[PATCH] REST: Fix duplicate project queries
Stephen Finucane
stephen at that.guru
Sun Feb 2 21:50:59 AEDT 2020
On Sun, 2020-02-02 at 11:29 +0100, Mete Polat wrote:
> Hi Stephen,
>
> On 01.02.20 15:05, Stephen Finucane wrote:
> > On Wed, 2020-01-29 at 20:01 +0100, Mete Polat wrote:
> > > Eliminates duplicate project queries caused by calling
> > > get_absolute_url() in the embedded serializers. Following foreign keys
> > > with 'series__project' will cache the project of the series as well as
> > > the series itself.
> > >
> > > Signed-off-by: Mete Polat <metepolat2000 at gmail.com>
> >
> > Hey Mete,
> >
> > > ---
> > > There are still some duplicates in various /api/ views but it looks like
> > > those are caused by the REST framework itself.
> > >
> > > patchwork/api/cover.py | 2 +-
> > > patchwork/api/event.py | 4 ++--
> > > patchwork/api/patch.py | 2 +-
> > > patchwork/api/series.py | 5 +++--
> > > 4 files changed, 7 insertions(+), 6 deletions(-)
> > >
> > > diff --git a/patchwork/api/cover.py b/patchwork/api/cover.py
> > > index caf9a386efa5..9e86d47e00e5 100644
> > > --- a/patchwork/api/cover.py
> > > +++ b/patchwork/api/cover.py
> > > @@ -101,7 +101,7 @@ class CoverLetterList(ListAPIView):
> > >
> > > def get_queryset(self):
> > > return CoverLetter.objects.all()\
> > > - .select_related('project', 'submitter', 'series')\
> > > + .select_related('project', 'submitter', 'series__project')\
> > > .defer('content', 'headers')
> > >
> > >
> > > diff --git a/patchwork/api/event.py b/patchwork/api/event.py
> > > index a066faaec63b..fdff6a4f2fa6 100644
> > > --- a/patchwork/api/event.py
> > > +++ b/patchwork/api/event.py
> > > @@ -86,7 +86,7 @@ class EventList(ListAPIView):
> > >
> > > def get_queryset(self):
> > > return Event.objects.all()\
> > > - .prefetch_related('project', 'patch', 'series', 'cover',
> > > - 'previous_state', 'current_state',
> > > + .prefetch_related('project', 'patch__project', 'series__project',
> > > + 'cover', 'previous_state', 'current_state',
> > > 'previous_delegate', 'current_delegate',
> > > 'created_check')
> >
> > The rest of these look good but I wasn't able to produce a test that
> > proved this particular change was doing anything. Are you sure this
> > particular change works and, if so, could you suggest one or more
> > scenarios that I could use to validate this?
> >
>
> Just checked it again. Without patch__project, I get tons of these
> duplicate queries:
>
> SELECT `patchwork_project`.`id`,
> `patchwork_project`.`linkname`,
> `patchwork_project`.`name`,
> `patchwork_project`.`listid`,
> `patchwork_project`.`listemail`,
> `patchwork_project`.`subject_match`,
> `patchwork_project`.`web_url`,
> `patchwork_project`.`scm_url`,
> `patchwork_project`.`webscm_url`,
> `patchwork_project`.`list_archive_url`,
> `patchwork_project`.`list_archive_url_format`,
> `patchwork_project`.`commit_url_format`,
> `patchwork_project`.`send_notifications`,
> `patchwork_project`.`use_tags`
> FROM `patchwork_project`
> WHERE `patchwork_project`.`id` = 2
>
> opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/django/contrib/staticfiles/handlers.py
> in __call__(65)
> return self.application(environ, start_response)
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/django/views/decorators/csrf.py
> in wrapped_view(54)
> return view_func(*args, **kwargs)
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/django/views/generic/base.py
> in view(71)
> return self.dispatch(request, *args, **kwargs)
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/views.py
> in dispatch(502)
> response = handler(request, *args, **kwargs)
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/generics.py
> in get(199)
> return self.list(request, *args, **kwargs)
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/mixins.py
> in list(43)
> return self.get_paginated_response(serializer.data)
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/serializers.py
> in data(757)
> ret = super().data
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/serializers.py
> in data(261)
> self._data = self.to_representation(self.instance)
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/serializers.py
> in to_representation(674)
> return [
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/serializers.py
> in <listcomp>(675)
> self.child.to_representation(item) for item in iterable
> /home/patchwork/patchwork/patchwork/api/event.py in to_representation(51)
> data = super(EventSerializer, self).to_representation(instance)
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/serializers.py
> in to_representation(526)
> ret[field.field_name] = field.to_representation(attribute)
> /home/patchwork/patchwork/patchwork/api/embedded.py in to_representation(57)
> return self._Serializer(context=self.context).to_representation(data)
> /home/patchwork/patchwork/patchwork/api/base.py in to_representation(90)
> data = super(BaseHyperlinkedModelSerializer, self).to_representation(
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/serializers.py
> in to_representation(526)
> ret[field.field_name] = field.to_representation(attribute)
> /opt/pyenv/versions/3.8.0/lib/python3.8/site-packages/rest_framework/fields.py
> in to_representation(1873)
> return method(value)
> /home/patchwork/patchwork/patchwork/api/embedded.py in get_web_url(81)
> return request.build_absolute_uri(instance.get_absolute_url())
> /home/patchwork/patchwork/patchwork/models.py in get_absolute_url(600)
> kwargs={'project_id': self.project.linkname,
>
> Same goes for series__project.
> I didn't write a test case but I was able to manually produce this
> behavior by just viewing the /api/events on my local instance and by
> optionally filtering for patch/series_created events. I think you should
> be able to reproduce this when there are enough of these patch/series
> events.
Ok, managed to get this to have an effect once I started creating a few
more events. Have applied this along with the test patch I sent
yesterday. Thanks!
Stephen
> Best regards,
>
> Mete
>
> > Cheers,
> > Stephen
> >
> > > diff --git a/patchwork/api/patch.py b/patchwork/api/patch.py
> > > index a29a1ab0eb71..1a3ce9057490 100644
> > > --- a/patchwork/api/patch.py
> > > +++ b/patchwork/api/patch.py
> > > @@ -176,7 +176,7 @@ class PatchList(ListAPIView):
> > > return Patch.objects.all()\
> > > .prefetch_related('check_set')\
> > > .select_related('project', 'state', 'submitter', 'delegate',
> > > - 'series')\
> > > + 'series__project')\
> > > .defer('content', 'diff', 'headers')
> > >
> > >
> > > diff --git a/patchwork/api/series.py b/patchwork/api/series.py
> > > index f7bb8c06a6c9..df28f95dab1b 100644
> > > --- a/patchwork/api/series.py
> > > +++ b/patchwork/api/series.py
> > > @@ -55,8 +55,9 @@ class SeriesMixin(object):
> > > serializer_class = SeriesSerializer
> > >
> > > def get_queryset(self):
> > > - return Series.objects.all().prefetch_related('patches',)\
> > > - .select_related('submitter', 'cover_letter', 'project')
> > > + return Series.objects.all()\
> > > + .prefetch_related('patches__project',)\
> > > + .select_related('submitter', 'cover_letter__project', 'project')
> > >
> > >
> > > class SeriesList(SeriesMixin, ListAPIView):
More information about the Patchwork
mailing list