1
0
mirror of https://github.com/django/django.git synced 2025-10-24 22:26:08 +00:00

[1.0.X] This fixes a group of problems in the SQL created by QuerySet.exclude()

when used in a few situations where NULL results can appear.

Fixed #8921 (the only ticket I know of that noticed any of these).

Backport of r9590 from trunk.


git-svn-id: http://code.djangoproject.com/svn/django/branches/releases/1.0.X@9591 bcc190cf-cafb-0310-a4f2-bffc1f526a37
This commit is contained in:
Malcolm Tredinnick
2008-12-08 02:47:05 +00:00
parent a8a4743b1d
commit 61e36bd7d1
2 changed files with 53 additions and 20 deletions

View File

@@ -54,7 +54,6 @@ class BaseQuery(object):
self.default_ordering = True self.default_ordering = True
self.standard_ordering = True self.standard_ordering = True
self.ordering_aliases = [] self.ordering_aliases = []
self.start_meta = None
self.select_fields = [] self.select_fields = []
self.related_select_fields = [] self.related_select_fields = []
self.dupe_avoidance = {} self.dupe_avoidance = {}
@@ -125,10 +124,9 @@ class BaseQuery(object):
def get_meta(self): def get_meta(self):
""" """
Returns the Options instance (the model._meta) from which to start Returns the Options instance (the model._meta) from which to start
processing. Normally, this is self.model._meta, but it can change. processing. Normally, this is self.model._meta, but it can be changed
by subclasses.
""" """
if self.start_meta:
return self.start_meta
return self.model._meta return self.model._meta
def quote_name_unless_alias(self, name): def quote_name_unless_alias(self, name):
@@ -166,7 +164,6 @@ class BaseQuery(object):
obj.default_ordering = self.default_ordering obj.default_ordering = self.default_ordering
obj.standard_ordering = self.standard_ordering obj.standard_ordering = self.standard_ordering
obj.ordering_aliases = [] obj.ordering_aliases = []
obj.start_meta = self.start_meta
obj.select_fields = self.select_fields[:] obj.select_fields = self.select_fields[:]
obj.related_select_fields = self.related_select_fields[:] obj.related_select_fields = self.related_select_fields[:]
obj.dupe_avoidance = self.dupe_avoidance.copy() obj.dupe_avoidance = self.dupe_avoidance.copy()
@@ -1485,11 +1482,24 @@ class BaseQuery(object):
query = Query(self.model, self.connection) query = Query(self.model, self.connection)
query.add_filter(filter_expr, can_reuse=can_reuse) query.add_filter(filter_expr, can_reuse=can_reuse)
query.bump_prefix() query.bump_prefix()
query.set_start(prefix)
query.clear_ordering(True) query.clear_ordering(True)
query.set_start(prefix)
self.add_filter(('%s__in' % prefix, query), negate=True, trim=True, self.add_filter(('%s__in' % prefix, query), negate=True, trim=True,
can_reuse=can_reuse) can_reuse=can_reuse)
# If there's more than one join in the inner query (before any initial
# bits were trimmed -- which means the last active table is more than
# two places into the alias list), we need to also handle the
# possibility that the earlier joins don't match anything by adding a
# comparison to NULL (e.g. in
# Tag.objects.exclude(parent__parent__name='t1'), a tag with no parent
# would otherwise be overlooked).
active_positions = [pos for (pos, count) in
enumerate(query.alias_refcount.itervalues()) if count]
if active_positions[-1] > 1:
self.add_filter(('%s__isnull' % prefix, False), negate=True,
trim=True, can_reuse=can_reuse)
def set_limits(self, low=None, high=None): def set_limits(self, low=None, high=None):
""" """
Adjusts the limits on the rows retrieved. We use low/high to set these, Adjusts the limits on the rows retrieved. We use low/high to set these,
@@ -1695,18 +1705,26 @@ class BaseQuery(object):
alias = self.get_initial_alias() alias = self.get_initial_alias()
field, col, opts, joins, last, extra = self.setup_joins( field, col, opts, joins, last, extra = self.setup_joins(
start.split(LOOKUP_SEP), opts, alias, False) start.split(LOOKUP_SEP), opts, alias, False)
alias = joins[last[-1]] select_col = self.alias_map[joins[1]][LHS_JOIN_COL]
self.select = [(alias, self.alias_map[alias][RHS_JOIN_COL])] select_alias = alias
self.select_fields = [field]
self.start_meta = opts
# The call to setup_joins add an extra reference to everything in # The call to setup_joins added an extra reference to everything in
# joins. So we need to unref everything once, and everything prior to # joins. Reverse that.
# the final join a second time.
for alias in joins: for alias in joins:
self.unref_alias(alias) self.unref_alias(alias)
for alias in joins[:last[-1]]:
self.unref_alias(alias) # We might be able to trim some joins from the front of this query,
# providing that we only traverse "always equal" connections (i.e. rhs
# is *always* the same value as lhs).
for alias in joins[1:]:
join_info = self.alias_map[alias]
if (join_info[LHS_JOIN_COL] != select_col
or join_info[JOIN_TYPE] != self.INNER):
break
self.unref_alias(select_alias)
select_alias = join_info[RHS_ALIAS]
select_col = join_info[RHS_JOIN_COL]
self.select = [(select_alias, select_col)]
def execute_sql(self, result_type=MULTI): def execute_sql(self, result_type=MULTI):
""" """

View File

@@ -675,7 +675,7 @@ thus fail.)
... s.reverse() ... s.reverse()
... params.reverse() ... params.reverse()
# This slightly odd comparison works aorund the fact that PostgreSQL will # This slightly odd comparison works around the fact that PostgreSQL will
# return 'one' and 'two' as strings, not Unicode objects. It's a side-effect of # return 'one' and 'two' as strings, not Unicode objects. It's a side-effect of
# using constants here and not a real concern. # using constants here and not a real concern.
>>> d = Item.objects.extra(select=SortedDict(s), select_params=params).values('a', 'b')[0] >>> d = Item.objects.extra(select=SortedDict(s), select_params=params).values('a', 'b')[0]
@@ -742,7 +742,7 @@ We can do slicing beyond what is currently in the result cache, too.
## only apparent much later when the full test suite runs. I don't understand ## only apparent much later when the full test suite runs. I don't understand
## what's going on here yet. ## what's going on here yet.
## ##
## # We need to mess with the implemenation internals a bit here to decrease the ## # We need to mess with the implementation internals a bit here to decrease the
## # cache fill size so that we don't read all the results at once. ## # cache fill size so that we don't read all the results at once.
## >>> from django.db.models import query ## >>> from django.db.models import query
## >>> query.ITER_CHUNK_SIZE = 2 ## >>> query.ITER_CHUNK_SIZE = 2
@@ -795,7 +795,7 @@ More twisted cases, involving nested negations.
[<Item: four>, <Item: one>, <Item: three>] [<Item: four>, <Item: one>, <Item: three>]
Bug #7095 Bug #7095
Updates that are filtered on the model being updated are somewhat tricky to get Updates that are filtered on the model being updated are somewhat tricky
in MySQL. This exercises that case. in MySQL. This exercises that case.
>>> mm = ManagedModel.objects.create(data='mm1', tag=t1, public=True) >>> mm = ManagedModel.objects.create(data='mm1', tag=t1, public=True)
>>> ManagedModel.objects.update(data='mm') >>> ManagedModel.objects.update(data='mm')
@@ -998,13 +998,28 @@ model. But it should still be possible to add new ordering after that.
>>> 'ORDER BY' in qs.query.as_sql()[0] >>> 'ORDER BY' in qs.query.as_sql()[0]
True True
Bug #9188 -- incorrect SQL was being generated for certain types of Incorrect SQL was being generated for certain types of exclude() queries that
exclude() queries that crossed multi-valued relations. crossed multi-valued relations (#8921, #9188 and some pre-emptively discovered
cases).
>>> PointerA.objects.filter(connection__pointerb__id=1) >>> PointerA.objects.filter(connection__pointerb__id=1)
[] []
>>> PointerA.objects.exclude(connection__pointerb__id=1) >>> PointerA.objects.exclude(connection__pointerb__id=1)
[] []
>>> Tag.objects.exclude(children=None)
[<Tag: t1>, <Tag: t3>]
# This example is tricky because the parent could be NULL, so only checking
# parents with annotations omits some results (tag t1, in this case).
>>> Tag.objects.exclude(parent__annotation__name="a1")
[<Tag: t1>, <Tag: t4>, <Tag: t5>]
# The annotation->tag link is single values and tag->children links is
# multi-valued. So we have to split the exclude filter in the middle and then
# optimise the inner query without losing results.
>>> Annotation.objects.exclude(tag__children__name="t2")
[<Annotation: a2>]
"""} """}
# In Python 2.3 and the Python 2.6 beta releases, exceptions raised in __len__ # In Python 2.3 and the Python 2.6 beta releases, exceptions raised in __len__