queryset-refactor: Moved the Query subclasses into their own file.

Trying to keep file lengths to something manageable. git-svn-id: http://code.djangoproject.com/svn/django/branches/queryset-refactor@7164 bcc190cf-cafb-0310-a4f2-bffc1f526a37
2025-07-05 18:29:11 +00:00 · 2008-02-27 02:15:41 +00:00 · 2008-02-27 02:15:41 +00:00 · 231e735c07
commit 231e735c07
parent 014373b459
5 changed files with 328 additions and 312 deletions
--- a/django/db/models/sql/init.py
+++ b/django/db/models/sql/init.py
@ -1,4 +1,5 @@
 from query import *
+from subqueries import *
 from where import AND, OR

 __all__ = ['Query', 'AND', 'OR']
--- a/django/db/models/sql/constants.py
+++ b/django/db/models/sql/constants.py
@ -0,0 +1,40 @@
+import re
+
+# Valid query types (a dictionary is used for speedy lookups).
+QUERY_TERMS = dict([(x, None) for x in (
+    'exact', 'iexact', 'contains', 'icontains', 'gt', 'gte', 'lt', 'lte', 'in',
+    'startswith', 'istartswith', 'endswith', 'iendswith', 'range', 'year',
+    'month', 'day', 'isnull', 'search', 'regex', 'iregex',
+    )])
+
+# Size of each "chunk" for get_iterator calls.
+# Larger values are slightly faster at the expense of more storage space.
+GET_ITERATOR_CHUNK_SIZE = 100
+
+# Separator used to split filter strings apart.
+LOOKUP_SEP = '__'
+
+# Constants to make looking up tuple values clearer.
+# Join lists
+TABLE_NAME = 0
+RHS_ALIAS = 1
+JOIN_TYPE = 2
+LHS_ALIAS = 3
+LHS_JOIN_COL = 4
+RHS_JOIN_COL = 5
+# Alias map lists
+ALIAS_TABLE = 0
+ALIAS_REFCOUNT = 1
+ALIAS_JOIN = 2
+ALIAS_NULLABLE=3
+
+# How many results to expect from a cursor.execute call
+MULTI = 'multi'
+SINGLE = 'single'
+
+ORDER_PATTERN = re.compile(r'\?|[-+]?\w+$')
+ORDER_DIR = {
+    'ASC': ('ASC', 'DESC'),
+    'DESC': ('DESC', 'ASC')}
+
+
--- a/django/db/models/sql/datastructures.py
+++ b/django/db/models/sql/datastructures.py
@ -9,6 +9,13 @@ class EmptyResultSet(Exception):
 class FullResultSet(Exception):
    pass

+class Empty(object):
+    pass
+
+class RawValue(object):
+    def __init__(self, value):
+        self.value = value
+
 class Aggregate(object):
    """
    Base class for all aggregate-related classes (min, max, avg, count, sum).
--- a/django/db/models/sql/query.py
+++ b/django/db/models/sql/query.py
@ -8,69 +8,23 @@ all about the internals of models in order to get the information it needs.
 """

 import copy
-import operator
-import re

 from django.utils.tree import Node
 from django.utils.datastructures import SortedDict
 from django.dispatch import dispatcher
 from django.db.models import signals
 from django.db.models.sql.where import WhereNode, EverythingNode, AND, OR
-from django.db.models.sql.datastructures import Count, Date
+from django.db.models.sql.datastructures import Count
 from django.db.models.fields import FieldDoesNotExist, Field, related
-from django.contrib.contenttypes import generic
 from django.core.exceptions import FieldError
-from datastructures import EmptyResultSet
+from datastructures import EmptyResultSet, Empty
+from constants import *

 try:
    reversed
 except NameError:
    from django.utils.itercompat import reversed    # For python 2.3.

-# Valid query types (a dictionary is used for speedy lookups).
-QUERY_TERMS = dict([(x, None) for x in (
-    'exact', 'iexact', 'contains', 'icontains', 'gt', 'gte', 'lt', 'lte', 'in',
-    'startswith', 'istartswith', 'endswith', 'iendswith', 'range', 'year',
-    'month', 'day', 'isnull', 'search', 'regex', 'iregex',
-    )])
-
-# Size of each "chunk" for get_iterator calls.
-# Larger values are slightly faster at the expense of more storage space.
-GET_ITERATOR_CHUNK_SIZE = 100
-
-# Separator used to split filter strings apart.
-LOOKUP_SEP = '__'
-
-# Constants to make looking up tuple values clearer.
-# Join lists
-TABLE_NAME = 0
-RHS_ALIAS = 1
-JOIN_TYPE = 2
-LHS_ALIAS = 3
-LHS_JOIN_COL = 4
-RHS_JOIN_COL = 5
-# Alias map lists
-ALIAS_TABLE = 0
-ALIAS_REFCOUNT = 1
-ALIAS_JOIN = 2
-ALIAS_NULLABLE=3
-
-# How many results to expect from a cursor.execute call
-MULTI = 'multi'
-SINGLE = 'single'
-
-ORDER_PATTERN = re.compile(r'\?|[-+]?\w+$')
-ORDER_DIR = {
-    'ASC': ('ASC', 'DESC'),
-    'DESC': ('DESC', 'ASC')}
-
-class Empty(object):
-    pass
-
-class RawValue(object):
-    def __init__(self, value):
-        self.value = value
-
 class Query(object):
    """
    A single SQL query.
@ -200,6 +154,7 @@ class Query(object):
        """
        Performs a COUNT() query using the current filter constraints.
        """
+        from subqueries import CountQuery
        obj = self.clone()
        obj.clear_ordering(True)
        obj.clear_limits()
@ -1126,269 +1081,6 @@ class Query(object):
        # The MULTI case.
        return results_iter(cursor)

-class DeleteQuery(Query):
-    """
-    Delete queries are done through this class, since they are more constrained
-    than general queries.
-    """
-    def as_sql(self):
-        """
-        Creates the SQL for this query. Returns the SQL string and list of
-        parameters.
-        """
-        assert len(self.tables) == 1, \
-                "Can only delete from one table at a time."
-        result = ['DELETE FROM %s' % self.tables[0]]
-        where, params = self.where.as_sql()
-        result.append('WHERE %s' % where)
-        return ' '.join(result), tuple(params)
-
-    def do_query(self, table, where):
-        self.tables = [table]
-        self.where = where
-        self.execute_sql(None)
-
-    def delete_batch_related(self, pk_list):
-        """
-        Set up and execute delete queries for all the objects related to the
-        primary key values in pk_list. To delete the objects themselves, use
-        the delete_batch() method.
-
-        More than one physical query may be executed if there are a
-        lot of values in pk_list.
-        """
-        cls = self.model
-        for related in cls._meta.get_all_related_many_to_many_objects():
-            if not isinstance(related.field, generic.GenericRelation):
-                for offset in range(0, len(pk_list), GET_ITERATOR_CHUNK_SIZE):
-                    where = self.where_class()
-                    where.add((None, related.field.m2m_reverse_name(),
-                            related.field, 'in',
-                            pk_list[offset : offset+GET_ITERATOR_CHUNK_SIZE]),
-                            AND)
-                    self.do_query(related.field.m2m_db_table(), where)
-
-        for f in cls._meta.many_to_many:
-            w1 = self.where_class()
-            if isinstance(f, generic.GenericRelation):
-                from django.contrib.contenttypes.models import ContentType
-                field = f.rel.to._meta.get_field(f.content_type_field_name)
-                w1.add((None, field.column, field, 'exact',
-                        ContentType.objects.get_for_model(cls).id), AND)
-            for offset in range(0, len(pk_list), GET_ITERATOR_CHUNK_SIZE):
-                where = self.where_class()
-                where.add((None, f.m2m_column_name(), f, 'in',
-                        pk_list[offset : offset + GET_ITERATOR_CHUNK_SIZE]),
-                        AND)
-                if w1:
-                    where.add(w1, AND)
-                self.do_query(f.m2m_db_table(), where)
-
-    def delete_batch(self, pk_list):
-        """
-        Set up and execute delete queries for all the objects in pk_list. This
-        should be called after delete_batch_related(), if necessary.
-
-        More than one physical query may be executed if there are a
-        lot of values in pk_list.
-        """
-        for offset in range(0, len(pk_list), GET_ITERATOR_CHUNK_SIZE):
-            where = self.where_class()
-            field = self.model._meta.pk
-            where.add((None, field.column, field, 'in',
-                    pk_list[offset : offset + GET_ITERATOR_CHUNK_SIZE]), AND)
-            self.do_query(self.model._meta.db_table, where)
-
-class UpdateQuery(Query):
-    """
-    Represents an "update" SQL query.
-    """
-    def __init__(self, *args, **kwargs):
-        super(UpdateQuery, self).__init__(*args, **kwargs)
-        self._setup_query()
-
-    def _setup_query(self):
-        """
-        Run on initialisation and after cloning.
-        """
-        self.values = []
-
-    def as_sql(self):
-        """
-        Creates the SQL for this query. Returns the SQL string and list of
-        parameters.
-        """
-        self.select_related = False
-        self.pre_sql_setup()
-
-        if len(self.tables) != 1:
-            # We can only update one table at a time, so we need to check that
-            # only one alias has a nonzero refcount.
-            table = None
-            for alias_list in self.table_map.values():
-                for alias in alias_list:
-                    if self.alias_map[alias][ALIAS_REFCOUNT]:
-                        if table:
-                            raise FieldError('Updates can only access a single database table at a time.')
-                        table = alias
-        else:
-            table = self.tables[0]
-
-        qn = self.quote_name_unless_alias
-        result = ['UPDATE %s' % qn(table)]
-        result.append('SET')
-        values, update_params = [], []
-        for name, val in self.values:
-            if val is not None:
-                values.append('%s = %%s' % qn(name))
-                update_params.append(val)
-            else:
-                values.append('%s = NULL' % qn(name))
-        result.append(', '.join(values))
-        where, params = self.where.as_sql()
-        if where:
-            result.append('WHERE %s' % where)
-        return ' '.join(result), tuple(update_params + params)
-
-    def clear_related(self, related_field, pk_list):
-        """
-        Set up and execute an update query that clears related entries for the
-        keys in pk_list.
-
-        This is used by the QuerySet.delete_objects() method.
-        """
-        for offset in range(0, len(pk_list), GET_ITERATOR_CHUNK_SIZE):
-            self.where = self.where_class()
-            f = self.model._meta.pk
-            self.where.add((None, f.column, f, 'in',
-                    pk_list[offset : offset + GET_ITERATOR_CHUNK_SIZE]),
-                    AND)
-            self.values = [(related_field.column, None)]
-            self.execute_sql(None)
-
-    def add_update_values(self, values):
-        from django.db.models.base import Model
-        for name, val in values.items():
-            field, model, direct, m2m = self.model._meta.get_field_by_name(name)
-            if not direct or m2m:
-                # Can only update non-relation fields and foreign keys.
-                raise fieldError('Cannot update model field %r (only non-relations and foreign keys permitted).' % field)
-            if field.rel and isinstance(val, Model):
-                val = val.pk
-            self.values.append((field.column, val))
-
-class InsertQuery(Query):
-    def __init__(self, *args, **kwargs):
-        super(InsertQuery, self).__init__(*args, **kwargs)
-        self._setup_query()
-
-    def _setup_query(self):
-        """
-        Run on initialisation and after cloning.
-        """
-        self.columns = []
-        self.values = []
-
-    def as_sql(self):
-        self.select_related = False
-        self.pre_sql_setup()
-        qn = self.quote_name_unless_alias
-        result = ['INSERT INTO %s' % qn(self.tables[0])]
-        result.append('(%s)' % ', '.join([qn(c) for c in self.columns]))
-        result.append('VALUES (')
-        params = []
-        first = True
-        for value in self.values:
-            prefix = not first and ', ' or ''
-            if isinstance(value, RawValue):
-                result.append('%s%s' % (prefix, value.value))
-            else:
-                result.append('%s%%s' % prefix)
-                params.append(value)
-            first = False
-        result.append(')')
-        return ' '.join(result), tuple(params)
-
-    def execute_sql(self, return_id=False):
-        cursor = super(InsertQuery, self).execute_sql(None)
-        if return_id:
-            return self.connection.ops.last_insert_id(cursor, self.tables[0],
-                    self.model._meta.pk.column)
-
-    def insert_values(self, insert_values, raw_values=False):
-        """
-        Set up the insert query from the 'insert_values' dictionary. The
-        dictionary gives the model field names and their target values.
-
-        If 'raw_values' is True, the values in the 'insert_values' dictionary
-        are inserted directly into the query, rather than passed as SQL
-        parameters. This provides a way to insert NULL and DEFAULT keywords
-        into the query, for example.
-        """
-        func = lambda x: self.model._meta.get_field_by_name(x)[0].column
-        # keys() and values() return items in the same order, providing the
-        # dictionary hasn't changed between calls. So these lines work as
-        # intended.
-        for name in insert_values:
-            if name == 'pk':
-                name = self.model._meta.pk.name
-            self.columns.append(func(name))
-        if raw_values:
-            self.values.extend([RawValue(v) for v in insert_values.values()])
-        else:
-            self.values.extend(insert_values.values())
-
-class DateQuery(Query):
-    """
-    A DateQuery is a normal query, except that it specifically selects a single
-    date field. This requires some special handling when converting the results
-    back to Python objects, so we put it in a separate class.
-    """
-    def results_iter(self):
-        """
-        Returns an iterator over the results from executing this query.
-        """
-        resolve_columns = hasattr(self, 'resolve_columns')
-        if resolve_columns:
-            from django.db.models.fields import DateTimeField
-            fields = [DateTimeField()]
-        else:
-            from django.db.backends.util import typecast_timestamp
-            needs_string_cast = self.connection.features.needs_datetime_string_cast
-
-        for rows in self.execute_sql(MULTI):
-            for row in rows:
-                date = row[0]
-                if resolve_columns:
-                    date = self.resolve_columns([date], fields)[0]
-                elif needs_string_cast:
-                    date = typecast_timestamp(str(date))
-                yield date
-
-    def add_date_select(self, column, lookup_type, order='ASC'):
-        """
-        Converts the query into a date extraction query.
-        """
-        alias = self.join((None, self.model._meta.db_table, None, None))
-        select = Date((alias, column), lookup_type,
-                self.connection.ops.date_trunc_sql)
-        self.select = [select]
-        self.distinct = True
-        self.order_by = order == 'ASC' and [1] or [-1]
-
-class CountQuery(Query):
-    """
-    A CountQuery knows how to take a normal query which would select over
-    multiple distinct columns and turn it into SQL that can be used on a
-    variety of backends (it requires a select in the FROM clause).
-    """
-    def get_from_clause(self):
-        result, params = self._query.as_sql()
-        return ['(%s) AS A1' % result], params
-
-    def get_ordering(self):
-        return ()
-
 def get_order_dir(field, default='ASC'):
    """
    Returns the field name and direction for an order specification. For
--- a/django/db/models/sql/subqueries.py
+++ b/django/db/models/sql/subqueries.py
@ -0,0 +1,276 @@
+"""
+Query subclasses which provide extra functionality beyond simple data retrieval.
+"""
+from django.contrib.contenttypes import generic
+from django.core.exceptions import FieldError
+from django.db.models.sql.constants import *
+from django.db.models.sql.datastructures import RawValue, Date
+from django.db.models.sql.query import Query
+from django.db.models.sql.where import AND
+
+__all__ = ['DeleteQuery', 'UpdateQuery', 'InsertQuery', 'DateQuery',
+        'CountQuery']
+
+class DeleteQuery(Query):
+    """
+    Delete queries are done through this class, since they are more constrained
+    than general queries.
+    """
+    def as_sql(self):
+        """
+        Creates the SQL for this query. Returns the SQL string and list of
+        parameters.
+        """
+        assert len(self.tables) == 1, \
+                "Can only delete from one table at a time."
+        result = ['DELETE FROM %s' % self.tables[0]]
+        where, params = self.where.as_sql()
+        result.append('WHERE %s' % where)
+        return ' '.join(result), tuple(params)
+
+    def do_query(self, table, where):
+        self.tables = [table]
+        self.where = where
+        self.execute_sql(None)
+
+    def delete_batch_related(self, pk_list):
+        """
+        Set up and execute delete queries for all the objects related to the
+        primary key values in pk_list. To delete the objects themselves, use
+        the delete_batch() method.
+
+        More than one physical query may be executed if there are a
+        lot of values in pk_list.
+        """
+        cls = self.model
+        for related in cls._meta.get_all_related_many_to_many_objects():
+            if not isinstance(related.field, generic.GenericRelation):
+                for offset in range(0, len(pk_list), GET_ITERATOR_CHUNK_SIZE):
+                    where = self.where_class()
+                    where.add((None, related.field.m2m_reverse_name(),
+                            related.field, 'in',
+                            pk_list[offset : offset+GET_ITERATOR_CHUNK_SIZE]),
+                            AND)
+                    self.do_query(related.field.m2m_db_table(), where)
+
+        for f in cls._meta.many_to_many:
+            w1 = self.where_class()
+            if isinstance(f, generic.GenericRelation):
+                from django.contrib.contenttypes.models import ContentType
+                field = f.rel.to._meta.get_field(f.content_type_field_name)
+                w1.add((None, field.column, field, 'exact',
+                        ContentType.objects.get_for_model(cls).id), AND)
+            for offset in range(0, len(pk_list), GET_ITERATOR_CHUNK_SIZE):
+                where = self.where_class()
+                where.add((None, f.m2m_column_name(), f, 'in',
+                        pk_list[offset : offset + GET_ITERATOR_CHUNK_SIZE]),
+                        AND)
+                if w1:
+                    where.add(w1, AND)
+                self.do_query(f.m2m_db_table(), where)
+
+    def delete_batch(self, pk_list):
+        """
+        Set up and execute delete queries for all the objects in pk_list. This
+        should be called after delete_batch_related(), if necessary.
+
+        More than one physical query may be executed if there are a
+        lot of values in pk_list.
+        """
+        for offset in range(0, len(pk_list), GET_ITERATOR_CHUNK_SIZE):
+            where = self.where_class()
+            field = self.model._meta.pk
+            where.add((None, field.column, field, 'in',
+                    pk_list[offset : offset + GET_ITERATOR_CHUNK_SIZE]), AND)
+            self.do_query(self.model._meta.db_table, where)
+
+class UpdateQuery(Query):
+    """
+    Represents an "update" SQL query.
+    """
+    def __init__(self, *args, **kwargs):
+        super(UpdateQuery, self).__init__(*args, **kwargs)
+        self._setup_query()
+
+    def _setup_query(self):
+        """
+        Run on initialisation and after cloning.
+        """
+        self.values = []
+
+    def as_sql(self):
+        """
+        Creates the SQL for this query. Returns the SQL string and list of
+        parameters.
+        """
+        self.select_related = False
+        self.pre_sql_setup()
+
+        if len(self.tables) != 1:
+            # We can only update one table at a time, so we need to check that
+            # only one alias has a nonzero refcount.
+            table = None
+            for alias_list in self.table_map.values():
+                for alias in alias_list:
+                    if self.alias_map[alias][ALIAS_REFCOUNT]:
+                        if table:
+                            raise FieldError('Updates can only access a single database table at a time.')
+                        table = alias
+        else:
+            table = self.tables[0]
+
+        qn = self.quote_name_unless_alias
+        result = ['UPDATE %s' % qn(table)]
+        result.append('SET')
+        values, update_params = [], []
+        for name, val in self.values:
+            if val is not None:
+                values.append('%s = %%s' % qn(name))
+                update_params.append(val)
+            else:
+                values.append('%s = NULL' % qn(name))
+        result.append(', '.join(values))
+        where, params = self.where.as_sql()
+        if where:
+            result.append('WHERE %s' % where)
+        return ' '.join(result), tuple(update_params + params)
+
+    def clear_related(self, related_field, pk_list):
+        """
+        Set up and execute an update query that clears related entries for the
+        keys in pk_list.
+
+        This is used by the QuerySet.delete_objects() method.
+        """
+        for offset in range(0, len(pk_list), GET_ITERATOR_CHUNK_SIZE):
+            self.where = self.where_class()
+            f = self.model._meta.pk
+            self.where.add((None, f.column, f, 'in',
+                    pk_list[offset : offset + GET_ITERATOR_CHUNK_SIZE]),
+                    AND)
+            self.values = [(related_field.column, None)]
+            self.execute_sql(None)
+
+    def add_update_values(self, values):
+        from django.db.models.base import Model
+        for name, val in values.items():
+            field, model, direct, m2m = self.model._meta.get_field_by_name(name)
+            if not direct or m2m:
+                # Can only update non-relation fields and foreign keys.
+                raise fieldError('Cannot update model field %r (only non-relations and foreign keys permitted).' % field)
+            if field.rel and isinstance(val, Model):
+                val = val.pk
+            self.values.append((field.column, val))
+
+class InsertQuery(Query):
+    def __init__(self, *args, **kwargs):
+        super(InsertQuery, self).__init__(*args, **kwargs)
+        self._setup_query()
+
+    def _setup_query(self):
+        """
+        Run on initialisation and after cloning.
+        """
+        self.columns = []
+        self.values = []
+
+    def as_sql(self):
+        self.select_related = False
+        self.pre_sql_setup()
+        qn = self.quote_name_unless_alias
+        result = ['INSERT INTO %s' % qn(self.tables[0])]
+        result.append('(%s)' % ', '.join([qn(c) for c in self.columns]))
+        result.append('VALUES (')
+        params = []
+        first = True
+        for value in self.values:
+            prefix = not first and ', ' or ''
+            if isinstance(value, RawValue):
+                result.append('%s%s' % (prefix, value.value))
+            else:
+                result.append('%s%%s' % prefix)
+                params.append(value)
+            first = False
+        result.append(')')
+        return ' '.join(result), tuple(params)
+
+    def execute_sql(self, return_id=False):
+        cursor = super(InsertQuery, self).execute_sql(None)
+        if return_id:
+            return self.connection.ops.last_insert_id(cursor, self.tables[0],
+                    self.model._meta.pk.column)
+
+    def insert_values(self, insert_values, raw_values=False):
+        """
+        Set up the insert query from the 'insert_values' dictionary. The
+        dictionary gives the model field names and their target values.
+
+        If 'raw_values' is True, the values in the 'insert_values' dictionary
+        are inserted directly into the query, rather than passed as SQL
+        parameters. This provides a way to insert NULL and DEFAULT keywords
+        into the query, for example.
+        """
+        func = lambda x: self.model._meta.get_field_by_name(x)[0].column
+        # keys() and values() return items in the same order, providing the
+        # dictionary hasn't changed between calls. So these lines work as
+        # intended.
+        for name in insert_values:
+            if name == 'pk':
+                name = self.model._meta.pk.name
+            self.columns.append(func(name))
+        if raw_values:
+            self.values.extend([RawValue(v) for v in insert_values.values()])
+        else:
+            self.values.extend(insert_values.values())
+
+class DateQuery(Query):
+    """
+    A DateQuery is a normal query, except that it specifically selects a single
+    date field. This requires some special handling when converting the results
+    back to Python objects, so we put it in a separate class.
+    """
+    def results_iter(self):
+        """
+        Returns an iterator over the results from executing this query.
+        """
+        resolve_columns = hasattr(self, 'resolve_columns')
+        if resolve_columns:
+            from django.db.models.fields import DateTimeField
+            fields = [DateTimeField()]
+        else:
+            from django.db.backends.util import typecast_timestamp
+            needs_string_cast = self.connection.features.needs_datetime_string_cast
+
+        for rows in self.execute_sql(MULTI):
+            for row in rows:
+                date = row[0]
+                if resolve_columns:
+                    date = self.resolve_columns([date], fields)[0]
+                elif needs_string_cast:
+                    date = typecast_timestamp(str(date))
+                yield date
+
+    def add_date_select(self, column, lookup_type, order='ASC'):
+        """
+        Converts the query into a date extraction query.
+        """
+        alias = self.join((None, self.model._meta.db_table, None, None))
+        select = Date((alias, column), lookup_type,
+                self.connection.ops.date_trunc_sql)
+        self.select = [select]
+        self.distinct = True
+        self.order_by = order == 'ASC' and [1] or [-1]
+
+class CountQuery(Query):
+    """
+    A CountQuery knows how to take a normal query which would select over
+    multiple distinct columns and turn it into SQL that can be used on a
+    variety of backends (it requires a select in the FROM clause).
+    """
+    def get_from_clause(self):
+        result, params = self._query.as_sql()
+        return ['(%s) AS A1' % result], params
+
+    def get_ordering(self):
+        return ()
+