Refactor.

WaVEV · WaVEV · commit 7e80c1ae3643 · 2024-07-26T01:56:15.000-03:00
diff --git a/django_mongodb/compiler.py b/django_mongodb/compiler.py
@@ -1,4 +1,4 @@
-from itertools import chain
+import itertools
 
 from django.core.exceptions import EmptyResultSet, FullResultSet
 from django.db import DatabaseError, IntegrityError, NotSupportedError
@@ -19,22 +19,33 @@ class SQLCompiler(compiler.SQLCompiler):
     """Base class for all Mongo compilers."""
 
     query_class = MongoQuery
-    _group_pipeline = None
-    aggregation_idx = 0
-
-    def _get_colum_from_expression(self, expr, alias):
+    SEPARATOR = "10__MESSI__3"
+
+    def _get_group_alias_column(self, col, annotation_group_idx):
+        """Generate alias and replacement for group columns."""
+        replacement = None
+        if not isinstance(col, Col):
+            alias = f"__annotation_group{next(annotation_group_idx)}"
+            col_expr = self._get_column_from_expression(col, alias)
+            replacement = col_expr
+            col = col_expr
+        if self.collection_name == col.alias:
+            return col.target.column, replacement
+        return f"{col.alias}{self.SEPARATOR}{col.target.column}", replacement
+
+    def _get_column_from_expression(self, expr, alias):
+        """Get column target from expression."""
         column_target = expr.output_field.__class__()
         column_target.db_column = alias
         column_target.set_attributes_from_name(alias)
         return Col(self.collection_name, column_target)
 
-    def _prepare_expressions_for_pipeline(self, expression, target):
+    def _prepare_expressions_for_pipeline(self, expression, target, count):
+        """Prepare expressions for the MongoDB aggregation pipeline."""
         replacements = {}
         group = {}
         for sub_expr in self._get_aggregate_expressions(expression):
-            alias = f"__aggregation{self.aggregation_idx}" if sub_expr != expression else target
-            self.aggregation_idx += 1
-
+            alias = f"__aggregation{next(count)}" if sub_expr != expression else target
             column_target = sub_expr.output_field.__class__()
             column_target.db_column = alias
             column_target.set_attributes_from_name(alias)
@@ -57,127 +68,109 @@ def _prepare_expressions_for_pipeline(self, expression, target):
             replacements[sub_expr] = replacing_expr
         return replacements, group
 
-    @staticmethod
-    def _random_separtor():
-        import random
-        import string
-
-        size = 6
-        chars = string.ascii_uppercase + string.digits
-        return "".join(random.choice(chars) for _ in range(size))  # noqa: S311
-
-    def pre_sql_setup(self, with_col_aliases=False):
-        pre_setup = super().pre_sql_setup(with_col_aliases=with_col_aliases)
-        self.annotations = {}
+    def _prepare_annotations_for_group_pipeline(self):
+        """Prepare annotations for the MongoDB aggregation pipeline."""
+        replacements = {}
         group = {}
-        group_expressions = set()
-        all_replacements = {}
-        self.aggregation_idx = 0
+        count = itertools.count(start=1)
         for target, expr in self.query.annotation_select.items():
             if expr.contains_aggregate:
-                replacements, expr_group = self._prepare_expressions_for_pipeline(expr, target)
-                all_replacements.update(replacements)
+                new_replacements, expr_group = self._prepare_expressions_for_pipeline(
+                    expr, target, count
+                )
+                replacements.update(new_replacements)
                 group.update(expr_group)
-            group_expressions |= set(expr.get_group_by_cols())
 
         having_replacements, having_group = self._prepare_expressions_for_pipeline(
-            self.having, None
+            self.having, None, count
         )
-        all_replacements.update(having_replacements)
+        replacements.update(having_replacements)
         group.update(having_group)
+        return group, replacements
 
-        if group or self.query.group_by:
-            order_by = self.get_order_by()
-            for expr, (_, _, is_ref) in order_by:
-                # Skip references to the SELECT clause, as all expressions in
-                # the SELECT clause are already part of the GROUP BY.
-                if not is_ref:
-                    group_expressions |= set(expr.get_group_by_cols())
-
-            for expr, *_ in self.select:
+    def _get_group_id_expressions(self):
+        """Generate group ID expressions for the aggregation pipeline."""
+        group_expressions = set()
+        replacements = {}
+        order_by = self.get_order_by()
+        for expr, (_, _, is_ref) in order_by:
+            if not is_ref:
                 group_expressions |= set(expr.get_group_by_cols())
 
-            having_group_by = self.having.get_group_by_cols() if self.having else ()
-            for expr in having_group_by:
-                group_expressions.add(expr)
-            if isinstance(self.query.group_by, tuple | list):
-                group_expressions |= set(self.query.group_by)
-            elif self.query.group_by is None:
-                group_expressions = set()
+        for expr, *_ in self.select:
+            group_expressions |= set(expr.get_group_by_cols())
 
-            all_strings = "".join(
-                str(col.as_mql(self, self.connection)) for col in group_expressions
-            )
+        having_group_by = self.having.get_group_by_cols() if self.having else ()
+        for expr in having_group_by:
+            group_expressions.add(expr)
+        if isinstance(self.query.group_by, tuple | list):
+            group_expressions |= set(self.query.group_by)
+        elif self.query.group_by is None:
+            group_expressions = set()
 
-            while True:
-                random_string = self._random_separtor()
-                if random_string not in all_strings:
-                    break
-            SEPARATOR = f"__{random_string}__"
-
-            annotation_group_idx = 0
-
-            def _ccc(col):
-                nonlocal annotation_group_idx
-
-                if not isinstance(col, Col):
-                    annotation_group_idx += 1
-                    alias = f"__annotation_group_{annotation_group_idx}"
-                    col_expr = self._get_colum_from_expression(col, alias)
-                    all_replacements[col] = col_expr
-                    col = col_expr
-                if self.collection_name == col.alias:
-                    return col.target.column
-                return f"{col.alias}{SEPARATOR}{col.target.column}"
-
-            ids = (
-                None
-                if not group_expressions
-                else {
-                    _ccc(col): col.as_mql(self, self.connection)
-                    # expression aren't needed in the group by clouse ()
-                    for col in group_expressions
-                }
-            )
-            self.annotations = {
-                target: expr.replace_expressions(all_replacements)
-                for target, expr in self.query.annotation_select.items()
-            }
-            pipeline = []
-            if not ids:
-                group["_id"] = None
-                pipeline.append({"$facet": {"group": [{"$group": group}]}})
-                pipeline.append(
-                    {
-                        "$addFields": {
-                            key: {
-                                "$getField": {
-                                    "input": {"$arrayElemAt": ["$group", 0]},
-                                    "field": key,
-                                }
+        if not group_expressions:
+            ids = None
+        else:
+            annotation_group_idx = itertools.count(start=1)
+            ids = {}
+            for col in group_expressions:
+                alias, replacement = self._get_group_alias_column(col, annotation_group_idx)
+                ids[alias] = col.as_mql(self, self.connection)
+                if replacement is not None:
+                    replacements[col] = replacement
+
+        return ids, replacements
+
+    def _build_group_pipeline(self, ids, group):
+        """Build the aggregation pipeline for grouping."""
+        pipeline = []
+        if not ids:
+            group["_id"] = None
+            pipeline.append({"$facet": {"group": [{"$group": group}]}})
+            pipeline.append(
+                {
+                    "$addFields": {
+                        key: {
+                            "$getField": {
+                                "input": {"$arrayElemAt": ["$group", 0]},
+                                "field": key,
                             }
-                            for key in group
                         }
+                        for key in group
                     }
-                )
-            else:
-                group["_id"] = ids
-                pipeline.append({"$group": group})
-                sets = {}
-                for key in ids:
-                    value = f"$_id.{key}"
-                    if SEPARATOR in key:
-                        subtable, field = key.split(SEPARATOR)
-                        if subtable not in sets:
-                            sets[subtable] = {}
-                        sets[subtable][field] = value
-                    else:
-                        sets[key] = value
-
-                pipeline.append({"$addFields": sets})
-                if "_id" not in sets:
-                    pipeline.append({"$unset": "_id"})
+                }
+            )
+        else:
+            group["_id"] = ids
+            pipeline.append({"$group": group})
+            sets = {}
+            for key in ids:
+                value = f"$_id.{key}"
+                if self.SEPARATOR in key:
+                    subtable, field = key.split(self.SEPARATOR)
+                    if subtable not in sets:
+                        sets[subtable] = {}
+                    sets[subtable][field] = value
+                else:
+                    sets[key] = value
+
+            pipeline.append({"$addFields": sets})
+            if "_id" not in sets:
+                pipeline.append({"$unset": "_id"})
 
+        return pipeline
+
+    def pre_sql_setup(self, with_col_aliases=False):
+        pre_setup = super().pre_sql_setup(with_col_aliases=with_col_aliases)
+        group, all_replacements = self._prepare_annotations_for_group_pipeline()
+
+        # The query.group_by is either None (no GROUP BY at all), True
+        # (group by select fields), or a list of expressions to be added
+        # to the group by.
+        if group or self.query.group_by:
+            ids, replacements = self._get_group_id_expressions()
+            all_replacements.update(replacements)
+            pipeline = self._build_group_pipeline(ids, group)
             if self.having:
                 pipeline.append(
                     {
@@ -188,7 +181,6 @@ def _ccc(col):
                         }
                     }
                 )
-
             self._group_pipeline = pipeline
         else:
             self._group_pipeline = None
@@ -203,7 +195,6 @@ def _ccc(col):
     def execute_sql(
         self, result_type=MULTI, chunked_fetch=False, chunk_size=GET_ITERATOR_CHUNK_SIZE
     ):
-        # QuerySet.count()
         self.pre_sql_setup()
         columns = self.get_columns()
         try:
@@ -256,7 +247,7 @@ def results_iter(
 
         fields = [s[0] for s in self.select[0 : self.col_count]]
         converters = self.get_converters(fields)
-        rows = chain.from_iterable(results)
+        rows = itertools.chain.from_iterable(results)
         if converters:
             rows = self.apply_converters(rows, converters)
         if tuple_expected:
@@ -320,34 +311,6 @@ def check_query(self):
             if any(key.startswith("_prefetch_related_") for key in self.query.extra):
                 raise NotSupportedError("QuerySet.prefetch_related() is not supported on MongoDB.")
             raise NotSupportedError("QuerySet.extra() is not supported on MongoDB.")
-        if any(
-            isinstance(a, Aggregate) and not isinstance(a, Count)
-            for a in self.query.annotations.values()
-        ):
-            # raise NotSupportedError("QuerySet.aggregate() isn't supported on MongoDB.")
-            pass
-
-    def get_count(self, check_exists=False):
-        """
-        Count objects matching the current filters / constraints.
-
-        If `check_exists` is True, only check if any object matches.
-        """
-        kwargs = {}
-        # If this query is sliced, the limits will be set on the subquery.
-        inner_query = getattr(self.query, "inner_query", None)
-        low_mark = inner_query.low_mark if inner_query else 0
-        high_mark = inner_query.high_mark if inner_query else None
-        if low_mark > 0:
-            kwargs["skip"] = low_mark
-        if check_exists:
-            kwargs["limit"] = 1
-        elif high_mark is not None:
-            kwargs["limit"] = high_mark - low_mark
-        try:
-            return self.build_query().count(**kwargs)
-        except EmptyResultSet:
-            return 0
 
     def build_query(self, columns=None):
         """Check if the query is supported and prepare a MongoQuery."""
@@ -540,6 +503,7 @@ def insert(self, docs, returning_fields=None):
 
 class SQLDeleteCompiler(compiler.SQLDeleteCompiler, SQLCompiler):
     def execute_sql(self, result_type=MULTI):
+        self.pre_sql_setup()
         cursor = Cursor()
         cursor.rowcount = self.build_query().delete()
         return cursor
diff --git a/django_mongodb/query.py b/django_mongodb/query.py
@@ -89,6 +89,23 @@ def delete(self):
         options = self.connection.operation_flags.get("delete", {})
         return self.collection.delete_many(self.mongo_query, **options).deleted_count
 
+    @wrap_database_errors
+    def get_cursor(self, count=False, limit=None, skip=None):
+        """
+        Return a pymongo CommandCursor that can be iterated on to give the
+        results of the query.
+
+        If `count` is True, return a single document with the number of
+        documents that match the query.
+
+        Use `limit` or `skip` to override those options of the query.
+        """
+        if self.query.low_mark == self.query.high_mark:
+            return []
+
+        pipeline = self.get_pipeline()
+        return self.collection.aggregate(pipeline)
+
     def get_pipeline(self, count=False, limit=None, skip=None):
         pipeline = [] if self.subquery is None else self.subquery.get_pipeline()
         if self.lookup_pipeline:
@@ -114,23 +131,6 @@ def get_pipeline(self, count=False, limit=None, skip=None):
 
         return pipeline
 
-    @wrap_database_errors
-    def get_cursor(self, count=False, limit=None, skip=None):
-        """
-        Return a pymongo CommandCursor that can be iterated on to give the
-        results of the query.
-
-        If `count` is True, return a single document with the number of
-        documents that match the query.
-
-        Use `limit` or `skip` to override those options of the query.
-        """
-        if self.query.low_mark == self.query.high_mark:
-            return []
-
-        pipeline = self.get_pipeline()
-        return self.collection.aggregate(pipeline)
-
 
 def join(self, compiler, connection):
     lookup_pipeline = []