mongodb · WaVEV · Dec 9, 2025 · Dec 10, 2025 · Dec 10, 2025 · timgraham
diff --git a/django_mongodb_backend/aggregates.py b/django_mongodb_backend/aggregates.py
@@ -7,6 +7,7 @@
     Variance,
 )
 from django.db.models.expressions import Case, Value, When
+from django.db.models.functions.comparison import Coalesce
 from django.db.models.lookups import IsNull
 from django.db.models.sql.where import WhereNode
 
@@ -69,6 +70,8 @@ def count(self, compiler, connection, resolve_inner_expression=False):
         if resolve_inner_expression:
             return lhs_mql
         return {"$sum": lhs_mql}
+    # Normalize empty documents (introduced upstream) to an empty set fallback.
+    agg_expression = Coalesce(agg_expression, [])
     # If distinct=True or resolve_inner_expression=False, sum the size of the
     # set.
     return {"$size": agg_expression.as_mql(compiler, connection, as_expr=True)}

diff --git a/django_mongodb_backend/compiler.py b/django_mongodb_backend/compiler.py
@@ -38,6 +38,10 @@ def __init__(self, *args, **kwargs):
         self.subqueries = []
         # Atlas search stage.
         self.search_pipeline = []
+        # Does the aggregation have no GROUP BY fields and needs wrapping?
+        self.wrap_for_global_aggregation = False
+        # The MQL equivalent to a SQL HAVING clause.
+        self.having_match_mql = None
 
     def _get_group_alias_column(self, expr, annotation_group_idx):
         """Generate a dummy field for use in the ids fields in $group."""
@@ -234,21 +238,10 @@ def _build_aggregation_pipeline(self, ids, group):
         """Build the aggregation pipeline for grouping."""
         pipeline = []
         if not ids:
-            group["_id"] = None
-            pipeline.append({"$facet": {"group": [{"$group": group}]}})
-            pipeline.append(
-                {
-                    "$addFields": {
-                        key: {
-                            "$getField": {
-                                "input": {"$arrayElemAt": ["$group", 0]},
-                                "field": key,
-                            }
-                        }
-                        for key in group
-                    }
-                }
-            )
+            pipeline.append({"$group": {"_id": None, **group}})
+            # Apply a global aggregation if there are no ids and no having
+            # clause.
+            self.wrap_for_global_aggregation = not bool(self.having)
         else:
             group["_id"] = ids
             pipeline.append({"$group": group})

diff --git a/django_mongodb_backend/fields/array.py b/django_mongodb_backend/fields/array.py
@@ -310,37 +310,23 @@ class ArrayOverlap(ArrayRHSMixin, FieldGetDbPrepValueMixin, Lookup):
 
     def get_subquery_wrapping_pipeline(self, compiler, connection, field_name, expr):
         return [
+            {"$project": {"subquery_results": expr.as_mql(compiler, connection, as_expr=True)}},
+            {"$unwind": "$subquery_results"},
             {
-                "$facet": {
-                    "group": [
-                        {"$project": {"tmp_name": expr.as_mql(compiler, connection, as_expr=True)}},
-                        {
-                            "$unwind": "$tmp_name",
-                        },
-                        {
-                            "$group": {
-                                "_id": None,
-                                "tmp_name": {"$addToSet": "$tmp_name"},
-                            }
-                        },
-                    ]
-                }
-            },
-            {
-                "$project": {
-                    field_name: {
-                        "$ifNull": [
-                            {
-                                "$getField": {
-                                    "input": {"$arrayElemAt": ["$group", 0]},
-                                    "field": "tmp_name",
-                                }
-                            },
-                            [],
-                        ]
-                    }
+                "$group": {
+                    "_id": None,
+                    "subquery_results": {"$addToSet": "$subquery_results"},
                 }
             },
+            # Workaround for https://jira.mongodb.org/browse/SERVER-114196:
+            # $$NOW becomes unavailable after $unionWith, so it must be stored
+            # beforehand to ensure it remains accessible later in the pipeline.
+            {"$addFields": {"__now": "$$NOW"}},
+            # Add an extra empty document to handle default values on empty
+            # results.
+            {"$unionWith": {"pipeline": [{"$documents": [{"subquery_results": []}]}]}},
+            {"$limit": 1},
+            {"$project": {field_name: "$subquery_results"}},
         ]
 
     def as_mql_expr(self, compiler, connection):

diff --git a/django_mongodb_backend/fields/embedded_model_array.py b/django_mongodb_backend/fields/embedded_model_array.py
@@ -150,44 +150,28 @@ def get_subquery_wrapping_pipeline(self, compiler, connection, field_name, expr)
         # structure of EmbeddedModelArrayField on the RHS behaves similar to
         # ArrayField.
         return [
+            {"$project": {"subquery_results": expr.as_mql(compiler, connection, as_expr=True)}},
+            # Use an $unwind followed by a $group to concatenate all the values
+            # from the RHS subquery.
+            {"$unwind": "$subquery_results"},
+            # The $group stage collects values into an array using $addToSet.
+            # The use of {_id: null} results in a single grouped array, but
+            # because arrays from multiple documents are aggregated, the result
+            # is a list of lists.
             {
-                "$facet": {
-                    "gathered_data": [
-                        {"$project": {"tmp_name": expr.as_mql(compiler, connection, as_expr=True)}},
-                        # To concatenate all the values from the RHS subquery,
-                        # use an $unwind followed by a $group.
-                        {
-                            "$unwind": "$tmp_name",
-                        },
-                        # The $group stage collects values into an array using
-                        # $addToSet. The use of {_id: null} results in a
-                        # single grouped array. However, because arrays from
-                        # multiple documents are aggregated, the result is a
-                        # list of lists.
-                        {
-                            "$group": {
-                                "_id": None,
-                                "tmp_name": {"$addToSet": "$tmp_name"},
-                            }
-                        },
-                    ]
-                }
-            },
-            {
-                "$project": {
-                    field_name: {
-                        "$ifNull": [
-                            {
-                                "$getField": {
-                                    "input": {"$arrayElemAt": ["$gathered_data", 0]},
-                                    "field": "tmp_name",
-                                }
-                            },
-                            [],
-                        ]
-                    }
+                "$group": {
+                    "_id": None,
+                    "subquery_results": {"$addToSet": "$subquery_results"},
                 }
             },
+            # Workaround for https://jira.mongodb.org/browse/SERVER-114196:
+            # $$NOW becomes unavailable after $unionWith, so it must be stored
+            # beforehand to ensure it remains accessible later in the pipeline.
+            {"$addFields": {"__now": "$$NOW"}},
+            # Add a dummy document in case of an empty result.
+            {"$unionWith": {"pipeline": [{"$documents": [{"subquery_results": []}]}]}},
+            {"$limit": 1},
+            {"$project": {field_name: "$subquery_results"}},
         ]
 
 

diff --git a/django_mongodb_backend/lookups.py b/django_mongodb_backend/lookups.py
@@ -56,34 +56,21 @@ def inner(self, compiler, connection):
 def get_subquery_wrapping_pipeline(self, compiler, connection, field_name, expr):  # noqa: ARG001
     return [
         {
-            "$facet": {
-                "group": [
-                    {
-                        "$group": {
-                            "_id": None,
-                            "tmp_name": {
-                                "$addToSet": expr.as_mql(compiler, connection, as_expr=True)
-                            },
-                        }
-                    }
-                ]
-            }
-        },
-        {
-            "$project": {
-                field_name: {
-                    "$ifNull": [
-                        {
-                            "$getField": {
-                                "input": {"$arrayElemAt": ["$group", 0]},
-                                "field": "tmp_name",
-                            }
-                        },
-                        [],
-                    ]
-                }
+            "$group": {
+                "_id": None,
+                # Use a temporal name in order to support field_name="_id".
+                "subquery_results": {"$addToSet": expr.as_mql(compiler, connection, as_expr=True)},
             }
         },
+        # Workaround for https://jira.mongodb.org/browse/SERVER-114196:
+        # $$NOW becomes unavailable after $unionWith, so it must be stored
+        # beforehand to ensure it remains accessible later in the pipeline.
+        {"$addFields": {"__now": "$$NOW"}},
+        # Add an extra empty document to handle default values on empty
+        # results.
+        {"$unionWith": {"pipeline": [{"$documents": [{"subquery_results": []}]}]}},
+        {"$limit": 1},
+        {"$project": {field_name: "$subquery_results"}},
     ]
 
 

diff --git a/django_mongodb_backend/query.py b/django_mongodb_backend/query.py
@@ -56,6 +56,7 @@ def __init__(self, compiler):
         # $lookup stage that encapsulates the pipeline for performing a nested
         # subquery.
         self.subquery_lookup = None
+        self.wrap_for_global_aggregation = compiler.wrap_for_global_aggregation
 
     def __repr__(self):
         return f"<MongoQuery: {self.match_mql!r} ORDER {self.ordering!r}>"
@@ -91,6 +92,23 @@ def get_pipeline(self):
             pipeline.append({"$match": self.match_mql})
         if self.aggregation_pipeline:
             pipeline.extend(self.aggregation_pipeline)
+        if self.wrap_for_global_aggregation:
+            pipeline.extend(
+                [
+                    # Workaround for https://jira.mongodb.org/browse/SERVER-114196:
+                    # $$NOW becomes unavailable after $unionWith, so it must be
+                    # stored beforehand to ensure it remains accessible later
+                    # in the pipeline.
+                    {"$addFields": {"__now": "$$NOW"}},
+                    # Add an empty extra document to handle default values on
+                    # empty results.
+                    {"$unionWith": {"pipeline": [{"$documents": [{}]}]}},
+                    # Limiting to one document ensures the original result
+                    # takes precedence when present, otherwise the injected
+                    # empty document is used.
+                    {"$limit": 1},
+                ]
+            )
         if self.project_fields:
             pipeline.append({"$project": self.project_fields})
         if self.combinator_pipeline:

diff --git a/docs/releases/6.0.x.rst b/docs/releases/6.0.x.rst
@@ -17,6 +17,11 @@ Bug fixes
 
 - ...
 
+Performance improvements
+------------------------
+
+- Removed usage of ``$facet`` from aggregate queries.
+
 6.0.0
 =====
 

diff --git a/tests/lookup_/tests.py b/tests/lookup_/tests.py
@@ -137,28 +137,15 @@ def test_subquery_filter_constant(self):
                         "let": {},
                         "pipeline": [
                             {"$match": {"num": {"$gt": 2}}},
+                            {"$group": {"_id": None, "subquery_results": {"$addToSet": "$num"}}},
+                            {"$addFields": {"__now": "$$NOW"}},
                             {
-                                "$facet": {
-                                    "group": [
-                                        {"$group": {"_id": None, "tmp_name": {"$addToSet": "$num"}}}
-                                    ]
-                                }
-                            },
-                            {
-                                "$project": {
-                                    "num": {
-                                        "$ifNull": [
-                                            {
-                                                "$getField": {
-                                                    "input": {"$arrayElemAt": ["$group", 0]},
-                                                    "field": "tmp_name",
-                                                }
-                                            },
-                                            [],
-                                        ]
-                                    }
+                                "$unionWith": {
+                                    "pipeline": [{"$documents": [{"subquery_results": []}]}]
                                 }
                             },
+                            {"$limit": 1},
+                            {"$project": {"num": "$subquery_results"}},
                         ],
                     }
                 },

diff --git a/tests/model_fields_/test_arrayfield.py b/tests/model_fields_/test_arrayfield.py
@@ -634,6 +634,21 @@ def test_overlap_values(self):
             self.objs[:3],
         )
 
+    def test_overlap_empty_values(self):
+        qs = NullableIntegerArrayModel.objects.filter(order__lt=-30)
+        self.assertCountEqual(
+            NullableIntegerArrayModel.objects.filter(
+                field__overlap=qs.values_list("field"),
+            ),
+            [],
+        )
+        self.assertCountEqual(
+            NullableIntegerArrayModel.objects.filter(
+                field__overlap=qs.values("field"),
+            ),
+            [],
+        )
+
     def test_index(self):
         self.assertSequenceEqual(
             NullableIntegerArrayModel.objects.filter(field__0=2), self.objs[1:3]

diff --git a/tests/model_fields_/test_embedded_model_array.py b/tests/model_fields_/test_embedded_model_array.py
@@ -520,6 +520,11 @@ def test_subquery_in_lookup(self):
         result = Exhibit.objects.filter(sections__number__in=subquery)
         self.assertCountEqual(result, [self.wonders, self.new_discoveries, self.egypt])
 
+    def test_subquery_empty_in_lookup(self):
+        subquery = Audit.objects.filter(section_number=10).values_list("section_number", flat=True)
+        result = Exhibit.objects.filter(sections__number__in=subquery)
+        self.assertCountEqual(result, [])
+
     def test_array_as_rhs(self):
         result = Exhibit.objects.filter(main_section__number__in=models.F("sections__number"))
         self.assertCountEqual(result, [self.new_discoveries])
-Original file line number
+Diff line change
@@ Expand Up / @@ -17,6 +17,11 @@ Bug fixes @@
     - ...
+    Performance improvements
+    ------------------------
+    - Removed usage of ``$facet`` from aggregate queries.
 .0.0
     =====
@@ Expand Down @@