From d074c7530b812a7b78c9a201c8a70f281ed3a36e Mon Sep 17 00:00:00 2001 From: Simon Charette Date: Sat, 13 Jan 2024 14:21:36 -0500 Subject: [PATCH 1/4] Refs #35102 -- Optimized Expression.identity used for equality and hashing. inspect.signature() is quite slow and produces the same object for each instance of the same class as they share their __init__ method which makes it a prime candidate for caching. Thanks Anthony Shaw for the report. --- django/db/models/expressions.py | 13 +++++++++---- 1 file changed, 9 insertions(+), 4 deletions(-) diff --git a/django/db/models/expressions.py b/django/db/models/expressions.py index c20de5995a34..9ee2d65c8af6 100644 --- a/django/db/models/expressions.py +++ b/django/db/models/expressions.py @@ -14,7 +14,7 @@ from django.db.models.constants import LOOKUP_SEP from django.db.models.query_utils import Q from django.utils.deconstruct import deconstructible -from django.utils.functional import cached_property +from django.utils.functional import cached_property, classproperty from django.utils.hashable import make_hashable @@ -485,13 +485,18 @@ def select_format(self, compiler, sql, params): class Expression(BaseExpression, Combinable): """An expression that can be combined with other expressions.""" + @classproperty + @functools.lru_cache(maxsize=128) + def _constructor_signature(cls): + return inspect.signature(cls.__init__) + @cached_property def identity(self): - constructor_signature = inspect.signature(self.__init__) args, kwargs = self._constructor_args - signature = constructor_signature.bind_partial(*args, **kwargs) + signature = self._constructor_signature.bind_partial(self, *args, **kwargs) signature.apply_defaults() - arguments = signature.arguments.items() + arguments = iter(signature.arguments.items()) + next(arguments) identity = [self.__class__] for arg, value in arguments: if isinstance(value, fields.Field): From f3d10546a850df4fe3796f972d5b7e16adf52f54 Mon Sep 17 00:00:00 2001 From: Mariusz Felisiak Date: Sat, 13 Jan 2024 14:33:20 -0500 Subject: [PATCH 2/4] Refs #35102 -- Optimized replace_expressions()/relabelling aliases by adding early return. This avoids costly hashing. Thanks Anthony Shaw for the report. Co-Authored-By: Simon Charette --- django/db/models/expressions.py | 5 ++++- django/db/models/sql/query.py | 2 ++ django/db/models/sql/where.py | 4 ++++ 3 files changed, 10 insertions(+), 1 deletion(-) diff --git a/django/db/models/expressions.py b/django/db/models/expressions.py index 9ee2d65c8af6..f25ad1af12cc 100644 --- a/django/db/models/expressions.py +++ b/django/db/models/expressions.py @@ -402,10 +402,13 @@ def relabeled_clone(self, change_map): return clone def replace_expressions(self, replacements): + if not replacements: + return self if replacement := replacements.get(self): return replacement + if not (source_expressions := self.get_source_expressions()): + return self clone = self.copy() - source_expressions = clone.get_source_expressions() clone.set_source_expressions( [ expr.replace_expressions(replacements) if expr else None diff --git a/django/db/models/sql/query.py b/django/db/models/sql/query.py index a79d66eb21e9..ce4fafb1e2bc 100644 --- a/django/db/models/sql/query.py +++ b/django/db/models/sql/query.py @@ -972,6 +972,8 @@ def change_aliases(self, change_map): relabelling any references to them in select columns and the where clause. """ + if not change_map: + return self # If keys and values of change_map were to intersect, an alias might be # updated twice (e.g. T4 -> T5, T5 -> T6, so also T4 -> T6) depending # on their order in change_map. diff --git a/django/db/models/sql/where.py b/django/db/models/sql/where.py index 2f23a2932ce5..8423fcb52892 100644 --- a/django/db/models/sql/where.py +++ b/django/db/models/sql/where.py @@ -204,6 +204,8 @@ def relabel_aliases(self, change_map): Relabel the alias values of any children. 'change_map' is a dictionary mapping old (current) alias values to the new values. """ + if not change_map: + return self for pos, child in enumerate(self.children): if hasattr(child, "relabel_aliases"): # For example another WhereNode @@ -225,6 +227,8 @@ def relabeled_clone(self, change_map): return clone def replace_expressions(self, replacements): + if not replacements: + return self if replacement := replacements.get(self): return replacement clone = self.create(connector=self.connector, negated=self.negated) From f92641a636a8cb75fc9851396cef4345510a4b52 Mon Sep 17 00:00:00 2001 From: Aivars Kalvans Date: Sun, 10 Dec 2023 21:43:34 +0200 Subject: [PATCH 3/4] Fixed #28344 -- Allowed customizing queryset in Model.refresh_from_db()/arefresh_from_db(). The from_queryset parameter can be used to: - use a custom Manager - lock the row until the end of transaction - select additional related objects --- django/db/models/base.py | 28 ++++++++----- docs/ref/models/instances.txt | 25 ++++++++++- docs/releases/5.1.txt | 5 +++ tests/async/test_async_model_methods.py | 11 +++++ tests/basic/tests.py | 56 ++++++++++++++++++++++++- 5 files changed, 111 insertions(+), 14 deletions(-) diff --git a/django/db/models/base.py b/django/db/models/base.py index 46ac762ccd46..b15bdd032ab0 100644 --- a/django/db/models/base.py +++ b/django/db/models/base.py @@ -673,7 +673,7 @@ def get_deferred_fields(self): if f.attname not in self.__dict__ } - def refresh_from_db(self, using=None, fields=None): + def refresh_from_db(self, using=None, fields=None, from_queryset=None): """ Reload field values from the database. @@ -705,10 +705,13 @@ def refresh_from_db(self, using=None, fields=None): "are not allowed in fields." % LOOKUP_SEP ) - hints = {"instance": self} - db_instance_qs = self.__class__._base_manager.db_manager( - using, hints=hints - ).filter(pk=self.pk) + if from_queryset is None: + hints = {"instance": self} + from_queryset = self.__class__._base_manager.db_manager(using, hints=hints) + elif using is not None: + from_queryset = from_queryset.using(using) + + db_instance_qs = from_queryset.filter(pk=self.pk) # Use provided fields, if not set then reload all non-deferred fields. deferred_fields = self.get_deferred_fields() @@ -729,9 +732,12 @@ def refresh_from_db(self, using=None, fields=None): # This field wasn't refreshed - skip ahead. continue setattr(self, field.attname, getattr(db_instance, field.attname)) - # Clear cached foreign keys. - if field.is_relation and field.is_cached(self): - field.delete_cached_value(self) + # Clear or copy cached foreign keys. + if field.is_relation: + if field.is_cached(db_instance): + field.set_cached_value(self, field.get_cached_value(db_instance)) + elif field.is_cached(self): + field.delete_cached_value(self) # Clear cached relations. for field in self._meta.related_objects: @@ -745,8 +751,10 @@ def refresh_from_db(self, using=None, fields=None): self._state.db = db_instance._state.db - async def arefresh_from_db(self, using=None, fields=None): - return await sync_to_async(self.refresh_from_db)(using=using, fields=fields) + async def arefresh_from_db(self, using=None, fields=None, from_queryset=None): + return await sync_to_async(self.refresh_from_db)( + using=using, fields=fields, from_queryset=from_queryset + ) def serializable_value(self, field_name): """ diff --git a/docs/ref/models/instances.txt b/docs/ref/models/instances.txt index 45af7f244fc1..6d1a7e5db458 100644 --- a/docs/ref/models/instances.txt +++ b/docs/ref/models/instances.txt @@ -142,8 +142,8 @@ value from the database: >>> del obj.field >>> obj.field # Loads the field from the database -.. method:: Model.refresh_from_db(using=None, fields=None) -.. method:: Model.arefresh_from_db(using=None, fields=None) +.. method:: Model.refresh_from_db(using=None, fields=None, from_queryset=None) +.. method:: Model.arefresh_from_db(using=None, fields=None, from_queryset=None) *Asynchronous version*: ``arefresh_from_db()`` @@ -197,6 +197,27 @@ all of the instance's fields when a deferred field is reloaded:: fields = fields.union(deferred_fields) super().refresh_from_db(using, fields, **kwargs) +The ``from_queryset`` argument allows using a different queryset than the one +created from :attr:`~django.db.models.Model._base_manager`. It gives you more +control over how the model is reloaded. For example, when your model uses soft +deletion you can make ``refresh_from_db()`` to take this into account:: + + obj.refresh_from_db(from_queryset=MyModel.active_objects.all()) + +You can cache related objects that otherwise would be cleared from the reloaded +instance:: + + obj.refresh_from_db(from_queryset=MyModel.objects.select_related("related_field")) + +You can lock the row until the end of transaction before reloading a model's +values:: + + obj.refresh_from_db(from_queryset=MyModel.objects.select_for_update()) + +.. versionchanged:: 5.1 + + The ``from_queryset`` argument was added. + .. method:: Model.get_deferred_fields() A helper method that returns a set containing the attribute names of all those diff --git a/docs/releases/5.1.txt b/docs/releases/5.1.txt index 2f672e3dce0c..30317eaa1916 100644 --- a/docs/releases/5.1.txt +++ b/docs/releases/5.1.txt @@ -208,6 +208,11 @@ Models :class:`~django.contrib.postgres.fields.ArrayField` can now be :ref:`sliced `. +* The new ``from_queryset`` argument of :meth:`.Model.refresh_from_db` and + :meth:`.Model.arefresh_from_db` allows customizing the queryset used to + reload a model's value. This can be used to lock the row before reloading or + to select related objects. + Requests and Responses ~~~~~~~~~~~~~~~~~~~~~~ diff --git a/tests/async/test_async_model_methods.py b/tests/async/test_async_model_methods.py index 94e0370e3560..d988d7befcb4 100644 --- a/tests/async/test_async_model_methods.py +++ b/tests/async/test_async_model_methods.py @@ -23,3 +23,14 @@ async def test_arefresh_from_db(self): await SimpleModel.objects.filter(pk=self.s1.pk).aupdate(field=20) await self.s1.arefresh_from_db() self.assertEqual(self.s1.field, 20) + + async def test_arefresh_from_db_from_queryset(self): + await SimpleModel.objects.filter(pk=self.s1.pk).aupdate(field=20) + with self.assertRaises(SimpleModel.DoesNotExist): + await self.s1.arefresh_from_db( + from_queryset=SimpleModel.objects.filter(field=0) + ) + await self.s1.arefresh_from_db( + from_queryset=SimpleModel.objects.filter(field__gt=0) + ) + self.assertEqual(self.s1.field, 20) diff --git a/tests/basic/tests.py b/tests/basic/tests.py index 990549edfc4b..8a304e9ace04 100644 --- a/tests/basic/tests.py +++ b/tests/basic/tests.py @@ -4,7 +4,14 @@ from unittest import mock from django.core.exceptions import MultipleObjectsReturned, ObjectDoesNotExist -from django.db import DEFAULT_DB_ALIAS, DatabaseError, connections, models +from django.db import ( + DEFAULT_DB_ALIAS, + DatabaseError, + connection, + connections, + models, + transaction, +) from django.db.models.manager import BaseManager from django.db.models.query import MAX_GET_RESULTS, EmptyQuerySet from django.test import ( @@ -13,7 +20,8 @@ TransactionTestCase, skipUnlessDBFeature, ) -from django.test.utils import ignore_warnings +from django.test.utils import CaptureQueriesContext, ignore_warnings +from django.utils.connection import ConnectionDoesNotExist from django.utils.deprecation import RemovedInDjango60Warning from django.utils.translation import gettext_lazy @@ -1003,3 +1011,47 @@ def test_prefetched_cache_cleared(self): # Cache was cleared and new results are available. self.assertCountEqual(a2_prefetched.selfref_set.all(), [s]) self.assertCountEqual(a2_prefetched.cited.all(), [s]) + + @skipUnlessDBFeature("has_select_for_update") + def test_refresh_for_update(self): + a = Article.objects.create(pub_date=datetime.now()) + for_update_sql = connection.ops.for_update_sql() + + with transaction.atomic(), CaptureQueriesContext(connection) as ctx: + a.refresh_from_db(from_queryset=Article.objects.select_for_update()) + self.assertTrue( + any(for_update_sql in query["sql"] for query in ctx.captured_queries) + ) + + def test_refresh_with_related(self): + a = Article.objects.create(pub_date=datetime.now()) + fa = FeaturedArticle.objects.create(article=a) + + from_queryset = FeaturedArticle.objects.select_related("article") + with self.assertNumQueries(1): + fa.refresh_from_db(from_queryset=from_queryset) + self.assertEqual(fa.article.pub_date, a.pub_date) + with self.assertNumQueries(2): + fa.refresh_from_db() + self.assertEqual(fa.article.pub_date, a.pub_date) + + def test_refresh_overwrites_queryset_using(self): + a = Article.objects.create(pub_date=datetime.now()) + + from_queryset = Article.objects.using("nonexistent") + with self.assertRaises(ConnectionDoesNotExist): + a.refresh_from_db(from_queryset=from_queryset) + a.refresh_from_db(using="default", from_queryset=from_queryset) + + def test_refresh_overwrites_queryset_fields(self): + a = Article.objects.create(pub_date=datetime.now()) + headline = "headline" + Article.objects.filter(pk=a.pk).update(headline=headline) + + from_queryset = Article.objects.only("pub_date") + with self.assertNumQueries(1): + a.refresh_from_db(from_queryset=from_queryset) + self.assertNotEqual(a.headline, headline) + with self.assertNumQueries(1): + a.refresh_from_db(fields=["headline"], from_queryset=from_queryset) + self.assertEqual(a.headline, headline) From 4fec1d2ce37241fb8fa001971c441d360ed2a196 Mon Sep 17 00:00:00 2001 From: jordanbae Date: Tue, 9 Jan 2024 23:04:31 +0900 Subject: [PATCH 4/4] Fixed #34949 -- Clarified when UniqueConstraints with include/nulls_distinct are not created. --- docs/ref/models/constraints.txt | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/docs/ref/models/constraints.txt b/docs/ref/models/constraints.txt index efe63a8ac183..cc308cedf225 100644 --- a/docs/ref/models/constraints.txt +++ b/docs/ref/models/constraints.txt @@ -229,7 +229,8 @@ For example:: will allow filtering on ``room`` and ``date``, also selecting ``full_name``, while fetching data only from the index. -``include`` is supported only on PostgreSQL. +Unique constraints with non-key columns are ignored for databases besides +PostgreSQL. Non-key columns have the same database restrictions as :attr:`Index.include`. @@ -272,7 +273,8 @@ For example:: creates a unique constraint that only allows one row to store a ``NULL`` value in the ``ordering`` column. -``nulls_distinct`` is ignored for databases besides PostgreSQL 15+. +Unique constraints with ``nulls_distinct`` are ignored for databases besides +PostgreSQL 15+. ``violation_error_code`` ------------------------