-
Notifications
You must be signed in to change notification settings - Fork 66
/
Copy pathfields.py
550 lines (446 loc) · 22.3 KB
/
fields.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
from __future__ import unicode_literals
from django import VERSION as DJANGO_VERSION
from django.core import checks
from django.db import IntegrityError, connections, router
from django.db.models import CASCADE
from django.db.models.fields.related import ForeignKey, ManyToManyField
from django.utils.functional import cached_property
from django.db.models.fields.related import ReverseManyToOneDescriptor, ManyToManyDescriptor
from modelcluster.utils import sort_by_fields
from modelcluster.queryset import FakeQuerySet
def create_deferring_foreign_related_manager(related, original_manager_cls):
"""
Create a DeferringRelatedManager class that wraps an ordinary RelatedManager
with 'deferring' behaviour: any updates to the object set (via e.g. add() or clear())
are written to a holding area rather than committed to the database immediately.
Writing to the database is deferred until the model is saved.
"""
relation_name = related.get_accessor_name()
rel_field = related.field
rel_model = related.related_model
superclass = rel_model._default_manager.__class__
class DeferringRelatedManager(superclass):
def __init__(self, instance):
super().__init__()
self.model = rel_model
self.instance = instance
@property
def is_deferring(self):
return relation_name in getattr(
self.instance, '_cluster_related_objects', {}
)
def _get_cluster_related_objects(self):
# Helper to retrieve the instance's _cluster_related_objects dict,
# creating it if it does not already exist
try:
return self.instance._cluster_related_objects
except AttributeError:
cluster_related_objects = {}
self.instance._cluster_related_objects = cluster_related_objects
return cluster_related_objects
def get_live_query_set(self):
# deprecated; renamed to get_live_queryset to match the move from
# get_query_set to get_queryset in Django 1.6
return self.get_live_queryset()
def get_live_queryset(self):
"""
return the original manager's queryset, which reflects the live database
"""
return original_manager_cls(self.instance).get_queryset()
def get_queryset(self):
"""
return the current object set with any updates applied,
wrapped up in a FakeQuerySet if it doesn't match the database state
"""
try:
results = self.instance._cluster_related_objects[relation_name]
except (AttributeError, KeyError):
if self.instance.pk is None:
# use an empty fake queryset if the instance is unsaved
results = []
else:
return self.get_live_queryset()
return FakeQuerySet(related.related_model, results)
def _apply_rel_filters(self, queryset):
# Implemented as empty for compatibility sake
# But there is probably a better implementation of this function
#
# NOTE: _apply_rel_filters() must return a copy of the queryset
# to work correctly with prefetch
return queryset._next_is_sticky().all()
def get_prefetch_querysets(self, instances, querysets=None):
if querysets and len(querysets) != 1:
raise ValueError("get_prefetch_querysets() must be passed exactly one queryset")
queryset = querysets[0] if querysets else None
if queryset is None:
db = self._db or router.db_for_read(self.model, instance=instances[0])
queryset = super().get_queryset().using(db)
rel_obj_attr = rel_field.get_local_related_value
instance_attr = rel_field.get_foreign_related_value
instances_dict = dict((instance_attr(inst), inst) for inst in instances)
query = {'%s__in' % rel_field.name: instances}
qs = queryset.filter(**query)
# Since we just bypassed this class' get_queryset(), we must manage
# the reverse relation manually.
for rel_obj in qs:
instance = instances_dict[rel_obj_attr(rel_obj)]
setattr(rel_obj, rel_field.name, instance)
cache_name = rel_field.related_query_name()
return qs, rel_obj_attr, instance_attr, False, cache_name, False
# Remove once we only support Django 5.0+
if not DJANGO_VERSION >= (5, 0):
def get_prefetch_queryset(self, instances, queryset=None):
if queryset is None:
return self.get_prefetch_querysets(instances)
return self.get_prefetch_querysets(instances, querysets=[queryset])
def get_object_list(self):
"""
return the mutable list that forms the current in-memory state of
this relation. If there is no such list (i.e. the manager is returning
querysets from the live database instead), one is created, populating it
with the live database state
"""
cluster_related_objects = self._get_cluster_related_objects()
try:
object_list = cluster_related_objects[relation_name]
except KeyError:
if self.instance.pk is None:
object_list = []
else:
object_list = list(self.get_live_queryset())
cluster_related_objects[relation_name] = object_list
return object_list
def add(self, *new_items):
"""
Add the passed items to the stored object set, but do not commit them
to the database
"""
items = self.get_object_list()
for target in new_items:
item_matched = False
for i, item in enumerate(items):
if item == target:
# Replace the matched item with the new one. This ensures that any
# modifications to that item's fields take effect within the recordset -
# i.e. we can perform a virtual UPDATE to an object in the list
# by calling add(updated_object). Which is semantically a bit dubious,
# but it does the job...
items[i] = target
item_matched = True
break
if not item_matched:
items.append(target)
# update the foreign key on the added item to point back to the parent instance
setattr(target, related.field.name, self.instance)
# Sort list
if rel_model._meta.ordering and len(items) > 1:
sort_by_fields(items, rel_model._meta.ordering)
def remove(self, *items_to_remove):
"""
Remove the passed items from the stored object set, but do not commit the change
to the database
"""
items = self.get_object_list()
# filter items list in place: see http://stackoverflow.com/a/1208792/1853523
items[:] = [item for item in items if item not in items_to_remove]
def create(self, **kwargs):
items = self.get_object_list()
new_item = related.related_model(**kwargs)
items.append(new_item)
return new_item
def clear(self):
"""
Clear the stored object set, without affecting the database
"""
self.set([])
def set(self, objs, bulk=True, clear=False):
# cast objs to a list so that:
# 1) we can call len() on it (which we can't do on, say, a queryset)
# 2) if we need to sort it, we can do so without mutating the original
objs = list(objs)
cluster_related_objects = self._get_cluster_related_objects()
for obj in objs:
# update the foreign key on the added item to point back to the parent instance
setattr(obj, related.field.name, self.instance)
# Clone and sort the 'objs' list, if necessary
if rel_model._meta.ordering and len(objs) > 1:
sort_by_fields(objs, rel_model._meta.ordering)
cluster_related_objects[relation_name] = objs
def commit(self):
"""
Apply any changes made to the stored object set to the database.
Any objects removed from the initial set will be deleted entirely
from the database.
"""
if self.instance.pk is None:
raise IntegrityError("Cannot commit relation %r on an unsaved model" % relation_name)
try:
final_items = self.instance._cluster_related_objects[relation_name]
except (AttributeError, KeyError):
# _cluster_related_objects entry never created => no changes to make
return
original_manager = original_manager_cls(self.instance)
live_items = list(original_manager.get_queryset())
for item in live_items:
if item not in final_items:
item.delete()
for item in final_items:
# Django 1.9+ bulk updates items by default which assumes
# that they have already been saved to the database.
# Disable this behaviour.
# https://code.djangoproject.com/ticket/18556
# https://github.com/django/django/commit/adc0c4fbac98f9cb975e8fa8220323b2de638b46
original_manager.add(item, bulk=False)
# purge the _cluster_related_objects entry, so we switch back to live SQL
del self.instance._cluster_related_objects[relation_name]
return DeferringRelatedManager
class ChildObjectsDescriptor(ReverseManyToOneDescriptor):
def __get__(self, instance, instance_type=None):
if instance is None:
return self
return self.child_object_manager_cls(instance)
def __set__(self, instance, value):
manager = self.__get__(instance)
manager.set(value)
@cached_property
def child_object_manager_cls(self):
return create_deferring_foreign_related_manager(self.rel, self.related_manager_cls)
class ParentalKey(ForeignKey):
related_accessor_class = ChildObjectsDescriptor
def __init__(self, *args, **kwargs):
kwargs.setdefault('on_delete', CASCADE)
super().__init__(*args, **kwargs)
def check(self, **kwargs):
from modelcluster.models import ClusterableModel
errors = super().check(**kwargs)
# Check that the destination model is a subclass of ClusterableModel.
# If self.rel.to is a string at this point, it means that Django has been unable
# to resolve it as a model name; if so, skip this test so that Django's own
# system checks can report the appropriate error
if isinstance(self.remote_field.model, type) and not issubclass(self.remote_field.model, ClusterableModel):
errors.append(
checks.Error(
'ParentalKey must point to a subclass of ClusterableModel.',
hint='Change {model_name} into a ClusterableModel or use a ForeignKey instead.'.format(
model_name=self.remote_field.model._meta.app_label + '.' + self.remote_field.model.__name__,
),
obj=self,
id='modelcluster.E001',
)
)
# ParentalKeys must have an accessor name (#49)
if self.remote_field.get_accessor_name() == '+':
errors.append(
checks.Error(
"related_name='+' is not allowed on ParentalKey fields",
hint="Either change it to a valid name or remove it",
obj=self,
id='modelcluster.E002',
)
)
return errors
def create_deferring_forward_many_to_many_manager(rel, original_manager_cls):
rel_field = rel.field
relation_name = rel_field.name
query_field_name = rel_field.related_query_name()
source_field_name = rel_field.m2m_field_name()
rel_model = rel.model
superclass = rel_model._default_manager.__class__
rel_through = rel.through
class DeferringManyRelatedManager(superclass):
def __init__(self, instance=None):
super().__init__()
self.model = rel_model
self.through = rel_through
self.instance = instance
def get_original_manager(self):
return original_manager_cls(self.instance)
def get_live_queryset(self):
"""
return the original manager's queryset, which reflects the live database
"""
return self.get_original_manager().get_queryset()
def _get_cluster_related_objects(self):
# Helper to retrieve the instance's _cluster_related_objects dict,
# creating it if it does not already exist
try:
return self.instance._cluster_related_objects
except AttributeError:
cluster_related_objects = {}
self.instance._cluster_related_objects = cluster_related_objects
return cluster_related_objects
def get_queryset(self):
"""
return the current object set with any updates applied,
wrapped up in a FakeQuerySet if it doesn't match the database state
"""
try:
results = self.instance._cluster_related_objects[relation_name]
except (AttributeError, KeyError):
if self.instance.pk:
return self.get_live_queryset()
else:
# the standard M2M manager fails on unsaved instances,
# so bypass it and return an empty queryset
return rel_model.objects.none()
return FakeQuerySet(rel_model, results)
def get_prefetch_querysets(self, instances, querysets=None):
# Derived from Django's ManyRelatedManager.get_prefetch_queryset.
if querysets and len(querysets) != 1:
raise ValueError("get_prefetch_querysets() must be passed exactly one queryset")
queryset = querysets[0] if querysets else None
if queryset is None:
queryset = super().get_queryset()
queryset._add_hints(instance=instances[0])
queryset = queryset.using(queryset._db or self._db)
query = {'%s__in' % query_field_name: instances}
queryset = queryset._next_is_sticky().filter(**query)
fk = self.through._meta.get_field(source_field_name)
join_table = fk.model._meta.db_table
connection = connections[queryset.db]
qn = connection.ops.quote_name
queryset = queryset.extra(select={
'_prefetch_related_val_%s' % f.attname:
'%s.%s' % (qn(join_table), qn(f.column)) for f in fk.local_related_fields})
return (
queryset,
lambda result: tuple(
getattr(result, '_prefetch_related_val_%s' % f.attname)
for f in fk.local_related_fields
),
lambda inst: tuple(
f.get_db_prep_value(getattr(inst, f.attname), connection)
for f in fk.foreign_related_fields
),
False,
relation_name,
False,
)
# Remove once we only support Django 5.0+
if not DJANGO_VERSION >= (5, 0):
def get_prefetch_queryset(self, instances, queryset=None):
if queryset is None:
return self.get_prefetch_querysets(instances)
return self.get_prefetch_querysets(instances, querysets=[queryset])
def _apply_rel_filters(self, queryset):
# Required for get_prefetch_queryset.
return queryset._next_is_sticky()
def get_object_list(self):
"""
return the mutable list that forms the current in-memory state of
this relation. If there is no such list (i.e. the manager is returning
querysets from the live database instead), one is created, populating it
with the live database state
"""
cluster_related_objects = self._get_cluster_related_objects()
try:
object_list = cluster_related_objects[relation_name]
except KeyError:
object_list = list(self.get_live_queryset())
cluster_related_objects[relation_name] = object_list
return object_list
def add(self, *new_items):
"""
Add the passed items to the stored object set, but do not commit them
to the database
"""
items = self.get_object_list()
for target in new_items:
if target.pk is None:
raise ValueError('"%r" needs to have a primary key value before '
'it can be added to a parental many-to-many relation.' % target)
item_matched = False
for i, item in enumerate(items):
if item == target:
# Replace the matched item with the new one. This ensures that any
# modifications to that item's fields take effect within the recordset -
# i.e. we can perform a virtual UPDATE to an object in the list
# by calling add(updated_object). Which is semantically a bit dubious,
# but it does the job...
items[i] = target
item_matched = True
break
if not item_matched:
items.append(target)
# Sort list
if rel_model._meta.ordering and len(items) > 1:
sort_by_fields(items, rel_model._meta.ordering)
def clear(self):
"""
Clear the stored object set, without affecting the database
"""
self.set([])
def set(self, objs, bulk=True, clear=False):
# cast objs to a list so that:
# 1) we can call len() on it (which we can't do on, say, a queryset)
# 2) if we need to sort it, we can do so without mutating the original
objs = list(objs)
if objs and not isinstance(objs[0], rel_model):
# assume objs is a list of pks (like when loading data from a
# fixture), and allow the orignal manager to handle things
original_manager = self.get_original_manager()
original_manager.set(objs)
return
cluster_related_objects = self._get_cluster_related_objects()
# Clone and sort the 'objs' list, if necessary
if rel_model._meta.ordering and len(objs) > 1:
sort_by_fields(objs, rel_model._meta.ordering)
cluster_related_objects[relation_name] = objs
def remove(self, *items_to_remove):
"""
Remove the passed items from the stored object set, but do not commit the change
to the database
"""
items = self.get_object_list()
# filter items list in place: see http://stackoverflow.com/a/1208792/1853523
items[:] = [item for item in items if item not in items_to_remove]
def commit(self):
"""
Apply any changes made to the stored object set to the database.
"""
if not self.instance.pk:
raise IntegrityError("Cannot commit relation %r on an unsaved model" % relation_name)
try:
final_items = self.instance._cluster_related_objects[relation_name]
except (AttributeError, KeyError):
# _cluster_related_objects entry never created => no changes to make
return
original_manager = self.get_original_manager()
live_items = list(original_manager.get_queryset())
items_to_remove = [item for item in live_items if item not in final_items]
items_to_add = [item for item in final_items if item not in live_items]
if items_to_remove:
original_manager.remove(*items_to_remove)
if items_to_add:
original_manager.add(*items_to_add)
# purge the _cluster_related_objects entry, so we switch back to live SQL
del self.instance._cluster_related_objects[relation_name]
return DeferringManyRelatedManager
class ParentalManyToManyDescriptor(ManyToManyDescriptor):
def __get__(self, instance, instance_type=None):
if instance is None:
return self
return self.child_object_manager_cls(instance)
def __set__(self, instance, value):
manager = self.__get__(instance)
manager.set(value)
@cached_property
def child_object_manager_cls(self):
rel = self.rel
return create_deferring_forward_many_to_many_manager(rel, self.related_manager_cls)
class ParentalManyToManyField(ManyToManyField):
related_accessor_class = ParentalManyToManyDescriptor
_need_commit_after_assignment = True
def contribute_to_class(self, cls, name, **kwargs):
# ManyToManyField does not (as of Django 1.10) respect related_accessor_class,
# but hard-codes ManyToManyDescriptor instead:
# https://github.com/django/django/blob/6157cd6da1b27716e8f3d1ed692a6e33d970ae46/django/db/models/fields/related.py#L1538
# So, we'll let the original contribute_to_class do its thing, and then overwrite
# the accessor...
super().contribute_to_class(cls, name, **kwargs)
setattr(cls, self.name, self.related_accessor_class(self.remote_field))
def value_from_object(self, obj):
# In Django >=1.10, ManyToManyField.value_from_object special-cases objects with no PK,
# returning an empty list on the basis that unsaved objects can't have related objects.
# Remove that special case.
return getattr(obj, self.attname).all()