123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329 |
- from collections import Counter, OrderedDict
- from operator import attrgetter
-
- from django.db import IntegrityError, connections, transaction
- from django.db.models import signals, sql
-
-
- class ProtectedError(IntegrityError):
- def __init__(self, msg, protected_objects):
- self.protected_objects = protected_objects
- super().__init__(msg, protected_objects)
-
-
- def CASCADE(collector, field, sub_objs, using):
- collector.collect(sub_objs, source=field.remote_field.model,
- source_attr=field.name, nullable=field.null)
- if field.null and not connections[using].features.can_defer_constraint_checks:
- collector.add_field_update(field, None, sub_objs)
-
-
- def PROTECT(collector, field, sub_objs, using):
- raise ProtectedError(
- "Cannot delete some instances of model '%s' because they are "
- "referenced through a protected foreign key: '%s.%s'" % (
- field.remote_field.model.__name__, sub_objs[0].__class__.__name__, field.name
- ),
- sub_objs
- )
-
-
- def SET(value):
- if callable(value):
- def set_on_delete(collector, field, sub_objs, using):
- collector.add_field_update(field, value(), sub_objs)
- else:
- def set_on_delete(collector, field, sub_objs, using):
- collector.add_field_update(field, value, sub_objs)
- set_on_delete.deconstruct = lambda: ('django.db.models.SET', (value,), {})
- return set_on_delete
-
-
- def SET_NULL(collector, field, sub_objs, using):
- collector.add_field_update(field, None, sub_objs)
-
-
- def SET_DEFAULT(collector, field, sub_objs, using):
- collector.add_field_update(field, field.get_default(), sub_objs)
-
-
- def DO_NOTHING(collector, field, sub_objs, using):
- pass
-
-
- def get_candidate_relations_to_delete(opts):
- # The candidate relations are the ones that come from N-1 and 1-1 relations.
- # N-N (i.e., many-to-many) relations aren't candidates for deletion.
- return (
- f for f in opts.get_fields(include_hidden=True)
- if f.auto_created and not f.concrete and (f.one_to_one or f.one_to_many)
- )
-
-
- class Collector:
- def __init__(self, using):
- self.using = using
- # Initially, {model: {instances}}, later values become lists.
- self.data = OrderedDict()
- self.field_updates = {} # {model: {(field, value): {instances}}}
- # fast_deletes is a list of queryset-likes that can be deleted without
- # fetching the objects into memory.
- self.fast_deletes = []
-
- # Tracks deletion-order dependency for databases without transactions
- # or ability to defer constraint checks. Only concrete model classes
- # should be included, as the dependencies exist only between actual
- # database tables; proxy models are represented here by their concrete
- # parent.
- self.dependencies = {} # {model: {models}}
-
- def add(self, objs, source=None, nullable=False, reverse_dependency=False):
- """
- Add 'objs' to the collection of objects to be deleted. If the call is
- the result of a cascade, 'source' should be the model that caused it,
- and 'nullable' should be set to True if the relation can be null.
-
- Return a list of all objects that were not already collected.
- """
- if not objs:
- return []
- new_objs = []
- model = objs[0].__class__
- instances = self.data.setdefault(model, set())
- for obj in objs:
- if obj not in instances:
- new_objs.append(obj)
- instances.update(new_objs)
- # Nullable relationships can be ignored -- they are nulled out before
- # deleting, and therefore do not affect the order in which objects have
- # to be deleted.
- if source is not None and not nullable:
- if reverse_dependency:
- source, model = model, source
- self.dependencies.setdefault(
- source._meta.concrete_model, set()).add(model._meta.concrete_model)
- return new_objs
-
- def add_field_update(self, field, value, objs):
- """
- Schedule a field update. 'objs' must be a homogeneous iterable
- collection of model instances (e.g. a QuerySet).
- """
- if not objs:
- return
- model = objs[0].__class__
- self.field_updates.setdefault(
- model, {}).setdefault(
- (field, value), set()).update(objs)
-
- def can_fast_delete(self, objs, from_field=None):
- """
- Determine if the objects in the given queryset-like or single object
- can be fast-deleted. This can be done if there are no cascades, no
- parents and no signal listeners for the object class.
-
- The 'from_field' tells where we are coming from - we need this to
- determine if the objects are in fact to be deleted. Allow also
- skipping parent -> child -> parent chain preventing fast delete of
- the child.
- """
- if from_field and from_field.remote_field.on_delete is not CASCADE:
- return False
- if hasattr(objs, '_meta'):
- model = type(objs)
- elif hasattr(objs, 'model') and hasattr(objs, '_raw_delete'):
- model = objs.model
- else:
- return False
- if (signals.pre_delete.has_listeners(model) or
- signals.post_delete.has_listeners(model) or
- signals.m2m_changed.has_listeners(model)):
- return False
- # The use of from_field comes from the need to avoid cascade back to
- # parent when parent delete is cascading to child.
- opts = model._meta
- return (
- all(link == from_field for link in opts.concrete_model._meta.parents.values()) and
- # Foreign keys pointing to this model.
- all(
- related.field.remote_field.on_delete is DO_NOTHING
- for related in get_candidate_relations_to_delete(opts)
- ) and (
- # Something like generic foreign key.
- not any(hasattr(field, 'bulk_related_objects') for field in opts.private_fields)
- )
- )
-
- def get_del_batches(self, objs, field):
- """
- Return the objs in suitably sized batches for the used connection.
- """
- conn_batch_size = max(
- connections[self.using].ops.bulk_batch_size([field.name], objs), 1)
- if len(objs) > conn_batch_size:
- return [objs[i:i + conn_batch_size]
- for i in range(0, len(objs), conn_batch_size)]
- else:
- return [objs]
-
- def collect(self, objs, source=None, nullable=False, collect_related=True,
- source_attr=None, reverse_dependency=False, keep_parents=False):
- """
- Add 'objs' to the collection of objects to be deleted as well as all
- parent instances. 'objs' must be a homogeneous iterable collection of
- model instances (e.g. a QuerySet). If 'collect_related' is True,
- related objects will be handled by their respective on_delete handler.
-
- If the call is the result of a cascade, 'source' should be the model
- that caused it and 'nullable' should be set to True, if the relation
- can be null.
-
- If 'reverse_dependency' is True, 'source' will be deleted before the
- current model, rather than after. (Needed for cascading to parent
- models, the one case in which the cascade follows the forwards
- direction of an FK rather than the reverse direction.)
-
- If 'keep_parents' is True, data of parent model's will be not deleted.
- """
- if self.can_fast_delete(objs):
- self.fast_deletes.append(objs)
- return
- new_objs = self.add(objs, source, nullable,
- reverse_dependency=reverse_dependency)
- if not new_objs:
- return
-
- model = new_objs[0].__class__
-
- if not keep_parents:
- # Recursively collect concrete model's parent models, but not their
- # related objects. These will be found by meta.get_fields()
- concrete_model = model._meta.concrete_model
- for ptr in concrete_model._meta.parents.values():
- if ptr:
- parent_objs = [getattr(obj, ptr.name) for obj in new_objs]
- self.collect(parent_objs, source=model,
- source_attr=ptr.remote_field.related_name,
- collect_related=False,
- reverse_dependency=True)
- if collect_related:
- parents = model._meta.parents
- for related in get_candidate_relations_to_delete(model._meta):
- # Preserve parent reverse relationships if keep_parents=True.
- if keep_parents and related.model in parents:
- continue
- field = related.field
- if field.remote_field.on_delete == DO_NOTHING:
- continue
- batches = self.get_del_batches(new_objs, field)
- for batch in batches:
- sub_objs = self.related_objects(related, batch)
- if self.can_fast_delete(sub_objs, from_field=field):
- self.fast_deletes.append(sub_objs)
- elif sub_objs:
- field.remote_field.on_delete(self, field, sub_objs, self.using)
- for field in model._meta.private_fields:
- if hasattr(field, 'bulk_related_objects'):
- # It's something like generic foreign key.
- sub_objs = field.bulk_related_objects(new_objs, self.using)
- self.collect(sub_objs, source=model, nullable=True)
-
- def related_objects(self, related, objs):
- """
- Get a QuerySet of objects related to `objs` via the relation `related`.
- """
- return related.related_model._base_manager.using(self.using).filter(
- **{"%s__in" % related.field.name: objs}
- )
-
- def instances_with_model(self):
- for model, instances in self.data.items():
- for obj in instances:
- yield model, obj
-
- def sort(self):
- sorted_models = []
- concrete_models = set()
- models = list(self.data)
- while len(sorted_models) < len(models):
- found = False
- for model in models:
- if model in sorted_models:
- continue
- dependencies = self.dependencies.get(model._meta.concrete_model)
- if not (dependencies and dependencies.difference(concrete_models)):
- sorted_models.append(model)
- concrete_models.add(model._meta.concrete_model)
- found = True
- if not found:
- return
- self.data = OrderedDict((model, self.data[model])
- for model in sorted_models)
-
- def delete(self):
- # sort instance collections
- for model, instances in self.data.items():
- self.data[model] = sorted(instances, key=attrgetter("pk"))
-
- # if possible, bring the models in an order suitable for databases that
- # don't support transactions or cannot defer constraint checks until the
- # end of a transaction.
- self.sort()
- # number of objects deleted for each model label
- deleted_counter = Counter()
-
- # Optimize for the case with a single obj and no dependencies
- if len(self.data) == 1 and len(instances) == 1:
- instance = list(instances)[0]
- if self.can_fast_delete(instance):
- with transaction.mark_for_rollback_on_error():
- count = sql.DeleteQuery(model).delete_batch([instance.pk], self.using)
- setattr(instance, model._meta.pk.attname, None)
- return count, {model._meta.label: count}
-
- with transaction.atomic(using=self.using, savepoint=False):
- # send pre_delete signals
- for model, obj in self.instances_with_model():
- if not model._meta.auto_created:
- signals.pre_delete.send(
- sender=model, instance=obj, using=self.using
- )
-
- # fast deletes
- for qs in self.fast_deletes:
- count = qs._raw_delete(using=self.using)
- deleted_counter[qs.model._meta.label] += count
-
- # update fields
- for model, instances_for_fieldvalues in self.field_updates.items():
- for (field, value), instances in instances_for_fieldvalues.items():
- query = sql.UpdateQuery(model)
- query.update_batch([obj.pk for obj in instances],
- {field.name: value}, self.using)
-
- # reverse instance collections
- for instances in self.data.values():
- instances.reverse()
-
- # delete instances
- for model, instances in self.data.items():
- query = sql.DeleteQuery(model)
- pk_list = [obj.pk for obj in instances]
- count = query.delete_batch(pk_list, self.using)
- deleted_counter[model._meta.label] += count
-
- if not model._meta.auto_created:
- for obj in instances:
- signals.post_delete.send(
- sender=model, instance=obj, using=self.using
- )
-
- # update collected instances
- for instances_for_fieldvalues in self.field_updates.values():
- for (field, value), instances in instances_for_fieldvalues.items():
- for obj in instances:
- setattr(obj, field.attname, value)
- for model, instances in self.data.items():
- for instance in instances:
- setattr(instance, model._meta.pk.attname, None)
- return sum(deleted_counter.values()), dict(deleted_counter)
|