DefectDojo
diff --git a/‎dojo/finding/helper.py‎
Lines changed: 199 additions & 91 deletions b/‎dojo/finding/helper.py‎
Lines changed: 199 additions & 91 deletions
diff --git a/‎dojo/models.py‎
Lines changed: 1 addition & 1 deletion b/‎dojo/models.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎dojo/settings/settings.dist.py‎
Lines changed: 1 addition & 1 deletion b/‎dojo/settings/settings.dist.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎dojo/signals.py‎
Lines changed: 10 additions & 0 deletions b/‎dojo/signals.py‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎dojo/tag_utils.py‎
Lines changed: 66 additions & 1 deletion b/‎dojo/tag_utils.py‎
Lines changed: 66 additions & 1 deletion
@@ -1647,7 +1647,7 @@ def is_ci_cd(self):
     def delete(self, *args, **kwargs):
         logger.debug("%d engagement delete", self.id)
         from dojo.finding import helper as finding_helper  # noqa: PLC0415 circular import
-        finding_helper.prepare_duplicates_for_delete(engagement=self)
+        finding_helper.prepare_duplicates_for_delete(self)
         super().delete(*args, **kwargs)
         with suppress(Engagement.DoesNotExist, Product.DoesNotExist):
             # Suppressing a potential issue created from async delete removing
 
@@ -302,7 +302,7 @@
     # Initial behaviour in Defect Dojo was to delete all duplicates when an original was deleted
     # New behaviour is to leave the duplicates in place, but set the oldest of duplicates as new original
     # Set to True to revert to the old behaviour where all duplicates are deleted
-    DD_DUPLICATE_CLUSTER_CASCADE_DELETE=(str, False),
+    DD_DUPLICATE_CLUSTER_CASCADE_DELETE=(bool, True),
     # Enable Rate Limiting for the login page
     DD_RATE_LIMITER_ENABLED=(bool, False),
     # Examples include 5/m 100/h and more https://django-ratelimit.readthedocs.io/en/stable/rates.html#simple-rates
 
@@ -0,0 +1,10 @@
+from django.dispatch import Signal
+
+# Sent before bulk-deleting findings via cascade_delete.
+# Receivers can dispatch integrator notifications, collect metrics, etc.
+# Provides: finding_qs (QuerySet of findings about to be deleted)
+#
+# IMPORTANT: The queryset may contain millions of rows. Receivers MUST NOT
+# call list(), len(), or otherwise materialize the full queryset into memory.
+# Use .filter(), .iterator(), or aggregation queries instead.
+pre_bulk_delete_findings = Signal()
@@ -1,5 +1,6 @@
 from __future__ import annotations
 
+import logging
 from collections.abc import Iterable
 
 from django.conf import settings
@@ -8,6 +9,8 @@
 
 from dojo.models import Product  # local import to avoid circulars at import time
 
+logger = logging.getLogger(__name__)
+
 
 def bulk_add_tags_to_instances(tag_or_tags, instances, tag_field_name: str = "tags", batch_size: int | None = None) -> int:
     """
@@ -161,4 +164,66 @@ def bulk_add_tags_to_instances(tag_or_tags, instances, tag_field_name: str = "ta
     return total_created
 
 
-__all__ = ["bulk_add_tags_to_instances"]
+def bulk_remove_all_tags(model_class, instance_ids_qs):
+    """
+    Remove all tags from instances identified by the given ID subquery.
+
+    Auto-discovers all TagFields on the model, decrements tag counts correctly,
+    and deletes through-table rows.
+    Accepts a QuerySet of IDs (as a subquery) to avoid materializing large ID lists.
+
+    Args:
+        model_class: The model class (e.g. Finding, Product).
+        instance_ids_qs: A QuerySet producing instance PKs (used as subquery).
+
+    """
+    tag_fields = [
+        field for field in model_class._meta.get_fields()
+        if hasattr(field, "tag_options")
+    ]
+
+    for tag_field in tag_fields:
+
+        tag_model = tag_field.related_model
+        through_model = tag_field.remote_field.through
+
+        # Find the FK column that points to the source model
+        source_field_name = None
+        target_field_name = None
+        for field in through_model._meta.get_fields():
+            if hasattr(field, "remote_field") and field.remote_field:
+                if field.remote_field.model == model_class:
+                    source_field_name = field.name
+                elif field.remote_field.model == tag_model:
+                    target_field_name = field.name
+
+        if not source_field_name or not target_field_name:
+            continue
+
+        # Get affected tag IDs and their counts before deletion
+        affected_tags = (
+            through_model.objects.filter(**{f"{source_field_name}__in": instance_ids_qs})
+            .values(target_field_name)
+            .annotate(num=models.Count("id"))
+        )
+
+        # Decrement tag counts. Tag counts are not used in DefectDojo but we
+        # maintain them to avoid breaking tagulous's internal bookkeeping.
+        for entry in affected_tags:
+            tag_model.objects.filter(pk=entry[target_field_name]).update(
+                count=models.F("count") - entry["num"],
+            )
+
+        # Delete through-table rows
+        count, _ = through_model.objects.filter(
+            **{f"{source_field_name}__in": instance_ids_qs},
+        ).delete()
+
+        if count:
+            logger.debug(
+                "bulk_remove_all_tags: removed %d %s.%s through-table rows",
+                count, model_class.__name__, tag_field.name,
+            )
+
+
+__all__ = ["bulk_add_tags_to_instances", "bulk_remove_all_tags"]