cern-nextgen
diff --git a/‎src/pquant/__init__.py‎
Lines changed: 4 additions & 4 deletions b/‎src/pquant/__init__.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎src/pquant/core/constants.py‎
Lines changed: 0 additions & 21 deletions b/‎src/pquant/core/constants.py‎
Lines changed: 0 additions & 21 deletions
diff --git a/‎src/pquant/core/keras/layers.py‎
Lines changed: 1 addition & 1 deletion b/‎src/pquant/core/keras/layers.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/pquant/pruning_methods/__init__.py‎ ‎…t/core/keras/pruning_methods/__init__.py‎src/pquant/pruning_methods/__init__.py renamed to src/pquant/core/keras/pruning_methods/__init__.py b/‎src/pquant/pruning_methods/__init__.py‎ ‎…t/core/keras/pruning_methods/__init__.py‎src/pquant/pruning_methods/__init__.py renamed to src/pquant/core/keras/pruning_methods/__init__.py
diff --git a/‎…nt/pruning_methods/activation_pruning.py‎ ‎…as/pruning_methods/activation_pruning.py‎src/pquant/pruning_methods/activation_pruning.py renamed to src/pquant/core/keras/pruning_methods/activation_pruning.py b/‎…nt/pruning_methods/activation_pruning.py‎ ‎…as/pruning_methods/activation_pruning.py‎src/pquant/pruning_methods/activation_pruning.py renamed to src/pquant/core/keras/pruning_methods/activation_pruning.py
diff --git a/‎src/pquant/pruning_methods/autosparse.py‎ ‎…core/keras/pruning_methods/autosparse.py‎src/pquant/pruning_methods/autosparse.py renamed to src/pquant/core/keras/pruning_methods/autosparse.py
Lines changed: 3 additions & 1 deletion b/‎src/pquant/pruning_methods/autosparse.py‎ ‎…core/keras/pruning_methods/autosparse.py‎src/pquant/pruning_methods/autosparse.py renamed to src/pquant/core/keras/pruning_methods/autosparse.py
Lines changed: 3 additions & 1 deletion
diff --git a/‎…/pruning_methods/constraint_functions.py‎ ‎…/pruning_methods/constraint_functions.py‎src/pquant/pruning_methods/constraint_functions.py renamed to src/pquant/core/keras/pruning_methods/constraint_functions.py b/‎…/pruning_methods/constraint_functions.py‎ ‎…/pruning_methods/constraint_functions.py‎src/pquant/pruning_methods/constraint_functions.py renamed to src/pquant/core/keras/pruning_methods/constraint_functions.py
diff --git a/‎src/pquant/pruning_methods/cs.py‎ ‎…/pquant/core/keras/pruning_methods/cs.py‎src/pquant/pruning_methods/cs.py renamed to src/pquant/core/keras/pruning_methods/cs.py b/‎src/pquant/pruning_methods/cs.py‎ ‎…/pquant/core/keras/pruning_methods/cs.py‎src/pquant/pruning_methods/cs.py renamed to src/pquant/core/keras/pruning_methods/cs.py
diff --git a/‎src/pquant/pruning_methods/dst.py‎ ‎…pquant/core/keras/pruning_methods/dst.py‎src/pquant/pruning_methods/dst.py renamed to src/pquant/core/keras/pruning_methods/dst.py b/‎src/pquant/pruning_methods/dst.py‎ ‎…pquant/core/keras/pruning_methods/dst.py‎src/pquant/pruning_methods/dst.py renamed to src/pquant/core/keras/pruning_methods/dst.py
diff --git a/‎src/pquant/pruning_methods/mdmm.py‎ ‎…quant/core/keras/pruning_methods/mdmm.py‎src/pquant/pruning_methods/mdmm.py renamed to src/pquant/core/keras/pruning_methods/mdmm.py
Lines changed: 35 additions & 4 deletions b/‎src/pquant/pruning_methods/mdmm.py‎ ‎…quant/core/keras/pruning_methods/mdmm.py‎src/pquant/pruning_methods/mdmm.py renamed to src/pquant/core/keras/pruning_methods/mdmm.py
Lines changed: 35 additions & 4 deletions
@@ -5,7 +5,7 @@
 # flake8: noqa
 backend = os.getenv("KERAS_BACKEND", "tensorflow")
 if backend == "torch":
-    from . import configs, pruning_methods
+    from . import configs
     from .core.hyperparameter_optimization import (
         PQConfig,
         ap_config,
@@ -19,7 +19,7 @@
         pdp_config,
         wanda_config,
     )
-    from .core.torch import activations, layers, optimizers, quantizer
+    from .core.torch import activations, layers, optimizers, pruning_methods, quantizer
     from .core.torch.layers import (
         add_compression_layers,
         apply_final_compression,
@@ -61,7 +61,7 @@
     __all__ = _forwards
 
 else:
-    from . import configs, pruning_methods
+    from . import configs
     from .core.hyperparameter_optimization import (
         PQConfig,
         ap_config,
@@ -74,7 +74,7 @@
         pdp_config,
         wanda_config,
     )
-    from .core.keras import activations, layers, quantizer
+    from .core.keras import activations, layers, pruning_methods, quantizer
     from .core.keras.layers import (
         add_compression_layers,
         apply_final_compression,
 
@@ -10,15 +10,6 @@
     PDPPruningModel,
     WandaPruningModel,
 )
-from pquant.pruning_methods.constraint_functions import (
-    EqualityConstraint,
-    GreaterThanOrEqualConstraint,
-    LessThanOrEqualConstraint,
-)
-from pquant.pruning_methods.metric_functions import (
-    StructuredSparsityMetric,
-    UnstructuredSparsityMetric,
-)
 
 PRUNING_MODEL_REGISTRY = {
     "cs": CSPruningModel,
@@ -53,15 +44,3 @@
 CONFIG_FILE = "config.yaml"
 
 N_JOBS = 1
-
-
-METRIC_REGISTRY = {
-    "UnstructuredSparsity": UnstructuredSparsityMetric,
-    "StructuredSparsity": StructuredSparsityMetric,
-}
-
-CONSTRAINT_REGISTRY = {
-    "Equality": EqualityConstraint,
-    "LessThanOrEqual": LessThanOrEqualConstraint,
-    "GreaterThanOrEqual": GreaterThanOrEqualConstraint,
-}
@@ -25,7 +25,7 @@
 from pquant.core.hyperparameter_optimization import PQConfig
 from pquant.core.keras.activations import PQActivation
 from pquant.core.keras.quantizer import Quantizer
-from pquant.core.utils import get_pruning_layer
+from pquant.core.keras.utils import get_pruning_layer
 
 T = TypeVar("T")
 
 
@@ -113,7 +113,9 @@ def call(self, weight):
         is_training = ops.logical_not(ops.logical_or(self.is_pretraining, self.is_finetuning))
         self.mask.assign(ops.where(is_training, new_binary_mask, ops.convert_to_tensor(self.mask)))
 
-        sparse_weight = ops.sign(weight) * ops.reshape(autosparse_prune(w_t, self.alpha), weight.shape)
+        sparse_weight = ops.sign(weight) * ops.reshape(
+            autosparse_prune(w_t, ops.convert_to_tensor(self.alpha)), weight.shape
+        )
 
         return ops.where(
             self.is_pretraining,
 
@@ -8,7 +8,26 @@
 import keras
 from keras import ops
 
-from pquant.core.constants import CONSTRAINT_REGISTRY, METRIC_REGISTRY
+from pquant.core.keras.pruning_methods.constraint_functions import (
+    EqualityConstraint,
+    GreaterThanOrEqualConstraint,
+    LessThanOrEqualConstraint,
+)
+from pquant.core.keras.pruning_methods.metric_functions import (
+    StructuredSparsityMetric,
+    UnstructuredSparsityMetric,
+)
+
+METRIC_REGISTRY = {
+    "UnstructuredSparsity": UnstructuredSparsityMetric,
+    "StructuredSparsity": StructuredSparsityMetric,
+}
+
+CONSTRAINT_REGISTRY = {
+    "Equality": EqualityConstraint,
+    "LessThanOrEqual": LessThanOrEqualConstraint,
+    "GreaterThanOrEqual": GreaterThanOrEqualConstraint,
+}
 
 # -------------------------------------------------------------------
 #                   MDMM Layer
@@ -28,6 +47,10 @@ def __init__(self, config, layer_type, *args, **kwargs):
         self.constraint_layer = None
         self._is_finetuning = False
         self._is_pretraining = True
+        # TEMP: cache last penalty so calculate_additional_loss() works in
+        # custom training loops via get_model_losses(). Remove once the
+        # add_loss()/model.fit path is the only supported path.
+        self._last_penalty = None
 
     def build(self, input_shape):
         pruning_parameters = self.config.pruning_parameters
@@ -94,8 +117,11 @@ def call(self, weight):
         self.mask.assign(ops.where(not_active, ops.convert_to_tensor(self.mask), hard_mask))
 
         penalty = ops.sum(self.constraint_layer(weight))
-        self.add_loss(ops.where(not_active, ops.zeros_like(penalty), penalty))
-
+        gated_penalty = ops.where(not_active, ops.zeros_like(penalty), penalty)
+        self.add_loss(gated_penalty)
+        # TEMP: cache for calculate_additional_loss() — remove with the
+        # _last_penalty attribute once custom-loop callers move to model.losses.
+        self._last_penalty = gated_penalty
         return ops.where(self.is_finetuning, weight * hard_mask, weight)
 
     def get_hard_mask(self, weight=None):
@@ -109,7 +135,12 @@ def get_layer_sparsity(self, weight):
 
     def calculate_additional_loss(self):
         # Loss is added via self.add_loss() in call() for model.fit.
-        # For custom training loops, accumulate model.losses from the last forward pass instead.
+        # TEMP: also return the cached penalty so custom training loops using
+        # get_model_losses() see the constraint term. Remove this branch (and
+        # the _last_penalty cache) once those callers switch to model.losses;
+        # then this can revert to `return 0.0`.
+        if self._last_penalty is not None:
+            return self._last_penalty
         return 0.0
 
     def pre_epoch_function(self, epoch, total_epochs):