Change the local scale identification method

shubhra · shubhra · commit 053183365f13 · 2025-09-25T13:56:00.000-04:00
Signed-off-by: Shubhra Pandit &lt;shubhra.pandit@gmail.com&gt;
diff --git a/src/llmcompressor/observers/mse.py b/src/llmcompressor/observers/mse.py
@@ -145,6 +145,7 @@ def calculate_updated_min_max(
         reduce_dims: Optional[Tuple[int]] = None,
         tensor_id: Optional[Any] = None,
         global_scale: Optional[torch.Tensor] = None,
+        is_local: Optional[bool]= False,
     ) -> Tuple[FloatTensor, IntTensor]:
         """
         Updates the mse-clipped min and max values of the observed tensor using
@@ -164,7 +165,7 @@ def calculate_updated_min_max(
         """
 
         # Skip local scales updates for dynamic activations (this will happen at runtime)
-        if self.is_activation and reduce_dims is not None:
+        if self.is_activation and is_local:
             # Activations local scales: min–max
             min_val = torch.amin(observed, dim=reduce_dims, keepdims=True)
             max_val = torch.amax(observed, dim=reduce_dims, keepdims=True)
@@ -219,6 +220,7 @@ def calculate_qparams(
             tensor_id=tensor_id,
             reduce_dims=reduce_dims,
             global_scale=global_scale,
+            is_local=True,
         )
         scale, zero_point = calculate_qparams(
             min_vals=updated_min_val,