Fix

Giuseppe5 · Giuseppe5 · commit 06bcaaef983b · 2023-12-15T13:50:11.000Z
diff --git a/src/brevitas/graph/equalize.py b/src/brevitas/graph/equalize.py
@@ -437,12 +437,14 @@ def _no_equalize():
 
     # Instead of clipping very low values, which would cause their reciprocal to be very large
     # thus hindering quantization, we set them to one, which is the no-op equivalent for equalization
-    sinks_range = torch.where(
-        sinks_range > EPSILON, sinks_range, torch.tensor(1., dtype=dtype, device=device))
-    srcs_range = torch.where(
-        srcs_range > EPSILON, srcs_range, torch.tensor(1., dtype=dtype, device=device))
-    srcs_range = torch.pow(srcs_range, alpha)
+    sinks_range = torch.where((sinks_range < EPSILON) | (srcs_range < EPSILON),
+                              torch.tensor(1., dtype=dtype, device=device),
+                              sinks_range)
+    srcs_range = torch.where((sinks_range < EPSILON) | (srcs_range < EPSILON),
+                             torch.tensor(1., dtype=dtype, device=device),
+                             srcs_range)
 
+    srcs_range = torch.pow(srcs_range, alpha)
     sinks_range = torch.pow(sinks_range, 1 - alpha)
     scaling_factors = srcs_range / sinks_range
     inverse_scaling_factors = torch.reciprocal(scaling_factors)
diff --git a/src/brevitas_examples/llm/llm_quant/equalize.py b/src/brevitas_examples/llm/llm_quant/equalize.py
@@ -32,6 +32,7 @@ def trace_and_standardize(model, ref_kwargs):
     graph_model = value_trace(model, value_args=ref_kwargs)
     graph_model = TorchFunctionalToModule().apply(graph_model)
     graph_model = DuplicateSharedStatelessModule().apply(graph_model)
+    return graph_model
 
 
 @torch.no_grad()