apple · NehalBhandari · Jun 18, 2024 · Jun 17, 2024
diff --git a/coremltools/optimize/torch/layerwise_compression/_quant.py b/coremltools/optimize/torch/layerwise_compression/_quant.py
@@ -120,10 +120,10 @@ def find_params(self, x, weight=False):
         x_max = _torch.maximum(x.max(1)[0], tmp)
 
         if self._symmetric:
-            xmax = _torch.maximum(_torch.abs(x_min), x_max)
+            x_max = _torch.maximum(_torch.abs(x_min), x_max)
             tmp = x_min < 0
             if _torch.any(tmp):
-                x_min[tmp] = -xmax[tmp]
+                x_min[tmp] = -x_max[tmp]
         tmp = (x_min == 0) & (x_max == 0)
         x_min[tmp] = -1
         x_max[tmp] = +1

diff --git a/coremltools/test/optimize/torch/layerwise_compression/test_quant.py b/coremltools/test/optimize/torch/layerwise_compression/test_quant.py
@@ -0,0 +1,83 @@
+#  Copyright (c) 2024, Apple Inc. All rights reserved.
+#
+#  Use of this source code is governed by a BSD-3-clause license that can be
+#  found in the LICENSE.txt file or at https://opensource.org/licenses/BSD-3-Clause
+
+import pytest
+import torch
+
+from coremltools.optimize.torch.layerwise_compression._quant import Quantizer
+
+
+@pytest.mark.parametrize(
+    "quantizer, expected_scale, expected_zp",
+    [
+        (
+            Quantizer(n_bits=4, per_channel=True, symmetric=True),
+            torch.tensor([[0.48], [1.4]]),
+            torch.tensor([[8.0], [8.0]]),
+        ),
+        (
+            Quantizer(n_bits=4, per_channel=False, symmetric=True),
+            torch.tensor([[1.4], [1.4]]),
+            torch.tensor([[8.0], [8.0]]),
+        ),
+        (
+            Quantizer(n_bits=4, per_channel=True, symmetric=False),
+            torch.tensor([[0.32], [0.76]]),
+            torch.tensor([[11.0], [1.0]]),
+        ),
+        (
+            Quantizer(n_bits=4, per_channel=False, symmetric=False),
+            torch.tensor([[0.94], [0.94]]),
+            torch.tensor([[4.0], [4.0]]),
+        ),
+        (
+            Quantizer(n_bits=8, per_channel=True, symmetric=True),
+            torch.tensor([[0.028], [0.0824]]),
+            torch.tensor([[128.0], [128.0]]),
+        ),
+        (
+            Quantizer(n_bits=8, per_channel=False, symmetric=True),
+            torch.tensor([[0.0824], [0.0824]]),
+            torch.tensor([[128.0], [128.0]]),
+        ),
+        (
+            Quantizer(n_bits=8, per_channel=True, symmetric=False),
+            torch.tensor([[0.0188], [0.0447]]),
+            torch.tensor([[191.0], [20.0]]),
+        ),
+        (
+            Quantizer(n_bits=8, per_channel=False, symmetric=False),
+            torch.tensor([[0.0553], [0.0553]]),
+            torch.tensor([[65.0], [65.0]]),
+        ),
+    ],
+)
+def test_find_params(quantizer, expected_scale, expected_zp):
+    # input
+    x = torch.tensor([[1.2, -3.6, 0.4], [-0.9, 1.5, 10.5]])
+    # fine quantization params
+    quantizer.find_params(x, weight=True)
+    # compare
+    assert torch.all(
+        torch.isclose(quantizer.scale, expected_scale, rtol=0.001, atol=0.001)
+    )
+    assert torch.all(torch.isclose(quantizer.zero_point, expected_zp))
+
+
+@pytest.mark.parametrize(
+    "input, weight, expected_shape",
+    [
+        (torch.rand(2, 3), True, (2, 1)),
+        (torch.rand(2, 3, 4), True, (2, 1, 1)),
+        (torch.rand(2, 3, 4, 5), True, (2, 1, 1, 1)),
+        (torch.rand(2, 3), False, (1, 3)),
+        (torch.rand(2, 3, 4), False, (1, 1, 4)),
+        (torch.rand(2, 3, 4, 5), False, (1, 3, 1, 1)),
+    ],
+)
+def test_find_params_reshape(input, weight, expected_shape):
+    quantizer = Quantizer(n_bits=4, per_channel=True, symmetric=True)
+    quantizer.find_params(input, weight=weight)
+    assert quantizer.scale.shape == expected_shape