fix ut

Signed-off-by: yuwenzho <[email protected]>
onnx · Jul 3, 2024 · 56c27ef · 56c27ef
1 parent 2340f61
commit 56c27ef
Show file tree

Hide file tree

Showing 4 changed files with 10 additions and 41 deletions.
diff --git a/onnx_neural_compressor/algorithms/utility.py b/onnx_neural_compressor/algorithms/utility.py
@@ -386,7 +386,7 @@ def make_matmul_weight_only_node(
             # require onnxruntime > 1.16.3
             kwargs["accuracy_level"] = accuracy_level
 
-    else: # pragma: no cover
+    else:  # pragma: no cover
         offset = 5 if zero_point is not None else 4
         op_type = "MatMulFpQ4"
 

diff --git a/test/quantization/layer_wise/test_layer_wise.py b/test/quantization/layer_wise/test_layer_wise.py
@@ -15,7 +15,6 @@
 from onnx_neural_compressor.quantization import config, matmul_4bits_quantizer
 
 
-
 def find_onnx_file(folder_path):
     # return first .onnx file path in folder_path
     for root, dirs, files in os.walk(folder_path):
@@ -217,6 +216,7 @@ def test_gptq_layer_wise_with_ort_like_api(self):
 
     def test__check_model_with_infer_shapes(self):
         from onnx_neural_compressor.algorithms.layer_wise import core as lwq_core
+
         self.assertFalse(lwq_core._check_model_with_infer_shapes(self.llama))
         self.assertTrue(lwq_core._check_model_with_infer_shapes(self.llama_optimized))
         self.assertTrue(

diff --git a/test/quantization/test_algorithm_utility.py b/test/quantization/test_algorithm_utility.py
@@ -1,9 +1,10 @@
 """Tests for algorithm utility components."""
 
 import os
-import onnx
 import unittest
+
 import numpy as np
+import onnx
 
 from onnx_neural_compressor.algorithms import utility as quant_utils
 
@@ -16,6 +17,7 @@ def find_onnx_file(folder_path):
                 return os.path.join(root, file)
     return None
 
+
 class TestUtilityFunctions(unittest.TestCase):
 
     def test_is_B_transposed(self):

diff --git a/test/utils/test_onnx_model.py b/test/utils/test_onnx_model.py
@@ -242,55 +242,22 @@ def test_remove_unused_nodes(self):
         model.remove_unused_nodes()
         self.assertTrue("Constant" not in [node.op_type for node in model.nodes()])
 
-        # test unused QuantizeLinear and DequantizeLinear
-        A = onnx.helper.make_tensor_value_info("A", onnx.TensorProto.FLOAT, [1, 1, 5, 5])
-        A_scale = onnx.helper.make_tensor_value_info("A_scale", onnx.TensorProto.FLOAT, [1])
-        a_scale = onnx.numpy_helper.from_array(np.random.ranf([1]).astype(np.float32), "A_scale")
-        A_zero = onnx.helper.make_tensor_value_info("A_zero_point", onnx.TensorProto.INT8, [1])
-        a_zero_point = onnx.numpy_helper.from_array(np.random.ranf([1]).astype(np.int8), "A_zero_point")
-        quantize_node = onnx.helper.make_node(
-            "QuantizeLinear", ["A", "A_scale", "A_zero_point"], ["B_quantized"], name="quantizelinear"
-        )
-
-        B_scale = onnx.helper.make_tensor_value_info("B_scale", onnx.TensorProto.FLOAT, [1])
-        b_scale = onnx.numpy_helper.from_array(np.random.ranf([1]).astype(np.float32), "B_scale")
-        B_zero = onnx.helper.make_tensor_value_info("B_zero_point", onnx.TensorProto.INT8, [1])
-        b_zero_point = onnx.numpy_helper.from_array(np.random.ranf([1]).astype(np.int8), "B_zero_point")
-        C = onnx.helper.make_tensor_value_info("C", onnx.TensorProto.FLOAT, [1, 1, 5, 5])
-        dequantize_node = onnx.helper.make_node(
-            "DequantizeLinear", ["B_quantized", "B_scale", "B_zero_point"], ["C"], name="dequantizelinear"
-        )
-
-        graph = onnx.helper.make_graph(
-            [quantize_node, dequantize_node],
-            "test_model",
-            [A],
-            [C],
-            initializer=[a_scale, a_zero_point, b_scale, b_zero_point],
-        )
-        model = onnx.helper.make_model(graph, opset_imports=[onnx.helper.make_opsetid("", 13)])
-        model.ir_version = 7
-        model = onnx_model.ONNXModel(model)
-        self.assertTrue("QuantizeLinear" in [node.op_type for node in model.nodes()])
-        self.assertTrue("DequantizeLinear" in [node.op_type for node in model.nodes()])
-        model.remove_unused_nodes()
-        self.assertTrue("QuantizeLinear" not in [node.op_type for node in model.nodes()])
-        self.assertTrue("DequantizeLinear" not in [node.op_type for node in model.nodes()])
-
         # test node which does not serve as the input or output of any other nodes
         matmul2_weight = onnx.helper.make_tensor(
             "matmul2_weight", onnx.TensorProto.FLOAT, [1, 3], np.random.random((1, 3)).reshape(3).tolist()
         )
         matmul2_output = onnx.helper.make_tensor_value_info("matmul2_output", onnx.TensorProto.FLOAT, [3, 3])
-        matmul2_node = onnx.helper.make_node("MatMul", ["input", "matmul2_weight"], ["matmul2_output"], name="Matmul_1")
+        matmul2_node = onnx.helper.make_node("MatMul", ["A", "matmul2_weight"], ["matmul2_output"], name="Matmul_1")
         graph.node.append(matmul2_node)
         graph.initializer.append(matmul2_weight)
         model = onnx.helper.make_model(graph, opset_imports=[onnx.helper.make_opsetid("", 13)])
         model.ir_version = 7
+
+        onnx.save(model, "model1.onnx")
         model = onnx_model.ONNXModel(model)
-        self.assertTrue("MatMul" in [node.op_type for node in model.nodes()])
+        self.assertTrue("Matmul_1" in [node.name for node in model.nodes()])
         model.remove_unused_nodes()
-        self.assertTrue("MatMul" not in [node.op_type for node in model.nodes()])
+        self.assertTrue("Matmul_1" not in [node.name for node in model.nodes()])
 
     def test_add_or_remove_tensors_to_outputs(self):
         model = onnx_model.ONNXModel(self.matmul_add_model)