Update tests

ajrasane · ajrasane · commit e829998fe603 · 2025-11-18T19:38:55.000Z
Signed-off-by: ajrasane &lt;131806219+ajrasane@users.noreply.github.com&gt;
diff --git a/tests/unit/onnx/test_qdq_utils.py b/tests/unit/onnx/test_qdq_utils.py
@@ -17,11 +17,11 @@
 import pytest
 from onnx import TensorProto, helper, numpy_helper
 
+from modelopt.onnx.export.quant_exporter import INT4QuantExporter
 from modelopt.onnx.quantization.qdq_utils import (
     _cast_fp4,
     _cast_fp8,
     fp4qdq_to_2dq,
-    quantize_weights_to_int4,
     quantize_weights_to_mxfp8,
 )
 
@@ -337,7 +337,9 @@ def test_basic_quantization_with_reshape_transpose(self):
         model = create_test_model_with_int4_dq_reshape_transpose_matmul()
 
         # Run quantization
-        quantized_model = quantize_weights_to_int4(model)
+        quantized_model = INT4QuantExporter.compute_scales(model)
+        quantized_model = INT4QuantExporter.compress_weights(quantized_model)
+        quantized_model = INT4QuantExporter.post_process(quantized_model)
 
         # Verify weight is converted to INT4
         weight_tensor = next(
@@ -362,7 +364,9 @@ def test_quantization_with_constant_scale(self):
         model = create_test_model_with_int4_dq_reshape_transpose_matmul(constant_scale=True)
 
         # Run quantization
-        quantized_model = quantize_weights_to_int4(model)
+        quantized_model = INT4QuantExporter.compute_scales(model)
+        quantized_model = INT4QuantExporter.compress_weights(quantized_model)
+        quantized_model = INT4QuantExporter.post_process(quantized_model)
 
         # Verify Constant node is removed
         constant_nodes = [node for node in quantized_model.graph.node if node.op_type == "Constant"]
@@ -385,7 +389,9 @@ def test_projection_bias_and_scale_casting(self):
         model = create_test_model_with_proj_nodes()
 
         # Run quantization
-        quantized_model = quantize_weights_to_int4(model)
+        quantized_model = INT4QuantExporter.compute_scales(model)
+        quantized_model = INT4QuantExporter.compress_weights(quantized_model)
+        quantized_model = INT4QuantExporter.post_process(quantized_model)
 
         # Verify bias tensor is cast to float16
         bias_tensor = next(