Adjust Quantization Preprocessing on Opset Handling (#26503)

qti-hungjuiw · web-flow · commit 3e8be0e88795 · 2025-12-06T00:01:29.000Z
### Description
&lt;!-- Describe your changes. --&gt;
- Moved `ReplaceUpsampleWithResize` in the quantization preprocessing
pipeline to occur before `SymbolicShapeInference`, due to the current
lack of shape inference support for the `Upsample` operator.
Prevented unnecessary modifications to `model.opset_import`. Setting
`model.opset_import` prior to invoking `onnx.version_converter` can
interfere with successful opset conversion.


### Motivation and Context
&lt;!-- - Why is this change required? What problem does it solve?
- If it fixes an open issue, please link to the issue here. --&gt;
- This change ensures the quantization preprocessing functions correctly
by addressing limitations in shape inference for `Upsample`.
- It also avoids potential issues with opset conversion caused by
premature modification of `model.opset_import`.
diff --git a/onnxruntime/python/tools/quantization/shape_inference.py b/onnxruntime/python/tools/quantization/shape_inference.py
@@ -74,34 +74,29 @@ def quant_pre_process(
 
     with tempfile.TemporaryDirectory(prefix="pre.quant.") as quant_tmp_dir:
         temp_path = Path(quant_tmp_dir)
-        model = None
+        model = input_model if isinstance(input_model, onnx.ModelProto) else onnx.load(input_model)
+
+        # Since Upsample is deprecated after opset v10, and the model's opset will
+        # be upgraded to at least v11 during quantization, we need to replace Upsample
+        # with Resize first to avoid generating an invalid model.
+        ai_onnx_domain = [opset for opset in model.opset_import if not opset.domain or opset.domain == "ai.onnx"]
+        if len(ai_onnx_domain) == 1:
+            opset_version = ai_onnx_domain[0].version
+            if opset_version <= 10:
+                ReplaceUpsampleWithResize(ONNXModel(model), opset_version).apply()
+                model = onnx.version_converter.convert_version(model, 11)
+                model = save_and_reload_model_with_shape_infer(model)
 
         if not skip_symbolic_shape:
             logger.info("Performing symbolic shape inference...")
-            loaded_model = input_model if isinstance(input_model, onnx.ModelProto) else onnx.load(input_model)
             model = SymbolicShapeInference.infer_shapes(
-                loaded_model,
+                model,
                 int_max,
                 auto_merge,
                 guess_output_rank,
                 verbose,
             )
 
-        # Since Upsample is deprecated after opset v10, and the model's opset will
-        # be upgraded to at least v11 during quantization, we need to replace Upsample
-        # with Resize first to avoid generating an invalid model.
-        if model:
-            ai_onnx_domain = [opset for opset in model.opset_import if not opset.domain or opset.domain == "ai.onnx"]
-            if len(ai_onnx_domain) == 1:
-                opset_version = ai_onnx_domain[0].version
-                if opset_version < 10:
-                    ReplaceUpsampleWithResize(ONNXModel(model), opset_version).apply()
-                    model.opset_import.remove(ai_onnx_domain[0])
-                    opset_version = 11
-                    model.opset_import.extend([onnx.helper.make_opsetid("", opset_version)])
-                    model = onnx.version_converter.convert_version(model, opset_version)
-                    model = save_and_reload_model_with_shape_infer(model)
-
         if not skip_optimization:
             # Use ORT optimizers (native code) to optimize model
             if not skip_symbolic_shape:
diff --git a/onnxruntime/test/python/quantization/test_quant_preprocess.py b/onnxruntime/test/python/quantization/test_quant_preprocess.py
@@ -0,0 +1,162 @@
+#!/usr/bin/env python
+# -------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License. See License.txt in the project root for
+# license information.
+# --------------------------------------------------------------------------
+
+import tempfile
+import unittest
+from pathlib import Path
+
+import numpy as np
+import onnx
+
+from onnxruntime.quantization.shape_inference import quant_pre_process
+
+
+class TestUpsample(unittest.TestCase):
+    def setUp(self):
+        self.temp_dir = tempfile.TemporaryDirectory(prefix="ort.quant_preprocess_")
+        self.temp_path = Path(self.temp_dir.name)
+
+    def tearDown(self):
+        self.temp_dir.cleanup()
+
+    def build_upsample_model(self, input_shape=(1, 3, 32, 32)):
+        """
+        Build a model with deprecated Upsample op (opset <= 10) for testing version conversion.
+        """
+        input_tensor = onnx.helper.make_tensor_value_info("input", onnx.TensorProto.FLOAT, input_shape)
+        output_shape = (input_shape[0], input_shape[1], input_shape[2] * 2, input_shape[3] * 2)
+        output_tensor = onnx.helper.make_tensor_value_info("output", onnx.TensorProto.FLOAT, output_shape)
+
+        # Create scales for upsample
+        scales = np.array([1.0, 1.0, 2.0, 2.0], dtype=np.float32)
+        scales_initializer = onnx.numpy_helper.from_array(scales, "scales")
+
+        upsample_node = onnx.helper.make_node(
+            "Upsample",
+            ["input", "scales"],
+            ["output"],
+            name="upsample_node",
+            mode="nearest",
+        )
+
+        graph = onnx.helper.make_graph(
+            [upsample_node],
+            "upsample_graph",
+            [input_tensor],
+            [output_tensor],
+            initializer=[scales_initializer],
+        )
+        # Use opset 10 to trigger Upsample -> Resize conversion
+        opset_imports = [onnx.helper.make_opsetid("", 10)]
+        model = onnx.helper.make_model(graph, opset_imports=opset_imports)
+        return model
+
+    def test_upsample_to_resize_conversion(self):
+        """
+        Test that deprecated Upsample ops are converted to Resize ops.
+        """
+        model = self.build_upsample_model()
+        input_path = self.temp_path / "input_model.onnx"
+        output_path = self.temp_path / "preprocessed_model.onnx"
+
+        onnx.save_model(model, input_path)
+
+        # Verify original model has Upsample op
+        self.assertEqual(model.graph.node[0].op_type, "Upsample")
+        self.assertEqual(model.opset_import[0].version, 10)
+
+        quant_pre_process(
+            input_model=str(input_path),
+            output_model_path=str(output_path),
+            skip_optimization=True,
+            skip_onnx_shape=True,
+            skip_symbolic_shape=True,
+        )
+
+        self.assertTrue(output_path.exists())
+        preprocessed_model = onnx.load(str(output_path))
+
+        # Verify Upsample was converted to Resize and opset was upgraded
+        node_types = [node.op_type for node in preprocessed_model.graph.node]
+        assert "Resize" in node_types
+        assert "Upsample" not in node_types
+        assert preprocessed_model.opset_import[0].version >= 11
+
+
+class TestClip(unittest.TestCase):
+    def setUp(self):
+        self.temp_dir = tempfile.TemporaryDirectory(prefix="ort.quant_preprocess_")
+        self.temp_path = Path(self.temp_dir.name)
+
+    def tearDown(self):
+        self.temp_dir.cleanup()
+
+    def build_clip_model(self, input_shape=(1, 3, 32, 32)):
+        """
+        Build a model with Clip op using ai.onnx v6 for testing version conversion.
+        """
+        input_tensor = onnx.helper.make_tensor_value_info("input", onnx.TensorProto.FLOAT, input_shape)
+        output_tensor = onnx.helper.make_tensor_value_info("output", onnx.TensorProto.FLOAT, input_shape)
+
+        # Create min and max values for clip
+        min_val = np.array(0.0, dtype=np.float32)
+        max_val = np.array(6.0, dtype=np.float32)
+        min_initializer = onnx.numpy_helper.from_array(min_val, "min")
+        max_initializer = onnx.numpy_helper.from_array(max_val, "max")
+
+        clip_node = onnx.helper.make_node(
+            "Clip",
+            ["input", "min", "max"],
+            ["output"],
+            name="clip_node",
+        )
+
+        graph = onnx.helper.make_graph(
+            [clip_node],
+            "clip_graph",
+            [input_tensor],
+            [output_tensor],
+            initializer=[min_initializer, max_initializer],
+        )
+        # Use opset 6 to trigger version conversion
+        opset_imports = [onnx.helper.make_opsetid("", 6)]
+        model = onnx.helper.make_model(graph, opset_imports=opset_imports)
+        return model
+
+    def test_clip_version_conversion(self):
+        """
+        Test that Clip op from ai.onnx v6 is upgraded to v11 after quant_pre_process.
+        """
+        model = self.build_clip_model()
+        input_path = self.temp_path / "input_clip_model.onnx"
+        output_path = self.temp_path / "preprocessed_clip_model.onnx"
+
+        onnx.save_model(model, input_path)
+
+        # Verify original model has Clip op with opset 6
+        self.assertEqual(model.graph.node[0].op_type, "Clip")
+        self.assertEqual(model.opset_import[0].version, 6)
+
+        quant_pre_process(
+            input_model=str(input_path),
+            output_model_path=str(output_path),
+            skip_optimization=True,
+            skip_onnx_shape=True,
+            skip_symbolic_shape=True,
+        )
+
+        self.assertTrue(output_path.exists())
+        preprocessed_model = onnx.load(str(output_path))
+
+        # Verify Clip op is still present and opset was upgraded to v11 or higher
+        node_types = [node.op_type for node in preprocessed_model.graph.node]
+        assert "Clip" in node_types
+        assert preprocessed_model.opset_import[0].version >= 11
+
+
+if __name__ == "__main__":
+    unittest.main()