move workflow test to gpu tests

willg-nv · willg-nv · commit 16f3c6d6c88f · 2026-02-27T07:59:39.000Z
Signed-off-by: Will Guo &lt;willg@nvidia.com&gt;
diff --git a/modelopt/onnx/quantization/autotune/__main__.py b/modelopt/onnx/quantization/autotune/__main__.py
@@ -112,8 +112,6 @@ def run_autotune() -> int:
         logger.error("Failed to initialize TensorRT benchmark")
         return 1
 
-    logger.info("Autotuning Mode: Pattern-Based")
-
     try:
         node_filter_list = None
         if args.node_filter_list:
diff --git a/tests/_test_utils/onnx/quantization/autotune/models.py b/tests/_test_utils/onnx/quantization/autotune/models.py
@@ -25,9 +25,9 @@
 
 def _create_simple_conv_onnx_model():
     """Build ONNX model: Input -> Conv -> Relu -> Output (minimal for autotuner tests)."""
-    input_tensor = helper.make_tensor_value_info("input", onnx.TensorProto.FLOAT, [1, 3, 224, 224])
+    input_tensor = helper.make_tensor_value_info("input", onnx.TensorProto.FLOAT, [32, 3, 224, 224])
     output_tensor = helper.make_tensor_value_info(
-        "output", onnx.TensorProto.FLOAT, [1, 64, 224, 224]
+        "output", onnx.TensorProto.FLOAT, [32, 64, 224, 224]
     )
     conv_node = helper.make_node(
         "Conv", inputs=["input", "conv_weight"], outputs=["conv_out"], name="conv"
diff --git a/tests/gpu/onnx/quantization/autotune/test_workflow.py b/tests/gpu/onnx/quantization/autotune/test_workflow.py
@@ -52,11 +52,11 @@ def test_export_quantized_model(use_trtexec, simple_conv_model):
     output_path = output_dir + ".quant.onnx"
 
     try:
-        init_benchmark_instance(use_trtexec=use_trtexec)
+        init_benchmark_instance(use_trtexec=use_trtexec, timing_runs=100)
         autotuner = region_pattern_autotuning_workflow(baseline_model_path, Path(output_dir))
 
         # Export model with Q/DQ insertion
-        autotuner.export_onnx(output_path, insert_qdq=True)
+        autotuner.export_onnx(output_path, insert_qdq=True, best=True)
 
         # Verify file was created
         assert os.path.exists(output_path)