test: skip NNX int8 parameter-only checkpoint generation for GPU dot product test

hsuan-lun-chiang · ecnal-cienet · commit 450ef8da960a · 2026-05-25T15:25:35.000Z
NNX int8 parameter-only generation requires a convert-on-load setup, which causes a ValueError since the fp32 training checkpoint lacks the AqtDotGeneral state that the target int8 model expects. This aligns the GPU/dot-product test with the existing skip in the TPU/autoselected test variant.
diff --git a/tests/integration/generate_param_only_checkpoint_test.py b/tests/integration/generate_param_only_checkpoint_test.py
@@ -127,7 +127,20 @@ def test_param_ckpt_generation_with_autoselected_attention(quantization, capsys)
 @pytest.mark.external_serving
 @pytest.mark.integration_test
 @pytest.mark.gpu_only
-@pytest.mark.parametrize("quantization", [(""), ("int8")])
+@pytest.mark.parametrize(
+    "quantization",
+    [
+        (""),
+        pytest.param(
+            "int8",
+            marks=pytest.mark.skip(
+                reason="NNX int8 param-only generation is a convert-on-load case (the fp32 training "
+                "checkpoint has no AqtDotGeneral state the int8 model expects); tracked as a follow-up "
+                "alongside layerwise_quantization."
+            ),
+        ),
+    ],
+)
 def test_param_ckpt_generation_with_dot_product(quantization, capsys):
   """Tests the parameter-only checkpoint generation and decode flow on GPU with dot product attention."""
   os.environ["NVTE_FUSED_ATTN"] = "1"  # Enable fused attention