File tree Expand file tree Collapse file tree
unittest/auto_deploy/singlegpu/shim Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -358,7 +358,6 @@ unittest/_torch/thop/serial/test_moe.py::TestMoeFp4::test_no_autotune[use_score_
358358unittest/_torch/thop/serial/test_moe.py::TestMoeFp4::test_no_autotune[use_score_as_input-RoutingRenormalize_qwen_next-swiglu-1024-1024-150] SKIP (https://nvbugs/5908070)
359359unittest/_torch/thop/serial/test_moe.py::TestMoeFp4::test_no_autotune[use_score_as_input-RoutingRenormalize_topk_4-swiglu-1024-1024-150] SKIP (https://nvbugs/5908070)
360360unittest/_torch/visual_gen/test_flux_pipeline.py::TestFluxCombinedOptimizations::test_all_optimizations_combined SKIP (https://nvbugs/6199854)
361- unittest/auto_deploy/singlegpu/shim/test_llm_config.py::test_speculative_flashinfer_fallback_disables_piecewise SKIP (https://nvbugs/6309375)
362361unittest/auto_deploy/singlegpu/smoke SKIP (https://nvbugs/6306936)
363362unittest/auto_deploy/singlegpu/smoke/test_disagg.py::test_autodeploy_disaggregated_batch_smoke[deepseek-trtllm-simple] SKIP (https://nvbugs/6307525)
364363unittest/auto_deploy/singlegpu/smoke/test_disagg.py::test_autodeploy_disaggregated_batch_smoke[llama-flashinfer-cudagraph] SKIP (https://nvbugs/6307525)
Original file line number Diff line number Diff line change @@ -95,25 +95,6 @@ def test_yaml_compile_backend_disables_default_piecewise(tmp_path):
9595 assert args .transforms ["compile_model" ]["piecewise_enabled" ] is False
9696
9797
98- def test_speculative_flashinfer_fallback_disables_piecewise ():
99- from tensorrt_llm .llmapi import EagleDecodingConfig
100-
101- spec_config = EagleDecodingConfig (
102- max_draft_len = 3 ,
103- speculative_model = "some/model" ,
104- eagle3_one_model = True ,
105- )
106-
107- args = LlmArgs (
108- model = "test-model" ,
109- attn_backend = "flashinfer" ,
110- speculative_config = spec_config ,
111- )
112-
113- assert args .compile_backend == "torch-simple"
114- assert args .transforms ["compile_model" ]["piecewise_enabled" ] is False
115-
116-
11798def test_cache_transceiver_rejects_unmanaged_persistent_caches ():
11899 """Cache transceiver rejects unmanaged persistent cache resources."""
119100 args = LlmArgs (
You can’t perform that action at this time.
0 commit comments