@@ -539,7 +539,7 @@ def test_pard_sa_global_pool(self):
539539 task = GSM8K (self .MODEL_NAME )
540540 task .evaluate (llm , extra_acc_spec = "use_sa_spec" )
541541
542- @pytest . mark . skip_less_device_memory ( 60000 )
542+ @skip_pre_hopper
543543 @parametrize_with_ids ("enable_max_concurrency,enable_draft_len_schedule" , [
544544 (False , True ),
545545 (True , False ),
@@ -577,7 +577,7 @@ def test_pard_dynamic_draft_len(self, enable_max_concurrency,
577577 task = GSM8K (self .MODEL_NAME )
578578 task .evaluate (llm )
579579
580- @pytest . mark . skip_less_device_memory ( 60000 )
580+ @skip_pre_hopper
581581 @parametrize_with_ids ("enable_max_concurrency,enable_draft_len_schedule" , [
582582 (False , True ),
583583 (True , False ),
@@ -1937,6 +1937,7 @@ def test_bfloat16_mtp_sa_global_pool(self):
19371937 task = GSM8K (self .MODEL_NAME )
19381938 task .evaluate (llm , extra_acc_spec = "use_sa_spec" )
19391939
1940+ @pytest .mark .skip_less_device_memory (60000 )
19401941 @parametrize_with_ids ("enable_max_concurrency,enable_draft_len_schedule" , [
19411942 (False , True ),
19421943 (True , False ),
@@ -2052,7 +2053,6 @@ def test_mtp_eagle_dynamic_draft_len(self, enable_max_concurrency,
20522053 task = GSM8K (self .MODEL_NAME )
20532054 task .evaluate (llm )
20542055
2055- @pytest .mark .skip_less_device_memory (60000 )
20562056 @parametrize_with_ids ("enable_max_concurrency,enable_draft_len_schedule" , [
20572057 (False , True ),
20582058 (True , False ),
0 commit comments