Skip to content

Commit d135f5d

Browse files
committed
Add SM constraint
Signed-off-by: Zheyu Fu <zheyuf@NVIDIA.com>
1 parent b8ec221 commit d135f5d

1 file changed

Lines changed: 3 additions & 3 deletions

File tree

tests/integration/defs/accuracy/test_llm_api_pytorch.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -539,7 +539,7 @@ def test_pard_sa_global_pool(self):
539539
task = GSM8K(self.MODEL_NAME)
540540
task.evaluate(llm, extra_acc_spec="use_sa_spec")
541541

542-
@pytest.mark.skip_less_device_memory(60000)
542+
@skip_pre_hopper
543543
@parametrize_with_ids("enable_max_concurrency,enable_draft_len_schedule", [
544544
(False, True),
545545
(True, False),
@@ -577,7 +577,7 @@ def test_pard_dynamic_draft_len(self, enable_max_concurrency,
577577
task = GSM8K(self.MODEL_NAME)
578578
task.evaluate(llm)
579579

580-
@pytest.mark.skip_less_device_memory(60000)
580+
@skip_pre_hopper
581581
@parametrize_with_ids("enable_max_concurrency,enable_draft_len_schedule", [
582582
(False, True),
583583
(True, False),
@@ -1937,6 +1937,7 @@ def test_bfloat16_mtp_sa_global_pool(self):
19371937
task = GSM8K(self.MODEL_NAME)
19381938
task.evaluate(llm, extra_acc_spec="use_sa_spec")
19391939

1940+
@pytest.mark.skip_less_device_memory(60000)
19401941
@parametrize_with_ids("enable_max_concurrency,enable_draft_len_schedule", [
19411942
(False, True),
19421943
(True, False),
@@ -2052,7 +2053,6 @@ def test_mtp_eagle_dynamic_draft_len(self, enable_max_concurrency,
20522053
task = GSM8K(self.MODEL_NAME)
20532054
task.evaluate(llm)
20542055

2055-
@pytest.mark.skip_less_device_memory(60000)
20562056
@parametrize_with_ids("enable_max_concurrency,enable_draft_len_schedule", [
20572057
(False, True),
20582058
(True, False),

0 commit comments

Comments
 (0)