Skip to content

Commit fbacddf

Browse files
committed
add test_hy_v3.py and test_ministral3.py
1 parent a96b39f commit fbacddf

4 files changed

Lines changed: 62 additions & 6 deletions

File tree

tests/models/test_hunyuan_v1_dense.py

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66
from model_test import ModelTest
77

88

9-
class TestNemotronUltra(ModelTest):
9+
class TestHunyuanV1Dense(ModelTest):
1010
NATIVE_MODEL_ID = "/monster/data/model/HY-MT1.5-1.8B" # tencent/HY-MT1.5-1.8B
1111
EVAL_TASKS_SLOW = {
1212
"arc_challenge": {
@@ -24,6 +24,5 @@ class TestNemotronUltra(ModelTest):
2424
}
2525
EVAL_TASKS_FAST = ModelTest.derive_fast_eval_tasks(EVAL_TASKS_SLOW)
2626

27-
def test_nemotron_ultra(self):
28-
# self.quantize_and_evaluate()
29-
print(self.evaluate_model(self.SAVE_PATH))
27+
def test_hunyuan_v1_dense(self):
28+
self.quantize_and_evaluate()

tests/models/test_hunyuan_v1_moe.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66
from model_test import ModelTest
77

88

9-
class TestNemotronUltra(ModelTest):
9+
class TestHunyuanV1MoE(ModelTest):
1010
NATIVE_MODEL_ID = "/monster/data/model/Hunyuan-A13B-Instruct" # tencent/Hunyuan-A13B-Instruct
1111
EVAL_TASKS_SLOW = {
1212
"arc_challenge": {
@@ -24,5 +24,5 @@ class TestNemotronUltra(ModelTest):
2424
}
2525
EVAL_TASKS_FAST = ModelTest.derive_fast_eval_tasks(EVAL_TASKS_SLOW)
2626

27-
def test_nemotron_ultra(self):
27+
def test_hunyuan_v1_moe(self):
2828
self.quantize_and_evaluate()

tests/models/test_hy_v3.py

Lines changed: 28 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
# SPDX-FileCopyrightText: 2024-2025 ModelCloud.ai
2+
# SPDX-FileCopyrightText: 2024-2025 qubitium@modelcloud.ai
3+
# SPDX-License-Identifier: Apache-2.0
4+
# Contact: qubitium@modelcloud.ai, x.com/qubitium
5+
6+
from model_test import ModelTest
7+
8+
9+
class TestHyV3(ModelTest):
10+
NATIVE_MODEL_ID = "/monster/data/model/Hy-MT2-30B-A3B" # tencent/Hy-MT2-30B-A3B
11+
EVAL_TASKS_SLOW = {
12+
"arc_challenge": {
13+
"chat_template": True,
14+
"acc": {"value": 0.3182, "floor_pct": 0.36},
15+
"acc_norm": {"value": 0.3472, "floor_pct": 0.36},
16+
},
17+
"mmlu_stem": {
18+
"chat_template": False,
19+
"acc": {
20+
"value": 0.4024,
21+
"floor_pct": 0.04,
22+
},
23+
},
24+
}
25+
EVAL_TASKS_FAST = ModelTest.derive_fast_eval_tasks(EVAL_TASKS_SLOW)
26+
27+
def test_hy_v3(self):
28+
self.quantize_and_evaluate()

tests/models/test_ministral3.py

Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
# SPDX-FileCopyrightText: 2024-2025 ModelCloud.ai
2+
# SPDX-FileCopyrightText: 2024-2025 qubitium@modelcloud.ai
3+
# SPDX-License-Identifier: Apache-2.0
4+
# Contact: qubitium@modelcloud.ai, x.com/qubitium
5+
6+
from model_test import ModelTest
7+
8+
9+
class TestMinistral3(ModelTest):
10+
NATIVE_MODEL_ID = "/monster/data/model/Ministral-3-3B-Instruct-2512-TextOnly" # "Aratako/Ministral-3-3B-Instruct-2512-TextOnly"
11+
NATIVE_ARC_CHALLENGE_ACC = 0.4974
12+
NATIVE_ARC_CHALLENGE_ACC_NORM = 0.5256
13+
NATIVE_ARC_CHALLENGE_ACC_SLOW = NATIVE_ARC_CHALLENGE_ACC
14+
NATIVE_ARC_CHALLENGE_ACC_NORM_SLOW = NATIVE_ARC_CHALLENGE_ACC_NORM
15+
NATIVE_ARC_CHALLENGE_ACC_FAST = NATIVE_ARC_CHALLENGE_ACC_SLOW
16+
NATIVE_ARC_CHALLENGE_ACC_NORM_FAST = NATIVE_ARC_CHALLENGE_ACC_NORM_SLOW
17+
TRUST_REMOTE_CODE = False
18+
EVAL_BATCH_SIZE = 6
19+
EVAL_TASKS_SLOW = {
20+
"arc_challenge": {
21+
"chat_template": False,
22+
"acc": {"value": NATIVE_ARC_CHALLENGE_ACC},
23+
"acc_norm": {"value": NATIVE_ARC_CHALLENGE_ACC_NORM},
24+
},
25+
}
26+
EVAL_TASKS_FAST = ModelTest.derive_fast_eval_tasks(EVAL_TASKS_SLOW)
27+
28+
def test_ministral3(self):
29+
self.quantize_and_evaluate()

0 commit comments

Comments
 (0)