Skip to content

Commit 1002e69

Browse files
[FIX] ci test (#2843)
* fix test_llama3_2_exllamav3.py Signed-off-by: ZX-ModelCloud <zx@modelcloud.ai> * fix test_falcon.py and test_gpt_oss.py Signed-off-by: ZX-ModelCloud <zx@modelcloud.ai> --------- Signed-off-by: ZX-ModelCloud <zx@modelcloud.ai>
1 parent bb0e0eb commit 1002e69

3 files changed

Lines changed: 6 additions & 1 deletion

File tree

gptqmodel/looper/exllamav3_processor.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -141,6 +141,7 @@ def preprocess(self, module: NamedModule, fallback=None, **kwargs):
141141
sym=True,
142142
device=module_qcfg.device,
143143
pack_dtype=module_qcfg.pack_dtype,
144+
act_group_aware=False,
144145
)
145146

146147
task = GPTQ(module=module, qcfg=capture_qcfg)

tests/models/test_falcon.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,8 @@
44
# Contact: qubitium@modelcloud.ai, x.com/qubitium
55

66
import torch # noqa: E402
7+
8+
from gptqmodel import BACKEND
79
from model_test import ModelTest
810

911

@@ -22,6 +24,7 @@ class TestFalcon(ModelTest):
2224
EVAL_BATCH_SIZE = 6
2325
USE_VLLM = False
2426
ACT_GROUP_AWARE = False
27+
LOAD_BACKEND = BACKEND.AUTO
2528

2629
def test_falcon(self):
2730
self.quantize_and_evaluate()

tests/models/test_gpt_oss.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
# SPDX-FileCopyrightText: 2024-2025 qubitium@modelcloud.ai
33
# SPDX-License-Identifier: Apache-2.0
44
# Contact: qubitium@modelcloud.ai, x.com/qubitium
5-
5+
from gptqmodel import BACKEND
66
from model_test import ModelTest
77

88

@@ -21,6 +21,7 @@ class TestGPTOSS(ModelTest):
2121
EVAL_BATCH_SIZE = 6
2222
USE_VLLM = False
2323
ACT_GROUP_AWARE = False
24+
LOAD_BACKEND = BACKEND.AUTO
2425

2526
def test_gpt_oss(self):
2627
self.quantize_and_evaluate()

0 commit comments

Comments
 (0)