We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent d575ebf commit cde1604Copy full SHA for cde1604
1 file changed
tests/models/test_llama3_2_exllamav3.py
@@ -8,7 +8,6 @@
8
9
import torch
10
11
-
12
TESTS_MODELS_ROOT = os.path.abspath(os.path.join(os.path.dirname(__file__), ".."))
13
if TESTS_MODELS_ROOT not in sys.path:
14
sys.path.insert(0, TESTS_MODELS_ROOT)
@@ -67,6 +66,7 @@ class TestLlama3_2_ExllamaV3(ModelTest):
67
66
TORCH_DTYPE = torch.float16
68
QUANT_BACKEND = BACKEND.EXLLAMA_V3
69
LOAD_BACKEND = BACKEND.EXLLAMA_V3
+ MODEL_COMPAT_FAST_LAYER_POSITION = "first"
70
71
def test_llama3_2_exllamav3(self):
72
self.quantize_and_evaluate()
0 commit comments