|
101 | 101 | from .definitions.glm4_moe import GLM4MoEGPTQ # noqa: E402 |
102 | 102 | from .definitions.glm4_moe_lite import Glm4MoeLiteQModel # noqa: E402 |
103 | 103 | from .definitions.glm4v import Glm4vGPTQ # noqa: E402 |
104 | | -from .definitions.glm4v_moe import Glm4vMoeQModel # noqa: E402 |
| 104 | +from .definitions.glm4v_moe import Glm4vMoeQModel, Glm4vMoeTextQModel # noqa: E402 |
105 | 105 | from .definitions.glm_moe_dsa import GlmMoeDsaQModel # noqa: E402 |
106 | 106 | from .definitions.glm_ocr import GlmOCRGPTQ # noqa: E402 |
107 | 107 | from .definitions.glmasr import GlmASRGPTQ # noqa: E402 |
|
128 | 128 | from .definitions.lfm2_moe import LFM2MoeQModel # noqa: E402 |
129 | 129 | from .definitions.llada2 import LLaDA2MoeQModel |
130 | 130 | from .definitions.llama import LlamaQModel # noqa: E402 |
131 | | -from .definitions.llama4 import Llama4QModel # noqa: E402 |
| 131 | +from .definitions.llama4 import Llama4QModel, Llama4TextQModel # noqa: E402 |
132 | 132 | from .definitions.llava_qwen2 import LlavaQwen2QModel # noqa: E402 |
133 | 133 | from .definitions.longcat_flash import LongCatFlashQModel # noqa: E402 |
134 | 134 | from .definitions.mimo import MimoQModel # noqa: E402 |
|
141 | 141 | from .definitions.minimax_m2 import MiniMaxM2GPTQ # noqa: E402 |
142 | 142 | from .definitions.mistral3 import Mistral3GPTQ |
143 | 143 | from .definitions.mixtral import MixtralQModel # noqa: E402 |
144 | | -from .definitions.mllama import MLlamaQModel # noqa: E402 |
| 144 | +from .definitions.mllama import MLlamaQModel, MLlamaTextQModel # noqa: E402 |
145 | 145 | from .definitions.mobilellm import MobileLLMQModel # noqa: E402 |
146 | 146 | from .definitions.moss import MossQModel # noqa: E402 |
147 | 147 | from .definitions.mpt import MptQModel # noqa: E402 |
|
206 | 206 | "gpt2": GPT2QModel, |
207 | 207 | "llama": LlamaQModel, |
208 | 208 | "llama4": Llama4QModel, |
| 209 | + "llama4_text": Llama4TextQModel, |
209 | 210 | "opt": OptQModel, |
210 | 211 | "moss": MossQModel, |
211 | 212 | "chatglm": ChatGLMQModel, |
212 | 213 | "glm": GlmQModel, |
213 | 214 | "glm4": GlmQModel, |
214 | 215 | "glm4v": Glm4vGPTQ, |
215 | 216 | "glm4v_moe": Glm4vMoeQModel, |
| 217 | + "glm4v_moe_text": Glm4vMoeTextQModel, |
216 | 218 | "glmasr": GlmASRGPTQ, |
217 | 219 | "glm_ocr": GlmOCRGPTQ, |
218 | 220 | "glm4_moe": GLM4MoEGPTQ, |
|
287 | 289 | "exaone4": Exaone4QModel, |
288 | 290 | "grinmoe": GrinMoeQModel, |
289 | 291 | "mllama": MLlamaQModel, |
| 292 | + "mllama_text_model": MLlamaTextQModel, |
290 | 293 | "marin": Qwen3QModel, |
291 | 294 | "granite": LlamaQModel, # 100% llama clone |
292 | 295 | "granitemoehybrid": GraniteMoeHybridQModel, |
@@ -449,25 +452,6 @@ def _get_config_load_kwargs(kwargs: dict) -> dict: |
449 | 452 | return get_hf_gguf_load_kwargs(kwargs) |
450 | 453 |
|
451 | 454 |
|
452 | | -def _normalize_supported_model_type(config) -> str: |
453 | | - model_type = config.model_type.lower() |
454 | | - config_class_name = type(config).__name__ |
455 | | - |
456 | | - if model_type == "qwen3_5": |
457 | | - if config_class_name == "Qwen3_5TextConfig": |
458 | | - return "qwen3_5_text" |
459 | | - if not hasattr(config, "text_config") and not hasattr(config, "vision_config"): |
460 | | - return "qwen3_5_text" |
461 | | - |
462 | | - if model_type == "qwen3_5_moe": |
463 | | - if config_class_name == "Qwen3_5MoeTextConfig": |
464 | | - return "qwen3_5_moe_text" |
465 | | - if not hasattr(config, "text_config") and not hasattr(config, "vision_config"): |
466 | | - return "qwen3_5_moe_text" |
467 | | - |
468 | | - return model_type |
469 | | - |
470 | | - |
471 | 455 | def check_and_get_model_definition(model_dir, trust_remote_code=False, **config_load_kwargs): |
472 | 456 | if "gguf_file" not in config_load_kwargs: |
473 | 457 | model_dir = normalize_model_id_or_path_for_hf_gguf( |
|
0 commit comments