Added embedding_dtype and vocabulary_quantization to config

Pringled · Pringled · commit fb3b2f74848b · 2025-09-11T12:44:57.000+02:00
diff --git a/model2vec/hf_utils.py b/model2vec/hf_utils.py
@@ -53,6 +53,9 @@ def save_pretrained(
 
     save_file(model_weights, folder_path / "model.safetensors")
     tokenizer.save(str(folder_path / "tokenizer.json"), pretty=False)
+
+    # Add embedding dtype to config
+    config["embedding_dtype"] = np.dtype(embeddings.dtype).name
     json.dump(config, open(folder_path / "config.json", "w"), indent=4)
 
     # Create modules.json
diff --git a/model2vec/model.py b/model2vec/model.py
@@ -506,6 +506,7 @@ def quantize_model(
         embeddings, token_mapping, weights = quantize_vocabulary(
             n_clusters=vocabulary_quantization, weights=model.weights, embeddings=model.embedding
         )
+        model.config["vocabulary_quantization"] = vocabulary_quantization
     else:
         embeddings = model.embedding
         token_mapping = model.token_mapping

Original file line number	Diff line number	Diff line change
`@@ -506,6 +506,7 @@ def quantize_model(`
`506`	`506`	`embeddings, token_mapping, weights = quantize_vocabulary(`
`507`	`507`	`n_clusters=vocabulary_quantization, weights=model.weights, embeddings=model.embedding`
`508`	`508`	`)`
	`509`	`+ model.config["vocabulary_quantization"] = vocabulary_quantization`
`509`	`510`	`else:`
`510`	`511`	`embeddings = model.embedding`
`511`	`512`	`token_mapping = model.token_mapping`