diff --git a/fastembed/text/onnx_embedding.py b/fastembed/text/onnx_embedding.py index 1e9978f75..de1f4e0b6 100644 --- a/fastembed/text/onnx_embedding.py +++ b/fastembed/text/onnx_embedding.py @@ -180,6 +180,19 @@ sources=ModelSource(hf="jinaai/jina-clip-v1"), model_file="onnx/text_model.onnx", ), + DenseModelDescription( + model="intfloat/multilingual-e5-large-instruct", + dim=1024, + description=( + "Text embeddings, Unimodal (text), Multilingual, 512 input tokens truncation, " + "Prefixes for queries/documents: necessary, 2024 year." + ), + license="mit", + size_in_GB=2.25, + sources=ModelSource(hf="intfloat/multilingual-e5-large-instruct"), + model_file="onnx/model.onnx", + additional_files=["onnx/model.onnx_data"] + ) ] diff --git a/tests/test_text_onnx_embeddings.py b/tests/test_text_onnx_embeddings.py index cdd22d79a..f81d9034f 100644 --- a/tests/test_text_onnx_embeddings.py +++ b/tests/test_text_onnx_embeddings.py @@ -36,6 +36,7 @@ [0.0361, 0.1862, 0.2776, 0.2461, -0.1904] ), "intfloat/multilingual-e5-large": np.array([0.4544, -0.0968, 0.1054, -1.3753, 0.1500]), + "intfloat/multilingual-e5-large-instruct": np.array([0.01044649, 0.02897520, 0.00060697, -0.04193532, 0.02606634]), "sentence-transformers/paraphrase-multilingual-mpnet-base-v2": np.array( [0.0047, 0.1334, -0.0102, 0.0714, 0.1930] ),