diff --git a/docs/examples/Supported_Models.ipynb b/docs/examples/Supported_Models.ipynb index 699fb405d..71888f15f 100644 --- a/docs/examples/Supported_Models.ipynb +++ b/docs/examples/Supported_Models.ipynb @@ -178,6 +178,14 @@ " Multilingual model, e5-large. Recommend using ...\n", " 2.240\n", " \n", + " \n", + " \n", + " 16\n", + " intfloat/multilingual-e5-large-instruct \n", + " 1024\n", + " Multilingual model, e5-large-instruct\n", + " 1.120\n", + " \n", " \n", "\n", "" @@ -200,6 +208,7 @@ "13 BAAI/bge-large-en-v1.5 1024 \n", "14 thenlper/gte-large 1024 \n", "15 intfloat/multilingual-e5-large 1024 \n", + "16 intfloat/multilingual-e5-large-instruct 1024 \n", "\n", " description size_in_GB \n", "0 Fast and Default English model 0.067 \n", @@ -217,7 +226,8 @@ "12 Sentence-transformers model for tasks like clu... 1.000 \n", "13 Large English model, v1.5 1.200 \n", "14 Large general text embeddings model 1.200 \n", - "15 Multilingual model, e5-large. Recommend using ... 2.240 " + "15 Multilingual model, e5-large. Recommend using ... 2.240 \n", + "16 Multilingual model, e5-large-instruct. 1.120 " ] }, "execution_count": 6, diff --git a/fastembed/text/e5_onnx_embedding.py b/fastembed/text/e5_onnx_embedding.py index 9c37174cd..28fda2522 100644 --- a/fastembed/text/e5_onnx_embedding.py +++ b/fastembed/text/e5_onnx_embedding.py @@ -25,6 +25,15 @@ "hf": "xenova/paraphrase-multilingual-mpnet-base-v2", }, }, + { + "model": "intfloat/multilingual-e5-large-instruct", + "dim": 1024, + "description": "multilingual model, e5-large-instruct", + "size_in_GB": 1.12, + "sources": { + "hf": "yashvardhan7/multilingual-e5-large-instruct", + }, + }, ] diff --git a/tests/test_text_onnx_embeddings.py b/tests/test_text_onnx_embeddings.py index be7105259..7929fefb3 100644 --- a/tests/test_text_onnx_embeddings.py +++ b/tests/test_text_onnx_embeddings.py @@ -28,6 +28,7 @@ ), "thenlper/gte-large": np.array([-0.01920587, 0.00113156, -0.00708992, -0.00632304, -0.04025577]), "mixedbread-ai/mxbai-embed-large-v1": np.array([0.02295546, 0.03196154, 0.016512, -0.04031524, -0.0219634]), + "intfloat/multilingual-e5-large-instruct": np.array([ 0.01020065, 0.0236722, 0.00117698, -0.04327101, 0.02887568]), }