diff --git a/fastembed/text/pooled_normalized_embedding.py b/fastembed/text/pooled_normalized_embedding.py index 70660420..47ec91a1 100644 --- a/fastembed/text/pooled_normalized_embedding.py +++ b/fastembed/text/pooled_normalized_embedding.py @@ -75,6 +75,15 @@ "sources": {"hf": "jinaai/jina-embeddings-v2-base-es"}, "model_file": "onnx/model.onnx", }, + { + "model": "thenlper/gte-base", + "dim": 768, + "description": "General text embeddings, Unimodal (text), supports English only input text, 512 input tokens truncation, Prefixes for queries/documents: not necessary, 2024 year.", + "license": "mit", + "size_in_GB": 0.44, + "sources": {"hf": "thenlper/gte-base"}, + "model_file": "onnx/model.onnx", + }, ] diff --git a/tests/test_text_onnx_embeddings.py b/tests/test_text_onnx_embeddings.py index f576330c..a40794be 100644 --- a/tests/test_text_onnx_embeddings.py +++ b/tests/test_text_onnx_embeddings.py @@ -64,6 +64,7 @@ ), "snowflake/snowflake-arctic-embed-l": np.array([0.0189, -0.0673, 0.0183, 0.0124, 0.0146]), "Qdrant/clip-ViT-B-32-text": np.array([0.0083, 0.0103, -0.0138, 0.0199, -0.0069]), + "thenlper/gte-base": np.array([0.0038, 0.0355, 0.0181, 0.0092, 0.0654]), }