Skip to content

Commit 2e6c8ab

Browse files
fix: Updated nomic ai with mean pooling
1 parent fa11d0f commit 2e6c8ab

File tree

4 files changed

+21
-12
lines changed

4 files changed

+21
-12
lines changed

fastembed/text/pooled_embedding.py

Lines changed: 0 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -18,17 +18,6 @@
1818
},
1919
"model_file": "onnx/model.onnx",
2020
},
21-
{
22-
"model": "nomic-ai/nomic-embed-text-v1.5-Q",
23-
"dim": 768,
24-
"description": "Text embeddings, Multimodal (text, image), English, 8192 input tokens truncation, Prefixes for queries/documents: necessary, 2024 year.",
25-
"license": "apache-2.0",
26-
"size_in_GB": 0.13,
27-
"sources": {
28-
"hf": "nomic-ai/nomic-embed-text-v1.5",
29-
},
30-
"model_file": "onnx/model_quantized.onnx",
31-
},
3221
{
3322
"model": "nomic-ai/nomic-embed-text-v1",
3423
"dim": 768,

fastembed/text/pooled_normalized_embedding.py

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,17 @@
99
from fastembed.text.pooled_embedding import PooledEmbedding
1010

1111
supported_pooled_normalized_models = [
12+
{
13+
"model": "nomic-ai/nomic-embed-text-v1.5-Q",
14+
"dim": 768,
15+
"description": "Text embeddings, Multimodal (text, image), English, 8192 input tokens truncation, Prefixes for queries/documents: necessary, 2024 year.",
16+
"license": "apache-2.0",
17+
"size_in_GB": 0.13,
18+
"sources": {
19+
"hf": "nomic-ai/nomic-embed-text-v1.5",
20+
},
21+
"model_file": "onnx/model_quantized.onnx",
22+
},
1223
{
1324
"model": "sentence-transformers/all-MiniLM-L6-v2",
1425
"dim": 384,

fastembed/text/text_embedding.py

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,4 @@
1+
import warnings
12
from typing import Any, Iterable, Optional, Sequence, Type, Union
23

34
import numpy as np
@@ -62,6 +63,14 @@ def __init__(
6263
**kwargs,
6364
):
6465
super().__init__(model_name, cache_dir, threads, **kwargs)
66+
if model_name == "nomic-ai/nomic-embed-text-v1.5-Q":
67+
warnings.warn(
68+
"The model 'nomic-ai/nomic-embed-text-v1.5-Q' has been updated to include a mean pooling layer. "
69+
"Please ensure your usage aligns with the new functionality. "
70+
"Support for the previous version without mean pooling will be removed as of version 0.5.2.",
71+
UserWarning,
72+
stacklevel=2,
73+
)
6574
for EMBEDDING_MODEL_TYPE in self.EMBEDDINGS_REGISTRY:
6675
supported_models = EMBEDDING_MODEL_TYPE.list_supported_models()
6776
if any(model_name.lower() == model["model"].lower() for model in supported_models):

tests/test_text_onnx_embeddings.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@
4848
[-0.15407836, -0.03053198, -3.9138033, 0.1910364, 0.13224715]
4949
),
5050
"nomic-ai/nomic-embed-text-v1.5-Q": np.array(
51-
[-0.12525563, 0.38030425, -3.961622, 0.04176439, -0.0758301]
51+
[0.0035279, 0.0162738, -0.1893193, 0.0194878, -0.0119418]
5252
),
5353
"thenlper/gte-large": np.array(
5454
[-0.01920587, 0.00113156, -0.00708992, -0.00632304, -0.04025577]

0 commit comments

Comments
 (0)