Skip to content

Commit fd0b26f

Browse files
deichrennerjoein
andauthored
Add support for jinaai/jina-embeddings-v2-base-de (#270)
* feat: add support for SOTA german embedding model with long context length jinaai/jina-embeddings-v2-base-de * Fix jina de model weight --------- Co-authored-by: George <[email protected]>
1 parent 5461012 commit fd0b26f

File tree

2 files changed

+9
-0
lines changed

2 files changed

+9
-0
lines changed

fastembed/text/jina_onnx_embedding.py

+8
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,14 @@
2424
"sources": {"hf": "xenova/jina-embeddings-v2-small-en"},
2525
"model_file": "onnx/model.onnx",
2626
},
27+
{
28+
"model": "jinaai/jina-embeddings-v2-base-de",
29+
"dim": 768,
30+
"description": "German embedding model supporting 8192 sequence length",
31+
"size_in_GB": 0.32,
32+
"sources": {"hf": "jinaai/jina-embeddings-v2-base-de"},
33+
"model_file": "onnx/model_fp16.onnx",
34+
},
2735
]
2836

2937

tests/test_text_onnx_embeddings.py

+1
Original file line numberDiff line numberDiff line change
@@ -36,6 +36,7 @@
3636
),
3737
"jinaai/jina-embeddings-v2-small-en": np.array([-0.0455, -0.0428, -0.0122, 0.0613, 0.0015]),
3838
"jinaai/jina-embeddings-v2-base-en": np.array([-0.0332, -0.0509, 0.0287, -0.0043, -0.0077]),
39+
"jinaai/jina-embeddings-v2-base-de": np.array([-0.0085, 0.0417, 0.0342, 0.0309, -0.0149]),
3940
"nomic-ai/nomic-embed-text-v1": np.array([0.0061, 0.0103, -0.0296, -0.0242, -0.0170]),
4041
"nomic-ai/nomic-embed-text-v1.5": np.array(
4142
[-1.6531514e-02, 8.5380634e-05, -1.8171231e-01, -3.9333291e-03, 1.2763254e-02]

0 commit comments

Comments
 (0)