Skip to content

Commit

Permalink
chore: xenova jina
Browse files Browse the repository at this point in the history
  • Loading branch information
Anush008 committed Jan 30, 2024
1 parent ede507e commit 3caeeeb
Show file tree
Hide file tree
Showing 2 changed files with 16 additions and 3 deletions.
15 changes: 14 additions & 1 deletion fastembed/embedding.py
Original file line number Diff line number Diff line change
Expand Up @@ -95,13 +95,26 @@ def __init__(
model_path = self.path / "model.onnx"
optimized_model_path = self.path / "model_optimized.onnx"

xenova_model_path = self.path / "onnx" / "model.onnx"
xenova_optimized_model_path = self.path / "onnx" / "model_optimized.onnx"

# List of Execution Providers: https://onnxruntime.ai/docs/execution-providers
onnx_providers = ["CPUExecutionProvider"]

if not model_path.exists():
# Rename file model_optimized.onnx to model.onnx if it exists
if optimized_model_path.exists():
optimized_model_path.rename(model_path)

# Patch for inconsistent repo structure at
# - https://huggingface.co/Xenova/jina-embeddings-v2-small-en
# - https://huggingface.co/Xenova/jina-embeddings-v2-base-en
elif xenova_model_path.exists():
model_path = xenova_model_path

elif xenova_optimized_model_path.exists():
model_path = xenova_optimized_model_path

else:
raise ValueError(f"Could not find model.onnx in {self.path}")

Expand All @@ -118,7 +131,7 @@ def __init__(
so.inter_op_num_threads = max_threads

self.tokenizer = self.load_tokenizer(self.path, max_length=max_length)
self.model = ort.InferenceSession(str(model_path), providers=onnx_providers, sess_options=so)
self.model = ort.InferenceSession(str(""), providers=onnx_providers, sess_options=so)

def onnx_embed(self, documents: List[str]) -> Tuple[np.ndarray, np.ndarray]:
encoded = self.tokenizer.encode_batch(documents)
Expand Down
4 changes: 2 additions & 2 deletions fastembed/models.json
Original file line number Diff line number Diff line change
Expand Up @@ -83,7 +83,7 @@
"description": " English embedding model supporting 8192 sequence length",
"size_in_GB": 0.55,
"hf_sources": [
"jinaai/jina-embeddings-v2-base-en"
"xenova/jina-embeddings-v2-base-en"
],
"compressed_url_sources": []
},
Expand All @@ -93,7 +93,7 @@
"description": " English embedding model supporting 8192 sequence length",
"size_in_GB": 0.13,
"hf_sources": [
"jinaai/jina-embeddings-v2-small-en"
"xenova/jina-embeddings-v2-small-en"
],
"compressed_url_sources": []
},
Expand Down

0 comments on commit 3caeeeb

Please sign in to comment.