meet4150's picture
download
raw
655 Bytes
import os
from langchain_huggingface import HuggingFaceEmbeddings
_embedder = None
def get_embedder() -> HuggingFaceEmbeddings:
"""
Local HuggingFace embedding model — BAAI/bge-small-en-v1.5
Downloaded once to ~/.cache/huggingface on first run.
normalize_embeddings=True required for correct cosine similarity with BGE.
"""
global _embedder
if _embedder is None:
_embedder = HuggingFaceEmbeddings(
model_name=os.getenv("HF_EMBEDDING_MODEL", "BAAI/bge-small-en-v1.5"),
model_kwargs={"device": "cpu"},
encode_kwargs={"normalize_embeddings": True},
)
return _embedder

Xet Storage Details

Size:
655 Bytes
·
Xet hash:
3e97154d5be15d164f4c3b4e0dc02a99138a351c40aa5ab303c30ea554c1cbe5

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.