Buckets:
| import os | |
| from langchain_huggingface import HuggingFaceEmbeddings | |
| _embedder = None | |
| def get_embedder() -> HuggingFaceEmbeddings: | |
| """ | |
| Local HuggingFace embedding model — BAAI/bge-small-en-v1.5 | |
| Downloaded once to ~/.cache/huggingface on first run. | |
| normalize_embeddings=True required for correct cosine similarity with BGE. | |
| """ | |
| global _embedder | |
| if _embedder is None: | |
| _embedder = HuggingFaceEmbeddings( | |
| model_name=os.getenv("HF_EMBEDDING_MODEL", "BAAI/bge-small-en-v1.5"), | |
| model_kwargs={"device": "cpu"}, | |
| encode_kwargs={"normalize_embeddings": True}, | |
| ) | |
| return _embedder | |
Xet Storage Details
- Size:
- 655 Bytes
- Xet hash:
- 3e97154d5be15d164f4c3b4e0dc02a99138a351c40aa5ab303c30ea554c1cbe5
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.