| FROM ghcr.io/huggingface/text-embeddings-inference:cpu-latest |
|
|
| # 国内加速(可选) |
| ENV HF_ENDPOINT=https: |
| ENV HF_HOME=/data/huggingface |
|
|
| # 关键步骤:升级 transformers 库,以支持 Gemma3 等新架构 |
| # RUN pip install --upgrade transformers sentence-transformers huggingface-hub |
|
|
| # 模型选择(轻量模型,适合免费 CPU) |
| # ENV MODEL_ID="Maxi-Lein/Qwen3-Embedding-4B-onnx" |
| ENV MODEL_ID="Qwen/Qwen3-Embedding-0.6B" |
| # ENV MODEL_ID="BAAI/bge-small-zh-v1.5" |
|
|
| # ENV INFINITY_MODEL_ID="microsoft/harrier-oss-v1-0.6b" |
| # BAAI/bge-small-zh-v1.5(中英文,轻量,24M 参数) |
|
|
| # 启动 TEI,监听 7860 端口(HF 要求) |
| # CMD ["--model-id", "Maxi-Lein/Qwen3-Embedding-4B-onnx", "--pooling", "mean", "--port", "7860"] |
| CMD ["--model-id", "Qwen/Qwen3-Embedding-0.6B", "--pooling", "mean", "--port", "7860"] |