FROM ghcr.io/huggingface/text-embeddings-inference:cpu-latest # 国内加速(可选) ENV HF_ENDPOINT=https://hf-mirror.com ENV HF_HOME=/data/huggingface # 关键步骤:升级 transformers 库,以支持 Gemma3 等新架构 # RUN pip install --upgrade transformers sentence-transformers huggingface-hub # 模型选择(轻量模型,适合免费 CPU) # ENV MODEL_ID="Maxi-Lein/Qwen3-Embedding-4B-onnx" ENV MODEL_ID="Qwen/Qwen3-Embedding-0.6B" # ENV MODEL_ID="BAAI/bge-small-zh-v1.5" # ENV INFINITY_MODEL_ID="microsoft/harrier-oss-v1-0.6b" # BAAI/bge-small-zh-v1.5(中英文,轻量,24M 参数) # 启动 TEI,监听 7860 端口(HF 要求) # CMD ["--model-id", "Maxi-Lein/Qwen3-Embedding-4B-onnx", "--pooling", "mean", "--port", "7860"] CMD ["--model-id", "Qwen/Qwen3-Embedding-0.6B", "--pooling", "mean", "--port", "7860"]