ex510 commited on
Commit
40b4ddb
·
verified ·
1 Parent(s): 3a33bda

Create main.py

Browse files
Files changed (1) hide show
  1. main.py +35 -0
main.py ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from fastapi import FastAPI, HTTPException
2
+ from pydantic import BaseModel
3
+ from sentence_transformers import SentenceTransformer
4
+ import uvicorn
5
+
6
+ app = FastAPI(title="Text Embedding API (KaLM-Embedding-Gemma3-12B)")
7
+
8
+ class TextRequest(BaseModel):
9
+ text: str
10
+
11
+ # Load Model
12
+ model_id = 'tencent/KaLM-Embedding-Gemma3-12B-2511'
13
+ model = SentenceTransformer(model_id)
14
+
15
+ @app.get("/")
16
+ def home():
17
+ return {"status": "online", "model": model_id, "endpoint": "/embed/text"}
18
+
19
+ @app.post("/embed/text")
20
+ async def embed_text(request: TextRequest):
21
+ try:
22
+ # Generate embedding
23
+ embedding = model.encode(request.text).tolist()
24
+
25
+ return {
26
+ "success": True,
27
+ "model": model_id,
28
+ "dimension": len(embedding),
29
+ "embedding": embedding
30
+ }
31
+ except Exception as e:
32
+ raise HTTPException(status_code=400, detail=str(e))
33
+
34
+ if __name__ == "__main__":
35
+ uvicorn.run(app, host="0.0.0.0", port=7860)