Gaykar commited on
Commit
b49655b
·
verified ·
1 Parent(s): f8ab8c8

Update app.py

Browse files

removed the uvicorn line

Files changed (1) hide show
  1. app.py +32 -33
app.py CHANGED
@@ -1,33 +1,32 @@
1
- from fastapi import FastAPI
2
- from pydantic import BaseModel
3
- from typing import List
4
- from sentence_transformers import SentenceTransformer
5
- import uvicorn
6
-
7
- app = FastAPI(title="Medical Embedding Service")
8
-
9
- # Load model ONCE at startup
10
- print("Loading Medical RAG Model... this may take a moment.")
11
- model = SentenceTransformer("Gaykar/all-MiniLM-L6-medical-rag")
12
- print("Model loaded successfully!")
13
-
14
- class QueryRequest(BaseModel):
15
- text: str
16
-
17
- class DocumentRequest(BaseModel):
18
- texts: List[str]
19
-
20
- @app.post("/embed_query")
21
- async def embed_query(request: QueryRequest):
22
- # Uses specialized encode_query for IR tasks
23
- embedding = model.encode_query(request.text).tolist()
24
- return {"embedding": embedding}
25
-
26
- @app.post("/embed_docs")
27
- async def embed_docs(request: DocumentRequest):
28
- # Uses specialized encode_document for IR tasks
29
- embeddings = model.encode_document(request.texts).tolist()
30
- return {"embeddings": embeddings}
31
-
32
- if __name__ == "__main__":
33
- uvicorn.run(app, host="0.0.0.0", port=8001)
 
1
+ from fastapi import FastAPI
2
+ from pydantic import BaseModel
3
+ from typing import List
4
+ from sentence_transformers import SentenceTransformer
5
+ import uvicorn
6
+
7
+ app = FastAPI(title="Medical Embedding Service")
8
+
9
+ # Load model ONCE at startup
10
+ print("Loading Medical RAG Model... this may take a moment.")
11
+ model = SentenceTransformer("Gaykar/all-MiniLM-L6-medical-rag")
12
+ print("Model loaded successfully!")
13
+
14
+ class QueryRequest(BaseModel):
15
+ text: str
16
+
17
+ class DocumentRequest(BaseModel):
18
+ texts: List[str]
19
+
20
+ @app.post("/embed_query")
21
+ async def embed_query(request: QueryRequest):
22
+ # Uses specialized encode_query for IR tasks
23
+ embedding = model.encode_query(request.text).tolist()
24
+ return {"embedding": embedding}
25
+
26
+ @app.post("/embed_docs")
27
+ async def embed_docs(request: DocumentRequest):
28
+ # Uses specialized encode_document for IR tasks
29
+ embeddings = model.encode_document(request.texts).tolist()
30
+ return {"embeddings": embeddings}
31
+
32
+