Spaces:

skkalwar
/

LLM_Model

Sleeping

Shreekant Kalwar (Nokia) commited on Sep 4

Commit

4815889

1 Parent(s): 6707a85

model change

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from fastapi import FastAPI
 from pydantic import BaseModel
 from transformers import AutoTokenizer, AutoModelForCausalLM
 import torch
 import os
@@ -10,11 +11,24 @@ os.environ["HF_HOME"] = "/app/.cache"
 app = FastAPI()
 class ChatRequest(BaseModel):
     message: str
 # Load DeepSeek model (small one for local use)
-model_name = "deepseek-ai/deepseek-coder-1.3b-instruct"
 print("Loading model... this may take a minute ⏳")
 tokenizer = AutoTokenizer.from_pretrained(model_name)
@@ -34,5 +48,8 @@ def chat(request: ChatRequest):
     """Chat endpoint using DeepSeek model"""
     inputs = tokenizer(request.message, return_tensors="pt").to(model.device)
     outputs = model.generate(**inputs, max_new_tokens=200)
     reply = tokenizer.decode(outputs[0], skip_special_tokens=True)
     return {"reply": reply}

 from fastapi import FastAPI
 from pydantic import BaseModel
 from transformers import AutoTokenizer, AutoModelForCausalLM
+from fastapi.middleware.cors import CORSMiddleware
 import torch
 import os
 app = FastAPI()
+# ✅ Allow all origins
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],  # allow all origins
+    allow_credentials=True,
+    allow_methods=["*"],  # allow all HTTP methods
+    allow_headers=["*"],  # allow all headers
+)
 class ChatRequest(BaseModel):
     message: str
 # Load DeepSeek model (small one for local use)
+#model_name = "deepseek-ai/deepseek-coder-1.3b-instruct"
+model_name="Qwen/Qwen2.5-1.5B-Instruct"
+#model_name="TinyLlama/TinyLlama-1.1B-Chat-v1.0"
 print("Loading model... this may take a minute ⏳")
 tokenizer = AutoTokenizer.from_pretrained(model_name)
     """Chat endpoint using DeepSeek model"""
     inputs = tokenizer(request.message, return_tensors="pt").to(model.device)
     outputs = model.generate(**inputs, max_new_tokens=200)
     reply = tokenizer.decode(outputs[0], skip_special_tokens=True)
     return {"reply": reply}