ciyidogan commited on
Commit
933f767
·
verified ·
1 Parent(s): 9a84c07

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -6
app.py CHANGED
@@ -21,10 +21,12 @@ def log(message):
21
  # === FastAPI başlat
22
  app = FastAPI()
23
  pipe = None
 
 
24
 
25
  @app.on_event("startup")
26
  def load_model():
27
- global pipe
28
  model_name = "atasoglu/Turkish-Llama-3-8B-function-calling"
29
  log(f"⬇️ Model yükleniyor: {model_name}")
30
  model, tokenizer = FastLanguageModel.from_pretrained(
@@ -48,16 +50,19 @@ class TestRequest(BaseModel):
48
  def test(req: TestRequest):
49
  prompt = f"Kullanıcı: {req.user_input}\nAsistan:"
50
  log(f"💬 Prompt alındı: {req.user_input}")
51
- outputs = pipe(
52
- prompt,
 
53
  max_new_tokens=256,
54
  temperature=0.2,
55
  top_p=0.95,
56
- repetition_penalty=1.1
 
57
  )
58
- answer = outputs[0]["generated_text"].replace(prompt, "").strip()
 
59
  log("✅ Cevap üretildi.")
60
- return {"response": answer}
61
 
62
  @app.get("/")
63
  def health():
 
21
  # === FastAPI başlat
22
  app = FastAPI()
23
  pipe = None
24
+ model = None
25
+ tokenizer = None
26
 
27
  @app.on_event("startup")
28
  def load_model():
29
+ global pipe, model, tokenizer
30
  model_name = "atasoglu/Turkish-Llama-3-8B-function-calling"
31
  log(f"⬇️ Model yükleniyor: {model_name}")
32
  model, tokenizer = FastLanguageModel.from_pretrained(
 
50
  def test(req: TestRequest):
51
  prompt = f"Kullanıcı: {req.user_input}\nAsistan:"
52
  log(f"💬 Prompt alındı: {req.user_input}")
53
+ inputs = tokenizer([prompt], return_tensors="pt") # ❌ .to("cuda") KALDIRILDI
54
+ outputs = model.generate(
55
+ **inputs,
56
  max_new_tokens=256,
57
  temperature=0.2,
58
  top_p=0.95,
59
+ repetition_penalty=1.1,
60
+ do_sample=True
61
  )
62
+ answer = tokenizer.decode(outputs[0], skip_special_tokens=True)
63
+ answer_clean = answer.split("Asistan:")[-1].strip()
64
  log("✅ Cevap üretildi.")
65
+ return {"response": answer_clean}
66
 
67
  @app.get("/")
68
  def health():