Spaces:

UcsTurkey
/

oncu

Paused

ciyidogan commited on May 28, 2025

Commit

d72f235

verified ·

1 Parent(s): 6557064

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -58,7 +58,7 @@ def load_model():
         log(f"✅ Model indirildi: {model_path}")
         log("📦 GGUF model yükleniyor...")
-        llm = Llama(model_path=model_path, n_gpu_layers=-1, n_ctx=1024)
         log("✅ Model başarıyla yüklendi ve kullanılmaya hazır.")
         log("💡 Artık /chat endpoint'ine POST isteği gönderebilirsiniz.")
     except Exception as e:
@@ -75,7 +75,7 @@ def chat(req: ChatRequest):
         response = llm(
             prompt,
-            max_tokens=512,
             stop=["Kullanıcı:", "Asistan:"],
             echo=False
         )

         log(f"✅ Model indirildi: {model_path}")
         log("📦 GGUF model yükleniyor...")
+        llm = Llama(model_path=model_path, n_gpu_layers=40, n_ctx=1024)
         log("✅ Model başarıyla yüklendi ve kullanılmaya hazır.")
         log("💡 Artık /chat endpoint'ine POST isteği gönderebilirsiniz.")
     except Exception as e:
         response = llm(
             prompt,
+            max_tokens=256,
             stop=["Kullanıcı:", "Asistan:"],
             echo=False
         )