Spaces:

viskav
/

format

Sleeping

App Files Files Community

viskav commited on Dec 15, 2025

Commit

442962e

verified ·

1 Parent(s): 9d5787f

Update app.py

Browse files

Files changed (1) hide show

app.py +41 -21

app.py CHANGED Viewed

@@ -23,19 +23,27 @@ llm = None
 @asynccontextmanager
 async def lifespan(app: FastAPI):
     global llm
-    model_path = hf_hub_download(
-        repo_id=MODEL_REPO,
-        filename=MODEL_FILE,
-    )
-    llm = Llama(
-        model_path=model_path,
-        n_ctx=N_CTX,
-        n_threads=N_THREADS,
-        n_batch=N_BATCH,
-        verbose=False,
-    )
     yield
@@ -127,19 +135,31 @@ Return ONLY the humanized text.
 # ==================================================
 @app.post("/humanize")
 def humanize(req: HumanizeRequest):
     if not req.text.strip():
         raise HTTPException(status_code=400, detail="Input text is empty")
     prompt = build_prompt(req.text, req.section, req.author_notes)
-    response = llm(
-        prompt,
-        max_tokens=512,
-        temperature=0.4,
-        top_p=0.9,
-        repetition_penalty=1.1,
-    )
     return {
         "humanized_text": response["choices"][0]["text"].strip()
-    }

 @asynccontextmanager
 async def lifespan(app: FastAPI):
     global llm
+    try:
+        print("⏳ Downloading model...")
+        model_path = hf_hub_download(
+            repo_id=MODEL_REPO,
+            filename=MODEL_FILE,
+        )
+        print("✅ Model downloaded. Loading...")
+        llm = Llama(
+            model_path=model_path,
+            n_ctx=N_CTX,
+            n_threads=N_THREADS,
+            n_batch=N_BATCH,
+            verbose=False,
+        )
+        print("🚀 Model loaded successfully")
+    except Exception as e:
+        print("❌ Model load failed:", e)
+        llm = None
     yield
 # ==================================================
 @app.post("/humanize")
 def humanize(req: HumanizeRequest):
+    if llm is None:
+        raise HTTPException(
+            status_code=503,
+            detail="Model is still loading. Please try again in a few seconds."
+        )
     if not req.text.strip():
         raise HTTPException(status_code=400, detail="Input text is empty")
     prompt = build_prompt(req.text, req.section, req.author_notes)
+    try:
+        response = llm(
+            prompt,
+            max_tokens=400,
+            temperature=0.4,
+            top_p=0.9,
+            repetition_penalty=1.1,
+        )
+    except Exception as e:
+        raise HTTPException(
+            status_code=500,
+            detail=f"Inference error: {str(e)}"
+        )
     return {
         "humanized_text": response["choices"][0]["text"].strip()
+    }