Spaces:

benkada
/

aiWeb

Sleeping

benkada commited on Apr 27, 2025

Commit

b273b4c

verified ·

1 Parent(s): cf9785c

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -20,7 +20,7 @@ PORT              = int(os.getenv("PORT", 7860))
 app = FastAPI(
     title       = "AI-Powered Web-App API",
     description = "Backend for summarisation, captioning & QA",
-    version     = "1.2.4",               # <-- bumped
 )
 app.add_middleware(
@@ -47,12 +47,15 @@ summary_client        = InferenceClient(
     timeout = 120,
 )
-# ➜ Upgraded QA model to a BigBird-RoBERTa checkpoint (better for documents)
 qa_client             = InferenceClient(
-    "google/bigbird-roberta-base-squad2",
     token   = HUGGINGFACE_TOKEN,
-    timeout = 180,
 )
 image_caption_client  = InferenceClient(
     "nlpconnect/vit-gpt2-image-captioning",
@@ -111,6 +114,7 @@ async def summarize_document(file: UploadFile = File(...)):
 # -------------------- Image Caption ------------------------------------------
 @app.post("/api/caption")
 async def caption_image(image: UploadFile = File(...)):
     try:
         img_bytes = await image.read()
         img       = Image.open(io.BytesIO(img_bytes)).convert("RGB")
@@ -145,7 +149,7 @@ async def question_answering(file: UploadFile = File(...),
             context  = (res.get("generated_text") if isinstance(res, dict)
                         else str(res))
         else:
-            context = process_uploaded_file(file)[:4096]   # BigBird handles longer
         if not context:
             return {"result": "No context – cannot answer."}

 app = FastAPI(
     title       = "AI-Powered Web-App API",
     description = "Backend for summarisation, captioning & QA",
+    version     = "1.2.3",               # <-- bumped
 )
 app.add_middleware(
     timeout = 120,
 )
+# ➜ Upgraded QA model (higher accuracy than roberta-base)
 qa_client             = InferenceClient(
+    "deepset/roberta-large-squad2",
     token   = HUGGINGFACE_TOKEN,
+    timeout = 120,
 )
+# If you need multilingual support, swap for:
+# qa_client = InferenceClient("deepset/xlm-roberta-large-squad2",
+#                             token=HUGGINGFACE_TOKEN, timeout=120)
 image_caption_client  = InferenceClient(
     "nlpconnect/vit-gpt2-image-captioning",
 # -------------------- Image Caption ------------------------------------------
 @app.post("/api/caption")
 async def caption_image(image: UploadFile = File(...)):
+    """`image` field name matches frontend (was `file` before)."""
     try:
         img_bytes = await image.read()
         img       = Image.open(io.BytesIO(img_bytes)).convert("RGB")
             context  = (res.get("generated_text") if isinstance(res, dict)
                         else str(res))
         else:
+            context = process_uploaded_file(file)[:3000]
         if not context:
             return {"result": "No context – cannot answer."}