Spaces:

benkada
/

aiWeb

Sleeping

App Files Files Community

benkada commited on Apr 27, 2025

Commit

e4872e8

verified ·

1 Parent(s): cb57f04

Update main.py

Browse files

Files changed (1) hide show

main.py +126 -213

main.py CHANGED Viewed

@@ -1,213 +1,126 @@
-from fastapi import FastAPI, UploadFile, File, Form, HTTPException
-from fastapi.responses import JSONResponse
-from fastapi.middleware.cors import CORSMiddleware
-from pydantic import BaseModel
-from typing import Optional
-import os
-import tempfile
-from transformers import pipeline
-import torch
-from PIL import Image
-import pytesseract
-from langchain.chains import LLMChain
-from langchain.prompts import PromptTemplate
-from langchain_community.llms import HuggingFaceHub
-# Initialize FastAPI app
-app = FastAPI(
-    title="AI-Powered Web Application API",
-    description="API for document analysis, image captioning, and question answering",
-    version="1.0.0"
-)
-# CORS configuration
-app.add_middleware(
-    CORSMiddleware,
-    allow_origins=["*"],
-    allow_credentials=True,
-    allow_methods=["*"],
-    allow_headers=["*"],
-)
-# Initialize AI models (lazy loading)
-summarizer = None
-image_captioner = None
-qa_chain = None
-class SummaryRequest(BaseModel):
-    file: UploadFile = File(...)
-class CaptionRequest(BaseModel):
-    file: UploadFile = File(...)
-class QARequest(BaseModel):
-    file: UploadFile = File(...)
-    question: str = Form(...)
-def initialize_models():
-    """Initialize AI models with optimized prompts"""
-    global summarizer, image_captioner, qa_chain
-    # Document summarization model
-    if summarizer is None:
-        summarizer = pipeline(
-            "summarization",
-            model="facebook/bart-large-cnn",
-            device=0 if torch.cuda.is_available() else -1
-        )
-    # Image captioning model
-    if image_captioner is None:
-        image_captioner = pipeline(
-            "image-to-text",
-            model="nlpconnect/vit-gpt2-image-captioning",
-            device=0 if torch.cuda.is_available() else -1
-        )
-    # Question answering chain
-    if qa_chain is None:
-        llm = HuggingFaceHub(
-            repo_id="google/flan-t5-large",
-            model_kwargs={"temperature": 0.1, "max_length": 512}
-        )
-        qa_prompt = PromptTemplate(
-            input_variables=["document", "question"],
-            template="""
-            Using the provided document, answer the following question precisely.
-            If the answer cannot be determined from the document, respond with
-            'The answer cannot be determined from the provided document.'
-            Question: {question}
-            Rules:
-            1. Provide a concise answer (1-3 sentences maximum)
-            2. When possible, reference the specific section of the document that supports your answer
-            3. Maintain numerical precision when answering quantitative questions
-            4. For comparison questions, highlight both items being compared
-            Document: {document}
-            """
-        )
-        qa_chain = LLMChain(llm=llm, prompt=qa_prompt)
-def extract_text_from_file(file: UploadFile) -> str:
-    """Extract text from various file formats"""
-    # Create a temporary file
-    with tempfile.NamedTemporaryFile(delete=False) as temp_file:
-        temp_file.write(file.file.read())
-        temp_path = temp_file.name
-    try:
-        # PDF, DOCX, PPTX, XLSX would need appropriate libraries here
-        # For simplicity, we'll just read text files in this example
-        if file.filename.endswith('.txt'):
-            with open(temp_path, 'r', encoding='utf-8') as f:
-                return f.read()
-        else:
-            # In a real implementation, use libraries like PyPDF2, python-docx, etc.
-            raise HTTPException(
-                status_code=415,
-                detail="File type not supported in this example implementation"
-            )
-    finally:
-        os.unlink(temp_path)
-@app.post("/api/summarize")
-async def summarize_document(file: UploadFile = File(...)):
-    """Summarize a document"""
-    initialize_models()
-    try:
-        # Extract text from the document
-        document_text = extract_text_from_file(file)
-        # Generate summary with optimized prompt
-        summary = summarizer(
-            document_text,
-            max_length=150,
-            min_length=30,
-            do_sample=False,
-            truncation=True
-        )
-        return JSONResponse(
-            content={"status": "success", "result": summary[0]['summary_text']},
-            status_code=200
-        )
-    except Exception as e:
-        raise HTTPException(
-            status_code=500,
-            detail=f"Error processing document: {str(e)}"
-        )
-@app.post("/api/caption")
-async def generate_image_caption(file: UploadFile = File(...)):
-    """Generate caption for an image"""
-    initialize_models()
-    try:
-        # Save the uploaded image temporarily
-        with tempfile.NamedTemporaryFile(suffix=".jpg", delete=False) as temp_file:
-            temp_file.write(file.file.read())
-            temp_path = temp_file.name
-        # Open the image
-        image = Image.open(temp_path)
-        # Generate caption with optimized prompt
-        caption = image_captioner(
-            image,
-            generate_kwargs={
-                "max_length": 50,
-                "num_beams": 4,
-                "early_stopping": True
-            }
-        )
-        return JSONResponse(
-            content={"status": "success", "result": caption[0]['generated_text']},
-            status_code=200
-        )
-    except Exception as e:
-        raise HTTPException(
-            status_code=500,
-            detail=f"Error processing image: {str(e)}"
-        )
-    finally:
-        if 'temp_path' in locals() and os.path.exists(temp_path):
-            os.unlink(temp_path)
-@app.post("/api/qa")
-async def answer_question(
-    file: UploadFile = File(...),
-    question: str = Form(...)
-):
-    """Answer questions based on document content"""
-    initialize_models()
-    try:
-        # Extract text from the document
-        document_text = extract_text_from_file(file)
-        # Get answer using the QA chain
-        answer = qa_chain.run(document=document_text, question=question)
-        return JSONResponse(
-            content={"status": "success", "result": answer},
-            status_code=200
-        )
-    except Exception as e:
-        raise HTTPException(
-            status_code=500,
-            detail=f"Error processing question: {str(e)}"
-        )
-@app.get("/")
-async def health_check():
-    """Health check endpoint"""
-    return {"status": "healthy", "version": "1.0.0"}
-if __name__ == "__main__":
-    import uvicorn
-    uvicorn.run(app, host="0.0.0.0", port=8000)

+import os
+from fastapi import FastAPI, UploadFile, File, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import JSONResponse
+from pydantic import BaseModel
+from typing import Optional
+from PIL import Image
+import pytesseract
+from transformers import pipeline
+from langchain.chains import LLMChain
+from langchain.prompts import PromptTemplate
+from langchain_community.llms import HuggingFaceHub
+# Ensure HF cache directory is set before any HF import uses it
+os.environ.setdefault("HF_HOME", os.getenv("HF_HOME", "/app/cache"))
+# FastAPI application
+app = FastAPI(
+    title="AI-Powered Web Application API",
+    description="API for document summarization, image captioning, and question answering",
+    version="1.0.0"
+)
+# CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# ----------------
+# Schemas
+# ----------------
+class SummarizeRequest(BaseModel):
+    text: str
+    max_length: Optional[int] = 150
+    min_length: Optional[int] = 40
+class QARequest(BaseModel):
+    question: str
+    context: Optional[str] = None
+# ----------------
+# Model loaders (lazy)
+# ----------------
+_cache_dir = os.getenv("HF_HOME", "/app/cache")
+_summarizer = None
+_captioner = None
+_qa_chain = None
+def get_summarizer():
+    global _summarizer
+    if _summarizer is None:
+        _summarizer = pipeline(
+            "summarization",
+            model="facebook/bart-large-cnn",
+            cache_dir=_cache_dir
+        )
+    return _summarizer
+def get_image_captioner():
+    global _captioner
+    if _captioner is None:
+        _captioner = pipeline(
+            "image-to-text",
+            model="nlpconnect/vit-gpt2-image-captioning",
+            cache_dir=_cache_dir
+        )
+    return _captioner
+def get_qa_chain():
+    global _qa_chain
+    if _qa_chain is None:
+        llm = HuggingFaceHub(
+            repo_id="google/flan-t5-large",
+            model_kwargs={"cache_dir": _cache_dir},
+            huggingfacehub_api_token=os.getenv("HUGGINGFACEHUB_API_TOKEN", None)
+        )
+        prompt = PromptTemplate(
+            input_variables=["context", "question"],
+            template="""
+Use the following context to answer the question:
+{context}
+Question: {question}
+Answer:"""
+        )
+        _qa_chain = LLMChain(llm=llm, prompt=prompt)
+    return _qa_chain
+# ----------------
+# Routes
+# ----------------
+@app.post("/summarize")
+def summarize(req: SummarizeRequest):
+    summarizer = get_summarizer()
+    result = summarizer(
+        req.text,
+        max_length=req.max_length,
+        min_length=req.min_length,
+        clean_up_tokenization_spaces=True
+    )
+    return JSONResponse(content={"summary": result[0]["summary_text"]})
+@app.post("/caption")
+async def caption_image(file: UploadFile = File(...)):
+    try:
+        img = Image.open(file.file).convert("RGB")
+        captioner = get_image_captioner()
+        result = captioner(img)
+        return JSONResponse(content={"caption": result[0]["generated_text"]})
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=str(e))
+@app.post("/qa")
+def question_answer(req: QARequest):
+    chain = get_qa_chain()
+    context = req.context or ""
+    answer = chain.run({"context": context, "question": req.question})
+    return JSONResponse(content={"answer": answer})