Spaces:

Trigger82
/

Hmm

Build error

App Files Files Community

Trigger82 commited on May 31, 2025

Commit

955e737

verified ·

1 Parent(s): 81cbe70

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -9

app.py CHANGED Viewed

@@ -12,8 +12,8 @@ logger = logging.getLogger(__name__)
 # Initialize FastAPI
 app = FastAPI(
-    title="PHI Chatbot API",
-    description="Chatbot API using Microsoft's Phi-2 model",
     version="1.0",
 )
@@ -23,9 +23,12 @@ logger.info(f"Using base path: '{BASE_PATH}'")
 # Load model and tokenizer
 try:
-    logger.info("Loading tokenizer and model...")
-    tokenizer = AutoTokenizer.from_pretrained("microsoft/phi-2")
-    model = AutoModelForCausalLM.from_pretrained("microsoft/phi-2")
     model.eval()
     logger.info("Model loaded successfully!")
 except Exception as e:
@@ -46,7 +49,7 @@ async def add_base_path(request: Request, call_next):
 @app.get("/")
 async def root():
     return {
-        "message": "🟢 PHI API is running",
         "endpoints": {
             "chat": f"{BASE_PATH}/ai?query=Hello&user_id=yourname",
             "health": f"{BASE_PATH}/health",
@@ -67,7 +70,7 @@ async def chat(request: Request):
         if len(user_input) > 200:
             raise HTTPException(status_code=400, detail="Query too long (max 200 characters)")
-        # Prompt style: phi models work best with natural instructions
         memory = chat_history.get(user_id, [])
         prompt = "You are a friendly, funny AI assistant called Trigger.\n\n"
         for q, a in memory:
@@ -105,7 +108,7 @@ async def chat(request: Request):
 async def health():
     return {
         "status": "healthy",
-        "model": "microsoft/phi-2",
         "users": len(chat_history),
         "base_path": BASE_PATH
     }
@@ -121,7 +124,7 @@ async def test_page():
     return f"""
     <html>
         <body>
-            <h1>PHI Chatbot Test</h1>
             <p>Base path: {BASE_PATH}</p>
             <ul>
                 <li><a href="{BASE_PATH}/">Root endpoint</a></li>

 # Initialize FastAPI
 app = FastAPI(
+    title="Trigger Chatbot API",
+    description="Chatbot API using TinyLlama-1.1B-Chat model",
     version="1.0",
 )
 # Load model and tokenizer
 try:
+    logger.info("Loading TinyLlama tokenizer and model...")
+    tokenizer = AutoTokenizer.from_pretrained("TinyLlama/TinyLlama-1.1B-Chat-v1.0")
+    model = AutoModelForCausalLM.from_pretrained(
+        "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
+        torch_dtype=torch.float16  # Reduces RAM usage
+    )
     model.eval()
     logger.info("Model loaded successfully!")
 except Exception as e:
 @app.get("/")
 async def root():
     return {
+        "message": "🟢 Trigger API is running",
         "endpoints": {
             "chat": f"{BASE_PATH}/ai?query=Hello&user_id=yourname",
             "health": f"{BASE_PATH}/health",
         if len(user_input) > 200:
             raise HTTPException(status_code=400, detail="Query too long (max 200 characters)")
+        # Prompt style: natural chat history
         memory = chat_history.get(user_id, [])
         prompt = "You are a friendly, funny AI assistant called Trigger.\n\n"
         for q, a in memory:
 async def health():
     return {
         "status": "healthy",
+        "model": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
         "users": len(chat_history),
         "base_path": BASE_PATH
     }
     return f"""
     <html>
         <body>
+            <h1>Trigger Chatbot Test</h1>
             <p>Base path: {BASE_PATH}</p>
             <ul>
                 <li><a href="{BASE_PATH}/">Root endpoint</a></li>