Spaces:

roshnn24
/

Figr-DataScience-Assignment

Sleeping

App Files Files Community

roshnn24 commited on Jan 16, 2025

Commit

b545a36

verified ·

1 Parent(s): b936fed

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -28

app.py CHANGED Viewed

@@ -142,28 +142,22 @@ def init_db():
         conn.commit()
 def initialize_llm():
-    """Initialize the model in the simplest way possible"""
     try:
-        # Get API token
         api_token = os.environ.get('HF_TOKEN')
         if not api_token:
             raise ValueError("No API token found")
-        # Initialize with minimal settings
-        llm = HuggingFaceHub(
-            repo_id="mistralai/Mistral-7B-Instruct-v0.3",  # Using a simpler model for testing
-            huggingfacehub_api_token=api_token,
-            task="text-generation"        )
-        # Quick test
-        test = llm("Say hello")
-        print(f"Test response: {test}")
-        return llm
     except Exception as e:
         print(f"LLM initialization error: {str(e)}")
-        raise
 class ChatSession:
@@ -278,14 +272,12 @@ try:
     print("Database initialized successfully")
     print("Initializing LLM...")
-    llm = initialize_llm()
-    if llm is None:
         raise ValueError("LLM initialization failed")
     print("LLM initialized successfully")
-    print("Creating LLM chain...")
-    llm_chain = LLMChain(llm=llm, prompt=prompt)
-    print("LLM chain created successfully")
 except Exception as e:
     print(f"Fatal initialization error: {e}")
@@ -472,24 +464,41 @@ def get_chat_list():
 @app.route("/api/chat", methods=["POST"])
 def chat():
     try:
-        # Get the user's message
         data = request.json
         user_input = data.get("message", "")
         print(f"Received message: {user_input}")
         # Very simple prompt for testing
-        prompt = f"You are a helpful assistant. Keep your response short and simple. User says: {user_input}"
         try:
-            # Get response directly from model
-            response = llm(prompt)
-            print(f"Raw response received: {response}")
-            # Return whatever response we get
-            return jsonify({
-                "success": True,
-                "response": response
-            })
         except Exception as e:
             print(f"Model error: {str(e)}")

         conn.commit()
 def initialize_llm():
+    """Initialize the LLM using InferenceClient."""
     try:
+        # Get API token from environment variable
         api_token = os.environ.get('HF_TOKEN')
         if not api_token:
             raise ValueError("No API token found")
+        # Initialize the InferenceClient
+        client = InferenceClient(api_key=api_token)
+        print("LLM initialized successfully!")
+        return client
     except Exception as e:
         print(f"LLM initialization error: {str(e)}")
+        return None
 class ChatSession:
     print("Database initialized successfully")
     print("Initializing LLM...")
+    llm_client = initialize_llm()
+    if llm_client is None:
         raise ValueError("LLM initialization failed")
     print("LLM initialized successfully")
 except Exception as e:
     print(f"Fatal initialization error: {e}")
 @app.route("/api/chat", methods=["POST"])
 def chat():
     try:
+        # Get the user's message from the request
         data = request.json
         user_input = data.get("message", "")
         print(f"Received message: {user_input}")
+        if not user_input:
+            return jsonify({
+                "success": False,
+                "response": "No message provided."
+            })
         # Very simple prompt for testing
+        messages = [
+            {"role": "user", "content": user_input}
+        ]
         try:
+            # Get response from the model using InferenceClient
+            if llm_client:
+                completion = llm_client.chat.completions.create(
+                    model="mistralai/Mistral-7B-Instruct-v0.3",  # Replace with the appropriate model
+                    messages=messages,
+                    max_tokens=150  # Adjust the max tokens as needed
+                )
+                response = completion['choices'][0]['message']['content']
+                print(f"Raw response received: {response}")
+                # Return the model's response
+                return jsonify({
+                    "success": True,
+                    "response": response
+                })
+            else:
+                raise ValueError("LLM client not initialized properly.")
         except Exception as e:
             print(f"Model error: {str(e)}")