Final_Assignment_Template

Sleeping

App Files Files Community

Facelook commited on Apr 26

Commit

b918222

1 Parent(s): 3273c0a

Trial and error.

Browse files

Files changed (1) hide show

app.py +21 -9

app.py CHANGED Viewed

@@ -18,11 +18,24 @@ class BasicAgent:
         print("BasicAgent initialized.")
         print("Loading Qwen2.5-7B-Instruct model...")
-        self.model_name = "Qwen/Qwen2.5-7B-Instruct"
-        self.client = InferenceClient(model=self.model_name)
-        self.tokenizer = None
-        self.model = None
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
@@ -54,9 +67,8 @@ class BasicAgent:
                 answer = self.tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
             else:
-                # Fallback to Inference API - using the correct method call for chat completion
-                response = self.client.chat_completion(messages)
-                answer = response.choices[0].message.content
             print(f"Agent generated response (first 50 chars): {answer[:50]}...")
             return answer
@@ -192,7 +204,7 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
 # --- Build Gradio Interface using Blocks ---
 with gr.Blocks() as demo:
-    gr.Markdown("# Basic Agent Evaluation Runner (Attempt #1)")
     gr.Markdown(
         """
         **Instructions:**

         print("BasicAgent initialized.")
         print("Loading Qwen2.5-7B-Instruct model...")
+        self.model_name = "Qwen/Qwen2.5-1.5B-Instruct"
+        # Load model and tokenizer
+        try:
+            self.tokenizer = AutoTokenizer.from_pretrained(self.model_name)
+            self.model = AutoModelForCausalLM.from_pretrained(
+                self.model_name,
+                torch_dtype="auto",
+                device_map="auto"
+            )
+            print(f"Successfully loaded {self.model_name}")
+        except Exception as e:
+            print(f"Error loading model: {e}")
+            # Fallback to HuggingFace Inference API if local loading fails
+            print("Falling back to InferenceClient")
+            self.client = InferenceClient(model=self.model_name)
+            self.tokenizer = None
+            self.model = None
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
                 answer = self.tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
             else:
+                # Fallback to Inference API
+                answer = self.client.chat(messages=messages)
             print(f"Agent generated response (first 50 chars): {answer[:50]}...")
             return answer
 # --- Build Gradio Interface using Blocks ---
 with gr.Blocks() as demo:
+    gr.Markdown("# Basic Agent Evaluation Runner")
     gr.Markdown(
         """
         **Instructions:**