Final_Assignment_Template

Runtime error

App Files Files Community

0r0b0r0s commited on Apr 30

Commit

e95b764

verified ·

1 Parent(s): 40b946e

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -21

app.py CHANGED Viewed

@@ -18,32 +18,48 @@ from huggingface_hub import InferenceClient, login
 class BasicAgent:
     def __init__(self):
-        # Use free-tier compatible Qwen model via Inference API
         self.client = InferenceClient(
-            model="Qwen/Qwen2-7B-Instruct",
-            token=os.getenv("HF_TOKEN")   # Works without token
         )
     def __call__(self, question: str) -> str:
-        """Optimized for GAIA scoring without hardware upgrades"""
         try:
-            # GAIA-optimized prompt template
-            response = self.client.text_generation(
-                prompt=f"""<|im_start|>system
-                        Answer with ONLY the exact value requested, no explanations.<|im_end|>
-                        <|im_start|>user
-                        {question}<|im_end|>
-                        <|im_start|>assistant
-                        """,
-                max_new_tokens=50,
-                temperature=0.01,
-                stop_sequences=["<|im_end|>"]
-            )
-            # Strict answer extraction
-            return response.split("<|im_start|>assistant")[-1].split("<|im_end|>")[0].strip()
-        except Exception:
-            return ""  # Empty answers preserve scoring eligibility

 class BasicAgent:
     def __init__(self):
+        # Initialize with GAIA-proven Qwen model
         self.client = InferenceClient(
+            model="Qwen/Qwen2-72B-Instruct",
+            token=os.environ["HF_TOKEN"],
+            timeout=120
         )
+        # Verify model access
+        test_response = self._call_model("2+2=")
+        if not test_response.startswith("4"):
+            raise RuntimeError("Model initialization failed")
+    def _call_model(self, question: str) -> str:
+        """Core model call with GAIA-optimized prompt"""
+        prompt = f"""<|im_start|>system
+Answer with ONLY the exact value requested, no explanations. Follow GAIA format strictly.<|im_end|>
+<|im_start|>user
+{question}<|im_end|>
+<|im_start|>assistant
+"""
+        return self.client.text_generation(
+            prompt=prompt,
+            temperature=0.05,
+            max_new_tokens=100,
+            stop_sequences=["<|im_end|>"],
+            repetition_penalty=1.1
+        )
     def __call__(self, question: str) -> str:
         try:
+            # Get raw model response
+            raw_response = self._call_model(question)
+            # Strict GAIA-compliant extraction
+            answer = raw_response.split("<|im_start|>assistant")[-1]
+            answer = answer.split("<|im_end|>")[0].strip()
+            # Normalization for exact matching
+            return re.sub(r'[^a-zA-Z0-9, ]', '', answer).lower()
+        except Exception as e:
+            print(f"Error: {str(e)}")
+            return ""