Final_Assignment_Template

Sleeping

App Files Files Community

s1144662 commited on Jan 1

Commit

9df76c7

verified ·

1 Parent(s): 70676c7

Update app.py

Browse files

Files changed (1) hide show

app.py +46 -33

app.py CHANGED Viewed

@@ -20,9 +20,13 @@ GROQ_API_URL = "https://api.groq.com/openai/v1/chat/completions"
 def perform_search(query: str) -> str:
     """搜尋工具：只抓重點，並有隨機延遲"""
     print(f"🕵️ Searching: {query[:50]}...")
     try:
-        time.sleep(random.uniform(1.0, 2.0)) # 隨機延遲
         with DDGS() as ddgs:
             results = list(ddgs.text(query, max_results=2, backend="lite"))
@@ -39,8 +43,8 @@ class GroqClient:
     def __init__(self):
         self.api_key = os.getenv("GROQ_API_KEY")
-    def query(self, messages, model, max_retries=3):
-        """發送請求給 Groq，包含自動重試機制"""
         if not self.api_key:
             return "Error: No API Key"
@@ -49,11 +53,21 @@ class GroqClient:
             "Content-Type": "application/json"
         }
         payload = {
             "model": model,
-            "messages": messages,
             "temperature": 0.1,
-            "max_tokens": 500
         }
         for attempt in range(max_retries):
@@ -62,63 +76,59 @@ class GroqClient:
                 # 如果成功
                 if response.status_code == 200:
-                    return response.json()['choices'][0]['message']['content']
-                # 如果遇到 429 (太快了)，休息久一點再試
                 if response.status_code == 429:
-                    wait_time = (attempt + 1) * 10 # 第一次等10秒，第二次等20秒...
-                    print(f"⚠️ Rate limit (429). Waiting {wait_time}s...")
                     time.sleep(wait_time)
                     continue
-                return f"API Error {response.status_code}"
             except Exception as e:
                 print(f"Connection Error: {e}")
-                time.sleep(5)
-        return "Failed after retries."
 def solve_question(question, client):
     """分析題目類型並選擇策略"""
     # 1. 檢查是否有圖片網址 (Vision 任務)
-    # 常見格式：https://... .png 或 .jpg
     img_match = re.search(r'(https?://[^\s]+\.(?:jpg|jpeg|png|webp))', question)
     if img_match:
         image_url = img_match.group(1)
-        print(f"👁️ Vision Task Detected! URL: {image_url}")
-        # 使用 Groq 的視覺模型
         messages = [
             {
                 "role": "user",
                 "content": [
-                    {"type": "text", "text": f"Answer this question directly: {question}"},
                     {"type": "image_url", "image_url": {"url": image_url}}
                 ]
             }
         ]
-        # 使用具備視覺能力的模型
         return client.query(messages, model="llama-3.2-11b-vision-preview")
     else:
         # 2. 一般文字/搜尋任務
-        # 先搜尋
         context = perform_search(question)
-        # 組合 Prompt
-        system_msg = "You are a helpful AI. Answer concisely using the provided context."
         if context:
-            user_msg = f"Context: {context}\n\nQuestion: {question}"
         else:
-            user_msg = question
-        messages = [
-            {"role": "system", "content": system_msg},
-            {"role": "user", "content": user_msg}
-        ]
         # 使用最強的文字模型
         return client.query(messages, model="llama-3.3-70b-versatile")
@@ -150,18 +160,21 @@ def run_and_submit_all(profile: Optional[gr.OAuthProfile] = None):
         # 核心：解題
         ans = solve_question(q, client)
         answers.append({"task_id": tid, "submitted_answer": ans})
-        logs.append({"Task": tid, "Type": "Image" if "http" in q and ".jpg" in q else "Text", "Answer": str(ans)[:100]})
-        # !!! 關鍵保命符 !!!
-        # 每題解完強制休息 5 秒，防止 429 錯誤
-        time.sleep(5)
     try:
         print("Submitting...")
         res = requests.post(f"{DEFAULT_API_URL}/submit", json={
             "username": profile.username,
-            "agent_code": "https://huggingface.co/spaces/test/test", # 這裡隨意填
             "answers": answers
         }, timeout=60)
@@ -172,8 +185,8 @@ def run_and_submit_all(profile: Optional[gr.OAuthProfile] = None):
     except Exception as e:
         return f"Submit error: {str(e)}", pd.DataFrame(logs)
-with gr.Blocks(title="Final Agent (Vision + Anti-429)") as demo:
-    gr.Markdown("# 🚀 Final Agent (Slow & Steady)")
     with gr.Row():
         gr.LoginButton()
         btn = gr.Button("Run Evaluation", variant="primary")

 def perform_search(query: str) -> str:
     """搜尋工具：只抓重點，並有隨機延遲"""
+    # 針對一些明顯的邏輯題，跳過搜尋以節省時間和 Token
+    if "reverse" in query.lower() or "tfel" in query.lower() or "python" in query.lower():
+        return ""
     print(f"🕵️ Searching: {query[:50]}...")
     try:
+        time.sleep(random.uniform(2.0, 4.0)) # 增加延遲
         with DDGS() as ddgs:
             results = list(ddgs.text(query, max_results=2, backend="lite"))
     def __init__(self):
         self.api_key = os.getenv("GROQ_API_KEY")
+    def query(self, messages, model, max_retries=5): # 增加重試次數到 5 次
+        """發送請求給 Groq，包含超強自動重試機制"""
         if not self.api_key:
             return "Error: No API Key"
             "Content-Type": "application/json"
         }
+        # 針對這門課的特殊要求：強制簡潔
+        # 這是拿分的關鍵，避免模型講廢話
+        system_instruction = {
+            "role": "system",
+            "content": "You are taking a test. Provide ONLY the exact answer. No sentences, no punctuation, no explanations. Example: if the answer is 5, output '5'. If the answer is Paris, output 'Paris'."
+        }
+        # 確保 system instruction 在最前面
+        final_messages = [system_instruction] + messages
         payload = {
             "model": model,
+            "messages": final_messages,
             "temperature": 0.1,
+            "max_tokens": 100 # 限制回答長度
         }
         for attempt in range(max_retries):
                 # 如果成功
                 if response.status_code == 200:
+                    content = response.json()['choices'][0]['message']['content'].strip()
+                    # 移除最後的句號 (常見錯誤)
+                    if content.endswith('.'):
+                        content = content[:-1]
+                    return content
+                # 如果遇到 429 (太快了)，休息很久再試
                 if response.status_code == 429:
+                    wait_time = (attempt + 1) * 20 # 20s, 40s, 60s, 80s, 100s
+                    print(f"⚠️ Rate limit (429). Waiting {wait_time}s... (Attempt {attempt+1}/{max_retries})")
                     time.sleep(wait_time)
                     continue
+                print(f"API Error {response.status_code}: {response.text[:100]}")
+                return f"Error"
             except Exception as e:
                 print(f"Connection Error: {e}")
+                time.sleep(10)
+        return "Error"
 def solve_question(question, client):
     """分析題目類型並選擇策略"""
     # 1. 檢查是否有圖片網址 (Vision 任務)
     img_match = re.search(r'(https?://[^\s]+\.(?:jpg|jpeg|png|webp))', question)
     if img_match:
         image_url = img_match.group(1)
+        print(f"👁️ Vision Task: {image_url}")
         messages = [
             {
                 "role": "user",
                 "content": [
+                    {"type": "text", "text": f"What is the answer to this question? {question}"},
                     {"type": "image_url", "image_url": {"url": image_url}}
                 ]
             }
         ]
         return client.query(messages, model="llama-3.2-11b-vision-preview")
     else:
         # 2. 一般文字/搜尋任務
         context = perform_search(question)
         if context:
+            user_msg = f"Context from search:\n{context}\n\nQuestion: {question}\nAnswer:"
         else:
+            user_msg = f"Question: {question}\nAnswer:"
+        messages = [{"role": "user", "content": user_msg}]
         # 使用最強的文字模型
         return client.query(messages, model="llama-3.3-70b-versatile")
         # 核心：解題
         ans = solve_question(q, client)
+        print(f"✅ Answer: {ans}") # 在 Log 顯示答案確認
         answers.append({"task_id": tid, "submitted_answer": ans})
+        logs.append({"Task": tid, "Answer": str(ans)[:100]})
+        # !!! 強制休息 10 秒 !!!
+        # 這是為了確保下一題不會立刻觸發 429
+        print("💤 Sleeping 10s to respect rate limits...")
+        time.sleep(10)
     try:
         print("Submitting...")
         res = requests.post(f"{DEFAULT_API_URL}/submit", json={
             "username": profile.username,
+            "agent_code": "https://huggingface.co/spaces/test/test",
             "answers": answers
         }, timeout=60)
     except Exception as e:
         return f"Submit error: {str(e)}", pd.DataFrame(logs)
+with gr.Blocks(title="Final Agent (Anti-429 v2)") as demo:
+    gr.Markdown("# 🚀 Final Agent (Strict Format + Slow Mode)")
     with gr.Row():
         gr.LoginButton()
         btn = gr.Button("Run Evaluation", variant="primary")