Final_Assignment_Template

Runtime error

0r0b0r0s commited on Apr 30

Commit

2cff5f4

verified ·

1 Parent(s): a1b8b57

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,10 +18,11 @@ from huggingface_hub import InferenceClient, login
 class BasicAgent:
     def __init__(self):
         login(token=os.environ["HF_TOKEN"])
         self.client = InferenceClient(
-            model="Qwen/Qwen2-7B-Instruct",
             token=os.environ["HF_TOKEN"],
             timeout=120
         )
@@ -43,12 +44,11 @@ Answer with ONLY the exact value requested.<|im_end|>
                 prompt=prompt,
                 temperature=0.01,
                 max_new_tokens=100,
-                stop_sequences=["<|im_end|>"],
-                repetition_penalty=1.1
             )
             return response.split("<|im_start|>assistant")[-1].split("<|im_end|>")[0].strip()
         except Exception as e:
-            print(f"Error processing '{question[:50]}...': {str(e)}")
             return ""
 def run_and_submit_all( profile: gr.OAuthProfile | None):

 class BasicAgent:
     def __init__(self):
+        # Required for gated models
         login(token=os.environ["HF_TOKEN"])
         self.client = InferenceClient(
+            model="Qwen/Qwen2-7B-Instruct-GPTQ-Int8",
             token=os.environ["HF_TOKEN"],
             timeout=120
         )
                 prompt=prompt,
                 temperature=0.01,
                 max_new_tokens=100,
+                stop_sequences=["<|im_end|>"]
             )
             return response.split("<|im_start|>assistant")[-1].split("<|im_end|>")[0].strip()
         except Exception as e:
+            print(f"Error: {str(e)}")
             return ""
 def run_and_submit_all( profile: gr.OAuthProfile | None):