Final_Assignment_Template

Sleeping

App Files Files Community

Freddolin commited on Jul 7, 2025

Commit

9666d9f

verified ·

1 Parent(s): 059c116

Update agent.py

Browse files

Files changed (1) hide show

agent.py +20 -16

agent.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from transformers import pipeline
 SYSTEM_PROMPT = """
 You are a general AI assistant. I will ask you a question. Report your thoughts, and finish your answer with the following template:
@@ -9,28 +10,31 @@ If you are asked for a string, don't use articles, neither abbreviations (e.g. f
 If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
 """
 class GaiaAgent:
-    def __init__(self, model_id="google/flan-t5-base"):
-        self.generator = pipeline(
-            "text2text-generation",
-            model=model_id,
-            tokenizer=model_id,
-            max_new_tokens=512,
-            device="cpu"
-        )
     def __call__(self, question: str) -> tuple[str, str]:
         try:
             prompt = f"{SYSTEM_PROMPT}\n\n{question}\nFINAL ANSWER:"
-            output = self.generator(prompt)[0]["generated_text"]
-            if "FINAL ANSWER:" in output:
-                final = output.split("FINAL ANSWER:")[-1].strip().split("\n")[0].strip()
             else:
-                final = output.strip()
-            return final, output
         except Exception as e:
             return "ERROR", f"Agent failed: {e}"

+from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
+import torch
 SYSTEM_PROMPT = """
 You are a general AI assistant. I will ask you a question. Report your thoughts, and finish your answer with the following template:
 If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
 """
 class GaiaAgent:
+    def __init__(self, model_id="tiiuae/falcon-rw-1b"):
+        self.tokenizer = AutoTokenizer.from_pretrained(model_id)
+        self.model = AutoModelForCausalLM.from_pretrained(model_id)
+        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        self.model.to(self.device)
     def __call__(self, question: str) -> tuple[str, str]:
         try:
             prompt = f"{SYSTEM_PROMPT}\n\n{question}\nFINAL ANSWER:"
+            inputs = self.tokenizer(prompt, return_tensors="pt").to(self.device)
+            outputs = self.model.generate(
+                **inputs,
+                max_new_tokens=256,
+                do_sample=True,
+                temperature=0.7,
+                pad_token_id=self.tokenizer.eos_token_id
+            )
+            output_text = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
+            if "FINAL ANSWER:" in output_text:
+                final = output_text.split("FINAL ANSWER:")[-1].strip().split("\n")[0].strip()
             else:
+                final = output_text.strip()
+            return final, output_text
         except Exception as e:
             return "ERROR", f"Agent failed: {e}"