Final_Assignment_Template_rubenml

Runtime error

App Files Files Community

rubenml commited on Apr 25, 2025

Commit

f4c9709

verified ·

1 Parent(s): d861b0a

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -13

app.py CHANGED Viewed

@@ -22,51 +22,49 @@ DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 class GeneralAgent:
     def __init__(self):
         print("Initializing GPT-2 based QA agent...")
-        # Cargar modelo y tokenizador de GPT-2
         self.model = GPT2LMHeadModel.from_pretrained("gpt2")
         self.tokenizer = GPT2Tokenizer.from_pretrained("gpt2")
     def __call__(self, question: str, context: str = None) -> str:
         """
-        Procesa la pregunta y genera una respuesta basada en el contexto proporcionado.
-        Usa un prompt específico para guiar la respuesta del modelo GPT-2.
         """
         if context is None:
-            return "FINAL ANSWER: No context provided."
-        # Crear el prompt para el modelo GPT-2
         prompt = f"""
-You are a general AI assistant. I will ask you a question. Report your thoughts, and finish your answer with the following template: FINAL ANSWER: [YOUR FINAL ANSWER]. YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
 Question: {question}
 Context: {context}
 """
-        # Tokenizar el prompt
         inputs = self.tokenizer.encode(prompt, return_tensors="pt")
-        # Generar la respuesta con GPT-2
         outputs = self.model.generate(inputs, max_length=500, num_return_sequences=1, no_repeat_ngram_size=2, early_stopping=True)
-        # Decodificar la salida
         answer = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
-        # Extraer la respuesta final
         final_answer = self._extract_final_answer(answer)
         return f"FINAL ANSWER: {final_answer}"
     def _extract_final_answer(self, answer: str) -> str:
         """
-        Extrae la parte relevante de la respuesta generada por GPT-2 según el formato solicitado.
         """
-        # Buscar la sección que comienza con "FINAL ANSWER:"
         final_answer_start = "FINAL ANSWER:"
         start_idx = answer.find(final_answer_start)
         if start_idx == -1:
             return "Error processing question."
-        # Extraer la respuesta que sigue a "FINAL ANSWER:"
         final_answer = answer[start_idx + len(final_answer_start):].strip()
         return final_answer.strip()
@@ -76,6 +74,7 @@ Context: {context}
 def run_and_submit_all(profile: gr.OAuthProfile | None):

 class GeneralAgent:
     def __init__(self):
         print("Initializing GPT-2 based QA agent...")
         self.model = GPT2LMHeadModel.from_pretrained("gpt2")
         self.tokenizer = GPT2Tokenizer.from_pretrained("gpt2")
     def __call__(self, question: str, context: str = None) -> str:
         """
+        Process the question and generate an answer based on the provided context.
         """
         if context is None:
+            context = "No context provided."  # Default context if none is given
+        # Create a clear, structured prompt
         prompt = f"""
+You are a general AI assistant. I will ask you a question. Report your thoughts, and finish your answer with the following template: FINAL ANSWER: [YOUR FINAL ANSWER].
+YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma-separated list of numbers and/or strings. If you are asked for a number, don't use commas to write your number nor use units such as $ or percent sign unless specified otherwise.
+If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise.
+If you are asked for a comma-separated list, apply the above rules depending on whether the element to be put in the list is a number or a string.
 Question: {question}
 Context: {context}
 """
         inputs = self.tokenizer.encode(prompt, return_tensors="pt")
+        # Generate the answer with GPT-2
         outputs = self.model.generate(inputs, max_length=500, num_return_sequences=1, no_repeat_ngram_size=2, early_stopping=True)
+        # Decode the generated answer
         answer = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
+        # Extract the relevant part of the answer
         final_answer = self._extract_final_answer(answer)
         return f"FINAL ANSWER: {final_answer}"
     def _extract_final_answer(self, answer: str) -> str:
         """
+        Extract the relevant part of the generated answer.
         """
         final_answer_start = "FINAL ANSWER:"
         start_idx = answer.find(final_answer_start)
         if start_idx == -1:
             return "Error processing question."
         final_answer = answer[start_idx + len(final_answer_start):].strip()
         return final_answer.strip()
 def run_and_submit_all(profile: gr.OAuthProfile | None):