Final_Assignment_Template

Sleeping

Umer797 commited on May 27, 2025

Commit

5a5c9b9

verified ·

1 Parent(s): 2cac8b2

Update llm_node.py

Files changed (1) hide show

llm_node.py CHANGED Viewed

@@ -2,13 +2,10 @@ import os
 from huggingface_hub import InferenceClient
 def llm_node(question, search_result):
-    # Initialize the client (no repo_id here!)
     client = InferenceClient(token=os.getenv("HUGGINGFACEHUB_API_TOKEN"))
-    # Define the model you want to use
-    model_id = "HuggingFaceH4/zephyr-7b-beta"  # You can swap this with e.g., mistralai/Mistral-7B-Instruct-v0.2
-    # Craft the prompt carefully
     prompt = f"""You are solving a GAIA benchmark evaluation question.
 Here’s the question:
@@ -24,15 +21,12 @@ Here’s retrieved information:
 Your answer:"""
-    # Call the model (pass model ID here)
     response = client.text_generation(
         model=model_id,
         prompt=prompt,
-        max_new_tokens=500,
         temperature=0.1,
-        top_p=0.95,
-        repetition_penalty=1.1
     )
-    # Clean up response text
     return response.strip()

 from huggingface_hub import InferenceClient
 def llm_node(question, search_result):
     client = InferenceClient(token=os.getenv("HUGGINGFACEHUB_API_TOKEN"))
+    model_id = "google/flan-t5-small"  # ✅ Small free-tier model
     prompt = f"""You are solving a GAIA benchmark evaluation question.
 Here’s the question:
 Your answer:"""
     response = client.text_generation(
         model=model_id,
         prompt=prompt,
+        max_new_tokens=200,  # smaller due to model limits
         temperature=0.1,
+        top_p=0.9
     )
     return response.strip()