jdesiree commited on
Commit
56eab31
·
verified ·
1 Parent(s): 62075fe

Model Change

Browse files

Switched to Qwen3-4B-Instruct-2507, a better fitting model for the anticipated task types.

Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -18,13 +18,13 @@ if "HUGGINGFACEHUB_API_TOKEN" not in os.environ:
18
 
19
  # --- LLM and Template Configuration ---
20
  llm = HuggingFaceEndpoint(
21
- repo_id="HuggingFaceH4/zephyr-7b-alpha", # inference-ready model
22
  temperature=0.7,
23
- max_new_tokens=512,
24
- huggingfacehub_api_token=os.getenv("HUGGINGFACEHUB_API_TOKEN"),
25
- task="conversational"
 
26
  )
27
-
28
  math_template = ChatPromptTemplate.from_messages([
29
  ("system", """{system_message}
30
  You are an expert math tutor. For every math problem:
 
18
 
19
  # --- LLM and Template Configuration ---
20
  llm = HuggingFaceEndpoint(
21
+ repo_id="Qwen/Qwen3-4B-Instruct-2507",
22
  temperature=0.7,
23
+ top_p=0.8,
24
+ top_k=20,
25
+ max_new_tokens=1024,
26
+ huggingfacehub_api_token=os.getenv("HUGGINGFACEHUB_API_TOKEN")
27
  )
 
28
  math_template = ChatPromptTemplate.from_messages([
29
  ("system", """{system_message}
30
  You are an expert math tutor. For every math problem: