Proposed Changes - Replace the default model from `moonshotai/Kimi-K2.5` to `Qwen/Qwen3-32B`. - Remove the provider-specific `extra_body={"thinking": {"type": "disabled"}}` parameter. - Update inference examples to use a model that is currently supported through Hugging Face Inference Providers. - Improve out-of-the-box execution for users running the notebook on Colab or local environments.

#138
Files changed (1) hide show
  1. unit1/dummy_agent_library.ipynb +1 -5
unit1/dummy_agent_library.ipynb CHANGED
@@ -52,7 +52,7 @@
52
  "except ImportError:\n",
53
  " HF_TOKEN = os.environ.get(\"HF_TOKEN\")\n",
54
  "\n",
55
- "client = InferenceClient(model=\"moonshotai/Kimi-K2.5\", token=HF_TOKEN)"
56
  ]
57
  },
58
  {
@@ -74,7 +74,6 @@
74
  " ],\n",
75
  " stream=False,\n",
76
  " max_tokens=1024,\n",
77
- " extra_body={'thinking': {'type': 'disabled'}},\n",
78
  ")\n",
79
  "print(output.choices[0].message.content)"
80
  ]
@@ -183,7 +182,6 @@
183
  " messages=messages,\n",
184
  " stream=False,\n",
185
  " max_tokens=200,\n",
186
- " extra_body={'thinking': {'type': 'disabled'}},\n",
187
  ")\n",
188
  "print(output.choices[0].message.content)"
189
  ]
@@ -210,7 +208,6 @@
210
  " messages=messages,\n",
211
  " max_tokens=150,\n",
212
  " stop=[\"Observation:\"], # Let's stop before any actual function is called\n",
213
- " extra_body={'thinking': {'type': 'disabled'}},\n",
214
  ")\n",
215
  "\n",
216
  "print(output.choices[0].message.content)"
@@ -261,7 +258,6 @@
261
  " messages=messages,\n",
262
  " stream=False,\n",
263
  " max_tokens=200,\n",
264
- " extra_body={'thinking': {'type': 'disabled'}},\n",
265
  ")\n",
266
  "\n",
267
  "print(output.choices[0].message.content)"
 
52
  "except ImportError:\n",
53
  " HF_TOKEN = os.environ.get(\"HF_TOKEN\")\n",
54
  "\n",
55
+ "client = InferenceClient(model=\"Qwen/Qwen3-32B\", token=HF_TOKEN)"
56
  ]
57
  },
58
  {
 
74
  " ],\n",
75
  " stream=False,\n",
76
  " max_tokens=1024,\n",
 
77
  ")\n",
78
  "print(output.choices[0].message.content)"
79
  ]
 
182
  " messages=messages,\n",
183
  " stream=False,\n",
184
  " max_tokens=200,\n",
 
185
  ")\n",
186
  "print(output.choices[0].message.content)"
187
  ]
 
208
  " messages=messages,\n",
209
  " max_tokens=150,\n",
210
  " stop=[\"Observation:\"], # Let's stop before any actual function is called\n",
 
211
  ")\n",
212
  "\n",
213
  "print(output.choices[0].message.content)"
 
258
  " messages=messages,\n",
259
  " stream=False,\n",
260
  " max_tokens=200,\n",
 
261
  ")\n",
262
  "\n",
263
  "print(output.choices[0].message.content)"