Proposed Changes - Replace the default model from `moonshotai/Kimi-K2.5` to `Qwen/Qwen3-32B`. - Remove the provider-specific `extra_body={"thinking": {"type": "disabled"}}` parameter. - Update inference examples to use a model that is currently supported through Hugging Face Inference Providers. - Improve out-of-the-box execution for users running the notebook on Colab or local environments.
#138
by Sourav6991 - opened
unit1/dummy_agent_library.ipynb
CHANGED
|
@@ -52,7 +52,7 @@
|
|
| 52 |
"except ImportError:\n",
|
| 53 |
" HF_TOKEN = os.environ.get(\"HF_TOKEN\")\n",
|
| 54 |
"\n",
|
| 55 |
-
"client = InferenceClient(model=\"
|
| 56 |
]
|
| 57 |
},
|
| 58 |
{
|
|
@@ -74,7 +74,6 @@
|
|
| 74 |
" ],\n",
|
| 75 |
" stream=False,\n",
|
| 76 |
" max_tokens=1024,\n",
|
| 77 |
-
" extra_body={'thinking': {'type': 'disabled'}},\n",
|
| 78 |
")\n",
|
| 79 |
"print(output.choices[0].message.content)"
|
| 80 |
]
|
|
@@ -183,7 +182,6 @@
|
|
| 183 |
" messages=messages,\n",
|
| 184 |
" stream=False,\n",
|
| 185 |
" max_tokens=200,\n",
|
| 186 |
-
" extra_body={'thinking': {'type': 'disabled'}},\n",
|
| 187 |
")\n",
|
| 188 |
"print(output.choices[0].message.content)"
|
| 189 |
]
|
|
@@ -210,7 +208,6 @@
|
|
| 210 |
" messages=messages,\n",
|
| 211 |
" max_tokens=150,\n",
|
| 212 |
" stop=[\"Observation:\"], # Let's stop before any actual function is called\n",
|
| 213 |
-
" extra_body={'thinking': {'type': 'disabled'}},\n",
|
| 214 |
")\n",
|
| 215 |
"\n",
|
| 216 |
"print(output.choices[0].message.content)"
|
|
@@ -261,7 +258,6 @@
|
|
| 261 |
" messages=messages,\n",
|
| 262 |
" stream=False,\n",
|
| 263 |
" max_tokens=200,\n",
|
| 264 |
-
" extra_body={'thinking': {'type': 'disabled'}},\n",
|
| 265 |
")\n",
|
| 266 |
"\n",
|
| 267 |
"print(output.choices[0].message.content)"
|
|
|
|
| 52 |
"except ImportError:\n",
|
| 53 |
" HF_TOKEN = os.environ.get(\"HF_TOKEN\")\n",
|
| 54 |
"\n",
|
| 55 |
+
"client = InferenceClient(model=\"Qwen/Qwen3-32B\", token=HF_TOKEN)"
|
| 56 |
]
|
| 57 |
},
|
| 58 |
{
|
|
|
|
| 74 |
" ],\n",
|
| 75 |
" stream=False,\n",
|
| 76 |
" max_tokens=1024,\n",
|
|
|
|
| 77 |
")\n",
|
| 78 |
"print(output.choices[0].message.content)"
|
| 79 |
]
|
|
|
|
| 182 |
" messages=messages,\n",
|
| 183 |
" stream=False,\n",
|
| 184 |
" max_tokens=200,\n",
|
|
|
|
| 185 |
")\n",
|
| 186 |
"print(output.choices[0].message.content)"
|
| 187 |
]
|
|
|
|
| 208 |
" messages=messages,\n",
|
| 209 |
" max_tokens=150,\n",
|
| 210 |
" stop=[\"Observation:\"], # Let's stop before any actual function is called\n",
|
|
|
|
| 211 |
")\n",
|
| 212 |
"\n",
|
| 213 |
"print(output.choices[0].message.content)"
|
|
|
|
| 258 |
" messages=messages,\n",
|
| 259 |
" stream=False,\n",
|
| 260 |
" max_tokens=200,\n",
|
|
|
|
| 261 |
")\n",
|
| 262 |
"\n",
|
| 263 |
"print(output.choices[0].message.content)"
|