Peter Larnholt commited on
Commit
80b0386
·
1 Parent(s): 55381a2

Remove --enable-auto-tool-choice flag (Qwen has native tool calling)

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -26,7 +26,7 @@ VLLM_ARGS = [
26
  "--max-model-len", "8192", # fits A10G 24GB
27
  "--gpu-memory-utilization", "0.90",
28
  "--trust-remote-code",
29
- "--enable-auto-tool-choice", # Enable automatic tool selection
30
  ]
31
  if "AWQ" in MODEL_ID.upper():
32
  VLLM_ARGS += ["--quantization", "awq_marlin"] # faster AWQ kernel if available
 
26
  "--max-model-len", "8192", # fits A10G 24GB
27
  "--gpu-memory-utilization", "0.90",
28
  "--trust-remote-code",
29
+ # Qwen 2.5 has native tool calling - no parser override needed
30
  ]
31
  if "AWQ" in MODEL_ID.upper():
32
  VLLM_ARGS += ["--quantization", "awq_marlin"] # faster AWQ kernel if available