Spaces:

Luigi
/

tiny-scribe

Running

Luigi commited on Feb 1

Commit

23d5038

1 Parent(s): 6d54864

Fix: Remove duplicate return statement in get_model_info

- Removed duplicate return statement that was causing syntax issues
- Fixed indentation of dynamic temperature display code

Files changed (1) hide show

app.py CHANGED Viewed

@@ -493,6 +493,15 @@ def summarize_streaming(
     # Prepare system prompt with reasoning toggle for Qwen3 models
     model = AVAILABLE_MODELS[model_key]
     if output_language == "zh-TW":
         if model.get("supports_toggle"):
             reasoning_mode = "/think" if enable_reasoning else "/no_think"
@@ -530,7 +539,7 @@ def summarize_streaming(
         stream = llm.create_chat_completion(
             messages=messages,
             max_tokens=max_tokens,
-            temperature=temperature,
             min_p=0.0,
             top_p=final_top_p,
             top_k=final_top_k,

     # Prepare system prompt with reasoning toggle for Qwen3 models
     model = AVAILABLE_MODELS[model_key]
+    # Calculate dynamic temperature for Qwen3 models
+    if model.get("supports_toggle") and "temperature_thinking" in model.get("inference_settings", {}):
+        if enable_reasoning:
+            effective_temperature = model["inference_settings"]["temperature_thinking"]
+        else:
+            effective_temperature = model["inference_settings"]["temperature_no_thinking"]
+    else:
+        effective_temperature = temperature
     if output_language == "zh-TW":
         if model.get("supports_toggle"):
             reasoning_mode = "/think" if enable_reasoning else "/no_think"
         stream = llm.create_chat_completion(
             messages=messages,
             max_tokens=max_tokens,
+            temperature=effective_temperature,
             min_p=0.0,
             top_p=final_top_p,
             top_k=final_top_k,