Spaces:

DocSA
/

LP_2-AI_Assistant

Sleeping

App Files Files Community

DocUA commited on Mar 3

Commit

28552c9

1 Parent(s): 09efcd1

Re-enable extended thinking for Claude Haiku 4.5 models

Browse files

Files changed (1) hide show

main.py +19 -23

main.py CHANGED Viewed

@@ -995,30 +995,26 @@ def generate_legal_position(
             # Add thinking config if enabled
             if thinking_enabled and "claude" in model_name.lower():
-                # Claude Haiku typically does not support thinking mode
-                if "haiku" in model_name.lower():
-                    print(f"[WARNING] Thinking mode is not supported for Haiku models. Disabling thinking for {model_name}.")
                 else:
-                    # For Claude 4.6 models, we can use Adaptive
-                    if thinking_type.lower() == "adaptive" and "-4-6" in str(model_name).lower():
-                        message_params["thinking"] = {"type": "adaptive"}
-                        message_params["temperature"] = 1.0
-                    else:
-                        # 'Enabled' type works for both 4.5 and 4.6 models
-                        budget = max(1024, int(thinking_budget))
-                        # Anthropic REQUIRES max_tokens > budget_tokens.
-                        # If the user sets a low max_tokens (e.g. 4000) and high budget (10000), it will fail.
-                        if message_params["max_tokens"] <= budget:
-                            recommended_max = budget + 4000
-                            print(f"[WARNING] max_tokens ({message_params['max_tokens']}) is <= thinking_budget ({budget}). Increasing max_tokens to {recommended_max}.")
-                            message_params["max_tokens"] = recommended_max
-                        message_params["thinking"] = {
-                            "type": "enabled",
-                            "budget_tokens": budget
-                        }
-                        message_params["temperature"] = 1.0
             # Log full prompts in debug mode
             _log_prompt("anthropic", model_name, system_prompt, content)

             # Add thinking config if enabled
             if thinking_enabled and "claude" in model_name.lower():
+                # For Claude 4.6 models, we can use Adaptive
+                if thinking_type.lower() == "adaptive" and "-4-6" in str(model_name).lower():
+                    message_params["thinking"] = {"type": "adaptive"}
+                    message_params["temperature"] = 1.0
                 else:
+                    # 'Enabled' type works for both 4.5 and 4.6 models
+                    budget = max(1024, int(thinking_budget))
+                    # Anthropic REQUIRES max_tokens > budget_tokens.
+                    # If the user sets a low max_tokens (e.g. 4000) and high budget (10000), it will fail.
+                    if message_params["max_tokens"] <= budget:
+                        recommended_max = budget + 4000
+                        print(f"[WARNING] max_tokens ({message_params['max_tokens']}) is <= thinking_budget ({budget}). Increasing max_tokens to {recommended_max}.")
+                        message_params["max_tokens"] = recommended_max
+                    message_params["thinking"] = {
+                        "type": "enabled",
+                        "budget_tokens": budget
+                    }
+                    message_params["temperature"] = 1.0
             # Log full prompts in debug mode
             _log_prompt("anthropic", model_name, system_prompt, content)