Spaces:

peijun1
/

AIstudioProxyAPI

Paused

App Files Files Community

AIstudioProxyAPI / browser_utils /auth_rotation.py

peijun1

Deploy AI Studio Proxy API to Hugging Face Spaces

a5784e9 17 days ago

Raw

History Blame Contribute Delete

32.2 kB

	import asyncio
	import glob
	import json
	import logging
	import os
	import random
	import time
	from datetime import datetime, timedelta
	from typing import Optional

	from playwright.async_api import Page, TimeoutError

	from api_utils.server_state import state
	from api_utils.utils_ext.cooldown_manager import (
	load_cooldown_profiles,
	save_cooldown_profiles,
	)
	from api_utils.utils_ext.usage_tracker import get_profile_usage
	from config import AI_STUDIO_URL_PATTERN
	from config.global_state import GlobalState
	from config.selectors import PROMPT_TEXTAREA_SELECTOR
	from config.settings import (
	AUTO_ROTATE_AUTH_PROFILE,
	HIGH_TRAFFIC_QUEUE_THRESHOLD,
	ROTATION_DEPLETION_GUARD_HIGH_TRAFFIC,
	)
	from config.timeouts import QUOTA_EXCEEDED_COOLDOWN_SECONDS, RATE_LIMIT_COOLDOWN_SECONDS

	logger = logging.getLogger("AuthRotation")

	# Track recently used profiles to avoid rapid cycling/reuse
	# Maps filename -> timestamp of last use
	_USED_PROFILES_HISTORY = {}
	_HISTORY_RETENTION_SECONDS = 3600 * 2 # 2 hours retention for history

	# Profiles currently in cooldown (e.g. due to quota limit)
	# Maps filename -> Dict[model_id, expiry_timestamp] OR filename -> expiry_timestamp (legacy/global)
	_COOLDOWN_PROFILES = load_cooldown_profiles()

	# [FINAL-02] Depletion Guard: Track rotation attempts
	_ROTATION_TIMESTAMPS = []
	_ROTATION_LIMIT_WINDOW = 60 # seconds
	_ROTATION_LIMIT_COUNT = 3 # max attempts per window


	def _normalize_model_id(model_id: str) -> str:
	"""
	Normalize model ID to match cooldown key format.
	Converts "gemini 3 pro preview" to "gemini-3-pro-preview"
	"""
	if not model_id:
	return "default"

	# Convert to lowercase and replace spaces/dots with hyphens
	normalized = model_id.lower()
	normalized = normalized.replace(" ", "-")
	normalized = normalized.replace(".", "-")

	# Handle specific model patterns
	if "gemini" in normalized:
	# Ensure consistent gemini model naming
	if "gemini-1-5-pro" in normalized:
	return "gemini-1.5-pro"
	elif "gemini-2-5-pro" in normalized:
	return "gemini-2.5-pro"
	elif "gemini-3-1-pro" in normalized:
	return "gemini-3.1-pro"
	elif "gemini-3-pro-preview" in normalized:
	return "gemini-3-pro-preview"
	elif "gemini-pro" in normalized:
	return "gemini-pro"

	return normalized


	def _calculate_smart_priority(
	profile_path: str, target_model_id: str, cooldown_dict: dict
	) -> tuple:
	"""
	Calculates a sorting priority for a profile based on 'Efficiency' logic.

	Priority Tuple: (neg_efficiency_score, usage_count, random_factor)
	1. efficiency_score (Higher is better): Count of ACTIVE cooldowns for OTHER models.
	Rationale: Prefer profiles that are already "damaged" (in cooldown) for other models
	but valid for the current target, over "fresh" profiles that can serve everything.
	2. usage_count (Lower is better): Standard wear leveling.
	3. random_factor: Tie-breaker.
	"""
	efficiency_score = 0
	now = time.time()

	# Check cooldown data for this profile
	if profile_path in cooldown_dict:
	data = cooldown_dict[profile_path]
	if isinstance(data, dict):
	# Iterate through model cooldowns
	for model, ts in data.items():
	# Skip global cooldowns (already filtered out) and target model (already filtered out)
	if model == "global":
	continue

	# Check if this model is different from target
	if target_model_id and model == target_model_id:
	continue

	# If cooldown is active for this OTHER model, increase efficiency score
	ts_val = ts.timestamp() if hasattr(ts, "timestamp") else ts
	if ts_val > now:
	efficiency_score += 1

	usage = get_profile_usage(profile_path)

	# Return tuple for sorting:
	# 1. Negative efficiency_score (Ascending sort -> Higher score comes first)
	# 2. Positive usage (Ascending sort -> Lower usage comes first)
	# 3. Random (Ascending sort -> Random tie breaker)
	return (-efficiency_score, usage, random.random())


	def check_profile_cookie_health(profile_path: str) -> dict:
	"""
	Check the health of cookies in an auth profile.

	Returns a dict with:
	- total: total number of cookies
	- expired: number of expired cookies
	- valid: number of valid cookies
	- critical_expired: list of critical expired cookie names (auth-related)
	- health_status: 'healthy', 'warning', or 'critical'
	"""
	result = {
	"total": 0,
	"expired": 0,
	"valid": 0,
	"session": 0,
	"critical_expired": [],
	"health_status": "healthy",
	}

	# Critical cookies that affect authentication
	CRITICAL_COOKIES = {
	"SID",
	"HSID",
	"SSID",
	"APISID",
	"SAPISID",
	"SIDCC",
	"__Secure-1PSID",
	"__Secure-3PSID",
	}

	try:
	with open(profile_path, "r", encoding="utf-8") as f:
	data = json.load(f)

	cookies = data.get("cookies", [])
	result["total"] = len(cookies)
	now = time.time()

	for cookie in cookies:
	name = cookie.get("name", "")
	expires = cookie.get("expires", -1)

	if expires == -1:
	# Session cookie (no expiry)
	result["session"] += 1
	result["valid"] += 1
	elif expires < now:
	# Expired
	result["expired"] += 1
	if name in CRITICAL_COOKIES:
	result["critical_expired"].append(name)
	else:
	# Valid
	result["valid"] += 1

	# Determine health status
	if result["critical_expired"]:
	result["health_status"] = "critical"
	logger.warning(
	f"🔴 Auth profile '{os.path.basename(profile_path)}' has expired critical cookies: {result['critical_expired']}"
	)
	elif result["expired"] > result["total"] * 0.3: # More than 30% expired
	result["health_status"] = "warning"
	logger.warning(
	f"🟡 Auth profile '{os.path.basename(profile_path)}' has {result['expired']}/{result['total']} expired cookies"
	)
	else:
	logger.debug(
	f"🟢 Auth profile '{os.path.basename(profile_path)}' cookie health: {result['valid']}/{result['total']} valid"
	)

	except (json.JSONDecodeError, OSError) as e:
	logger.error(f"Failed to check cookie health for '{profile_path}': {e}")
	result["health_status"] = "error"

	return result


	def _find_best_profile_in_dirs(
	directories: list[str], target_model_id: str = None
	) -> Optional[str]:
	"""
	Finds the best available profile within a given list of directories.
	- Scans for .json files.
	- Excludes profiles in cooldown (Global or Model-Specific).
	- Sorts by usage count (ascending) and then randomly.
	"""
	if not directories or not isinstance(directories, list):
	return None

	logger.info(f"[DEBUG] Scanning directories: {directories}")
	all_profiles = []
	for d in directories:
	if d and isinstance(d, str) and os.path.exists(d):
	files = glob.glob(os.path.join(d, "*.json"))
	logger.info(f"[DEBUG] Found {len(files)} profiles in {d}")
	all_profiles.extend([os.path.abspath(f) for f in files])
	else:
	logger.warning(
	f"[DEBUG] Directory missing or invalid: {d} (Abs: {os.path.abspath(d) if d else 'None'})"
	)

	if not all_profiles:
	logger.warning(f"[DEBUG] No profiles found in {directories}")
	return None

	# Normalize target model ID for cooldown checking
	normalized_target_model = (
	_normalize_model_id(target_model_id) if target_model_id else None
	)
	logger.info(
	f"[DEBUG] Target model: {target_model_id} -> Normalized: {normalized_target_model}"
	)

	# Filter out profiles that don't exist or are in cooldown
	valid_profiles = []
	now = time.time()

	for p in all_profiles:
	if not os.path.exists(p):
	continue

	if p in _COOLDOWN_PROFILES:
	cooldown_data = _COOLDOWN_PROFILES[p]

	# Check if cooldown is active
	is_cooldown_active = False

	if isinstance(cooldown_data, dict):
	# New Format: Dict[model_id, timestamp]
	# Check Global Cooldown
	if "global" in cooldown_data:
	ts = cooldown_data["global"]
	ts_val = ts.timestamp() if hasattr(ts, "timestamp") else ts
	if ts_val > now:
	is_cooldown_active = True

	# Check Specific Model Cooldown
	if not is_cooldown_active and normalized_target_model:
	# Try both the normalized model ID and the original
	for model_key in [
	normalized_target_model,
	target_model_id.lower() if target_model_id else None,
	]:
	if model_key and model_key in cooldown_data:
	ts = cooldown_data[model_key]
	ts_val = ts.timestamp() if hasattr(ts, "timestamp") else ts
	if ts_val > now:
	is_cooldown_active = True
	logger.info(
	f"[DEBUG] Profile {os.path.basename(p)} is in cooldown for model '{model_key}'"
	)
	break
	else:
	# Legacy Format: timestamp direct
	if cooldown_data:
	ts = cooldown_data
	ts_val = ts.timestamp() if hasattr(ts, "timestamp") else ts
	if isinstance(ts_val, (int, float)) and ts_val > now:
	is_cooldown_active = True

	if is_cooldown_active:
	continue

	valid_profiles.append(p)

	if not valid_profiles:
	return None

	# Smart Efficiency Selection Logic:
	# Sort candidates using the smart priority tuple
	# Key: (-efficiency_score, usage, random)
	valid_profiles.sort(
	key=lambda p: _calculate_smart_priority(
	p, normalized_target_model, _COOLDOWN_PROFILES
	)
	)

	logger.info(f"[DEBUG] Best profile selected: {os.path.basename(valid_profiles[0])}")
	return valid_profiles[0]


	def _get_next_profile(target_model_id: str = None) -> Optional[str]:
	"""
	Implements a two-tiered profile selection system: Standard and Emergency.

	Tier 1 (Standard):
	- Scans `auth_profiles/saved` and `auth_profiles/active`.
	- Selects the best profile based on usage and cooldown status.

	Tier 2 (Emergency):
	- If no standard profiles are available, falls back to `auth_profiles/emergency`.
	- Selects the best emergency profile using the same logic.
	"""
	# Ensure the emergency directory exists
	emergency_dir = "auth_profiles/emergency"
	abs_emergency = os.path.abspath(emergency_dir)
	logger.info(f"[DEBUG] Emergency Dir: {emergency_dir} (Absolute: {abs_emergency})")
	os.makedirs(emergency_dir, exist_ok=True)

	# Note: Cooldown cleanup is complex with nested structure.
	# We rely on check-time filtering in _find_best_profile_in_dirs to handle expired entries effectively.

	# --- Tier 1: Standard Profiles ---
	logger.info(
	f"Tier 1: Searching for standard profiles... (Target Model: {target_model_id or 'Any'})"
	)
	# [FIX] Explicitly include emergency profiles in standard rotation scan if they are healthy
	# This ensures we don't artificially ignore valid profiles just because they are in the 'emergency' folder
	# The 'emergency' fallback logic (Tier 2) below is still useful for specific logging or aggressive fallback if needed,
	# but primarily we want to treat all available profiles as candidates.
	standard_dirs = [
	"auth_profiles/saved",
	"auth_profiles/active",
	"auth_profiles/emergency",
	]
	best_profile = _find_best_profile_in_dirs(standard_dirs, target_model_id)

	if best_profile:
	usage_val = get_profile_usage(best_profile)
	logger.info(
	f"🎯 Selected standard profile '{os.path.basename(best_profile)}' with usage: {usage_val}"
	)
	return best_profile

	# --- Tier 2: Emergency Profiles ---
	logger.warning(
	"Tier 1 yielded no profiles. Falling back to Tier 2: Emergency Pool."
	)
	emergency_dirs = [emergency_dir]
	best_emergency_profile = _find_best_profile_in_dirs(emergency_dirs, target_model_id)

	if best_emergency_profile:
	usage_val = get_profile_usage(best_emergency_profile)
	logger.info(
	f"🚨 Selected emergency profile '{os.path.basename(best_emergency_profile)}' with usage: {usage_val}"
	)
	return best_emergency_profile

	logger.error("No available profiles in standard or emergency pools.")
	return None


	async def _perform_canary_test(page: Page) -> bool:
	"""
	Performs a simple check to ensure the new profile is healthy.
	Navigates to the chat page and verifies a key element is present.
	"""
	if not page or page.is_closed():
	logger.warning("⚠️ Canary Test: Page is not available.")
	return False

	# Early exit during shutdown to avoid proxy connection issues
	if GlobalState.IS_SHUTTING_DOWN.is_set():
	logger.info("🔬 Canary Test Skipped: System is shutting down.")
	return True # Return True to allow rotation to complete during shutdown

	try:
	logger.info("🔬 Performing Canary Test on new profile...")
	target_url = f"https://{AI_STUDIO_URL_PATTERN}prompts/new_chat"
	await page.goto(target_url, wait_until="domcontentloaded", timeout=30000)

	# Check for a reliable element that indicates a logged-in state
	await page.wait_for_selector(PROMPT_TEXTAREA_SELECTOR, timeout=15000)

	logger.info("✅ Canary Test Passed: Profile is healthy.")
	return True
	except TimeoutError:
	logger.warning(
	"❌ Canary Test Failed: Timed out waiting for key element. Profile is likely bad."
	)
	return False
	except Exception as e:
	# Special handling for proxy connection errors during shutdown
	if (
	"NS_ERROR_PROXY_CONNECTION_REFUSED" in str(e)
	and GlobalState.IS_SHUTTING_DOWN.is_set()
	):
	logger.info(
	"🔬 Canary Test Skipped: Proxy connection refused during shutdown."
	)
	return True # Allow rotation to complete during shutdown

	logger.error(f"❌ Canary Test Failed: Unexpected error - {e}", exc_info=True)
	return False


	async def perform_auth_rotation(target_model_id: str = None) -> bool:
	"""
	Performs the authentication profile rotation with a soft-swap and canary test.

	Checks AUTO_ROTATE_AUTH_PROFILE environment variable to determine if rotation should proceed.

	1. Acquires Hard Lock (stops requests).
	2. Enters a loop to find a healthy profile.
	3. Selects next profile, puts the old one in cooldown.
	4. Performs a soft-swap of cookies.
	5. Runs a canary test to validate the new profile.
	6. If healthy, breaks the loop and releases the lock.
	7. If unhealthy, adds the profile to cooldown and repeats.
	"""

	# Check if auto-rotation is enabled via environment variable
	if not AUTO_ROTATE_AUTH_PROFILE:
	logger.info(
	"🔒 Auth rotation is disabled via AUTO_ROTATE_AUTH_PROFILE environment variable"
	)
	logger.info("♻️ ROTATION SKIPPED - Auto-rotation disabled")
	logger.info("♻️ =========================================")
	return False

	# [OBS-04] Explicit Rotation Logging with Visual Separators
	logger.info("♻️ =========================================")
	logger.info("♻️ INITIATING AUTH ROTATION")
	logger.info("♻️ =========================================")

	# Avoid re-entry if already rotating (Atomic Check & Wait)
	if not GlobalState.AUTH_ROTATION_LOCK.is_set():
	logger.info(
	"⚠️ Rotation already in progress (Lock is cleared). Waiting for completion..."
	)
	await GlobalState.AUTH_ROTATION_LOCK.wait()
	logger.info("♻️ Rotation skipped - already in progress (Waited for completion)")
	logger.info("♻️ =========================================")
	return True

	# Atomically acquire the lock
	GlobalState.AUTH_ROTATION_LOCK.clear()
	logger.info("🔒 Request processing locked.")

	should_release_lock = True

	try:
	# [FINAL-02] Depletion Guard Check
	global _ROTATION_TIMESTAMPS
	current_time = time.time()

	# Dynamic "Rotation Window" Adjustment
	if GlobalState.queued_request_count > HIGH_TRAFFIC_QUEUE_THRESHOLD:
	effective_rotation_limit = ROTATION_DEPLETION_GUARD_HIGH_TRAFFIC
	logger.info(
	f"High traffic detected ({GlobalState.queued_request_count} queued). Using lenient rotation guard: {effective_rotation_limit}"
	)
	else:
	effective_rotation_limit = _ROTATION_LIMIT_COUNT

	# Filter timestamps within the window, ensuring we only process numeric values
	_ROTATION_TIMESTAMPS = [
	t
	for t in _ROTATION_TIMESTAMPS
	if isinstance(t, (int, float)) and current_time - t < _ROTATION_LIMIT_WINDOW
	]

	if len(_ROTATION_TIMESTAMPS) >= effective_rotation_limit:
	logger.critical(
	f"🚨 CRITICAL: TOO MANY ROTATIONS! (limit: {effective_rotation_limit}) All accounts may be exhausted. Stopping Browser & Locking API."
	)
	logger.critical("♻️ ROTATION ABORTED - System Exhausted")
	logger.critical("♻️ =========================================")

	# SOFT DEPLETION STRATEGY: Avoid hard shutdown to maintain "No Downtime" goal
	logger.critical(
	"🚨 DEPLETION DETECTED: Switching to emergency operation mode"
	)
	logger.critical("🚨 All profiles exhausted, but avoiding hard shutdown")

	# Set emergency mode flag
	GlobalState.DEPLOYMENT_EMERGENCY_MODE = True

	# Try to perform soft profile rotation even during depletion
	# This maintains the "No Downtime" requirement
	try:
	# Attempt one final soft rotation with emergency profiles
	emergency_profile = _find_best_profile_in_dirs(
	["auth_profiles/emergency"]
	)
	if emergency_profile:
	logger.critical("🚨 Attempting emergency profile activation...")
	# Perform minimal soft swap for emergency operation
	if state.page_instance and not state.page_instance.is_closed():
	with open(emergency_profile, "r", encoding="utf-8") as f:
	storage_state = json.load(f)
	context = state.page_instance.context
	await context.clear_cookies()
	await context.add_cookies(storage_state.get("cookies", []))
	logger.critical(
	"🚨 Emergency profile activated - continuing operation"
	)
	return True
	except Exception as e:
	logger.critical(f"🚨 Emergency activation failed: {e}")

	# Only if soft emergency operation fails, then consider partial shutdown
	# But still try to maintain some level of service
	logger.critical(
	"🚨 Entering minimal operation mode - limited service available"
	)

	# PERMANENT LOCK (Do not release GlobalState.AUTH_ROTATION_LOCK)
	# We leave the lock cleared so no new requests can proceed.
	should_release_lock = False
	return False

	# Record this attempt
	_ROTATION_TIMESTAMPS.append(current_time)
	logger.info(
	f"🔄 Rotation attempt #{len(_ROTATION_TIMESTAMPS)} in current window"
	)

	# (Lock is already acquired above)

	max_retries = 5
	failed_attempts = 0

	# Note: Nested try block removed, logic flattened into main try/finally
	while failed_attempts < max_retries:
	# 2. Select next profile
	logger.info("🔍 Selecting next auth profile...")
	next_profile_path = _get_next_profile(target_model_id)

	if not next_profile_path:
	logger.warning("All profiles are on cooldown. Calculating wait time...")

	now = time.time()
	min_expiry = float("inf")

	# Find the soonest expiry time among all cooldown profiles
	for _, cooldown_data in _COOLDOWN_PROFILES.items():
	if isinstance(cooldown_data, dict):
	for ts in cooldown_data.values():
	ts_val = ts.timestamp() if hasattr(ts, "timestamp") else ts
	if ts_val > now and ts_val < min_expiry:
	min_expiry = ts_val
	else: # Legacy timestamp format
	ts_val = (
	cooldown_data.timestamp()
	if hasattr(cooldown_data, "timestamp")
	else cooldown_data
	)
	if (
	isinstance(ts_val, (int, float))
	and ts_val > now
	and ts_val < min_expiry
	):
	min_expiry = ts_val

	if min_expiry != float("inf"):
	# Add a small buffer to avoid timing issues
	wait_time = (min_expiry - now) + 1
	if wait_time > 0:
	logger.info(
	f"🕒 Waiting for {wait_time:.2f} seconds for the next profile to become available."
	)
	await asyncio.sleep(wait_time)

	# Retry getting the profile
	logger.info("Retrying to get next profile after waiting.")
	next_profile_path = _get_next_profile(target_model_id)

	# Final check after waiting
	if not next_profile_path:
	logger.critical(
	"❌ Rotation Failed: No available auth profiles found even after waiting!"
	)
	logger.critical("♻️ ROTATION FAILED - No profiles available")
	logger.critical("♻️ =========================================")
	return False

	# Always place the previous profile on cooldown on the first attempt
	if failed_attempts == 0:
	old_profile = getattr(state, "current_auth_profile_path", "unknown")
	if old_profile != "unknown" and os.path.exists(old_profile):
	# Calculate cooldown based on error type
	error_type = GlobalState.last_error_type

	# Ensure existing entry is a dict if it exists
	if old_profile not in _COOLDOWN_PROFILES or not isinstance(
	_COOLDOWN_PROFILES[old_profile], dict
	):
	_COOLDOWN_PROFILES[old_profile] = {}

	expiry_ts = (
	datetime.now()
	+ timedelta(seconds=QUOTA_EXCEEDED_COOLDOWN_SECONDS)
	).timestamp()
	rate_limit_ts = (
	datetime.now() + timedelta(seconds=RATE_LIMIT_COOLDOWN_SECONDS)
	).timestamp()

	if error_type == "RATE_LIMIT":
	# Rate Limit -> Global Cooldown
	_COOLDOWN_PROFILES[old_profile]["global"] = rate_limit_ts
	logger.info(
	f"❄️ Placing profile in GLOBAL cooldown for {RATE_LIMIT_COOLDOWN_SECONDS}s (Rate Limit)."
	)
	else:
	# Quota Exceeded -> Model Specific Cooldowns

	# 1. Identify models to cooldown
	models_to_cooldown = set(
	GlobalState.current_profile_exhausted_models
	)
	logger.info(
	f"🔍 Model cooldown analysis: exhausted_models={GlobalState.current_profile_exhausted_models}, target_model={target_model_id}"
	)

	# 2. Ensure target/current model is included if appropriate
	# If a specific target was requested, it's likely the one failing
	if target_model_id:
	models_to_cooldown.add(target_model_id.lower())

	# 3. Fallback: Only use "default" as absolute last resort
	# Prioritize target_model_id and avoid unnecessary "default" entries
	if not models_to_cooldown:
	if target_model_id:
	models_to_cooldown.add(target_model_id.lower())
	logger.info(
	f"🔍 Using target_model_id as fallback: {target_model_id}"
	)
	elif state.current_ai_studio_model_id:
	models_to_cooldown.add(
	state.current_ai_studio_model_id.lower()
	)
	logger.info(
	f"🔍 Using state.current_ai_studio_model_id as fallback: {state.current_ai_studio_model_id}"
	)
	else:
	# Only use "default" if we truly cannot identify any model
	logger.warning(
	"⚠️ Unable to identify specific model, falling back to 'default'. This should be rare."
	)
	models_to_cooldown.add("default")

	# 4. Apply cooldowns
	logger.info(
	f"🎯 Applying cooldown to models: {list(models_to_cooldown)}"
	)
	for m_id in models_to_cooldown:
	_COOLDOWN_PROFILES[old_profile][m_id] = expiry_ts
	logger.info(
	f"❄️ Placing profile in cooldown for model '{m_id}' for {QUOTA_EXCEEDED_COOLDOWN_SECONDS}s."
	)

	save_cooldown_profiles(_COOLDOWN_PROFILES)

	new_profile_name = os.path.basename(next_profile_path)
	logger.info(f"👉 Attempting to rotate to profile: {new_profile_name}")

	# Update global state for the new profile path
	state.current_auth_profile_path = next_profile_path
	os.environ["ACTIVE_AUTH_JSON_PATH"] = next_profile_path

	# 3. Soft Context Swap
	logger.info("🚀 Performing Soft Context Swap...")
	if not state.page_instance or state.page_instance.is_closed():
	logger.error(
	"❌ Page instance not found or closed, cannot perform soft swap."
	)
	return False

	try:
	try:
	with open(next_profile_path, "r", encoding="utf-8") as f:
	storage_state = json.load(f)
	except (json.JSONDecodeError, OSError) as json_err:
	logger.error(
	f"❌ Corrupt or inaccessible profile file '{new_profile_name}': {json_err}"
	)
	# Treat as a failed attempt, will trigger cooldown logic in outer except/continue
	raise

	if not isinstance(storage_state, dict):
	raise ValueError(f"Invalid profile format in '{new_profile_name}'")

	context = state.page_instance.context
	await context.clear_cookies()
	await context.add_cookies(storage_state.get("cookies", []))
	logger.info("✅ Injected new cookies.")

	# 4. Perform Canary Test
	if await _perform_canary_test(state.page_instance):
	# Healthy profile found, break the loop
	GlobalState.reset_quota_status()
	# GlobalState.current_profile_token_count = 0 # Removed: handled by reset_quota_status
	logger.info(
	f"♻️ ROTATION SUCCESSFUL with profile: {new_profile_name}"
	)
	logger.info("♻️ =========================================")
	return True
	else:
	# Canary test failed, profile is bad
	logger.warning(
	f" Canary test failed for {new_profile_name}. Adding to cooldown and retrying."
	)
	failed_attempts += 1

	# Place failed profile in cooldown immediately
	expiry_time = datetime.now() + timedelta(
	seconds=QUOTA_EXCEEDED_COOLDOWN_SECONDS
	)
	_COOLDOWN_PROFILES[next_profile_path] = expiry_time
	save_cooldown_profiles(_COOLDOWN_PROFILES)
	logger.info(
	f"❄️ Placing unhealthy profile '{new_profile_name}' in cooldown for {QUOTA_EXCEEDED_COOLDOWN_SECONDS}s."
	)
	continue # Try next profile

	except Exception as swap_err:
	logger.error(
	f"❌ Failed to perform soft swap for {new_profile_name}: {swap_err}"
	)
	failed_attempts += 1
	# Also place this profile on cooldown
	expiry_time = datetime.now() + timedelta(
	seconds=QUOTA_EXCEEDED_COOLDOWN_SECONDS
	)
	_COOLDOWN_PROFILES[next_profile_path] = expiry_time
	save_cooldown_profiles(_COOLDOWN_PROFILES)
	logger.info(
	f"❄️ Placing swap-failed profile '{new_profile_name}' in cooldown."
	)
	continue

	# If loop finishes without success
	logger.critical(
	f"🚨 ROTATION FAILED: All {max_retries} attempts to find a healthy profile failed."
	)
	return False
	except Exception as e:
	logger.error(
	f"❌ Unexpected error during auth rotation loop: {e}", exc_info=True
	)
	logger.error("♻️ ROTATION FAILED - Unexpected error")
	logger.error("♻️ =========================================")
	return False
	finally:
	# 5. Release lock (if not permanently locked)
	if should_release_lock:
	GlobalState.AUTH_ROTATION_LOCK.set()
	logger.info("🔓 Request processing unlocked.")
	logger.info("♻️ Rotation flow completed")
	logger.info("♻️ =========================================")