Spaces:

elmerzole
/

llm-api-proxy

Paused

MasuRii commited on Dec 4, 2025

Commit

fce1762

1 Parent(s): 956bdbb

fix(logging): preserve full credential filenames in logs

Resolved logging truncation issue where OAuth credential filenames were
being aggressively abbreviated (e.g., `...6.json` instead of
`antigravity_oauth_16.json`), causing ambiguity when debugging or
auditing specific credentials.

**Changes:**

- Enhanced `mask_credential()` utility in error_handler.py:
- Now explicitly detects `.json` file extensions
- Returns full basename for file paths (e.g., `antigravity_oauth_16.json`)
- Maintains security by masking API keys to last 6 characters (`...xyz123`)

- Replaced all manual credential truncation with centralized `mask_credential()`:
- client.py: 15 instances (stream handling, retry logging, model discovery)
- usage_manager.py: 16 instances (key acquisition, release, cooldown tracking)
- failure_logger.py: 2 instances (failure logging and summaries)

- Code quality improvements:
- Fixed indentation error in client.py during refactoring
- Ensured consistent, safe credential logging across entire application

- Configuration:
- Added `oauth_creds/` to .gitignore to prevent accidental credential commits

**Impact:**

This standardizes credential display throughout the application, enabling
accurate debugging and auditing while maintaining security for raw API keys.
Logs now clearly distinguish between multiple OAuth files (e.g., `6.json`
vs `16.json`) without exposing sensitive key material.

**Files Modified:**
- .gitignore (added oauth_creds exclusion)
- src/rotator_library/client.py (15 replacements)
- src/rotator_library/error_handler.py (enhanced mask_credential logic)
- src/rotator_library/failure_logger.py (2 replacements)
- src/rotator_library/usage_manager.py (16 replacements)

Files changed (5) hide show

.gitignore +2 -0
src/rotator_library/client.py +16 -24
src/rotator_library/error_handler.py +1 -1
src/rotator_library/failure_logger.py +3 -2
src/rotator_library/usage_manager.py +16 -16

.gitignore CHANGED Viewed

@@ -128,3 +128,5 @@ cache/antigravity/thought_signatures.json
 logs/
 cache/
 *.env

 logs/
 cache/
 *.env
+oauth_creds

src/rotator_library/client.py CHANGED Viewed

@@ -537,7 +537,7 @@ class RotatingClient:
             while True:
                 if request and await request.is_disconnected():
                     lib_logger.info(
-                        f"Client disconnected. Aborting stream for credential ...{key[-6:]}."
                     )
                     break
@@ -695,7 +695,7 @@ class RotatingClient:
             # Catch any other unexpected errors during streaming.
             lib_logger.error(f"Caught unexpected exception of type: {type(e).__name__}")
             lib_logger.error(
-                f"An unexpected error occurred during the stream for credential ...{key[-6:]}: {e}"
             )
             # We still need to raise it so the client knows something went wrong.
             raise
@@ -705,7 +705,7 @@ class RotatingClient:
             # The primary goal is to ensure usage is always logged internally.
             await self.usage_manager.release_key(key, model)
             lib_logger.info(
-                f"STREAM FINISHED and lock released for credential ...{key[-6:]}."
             )
             # Only send [DONE] if the stream completed naturally and the client is still there.
@@ -1006,7 +1006,7 @@ class RotatingClient:
                     for attempt in range(self.max_retries):
                         try:
                             lib_logger.info(
-                                f"Attempting call with credential ...{current_cred[-6:]} (Attempt {attempt + 1}/{self.max_retries})"
                             )
                             if pre_request_callback:
@@ -1495,9 +1495,9 @@ class RotatingClient:
                         for attempt in range(self.max_retries):
                             try:
                                 lib_logger.info(
-                                    f"Attempting stream with credential ...{current_cred[-6:]} (Attempt {attempt + 1}/{self.max_retries})"
                                 )
                                 if pre_request_callback:
                                     try:
                                         await pre_request_callback(
@@ -1518,7 +1518,7 @@ class RotatingClient:
                                 )
                                 lib_logger.info(
-                                    f"Stream connection established for credential ...{current_cred[-6:]}. Processing response."
                                 )
                                 key_acquired = False
@@ -1735,7 +1735,7 @@ class RotatingClient:
                     for attempt in range(self.max_retries):
                         try:
                             lib_logger.info(
-                                f"Attempting stream with credential ...{current_cred[-6:]} (Attempt {attempt + 1}/{self.max_retries})"
                             )
                             if pre_request_callback:
@@ -1763,7 +1763,7 @@ class RotatingClient:
                             )
                             lib_logger.info(
-                                f"Stream connection established for credential ...{current_cred[-6:]}. Processing response."
                             )
                             key_acquired = False
@@ -1935,7 +1935,7 @@ class RotatingClient:
                             if attempt >= self.max_retries - 1:
                                 lib_logger.warning(
-                                    f"Credential ...{current_cred[-6:]} failed after max retries for model {model} due to a server error. Rotating key silently."
                                 )
                                 # [MODIFIED] Do not yield to the client here.
                                 break
@@ -1951,7 +1951,7 @@ class RotatingClient:
                                 break
                             lib_logger.warning(
-                                f"Credential ...{current_cred[-6:]} encountered a server error for model {model}. Reason: '{error_message_text}'. Retrying in {wait_time:.2f}s."
                             )
                             await asyncio.sleep(wait_time)
                             continue
@@ -1977,7 +1977,7 @@ class RotatingClient:
                             )
                             lib_logger.warning(
-                                f"Credential ...{current_cred[-6:]} failed with {classified_error.error_type} (Status: {classified_error.status_code}). Error: {error_message_text}."
                             )
                             # Handle rate limits with cooldown
@@ -2179,13 +2179,9 @@ class RotatingClient:
             for credential in shuffled_credentials:
                 try:
                     # Display last 6 chars for API keys, or the filename for OAuth paths
-                    cred_display = (
-                        credential[-6:]
-                        if not os.path.isfile(credential)
-                        else os.path.basename(credential)
-                    )
                     lib_logger.debug(
-                        f"Attempting to get models for {provider} with credential ...{cred_display}"
                     )
                     models = await provider_instance.get_models(
                         credential, self.http_client
@@ -2216,13 +2212,9 @@ class RotatingClient:
                     return final_models
                 except Exception as e:
                     classified_error = classify_error(e)
-                    cred_display = (
-                        credential[-6:]
-                        if not os.path.isfile(credential)
-                        else os.path.basename(credential)
-                    )
                     lib_logger.debug(
-                        f"Failed to get models for provider {provider} with credential ...{cred_display}: {classified_error.error_type}. Trying next credential."
                     )
                     continue  # Try the next credential

             while True:
                 if request and await request.is_disconnected():
                     lib_logger.info(
+                        f"Client disconnected. Aborting stream for credential {mask_credential(key)}."
                     )
                     break
             # Catch any other unexpected errors during streaming.
             lib_logger.error(f"Caught unexpected exception of type: {type(e).__name__}")
             lib_logger.error(
+                f"An unexpected error occurred during the stream for credential {mask_credential(key)}: {e}"
             )
             # We still need to raise it so the client knows something went wrong.
             raise
             # The primary goal is to ensure usage is always logged internally.
             await self.usage_manager.release_key(key, model)
             lib_logger.info(
+                f"STREAM FINISHED and lock released for credential {mask_credential(key)}."
             )
             # Only send [DONE] if the stream completed naturally and the client is still there.
                     for attempt in range(self.max_retries):
                         try:
                             lib_logger.info(
+                                f"Attempting call with credential {mask_credential(current_cred)} (Attempt {attempt + 1}/{self.max_retries})"
                             )
                             if pre_request_callback:
                         for attempt in range(self.max_retries):
                             try:
                                 lib_logger.info(
+                                    f"Attempting stream with credential {mask_credential(current_cred)} (Attempt {attempt + 1}/{self.max_retries})"
                                 )
                                 if pre_request_callback:
                                     try:
                                         await pre_request_callback(
                                 )
                                 lib_logger.info(
+                                    f"Stream connection established for credential {mask_credential(current_cred)}. Processing response."
                                 )
                                 key_acquired = False
                     for attempt in range(self.max_retries):
                         try:
                             lib_logger.info(
+                                f"Attempting stream with credential {mask_credential(current_cred)} (Attempt {attempt + 1}/{self.max_retries})"
                             )
                             if pre_request_callback:
                             )
                             lib_logger.info(
+                                f"Stream connection established for credential {mask_credential(current_cred)}. Processing response."
                             )
                             key_acquired = False
                             if attempt >= self.max_retries - 1:
                                 lib_logger.warning(
+                                    f"Credential {mask_credential(current_cred)} failed after max retries for model {model} due to a server error. Rotating key silently."
                                 )
                                 # [MODIFIED] Do not yield to the client here.
                                 break
                                 break
                             lib_logger.warning(
+                                f"Credential {mask_credential(current_cred)} encountered a server error for model {model}. Reason: '{error_message_text}'. Retrying in {wait_time:.2f}s."
                             )
                             await asyncio.sleep(wait_time)
                             continue
                             )
                             lib_logger.warning(
+                                f"Credential {mask_credential(current_cred)} failed with {classified_error.error_type} (Status: {classified_error.status_code}). Error: {error_message_text}."
                             )
                             # Handle rate limits with cooldown
             for credential in shuffled_credentials:
                 try:
                     # Display last 6 chars for API keys, or the filename for OAuth paths
+                    cred_display = mask_credential(credential)
                     lib_logger.debug(
+                        f"Attempting to get models for {provider} with credential {cred_display}"
                     )
                     models = await provider_instance.get_models(
                         credential, self.http_client
                     return final_models
                 except Exception as e:
                     classified_error = classify_error(e)
+                    cred_display = mask_credential(credential)
                     lib_logger.debug(
+                        f"Failed to get models for provider {provider} with credential {cred_display}: {classified_error.error_type}. Trying next credential."
                     )
                     continue  # Try the next credential

src/rotator_library/error_handler.py CHANGED Viewed

@@ -112,7 +112,7 @@ def mask_credential(credential: str) -> str:
     - For API keys: shows last 6 characters (e.g., "...xyz123")
     - For OAuth file paths: shows just the filename (e.g., "antigravity_oauth_1.json")
     """
-    if os.path.isfile(credential):
         return os.path.basename(credential)
     elif len(credential) > 6:
         return f"...{credential[-6:]}"

     - For API keys: shows last 6 characters (e.g., "...xyz123")
     - For OAuth file paths: shows just the filename (e.g., "antigravity_oauth_1.json")
     """
+    if os.path.isfile(credential) or credential.endswith(".json"):
         return os.path.basename(credential)
     elif len(credential) > 6:
         return f"...{credential[-6:]}"

src/rotator_library/failure_logger.py CHANGED Viewed

@@ -3,6 +3,7 @@ import json
 from logging.handlers import RotatingFileHandler
 import os
 from datetime import datetime
 def setup_failure_logger():
@@ -133,7 +134,7 @@ def log_failure(
     detailed_log_data = {
         "timestamp": datetime.utcnow().isoformat(),
-        "api_key_ending": api_key[-4:] if len(api_key) >= 4 else "****",
         "model": model,
         "attempt_number": attempt,
         "error_type": type(error).__name__,
@@ -148,7 +149,7 @@ def log_failure(
     # 2. Log a concise summary to the main library logger, which will propagate
     summary_message = (
-        f"API call failed for model {model} with key ...{api_key[-4:] if len(api_key) >= 4 else '****'}. "
         f"Error: {type(error).__name__}. See failures.log for details."
     )
     main_lib_logger.error(summary_message)

 from logging.handlers import RotatingFileHandler
 import os
 from datetime import datetime
+from .error_handler import mask_credential
 def setup_failure_logger():
     detailed_log_data = {
         "timestamp": datetime.utcnow().isoformat(),
+        "api_key_ending": mask_credential(api_key),
         "model": model,
         "attempt_number": attempt,
         "error_type": type(error).__name__,
     # 2. Log a concise summary to the main library logger, which will propagate
     summary_message = (
+        f"API call failed for model {model} with key {mask_credential(api_key)}. "
         f"Error: {type(error).__name__}. See failures.log for details."
     )
     main_lib_logger.error(summary_message)

src/rotator_library/usage_manager.py CHANGED Viewed

@@ -9,7 +9,7 @@ from typing import Any, Dict, List, Optional, Set
 import aiofiles
 import litellm
-from .error_handler import ClassifiedError, NoAvailableKeysError
 from .providers import PROVIDER_PLUGINS
 lib_logger = logging.getLogger("rotator_library")
@@ -139,7 +139,7 @@ class UsageManager:
                     last_reset_dt is None
                     or last_reset_dt < reset_threshold_today <= now_utc
                 ):
-                    lib_logger.debug(f"Performing daily reset for key ...{key[-6:]}")
                     needs_saving = True
                     # Reset cooldowns
@@ -237,7 +237,7 @@ class UsageManager:
         if lib_logger.isEnabledFor(logging.DEBUG):
             total_weight = sum(weights)
             weight_info = ", ".join(
-                f"...{cred[-6:]}: w={w:.1f} ({w/total_weight*100:.1f}%)"
                 for (cred, _), w in zip(candidates, weights)
             )
             #lib_logger.debug(f"Weighted selection candidates: {weight_info}")
@@ -358,7 +358,7 @@ class UsageManager:
                             if not state["models_in_use"]:
                                 state["models_in_use"][model] = 1
                                 lib_logger.info(
-                                    f"Acquired Priority-{priority_level} Tier-1 key ...{key[-6:]} for model {model} "
                                     f"(selection: {selection_method}, usage: {usage})"
                                 )
                                 return key
@@ -371,7 +371,7 @@ class UsageManager:
                             if current_count < max_concurrent:
                                 state["models_in_use"][model] = current_count + 1
                                 lib_logger.info(
-                                    f"Acquired Priority-{priority_level} Tier-2 key ...{key[-6:]} for model {model} "
                                     f"(selection: {selection_method}, concurrent: {state['models_in_use'][model]}/{max_concurrent}, usage: {usage})"
                                 )
                                 return key
@@ -452,7 +452,7 @@ class UsageManager:
                         if not state["models_in_use"]:
                             state["models_in_use"][model] = 1
                             lib_logger.info(
-                                f"Acquired Tier 1 key ...{key[-6:]} for model {model} "
                                 f"(selection: {selection_method}, usage: {usage})"
                             )
                             return key
@@ -465,7 +465,7 @@ class UsageManager:
                         if current_count < max_concurrent:
                             state["models_in_use"][model] = current_count + 1
                             lib_logger.info(
-                                f"Acquired Tier 2 key ...{key[-6:]} for model {model} "
                                 f"(selection: {selection_method}, concurrent: {state['models_in_use'][model]}/{max_concurrent}, usage: {usage})"
                             )
                             return key
@@ -521,12 +521,12 @@ class UsageManager:
                 if remaining <= 0:
                     del state["models_in_use"][model]  # Clean up when count reaches 0
                 lib_logger.info(
-                    f"Released credential ...{key[-6:]} from model {model} "
                     f"(remaining concurrent: {max(0, remaining)})"
                 )
             else:
                 lib_logger.warning(
-                    f"Attempted to release credential ...{key[-6:]} for model {model}, but it was not in use."
                 )
         # Notify all tasks waiting on this key's condition
@@ -589,7 +589,7 @@ class UsageManager:
                     usage, "completion_tokens", 0
                 )  # Not present in embedding responses
                 lib_logger.info(
-                    f"Recorded usage from response object for key ...{key[-6:]}"
                 )
                 try:
                     provider_name = model.split("/")[0]
@@ -681,14 +681,14 @@ class UsageManager:
                 # Rate limit errors: use retry_after if available, otherwise default to 60s
                 cooldown_seconds = classified_error.retry_after or 60
                 lib_logger.info(
-                    f"Rate limit error on key ...{key[-6:]} for model {model}. "
                     f"Using {'provided' if classified_error.retry_after else 'default'} retry_after: {cooldown_seconds}s"
                 )
             elif classified_error.error_type == "authentication":
                 # Apply a 5-minute key-level lockout for auth errors
                 key_data["key_cooldown_until"] = time.time() + 300
                 lib_logger.warning(
-                    f"Authentication error on key ...{key[-6:]}. Applying 5-minute key-level lockout."
                 )
                 # Auth errors still use escalating backoff for the specific model
                 cooldown_seconds = 300  # 5 minutes for model cooldown
@@ -707,7 +707,7 @@ class UsageManager:
                     backoff_tiers = {1: 10, 2: 30, 3: 60, 4: 120}
                     cooldown_seconds = backoff_tiers.get(count, 7200)  # Default to 2 hours for "spent" keys
                     lib_logger.warning(
-                        f"Failure #{count} for key ...{key[-6:]} with model {model}. "
                         f"Error type: {classified_error.error_type}"
                     )
             else:
@@ -715,7 +715,7 @@ class UsageManager:
                 if cooldown_seconds is None:
                     cooldown_seconds = 30  # 30s cooldown for provider issues
                 lib_logger.info(
-                    f"Provider-level error ({classified_error.error_type}) for key ...{key[-6:]} with model {model}. "
                     f"NOT incrementing consecutive failures. Applying {cooldown_seconds}s cooldown."
                 )
@@ -723,7 +723,7 @@ class UsageManager:
             model_cooldowns = key_data.setdefault("model_cooldowns", {})
             model_cooldowns[model] = time.time() + cooldown_seconds
             lib_logger.warning(
-                f"Cooldown applied for key ...{key[-6:]} with model {model}: {cooldown_seconds}s. "
                 f"Error type: {classified_error.error_type}"
             )
@@ -750,5 +750,5 @@ class UsageManager:
         if long_term_lockout_models >= 3:
             key_data["key_cooldown_until"] = now + 300  # 5-minute key lockout
             lib_logger.error(
-                f"Key ...{key[-6:]} has {long_term_lockout_models} models in long-term lockout. Applying 5-minute key-level lockout."
             )

 import aiofiles
 import litellm
+from .error_handler import ClassifiedError, NoAvailableKeysError, mask_credential
 from .providers import PROVIDER_PLUGINS
 lib_logger = logging.getLogger("rotator_library")
                     last_reset_dt is None
                     or last_reset_dt < reset_threshold_today <= now_utc
                 ):
+                    lib_logger.debug(f"Performing daily reset for key {mask_credential(key)}")
                     needs_saving = True
                     # Reset cooldowns
         if lib_logger.isEnabledFor(logging.DEBUG):
             total_weight = sum(weights)
             weight_info = ", ".join(
+                f"{mask_credential(cred)}: w={w:.1f} ({w/total_weight*100:.1f}%)"
                 for (cred, _), w in zip(candidates, weights)
             )
             #lib_logger.debug(f"Weighted selection candidates: {weight_info}")
                             if not state["models_in_use"]:
                                 state["models_in_use"][model] = 1
                                 lib_logger.info(
+                                    f"Acquired Priority-{priority_level} Tier-1 key {mask_credential(key)} for model {model} "
                                     f"(selection: {selection_method}, usage: {usage})"
                                 )
                                 return key
                             if current_count < max_concurrent:
                                 state["models_in_use"][model] = current_count + 1
                                 lib_logger.info(
+                                    f"Acquired Priority-{priority_level} Tier-2 key {mask_credential(key)} for model {model} "
                                     f"(selection: {selection_method}, concurrent: {state['models_in_use'][model]}/{max_concurrent}, usage: {usage})"
                                 )
                                 return key
                         if not state["models_in_use"]:
                             state["models_in_use"][model] = 1
                             lib_logger.info(
+                                f"Acquired Tier 1 key {mask_credential(key)} for model {model} "
                                 f"(selection: {selection_method}, usage: {usage})"
                             )
                             return key
                         if current_count < max_concurrent:
                             state["models_in_use"][model] = current_count + 1
                             lib_logger.info(
+                                f"Acquired Tier 2 key {mask_credential(key)} for model {model} "
                                 f"(selection: {selection_method}, concurrent: {state['models_in_use'][model]}/{max_concurrent}, usage: {usage})"
                             )
                             return key
                 if remaining <= 0:
                     del state["models_in_use"][model]  # Clean up when count reaches 0
                 lib_logger.info(
+                    f"Released credential {mask_credential(key)} from model {model} "
                     f"(remaining concurrent: {max(0, remaining)})"
                 )
             else:
                 lib_logger.warning(
+                    f"Attempted to release credential {mask_credential(key)} for model {model}, but it was not in use."
                 )
         # Notify all tasks waiting on this key's condition
                     usage, "completion_tokens", 0
                 )  # Not present in embedding responses
                 lib_logger.info(
+                    f"Recorded usage from response object for key {mask_credential(key)}"
                 )
                 try:
                     provider_name = model.split("/")[0]
                 # Rate limit errors: use retry_after if available, otherwise default to 60s
                 cooldown_seconds = classified_error.retry_after or 60
                 lib_logger.info(
+                    f"Rate limit error on key {mask_credential(key)} for model {model}. "
                     f"Using {'provided' if classified_error.retry_after else 'default'} retry_after: {cooldown_seconds}s"
                 )
             elif classified_error.error_type == "authentication":
                 # Apply a 5-minute key-level lockout for auth errors
                 key_data["key_cooldown_until"] = time.time() + 300
                 lib_logger.warning(
+                    f"Authentication error on key {mask_credential(key)}. Applying 5-minute key-level lockout."
                 )
                 # Auth errors still use escalating backoff for the specific model
                 cooldown_seconds = 300  # 5 minutes for model cooldown
                     backoff_tiers = {1: 10, 2: 30, 3: 60, 4: 120}
                     cooldown_seconds = backoff_tiers.get(count, 7200)  # Default to 2 hours for "spent" keys
                     lib_logger.warning(
+                        f"Failure #{count} for key {mask_credential(key)} with model {model}. "
                         f"Error type: {classified_error.error_type}"
                     )
             else:
                 if cooldown_seconds is None:
                     cooldown_seconds = 30  # 30s cooldown for provider issues
                 lib_logger.info(
+                    f"Provider-level error ({classified_error.error_type}) for key {mask_credential(key)} with model {model}. "
                     f"NOT incrementing consecutive failures. Applying {cooldown_seconds}s cooldown."
                 )
             model_cooldowns = key_data.setdefault("model_cooldowns", {})
             model_cooldowns[model] = time.time() + cooldown_seconds
             lib_logger.warning(
+                f"Cooldown applied for key {mask_credential(key)} with model {model}: {cooldown_seconds}s. "
                 f"Error type: {classified_error.error_type}"
             )
         if long_term_lockout_models >= 3:
             key_data["key_cooldown_until"] = now + 300  # 5-minute key lockout
             lib_logger.error(
+                f"Key {mask_credential(key)} has {long_term_lockout_models} models in long-term lockout. Applying 5-minute key-level lockout."
             )