Spaces:

elmerzole
/

llm-api-proxy

Paused

Mirrowel commited on Nov 18, 2025

Commit

e2c300f

1 Parent(s): dea215f

refactor(providers): enhance model discovery and deduplication logic

Restructures model loading logic across `gemini_cli`, `iflow`, and `qwen_code` providers to handle prioritized model sources more reliably.

- Introduced `env_var_ids` tracking to record model IDs defined via environment variables.
- Environment variable models are now guaranteed to be included without internal deduplication.
- Dynamic and hardcoded models are only added if their base model ID does not conflict with an ID already defined via environment variables.
- Added a helper function `extract_model_id` to standardize model ID parsing across different API response formats.
- Corrects the Qwen Code provider to strip the internal provider prefix before sending the model name in the chat completion API payload.

Files changed (3) hide show

src/rotator_library/providers/gemini_cli_provider.py +42 -24
src/rotator_library/providers/iflow_provider.py +37 -15
src/rotator_library/providers/qwen_code_provider.py +42 -16

src/rotator_library/providers/gemini_cli_provider.py CHANGED Viewed

@@ -722,25 +722,53 @@ class GeminiCliProvider(GeminiAuthBase, ProviderInterface):
     async def get_models(self, credential: str, client: httpx.AsyncClient) -> List[str]:
         """
         Returns a merged list of Gemini CLI models from three sources:
-        1. Environment variable models (via GEMINI_CLI_MODELS)
-        2. Hardcoded models (fallback list)
-        3. Dynamic discovery from Gemini API (if supported)
         """
         models = []
-        # Source 1: Load environment variable models
         static_models = self.model_definitions.get_all_provider_models("gemini_cli")
         if static_models:
-            models.extend(static_models)
             lib_logger.info(f"Loaded {len(static_models)} static models for gemini_cli from environment variables")
-        # Source 2: Add hardcoded models (avoiding duplicates)
-        existing_ids = [m.split("/")[-1] for m in models]
         for model_id in HARDCODED_MODELS:
-            if model_id not in existing_ids:
                 models.append(f"gemini_cli/{model_id}")
-        # Source 3: Try dynamic discovery from Gemini API
         try:
             # Get access token for API calls
             access_token = await self.get_access_token(credential)
@@ -756,27 +784,17 @@ class GeminiCliProvider(GeminiAuthBase, ProviderInterface):
             )
             response.raise_for_status()
-            # Parse dynamic models and avoid duplicates
-            existing_ids = [m.split("/")[-1] for m in models]
             dynamic_data = response.json()
             # Handle various response formats
             model_list = dynamic_data.get("models", dynamic_data.get("data", []))
             dynamic_count = 0
             for model in model_list:
-                # Extract model ID (may be in 'name' or 'id' field)
-                model_id = None
-                if isinstance(model, dict):
-                    model_id = model.get("name", model.get("id"))
-                    # Gemini models often have format "models/gemini-pro", extract just the model name
-                    if model_id and "/" in model_id:
-                        model_id = model_id.split("/")[-1]
-                else:
-                    model_id = model
-                if model_id and model_id not in existing_ids and model_id.startswith("gemini"):
                     models.append(f"gemini_cli/{model_id}")
                     dynamic_count += 1
             if dynamic_count > 0:

     async def get_models(self, credential: str, client: httpx.AsyncClient) -> List[str]:
         """
         Returns a merged list of Gemini CLI models from three sources:
+        1. Environment variable models (via GEMINI_CLI_MODELS) - ALWAYS included, take priority
+        2. Hardcoded models (fallback list) - added only if ID not in env vars
+        3. Dynamic discovery from Gemini API (if supported) - added only if ID not in env vars
+        Environment variable models always win and are never deduplicated, even if they
+        share the same ID (to support different configs like temperature, etc.)
         """
         models = []
+        env_var_ids = set()  # Track IDs from env vars to prevent hardcoded/dynamic duplicates
+        def extract_model_id(item) -> str:
+            """Extract model ID from various formats (dict, string with/without provider prefix)."""
+            if isinstance(item, dict):
+                # Dict format: extract 'name' or 'id' field
+                model_id = item.get("name") or item.get("id", "")
+                # Gemini models often have format "models/gemini-pro", extract just the model name
+                if model_id and "/" in model_id:
+                    model_id = model_id.split("/")[-1]
+                return model_id
+            elif isinstance(item, str):
+                # String format: extract ID from "provider/id" or "models/id" or just "id"
+                return item.split("/")[-1] if "/" in item else item
+            return str(item)
+        # Source 1: Load environment variable models (ALWAYS include ALL of them)
         static_models = self.model_definitions.get_all_provider_models("gemini_cli")
         if static_models:
+            for model in static_models:
+                # Extract model name from "gemini_cli/ModelName" format
+                model_name = model.split("/")[-1] if "/" in model else model
+                # Get the actual model ID from definitions (which may differ from the name)
+                model_id = self.model_definitions.get_model_id("gemini_cli", model_name)
+                # ALWAYS add env var models (no deduplication)
+                models.append(model)
+                # Track the ID to prevent hardcoded/dynamic duplicates
+                if model_id:
+                    env_var_ids.add(model_id)
             lib_logger.info(f"Loaded {len(static_models)} static models for gemini_cli from environment variables")
+        # Source 2: Add hardcoded models (only if ID not already in env vars)
         for model_id in HARDCODED_MODELS:
+            if model_id not in env_var_ids:
                 models.append(f"gemini_cli/{model_id}")
+                env_var_ids.add(model_id)
+        # Source 3: Try dynamic discovery from Gemini API (only if ID not already in env vars)
         try:
             # Get access token for API calls
             access_token = await self.get_access_token(credential)
             )
             response.raise_for_status()
             dynamic_data = response.json()
             # Handle various response formats
             model_list = dynamic_data.get("models", dynamic_data.get("data", []))
             dynamic_count = 0
             for model in model_list:
+                model_id = extract_model_id(model)
+                # Only include Gemini models that aren't already in env vars
+                if model_id and model_id not in env_var_ids and model_id.startswith("gemini"):
                     models.append(f"gemini_cli/{model_id}")
+                    env_var_ids.add(model_id)
                     dynamic_count += 1
             if dynamic_count > 0:

src/rotator_library/providers/iflow_provider.py CHANGED Viewed

@@ -57,27 +57,51 @@ class IFlowProvider(IFlowAuthBase, ProviderInterface):
     async def get_models(self, credential: str, client: httpx.AsyncClient) -> List[str]:
         """
         Returns a merged list of iFlow models from three sources:
-        1. Environment variable models (via IFLOW_MODELS)
-        2. Hardcoded models (fallback list)
-        3. Dynamic discovery from iFlow API (if supported)
         Validates OAuth credentials if applicable.
         """
         models = []
-        # Source 1: Load environment variable models
         static_models = self.model_definitions.get_all_provider_models("iflow")
         if static_models:
-            models.extend(static_models)
             lib_logger.info(f"Loaded {len(static_models)} static models for iflow from environment variables")
-        # Source 2: Add hardcoded models (avoiding duplicates)
-        existing_ids = [m.split("/")[-1] for m in models]
         for model_id in HARDCODED_MODELS:
-            if model_id not in existing_ids:
                 models.append(f"iflow/{model_id}")
-        # Source 3: Try dynamic discovery from iFlow API
         try:
             # Validate OAuth credentials and get API details
             if os.path.isfile(credential):
@@ -92,18 +116,16 @@ class IFlowProvider(IFlowAuthBase, ProviderInterface):
             )
             response.raise_for_status()
-            # Parse dynamic models and avoid duplicates
-            existing_ids = [m.split("/")[-1] for m in models]
             dynamic_data = response.json()
             # Handle both {data: [...]} and direct [...] formats
             model_list = dynamic_data.get("data", dynamic_data) if isinstance(dynamic_data, dict) else dynamic_data
             dynamic_count = 0
             for model in model_list:
-                model_id = model.get("id") if isinstance(model, dict) else model
-                if model_id and model_id not in existing_ids:
                     models.append(f"iflow/{model_id}")
                     dynamic_count += 1
             if dynamic_count > 0:

     async def get_models(self, credential: str, client: httpx.AsyncClient) -> List[str]:
         """
         Returns a merged list of iFlow models from three sources:
+        1. Environment variable models (via IFLOW_MODELS) - ALWAYS included, take priority
+        2. Hardcoded models (fallback list) - added only if ID not in env vars
+        3. Dynamic discovery from iFlow API (if supported) - added only if ID not in env vars
+        Environment variable models always win and are never deduplicated, even if they
+        share the same ID (to support different configs like temperature, etc.)
         Validates OAuth credentials if applicable.
         """
         models = []
+        env_var_ids = set()  # Track IDs from env vars to prevent hardcoded/dynamic duplicates
+        def extract_model_id(item) -> str:
+            """Extract model ID from various formats (dict, string with/without provider prefix)."""
+            if isinstance(item, dict):
+                # Dict format: extract 'id' or 'name' field
+                return item.get("id") or item.get("name", "")
+            elif isinstance(item, str):
+                # String format: extract ID from "provider/id" or just "id"
+                return item.split("/")[-1] if "/" in item else item
+            return str(item)
+        # Source 1: Load environment variable models (ALWAYS include ALL of them)
         static_models = self.model_definitions.get_all_provider_models("iflow")
         if static_models:
+            for model in static_models:
+                # Extract model name from "iflow/ModelName" format
+                model_name = model.split("/")[-1] if "/" in model else model
+                # Get the actual model ID from definitions (which may differ from the name)
+                model_id = self.model_definitions.get_model_id("iflow", model_name)
+                # ALWAYS add env var models (no deduplication)
+                models.append(model)
+                # Track the ID to prevent hardcoded/dynamic duplicates
+                if model_id:
+                    env_var_ids.add(model_id)
             lib_logger.info(f"Loaded {len(static_models)} static models for iflow from environment variables")
+        # Source 2: Add hardcoded models (only if ID not already in env vars)
         for model_id in HARDCODED_MODELS:
+            if model_id not in env_var_ids:
                 models.append(f"iflow/{model_id}")
+                env_var_ids.add(model_id)
+        # Source 3: Try dynamic discovery from iFlow API (only if ID not already in env vars)
         try:
             # Validate OAuth credentials and get API details
             if os.path.isfile(credential):
             )
             response.raise_for_status()
             dynamic_data = response.json()
             # Handle both {data: [...]} and direct [...] formats
             model_list = dynamic_data.get("data", dynamic_data) if isinstance(dynamic_data, dict) else dynamic_data
             dynamic_count = 0
             for model in model_list:
+                model_id = extract_model_id(model)
+                if model_id and model_id not in env_var_ids:
                     models.append(f"iflow/{model_id}")
+                    env_var_ids.add(model_id)
                     dynamic_count += 1
             if dynamic_count > 0:

src/rotator_library/providers/qwen_code_provider.py CHANGED Viewed

@@ -40,27 +40,51 @@ class QwenCodeProvider(QwenAuthBase, ProviderInterface):
     async def get_models(self, credential: str, client: httpx.AsyncClient) -> List[str]:
         """
         Returns a merged list of Qwen Code models from three sources:
-        1. Environment variable models (via QWEN_CODE_MODELS)
-        2. Hardcoded models (fallback list)
-        3. Dynamic discovery from Qwen API (if supported)
         Validates OAuth credentials if applicable.
         """
         models = []
-        # Source 1: Load environment variable models
         static_models = self.model_definitions.get_all_provider_models("qwen_code")
         if static_models:
-            models.extend(static_models)
             lib_logger.info(f"Loaded {len(static_models)} static models for qwen_code from environment variables")
-        # Source 2: Add hardcoded models (avoiding duplicates)
-        existing_ids = [m.split("/")[-1] for m in models]
         for model_id in HARDCODED_MODELS:
-            if model_id not in existing_ids:
                 models.append(f"qwen_code/{model_id}")
-        # Source 3: Try dynamic discovery from Qwen Code API
         try:
             # Validate OAuth credentials and get API details
             if os.path.isfile(credential):
@@ -75,18 +99,16 @@ class QwenCodeProvider(QwenAuthBase, ProviderInterface):
             )
             response.raise_for_status()
-            # Parse dynamic models and avoid duplicates
-            existing_ids = [m.split("/")[-1] for m in models]
             dynamic_data = response.json()
             # Handle both {data: [...]} and direct [...] formats
             model_list = dynamic_data.get("data", dynamic_data) if isinstance(dynamic_data, dict) else dynamic_data
             dynamic_count = 0
             for model in model_list:
-                model_id = model.get("id") if isinstance(model, dict) else model
-                if model_id and model_id not in existing_ids:
                     models.append(f"qwen_code/{model_id}")
                     dynamic_count += 1
             if dynamic_count > 0:
@@ -342,8 +364,12 @@ class QwenCodeProvider(QwenAuthBase, ProviderInterface):
             """Prepares and makes the actual API call."""
             api_base, access_token = await self.get_api_details(credential_path)
             # Build clean payload with only supported parameters
-            payload = self._build_request_payload(**kwargs)
             headers = {
                 "Authorization": f"Bearer {access_token}",

     async def get_models(self, credential: str, client: httpx.AsyncClient) -> List[str]:
         """
         Returns a merged list of Qwen Code models from three sources:
+        1. Environment variable models (via QWEN_CODE_MODELS) - ALWAYS included, take priority
+        2. Hardcoded models (fallback list) - added only if ID not in env vars
+        3. Dynamic discovery from Qwen API (if supported) - added only if ID not in env vars
+        Environment variable models always win and are never deduplicated, even if they
+        share the same ID (to support different configs like temperature, etc.)
         Validates OAuth credentials if applicable.
         """
         models = []
+        env_var_ids = set()  # Track IDs from env vars to prevent hardcoded/dynamic duplicates
+        def extract_model_id(item) -> str:
+            """Extract model ID from various formats (dict, string with/without provider prefix)."""
+            if isinstance(item, dict):
+                # Dict format: extract 'id' or 'name' field
+                return item.get("id") or item.get("name", "")
+            elif isinstance(item, str):
+                # String format: extract ID from "provider/id" or just "id"
+                return item.split("/")[-1] if "/" in item else item
+            return str(item)
+        # Source 1: Load environment variable models (ALWAYS include ALL of them)
         static_models = self.model_definitions.get_all_provider_models("qwen_code")
         if static_models:
+            for model in static_models:
+                # Extract model name from "qwen_code/ModelName" format
+                model_name = model.split("/")[-1] if "/" in model else model
+                # Get the actual model ID from definitions (which may differ from the name)
+                model_id = self.model_definitions.get_model_id("qwen_code", model_name)
+                # ALWAYS add env var models (no deduplication)
+                models.append(model)
+                # Track the ID to prevent hardcoded/dynamic duplicates
+                if model_id:
+                    env_var_ids.add(model_id)
             lib_logger.info(f"Loaded {len(static_models)} static models for qwen_code from environment variables")
+        # Source 2: Add hardcoded models (only if ID not already in env vars)
         for model_id in HARDCODED_MODELS:
+            if model_id not in env_var_ids:
                 models.append(f"qwen_code/{model_id}")
+                env_var_ids.add(model_id)
+        # Source 3: Try dynamic discovery from Qwen Code API (only if ID not already in env vars)
         try:
             # Validate OAuth credentials and get API details
             if os.path.isfile(credential):
             )
             response.raise_for_status()
             dynamic_data = response.json()
             # Handle both {data: [...]} and direct [...] formats
             model_list = dynamic_data.get("data", dynamic_data) if isinstance(dynamic_data, dict) else dynamic_data
             dynamic_count = 0
             for model in model_list:
+                model_id = extract_model_id(model)
+                if model_id and model_id not in env_var_ids:
                     models.append(f"qwen_code/{model_id}")
+                    env_var_ids.add(model_id)
                     dynamic_count += 1
             if dynamic_count > 0:
             """Prepares and makes the actual API call."""
             api_base, access_token = await self.get_api_details(credential_path)
+            # Strip provider prefix from model name (e.g., "qwen_code/qwen3-coder-plus" -> "qwen3-coder-plus")
+            model_name = model.split('/')[-1]
+            kwargs_with_stripped_model = {**kwargs, 'model': model_name}
             # Build clean payload with only supported parameters
+            payload = self._build_request_payload(**kwargs_with_stripped_model)
             headers = {
                 "Authorization": f"Bearer {access_token}",