import os import time from typing import Dict, List, Optional, Union import requests from loguru import logger as eval_logger from ..protocol import Request, Response, ServerConfig from .openai import OpenAIProvider # Import OpenAIJudge for shared methods class AzureOpenAIProvider(OpenAIProvider): """Azure OpenAI implementation of the Judge interface""" def __init__(self, config: Optional[ServerConfig] = None): super().__init__(config) self.api_key = os.getenv("AZURE_API_KEY", "") self.api_endpoint = os.getenv("AZURE_ENDPOINT", "") self.api_version = os.getenv("API_VERSION", "2024-02-15-preview") # Initialize Azure OpenAI client try: from openai import AzureOpenAI self.client = AzureOpenAI(api_key=self.api_key, azure_endpoint=self.api_endpoint, api_version=self.api_version) self.use_client = True except ImportError: eval_logger.warning("Azure OpenAI client not available, falling back to requests") self.use_client = False def is_available(self) -> bool: return bool(self.api_key and self.api_endpoint) def evaluate(self, request: Request) -> Response: """Evaluate using Azure OpenAI API""" if not self.is_available(): raise ValueError("Azure OpenAI API credentials not configured") config = request.config or self.config messages = self.prepare_messages(request) # Handle images if present if request.images: messages = self._add_images_to_messages(messages, request.images) # Prepare payload payload = { "model": config.model_name, "messages": messages, "temperature": config.temperature, "max_tokens": config.max_tokens, } if config.top_p is not None: payload["top_p"] = config.top_p if config.response_format == "json": payload["response_format"] = {"type": "json_object"} # Make API call with retries for attempt in range(config.num_retries): try: if self.use_client: response = self.client.chat.completions.create(**payload) content = response.choices[0].message.content model_used = response.model usage = response.usage.model_dump() if hasattr(response.usage, "model_dump") else None raw_response = response else: response = self._make_request(payload, config.timeout) content = response["choices"][0]["message"]["content"] model_used = response["model"] usage = response.get("usage") raw_response = response return Response(content=content.strip(), model_used=model_used, usage=usage, raw_response=raw_response) except Exception as e: eval_logger.warning(f"Attempt {attempt + 1}/{config.num_retries} failed: {str(e)}") if attempt < config.num_retries - 1: time.sleep(config.retry_delay) else: eval_logger.error(f"All {config.num_retries} attempts failed") raise def _make_request(self, payload: Dict, timeout: int) -> Dict: """Make HTTP request to Azure OpenAI API""" headers = { "api-key": self.api_key, "Content-Type": "application/json", } # Construct the full URL deployment_name = payload["model"] url = f"{self.api_endpoint}/openai/deployments/{deployment_name}/chat/completions?api-version={self.api_version}" response = requests.post(url, headers=headers, json=payload, timeout=timeout) response.raise_for_status() return response.json()