| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| |
|
| | import os |
| | import logging |
| | import json |
| | from pathlib import Path |
| | import gradio as gr |
| | from PIL import Image |
| | import google.generativeai as genai |
| | import re |
| | from typing import List, Union, Any |
| |
|
| | logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s') |
| | logger = logging.getLogger(__name__) |
| |
|
| | def robust_json_parser(raw_text: str) -> dict: |
| | """ |
| | Parses a JSON object from a string that might contain extra text, |
| | such as Markdown code blocks from an LLM's response. |
| | """ |
| | clean_text = raw_text.strip() |
| | try: |
| | match = re.search(r'```json\s*(\{.*?\})\s*```', clean_text, re.DOTALL) |
| | if match: |
| | json_str = match.group(1) |
| | return json.loads(json_str) |
| | |
| | start_index = clean_text.find('{') |
| | end_index = clean_text.rfind('}') |
| | if start_index != -1 and end_index != -1 and end_index > start_index: |
| | json_str = clean_text[start_index : end_index + 1] |
| | return json.loads(json_str) |
| | else: |
| | raise ValueError("No valid JSON object could be found in the AI's response.") |
| | except json.JSONDecodeError as e: |
| | logger.error(f"Failed to decode JSON. The AI returned the following text:\n---\n{raw_text}\n---") |
| | raise ValueError(f"The AI returned an invalid JSON format: {e}") |
| |
|
| | class GeminiManager: |
| | """ |
| | Manages raw interactions with the Google Gemini API. |
| | """ |
| | def __init__(self): |
| | self.api_key = os.environ.get("GEMINI_API_KEY") |
| | if self.api_key: |
| | genai.configure(api_key=self.api_key) |
| | self.model = genai.GenerativeModel('gemini-2.0-flash') |
| | logger.info("GeminiManager (Communication Layer) initialized successfully.") |
| | else: |
| | self.model = None |
| | logger.warning("Gemini API key not found. GeminiManager disabled.") |
| | |
| | def _check_model(self): |
| | """Raises an error if the Gemini API is not configured.""" |
| | if not self.model: |
| | raise gr.Error("The Google Gemini API key is not configured (GEMINI_API_KEY).") |
| |
|
| | def _generate_content(self, prompt_parts: List[Any]) -> str: |
| | """Internal method to make the API call.""" |
| | self._check_model() |
| | logger.info("Calling Gemini API...") |
| | response = self.model.generate_content(prompt_parts) |
| | logger.info(f"Gemini responded with raw text: {response.text}") |
| | return response.text |
| |
|
| | def get_raw_text(self, prompt_parts: List[Any]) -> str: |
| | """ |
| | Sends a prompt to the Gemini API and returns the raw text response. |
| | |
| | Args: |
| | prompt_parts (List[Any]): A list containing strings and/or PIL.Image objects. |
| | |
| | Returns: |
| | str: The raw string response from the API. |
| | """ |
| | try: |
| | return self._generate_content(prompt_parts) |
| | except Exception as e: |
| | logger.error(f"Gemini API call failed: {e}", exc_info=True) |
| | raise gr.Error(f"Gemini API communication failed: {e}") |
| |
|
| | def get_json_object(self, prompt_parts: List[Any]) -> dict: |
| | """ |
| | Sends a prompt to the Gemini API, expects a JSON response, parses it, and returns a dictionary. |
| | |
| | Args: |
| | prompt_parts (List[Any]): A list containing strings and/or PIL.Image objects. |
| | |
| | Returns: |
| | dict: The parsed JSON object from the API response. |
| | """ |
| | try: |
| | raw_response = self._generate_content(prompt_parts) |
| | return robust_json_parser(raw_response) |
| | except Exception as e: |
| | logger.error(f"Gemini API call or JSON parsing failed: {e}", exc_info=True) |
| | raise gr.Error(f"Gemini API communication or response parsing failed: {e}") |
| |
|
| | |
| | gemini_manager_singleton = GeminiManager() |