Spaces:

cdpearlman
/

LLMVis

Sleeping

App Files Files Community

cdpearlman Cursor commited on Feb 3

Commit

ddd91a5

1 Parent(s): 689669f

Migrate from google-generativeai to google-genai SDK

Browse files

Co-authored-by: Cursor <cursoragent@cursor.com>

Files changed (4) hide show

requirements.txt +1 -1
tests/test_gemini_connection.py +25 -8
todo.md +13 -0
utils/gemini_client.py +35 -24

requirements.txt CHANGED Viewed

@@ -18,4 +18,4 @@ numpy>=1.24.0
 pytest>=7.0.0
 # AI Chatbot dependencies
-google-generativeai>=0.8.0

 pytest>=7.0.0
 # AI Chatbot dependencies
+google-genai>=1.0.0

tests/test_gemini_connection.py CHANGED Viewed

@@ -4,8 +4,7 @@ Tests for Gemini API connection.
 Verifies that the API key is configured correctly and can connect
 to the Gemini API without consuming generation tokens.
-Note: These tests avoid importing utils.gemini_client where possible
-to prevent slow tensorflow/jax imports from the google-generativeai package.
 """
 import os
@@ -33,13 +32,13 @@ class TestGeminiConnection:
         Test API connectivity by listing available models.
         This verifies the API key is valid without consuming generation tokens.
         """
-        import google.generativeai as genai
         api_key = os.environ.get("GEMINI_API_KEY")
-        genai.configure(api_key=api_key)
         # List models - this is a read-only API call that validates the key
-        models = list(genai.list_models())
         assert len(models) > 0, "No models returned - API key may be invalid"
@@ -51,12 +50,12 @@ class TestGeminiConnection:
     @pytest.mark.timeout(30)
     def test_flash_model_available(self):
         """Verify a Gemini Flash model (used by default) is available."""
-        import google.generativeai as genai
         api_key = os.environ.get("GEMINI_API_KEY")
-        genai.configure(api_key=api_key)
-        models = list(genai.list_models())
         model_names = [m.name for m in models]
         # Check for flash model variants (our default is gemini-2.0-flash)
@@ -65,3 +64,21 @@ class TestGeminiConnection:
             f"No Gemini Flash models available. "
             f"Available models: {model_names[:10]}..."
         )

 Verifies that the API key is configured correctly and can connect
 to the Gemini API without consuming generation tokens.
+Uses the new google-genai SDK.
 """
 import os
         Test API connectivity by listing available models.
         This verifies the API key is valid without consuming generation tokens.
         """
+        from google import genai
         api_key = os.environ.get("GEMINI_API_KEY")
+        client = genai.Client(api_key=api_key)
         # List models - this is a read-only API call that validates the key
+        models = list(client.models.list())
         assert len(models) > 0, "No models returned - API key may be invalid"
     @pytest.mark.timeout(30)
     def test_flash_model_available(self):
         """Verify a Gemini Flash model (used by default) is available."""
+        from google import genai
         api_key = os.environ.get("GEMINI_API_KEY")
+        client = genai.Client(api_key=api_key)
+        models = list(client.models.list())
         model_names = [m.name for m in models]
         # Check for flash model variants (our default is gemini-2.0-flash)
             f"No Gemini Flash models available. "
             f"Available models: {model_names[:10]}..."
         )
+    @pytest.mark.timeout(30)
+    def test_embedding_model_available(self):
+        """Verify the embedding model is available."""
+        from google import genai
+        api_key = os.environ.get("GEMINI_API_KEY")
+        client = genai.Client(api_key=api_key)
+        models = list(client.models.list())
+        model_names = [m.name for m in models]
+        # Check for embedding model (gemini-embedding-001)
+        has_embedding_model = any("embedding" in name.lower() for name in model_names)
+        assert has_embedding_model, (
+            f"No embedding models available. "
+            f"Available models: {model_names[:10]}..."
+        )

todo.md CHANGED Viewed

@@ -150,3 +150,16 @@
 - [x] Create `tests/test_gemini_connection.py` to verify API key connectivity
 - [x] Tests verify: API key is set, can list models, flash model available
 - Note: On Hugging Face Spaces, set `GEMINI_API_KEY` in Repository Secrets

 - [x] Create `tests/test_gemini_connection.py` to verify API key connectivity
 - [x] Tests verify: API key is set, can list models, flash model available
 - Note: On Hugging Face Spaces, set `GEMINI_API_KEY` in Repository Secrets
+## Completed: Migrate to New Google GenAI SDK
+- [x] Update `requirements.txt`: `google-generativeai` → `google-genai>=1.0.0`
+- [x] Rewrite `utils/gemini_client.py` using new centralized Client architecture
+  - New import: `from google import genai` and `from google.genai import types`
+  - Client-based API: `client = genai.Client(api_key=...)`
+  - Chat via: `client.chats.create(model=..., config=..., history=...)`
+  - Embeddings via: `client.models.embed_content(model=..., contents=..., config=...)`
+- [x] Update embedding model: `models/text-embedding-004` → `gemini-embedding-001`
+- [x] Update `tests/test_gemini_connection.py` to use new SDK
+- [x] All 4 connection tests pass
+- [x] Verified: embeddings work (3072 dimensions), chat generation works

utils/gemini_client.py CHANGED Viewed

@@ -3,16 +3,19 @@ Gemini API Client
 Wrapper for Google Gemini API providing text generation and embedding capabilities
 for the AI chatbot feature.
 """
 import os
 from typing import List, Dict, Optional
-import google.generativeai as genai
 # Default model configuration
 DEFAULT_GENERATION_MODEL = "gemini-2.0-flash"
-DEFAULT_EMBEDDING_MODEL = "models/text-embedding-004"
 # System prompt for the chatbot
 SYSTEM_PROMPT = """You are a helpful AI assistant integrated into a Transformer Explanation Dashboard.
@@ -45,23 +48,19 @@ class GeminiClient:
         """
         self.api_key = api_key or os.environ.get("GEMINI_API_KEY")
         self._initialized = False
-        self._generation_model = None
-        self._embedding_model = None
         if self.api_key:
             self._initialize()
     def _initialize(self):
-        """Initialize the Gemini API with the API key."""
         if not self.api_key:
             return
         try:
-            genai.configure(api_key=self.api_key)
-            self._generation_model = genai.GenerativeModel(
-                model_name=DEFAULT_GENERATION_MODEL,
-                system_instruction=SYSTEM_PROMPT
-            )
             self._initialized = True
         except Exception as e:
             print(f"Error initializing Gemini client: {e}")
@@ -98,26 +97,32 @@ class GeminiClient:
             # Build the full prompt with context
             full_message = self._build_prompt(user_message, rag_context, dashboard_context)
-            # Convert chat history to Gemini format
             history = []
             if chat_history:
                 for msg in chat_history[-10:]:  # Keep last 10 messages for context
                     role = "user" if msg.get("role") == "user" else "model"
                     history.append({
                         "role": role,
-                        "parts": [msg.get("content", "")]
                     })
-            # Create chat session and send message
-            chat = self._generation_model.start_chat(history=history)
-            response = chat.send_message(full_message)
             return response.text
         except Exception as e:
             error_msg = str(e)
             if "quota" in error_msg.lower() or "rate" in error_msg.lower():
-                return "The AI service is currently rate limited. Please try again in a moment."
             elif "invalid" in error_msg.lower() and "key" in error_msg.lower():
                 return "Invalid API key. Please check your GEMINI_API_KEY configuration."
             else:
@@ -187,12 +192,15 @@ class GeminiClient:
             return None
         try:
-            result = genai.embed_content(
                 model=DEFAULT_EMBEDDING_MODEL,
-                content=text,
-                task_type="retrieval_document"
             )
-            return result['embedding']
         except Exception as e:
             print(f"Embedding error: {e}")
             return None
@@ -211,12 +219,15 @@ class GeminiClient:
             return None
         try:
-            result = genai.embed_content(
                 model=DEFAULT_EMBEDDING_MODEL,
-                content=query,
-                task_type="retrieval_query"
             )
-            return result['embedding']
         except Exception as e:
             print(f"Query embedding error: {e}")
             return None

 Wrapper for Google Gemini API providing text generation and embedding capabilities
 for the AI chatbot feature.
+Uses the new google-genai SDK (migrated from deprecated google-generativeai).
 """
 import os
 from typing import List, Dict, Optional
+from google import genai
+from google.genai import types
 # Default model configuration
 DEFAULT_GENERATION_MODEL = "gemini-2.0-flash"
+DEFAULT_EMBEDDING_MODEL = "gemini-embedding-001"
 # System prompt for the chatbot
 SYSTEM_PROMPT = """You are a helpful AI assistant integrated into a Transformer Explanation Dashboard.
         """
         self.api_key = api_key or os.environ.get("GEMINI_API_KEY")
         self._initialized = False
+        self._client = None
         if self.api_key:
             self._initialize()
     def _initialize(self):
+        """Initialize the Gemini API client."""
         if not self.api_key:
             return
         try:
+            # Create the centralized client object (new SDK architecture)
+            self._client = genai.Client(api_key=self.api_key)
             self._initialized = True
         except Exception as e:
             print(f"Error initializing Gemini client: {e}")
             # Build the full prompt with context
             full_message = self._build_prompt(user_message, rag_context, dashboard_context)
+            # Convert chat history to new SDK format
             history = []
             if chat_history:
                 for msg in chat_history[-10:]:  # Keep last 10 messages for context
                     role = "user" if msg.get("role") == "user" else "model"
                     history.append({
                         "role": role,
+                        "parts": [{"text": msg.get("content", "")}]
                     })
+            # Create chat session with system instruction and send message
+            chat = self._client.chats.create(
+                model=DEFAULT_GENERATION_MODEL,
+                config=types.GenerateContentConfig(
+                    system_instruction=SYSTEM_PROMPT,
+                ),
+                history=history
+            )
+            response = chat.send_message(message=full_message)
             return response.text
         except Exception as e:
             error_msg = str(e)
             if "quota" in error_msg.lower() or "rate" in error_msg.lower():
+                return f"The AI service is currently rate limited. Please try again in a moment. {error_msg}"
             elif "invalid" in error_msg.lower() and "key" in error_msg.lower():
                 return "Invalid API key. Please check your GEMINI_API_KEY configuration."
             else:
             return None
         try:
+            result = self._client.models.embed_content(
                 model=DEFAULT_EMBEDDING_MODEL,
+                contents=text,
+                config=types.EmbedContentConfig(
+                    task_type="RETRIEVAL_DOCUMENT"
+                )
             )
+            # New SDK returns embeddings as a list, get the first one
+            return result.embeddings[0].values
         except Exception as e:
             print(f"Embedding error: {e}")
             return None
             return None
         try:
+            result = self._client.models.embed_content(
                 model=DEFAULT_EMBEDDING_MODEL,
+                contents=query,
+                config=types.EmbedContentConfig(
+                    task_type="RETRIEVAL_QUERY"
+                )
             )
+            # New SDK returns embeddings as a list, get the first one
+            return result.embeddings[0].values
         except Exception as e:
             print(f"Query embedding error: {e}")
             return None