Spaces:

jeremierostan
/

Real-Time-Experts

Sleeping

App Files Files Community

jeremierostan commited on Mar 5, 2025

Commit

a64ea5d

verified ·

1 Parent(s): 4cd60b2

Update app.py

Browse files

Files changed (1) hide show

app.py +45 -34

app.py CHANGED Viewed

@@ -62,7 +62,6 @@ class GeminiHandler(AsyncStreamHandler):
         self.input_queue: asyncio.Queue = asyncio.Queue()
         self.output_queue: asyncio.Queue = asyncio.Queue()
         self.quit: asyncio.Event = asyncio.Event()
-        self.system_prompt = None
     def copy(self) -> "GeminiHandler":
         return GeminiHandler(
@@ -77,55 +76,68 @@ class GeminiHandler(AsyncStreamHandler):
             api_key, voice_name, prompt_key, custom_prompt = self.latest_args[1:]
             # Determine which prompt to use
             if prompt_key and prompt_key in SYSTEM_PROMPTS:
-                self.system_prompt = SYSTEM_PROMPTS[prompt_key]
             elif custom_prompt:
-                self.system_prompt = custom_prompt
         else:
             api_key, voice_name = None, "Puck"
-            self.system_prompt = None
         client = genai.Client(
             api_key=api_key or os.getenv("GEMINI_API_KEY"),
             http_options={"api_version": "v1alpha"},
         )
-        # Create basic config
-        config = LiveConnectConfig(
-            response_modalities=["AUDIO"],  # type: ignore
-            speech_config=SpeechConfig(
-                voice_config=VoiceConfig(
-                    prebuilt_voice_config=PrebuiltVoiceConfig(
-                        voice_name=voice_name,
-                    )
-                )
-            ),
-        )
-        # Get model reference
-        model = client.get_model("gemini-2.0-flash-exp")
-        # Apply system prompt if available
-        if self.system_prompt:
             try:
-                # First try with system_instruction method (newer API versions)
-                model = model.with_system_instructions(self.system_prompt)
-                print(f"Using system prompt via with_system_instructions: {self.system_prompt[:50]}...")
             except Exception as e:
-                print(f"Could not apply system prompt via with_system_instructions: {e}")
-                # If that fails, we'll handle it in the session
-                pass
-        # Create session
         async with client.aio.live.connect(
             model="gemini-2.0-flash-exp", config=config
         ) as session:
-            # If we couldn't set the system prompt earlier and we have one,
-            # try to send it as the first message
-            if self.system_prompt:
                 try:
-                    # Try to send system prompt as first message
-                    await session.send_message(f"SYSTEM: {self.system_prompt}\n\nPlease acknowledge this system instruction.")
                     # Wait for a response
                     async for response in session.stream_response():
                         # Just need one response to confirm it was received
@@ -134,7 +146,6 @@ class GeminiHandler(AsyncStreamHandler):
                 except Exception as e:
                     print(f"Could not send system prompt as message: {e}")
-            # Now start the audio stream
             async for audio in session.start_stream(
                 stream=self.stream(), mime_type="audio/pcm"
             ):

         self.input_queue: asyncio.Queue = asyncio.Queue()
         self.output_queue: asyncio.Queue = asyncio.Queue()
         self.quit: asyncio.Event = asyncio.Event()
     def copy(self) -> "GeminiHandler":
         return GeminiHandler(
             api_key, voice_name, prompt_key, custom_prompt = self.latest_args[1:]
             # Determine which prompt to use
+            system_prompt = None
             if prompt_key and prompt_key in SYSTEM_PROMPTS:
+                system_prompt = SYSTEM_PROMPTS[prompt_key]
             elif custom_prompt:
+                system_prompt = custom_prompt
         else:
             api_key, voice_name = None, "Puck"
+            system_prompt = None
         client = genai.Client(
             api_key=api_key or os.getenv("GEMINI_API_KEY"),
             http_options={"api_version": "v1alpha"},
         )
+        # Create config with system instructions if available
+        if system_prompt:
             try:
+                # Try with system_instruction as a list
+                config = LiveConnectConfig(
+                    response_modalities=["AUDIO"],  # type: ignore
+                    speech_config=SpeechConfig(
+                        voice_config=VoiceConfig(
+                            prebuilt_voice_config=PrebuiltVoiceConfig(
+                                voice_name=voice_name,
+                            )
+                        )
+                    ),
+                    system_instruction=[system_prompt],
+                )
             except Exception as e:
+                print(f"Error with system_instruction: {e}")
+                # Fall back to basic config without system instruction
+                config = LiveConnectConfig(
+                    response_modalities=["AUDIO"],  # type: ignore
+                    speech_config=SpeechConfig(
+                        voice_config=VoiceConfig(
+                            prebuilt_voice_config=PrebuiltVoiceConfig(
+                                voice_name=voice_name,
+                            )
+                        )
+                    ),
+                )
+        else:
+            # Basic config without system instruction
+            config = LiveConnectConfig(
+                response_modalities=["AUDIO"],  # type: ignore
+                speech_config=SpeechConfig(
+                    voice_config=VoiceConfig(
+                        prebuilt_voice_config=PrebuiltVoiceConfig(
+                            voice_name=voice_name,
+                        )
+                    )
+                ),
+            )
         async with client.aio.live.connect(
             model="gemini-2.0-flash-exp", config=config
         ) as session:
+            # If we have a system prompt but couldn't set it in the config, try sending it as a message
+            if system_prompt and 'system_instruction' not in str(config):
                 try:
+                    await session.send_message(f"SYSTEM: {system_prompt}\n\nPlease acknowledge this system instruction.")
                     # Wait for a response
                     async for response in session.stream_response():
                         # Just need one response to confirm it was received
                 except Exception as e:
                     print(f"Could not send system prompt as message: {e}")
             async for audio in session.start_stream(
                 stream=self.stream(), mime_type="audio/pcm"
             ):