Izzak

Sleeping

App Files Files Community

caarleexx commited on Dec 9, 2025

Commit

5d0198d

verified ·

1 Parent(s): 4cc493f

Update app.py

Browse files

Files changed (1) hide show

app.py +76 -13

app.py CHANGED Viewed

@@ -1,16 +1,79 @@
 import gradio as gr
-import groq_gradio
 import os
-# Initialize Groq client
-client = Groq(
-    api_key=os.environ.get("GROQ_API_KEY")
-)
-gr.load(
-    name='llama-3.3-70b-versatile', # The specific model powered by Groq to use
-    src=groq_gradio.registry, # Tells Gradio to use our custom interface registry as the source
-    title='Groq-Gradio Integration', # The title shown at the top of our UI
-    description="Chat with the Llama 3.3 70B model powered by Groq.", # Subtitle
-    examples=["Explain quantum gravity to a 5-year old.", "How many R are there in the word Strawberry?"] # Pre-written prompts users can click to try
-).launch() # Creates and starts the web server!

 import gradio as gr
+from openai import OpenAI
 import os
+from groq import Groq
+# Configure suas chaves de API. É altamente recomendável usar os segredos do Hugging Face.
+# Se estiver executando localmente, certifique-se de que suas variáveis de ambiente estejam definidas.
+try:
+    groq_api_key = os.environ['GROQ_API_KEY']
+except KeyError:
+    # Se a chave de API não estiver definida como um segredo, você pode inseri-la aqui.
+    # No entanto, isso não é recomendado por razões de segurança.
+    groq_api_key = "SUA_CHAVE_DE_API_DA_GROQ_AQUI"
+client = Groq(api_key=groq_api_key)
+openai_client = OpenAI() # A biblioteca openai é usada para a transcrição do Whisper
+def transcribe_audio(audio_path):
+    """
+    Transcreve o áudio usando a API do Whisper da OpenAI.
+    """
+    if audio_path is None:
+        return ""
+    with open(audio_path, "rb") as audio_file:
+        transcription = openai_client.audio.transcriptions.create(
+          model="whisper-1",
+          file=audio_file
+        )
+    return transcription.text
+def get_llm_response(user_input):
+    """
+    Obtém uma resposta de um modelo de linguagem grande usando a API da Groq.
+    """
+    if not user_input:
+        return "Por favor, faça uma pergunta."
+    chat_completion = client.chat.completions.create(
+        messages=[
+            {
+                "role": "system",
+                "content": "Você é um assistente prestativo."
+            },
+            {
+                "role": "user",
+                "content": user_input,
+            }
+        ],
+        model="llama3-8b-8192",
+    )
+    return chat_completion.choices[0].message.content
+# Define a interface do Gradio
+with gr.Blocks() as demo:
+    gr.Markdown("# Detecção Automática de Voz com Gradio e Groq")
+    gr.Markdown("Fale no microfone e o aplicativo irá transcrever e responder automaticamente.")
+    with gr.Row():
+        audio_input = gr.Audio(sources=["microphone"], type="filepath", label="Entrada de Áudio")
+        transcribed_text = gr.Textbox(label="Texto Transcrito")
+    with gr.Row():
+        llm_response = gr.Textbox(label="Resposta do LLM")
+    # Define as ações da interface
+    audio_input.stop_recording(
+        fn=transcribe_audio,
+        inputs=audio_input,
+        outputs=transcribed_text
+    ).then(
+        fn=get_llm_response,
+        inputs=transcribed_text,
+        outputs=llm_response
+    )
+# Lança a interface do Gradio
+demo.launch()