Spaces:

quentinbch
/

Voice_Assistant

Sleeping

quentinbch commited on Dec 6, 2025

Commit

17036d1

verified ·

1 Parent(s): 7975ec5

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -23,7 +23,6 @@ transcriber = pipeline(
 # --- 2. Client LLM ---
 client = InferenceClient(
-    provider="fireworks-ai",
     token=HF_TOKEN
 )
@@ -51,16 +50,15 @@ def query_llm(text):
         return "Je n'ai rien entendu."
     try:
-        # Prompt système pour guider le modèle à être concis (mieux pour le TTS)
         messages = [
             {"role": "system", "content": "You are a helpful vocal assistant. Keep your answers short and concise suitable for speech synthesis."},
             {"role": "user", "content": text}
         ]
         completion = client.chat.completions.create(
-            model="meta-llama/Meta-Llama-3.1-8B-Instruct",
             messages=messages,
-            max_tokens=150 # Limite pour éviter une synthèse trop longue
         )
         return completion.choices[0].message.content
     except Exception as e:

 # --- 2. Client LLM ---
 client = InferenceClient(
     token=HF_TOKEN
 )
         return "Je n'ai rien entendu."
     try:
         messages = [
             {"role": "system", "content": "You are a helpful vocal assistant. Keep your answers short and concise suitable for speech synthesis."},
             {"role": "user", "content": text}
         ]
         completion = client.chat.completions.create(
+            model="meta-llama/Meta-Llama-3.1-8B-Instruct",
             messages=messages,
+            max_tokens=150
         )
         return completion.choices[0].message.content
     except Exception as e: