Spaces:

HaveAI
/

Flare_alpha

Sleeping

App Files Files Community

HaveAI commited on Apr 14

Commit

0396547

verified ·

1 Parent(s): 7eb0bc1

Update app.py

Browse files

Files changed (1) hide show

app.py +33 -21

app.py CHANGED Viewed

@@ -1,8 +1,10 @@
 import gradio as gr
-# Инициализируем модель один раз вне функции
-# Это исправит ошибку при генерации ответа
-model_client = gr.load("models/moonshotai/Kimi-K2-Thinking", provider="novita")
 custom_theme = gr.themes.Soft(
     primary_hue="yellow",
@@ -13,36 +15,46 @@ custom_theme = gr.themes.Soft(
 )
 css = """
-#side-bar {
-    background-color: #ffdd00 !important;
-    padding: 15px;
-}
-.gradio-container {
-    color: white;
-}
 """
 def predict(message, history):
-    # Системная инструкция
-    system_prompt = "Тебя зовут Gemini."
-    # Объединяем системную инструкцию и сообщение
-    full_query = f"{system_prompt}\n\nПользователь: {message}"
-    # Вызываем уже созданный клиент
     try:
-        response = model_client(full_query)
-        return response
     except Exception as e:
-        return f"Ошибка связи с моделью: {str(e)}"
 with gr.Blocks(theme=custom_theme, css=css, fill_height=True) as demo:
     with gr.Sidebar(elem_id="side-bar"):
         gr.Markdown("# **FlareAI**")
         gr.Markdown("Flare — твой персональный ассистент")
-        # Кнопка входа важна, если Space требует авторизации для доступа к API
-        button = gr.LoginButton("Войти")
     gr.ChatInterface(fn=predict)
 demo.launch()

 import gradio as gr
+from huggingface_hub import InferenceClient
+import os
+# Используем InferenceClient для прямой работы с моделью
+# Он автоматически подтянет ваш токен из настроек Space
+client = InferenceClient("moonshotai/Kimi-K2-Thinking")
 custom_theme = gr.themes.Soft(
     primary_hue="yellow",
 )
 css = """
+#side-bar { background-color: #ffdd00 !important; padding: 15px; }
+.gradio-container { color: white; }
 """
 def predict(message, history):
+    # Формируем сообщения для чата
+    messages = [
+        {"role": "system", "content": "Тебя зовут Gemini."},
+    ]
+    # Добавляем историю сообщений (чтобы бот помнил контекст)
+    for human, assistant in history:
+        messages.append({"role": "user", "content": human})
+        messages.append({"role": "assistant", "content": assistant})
+    # Добавляем текущее сообщение
+    messages.append({"role": "user", "content": message})
+    response = ""
     try:
+        # Стриминг ответа (текст будет появляться постепенно)
+        for message_chunk in client.chat_completion(
+            messages,
+            max_tokens=512,
+            stream=True,
+        ):
+            token = message_chunk.choices[0].delta.content
+            if token:
+                response += token
+            yield response
     except Exception as e:
+        yield f"Произошла ошибка: {str(e)}"
 with gr.Blocks(theme=custom_theme, css=css, fill_height=True) as demo:
     with gr.Sidebar(elem_id="side-bar"):
         gr.Markdown("# **FlareAI**")
         gr.Markdown("Flare — твой персональный ассистент")
+        gr.LoginButton("Войти")
+    # Используем ChatInterface с поддержкой истории
     gr.ChatInterface(fn=predict)
 demo.launch()