Spaces:

HaveAI
/

Flare_alpha

Sleeping

App Files Files Community

HaveAI commited on Apr 14

Commit

809c7df

verified ·

1 Parent(s): 0396547

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -31

app.py CHANGED Viewed

@@ -1,10 +1,8 @@
 import gradio as gr
-from huggingface_hub import InferenceClient
-import os
-# Используем InferenceClient для прямой работы с моделью
-# Он автоматически подтянет ваш токен из настроек Space
-client = InferenceClient("moonshotai/Kimi-K2-Thinking")
 custom_theme = gr.themes.Soft(
     primary_hue="yellow",
@@ -20,41 +18,31 @@ css = """
 """
 def predict(message, history):
-    # Формируем сообщения для чата
-    messages = [
-        {"role": "system", "content": "Тебя зовут Gemini."},
-    ]
-    # Добавляем историю сообщений (чтобы бот помнил контекст)
-    for human, assistant in history:
-        messages.append({"role": "user", "content": human})
-        messages.append({"role": "assistant", "content": assistant})
-    # Добавляем текущее сообщение
-    messages.append({"role": "user", "content": message})
-    response = ""
     try:
-        # Стриминг ответа (текст будет появляться постепенно)
-        for message_chunk in client.chat_completion(
-            messages,
-            max_tokens=512,
-            stream=True,
-        ):
-            token = message_chunk.choices[0].delta.content
-            if token:
-                response += token
-            yield response
     except Exception as e:
-        yield f"Произошла ошибка: {str(e)}"
-with gr.Blocks(theme=custom_theme, css=css, fill_height=True) as demo:
     with gr.Sidebar(elem_id="side-bar"):
         gr.Markdown("# **FlareAI**")
         gr.Markdown("Flare — твой персональный ассистент")
         gr.LoginButton("Войти")
-    # Используем ChatInterface с поддержкой истории
     gr.ChatInterface(fn=predict)
 demo.launch()

 import gradio as gr
+# Загружаем модель один раз
+# Это самый стабильный способ для бесплатных Space
+model = gr.load("models/moonshotai/Kimi-K2-Thinking", provider="novita")
 custom_theme = gr.themes.Soft(
     primary_hue="yellow",
 """
 def predict(message, history):
+    # Системный промпт
+    system_instr = "Тебя зовут Gemini. "
+    full_prompt = system_instr + message
     try:
+        # Вызываем модель
+        response = model(full_prompt)
+        # Проверка: если пришел список, берем первый элемент
+        if isinstance(response, list):
+            return response[0]
+        # Если пришел словарь (бывает в некоторых API)
+        elif isinstance(response, dict):
+            return response.get("generated_text", str(response))
+        return response
     except Exception as e:
+        return f"Ошибка: {str(e)}. Попробуй подождать 10 секунд и отправить снова."
+with gr.Blocks(theme=custom_theme, css=css) as demo:
     with gr.Sidebar(elem_id="side-bar"):
         gr.Markdown("# **FlareAI**")
         gr.Markdown("Flare — твой персональный ассистент")
         gr.LoginButton("Войти")
     gr.ChatInterface(fn=predict)
 demo.launch()