Spaces:

Yermek68
/

eroha-agentapi

Sleeping

App Files Files Community

Yermek68 commited on 2 days ago

Commit

c487e9b

verified ·

1 Parent(s): b4ca792

Update app.py

Browse files

Files changed (1) hide show

app.py +48 -37

app.py CHANGED Viewed

@@ -3,9 +3,9 @@ import time
 import gradio as gr
 import pandas as pd
 import matplotlib.pyplot as plt
-from io import BytesIO
 import base64
-from huggingface_hub import InferenceClient
 from core.dashboard import ErohaDashboard
 from core.intelligence import update_memory, summarize_context
@@ -19,46 +19,59 @@ from core.model_selector import choose_model
 HF_TOKEN = os.getenv("HF_TOKEN", "")
 LOG_FILE = "logs/history.csv"
 os.makedirs("logs", exist_ok=True)
 dashboard = ErohaDashboard()
 # ==============================
-# 🔍 Определение типа подключения
 # ==============================
-def create_inference_client(model_id):
     """
-    Автоматически выбирает нужный тип API (Router / Direct / Local)
     """
-    # Router API
-    if "router.huggingface.co" in model_id or model_id.lower() == "router":
-        print("🔁 Router API Mode активирован")
-        return InferenceClient(base_url="https://router.huggingface.co", token=HF_TOKEN)
-    # Local API
-    elif model_id.startswith("http://") or model_id.startswith("https://"):
-        print("🖥️ Local/Custom API Mode активирован:", model_id)
-        return InferenceClient(base_url=model_id, token=HF_TOKEN)
-    # Direct Model
-    else:
-        print("⚙️ Direct Model Mode активирован:", model_id)
-        return InferenceClient(model=model_id, token=HF_TOKEN)
 # ==============================
-# 🧠 Генерация ответа
 # ==============================
 def generate_response(user_input):
     try:
         start = time.time()
         prefs = analyze_user_input(user_input)
         model_id = choose_model(user_input)
-        client = create_inference_client(model_id)
-        result = client.text_generation(
-            user_input,
-            max_new_tokens=600,
-            temperature=0.7,
-        )
         check = evaluate_answer(result)
         improved = improve_answer(result)
@@ -82,7 +95,7 @@ def generate_response(user_input):
         summary = (
             f"🧠 **Модель:** `{model_id}`\n"
             f"⚡ **Время отклика:** {response_time} сек\n"
-            f"🔍 **Качество:** {check['result']}\n"
             f"{'; '.join(check['feedback']) if check['feedback'] else '✅ Всё отлично'}\n\n"
             f"{context}"
         )
@@ -97,11 +110,10 @@ def generate_response(user_input):
 # ==============================
 def generate_chart():
     if not os.path.exists(LOG_FILE):
-        return "⚠️ Нет данных для отображения."
     df = pd.read_csv(LOG_FILE)
     if df.empty:
         return "⚠️ История пуста."
     df["time"] = pd.to_datetime(df["time"])
     df = df.tail(50)
@@ -109,9 +121,8 @@ def generate_chart():
     plt.plot(df["time"], df["response_time"], marker="o", linewidth=1.5)
     plt.title("⚡ Скорость отклика моделей (последние 50 запросов)")
     plt.xlabel("Время")
-    plt.ylabel("Время отклика (сек)")
     plt.grid(True)
     buffer = BytesIO()
     plt.savefig(buffer, format="png", bbox_inches="tight")
     buffer.seek(0)
@@ -125,14 +136,14 @@ def show_dashboard():
     return metrics_text, df, chart_html
 # ==============================
-# 🎨 Gradio Interface
 # ==============================
-with gr.Blocks(title="Eroha AgentAPI v5.5 — Adaptive AutoRouter", theme="soft") as app:
-    gr.Markdown("# 🤖 Eroha AgentAPI v5.5 — Guru Edition (AutoRouter Adaptive Core)")
-    gr.Markdown("**Интеллект + самообучение + аналитика + автоопределение API** 🧩")
     with gr.Tab("💬 Agent Chat"):
-        user_input = gr.Textbox(label="Введите запрос", placeholder="Например: объясни, как работает нейронная сеть, используя метафоры.")
         output_box = gr.Textbox(label="Ответ", lines=15)
         submit_btn = gr.Button("🚀 Отправить")
         submit_btn.click(fn=generate_response, inputs=user_input, outputs=output_box)

 import gradio as gr
 import pandas as pd
 import matplotlib.pyplot as plt
 import base64
+from io import BytesIO
+import requests
 from core.dashboard import ErohaDashboard
 from core.intelligence import update_memory, summarize_context
 HF_TOKEN = os.getenv("HF_TOKEN", "")
 LOG_FILE = "logs/history.csv"
 os.makedirs("logs", exist_ok=True)
 dashboard = ErohaDashboard()
 # ==============================
+# 🔁 Автоматический Router с Failover
 # ==============================
+def query_huggingface_router(prompt, model_id):
     """
+    Универсальный запрос к Router API с fallback на прямую модель.
     """
+    headers = {"Authorization": f"Bearer {HF_TOKEN}"}
+    payload = {
+        "inputs": prompt,
+        "parameters": {"max_new_tokens": 600, "temperature": 0.7},
+    }
+    try:
+        # 1️⃣ Основной Router API
+        response = requests.post(
+            "https://router.huggingface.co/models/" + model_id,
+            headers=headers,
+            json=payload,
+            timeout=30,
+        )
+        if response.status_code == 200:
+            return response.json()[0]["generated_text"]
+        elif response.status_code == 410:
+            raise RuntimeError("Old endpoint rejected (410)")
+        else:
+            raise RuntimeError(f"Router error: {response.status_code}")
+    except Exception as e:
+        print("⚠️ Router недоступен, выполняется fallback:", str(e))
+        # 2️⃣ Fallback: прямое обращение к конкретной модели
+        fallback_url = f"https://huggingface.co/api/models/{model_id}"
+        try:
+            response = requests.post(fallback_url, headers=headers, json=payload, timeout=30)
+            if response.status_code == 200:
+                return response.json()[0]["generated_text"]
+            else:
+                raise RuntimeError(f"Fallback error: {response.status_code}")
+        except Exception as e2:
+            return f"❌ Ошибка при обращении к API: {str(e2)}"
 # ==============================
+# 🧠 Основная логика
 # ==============================
 def generate_response(user_input):
     try:
         start = time.time()
         prefs = analyze_user_input(user_input)
         model_id = choose_model(user_input)
+        result = query_huggingface_router(user_input, model_id)
         check = evaluate_answer(result)
         improved = improve_answer(result)
         summary = (
             f"🧠 **Модель:** `{model_id}`\n"
             f"⚡ **Время отклика:** {response_time} сек\n"
+            f"🔍 **Проверка качества:** {check['result']}\n"
             f"{'; '.join(check['feedback']) if check['feedback'] else '✅ Всё отлично'}\n\n"
             f"{context}"
         )
 # ==============================
 def generate_chart():
     if not os.path.exists(LOG_FILE):
+        return "⚠️ Нет данных для графика."
     df = pd.read_csv(LOG_FILE)
     if df.empty:
         return "⚠️ История пуста."
     df["time"] = pd.to_datetime(df["time"])
     df = df.tail(50)
     plt.plot(df["time"], df["response_time"], marker="o", linewidth=1.5)
     plt.title("⚡ Скорость отклика моделей (последние 50 запросов)")
     plt.xlabel("Время")
+    plt.ylabel("Секунды")
     plt.grid(True)
     buffer = BytesIO()
     plt.savefig(buffer, format="png", bbox_inches="tight")
     buffer.seek(0)
     return metrics_text, df, chart_html
 # ==============================
+# 🎨 Интерфейс Gradio
 # ==============================
+with gr.Blocks(title="Eroha AgentAPI v5.6 — AutoRouter Failover Core", theme="soft") as app:
+    gr.Markdown("# 🤖 Eroha AgentAPI v5.6 — Guru Edition (AutoRouter + Failover Core)")
+    gr.Markdown("**Автоматический Router + fallback + визуальная аналитика** ⚙️")
     with gr.Tab("💬 Agent Chat"):
+        user_input = gr.Textbox(label="Введите запрос", placeholder="Например: придумай философскую сказку об ИИ.")
         output_box = gr.Textbox(label="Ответ", lines=15)
         submit_btn = gr.Button("🚀 Отправить")
         submit_btn.click(fn=generate_response, inputs=user_input, outputs=output_box)