Spaces:

FECUOY
/

Test1

Sleeping

App Files Files Community

FECUOY commited on Jan 19

Commit

63957d1

verified ·

1 Parent(s): 94045d9

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -62

app.py CHANGED Viewed

@@ -1,67 +1,23 @@
-import gradio as gr
-from huggingface_hub import InferenceClient
-def respond(
-    message,
-    history: list[dict[str, str]],
-    system_message,
-    max_tokens,
-    temperature,
-    top_p,
-    hf_token: gr.OAuthToken,
-):
-    # استخدام نموذج Qwen 2.5 72B
-    client = InferenceClient(
-        model="moonshotai/Kimi-K2-Instruct",
-        token=hf_token.token
-    )
-    # 1. بناء قائمة الرسائل بشكل صحيح
-    messages = [{"role": "system", "content": system_message}]
-    # إضافة التاريخ (history في Gradio type="messages" هو قائمة قواميس جاهزة)
-    messages.extend(history)
-    # إضافة رسالة المستخدم الحالية
-    messages.append({"role": "user", "content": message})
-    response = ""
-    try:
-        # 2. بدء الاتصال مع النموذج
-        for msg in client.chat_completion(
-            messages,
-            max_tokens=max_tokens,
-            stream=True,
-            temperature=temperature,
-            top_p=top_p,
-        ):
-            # التأكد من أن القائمة ليست فارغة قبل الوصول للعنصر [0]
-            if msg.choices and len(msg.choices) > 0:
-                token = msg.choices[0].delta.content
-                if token:
-                    response += token
-                    yield response
-    except Exception as e:
-        yield f"⚠️ حدث خطأ: {str(e)}"
-# إعداد واجهة Gradio
-chatbot = gr.ChatInterface(
-    respond,
-    type="messages", # يضمن إرسال التاريخ بتنسيق قواميس الأدوار
-    additional_inputs=[
-        gr.Textbox(value="أنت مساعد ذكي ومفيد.", label="System message"),
-        gr.Slider(minimum=1, maximum=4096, value=1024, step=1, label="Max tokens"),
-        gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p"),
     ],
-    title="Qwen 2.5 72B Chatbot",
-)
-with gr.Blocks() as demo:
-    with gr.Sidebar():
-        gr.LoginButton()
-    chatbot.render()
-if __name__ == "__main__":
-    demo.launch()

+import { InferenceClient } from "@huggingface/inference";
+const client = new InferenceClient(process.env.HF_TOKEN);
+let out = "";
+const stream = client.chatCompletionStream({
+    model: "moonshotai/Kimi-K2-Instruct-0905",
+    messages: [
+        {
+            role: "user",
+            content: "What is the capital of France?",
+        },
     ],
+});
+for await (const chunk of stream) {
+	if (chunk.choices && chunk.choices.length > 0) {
+		const newContent = chunk.choices[0].delta.content;
+		out += newContent;
+		console.log(newContent);
+	}
+}