Spaces:

anaspro
/

chatbox

Runtime error

App Files Files Community

anaspro commited on Oct 26

Commit

e2196c4

1 Parent(s): 51d3416

updatE

Browse files

Files changed (3) hide show

README.md +9 -9
app.py +9 -46
test_iraqi_model.py +35 -51

README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-title: Iraqi AI Assistant - ذكاء عراقي
 emoji: 🤖
 colorFrom: blue
 colorTo: green
@@ -10,23 +10,23 @@ pinned: false
 models:
 - inceptionai/jais-family-13b-chat
 tags:
-- customer-support
 - arabic
 - chatbot
-- iraqi-dialect
-- tech-support
 - multilingual
 ---
-ذكاء صناعي متقدم يدعم اللغتين العربية والإنجليزية - Jais AI.
 🚀 **المميزات:**
-- 🌐 دعم ثنائي اللغة (عربي وإنجليزي)
-- 🧠 موديل Jais المتقدم من Inception
 - 💬 إجابات ذكية واحترافية
-- 🎯 مدعوم بـ موديل 13B مع تحسينات الأداء
-📞 احجي مع الذكاء الاصطناعي باللهجة العراقية في أي موضوع تريده.
 ## 🚀 كيفية النشر على Hugging Face Spaces ZeroGPU

 ---
+title: Jais AI - ذكاء جيس
 emoji: 🤖
 colorFrom: blue
 colorTo: green
 models:
 - inceptionai/jais-family-13b-chat
 tags:
 - arabic
+- english
 - chatbot
+- jais
+- inception
 - multilingual
 ---
+ذكاء صناعي متقدم يدعم اللغة العربية - موديل Jais من Inception.
 🚀 **المميزات:**
+- 🇸🇦 التركيز على اللغة العربية
+- 🧠 موديل Jais 13B المتقدم من Inception
 - 💬 إجابات ذكية واحترافية
+- 🎯 سهل الاستخدام بدون إعدادات معقدة
+📞 احجي مع ذكاء Jais الاصطناعي بالعربية.
 ## 🚀 كيفية النشر على Hugging Face Spaces ZeroGPU

app.py CHANGED Viewed

@@ -59,41 +59,11 @@ def get_response(text, tokenizer=tokenizer, model=model):
     response = response.split("### Response :")[-1]
     return response
-def format_conversation_history(chat_history):
-    messages = []
-    for item in chat_history:
-        role = item["role"]
-        content = item["content"]
-        if isinstance(content, list):
-            content = content[0]["text"] if content and "text" in content[0] else str(content)
-        messages.append({"role": role, "content": content})
-    return messages
-def detect_language(text):
-    """Simple language detection - Arabic vs English"""
-    arabic_chars = sum(1 for char in text if '\u0600' <= char <= '\u06FF')
-    total_chars = len(text.replace(' ', ''))
-    if total_chars == 0:
-        return 'ar'  # default to Arabic
-    arabic_ratio = arabic_chars / total_chars
-    return 'ar' if arabic_ratio > 0.3 else 'en'
 @spaces.GPU()
-def generate_response(input_data, chat_history, max_new_tokens, temperature, top_p, top_k, repetition_penalty):
-    # Detect language of the current question (مثل الكود الأصلي)
-    def detect_language(text):
-        arabic_chars = sum(1 for char in text if '\u0600' <= char <= '\u06FF')
-        total_chars = len(text.replace(' ', ''))
-        if total_chars == 0:
-            return 'ar'
-        arabic_ratio = arabic_chars / total_chars
-        return 'ar' if arabic_ratio > 0.3 else 'en'
-    lang = detect_language(input_data)
     ques = input_data
-    text = prompt_ar.format_map({'Question': ques}) if lang == 'ar' else prompt_eng.format_map({'Question': ques})
     try:
         response = get_response(text)
@@ -107,32 +77,25 @@ def generate_response(input_data, chat_history, max_new_tokens, temperature, top
 demo = gr.ChatInterface(
     fn=generate_response,
-    additional_inputs=[
-        gr.Slider(label="الحد الأقصى للكلمات الجديدة", minimum=64, maximum=4096, step=1, value=2048),
-        gr.Slider(label="درجة الحرارة", minimum=0.1, maximum=2.0, step=0.1, value=0.7),
-        gr.Slider(label="Top-p", minimum=0.05, maximum=1.0, step=0.05, value=0.9),
-        gr.Slider(label="Top-k", minimum=1, maximum=100, step=1, value=50),
-        gr.Slider(label="عقوبة التكرار", minimum=1.0, maximum=2.0, step=0.05, value=1.0)
-    ],
     examples=[
         [{"text": "ما هي عاصمة الامارات؟"}],
         [{"text": "شرح لي الذكاء الاصطناعي"}],
         [{"text": "أخبرني قصة قصيرة"}],
         [{"text": "كيف أتعلم البرمجة؟"}],
-        [{"text": "What is the capital of UAE?"}],
     ],
     cache_examples=False,
     type="messages",
-    title="Jais AI - ذكاء صناعي متقدم",
-    description="""🤖 ذكاء صناعي متقدم يدعم اللغتين العربية والإنجليزية
 ✨ المميزات:
-- 🌐 دعم ثنائي اللغة (عربي وإنجليزي)
 - 🧠 موديل Jais المتقدم من Inception
 - 💬 إجابات ذكية واحترافية
-- 🎯 مدعوم بـ موديل 13B مع تحسينات الأداء
-احجي مع ذكاء Jais الاصطناعي في أي موضوع تريده.""",
     fill_height=True,
     textbox=gr.Textbox(
         label="اكتب رسالتك هنا",

     response = response.split("### Response :")[-1]
     return response
 @spaces.GPU()
+def generate_response(input_data, chat_history):
+    # Use Arabic prompt for all responses (simplified approach)
     ques = input_data
+    text = prompt_ar.format_map({'Question': ques})
     try:
         response = get_response(text)
 demo = gr.ChatInterface(
     fn=generate_response,
     examples=[
         [{"text": "ما هي عاصمة الامارات؟"}],
         [{"text": "شرح لي الذكاء الاصطناعي"}],
         [{"text": "أخبرني قصة قصيرة"}],
         [{"text": "كيف أتعلم البرمجة؟"}],
+        [{"text": "ما هو الفرق بين الذكاء الاصطناعي والتعلم الآلي؟"}],
     ],
     cache_examples=False,
     type="messages",
+    title="Jais AI - ذكاء جيس العربي",
+    description="""🤖 ذكاء صناعي متقدم يدعم اللغة العربية
 ✨ المميزات:
+- 🇸🇦 التركيز على اللغة العربية
 - 🧠 موديل Jais المتقدم من Inception
 - 💬 إجابات ذكية واحترافية
+- 🎯 سهل الاستخدام بدون إعدادات معقدة
+احجي مع ذكاء Jais الاصطناعي بالعربية.""",
     fill_height=True,
     textbox=gr.Textbox(
         label="اكتب رسالتك هنا",

test_iraqi_model.py CHANGED Viewed

@@ -1,69 +1,53 @@
 #!/usr/bin/env python3
 """
-اختبار الموديل العراقي 4-bit
 """
 import os
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
-def test_model():
     model_path = "inceptionai/jais-family-13b-chat"
-    hf_token = os.getenv("HF_TOKEN")
-    print("جاري تحميل مودل Jais...")
-    tokenizer = AutoTokenizer.from_pretrained(
-        model_path,
-        token=hf_token,
-        trust_remote_code=True
-    )
-    model = AutoModelForCausalLM.from_pretrained(
-        model_path,
-        device_map="auto",
-        trust_remote_code=True,
-        token=hf_token,
-        torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
-        low_cpu_mem_usage=True
-    )
-    if tokenizer.pad_token is None:
-        tokenizer.pad_token = tokenizer.eos_token
-    # اختبار الـ prompt الجديد
-    prompt = """### Instruction:أنت ذكاء صناعي يتحدث باللهجة العراقية ويجيب باحترافية وذكاء. الإجابات دائما تستخدم اللهجة العراقية.
-### Input:[|Human|] مرحبا كيفك؟
-[|AI|]
-### Response :"""
-    inputs = tokenizer(prompt, return_tensors="pt")
-    input_ids = inputs['input_ids'].to('cuda' if torch.cuda.is_available() else 'cpu')
-    attention_mask = inputs['attention_mask'].to('cuda' if torch.cuda.is_available() else 'cpu')
-    print("جاري توليد الرد...")
-    outputs = model.generate(
-        input_ids,
-        attention_mask=attention_mask,
-        max_length=input_ids.shape[-1] + 100,
-        temperature=0.3,
-        top_p=0.8,
-        do_sample=True,
-        pad_token_id=tokenizer.pad_token_id,
-        eos_token_id=tokenizer.eos_token_id
-    )
-    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
-    # استخراج الرد الجديد فقط
-    if "### Response :" in response:
-        response = response.split("### Response :")[-1].strip()
     print("=" * 50)
     print("الاختبار نجح! ✅")
     print(f"الموديل: {model_path}")
-    print("الـ prompt: ذكاء صناعي باللهجة العراقية (مع التأكيد على استخدام اللهجة دائماً)"
     print(f"الرد: {response}")
     print("=" * 50)
 if __name__ == "__main__":
-    test_model()

 #!/usr/bin/env python3
 """
+اختبار مودل Jais - مثل الكود الأصلي
 """
 import os
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
+def test_jais():
     model_path = "inceptionai/jais-family-13b-chat"
+    # تحميل المودل مثل الكود الأصلي
+    tokenizer = AutoTokenizer.from_pretrained(model_path)
+    model = AutoModelForCausalLM.from_pretrained(model_path, device_map="auto", trust_remote_code=True)
+    # الـ prompts الأصلية
+    prompt_eng = "### Instruction:Your name is 'Jais', and you are named after Jebel Jais, the highest mountain in UAE. You were made by 'Inception' in the UAE. You are a helpful, respectful, and honest assistant. Always answer as helpfully as possible, while being safe. Complete the conversation between [|Human|] and [|AI|]:\n### Input: [|Human|] {Question}\n[|AI|]\n### Response :"
+    prompt_ar = "### Instruction:اسمك \"جيس\" وسميت على اسم جبل جيس اعلى جبل في الامارات. تم بنائك بواسطة Inception في الإمارات. أنت مساعد مفيد ومحترم وصادق. أجب دائمًا بأكبر قدر ممكن من المساعدة، مع الحفاظ على البقاء أمناً. أكمل المحادثة بين [|Human|] و[|AI|] :\n### Input:[|Human|] {Question}\n[|AI|]\n### Response :"
+    def get_response(text):
+        input_ids = tokenizer(text, return_tensors="pt").input_ids
+        inputs = input_ids.to("cuda" if torch.cuda.is_available() else "cpu")
+        input_len = inputs.shape[-1]
+        generate_ids = model.generate(
+            inputs,
+            top_p=0.9,
+            temperature=0.3,
+            max_length=2048,
+            min_length=input_len + 4,
+            repetition_penalty=1.2,
+            do_sample=True,
+        )
+        response = tokenizer.batch_decode(
+            generate_ids, skip_special_tokens=True, clean_up_tokenization_spaces=True
+        )[0]
+        response = response.split("### Response :")[-1]
+        return response
+    # اختبار عربي فقط (التركيز على العربية)
+    ques = "ما هي عاصمة الامارات؟"
+    text = prompt_ar.format_map({'Question': ques})
+    response = get_response(text)
     print("=" * 50)
     print("الاختبار نجح! ✅")
     print(f"الموديل: {model_path}")
+    print("السؤال: ما هي عاصمة الامارات؟"
     print(f"الرد: {response}")
     print("=" * 50)
 if __name__ == "__main__":
+    test_jais()