"""Centralized Arabic retrieval normalization replacements.""" ARABIC_REPLACEMENTS = { "الفرق بين": "difference between", "ايه الفرق بين": "difference between", "ما الفرق بين": "difference between", "المعدل التراكمي العام": "cgpa cumulative gpa overall gpa", "المعدل التراكمي": "cgpa cumulative gpa", "معدل تراكمي": "cgpa cumulative gpa", "التراكمي": "cgpa cumulative gpa", "المعدل الفصلي": "gpa semester gpa", "معدل فصلي": "gpa semester gpa", "الفصلي": "semester gpa", "ادفيزور": "advisor", "مشرف": "advisor", "مرشد": "advisor", "ارشاد": "advising", "مقررات": "courses", "كورسات": "courses", "تسجيل": "registration", "جدول": "schedule", "جداول": "schedule", "خطة": "study plan", "خطه": "study plan", "تراك": "track", "تخصص": "major", "جامعة النيل": "nile university", "جامعه النيل": "nile university", "النيل": "nile university", "الساعه": "credit hour", "الساعة": "credit hour", "ساعه": "credit hour", "ساعة": "credit hour", "كريدت": "credit", "بكام": "price", "سعر": "price", "رسوم": "fees", "تكلفة": "cost", "تكلفه": "cost", "مصاريف": "tuition fees", "قسط": "installment", "منحه": "scholarship", "منح": "scholarship", "تقديم": "application", "قبول": "admission", "التحاق": "enrollment", "شروط": "requirements", "مستندات": "documents", "اوراق": "documents", "تحويل": "transfer", "معادله": "equivalency", "مكتبه": "library", "مكتبة": "library", "مواصلات": "transportation", "باص": "bus", "سكن": "housing", "عياده": "clinic", "عيادة": "clinic", "جيم": "gym", "انشطة": "activities", "انشطه": "activities", "مشكلة": "issue", "مشكله": "issue", "شكوى": "complaint", "شكوي": "complaint", "مفقود": "lost", "مفقوده": "lost", "مفقودات": "lost found items", "ضايع": "lost", "ضائع": "lost", "معثور": "found", "العثور": "found", "الاشياء": "items", "الأشياء": "items", "اشياء": "items", "الامن": "security office", "أمن": "security office", "مكتب الامن": "security office", "مكتب الأمن": "security office", "سيكيورتي": "security office", "تدريب": "internship", "موقع": "website", "ايميل": "email", "بريد": "email", "اوتلوك": "outlook", "مودل": "moodle", "المودل": "moodle", "بوابه": "portal", "بوابة": "portal", "سيلف سيرفس": "self service", "الخدمه الذاتيه": "self service", "الخدمة الذاتية": "self service", "الخدمه": "service", "الخدمة": "service", "طلب": "request", "طلبات": "requests", "نموذج": "form", "نماذج": "forms", "نموذح": "form", "تواصل": "contact", "التواصل": "contact", "رقم": "phone", "تليفون": "phone", "موبايل": "phone", "واتساب": "whatsapp", "لينك": "link", "رابط": "link", "ويب": "website", "اونلاين": "online", "أونلاين": "online", "الكتروني": "online", "إلكتروني": "online", "ابلكيشن": "application", "ابليكيشن": "application", "ابليكشن": "application", "ابلاي": "apply", "تقديم اونلاين": "online application", "التقديم اونلاين": "online application", "مصروف": "tuition", "المصروف": "tuition", "مصاريف الجامعة": "tuition fees", "رسوم الجامعة": "tuition fees", "فلوس": "fees", "تكاليف": "cost", "الاسعار": "price", "الأسعار": "price", "زيادة": "increase", "زياده": "increase", "استرداد": "refund", "استرجاع": "refund", "مرتجع": "refund", "دفع": "payment", "سداد": "payment", "اقساط": "installments", "أقساط": "installments", "قسط اول": "first installment", "قسط اولى": "first installment", "القسط الاول": "first installment", "خصم": "discount", "تخفيض": "discount", "اعفاء": "waiver", "إعفاء": "waiver", "مساعده ماليه": "financial aid", "مساعدة مالية": "financial aid", "دعم مالي": "financial aid", "منح دراسية": "scholarships", "المنح": "scholarship", "تفوق": "merit", "امتياز": "excellence", "القبول": "admission", "الالتحاق": "enrollment", "المتطلبات": "requirements", "المطلوب": "requirements", "اوراق التقديم": "application documents", "الاوراق": "documents", "الأوراق": "documents", "اثبات": "proof", "إثبات": "proof", "معادلة": "equivalency", "تحويلات": "transfer", "ترانسفير": "transfer", "ثانويه": "high school", "ثانوية": "high school", "انجليزي": "english", "إنجليزي": "english", "توفل": "toefl", "ايلتس": "ielts", "ايلس": "ielts", "اختبار تحديد مستوى": "placement test", "تحديد مستوى": "placement test", "نتيجة": "result", "نتايج": "results", "نتائج": "results", "موعد": "deadline", "مواعيد": "deadlines", "ميعاد": "date", "تواريخ": "dates", "ترم": "semester", "سمستر": "semester", "الفصل": "semester", "صيفي": "summer", "سمر": "summer", "خريفي": "fall", "ربيعي": "spring", "تسجيل مواد": "course registration", "تسجيل المقررات": "course registration", "حذف": "drop", "اضافة": "add", "إضافة": "add", "انسحاب": "withdrawal", "سحب": "withdrawal", "تأجيل": "defer", "تجميد": "freeze", "اكتف": "activate", "تفعيل": "activate", "اعتذار": "medical excuse", "عذر": "excuse", "مرضي": "medical", "مرضي": "medical", "غياب": "absence", "حضور": "attendance", "حرمان": "debarred", "امتحان": "exam", "اختبار": "exam", "فاينال": "final exam", "ميدترم": "midterm", "تقييم": "evaluation", "درجات": "grades", "درجة": "grade", "تقدير": "grade", "معدل": "gpa", "جي بي ايه": "gpa", "سي جي بي ايه": "cgpa", "انذار": "probation", "إنذار": "probation", "فصل": "dismissal", "ايقاف": "suspension", "إيقاف": "suspension", "تخرج": "graduation", "خريج": "graduate", "شهاده": "certificate", "شهادة": "certificate", "بيان درجات": "transcript", "ترانسكربت": "transcript", "خطاب قيد": "enrollment letter", "id": "student id", "بطاقه": "id card", "بطاقة": "id card", "كارنيه": "id card", "حساب": "account", "حسابي": "account", "باسورد": "password", "كلمه السر": "password", "كلمة السر": "password", "نسيت الباسورد": "reset password", "تسجيل دخول": "login", "لوجن": "login", "خروج": "logout", "البورتال": "portal", "بوابة الطالب": "student portal", "موديل": "moodle", "ميل": "email", "بريد جامعي": "university email", "ايميل الجامعة": "university email", "اوت لوك": "outlook", "الرجسترار": "registrar", "ريجستار": "registrar", "الدعم الفني": "technical support", "الدعم التقني": "technical support", "اي تي": "it support", "it": "it support", "نادي": "club", "نوادي": "clubs", "اتحاد الطلبة": "student union", "اتحاد الطلاب": "student union", "su": "student union", "نشاط": "activity", "فعاليات": "events", "فعاليه": "event", "فعالية": "event", "seec": "student activities", "تطوع": "volunteering", "تطوعي": "volunteering", "سفر": "exchange", "تبادل": "exchange", "exchange": "exchange", "تدريب صيفي": "summer internship", "وظيفه": "job", "وظيفة": "job", "وظايف": "jobs", "وظائف": "jobs", "career": "careers", "كارير": "careers", "مكتبة الجامعة": "library", "استعارة": "borrow", "ارجاع": "return", "إرجاع": "return", "باصات": "buses", "موقف": "parking", "جراج": "garage", "باركينج": "parking", "مبيت": "housing", "سكن طلاب": "student housing", "عيادة الجامعة": "clinic", "تأمين طبي": "medical insurance", "تامين": "insurance", "تامين طبي": "medical insurance", "تأمين": "insurance", "صالة": "gym", "ملاعب": "courts", "الملعب": "court", "امن": "security office", "السكرتاريه": "administration office", "سكرتارية": "administration office", "مكتب القبول": "admissions office", "شؤون الطلبة": "student affairs", "الشؤون": "student affairs", "مفقودات ومعثورات": "lost and found", "المفقودات": "lost and found", "المعثورات": "found items", } ARABIC_STOPWORDS_PATTERN = ( r"\b(من|في|على|عن|الى|إلى|مع|او|أو|هل|ما|ماذا|كيف|كم|ليه|انا|هو|هي|هم|ده|دي|دا|" r"لو|بس|يعني|عندي|عندكم|اي|ايه|كل|بعد|قبل|هناك|يوجد|توجد|فيه|فيها|ممكن|عايز|عاوزه|" r"عاوز|اريد|أريد|لو سمحت|فضلا|فضلًا|من فضلك|متى|فين|وين|ليش|لماذا)\b" )