AdmissionOfficer / src /replacements.py
Rwan Ashraf
Improving Arabic Language
548e4d8
"""Centralized Arabic retrieval normalization replacements."""
ARABIC_REPLACEMENTS = {
"الفرق بين": "difference between",
"ايه الفرق بين": "difference between",
"ما الفرق بين": "difference between",
"المعدل التراكمي العام": "cgpa cumulative gpa overall gpa",
"المعدل التراكمي": "cgpa cumulative gpa",
"معدل تراكمي": "cgpa cumulative gpa",
"التراكمي": "cgpa cumulative gpa",
"المعدل الفصلي": "gpa semester gpa",
"معدل فصلي": "gpa semester gpa",
"الفصلي": "semester gpa",
"ادفيزور": "advisor",
"مشرف": "advisor",
"مرشد": "advisor",
"ارشاد": "advising",
"مقررات": "courses",
"كورسات": "courses",
"تسجيل": "registration",
"جدول": "schedule",
"جداول": "schedule",
"خطة": "study plan",
"خطه": "study plan",
"تراك": "track",
"تخصص": "major",
"جامعة النيل": "nile university",
"جامعه النيل": "nile university",
"النيل": "nile university",
"الساعه": "credit hour",
"الساعة": "credit hour",
"ساعه": "credit hour",
"ساعة": "credit hour",
"كريدت": "credit",
"بكام": "price",
"سعر": "price",
"رسوم": "fees",
"تكلفة": "cost",
"تكلفه": "cost",
"مصاريف": "tuition fees",
"قسط": "installment",
"منحه": "scholarship",
"منح": "scholarship",
"تقديم": "application",
"قبول": "admission",
"التحاق": "enrollment",
"شروط": "requirements",
"مستندات": "documents",
"اوراق": "documents",
"تحويل": "transfer",
"معادله": "equivalency",
"مكتبه": "library",
"مكتبة": "library",
"مواصلات": "transportation",
"باص": "bus",
"سكن": "housing",
"عياده": "clinic",
"عيادة": "clinic",
"جيم": "gym",
"انشطة": "activities",
"انشطه": "activities",
"مشكلة": "issue",
"مشكله": "issue",
"شكوى": "complaint",
"شكوي": "complaint",
"مفقود": "lost",
"مفقوده": "lost",
"مفقودات": "lost found items",
"ضايع": "lost",
"ضائع": "lost",
"معثور": "found",
"العثور": "found",
"الاشياء": "items",
"الأشياء": "items",
"اشياء": "items",
"الامن": "security office",
"أمن": "security office",
"مكتب الامن": "security office",
"مكتب الأمن": "security office",
"سيكيورتي": "security office",
"تدريب": "internship",
"موقع": "website",
"ايميل": "email",
"بريد": "email",
"اوتلوك": "outlook",
"مودل": "moodle",
"المودل": "moodle",
"بوابه": "portal",
"بوابة": "portal",
"سيلف سيرفس": "self service",
"الخدمه الذاتيه": "self service",
"الخدمة الذاتية": "self service",
"الخدمه": "service",
"الخدمة": "service",
"طلب": "request",
"طلبات": "requests",
"نموذج": "form",
"نماذج": "forms",
"نموذح": "form",
"تواصل": "contact",
"التواصل": "contact",
"رقم": "phone",
"تليفون": "phone",
"موبايل": "phone",
"واتساب": "whatsapp",
"لينك": "link",
"رابط": "link",
"ويب": "website",
"اونلاين": "online",
"أونلاين": "online",
"الكتروني": "online",
"إلكتروني": "online",
"ابلكيشن": "application",
"ابليكيشن": "application",
"ابليكشن": "application",
"ابلاي": "apply",
"تقديم اونلاين": "online application",
"التقديم اونلاين": "online application",
"مصروف": "tuition",
"المصروف": "tuition",
"مصاريف الجامعة": "tuition fees",
"رسوم الجامعة": "tuition fees",
"فلوس": "fees",
"تكاليف": "cost",
"الاسعار": "price",
"الأسعار": "price",
"زيادة": "increase",
"زياده": "increase",
"استرداد": "refund",
"استرجاع": "refund",
"مرتجع": "refund",
"دفع": "payment",
"سداد": "payment",
"اقساط": "installments",
"أقساط": "installments",
"قسط اول": "first installment",
"قسط اولى": "first installment",
"القسط الاول": "first installment",
"خصم": "discount",
"تخفيض": "discount",
"اعفاء": "waiver",
"إعفاء": "waiver",
"مساعده ماليه": "financial aid",
"مساعدة مالية": "financial aid",
"دعم مالي": "financial aid",
"منح دراسية": "scholarships",
"المنح": "scholarship",
"تفوق": "merit",
"امتياز": "excellence",
"القبول": "admission",
"الالتحاق": "enrollment",
"المتطلبات": "requirements",
"المطلوب": "requirements",
"اوراق التقديم": "application documents",
"الاوراق": "documents",
"الأوراق": "documents",
"اثبات": "proof",
"إثبات": "proof",
"معادلة": "equivalency",
"تحويلات": "transfer",
"ترانسفير": "transfer",
"ثانويه": "high school",
"ثانوية": "high school",
"انجليزي": "english",
"إنجليزي": "english",
"توفل": "toefl",
"ايلتس": "ielts",
"ايلس": "ielts",
"اختبار تحديد مستوى": "placement test",
"تحديد مستوى": "placement test",
"نتيجة": "result",
"نتايج": "results",
"نتائج": "results",
"موعد": "deadline",
"مواعيد": "deadlines",
"ميعاد": "date",
"تواريخ": "dates",
"ترم": "semester",
"سمستر": "semester",
"الفصل": "semester",
"صيفي": "summer",
"سمر": "summer",
"خريفي": "fall",
"ربيعي": "spring",
"تسجيل مواد": "course registration",
"تسجيل المقررات": "course registration",
"حذف": "drop",
"اضافة": "add",
"إضافة": "add",
"انسحاب": "withdrawal",
"سحب": "withdrawal",
"تأجيل": "defer",
"تجميد": "freeze",
"اكتف": "activate",
"تفعيل": "activate",
"اعتذار": "medical excuse",
"عذر": "excuse",
"مرضي": "medical",
"مرضي": "medical",
"غياب": "absence",
"حضور": "attendance",
"حرمان": "debarred",
"امتحان": "exam",
"اختبار": "exam",
"فاينال": "final exam",
"ميدترم": "midterm",
"تقييم": "evaluation",
"درجات": "grades",
"درجة": "grade",
"تقدير": "grade",
"معدل": "gpa",
"جي بي ايه": "gpa",
"سي جي بي ايه": "cgpa",
"انذار": "probation",
"إنذار": "probation",
"فصل": "dismissal",
"ايقاف": "suspension",
"إيقاف": "suspension",
"تخرج": "graduation",
"خريج": "graduate",
"شهاده": "certificate",
"شهادة": "certificate",
"بيان درجات": "transcript",
"ترانسكربت": "transcript",
"خطاب قيد": "enrollment letter",
"id": "student id",
"بطاقه": "id card",
"بطاقة": "id card",
"كارنيه": "id card",
"حساب": "account",
"حسابي": "account",
"باسورد": "password",
"كلمه السر": "password",
"كلمة السر": "password",
"نسيت الباسورد": "reset password",
"تسجيل دخول": "login",
"لوجن": "login",
"خروج": "logout",
"البورتال": "portal",
"بوابة الطالب": "student portal",
"موديل": "moodle",
"ميل": "email",
"بريد جامعي": "university email",
"ايميل الجامعة": "university email",
"اوت لوك": "outlook",
"الرجسترار": "registrar",
"ريجستار": "registrar",
"الدعم الفني": "technical support",
"الدعم التقني": "technical support",
"اي تي": "it support",
"it": "it support",
"نادي": "club",
"نوادي": "clubs",
"اتحاد الطلبة": "student union",
"اتحاد الطلاب": "student union",
"su": "student union",
"نشاط": "activity",
"فعاليات": "events",
"فعاليه": "event",
"فعالية": "event",
"seec": "student activities",
"تطوع": "volunteering",
"تطوعي": "volunteering",
"سفر": "exchange",
"تبادل": "exchange",
"exchange": "exchange",
"تدريب صيفي": "summer internship",
"وظيفه": "job",
"وظيفة": "job",
"وظايف": "jobs",
"وظائف": "jobs",
"career": "careers",
"كارير": "careers",
"مكتبة الجامعة": "library",
"استعارة": "borrow",
"ارجاع": "return",
"إرجاع": "return",
"باصات": "buses",
"موقف": "parking",
"جراج": "garage",
"باركينج": "parking",
"مبيت": "housing",
"سكن طلاب": "student housing",
"عيادة الجامعة": "clinic",
"تأمين طبي": "medical insurance",
"تامين": "insurance",
"تامين طبي": "medical insurance",
"تأمين": "insurance",
"صالة": "gym",
"ملاعب": "courts",
"الملعب": "court",
"امن": "security office",
"السكرتاريه": "administration office",
"سكرتارية": "administration office",
"مكتب القبول": "admissions office",
"شؤون الطلبة": "student affairs",
"الشؤون": "student affairs",
"مفقودات ومعثورات": "lost and found",
"المفقودات": "lost and found",
"المعثورات": "found items",
}
ARABIC_STOPWORDS_PATTERN = (
r"\b(من|في|على|عن|الى|إلى|مع|او|أو|هل|ما|ماذا|كيف|كم|ليه|انا|هو|هي|هم|ده|دي|دا|"
r"لو|بس|يعني|عندي|عندكم|اي|ايه|كل|بعد|قبل|هناك|يوجد|توجد|فيه|فيها|ممكن|عايز|عاوزه|"
r"عاوز|اريد|أريد|لو سمحت|فضلا|فضلًا|من فضلك|متى|فين|وين|ليش|لماذا)\b"
)