Spaces:

MarioMamdouh121
/

Arabic-qa

Sleeping

MarioMamdouh121 commited on May 6, 2025

Commit

9c8d6cc

verified ·

1 Parent(s): e0793b2

Update src/streamlit_app.py

Files changed (1) hide show

src/streamlit_app.py CHANGED Viewed

@@ -1,14 +1,14 @@
 from transformers import AutoModelForQuestionAnswering, AutoTokenizer
-from arabert.preprocess import ArabertPreprocessor
 import streamlit as st
 import torch
 import os
 # Load model
-model = AutoModelForQuestionAnswering.from_pretrained("MarioMamdouh121/arabic-qa-model")
-tokenizer = AutoTokenizer.from_pretrained("MarioMamdouh121/arabic-qa-model")
-arabert_prep = ArabertPreprocessor(model_name="aubmindlab/bert-base-arabertv2")
 # Streamlit interface
 st.title("Arabic Question Answering")
@@ -19,8 +19,8 @@ question = st.text_input("السؤال")
 if st.button("احصل على الجواب") and context and question:
     # Preprocess
-    context_proc = arabert_prep.preprocess(context)
-    question_proc = arabert_prep.preprocess(question)
     # Tokenize
     inputs = tokenizer(

 from transformers import AutoModelForQuestionAnswering, AutoTokenizer
+from farasa.segmenter import FarasaSegmenter
 import streamlit as st
 import torch
 import os
 # Load model
+model = AutoModelForQuestionAnswering.from_pretrained("checkpoint-2817")
+tokenizer = AutoTokenizer.from_pretrained("checkpoint-2817")
+segmenter = FarasaSegmenter(interactive=False)
 # Streamlit interface
 st.title("Arabic Question Answering")
 if st.button("احصل على الجواب") and context and question:
     # Preprocess
+    context_proc = segmenter.segment(context)
+    question_proc = segmenter.segment(question)
     # Tokenize
     inputs = tokenizer(