Spaces:

flax-community
/

roberta-base-mr

Runtime error

hassiahk commited on Jul 17, 2021

Commit

97275be

1 Parent(s): 0bc5c62

Added model hub links

Files changed (2) hide show

apps/classifier.py CHANGED Viewed

@@ -20,17 +20,30 @@ def load_model(input_text, model_name_or_path):
 def app():
     st.title("RoBERTa Marathi")
     classifier = st.sidebar.selectbox("Select a Model", index=0, options=["Indic NLP", "iNLTK"])
     sample_texts = [
-        "दानिश सिद्दीकीच्या मृत्यूला आम्ही जबाबदार नाही",
         "अध्यक्ष शरद पवार आणि उपमुख्यमंत्री अजित पवार यांची भेट घेतली.",
         "मोठी बातमी! उद्या दुपारी १ वाजता जाहीर होणार दहावीचा निकाल",
     ]
     model_name_or_path = cfg["models"][classifier]
-    input_text = st.sidebar.selectbox("Select a Text", options=sample_texts)
-    text_to_classify = st.text_input("Text:", input_text)
     predict_button = st.button("Predict")

 def app():
     st.title("RoBERTa Marathi")
+    st.markdown(
+        "This demo uses [RoBERTa for Marathi](https://huggingface.co/flax-community/roberta-base-mr) model "
+        "trained on [mC4](https://huggingface.co/datasets/mc4)."
+    )
+    st.markdown(
+        "Can't figure out where to get a sample text? Visit this "
+        "[link](https://maharashtratimes.com/entertainment/articlelist/19359255.cms), copy any headline and see if "
+        "the model is predicting it as `entertainment` or not."
+    )
     classifier = st.sidebar.selectbox("Select a Model", index=0, options=["Indic NLP", "iNLTK"])
     sample_texts = [
         "अध्यक्ष शरद पवार आणि उपमुख्यमंत्री अजित पवार यांची भेट घेतली.",
         "मोठी बातमी! उद्या दुपारी १ वाजता जाहीर होणार दहावीचा निकाल",
+        "Custom",
     ]
     model_name_or_path = cfg["models"][classifier]
+    text_to_classify = st.selectbox("Select a Text", options=sample_texts, index=len(sample_texts) - 1)
+    if text_to_classify == "Custom":
+        text_to_classify = st.text_input("Enter custom text:")
     predict_button = st.button("Predict")

apps/mlm.py CHANGED Viewed

@@ -15,12 +15,22 @@ def load_model(input_text, model_name_or_path):
     nlp = pipeline("fill-mask", model=model, tokenizer=tokenizer)
     result = nlp(input_text)
     sentence, mask = result[0]["sequence"], result[0]["token_str"]
-    return sentence, mask
 def app():
     st.title("RoBERTa Marathi")
     masked_texts = [
         "मोठी बातमी! उद्या दुपारी <mask> वाजता जाहीर होणार दहावीचा निकाल",
         "अध्यक्ष <mask> पवार आणि उपमुख्यमंत्री अजित पवार यांची भेट घेतली.",
@@ -33,7 +43,9 @@ def app():
     if fill_button:
         with st.spinner("Filling the Mask..."):
-            filled_sentence, mask = load_model(masked_text, cfg["models"]["RoBERTa"])
             st.markdown(f"**Filled sentence: **{filled_sentence}")
             st.markdown(f"**Predicted masked token: **{mask}")

     nlp = pipeline("fill-mask", model=model, tokenizer=tokenizer)
     result = nlp(input_text)
     sentence, mask = result[0]["sequence"], result[0]["token_str"]
+    return sentence, mask, result
 def app():
     st.title("RoBERTa Marathi")
+    st.markdown(
+        "This demo uses [RoBERTa for Marathi](https://huggingface.co/flax-community/roberta-base-mr) model "
+        "trained on [mC4](https://huggingface.co/datasets/mc4)."
+    )
+    st.markdown(
+        "Can't figure out where to get a sample text? Visit this "
+        "[link](https://maharashtratimes.com/entertainment/articlelist/19359255.cms), copy any headline and mask a word."
+    )
     masked_texts = [
         "मोठी बातमी! उद्या दुपारी <mask> वाजता जाहीर होणार दहावीचा निकाल",
         "अध्यक्ष <mask> पवार आणि उपमुख्यमंत्री अजित पवार यांची भेट घेतली.",
     if fill_button:
         with st.spinner("Filling the Mask..."):
+            filled_sentence, mask, raw_json = load_model(masked_text, cfg["models"]["RoBERTa"])
             st.markdown(f"**Filled sentence: **{filled_sentence}")
             st.markdown(f"**Predicted masked token: **{mask}")
+            st.write(raw_json)