deeppunct-gr

Runtime error

App Files Files Community

wldmr commited on Apr 1, 2023

Commit

22e7a05

1 Parent(s): 25e3dec

added measures

Browse files

Files changed (1) hide show

app.py +13 -3

app.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from deepmultilingualpunctuation import PunctuationModel
 import gradio as gr
 import re
 # https://stackoverflow.com/questions/22800401/how-to-capitalize-the-first-letter-of-every-sentence
 def cap(match):
@@ -73,7 +74,12 @@ def predict(brakes, transcript):
     regex3 = r"^\w"
     pcnt_file_cr_cap = re.sub(regex3, lambda x: x.group().upper(), re.sub(regex2, lambda x: x.group().upper(), re.sub(regex1, "I", pcnt_file_cr)))
-    return pcnt_file_cr_cap
 if __name__ == "__main__":
@@ -85,9 +91,13 @@ Model restores punctuation and case i.e. of the following punctuations -- [! ? .
     examples = [['sentences', "my name is clara i live in berkeley california"]]
     interface = gr.Interface(fn = predict,
-                         inputs = [gr.Radio(["no brakes","sentences", "textlines"], value="no brakes", label="line brakes"),
                                    "text"],
-                         outputs = ["text"],
                          title = title,
                          description = description,
                          examples=examples,

 from deepmultilingualpunctuation import PunctuationModel
 import gradio as gr
 import re
+import metrics
 # https://stackoverflow.com/questions/22800401/how-to-capitalize-the-first-letter-of-every-sentence
 def cap(match):
     regex3 = r"^\w"
     pcnt_file_cr_cap = re.sub(regex3, lambda x: x.group().upper(), re.sub(regex2, lambda x: x.group().upper(), re.sub(regex1, "I", pcnt_file_cr)))
+    n_tokens= metrics.num_tokens(pcnt_file_cr_cap)
+    n_sents = metrics.num_sentences(pcnt_file_cr_cap)
+    n_words = metrics.num_words(pcnt_file_cr_cap)
+    n_chars = metrics.num_chars(pcnt_file_cr_cap)
+    return pcnt_file_cr_cap, n_words, n_sents, n_chars, n_tokens
 if __name__ == "__main__":
     examples = [['sentences', "my name is clara i live in berkeley california"]]
     interface = gr.Interface(fn = predict,
+                         inputs = [gr.Radio(["no brakes","sentences", "textlines"], value="no brakes", label="preserve line brakes"),
                                    "text"],
+                         outputs=[gr.Textbox(label="Punctuated Transcript"),
+                                    gr.Number(label="Number of Words"),
+                                    gr.Number(label="Number of Sentences"),
+                                    gr.Number(label="Number of Characters"),
+                                    gr.Number(label="Number of Tokens")],
                          title = title,
                          description = description,
                          examples=examples,