Spaces:
Runtime error
Runtime error
added measures
Browse files
app.py
CHANGED
|
@@ -1,6 +1,7 @@
|
|
| 1 |
from deepmultilingualpunctuation import PunctuationModel
|
| 2 |
import gradio as gr
|
| 3 |
import re
|
|
|
|
| 4 |
|
| 5 |
# https://stackoverflow.com/questions/22800401/how-to-capitalize-the-first-letter-of-every-sentence
|
| 6 |
def cap(match):
|
|
@@ -73,7 +74,12 @@ def predict(brakes, transcript):
|
|
| 73 |
regex3 = r"^\w"
|
| 74 |
pcnt_file_cr_cap = re.sub(regex3, lambda x: x.group().upper(), re.sub(regex2, lambda x: x.group().upper(), re.sub(regex1, "I", pcnt_file_cr)))
|
| 75 |
|
| 76 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 77 |
|
| 78 |
if __name__ == "__main__":
|
| 79 |
|
|
@@ -85,9 +91,13 @@ Model restores punctuation and case i.e. of the following punctuations -- [! ? .
|
|
| 85 |
examples = [['sentences', "my name is clara i live in berkeley california"]]
|
| 86 |
|
| 87 |
interface = gr.Interface(fn = predict,
|
| 88 |
-
inputs = [gr.Radio(["no brakes","sentences", "textlines"], value="no brakes", label="line brakes"),
|
| 89 |
"text"],
|
| 90 |
-
outputs
|
|
|
|
|
|
|
|
|
|
|
|
|
| 91 |
title = title,
|
| 92 |
description = description,
|
| 93 |
examples=examples,
|
|
|
|
| 1 |
from deepmultilingualpunctuation import PunctuationModel
|
| 2 |
import gradio as gr
|
| 3 |
import re
|
| 4 |
+
import metrics
|
| 5 |
|
| 6 |
# https://stackoverflow.com/questions/22800401/how-to-capitalize-the-first-letter-of-every-sentence
|
| 7 |
def cap(match):
|
|
|
|
| 74 |
regex3 = r"^\w"
|
| 75 |
pcnt_file_cr_cap = re.sub(regex3, lambda x: x.group().upper(), re.sub(regex2, lambda x: x.group().upper(), re.sub(regex1, "I", pcnt_file_cr)))
|
| 76 |
|
| 77 |
+
n_tokens= metrics.num_tokens(pcnt_file_cr_cap)
|
| 78 |
+
n_sents = metrics.num_sentences(pcnt_file_cr_cap)
|
| 79 |
+
n_words = metrics.num_words(pcnt_file_cr_cap)
|
| 80 |
+
n_chars = metrics.num_chars(pcnt_file_cr_cap)
|
| 81 |
+
|
| 82 |
+
return pcnt_file_cr_cap, n_words, n_sents, n_chars, n_tokens
|
| 83 |
|
| 84 |
if __name__ == "__main__":
|
| 85 |
|
|
|
|
| 91 |
examples = [['sentences', "my name is clara i live in berkeley california"]]
|
| 92 |
|
| 93 |
interface = gr.Interface(fn = predict,
|
| 94 |
+
inputs = [gr.Radio(["no brakes","sentences", "textlines"], value="no brakes", label="preserve line brakes"),
|
| 95 |
"text"],
|
| 96 |
+
outputs=[gr.Textbox(label="Punctuated Transcript"),
|
| 97 |
+
gr.Number(label="Number of Words"),
|
| 98 |
+
gr.Number(label="Number of Sentences"),
|
| 99 |
+
gr.Number(label="Number of Characters"),
|
| 100 |
+
gr.Number(label="Number of Tokens")],
|
| 101 |
title = title,
|
| 102 |
description = description,
|
| 103 |
examples=examples,
|