Spaces:
Sleeping
Sleeping
Hynek Kydlíček
commited on
Commit
·
861d5e9
1
Parent(s):
5259ca7
freeze version
Browse files- app.py +16 -14
- requirements.txt +3 -3
app.py
CHANGED
|
@@ -1,13 +1,19 @@
|
|
| 1 |
from html import unescape
|
| 2 |
from unicodedata import normalize
|
| 3 |
import gradio as gr
|
| 4 |
-
from transformers import pipeline
|
| 5 |
import re
|
| 6 |
|
| 7 |
re_multispace = re.compile(r"\s+")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8 |
|
| 9 |
def normalize_text(text):
|
| 10 |
-
if text
|
| 11 |
return None
|
| 12 |
|
| 13 |
text = text.strip()
|
|
@@ -20,28 +26,24 @@ def normalize_text(text):
|
|
| 20 |
return text
|
| 21 |
|
| 22 |
|
| 23 |
-
|
| 24 |
-
|
| 25 |
-
]
|
| 26 |
-
|
| 27 |
-
pipelines = {model: pipeline(task="text-classification",
|
| 28 |
-
model=f"hynky/{model.replace(' ', '_')}", tokenizer="ufal/robeczech-base",
|
| 29 |
truncation=True, max_length=512,
|
| 30 |
top_k=5
|
| 31 |
-
) for model in
|
| 32 |
|
| 33 |
|
| 34 |
def predict(article):
|
| 35 |
article = normalize_text(article)
|
| 36 |
-
predictions = [pipelines[model](article)[0] for model in
|
| 37 |
predictions = [{pred["label"]: round(pred["score"], 3) for pred in task_preds} for task_preds in predictions]
|
| 38 |
-
return
|
| 39 |
|
| 40 |
gr.Interface(
|
| 41 |
predict,
|
| 42 |
-
inputs=gr.
|
| 43 |
# multioutput of gradio text
|
| 44 |
-
outputs=[gr.
|
| 45 |
-
for
|
| 46 |
title="News Article Classifier",
|
| 47 |
).launch()
|
|
|
|
| 1 |
from html import unescape
|
| 2 |
from unicodedata import normalize
|
| 3 |
import gradio as gr
|
| 4 |
+
from transformers import pipeline, AutoModel
|
| 5 |
import re
|
| 6 |
|
| 7 |
re_multispace = re.compile(r"\s+")
|
| 8 |
+
model_task_mapping = {
|
| 9 |
+
"Server": "Server",
|
| 10 |
+
"Category": "Category",
|
| 11 |
+
"Gender": "Gender",
|
| 12 |
+
"Day Of Week": "Day_of_week"
|
| 13 |
+
}
|
| 14 |
|
| 15 |
def normalize_text(text):
|
| 16 |
+
if text is None:
|
| 17 |
return None
|
| 18 |
|
| 19 |
text = text.strip()
|
|
|
|
| 26 |
return text
|
| 27 |
|
| 28 |
|
| 29 |
+
pipelines = {task: pipeline(task="text-classification",
|
| 30 |
+
model=f"hynky/{model}", tokenizer="ufal/robeczech-base",
|
|
|
|
|
|
|
|
|
|
|
|
|
| 31 |
truncation=True, max_length=512,
|
| 32 |
top_k=5
|
| 33 |
+
) for task, model in model_task_mapping.items()}
|
| 34 |
|
| 35 |
|
| 36 |
def predict(article):
|
| 37 |
article = normalize_text(article)
|
| 38 |
+
predictions = [pipelines[model](article)[0] for model in model_task_mapping.keys()]
|
| 39 |
predictions = [{pred["label"]: round(pred["score"], 3) for pred in task_preds} for task_preds in predictions]
|
| 40 |
+
return predictions
|
| 41 |
|
| 42 |
gr.Interface(
|
| 43 |
predict,
|
| 44 |
+
inputs=gr.Textbox(lines=4, placeholder="Paste a news article here..."),
|
| 45 |
# multioutput of gradio text
|
| 46 |
+
outputs=[gr.Label(num_top_classes=5, label=task)
|
| 47 |
+
for task in model_task_mapping.keys()],
|
| 48 |
title="News Article Classifier",
|
| 49 |
).launch()
|
requirements.txt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
-
transformers
|
| 2 |
-
torch
|
| 3 |
-
gradio==3.26
|
|
|
|
| 1 |
+
transformers==0.1.1
|
| 2 |
+
torch==2.1.0
|
| 3 |
+
gradio==0.3.26
|