Spaces:

darkproger
/

propaganda

Build error

App Files Files Community

darkproger commited on Nov 4, 2021

Commit

efb23c9

1 Parent(s): 766dac7

use st.metric for sequence logits

Browse files

Files changed (1) hide show

app.py +22 -15

app.py CHANGED Viewed

@@ -7,7 +7,8 @@ import streamlit as st
 import torch
 from transformers import BertTokenizerFast
-from model import BertForTokenAndSequenceJointClassification, TOKEN_TAGS
 @st.cache(allow_output_mutation=True)
 def load_model():
@@ -16,22 +17,28 @@ def load_model():
             "QCRI/PropagandaTechniquesAnalysis-en-BERT",
              revision="v0.1.0")
     return tokenizer, model
-tokenizer, model = load_model()
-st.write("[Propaganda Techniques Analysis BERT](https://huggingface.co/QCRI/PropagandaTechniquesAnalysis-en-BERT) Tagger")
-input = st.text_area('Input', """\
-In some instances, it can be highly dangerous to use a medicine for the prevention or treatment of COVID-19 that has not been approved by or has not received emergency use authorization from the FDA.
-""")
-inputs = tokenizer.encode_plus(input, return_tensors="pt")
-outputs = model(**inputs)
-sequence_class_index = torch.argmax(outputs.sequence_logits, dim=-1)
-sequence_class = model.sequence_tags[sequence_class_index[0]]
-token_class_index = torch.argmax(outputs.token_logits, dim=-1)
-tokens = tokenizer.convert_ids_to_tokens(inputs.input_ids[0][1:-1])
-tags = [model.token_tags[i] for i in token_class_index[0].tolist()[1:-1]]
 spaces = [not tok.startswith('##') for tok in tokens][1:] + [False]
@@ -40,7 +47,7 @@ doc = Doc(Vocab(strings=set(tokens)),
           spaces=spaces,
           ents=[tag if tag == "O" else f"B-{tag}" for tag in tags])
-labels = TOKEN_TAGS[2:]
 label_select = st.multiselect(
     "Tags",

 import torch
 from transformers import BertTokenizerFast
+from model import BertForTokenAndSequenceJointClassification
 @st.cache(allow_output_mutation=True)
 def load_model():
             "QCRI/PropagandaTechniquesAnalysis-en-BERT",
              revision="v0.1.0")
     return tokenizer, model
+with torch.inference_mode(True):
+    tokenizer, model = load_model()
+    st.write("[Propaganda Techniques Analysis BERT](https://huggingface.co/QCRI/PropagandaTechniquesAnalysis-en-BERT) Tagger")
+    input = st.text_area('Input', """\
+    In some instances, it can be highly dangerous to use a medicine for the prevention or treatment of COVID-19 that has not been approved by or has not received emergency use authorization from the FDA.
+    """)
+    inputs = tokenizer.encode_plus(input, return_tensors="pt")
+    outputs = model(**inputs)
+    sequence_class_index = torch.argmax(outputs.sequence_logits, dim=-1)
+    sequence_class = model.sequence_tags[sequence_class_index[0]]
+    token_class_index = torch.argmax(outputs.token_logits, dim=-1)
+    tokens = tokenizer.convert_ids_to_tokens(inputs.input_ids[0][1:-1])
+    tags = [model.token_tags[i] for i in token_class_index[0].tolist()[1:-1]]
+columns = st.columns(len(outputs.sequence_logits.flatten()))
+for col, sequence_tag, logit in zip(columns, model.sequence_tags, outputs.sequence_logits.flatten()):
+    col.metric(sequence_tag, '%.2f' % logit.item())
 spaces = [not tok.startswith('##') for tok in tokens][1:] + [False]
           spaces=spaces,
           ents=[tag if tag == "O" else f"B-{tag}" for tag in tags])
+labels = model.token_tags[2:]
 label_select = st.multiselect(
     "Tags",