Spaces:
Sleeping
Sleeping
Commit
·
43e2fd9
1
Parent(s):
a188b38
Add other datasets
Browse files
app.py
CHANGED
|
@@ -4,9 +4,6 @@ import streamlit as st
|
|
| 4 |
from datasets import load_dataset
|
| 5 |
from annotated_text import annotated_text
|
| 6 |
|
| 7 |
-
# Load data
|
| 8 |
-
ds = load_dataset("hs-knowledge/hateval_enriched")
|
| 9 |
-
|
| 10 |
|
| 11 |
# Show highlighted ner entities in a tweet
|
| 12 |
def display_ner(example):
|
|
@@ -69,9 +66,9 @@ def display_ner(example):
|
|
| 69 |
annotated_text(*chunks)
|
| 70 |
|
| 71 |
|
| 72 |
-
def display_text(example):
|
| 73 |
# Use annotated_text to show entities
|
| 74 |
-
text = example[
|
| 75 |
|
| 76 |
# Sort entities by start
|
| 77 |
entities = sorted(example["entities"], key=lambda x: x["start"])
|
|
@@ -110,7 +107,20 @@ def display_text(example):
|
|
| 110 |
annotated_text(*chunks)
|
| 111 |
|
| 112 |
|
| 113 |
-
#
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 114 |
|
| 115 |
elements = random.choices(range(len(ds["train"])), k=50)
|
| 116 |
ds["train"] = ds["train"].select(elements)
|
|
|
|
| 4 |
from datasets import load_dataset
|
| 5 |
from annotated_text import annotated_text
|
| 6 |
|
|
|
|
|
|
|
|
|
|
| 7 |
|
| 8 |
# Show highlighted ner entities in a tweet
|
| 9 |
def display_ner(example):
|
|
|
|
| 66 |
annotated_text(*chunks)
|
| 67 |
|
| 68 |
|
| 69 |
+
def display_text(example, text_column):
|
| 70 |
# Use annotated_text to show entities
|
| 71 |
+
text = example[text_column]
|
| 72 |
|
| 73 |
# Sort entities by start
|
| 74 |
entities = sorted(example["entities"], key=lambda x: x["start"])
|
|
|
|
| 107 |
annotated_text(*chunks)
|
| 108 |
|
| 109 |
|
| 110 |
+
# selectbox to choose dataset
|
| 111 |
+
|
| 112 |
+
selected_dataset = st.sidebar.selectbox(
|
| 113 |
+
"Select dataset", ["hateval_enriched", "sbf-enriched", "hatecheck-enriched"]
|
| 114 |
+
)
|
| 115 |
+
|
| 116 |
+
# Load data
|
| 117 |
+
ds = load_dataset(f"hs-knowledge/{selected_dataset}")
|
| 118 |
+
|
| 119 |
+
text_column = {
|
| 120 |
+
"hateval_enriched": "text",
|
| 121 |
+
"sbf-enriched": "post",
|
| 122 |
+
"hatecheck-enriched": "test_case",
|
| 123 |
+
}
|
| 124 |
|
| 125 |
elements = random.choices(range(len(ds["train"])), k=50)
|
| 126 |
ds["train"] = ds["train"].select(elements)
|