Spaces:
Sleeping
Sleeping
Create stats_data.py
Browse files- stats_data.py +34 -0
stats_data.py
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import pandas as pd
|
| 2 |
+
|
| 3 |
+
# Metadata for speakers available in the demo
|
| 4 |
+
SPEAKER_META = {
|
| 5 |
+
"M05": {"Gender": "Male", "Severity": "Severe", "Dataset": "Torgo"},
|
| 6 |
+
"F01": {"Gender": "Female", "Severity": "Severe", "Dataset": "Torgo"},
|
| 7 |
+
"M01": {"Gender": "Male", "Severity": "Moderate", "Dataset": "Torgo"},
|
| 8 |
+
"M04": {"Gender": "Male", "Severity": "Moderate", "Dataset": "Torgo"},
|
| 9 |
+
"M02": {"Gender": "Male", "Severity": "Mild", "Dataset": "Torgo"},
|
| 10 |
+
"M03": {"Gender": "Male", "Severity": "Mild", "Dataset": "Torgo"},
|
| 11 |
+
"F03": {"Gender": "Female", "Severity": "Mild", "Dataset": "Torgo"},
|
| 12 |
+
"F04": {"Gender": "Female", "Severity": "Mild", "Dataset": "Torgo"},
|
| 13 |
+
"F02 (UA)": {"Gender": "Female", "Severity": "Severe (Isolated)", "Dataset": "UA-Speech"}
|
| 14 |
+
}
|
| 15 |
+
|
| 16 |
+
def get_indomain_breakdown():
|
| 17 |
+
data = {
|
| 18 |
+
"Speaker": ["M05", "F01", "M01", "M04", "M02", "M03", "F03", "F04"],
|
| 19 |
+
"Severity": ["Severe", "Severe", "Moderate", "Moderate", "Mild", "Mild", "Mild", "Mild"],
|
| 20 |
+
"Whisper Tiny": ["12.1%", "12.6%", "32.7%", "31.8%", "62.1%", "58.4%", "61.2%", "59.1%"],
|
| 21 |
+
"5K Model (Ours)": ["33.1%", "34.2%", "47.2%", "45.6%", "84.5%", "81.8%", "83.5%", "82.8%"],
|
| 22 |
+
"10K Model (Ours)": ["25.4%", "24.1%", "44.1%", "41.2%", "79.1%", "77.5%", "79.0%", "78.2%"]
|
| 23 |
+
}
|
| 24 |
+
return pd.DataFrame(data)
|
| 25 |
+
|
| 26 |
+
def get_experimental_summary():
|
| 27 |
+
data = {
|
| 28 |
+
"Experiment Condition": ["In-Domain (Seen Torgo)", "LOSO (Unseen Torgo F01)", "Zero-Shot (UA-Speech F02)"],
|
| 29 |
+
"Whisper Tiny (Baseline)": ["41.50%", "12.38%", "4.33%"],
|
| 30 |
+
"5K Pure Model Score": ["58.77%", "N/A", "6.19%"],
|
| 31 |
+
"10K Triple-Mix Score": ["54.67%", "24.76%", "5.98%"],
|
| 32 |
+
"Relative Gain (Best vs Baseline)": ["+41.6%", "+100.0%", "+42.9%"]
|
| 33 |
+
}
|
| 34 |
+
return pd.DataFrame(data)
|