陈俊杰
commited on
Commit
·
1fd8f1d
1
Parent(s):
819591b
cjj-leaderboard
Browse files
app.py
CHANGED
|
@@ -219,7 +219,7 @@ This leaderboard is used to show the performance of the <strong>automatic evalua
|
|
| 219 |
data = {
|
| 220 |
('', 'teamId'): ['baseline', 'baseline', 'baseline', 'baseline'],
|
| 221 |
('', 'methods'): ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o-mini"],
|
| 222 |
-
('', 'overall'): [],
|
| 223 |
('Dialogue Generation', 'accuracy'): [0.5806, 0.5483, 0.6001, 0.6472],
|
| 224 |
('Dialogue Generation', "kendall's tau"): [0.3243, 0.1739, 0.3042, 0.4167],
|
| 225 |
('Dialogue Generation', 'spearman'): [0.3505, 0.1857, 0.3264, 0.4512],
|
|
@@ -233,17 +233,18 @@ This leaderboard is used to show the performance of the <strong>automatic evalua
|
|
| 233 |
('Non-Factoid QA', "kendall's tau"): [0.2332, 0.2389, 0.4440, 0.4235],
|
| 234 |
('Non-Factoid QA', 'spearman'): [0.2443, 0.2492, 0.4630, 0.4511]
|
| 235 |
}
|
| 236 |
-
overall = [0, 0, 0, 0]
|
| 237 |
-
for d in data:
|
| 238 |
-
|
| 239 |
-
|
| 240 |
-
|
| 241 |
-
overall = [i / (3*4) for i in overall]
|
| 242 |
-
data[('', 'overall')] = overall
|
| 243 |
-
for d in data:
|
| 244 |
-
|
| 245 |
-
|
| 246 |
-
|
|
|
|
| 247 |
st.dataframe(data, use_container_width=True)
|
| 248 |
# # teamId 唯一标识码
|
| 249 |
# DG = {
|
|
|
|
| 219 |
data = {
|
| 220 |
('', 'teamId'): ['baseline', 'baseline', 'baseline', 'baseline'],
|
| 221 |
('', 'methods'): ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o-mini"],
|
| 222 |
+
('', 'overall'): [0,0,0,0],
|
| 223 |
('Dialogue Generation', 'accuracy'): [0.5806, 0.5483, 0.6001, 0.6472],
|
| 224 |
('Dialogue Generation', "kendall's tau"): [0.3243, 0.1739, 0.3042, 0.4167],
|
| 225 |
('Dialogue Generation', 'spearman'): [0.3505, 0.1857, 0.3264, 0.4512],
|
|
|
|
| 233 |
('Non-Factoid QA', "kendall's tau"): [0.2332, 0.2389, 0.4440, 0.4235],
|
| 234 |
('Non-Factoid QA', 'spearman'): [0.2443, 0.2492, 0.4630, 0.4511]
|
| 235 |
}
|
| 236 |
+
# overall = [0, 0, 0, 0]
|
| 237 |
+
# for d in data:
|
| 238 |
+
# if d != ('', 'teamId') and d != ('', 'methods') and d != ('', 'overall'):
|
| 239 |
+
# for i in range(4):
|
| 240 |
+
# overall[i] += data[d][i]
|
| 241 |
+
# overall = [i / (3*4) for i in overall]
|
| 242 |
+
# data[('', 'overall')] = overall
|
| 243 |
+
# for d in data:
|
| 244 |
+
# if d != ('', 'teamId') and d != ('', 'methods'):
|
| 245 |
+
# for col in range(len(data[d])):
|
| 246 |
+
# data[d][col] = "{:.4f}".format(data[d][col])
|
| 247 |
+
# print(data)
|
| 248 |
st.dataframe(data, use_container_width=True)
|
| 249 |
# # teamId 唯一标识码
|
| 250 |
# DG = {
|
test.py
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
data = {
|
| 2 |
('', 'teamId'): ['baseline', 'baseline', 'baseline', 'baseline'],
|
| 3 |
('', 'methods'): ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o-mini"],
|
| 4 |
-
('', 'overall'): [],
|
| 5 |
('Dialogue Generation', 'accuracy'): [0.5806, 0.5483, 0.6001, 0.6472],
|
| 6 |
('Dialogue Generation', "kendall's tau"): [0.3243, 0.1739, 0.3042, 0.4167],
|
| 7 |
('Dialogue Generation', 'spearman'): [0.3505, 0.1857, 0.3264, 0.4512],
|
|
@@ -17,11 +17,14 @@ data = {
|
|
| 17 |
}
|
| 18 |
|
| 19 |
overall = [0, 0, 0, 0]
|
| 20 |
-
|
| 21 |
for d in data:
|
| 22 |
if d != ('', 'teamId') and d != ('', 'methods') and d != ('', 'overall'):
|
| 23 |
-
|
| 24 |
-
|
| 25 |
-
|
| 26 |
overall = [i / (3*4) for i in overall]
|
| 27 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
data = {
|
| 2 |
('', 'teamId'): ['baseline', 'baseline', 'baseline', 'baseline'],
|
| 3 |
('', 'methods'): ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o-mini"],
|
| 4 |
+
('', 'overall'): [0,0,0,0],
|
| 5 |
('Dialogue Generation', 'accuracy'): [0.5806, 0.5483, 0.6001, 0.6472],
|
| 6 |
('Dialogue Generation', "kendall's tau"): [0.3243, 0.1739, 0.3042, 0.4167],
|
| 7 |
('Dialogue Generation', 'spearman'): [0.3505, 0.1857, 0.3264, 0.4512],
|
|
|
|
| 17 |
}
|
| 18 |
|
| 19 |
overall = [0, 0, 0, 0]
|
|
|
|
| 20 |
for d in data:
|
| 21 |
if d != ('', 'teamId') and d != ('', 'methods') and d != ('', 'overall'):
|
| 22 |
+
for i in range(4):
|
| 23 |
+
overall[i] += data[d][i]
|
|
|
|
| 24 |
overall = [i / (3*4) for i in overall]
|
| 25 |
+
data[('', 'overall')] = overall
|
| 26 |
+
for d in data:
|
| 27 |
+
if d != ('', 'teamId') and d != ('', 'methods'):
|
| 28 |
+
for col in range(len(data[d])):
|
| 29 |
+
data[d][col] = "{:.4f}".format(data[d][col])
|
| 30 |
+
print(data)
|