Upload ablation summaries
Browse files
mbert_paper_metrics/docs/ablation_results.csv
CHANGED
|
@@ -90,6 +90,7 @@ result_ablation_mbert_paper,vsfc,mBERT,mha_attention,42,eval_accuracy,0.93303853
|
|
| 90 |
result_ablation_mbert_paper,vsfc,mBERT,mha_attention,43,eval_accuracy,0.9330385344283006,0.21815043687820435,0.22466682554124953,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_43/all_results.json
|
| 91 |
result_ablation_mbert_paper,vsfc,mBERT,mha_attention,44,eval_accuracy,0.934301958307012,0.21530689299106598,0.22445858664168067,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_44/all_results.json
|
| 92 |
result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,42,eval_accuracy,0.9355653821857233,0.2141973078250885,0.21831525011218234,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_42/all_results.json
|
|
|
|
| 93 |
result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,44,eval_accuracy,0.9317751105495894,0.21137550473213196,0.2217927779351081,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_44/all_results.json
|
| 94 |
result_ablation_mbert_paper,vsfc,mBERT,gated_multi_branch,42,eval_accuracy,0.9374605180037903,0.22037982940673828,0.2221188189544322,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_42/all_results.json
|
| 95 |
result_ablation_mbert_paper,vsfc,mBERT,gated_multi_branch,43,eval_accuracy,0.932406822488945,0.2144102156162262,0.22194261373061955,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_43/all_results.json
|
|
|
|
| 90 |
result_ablation_mbert_paper,vsfc,mBERT,mha_attention,43,eval_accuracy,0.9330385344283006,0.21815043687820435,0.22466682554124953,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_43/all_results.json
|
| 91 |
result_ablation_mbert_paper,vsfc,mBERT,mha_attention,44,eval_accuracy,0.934301958307012,0.21530689299106598,0.22445858664168067,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_44/all_results.json
|
| 92 |
result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,42,eval_accuracy,0.9355653821857233,0.2141973078250885,0.21831525011218234,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_42/all_results.json
|
| 93 |
+
result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,43,eval_accuracy,0.9317751105495894,0.20609119534492493,0.2264852445998114,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_43/all_results.json
|
| 94 |
result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,44,eval_accuracy,0.9317751105495894,0.21137550473213196,0.2217927779351081,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_44/all_results.json
|
| 95 |
result_ablation_mbert_paper,vsfc,mBERT,gated_multi_branch,42,eval_accuracy,0.9374605180037903,0.22037982940673828,0.2221188189544322,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_42/all_results.json
|
| 96 |
result_ablation_mbert_paper,vsfc,mBERT,gated_multi_branch,43,eval_accuracy,0.932406822488945,0.2144102156162262,0.22194261373061955,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_43/all_results.json
|
mbert_paper_metrics/docs/ablation_results_aggregate.csv
CHANGED
|
@@ -30,4 +30,4 @@ result_ablation_mbert_paper,vsfc,mBERT,hf_sequence_classifier,eval_accuracy,3,0.
|
|
| 30 |
result_ablation_mbert_paper,vsfc,mBERT,max,eval_accuracy,3,0.9340913876605601,0.0007294381164745449,0.9336702463676564,0.9349336702463676
|
| 31 |
result_ablation_mbert_paper,vsfc,mBERT,mean,eval_accuracy,3,0.9334596757212045,0.0013150132656134848,0.932406822488945,0.9349336702463676
|
| 32 |
result_ablation_mbert_paper,vsfc,mBERT,mha_attention,eval_accuracy,3,0.9334596757212045,0.0007294381164746089,0.9330385344283006,0.934301958307012
|
| 33 |
-
result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,eval_accuracy,
|
|
|
|
| 30 |
result_ablation_mbert_paper,vsfc,mBERT,max,eval_accuracy,3,0.9340913876605601,0.0007294381164745449,0.9336702463676564,0.9349336702463676
|
| 31 |
result_ablation_mbert_paper,vsfc,mBERT,mean,eval_accuracy,3,0.9334596757212045,0.0013150132656134848,0.932406822488945,0.9349336702463676
|
| 32 |
result_ablation_mbert_paper,vsfc,mBERT,mha_attention,eval_accuracy,3,0.9334596757212045,0.0007294381164746089,0.9330385344283006,0.934301958307012
|
| 33 |
+
result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,eval_accuracy,3,0.9330385344283006,0.0021883143494236985,0.9317751105495894,0.9355653821857233
|
mbert_paper_metrics/docs/ablation_summary.md
CHANGED
|
@@ -36,7 +36,7 @@ Main metric is selected per task: CoLA uses Matthews correlation; MRPC/QQP/STSB
|
|
| 36 |
| result_ablation_mbert_paper | vsfc | mBERT | max | eval_accuracy | 3 | 0.9341 | 0.0007 | 0.9337 | 0.9349 |
|
| 37 |
| result_ablation_mbert_paper | vsfc | mBERT | mean | eval_accuracy | 3 | 0.9335 | 0.0013 | 0.9324 | 0.9349 |
|
| 38 |
| result_ablation_mbert_paper | vsfc | mBERT | mha_attention | eval_accuracy | 3 | 0.9335 | 0.0007 | 0.9330 | 0.9343 |
|
| 39 |
-
| result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | eval_accuracy |
|
| 40 |
|
| 41 |
## Gated Multi-Branch Deltas
|
| 42 |
| source | task | model | baseline | gated_mean | baseline_mean | delta |
|
|
@@ -55,7 +55,7 @@ Main metric is selected per task: CoLA uses Matthews correlation; MRPC/QQP/STSB
|
|
| 55 |
| result_ablation_mbert_paper | sst2 | mBERT | hf_sequence_classifier | 0.8758 | 0.8788 | -0.0031 |
|
| 56 |
| result_ablation_mbert_paper | vsfc | mBERT | attention | 0.9326 | 0.9337 | -0.0011 |
|
| 57 |
| result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 0.9326 | 0.9335 | -0.0008 |
|
| 58 |
-
| result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 0.9326 | 0.
|
| 59 |
| result_ablation_mbert_paper | vsfc | mBERT | hf_sequence_classifier | 0.9326 | 0.9318 | 0.0008 |
|
| 60 |
|
| 61 |
## Raw Runs
|
|
@@ -152,6 +152,7 @@ Main metric is selected per task: CoLA uses Matthews correlation; MRPC/QQP/STSB
|
|
| 152 |
| result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 43.0000 | eval_accuracy | 0.9330 | 0.2182 | 0.2247 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_43/all_results.json |
|
| 153 |
| result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 44.0000 | eval_accuracy | 0.9343 | 0.2153 | 0.2245 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_44/all_results.json |
|
| 154 |
| result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 42.0000 | eval_accuracy | 0.9356 | 0.2142 | 0.2183 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_42/all_results.json |
|
|
|
|
| 155 |
| result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 44.0000 | eval_accuracy | 0.9318 | 0.2114 | 0.2218 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_44/all_results.json |
|
| 156 |
| result_ablation_mbert_paper | vsfc | mBERT | gated_multi_branch | 42.0000 | eval_accuracy | 0.9375 | 0.2204 | 0.2221 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_42/all_results.json |
|
| 157 |
| result_ablation_mbert_paper | vsfc | mBERT | gated_multi_branch | 43.0000 | eval_accuracy | 0.9324 | 0.2144 | 0.2219 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_43/all_results.json |
|
|
|
|
| 36 |
| result_ablation_mbert_paper | vsfc | mBERT | max | eval_accuracy | 3 | 0.9341 | 0.0007 | 0.9337 | 0.9349 |
|
| 37 |
| result_ablation_mbert_paper | vsfc | mBERT | mean | eval_accuracy | 3 | 0.9335 | 0.0013 | 0.9324 | 0.9349 |
|
| 38 |
| result_ablation_mbert_paper | vsfc | mBERT | mha_attention | eval_accuracy | 3 | 0.9335 | 0.0007 | 0.9330 | 0.9343 |
|
| 39 |
+
| result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | eval_accuracy | 3 | 0.9330 | 0.0022 | 0.9318 | 0.9356 |
|
| 40 |
|
| 41 |
## Gated Multi-Branch Deltas
|
| 42 |
| source | task | model | baseline | gated_mean | baseline_mean | delta |
|
|
|
|
| 55 |
| result_ablation_mbert_paper | sst2 | mBERT | hf_sequence_classifier | 0.8758 | 0.8788 | -0.0031 |
|
| 56 |
| result_ablation_mbert_paper | vsfc | mBERT | attention | 0.9326 | 0.9337 | -0.0011 |
|
| 57 |
| result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 0.9326 | 0.9335 | -0.0008 |
|
| 58 |
+
| result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 0.9326 | 0.9330 | -0.0004 |
|
| 59 |
| result_ablation_mbert_paper | vsfc | mBERT | hf_sequence_classifier | 0.9326 | 0.9318 | 0.0008 |
|
| 60 |
|
| 61 |
## Raw Runs
|
|
|
|
| 152 |
| result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 43.0000 | eval_accuracy | 0.9330 | 0.2182 | 0.2247 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_43/all_results.json |
|
| 153 |
| result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 44.0000 | eval_accuracy | 0.9343 | 0.2153 | 0.2245 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_44/all_results.json |
|
| 154 |
| result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 42.0000 | eval_accuracy | 0.9356 | 0.2142 | 0.2183 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_42/all_results.json |
|
| 155 |
+
| result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 43.0000 | eval_accuracy | 0.9318 | 0.2061 | 0.2265 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_43/all_results.json |
|
| 156 |
| result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 44.0000 | eval_accuracy | 0.9318 | 0.2114 | 0.2218 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_44/all_results.json |
|
| 157 |
| result_ablation_mbert_paper | vsfc | mBERT | gated_multi_branch | 42.0000 | eval_accuracy | 0.9375 | 0.2204 | 0.2221 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_42/all_results.json |
|
| 158 |
| result_ablation_mbert_paper | vsfc | mBERT | gated_multi_branch | 43.0000 | eval_accuracy | 0.9324 | 0.2144 | 0.2219 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_43/all_results.json |
|