PuxAI commited on
Commit
4a0de40
·
verified ·
1 Parent(s): 9479697

Upload ablation summaries

Browse files
mbert_paper_metrics/docs/ablation_results.csv CHANGED
@@ -90,6 +90,7 @@ result_ablation_mbert_paper,vsfc,mBERT,mha_attention,42,eval_accuracy,0.93303853
90
  result_ablation_mbert_paper,vsfc,mBERT,mha_attention,43,eval_accuracy,0.9330385344283006,0.21815043687820435,0.22466682554124953,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_43/all_results.json
91
  result_ablation_mbert_paper,vsfc,mBERT,mha_attention,44,eval_accuracy,0.934301958307012,0.21530689299106598,0.22445858664168067,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_44/all_results.json
92
  result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,42,eval_accuracy,0.9355653821857233,0.2141973078250885,0.21831525011218234,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_42/all_results.json
 
93
  result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,44,eval_accuracy,0.9317751105495894,0.21137550473213196,0.2217927779351081,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_44/all_results.json
94
  result_ablation_mbert_paper,vsfc,mBERT,gated_multi_branch,42,eval_accuracy,0.9374605180037903,0.22037982940673828,0.2221188189544322,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_42/all_results.json
95
  result_ablation_mbert_paper,vsfc,mBERT,gated_multi_branch,43,eval_accuracy,0.932406822488945,0.2144102156162262,0.22194261373061955,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_43/all_results.json
 
90
  result_ablation_mbert_paper,vsfc,mBERT,mha_attention,43,eval_accuracy,0.9330385344283006,0.21815043687820435,0.22466682554124953,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_43/all_results.json
91
  result_ablation_mbert_paper,vsfc,mBERT,mha_attention,44,eval_accuracy,0.934301958307012,0.21530689299106598,0.22445858664168067,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_44/all_results.json
92
  result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,42,eval_accuracy,0.9355653821857233,0.2141973078250885,0.21831525011218234,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_42/all_results.json
93
+ result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,43,eval_accuracy,0.9317751105495894,0.20609119534492493,0.2264852445998114,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_43/all_results.json
94
  result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,44,eval_accuracy,0.9317751105495894,0.21137550473213196,0.2217927779351081,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_44/all_results.json
95
  result_ablation_mbert_paper,vsfc,mBERT,gated_multi_branch,42,eval_accuracy,0.9374605180037903,0.22037982940673828,0.2221188189544322,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_42/all_results.json
96
  result_ablation_mbert_paper,vsfc,mBERT,gated_multi_branch,43,eval_accuracy,0.932406822488945,0.2144102156162262,0.22194261373061955,3.0,1583,/workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_43/all_results.json
mbert_paper_metrics/docs/ablation_results_aggregate.csv CHANGED
@@ -30,4 +30,4 @@ result_ablation_mbert_paper,vsfc,mBERT,hf_sequence_classifier,eval_accuracy,3,0.
30
  result_ablation_mbert_paper,vsfc,mBERT,max,eval_accuracy,3,0.9340913876605601,0.0007294381164745449,0.9336702463676564,0.9349336702463676
31
  result_ablation_mbert_paper,vsfc,mBERT,mean,eval_accuracy,3,0.9334596757212045,0.0013150132656134848,0.932406822488945,0.9349336702463676
32
  result_ablation_mbert_paper,vsfc,mBERT,mha_attention,eval_accuracy,3,0.9334596757212045,0.0007294381164746089,0.9330385344283006,0.934301958307012
33
- result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,eval_accuracy,2,0.9336702463676563,0.0026801267764492965,0.9317751105495894,0.9355653821857233
 
30
  result_ablation_mbert_paper,vsfc,mBERT,max,eval_accuracy,3,0.9340913876605601,0.0007294381164745449,0.9336702463676564,0.9349336702463676
31
  result_ablation_mbert_paper,vsfc,mBERT,mean,eval_accuracy,3,0.9334596757212045,0.0013150132656134848,0.932406822488945,0.9349336702463676
32
  result_ablation_mbert_paper,vsfc,mBERT,mha_attention,eval_accuracy,3,0.9334596757212045,0.0007294381164746089,0.9330385344283006,0.934301958307012
33
+ result_ablation_mbert_paper,vsfc,mBERT,multi_branch_average,eval_accuracy,3,0.9330385344283006,0.0021883143494236985,0.9317751105495894,0.9355653821857233
mbert_paper_metrics/docs/ablation_summary.md CHANGED
@@ -36,7 +36,7 @@ Main metric is selected per task: CoLA uses Matthews correlation; MRPC/QQP/STSB
36
  | result_ablation_mbert_paper | vsfc | mBERT | max | eval_accuracy | 3 | 0.9341 | 0.0007 | 0.9337 | 0.9349 |
37
  | result_ablation_mbert_paper | vsfc | mBERT | mean | eval_accuracy | 3 | 0.9335 | 0.0013 | 0.9324 | 0.9349 |
38
  | result_ablation_mbert_paper | vsfc | mBERT | mha_attention | eval_accuracy | 3 | 0.9335 | 0.0007 | 0.9330 | 0.9343 |
39
- | result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | eval_accuracy | 2 | 0.9337 | 0.0027 | 0.9318 | 0.9356 |
40
 
41
  ## Gated Multi-Branch Deltas
42
  | source | task | model | baseline | gated_mean | baseline_mean | delta |
@@ -55,7 +55,7 @@ Main metric is selected per task: CoLA uses Matthews correlation; MRPC/QQP/STSB
55
  | result_ablation_mbert_paper | sst2 | mBERT | hf_sequence_classifier | 0.8758 | 0.8788 | -0.0031 |
56
  | result_ablation_mbert_paper | vsfc | mBERT | attention | 0.9326 | 0.9337 | -0.0011 |
57
  | result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 0.9326 | 0.9335 | -0.0008 |
58
- | result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 0.9326 | 0.9337 | -0.0011 |
59
  | result_ablation_mbert_paper | vsfc | mBERT | hf_sequence_classifier | 0.9326 | 0.9318 | 0.0008 |
60
 
61
  ## Raw Runs
@@ -152,6 +152,7 @@ Main metric is selected per task: CoLA uses Matthews correlation; MRPC/QQP/STSB
152
  | result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 43.0000 | eval_accuracy | 0.9330 | 0.2182 | 0.2247 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_43/all_results.json |
153
  | result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 44.0000 | eval_accuracy | 0.9343 | 0.2153 | 0.2245 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_44/all_results.json |
154
  | result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 42.0000 | eval_accuracy | 0.9356 | 0.2142 | 0.2183 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_42/all_results.json |
 
155
  | result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 44.0000 | eval_accuracy | 0.9318 | 0.2114 | 0.2218 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_44/all_results.json |
156
  | result_ablation_mbert_paper | vsfc | mBERT | gated_multi_branch | 42.0000 | eval_accuracy | 0.9375 | 0.2204 | 0.2221 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_42/all_results.json |
157
  | result_ablation_mbert_paper | vsfc | mBERT | gated_multi_branch | 43.0000 | eval_accuracy | 0.9324 | 0.2144 | 0.2219 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_43/all_results.json |
 
36
  | result_ablation_mbert_paper | vsfc | mBERT | max | eval_accuracy | 3 | 0.9341 | 0.0007 | 0.9337 | 0.9349 |
37
  | result_ablation_mbert_paper | vsfc | mBERT | mean | eval_accuracy | 3 | 0.9335 | 0.0013 | 0.9324 | 0.9349 |
38
  | result_ablation_mbert_paper | vsfc | mBERT | mha_attention | eval_accuracy | 3 | 0.9335 | 0.0007 | 0.9330 | 0.9343 |
39
+ | result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | eval_accuracy | 3 | 0.9330 | 0.0022 | 0.9318 | 0.9356 |
40
 
41
  ## Gated Multi-Branch Deltas
42
  | source | task | model | baseline | gated_mean | baseline_mean | delta |
 
55
  | result_ablation_mbert_paper | sst2 | mBERT | hf_sequence_classifier | 0.8758 | 0.8788 | -0.0031 |
56
  | result_ablation_mbert_paper | vsfc | mBERT | attention | 0.9326 | 0.9337 | -0.0011 |
57
  | result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 0.9326 | 0.9335 | -0.0008 |
58
+ | result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 0.9326 | 0.9330 | -0.0004 |
59
  | result_ablation_mbert_paper | vsfc | mBERT | hf_sequence_classifier | 0.9326 | 0.9318 | 0.0008 |
60
 
61
  ## Raw Runs
 
152
  | result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 43.0000 | eval_accuracy | 0.9330 | 0.2182 | 0.2247 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_43/all_results.json |
153
  | result_ablation_mbert_paper | vsfc | mBERT | mha_attention | 44.0000 | eval_accuracy | 0.9343 | 0.2153 | 0.2245 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/mha_attention/seed_44/all_results.json |
154
  | result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 42.0000 | eval_accuracy | 0.9356 | 0.2142 | 0.2183 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_42/all_results.json |
155
+ | result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 43.0000 | eval_accuracy | 0.9318 | 0.2061 | 0.2265 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_43/all_results.json |
156
  | result_ablation_mbert_paper | vsfc | mBERT | multi_branch_average | 44.0000 | eval_accuracy | 0.9318 | 0.2114 | 0.2218 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/multi_branch_average/seed_44/all_results.json |
157
  | result_ablation_mbert_paper | vsfc | mBERT | gated_multi_branch | 42.0000 | eval_accuracy | 0.9375 | 0.2204 | 0.2221 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_42/all_results.json |
158
  | result_ablation_mbert_paper | vsfc | mBERT | gated_multi_branch | 43.0000 | eval_accuracy | 0.9324 | 0.2144 | 0.2219 | 3.0000 | 1583 | /workspace/result_ablation_mbert_paper/vsfc/mBERT/gated_multi_branch/seed_43/all_results.json |