Hartunka commited on
Commit
7a3fbae
·
verified ·
1 Parent(s): d20ada5

End of training

Browse files
README.md CHANGED
@@ -1,14 +1,32 @@
1
  ---
2
  library_name: transformers
 
 
3
  base_model: Hartunka/tiny_bert_rand_10_v2
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - accuracy
8
  - f1
9
  model-index:
10
  - name: tiny_bert_rand_10_v2_mrpc
11
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,12 +34,12 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # tiny_bert_rand_10_v2_mrpc
18
 
19
- This model is a fine-tuned version of [Hartunka/tiny_bert_rand_10_v2](https://huggingface.co/Hartunka/tiny_bert_rand_10_v2) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.9016
22
- - Accuracy: 0.6569
23
- - F1: 0.7578
24
- - Combined Score: 0.7073
25
 
26
  ## Model description
27
 
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - en
5
  base_model: Hartunka/tiny_bert_rand_10_v2
6
  tags:
7
  - generated_from_trainer
8
+ datasets:
9
+ - glue
10
  metrics:
11
  - accuracy
12
  - f1
13
  model-index:
14
  - name: tiny_bert_rand_10_v2_mrpc
15
+ results:
16
+ - task:
17
+ name: Text Classification
18
+ type: text-classification
19
+ dataset:
20
+ name: GLUE MRPC
21
+ type: glue
22
+ args: mrpc
23
+ metrics:
24
+ - name: Accuracy
25
+ type: accuracy
26
+ value: 0.6936274509803921
27
+ - name: F1
28
+ type: f1
29
+ value: 0.8049921996879875
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  # tiny_bert_rand_10_v2_mrpc
36
 
37
+ This model is a fine-tuned version of [Hartunka/tiny_bert_rand_10_v2](https://huggingface.co/Hartunka/tiny_bert_rand_10_v2) on the GLUE MRPC dataset.
38
  It achieves the following results on the evaluation set:
39
+ - Loss: 0.5925
40
+ - Accuracy: 0.6936
41
+ - F1: 0.8050
42
+ - Combined Score: 0.7493
43
 
44
  ## Model description
45
 
all_results.json CHANGED
@@ -4,14 +4,14 @@
4
  "eval_combined_score": 0.7493098253341899,
5
  "eval_f1": 0.8049921996879875,
6
  "eval_loss": 0.5925148725509644,
7
- "eval_runtime": 0.1712,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 2382.616,
10
- "eval_steps_per_second": 11.679,
11
  "total_flos": 673316591603712.0,
12
  "train_loss": 0.4811921028863816,
13
- "train_runtime": 19.5808,
14
  "train_samples": 3668,
15
- "train_samples_per_second": 9366.303,
16
- "train_steps_per_second": 38.303
17
  }
 
4
  "eval_combined_score": 0.7493098253341899,
5
  "eval_f1": 0.8049921996879875,
6
  "eval_loss": 0.5925148725509644,
7
+ "eval_runtime": 0.1461,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 2792.58,
10
+ "eval_steps_per_second": 13.689,
11
  "total_flos": 673316591603712.0,
12
  "train_loss": 0.4811921028863816,
13
+ "train_runtime": 20.9726,
14
  "train_samples": 3668,
15
+ "train_samples_per_second": 8744.756,
16
+ "train_steps_per_second": 35.761
17
  }
eval_results.json CHANGED
@@ -4,8 +4,8 @@
4
  "eval_combined_score": 0.7493098253341899,
5
  "eval_f1": 0.8049921996879875,
6
  "eval_loss": 0.5925148725509644,
7
- "eval_runtime": 0.1712,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 2382.616,
10
- "eval_steps_per_second": 11.679
11
  }
 
4
  "eval_combined_score": 0.7493098253341899,
5
  "eval_f1": 0.8049921996879875,
6
  "eval_loss": 0.5925148725509644,
7
+ "eval_runtime": 0.1461,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 2792.58,
10
+ "eval_steps_per_second": 13.689
11
  }
logs/events.out.tfevents.1745307409.s_005_m.2850172.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93f8e1845e846303041d3c4ab5f2c2d9b411902b258ece206573e2422b895bac
3
+ size 459
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 7.0,
3
  "total_flos": 673316591603712.0,
4
  "train_loss": 0.4811921028863816,
5
- "train_runtime": 19.5808,
6
  "train_samples": 3668,
7
- "train_samples_per_second": 9366.303,
8
- "train_steps_per_second": 38.303
9
  }
 
2
  "epoch": 7.0,
3
  "total_flos": 673316591603712.0,
4
  "train_loss": 0.4811921028863816,
5
+ "train_runtime": 20.9726,
6
  "train_samples": 3668,
7
+ "train_samples_per_second": 8744.756,
8
+ "train_steps_per_second": 35.761
9
  }
trainer_state.json CHANGED
@@ -22,9 +22,9 @@
22
  "eval_combined_score": 0.7493098253341899,
23
  "eval_f1": 0.8049921996879875,
24
  "eval_loss": 0.6069743037223816,
25
- "eval_runtime": 0.1365,
26
- "eval_samples_per_second": 2988.638,
27
- "eval_steps_per_second": 14.65,
28
  "step": 15
29
  },
30
  {
@@ -40,9 +40,9 @@
40
  "eval_combined_score": 0.7493098253341899,
41
  "eval_f1": 0.8049921996879875,
42
  "eval_loss": 0.5925148725509644,
43
- "eval_runtime": 0.1403,
44
- "eval_samples_per_second": 2908.483,
45
- "eval_steps_per_second": 14.257,
46
  "step": 30
47
  },
48
  {
@@ -58,9 +58,9 @@
58
  "eval_combined_score": 0.7553715761113606,
59
  "eval_f1": 0.8122137404580153,
60
  "eval_loss": 0.6044036746025085,
61
- "eval_runtime": 0.1319,
62
- "eval_samples_per_second": 3093.061,
63
- "eval_steps_per_second": 15.162,
64
  "step": 45
65
  },
66
  {
@@ -76,9 +76,9 @@
76
  "eval_combined_score": 0.7210159380207779,
77
  "eval_f1": 0.7631103074141049,
78
  "eval_loss": 0.6260837316513062,
79
- "eval_runtime": 0.1669,
80
- "eval_samples_per_second": 2444.296,
81
- "eval_steps_per_second": 11.982,
82
  "step": 60
83
  },
84
  {
@@ -94,9 +94,9 @@
94
  "eval_combined_score": 0.6964081086980247,
95
  "eval_f1": 0.738404452690167,
96
  "eval_loss": 0.6786839962005615,
97
- "eval_runtime": 0.1589,
98
- "eval_samples_per_second": 2567.194,
99
- "eval_steps_per_second": 12.584,
100
  "step": 75
101
  },
102
  {
@@ -112,9 +112,9 @@
112
  "eval_combined_score": 0.7001788553259142,
113
  "eval_f1": 0.745945945945946,
114
  "eval_loss": 0.7894179224967957,
115
- "eval_runtime": 0.1302,
116
- "eval_samples_per_second": 3132.822,
117
- "eval_steps_per_second": 15.357,
118
  "step": 90
119
  },
120
  {
@@ -130,9 +130,9 @@
130
  "eval_combined_score": 0.7073241061130334,
131
  "eval_f1": 0.7577854671280276,
132
  "eval_loss": 0.9015735387802124,
133
- "eval_runtime": 0.1374,
134
- "eval_samples_per_second": 2970.145,
135
- "eval_steps_per_second": 14.56,
136
  "step": 105
137
  },
138
  {
@@ -140,9 +140,9 @@
140
  "step": 105,
141
  "total_flos": 673316591603712.0,
142
  "train_loss": 0.4811921028863816,
143
- "train_runtime": 19.5808,
144
- "train_samples_per_second": 9366.303,
145
- "train_steps_per_second": 38.303
146
  }
147
  ],
148
  "logging_steps": 1,
 
22
  "eval_combined_score": 0.7493098253341899,
23
  "eval_f1": 0.8049921996879875,
24
  "eval_loss": 0.6069743037223816,
25
+ "eval_runtime": 0.2253,
26
+ "eval_samples_per_second": 1810.799,
27
+ "eval_steps_per_second": 8.876,
28
  "step": 15
29
  },
30
  {
 
40
  "eval_combined_score": 0.7493098253341899,
41
  "eval_f1": 0.8049921996879875,
42
  "eval_loss": 0.5925148725509644,
43
+ "eval_runtime": 0.1646,
44
+ "eval_samples_per_second": 2479.406,
45
+ "eval_steps_per_second": 12.154,
46
  "step": 30
47
  },
48
  {
 
58
  "eval_combined_score": 0.7553715761113606,
59
  "eval_f1": 0.8122137404580153,
60
  "eval_loss": 0.6044036746025085,
61
+ "eval_runtime": 0.1362,
62
+ "eval_samples_per_second": 2995.695,
63
+ "eval_steps_per_second": 14.685,
64
  "step": 45
65
  },
66
  {
 
76
  "eval_combined_score": 0.7210159380207779,
77
  "eval_f1": 0.7631103074141049,
78
  "eval_loss": 0.6260837316513062,
79
+ "eval_runtime": 0.1534,
80
+ "eval_samples_per_second": 2659.28,
81
+ "eval_steps_per_second": 13.036,
82
  "step": 60
83
  },
84
  {
 
94
  "eval_combined_score": 0.6964081086980247,
95
  "eval_f1": 0.738404452690167,
96
  "eval_loss": 0.6786839962005615,
97
+ "eval_runtime": 0.1384,
98
+ "eval_samples_per_second": 2947.056,
99
+ "eval_steps_per_second": 14.446,
100
  "step": 75
101
  },
102
  {
 
112
  "eval_combined_score": 0.7001788553259142,
113
  "eval_f1": 0.745945945945946,
114
  "eval_loss": 0.7894179224967957,
115
+ "eval_runtime": 0.1647,
116
+ "eval_samples_per_second": 2477.03,
117
+ "eval_steps_per_second": 12.142,
118
  "step": 90
119
  },
120
  {
 
130
  "eval_combined_score": 0.7073241061130334,
131
  "eval_f1": 0.7577854671280276,
132
  "eval_loss": 0.9015735387802124,
133
+ "eval_runtime": 0.1697,
134
+ "eval_samples_per_second": 2404.916,
135
+ "eval_steps_per_second": 11.789,
136
  "step": 105
137
  },
138
  {
 
140
  "step": 105,
141
  "total_flos": 673316591603712.0,
142
  "train_loss": 0.4811921028863816,
143
+ "train_runtime": 20.9726,
144
+ "train_samples_per_second": 8744.756,
145
+ "train_steps_per_second": 35.761
146
  }
147
  ],
148
  "logging_steps": 1,