Hartunka commited on
Commit
4da292b
·
verified ·
1 Parent(s): 8d6f8f7

End of training

Browse files
README.md CHANGED
@@ -1,14 +1,32 @@
1
  ---
2
  library_name: transformers
 
 
3
  base_model: Hartunka/bert_base_rand_100_v1
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - accuracy
8
  - f1
9
  model-index:
10
  - name: bert_base_rand_100_v1_mrpc
11
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,12 +34,12 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # bert_base_rand_100_v1_mrpc
18
 
19
- This model is a fine-tuned version of [Hartunka/bert_base_rand_100_v1](https://huggingface.co/Hartunka/bert_base_rand_100_v1) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 1.4011
22
- - Accuracy: 0.6495
23
- - F1: 0.7357
24
- - Combined Score: 0.6926
25
 
26
  ## Model description
27
 
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - en
5
  base_model: Hartunka/bert_base_rand_100_v1
6
  tags:
7
  - generated_from_trainer
8
+ datasets:
9
+ - glue
10
  metrics:
11
  - accuracy
12
  - f1
13
  model-index:
14
  - name: bert_base_rand_100_v1_mrpc
15
+ results:
16
+ - task:
17
+ name: Text Classification
18
+ type: text-classification
19
+ dataset:
20
+ name: GLUE MRPC
21
+ type: glue
22
+ args: mrpc
23
+ metrics:
24
+ - name: Accuracy
25
+ type: accuracy
26
+ value: 0.7107843137254902
27
+ - name: F1
28
+ type: f1
29
+ value: 0.8033333333333333
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  # bert_base_rand_100_v1_mrpc
36
 
37
+ This model is a fine-tuned version of [Hartunka/bert_base_rand_100_v1](https://huggingface.co/Hartunka/bert_base_rand_100_v1) on the GLUE MRPC dataset.
38
  It achieves the following results on the evaluation set:
39
+ - Loss: 0.5808
40
+ - Accuracy: 0.7108
41
+ - F1: 0.8033
42
+ - Combined Score: 0.7571
43
 
44
  ## Model description
45
 
all_results.json CHANGED
@@ -4,14 +4,14 @@
4
  "eval_combined_score": 0.7570588235294118,
5
  "eval_f1": 0.8033333333333333,
6
  "eval_loss": 0.5807782411575317,
7
- "eval_runtime": 0.3002,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 1359.097,
10
- "eval_steps_per_second": 6.662,
11
  "total_flos": 3377819728711680.0,
12
  "train_loss": 0.3727283318837484,
13
- "train_runtime": 58.1176,
14
  "train_samples": 3668,
15
- "train_samples_per_second": 3155.67,
16
- "train_steps_per_second": 12.905
17
  }
 
4
  "eval_combined_score": 0.7570588235294118,
5
  "eval_f1": 0.8033333333333333,
6
  "eval_loss": 0.5807782411575317,
7
+ "eval_runtime": 0.3042,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 1341.2,
10
+ "eval_steps_per_second": 6.575,
11
  "total_flos": 3377819728711680.0,
12
  "train_loss": 0.3727283318837484,
13
+ "train_runtime": 60.2116,
14
  "train_samples": 3668,
15
+ "train_samples_per_second": 3045.927,
16
+ "train_steps_per_second": 12.456
17
  }
eval_results.json CHANGED
@@ -4,8 +4,8 @@
4
  "eval_combined_score": 0.7570588235294118,
5
  "eval_f1": 0.8033333333333333,
6
  "eval_loss": 0.5807782411575317,
7
- "eval_runtime": 0.3002,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 1359.097,
10
- "eval_steps_per_second": 6.662
11
  }
 
4
  "eval_combined_score": 0.7570588235294118,
5
  "eval_f1": 0.8033333333333333,
6
  "eval_loss": 0.5807782411575317,
7
+ "eval_runtime": 0.3042,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 1341.2,
10
+ "eval_steps_per_second": 6.575
11
  }
logs/events.out.tfevents.1745183177.s_005_m.2815556.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fddd66f86acf8c7487dbc3b185d7b2c9dcb0a384e77f2717ea0c297d612014bb
3
+ size 459
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 7.0,
3
  "total_flos": 3377819728711680.0,
4
  "train_loss": 0.3727283318837484,
5
- "train_runtime": 58.1176,
6
  "train_samples": 3668,
7
- "train_samples_per_second": 3155.67,
8
- "train_steps_per_second": 12.905
9
  }
 
2
  "epoch": 7.0,
3
  "total_flos": 3377819728711680.0,
4
  "train_loss": 0.3727283318837484,
5
+ "train_runtime": 60.2116,
6
  "train_samples": 3668,
7
+ "train_samples_per_second": 3045.927,
8
+ "train_steps_per_second": 12.456
9
  }
trainer_state.json CHANGED
@@ -22,9 +22,9 @@
22
  "eval_combined_score": 0.7513938781619518,
23
  "eval_f1": 0.8091603053435115,
24
  "eval_loss": 0.5958898067474365,
25
- "eval_runtime": 0.2694,
26
- "eval_samples_per_second": 1514.258,
27
- "eval_steps_per_second": 7.423,
28
  "step": 15
29
  },
30
  {
@@ -40,9 +40,9 @@
40
  "eval_combined_score": 0.7570588235294118,
41
  "eval_f1": 0.8033333333333333,
42
  "eval_loss": 0.5807782411575317,
43
- "eval_runtime": 0.2724,
44
- "eval_samples_per_second": 1497.92,
45
- "eval_steps_per_second": 7.343,
46
  "step": 30
47
  },
48
  {
@@ -58,9 +58,9 @@
58
  "eval_combined_score": 0.7586610486891385,
59
  "eval_f1": 0.8089887640449438,
60
  "eval_loss": 0.5847347974777222,
61
- "eval_runtime": 0.3261,
62
- "eval_samples_per_second": 1251.324,
63
- "eval_steps_per_second": 6.134,
64
  "step": 45
65
  },
66
  {
@@ -76,9 +76,9 @@
76
  "eval_combined_score": 0.7443602859203882,
77
  "eval_f1": 0.7926421404682275,
78
  "eval_loss": 0.7103803753852844,
79
- "eval_runtime": 0.2922,
80
- "eval_samples_per_second": 1396.208,
81
- "eval_steps_per_second": 6.844,
82
  "step": 60
83
  },
84
  {
@@ -94,9 +94,9 @@
94
  "eval_combined_score": 0.7373566326705814,
95
  "eval_f1": 0.7810858143607706,
96
  "eval_loss": 0.9412671327590942,
97
- "eval_runtime": 0.2711,
98
- "eval_samples_per_second": 1505.075,
99
- "eval_steps_per_second": 7.378,
100
  "step": 75
101
  },
102
  {
@@ -112,9 +112,9 @@
112
  "eval_combined_score": 0.7117102396514161,
113
  "eval_f1": 0.7518518518518519,
114
  "eval_loss": 1.1874147653579712,
115
- "eval_runtime": 0.2829,
116
- "eval_samples_per_second": 1441.989,
117
- "eval_steps_per_second": 7.069,
118
  "step": 90
119
  },
120
  {
@@ -130,9 +130,9 @@
130
  "eval_combined_score": 0.6925922402232612,
131
  "eval_f1": 0.7356746765249538,
132
  "eval_loss": 1.4011175632476807,
133
- "eval_runtime": 0.2802,
134
- "eval_samples_per_second": 1456.129,
135
- "eval_steps_per_second": 7.138,
136
  "step": 105
137
  },
138
  {
@@ -140,9 +140,9 @@
140
  "step": 105,
141
  "total_flos": 3377819728711680.0,
142
  "train_loss": 0.3727283318837484,
143
- "train_runtime": 58.1176,
144
- "train_samples_per_second": 3155.67,
145
- "train_steps_per_second": 12.905
146
  }
147
  ],
148
  "logging_steps": 1,
 
22
  "eval_combined_score": 0.7513938781619518,
23
  "eval_f1": 0.8091603053435115,
24
  "eval_loss": 0.5958898067474365,
25
+ "eval_runtime": 0.2695,
26
+ "eval_samples_per_second": 1513.971,
27
+ "eval_steps_per_second": 7.421,
28
  "step": 15
29
  },
30
  {
 
40
  "eval_combined_score": 0.7570588235294118,
41
  "eval_f1": 0.8033333333333333,
42
  "eval_loss": 0.5807782411575317,
43
+ "eval_runtime": 0.2883,
44
+ "eval_samples_per_second": 1415.329,
45
+ "eval_steps_per_second": 6.938,
46
  "step": 30
47
  },
48
  {
 
58
  "eval_combined_score": 0.7586610486891385,
59
  "eval_f1": 0.8089887640449438,
60
  "eval_loss": 0.5847347974777222,
61
+ "eval_runtime": 0.2696,
62
+ "eval_samples_per_second": 1513.304,
63
+ "eval_steps_per_second": 7.418,
64
  "step": 45
65
  },
66
  {
 
76
  "eval_combined_score": 0.7443602859203882,
77
  "eval_f1": 0.7926421404682275,
78
  "eval_loss": 0.7103803753852844,
79
+ "eval_runtime": 0.285,
80
+ "eval_samples_per_second": 1431.679,
81
+ "eval_steps_per_second": 7.018,
82
  "step": 60
83
  },
84
  {
 
94
  "eval_combined_score": 0.7373566326705814,
95
  "eval_f1": 0.7810858143607706,
96
  "eval_loss": 0.9412671327590942,
97
+ "eval_runtime": 0.2734,
98
+ "eval_samples_per_second": 1492.486,
99
+ "eval_steps_per_second": 7.316,
100
  "step": 75
101
  },
102
  {
 
112
  "eval_combined_score": 0.7117102396514161,
113
  "eval_f1": 0.7518518518518519,
114
  "eval_loss": 1.1874147653579712,
115
+ "eval_runtime": 0.2693,
116
+ "eval_samples_per_second": 1515.172,
117
+ "eval_steps_per_second": 7.427,
118
  "step": 90
119
  },
120
  {
 
130
  "eval_combined_score": 0.6925922402232612,
131
  "eval_f1": 0.7356746765249538,
132
  "eval_loss": 1.4011175632476807,
133
+ "eval_runtime": 0.2886,
134
+ "eval_samples_per_second": 1413.947,
135
+ "eval_steps_per_second": 6.931,
136
  "step": 105
137
  },
138
  {
 
140
  "step": 105,
141
  "total_flos": 3377819728711680.0,
142
  "train_loss": 0.3727283318837484,
143
+ "train_runtime": 60.2116,
144
+ "train_samples_per_second": 3045.927,
145
+ "train_steps_per_second": 12.456
146
  }
147
  ],
148
  "logging_steps": 1,