Hartunka commited on
Commit
710962a
·
verified ·
1 Parent(s): 61176e6

End of training

Browse files
README.md CHANGED
@@ -1,14 +1,32 @@
1
  ---
2
  library_name: transformers
 
 
3
  base_model: Hartunka/bert_base_km_50_v1
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - accuracy
8
  - f1
9
  model-index:
10
  - name: bert_base_km_50_v1_mrpc
11
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,12 +34,12 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # bert_base_km_50_v1_mrpc
18
 
19
- This model is a fine-tuned version of [Hartunka/bert_base_km_50_v1](https://huggingface.co/Hartunka/bert_base_km_50_v1) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 1.1340
22
- - Accuracy: 0.6593
23
- - F1: 0.7531
24
- - Combined Score: 0.7062
25
 
26
  ## Model description
27
 
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - en
5
  base_model: Hartunka/bert_base_km_50_v1
6
  tags:
7
  - generated_from_trainer
8
+ datasets:
9
+ - glue
10
  metrics:
11
  - accuracy
12
  - f1
13
  model-index:
14
  - name: bert_base_km_50_v1_mrpc
15
+ results:
16
+ - task:
17
+ name: Text Classification
18
+ type: text-classification
19
+ dataset:
20
+ name: GLUE MRPC
21
+ type: glue
22
+ args: mrpc
23
+ metrics:
24
+ - name: Accuracy
25
+ type: accuracy
26
+ value: 0.7034313725490197
27
+ - name: F1
28
+ type: f1
29
+ value: 0.8141321044546851
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  # bert_base_km_50_v1_mrpc
36
 
37
+ This model is a fine-tuned version of [Hartunka/bert_base_km_50_v1](https://huggingface.co/Hartunka/bert_base_km_50_v1) on the GLUE MRPC dataset.
38
  It achieves the following results on the evaluation set:
39
+ - Loss: 0.5894
40
+ - Accuracy: 0.7034
41
+ - F1: 0.8141
42
+ - Combined Score: 0.7588
43
 
44
  ## Model description
45
 
all_results.json CHANGED
@@ -4,14 +4,14 @@
4
  "eval_combined_score": 0.7587817385018524,
5
  "eval_f1": 0.8141321044546851,
6
  "eval_loss": 0.5893518924713135,
7
- "eval_runtime": 0.3351,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 1217.397,
10
- "eval_steps_per_second": 5.968,
11
  "total_flos": 3377819728711680.0,
12
  "train_loss": 0.37630167575109574,
13
- "train_runtime": 57.9107,
14
  "train_samples": 3668,
15
- "train_samples_per_second": 3166.945,
16
- "train_steps_per_second": 12.951
17
  }
 
4
  "eval_combined_score": 0.7587817385018524,
5
  "eval_f1": 0.8141321044546851,
6
  "eval_loss": 0.5893518924713135,
7
+ "eval_runtime": 0.2812,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 1450.71,
10
+ "eval_steps_per_second": 7.111,
11
  "total_flos": 3377819728711680.0,
12
  "train_loss": 0.37630167575109574,
13
+ "train_runtime": 59.1897,
14
  "train_samples": 3668,
15
+ "train_samples_per_second": 3098.514,
16
+ "train_steps_per_second": 12.671
17
  }
eval_results.json CHANGED
@@ -4,8 +4,8 @@
4
  "eval_combined_score": 0.7587817385018524,
5
  "eval_f1": 0.8141321044546851,
6
  "eval_loss": 0.5893518924713135,
7
- "eval_runtime": 0.3351,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 1217.397,
10
- "eval_steps_per_second": 5.968
11
  }
 
4
  "eval_combined_score": 0.7587817385018524,
5
  "eval_f1": 0.8141321044546851,
6
  "eval_loss": 0.5893518924713135,
7
+ "eval_runtime": 0.2812,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 1450.71,
10
+ "eval_steps_per_second": 7.111
11
  }
logs/events.out.tfevents.1745080139.s_005_m.2793776.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44220412ad73cbe3e83ab521deda94ba749ef4b328479a63f55ce4e777284268
3
+ size 459
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 7.0,
3
  "total_flos": 3377819728711680.0,
4
  "train_loss": 0.37630167575109574,
5
- "train_runtime": 57.9107,
6
  "train_samples": 3668,
7
- "train_samples_per_second": 3166.945,
8
- "train_steps_per_second": 12.951
9
  }
 
2
  "epoch": 7.0,
3
  "total_flos": 3377819728711680.0,
4
  "train_loss": 0.37630167575109574,
5
+ "train_runtime": 59.1897,
6
  "train_samples": 3668,
7
+ "train_samples_per_second": 3098.514,
8
+ "train_steps_per_second": 12.671
9
  }
trainer_state.json CHANGED
@@ -22,9 +22,9 @@
22
  "eval_combined_score": 0.7452987825395369,
23
  "eval_f1": 0.8018720748829953,
24
  "eval_loss": 0.5977591872215271,
25
- "eval_runtime": 0.2702,
26
- "eval_samples_per_second": 1509.746,
27
- "eval_steps_per_second": 7.401,
28
  "step": 15
29
  },
30
  {
@@ -40,9 +40,9 @@
40
  "eval_combined_score": 0.7587817385018524,
41
  "eval_f1": 0.8141321044546851,
42
  "eval_loss": 0.5893518924713135,
43
- "eval_runtime": 0.2724,
44
- "eval_samples_per_second": 1497.989,
45
- "eval_steps_per_second": 7.343,
46
  "step": 30
47
  },
48
  {
@@ -58,9 +58,9 @@
58
  "eval_combined_score": 0.7552244582043344,
59
  "eval_f1": 0.8070175438596491,
60
  "eval_loss": 0.6016624569892883,
61
- "eval_runtime": 0.2763,
62
- "eval_samples_per_second": 1476.67,
63
- "eval_steps_per_second": 7.239,
64
  "step": 45
65
  },
66
  {
@@ -76,9 +76,9 @@
76
  "eval_combined_score": 0.737373677185623,
77
  "eval_f1": 0.7909238249594813,
78
  "eval_loss": 0.6796642541885376,
79
- "eval_runtime": 0.2698,
80
- "eval_samples_per_second": 1512.03,
81
- "eval_steps_per_second": 7.412,
82
  "step": 60
83
  },
84
  {
@@ -94,9 +94,9 @@
94
  "eval_combined_score": 0.6872946105816629,
95
  "eval_f1": 0.7299813780260708,
96
  "eval_loss": 0.8248001337051392,
97
- "eval_runtime": 0.3065,
98
- "eval_samples_per_second": 1331.354,
99
- "eval_steps_per_second": 6.526,
100
  "step": 75
101
  },
102
  {
@@ -112,9 +112,9 @@
112
  "eval_combined_score": 0.6659663865546219,
113
  "eval_f1": 0.7142857142857143,
114
  "eval_loss": 1.088710904121399,
115
- "eval_runtime": 0.2777,
116
- "eval_samples_per_second": 1469.065,
117
- "eval_steps_per_second": 7.201,
118
  "step": 90
119
  },
120
  {
@@ -130,9 +130,9 @@
130
  "eval_combined_score": 0.7062110368125936,
131
  "eval_f1": 0.7531083481349912,
132
  "eval_loss": 1.1340426206588745,
133
- "eval_runtime": 0.2695,
134
- "eval_samples_per_second": 1514.054,
135
- "eval_steps_per_second": 7.422,
136
  "step": 105
137
  },
138
  {
@@ -140,9 +140,9 @@
140
  "step": 105,
141
  "total_flos": 3377819728711680.0,
142
  "train_loss": 0.37630167575109574,
143
- "train_runtime": 57.9107,
144
- "train_samples_per_second": 3166.945,
145
- "train_steps_per_second": 12.951
146
  }
147
  ],
148
  "logging_steps": 1,
 
22
  "eval_combined_score": 0.7452987825395369,
23
  "eval_f1": 0.8018720748829953,
24
  "eval_loss": 0.5977591872215271,
25
+ "eval_runtime": 0.2815,
26
+ "eval_samples_per_second": 1449.507,
27
+ "eval_steps_per_second": 7.105,
28
  "step": 15
29
  },
30
  {
 
40
  "eval_combined_score": 0.7587817385018524,
41
  "eval_f1": 0.8141321044546851,
42
  "eval_loss": 0.5893518924713135,
43
+ "eval_runtime": 0.2759,
44
+ "eval_samples_per_second": 1478.916,
45
+ "eval_steps_per_second": 7.25,
46
  "step": 30
47
  },
48
  {
 
58
  "eval_combined_score": 0.7552244582043344,
59
  "eval_f1": 0.8070175438596491,
60
  "eval_loss": 0.6016624569892883,
61
+ "eval_runtime": 0.2708,
62
+ "eval_samples_per_second": 1506.861,
63
+ "eval_steps_per_second": 7.387,
64
  "step": 45
65
  },
66
  {
 
76
  "eval_combined_score": 0.737373677185623,
77
  "eval_f1": 0.7909238249594813,
78
  "eval_loss": 0.6796642541885376,
79
+ "eval_runtime": 0.2782,
80
+ "eval_samples_per_second": 1466.576,
81
+ "eval_steps_per_second": 7.189,
82
  "step": 60
83
  },
84
  {
 
94
  "eval_combined_score": 0.6872946105816629,
95
  "eval_f1": 0.7299813780260708,
96
  "eval_loss": 0.8248001337051392,
97
+ "eval_runtime": 0.2776,
98
+ "eval_samples_per_second": 1469.566,
99
+ "eval_steps_per_second": 7.204,
100
  "step": 75
101
  },
102
  {
 
112
  "eval_combined_score": 0.6659663865546219,
113
  "eval_f1": 0.7142857142857143,
114
  "eval_loss": 1.088710904121399,
115
+ "eval_runtime": 0.2704,
116
+ "eval_samples_per_second": 1509.018,
117
+ "eval_steps_per_second": 7.397,
118
  "step": 90
119
  },
120
  {
 
130
  "eval_combined_score": 0.7062110368125936,
131
  "eval_f1": 0.7531083481349912,
132
  "eval_loss": 1.1340426206588745,
133
+ "eval_runtime": 0.2846,
134
+ "eval_samples_per_second": 1433.362,
135
+ "eval_steps_per_second": 7.026,
136
  "step": 105
137
  },
138
  {
 
140
  "step": 105,
141
  "total_flos": 3377819728711680.0,
142
  "train_loss": 0.37630167575109574,
143
+ "train_runtime": 59.1897,
144
+ "train_samples_per_second": 3098.514,
145
+ "train_steps_per_second": 12.671
146
  }
147
  ],
148
  "logging_steps": 1,