Hartunka commited on
Commit
b6c3453
·
verified ·
1 Parent(s): 983aa64

End of training

Browse files
README.md CHANGED
@@ -1,13 +1,28 @@
1
  ---
2
  library_name: transformers
 
 
3
  base_model: Hartunka/bert_base_km_20_v1
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - accuracy
8
  model-index:
9
  - name: bert_base_km_20_v1_wnli
10
- results: []
 
 
 
 
 
 
 
 
 
 
 
11
  ---
12
 
13
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -15,10 +30,10 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # bert_base_km_20_v1_wnli
17
 
18
- This model is a fine-tuned version of [Hartunka/bert_base_km_20_v1](https://huggingface.co/Hartunka/bert_base_km_20_v1) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.8994
21
- - Accuracy: 0.1690
22
 
23
  ## Model description
24
 
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - en
5
  base_model: Hartunka/bert_base_km_20_v1
6
  tags:
7
  - generated_from_trainer
8
+ datasets:
9
+ - glue
10
  metrics:
11
  - accuracy
12
  model-index:
13
  - name: bert_base_km_20_v1_wnli
14
+ results:
15
+ - task:
16
+ name: Text Classification
17
+ type: text-classification
18
+ dataset:
19
+ name: GLUE WNLI
20
+ type: glue
21
+ args: wnli
22
+ metrics:
23
+ - name: Accuracy
24
+ type: accuracy
25
+ value: 0.39436619718309857
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
30
 
31
  # bert_base_km_20_v1_wnli
32
 
33
+ This model is a fine-tuned version of [Hartunka/bert_base_km_20_v1](https://huggingface.co/Hartunka/bert_base_km_20_v1) on the GLUE WNLI dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.7542
36
+ - Accuracy: 0.3944
37
 
38
  ## Model description
39
 
all_results.json CHANGED
@@ -2,14 +2,14 @@
2
  "epoch": 6.0,
3
  "eval_accuracy": 0.39436619718309857,
4
  "eval_loss": 0.7541812658309937,
5
- "eval_runtime": 0.0745,
6
  "eval_samples": 71,
7
- "eval_samples_per_second": 953.089,
8
- "eval_steps_per_second": 13.424,
9
  "total_flos": 501226560460800.0,
10
  "train_loss": 0.6963877810372247,
11
- "train_runtime": 18.5769,
12
  "train_samples": 635,
13
- "train_samples_per_second": 1709.111,
14
- "train_steps_per_second": 8.075
15
  }
 
2
  "epoch": 6.0,
3
  "eval_accuracy": 0.39436619718309857,
4
  "eval_loss": 0.7541812658309937,
5
+ "eval_runtime": 0.0757,
6
  "eval_samples": 71,
7
+ "eval_samples_per_second": 938.137,
8
+ "eval_steps_per_second": 13.213,
9
  "total_flos": 501226560460800.0,
10
  "train_loss": 0.6963877810372247,
11
+ "train_runtime": 19.3347,
12
  "train_samples": 635,
13
+ "train_samples_per_second": 1642.129,
14
+ "train_steps_per_second": 7.758
15
  }
eval_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 6.0,
3
  "eval_accuracy": 0.39436619718309857,
4
  "eval_loss": 0.7541812658309937,
5
- "eval_runtime": 0.0745,
6
  "eval_samples": 71,
7
- "eval_samples_per_second": 953.089,
8
- "eval_steps_per_second": 13.424
9
  }
 
2
  "epoch": 6.0,
3
  "eval_accuracy": 0.39436619718309857,
4
  "eval_loss": 0.7541812658309937,
5
+ "eval_runtime": 0.0757,
6
  "eval_samples": 71,
7
+ "eval_samples_per_second": 938.137,
8
+ "eval_steps_per_second": 13.213
9
  }
logs/events.out.tfevents.1745050805.s_005_m.2788007.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a6aa7cd78e589c0e2a2b7d8bd2b2c4e4e0143bf9fb8ddc83757ce0da5f0cf40
3
+ size 357
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 6.0,
3
  "total_flos": 501226560460800.0,
4
  "train_loss": 0.6963877810372247,
5
- "train_runtime": 18.5769,
6
  "train_samples": 635,
7
- "train_samples_per_second": 1709.111,
8
- "train_steps_per_second": 8.075
9
  }
 
2
  "epoch": 6.0,
3
  "total_flos": 501226560460800.0,
4
  "train_loss": 0.6963877810372247,
5
+ "train_runtime": 19.3347,
6
  "train_samples": 635,
7
+ "train_samples_per_second": 1642.129,
8
+ "train_steps_per_second": 7.758
9
  }
trainer_state.json CHANGED
@@ -20,9 +20,9 @@
20
  "epoch": 1.0,
21
  "eval_accuracy": 0.39436619718309857,
22
  "eval_loss": 0.7541812658309937,
23
- "eval_runtime": 0.0584,
24
- "eval_samples_per_second": 1215.398,
25
- "eval_steps_per_second": 17.118,
26
  "step": 3
27
  },
28
  {
@@ -36,9 +36,9 @@
36
  "epoch": 2.0,
37
  "eval_accuracy": 0.2112676056338028,
38
  "eval_loss": 0.7640296220779419,
39
- "eval_runtime": 0.0644,
40
- "eval_samples_per_second": 1101.727,
41
- "eval_steps_per_second": 15.517,
42
  "step": 6
43
  },
44
  {
@@ -52,9 +52,9 @@
52
  "epoch": 3.0,
53
  "eval_accuracy": 0.22535211267605634,
54
  "eval_loss": 0.7914281487464905,
55
- "eval_runtime": 0.0545,
56
- "eval_samples_per_second": 1303.617,
57
- "eval_steps_per_second": 18.361,
58
  "step": 9
59
  },
60
  {
@@ -68,9 +68,9 @@
68
  "epoch": 4.0,
69
  "eval_accuracy": 0.2676056338028169,
70
  "eval_loss": 0.814260721206665,
71
- "eval_runtime": 0.0691,
72
- "eval_samples_per_second": 1028.222,
73
- "eval_steps_per_second": 14.482,
74
  "step": 12
75
  },
76
  {
@@ -84,9 +84,9 @@
84
  "epoch": 5.0,
85
  "eval_accuracy": 0.2112676056338028,
86
  "eval_loss": 0.8581647872924805,
87
- "eval_runtime": 0.0555,
88
- "eval_samples_per_second": 1279.597,
89
- "eval_steps_per_second": 18.022,
90
  "step": 15
91
  },
92
  {
@@ -100,9 +100,9 @@
100
  "epoch": 6.0,
101
  "eval_accuracy": 0.16901408450704225,
102
  "eval_loss": 0.8994279503822327,
103
- "eval_runtime": 0.0558,
104
- "eval_samples_per_second": 1272.37,
105
- "eval_steps_per_second": 17.921,
106
  "step": 18
107
  },
108
  {
@@ -110,9 +110,9 @@
110
  "step": 18,
111
  "total_flos": 501226560460800.0,
112
  "train_loss": 0.6963877810372247,
113
- "train_runtime": 18.5769,
114
- "train_samples_per_second": 1709.111,
115
- "train_steps_per_second": 8.075
116
  }
117
  ],
118
  "logging_steps": 1,
 
20
  "epoch": 1.0,
21
  "eval_accuracy": 0.39436619718309857,
22
  "eval_loss": 0.7541812658309937,
23
+ "eval_runtime": 0.0818,
24
+ "eval_samples_per_second": 868.221,
25
+ "eval_steps_per_second": 12.228,
26
  "step": 3
27
  },
28
  {
 
36
  "epoch": 2.0,
37
  "eval_accuracy": 0.2112676056338028,
38
  "eval_loss": 0.7640296220779419,
39
+ "eval_runtime": 0.0608,
40
+ "eval_samples_per_second": 1166.879,
41
+ "eval_steps_per_second": 16.435,
42
  "step": 6
43
  },
44
  {
 
52
  "epoch": 3.0,
53
  "eval_accuracy": 0.22535211267605634,
54
  "eval_loss": 0.7914281487464905,
55
+ "eval_runtime": 0.0568,
56
+ "eval_samples_per_second": 1250.685,
57
+ "eval_steps_per_second": 17.615,
58
  "step": 9
59
  },
60
  {
 
68
  "epoch": 4.0,
69
  "eval_accuracy": 0.2676056338028169,
70
  "eval_loss": 0.814260721206665,
71
+ "eval_runtime": 0.0573,
72
+ "eval_samples_per_second": 1238.364,
73
+ "eval_steps_per_second": 17.442,
74
  "step": 12
75
  },
76
  {
 
84
  "epoch": 5.0,
85
  "eval_accuracy": 0.2112676056338028,
86
  "eval_loss": 0.8581647872924805,
87
+ "eval_runtime": 0.0598,
88
+ "eval_samples_per_second": 1187.52,
89
+ "eval_steps_per_second": 16.726,
90
  "step": 15
91
  },
92
  {
 
100
  "epoch": 6.0,
101
  "eval_accuracy": 0.16901408450704225,
102
  "eval_loss": 0.8994279503822327,
103
+ "eval_runtime": 0.0623,
104
+ "eval_samples_per_second": 1138.876,
105
+ "eval_steps_per_second": 16.041,
106
  "step": 18
107
  },
108
  {
 
110
  "step": 18,
111
  "total_flos": 501226560460800.0,
112
  "train_loss": 0.6963877810372247,
113
+ "train_runtime": 19.3347,
114
+ "train_samples_per_second": 1642.129,
115
+ "train_steps_per_second": 7.758
116
  }
117
  ],
118
  "logging_steps": 1,