MHGanainy commited on
Commit
5c7f4eb
·
verified ·
1 Parent(s): 9d32b06

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +3 -3
  2. train_results.json +3 -3
  3. trainer_state.json +35 -31
all_results.json CHANGED
@@ -20,8 +20,8 @@
20
  "predict_steps_per_second": 4.098,
21
  "total_flos": 6.343227643160166e+17,
22
  "train_loss": 0.6829259282291525,
23
- "train_runtime": 2716.1998,
24
  "train_samples": 32305,
25
- "train_samples_per_second": 237.869,
26
- "train_steps_per_second": 7.437
27
  }
 
20
  "predict_steps_per_second": 4.098,
21
  "total_flos": 6.343227643160166e+17,
22
  "train_loss": 0.6829259282291525,
23
+ "train_runtime": 2722.2879,
24
  "train_samples": 32305,
25
+ "train_samples_per_second": 237.337,
26
+ "train_steps_per_second": 7.42
27
  }
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 4.0,
3
  "total_flos": 6.343227643160166e+17,
4
  "train_loss": 0.6829259282291525,
5
- "train_runtime": 2716.1998,
6
  "train_samples": 32305,
7
- "train_samples_per_second": 237.869,
8
- "train_steps_per_second": 7.437
9
  }
 
2
  "epoch": 4.0,
3
  "total_flos": 6.343227643160166e+17,
4
  "train_loss": 0.6829259282291525,
5
+ "train_runtime": 2722.2879,
6
  "train_samples": 32305,
7
+ "train_samples_per_second": 237.337,
8
+ "train_steps_per_second": 7.42
9
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.0,
3
  "best_model_checkpoint": "logs/ildc/roberta-base/seed_1/checkpoint-1010",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
@@ -24,14 +24,15 @@
24
  },
25
  {
26
  "epoch": 1.0,
27
- "eval_accuracy": 0.5,
28
- "eval_f1": 0.0,
 
29
  "eval_loss": 0.7003927230834961,
30
- "eval_precision": 0.0,
31
- "eval_recall": 0.0,
32
- "eval_runtime": 9.0772,
33
- "eval_samples_per_second": 109.505,
34
- "eval_steps_per_second": 3.525,
35
  "step": 1010
36
  },
37
  {
@@ -50,13 +51,14 @@
50
  },
51
  {
52
  "epoch": 2.0,
53
- "eval_accuracy": 0.5,
54
- "eval_f1": 0.0,
 
55
  "eval_loss": 0.699403703212738,
56
- "eval_precision": 0.0,
57
- "eval_recall": 0.0,
58
- "eval_runtime": 8.2465,
59
- "eval_samples_per_second": 120.536,
60
  "eval_steps_per_second": 3.88,
61
  "step": 2020
62
  },
@@ -76,14 +78,15 @@
76
  },
77
  {
78
  "epoch": 3.0,
79
- "eval_accuracy": 0.5,
80
- "eval_f1": 0.0,
 
81
  "eval_loss": 0.751548707485199,
82
- "eval_precision": 0.0,
83
- "eval_recall": 0.0,
84
- "eval_runtime": 8.2525,
85
- "eval_samples_per_second": 120.448,
86
- "eval_steps_per_second": 3.878,
87
  "step": 3030
88
  },
89
  {
@@ -102,14 +105,15 @@
102
  },
103
  {
104
  "epoch": 4.0,
105
- "eval_accuracy": 0.5,
106
- "eval_f1": 0.0,
 
107
  "eval_loss": 0.7038925290107727,
108
- "eval_precision": 0.0,
109
- "eval_recall": 0.0,
110
- "eval_runtime": 8.2406,
111
- "eval_samples_per_second": 120.622,
112
- "eval_steps_per_second": 3.883,
113
  "step": 4040
114
  },
115
  {
@@ -117,9 +121,9 @@
117
  "step": 4040,
118
  "total_flos": 6.343227643160166e+17,
119
  "train_loss": 0.6829259282291525,
120
- "train_runtime": 2716.1998,
121
- "train_samples_per_second": 237.869,
122
- "train_steps_per_second": 7.437
123
  }
124
  ],
125
  "logging_steps": 500,
 
1
  {
2
+ "best_metric": 0.6684856753069577,
3
  "best_model_checkpoint": "logs/ildc/roberta-base/seed_1/checkpoint-1010",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
 
24
  },
25
  {
26
  "epoch": 1.0,
27
+ "eval_accuracy": 0.5110663983903421,
28
+ "eval_best_threshold": 0.43776339292526245,
29
+ "eval_f1": 0.6684856753069577,
30
  "eval_loss": 0.7003927230834961,
31
+ "eval_precision": 0.5056759545923633,
32
+ "eval_recall": 0.9859154929577465,
33
+ "eval_runtime": 8.3061,
34
+ "eval_samples_per_second": 119.671,
35
+ "eval_steps_per_second": 3.853,
36
  "step": 1010
37
  },
38
  {
 
51
  },
52
  {
53
  "epoch": 2.0,
54
+ "eval_accuracy": 0.5030181086519114,
55
+ "eval_best_threshold": 0.43332192301750183,
56
+ "eval_f1": 0.6671159029649596,
57
  "eval_loss": 0.699403703212738,
58
+ "eval_precision": 0.5015197568389058,
59
+ "eval_recall": 0.9959758551307847,
60
+ "eval_runtime": 8.2485,
61
+ "eval_samples_per_second": 120.507,
62
  "eval_steps_per_second": 3.88,
63
  "step": 2020
64
  },
 
78
  },
79
  {
80
  "epoch": 3.0,
81
+ "eval_accuracy": 0.5030181086519114,
82
+ "eval_best_threshold": 0.332852303981781,
83
+ "eval_f1": 0.6644021739130435,
84
  "eval_loss": 0.751548707485199,
85
+ "eval_precision": 0.5015384615384615,
86
+ "eval_recall": 0.9839034205231388,
87
+ "eval_runtime": 8.2689,
88
+ "eval_samples_per_second": 120.21,
89
+ "eval_steps_per_second": 3.87,
90
  "step": 3030
91
  },
92
  {
 
105
  },
106
  {
107
  "epoch": 4.0,
108
+ "eval_accuracy": 0.5030181086519114,
109
+ "eval_best_threshold": 0.4006907343864441,
110
+ "eval_f1": 0.6671159029649596,
111
  "eval_loss": 0.7038925290107727,
112
+ "eval_precision": 0.5015197568389058,
113
+ "eval_recall": 0.9959758551307847,
114
+ "eval_runtime": 8.2224,
115
+ "eval_samples_per_second": 120.89,
116
+ "eval_steps_per_second": 3.892,
117
  "step": 4040
118
  },
119
  {
 
121
  "step": 4040,
122
  "total_flos": 6.343227643160166e+17,
123
  "train_loss": 0.6829259282291525,
124
+ "train_runtime": 2722.2879,
125
+ "train_samples_per_second": 237.337,
126
+ "train_steps_per_second": 7.42
127
  }
128
  ],
129
  "logging_steps": 500,