MHGanainy commited on
Commit
7ec67d5
·
verified ·
1 Parent(s): 572942b

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +3 -3
  2. train_results.json +3 -3
  3. trainer_state.json +15 -15
all_results.json CHANGED
@@ -16,8 +16,8 @@
16
  "predict_steps_per_second": 4.179,
17
  "total_flos": 2512343535714304.0,
18
  "train_loss": 0.3421715199947357,
19
- "train_runtime": 21.295,
20
  "train_samples": 100,
21
- "train_samples_per_second": 93.919,
22
- "train_steps_per_second": 3.757
23
  }
 
16
  "predict_steps_per_second": 4.179,
17
  "total_flos": 2512343535714304.0,
18
  "train_loss": 0.3421715199947357,
19
+ "train_runtime": 21.559,
20
  "train_samples": 100,
21
+ "train_samples_per_second": 92.769,
22
+ "train_steps_per_second": 3.711
23
  }
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 4.0,
3
  "total_flos": 2512343535714304.0,
4
  "train_loss": 0.3421715199947357,
5
- "train_runtime": 21.295,
6
  "train_samples": 100,
7
- "train_samples_per_second": 93.919,
8
- "train_steps_per_second": 3.757
9
  }
 
2
  "epoch": 4.0,
3
  "total_flos": 2512343535714304.0,
4
  "train_loss": 0.3421715199947357,
5
+ "train_runtime": 21.559,
6
  "train_samples": 100,
7
+ "train_samples_per_second": 92.769,
8
+ "train_steps_per_second": 3.711
9
  }
trainer_state.json CHANGED
@@ -13,9 +13,9 @@
13
  "eval_loss": 0.41245660185813904,
14
  "eval_macro-f1": 0.029029793735676088,
15
  "eval_micro-f1": 0.16521739130434782,
16
- "eval_runtime": 1.0746,
17
- "eval_samples_per_second": 93.059,
18
- "eval_steps_per_second": 3.722,
19
  "step": 4
20
  },
21
  {
@@ -23,9 +23,9 @@
23
  "eval_loss": 0.3445906341075897,
24
  "eval_macro-f1": 0.029029793735676088,
25
  "eval_micro-f1": 0.16521739130434782,
26
- "eval_runtime": 1.4551,
27
- "eval_samples_per_second": 68.726,
28
- "eval_steps_per_second": 2.749,
29
  "step": 8
30
  },
31
  {
@@ -33,9 +33,9 @@
33
  "eval_loss": 0.3343995213508606,
34
  "eval_macro-f1": 0.029029793735676088,
35
  "eval_micro-f1": 0.16521739130434782,
36
- "eval_runtime": 1.1868,
37
- "eval_samples_per_second": 84.263,
38
- "eval_steps_per_second": 3.371,
39
  "step": 12
40
  },
41
  {
@@ -43,9 +43,9 @@
43
  "eval_loss": 0.333324134349823,
44
  "eval_macro-f1": 0.029029793735676088,
45
  "eval_micro-f1": 0.16521739130434782,
46
- "eval_runtime": 1.0777,
47
- "eval_samples_per_second": 92.789,
48
- "eval_steps_per_second": 3.712,
49
  "step": 16
50
  },
51
  {
@@ -53,9 +53,9 @@
53
  "step": 16,
54
  "total_flos": 2512343535714304.0,
55
  "train_loss": 0.3421715199947357,
56
- "train_runtime": 21.295,
57
- "train_samples_per_second": 93.919,
58
- "train_steps_per_second": 3.757
59
  }
60
  ],
61
  "logging_steps": 500,
 
13
  "eval_loss": 0.41245660185813904,
14
  "eval_macro-f1": 0.029029793735676088,
15
  "eval_micro-f1": 0.16521739130434782,
16
+ "eval_runtime": 1.0722,
17
+ "eval_samples_per_second": 93.268,
18
+ "eval_steps_per_second": 3.731,
19
  "step": 4
20
  },
21
  {
 
23
  "eval_loss": 0.3445906341075897,
24
  "eval_macro-f1": 0.029029793735676088,
25
  "eval_micro-f1": 0.16521739130434782,
26
+ "eval_runtime": 1.4747,
27
+ "eval_samples_per_second": 67.809,
28
+ "eval_steps_per_second": 2.712,
29
  "step": 8
30
  },
31
  {
 
33
  "eval_loss": 0.3343995213508606,
34
  "eval_macro-f1": 0.029029793735676088,
35
  "eval_micro-f1": 0.16521739130434782,
36
+ "eval_runtime": 1.6766,
37
+ "eval_samples_per_second": 59.646,
38
+ "eval_steps_per_second": 2.386,
39
  "step": 12
40
  },
41
  {
 
43
  "eval_loss": 0.333324134349823,
44
  "eval_macro-f1": 0.029029793735676088,
45
  "eval_micro-f1": 0.16521739130434782,
46
+ "eval_runtime": 1.0723,
47
+ "eval_samples_per_second": 93.253,
48
+ "eval_steps_per_second": 3.73,
49
  "step": 16
50
  },
51
  {
 
53
  "step": 16,
54
  "total_flos": 2512343535714304.0,
55
  "train_loss": 0.3421715199947357,
56
+ "train_runtime": 21.559,
57
+ "train_samples_per_second": 92.769,
58
+ "train_steps_per_second": 3.711
59
  }
60
  ],
61
  "logging_steps": 500,