gokuls commited on
Commit
13ae8e9
·
1 Parent(s): 2a9607f

End of training

Browse files
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_accuracy": 0.33660520215315354,
4
- "eval_loss": 4.140918254852295,
5
- "eval_runtime": 346.5619,
6
  "eval_samples": 308356,
7
- "eval_samples_per_second": 889.757,
8
- "eval_steps_per_second": 18.539,
9
- "perplexity": 62.8605169302589,
10
- "train_loss": 4.73325779911465,
11
- "train_runtime": 51385.934,
12
  "train_samples": 5858758,
13
- "train_samples_per_second": 570.074,
14
- "train_steps_per_second": 11.877
15
  }
 
1
  {
2
+ "epoch": 21.79,
3
+ "eval_accuracy": 0.3896253594872046,
4
+ "eval_loss": 3.6499946117401123,
5
+ "eval_runtime": 404.9308,
6
  "eval_samples": 308356,
7
+ "eval_samples_per_second": 761.503,
8
+ "eval_steps_per_second": 11.901,
9
+ "perplexity": 38.47445873809088,
10
+ "train_loss": 4.1639687691688305,
11
+ "train_runtime": 215975.8067,
12
  "train_samples": 5858758,
13
+ "train_samples_per_second": 1356.346,
14
+ "train_steps_per_second": 21.193
15
  }
eval_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_accuracy": 0.33660520215315354,
4
- "eval_loss": 4.140918254852295,
5
- "eval_runtime": 346.5619,
6
  "eval_samples": 308356,
7
- "eval_samples_per_second": 889.757,
8
- "eval_steps_per_second": 18.539,
9
- "perplexity": 62.8605169302589
10
  }
 
1
  {
2
+ "epoch": 21.79,
3
+ "eval_accuracy": 0.3896253594872046,
4
+ "eval_loss": 3.6499946117401123,
5
+ "eval_runtime": 404.9308,
6
  "eval_samples": 308356,
7
+ "eval_samples_per_second": 761.503,
8
+ "eval_steps_per_second": 11.901,
9
+ "perplexity": 38.47445873809088
10
  }
logs/events.out.tfevents.1687535517.serv-3331.2657420.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1c713be261466591886aa1987fc1623bb15d07630bc68d4c72ed824454ed705
3
+ size 369
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 5.0,
3
- "train_loss": 4.73325779911465,
4
- "train_runtime": 51385.934,
5
  "train_samples": 5858758,
6
- "train_samples_per_second": 570.074,
7
- "train_steps_per_second": 11.877
8
  }
 
1
  {
2
+ "epoch": 21.79,
3
+ "train_loss": 4.1639687691688305,
4
+ "train_runtime": 215975.8067,
5
  "train_samples": 5858758,
6
+ "train_samples_per_second": 1356.346,
7
+ "train_steps_per_second": 21.193
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff