SystemAdmin123 commited on
Commit
ed91321
·
verified ·
1 Parent(s): fff288a

Training in progress, step 40, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0266669328e80e3461a10118de44cff8735079c14f427660e06289fa00132dd
3
  size 723674912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89da288ea916bc87e2dc309ae736f2a5f22442c411406161ba1505c8cd18f6fd
3
  size 723674912
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69823c3e1cc379e7cde9fa82cf2a2c9e87827da47e5463701880ad9a8a85e3b4
3
  size 735625370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8853aff753532a2e2c9adad78d54da494e7b9ff2ed1f437edd469bc5ab58565e
3
  size 735625370
last-checkpoint/trainer_state.json CHANGED
@@ -11,31 +11,31 @@
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 3.067882776260376,
14
- "eval_runtime": 5.0136,
15
- "eval_samples_per_second": 299.584,
16
- "eval_steps_per_second": 18.749,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
  "grad_norm": 4.40625,
22
  "learning_rate": 1.6000000000000003e-05,
23
- "loss": 2.778,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
- "grad_norm": 1.640625,
29
  "learning_rate": 3.2000000000000005e-05,
30
- "loss": 2.8954,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
- "eval_loss": 3.0601139068603516,
36
- "eval_runtime": 5.1989,
37
- "eval_samples_per_second": 288.907,
38
- "eval_steps_per_second": 18.081,
39
  "step": 20
40
  },
41
  {
@@ -49,15 +49,15 @@
49
  "epoch": 0.047337278106508875,
50
  "grad_norm": 1.7578125,
51
  "learning_rate": 6.400000000000001e-05,
52
- "loss": 2.8826,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
- "eval_loss": 2.956596851348877,
58
- "eval_runtime": 5.2535,
59
- "eval_samples_per_second": 285.902,
60
- "eval_steps_per_second": 17.893,
61
  "step": 40
62
  }
63
  ],
 
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 3.067882776260376,
14
+ "eval_runtime": 5.0635,
15
+ "eval_samples_per_second": 296.633,
16
+ "eval_steps_per_second": 18.564,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
  "grad_norm": 4.40625,
22
  "learning_rate": 1.6000000000000003e-05,
23
+ "loss": 2.7782,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
+ "grad_norm": 1.6328125,
29
  "learning_rate": 3.2000000000000005e-05,
30
+ "loss": 2.8956,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
+ "eval_loss": 3.0602526664733887,
36
+ "eval_runtime": 5.3059,
37
+ "eval_samples_per_second": 283.082,
38
+ "eval_steps_per_second": 17.716,
39
  "step": 20
40
  },
41
  {
 
49
  "epoch": 0.047337278106508875,
50
  "grad_norm": 1.7578125,
51
  "learning_rate": 6.400000000000001e-05,
52
+ "loss": 2.8821,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
+ "eval_loss": 2.9565436840057373,
58
+ "eval_runtime": 5.3075,
59
+ "eval_samples_per_second": 282.998,
60
+ "eval_steps_per_second": 17.711,
61
  "step": 40
62
  }
63
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e88807ca1f23b8b745e9faf9e15e3cc183acee05b7a930af2c8542a4cad292cc
3
  size 6712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff2d010d71ffe14af88bc9959221d3983bd2a3f394734b7d7b835d485397643f
3
  size 6712