SystemAdmin123 commited on
Commit
738d345
·
verified ·
1 Parent(s): 914525c

Training in progress, step 40, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:296d3c11b549378809925dc5abeb8f0a62cd642b0dd4f1e0fe503271668e5fc2
3
  size 723674912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0266669328e80e3461a10118de44cff8735079c14f427660e06289fa00132dd
3
  size 723674912
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:367d828c50db3ed18885e248d3bf5cab302f7bbff0a88bfb288efcaaa6d12bcd
3
  size 735625370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69823c3e1cc379e7cde9fa82cf2a2c9e87827da47e5463701880ad9a8a85e3b4
3
  size 735625370
last-checkpoint/trainer_state.json CHANGED
@@ -11,53 +11,53 @@
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 3.067882776260376,
14
- "eval_runtime": 5.1514,
15
- "eval_samples_per_second": 291.572,
16
- "eval_steps_per_second": 18.248,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
  "grad_norm": 4.40625,
22
  "learning_rate": 1.6000000000000003e-05,
23
- "loss": 2.7777,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
  "grad_norm": 1.640625,
29
  "learning_rate": 3.2000000000000005e-05,
30
- "loss": 2.894,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
- "eval_loss": 3.0597116947174072,
36
- "eval_runtime": 5.678,
37
- "eval_samples_per_second": 264.528,
38
- "eval_steps_per_second": 16.555,
39
  "step": 20
40
  },
41
  {
42
  "epoch": 0.03550295857988166,
43
  "grad_norm": 6.0625,
44
  "learning_rate": 4.8e-05,
45
- "loss": 3.02,
46
  "step": 30
47
  },
48
  {
49
  "epoch": 0.047337278106508875,
50
  "grad_norm": 1.7578125,
51
  "learning_rate": 6.400000000000001e-05,
52
- "loss": 2.8817,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
- "eval_loss": 2.9575068950653076,
58
- "eval_runtime": 5.5448,
59
- "eval_samples_per_second": 270.884,
60
- "eval_steps_per_second": 16.953,
61
  "step": 40
62
  }
63
  ],
 
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 3.067882776260376,
14
+ "eval_runtime": 5.0136,
15
+ "eval_samples_per_second": 299.584,
16
+ "eval_steps_per_second": 18.749,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
  "grad_norm": 4.40625,
22
  "learning_rate": 1.6000000000000003e-05,
23
+ "loss": 2.778,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
  "grad_norm": 1.640625,
29
  "learning_rate": 3.2000000000000005e-05,
30
+ "loss": 2.8954,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
+ "eval_loss": 3.0601139068603516,
36
+ "eval_runtime": 5.1989,
37
+ "eval_samples_per_second": 288.907,
38
+ "eval_steps_per_second": 18.081,
39
  "step": 20
40
  },
41
  {
42
  "epoch": 0.03550295857988166,
43
  "grad_norm": 6.0625,
44
  "learning_rate": 4.8e-05,
45
+ "loss": 3.0194,
46
  "step": 30
47
  },
48
  {
49
  "epoch": 0.047337278106508875,
50
  "grad_norm": 1.7578125,
51
  "learning_rate": 6.400000000000001e-05,
52
+ "loss": 2.8826,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
+ "eval_loss": 2.956596851348877,
58
+ "eval_runtime": 5.2535,
59
+ "eval_samples_per_second": 285.902,
60
+ "eval_steps_per_second": 17.893,
61
  "step": 40
62
  }
63
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c13eb177f9a4df885b8c30c848aa7cef22c2095d626ae8c593587f9a5d8892d1
3
  size 6712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e88807ca1f23b8b745e9faf9e15e3cc183acee05b7a930af2c8542a4cad292cc
3
  size 6712