SystemAdmin123 commited on
Commit
c6d11b0
·
verified ·
1 Parent(s): 2ada648

Training in progress, step 40, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a660381d79264a17d2550ea5e5a429959f0b9c28eb96332197a2a8a9c4f6fb3
3
  size 723676832
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:356e77737e1ae57c572cefec580a243ff3bf580fbabb7d8184cf96c4dc8f3524
3
  size 723676832
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17e06f5b51db696407df34b9e2582d449c160e769f799d7cfe185bcb41183b88
3
  size 735627290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ceb1e871d2adeb06e378f9b3dd9f505b3cc3347052040d028a70c5698d6ed5f4
3
  size 735627290
last-checkpoint/trainer_state.json CHANGED
@@ -11,53 +11,53 @@
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 2.9618937969207764,
14
- "eval_runtime": 5.1254,
15
- "eval_samples_per_second": 293.049,
16
- "eval_steps_per_second": 18.34,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
  "grad_norm": 4.4375,
22
  "learning_rate": 1.6000000000000003e-05,
23
- "loss": 2.655,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
  "grad_norm": 1.6328125,
29
  "learning_rate": 3.2000000000000005e-05,
30
- "loss": 2.7917,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
- "eval_loss": 2.933722734451294,
36
- "eval_runtime": 5.4063,
37
- "eval_samples_per_second": 277.826,
38
- "eval_steps_per_second": 17.387,
39
  "step": 20
40
  },
41
  {
42
  "epoch": 0.03550295857988166,
43
- "grad_norm": 6.3125,
44
  "learning_rate": 4.8e-05,
45
- "loss": 2.8946,
46
  "step": 30
47
  },
48
  {
49
  "epoch": 0.047337278106508875,
50
- "grad_norm": 2.15625,
51
  "learning_rate": 6.400000000000001e-05,
52
- "loss": 2.7579,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
- "eval_loss": 2.718113899230957,
58
- "eval_runtime": 5.4545,
59
- "eval_samples_per_second": 275.368,
60
- "eval_steps_per_second": 17.233,
61
  "step": 40
62
  }
63
  ],
 
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 2.9618937969207764,
14
+ "eval_runtime": 5.2129,
15
+ "eval_samples_per_second": 288.133,
16
+ "eval_steps_per_second": 18.032,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
  "grad_norm": 4.4375,
22
  "learning_rate": 1.6000000000000003e-05,
23
+ "loss": 2.6559,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
  "grad_norm": 1.6328125,
29
  "learning_rate": 3.2000000000000005e-05,
30
+ "loss": 2.7912,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
+ "eval_loss": 2.9339327812194824,
36
+ "eval_runtime": 5.5967,
37
+ "eval_samples_per_second": 268.371,
38
+ "eval_steps_per_second": 16.796,
39
  "step": 20
40
  },
41
  {
42
  "epoch": 0.03550295857988166,
43
+ "grad_norm": 6.34375,
44
  "learning_rate": 4.8e-05,
45
+ "loss": 2.8945,
46
  "step": 30
47
  },
48
  {
49
  "epoch": 0.047337278106508875,
50
+ "grad_norm": 2.1875,
51
  "learning_rate": 6.400000000000001e-05,
52
+ "loss": 2.7552,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
+ "eval_loss": 2.7184391021728516,
58
+ "eval_runtime": 5.6084,
59
+ "eval_samples_per_second": 267.814,
60
+ "eval_steps_per_second": 16.761,
61
  "step": 40
62
  }
63
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbe03fc40c2f60afb467f9fe9d85c4aa58d6394a9d6b88eb6bbad1750f4faa0d
3
  size 6840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7337b093c5d7d6a10f8669867e0be91b7b9af804f42fa136237f8529e7181224
3
  size 6840