SystemAdmin123 commited on
Commit
7210ab5
·
verified ·
1 Parent(s): 932f804

Training in progress, step 40, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74fd01a8bae891e64aa1a626cc333858550e0cb6e36fcb7777c30999ee762d5e
3
  size 723674912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea2ad4c7c610b5e4ef126bc494685c8d4930ad390366ab2e84a4faeb7d420766
3
  size 723674912
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbf48b20262fa5e0455f8bf8dec46b89425e9f2d27bcf272b7ece12dbc3f48cb
3
  size 735625370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c39f051c45f03d6dcadc277c1454a36b0adc05bc85d9ce17d6a180588b3cad4
3
  size 735625370
last-checkpoint/trainer_state.json CHANGED
@@ -11,53 +11,53 @@
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 2.6000850200653076,
14
- "eval_runtime": 5.1412,
15
- "eval_samples_per_second": 292.148,
16
- "eval_steps_per_second": 18.284,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
- "grad_norm": 4.21875,
22
  "learning_rate": 1.6000000000000003e-05,
23
- "loss": 2.4519,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
  "grad_norm": 1.15625,
29
  "learning_rate": 3.2000000000000005e-05,
30
- "loss": 2.4462,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
- "eval_loss": 2.592799425125122,
36
- "eval_runtime": 5.3446,
37
- "eval_samples_per_second": 281.033,
38
- "eval_steps_per_second": 17.588,
39
  "step": 20
40
  },
41
  {
42
  "epoch": 0.03550295857988166,
43
- "grad_norm": 3.9375,
44
  "learning_rate": 4.8e-05,
45
- "loss": 2.5891,
46
  "step": 30
47
  },
48
  {
49
  "epoch": 0.047337278106508875,
50
  "grad_norm": 1.5,
51
  "learning_rate": 6.400000000000001e-05,
52
- "loss": 2.4169,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
- "eval_loss": 2.5311338901519775,
58
- "eval_runtime": 5.3509,
59
- "eval_samples_per_second": 280.702,
60
- "eval_steps_per_second": 17.567,
61
  "step": 40
62
  }
63
  ],
 
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 2.6000850200653076,
14
+ "eval_runtime": 4.9168,
15
+ "eval_samples_per_second": 305.481,
16
+ "eval_steps_per_second": 19.118,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
+ "grad_norm": 4.3125,
22
  "learning_rate": 1.6000000000000003e-05,
23
+ "loss": 2.4524,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
  "grad_norm": 1.15625,
29
  "learning_rate": 3.2000000000000005e-05,
30
+ "loss": 2.4454,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
+ "eval_loss": 2.5929689407348633,
36
+ "eval_runtime": 5.1638,
37
+ "eval_samples_per_second": 290.869,
38
+ "eval_steps_per_second": 18.204,
39
  "step": 20
40
  },
41
  {
42
  "epoch": 0.03550295857988166,
43
+ "grad_norm": 4.0,
44
  "learning_rate": 4.8e-05,
45
+ "loss": 2.5904,
46
  "step": 30
47
  },
48
  {
49
  "epoch": 0.047337278106508875,
50
  "grad_norm": 1.5,
51
  "learning_rate": 6.400000000000001e-05,
52
+ "loss": 2.4156,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
+ "eval_loss": 2.5310535430908203,
58
+ "eval_runtime": 5.1508,
59
+ "eval_samples_per_second": 291.604,
60
+ "eval_steps_per_second": 18.249,
61
  "step": 40
62
  }
63
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56abc2533c0578396c842febb0d8251535aeccfdad6e84eb864bab834fbe822f
3
  size 6712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f671da996f9974e01b0bb6a782a1b157ff77bf2c5559d84c73598d7fc8d1f978
3
  size 6712