Sela223 commited on
Commit
0868695
·
verified ·
1 Parent(s): 7bce46e

Upload checkpoint checkpoint-50

Browse files
checkpoint-50/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b84dffa4f79bec060fcb8dd5f305478965ff574aaaa9dd339e749bfcd8b8d383
3
  size 614801160
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebca23c43e2da93412879287d3ecb22ba143e75a2600955a24c9739b83be1507
3
  size 614801160
checkpoint-50/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:409682af3c024d58e5d006b75e3f34fa18bc169d0018977e97bab189b743732d
3
  size 312742204
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfa314ed8ffe2040322876ac873f864979ab880ac758867620937ebd26730858
3
  size 312742204
checkpoint-50/trainer_state.json CHANGED
@@ -13,35 +13,35 @@
13
  "epoch": 0.05235602094240838,
14
  "grad_norm": NaN,
15
  "learning_rate": 0.0,
16
- "loss": 9.7678,
17
  "step": 10
18
  },
19
  {
20
  "epoch": 0.10471204188481675,
21
- "grad_norm": 204575.09375,
22
  "learning_rate": 3.1413612565445024e-08,
23
- "loss": 9.1803,
24
  "step": 20
25
  },
26
  {
27
  "epoch": 0.15706806282722513,
28
- "grad_norm": 26470.66015625,
29
  "learning_rate": 1.3612565445026178e-07,
30
- "loss": 3.8501,
31
  "step": 30
32
  },
33
  {
34
  "epoch": 0.2094240837696335,
35
- "grad_norm": 10531.1064453125,
36
  "learning_rate": 2.4083769633507854e-07,
37
- "loss": 3.2742,
38
  "step": 40
39
  },
40
  {
41
  "epoch": 0.2617801047120419,
42
- "grad_norm": 8319.623046875,
43
  "learning_rate": 3.4554973821989523e-07,
44
- "loss": 3.096,
45
  "step": 50
46
  }
47
  ],
 
13
  "epoch": 0.05235602094240838,
14
  "grad_norm": NaN,
15
  "learning_rate": 0.0,
16
+ "loss": 9.7408,
17
  "step": 10
18
  },
19
  {
20
  "epoch": 0.10471204188481675,
21
+ "grad_norm": 202209.765625,
22
  "learning_rate": 3.1413612565445024e-08,
23
+ "loss": 9.1548,
24
  "step": 20
25
  },
26
  {
27
  "epoch": 0.15706806282722513,
28
+ "grad_norm": 27189.787109375,
29
  "learning_rate": 1.3612565445026178e-07,
30
+ "loss": 3.8451,
31
  "step": 30
32
  },
33
  {
34
  "epoch": 0.2094240837696335,
35
+ "grad_norm": 10457.34765625,
36
  "learning_rate": 2.4083769633507854e-07,
37
+ "loss": 3.267,
38
  "step": 40
39
  },
40
  {
41
  "epoch": 0.2617801047120419,
42
+ "grad_norm": 8087.2939453125,
43
  "learning_rate": 3.4554973821989523e-07,
44
+ "loss": 3.0939,
45
  "step": 50
46
  }
47
  ],