nour4286 commited on
Commit
004e91a
·
verified ·
1 Parent(s): d99d6f6

Training in progress, epoch 2, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e165614c217b762f552934561d88155cf0e7cc4d5a5298b404fd39e3d22d5e08
3
  size 557116312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c2a8d90aa234ac44475d39409dfbfa4fdb26f65d52a62de6861c428091b8ec8
3
  size 557116312
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e911663be690fcc16c588d5b34cf04dda3344d52a411d30cb50207ba0266d71
3
  size 1113991930
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e24858682d1d6129b19e305ab6bb61cdca3709f8c6b2b91eaf6b426db53a7515
3
  size 1113991930
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59624509e89bbc9b94c591ed4735982e33caa7e6875690c4ff16d1a97717d87c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef2b170a520baa1ce18377bdacbbdccab7978596a4a772af3bdbdf4cfda617a7
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ac9643ef164647dd74d17c68b79347a9f51627588cd7ec3dd1a18bf83f7e68f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be41d27c52015159c12ea1a39d342a8acabee4a3e8b9b9a41f77607cbb01aef6
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 2.6116,
3
- "best_model_checkpoint": "my-model/checkpoint-1528",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 1528,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -40,6 +40,39 @@
40
  "eval_samples_per_second": 5.2,
41
  "eval_steps_per_second": 0.521,
42
  "step": 1528
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
43
  }
44
  ],
45
  "logging_steps": 500,
@@ -59,7 +92,7 @@
59
  "attributes": {}
60
  }
61
  },
62
- "total_flos": 7327420304523264.0,
63
  "train_batch_size": 10,
64
  "trial_name": null,
65
  "trial_params": null
 
1
  {
2
+ "best_metric": 3.0744,
3
+ "best_model_checkpoint": "my-model/checkpoint-3056",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 3056,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
40
  "eval_samples_per_second": 5.2,
41
  "eval_steps_per_second": 0.521,
42
  "step": 1528
43
+ },
44
+ {
45
+ "epoch": 1.3089005235602094,
46
+ "grad_norm": 3.5784597396850586,
47
+ "learning_rate": 2.8184991273996508e-05,
48
+ "loss": 0.0605,
49
+ "step": 2000
50
+ },
51
+ {
52
+ "epoch": 1.6361256544502618,
53
+ "grad_norm": 3.948634624481201,
54
+ "learning_rate": 2.273123909249564e-05,
55
+ "loss": 0.1013,
56
+ "step": 2500
57
+ },
58
+ {
59
+ "epoch": 1.9633507853403143,
60
+ "grad_norm": 5.947019577026367,
61
+ "learning_rate": 1.7277486910994763e-05,
62
+ "loss": 0.2594,
63
+ "step": 3000
64
+ },
65
+ {
66
+ "epoch": 2.0,
67
+ "eval_loss": 4.7294816970825195,
68
+ "eval_rouge1": 3.0744,
69
+ "eval_rouge2": 0.2582,
70
+ "eval_rougeL": 3.0319,
71
+ "eval_rougeLsum": 3.0448,
72
+ "eval_runtime": 416.9983,
73
+ "eval_samples_per_second": 5.264,
74
+ "eval_steps_per_second": 0.528,
75
+ "step": 3056
76
  }
77
  ],
78
  "logging_steps": 500,
 
92
  "attributes": {}
93
  }
94
  },
95
+ "total_flos": 1.4662889498529792e+16,
96
  "train_batch_size": 10,
97
  "trial_name": null,
98
  "trial_params": null