bhuvanmdev commited on
Commit
d73d3b4
·
verified ·
1 Parent(s): 652230a

Training in progress, step 720, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50e6594b364a0fbb854abb5d965c726e8f15fa01c9001b41d915e779549b2215
3
  size 1316913776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fea491b3b1391cebeed659bd3578d064da132e8ae050b25368833ae5a10ca588
3
  size 1316913776
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9629f232980735b2c724e023cd63526e09d46d3ef9ec65dbafa2e8570647df4b
3
  size 8908124
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04ed2b24885e7eebc909afa04e3fc3dcc986e27c10b7a80cc077f1a38645d3a8
3
  size 8908124
last-checkpoint/rng_state.pth CHANGED
Binary files a/last-checkpoint/rng_state.pth and b/last-checkpoint/rng_state.pth differ
 
last-checkpoint/scheduler.pt CHANGED
Binary files a/last-checkpoint/scheduler.pt and b/last-checkpoint/scheduler.pt differ
 
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.15242593387720052,
5
  "eval_steps": 500,
6
- "global_step": 710,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -504,6 +504,13 @@
504
  "learning_rate": 0.00042378703306139977,
505
  "loss": 0.8205,
506
  "step": 710
 
 
 
 
 
 
 
507
  }
508
  ],
509
  "logging_steps": 10,
@@ -511,7 +518,7 @@
511
  "num_input_tokens_seen": 0,
512
  "num_train_epochs": 1,
513
  "save_steps": 10,
514
- "total_flos": 5.317746260637773e+16,
515
  "train_batch_size": 3,
516
  "trial_name": null,
517
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.15457277801631603,
5
  "eval_steps": 500,
6
+ "global_step": 720,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
504
  "learning_rate": 0.00042378703306139977,
505
  "loss": 0.8205,
506
  "step": 710
507
+ },
508
+ {
509
+ "epoch": 0.15457277801631603,
510
+ "grad_norm": 1.7332643270492554,
511
+ "learning_rate": 0.00042271361099184204,
512
+ "loss": 0.845,
513
+ "step": 720
514
  }
515
  ],
516
  "logging_steps": 10,
 
518
  "num_input_tokens_seen": 0,
519
  "num_train_epochs": 1,
520
  "save_steps": 10,
521
+ "total_flos": 5.413961972677248e+16,
522
  "train_batch_size": 3,
523
  "trial_name": null,
524
  "trial_params": null