youssefedweqd commited on
Commit
da137e0
·
verified ·
1 Parent(s): 27bfe90

Training in progress, step 300, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -23,13 +23,13 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "up_proj",
27
- "o_proj",
28
  "k_proj",
 
29
  "down_proj",
30
- "q_proj",
31
  "gate_proj",
32
- "v_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "q_proj",
27
+ "v_proj",
28
  "k_proj",
29
+ "up_proj",
30
  "down_proj",
 
31
  "gate_proj",
32
+ "o_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:374da347622d668269859b72eea6f2d0b4a91b341a780d5b61734db381dfaa05
3
  size 161533160
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbb4f2a54acdd2dc060e3f9b839392093f0072bde87714829f2c22879be8a83b
3
  size 161533160
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e87be9e7a373870535fef2fa6152f10c18656b3e076faafdcd2eb3a7235ee483
3
  size 323292202
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9692d49a09a3c2f840030cbb28ca611ed0b3e2db87ed53e29bafb9a9ff2c6c81
3
  size 323292202
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f8f252de09a4793e5f13e772318938c884d18658b3687d3f2f6915920086464
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:061821e3d04852eeae52afa7567aad700ed25cb9e80039e019f6142953cc33e4
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.033112582781456956,
6
  "eval_steps": 100,
7
- "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -52,6 +52,20 @@
52
  "eval_samples_per_second": 3.185,
53
  "eval_steps_per_second": 3.185,
54
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
55
  }
56
  ],
57
  "logging_steps": 50,
@@ -71,7 +85,7 @@
71
  "attributes": {}
72
  }
73
  },
74
- "total_flos": 1563083893899264.0,
75
  "train_batch_size": 1,
76
  "trial_name": null,
77
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.04966887417218543,
6
  "eval_steps": 100,
7
+ "global_step": 300,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
52
  "eval_samples_per_second": 3.185,
53
  "eval_steps_per_second": 3.185,
54
  "step": 200
55
+ },
56
+ {
57
+ "epoch": 0.041390728476821195,
58
+ "grad_norm": 3.0053958892822266,
59
+ "learning_rate": 1.3741721854304637e-05,
60
+ "loss": 0.9816,
61
+ "step": 250
62
+ },
63
+ {
64
+ "epoch": 0.04966887417218543,
65
+ "grad_norm": 3.028010368347168,
66
+ "learning_rate": 1.6501103752759385e-05,
67
+ "loss": 0.9372,
68
+ "step": 300
69
  }
70
  ],
71
  "logging_steps": 50,
 
85
  "attributes": {}
86
  }
87
  },
88
+ "total_flos": 2342017777532928.0,
89
  "train_batch_size": 1,
90
  "trial_name": null,
91
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a2edd0949861cb7badd527f7095b9c2224394d2fdbe771dec750a5cdb83b3f5
3
- size 5688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dd2ef96eff028fc6db83c8627ce2e789cafe652a25ea367c040819bc392f916
3
+ size 5752