KritiBanka1204 commited on
Commit
f5a96f6
·
verified ·
1 Parent(s): 3a74465

Upload fine-tuned checkpoint

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90ded5363c2db97ff3750527e380a2c1f5ec45ea549c35b83e8fc41c24e45755
3
  size 27297032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0539a36e6a74f2a3406db8fa6dca951caa7964905378b7db1054dcf33f2eb9db
3
  size 27297032
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b03510e887c64ac3a15f4caa9a6b07fa75481aedaca8cf441644a811a5addb9e
3
  size 54741195
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46b2ca18f46519ce107b56d52f4fbfd44ce18c555787d3803f48d182d4ed3fe0
3
  size 54741195
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd779a83acd3715c3d89d4b2113b579f25c288a6885c23419474a59b3d94b13a
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56aaeecdd7e946f32ea405fcbda9013bb4265f7535e6c1c8a57deda409eecc43
3
  size 14645
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31c8db2337dd529c4305ba9ec942095fa6efc6b665b33070cf7956020c7f5bb6
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73418fb68e188969c98f7ed1c862c2617299d539423cbbbbdd8d7bf13c2ac383
3
  size 1465
trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 600,
3
- "best_metric": 0.5126457214355469,
4
  "best_model_checkpoint": "./opencoder8b_finetuned/checkpoint-400",
5
- "epoch": 3.0,
6
  "eval_steps": 200,
7
- "global_step": 732,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -52,35 +52,6 @@
52
  "eval_samples_per_second": 4.328,
53
  "eval_steps_per_second": 0.544,
54
  "step": 400
55
- },
56
- {
57
- "epoch": 2.0491803278688523,
58
- "grad_norm": 0.17177526652812958,
59
- "learning_rate": 7.3625016623302155e-06,
60
- "loss": 0.5556,
61
- "step": 500
62
- },
63
- {
64
- "epoch": 2.459016393442623,
65
- "grad_norm": 0.26423564553260803,
66
- "learning_rate": 6.022760330631006e-06,
67
- "loss": 0.5291,
68
- "step": 600
69
- },
70
- {
71
- "epoch": 2.459016393442623,
72
- "eval_loss": 0.5126457214355469,
73
- "eval_runtime": 199.6781,
74
- "eval_samples_per_second": 4.347,
75
- "eval_steps_per_second": 0.546,
76
- "step": 600
77
- },
78
- {
79
- "epoch": 2.8688524590163933,
80
- "grad_norm": 0.23801229894161224,
81
- "learning_rate": 4.599860978031383e-06,
82
- "loss": 0.5239,
83
- "step": 700
84
  }
85
  ],
86
  "logging_steps": 100,
@@ -109,7 +80,7 @@
109
  "attributes": {}
110
  }
111
  },
112
- "total_flos": 1.34827040065536e+18,
113
  "train_batch_size": 8,
114
  "trial_name": null,
115
  "trial_params": null
 
1
  {
2
+ "best_global_step": 400,
3
+ "best_metric": 0.5587947964668274,
4
  "best_model_checkpoint": "./opencoder8b_finetuned/checkpoint-400",
5
+ "epoch": 1.639344262295082,
6
  "eval_steps": 200,
7
+ "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
52
  "eval_samples_per_second": 4.328,
53
  "eval_steps_per_second": 0.544,
54
  "step": 400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
55
  }
56
  ],
57
  "logging_steps": 100,
 
80
  "attributes": {}
81
  }
82
  },
83
+ "total_flos": 7.36870224949248e+17,
84
  "train_batch_size": 8,
85
  "trial_name": null,
86
  "trial_params": null