pminervini commited on
Commit
91832e8
·
verified ·
1 Parent(s): 905623e

Training in progress, step 32

Browse files
adapter_config.json CHANGED
@@ -15,17 +15,17 @@
15
  "megatron_core": "megatron.core",
16
  "modules_to_save": null,
17
  "peft_type": "LORA",
18
- "r": 32,
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "o_proj",
23
  "down_proj",
24
- "v_proj",
25
- "gate_proj",
26
- "up_proj",
27
  "k_proj",
28
- "q_proj"
 
 
 
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_dora": false,
 
15
  "megatron_core": "megatron.core",
16
  "modules_to_save": null,
17
  "peft_type": "LORA",
18
+ "r": 64,
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
22
  "down_proj",
23
+ "q_proj",
 
 
24
  "k_proj",
25
+ "o_proj",
26
+ "gate_proj",
27
+ "v_proj",
28
+ "up_proj"
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f15e14cba9365f8220a4850b3bcdf9846b3c6c047ddbe878ffb858472058d67
3
- size 78480320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9247a99e657eee355845eca8d6a4c8760786b13dcb8efce91889a93c62b9b25b
3
+ size 156927136
all_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 24.04,
3
- "train_loss": 0.24291648308280855,
4
- "train_runtime": 18372.1559,
5
- "train_samples_per_second": 3.567,
6
- "train_steps_per_second": 0.223
7
  }
 
1
  {
2
+ "epoch": 3.0,
3
+ "train_loss": 0.5746448771096766,
4
+ "train_runtime": 1124.5772,
5
+ "train_samples_per_second": 7.285,
6
+ "train_steps_per_second": 0.455
7
  }
best_metrics.json CHANGED
@@ -1 +1 @@
1
- {"eval_loss": 0.3460787236690521}
 
1
+ {"eval_loss": 0.43469348549842834}
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 24.04,
3
- "train_loss": 0.24291648308280855,
4
- "train_runtime": 18372.1559,
5
- "train_samples_per_second": 3.567,
6
- "train_steps_per_second": 0.223
7
  }
 
1
  {
2
+ "epoch": 3.0,
3
+ "train_loss": 0.5746448771096766,
4
+ "train_runtime": 1124.5772,
5
+ "train_samples_per_second": 7.285,
6
+ "train_steps_per_second": 0.455
7
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1b7377c91947b1cb0e5aef3bd1f8996d27a4271b83c0b7ab8ebcd5796a7a15e
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6ec9b9f5f072535b9595e9544338e214bf19768c7fa12b3894f9ba7b868bfbc
3
  size 4920