ExplosionNuclear commited on
Commit
5be5061
·
verified ·
1 Parent(s): d3ef8a4

Training in progress, step 15

Browse files
adapter_config.json CHANGED
@@ -3,7 +3,6 @@
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "ExplosionNuclear/Llama-2.3-3B-Instruct-special",
5
  "bias": "lora_only",
6
- "corda_config": null,
7
  "eva_config": null,
8
  "exclude_modules": null,
9
  "fan_in_fan_out": false,
@@ -20,22 +19,19 @@
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
- "qalora_group_size": 16,
24
  "r": 2,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "v_proj",
29
- "k_proj",
30
- "up_proj",
31
  "down_proj",
 
 
 
32
  "o_proj",
33
- "q_proj",
34
- "gate_proj"
35
  ],
36
  "task_type": "CAUSAL_LM",
37
- "trainable_token_indices": null,
38
  "use_dora": false,
39
- "use_qalora": false,
40
  "use_rslora": false
41
  }
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "ExplosionNuclear/Llama-2.3-3B-Instruct-special",
5
  "bias": "lora_only",
 
6
  "eva_config": null,
7
  "exclude_modules": null,
8
  "fan_in_fan_out": false,
 
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": null,
21
  "peft_type": "LORA",
 
22
  "r": 2,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "q_proj",
 
 
27
  "down_proj",
28
+ "gate_proj",
29
+ "k_proj",
30
+ "v_proj",
31
  "o_proj",
32
+ "up_proj"
 
33
  ],
34
  "task_type": "CAUSAL_LM",
 
35
  "use_dora": false,
 
36
  "use_rslora": false
37
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f9088699c7de898863be4a0ac3afce54378ef66fa50e665fbd3a4337d19daec
3
  size 12208024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccdeb117b5321cf3e23865ef2f2c13211bb3324e92c66f1382ac3ea1830d0d4d
3
  size 12208024
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5ea7cd63307494abcbf6ce5ffe37692631cd23cfa2dc6e50c08f465d3115335
3
- size 14520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec95a8c46bcb2a0d603ebb4f2931ba97a766a3794b3ccf712b7d4cbdaf37e41b
3
+ size 18936