Tfloow commited on
Commit
25f441e
·
verified ·
1 Parent(s): 1ce6cf9

Training in progress, step 50

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: Meta-Llama-3.1-8B-Instruct-AWQ-INT4_simulated_3-bits_lora
5
  tags:
6
  - generated_from_trainer
7
- - trl
8
  - sft
 
9
  licence: license
10
  ---
11
 
 
4
  model_name: Meta-Llama-3.1-8B-Instruct-AWQ-INT4_simulated_3-bits_lora
5
  tags:
6
  - generated_from_trainer
 
7
  - sft
8
+ - trl
9
  licence: license
10
  ---
11
 
adapter_config.json CHANGED
@@ -4,11 +4,18 @@
4
  "base_model_name_or_path": "hugging-quants/Meta-Llama-3.1-8B-Instruct-AWQ-INT4",
5
  "bias": "none",
6
  "corda_config": null,
7
- "eva_config": null,
 
 
 
 
 
 
 
8
  "exclude_modules": null,
9
  "fan_in_fan_out": false,
10
  "inference_mode": true,
11
- "init_lora_weights": true,
12
  "layer_replication": null,
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
@@ -25,13 +32,13 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
 
28
  "q_proj",
29
- "k_proj",
30
- "v_proj",
31
  "o_proj",
32
- "down_proj",
33
  "up_proj",
34
- "gate_proj"
 
35
  ],
36
  "target_parameters": null,
37
  "task_type": "CAUSAL_LM",
 
4
  "base_model_name_or_path": "hugging-quants/Meta-Llama-3.1-8B-Instruct-AWQ-INT4",
5
  "bias": "none",
6
  "corda_config": null,
7
+ "eva_config": {
8
+ "adjust_scaling_factors": true,
9
+ "label_mask_value": -100,
10
+ "rho": 2.0,
11
+ "tau": 0.99,
12
+ "use_label_mask": true,
13
+ "whiten": false
14
+ },
15
  "exclude_modules": null,
16
  "fan_in_fan_out": false,
17
  "inference_mode": true,
18
+ "init_lora_weights": "eva",
19
  "layer_replication": null,
20
  "layers_pattern": null,
21
  "layers_to_transform": null,
 
32
  "rank_pattern": {},
33
  "revision": null,
34
  "target_modules": [
35
+ "gate_proj",
36
+ "down_proj",
37
  "q_proj",
 
 
38
  "o_proj",
 
39
  "up_proj",
40
+ "v_proj",
41
+ "k_proj"
42
  ],
43
  "target_parameters": null,
44
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89f30b36ab8d7e5c1e5f4027b8ac379dbdd1de5ef263b5b3cbecfff24e2f9fbe
3
  size 167832240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba592187ad1db5c29bfd421685286492d45aff68d43da373e12478269271931a
3
  size 167832240
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4dc31dcae6cf45b6b6d0e1b303a9c79d420a81854e22e52c896c154cab23fd68
3
  size 6353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f5e1440bca299a2a502cfdba638e3636a16a2da6db41726ecc709c0ef6e3388
3
  size 6353