soroushheidary commited on
Commit
bd4488a
·
verified ·
1 Parent(s): 84cf1a5

Training in progress, step 33

Browse files
adapter_config.json CHANGED
@@ -2,32 +2,41 @@
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "tiiuae/falcon-11B",
 
 
5
  "bias": "none",
 
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
 
9
  "layer_replication": null,
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
- "lora_alpha": 2,
14
- "lora_dropout": 0.05,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": [
18
  "classifier",
19
  "score"
20
  ],
21
- "peft_type": "LORA",
22
- "r": 8,
23
- "rank_pattern": {},
 
24
  "revision": null,
25
  "target_modules": [
26
- "dense_4h_to_h",
27
  "query_key_value",
 
28
  "dense_h_to_4h"
29
  ],
 
30
  "task_type": "SEQ_CLS",
 
 
 
31
  "use_dora": false,
32
  "use_rslora": false
33
  }
 
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "tiiuae/falcon-11B",
5
+ "beta1": 0.85,
6
+ "beta2": 0.85,
7
  "bias": "none",
8
+ "deltaT": 1,
9
  "fan_in_fan_out": false,
10
  "inference_mode": true,
11
  "init_lora_weights": true,
12
+ "init_r": 12,
13
  "layer_replication": null,
14
  "layers_pattern": null,
15
  "layers_to_transform": null,
16
  "loftq_config": {},
17
+ "lora_alpha": 16,
18
+ "lora_dropout": 0.01,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": [
22
  "classifier",
23
  "score"
24
  ],
25
+ "orth_reg_weight": 0.5,
26
+ "peft_type": "ADALORA",
27
+ "r": 2,
28
+ "rank_pattern": null,
29
  "revision": null,
30
  "target_modules": [
 
31
  "query_key_value",
32
+ "dense_4h_to_h",
33
  "dense_h_to_4h"
34
  ],
35
+ "target_r": 8,
36
  "task_type": "SEQ_CLS",
37
+ "tfinal": 0,
38
+ "tinit": 0,
39
+ "total_step": null,
40
  "use_dora": false,
41
  "use_rslora": false
42
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bdcb2229f86a200df1a5b7b24ac6f1bf46f59a5d0dd00d1e7057bce1cb0ea42d
3
- size 98387400
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15ac6b82791562199642e0730017c4857315128aec43aa4540e84e6e2c9ff714
3
+ size 147569848
runs/Sep29_12-59-11_e3d96b08e858/events.out.tfevents.1727614752.e3d96b08e858.1297.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6df2452b3857f7786d47dba6b2e318e5d1ce42bb9f7084fe12b90f0869b31ee7
3
+ size 13368
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f58392b55571c43a95e5831930510cf8aca4553d7bea5991a6c8325b026b59d
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6d37eb0148f1a37a83c9bef028ee9f98438987c56bdf8023e635dbf864e7910
3
  size 5176