weathon commited on
Commit
4fd48f6
·
verified ·
1 Parent(s): 9539c80

Training in progress, step 200

Browse files
adapter_config.json CHANGED
@@ -16,7 +16,7 @@
16
  "layers_pattern": null,
17
  "layers_to_transform": null,
18
  "loftq_config": {},
19
- "lora_alpha": 32,
20
  "lora_bias": false,
21
  "lora_dropout": 0.0,
22
  "megatron_config": null,
@@ -24,39 +24,39 @@
24
  "modules_to_save": null,
25
  "peft_type": "LORA",
26
  "qalora_group_size": 16,
27
- "r": 32,
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
31
- "projections.1",
32
- "projections.4",
33
- "fc1",
34
- "projection",
35
- "query",
36
- "projections.10",
37
- "itm_head",
38
- "projections.12",
39
  "fc2",
 
 
 
 
40
  "projections.8",
 
 
 
 
41
  "value",
42
- "projections.0",
43
- "projections.16",
44
- "projections.3",
45
  "vision_projection",
 
 
46
  "projections.7",
47
- "qkv",
48
- "projections.9",
49
- "text_projection",
50
- "projections.11",
51
- "projections.17",
52
- "key",
53
  "projections.13",
54
- "projections.6",
55
- "dense",
 
 
56
  "projections.15",
 
 
 
 
57
  "projections.5",
58
- "projections.14",
59
- "projections.2"
60
  ],
61
  "target_parameters": null,
62
  "task_type": null,
 
16
  "layers_pattern": null,
17
  "layers_to_transform": null,
18
  "loftq_config": {},
19
+ "lora_alpha": 64,
20
  "lora_bias": false,
21
  "lora_dropout": 0.0,
22
  "megatron_config": null,
 
24
  "modules_to_save": null,
25
  "peft_type": "LORA",
26
  "qalora_group_size": 16,
27
+ "r": 64,
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
31
+ "projections.16",
 
 
 
 
 
 
 
32
  "fc2",
33
+ "projections.10",
34
+ "projections.3",
35
+ "projections.14",
36
+ "projections.4",
37
  "projections.8",
38
+ "projections.1",
39
+ "projections.17",
40
+ "projections.9",
41
+ "projections.6",
42
  "value",
 
 
 
43
  "vision_projection",
44
+ "dense",
45
+ "query",
46
  "projections.7",
 
 
 
 
 
 
47
  "projections.13",
48
+ "key",
49
+ "projection",
50
+ "text_projection",
51
+ "projections.0",
52
  "projections.15",
53
+ "projections.11",
54
+ "projections.12",
55
+ "qkv",
56
+ "itm_head",
57
  "projections.5",
58
+ "projections.2",
59
+ "fc1"
60
  ],
61
  "target_parameters": null,
62
  "task_type": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ea07561893b40da0e74760e3e05b48effecec53c4075af3b189d2ea37595943
3
- size 157934960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efe22196619394984462a449a57d5f4e05e9b83dd6618964b479c8e620a21a06
3
+ size 315779008
runs/Oct08_02-36-25_e41bbb0dd69c/events.out.tfevents.1759890986.e41bbb0dd69c.19881.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e36be2b8de33472d053e20c565f9153091a22582c9e9daedb7ebc900f6c16975
3
+ size 8885
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a285df2580f8deb2fb52d6b92c8381ec9089f886f7cb7b83162af42771ac5544
3
  size 5777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7fb6989cd71af6446aaa7bbd135f1650d8a343e3c2323bad4ded21895b574d9
3
  size 5777