AIsumit123 commited on
Commit
15cf3bc
·
verified ·
1 Parent(s): 94c749f

Training in progress, step 10

Browse files
adapter_config.json CHANGED
@@ -3,7 +3,7 @@
3
  "alpha_pattern": {},
4
  "arrow_config": null,
5
  "auto_mapping": null,
6
- "base_model_name_or_path": "google/mt5-small",
7
  "bias": "none",
8
  "corda_config": null,
9
  "ensure_weight_tying": false,
@@ -16,23 +16,27 @@
16
  "layers_pattern": null,
17
  "layers_to_transform": null,
18
  "loftq_config": {},
19
- "lora_alpha": 32,
20
  "lora_bias": false,
21
  "lora_dropout": 0.05,
22
  "megatron_config": null,
23
  "megatron_core": "megatron.core",
24
- "modules_to_save": null,
 
 
25
  "peft_type": "LORA",
26
  "peft_version": "0.18.0",
27
  "qalora_group_size": 16,
28
- "r": 16,
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
  "q",
33
- "o",
34
  "k",
35
- "v"
 
 
36
  ],
37
  "target_parameters": null,
38
  "task_type": "SEQ_2_SEQ_LM",
 
3
  "alpha_pattern": {},
4
  "arrow_config": null,
5
  "auto_mapping": null,
6
+ "base_model_name_or_path": "google/mt5-base",
7
  "bias": "none",
8
  "corda_config": null,
9
  "ensure_weight_tying": false,
 
16
  "layers_pattern": null,
17
  "layers_to_transform": null,
18
  "loftq_config": {},
19
+ "lora_alpha": 64,
20
  "lora_bias": false,
21
  "lora_dropout": 0.05,
22
  "megatron_config": null,
23
  "megatron_core": "megatron.core",
24
+ "modules_to_save": [
25
+ "lm_head"
26
+ ],
27
  "peft_type": "LORA",
28
  "peft_version": "0.18.0",
29
  "qalora_group_size": 16,
30
+ "r": 32,
31
  "rank_pattern": {},
32
  "revision": null,
33
  "target_modules": [
34
  "q",
35
+ "v",
36
  "k",
37
+ "wi_1",
38
+ "wi_0",
39
+ "wo"
40
  ],
41
  "target_parameters": null,
42
  "task_type": "SEQ_2_SEQ_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:773536de88447595b67a1d37ffb7c112d6c9a139a54bf929540bde4d49c877f8
3
- size 5531800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:008544ce963eb3d5056775af96004ba688d133021d742a107ceafe07070e4ccf
3
+ size 815581456
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a522bc2d1d1079fb198e48926a65db109911f8c0fe54c0a30d01e91079a1687d
3
- size 6097
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa3522c0523845f65b29d7fd5f1f6653fe6516b7bdbd22510a99199b6e2e1ef6
3
+ size 5688