Buura commited on
Commit
7600d4c
·
verified ·
1 Parent(s): 732aa81

Upload folder using huggingface_hub

Browse files
checkpoints/checkpoint-1800/README.md CHANGED
@@ -1,6 +1,11 @@
1
  ---
2
  base_model: Qwen/Qwen2.5-Coder-1.5B
3
  library_name: peft
 
 
 
 
 
4
  ---
5
 
6
  # Model Card for Model ID
@@ -199,4 +204,4 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
199
  [More Information Needed]
200
  ### Framework versions
201
 
202
- - PEFT 0.15.2
 
1
  ---
2
  base_model: Qwen/Qwen2.5-Coder-1.5B
3
  library_name: peft
4
+ pipeline_tag: text-generation
5
+ tags:
6
+ - base_model:adapter:Qwen/Qwen2.5-Coder-1.5B
7
+ - lora
8
+ - transformers
9
  ---
10
 
11
  # Model Card for Model ID
 
204
  [More Information Needed]
205
  ### Framework versions
206
 
207
+ - PEFT 0.17.0
checkpoints/checkpoint-1800/adapter_config.json CHANGED
@@ -20,17 +20,20 @@
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
- "r": 8,
 
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
 
27
  "q_proj",
28
  "v_proj",
29
- "o_proj",
30
- "k_proj"
31
  ],
 
32
  "task_type": "CAUSAL_LM",
33
  "trainable_token_indices": null,
34
  "use_dora": false,
 
35
  "use_rslora": false
36
  }
 
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
+ "qalora_group_size": 16,
24
+ "r": 16,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
+ "k_proj",
29
  "q_proj",
30
  "v_proj",
31
+ "o_proj"
 
32
  ],
33
+ "target_parameters": null,
34
  "task_type": "CAUSAL_LM",
35
  "trainable_token_indices": null,
36
  "use_dora": false,
37
+ "use_qalora": false,
38
  "use_rslora": false
39
  }
checkpoints/checkpoint-1800/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1033f30fe198c963ab4adb761d769603e4bb2d0f472a486c62db933d02500cd8
3
- size 8745704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73c47728d651268e06825556e0863e2c90727bcff62056689679ea9e6aa5f2ef
3
+ size 17462432