ABrain-One commited on
Commit
718d621
·
verified ·
1 Parent(s): fabe28c

Upload model

Browse files
Files changed (3) hide show
  1. README.md +19 -0
  2. adapter_config.json +34 -0
  3. adapter_model.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: deepseek-ai/deepseek-coder-1.3b-instruct_raw
3
+ library_name: peft
4
+ ---
5
+
6
+ # Model Card for Model ID
7
+
8
+ This model is trained to provide modified cv model implementations in the LEMUR dataset project to extend the dataset.
9
+
10
+ ## Model Details
11
+
12
+ ### Model Description
13
+
14
+ The model can change parameters or layers when asked to improve the implementation of provided codes from the LEMUR project. The answer should only contain codes without explanations, even if it is not required to do so in the prompt. The model should respond codes with methods concerning the requirements of the LEMUR dataset. For most codes with average implementation complexity, at least one change should be guaranteed.
15
+
16
+ - **Model type:** Peft Model
17
+ - **Language(s):** English
18
+ - **License:** MIT
19
+ - **Finetuned from model [optional]:** deepseek-coder-1.3b-instruct_raw
adapter_config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "deepseek-ai/deepseek-coder-1.3b-instruct_raw",
5
+ "bias": "none",
6
+ "fan_in_fan_out": false,
7
+ "inference_mode": true,
8
+ "init_lora_weights": true,
9
+ "layer_replication": null,
10
+ "layers_pattern": null,
11
+ "layers_to_transform": null,
12
+ "loftq_config": {},
13
+ "lora_alpha": 64,
14
+ "lora_dropout": 0.1,
15
+ "megatron_config": null,
16
+ "megatron_core": "megatron.core",
17
+ "modules_to_save": null,
18
+ "peft_type": "LORA",
19
+ "r": 64,
20
+ "rank_pattern": {},
21
+ "revision": null,
22
+ "target_modules": [
23
+ "v_proj",
24
+ "o_proj",
25
+ "k_proj",
26
+ "up_proj",
27
+ "gate_proj",
28
+ "down_proj",
29
+ "q_proj"
30
+ ],
31
+ "task_type": "CAUSAL_LM",
32
+ "use_dora": true,
33
+ "use_rslora": false
34
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8a29fc297e9903d6eac45df051eea0f83fa8f801874076f986f8fdfa0765688
3
+ size 241970040