VyDat commited on
Commit
8e99680
·
verified ·
1 Parent(s): 7cb8b4a

Upload model trained with Unsloth

Browse files

Upload model trained with Unsloth 2x faster

Files changed (2) hide show
  1. adapter_config.json +6 -11
  2. adapter_model.safetensors +2 -2
adapter_config.json CHANGED
@@ -1,16 +1,13 @@
1
  {
2
- "alora_invocation_tokens": null,
3
  "alpha_pattern": {},
4
- "arrow_config": null,
5
  "auto_mapping": {
6
  "base_model_class": "LlamaForCausalLM",
7
  "parent_library": "transformers.models.llama.modeling_llama",
8
  "unsloth_fixed": true
9
  },
10
- "base_model_name_or_path": "unsloth/Llama-3.2-1B-Instruct",
11
  "bias": "none",
12
  "corda_config": null,
13
- "ensure_weight_tying": false,
14
  "eva_config": null,
15
  "exclude_modules": null,
16
  "fan_in_fan_out": false,
@@ -20,28 +17,26 @@
20
  "layers_pattern": null,
21
  "layers_to_transform": null,
22
  "loftq_config": {},
23
- "lora_alpha": 128,
24
  "lora_bias": false,
25
- "lora_dropout": 0.05,
26
  "megatron_config": null,
27
  "megatron_core": "megatron.core",
28
  "modules_to_save": null,
29
  "peft_type": "LORA",
30
- "peft_version": "0.18.0",
31
  "qalora_group_size": 16,
32
- "r": 64,
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
- "down_proj",
37
  "up_proj",
38
- "v_proj",
39
  "o_proj",
40
  "gate_proj",
 
41
  "q_proj",
42
  "k_proj"
43
  ],
44
- "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
46
  "trainable_token_indices": null,
47
  "use_dora": false,
 
1
  {
 
2
  "alpha_pattern": {},
 
3
  "auto_mapping": {
4
  "base_model_class": "LlamaForCausalLM",
5
  "parent_library": "transformers.models.llama.modeling_llama",
6
  "unsloth_fixed": true
7
  },
8
+ "base_model_name_or_path": "unsloth/llama-3.2-1b-instruct-unsloth-bnb-4bit",
9
  "bias": "none",
10
  "corda_config": null,
 
11
  "eva_config": null,
12
  "exclude_modules": null,
13
  "fan_in_fan_out": false,
 
17
  "layers_pattern": null,
18
  "layers_to_transform": null,
19
  "loftq_config": {},
20
+ "lora_alpha": 16,
21
  "lora_bias": false,
22
+ "lora_dropout": 0,
23
  "megatron_config": null,
24
  "megatron_core": "megatron.core",
25
  "modules_to_save": null,
26
  "peft_type": "LORA",
 
27
  "qalora_group_size": 16,
28
+ "r": 16,
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
 
32
  "up_proj",
33
+ "down_proj",
34
  "o_proj",
35
  "gate_proj",
36
+ "v_proj",
37
  "q_proj",
38
  "k_proj"
39
  ],
 
40
  "task_type": "CAUSAL_LM",
41
  "trainable_token_indices": null,
42
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9619e6452d6ed71e55d161ffff90da152359c4d856ee93a74e43494118f1717
3
- size 180385008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c819383131287784820d5ad14a2a6b0267e03d2b3e190e4d8fa7ab6cd948a12
3
+ size 45118424