codegood commited on
Commit
4a24086
·
verified ·
1 Parent(s): 769aeaa

Upload model trained with Unsloth

Browse files

Upload model trained with Unsloth 2x faster

Files changed (2) hide show
  1. adapter_config.json +0 -5
  2. adapter_model.safetensors +1 -1
adapter_config.json CHANGED
@@ -1,7 +1,5 @@
1
  {
2
- "alora_invocation_tokens": null,
3
  "alpha_pattern": {},
4
- "arrow_config": null,
5
  "auto_mapping": {
6
  "base_model_class": "Gemma3ForConditionalGeneration",
7
  "parent_library": "transformers.models.gemma3.modeling_gemma3",
@@ -10,7 +8,6 @@
10
  "base_model_name_or_path": "unsloth/gemma-3-4b-pt-unsloth-bnb-4bit",
11
  "bias": "none",
12
  "corda_config": null,
13
- "ensure_weight_tying": false,
14
  "eva_config": null,
15
  "exclude_modules": null,
16
  "fan_in_fan_out": false,
@@ -27,13 +24,11 @@
27
  "megatron_core": "megatron.core",
28
  "modules_to_save": null,
29
  "peft_type": "LORA",
30
- "peft_version": "0.18.0",
31
  "qalora_group_size": 16,
32
  "r": 16,
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": "(?:.*?(?:vision|image|visual|patch|language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:k_proj|v_proj|q_proj|out_proj|fc1|fc2|o_proj|gate_proj|up_proj|down_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:k_proj|v_proj|q_proj|out_proj|fc1|fc2|o_proj|gate_proj|up_proj|down_proj)))",
36
- "target_parameters": null,
37
  "task_type": "CAUSAL_LM",
38
  "trainable_token_indices": null,
39
  "use_dora": false,
 
1
  {
 
2
  "alpha_pattern": {},
 
3
  "auto_mapping": {
4
  "base_model_class": "Gemma3ForConditionalGeneration",
5
  "parent_library": "transformers.models.gemma3.modeling_gemma3",
 
8
  "base_model_name_or_path": "unsloth/gemma-3-4b-pt-unsloth-bnb-4bit",
9
  "bias": "none",
10
  "corda_config": null,
 
11
  "eva_config": null,
12
  "exclude_modules": null,
13
  "fan_in_fan_out": false,
 
24
  "megatron_core": "megatron.core",
25
  "modules_to_save": null,
26
  "peft_type": "LORA",
 
27
  "qalora_group_size": 16,
28
  "r": 16,
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": "(?:.*?(?:vision|image|visual|patch|language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:k_proj|v_proj|q_proj|out_proj|fc1|fc2|o_proj|gate_proj|up_proj|down_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:k_proj|v_proj|q_proj|out_proj|fc1|fc2|o_proj|gate_proj|up_proj|down_proj)))",
 
32
  "task_type": "CAUSAL_LM",
33
  "trainable_token_indices": null,
34
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:466935ebb2625b641e2e2e1dd5d64f94f89d5b797efb8282c63fcf65256fb381
3
  size 154116312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cd7ad46ae4dd8e47169ce11ac701ab414ec1a85f4b6b80d208936233d5bfe91
3
  size 154116312