Upload model trained with Unsloth

Upload model trained with Unsloth 2x faster

Files changed (2) hide show

adapter_config.json CHANGED Viewed

@@ -1,13 +1,16 @@
 {
   "alpha_pattern": {},
   "auto_mapping": {
-    "base_model_class": "Qwen3VLForConditionalGeneration",
-    "parent_library": "transformers.models.qwen3_vl.modeling_qwen3_vl",
     "unsloth_fixed": true
   },
-  "base_model_name_or_path": "unsloth/qwen3-vl-8b-instruct-unsloth-bnb-4bit",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
   "exclude_modules": null,
   "fan_in_fan_out": false,
@@ -17,18 +20,19 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 16,
   "lora_bias": false,
   "lora_dropout": 0,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
   "qalora_group_size": 16,
-  "r": 16,
   "rank_pattern": {},
   "revision": null,
-  "target_modules": "(?:.*?(?:vision|image|visual|patch|language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:qkv|proj|linear_fc1|linear_fc2|q_proj|k_proj|v_proj|o_proj|gate_proj|up_proj|down_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:qkv|proj|linear_fc1|linear_fc2|q_proj|k_proj|v_proj|o_proj|gate_proj|up_proj|down_proj)))",
   "target_parameters": null,
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

 {
+  "alora_invocation_tokens": null,
   "alpha_pattern": {},
+  "arrow_config": null,
   "auto_mapping": {
+    "base_model_class": "Mistral3ForConditionalGeneration",
+    "parent_library": "transformers.models.mistral3.modeling_mistral3",
     "unsloth_fixed": true
   },
+  "base_model_name_or_path": "unsloth/Ministral-3-3B-Instruct-2512",
   "bias": "none",
   "corda_config": null,
+  "ensure_weight_tying": false,
   "eva_config": null,
   "exclude_modules": null,
   "fan_in_fan_out": false,
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 32,
   "lora_bias": false,
   "lora_dropout": 0,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "peft_version": "0.18.0",
   "qalora_group_size": 16,
+  "r": 32,
   "rank_pattern": {},
   "revision": null,
+  "target_modules": "(?:.*?(?:vision|image|visual|patch|language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:gate_proj|up_proj|down_proj|k_proj|v_proj|q_proj|o_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:gate_proj|up_proj|down_proj|k_proj|v_proj|q_proj|o_proj)))",
   "target_parameters": null,
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4ebc8e7f0ebbb4b96d07491f6c2e99dcb0ce26632cbabf92f9a51d8c2718723d
-size 205492968

 version https://git-lfs.github.com/spec/v1
+oid sha256:540cabd278419a0633ea5598b9e261ee394d4db3f7989b1dda1f3f146514191a
+size 270117632