Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

README.md +51 -0
qwen2vl_7b_var_lora1/adapter_config.json +37 -0
qwen2vl_7b_var_lora1/adapter_model.safetensors +3 -0
qwen2vl_7b_var_select3_lora2/adapter_config.json +99 -0
qwen2vl_7b_var_select3_lora2/adapter_model.safetensors +3 -0
qwen2vl_7b_youcookii_lora1/adapter_config.json +37 -0
qwen2vl_7b_youcookii_lora1/adapter_model.safetensors +3 -0
qwen2vl_7b_youcookii_select3_lora2/adapter_config.json +99 -0
qwen2vl_7b_youcookii_select3_lora2/adapter_model.safetensors +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,51 @@

+---
+base_model: Qwen2-VL-7B-Instruct
+library_name: peft
+---
+# Model Card
+## Model Details
+- **Finetuned from model:** Qwen2-VL-7B-Instruct
+- **Finetuned dataset:** VAR, YoucookII
+- **Paper:** ABDUCTIVEMLLM: Boosting Visual Abductive Reasoning Within MLLMs
+## How to Get Started with the Model
+Use the code below to get started with the model.
+```python
+    model = Qwen2VLForConditionalGeneration.from_pretrained(
+        'path/to/your/Qwen2-VL-7B-Instruct',
+        torch_dtype='auto',
+        attn_implementation="flash_attention_2"
+    )
+    # merge lora adapter from Training Stage-1
+    lora_model_dir = 'qwen2vl_7b_var_lora1'
+    model = PeftModel.from_pretrained(model, model_id=lora_model_dir)
+    model = model.merge_and_unload()
+    # merge lora adapter from Training Stage-2
+    lora2_dir = 'qwen2vl_7b_var_select3_lora2'
+    model = PeftModel.from_pretrained(model, model_id=lora2_dir)
+    model = model.merge_and_unload()
+    model.generate()
+```
+## Citation
+```
+@article{chang2026abductivemllm,
+  title={AbductiveMLLM: Boosting Visual Abductive Reasoning Within MLLMs},
+  author={Chang, Boyu and Wang, Qi and Guo, Xi and Nan, Zhixiong and Yao, Yazhou and Zhou, Tianfei},
+  journal={arXiv preprint arXiv:2601.02771},
+  year={2026}
+}
+```

qwen2vl_7b_var_lora1/adapter_config.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "dVAR/LLM_Weights/Qwen2-VL-7B-Instruct",
+  "bias": "none",
+  "eva_config": null,
+  "exclude_modules": null,
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 32,
+  "lora_bias": false,
+  "lora_dropout": 0.05,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 16,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "k_proj",
+    "o_proj",
+    "up_proj",
+    "gate_proj",
+    "down_proj",
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

qwen2vl_7b_var_lora1/adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d0a12fca5b399467581381ef926a5a33ed9a0c8b17def9957e1c5f0aa6bb8ed
+size 80792880

qwen2vl_7b_var_select3_lora2/adapter_config.json ADDED Viewed

	@@ -0,0 +1,99 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "dVAR/LLM_Weights/Qwen2-VL-7B-Instruct",
+  "bias": "none",
+  "eva_config": null,
+  "exclude_modules": [
+    "text_projection",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn.v_proj"
+  ],
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 32,
+  "lora_bias": false,
+  "lora_dropout": 0.05,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 16,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "down_proj",
+    "v_proj",
+    "o_proj",
+    "up_proj",
+    "k_proj",
+    "gate_proj",
+    "q_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

qwen2vl_7b_var_select3_lora2/adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:759802f9cc8c1ede48c21f0aaed0a133667d90724e4a8ca770a9d687a736a103
+size 161533192

qwen2vl_7b_youcookii_lora1/adapter_config.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "dVAR/LLM_Weights/Qwen2-VL-7B-Instruct",
+  "bias": "none",
+  "eva_config": null,
+  "exclude_modules": null,
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 32,
+  "lora_bias": false,
+  "lora_dropout": 0.05,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 16,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "k_proj",
+    "q_proj",
+    "up_proj",
+    "o_proj",
+    "down_proj",
+    "v_proj",
+    "gate_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

qwen2vl_7b_youcookii_lora1/adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:47153c635282573c65397d3f253a5a29e4c2d1d25707baaee62e2076f383f05a
+size 80792880

qwen2vl_7b_youcookii_select3_lora2/adapter_config.json ADDED Viewed

	@@ -0,0 +1,99 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "dVAR/LLM_Weights/Qwen2-VL-7B-Instruct",
+  "bias": "none",
+  "eva_config": null,
+  "exclude_modules": [
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn.out_proj",
+    "text_projection",
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.4.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.0.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.7.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.10.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.3.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.9.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.5.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn.q_proj",
+    "clip_text_encoder.text_model.encoder.layers.2.self_attn.out_proj",
+    "clip_text_encoder.text_model.encoder.layers.8.self_attn.k_proj",
+    "clip_text_encoder.text_model.encoder.layers.1.self_attn.v_proj",
+    "clip_text_encoder.text_model.encoder.layers.11.self_attn",
+    "clip_text_encoder.text_model.encoder.layers.6.self_attn.out_proj"
+  ],
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 32,
+  "lora_bias": false,
+  "lora_dropout": 0.05,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 16,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "down_proj",
+    "gate_proj",
+    "k_proj",
+    "v_proj",
+    "o_proj",
+    "q_proj",
+    "up_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

qwen2vl_7b_youcookii_select3_lora2/adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5205f2327872201d2827fde4a8ad1c170b9efd4b6fb986b41c06b477eede8fe5
+size 161533192