weathon commited on
Commit
afd7526
·
verified ·
1 Parent(s): 2481270

Training in progress, step 300

Browse files
README.md CHANGED
@@ -1,17 +1,17 @@
1
  ---
2
- base_model: Qwen/Qwen2.5-VL-32B-Instruct
3
  library_name: transformers
4
  model_name: anti_aesthetics_captioning
5
  tags:
6
  - generated_from_trainer
7
- - sft
8
  - trl
 
9
  licence: license
10
  ---
11
 
12
  # Model Card for anti_aesthetics_captioning
13
 
14
- This model is a fine-tuned version of [Qwen/Qwen2.5-VL-32B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-32B-Instruct).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
@@ -27,7 +27,7 @@ print(output["generated_text"])
27
 
28
  ## Training procedure
29
 
30
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/3dsmile/huggingface/runs/epb6vhi4)
31
 
32
 
33
  This model was trained with SFT.
 
1
  ---
2
+ base_model: Qwen/Qwen2.5-VL-7B-Instruct
3
  library_name: transformers
4
  model_name: anti_aesthetics_captioning
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - sft
9
  licence: license
10
  ---
11
 
12
  # Model Card for anti_aesthetics_captioning
13
 
14
+ This model is a fine-tuned version of [Qwen/Qwen2.5-VL-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-7B-Instruct).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
 
27
 
28
  ## Training procedure
29
 
30
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/3dsmile/huggingface/runs/4n52rfyh)
31
 
32
 
33
  This model was trained with SFT.
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "Qwen/Qwen2.5-VL-32B-Instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
@@ -13,7 +13,7 @@
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
- "lora_alpha": 32,
17
  "lora_bias": false,
18
  "lora_dropout": 0.0,
19
  "megatron_config": null,
@@ -21,14 +21,15 @@
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
  "qalora_group_size": 16,
24
- "r": 32,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "q_proj",
29
- "v_proj",
30
  "o_proj",
31
- "k_proj"
 
 
32
  ],
33
  "target_parameters": null,
34
  "task_type": "CAUSAL_LM",
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "Qwen/Qwen2.5-VL-7B-Instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
 
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
+ "lora_alpha": 64,
17
  "lora_bias": false,
18
  "lora_dropout": 0.0,
19
  "megatron_config": null,
 
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
  "qalora_group_size": 16,
24
+ "r": 64,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
+ "k_proj",
 
29
  "o_proj",
30
+ "qkv",
31
+ "v_proj",
32
+ "q_proj"
33
  ],
34
  "target_parameters": null,
35
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0d5da870d48a8f905b015d6e2efcd452a686163e847df272b3d891f39157a97
3
- size 268512816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d4c646c251e57b1c0db2d3dd76a524ed1dece3cc8d2031eedd7abcf5375836c
3
+ size 203466072
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db86ecd266c79166b251c06cf57c50214857fa4fe82b2bedb895efeb20ee9014
3
  size 5777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed701b2b37e1bca68597c2d604aee0f225b006e0ed7e46fcbd34bee44b9a8e60
3
  size 5777