RetrO21 commited on
Commit
3e4596e
·
verified ·
1 Parent(s): fd06e4d

Training in progress, epoch 1

Browse files
README.md CHANGED
@@ -35,9 +35,9 @@ This model was trained with SFT.
35
  ### Framework versions
36
 
37
  - TRL: 0.25.1
38
- - Transformers: 4.57.1
39
- - Pytorch: 2.8.0+cu126
40
- - Datasets: 4.0.0
41
  - Tokenizers: 0.22.1
42
 
43
  ## Citations
 
35
  ### Framework versions
36
 
37
  - TRL: 0.25.1
38
+ - Transformers: 4.57.3
39
+ - Pytorch: 2.9.1
40
+ - Datasets: 4.4.1
41
  - Tokenizers: 0.22.1
42
 
43
  ## Citations
adapter_config.json CHANGED
@@ -1,9 +1,12 @@
1
  {
 
2
  "alpha_pattern": {},
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "Qwen/Qwen2-VL-2B-Instruct",
5
  "bias": "none",
6
  "corda_config": null,
 
7
  "eva_config": null,
8
  "exclude_modules": null,
9
  "fan_in_fan_out": false,
@@ -13,20 +16,23 @@
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
- "lora_alpha": 16,
17
  "lora_bias": false,
18
  "lora_dropout": 0.1,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
 
23
  "qalora_group_size": 16,
24
  "r": 8,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
 
28
  "q_proj",
29
- "v_proj"
30
  ],
31
  "target_parameters": null,
32
  "task_type": "CAUSAL_LM",
 
1
  {
2
+ "alora_invocation_tokens": null,
3
  "alpha_pattern": {},
4
+ "arrow_config": null,
5
  "auto_mapping": null,
6
  "base_model_name_or_path": "Qwen/Qwen2-VL-2B-Instruct",
7
  "bias": "none",
8
  "corda_config": null,
9
+ "ensure_weight_tying": false,
10
  "eva_config": null,
11
  "exclude_modules": null,
12
  "fan_in_fan_out": false,
 
16
  "layers_pattern": null,
17
  "layers_to_transform": null,
18
  "loftq_config": {},
19
+ "lora_alpha": 32,
20
  "lora_bias": false,
21
  "lora_dropout": 0.1,
22
  "megatron_config": null,
23
  "megatron_core": "megatron.core",
24
  "modules_to_save": null,
25
  "peft_type": "LORA",
26
+ "peft_version": "0.18.0",
27
  "qalora_group_size": 16,
28
  "r": 8,
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
+ "k_proj",
33
+ "v_proj",
34
  "q_proj",
35
+ "o_proj"
36
  ],
37
  "target_parameters": null,
38
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c61e6c26341379c2e665c23fbce3359df5e996d418ef431e723615acb1eae63
3
- size 4374520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:740c85a1250aac945091b2cfb960cfcd7fd3003f1f4c6e4ca13bcd9337e543f3
3
+ size 8749064
preprocessor_config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": null,
3
+ "data_format": "channels_first",
4
+ "default_to_square": true,
5
+ "device": null,
6
+ "disable_grouping": null,
7
+ "do_center_crop": null,
8
+ "do_convert_rgb": true,
9
+ "do_normalize": true,
10
+ "do_pad": null,
11
+ "do_rescale": true,
12
+ "do_resize": true,
13
+ "image_mean": [
14
+ 0.48145466,
15
+ 0.4578275,
16
+ 0.40821073
17
+ ],
18
+ "image_processor_type": "Qwen2VLImageProcessorFast",
19
+ "image_std": [
20
+ 0.26862954,
21
+ 0.26130258,
22
+ 0.27577711
23
+ ],
24
+ "input_data_format": null,
25
+ "max_pixels": 12845056,
26
+ "merge_size": 2,
27
+ "min_pixels": 3136,
28
+ "pad_size": null,
29
+ "patch_size": 14,
30
+ "processor_class": "Qwen2VLProcessor",
31
+ "resample": 3,
32
+ "rescale_factor": 0.00392156862745098,
33
+ "return_tensors": null,
34
+ "size": {
35
+ "longest_edge": 12845056,
36
+ "shortest_edge": 3136
37
+ },
38
+ "temporal_patch_size": 2
39
+ }
runs/Dec01_04-29-02_132-145-133-63/events.out.tfevents.1764563546.132-145-133-63.4719.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5819686e8311fb87d76a330e9f3cbd7cb0e04deb1ec5f7edfea1d7ea14edaf73
3
+ size 12568
runs/Nov27_09-05-25_158-101-122-208/events.out.tfevents.1764234417.158-101-122-208.1760.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:934a3c1a698a294a75a7fdd6e047500c42e3d5721783295080e999c7b412e51e
3
+ size 77720
runs/Nov28_05-39-54_129-213-22-251/events.out.tfevents.1764308482.129-213-22-251.1635.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb92b31906b59c0acd32f14c586f7164f067b2b5da4da7016fe51f881ecc820d
3
+ size 20208
runs/Nov28_05-59-12_129-213-22-251/events.out.tfevents.1764309630.129-213-22-251.1635.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f6e595faf6b87acdd921963a4c3346a24399621c9ccd5e9fee4c12d1cc72afb
3
+ size 36116
runs/Nov28_07-06-58_129-213-22-251/events.out.tfevents.1764313877.129-213-22-251.1635.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3699e4ad00e96f64f617f41c1c3f903e3bfea725a00546aec43c18e2514ccb8
3
+ size 8331
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ecce47d18bf4423b0687b472437a5fa1c72cae786aabf42ba0600354efbcca9e
3
  size 6225
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1adcf89e2ce7be508f245e87af0fd5d93d0d2e7562c07049b800c8d5a6b1822e
3
  size 6225
video_preprocessor_config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": null,
3
+ "data_format": "channels_first",
4
+ "default_to_square": true,
5
+ "device": null,
6
+ "do_center_crop": null,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "do_sample_frames": false,
12
+ "fps": null,
13
+ "image_mean": [
14
+ 0.48145466,
15
+ 0.4578275,
16
+ 0.40821073
17
+ ],
18
+ "image_std": [
19
+ 0.26862954,
20
+ 0.26130258,
21
+ 0.27577711
22
+ ],
23
+ "input_data_format": null,
24
+ "max_frames": 768,
25
+ "max_pixels": 12845056,
26
+ "merge_size": 2,
27
+ "min_frames": 4,
28
+ "min_pixels": 3136,
29
+ "num_frames": null,
30
+ "pad_size": null,
31
+ "patch_size": 14,
32
+ "processor_class": "Qwen2VLProcessor",
33
+ "resample": 3,
34
+ "rescale_factor": 0.00392156862745098,
35
+ "return_metadata": false,
36
+ "size": {
37
+ "longest_edge": 12845056,
38
+ "shortest_edge": 3136
39
+ },
40
+ "temporal_patch_size": 2,
41
+ "video_metadata": null,
42
+ "video_processor_type": "Qwen2VLVideoProcessor"
43
+ }