Add lora_tuned_stage2

Browse files

Files changed (15) hide show

lora_tuned_stage2/checkpoint-15000/adapter_config.json +128 -0
lora_tuned_stage2/checkpoint-15000/adapter_model.safetensors +3 -0
lora_tuned_stage2/checkpoint-15000/generation_config.json +12 -0
lora_tuned_stage2/checkpoint-15000/optimizer.pt +3 -0
lora_tuned_stage2/checkpoint-15000/rng_state_0.pth +3 -0
lora_tuned_stage2/checkpoint-15000/rng_state_1.pth +3 -0
lora_tuned_stage2/checkpoint-15000/rng_state_2.pth +3 -0
lora_tuned_stage2/checkpoint-15000/rng_state_3.pth +3 -0
lora_tuned_stage2/checkpoint-15000/rng_state_4.pth +3 -0
lora_tuned_stage2/checkpoint-15000/rng_state_5.pth +3 -0
lora_tuned_stage2/checkpoint-15000/rng_state_6.pth +3 -0
lora_tuned_stage2/checkpoint-15000/rng_state_7.pth +3 -0
lora_tuned_stage2/checkpoint-15000/scheduler.pt +3 -0
lora_tuned_stage2/checkpoint-15000/trainer_state.json +0 -0
lora_tuned_stage2/checkpoint-15000/training_args.bin +3 -0

lora_tuned_stage2/checkpoint-15000/adapter_config.json ADDED Viewed

	@@ -0,0 +1,128 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "/leonardo_scratch/large/userexternal/dbucciar/hf-cache/hf-cache/image_first_after15k_after_lvis_idefics",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": false,
+  "init_lora_weights": "gaussian",
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 16,
+  "lora_dropout": 0.1,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 64,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "text_model.layers.15.self_attn.k_proj",
+    "text_model.layers.19.self_attn.v_proj",
+    "text_model.layers.10.self_attn.k_proj",
+    "text_model.layers.7.self_attn.k_proj",
+    "text_model.layers.16.self_attn.q_proj",
+    "text_model.layers.16.self_attn.v_proj",
+    "30.self_attn.v_proj",
+    "text_model.layers.25.self_attn.q_proj",
+    "27.self_attn.k_proj",
+    "text_model.layers.26.self_attn.q_proj",
+    "text_model.layers.11.self_attn.v_proj",
+    "text_model.layers.20.self_attn.k_proj",
+    "text_model.layers.21.self_attn.v_proj",
+    "31.self_attn.v_proj",
+    "text_model.layers.0.self_attn.k_proj",
+    "gate_proj",
+    "text_model.layers.16.self_attn.k_proj",
+    "27.self_attn.v_proj",
+    "up_proj",
+    "text_model.layers.25.self_attn.v_proj",
+    "text_model.layers.23.self_attn.k_proj",
+    "text_model.layers.13.self_attn.v_proj",
+    "down_proj",
+    "text_model.layers.5.self_attn.k_proj",
+    "text_model.layers.24.self_attn.k_proj",
+    "text_model.layers.0.self_attn.v_proj",
+    "text_model.layers.14.self_attn.q_proj",
+    "text_model.layers.1.self_attn.k_proj",
+    "text_model.layers.15.self_attn.v_proj",
+    "text_model.layers.14.self_attn.k_proj",
+    "text_model.layers.17.self_attn.k_proj",
+    "text_model.layers.7.self_attn.q_proj",
+    "text_model.layers.8.self_attn.q_proj",
+    "text_model.layers.11.self_attn.k_proj",
+    "text_model.layers.3.self_attn.q_proj",
+    "text_model.layers.18.self_attn.v_proj",
+    "text_model.layers.19.self_attn.k_proj",
+    "28.self_attn.v_proj",
+    "text_model.layers.15.self_attn.q_proj",
+    "text_model.layers.9.self_attn.k_proj",
+    "text_model.layers.13.self_attn.k_proj",
+    "text_model.layers.20.self_attn.v_proj",
+    "text_model.layers.2.self_attn.q_proj",
+    "28.self_attn.k_proj",
+    "text_model.layers.1.self_attn.v_proj",
+    "29.self_attn.k_proj",
+    "text_model.layers.4.self_attn.k_proj",
+    "text_model.layers.9.self_attn.v_proj",
+    "text_model.layers.12.self_attn.v_proj",
+    "text_model.layers.17.self_attn.v_proj",
+    "text_model.layers.10.self_attn.q_proj",
+    "text_model.layers.22.self_attn.k_proj",
+    "text_model.layers.20.self_attn.q_proj",
+    "lm_head",
+    "text_model.layers.2.self_attn.v_proj",
+    "text_model.layers.1.self_attn.q_proj",
+    "text_model.layers.18.self_attn.q_proj",
+    "31.self_attn.q_proj",
+    "text_model.layers.6.self_attn.q_proj",
+    "text_model.layers.21.self_attn.k_proj",
+    "text_model.layers.4.self_attn.v_proj",
+    "text_model.layers.25.self_attn.k_proj",
+    "text_model.layers.19.self_attn.q_proj",
+    "text_model.layers.26.self_attn.k_proj",
+    "text_model.layers.8.self_attn.k_proj",
+    "30.self_attn.k_proj",
+    "text_model.layers.5.self_attn.v_proj",
+    "text_model.layers.8.self_attn.v_proj",
+    "27.self_attn.q_proj",
+    "text_model.layers.22.self_attn.v_proj",
+    "text_model.layers.0.self_attn.q_proj",
+    "text_model.layers.5.self_attn.q_proj",
+    "text_model.layers.3.self_attn.v_proj",
+    "text_model.layers.12.self_attn.q_proj",
+    "28.self_attn.q_proj",
+    "text_model.layers.10.self_attn.v_proj",
+    "text_model.layers.13.self_attn.q_proj",
+    "text_model.layers.6.self_attn.k_proj",
+    "31.self_attn.k_proj",
+    "text_model.layers.26.self_attn.v_proj",
+    "text_model.layers.7.self_attn.v_proj",
+    "text_model.layers.2.self_attn.k_proj",
+    "text_model.layers.11.self_attn.q_proj",
+    "text_model.layers.4.self_attn.q_proj",
+    "29.self_attn.v_proj",
+    "text_model.layers.6.self_attn.v_proj",
+    "30.self_attn.q_proj",
+    "text_model.layers.18.self_attn.k_proj",
+    "text_model.layers.23.self_attn.q_proj",
+    "text_model.layers.14.self_attn.v_proj",
+    "text_model.layers.23.self_attn.v_proj",
+    "text_model.layers.17.self_attn.q_proj",
+    "text_model.layers.22.self_attn.q_proj",
+    "29.self_attn.q_proj",
+    "o_proj",
+    "text_model.layers.21.self_attn.q_proj",
+    "text_model.layers.3.self_attn.k_proj",
+    "text_model.layers.9.self_attn.q_proj",
+    "text_model.layers.24.self_attn.v_proj",
+    "text_model.layers.12.self_attn.k_proj",
+    "text_model.layers.24.self_attn.q_proj"
+  ],
+  "task_type": null,
+  "use_dora": false,
+  "use_rslora": false
+}

lora_tuned_stage2/checkpoint-15000/adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7728e2b6c308713c11c7329f6e349b2ef0acf5b00c3240924a4a6da40b855cd
+size 2806433816

lora_tuned_stage2/checkpoint-15000/generation_config.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 128000,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009,
+    128258
+  ],
+  "pad_token_id": 128002,
+  "transformers_version": "4.45.0.dev0"
+}

lora_tuned_stage2/checkpoint-15000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05fbd830c8460e35b06447efb5612286675b39ed7ee287f180a624fd728ffb6b
+size 358532508

lora_tuned_stage2/checkpoint-15000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a2280c4383b1248c16c14176cd46d34d73a0622be747d55a6c0513e3a602257
+size 14960

lora_tuned_stage2/checkpoint-15000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ce150bcd7185431ddc00a7d0e4fae3ce9876bb1fbcdacabac55cb1846ef6ea5
+size 14960

lora_tuned_stage2/checkpoint-15000/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1272852f12f33fd5ef0c2b9941732f49b8cbf938da3ea6369c52dc9c117148b5
+size 14960

lora_tuned_stage2/checkpoint-15000/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32a479173eac6fc419d1753d9a150fe9441bdc89e5fa687467cec12818bfbee4
+size 14960

lora_tuned_stage2/checkpoint-15000/rng_state_4.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9c1acd83f2ae1643b2ae86dee0266b9705b2988ede4f2fc770a10cd595c98ad4
+size 14960

lora_tuned_stage2/checkpoint-15000/rng_state_5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6406a687bc2bf0f1ddd4651fad2ca5a34e59249e3ac2c73e869a0bf93d98e490
+size 14960

lora_tuned_stage2/checkpoint-15000/rng_state_6.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:01de3fbea9accef82ed56957e195bf93c4028e5a1f28965a90ad69daf8be5784
+size 14960

lora_tuned_stage2/checkpoint-15000/rng_state_7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:044f815af22c4f30dd5b273290103876b269d4b80108b2a962b9aa096039f361
+size 14960

lora_tuned_stage2/checkpoint-15000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b122911694009e78ed7d779c4ad2f11d25db15e7f2ef6b691ef70915ee429ee3
+size 1064

lora_tuned_stage2/checkpoint-15000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

lora_tuned_stage2/checkpoint-15000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66db180e50c8e137b1bba960fbb542970431ee7e8a18d4bc45074381235c9e9e
+size 6072