mazesmazes commited on
Commit
d0f55fa
·
verified ·
1 Parent(s): fb9a105

Training in progress, step 500

Browse files
adapter_config.json CHANGED
@@ -29,8 +29,8 @@
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
- "v_proj",
33
- "q_proj"
34
  ],
35
  "target_parameters": null,
36
  "task_type": "CAUSAL_LM",
 
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
+ "q_proj",
33
+ "v_proj"
34
  ],
35
  "target_parameters": null,
36
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a56130d6532b2b6b1a599abd432ca717602cbd16355136d12768dbf5f21692ea
3
  size 36715216
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d18a0b9c1a132992b5942c61c13e41c96c52fc3a5f135f8589cc2f6c35b22fd
3
  size 36715216
config.json CHANGED
@@ -156,12 +156,12 @@
156
  ]
157
  ],
158
  "encoder_dim": 1280,
159
- "freeze_projector": true,
160
  "inference_warmup_tokens": 10,
161
  "label_smoothing": 0.0,
162
  "length_penalty": 1.0,
163
  "llm_dim": 1024,
164
- "lora_alpha": 128,
165
  "lora_dropout": 0.0,
166
  "lora_rank": 64,
167
  "lora_target_modules": [
 
156
  ]
157
  ],
158
  "encoder_dim": 1280,
159
+ "freeze_projector": false,
160
  "inference_warmup_tokens": 10,
161
  "label_smoothing": 0.0,
162
  "length_penalty": 1.0,
163
  "llm_dim": 1024,
164
+ "lora_alpha": 32,
165
  "lora_dropout": 0.0,
166
  "lora_rank": 64,
167
  "lora_target_modules": [
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc863480c4f2381e8cd274660102146566c7f2e38bde8a8f3e267c9361b62856
3
  size 25172384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c6e83c3b9a3fd36727fc676cbae32a1a386efad5f24cc085500fabd26eca7cf
3
  size 25172384
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50389fcf6939a2d04fa7fb7e239f98f27e46ad21c06f320b15fb023f3550c88d
3
  size 5201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57e9882a79d3171d1aeea43287b622c738071f7c789fce0847f6c51496e3e3e6
3
  size 5201