Syclus commited on
Commit
6b27366
·
verified ·
1 Parent(s): fc5800e

Add model weights and config

Browse files
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "EncoderTuningModel"
4
+ ],
5
+ "audio_encoder_name": "models/flamingo_qwen/flamingo_qwen2_moe.py",
6
+ "audio_encoder_params": {
7
+ "adapter_dropout": 0.1,
8
+ "adapter_type": "adapter",
9
+ "cls_task_ids": "None",
10
+ "fusion_mode": "moe_swiglu",
11
+ "num_tasks": 12,
12
+ "qformer_d_model": 1024,
13
+ "qformer_drop_path": 0.05,
14
+ "qformer_dropout": 0.1,
15
+ "qformer_heads": 16,
16
+ "qformer_layers": 6,
17
+ "qformer_num_global_queries": 32,
18
+ "qformer_num_local_queries": 96,
19
+ "qformer_pool_stride": 4,
20
+ "task_cond": false
21
+ },
22
+ "decoder_type": "/private/models/SmolLM2-135M",
23
+ "dtype": "float32",
24
+ "lora_alpha": 32,
25
+ "lora_dropout": 0.1,
26
+ "lora_r": 8,
27
+ "lora_target_modules": "all-linear",
28
+ "model_type": "encoder_tuning_model",
29
+ "train_encoder_stage1": false,
30
+ "train_encoder_stage2": false,
31
+ "transformers_version": "5.0.0"
32
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58cdba58cbbb433638636d7ee285a5817a0eb1e8a2c326bcf72ab78128a61a01
3
+ size 4566938804
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6f4285566aa7fa8879e9e57ac989a653a0ee250ae77da7ad12e6cd41e9d6da2
3
+ size 952076899
rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3e19c3173ea0077e9906f713dfb1f845339ff71c9670e1da2d21de174358fef
3
+ size 15173
rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65f46c0156c915214baa7c2a9bb36ada5ccdf9b1477ec1302ed4c5478a263d48
3
+ size 15173
rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72f93b7d7bb9f4f091ad327548e1298a81a5b522ed043bafc49ef1878d38103f
3
+ size 15173
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f806da08112492605f4d8e7d6e09bb187437a32aede91141195cb859f425e5cc
3
+ size 1465
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:380b270c309cf5ec685afd1c3fffef0d6cd29ad88905df124818dd47324245bc
3
+ size 5329
training_stage.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"training_stage": "stage2"}