Alexhu1999 commited on
Commit
7d7a284
·
verified ·
1 Parent(s): f19ea7d

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -1,53 +1,7 @@
1
  {
2
  "architectures": [
3
- "Gemma3nForConditionalGeneration"
4
  ],
5
- "audio_config": {
6
- "conf_attention_chunk_size": 12,
7
- "conf_attention_context_left": 13,
8
- "conf_attention_context_right": 0,
9
- "conf_attention_logit_cap": 50.0,
10
- "conf_conv_kernel_size": 5,
11
- "conf_num_attention_heads": 8,
12
- "conf_num_hidden_layers": 12,
13
- "conf_reduction_factor": 4,
14
- "conf_residual_weight": 0.5,
15
- "gradient_clipping": 10000000000.0,
16
- "hidden_size": 1536,
17
- "input_feat_size": 128,
18
- "model_type": "gemma3n_audio",
19
- "rms_norm_eps": 1e-06,
20
- "sscp_conv_channel_size": [
21
- 128,
22
- 32
23
- ],
24
- "sscp_conv_group_norm_eps": 0.001,
25
- "sscp_conv_kernel_size": [
26
- [
27
- 3,
28
- 3
29
- ],
30
- [
31
- 3,
32
- 3
33
- ]
34
- ],
35
- "sscp_conv_stride_size": [
36
- [
37
- 2,
38
- 2
39
- ],
40
- [
41
- 2,
42
- 2
43
- ]
44
- ],
45
- "torch_dtype": "float32",
46
- "vocab_offset": 262272,
47
- "vocab_size": 128
48
- },
49
- "audio_soft_tokens_per_image": 188,
50
- "audio_token_id": 262273,
51
  "boa_token_id": 256000,
52
  "boi_token": "<start_of_image>",
53
  "boi_token_id": 64401,
@@ -111,13 +65,13 @@
111
  "num_hidden_layers": 16,
112
  "num_key_value_heads": 8,
113
  "rope_theta": 1000000.0,
114
- "torch_dtype": "float32",
115
  "use_cache": true,
116
  "use_pos_enc": true,
117
  "vocab_size": 64403
118
  },
119
- "torch_dtype": "float32",
120
- "transformers_version": "4.54.1",
121
  "use_cache": true,
122
  "vision_config": {
123
  "architecture": "mobilenetv5_300m_enc",
@@ -129,10 +83,10 @@
129
  "LABEL_1"
130
  ],
131
  "model_args": null,
132
- "model_type": "gemma3n_vision",
133
  "num_classes": 2,
134
  "rms_norm_eps": 1e-06,
135
- "torch_dtype": "float32",
136
  "vocab_offset": 262144,
137
  "vocab_size": 128
138
  },
 
1
  {
2
  "architectures": [
3
+ "Lfm2vlForConditionalGeneration"
4
  ],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "boa_token_id": 256000,
6
  "boi_token": "<start_of_image>",
7
  "boi_token_id": 64401,
 
65
  "num_hidden_layers": 16,
66
  "num_key_value_heads": 8,
67
  "rope_theta": 1000000.0,
68
+ "torch_dtype": "bfloat16",
69
  "use_cache": true,
70
  "use_pos_enc": true,
71
  "vocab_size": 64403
72
  },
73
+ "torch_dtype": "bfloat16",
74
+ "transformers_version": "4.54.0",
75
  "use_cache": true,
76
  "vision_config": {
77
  "architecture": "mobilenetv5_300m_enc",
 
83
  "LABEL_1"
84
  ],
85
  "model_args": null,
86
+ "model_type": "lfm2_vision",
87
  "num_classes": 2,
88
  "rms_norm_eps": 1e-06,
89
+ "torch_dtype": "bfloat16",
90
  "vocab_offset": 262144,
91
  "vocab_size": 128
92
  },
generation_config.json CHANGED
@@ -9,5 +9,5 @@
9
  "pad_token_id": 0,
10
  "top_k": 64,
11
  "top_p": 0.95,
12
- "transformers_version": "4.54.1"
13
  }
 
9
  "pad_token_id": 0,
10
  "top_k": 64,
11
  "top_p": 0.95,
12
+ "transformers_version": "4.54.0"
13
  }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b0db5e62e2880b680572af2894587b8c059f7e08199735e420ca2f34ce294fc
3
+ size 2933310216
preprocessor_config.json CHANGED
@@ -39,7 +39,6 @@
39
  "preemphasis": 0.97,
40
  "preemphasis_htk_flavor": true,
41
  "processor_class": "Lfm2vlProcessor",
42
- "feature_extractor_type": "Lfm2vlAudioFeatureExtractor",
43
  "resample": 2,
44
  "rescale_factor": 0.00392156862745098,
45
  "return_attention_mask": true,
 
39
  "preemphasis": 0.97,
40
  "preemphasis_htk_flavor": true,
41
  "processor_class": "Lfm2vlProcessor",
 
42
  "resample": 2,
43
  "rescale_factor": 0.00392156862745098,
44
  "return_attention_mask": true,
special_tokens_map.json CHANGED
@@ -1,26 +1,8 @@
1
  {
2
  "additional_special_tokens": [
3
- {
4
- "content": "<image_soft_token>",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false
9
- },
10
- {
11
- "content": "<start_of_image>",
12
- "lstrip": false,
13
- "normalized": false,
14
- "rstrip": false,
15
- "single_word": false
16
- },
17
- {
18
- "content": "<end_of_image>",
19
- "lstrip": false,
20
- "normalized": false,
21
- "rstrip": false,
22
- "single_word": false
23
- }
24
  ],
25
  "bos_token": {
26
  "content": "<|startoftext|>",
 
1
  {
2
  "additional_special_tokens": [
3
+ "<image_soft_token>",
4
+ "<start_of_image>",
5
+ "<end_of_image>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6
  ],
7
  "bos_token": {
8
  "content": "<|startoftext|>",
tokenizer_config.json CHANGED
@@ -4092,6 +4092,7 @@
4092
  "clean_up_tokenization_spaces": true,
4093
  "eos_token": "<|im_end|>",
4094
  "extra_special_tokens": {},
 
4095
  "legacy": false,
4096
  "model_max_length": 1000000000000000019884624838656,
4097
  "pad_token": "<|pad|>",
@@ -4102,6 +4103,5 @@
4102
  "tokenizer_class": "PreTrainedTokenizerFast",
4103
  "truncation": "do_not_truncate",
4104
  "use_default_system_prompt": false,
4105
- "use_fast": true,
4106
- "image_token_id": "64400"
4107
  }
 
4092
  "clean_up_tokenization_spaces": true,
4093
  "eos_token": "<|im_end|>",
4094
  "extra_special_tokens": {},
4095
+ "image_token_id": 64400,
4096
  "legacy": false,
4097
  "model_max_length": 1000000000000000019884624838656,
4098
  "pad_token": "<|pad|>",
 
4103
  "tokenizer_class": "PreTrainedTokenizerFast",
4104
  "truncation": "do_not_truncate",
4105
  "use_default_system_prompt": false,
4106
+ "use_fast": true
 
4107
  }