Update config.json
Browse files- config.json +4 -5
config.json
CHANGED
|
@@ -67,7 +67,6 @@
|
|
| 67 |
"top_p": 1.0,
|
| 68 |
"torch_dtype": null,
|
| 69 |
"torchscript": false,
|
| 70 |
-
"transformers_version": "4.16.0.dev0",
|
| 71 |
"use_bfloat16": false,
|
| 72 |
"vocab_size": 256,
|
| 73 |
"use_attention_bias": false,
|
|
@@ -82,7 +81,7 @@
|
|
| 82 |
},
|
| 83 |
"text_config_dict": null,
|
| 84 |
"transformers_version": null,
|
| 85 |
-
"
|
| 86 |
"use_attention_bias": false,
|
| 87 |
"_name_or_path": "",
|
| 88 |
"add_cross_attention": false,
|
|
@@ -104,7 +103,7 @@
|
|
| 104 |
"forced_eos_token_id": null,
|
| 105 |
"hidden_act": "gelu",
|
| 106 |
"hidden_size": 768,
|
| 107 |
-
"
|
| 108 |
"initializer_factor": 1.0,
|
| 109 |
"initializer_range": 0.02,
|
| 110 |
"intermediate_size": 1536,
|
|
@@ -114,7 +113,7 @@
|
|
| 114 |
"length_penalty": 1.0,
|
| 115 |
"max_length": 20,
|
| 116 |
"min_length": 0,
|
| 117 |
-
"model_type": "
|
| 118 |
"no_repeat_ngram_size": 0,
|
| 119 |
"num_attention_heads": 12,
|
| 120 |
"num_beam_groups": 1,
|
|
@@ -154,5 +153,5 @@
|
|
| 154 |
"use_rotary_embedding": true,
|
| 155 |
"summary_type": "mean"
|
| 156 |
},
|
| 157 |
-
"
|
| 158 |
}
|
|
|
|
| 67 |
"top_p": 1.0,
|
| 68 |
"torch_dtype": null,
|
| 69 |
"torchscript": false,
|
|
|
|
| 70 |
"use_bfloat16": false,
|
| 71 |
"vocab_size": 256,
|
| 72 |
"use_attention_bias": false,
|
|
|
|
| 81 |
},
|
| 82 |
"text_config_dict": null,
|
| 83 |
"transformers_version": null,
|
| 84 |
+
"speech_config": {
|
| 85 |
"use_attention_bias": false,
|
| 86 |
"_name_or_path": "",
|
| 87 |
"add_cross_attention": false,
|
|
|
|
| 103 |
"forced_eos_token_id": null,
|
| 104 |
"hidden_act": "gelu",
|
| 105 |
"hidden_size": 768,
|
| 106 |
+
"vocab_size": 8192,
|
| 107 |
"initializer_factor": 1.0,
|
| 108 |
"initializer_range": 0.02,
|
| 109 |
"intermediate_size": 1536,
|
|
|
|
| 113 |
"length_penalty": 1.0,
|
| 114 |
"max_length": 20,
|
| 115 |
"min_length": 0,
|
| 116 |
+
"model_type": "clip_speech_model",
|
| 117 |
"no_repeat_ngram_size": 0,
|
| 118 |
"num_attention_heads": 12,
|
| 119 |
"num_beam_groups": 1,
|
|
|
|
| 153 |
"use_rotary_embedding": true,
|
| 154 |
"summary_type": "mean"
|
| 155 |
},
|
| 156 |
+
"speech_config_dict": null,
|
| 157 |
}
|