Update config.json
Browse filesRename clip -> clip_vip and Clip to ClipViP
- config.json +4 -4
config.json
CHANGED
|
@@ -1,10 +1,10 @@
|
|
| 1 |
{
|
| 2 |
"architectures": [
|
| 3 |
-
"
|
| 4 |
],
|
| 5 |
"initializer_factor": 1.0,
|
| 6 |
"logit_scale_init_value": 2.6592,
|
| 7 |
-
"model_type": "
|
| 8 |
"projection_dim": 512,
|
| 9 |
"text_config": {
|
| 10 |
"_name_or_path": "",
|
|
@@ -44,7 +44,7 @@
|
|
| 44 |
"max_length": 20,
|
| 45 |
"max_position_embeddings": 77,
|
| 46 |
"min_length": 0,
|
| 47 |
-
"model_type": "
|
| 48 |
"no_repeat_ngram_size": 0,
|
| 49 |
"num_attention_heads": 8,
|
| 50 |
"num_beam_groups": 1,
|
|
@@ -120,7 +120,7 @@
|
|
| 120 |
"logit_scale_init_value": 4.60,
|
| 121 |
"max_length": 20,
|
| 122 |
"min_length": 0,
|
| 123 |
-
"model_type": "
|
| 124 |
"no_repeat_ngram_size": 0,
|
| 125 |
"num_attention_heads": 12,
|
| 126 |
"num_beam_groups": 1,
|
|
|
|
| 1 |
{
|
| 2 |
"architectures": [
|
| 3 |
+
"CLIPViPModel"
|
| 4 |
],
|
| 5 |
"initializer_factor": 1.0,
|
| 6 |
"logit_scale_init_value": 2.6592,
|
| 7 |
+
"model_type": "clip_vip",
|
| 8 |
"projection_dim": 512,
|
| 9 |
"text_config": {
|
| 10 |
"_name_or_path": "",
|
|
|
|
| 44 |
"max_length": 20,
|
| 45 |
"max_position_embeddings": 77,
|
| 46 |
"min_length": 0,
|
| 47 |
+
"model_type": "clip_vip_text_model",
|
| 48 |
"no_repeat_ngram_size": 0,
|
| 49 |
"num_attention_heads": 8,
|
| 50 |
"num_beam_groups": 1,
|
|
|
|
| 120 |
"logit_scale_init_value": 4.60,
|
| 121 |
"max_length": 20,
|
| 122 |
"min_length": 0,
|
| 123 |
+
"model_type": "clip_vip_vision_model",
|
| 124 |
"no_repeat_ngram_size": 0,
|
| 125 |
"num_attention_heads": 12,
|
| 126 |
"num_beam_groups": 1,
|