Bingsu commited on
Commit
be19eec
·
verified ·
1 Parent(s): f60e610

Delete configuration_hyperclovax.py

Browse files
Files changed (1) hide show
  1. configuration_hyperclovax.py +0 -60
configuration_hyperclovax.py DELETED
@@ -1,60 +0,0 @@
1
- from transformers.configuration_utils import PretrainedConfig
2
- from transformers.utils import logging
3
-
4
- logger = logging.get_logger(__name__)
5
-
6
-
7
- class HCXVisionConfig(PretrainedConfig):
8
- model_type = "hyperclovax_vlm"
9
- keys_to_ignore_at_inference = ["past_key_values"]
10
-
11
- # The `gpt2` class has a different name, so it needs to be updated accordingly.
12
- language_config_attribute_map = {
13
- "n_embd": "hidden_size",
14
- "n_positions": "max_position_embeddings",
15
- "n_head": "num_attention_heads",
16
- "n_layer": "num_hidden_layers",
17
- }
18
-
19
- def __init__(
20
- self,
21
- language_config=None,
22
- vision_config=None,
23
- use_nth_layer=-2,
24
- img_start_id=100009, # <|dummy3|>
25
- decoder_max_length=4096,
26
- anyres=False,
27
- unpad=False,
28
- max_num_grids=-1,
29
- num_queries_vis_abstractor=-1,
30
- ignore_index=-100,
31
- proj_pos_emb=True,
32
- proj_prenorm=False,
33
- use_1x1_grid=False,
34
- **kwargs,
35
- ):
36
- for key, val in self.language_config_attribute_map.items():
37
- if language_config is not None and key in language_config:
38
- language_config[val] = language_config.pop(key)
39
-
40
- self.language_config = language_config
41
- self.vision_config = vision_config
42
-
43
- if language_config is not None:
44
- # In DeepSpeed ZeRO-3, the memory size is automatically determined based on the `hidden_size` specified in the config.
45
- self.hidden_size = (
46
- language_config["hidden_size"] if "hidden_size" in language_config else language_config["n_embd"]
47
- )
48
- # add VLM configs
49
- self.use_nth_layer = use_nth_layer
50
- self.decoder_max_length = decoder_max_length
51
- self.anyres = anyres
52
- self.unpad = unpad
53
- self.max_num_grids = max_num_grids
54
- self.num_queries_vis_abstractor = num_queries_vis_abstractor
55
- self.img_start_id = img_start_id
56
- self.ignore_index = ignore_index
57
- self.proj_pos_emb = proj_pos_emb
58
- self.proj_prenorm = proj_prenorm
59
- self.use_1x1_grid = use_1x1_grid
60
- super().__init__(**kwargs)