| | |
| | from transformers import PretrainedConfig |
| |
|
| |
|
| | class DownsamplerConfig(PretrainedConfig): |
| | model_type = 'downsampler' |
| | _auto_class = 'AutoConfig' |
| |
|
| | def __init__( |
| | self, |
| | kernel_size=1, |
| | stride=1, |
| | visual_hidden_size=4096, |
| | llm_hidden_size=4096, |
| | depth=2, |
| | hidden_act='gelu', |
| | bias=False, |
| | **kwargs, |
| | ): |
| | self.visual_hidden_size = visual_hidden_size |
| | self.llm_hidden_size = llm_hidden_size |
| | self.depth = depth |
| | self.hidden_act = hidden_act |
| | self.bias = bias |
| | self.kernel_size = kernel_size |
| | self.stride = stride |
| | super().__init__(**kwargs) |
| |
|