| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| """HyperCLOVAX-SEED Audio Encoder configuration.""" |
|
|
| from transformers import AutoConfig, PretrainedConfig |
|
|
|
|
| class HyperCLOVAXSeedAudioEncoderConfig(PretrainedConfig): |
| """Configuration for HyperCLOVAXSeedAudioEncoder wrapped as PreTrainedModel.""" |
|
|
| model_type = "hyperclovax_seed_audio_encoder" |
|
|
| def __init__( |
| self, |
| d_model=768, |
| encoder_layers=12, |
| encoder_attention_heads=12, |
| encoder_ffn_dim=3072, |
| num_mel_bins=128, |
| max_source_positions=1500, |
| dropout=0.1, |
| attention_dropout=0.1, |
| pool_kernel_size=5, |
| pool_stride=5, |
| **kwargs, |
| ): |
| super().__init__(**kwargs) |
| self.d_model = d_model |
| self.hidden_size = d_model |
| self.encoder_layers = encoder_layers |
| self.encoder_attention_heads = encoder_attention_heads |
| self.encoder_ffn_dim = encoder_ffn_dim |
| self.num_mel_bins = num_mel_bins |
| self.max_source_positions = max_source_positions |
| self.dropout = dropout |
| self.attention_dropout = attention_dropout |
| self.pool_kernel_size = pool_kernel_size |
| self.pool_stride = pool_stride |
|
|
|
|
| AutoConfig.register("hyperclovax_seed_audio_encoder", HyperCLOVAXSeedAudioEncoderConfig) |
|
|
| __all__ = ["HyperCLOVAXSeedAudioEncoderConfig"] |
|
|