omar-rq-multicodebook / config.gin
p-alonso's picture
Update config.gin to keep required params only with explicit names
cbdcbab verified
# Parameters for build_module:
# ==============================================================================
omar_rq.utils.build_module.ckpt_path = 'model.ckpt'
omar_rq.utils.build_module.module = @omar_rq.modules.maskingmodel.MaskingModel
omar_rq.utils.build_module.net = @omar_rq.nets.conformer.Conformer
omar_rq.utils.build_module.representation = @omar_rq.nets.melspectrogram.MelSpectrogram
# Parameters for omar_rq.nets.conformer.Conformer:
# ==============================================================================
omar_rq.nets.conformer.Conformer.alpha_deepnorm = 2.6321480259049848
omar_rq.nets.conformer.Conformer.beta_deepnorm = 0.022386873579657126
omar_rq.nets.conformer.Conformer.conv_kernel_size = 5
omar_rq.nets.conformer.Conformer.depth = 24
omar_rq.nets.conformer.Conformer.dropout = 0.2
omar_rq.nets.conformer.Conformer.embed_dim = 1024
omar_rq.nets.conformer.Conformer.input_dropout = 0.0
omar_rq.nets.conformer.Conformer.mlp_ratio = 4.0
omar_rq.nets.conformer.Conformer.mlp_residual_factor = 4.0
omar_rq.nets.conformer.Conformer.num_heads = 8
omar_rq.nets.conformer.Conformer.num_patches = 460
omar_rq.nets.conformer.Conformer.patch_size = None
omar_rq.nets.conformer.Conformer.use_deepnorm = True
omar_rq.nets.conformer.Conformer.use_rope = True
# Parameters for omar_rq.modules.maskingmodel.MaskingModel:
# ==============================================================================
omar_rq.modules.maskingmodel.MaskingModel.codebook_dim = 16
omar_rq.modules.maskingmodel.MaskingModel.codebook_size = 8192
omar_rq.modules.maskingmodel.MaskingModel.diff_input = False
omar_rq.modules.maskingmodel.MaskingModel.input_representation = None
omar_rq.modules.maskingmodel.MaskingModel.lr = 0.0001
omar_rq.modules.maskingmodel.MaskingModel.mask_prob = 0.6
omar_rq.modules.maskingmodel.MaskingModel.mask_seconds = 0.4
omar_rq.modules.maskingmodel.MaskingModel.masking_noise_type = 'random_normal'
omar_rq.modules.maskingmodel.MaskingModel.num_codebooks = 4
omar_rq.modules.maskingmodel.MaskingModel.plot_tokens = False
omar_rq.modules.maskingmodel.MaskingModel.quantizer_type = 'random_codebook'
omar_rq.modules.maskingmodel.MaskingModel.seed = 0
omar_rq.modules.maskingmodel.MaskingModel.weight_decay = 0.01
# Parameters for omar_rq.nets.melspectrogram.MelSpectrogram:
# ==============================================================================
omar_rq.nets.melspectrogram.MelSpectrogram.freq_mask_param = 0
omar_rq.nets.melspectrogram.MelSpectrogram.hop_len = 256
omar_rq.nets.melspectrogram.MelSpectrogram.mel_scale = 'slaney'
omar_rq.nets.melspectrogram.MelSpectrogram.n_mel = 96
omar_rq.nets.melspectrogram.MelSpectrogram.norm = 'slaney'
omar_rq.nets.melspectrogram.MelSpectrogram.norm_mean = 2.06755686098554
omar_rq.nets.melspectrogram.MelSpectrogram.norm_std = 1.268292820667291
omar_rq.nets.melspectrogram.MelSpectrogram.power = 2
omar_rq.nets.melspectrogram.MelSpectrogram.sr = 16000
omar_rq.nets.melspectrogram.MelSpectrogram.stretch_factor = 1
omar_rq.nets.melspectrogram.MelSpectrogram.time_mask_param = 0
omar_rq.nets.melspectrogram.MelSpectrogram.win_len = 512