vqprot-tiny / config.json
khairi's picture
Training checkpoint — step 500
4cbc0e0 verified
{
"architectures": [
"VQProtV1"
],
"batch_size": 8,
"beta": 2.1,
"bucket_size": 16,
"d_model": 256,
"debug": true,
"dropout_rate": 0.1,
"esm_d_model": 320,
"esm_model_name": "facebook/esm2_t6_8M_UR50D",
"hidden_size": 256,
"intermediate_size": 768,
"mask_token_id": 32,
"max_seq_len": 258,
"model_type": "vqprot",
"n_decoder_layers": 4,
"n_encoder_layers": 6,
"name": "vqprot_v1",
"norm_eps": 1e-06,
"num_codes": 64,
"num_codes_min_usage": 0.5,
"num_codes_reset_interval": 100,
"num_heads": 4,
"num_kv_heads": 4,
"position_emb_theta": 10000.0,
"torch_dtype": "float32",
"transformers_version": "4.48.3",
"vocab_size": 33
}