{ "vocab_size": 10303, "pad_token_id": 0, "mf_start_token_id": 1, "mf_end_token_id": 2, "bp_start_token_id": 3, "bp_end_token_id": 4, "cc_start_token_id": 5, "cc_end_token_id": 6, "organism_vocab_size": 201, "embed_model_type": "esm2", "max_protein_length": 1024, "vocab_config": { "MF": { "method": "min_freq", "value": 20 }, "BP": { "method": "min_freq", "value": 20 }, "CC": { "method": "min_freq", "value": 20 } }, "vocab_stats": { "MF": { "method": "min_freq", "threshold": 20, "selected": 1537, "freq_range": [ 20, 73296 ], "total_terms": 7183 }, "BP": { "method": "min_freq", "threshold": 20, "selected": 7720, "freq_range": [ 20, 81287 ], "total_terms": 21200 }, "CC": { "method": "min_freq", "threshold": 20, "selected": 1039, "freq_range": [ 20, 84240 ], "total_terms": 2939 } } }