nav2tex-decoder / config.json
harryrobert's picture
Upload config.json with huggingface_hub
ee72508 verified
raw
history blame contribute delete
829 Bytes
{
"tokenizer_dir": "/workspace/nav2tex-decoder/tokenizer",
"vocab_size": 50000,
"pad_token_id": 1,
"bos_token_id": 0,
"eos_token_id": 2,
"data_glob": "/workspace/data/data/*.parquet",
"max_seq_len": 1024,
"cpe_score_threshold": 400,
"cpe_ratio": 0.25,
"d_model": 1024,
"n_heads": 16,
"n_layers": 8,
"d_ff": 4096,
"dropout": 0.1,
"squeeze_ratio": 4,
"lam_lambda": 0.1,
"batch_size": 16,
"grad_accum": 8,
"max_epochs": 10,
"warmup_steps": 2000,
"lr": 0.0001,
"weight_decay": 0.01,
"max_grad_norm": 1.0,
"label_smoothing": 0.1,
"save_dir": "/workspace/checkpoints",
"save_every_n_steps": 2000,
"log_every_n_steps": 100,
"num_workers": 8,
"prefetch_factor": 4,
"persistent_workers": true,
"cuda_benchmark": true,
"bf16": true,
"compile": true,
"flash_attn": false
}