{ "tokenizer_dir": "/workspace/nav2tex-decoder/tokenizer", "vocab_size": 50000, "pad_token_id": 1, "bos_token_id": 0, "eos_token_id": 2, "data_glob": "/workspace/data/data/*.parquet", "max_seq_len": 1024, "cpe_score_threshold": 400, "cpe_ratio": 0.25, "d_model": 1024, "n_heads": 16, "n_layers": 8, "d_ff": 4096, "dropout": 0.1, "squeeze_ratio": 4, "lam_lambda": 0.1, "batch_size": 16, "grad_accum": 8, "max_epochs": 10, "warmup_steps": 2000, "lr": 0.0001, "weight_decay": 0.01, "max_grad_norm": 1.0, "label_smoothing": 0.1, "save_dir": "/workspace/checkpoints", "save_every_n_steps": 2000, "log_every_n_steps": 100, "num_workers": 8, "prefetch_factor": 4, "persistent_workers": true, "cuda_benchmark": true, "bf16": true, "compile": true, "flash_attn": false }