harryrobert commited on
Commit
ee72508
·
verified ·
1 Parent(s): f045894

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +36 -20
config.json CHANGED
@@ -1,20 +1,36 @@
1
- {
2
- "architectures": [
3
- "Nav2TexDecoderModel"
4
- ],
5
- "bos_token_id": 0,
6
- "d_ff": 4096,
7
- "d_model": 1024,
8
- "dropout": 0.1,
9
- "dtype": "float32",
10
- "eos_token_id": 2,
11
- "lam_lambda": 0.1,
12
- "max_seq_len": 1024,
13
- "model_type": "nav2tex_decoder",
14
- "n_heads": 16,
15
- "n_layers": 8,
16
- "pad_token_id": 1,
17
- "squeeze_ratio": 4,
18
- "transformers_version": "4.57.3",
19
- "vocab_size": 50000
20
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "tokenizer_dir": "/workspace/nav2tex-decoder/tokenizer",
3
+ "vocab_size": 50000,
4
+ "pad_token_id": 1,
5
+ "bos_token_id": 0,
6
+ "eos_token_id": 2,
7
+ "data_glob": "/workspace/data/data/*.parquet",
8
+ "max_seq_len": 1024,
9
+ "cpe_score_threshold": 400,
10
+ "cpe_ratio": 0.25,
11
+ "d_model": 1024,
12
+ "n_heads": 16,
13
+ "n_layers": 8,
14
+ "d_ff": 4096,
15
+ "dropout": 0.1,
16
+ "squeeze_ratio": 4,
17
+ "lam_lambda": 0.1,
18
+ "batch_size": 16,
19
+ "grad_accum": 8,
20
+ "max_epochs": 10,
21
+ "warmup_steps": 2000,
22
+ "lr": 0.0001,
23
+ "weight_decay": 0.01,
24
+ "max_grad_norm": 1.0,
25
+ "label_smoothing": 0.1,
26
+ "save_dir": "/workspace/checkpoints",
27
+ "save_every_n_steps": 2000,
28
+ "log_every_n_steps": 100,
29
+ "num_workers": 8,
30
+ "prefetch_factor": 4,
31
+ "persistent_workers": true,
32
+ "cuda_benchmark": true,
33
+ "bf16": true,
34
+ "compile": true,
35
+ "flash_attn": false
36
+ }