levossadtchi commited on
Commit
3f6fdf8
·
verified ·
1 Parent(s): 7f06cc6

Delete configs/.ipynb_checkpoints

Browse files
configs/.ipynb_checkpoints/pretrain_5090_stage1-checkpoint.json DELETED
@@ -1,27 +0,0 @@
1
- {
2
- "seed": 42,
3
- "train_dir": "data/pretokenized/train",
4
- "val_dir": "data/pretokenized/val",
5
- "output_dir": "outputs/pretrain_stage1",
6
- "checkpoint_dir": "checkpoints/pretrain_stage1",
7
- "init_from": null,
8
- "resume_from": null,
9
- "seq_len": 2048,
10
- "micro_batch_size": 8,
11
- "grad_accum_steps": 32,
12
- "max_steps": 20000,
13
- "warmup_steps": 2000,
14
- "learning_rate": 0.003,
15
- "min_lr": 0.0003,
16
- "weight_decay": 0.1,
17
- "beta1": 0.9,
18
- "beta2": 0.95,
19
- "grad_clip": 1.0,
20
- "precision": "bf16",
21
- "num_workers": 0,
22
- "log_interval": 10,
23
- "eval_interval": 250,
24
- "eval_batches": 50,
25
- "save_interval": 100,
26
- "compile_model": false
27
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
configs/.ipynb_checkpoints/pretrain_5090_stage2_anneal-checkpoint.json DELETED
@@ -1,27 +0,0 @@
1
- {
2
- "seed": 42,
3
- "train_dir": "data/pretokenized/train",
4
- "val_dir": "data/pretokenized/val",
5
- "output_dir": "outputs/pretrain_stage2",
6
- "checkpoint_dir": "checkpoints/pretrain_stage2",
7
- "init_from": "checkpoints/pretrain_stage1/last.pt",
8
- "resume_from": null,
9
- "seq_len": 8192,
10
- "micro_batch_size": 2,
11
- "grad_accum_steps": 16,
12
- "max_steps": 1000,
13
- "warmup_steps": 100,
14
- "learning_rate": 0.001,
15
- "min_lr": 0.0001,
16
- "weight_decay": 0.1,
17
- "beta1": 0.9,
18
- "beta2": 0.95,
19
- "grad_clip": 1.0,
20
- "precision": "bf16",
21
- "num_workers": 0,
22
- "log_interval": 5,
23
- "eval_interval": 100,
24
- "eval_batches": 20,
25
- "save_interval": 50,
26
- "compile_model": false
27
- }