louaaron commited on
Commit
52eed37
·
verified ·
1 Parent(s): b83c234

Create config.json

Browse files
Files changed (1) hide show
  1. config.json +62 -0
config.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ngpus": 8,
3
+ "tokens": 50257,
4
+ "training": {
5
+ "batch_size": 512,
6
+ "accum": 2,
7
+ "n_iters": 1300001,
8
+ "snapshot_freq": 50000,
9
+ "log_freq": 50,
10
+ "eval_freq": 100,
11
+ "snapshot_freq_for_preemption": 10000,
12
+ "weight": "standard",
13
+ "snapshot_sampling": true,
14
+ "ema": 0.9999
15
+ },
16
+ "data": {
17
+ "train": "openwebtext",
18
+ "valid": "wikitext103",
19
+ "cache_dir": "data"
20
+ },
21
+ "graph": {
22
+ "type": "absorb"
23
+ },
24
+ "noise": {
25
+ "type": "loglinear",
26
+ "sigma_min": 0.0001,
27
+ "sigma_max": 20
28
+ },
29
+ "sampling": {
30
+ "predictor": "euler",
31
+ "steps": 128,
32
+ "noise_removal": true
33
+ },
34
+ "eval": {
35
+ "batch_size": 512,
36
+ "perplexity": true,
37
+ "perplexity_batch_size": 32
38
+ },
39
+ "optim": {
40
+ "weight_decay": 0,
41
+ "optimizer": "AdamW",
42
+ "lr": 0.0003,
43
+ "beta1": 0.9,
44
+ "beta2": 0.999,
45
+ "eps": 1e-08,
46
+ "warmup": 2500,
47
+ "grad_clip": 1.0
48
+ },
49
+ "model": {
50
+ "name": "medium",
51
+ "type": "ddit",
52
+ "hidden_size": 1024,
53
+ "cond_dim": 128,
54
+ "length": 1024,
55
+ "n_blocks": 24,
56
+ "n_heads": 16,
57
+ "scale_by_sigma": true,
58
+ "dropout": 0.1,
59
+ "score_strategy": 0
60
+ },
61
+ "work_dir": "absorb_medium"
62
+ }