AlienKevin commited on
Commit
0398ac1
·
verified ·
1 Parent(s): 91541a2

Upload CIFAR-10 checkpoint and config (2025-09-13T16:23:39.476367Z)

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ ckpt-150000.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
ckpt-150000.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca88d7fd9f9e32d5d52e171c2b57aeef05262866ed29bebed957969f0daf19ff
3
+ size 495423956
ckpt-150000.index ADDED
Binary file (64 kB). View file
 
config.json ADDED
@@ -0,0 +1,124 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": {
3
+ "batch_duplicates": 1,
4
+ "cache_dataset": true,
5
+ "cropping": "none",
6
+ "eval_split": "test",
7
+ "flipping": "left_right",
8
+ "image_size": 32,
9
+ "name": "object_recognition",
10
+ "num_classes": 10,
11
+ "tfds_name": "cifar10",
12
+ "train_split": "train"
13
+ },
14
+ "datasets": [
15
+ {
16
+ "batch_duplicates": 1,
17
+ "cache_dataset": true,
18
+ "cropping": "none",
19
+ "eval_split": "test",
20
+ "flipping": "left_right",
21
+ "image_size": 32,
22
+ "name": "object_recognition",
23
+ "num_classes": 10,
24
+ "tfds_name": "cifar10",
25
+ "train_split": "train"
26
+ }
27
+ ],
28
+ "eval": {
29
+ "batch_size": 64,
30
+ "checkpoint_dir": "",
31
+ "steps": 2,
32
+ "tag": "eval",
33
+ "write_images_to_file": true
34
+ },
35
+ "model": {
36
+ "arch_name": "tape",
37
+ "b_scale": 1.0,
38
+ "b_type": "uint8",
39
+ "cond_decoupled_read": false,
40
+ "cond_dim": 0,
41
+ "cond_dropout": 0.0,
42
+ "cond_on_latent": true,
43
+ "cond_proj": true,
44
+ "cond_tape_writable": false,
45
+ "conditional": "class",
46
+ "conv_drop_units": 0.0,
47
+ "conv_kernel_size": 0,
48
+ "drop_att": 0.0,
49
+ "drop_path": 0.1,
50
+ "drop_sc": 0.0,
51
+ "drop_units": 0.1,
52
+ "flip_rate": 0.0,
53
+ "guidance": 0.0,
54
+ "infer_iterations": 100,
55
+ "infer_schedule": "cosine",
56
+ "latent_dim": 512,
57
+ "latent_mlp_ratio": 4,
58
+ "latent_num_heads": 16,
59
+ "latent_pos_encoding": "learned",
60
+ "latent_slots": 128,
61
+ "loss_type": "eps",
62
+ "name": "image_diffusion_model",
63
+ "normalize_noisy_input": false,
64
+ "num_layers": "2,2,2",
65
+ "patch_size": 2,
66
+ "pos_encoding": "sin_cos",
67
+ "pred_type": "eps",
68
+ "pretrained_ckpt": "",
69
+ "rw_num_heads": 8,
70
+ "sampler_name": "ddpm",
71
+ "self_cond": "latent",
72
+ "self_cond_by_masking": true,
73
+ "self_cond_rate": 0.9,
74
+ "tape_dim": 256,
75
+ "tape_mlp_ratio": 2,
76
+ "tape_pos_encoding": "learned",
77
+ "td": 0.0,
78
+ "time_on_latent": true,
79
+ "time_scaling": 1000,
80
+ "train_schedule": "sigmoid@-3,3,0.9",
81
+ "use_cls_token": false,
82
+ "x0_clip": "auto",
83
+ "xattn_enc_ln": false
84
+ },
85
+ "model_dir": "results/cifar10",
86
+ "optimization": {
87
+ "beta1": 0.9,
88
+ "beta2": 0.999,
89
+ "ema_decay": 0.9999,
90
+ "ema_name_exact_match": true,
91
+ "end_lr_factor": 0.0,
92
+ "eps": 1e-08,
93
+ "exclude_from_weight_decay": "bias,beta,gamma",
94
+ "global_clipnorm": 1.0,
95
+ "learning_rate": 0.003,
96
+ "learning_rate_scaling": "none",
97
+ "learning_rate_schedule": "cosine@0.8",
98
+ "momentum": 0.9,
99
+ "optimizer": "lamb",
100
+ "tail_steps": 0,
101
+ "warmup_epochs": 0,
102
+ "warmup_steps": 10000,
103
+ "weight_decay": 0.01
104
+ },
105
+ "task": {
106
+ "name": "image_generation",
107
+ "weight": 1.0
108
+ },
109
+ "tasks": [
110
+ {
111
+ "name": "image_generation",
112
+ "weight": 1.0
113
+ }
114
+ ],
115
+ "train": {
116
+ "batch_size": 256,
117
+ "checkpoint_epochs": 40,
118
+ "checkpoint_steps": 1000,
119
+ "epochs": 100,
120
+ "keep_checkpoint_max": 10,
121
+ "label_smoothing": 0.0,
122
+ "steps": 150000
123
+ }
124
+ }
events.out.tfevents.1757712604.viscam-hgx-2.stanford.edu.2124946.0.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7836654b71b5840b1dcf6d1a68de9331ae80313d9d6f3f39c1723138f62465dd
3
+ size 84116