McNu1ty commited on
Commit
b37c8a1
·
verified ·
1 Parent(s): cbe6228

Upload 2 files

Browse files
cifar-gqgan-gs64-cb1024/checkpoints/last.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70945089febc5f99c8ce821da6f0b7e0e994fe55e73e993cadc282ea925cd4ca
3
+ size 498383136
cifar-gqgan-gs64-cb1024/config.yaml ADDED
@@ -0,0 +1,270 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # lightning.pytorch==2.2.0
2
+ seed_everything: 0
3
+ trainer:
4
+ accelerator: gpu
5
+ strategy: ddp_find_unused_parameters_true
6
+ devices: 6
7
+ num_nodes: 1
8
+ precision: 16-mixed
9
+ logger:
10
+ class_path: lightning.pytorch.loggers.TensorBoardLogger
11
+ init_args:
12
+ save_dir: ./logs/gqgan/
13
+ name: null
14
+ version: cifar-test1
15
+ log_graph: false
16
+ default_hp_metric: true
17
+ prefix: ''
18
+ sub_dir: null
19
+ comment: ''
20
+ purge_step: null
21
+ max_queue: 10
22
+ flush_secs: 120
23
+ filename_suffix: ''
24
+ callbacks:
25
+ - class_path: lightning.pytorch.callbacks.ModelCheckpoint
26
+ init_args:
27
+ dirpath: ./logs/gqgan/cifar-test1/checkpoints/
28
+ filename: null
29
+ monitor: null
30
+ verbose: false
31
+ save_last: null
32
+ save_top_k: 1
33
+ save_weights_only: false
34
+ mode: min
35
+ auto_insert_metric_name: true
36
+ every_n_train_steps: null
37
+ train_time_interval: null
38
+ every_n_epochs: null
39
+ save_on_train_epoch_end: null
40
+ enable_version_counter: true
41
+ - class_path: lightning.pytorch.callbacks.LearningRateMonitor
42
+ init_args:
43
+ logging_interval: step
44
+ log_momentum: false
45
+ log_weight_decay: false
46
+ fast_dev_run: false
47
+ max_epochs: 30
48
+ min_epochs: null
49
+ max_steps: -1
50
+ min_steps: null
51
+ max_time: null
52
+ limit_train_batches: null
53
+ limit_val_batches: null
54
+ limit_test_batches: null
55
+ limit_predict_batches: null
56
+ overfit_batches: 0.0
57
+ val_check_interval: null
58
+ check_val_every_n_epoch: 1
59
+ num_sanity_val_steps: -1
60
+ log_every_n_steps: 100
61
+ enable_checkpointing: null
62
+ enable_progress_bar: null
63
+ enable_model_summary: null
64
+ accumulate_grad_batches: 1
65
+ gradient_clip_val: null
66
+ gradient_clip_algorithm: null
67
+ deterministic: null
68
+ benchmark: null
69
+ inference_mode: true
70
+ use_distributed_sampler: true
71
+ profiler: null
72
+ detect_anomaly: false
73
+ barebones: false
74
+ plugins: null
75
+ sync_batchnorm: false
76
+ reload_dataloaders_every_n_epochs: 0
77
+ default_root_dir: null
78
+ model:
79
+ class_path: gstk.models.gqgan_vq_v1.GQGAN
80
+ init_args:
81
+ fm_shape:
82
+ - 16
83
+ - 16
84
+ img_encoder_cfg:
85
+ double_z: false
86
+ z_channels: 64
87
+ resolution: 128
88
+ in_channels: 3
89
+ out_ch: 3
90
+ ch: 128
91
+ ch_mult:
92
+ - 1
93
+ - 2
94
+ num_res_blocks: 4
95
+ img_decoder_cfg:
96
+ double_z: false
97
+ z_channels: 3
98
+ resolution: 128
99
+ in_channels: 3
100
+ out_ch: 3
101
+ ch: 128
102
+ ch_mult:
103
+ - 1
104
+ - 2
105
+ num_res_blocks: 4
106
+ z_channels: 3
107
+ vq_cfg:
108
+ learnable_codebook: false
109
+ ema_update: true
110
+ sync_codebook: true
111
+ dim: 3
112
+ codebook_size: 1024
113
+ accept_image_fmap: false
114
+ decay: 0.8
115
+ commitment_weight: 1.0
116
+ threshold_ema_dead_code: 2
117
+ kmeans_init: true
118
+ kmeans_iters: 10
119
+ gs_embed_cfg:
120
+ fm_lifter_cfg:
121
+ in_dim: 64
122
+ pe_version: sine
123
+ out_dim: 64
124
+ gaussian_lifter_cfg:
125
+ num_anchor: 64
126
+ embed_dim: 64
127
+ anchor_grad: true
128
+ ins_feat_grad: false
129
+ feature_dim: 64
130
+ include_opa: false
131
+ anchor_encoder_cfg:
132
+ embed_dim: 64
133
+ include_opa: false
134
+ feature_dim: 64
135
+ attn_encoder_cfg:
136
+ fm_shape:
137
+ - 16
138
+ - 16
139
+ encoder_layer_cfg:
140
+ embed_dim: 64
141
+ dropout: 0.1
142
+ activation: relu
143
+ n_levels: 1
144
+ num_heads: 4
145
+ n_points: 4
146
+ num_layers: 2
147
+ attn_decoder_cfg:
148
+ fm_shape:
149
+ - 16
150
+ - 16
151
+ decoder_layer_cfg:
152
+ embed_dim: 64
153
+ dropout: 0.1
154
+ activation: relu
155
+ n_levels: 1
156
+ num_heads: 4
157
+ n_points: 4
158
+ num_layers: 2
159
+ proj_drop: 0.1
160
+ residual_mode: cat
161
+ ffn_cfg:
162
+ in_channels: 128
163
+ pre_norm: true
164
+ out_norm: false
165
+ embed_dim: 64
166
+ num_fcs: 2
167
+ ffn_drop: 0.0
168
+ add_identity: true
169
+ refine_cfg:
170
+ embed_dim: 64
171
+ xy_range:
172
+ - -1
173
+ - 1
174
+ initial_scale_range:
175
+ - 0.1
176
+ - 4.0
177
+ final_scale_range:
178
+ - 0.1
179
+ - 3.0
180
+ refine_state:
181
+ - 0
182
+ - 1
183
+ include_opa: false
184
+ dim_feature: 64
185
+ z_channels: 3
186
+ spconv_cfg:
187
+ in_channels: 64
188
+ out_channels: 64
189
+ kernel_size: 5
190
+ fm_shape:
191
+ - 16
192
+ - 16
193
+ use_out_proj: false
194
+ operation_order:
195
+ - cross_attn
196
+ - ffn
197
+ - refine
198
+ - cross_attn
199
+ - ffn
200
+ - refine
201
+ - cross_attn
202
+ - ffn
203
+ - refine
204
+ op_param_share: false
205
+ image_key: image
206
+ use_ema: true
207
+ loss_cfg:
208
+ disc_conditional: false
209
+ disc_in_channels: 3
210
+ disc_start_epoch: 0
211
+ gan_start_epoch: 5
212
+ disc_weight: 0.8
213
+ gen_loss_weight: 0.1
214
+ lecam_loss_weight: 0.05
215
+ commit_weight: 0.25
216
+ optim_gen_cfg:
217
+ opt: adamw
218
+ lr: 0.0002
219
+ betas:
220
+ - 0.9
221
+ - 0.999
222
+ weight_decay: 0.01
223
+ optim_disc_cfg:
224
+ opt: adamw
225
+ lr: 0.0002
226
+ betas:
227
+ - 0.9
228
+ - 0.999
229
+ weight_decay: 0.01
230
+ lr_scheduler_cfg:
231
+ sched: cosine
232
+ warmup_lr: 1.0e-06
233
+ min_lr: 0.0
234
+ warmup_epochs: 1
235
+ step_on_epochs: false
236
+ num_epochs: null
237
+ updates_per_epoch: null
238
+ embed_dim: 64
239
+ num_gs: 64
240
+ xy_range:
241
+ - -1
242
+ - 1
243
+ initial_scale_range:
244
+ - 0.1
245
+ - 4.0
246
+ final_scale_range:
247
+ - 0.1
248
+ - 3.0
249
+ include_opa: false
250
+ data:
251
+ class_path: gstk.data.from_config.DataModuleFromConfig
252
+ init_args:
253
+ batch_size: 64
254
+ train:
255
+ target: gstk.data.dataset.MyCIFAR
256
+ params:
257
+ train: true
258
+ validation:
259
+ target: gstk.data.dataset.MyCIFAR
260
+ params:
261
+ train: false
262
+ test:
263
+ target: gstk.data.dataset.MyCIFAR
264
+ params:
265
+ train: false
266
+ wrap: false
267
+ num_workers: 8
268
+ optimizer: null
269
+ lr_scheduler: null
270
+ ckpt_path: null