20051216
Browse files- diffusion_test.py +1 -1
- perlmutter_diffusion.sbatch +2 -2
- quantify_results.ipynb +2 -2
diffusion_test.py
CHANGED
|
@@ -495,7 +495,7 @@ class DDPM21CM:
|
|
| 495 |
pbar_train = tqdm(total=len(self.dataloader), file=sys.stderr, disable=True)#, mininterval=self.config.pbar_update_step)#, disable=True)#not self.accelerator.is_local_main_process)
|
| 496 |
pbar_train.set_description(f"{socket.gethostbyname(socket.gethostname())} cuda:{torch.cuda.current_device()}/{self.config.global_rank} Epoch {ep}")
|
| 497 |
epoch_start = time()
|
| 498 |
-
print(f"epoch = {ep}")
|
| 499 |
for i, (x, c) in enumerate(self.dataloader):
|
| 500 |
x = self.transform(x)
|
| 501 |
x = x.to(self.config.device)#.to(self.config.dtype)
|
|
|
|
| 495 |
pbar_train = tqdm(total=len(self.dataloader), file=sys.stderr, disable=True)#, mininterval=self.config.pbar_update_step)#, disable=True)#not self.accelerator.is_local_main_process)
|
| 496 |
pbar_train.set_description(f"{socket.gethostbyname(socket.gethostname())} cuda:{torch.cuda.current_device()}/{self.config.global_rank} Epoch {ep}")
|
| 497 |
epoch_start = time()
|
| 498 |
+
#print(f"epoch = {ep}")
|
| 499 |
for i, (x, c) in enumerate(self.dataloader):
|
| 500 |
x = self.transform(x)
|
| 501 |
x = x.to(self.config.device)#.to(self.config.dtype)
|
perlmutter_diffusion.sbatch
CHANGED
|
@@ -35,10 +35,10 @@ srun python diffusion.py \
|
|
| 35 |
--num_new_img_per_gpu 4 \
|
| 36 |
--max_num_img_per_gpu 2 \
|
| 37 |
--gradient_accumulation_steps 1 \
|
| 38 |
-
--autocast
|
| 39 |
--use_checkpoint 1 \
|
| 40 |
--dropout 0.1 \
|
| 41 |
-
--resume ./outputs/model-N1600-device_count4-node4-
|
| 42 |
#--train "$SCRATCH/LEN128-DIM64-CUB16-Tvir[4, 6]-zeta[10, 250]-0809-123640.h5" \
|
| 43 |
|
| 44 |
date
|
|
|
|
| 35 |
--num_new_img_per_gpu 4 \
|
| 36 |
--max_num_img_per_gpu 2 \
|
| 37 |
--gradient_accumulation_steps 1 \
|
| 38 |
+
--autocast 0 \
|
| 39 |
--use_checkpoint 1 \
|
| 40 |
--dropout 0.1 \
|
| 41 |
+
--resume ./outputs/model-N1600-device_count4-node4-epoch29-20051216 \
|
| 42 |
#--train "$SCRATCH/LEN128-DIM64-CUB16-Tvir[4, 6]-zeta[10, 250]-0809-123640.h5" \
|
| 43 |
|
| 44 |
date
|
quantify_results.ipynb
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0c13ff1f79531d58b80a67cf6ae9141685d85483eac6006d7fc90f33d55283e
|
| 3 |
+
size 28539850
|