Xsmos commited on
Commit
19a0366
·
verified ·
1 Parent(s): 77c1fc3
diffusion_test.py CHANGED
@@ -495,7 +495,7 @@ class DDPM21CM:
495
  pbar_train = tqdm(total=len(self.dataloader), file=sys.stderr, disable=True)#, mininterval=self.config.pbar_update_step)#, disable=True)#not self.accelerator.is_local_main_process)
496
  pbar_train.set_description(f"{socket.gethostbyname(socket.gethostname())} cuda:{torch.cuda.current_device()}/{self.config.global_rank} Epoch {ep}")
497
  epoch_start = time()
498
- print(f"epoch = {ep}")
499
  for i, (x, c) in enumerate(self.dataloader):
500
  x = self.transform(x)
501
  x = x.to(self.config.device)#.to(self.config.dtype)
 
495
  pbar_train = tqdm(total=len(self.dataloader), file=sys.stderr, disable=True)#, mininterval=self.config.pbar_update_step)#, disable=True)#not self.accelerator.is_local_main_process)
496
  pbar_train.set_description(f"{socket.gethostbyname(socket.gethostname())} cuda:{torch.cuda.current_device()}/{self.config.global_rank} Epoch {ep}")
497
  epoch_start = time()
498
+ #print(f"epoch = {ep}")
499
  for i, (x, c) in enumerate(self.dataloader):
500
  x = self.transform(x)
501
  x = x.to(self.config.device)#.to(self.config.dtype)
perlmutter_diffusion.sbatch CHANGED
@@ -35,10 +35,10 @@ srun python diffusion.py \
35
  --num_new_img_per_gpu 4 \
36
  --max_num_img_per_gpu 2 \
37
  --gradient_accumulation_steps 1 \
38
- --autocast 1 \
39
  --use_checkpoint 1 \
40
  --dropout 0.1 \
41
- --resume ./outputs/model-N1600-device_count4-node4-epoch9-20051216 \
42
  #--train "$SCRATCH/LEN128-DIM64-CUB16-Tvir[4, 6]-zeta[10, 250]-0809-123640.h5" \
43
 
44
  date
 
35
  --num_new_img_per_gpu 4 \
36
  --max_num_img_per_gpu 2 \
37
  --gradient_accumulation_steps 1 \
38
+ --autocast 0 \
39
  --use_checkpoint 1 \
40
  --dropout 0.1 \
41
+ --resume ./outputs/model-N1600-device_count4-node4-epoch29-20051216 \
42
  #--train "$SCRATCH/LEN128-DIM64-CUB16-Tvir[4, 6]-zeta[10, 250]-0809-123640.h5" \
43
 
44
  date
quantify_results.ipynb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4959c36d99047fc29ed5ded2317a3f74e5fbca497e8848778ed4e86c41e5f56
3
- size 12046825
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0c13ff1f79531d58b80a67cf6ae9141685d85483eac6006d7fc90f33d55283e
3
+ size 28539850