recoilme commited on
Commit
d016c5e
·
1 Parent(s): 37f77d5
samples/unet_320x576_0.jpg CHANGED

Git LFS Details

  • SHA256: 53d5c579c2ae2ce32d33da94086d1f1895b74b2c13fe5b43d8acadc31b69f061
  • Pointer size: 130 Bytes
  • Size of remote file: 88.1 kB

Git LFS Details

  • SHA256: eed0d246e8bdfed17954d0297fea5454e5c34d2a575beca2990c190b53f52b81
  • Pointer size: 130 Bytes
  • Size of remote file: 72.3 kB
samples/unet_384x576_0.jpg CHANGED

Git LFS Details

  • SHA256: ad5a62380302159303d196b4d7485bcdfae708e2581137facf32c812fb137ea3
  • Pointer size: 130 Bytes
  • Size of remote file: 66.4 kB

Git LFS Details

  • SHA256: 3cf732a24718890a14c01042039e7f518d3759b5e96e76d3f6f630242ba76043
  • Pointer size: 130 Bytes
  • Size of remote file: 84.7 kB
samples/unet_448x576_0.jpg CHANGED

Git LFS Details

  • SHA256: efe165b199ae5812519ff3bce19b3f7cf179577f10ed819da3cbb34e7e957a16
  • Pointer size: 130 Bytes
  • Size of remote file: 70.3 kB

Git LFS Details

  • SHA256: cf263b79b00a6b24af3707e40d5fc4f2155327d37d39bee7b96750966a676515
  • Pointer size: 130 Bytes
  • Size of remote file: 70.7 kB
samples/unet_512x576_0.jpg CHANGED

Git LFS Details

  • SHA256: b606ed102d90ecbe6a9f1f603ce4b8d6c2aa50be42cbe2b54e4a69e603262c71
  • Pointer size: 131 Bytes
  • Size of remote file: 135 kB

Git LFS Details

  • SHA256: b2253da9aebbea17fb23d63061a64a43c66b53c297ed7caee6c142fa6c091427
  • Pointer size: 131 Bytes
  • Size of remote file: 101 kB
samples/unet_576x320_0.jpg CHANGED

Git LFS Details

  • SHA256: 1523b417c12130766aef934b3602b2eb9b74de05393aa12482bc6cb6c5776ab6
  • Pointer size: 130 Bytes
  • Size of remote file: 62.6 kB

Git LFS Details

  • SHA256: 948a46962a49b7ad1c503f3b1bae6e06cd00e097e8e24de307bf4173de69089d
  • Pointer size: 130 Bytes
  • Size of remote file: 32.8 kB
samples/unet_576x384_0.jpg CHANGED

Git LFS Details

  • SHA256: 1fc415802e367557b6748491c574d164074ab96b84144894b722066773e2dff4
  • Pointer size: 130 Bytes
  • Size of remote file: 57.9 kB

Git LFS Details

  • SHA256: fcea4e4dd33bc40e7f33145d1e0e433701ba0bcca3af242bd35a328250e611d6
  • Pointer size: 130 Bytes
  • Size of remote file: 96.1 kB
samples/unet_576x448_0.jpg CHANGED

Git LFS Details

  • SHA256: 706adfb5a07ef0b2ba85ed08d02ff376b743db266b231c25a91a3981568468b4
  • Pointer size: 130 Bytes
  • Size of remote file: 74.7 kB

Git LFS Details

  • SHA256: 6621334078214223cef6a53cf8d2012d70abbf8b79dbd1b3475cc82c1293aebd
  • Pointer size: 130 Bytes
  • Size of remote file: 73 kB
samples/unet_576x512_0.jpg CHANGED

Git LFS Details

  • SHA256: 4bcbeaed34f56ce59d68452e221571b93f27fc80b35433efea9c1ef392004578
  • Pointer size: 131 Bytes
  • Size of remote file: 162 kB

Git LFS Details

  • SHA256: a99a72655016630a58c2916813c199e1e2e48c57560489093e80adde7b40fdfb
  • Pointer size: 130 Bytes
  • Size of remote file: 68.4 kB
samples/unet_576x576_0.jpg CHANGED

Git LFS Details

  • SHA256: 995385b7a6bf76c3f4cf9732700b5d11fc631d5afe791867de14e6cc0200c471
  • Pointer size: 131 Bytes
  • Size of remote file: 150 kB

Git LFS Details

  • SHA256: cc8d71d65f12421eb13f7ef20cb67397c50a3586a9a4d27db88fa3ddd85be551
  • Pointer size: 131 Bytes
  • Size of remote file: 251 kB
src/cherrypick.ipynb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3bc29d6c8ede5a64c8ae9b2f8f824d4edfe91209bc6a6363a43ab66ec01d68f
3
- size 44788
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a7a1a0affd76326768c9aa37d032b8c0156a10f06f3fe53b98ca695a9dac57f
3
+ size 44433
train.py CHANGED
@@ -28,9 +28,9 @@ import torch.nn.functional as F
28
  ds_path = "datasets/576"
29
  project = "unet"
30
  batch_size = 40
31
- base_learning_rate = 2e-5
32
- min_learning_rate = 9e-6
33
- num_epochs = 16
34
  # samples/save per epoch
35
  sample_interval_share = 5
36
  use_wandb = True
@@ -51,7 +51,7 @@ dtype = torch.float32
51
  save_barrier = 1.03
52
  dispersive_temperature=0.5
53
  dispersive_weight=0.05
54
- percentile_clipping = 97 # 8bit optim
55
  steps_offset = 1 # Scheduler
56
  limit = 0
57
  checkpoints_folder = ""
@@ -880,7 +880,6 @@ for epoch in range(start_epoch, start_epoch + num_epochs):
880
  dispersive_loss = dispersive_hook.weight * dispersive_hook.compute_dispersive_loss()
881
  if torch.isnan(dispersive_loss) or torch.isinf(dispersive_loss):
882
  print(f"Rank {accelerator.process_index}: Found nan/inf in dispersive_loss: {total_loss}")
883
- #break
884
 
885
  # Итоговый loss
886
  # dispersive_loss должен падать и тотал падать - поэтому плюс
@@ -905,7 +904,7 @@ for epoch in range(start_epoch, start_epoch + num_epochs):
905
  if not fbp:
906
  if accelerator.sync_gradients:
907
  with torch.amp.autocast('cuda', enabled=False):
908
- grad = accelerator.clip_grad_norm_(unet.parameters(), 1.)
909
  optimizer.step()
910
  lr_scheduler.step()
911
  optimizer.zero_grad(set_to_none=True)
 
28
  ds_path = "datasets/576"
29
  project = "unet"
30
  batch_size = 40
31
+ base_learning_rate = 9e-6
32
+ min_learning_rate = 8e-6
33
+ num_epochs = 6
34
  # samples/save per epoch
35
  sample_interval_share = 5
36
  use_wandb = True
 
51
  save_barrier = 1.03
52
  dispersive_temperature=0.5
53
  dispersive_weight=0.05
54
+ percentile_clipping = 95 # 8bit optim
55
  steps_offset = 1 # Scheduler
56
  limit = 0
57
  checkpoints_folder = ""
 
880
  dispersive_loss = dispersive_hook.weight * dispersive_hook.compute_dispersive_loss()
881
  if torch.isnan(dispersive_loss) or torch.isinf(dispersive_loss):
882
  print(f"Rank {accelerator.process_index}: Found nan/inf in dispersive_loss: {total_loss}")
 
883
 
884
  # Итоговый loss
885
  # dispersive_loss должен падать и тотал падать - поэтому плюс
 
904
  if not fbp:
905
  if accelerator.sync_gradients:
906
  with torch.amp.autocast('cuda', enabled=False):
907
+ grad = accelerator.clip_grad_norm_(unet.parameters(), 0.5)
908
  optimizer.step()
909
  lr_scheduler.step()
910
  optimizer.zero_grad(set_to_none=True)
unet/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:07a685bcb8f3815c8b00c3d72f767a0f5cee548614bf2ed03c9cee89e4523681
3
  size 7014306128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3991dd208c9c94d95c5c2465e0dc11197da00f0b30aebb53d89b3e9bc9392ae4
3
  size 7014306128