LamTNguyen commited on
Commit
d877cbe
·
verified ·
1 Parent(s): 2ebde61

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165/log.txt +25 -0
  2. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165/progress.csv +2 -0
  3. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/ema_0.995_090000.pt +3 -0
  4. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/log.txt +2053 -0
  5. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/model090000.pt +3 -0
  6. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_indistro_terms.npz +3 -0
  7. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_outdistro_terms.npz +3 -0
  8. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_indistro_terms.npz +3 -0
  9. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_outdistro_terms.npz +3 -0
  10. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_indistro_terms.npz +3 -0
  11. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_outdistro_terms.npz +3 -0
  12. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_indistro_terms.npz +3 -0
  13. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_outdistro_terms.npz +3 -0
  14. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_indistro_terms.npz +3 -0
  15. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_outdistro_terms.npz +3 -0
  16. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_indistro_terms.npz +3 -0
  17. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_outdistro_terms.npz +3 -0
  18. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_indistro_terms.npz +3 -0
  19. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_outdistro_terms.npz +3 -0
  20. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_indistro_terms.npz +3 -0
  21. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_outdistro_terms.npz +3 -0
  22. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/progress.csv +92 -0
  23. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_indistro_terms.npz +3 -0
  24. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_outdistro_terms.npz +3 -0
  25. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_indistro_terms.npz +3 -0
  26. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_outdistro_terms.npz +3 -0
  27. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_indistro_terms.npz +3 -0
  28. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_outdistro_terms.npz +3 -0
  29. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_indistro_terms.npz +3 -0
  30. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_outdistro_terms.npz +3 -0
  31. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_indistro_terms.npz +3 -0
  32. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_outdistro_terms.npz +3 -0
  33. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_indistro_terms.npz +3 -0
  34. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_outdistro_terms.npz +3 -0
  35. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_indistro_terms.npz +3 -0
  36. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_outdistro_terms.npz +3 -0
  37. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_indistro_terms.npz +3 -0
  38. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_outdistro_terms.npz +3 -0
  39. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_indistro_terms.npz +3 -0
  40. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_outdistro_terms.npz +3 -0
  41. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_indistro_terms.npz +3 -0
  42. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_outdistro_terms.npz +3 -0
  43. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_indistro_terms.npz +3 -0
  44. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_outdistro_terms.npz +3 -0
  45. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_indistro_terms.npz +3 -0
  46. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_outdistro_terms.npz +3 -0
  47. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_indistro_terms.npz +3 -0
  48. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_outdistro_terms.npz +3 -0
  49. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_indistro_terms.npz +3 -0
  50. cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_outdistro_terms.npz +3 -0
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165/log.txt ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Logging to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165
2
+ creating model and diffusion...
3
+ creating data loader...
4
+ training...
5
+ -------------------------
6
+ | grad_norm | 2.54 |
7
+ | loss | 1.01 |
8
+ | loss_q0 | 1.01 |
9
+ | loss_q1 | 1.01 |
10
+ | loss_q2 | 1.01 |
11
+ | loss_q3 | 1.01 |
12
+ | mse | 0.999 |
13
+ | mse_q0 | 1 |
14
+ | mse_q1 | 1.01 |
15
+ | mse_q2 | 0.996 |
16
+ | mse_q3 | 1 |
17
+ | param_norm | 180 |
18
+ | samples | 16 |
19
+ | step | 0 |
20
+ | vb | 0.00969 |
21
+ | vb_q0 | 0.00814 |
22
+ | vb_q1 | 0.00726 |
23
+ | vb_q2 | 0.00917 |
24
+ | vb_q3 | 0.0122 |
25
+ -------------------------
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165/progress.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ grad_norm,loss,loss_q0,loss_q1,loss_q2,loss_q3,mse,mse_q0,mse_q1,mse_q2,mse_q3,param_norm,samples,step,vb,vb_q0,vb_q1,vb_q2,vb_q3
2
+ 2.5351430912370003,1.0083870887756348,1.0080348,1.0147415,1.0054059,1.0136827,0.998694896697998,0.99989533,1.0074818,0.9962311,1.0014414,180.41246248133166,16,0,0.009692199528217316,0.008139333,0.0072596963,0.009174611,0.012241336
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/ema_0.995_090000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31fd61b64d5548d00967160f3b4b7c1a29760cd6ea3de1c6a5a326de34201688
3
+ size 118795331
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/log.txt ADDED
@@ -0,0 +1,2053 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Logging to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947
2
+ creating model and diffusion...
3
+ creating data loader...
4
+ training...
5
+ -------------------------
6
+ | grad_norm | 2.54 |
7
+ | loss | 1.01 |
8
+ | loss_q0 | 1.01 |
9
+ | loss_q1 | 1.01 |
10
+ | loss_q2 | 1.01 |
11
+ | loss_q3 | 1.01 |
12
+ | mse | 0.999 |
13
+ | mse_q0 | 1 |
14
+ | mse_q1 | 1.01 |
15
+ | mse_q2 | 0.996 |
16
+ | mse_q3 | 1 |
17
+ | param_norm | 180 |
18
+ | samples | 16 |
19
+ | step | 0 |
20
+ | vb | 0.00969 |
21
+ | vb_q0 | 0.00814 |
22
+ | vb_q1 | 0.00726 |
23
+ | vb_q2 | 0.00917 |
24
+ | vb_q3 | 0.0122 |
25
+ -------------------------
26
+ -------------------------
27
+ | grad_norm | 0.387 |
28
+ | loss | 0.119 |
29
+ | loss_q0 | 0.231 |
30
+ | loss_q1 | 0.0923 |
31
+ | loss_q2 | 0.0775 |
32
+ | loss_q3 | 0.0703 |
33
+ | mse | 0.112 |
34
+ | mse_q0 | 0.208 |
35
+ | mse_q1 | 0.0916 |
36
+ | mse_q2 | 0.0767 |
37
+ | mse_q3 | 0.0694 |
38
+ | param_norm | 181 |
39
+ | samples | 1.6e+04 |
40
+ | step | 1e+03 |
41
+ | vb | 0.00636 |
42
+ | vb_q0 | 0.0225 |
43
+ | vb_q1 | 0.000681 |
44
+ | vb_q2 | 0.00072 |
45
+ | vb_q3 | 0.000888 |
46
+ -------------------------
47
+ -------------------------
48
+ | grad_norm | 0.123 |
49
+ | loss | 0.0423 |
50
+ | loss_q0 | 0.138 |
51
+ | loss_q1 | 0.0212 |
52
+ | loss_q2 | 0.00602 |
53
+ | loss_q3 | 0.003 |
54
+ | mse | 0.0386 |
55
+ | mse_q0 | 0.124 |
56
+ | mse_q1 | 0.0211 |
57
+ | mse_q2 | 0.00597 |
58
+ | mse_q3 | 0.00296 |
59
+ | param_norm | 181 |
60
+ | samples | 3.2e+04 |
61
+ | step | 2e+03 |
62
+ | vb | 0.00371 |
63
+ | vb_q0 | 0.0145 |
64
+ | vb_q1 | 0.000156 |
65
+ | vb_q2 | 5.42e-05 |
66
+ | vb_q3 | 3.8e-05 |
67
+ -------------------------
68
+ -------------------------
69
+ | grad_norm | 0.109 |
70
+ | loss | 0.0398 |
71
+ | loss_q0 | 0.132 |
72
+ | loss_q1 | 0.02 |
73
+ | loss_q2 | 0.00499 |
74
+ | loss_q3 | 0.00191 |
75
+ | mse | 0.0359 |
76
+ | mse_q0 | 0.116 |
77
+ | mse_q1 | 0.0198 |
78
+ | mse_q2 | 0.00495 |
79
+ | mse_q3 | 0.00188 |
80
+ | param_norm | 181 |
81
+ | samples | 4.8e+04 |
82
+ | step | 3e+03 |
83
+ | vb | 0.00389 |
84
+ | vb_q0 | 0.0153 |
85
+ | vb_q1 | 0.000147 |
86
+ | vb_q2 | 4.46e-05 |
87
+ | vb_q3 | 2.41e-05 |
88
+ -------------------------
89
+ -------------------------
90
+ | grad_norm | 0.0996 |
91
+ | loss | 0.039 |
92
+ | loss_q0 | 0.13 |
93
+ | loss_q1 | 0.0193 |
94
+ | loss_q2 | 0.00441 |
95
+ | loss_q3 | 0.00145 |
96
+ | mse | 0.0342 |
97
+ | mse_q0 | 0.111 |
98
+ | mse_q1 | 0.0192 |
99
+ | mse_q2 | 0.00437 |
100
+ | mse_q3 | 0.00143 |
101
+ | param_norm | 182 |
102
+ | samples | 6.4e+04 |
103
+ | step | 4e+03 |
104
+ | vb | 0.00478 |
105
+ | vb_q0 | 0.0188 |
106
+ | vb_q1 | 0.000142 |
107
+ | vb_q2 | 3.95e-05 |
108
+ | vb_q3 | 1.83e-05 |
109
+ -------------------------
110
+ -------------------------
111
+ | grad_norm | 0.0932 |
112
+ | loss | 0.0376 |
113
+ | loss_q0 | 0.125 |
114
+ | loss_q1 | 0.0189 |
115
+ | loss_q2 | 0.00411 |
116
+ | loss_q3 | 0.00115 |
117
+ | mse | 0.0337 |
118
+ | mse_q0 | 0.109 |
119
+ | mse_q1 | 0.0188 |
120
+ | mse_q2 | 0.00408 |
121
+ | mse_q3 | 0.00114 |
122
+ | param_norm | 182 |
123
+ | samples | 8e+04 |
124
+ | step | 5e+03 |
125
+ | vb | 0.00392 |
126
+ | vb_q0 | 0.0153 |
127
+ | vb_q1 | 0.000139 |
128
+ | vb_q2 | 3.67e-05 |
129
+ | vb_q3 | 1.45e-05 |
130
+ -------------------------
131
+ -------------------------
132
+ | grad_norm | 0.0887 |
133
+ | loss | 0.0355 |
134
+ | loss_q0 | 0.121 |
135
+ | loss_q1 | 0.0185 |
136
+ | loss_q2 | 0.00402 |
137
+ | loss_q3 | 0.000991 |
138
+ | mse | 0.0322 |
139
+ | mse_q0 | 0.107 |
140
+ | mse_q1 | 0.0184 |
141
+ | mse_q2 | 0.00398 |
142
+ | mse_q3 | 0.000978 |
143
+ | param_norm | 182 |
144
+ | samples | 9.6e+04 |
145
+ | step | 6e+03 |
146
+ | vb | 0.00333 |
147
+ | vb_q0 | 0.0134 |
148
+ | vb_q1 | 0.000136 |
149
+ | vb_q2 | 3.57e-05 |
150
+ | vb_q3 | 1.24e-05 |
151
+ -------------------------
152
+ -------------------------
153
+ | grad_norm | 0.0888 |
154
+ | loss | 0.0371 |
155
+ | loss_q0 | 0.126 |
156
+ | loss_q1 | 0.0184 |
157
+ | loss_q2 | 0.00386 |
158
+ | loss_q3 | 0.000895 |
159
+ | mse | 0.0326 |
160
+ | mse_q0 | 0.108 |
161
+ | mse_q1 | 0.0183 |
162
+ | mse_q2 | 0.00383 |
163
+ | mse_q3 | 0.000884 |
164
+ | param_norm | 183 |
165
+ | samples | 1.12e+05 |
166
+ | step | 7e+03 |
167
+ | vb | 0.00445 |
168
+ | vb_q0 | 0.0177 |
169
+ | vb_q1 | 0.000135 |
170
+ | vb_q2 | 3.43e-05 |
171
+ | vb_q3 | 1.12e-05 |
172
+ -------------------------
173
+ -------------------------
174
+ | grad_norm | 0.0858 |
175
+ | loss | 0.0357 |
176
+ | loss_q0 | 0.12 |
177
+ | loss_q1 | 0.0183 |
178
+ | loss_q2 | 0.0038 |
179
+ | loss_q3 | 0.000822 |
180
+ | mse | 0.0324 |
181
+ | mse_q0 | 0.107 |
182
+ | mse_q1 | 0.0181 |
183
+ | mse_q2 | 0.00377 |
184
+ | mse_q3 | 0.000812 |
185
+ | param_norm | 183 |
186
+ | samples | 1.28e+05 |
187
+ | step | 8e+03 |
188
+ | vb | 0.00332 |
189
+ | vb_q0 | 0.013 |
190
+ | vb_q1 | 0.000134 |
191
+ | vb_q2 | 3.38e-05 |
192
+ | vb_q3 | 1.03e-05 |
193
+ -------------------------
194
+ -------------------------
195
+ | grad_norm | 0.0835 |
196
+ | loss | 0.0363 |
197
+ | loss_q0 | 0.123 |
198
+ | loss_q1 | 0.0183 |
199
+ | loss_q2 | 0.00378 |
200
+ | loss_q3 | 0.000763 |
201
+ | mse | 0.0322 |
202
+ | mse_q0 | 0.107 |
203
+ | mse_q1 | 0.0181 |
204
+ | mse_q2 | 0.00375 |
205
+ | mse_q3 | 0.000754 |
206
+ | param_norm | 184 |
207
+ | samples | 1.44e+05 |
208
+ | step | 9e+03 |
209
+ | vb | 0.00412 |
210
+ | vb_q0 | 0.0164 |
211
+ | vb_q1 | 0.000134 |
212
+ | vb_q2 | 3.34e-05 |
213
+ | vb_q3 | 9.54e-06 |
214
+ -------------------------
215
+ -------------------------
216
+ | grad_norm | 0.0782 |
217
+ | loss | 0.0356 |
218
+ | loss_q0 | 0.121 |
219
+ | loss_q1 | 0.018 |
220
+ | loss_q2 | 0.00372 |
221
+ | loss_q3 | 0.000705 |
222
+ | mse | 0.0315 |
223
+ | mse_q0 | 0.105 |
224
+ | mse_q1 | 0.0179 |
225
+ | mse_q2 | 0.00369 |
226
+ | mse_q3 | 0.000696 |
227
+ | param_norm | 184 |
228
+ | samples | 1.6e+05 |
229
+ | step | 1e+04 |
230
+ | vb | 0.00407 |
231
+ | vb_q0 | 0.0163 |
232
+ | vb_q1 | 0.000132 |
233
+ | vb_q2 | 3.29e-05 |
234
+ | vb_q3 | 8.77e-06 |
235
+ -------------------------
236
+ saving model 0...
237
+ saving model 0.995...
238
+ evaluation indistro starting...
239
+ done 96 samples: bpd=3.809229850769043
240
+ done 192 samples: bpd=3.8889626264572144
241
+ done 288 samples: bpd=3.8427980740865073
242
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_indistro_terms.npz
243
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_indistro_terms.npz
244
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_indistro_terms.npz
245
+ evaluation nll complete
246
+ evaluation outdistro starting...
247
+ done 192 samples: bpd=4.073406219482422
248
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_outdistro_terms.npz
249
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_outdistro_terms.npz
250
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_outdistro_terms.npz
251
+ evaluation nll complete
252
+ sampling starting...
253
+ -------------------------
254
+ | grad_norm | 0.0793 |
255
+ | loss | 0.0355 |
256
+ | loss_q0 | 0.119 |
257
+ | loss_q1 | 0.0179 |
258
+ | loss_q2 | 0.00367 |
259
+ | loss_q3 | 0.000674 |
260
+ | mse | 0.0318 |
261
+ | mse_q0 | 0.104 |
262
+ | mse_q1 | 0.0178 |
263
+ | mse_q2 | 0.00364 |
264
+ | mse_q3 | 0.000666 |
265
+ | param_norm | 185 |
266
+ | samples | 1.76e+05 |
267
+ | step | 1.1e+04 |
268
+ | vb | 0.00371 |
269
+ | vb_q0 | 0.0145 |
270
+ | vb_q1 | 0.000131 |
271
+ | vb_q2 | 3.25e-05 |
272
+ | vb_q3 | 8.42e-06 |
273
+ -------------------------
274
+ -------------------------
275
+ | grad_norm | 0.0761 |
276
+ | loss | 0.0362 |
277
+ | loss_q0 | 0.119 |
278
+ | loss_q1 | 0.0177 |
279
+ | loss_q2 | 0.00357 |
280
+ | loss_q3 | 0.000631 |
281
+ | mse | 0.0321 |
282
+ | mse_q0 | 0.103 |
283
+ | mse_q1 | 0.0175 |
284
+ | mse_q2 | 0.00354 |
285
+ | mse_q3 | 0.000623 |
286
+ | param_norm | 185 |
287
+ | samples | 1.92e+05 |
288
+ | step | 1.2e+04 |
289
+ | vb | 0.00416 |
290
+ | vb_q0 | 0.016 |
291
+ | vb_q1 | 0.00013 |
292
+ | vb_q2 | 3.16e-05 |
293
+ | vb_q3 | 7.87e-06 |
294
+ -------------------------
295
+ -------------------------
296
+ | grad_norm | 0.0758 |
297
+ | loss | 0.0354 |
298
+ | loss_q0 | 0.12 |
299
+ | loss_q1 | 0.018 |
300
+ | loss_q2 | 0.0036 |
301
+ | loss_q3 | 0.00061 |
302
+ | mse | 0.0314 |
303
+ | mse_q0 | 0.104 |
304
+ | mse_q1 | 0.0178 |
305
+ | mse_q2 | 0.00356 |
306
+ | mse_q3 | 0.000603 |
307
+ | param_norm | 185 |
308
+ | samples | 2.08e+05 |
309
+ | step | 1.3e+04 |
310
+ | vb | 0.004 |
311
+ | vb_q0 | 0.0159 |
312
+ | vb_q1 | 0.000132 |
313
+ | vb_q2 | 3.18e-05 |
314
+ | vb_q3 | 7.59e-06 |
315
+ -------------------------
316
+ -------------------------
317
+ | grad_norm | 0.0745 |
318
+ | loss | 0.0341 |
319
+ | loss_q0 | 0.114 |
320
+ | loss_q1 | 0.0178 |
321
+ | loss_q2 | 0.00351 |
322
+ | loss_q3 | 0.000586 |
323
+ | mse | 0.031 |
324
+ | mse_q0 | 0.102 |
325
+ | mse_q1 | 0.0177 |
326
+ | mse_q2 | 0.00348 |
327
+ | mse_q3 | 0.000579 |
328
+ | param_norm | 186 |
329
+ | samples | 2.24e+05 |
330
+ | step | 1.4e+04 |
331
+ | vb | 0.00309 |
332
+ | vb_q0 | 0.0122 |
333
+ | vb_q1 | 0.000131 |
334
+ | vb_q2 | 3.11e-05 |
335
+ | vb_q3 | 7.29e-06 |
336
+ -------------------------
337
+ -------------------------
338
+ | grad_norm | 0.0728 |
339
+ | loss | 0.034 |
340
+ | loss_q0 | 0.116 |
341
+ | loss_q1 | 0.0177 |
342
+ | loss_q2 | 0.00353 |
343
+ | loss_q3 | 0.000564 |
344
+ | mse | 0.0308 |
345
+ | mse_q0 | 0.103 |
346
+ | mse_q1 | 0.0176 |
347
+ | mse_q2 | 0.0035 |
348
+ | mse_q3 | 0.000557 |
349
+ | param_norm | 186 |
350
+ | samples | 2.4e+05 |
351
+ | step | 1.5e+04 |
352
+ | vb | 0.00324 |
353
+ | vb_q0 | 0.013 |
354
+ | vb_q1 | 0.00013 |
355
+ | vb_q2 | 3.12e-05 |
356
+ | vb_q3 | 6.99e-06 |
357
+ -------------------------
358
+ -------------------------
359
+ | grad_norm | 0.0736 |
360
+ | loss | 0.036 |
361
+ | loss_q0 | 0.121 |
362
+ | loss_q1 | 0.0177 |
363
+ | loss_q2 | 0.00358 |
364
+ | loss_q3 | 0.00056 |
365
+ | mse | 0.0315 |
366
+ | mse_q0 | 0.104 |
367
+ | mse_q1 | 0.0175 |
368
+ | mse_q2 | 0.00354 |
369
+ | mse_q3 | 0.000553 |
370
+ | param_norm | 187 |
371
+ | samples | 2.56e+05 |
372
+ | step | 1.6e+04 |
373
+ | vb | 0.00452 |
374
+ | vb_q0 | 0.0177 |
375
+ | vb_q1 | 0.00013 |
376
+ | vb_q2 | 3.15e-05 |
377
+ | vb_q3 | 6.93e-06 |
378
+ -------------------------
379
+ -------------------------
380
+ | grad_norm | 0.07 |
381
+ | loss | 0.0347 |
382
+ | loss_q0 | 0.116 |
383
+ | loss_q1 | 0.0177 |
384
+ | loss_q2 | 0.00352 |
385
+ | loss_q3 | 0.000523 |
386
+ | mse | 0.0309 |
387
+ | mse_q0 | 0.101 |
388
+ | mse_q1 | 0.0175 |
389
+ | mse_q2 | 0.00349 |
390
+ | mse_q3 | 0.000516 |
391
+ | param_norm | 187 |
392
+ | samples | 2.72e+05 |
393
+ | step | 1.7e+04 |
394
+ | vb | 0.00377 |
395
+ | vb_q0 | 0.0147 |
396
+ | vb_q1 | 0.00013 |
397
+ | vb_q2 | 3.1e-05 |
398
+ | vb_q3 | 6.47e-06 |
399
+ -------------------------
400
+ -------------------------
401
+ | grad_norm | 0.0702 |
402
+ | loss | 0.0339 |
403
+ | loss_q0 | 0.115 |
404
+ | loss_q1 | 0.0174 |
405
+ | loss_q2 | 0.00347 |
406
+ | loss_q3 | 0.000516 |
407
+ | mse | 0.0303 |
408
+ | mse_q0 | 0.101 |
409
+ | mse_q1 | 0.0173 |
410
+ | mse_q2 | 0.00344 |
411
+ | mse_q3 | 0.000509 |
412
+ | param_norm | 188 |
413
+ | samples | 2.88e+05 |
414
+ | step | 1.8e+04 |
415
+ | vb | 0.00366 |
416
+ | vb_q0 | 0.0146 |
417
+ | vb_q1 | 0.000128 |
418
+ | vb_q2 | 3.06e-05 |
419
+ | vb_q3 | 6.4e-06 |
420
+ -------------------------
421
+ -------------------------
422
+ | grad_norm | 0.0676 |
423
+ | loss | 0.0331 |
424
+ | loss_q0 | 0.112 |
425
+ | loss_q1 | 0.0174 |
426
+ | loss_q2 | 0.00344 |
427
+ | loss_q3 | 0.000507 |
428
+ | mse | 0.0304 |
429
+ | mse_q0 | 0.101 |
430
+ | mse_q1 | 0.0173 |
431
+ | mse_q2 | 0.0034 |
432
+ | mse_q3 | 0.000501 |
433
+ | param_norm | 188 |
434
+ | samples | 3.04e+05 |
435
+ | step | 1.9e+04 |
436
+ | vb | 0.00274 |
437
+ | vb_q0 | 0.0109 |
438
+ | vb_q1 | 0.000128 |
439
+ | vb_q2 | 3.04e-05 |
440
+ | vb_q3 | 6.26e-06 |
441
+ -------------------------
442
+ -------------------------
443
+ | grad_norm | 0.0685 |
444
+ | loss | 0.0337 |
445
+ | loss_q0 | 0.114 |
446
+ | loss_q1 | 0.0175 |
447
+ | loss_q2 | 0.00345 |
448
+ | loss_q3 | 0.000495 |
449
+ | mse | 0.03 |
450
+ | mse_q0 | 0.0991 |
451
+ | mse_q1 | 0.0174 |
452
+ | mse_q2 | 0.00342 |
453
+ | mse_q3 | 0.000489 |
454
+ | param_norm | 189 |
455
+ | samples | 3.2e+05 |
456
+ | step | 2e+04 |
457
+ | vb | 0.00368 |
458
+ | vb_q0 | 0.0146 |
459
+ | vb_q1 | 0.000128 |
460
+ | vb_q2 | 3.05e-05 |
461
+ | vb_q3 | 6.13e-06 |
462
+ -------------------------
463
+ saving model 0...
464
+ saving model 0.995...
465
+ evaluation indistro starting...
466
+ done 96 samples: bpd=3.86189341545105
467
+ done 192 samples: bpd=3.769935965538025
468
+ done 288 samples: bpd=3.756619850794474
469
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_indistro_terms.npz
470
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_indistro_terms.npz
471
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_indistro_terms.npz
472
+ evaluation nll complete
473
+ evaluation outdistro starting...
474
+ done 192 samples: bpd=3.8321585655212402
475
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_outdistro_terms.npz
476
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_outdistro_terms.npz
477
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_outdistro_terms.npz
478
+ evaluation nll complete
479
+ sampling starting...
480
+ -------------------------
481
+ | grad_norm | 0.0657 |
482
+ | loss | 0.0348 |
483
+ | loss_q0 | 0.118 |
484
+ | loss_q1 | 0.0175 |
485
+ | loss_q2 | 0.00344 |
486
+ | loss_q3 | 0.000478 |
487
+ | mse | 0.0307 |
488
+ | mse_q0 | 0.101 |
489
+ | mse_q1 | 0.0174 |
490
+ | mse_q2 | 0.00341 |
491
+ | mse_q3 | 0.000472 |
492
+ | param_norm | 189 |
493
+ | samples | 3.36e+05 |
494
+ | step | 2.1e+04 |
495
+ | vb | 0.00408 |
496
+ | vb_q0 | 0.0161 |
497
+ | vb_q1 | 0.000128 |
498
+ | vb_q2 | 3.03e-05 |
499
+ | vb_q3 | 5.9e-06 |
500
+ -------------------------
501
+ -------------------------
502
+ | grad_norm | 0.065 |
503
+ | loss | 0.0331 |
504
+ | loss_q0 | 0.114 |
505
+ | loss_q1 | 0.0175 |
506
+ | loss_q2 | 0.0034 |
507
+ | loss_q3 | 0.000467 |
508
+ | mse | 0.0295 |
509
+ | mse_q0 | 0.0992 |
510
+ | mse_q1 | 0.0174 |
511
+ | mse_q2 | 0.00337 |
512
+ | mse_q3 | 0.000462 |
513
+ | param_norm | 190 |
514
+ | samples | 3.52e+05 |
515
+ | step | 2.2e+04 |
516
+ | vb | 0.00366 |
517
+ | vb_q0 | 0.0149 |
518
+ | vb_q1 | 0.000129 |
519
+ | vb_q2 | 3.01e-05 |
520
+ | vb_q3 | 5.77e-06 |
521
+ -------------------------
522
+ -------------------------
523
+ | grad_norm | 0.0658 |
524
+ | loss | 0.0332 |
525
+ | loss_q0 | 0.111 |
526
+ | loss_q1 | 0.0173 |
527
+ | loss_q2 | 0.00337 |
528
+ | loss_q3 | 0.00046 |
529
+ | mse | 0.0298 |
530
+ | mse_q0 | 0.0979 |
531
+ | mse_q1 | 0.0171 |
532
+ | mse_q2 | 0.00334 |
533
+ | mse_q3 | 0.000454 |
534
+ | param_norm | 190 |
535
+ | samples | 3.68e+05 |
536
+ | step | 2.3e+04 |
537
+ | vb | 0.00346 |
538
+ | vb_q0 | 0.0136 |
539
+ | vb_q1 | 0.000127 |
540
+ | vb_q2 | 2.98e-05 |
541
+ | vb_q3 | 5.69e-06 |
542
+ -------------------------
543
+ -------------------------
544
+ | grad_norm | 0.0645 |
545
+ | loss | 0.0335 |
546
+ | loss_q0 | 0.116 |
547
+ | loss_q1 | 0.0171 |
548
+ | loss_q2 | 0.00335 |
549
+ | loss_q3 | 0.000448 |
550
+ | mse | 0.0293 |
551
+ | mse_q0 | 0.0987 |
552
+ | mse_q1 | 0.017 |
553
+ | mse_q2 | 0.00332 |
554
+ | mse_q3 | 0.000443 |
555
+ | param_norm | 191 |
556
+ | samples | 3.84e+05 |
557
+ | step | 2.4e+04 |
558
+ | vb | 0.00421 |
559
+ | vb_q0 | 0.0171 |
560
+ | vb_q1 | 0.000126 |
561
+ | vb_q2 | 2.96e-05 |
562
+ | vb_q3 | 5.52e-06 |
563
+ -------------------------
564
+ -------------------------
565
+ | grad_norm | 0.0657 |
566
+ | loss | 0.0336 |
567
+ | loss_q0 | 0.111 |
568
+ | loss_q1 | 0.0171 |
569
+ | loss_q2 | 0.00337 |
570
+ | loss_q3 | 0.000451 |
571
+ | mse | 0.0301 |
572
+ | mse_q0 | 0.098 |
573
+ | mse_q1 | 0.017 |
574
+ | mse_q2 | 0.00334 |
575
+ | mse_q3 | 0.000445 |
576
+ | param_norm | 191 |
577
+ | samples | 4e+05 |
578
+ | step | 2.5e+04 |
579
+ | vb | 0.00348 |
580
+ | vb_q0 | 0.0135 |
581
+ | vb_q1 | 0.000125 |
582
+ | vb_q2 | 2.98e-05 |
583
+ | vb_q3 | 5.57e-06 |
584
+ -------------------------
585
+ -------------------------
586
+ | grad_norm | 0.0639 |
587
+ | loss | 0.0331 |
588
+ | loss_q0 | 0.111 |
589
+ | loss_q1 | 0.0173 |
590
+ | loss_q2 | 0.00337 |
591
+ | loss_q3 | 0.000437 |
592
+ | mse | 0.03 |
593
+ | mse_q0 | 0.0991 |
594
+ | mse_q1 | 0.0172 |
595
+ | mse_q2 | 0.00334 |
596
+ | mse_q3 | 0.000432 |
597
+ | param_norm | 192 |
598
+ | samples | 4.16e+05 |
599
+ | step | 2.6e+04 |
600
+ | vb | 0.00305 |
601
+ | vb_q0 | 0.012 |
602
+ | vb_q1 | 0.000127 |
603
+ | vb_q2 | 2.97e-05 |
604
+ | vb_q3 | 5.39e-06 |
605
+ -------------------------
606
+ -------------------------
607
+ | grad_norm | 0.062 |
608
+ | loss | 0.0319 |
609
+ | loss_q0 | 0.109 |
610
+ | loss_q1 | 0.0174 |
611
+ | loss_q2 | 0.00339 |
612
+ | loss_q3 | 0.000424 |
613
+ | mse | 0.0294 |
614
+ | mse_q0 | 0.0989 |
615
+ | mse_q1 | 0.0172 |
616
+ | mse_q2 | 0.00336 |
617
+ | mse_q3 | 0.000419 |
618
+ | param_norm | 192 |
619
+ | samples | 4.32e+05 |
620
+ | step | 2.7e+04 |
621
+ | vb | 0.00251 |
622
+ | vb_q0 | 0.0101 |
623
+ | vb_q1 | 0.000127 |
624
+ | vb_q2 | 2.99e-05 |
625
+ | vb_q3 | 5.22e-06 |
626
+ -------------------------
627
+ -------------------------
628
+ | grad_norm | 0.0651 |
629
+ | loss | 0.0327 |
630
+ | loss_q0 | 0.109 |
631
+ | loss_q1 | 0.0171 |
632
+ | loss_q2 | 0.00341 |
633
+ | loss_q3 | 0.000435 |
634
+ | mse | 0.0294 |
635
+ | mse_q0 | 0.0958 |
636
+ | mse_q1 | 0.017 |
637
+ | mse_q2 | 0.00338 |
638
+ | mse_q3 | 0.00043 |
639
+ | param_norm | 193 |
640
+ | samples | 4.48e+05 |
641
+ | step | 2.8e+04 |
642
+ | vb | 0.00326 |
643
+ | vb_q0 | 0.0127 |
644
+ | vb_q1 | 0.000126 |
645
+ | vb_q2 | 3.01e-05 |
646
+ | vb_q3 | 5.34e-06 |
647
+ -------------------------
648
+ -------------------------
649
+ | grad_norm | 0.0617 |
650
+ | loss | 0.0335 |
651
+ | loss_q0 | 0.114 |
652
+ | loss_q1 | 0.0172 |
653
+ | loss_q2 | 0.00339 |
654
+ | loss_q3 | 0.000421 |
655
+ | mse | 0.03 |
656
+ | mse_q0 | 0.1 |
657
+ | mse_q1 | 0.0171 |
658
+ | mse_q2 | 0.00336 |
659
+ | mse_q3 | 0.000416 |
660
+ | param_norm | 193 |
661
+ | samples | 4.64e+05 |
662
+ | step | 2.9e+04 |
663
+ | vb | 0.00346 |
664
+ | vb_q0 | 0.0139 |
665
+ | vb_q1 | 0.000126 |
666
+ | vb_q2 | 2.99e-05 |
667
+ | vb_q3 | 5.18e-06 |
668
+ -------------------------
669
+ -------------------------
670
+ | grad_norm | 0.0625 |
671
+ | loss | 0.0341 |
672
+ | loss_q0 | 0.117 |
673
+ | loss_q1 | 0.0173 |
674
+ | loss_q2 | 0.00336 |
675
+ | loss_q3 | 0.000427 |
676
+ | mse | 0.0297 |
677
+ | mse_q0 | 0.0996 |
678
+ | mse_q1 | 0.0172 |
679
+ | mse_q2 | 0.00333 |
680
+ | mse_q3 | 0.000422 |
681
+ | param_norm | 194 |
682
+ | samples | 4.8e+05 |
683
+ | step | 3e+04 |
684
+ | vb | 0.00441 |
685
+ | vb_q0 | 0.0178 |
686
+ | vb_q1 | 0.000127 |
687
+ | vb_q2 | 2.96e-05 |
688
+ | vb_q3 | 5.26e-06 |
689
+ -------------------------
690
+ saving model 0...
691
+ saving model 0.995...
692
+ evaluation indistro starting...
693
+ done 96 samples: bpd=3.642620086669922
694
+ done 192 samples: bpd=3.8054873943328857
695
+ done 288 samples: bpd=3.7644495169321694
696
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_indistro_terms.npz
697
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_indistro_terms.npz
698
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_indistro_terms.npz
699
+ evaluation nll complete
700
+ evaluation outdistro starting...
701
+ done 192 samples: bpd=3.8840670585632324
702
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_outdistro_terms.npz
703
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_outdistro_terms.npz
704
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_outdistro_terms.npz
705
+ evaluation nll complete
706
+ sampling starting...
707
+ -------------------------
708
+ | grad_norm | 0.0625 |
709
+ | loss | 0.0347 |
710
+ | loss_q0 | 0.117 |
711
+ | loss_q1 | 0.0174 |
712
+ | loss_q2 | 0.00327 |
713
+ | loss_q3 | 0.000413 |
714
+ | mse | 0.0306 |
715
+ | mse_q0 | 0.101 |
716
+ | mse_q1 | 0.0172 |
717
+ | mse_q2 | 0.00324 |
718
+ | mse_q3 | 0.000408 |
719
+ | param_norm | 194 |
720
+ | samples | 4.96e+05 |
721
+ | step | 3.1e+04 |
722
+ | vb | 0.00405 |
723
+ | vb_q0 | 0.0159 |
724
+ | vb_q1 | 0.000127 |
725
+ | vb_q2 | 2.89e-05 |
726
+ | vb_q3 | 5.09e-06 |
727
+ -------------------------
728
+ -------------------------
729
+ | grad_norm | 0.0595 |
730
+ | loss | 0.0319 |
731
+ | loss_q0 | 0.107 |
732
+ | loss_q1 | 0.0169 |
733
+ | loss_q2 | 0.00331 |
734
+ | loss_q3 | 0.000398 |
735
+ | mse | 0.0293 |
736
+ | mse_q0 | 0.0967 |
737
+ | mse_q1 | 0.0168 |
738
+ | mse_q2 | 0.00328 |
739
+ | mse_q3 | 0.000393 |
740
+ | param_norm | 195 |
741
+ | samples | 5.12e+05 |
742
+ | step | 3.2e+04 |
743
+ | vb | 0.00266 |
744
+ | vb_q0 | 0.0105 |
745
+ | vb_q1 | 0.000124 |
746
+ | vb_q2 | 2.92e-05 |
747
+ | vb_q3 | 4.88e-06 |
748
+ -------------------------
749
+ -------------------------
750
+ | grad_norm | 0.0619 |
751
+ | loss | 0.033 |
752
+ | loss_q0 | 0.113 |
753
+ | loss_q1 | 0.0172 |
754
+ | loss_q2 | 0.00329 |
755
+ | loss_q3 | 0.0004 |
756
+ | mse | 0.0296 |
757
+ | mse_q0 | 0.0996 |
758
+ | mse_q1 | 0.0171 |
759
+ | mse_q2 | 0.00326 |
760
+ | mse_q3 | 0.000395 |
761
+ | param_norm | 195 |
762
+ | samples | 5.28e+05 |
763
+ | step | 3.3e+04 |
764
+ | vb | 0.00338 |
765
+ | vb_q0 | 0.0137 |
766
+ | vb_q1 | 0.000126 |
767
+ | vb_q2 | 2.9e-05 |
768
+ | vb_q3 | 4.93e-06 |
769
+ -------------------------
770
+ -------------------------
771
+ | grad_norm | 0.0606 |
772
+ | loss | 0.0351 |
773
+ | loss_q0 | 0.119 |
774
+ | loss_q1 | 0.017 |
775
+ | loss_q2 | 0.00336 |
776
+ | loss_q3 | 0.000399 |
777
+ | mse | 0.0304 |
778
+ | mse_q0 | 0.1 |
779
+ | mse_q1 | 0.0169 |
780
+ | mse_q2 | 0.00333 |
781
+ | mse_q3 | 0.000394 |
782
+ | param_norm | 196 |
783
+ | samples | 5.44e+05 |
784
+ | step | 3.4e+04 |
785
+ | vb | 0.00465 |
786
+ | vb_q0 | 0.0183 |
787
+ | vb_q1 | 0.000125 |
788
+ | vb_q2 | 2.96e-05 |
789
+ | vb_q3 | 4.89e-06 |
790
+ -------------------------
791
+ -------------------------
792
+ | grad_norm | 0.0636 |
793
+ | loss | 0.0342 |
794
+ | loss_q0 | 0.114 |
795
+ | loss_q1 | 0.017 |
796
+ | loss_q2 | 0.00332 |
797
+ | loss_q3 | 0.000391 |
798
+ | mse | 0.0303 |
799
+ | mse_q0 | 0.0985 |
800
+ | mse_q1 | 0.0169 |
801
+ | mse_q2 | 0.00329 |
802
+ | mse_q3 | 0.000386 |
803
+ | param_norm | 196 |
804
+ | samples | 5.6e+05 |
805
+ | step | 3.5e+04 |
806
+ | vb | 0.00394 |
807
+ | vb_q0 | 0.0153 |
808
+ | vb_q1 | 0.000125 |
809
+ | vb_q2 | 2.92e-05 |
810
+ | vb_q3 | 4.82e-06 |
811
+ -------------------------
812
+ -------------------------
813
+ | grad_norm | 0.0611 |
814
+ | loss | 0.034 |
815
+ | loss_q0 | 0.114 |
816
+ | loss_q1 | 0.017 |
817
+ | loss_q2 | 0.00334 |
818
+ | loss_q3 | 0.000391 |
819
+ | mse | 0.03 |
820
+ | mse_q0 | 0.0984 |
821
+ | mse_q1 | 0.0169 |
822
+ | mse_q2 | 0.00331 |
823
+ | mse_q3 | 0.000387 |
824
+ | param_norm | 197 |
825
+ | samples | 5.76e+05 |
826
+ | step | 3.6e+04 |
827
+ | vb | 0.00397 |
828
+ | vb_q0 | 0.0155 |
829
+ | vb_q1 | 0.000125 |
830
+ | vb_q2 | 2.95e-05 |
831
+ | vb_q3 | 4.81e-06 |
832
+ -------------------------
833
+ -------------------------
834
+ | grad_norm | 0.0599 |
835
+ | loss | 0.0318 |
836
+ | loss_q0 | 0.11 |
837
+ | loss_q1 | 0.017 |
838
+ | loss_q2 | 0.00335 |
839
+ | loss_q3 | 0.000387 |
840
+ | mse | 0.0285 |
841
+ | mse_q0 | 0.0965 |
842
+ | mse_q1 | 0.0169 |
843
+ | mse_q2 | 0.00332 |
844
+ | mse_q3 | 0.000383 |
845
+ | param_norm | 197 |
846
+ | samples | 5.92e+05 |
847
+ | step | 3.7e+04 |
848
+ | vb | 0.00331 |
849
+ | vb_q0 | 0.0136 |
850
+ | vb_q1 | 0.000125 |
851
+ | vb_q2 | 2.95e-05 |
852
+ | vb_q3 | 4.76e-06 |
853
+ -------------------------
854
+ -------------------------
855
+ | grad_norm | 0.0596 |
856
+ | loss | 0.0342 |
857
+ | loss_q0 | 0.116 |
858
+ | loss_q1 | 0.017 |
859
+ | loss_q2 | 0.00336 |
860
+ | loss_q3 | 0.000383 |
861
+ | mse | 0.03 |
862
+ | mse_q0 | 0.0993 |
863
+ | mse_q1 | 0.0168 |
864
+ | mse_q2 | 0.00333 |
865
+ | mse_q3 | 0.000379 |
866
+ | param_norm | 198 |
867
+ | samples | 6.08e+05 |
868
+ | step | 3.8e+04 |
869
+ | vb | 0.00417 |
870
+ | vb_q0 | 0.0165 |
871
+ | vb_q1 | 0.000124 |
872
+ | vb_q2 | 2.95e-05 |
873
+ | vb_q3 | 4.7e-06 |
874
+ -------------------------
875
+ -------------------------
876
+ | grad_norm | 0.062 |
877
+ | loss | 0.0346 |
878
+ | loss_q0 | 0.117 |
879
+ | loss_q1 | 0.0169 |
880
+ | loss_q2 | 0.00327 |
881
+ | loss_q3 | 0.000388 |
882
+ | mse | 0.0298 |
883
+ | mse_q0 | 0.0984 |
884
+ | mse_q1 | 0.0168 |
885
+ | mse_q2 | 0.00325 |
886
+ | mse_q3 | 0.000384 |
887
+ | param_norm | 198 |
888
+ | samples | 6.24e+05 |
889
+ | step | 3.9e+04 |
890
+ | vb | 0.00484 |
891
+ | vb_q0 | 0.0191 |
892
+ | vb_q1 | 0.000124 |
893
+ | vb_q2 | 2.89e-05 |
894
+ | vb_q3 | 4.77e-06 |
895
+ -------------------------
896
+ -------------------------
897
+ | grad_norm | 0.0562 |
898
+ | loss | 0.0336 |
899
+ | loss_q0 | 0.113 |
900
+ | loss_q1 | 0.0167 |
901
+ | loss_q2 | 0.00331 |
902
+ | loss_q3 | 0.000371 |
903
+ | mse | 0.0296 |
904
+ | mse_q0 | 0.0974 |
905
+ | mse_q1 | 0.0166 |
906
+ | mse_q2 | 0.00328 |
907
+ | mse_q3 | 0.000367 |
908
+ | param_norm | 199 |
909
+ | samples | 6.4e+05 |
910
+ | step | 4e+04 |
911
+ | vb | 0.00396 |
912
+ | vb_q0 | 0.0155 |
913
+ | vb_q1 | 0.000123 |
914
+ | vb_q2 | 2.92e-05 |
915
+ | vb_q3 | 4.55e-06 |
916
+ -------------------------
917
+ saving model 0...
918
+ saving model 0.995...
919
+ evaluation indistro starting...
920
+ done 96 samples: bpd=3.5080957412719727
921
+ done 192 samples: bpd=3.5733258724212646
922
+ done 288 samples: bpd=3.587653636932373
923
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_indistro_terms.npz
924
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_indistro_terms.npz
925
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_indistro_terms.npz
926
+ evaluation nll complete
927
+ evaluation outdistro starting...
928
+ done 192 samples: bpd=3.791849136352539
929
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_outdistro_terms.npz
930
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_outdistro_terms.npz
931
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_outdistro_terms.npz
932
+ evaluation nll complete
933
+ sampling starting...
934
+ -------------------------
935
+ | grad_norm | 0.0596 |
936
+ | loss | 0.0344 |
937
+ | loss_q0 | 0.115 |
938
+ | loss_q1 | 0.0168 |
939
+ | loss_q2 | 0.00325 |
940
+ | loss_q3 | 0.000377 |
941
+ | mse | 0.0306 |
942
+ | mse_q0 | 0.1 |
943
+ | mse_q1 | 0.0167 |
944
+ | mse_q2 | 0.00322 |
945
+ | mse_q3 | 0.000372 |
946
+ | param_norm | 199 |
947
+ | samples | 6.56e+05 |
948
+ | step | 4.1e+04 |
949
+ | vb | 0.00381 |
950
+ | vb_q0 | 0.0148 |
951
+ | vb_q1 | 0.000123 |
952
+ | vb_q2 | 2.87e-05 |
953
+ | vb_q3 | 4.62e-06 |
954
+ -------------------------
955
+ -------------------------
956
+ | grad_norm | 0.0589 |
957
+ | loss | 0.0328 |
958
+ | loss_q0 | 0.113 |
959
+ | loss_q1 | 0.017 |
960
+ | loss_q2 | 0.00331 |
961
+ | loss_q3 | 0.00037 |
962
+ | mse | 0.0286 |
963
+ | mse_q0 | 0.0962 |
964
+ | mse_q1 | 0.0168 |
965
+ | mse_q2 | 0.00328 |
966
+ | mse_q3 | 0.000365 |
967
+ | param_norm | 200 |
968
+ | samples | 6.72e+05 |
969
+ | step | 4.2e+04 |
970
+ | vb | 0.00413 |
971
+ | vb_q0 | 0.0168 |
972
+ | vb_q1 | 0.000124 |
973
+ | vb_q2 | 2.92e-05 |
974
+ | vb_q3 | 4.52e-06 |
975
+ -------------------------
976
+ -------------------------
977
+ | grad_norm | 0.0587 |
978
+ | loss | 0.0329 |
979
+ | loss_q0 | 0.111 |
980
+ | loss_q1 | 0.017 |
981
+ | loss_q2 | 0.00332 |
982
+ | loss_q3 | 0.000369 |
983
+ | mse | 0.0295 |
984
+ | mse_q0 | 0.0973 |
985
+ | mse_q1 | 0.0168 |
986
+ | mse_q2 | 0.00329 |
987
+ | mse_q3 | 0.000364 |
988
+ | param_norm | 200 |
989
+ | samples | 6.88e+05 |
990
+ | step | 4.3e+04 |
991
+ | vb | 0.00348 |
992
+ | vb_q0 | 0.0137 |
993
+ | vb_q1 | 0.000125 |
994
+ | vb_q2 | 2.92e-05 |
995
+ | vb_q3 | 4.51e-06 |
996
+ -------------------------
997
+ -------------------------
998
+ | grad_norm | 0.0571 |
999
+ | loss | 0.0338 |
1000
+ | loss_q0 | 0.117 |
1001
+ | loss_q1 | 0.0168 |
1002
+ | loss_q2 | 0.00322 |
1003
+ | loss_q3 | 0.000364 |
1004
+ | mse | 0.0294 |
1005
+ | mse_q0 | 0.0992 |
1006
+ | mse_q1 | 0.0167 |
1007
+ | mse_q2 | 0.00319 |
1008
+ | mse_q3 | 0.000359 |
1009
+ | param_norm | 201 |
1010
+ | samples | 7.04e+05 |
1011
+ | step | 4.4e+04 |
1012
+ | vb | 0.00437 |
1013
+ | vb_q0 | 0.0177 |
1014
+ | vb_q1 | 0.000123 |
1015
+ | vb_q2 | 2.84e-05 |
1016
+ | vb_q3 | 4.45e-06 |
1017
+ -------------------------
1018
+ -------------------------
1019
+ | grad_norm | 0.0587 |
1020
+ | loss | 0.034 |
1021
+ | loss_q0 | 0.114 |
1022
+ | loss_q1 | 0.0171 |
1023
+ | loss_q2 | 0.00331 |
1024
+ | loss_q3 | 0.00037 |
1025
+ | mse | 0.0301 |
1026
+ | mse_q0 | 0.0988 |
1027
+ | mse_q1 | 0.017 |
1028
+ | mse_q2 | 0.00328 |
1029
+ | mse_q3 | 0.000365 |
1030
+ | param_norm | 201 |
1031
+ | samples | 7.2e+05 |
1032
+ | step | 4.5e+04 |
1033
+ | vb | 0.00387 |
1034
+ | vb_q0 | 0.0152 |
1035
+ | vb_q1 | 0.000126 |
1036
+ | vb_q2 | 2.91e-05 |
1037
+ | vb_q3 | 4.52e-06 |
1038
+ -------------------------
1039
+ -------------------------
1040
+ | grad_norm | 0.061 |
1041
+ | loss | 0.0329 |
1042
+ | loss_q0 | 0.11 |
1043
+ | loss_q1 | 0.0169 |
1044
+ | loss_q2 | 0.00329 |
1045
+ | loss_q3 | 0.000368 |
1046
+ | mse | 0.0299 |
1047
+ | mse_q0 | 0.0983 |
1048
+ | mse_q1 | 0.0167 |
1049
+ | mse_q2 | 0.00326 |
1050
+ | mse_q3 | 0.000364 |
1051
+ | param_norm | 202 |
1052
+ | samples | 7.36e+05 |
1053
+ | step | 4.6e+04 |
1054
+ | vb | 0.0031 |
1055
+ | vb_q0 | 0.0121 |
1056
+ | vb_q1 | 0.000124 |
1057
+ | vb_q2 | 2.89e-05 |
1058
+ | vb_q3 | 4.5e-06 |
1059
+ -------------------------
1060
+ -------------------------
1061
+ | grad_norm | 0.0566 |
1062
+ | loss | 0.0328 |
1063
+ | loss_q0 | 0.111 |
1064
+ | loss_q1 | 0.0171 |
1065
+ | loss_q2 | 0.00327 |
1066
+ | loss_q3 | 0.000357 |
1067
+ | mse | 0.0294 |
1068
+ | mse_q0 | 0.0976 |
1069
+ | mse_q1 | 0.017 |
1070
+ | mse_q2 | 0.00324 |
1071
+ | mse_q3 | 0.000353 |
1072
+ | param_norm | 202 |
1073
+ | samples | 7.52e+05 |
1074
+ | step | 4.7e+04 |
1075
+ | vb | 0.00339 |
1076
+ | vb_q0 | 0.0135 |
1077
+ | vb_q1 | 0.000126 |
1078
+ | vb_q2 | 2.88e-05 |
1079
+ | vb_q3 | 4.39e-06 |
1080
+ -------------------------
1081
+ -------------------------
1082
+ | grad_norm | 0.0606 |
1083
+ | loss | 0.0344 |
1084
+ | loss_q0 | 0.114 |
1085
+ | loss_q1 | 0.0168 |
1086
+ | loss_q2 | 0.00333 |
1087
+ | loss_q3 | 0.000357 |
1088
+ | mse | 0.0305 |
1089
+ | mse_q0 | 0.0991 |
1090
+ | mse_q1 | 0.0167 |
1091
+ | mse_q2 | 0.0033 |
1092
+ | mse_q3 | 0.000352 |
1093
+ | param_norm | 203 |
1094
+ | samples | 7.68e+05 |
1095
+ | step | 4.8e+04 |
1096
+ | vb | 0.00387 |
1097
+ | vb_q0 | 0.0149 |
1098
+ | vb_q1 | 0.000123 |
1099
+ | vb_q2 | 2.93e-05 |
1100
+ | vb_q3 | 4.37e-06 |
1101
+ -------------------------
1102
+ -------------------------
1103
+ | grad_norm | 0.0559 |
1104
+ | loss | 0.0327 |
1105
+ | loss_q0 | 0.108 |
1106
+ | loss_q1 | 0.0166 |
1107
+ | loss_q2 | 0.00329 |
1108
+ | loss_q3 | 0.000351 |
1109
+ | mse | 0.0292 |
1110
+ | mse_q0 | 0.0947 |
1111
+ | mse_q1 | 0.0165 |
1112
+ | mse_q2 | 0.00326 |
1113
+ | mse_q3 | 0.000347 |
1114
+ | param_norm | 203 |
1115
+ | samples | 7.84e+05 |
1116
+ | step | 4.9e+04 |
1117
+ | vb | 0.00349 |
1118
+ | vb_q0 | 0.0135 |
1119
+ | vb_q1 | 0.000122 |
1120
+ | vb_q2 | 2.9e-05 |
1121
+ | vb_q3 | 4.29e-06 |
1122
+ -------------------------
1123
+ -------------------------
1124
+ | grad_norm | 0.0589 |
1125
+ | loss | 0.0338 |
1126
+ | loss_q0 | 0.116 |
1127
+ | loss_q1 | 0.0169 |
1128
+ | loss_q2 | 0.00327 |
1129
+ | loss_q3 | 0.00035 |
1130
+ | mse | 0.029 |
1131
+ | mse_q0 | 0.0968 |
1132
+ | mse_q1 | 0.0168 |
1133
+ | mse_q2 | 0.00325 |
1134
+ | mse_q3 | 0.000346 |
1135
+ | param_norm | 204 |
1136
+ | samples | 8e+05 |
1137
+ | step | 5e+04 |
1138
+ | vb | 0.00479 |
1139
+ | vb_q0 | 0.0193 |
1140
+ | vb_q1 | 0.000124 |
1141
+ | vb_q2 | 2.88e-05 |
1142
+ | vb_q3 | 4.29e-06 |
1143
+ -------------------------
1144
+ saving model 0...
1145
+ saving model 0.995...
1146
+ evaluation indistro starting...
1147
+ done 96 samples: bpd=3.513167142868042
1148
+ done 192 samples: bpd=3.5448752641677856
1149
+ done 288 samples: bpd=3.5497219562530518
1150
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_indistro_terms.npz
1151
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_indistro_terms.npz
1152
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_indistro_terms.npz
1153
+ evaluation nll complete
1154
+ evaluation outdistro starting...
1155
+ done 192 samples: bpd=3.7412848472595215
1156
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_outdistro_terms.npz
1157
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_outdistro_terms.npz
1158
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_outdistro_terms.npz
1159
+ evaluation nll complete
1160
+ sampling starting...
1161
+ -------------------------
1162
+ | grad_norm | 0.0547 |
1163
+ | loss | 0.0326 |
1164
+ | loss_q0 | 0.11 |
1165
+ | loss_q1 | 0.0167 |
1166
+ | loss_q2 | 0.00326 |
1167
+ | loss_q3 | 0.000349 |
1168
+ | mse | 0.0291 |
1169
+ | mse_q0 | 0.0965 |
1170
+ | mse_q1 | 0.0166 |
1171
+ | mse_q2 | 0.00323 |
1172
+ | mse_q3 | 0.000345 |
1173
+ | param_norm | 204 |
1174
+ | samples | 8.16e+05 |
1175
+ | step | 5.1e+04 |
1176
+ | vb | 0.00349 |
1177
+ | vb_q0 | 0.0138 |
1178
+ | vb_q1 | 0.000123 |
1179
+ | vb_q2 | 2.87e-05 |
1180
+ | vb_q3 | 4.27e-06 |
1181
+ -------------------------
1182
+ -------------------------
1183
+ | grad_norm | 0.0582 |
1184
+ | loss | 0.0324 |
1185
+ | loss_q0 | 0.109 |
1186
+ | loss_q1 | 0.0168 |
1187
+ | loss_q2 | 0.00319 |
1188
+ | loss_q3 | 0.000349 |
1189
+ | mse | 0.0292 |
1190
+ | mse_q0 | 0.0969 |
1191
+ | mse_q1 | 0.0166 |
1192
+ | mse_q2 | 0.00316 |
1193
+ | mse_q3 | 0.000345 |
1194
+ | param_norm | 205 |
1195
+ | samples | 8.32e+05 |
1196
+ | step | 5.2e+04 |
1197
+ | vb | 0.00317 |
1198
+ | vb_q0 | 0.0126 |
1199
+ | vb_q1 | 0.000123 |
1200
+ | vb_q2 | 2.82e-05 |
1201
+ | vb_q3 | 4.27e-06 |
1202
+ -------------------------
1203
+ -------------------------
1204
+ | grad_norm | 0.0565 |
1205
+ | loss | 0.0328 |
1206
+ | loss_q0 | 0.111 |
1207
+ | loss_q1 | 0.0168 |
1208
+ | loss_q2 | 0.00324 |
1209
+ | loss_q3 | 0.000347 |
1210
+ | mse | 0.0291 |
1211
+ | mse_q0 | 0.0964 |
1212
+ | mse_q1 | 0.0167 |
1213
+ | mse_q2 | 0.00321 |
1214
+ | mse_q3 | 0.000343 |
1215
+ | param_norm | 205 |
1216
+ | samples | 8.48e+05 |
1217
+ | step | 5.3e+04 |
1218
+ | vb | 0.00373 |
1219
+ | vb_q0 | 0.0148 |
1220
+ | vb_q1 | 0.000123 |
1221
+ | vb_q2 | 2.85e-05 |
1222
+ | vb_q3 | 4.23e-06 |
1223
+ -------------------------
1224
+ -------------------------
1225
+ | grad_norm | 0.0586 |
1226
+ | loss | 0.0338 |
1227
+ | loss_q0 | 0.117 |
1228
+ | loss_q1 | 0.0168 |
1229
+ | loss_q2 | 0.00323 |
1230
+ | loss_q3 | 0.000341 |
1231
+ | mse | 0.0297 |
1232
+ | mse_q0 | 0.1 |
1233
+ | mse_q1 | 0.0167 |
1234
+ | mse_q2 | 0.00321 |
1235
+ | mse_q3 | 0.000337 |
1236
+ | param_norm | 206 |
1237
+ | samples | 8.64e+05 |
1238
+ | step | 5.4e+04 |
1239
+ | vb | 0.00406 |
1240
+ | vb_q0 | 0.0164 |
1241
+ | vb_q1 | 0.000123 |
1242
+ | vb_q2 | 2.85e-05 |
1243
+ | vb_q3 | 4.17e-06 |
1244
+ -------------------------
1245
+ -------------------------
1246
+ | grad_norm | 0.0558 |
1247
+ | loss | 0.0336 |
1248
+ | loss_q0 | 0.115 |
1249
+ | loss_q1 | 0.0165 |
1250
+ | loss_q2 | 0.00326 |
1251
+ | loss_q3 | 0.00034 |
1252
+ | mse | 0.0293 |
1253
+ | mse_q0 | 0.098 |
1254
+ | mse_q1 | 0.0164 |
1255
+ | mse_q2 | 0.00323 |
1256
+ | mse_q3 | 0.000336 |
1257
+ | param_norm | 206 |
1258
+ | samples | 8.8e+05 |
1259
+ | step | 5.5e+04 |
1260
+ | vb | 0.00434 |
1261
+ | vb_q0 | 0.0174 |
1262
+ | vb_q1 | 0.000121 |
1263
+ | vb_q2 | 2.87e-05 |
1264
+ | vb_q3 | 4.16e-06 |
1265
+ -------------------------
1266
+ -------------------------
1267
+ | grad_norm | 0.0578 |
1268
+ | loss | 0.0329 |
1269
+ | loss_q0 | 0.112 |
1270
+ | loss_q1 | 0.0164 |
1271
+ | loss_q2 | 0.00319 |
1272
+ | loss_q3 | 0.000341 |
1273
+ | mse | 0.029 |
1274
+ | mse_q0 | 0.0971 |
1275
+ | mse_q1 | 0.0163 |
1276
+ | mse_q2 | 0.00316 |
1277
+ | mse_q3 | 0.000337 |
1278
+ | param_norm | 207 |
1279
+ | samples | 8.96e+05 |
1280
+ | step | 5.6e+04 |
1281
+ | vb | 0.00385 |
1282
+ | vb_q0 | 0.0153 |
1283
+ | vb_q1 | 0.000121 |
1284
+ | vb_q2 | 2.82e-05 |
1285
+ | vb_q3 | 4.18e-06 |
1286
+ -------------------------
1287
+ -------------------------
1288
+ | grad_norm | 0.055 |
1289
+ | loss | 0.0329 |
1290
+ | loss_q0 | 0.112 |
1291
+ | loss_q1 | 0.0165 |
1292
+ | loss_q2 | 0.00321 |
1293
+ | loss_q3 | 0.00033 |
1294
+ | mse | 0.029 |
1295
+ | mse_q0 | 0.0964 |
1296
+ | mse_q1 | 0.0164 |
1297
+ | mse_q2 | 0.00319 |
1298
+ | mse_q3 | 0.000326 |
1299
+ | param_norm | 207 |
1300
+ | samples | 9.12e+05 |
1301
+ | step | 5.7e+04 |
1302
+ | vb | 0.00392 |
1303
+ | vb_q0 | 0.0156 |
1304
+ | vb_q1 | 0.000121 |
1305
+ | vb_q2 | 2.83e-05 |
1306
+ | vb_q3 | 4.04e-06 |
1307
+ -------------------------
1308
+ -------------------------
1309
+ | grad_norm | 0.0567 |
1310
+ | loss | 0.0338 |
1311
+ | loss_q0 | 0.113 |
1312
+ | loss_q1 | 0.0168 |
1313
+ | loss_q2 | 0.00327 |
1314
+ | loss_q3 | 0.000333 |
1315
+ | mse | 0.0295 |
1316
+ | mse_q0 | 0.0965 |
1317
+ | mse_q1 | 0.0167 |
1318
+ | mse_q2 | 0.00324 |
1319
+ | mse_q3 | 0.000329 |
1320
+ | param_norm | 208 |
1321
+ | samples | 9.28e+05 |
1322
+ | step | 5.8e+04 |
1323
+ | vb | 0.00423 |
1324
+ | vb_q0 | 0.0165 |
1325
+ | vb_q1 | 0.000123 |
1326
+ | vb_q2 | 2.88e-05 |
1327
+ | vb_q3 | 4.06e-06 |
1328
+ -------------------------
1329
+ -------------------------
1330
+ | grad_norm | 0.0562 |
1331
+ | loss | 0.0341 |
1332
+ | loss_q0 | 0.115 |
1333
+ | loss_q1 | 0.0166 |
1334
+ | loss_q2 | 0.00321 |
1335
+ | loss_q3 | 0.00033 |
1336
+ | mse | 0.0295 |
1337
+ | mse_q0 | 0.0972 |
1338
+ | mse_q1 | 0.0165 |
1339
+ | mse_q2 | 0.00318 |
1340
+ | mse_q3 | 0.000326 |
1341
+ | param_norm | 209 |
1342
+ | samples | 9.44e+05 |
1343
+ | step | 5.9e+04 |
1344
+ | vb | 0.00459 |
1345
+ | vb_q0 | 0.018 |
1346
+ | vb_q1 | 0.000122 |
1347
+ | vb_q2 | 2.83e-05 |
1348
+ | vb_q3 | 4.03e-06 |
1349
+ -------------------------
1350
+ -------------------------
1351
+ | grad_norm | 0.0591 |
1352
+ | loss | 0.0323 |
1353
+ | loss_q0 | 0.109 |
1354
+ | loss_q1 | 0.0167 |
1355
+ | loss_q2 | 0.00328 |
1356
+ | loss_q3 | 0.000334 |
1357
+ | mse | 0.0289 |
1358
+ | mse_q0 | 0.0958 |
1359
+ | mse_q1 | 0.0166 |
1360
+ | mse_q2 | 0.00325 |
1361
+ | mse_q3 | 0.00033 |
1362
+ | param_norm | 209 |
1363
+ | samples | 9.6e+05 |
1364
+ | step | 6e+04 |
1365
+ | vb | 0.00337 |
1366
+ | vb_q0 | 0.0134 |
1367
+ | vb_q1 | 0.000123 |
1368
+ | vb_q2 | 2.88e-05 |
1369
+ | vb_q3 | 4.07e-06 |
1370
+ -------------------------
1371
+ saving model 0...
1372
+ saving model 0.995...
1373
+ evaluation indistro starting...
1374
+ done 96 samples: bpd=3.7332992553710938
1375
+ done 192 samples: bpd=3.742550849914551
1376
+ done 288 samples: bpd=3.750394821166992
1377
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_indistro_terms.npz
1378
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_indistro_terms.npz
1379
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_indistro_terms.npz
1380
+ evaluation nll complete
1381
+ evaluation outdistro starting...
1382
+ done 192 samples: bpd=3.7803030014038086
1383
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_outdistro_terms.npz
1384
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_outdistro_terms.npz
1385
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_outdistro_terms.npz
1386
+ evaluation nll complete
1387
+ sampling starting...
1388
+ -------------------------
1389
+ | grad_norm | 0.0561 |
1390
+ | loss | 0.0328 |
1391
+ | loss_q0 | 0.11 |
1392
+ | loss_q1 | 0.0166 |
1393
+ | loss_q2 | 0.00324 |
1394
+ | loss_q3 | 0.000332 |
1395
+ | mse | 0.0294 |
1396
+ | mse_q0 | 0.0963 |
1397
+ | mse_q1 | 0.0165 |
1398
+ | mse_q2 | 0.00321 |
1399
+ | mse_q3 | 0.000328 |
1400
+ | param_norm | 210 |
1401
+ | samples | 9.76e+05 |
1402
+ | step | 6.1e+04 |
1403
+ | vb | 0.00346 |
1404
+ | vb_q0 | 0.0135 |
1405
+ | vb_q1 | 0.000122 |
1406
+ | vb_q2 | 2.85e-05 |
1407
+ | vb_q3 | 4.05e-06 |
1408
+ -------------------------
1409
+ -------------------------
1410
+ | grad_norm | 0.055 |
1411
+ | loss | 0.033 |
1412
+ | loss_q0 | 0.113 |
1413
+ | loss_q1 | 0.0167 |
1414
+ | loss_q2 | 0.00321 |
1415
+ | loss_q3 | 0.000327 |
1416
+ | mse | 0.0291 |
1417
+ | mse_q0 | 0.0971 |
1418
+ | mse_q1 | 0.0166 |
1419
+ | mse_q2 | 0.00318 |
1420
+ | mse_q3 | 0.000323 |
1421
+ | param_norm | 210 |
1422
+ | samples | 9.92e+05 |
1423
+ | step | 6.2e+04 |
1424
+ | vb | 0.00388 |
1425
+ | vb_q0 | 0.0155 |
1426
+ | vb_q1 | 0.000122 |
1427
+ | vb_q2 | 2.82e-05 |
1428
+ | vb_q3 | 3.99e-06 |
1429
+ -------------------------
1430
+ -------------------------
1431
+ | grad_norm | 0.0522 |
1432
+ | loss | 0.0327 |
1433
+ | loss_q0 | 0.112 |
1434
+ | loss_q1 | 0.0166 |
1435
+ | loss_q2 | 0.00317 |
1436
+ | loss_q3 | 0.000321 |
1437
+ | mse | 0.0291 |
1438
+ | mse_q0 | 0.0975 |
1439
+ | mse_q1 | 0.0165 |
1440
+ | mse_q2 | 0.00314 |
1441
+ | mse_q3 | 0.000317 |
1442
+ | param_norm | 211 |
1443
+ | samples | 1.01e+06 |
1444
+ | step | 6.3e+04 |
1445
+ | vb | 0.00364 |
1446
+ | vb_q0 | 0.0146 |
1447
+ | vb_q1 | 0.000122 |
1448
+ | vb_q2 | 2.8e-05 |
1449
+ | vb_q3 | 3.91e-06 |
1450
+ -------------------------
1451
+ -------------------------
1452
+ | grad_norm | 0.0563 |
1453
+ | loss | 0.0326 |
1454
+ | loss_q0 | 0.11 |
1455
+ | loss_q1 | 0.0167 |
1456
+ | loss_q2 | 0.00322 |
1457
+ | loss_q3 | 0.000333 |
1458
+ | mse | 0.0287 |
1459
+ | mse_q0 | 0.0949 |
1460
+ | mse_q1 | 0.0165 |
1461
+ | mse_q2 | 0.0032 |
1462
+ | mse_q3 | 0.000329 |
1463
+ | param_norm | 211 |
1464
+ | samples | 1.02e+06 |
1465
+ | step | 6.4e+04 |
1466
+ | vb | 0.00392 |
1467
+ | vb_q0 | 0.0155 |
1468
+ | vb_q1 | 0.000122 |
1469
+ | vb_q2 | 2.84e-05 |
1470
+ | vb_q3 | 4.06e-06 |
1471
+ -------------------------
1472
+ -------------------------
1473
+ | grad_norm | 0.0557 |
1474
+ | loss | 0.0327 |
1475
+ | loss_q0 | 0.111 |
1476
+ | loss_q1 | 0.0167 |
1477
+ | loss_q2 | 0.00317 |
1478
+ | loss_q3 | 0.000325 |
1479
+ | mse | 0.0288 |
1480
+ | mse_q0 | 0.0954 |
1481
+ | mse_q1 | 0.0166 |
1482
+ | mse_q2 | 0.00314 |
1483
+ | mse_q3 | 0.000321 |
1484
+ | param_norm | 212 |
1485
+ | samples | 1.04e+06 |
1486
+ | step | 6.5e+04 |
1487
+ | vb | 0.00387 |
1488
+ | vb_q0 | 0.0154 |
1489
+ | vb_q1 | 0.000122 |
1490
+ | vb_q2 | 2.8e-05 |
1491
+ | vb_q3 | 3.95e-06 |
1492
+ -------------------------
1493
+ -------------------------
1494
+ | grad_norm | 0.0545 |
1495
+ | loss | 0.032 |
1496
+ | loss_q0 | 0.11 |
1497
+ | loss_q1 | 0.0167 |
1498
+ | loss_q2 | 0.00324 |
1499
+ | loss_q3 | 0.000323 |
1500
+ | mse | 0.0282 |
1501
+ | mse_q0 | 0.0944 |
1502
+ | mse_q1 | 0.0165 |
1503
+ | mse_q2 | 0.00321 |
1504
+ | mse_q3 | 0.00032 |
1505
+ | param_norm | 212 |
1506
+ | samples | 1.06e+06 |
1507
+ | step | 6.6e+04 |
1508
+ | vb | 0.00382 |
1509
+ | vb_q0 | 0.0154 |
1510
+ | vb_q1 | 0.000122 |
1511
+ | vb_q2 | 2.85e-05 |
1512
+ | vb_q3 | 3.94e-06 |
1513
+ -------------------------
1514
+ -------------------------
1515
+ | grad_norm | 0.0545 |
1516
+ | loss | 0.0326 |
1517
+ | loss_q0 | 0.111 |
1518
+ | loss_q1 | 0.0166 |
1519
+ | loss_q2 | 0.00322 |
1520
+ | loss_q3 | 0.00032 |
1521
+ | mse | 0.0288 |
1522
+ | mse_q0 | 0.0955 |
1523
+ | mse_q1 | 0.0164 |
1524
+ | mse_q2 | 0.00319 |
1525
+ | mse_q3 | 0.000316 |
1526
+ | param_norm | 213 |
1527
+ | samples | 1.07e+06 |
1528
+ | step | 6.7e+04 |
1529
+ | vb | 0.00382 |
1530
+ | vb_q0 | 0.0152 |
1531
+ | vb_q1 | 0.000121 |
1532
+ | vb_q2 | 2.83e-05 |
1533
+ | vb_q3 | 3.89e-06 |
1534
+ -------------------------
1535
+ -------------------------
1536
+ | grad_norm | 0.0563 |
1537
+ | loss | 0.0335 |
1538
+ | loss_q0 | 0.114 |
1539
+ | loss_q1 | 0.0165 |
1540
+ | loss_q2 | 0.0032 |
1541
+ | loss_q3 | 0.000325 |
1542
+ | mse | 0.0294 |
1543
+ | mse_q0 | 0.098 |
1544
+ | mse_q1 | 0.0164 |
1545
+ | mse_q2 | 0.00317 |
1546
+ | mse_q3 | 0.000321 |
1547
+ | param_norm | 213 |
1548
+ | samples | 1.09e+06 |
1549
+ | step | 6.8e+04 |
1550
+ | vb | 0.00401 |
1551
+ | vb_q0 | 0.0159 |
1552
+ | vb_q1 | 0.000121 |
1553
+ | vb_q2 | 2.81e-05 |
1554
+ | vb_q3 | 3.96e-06 |
1555
+ -------------------------
1556
+ -------------------------
1557
+ | grad_norm | 0.055 |
1558
+ | loss | 0.0318 |
1559
+ | loss_q0 | 0.107 |
1560
+ | loss_q1 | 0.0168 |
1561
+ | loss_q2 | 0.00323 |
1562
+ | loss_q3 | 0.000317 |
1563
+ | mse | 0.0287 |
1564
+ | mse_q0 | 0.0942 |
1565
+ | mse_q1 | 0.0166 |
1566
+ | mse_q2 | 0.00321 |
1567
+ | mse_q3 | 0.000313 |
1568
+ | param_norm | 214 |
1569
+ | samples | 1.1e+06 |
1570
+ | step | 6.9e+04 |
1571
+ | vb | 0.00313 |
1572
+ | vb_q0 | 0.0124 |
1573
+ | vb_q1 | 0.000123 |
1574
+ | vb_q2 | 2.84e-05 |
1575
+ | vb_q3 | 3.86e-06 |
1576
+ -------------------------
1577
+ -------------------------
1578
+ | grad_norm | 0.0537 |
1579
+ | loss | 0.0316 |
1580
+ | loss_q0 | 0.105 |
1581
+ | loss_q1 | 0.0166 |
1582
+ | loss_q2 | 0.00318 |
1583
+ | loss_q3 | 0.000318 |
1584
+ | mse | 0.0286 |
1585
+ | mse_q0 | 0.0936 |
1586
+ | mse_q1 | 0.0165 |
1587
+ | mse_q2 | 0.00315 |
1588
+ | mse_q3 | 0.000314 |
1589
+ | param_norm | 215 |
1590
+ | samples | 1.12e+06 |
1591
+ | step | 7e+04 |
1592
+ | vb | 0.00302 |
1593
+ | vb_q0 | 0.0118 |
1594
+ | vb_q1 | 0.000122 |
1595
+ | vb_q2 | 2.8e-05 |
1596
+ | vb_q3 | 3.87e-06 |
1597
+ -------------------------
1598
+ saving model 0...
1599
+ saving model 0.995...
1600
+ evaluation indistro starting...
1601
+ done 96 samples: bpd=3.8689794540405273
1602
+ done 192 samples: bpd=3.703700542449951
1603
+ done 288 samples: bpd=3.6549039681752524
1604
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_indistro_terms.npz
1605
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_indistro_terms.npz
1606
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model70000_indistro_terms.npz
1607
+ evaluation nll complete
1608
+ evaluation outdistro starting...
1609
+ done 192 samples: bpd=3.788196086883545
1610
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_outdistro_terms.npz
1611
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_outdistro_terms.npz
1612
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model70000_outdistro_terms.npz
1613
+ evaluation nll complete
1614
+ sampling starting...
1615
+ -------------------------
1616
+ | grad_norm | 0.0552 |
1617
+ | loss | 0.0336 |
1618
+ | loss_q0 | 0.112 |
1619
+ | loss_q1 | 0.0168 |
1620
+ | loss_q2 | 0.00322 |
1621
+ | loss_q3 | 0.00032 |
1622
+ | mse | 0.0297 |
1623
+ | mse_q0 | 0.0973 |
1624
+ | mse_q1 | 0.0166 |
1625
+ | mse_q2 | 0.00319 |
1626
+ | mse_q3 | 0.000316 |
1627
+ | param_norm | 215 |
1628
+ | samples | 1.14e+06 |
1629
+ | step | 7.1e+04 |
1630
+ | vb | 0.00389 |
1631
+ | vb_q0 | 0.0152 |
1632
+ | vb_q1 | 0.000123 |
1633
+ | vb_q2 | 2.83e-05 |
1634
+ | vb_q3 | 3.9e-06 |
1635
+ -------------------------
1636
+ -------------------------
1637
+ | grad_norm | 0.0521 |
1638
+ | loss | 0.0323 |
1639
+ | loss_q0 | 0.109 |
1640
+ | loss_q1 | 0.0167 |
1641
+ | loss_q2 | 0.00316 |
1642
+ | loss_q3 | 0.000313 |
1643
+ | mse | 0.0285 |
1644
+ | mse_q0 | 0.0942 |
1645
+ | mse_q1 | 0.0166 |
1646
+ | mse_q2 | 0.00313 |
1647
+ | mse_q3 | 0.00031 |
1648
+ | param_norm | 216 |
1649
+ | samples | 1.15e+06 |
1650
+ | step | 7.2e+04 |
1651
+ | vb | 0.00381 |
1652
+ | vb_q0 | 0.0151 |
1653
+ | vb_q1 | 0.000123 |
1654
+ | vb_q2 | 2.78e-05 |
1655
+ | vb_q3 | 3.81e-06 |
1656
+ -------------------------
1657
+ -------------------------
1658
+ | grad_norm | 0.056 |
1659
+ | loss | 0.0321 |
1660
+ | loss_q0 | 0.109 |
1661
+ | loss_q1 | 0.0165 |
1662
+ | loss_q2 | 0.00314 |
1663
+ | loss_q3 | 0.000315 |
1664
+ | mse | 0.029 |
1665
+ | mse_q0 | 0.0965 |
1666
+ | mse_q1 | 0.0164 |
1667
+ | mse_q2 | 0.00312 |
1668
+ | mse_q3 | 0.000311 |
1669
+ | param_norm | 216 |
1670
+ | samples | 1.17e+06 |
1671
+ | step | 7.3e+04 |
1672
+ | vb | 0.00309 |
1673
+ | vb_q0 | 0.0123 |
1674
+ | vb_q1 | 0.000121 |
1675
+ | vb_q2 | 2.78e-05 |
1676
+ | vb_q3 | 3.84e-06 |
1677
+ -------------------------
1678
+ -------------------------
1679
+ | grad_norm | 0.0551 |
1680
+ | loss | 0.0329 |
1681
+ | loss_q0 | 0.11 |
1682
+ | loss_q1 | 0.0163 |
1683
+ | loss_q2 | 0.00321 |
1684
+ | loss_q3 | 0.00032 |
1685
+ | mse | 0.029 |
1686
+ | mse_q0 | 0.0948 |
1687
+ | mse_q1 | 0.0162 |
1688
+ | mse_q2 | 0.00318 |
1689
+ | mse_q3 | 0.000316 |
1690
+ | param_norm | 217 |
1691
+ | samples | 1.18e+06 |
1692
+ | step | 7.4e+04 |
1693
+ | vb | 0.0039 |
1694
+ | vb_q0 | 0.0152 |
1695
+ | vb_q1 | 0.00012 |
1696
+ | vb_q2 | 2.82e-05 |
1697
+ | vb_q3 | 3.88e-06 |
1698
+ -------------------------
1699
+ -------------------------
1700
+ | grad_norm | 0.0539 |
1701
+ | loss | 0.0323 |
1702
+ | loss_q0 | 0.112 |
1703
+ | loss_q1 | 0.0163 |
1704
+ | loss_q2 | 0.00319 |
1705
+ | loss_q3 | 0.000316 |
1706
+ | mse | 0.0286 |
1707
+ | mse_q0 | 0.0974 |
1708
+ | mse_q1 | 0.0162 |
1709
+ | mse_q2 | 0.00316 |
1710
+ | mse_q3 | 0.000313 |
1711
+ | param_norm | 217 |
1712
+ | samples | 1.2e+06 |
1713
+ | step | 7.5e+04 |
1714
+ | vb | 0.00365 |
1715
+ | vb_q0 | 0.0148 |
1716
+ | vb_q1 | 0.00012 |
1717
+ | vb_q2 | 2.81e-05 |
1718
+ | vb_q3 | 3.85e-06 |
1719
+ -------------------------
1720
+ -------------------------
1721
+ | grad_norm | 0.053 |
1722
+ | loss | 0.0342 |
1723
+ | loss_q0 | 0.116 |
1724
+ | loss_q1 | 0.0166 |
1725
+ | loss_q2 | 0.00318 |
1726
+ | loss_q3 | 0.000306 |
1727
+ | mse | 0.0296 |
1728
+ | mse_q0 | 0.0982 |
1729
+ | mse_q1 | 0.0164 |
1730
+ | mse_q2 | 0.00315 |
1731
+ | mse_q3 | 0.000303 |
1732
+ | param_norm | 218 |
1733
+ | samples | 1.22e+06 |
1734
+ | step | 7.6e+04 |
1735
+ | vb | 0.00462 |
1736
+ | vb_q0 | 0.0183 |
1737
+ | vb_q1 | 0.000122 |
1738
+ | vb_q2 | 2.8e-05 |
1739
+ | vb_q3 | 3.73e-06 |
1740
+ -------------------------
1741
+ -------------------------
1742
+ | grad_norm | 0.0529 |
1743
+ | loss | 0.0316 |
1744
+ | loss_q0 | 0.107 |
1745
+ | loss_q1 | 0.0164 |
1746
+ | loss_q2 | 0.00313 |
1747
+ | loss_q3 | 0.000315 |
1748
+ | mse | 0.0285 |
1749
+ | mse_q0 | 0.0946 |
1750
+ | mse_q1 | 0.0163 |
1751
+ | mse_q2 | 0.00311 |
1752
+ | mse_q3 | 0.000311 |
1753
+ | param_norm | 218 |
1754
+ | samples | 1.23e+06 |
1755
+ | step | 7.7e+04 |
1756
+ | vb | 0.00309 |
1757
+ | vb_q0 | 0.0122 |
1758
+ | vb_q1 | 0.00012 |
1759
+ | vb_q2 | 2.77e-05 |
1760
+ | vb_q3 | 3.82e-06 |
1761
+ -------------------------
1762
+ -------------------------
1763
+ | grad_norm | 0.0518 |
1764
+ | loss | 0.0333 |
1765
+ | loss_q0 | 0.117 |
1766
+ | loss_q1 | 0.0163 |
1767
+ | loss_q2 | 0.00321 |
1768
+ | loss_q3 | 0.000305 |
1769
+ | mse | 0.0287 |
1770
+ | mse_q0 | 0.098 |
1771
+ | mse_q1 | 0.0162 |
1772
+ | mse_q2 | 0.00319 |
1773
+ | mse_q3 | 0.000301 |
1774
+ | param_norm | 219 |
1775
+ | samples | 1.25e+06 |
1776
+ | step | 7.8e+04 |
1777
+ | vb | 0.00466 |
1778
+ | vb_q0 | 0.0191 |
1779
+ | vb_q1 | 0.00012 |
1780
+ | vb_q2 | 2.83e-05 |
1781
+ | vb_q3 | 3.71e-06 |
1782
+ -------------------------
1783
+ -------------------------
1784
+ | grad_norm | 0.0557 |
1785
+ | loss | 0.0322 |
1786
+ | loss_q0 | 0.11 |
1787
+ | loss_q1 | 0.0166 |
1788
+ | loss_q2 | 0.00322 |
1789
+ | loss_q3 | 0.000315 |
1790
+ | mse | 0.0285 |
1791
+ | mse_q0 | 0.0949 |
1792
+ | mse_q1 | 0.0165 |
1793
+ | mse_q2 | 0.00319 |
1794
+ | mse_q3 | 0.000312 |
1795
+ | param_norm | 219 |
1796
+ | samples | 1.26e+06 |
1797
+ | step | 7.9e+04 |
1798
+ | vb | 0.00366 |
1799
+ | vb_q0 | 0.0146 |
1800
+ | vb_q1 | 0.000122 |
1801
+ | vb_q2 | 2.83e-05 |
1802
+ | vb_q3 | 3.83e-06 |
1803
+ -------------------------
1804
+ -------------------------
1805
+ | grad_norm | 0.0526 |
1806
+ | loss | 0.031 |
1807
+ | loss_q0 | 0.107 |
1808
+ | loss_q1 | 0.0165 |
1809
+ | loss_q2 | 0.00321 |
1810
+ | loss_q3 | 0.000306 |
1811
+ | mse | 0.0276 |
1812
+ | mse_q0 | 0.0935 |
1813
+ | mse_q1 | 0.0164 |
1814
+ | mse_q2 | 0.00319 |
1815
+ | mse_q3 | 0.000303 |
1816
+ | param_norm | 220 |
1817
+ | samples | 1.28e+06 |
1818
+ | step | 8e+04 |
1819
+ | vb | 0.00343 |
1820
+ | vb_q0 | 0.014 |
1821
+ | vb_q1 | 0.000121 |
1822
+ | vb_q2 | 2.83e-05 |
1823
+ | vb_q3 | 3.73e-06 |
1824
+ -------------------------
1825
+ saving model 0...
1826
+ saving model 0.995...
1827
+ evaluation indistro starting...
1828
+ done 96 samples: bpd=3.589547634124756
1829
+ done 192 samples: bpd=3.518894910812378
1830
+ done 288 samples: bpd=3.5158642133076987
1831
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_indistro_terms.npz
1832
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_indistro_terms.npz
1833
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model80000_indistro_terms.npz
1834
+ evaluation nll complete
1835
+ evaluation outdistro starting...
1836
+ done 192 samples: bpd=3.783998489379883
1837
+ saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_outdistro_terms.npz
1838
+ saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_outdistro_terms.npz
1839
+ saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model80000_outdistro_terms.npz
1840
+ evaluation nll complete
1841
+ sampling starting...
1842
+ -------------------------
1843
+ | grad_norm | 0.0541 |
1844
+ | loss | 0.0329 |
1845
+ | loss_q0 | 0.111 |
1846
+ | loss_q1 | 0.0166 |
1847
+ | loss_q2 | 0.00321 |
1848
+ | loss_q3 | 0.000311 |
1849
+ | mse | 0.0292 |
1850
+ | mse_q0 | 0.0963 |
1851
+ | mse_q1 | 0.0165 |
1852
+ | mse_q2 | 0.00318 |
1853
+ | mse_q3 | 0.000308 |
1854
+ | param_norm | 221 |
1855
+ | samples | 1.3e+06 |
1856
+ | step | 8.1e+04 |
1857
+ | vb | 0.00363 |
1858
+ | vb_q0 | 0.0143 |
1859
+ | vb_q1 | 0.000122 |
1860
+ | vb_q2 | 2.82e-05 |
1861
+ | vb_q3 | 3.79e-06 |
1862
+ -------------------------
1863
+ -------------------------
1864
+ | grad_norm | 0.0519 |
1865
+ | loss | 0.034 |
1866
+ | loss_q0 | 0.116 |
1867
+ | loss_q1 | 0.0167 |
1868
+ | loss_q2 | 0.0032 |
1869
+ | loss_q3 | 0.000307 |
1870
+ | mse | 0.0295 |
1871
+ | mse_q0 | 0.0981 |
1872
+ | mse_q1 | 0.0166 |
1873
+ | mse_q2 | 0.00317 |
1874
+ | mse_q3 | 0.000303 |
1875
+ | param_norm | 221 |
1876
+ | samples | 1.31e+06 |
1877
+ | step | 8.2e+04 |
1878
+ | vb | 0.0045 |
1879
+ | vb_q0 | 0.0179 |
1880
+ | vb_q1 | 0.000122 |
1881
+ | vb_q2 | 2.82e-05 |
1882
+ | vb_q3 | 3.73e-06 |
1883
+ -------------------------
1884
+ -------------------------
1885
+ | grad_norm | 0.0539 |
1886
+ | loss | 0.032 |
1887
+ | loss_q0 | 0.107 |
1888
+ | loss_q1 | 0.0165 |
1889
+ | loss_q2 | 0.00318 |
1890
+ | loss_q3 | 0.000305 |
1891
+ | mse | 0.0288 |
1892
+ | mse_q0 | 0.0941 |
1893
+ | mse_q1 | 0.0164 |
1894
+ | mse_q2 | 0.00315 |
1895
+ | mse_q3 | 0.000301 |
1896
+ | param_norm | 222 |
1897
+ | samples | 1.33e+06 |
1898
+ | step | 8.3e+04 |
1899
+ | vb | 0.00327 |
1900
+ | vb_q0 | 0.0127 |
1901
+ | vb_q1 | 0.000121 |
1902
+ | vb_q2 | 2.8e-05 |
1903
+ | vb_q3 | 3.71e-06 |
1904
+ -------------------------
1905
+ -------------------------
1906
+ | grad_norm | 0.0548 |
1907
+ | loss | 0.0326 |
1908
+ | loss_q0 | 0.111 |
1909
+ | loss_q1 | 0.0164 |
1910
+ | loss_q2 | 0.00321 |
1911
+ | loss_q3 | 0.000306 |
1912
+ | mse | 0.0289 |
1913
+ | mse_q0 | 0.0961 |
1914
+ | mse_q1 | 0.0163 |
1915
+ | mse_q2 | 0.00318 |
1916
+ | mse_q3 | 0.000302 |
1917
+ | param_norm | 222 |
1918
+ | samples | 1.34e+06 |
1919
+ | step | 8.4e+04 |
1920
+ | vb | 0.00375 |
1921
+ | vb_q0 | 0.0149 |
1922
+ | vb_q1 | 0.000121 |
1923
+ | vb_q2 | 2.82e-05 |
1924
+ | vb_q3 | 3.72e-06 |
1925
+ -------------------------
1926
+ -------------------------
1927
+ | grad_norm | 0.0538 |
1928
+ | loss | 0.033 |
1929
+ | loss_q0 | 0.112 |
1930
+ | loss_q1 | 0.0164 |
1931
+ | loss_q2 | 0.00319 |
1932
+ | loss_q3 | 0.000304 |
1933
+ | mse | 0.0287 |
1934
+ | mse_q0 | 0.0949 |
1935
+ | mse_q1 | 0.0163 |
1936
+ | mse_q2 | 0.00317 |
1937
+ | mse_q3 | 0.0003 |
1938
+ | param_norm | 223 |
1939
+ | samples | 1.36e+06 |
1940
+ | step | 8.5e+04 |
1941
+ | vb | 0.00431 |
1942
+ | vb_q0 | 0.0171 |
1943
+ | vb_q1 | 0.00012 |
1944
+ | vb_q2 | 2.81e-05 |
1945
+ | vb_q3 | 3.69e-06 |
1946
+ -------------------------
1947
+ -------------------------
1948
+ | grad_norm | 0.0539 |
1949
+ | loss | 0.0326 |
1950
+ | loss_q0 | 0.112 |
1951
+ | loss_q1 | 0.0162 |
1952
+ | loss_q2 | 0.00316 |
1953
+ | loss_q3 | 0.000305 |
1954
+ | mse | 0.0285 |
1955
+ | mse_q0 | 0.0951 |
1956
+ | mse_q1 | 0.0161 |
1957
+ | mse_q2 | 0.00313 |
1958
+ | mse_q3 | 0.000301 |
1959
+ | param_norm | 223 |
1960
+ | samples | 1.38e+06 |
1961
+ | step | 8.6e+04 |
1962
+ | vb | 0.00417 |
1963
+ | vb_q0 | 0.0167 |
1964
+ | vb_q1 | 0.000119 |
1965
+ | vb_q2 | 2.78e-05 |
1966
+ | vb_q3 | 3.7e-06 |
1967
+ -------------------------
1968
+ -------------------------
1969
+ | grad_norm | 0.0528 |
1970
+ | loss | 0.0334 |
1971
+ | loss_q0 | 0.112 |
1972
+ | loss_q1 | 0.0162 |
1973
+ | loss_q2 | 0.00315 |
1974
+ | loss_q3 | 0.000298 |
1975
+ | mse | 0.0294 |
1976
+ | mse_q0 | 0.0967 |
1977
+ | mse_q1 | 0.0161 |
1978
+ | mse_q2 | 0.00312 |
1979
+ | mse_q3 | 0.000294 |
1980
+ | param_norm | 224 |
1981
+ | samples | 1.39e+06 |
1982
+ | step | 8.7e+04 |
1983
+ | vb | 0.00398 |
1984
+ | vb_q0 | 0.0155 |
1985
+ | vb_q1 | 0.000119 |
1986
+ | vb_q2 | 2.78e-05 |
1987
+ | vb_q3 | 3.62e-06 |
1988
+ -------------------------
1989
+ -------------------------
1990
+ | grad_norm | 0.0519 |
1991
+ | loss | 0.0328 |
1992
+ | loss_q0 | 0.112 |
1993
+ | loss_q1 | 0.0163 |
1994
+ | loss_q2 | 0.00322 |
1995
+ | loss_q3 | 0.000293 |
1996
+ | mse | 0.0285 |
1997
+ | mse_q0 | 0.095 |
1998
+ | mse_q1 | 0.0162 |
1999
+ | mse_q2 | 0.00319 |
2000
+ | mse_q3 | 0.00029 |
2001
+ | param_norm | 224 |
2002
+ | samples | 1.41e+06 |
2003
+ | step | 8.8e+04 |
2004
+ | vb | 0.00427 |
2005
+ | vb_q0 | 0.017 |
2006
+ | vb_q1 | 0.00012 |
2007
+ | vb_q2 | 2.83e-05 |
2008
+ | vb_q3 | 3.58e-06 |
2009
+ -------------------------
2010
+ -------------------------
2011
+ | grad_norm | 0.0527 |
2012
+ | loss | 0.0333 |
2013
+ | loss_q0 | 0.113 |
2014
+ | loss_q1 | 0.0163 |
2015
+ | loss_q2 | 0.00317 |
2016
+ | loss_q3 | 0.000296 |
2017
+ | mse | 0.0293 |
2018
+ | mse_q0 | 0.0969 |
2019
+ | mse_q1 | 0.0162 |
2020
+ | mse_q2 | 0.00315 |
2021
+ | mse_q3 | 0.000293 |
2022
+ | param_norm | 225 |
2023
+ | samples | 1.42e+06 |
2024
+ | step | 8.9e+04 |
2025
+ | vb | 0.00403 |
2026
+ | vb_q0 | 0.0158 |
2027
+ | vb_q1 | 0.00012 |
2028
+ | vb_q2 | 2.79e-05 |
2029
+ | vb_q3 | 3.61e-06 |
2030
+ -------------------------
2031
+ -------------------------
2032
+ | grad_norm | 0.0531 |
2033
+ | loss | 0.0321 |
2034
+ | loss_q0 | 0.109 |
2035
+ | loss_q1 | 0.0163 |
2036
+ | loss_q2 | 0.00314 |
2037
+ | loss_q3 | 0.000301 |
2038
+ | mse | 0.0281 |
2039
+ | mse_q0 | 0.0931 |
2040
+ | mse_q1 | 0.0162 |
2041
+ | mse_q2 | 0.00311 |
2042
+ | mse_q3 | 0.000297 |
2043
+ | param_norm | 225 |
2044
+ | samples | 1.44e+06 |
2045
+ | step | 9e+04 |
2046
+ | vb | 0.00403 |
2047
+ | vb_q0 | 0.0161 |
2048
+ | vb_q1 | 0.00012 |
2049
+ | vb_q2 | 2.77e-05 |
2050
+ | vb_q3 | 3.65e-06 |
2051
+ -------------------------
2052
+ saving model 0...
2053
+ saving model 0.995...
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/model090000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faa39741934e7290b8c99be648286a526d52da84b83913d8c5fc1d2eda742d3e
3
+ size 118795331
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2d9b7055a02de22f4bf1194021fe75f719aed183afa631bf91ddfc96e92950b
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d2abf9b2d1212b81e1898946fd6b71b7750dc186e48b1967989fd1f592ef1b7
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f680d6299d5a8bea5679596fa5c17907c3e9305b8824b155a0991ff82da708be
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab566effd6f15e249d3035436290cf4e8f31b794df613b0be0f513aef26c04af
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3fca8434fd5d5cef29f3dcaa57f04aff6fe174803759c1d25a177bdf1c3fe71
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47eda96e0d93f907ef270723ece66b2a3f58eff338f76860224e9b96feb69672
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98df3087270472019c5ab8615f297b5269042339aaf2c4a3fb3d2e0db459c6df
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e798a4fb4501bcdaf45f8ba89b5816e3fc7f56bf06ec09313f2d1d5a3a8591
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0662f34dcda129eaade97d62bb7f0948541a3e3766e36bd2ba9e8c56e61aae1
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98742f94747784171671e123b6888d7b5c637b49092cc59a94cfa309f8a0681a
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beda7d927cf4200f1277b3c54d745cfa72b10475ac7ab5ac9b6ec7244ca2e21f
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a04bebd68bd06c37a5e7b950aff6a0bfc3fbab35a1fd6e2417db3a1bcee3915
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b72fe3fdc5d8f9bc46ce994ad50024562ead5deb8e254be8cbd8ffbbdd37e1f9
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93ecad13c3f357059a05c94a281553263823029fda7f3a74044264a68d8f0457
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48b234bca5e10af6780f168a2c9607be1b7512264d74acd91b045d282a8ad381
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c37c2f003b3fbd8696b86b6c6a27d0370efe75d4f9fa14cdfa95076ecf7cd0d4
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/progress.csv ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ grad_norm,loss,loss_q0,loss_q1,loss_q2,loss_q3,mse,mse_q0,mse_q1,mse_q2,mse_q3,param_norm,samples,step,vb,vb_q0,vb_q1,vb_q2,vb_q3
2
+ 2.5351430912370003,1.0083870887756348,1.0080348,1.0147415,1.0054059,1.0136827,0.998694896697998,0.99989533,1.0074818,0.9962311,1.0014414,180.41246248133166,16,0,0.009692199528217316,0.008139333,0.0072596963,0.009174611,0.012241336
3
+ 0.38749177888836006,0.1188441446544604,0.23050378,0.09230976,0.07746425,0.07026056,0.11248564948420937,0.20805381,0.091629766,0.07674303,0.069372825,180.66343956539816,16016,1000,0.006358495749438592,0.02245115,0.0006805919,0.0007197115,0.00088763604
4
+ 0.12307880156062548,0.04229613807797427,0.1380176,0.02121456,0.006024488,0.002998885,0.03858366940822451,0.1235378,0.021058422,0.005970266,0.0029609331,180.98630945099032,32016,2000,0.0037124686531751676,0.014480295,0.00015607383,5.4194606e-05,3.7959086e-05
5
+ 0.10861653979302052,0.039761583946645196,0.13161595,0.019968102,0.004992695,0.0019074993,0.03586718766624112,0.116353765,0.01982141,0.0049480926,0.0018834297,181.3068163062271,48016,3000,0.003894396077477716,0.015261498,0.00014671894,4.4623197e-05,2.4088806e-05
6
+ 0.09964214955218444,0.03897652612999087,0.13006906,0.019326078,0.0044136457,0.0014531624,0.034191709961276504,0.111236505,0.019184364,0.004374178,0.0014348875,181.6596103300142,64016,4000,0.004784816259354556,0.018831875,0.00014192188,3.9468487e-05,1.8275206e-05
7
+ 0.09317443470311265,0.037605101859662635,0.12454447,0.018902501,0.0041123107,0.001154012,0.03368547698156907,0.109276615,0.018763695,0.004075592,0.0011394793,182.04426555810963,80016,5000,0.0039196247911386295,0.015267931,0.0001387761,3.6689344e-05,1.4532697e-05
8
+ 0.0886957447274456,0.035527612912002925,0.120667055,0.01854412,0.0040197615,0.0009905453,0.03219566396577278,0.107276805,0.018407892,0.00398406,0.0009781083,182.46636837398046,96016,6000,0.0033319491002730484,0.01339026,0.00013620706,3.5672114e-05,1.2439021e-05
9
+ 0.08884252483390416,0.037085171052720405,0.12610608,0.018420853,0.0038603789,0.00089521776,0.03263257407117637,0.10839811,0.018285641,0.0038261223,0.0008839919,182.8893104605321,112016,7000,0.004452596903582152,0.017707948,0.00013522441,3.426993e-05,1.122406e-05
10
+ 0.0857711745360411,0.03572559505654495,0.11959203,0.018250594,0.0038038292,0.0008218667,0.03240766271762553,0.10657379,0.018116733,0.0037700704,0.0008115997,183.31371071363583,128016,8000,0.0033179325486016676,0.013017683,0.00013396822,3.3756118e-05,1.0269199e-05
11
+ 0.08352209011027495,0.03627534082811327,0.122893825,0.018271394,0.0037806442,0.00076336414,0.032151561991777225,0.10650192,0.018137224,0.0037471913,0.0007538211,183.72409575601273,144016,9000,0.004123778771936488,0.016392084,0.00013416508,3.3446035e-05,9.537006e-06
12
+ 0.07819607665340927,0.03558732673386118,0.12148027,0.01801353,0.0037238055,0.0007050081,0.03151981560187414,0.10513709,0.017881062,0.003690869,0.0006962378,184.14608868604898,160016,10000,0.004067511171997459,0.016343135,0.00013240371,3.294034e-05,8.767597e-06
13
+ 0.07929677300921607,0.035510201264638455,0.118732445,0.017892234,0.0036725905,0.0006744754,0.0318000881602056,0.10418824,0.017760986,0.0036401371,0.00066605385,184.56062210642554,176016,11000,0.003710113193408687,0.0145442765,0.00013128045,3.245605e-05,8.422207e-06
14
+ 0.07606976359003007,0.036228113402612394,0.11915751,0.01767679,0.003570582,0.0006312284,0.03206723391730331,0.1031912,0.017547045,0.0035389613,0.00062336045,184.98705663130787,192016,12000,0.004160879494367684,0.01596667,0.00012979291,3.1647447e-05,7.869366e-06
15
+ 0.07580516411874072,0.035391651648562346,0.11950631,0.01797185,0.0035955356,0.00061021117,0.0313885395638644,0.10364518,0.017839914,0.0035637391,0.00060262426,185.4279781777233,208016,13000,0.004003112132235403,0.015860839,0.00013189905,3.1765376e-05,7.586633e-06
16
+ 0.07445083135354322,0.03409526038984763,0.11401415,0.017829452,0.003512294,0.0005860707,0.031001788998255484,0.101847194,0.017698564,0.0034811932,0.00057878107,185.87382808638486,224016,14000,0.003093471366293667,0.012167456,0.00013081093,3.108762e-05,7.2855028e-06
17
+ 0.07279939663843127,0.034026893349597354,0.11569134,0.01771187,0.0035322888,0.0005639997,0.03078441938618196,0.102721766,0.017581943,0.0035010688,0.000557,186.32704342058275,240016,15000,0.003242473963002344,0.012969432,0.00013002187,3.120578e-05,6.992426e-06
18
+ 0.0736225762665543,0.03601916115265344,0.12135752,0.017668933,0.0035753683,0.00055964786,0.031502397187519876,0.10361251,0.017539231,0.0035438044,0.00055272045,186.78717955530357,256016,16000,0.004516764026866449,0.01774468,0.00012970669,3.1536758e-05,6.9295943e-06
19
+ 0.07003611841770217,0.03470956698013467,0.115704976,0.017651262,0.003517309,0.00052276324,0.030937781215412487,0.10103667,0.017521774,0.0034862761,0.0005162885,187.2523824098204,272016,17000,0.003771785830802405,0.014667533,0.00012964712,3.101094e-05,6.4721166e-06
20
+ 0.07022596794148567,0.033926365358289357,0.11516196,0.01744049,0.0034680655,0.00051565305,0.03027114991284904,0.10055869,0.01731255,0.0034374394,0.00050925295,187.71733501280244,288016,18000,0.0036552153062184476,0.014603293,0.000128011,3.0635038e-05,6.398486e-06
21
+ 0.06760526681911644,0.03312311216723178,0.11218125,0.0174029,0.0034353957,0.00050708477,0.030387418352998782,0.101301864,0.017275268,0.0034049859,0.000500825,188.18610723568634,304016,19000,0.0027356939040691984,0.010879083,0.0001276402,3.0393301e-05,6.259092e-06
22
+ 0.06846573576417096,0.033713404638692775,0.11369722,0.017500442,0.0034515406,0.00049525604,0.03003398319613185,0.0990803,0.017371753,0.003421087,0.00048912317,188.66174008771435,320016,20000,0.003679421486311178,0.014616791,0.00012848775,3.0460027e-05,6.1334135e-06
23
+ 0.06570787989823366,0.034831443264149116,0.117571786,0.017496178,0.003436851,0.00047775477,0.030749482037965188,0.10144187,0.01736774,0.0034065326,0.0004718528,189.14313822414698,336016,21000,0.0040819612771483636,0.016130125,0.00012842721,3.0319676e-05,5.9043014e-06
24
+ 0.06500338504391671,0.03312428622506552,0.11410628,0.017498154,0.0034039908,0.00046727248,0.02946588172530758,0.09922673,0.017369624,0.0033738937,0.00046150686,189.61774857027513,352016,22000,0.0036584045571617105,0.01488075,0.00012852503,3.00793e-05,5.7660286e-06
25
+ 0.0657523784396333,0.033238833872135755,0.11149831,0.017255954,0.0033713912,0.00046014483,0.02977588848094456,0.097882025,0.017129181,0.003341607,0.0004544512,190.09695096125114,368016,23000,0.003462945427370877,0.013616501,0.00012662949,2.9804314e-05,5.6928247e-06
26
+ 0.06446878267604217,0.033497490535024495,0.11571708,0.017133031,0.0033476737,0.00044819817,0.029288049949798722,0.09865497,0.017007345,0.003318086,0.0004426727,190.5726351798022,384016,24000,0.0042094407337172025,0.017061219,0.00012562412,2.9606575e-05,5.524605e-06
27
+ 0.06572510668094186,0.033606036777375274,0.1114288,0.01708275,0.0033722003,0.00045098146,0.030121052097296368,0.09795004,0.01695719,0.0033424366,0.00044541157,191.0554391573781,400016,25000,0.003484984657028679,0.013479048,0.0001253517,2.978108e-05,5.5673586e-06
28
+ 0.06389940770783689,0.033072616680990874,0.11113418,0.0173054,0.0033691847,0.000437037,0.030025266982149308,0.09912062,0.017178273,0.0033394808,0.00043164505,191.53368998022734,416016,26000,0.003047349801403475,0.012013028,0.00012700053,2.9700044e-05,5.3882854e-06
29
+ 0.06202980238335346,0.03186704055382874,0.108990036,0.017358135,0.0033885366,0.0004237423,0.029358124582795436,0.09887371,0.017230764,0.0033586454,0.00041852126,192.02005145146225,432016,27000,0.0025089161274409006,0.010116346,0.00012742964,2.9885457e-05,5.2215532e-06
30
+ 0.06507318903432624,0.032704058849951215,0.108584546,0.017107127,0.0034131126,0.00043490744,0.0294432620073203,0.09584253,0.016981384,0.0033830807,0.000429563,192.50872719285462,448016,28000,0.0032607969519249415,0.012741454,0.00012558771,3.006147e-05,5.342524e-06
31
+ 0.061742087373785295,0.03350174230337143,0.11429626,0.017215947,0.0033885192,0.00042082704,0.030044486049562672,0.100424126,0.017089764,0.0033586456,0.00041564347,193.0169310468928,464016,29000,0.0034572562404355297,0.013872838,0.00012633206,2.9865563e-05,5.183321e-06
32
+ 0.0624551814011085,0.034128661675378626,0.1173962,0.017290827,0.0033605401,0.00042712872,0.029716186567675287,0.09962314,0.01716392,0.0033309173,0.00042187105,193.51515518296767,480016,30000,0.0044124749983238815,0.01777282,0.00012695667,2.9622672e-05,5.256742e-06
33
+ 0.062481250851292316,0.03467470299592233,0.116738975,0.017357923,0.0032680791,0.0004129323,0.030620100070722408,0.10083595,0.01723062,0.003239176,0.00040784662,194.01625004377158,496016,31000,0.004054602820269786,0.015903743,0.00012738437,2.8881595e-05,5.0861936e-06
34
+ 0.059544816249945745,0.03191653931303892,0.107237056,0.01688988,0.003309901,0.00039750466,0.029257788867224,0.09673227,0.01676584,0.0032806557,0.0003926191,194.50789803887457,512016,32000,0.0026587504843319045,0.010504916,0.00012396519,2.921592e-05,4.88355e-06
35
+ 0.06191545396159866,0.032959418754558954,0.11320956,0.017212626,0.0032893242,0.00040001184,0.029583945242222402,0.099553026,0.017086314,0.0032603175,0.00039507487,195.00805649699484,528016,33000,0.003375473534042611,0.013656557,0.00012623,2.9024919e-05,4.931894e-06
36
+ 0.06062383562139264,0.03507452268223289,0.1186602,0.017035112,0.003361485,0.00039891747,0.03042809375678185,0.10035401,0.016909963,0.0033318624,0.0003940254,195.51581487298773,544016,34000,0.00464642891728909,0.01830657,0.0001249956,2.9623676e-05,4.8945435e-06
37
+ 0.0635884625233498,0.03421822762326342,0.11376807,0.016997557,0.0033168655,0.0003910728,0.03027863175328823,0.098510556,0.016872844,0.0032876404,0.0003862558,196.01952616591777,560016,35000,0.0039395957740707655,0.015257463,0.00012484925,2.9230518e-05,4.8173247e-06
38
+ 0.06107008070458716,0.03400131588359365,0.11395261,0.017034004,0.0033417647,0.000391365,0.030032761705573632,0.09844176,0.01690923,0.0033122944,0.00038655792,196.53440023057288,576016,36000,0.0039685542472416195,0.015511259,0.00012491264,2.9460234e-05,4.8053867e-06
39
+ 0.05990060420544789,0.031796633830294026,0.110115506,0.017024536,0.0033530544,0.0003873284,0.028481805210001782,0.09654104,0.016899774,0.0033235375,0.00038257174,197.055504963234,592016,37000,0.00331482850082466,0.013573966,0.00012494644,2.9503595e-05,4.7565004e-06
40
+ 0.05964728175132119,0.03421506795426823,0.11576267,0.01695003,0.003358747,0.00038322265,0.030042259609093937,0.09927248,0.016825961,0.0033292135,0.00037852148,197.55391341669232,608016,38000,0.004172808433513642,0.016490666,0.00012431541,2.9531342e-05,4.70193e-06
41
+ 0.06199229772136795,0.03464131498523055,0.1174464,0.016948694,0.0032748824,0.0003883894,0.02980534010659902,0.09836048,0.016824186,0.0032459898,0.00038362487,198.06088791144228,624016,39000,0.004835974949110094,0.019086318,0.00012441786,2.888706e-05,4.7685703e-06
42
+ 0.056173037045499453,0.03355109516414816,0.11292371,0.016729953,0.0033132827,0.00037121255,0.029589416386792435,0.0973765,0.01660693,0.003284098,0.0003666663,198.56081043473,640016,40000,0.00396167884672832,0.015547644,0.00012284327,2.9201183e-05,4.5452493e-06
43
+ 0.059586109913723165,0.03439353797165681,0.11501123,0.016799184,0.0032522487,0.00037694137,0.03058620501356197,0.10024245,0.01667592,0.0032235205,0.00037231977,199.07202000917638,656016,41000,0.003807332962431243,0.0147682,0.00012321919,2.872436e-05,4.6212567e-06
44
+ 0.05894077335415071,0.032751620854716786,0.11300882,0.016963845,0.003307908,0.00036955116,0.028623223698232256,0.09623524,0.016839366,0.0032787365,0.00036502533,199.58008478395695,672016,42000,0.0041283972965175135,0.016773384,0.00012447062,2.9154508e-05,4.5238708e-06
45
+ 0.05868386952980761,0.03294618712179362,0.11097262,0.016964072,0.0033232172,0.00036870345,0.02946679911063989,0.09728215,0.016839681,0.0032939932,0.00036419198,200.0846214186139,688016,43000,0.0034793879719672975,0.013690477,0.00012450444,2.9235018e-05,4.511798e-06
46
+ 0.05712984254316217,0.03381405721371992,0.11685681,0.016791698,0.0032206727,0.00036353475,0.02944247466232629,0.09920453,0.016668713,0.003192205,0.00035909005,200.59420255540854,704016,44000,0.004371582545412817,0.017651275,0.00012318294,2.8447348e-05,4.445859e-06
47
+ 0.05872447042537553,0.03396594162192185,0.114005156,0.01711849,0.0033121896,0.00036989406,0.030093214575201265,0.09881455,0.016992783,0.0032830366,0.00036537353,201.11641888427923,720016,45000,0.003872727055175347,0.015191066,0.00012560641,2.9149056e-05,4.5206743e-06
48
+ 0.06097992962216492,0.03294634878612119,0.110426016,0.016868757,0.0032893084,0.00036801185,0.029851069680182304,0.09827576,0.016744858,0.0032603466,0.00036351025,201.64697269969358,736016,46000,0.00309527928518946,0.0121497195,0.00012382239,2.8945595e-05,4.5013194e-06
49
+ 0.05663350393527339,0.03281864472618324,0.11114136,0.017104618,0.003268149,0.00035735714,0.029430219083558716,0.09762698,0.01697898,0.0032393266,0.0003529712,202.18138340129346,752016,47000,0.0033884257052377476,0.013513711,0.00012554179,2.880804e-05,4.385141e-06
50
+ 0.06063569568036176,0.03437269755802121,0.113925785,0.016789563,0.0033288866,0.00035659614,0.030504634066950503,0.09906795,0.01666624,0.0032996624,0.00035222422,202.7109620764582,768016,48000,0.0038680633639451042,0.01485805,0.00012322138,2.9250343e-05,4.3697933e-06
51
+ 0.05590325931445254,0.032708261736202934,0.108219825,0.016645735,0.003290488,0.0003511349,0.029215563801117245,0.09470438,0.016523577,0.0032615233,0.00034684205,203.2325454028811,784016,49000,0.0034926978458897744,0.013515289,0.00012212881,2.8963383e-05,4.2930833e-06
52
+ 0.05887933848793965,0.03376324380328875,0.116158925,0.016920695,0.0032746454,0.00034992793,0.02897768413065938,0.096828245,0.016796345,0.0032458303,0.0003456357,203.76202215823727,800016,50000,0.004785559726273274,0.019329714,0.00012416193,2.8846493e-05,4.291475e-06
53
+ 0.05469590156811721,0.032565321495523644,0.11032303,0.016709045,0.0032559878,0.00034908004,0.02907934553176169,0.096488744,0.016586395,0.0032273156,0.00034481476,204.2916254382747,816016,51000,0.0034859760021263273,0.0138334455,0.00012255994,2.866468e-05,4.2657607e-06
54
+ 0.05821708565069131,0.03239636913407592,0.109414965,0.016752806,0.0031915545,0.00034925115,0.02922611857857558,0.09686192,0.016630068,0.003163346,0.00034498065,204.81139891476724,832016,52000,0.003170250439259681,0.0125530595,0.00012287298,2.8185024e-05,4.2722245e-06
55
+ 0.056472664837151174,0.032827345147263286,0.11111243,0.016775163,0.0032373543,0.0003468643,0.029102278060745435,0.09635251,0.016651995,0.0032088135,0.00034263523,205.34224746566233,848016,53000,0.0037250671177025646,0.014759482,0.00012308097,2.8527791e-05,4.2316706e-06
56
+ 0.058580288619056245,0.03378580757998857,0.116668485,0.01680422,0.0032340037,0.00034146922,0.029724239581264543,0.10026108,0.0166807,0.0032055054,0.0003372957,205.87049279340533,864016,54000,0.0040615680630035084,0.01640741,0.00012337447,2.8509008e-05,4.1713724e-06
57
+ 0.05577092016550799,0.03361079018889,0.115389265,0.01653975,0.0032588867,0.00034043673,0.029271172700449793,0.098015465,0.016418306,0.0032301627,0.00033628094,206.39883776488094,880016,55000,0.0043396173334149255,0.01737308,0.000121398225,2.8703816e-05,4.1555404e-06
58
+ 0.05777157335551956,0.032890599876409285,0.11236597,0.016426073,0.003189053,0.0003412673,0.029044150866800924,0.09706599,0.016305484,0.0031608941,0.00033709285,206.93104066460336,896016,56000,0.0038464491756367383,0.015299772,0.000120635515,2.8174678e-05,4.1754015e-06
59
+ 0.0549993421713471,0.032922283426858504,0.11200538,0.01651029,0.003214448,0.00033035304,0.029002052478957843,0.096423775,0.01638919,0.0031861567,0.0003263155,207.46522256001313,912016,57000,0.003920230926469228,0.01558186,0.00012120526,2.8303351e-05,4.0363334e-06
60
+ 0.05667900257998245,0.033775523173855654,0.11304036,0.016811568,0.0032695837,0.00033267093,0.029541628846433042,0.0965043,0.016688148,0.0032408198,0.00032860908,208.0033349397023,928016,58000,0.0042338941080270216,0.016535679,0.00012338899,2.8753026e-05,4.060786e-06
61
+ 0.056156006808770274,0.03412930240388957,0.11518897,0.016638665,0.0032071744,0.00032965813,0.029538585802540176,0.09722457,0.016516583,0.0031789169,0.0003256278,208.54892494879786,944016,59000,0.0045907166081415205,0.017964583,0.00012210695,2.8254328e-05,4.029121e-06
62
+ 0.05911564312284267,0.03229978877119724,0.10923988,0.016702617,0.0032797777,0.000333632,0.028932071614079128,0.095846295,0.0165801,0.0032509386,0.000329559,209.09054022985416,960016,60000,0.003367717187837117,0.013393664,0.00012255066,2.8840614e-05,4.07416e-06
63
+ 0.05608525544731012,0.03283120975131181,0.10976717,0.016605306,0.0032396517,0.0003319304,0.029373283780645538,0.096258745,0.016483575,0.0032111153,0.00032788492,209.62571191879317,976016,61000,0.003457925954358867,0.013508584,0.00012169345,2.8519622e-05,4.046387e-06
64
+ 0.05501877534166442,0.03297481621825135,0.11257801,0.016683873,0.0032061664,0.00032656046,0.02909935219865291,0.09710706,0.016561648,0.0031779374,0.0003225721,210.16177222075467,992016,62000,0.0038754640472434404,0.015470902,0.00012244807,2.823787e-05,3.9868305e-06
65
+ 0.05219062805249584,0.03271656697243452,0.11215093,0.01660635,0.0031688388,0.00032076152,0.029074916717596305,0.0975485,0.016484628,0.00314089,0.00031685104,210.69716152923755,1008016,63000,0.003641650405934349,0.014602079,0.00012182051,2.796042e-05,3.910809e-06
66
+ 0.0563183546792654,0.032633363903267196,0.110403255,0.016650705,0.0032242872,0.00033333438,0.028713572517503037,0.094859675,0.016528629,0.0031959028,0.00032927687,211.23255039549332,1024016,64000,0.003919791538915892,0.01554351,0.00012214162,2.8378483e-05,4.059327e-06
67
+ 0.05567153185097883,0.03271436781599188,0.11082813,0.016680101,0.003167083,0.0003245076,0.028839432608569044,0.0954411,0.016557798,0.003139104,0.0003205526,211.7938454092672,1040016,65000,0.0038749351028000024,0.015386748,0.00012239139,2.7955537e-05,3.9548736e-06
68
+ 0.054521421907489855,0.03198573151091111,0.10981132,0.016658057,0.0032372614,0.00032345607,0.028164957368280685,0.09436482,0.016535752,0.0032087525,0.0003195153,212.34134123745378,1056016,66000,0.0038207741568548935,0.015447455,0.00012225585,2.8481953e-05,3.9391934e-06
69
+ 0.05447587863110852,0.03257946248212834,0.110619865,0.016562264,0.00321832,0.00032014225,0.028763761436566723,0.095464736,0.016440779,0.0031900178,0.00031624868,212.88179851937997,1072016,67000,0.0038157009625974718,0.015155151,0.000121496254,2.830203e-05,3.892867e-06
70
+ 0.05625929957161441,0.03345432130480183,0.11385384,0.016502324,0.0031968574,0.00032535195,0.02944285704940558,0.09799432,0.016381111,0.0031687305,0.00032139668,213.43198783288094,1088016,68000,0.004011464272607544,0.015859297,0.000121060184,2.8142187e-05,3.955854e-06
71
+ 0.055004896501871965,0.03179665893525817,0.106536396,0.016759587,0.003234906,0.0003170966,0.02866484727500941,0.09416932,0.016636532,0.0032064856,0.00031323388,213.97716156854878,1104016,69000,0.003131811674247735,0.012366518,0.0001230559,2.8449249e-05,3.8646804e-06
72
+ 0.0536967586134085,0.031609297288116074,0.10543689,0.016608428,0.0031813001,0.00031804832,0.02858661183598451,0.09358934,0.01648658,0.0031532515,0.0003141802,214.52275669607016,1120016,70000,0.003022685538349841,0.011847356,0.00012193782,2.802256e-05,3.869898e-06
73
+ 0.055160000674791175,0.03359202911099426,0.11249393,0.016765459,0.003218583,0.0003199129,0.029701160784345104,0.097294256,0.016642336,0.0031902415,0.0003160156,215.0794749861993,1136016,71000,0.0038908681614521056,0.015199085,0.00012300705,2.8343668e-05,3.8999674e-06
74
+ 0.052124493352076494,0.032299238147214054,0.10922959,0.016720576,0.0031599372,0.00031348807,0.028491226778831348,0.09415393,0.016597822,0.0031320874,0.00030967535,215.6190056423105,1152016,72000,0.0038080114894764867,0.015075754,0.00012270373,2.7840493e-05,3.8117723e-06
75
+ 0.05602791396815743,0.03207306618290028,0.10878707,0.01654309,0.0031445029,0.00031522085,0.028986355684697665,0.09652405,0.016421627,0.0031167322,0.0003113774,216.16338349037008,1168016,73000,0.0030867105857832968,0.012263436,0.000121361336,2.7754784e-05,3.842977e-06
76
+ 0.05514118943080267,0.03291953222267334,0.11000037,0.016335782,0.0032078905,0.00031993998,0.02901805261312983,0.094825625,0.016215825,0.003179649,0.0003160567,216.7088737915842,1184016,74000,0.003901479640284375,0.015174718,0.00011994187,2.8248303e-05,3.8848984e-06
77
+ 0.053917622368786805,0.03229256081348279,0.112196766,0.016277803,0.0031891218,0.00031636583,0.028643552313558786,0.097388506,0.016158126,0.0031610357,0.00031251617,217.2531572944162,1200016,75000,0.003649008465410592,0.014807831,0.00011950541,2.8058577e-05,3.8494427e-06
78
+ 0.052981417029987224,0.0341953547678421,0.116435856,0.016571032,0.0031762663,0.00030623708,0.029571750625269504,0.09816321,0.016449459,0.00314827,0.00030250393,217.80283299053247,1216016,76000,0.004623604139531382,0.018273614,0.00012165095,2.7984212e-05,3.7342302e-06
79
+ 0.05289038967522982,0.03162145696440708,0.10671775,0.01638042,0.0031340923,0.0003145785,0.028533928525866923,0.09455053,0.016260015,0.0031064413,0.00031076107,218.34727276351896,1232016,77000,0.0030875285836682413,0.012167565,0.00012020506,2.765851e-05,3.81587e-06
80
+ 0.05182882786087654,0.03334044235898181,0.11710279,0.01634992,0.0032149598,0.00030519342,0.028676871411036683,0.097971424,0.016230054,0.0031866871,0.00030148242,218.8977723329652,1248016,78000,0.004663570980301311,0.01913189,0.00011996337,2.8270782e-05,3.7112736e-06
81
+ 0.05568380582659867,0.03217754939687437,0.1095662,0.016602147,0.003222337,0.00031537103,0.028514700887724783,0.0949204,0.01648014,0.0031939843,0.00031153962,219.43789728445705,1264016,79000,0.003662848463267439,0.014646563,0.00012193552,2.8328419e-05,3.8329854e-06
82
+ 0.052589483680058065,0.031027754681417816,0.10749624,0.016473018,0.0032142357,0.00030646118,0.027600207204464804,0.093507364,0.016352147,0.0031859952,0.00030273027,219.98566685717032,1280016,80000,0.003427547564009729,0.013987808,0.000120873076,2.8261276e-05,3.7290972e-06
83
+ 0.05408931870586312,0.03287746825115753,0.11066489,0.016582951,0.0032121951,0.000311349,0.029243982360698296,0.0963409,0.01646148,0.0031839686,0.00030756238,220.53661458609324,1296016,81000,0.0036334858180962267,0.014324212,0.00012168298,2.8221206e-05,3.7859606e-06
84
+ 0.05193936758525872,0.034012925043702125,0.11597945,0.016673468,0.0031951754,0.00030703977,0.029514113441342527,0.098124385,0.016551005,0.0031670453,0.00030331008,221.09667476906426,1312016,82000,0.0044988117457196485,0.017854406,0.00012236196,2.815449e-05,3.7301634e-06
85
+ 0.05394444767229505,0.032036127452272856,0.1068324,0.016482735,0.0031777814,0.00030481693,0.028769741350319226,0.0940962,0.016361859,0.0031498182,0.00030111158,221.6284145809641,1328016,83000,0.003266386073872127,0.012735808,0.000120988894,2.7968386e-05,3.7091543e-06
86
+ 0.05476221005534034,0.0326294223433361,0.11096678,0.01644256,0.0032055858,0.0003057367,0.028880953270941985,0.09606332,0.016321775,0.0031773986,0.0003020142,222.18229749069903,1344016,84000,0.0037484689268530926,0.014904034,0.00012073276,2.8205677e-05,3.7231591e-06
87
+ 0.053805872175713636,0.03300966645451257,0.11195825,0.016388921,0.0031943046,0.00030365036,0.028699940414168,0.094897486,0.016268652,0.003166191,0.00029995653,222.72849472724013,1360016,85000,0.004309725956492912,0.017060978,0.000120299104,2.8126971e-05,3.694623e-06
88
+ 0.05389630719102992,0.03263209202885624,0.111721896,0.016232198,0.003155762,0.00030469702,0.02846119845774958,0.095052056,0.016112978,0.0031279782,0.00030099525,223.27321970421107,1376016,86000,0.0041708936295944965,0.016670404,0.000119065,2.778399e-05,3.7022885e-06
89
+ 0.052768324952189964,0.03336872462159945,0.11223782,0.016193166,0.0031470296,0.00029771673,0.02939277546736413,0.096720085,0.01607432,0.0031192529,0.00029409528,223.82831639236488,1392016,87000,0.003975949179493906,0.015517785,0.00011882389,2.7750488e-05,3.623136e-06
90
+ 0.051911611603562696,0.032762888428755056,0.112017736,0.016323732,0.0032191554,0.00029317968,0.02849486762052399,0.09496883,0.016203977,0.0031908704,0.00028960145,224.36776144545254,1408016,88000,0.004268020885701837,0.017048156,0.000119667515,2.8295772e-05,3.5797157e-06
91
+ 0.05270384717706044,0.03329609772935519,0.11268163,0.016314829,0.0031742973,0.0002963548,0.029269737612456045,0.09687495,0.016195076,0.0031463364,0.00029274338,224.9106097117001,1424016,89000,0.0040263602071318,0.015806448,0.00011976254,2.794944e-05,3.6102422e-06
92
+ 0.05311616907660258,0.03209496235847477,0.10914376,0.016326811,0.0031423385,0.0003005712,0.028060743806883687,0.09305488,0.016206853,0.003114658,0.00029692045,225.45843791482633,1440016,90000,0.004034218460048576,0.016089164,0.000119740245,2.7677215e-05,3.6494046e-06
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb0488329e5e7a4f16c7265d77818bff83125f16e186d03b91211028af455c85
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d2040c72d075350bc8a4a03728fcc9e55922d1b4ee3bc61d136e5b57882e13a
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d702e8e25f876edd23ae0a331c45037916d8d9c126c20da8e24d6ddbd8ecaef1
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da10e3c5d24ec7d4e96a0cccc4288a99b32a91d0419173113379c34cebb75731
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:608f40578e49974a7c24abd8f4614150490c7bc075d135e41c5a6302ddf39343
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7946119a72301e1a1942646ab6cedc426a664219ffade5ce6b4cce7005cb3e6
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c181760e23bc89a3d148f24ed5ff97ef5c6beb93d90613a792c6a37bd8d971ad
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:649eabfaedbd9b674647dd4cd198867d548aec8505abe9704566bf265a29ec51
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3e8b60c1887915efbe2269a1e0a83f497ff9202ae9333804116d4823d55c8fd
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:304aa7488bd234365fbed535049492bf714cc7b29d078a62c61d75f256465097
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d88506c55c4433fbaf3048b562d1968f420a8bb9469fbd1914e528b13ef31dd
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c6d78f2677a88c633a3cdd7de0112af82132153180957f2c6918aec649ae49d
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48191b3527894041c309ba6d1cb07ffa40c9e0569f783c90330f337572c8e73b
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:865c44b1954ea89629977a6ffb27ae9521c258127b524e8c392ac3dd37245754
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0431935e48e0758773987b33e2412063afe5e6cdb12221988d9f4d6c6d2e8d7d
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c782b97d5ea8910de24497f5b30f6487f01eb8d12a384fc723f8639189c90135
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:325e539489c907a4fba19b8dc77839b48ee1f933bc6870fd24686188ae4c67eb
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a21fdf727a30b3f77a37bcbd836d8324391082da5f89396a92f99a1ae6a8b2bf
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f7a57d3d8156e6e01e397ca2d7883435b6a5bda71a612658945b55c2c1b15fb
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e62fa8f3e4680b217857c8fe6a589babf8e8efa26ff69e0359d959503130e055
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de8cb0f654d7525729b210d3ca1b89878112dd243a3712f3473bb6345ab51809
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48e1a3badf5dfcaac116fbf5403c1e1fde1104e291ec70e2d762b94ab1af5edf
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:608192783cc9fc8aa3a4f6a8dbf55d2c0ba46ba50aefaf256dfd30c471c10b90
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c552e5b68c30b1e0cf62558869408bb00e9db6b15bdd87c1c6c271c581577a09
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90a7f2f517b6cfb13919e493cf2f2216b90587ca38626c9ebcecd5b08558c75e
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b9c1e33e3996310692e85fb970bd0c0f6f55c60289412dce8c64cfefa24aca2
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_indistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfaa6a6ec8da1851c85dd78abe110fb19fed87128d46819bf6cbe5f82db4a31d
3
+ size 4264
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_outdistro_terms.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e010e2655fbf8810873c761fde1eb1f62a773c57447b4668ab3bfbe7789ca92
3
+ size 4264