Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165/log.txt +25 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165/progress.csv +2 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/ema_0.995_090000.pt +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/log.txt +2053 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/model090000.pt +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/progress.csv +92 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_outdistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_indistro_terms.npz +3 -0
- cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_outdistro_terms.npz +3 -0
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165/log.txt
ADDED
|
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Logging to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165
|
| 2 |
+
creating model and diffusion...
|
| 3 |
+
creating data loader...
|
| 4 |
+
training...
|
| 5 |
+
-------------------------
|
| 6 |
+
| grad_norm | 2.54 |
|
| 7 |
+
| loss | 1.01 |
|
| 8 |
+
| loss_q0 | 1.01 |
|
| 9 |
+
| loss_q1 | 1.01 |
|
| 10 |
+
| loss_q2 | 1.01 |
|
| 11 |
+
| loss_q3 | 1.01 |
|
| 12 |
+
| mse | 0.999 |
|
| 13 |
+
| mse_q0 | 1 |
|
| 14 |
+
| mse_q1 | 1.01 |
|
| 15 |
+
| mse_q2 | 0.996 |
|
| 16 |
+
| mse_q3 | 1 |
|
| 17 |
+
| param_norm | 180 |
|
| 18 |
+
| samples | 16 |
|
| 19 |
+
| step | 0 |
|
| 20 |
+
| vb | 0.00969 |
|
| 21 |
+
| vb_q0 | 0.00814 |
|
| 22 |
+
| vb_q1 | 0.00726 |
|
| 23 |
+
| vb_q2 | 0.00917 |
|
| 24 |
+
| vb_q3 | 0.0122 |
|
| 25 |
+
-------------------------
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-13-37-566165/progress.csv
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
grad_norm,loss,loss_q0,loss_q1,loss_q2,loss_q3,mse,mse_q0,mse_q1,mse_q2,mse_q3,param_norm,samples,step,vb,vb_q0,vb_q1,vb_q2,vb_q3
|
| 2 |
+
2.5351430912370003,1.0083870887756348,1.0080348,1.0147415,1.0054059,1.0136827,0.998694896697998,0.99989533,1.0074818,0.9962311,1.0014414,180.41246248133166,16,0,0.009692199528217316,0.008139333,0.0072596963,0.009174611,0.012241336
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/ema_0.995_090000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31fd61b64d5548d00967160f3b4b7c1a29760cd6ea3de1c6a5a326de34201688
|
| 3 |
+
size 118795331
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/log.txt
ADDED
|
@@ -0,0 +1,2053 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Logging to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947
|
| 2 |
+
creating model and diffusion...
|
| 3 |
+
creating data loader...
|
| 4 |
+
training...
|
| 5 |
+
-------------------------
|
| 6 |
+
| grad_norm | 2.54 |
|
| 7 |
+
| loss | 1.01 |
|
| 8 |
+
| loss_q0 | 1.01 |
|
| 9 |
+
| loss_q1 | 1.01 |
|
| 10 |
+
| loss_q2 | 1.01 |
|
| 11 |
+
| loss_q3 | 1.01 |
|
| 12 |
+
| mse | 0.999 |
|
| 13 |
+
| mse_q0 | 1 |
|
| 14 |
+
| mse_q1 | 1.01 |
|
| 15 |
+
| mse_q2 | 0.996 |
|
| 16 |
+
| mse_q3 | 1 |
|
| 17 |
+
| param_norm | 180 |
|
| 18 |
+
| samples | 16 |
|
| 19 |
+
| step | 0 |
|
| 20 |
+
| vb | 0.00969 |
|
| 21 |
+
| vb_q0 | 0.00814 |
|
| 22 |
+
| vb_q1 | 0.00726 |
|
| 23 |
+
| vb_q2 | 0.00917 |
|
| 24 |
+
| vb_q3 | 0.0122 |
|
| 25 |
+
-------------------------
|
| 26 |
+
-------------------------
|
| 27 |
+
| grad_norm | 0.387 |
|
| 28 |
+
| loss | 0.119 |
|
| 29 |
+
| loss_q0 | 0.231 |
|
| 30 |
+
| loss_q1 | 0.0923 |
|
| 31 |
+
| loss_q2 | 0.0775 |
|
| 32 |
+
| loss_q3 | 0.0703 |
|
| 33 |
+
| mse | 0.112 |
|
| 34 |
+
| mse_q0 | 0.208 |
|
| 35 |
+
| mse_q1 | 0.0916 |
|
| 36 |
+
| mse_q2 | 0.0767 |
|
| 37 |
+
| mse_q3 | 0.0694 |
|
| 38 |
+
| param_norm | 181 |
|
| 39 |
+
| samples | 1.6e+04 |
|
| 40 |
+
| step | 1e+03 |
|
| 41 |
+
| vb | 0.00636 |
|
| 42 |
+
| vb_q0 | 0.0225 |
|
| 43 |
+
| vb_q1 | 0.000681 |
|
| 44 |
+
| vb_q2 | 0.00072 |
|
| 45 |
+
| vb_q3 | 0.000888 |
|
| 46 |
+
-------------------------
|
| 47 |
+
-------------------------
|
| 48 |
+
| grad_norm | 0.123 |
|
| 49 |
+
| loss | 0.0423 |
|
| 50 |
+
| loss_q0 | 0.138 |
|
| 51 |
+
| loss_q1 | 0.0212 |
|
| 52 |
+
| loss_q2 | 0.00602 |
|
| 53 |
+
| loss_q3 | 0.003 |
|
| 54 |
+
| mse | 0.0386 |
|
| 55 |
+
| mse_q0 | 0.124 |
|
| 56 |
+
| mse_q1 | 0.0211 |
|
| 57 |
+
| mse_q2 | 0.00597 |
|
| 58 |
+
| mse_q3 | 0.00296 |
|
| 59 |
+
| param_norm | 181 |
|
| 60 |
+
| samples | 3.2e+04 |
|
| 61 |
+
| step | 2e+03 |
|
| 62 |
+
| vb | 0.00371 |
|
| 63 |
+
| vb_q0 | 0.0145 |
|
| 64 |
+
| vb_q1 | 0.000156 |
|
| 65 |
+
| vb_q2 | 5.42e-05 |
|
| 66 |
+
| vb_q3 | 3.8e-05 |
|
| 67 |
+
-------------------------
|
| 68 |
+
-------------------------
|
| 69 |
+
| grad_norm | 0.109 |
|
| 70 |
+
| loss | 0.0398 |
|
| 71 |
+
| loss_q0 | 0.132 |
|
| 72 |
+
| loss_q1 | 0.02 |
|
| 73 |
+
| loss_q2 | 0.00499 |
|
| 74 |
+
| loss_q3 | 0.00191 |
|
| 75 |
+
| mse | 0.0359 |
|
| 76 |
+
| mse_q0 | 0.116 |
|
| 77 |
+
| mse_q1 | 0.0198 |
|
| 78 |
+
| mse_q2 | 0.00495 |
|
| 79 |
+
| mse_q3 | 0.00188 |
|
| 80 |
+
| param_norm | 181 |
|
| 81 |
+
| samples | 4.8e+04 |
|
| 82 |
+
| step | 3e+03 |
|
| 83 |
+
| vb | 0.00389 |
|
| 84 |
+
| vb_q0 | 0.0153 |
|
| 85 |
+
| vb_q1 | 0.000147 |
|
| 86 |
+
| vb_q2 | 4.46e-05 |
|
| 87 |
+
| vb_q3 | 2.41e-05 |
|
| 88 |
+
-------------------------
|
| 89 |
+
-------------------------
|
| 90 |
+
| grad_norm | 0.0996 |
|
| 91 |
+
| loss | 0.039 |
|
| 92 |
+
| loss_q0 | 0.13 |
|
| 93 |
+
| loss_q1 | 0.0193 |
|
| 94 |
+
| loss_q2 | 0.00441 |
|
| 95 |
+
| loss_q3 | 0.00145 |
|
| 96 |
+
| mse | 0.0342 |
|
| 97 |
+
| mse_q0 | 0.111 |
|
| 98 |
+
| mse_q1 | 0.0192 |
|
| 99 |
+
| mse_q2 | 0.00437 |
|
| 100 |
+
| mse_q3 | 0.00143 |
|
| 101 |
+
| param_norm | 182 |
|
| 102 |
+
| samples | 6.4e+04 |
|
| 103 |
+
| step | 4e+03 |
|
| 104 |
+
| vb | 0.00478 |
|
| 105 |
+
| vb_q0 | 0.0188 |
|
| 106 |
+
| vb_q1 | 0.000142 |
|
| 107 |
+
| vb_q2 | 3.95e-05 |
|
| 108 |
+
| vb_q3 | 1.83e-05 |
|
| 109 |
+
-------------------------
|
| 110 |
+
-------------------------
|
| 111 |
+
| grad_norm | 0.0932 |
|
| 112 |
+
| loss | 0.0376 |
|
| 113 |
+
| loss_q0 | 0.125 |
|
| 114 |
+
| loss_q1 | 0.0189 |
|
| 115 |
+
| loss_q2 | 0.00411 |
|
| 116 |
+
| loss_q3 | 0.00115 |
|
| 117 |
+
| mse | 0.0337 |
|
| 118 |
+
| mse_q0 | 0.109 |
|
| 119 |
+
| mse_q1 | 0.0188 |
|
| 120 |
+
| mse_q2 | 0.00408 |
|
| 121 |
+
| mse_q3 | 0.00114 |
|
| 122 |
+
| param_norm | 182 |
|
| 123 |
+
| samples | 8e+04 |
|
| 124 |
+
| step | 5e+03 |
|
| 125 |
+
| vb | 0.00392 |
|
| 126 |
+
| vb_q0 | 0.0153 |
|
| 127 |
+
| vb_q1 | 0.000139 |
|
| 128 |
+
| vb_q2 | 3.67e-05 |
|
| 129 |
+
| vb_q3 | 1.45e-05 |
|
| 130 |
+
-------------------------
|
| 131 |
+
-------------------------
|
| 132 |
+
| grad_norm | 0.0887 |
|
| 133 |
+
| loss | 0.0355 |
|
| 134 |
+
| loss_q0 | 0.121 |
|
| 135 |
+
| loss_q1 | 0.0185 |
|
| 136 |
+
| loss_q2 | 0.00402 |
|
| 137 |
+
| loss_q3 | 0.000991 |
|
| 138 |
+
| mse | 0.0322 |
|
| 139 |
+
| mse_q0 | 0.107 |
|
| 140 |
+
| mse_q1 | 0.0184 |
|
| 141 |
+
| mse_q2 | 0.00398 |
|
| 142 |
+
| mse_q3 | 0.000978 |
|
| 143 |
+
| param_norm | 182 |
|
| 144 |
+
| samples | 9.6e+04 |
|
| 145 |
+
| step | 6e+03 |
|
| 146 |
+
| vb | 0.00333 |
|
| 147 |
+
| vb_q0 | 0.0134 |
|
| 148 |
+
| vb_q1 | 0.000136 |
|
| 149 |
+
| vb_q2 | 3.57e-05 |
|
| 150 |
+
| vb_q3 | 1.24e-05 |
|
| 151 |
+
-------------------------
|
| 152 |
+
-------------------------
|
| 153 |
+
| grad_norm | 0.0888 |
|
| 154 |
+
| loss | 0.0371 |
|
| 155 |
+
| loss_q0 | 0.126 |
|
| 156 |
+
| loss_q1 | 0.0184 |
|
| 157 |
+
| loss_q2 | 0.00386 |
|
| 158 |
+
| loss_q3 | 0.000895 |
|
| 159 |
+
| mse | 0.0326 |
|
| 160 |
+
| mse_q0 | 0.108 |
|
| 161 |
+
| mse_q1 | 0.0183 |
|
| 162 |
+
| mse_q2 | 0.00383 |
|
| 163 |
+
| mse_q3 | 0.000884 |
|
| 164 |
+
| param_norm | 183 |
|
| 165 |
+
| samples | 1.12e+05 |
|
| 166 |
+
| step | 7e+03 |
|
| 167 |
+
| vb | 0.00445 |
|
| 168 |
+
| vb_q0 | 0.0177 |
|
| 169 |
+
| vb_q1 | 0.000135 |
|
| 170 |
+
| vb_q2 | 3.43e-05 |
|
| 171 |
+
| vb_q3 | 1.12e-05 |
|
| 172 |
+
-------------------------
|
| 173 |
+
-------------------------
|
| 174 |
+
| grad_norm | 0.0858 |
|
| 175 |
+
| loss | 0.0357 |
|
| 176 |
+
| loss_q0 | 0.12 |
|
| 177 |
+
| loss_q1 | 0.0183 |
|
| 178 |
+
| loss_q2 | 0.0038 |
|
| 179 |
+
| loss_q3 | 0.000822 |
|
| 180 |
+
| mse | 0.0324 |
|
| 181 |
+
| mse_q0 | 0.107 |
|
| 182 |
+
| mse_q1 | 0.0181 |
|
| 183 |
+
| mse_q2 | 0.00377 |
|
| 184 |
+
| mse_q3 | 0.000812 |
|
| 185 |
+
| param_norm | 183 |
|
| 186 |
+
| samples | 1.28e+05 |
|
| 187 |
+
| step | 8e+03 |
|
| 188 |
+
| vb | 0.00332 |
|
| 189 |
+
| vb_q0 | 0.013 |
|
| 190 |
+
| vb_q1 | 0.000134 |
|
| 191 |
+
| vb_q2 | 3.38e-05 |
|
| 192 |
+
| vb_q3 | 1.03e-05 |
|
| 193 |
+
-------------------------
|
| 194 |
+
-------------------------
|
| 195 |
+
| grad_norm | 0.0835 |
|
| 196 |
+
| loss | 0.0363 |
|
| 197 |
+
| loss_q0 | 0.123 |
|
| 198 |
+
| loss_q1 | 0.0183 |
|
| 199 |
+
| loss_q2 | 0.00378 |
|
| 200 |
+
| loss_q3 | 0.000763 |
|
| 201 |
+
| mse | 0.0322 |
|
| 202 |
+
| mse_q0 | 0.107 |
|
| 203 |
+
| mse_q1 | 0.0181 |
|
| 204 |
+
| mse_q2 | 0.00375 |
|
| 205 |
+
| mse_q3 | 0.000754 |
|
| 206 |
+
| param_norm | 184 |
|
| 207 |
+
| samples | 1.44e+05 |
|
| 208 |
+
| step | 9e+03 |
|
| 209 |
+
| vb | 0.00412 |
|
| 210 |
+
| vb_q0 | 0.0164 |
|
| 211 |
+
| vb_q1 | 0.000134 |
|
| 212 |
+
| vb_q2 | 3.34e-05 |
|
| 213 |
+
| vb_q3 | 9.54e-06 |
|
| 214 |
+
-------------------------
|
| 215 |
+
-------------------------
|
| 216 |
+
| grad_norm | 0.0782 |
|
| 217 |
+
| loss | 0.0356 |
|
| 218 |
+
| loss_q0 | 0.121 |
|
| 219 |
+
| loss_q1 | 0.018 |
|
| 220 |
+
| loss_q2 | 0.00372 |
|
| 221 |
+
| loss_q3 | 0.000705 |
|
| 222 |
+
| mse | 0.0315 |
|
| 223 |
+
| mse_q0 | 0.105 |
|
| 224 |
+
| mse_q1 | 0.0179 |
|
| 225 |
+
| mse_q2 | 0.00369 |
|
| 226 |
+
| mse_q3 | 0.000696 |
|
| 227 |
+
| param_norm | 184 |
|
| 228 |
+
| samples | 1.6e+05 |
|
| 229 |
+
| step | 1e+04 |
|
| 230 |
+
| vb | 0.00407 |
|
| 231 |
+
| vb_q0 | 0.0163 |
|
| 232 |
+
| vb_q1 | 0.000132 |
|
| 233 |
+
| vb_q2 | 3.29e-05 |
|
| 234 |
+
| vb_q3 | 8.77e-06 |
|
| 235 |
+
-------------------------
|
| 236 |
+
saving model 0...
|
| 237 |
+
saving model 0.995...
|
| 238 |
+
evaluation indistro starting...
|
| 239 |
+
done 96 samples: bpd=3.809229850769043
|
| 240 |
+
done 192 samples: bpd=3.8889626264572144
|
| 241 |
+
done 288 samples: bpd=3.8427980740865073
|
| 242 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_indistro_terms.npz
|
| 243 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_indistro_terms.npz
|
| 244 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_indistro_terms.npz
|
| 245 |
+
evaluation nll complete
|
| 246 |
+
evaluation outdistro starting...
|
| 247 |
+
done 192 samples: bpd=4.073406219482422
|
| 248 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_outdistro_terms.npz
|
| 249 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_outdistro_terms.npz
|
| 250 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_outdistro_terms.npz
|
| 251 |
+
evaluation nll complete
|
| 252 |
+
sampling starting...
|
| 253 |
+
-------------------------
|
| 254 |
+
| grad_norm | 0.0793 |
|
| 255 |
+
| loss | 0.0355 |
|
| 256 |
+
| loss_q0 | 0.119 |
|
| 257 |
+
| loss_q1 | 0.0179 |
|
| 258 |
+
| loss_q2 | 0.00367 |
|
| 259 |
+
| loss_q3 | 0.000674 |
|
| 260 |
+
| mse | 0.0318 |
|
| 261 |
+
| mse_q0 | 0.104 |
|
| 262 |
+
| mse_q1 | 0.0178 |
|
| 263 |
+
| mse_q2 | 0.00364 |
|
| 264 |
+
| mse_q3 | 0.000666 |
|
| 265 |
+
| param_norm | 185 |
|
| 266 |
+
| samples | 1.76e+05 |
|
| 267 |
+
| step | 1.1e+04 |
|
| 268 |
+
| vb | 0.00371 |
|
| 269 |
+
| vb_q0 | 0.0145 |
|
| 270 |
+
| vb_q1 | 0.000131 |
|
| 271 |
+
| vb_q2 | 3.25e-05 |
|
| 272 |
+
| vb_q3 | 8.42e-06 |
|
| 273 |
+
-------------------------
|
| 274 |
+
-------------------------
|
| 275 |
+
| grad_norm | 0.0761 |
|
| 276 |
+
| loss | 0.0362 |
|
| 277 |
+
| loss_q0 | 0.119 |
|
| 278 |
+
| loss_q1 | 0.0177 |
|
| 279 |
+
| loss_q2 | 0.00357 |
|
| 280 |
+
| loss_q3 | 0.000631 |
|
| 281 |
+
| mse | 0.0321 |
|
| 282 |
+
| mse_q0 | 0.103 |
|
| 283 |
+
| mse_q1 | 0.0175 |
|
| 284 |
+
| mse_q2 | 0.00354 |
|
| 285 |
+
| mse_q3 | 0.000623 |
|
| 286 |
+
| param_norm | 185 |
|
| 287 |
+
| samples | 1.92e+05 |
|
| 288 |
+
| step | 1.2e+04 |
|
| 289 |
+
| vb | 0.00416 |
|
| 290 |
+
| vb_q0 | 0.016 |
|
| 291 |
+
| vb_q1 | 0.00013 |
|
| 292 |
+
| vb_q2 | 3.16e-05 |
|
| 293 |
+
| vb_q3 | 7.87e-06 |
|
| 294 |
+
-------------------------
|
| 295 |
+
-------------------------
|
| 296 |
+
| grad_norm | 0.0758 |
|
| 297 |
+
| loss | 0.0354 |
|
| 298 |
+
| loss_q0 | 0.12 |
|
| 299 |
+
| loss_q1 | 0.018 |
|
| 300 |
+
| loss_q2 | 0.0036 |
|
| 301 |
+
| loss_q3 | 0.00061 |
|
| 302 |
+
| mse | 0.0314 |
|
| 303 |
+
| mse_q0 | 0.104 |
|
| 304 |
+
| mse_q1 | 0.0178 |
|
| 305 |
+
| mse_q2 | 0.00356 |
|
| 306 |
+
| mse_q3 | 0.000603 |
|
| 307 |
+
| param_norm | 185 |
|
| 308 |
+
| samples | 2.08e+05 |
|
| 309 |
+
| step | 1.3e+04 |
|
| 310 |
+
| vb | 0.004 |
|
| 311 |
+
| vb_q0 | 0.0159 |
|
| 312 |
+
| vb_q1 | 0.000132 |
|
| 313 |
+
| vb_q2 | 3.18e-05 |
|
| 314 |
+
| vb_q3 | 7.59e-06 |
|
| 315 |
+
-------------------------
|
| 316 |
+
-------------------------
|
| 317 |
+
| grad_norm | 0.0745 |
|
| 318 |
+
| loss | 0.0341 |
|
| 319 |
+
| loss_q0 | 0.114 |
|
| 320 |
+
| loss_q1 | 0.0178 |
|
| 321 |
+
| loss_q2 | 0.00351 |
|
| 322 |
+
| loss_q3 | 0.000586 |
|
| 323 |
+
| mse | 0.031 |
|
| 324 |
+
| mse_q0 | 0.102 |
|
| 325 |
+
| mse_q1 | 0.0177 |
|
| 326 |
+
| mse_q2 | 0.00348 |
|
| 327 |
+
| mse_q3 | 0.000579 |
|
| 328 |
+
| param_norm | 186 |
|
| 329 |
+
| samples | 2.24e+05 |
|
| 330 |
+
| step | 1.4e+04 |
|
| 331 |
+
| vb | 0.00309 |
|
| 332 |
+
| vb_q0 | 0.0122 |
|
| 333 |
+
| vb_q1 | 0.000131 |
|
| 334 |
+
| vb_q2 | 3.11e-05 |
|
| 335 |
+
| vb_q3 | 7.29e-06 |
|
| 336 |
+
-------------------------
|
| 337 |
+
-------------------------
|
| 338 |
+
| grad_norm | 0.0728 |
|
| 339 |
+
| loss | 0.034 |
|
| 340 |
+
| loss_q0 | 0.116 |
|
| 341 |
+
| loss_q1 | 0.0177 |
|
| 342 |
+
| loss_q2 | 0.00353 |
|
| 343 |
+
| loss_q3 | 0.000564 |
|
| 344 |
+
| mse | 0.0308 |
|
| 345 |
+
| mse_q0 | 0.103 |
|
| 346 |
+
| mse_q1 | 0.0176 |
|
| 347 |
+
| mse_q2 | 0.0035 |
|
| 348 |
+
| mse_q3 | 0.000557 |
|
| 349 |
+
| param_norm | 186 |
|
| 350 |
+
| samples | 2.4e+05 |
|
| 351 |
+
| step | 1.5e+04 |
|
| 352 |
+
| vb | 0.00324 |
|
| 353 |
+
| vb_q0 | 0.013 |
|
| 354 |
+
| vb_q1 | 0.00013 |
|
| 355 |
+
| vb_q2 | 3.12e-05 |
|
| 356 |
+
| vb_q3 | 6.99e-06 |
|
| 357 |
+
-------------------------
|
| 358 |
+
-------------------------
|
| 359 |
+
| grad_norm | 0.0736 |
|
| 360 |
+
| loss | 0.036 |
|
| 361 |
+
| loss_q0 | 0.121 |
|
| 362 |
+
| loss_q1 | 0.0177 |
|
| 363 |
+
| loss_q2 | 0.00358 |
|
| 364 |
+
| loss_q3 | 0.00056 |
|
| 365 |
+
| mse | 0.0315 |
|
| 366 |
+
| mse_q0 | 0.104 |
|
| 367 |
+
| mse_q1 | 0.0175 |
|
| 368 |
+
| mse_q2 | 0.00354 |
|
| 369 |
+
| mse_q3 | 0.000553 |
|
| 370 |
+
| param_norm | 187 |
|
| 371 |
+
| samples | 2.56e+05 |
|
| 372 |
+
| step | 1.6e+04 |
|
| 373 |
+
| vb | 0.00452 |
|
| 374 |
+
| vb_q0 | 0.0177 |
|
| 375 |
+
| vb_q1 | 0.00013 |
|
| 376 |
+
| vb_q2 | 3.15e-05 |
|
| 377 |
+
| vb_q3 | 6.93e-06 |
|
| 378 |
+
-------------------------
|
| 379 |
+
-------------------------
|
| 380 |
+
| grad_norm | 0.07 |
|
| 381 |
+
| loss | 0.0347 |
|
| 382 |
+
| loss_q0 | 0.116 |
|
| 383 |
+
| loss_q1 | 0.0177 |
|
| 384 |
+
| loss_q2 | 0.00352 |
|
| 385 |
+
| loss_q3 | 0.000523 |
|
| 386 |
+
| mse | 0.0309 |
|
| 387 |
+
| mse_q0 | 0.101 |
|
| 388 |
+
| mse_q1 | 0.0175 |
|
| 389 |
+
| mse_q2 | 0.00349 |
|
| 390 |
+
| mse_q3 | 0.000516 |
|
| 391 |
+
| param_norm | 187 |
|
| 392 |
+
| samples | 2.72e+05 |
|
| 393 |
+
| step | 1.7e+04 |
|
| 394 |
+
| vb | 0.00377 |
|
| 395 |
+
| vb_q0 | 0.0147 |
|
| 396 |
+
| vb_q1 | 0.00013 |
|
| 397 |
+
| vb_q2 | 3.1e-05 |
|
| 398 |
+
| vb_q3 | 6.47e-06 |
|
| 399 |
+
-------------------------
|
| 400 |
+
-------------------------
|
| 401 |
+
| grad_norm | 0.0702 |
|
| 402 |
+
| loss | 0.0339 |
|
| 403 |
+
| loss_q0 | 0.115 |
|
| 404 |
+
| loss_q1 | 0.0174 |
|
| 405 |
+
| loss_q2 | 0.00347 |
|
| 406 |
+
| loss_q3 | 0.000516 |
|
| 407 |
+
| mse | 0.0303 |
|
| 408 |
+
| mse_q0 | 0.101 |
|
| 409 |
+
| mse_q1 | 0.0173 |
|
| 410 |
+
| mse_q2 | 0.00344 |
|
| 411 |
+
| mse_q3 | 0.000509 |
|
| 412 |
+
| param_norm | 188 |
|
| 413 |
+
| samples | 2.88e+05 |
|
| 414 |
+
| step | 1.8e+04 |
|
| 415 |
+
| vb | 0.00366 |
|
| 416 |
+
| vb_q0 | 0.0146 |
|
| 417 |
+
| vb_q1 | 0.000128 |
|
| 418 |
+
| vb_q2 | 3.06e-05 |
|
| 419 |
+
| vb_q3 | 6.4e-06 |
|
| 420 |
+
-------------------------
|
| 421 |
+
-------------------------
|
| 422 |
+
| grad_norm | 0.0676 |
|
| 423 |
+
| loss | 0.0331 |
|
| 424 |
+
| loss_q0 | 0.112 |
|
| 425 |
+
| loss_q1 | 0.0174 |
|
| 426 |
+
| loss_q2 | 0.00344 |
|
| 427 |
+
| loss_q3 | 0.000507 |
|
| 428 |
+
| mse | 0.0304 |
|
| 429 |
+
| mse_q0 | 0.101 |
|
| 430 |
+
| mse_q1 | 0.0173 |
|
| 431 |
+
| mse_q2 | 0.0034 |
|
| 432 |
+
| mse_q3 | 0.000501 |
|
| 433 |
+
| param_norm | 188 |
|
| 434 |
+
| samples | 3.04e+05 |
|
| 435 |
+
| step | 1.9e+04 |
|
| 436 |
+
| vb | 0.00274 |
|
| 437 |
+
| vb_q0 | 0.0109 |
|
| 438 |
+
| vb_q1 | 0.000128 |
|
| 439 |
+
| vb_q2 | 3.04e-05 |
|
| 440 |
+
| vb_q3 | 6.26e-06 |
|
| 441 |
+
-------------------------
|
| 442 |
+
-------------------------
|
| 443 |
+
| grad_norm | 0.0685 |
|
| 444 |
+
| loss | 0.0337 |
|
| 445 |
+
| loss_q0 | 0.114 |
|
| 446 |
+
| loss_q1 | 0.0175 |
|
| 447 |
+
| loss_q2 | 0.00345 |
|
| 448 |
+
| loss_q3 | 0.000495 |
|
| 449 |
+
| mse | 0.03 |
|
| 450 |
+
| mse_q0 | 0.0991 |
|
| 451 |
+
| mse_q1 | 0.0174 |
|
| 452 |
+
| mse_q2 | 0.00342 |
|
| 453 |
+
| mse_q3 | 0.000489 |
|
| 454 |
+
| param_norm | 189 |
|
| 455 |
+
| samples | 3.2e+05 |
|
| 456 |
+
| step | 2e+04 |
|
| 457 |
+
| vb | 0.00368 |
|
| 458 |
+
| vb_q0 | 0.0146 |
|
| 459 |
+
| vb_q1 | 0.000128 |
|
| 460 |
+
| vb_q2 | 3.05e-05 |
|
| 461 |
+
| vb_q3 | 6.13e-06 |
|
| 462 |
+
-------------------------
|
| 463 |
+
saving model 0...
|
| 464 |
+
saving model 0.995...
|
| 465 |
+
evaluation indistro starting...
|
| 466 |
+
done 96 samples: bpd=3.86189341545105
|
| 467 |
+
done 192 samples: bpd=3.769935965538025
|
| 468 |
+
done 288 samples: bpd=3.756619850794474
|
| 469 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_indistro_terms.npz
|
| 470 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_indistro_terms.npz
|
| 471 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_indistro_terms.npz
|
| 472 |
+
evaluation nll complete
|
| 473 |
+
evaluation outdistro starting...
|
| 474 |
+
done 192 samples: bpd=3.8321585655212402
|
| 475 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_outdistro_terms.npz
|
| 476 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_outdistro_terms.npz
|
| 477 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_outdistro_terms.npz
|
| 478 |
+
evaluation nll complete
|
| 479 |
+
sampling starting...
|
| 480 |
+
-------------------------
|
| 481 |
+
| grad_norm | 0.0657 |
|
| 482 |
+
| loss | 0.0348 |
|
| 483 |
+
| loss_q0 | 0.118 |
|
| 484 |
+
| loss_q1 | 0.0175 |
|
| 485 |
+
| loss_q2 | 0.00344 |
|
| 486 |
+
| loss_q3 | 0.000478 |
|
| 487 |
+
| mse | 0.0307 |
|
| 488 |
+
| mse_q0 | 0.101 |
|
| 489 |
+
| mse_q1 | 0.0174 |
|
| 490 |
+
| mse_q2 | 0.00341 |
|
| 491 |
+
| mse_q3 | 0.000472 |
|
| 492 |
+
| param_norm | 189 |
|
| 493 |
+
| samples | 3.36e+05 |
|
| 494 |
+
| step | 2.1e+04 |
|
| 495 |
+
| vb | 0.00408 |
|
| 496 |
+
| vb_q0 | 0.0161 |
|
| 497 |
+
| vb_q1 | 0.000128 |
|
| 498 |
+
| vb_q2 | 3.03e-05 |
|
| 499 |
+
| vb_q3 | 5.9e-06 |
|
| 500 |
+
-------------------------
|
| 501 |
+
-------------------------
|
| 502 |
+
| grad_norm | 0.065 |
|
| 503 |
+
| loss | 0.0331 |
|
| 504 |
+
| loss_q0 | 0.114 |
|
| 505 |
+
| loss_q1 | 0.0175 |
|
| 506 |
+
| loss_q2 | 0.0034 |
|
| 507 |
+
| loss_q3 | 0.000467 |
|
| 508 |
+
| mse | 0.0295 |
|
| 509 |
+
| mse_q0 | 0.0992 |
|
| 510 |
+
| mse_q1 | 0.0174 |
|
| 511 |
+
| mse_q2 | 0.00337 |
|
| 512 |
+
| mse_q3 | 0.000462 |
|
| 513 |
+
| param_norm | 190 |
|
| 514 |
+
| samples | 3.52e+05 |
|
| 515 |
+
| step | 2.2e+04 |
|
| 516 |
+
| vb | 0.00366 |
|
| 517 |
+
| vb_q0 | 0.0149 |
|
| 518 |
+
| vb_q1 | 0.000129 |
|
| 519 |
+
| vb_q2 | 3.01e-05 |
|
| 520 |
+
| vb_q3 | 5.77e-06 |
|
| 521 |
+
-------------------------
|
| 522 |
+
-------------------------
|
| 523 |
+
| grad_norm | 0.0658 |
|
| 524 |
+
| loss | 0.0332 |
|
| 525 |
+
| loss_q0 | 0.111 |
|
| 526 |
+
| loss_q1 | 0.0173 |
|
| 527 |
+
| loss_q2 | 0.00337 |
|
| 528 |
+
| loss_q3 | 0.00046 |
|
| 529 |
+
| mse | 0.0298 |
|
| 530 |
+
| mse_q0 | 0.0979 |
|
| 531 |
+
| mse_q1 | 0.0171 |
|
| 532 |
+
| mse_q2 | 0.00334 |
|
| 533 |
+
| mse_q3 | 0.000454 |
|
| 534 |
+
| param_norm | 190 |
|
| 535 |
+
| samples | 3.68e+05 |
|
| 536 |
+
| step | 2.3e+04 |
|
| 537 |
+
| vb | 0.00346 |
|
| 538 |
+
| vb_q0 | 0.0136 |
|
| 539 |
+
| vb_q1 | 0.000127 |
|
| 540 |
+
| vb_q2 | 2.98e-05 |
|
| 541 |
+
| vb_q3 | 5.69e-06 |
|
| 542 |
+
-------------------------
|
| 543 |
+
-------------------------
|
| 544 |
+
| grad_norm | 0.0645 |
|
| 545 |
+
| loss | 0.0335 |
|
| 546 |
+
| loss_q0 | 0.116 |
|
| 547 |
+
| loss_q1 | 0.0171 |
|
| 548 |
+
| loss_q2 | 0.00335 |
|
| 549 |
+
| loss_q3 | 0.000448 |
|
| 550 |
+
| mse | 0.0293 |
|
| 551 |
+
| mse_q0 | 0.0987 |
|
| 552 |
+
| mse_q1 | 0.017 |
|
| 553 |
+
| mse_q2 | 0.00332 |
|
| 554 |
+
| mse_q3 | 0.000443 |
|
| 555 |
+
| param_norm | 191 |
|
| 556 |
+
| samples | 3.84e+05 |
|
| 557 |
+
| step | 2.4e+04 |
|
| 558 |
+
| vb | 0.00421 |
|
| 559 |
+
| vb_q0 | 0.0171 |
|
| 560 |
+
| vb_q1 | 0.000126 |
|
| 561 |
+
| vb_q2 | 2.96e-05 |
|
| 562 |
+
| vb_q3 | 5.52e-06 |
|
| 563 |
+
-------------------------
|
| 564 |
+
-------------------------
|
| 565 |
+
| grad_norm | 0.0657 |
|
| 566 |
+
| loss | 0.0336 |
|
| 567 |
+
| loss_q0 | 0.111 |
|
| 568 |
+
| loss_q1 | 0.0171 |
|
| 569 |
+
| loss_q2 | 0.00337 |
|
| 570 |
+
| loss_q3 | 0.000451 |
|
| 571 |
+
| mse | 0.0301 |
|
| 572 |
+
| mse_q0 | 0.098 |
|
| 573 |
+
| mse_q1 | 0.017 |
|
| 574 |
+
| mse_q2 | 0.00334 |
|
| 575 |
+
| mse_q3 | 0.000445 |
|
| 576 |
+
| param_norm | 191 |
|
| 577 |
+
| samples | 4e+05 |
|
| 578 |
+
| step | 2.5e+04 |
|
| 579 |
+
| vb | 0.00348 |
|
| 580 |
+
| vb_q0 | 0.0135 |
|
| 581 |
+
| vb_q1 | 0.000125 |
|
| 582 |
+
| vb_q2 | 2.98e-05 |
|
| 583 |
+
| vb_q3 | 5.57e-06 |
|
| 584 |
+
-------------------------
|
| 585 |
+
-------------------------
|
| 586 |
+
| grad_norm | 0.0639 |
|
| 587 |
+
| loss | 0.0331 |
|
| 588 |
+
| loss_q0 | 0.111 |
|
| 589 |
+
| loss_q1 | 0.0173 |
|
| 590 |
+
| loss_q2 | 0.00337 |
|
| 591 |
+
| loss_q3 | 0.000437 |
|
| 592 |
+
| mse | 0.03 |
|
| 593 |
+
| mse_q0 | 0.0991 |
|
| 594 |
+
| mse_q1 | 0.0172 |
|
| 595 |
+
| mse_q2 | 0.00334 |
|
| 596 |
+
| mse_q3 | 0.000432 |
|
| 597 |
+
| param_norm | 192 |
|
| 598 |
+
| samples | 4.16e+05 |
|
| 599 |
+
| step | 2.6e+04 |
|
| 600 |
+
| vb | 0.00305 |
|
| 601 |
+
| vb_q0 | 0.012 |
|
| 602 |
+
| vb_q1 | 0.000127 |
|
| 603 |
+
| vb_q2 | 2.97e-05 |
|
| 604 |
+
| vb_q3 | 5.39e-06 |
|
| 605 |
+
-------------------------
|
| 606 |
+
-------------------------
|
| 607 |
+
| grad_norm | 0.062 |
|
| 608 |
+
| loss | 0.0319 |
|
| 609 |
+
| loss_q0 | 0.109 |
|
| 610 |
+
| loss_q1 | 0.0174 |
|
| 611 |
+
| loss_q2 | 0.00339 |
|
| 612 |
+
| loss_q3 | 0.000424 |
|
| 613 |
+
| mse | 0.0294 |
|
| 614 |
+
| mse_q0 | 0.0989 |
|
| 615 |
+
| mse_q1 | 0.0172 |
|
| 616 |
+
| mse_q2 | 0.00336 |
|
| 617 |
+
| mse_q3 | 0.000419 |
|
| 618 |
+
| param_norm | 192 |
|
| 619 |
+
| samples | 4.32e+05 |
|
| 620 |
+
| step | 2.7e+04 |
|
| 621 |
+
| vb | 0.00251 |
|
| 622 |
+
| vb_q0 | 0.0101 |
|
| 623 |
+
| vb_q1 | 0.000127 |
|
| 624 |
+
| vb_q2 | 2.99e-05 |
|
| 625 |
+
| vb_q3 | 5.22e-06 |
|
| 626 |
+
-------------------------
|
| 627 |
+
-------------------------
|
| 628 |
+
| grad_norm | 0.0651 |
|
| 629 |
+
| loss | 0.0327 |
|
| 630 |
+
| loss_q0 | 0.109 |
|
| 631 |
+
| loss_q1 | 0.0171 |
|
| 632 |
+
| loss_q2 | 0.00341 |
|
| 633 |
+
| loss_q3 | 0.000435 |
|
| 634 |
+
| mse | 0.0294 |
|
| 635 |
+
| mse_q0 | 0.0958 |
|
| 636 |
+
| mse_q1 | 0.017 |
|
| 637 |
+
| mse_q2 | 0.00338 |
|
| 638 |
+
| mse_q3 | 0.00043 |
|
| 639 |
+
| param_norm | 193 |
|
| 640 |
+
| samples | 4.48e+05 |
|
| 641 |
+
| step | 2.8e+04 |
|
| 642 |
+
| vb | 0.00326 |
|
| 643 |
+
| vb_q0 | 0.0127 |
|
| 644 |
+
| vb_q1 | 0.000126 |
|
| 645 |
+
| vb_q2 | 3.01e-05 |
|
| 646 |
+
| vb_q3 | 5.34e-06 |
|
| 647 |
+
-------------------------
|
| 648 |
+
-------------------------
|
| 649 |
+
| grad_norm | 0.0617 |
|
| 650 |
+
| loss | 0.0335 |
|
| 651 |
+
| loss_q0 | 0.114 |
|
| 652 |
+
| loss_q1 | 0.0172 |
|
| 653 |
+
| loss_q2 | 0.00339 |
|
| 654 |
+
| loss_q3 | 0.000421 |
|
| 655 |
+
| mse | 0.03 |
|
| 656 |
+
| mse_q0 | 0.1 |
|
| 657 |
+
| mse_q1 | 0.0171 |
|
| 658 |
+
| mse_q2 | 0.00336 |
|
| 659 |
+
| mse_q3 | 0.000416 |
|
| 660 |
+
| param_norm | 193 |
|
| 661 |
+
| samples | 4.64e+05 |
|
| 662 |
+
| step | 2.9e+04 |
|
| 663 |
+
| vb | 0.00346 |
|
| 664 |
+
| vb_q0 | 0.0139 |
|
| 665 |
+
| vb_q1 | 0.000126 |
|
| 666 |
+
| vb_q2 | 2.99e-05 |
|
| 667 |
+
| vb_q3 | 5.18e-06 |
|
| 668 |
+
-------------------------
|
| 669 |
+
-------------------------
|
| 670 |
+
| grad_norm | 0.0625 |
|
| 671 |
+
| loss | 0.0341 |
|
| 672 |
+
| loss_q0 | 0.117 |
|
| 673 |
+
| loss_q1 | 0.0173 |
|
| 674 |
+
| loss_q2 | 0.00336 |
|
| 675 |
+
| loss_q3 | 0.000427 |
|
| 676 |
+
| mse | 0.0297 |
|
| 677 |
+
| mse_q0 | 0.0996 |
|
| 678 |
+
| mse_q1 | 0.0172 |
|
| 679 |
+
| mse_q2 | 0.00333 |
|
| 680 |
+
| mse_q3 | 0.000422 |
|
| 681 |
+
| param_norm | 194 |
|
| 682 |
+
| samples | 4.8e+05 |
|
| 683 |
+
| step | 3e+04 |
|
| 684 |
+
| vb | 0.00441 |
|
| 685 |
+
| vb_q0 | 0.0178 |
|
| 686 |
+
| vb_q1 | 0.000127 |
|
| 687 |
+
| vb_q2 | 2.96e-05 |
|
| 688 |
+
| vb_q3 | 5.26e-06 |
|
| 689 |
+
-------------------------
|
| 690 |
+
saving model 0...
|
| 691 |
+
saving model 0.995...
|
| 692 |
+
evaluation indistro starting...
|
| 693 |
+
done 96 samples: bpd=3.642620086669922
|
| 694 |
+
done 192 samples: bpd=3.8054873943328857
|
| 695 |
+
done 288 samples: bpd=3.7644495169321694
|
| 696 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_indistro_terms.npz
|
| 697 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_indistro_terms.npz
|
| 698 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_indistro_terms.npz
|
| 699 |
+
evaluation nll complete
|
| 700 |
+
evaluation outdistro starting...
|
| 701 |
+
done 192 samples: bpd=3.8840670585632324
|
| 702 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_outdistro_terms.npz
|
| 703 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_outdistro_terms.npz
|
| 704 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_outdistro_terms.npz
|
| 705 |
+
evaluation nll complete
|
| 706 |
+
sampling starting...
|
| 707 |
+
-------------------------
|
| 708 |
+
| grad_norm | 0.0625 |
|
| 709 |
+
| loss | 0.0347 |
|
| 710 |
+
| loss_q0 | 0.117 |
|
| 711 |
+
| loss_q1 | 0.0174 |
|
| 712 |
+
| loss_q2 | 0.00327 |
|
| 713 |
+
| loss_q3 | 0.000413 |
|
| 714 |
+
| mse | 0.0306 |
|
| 715 |
+
| mse_q0 | 0.101 |
|
| 716 |
+
| mse_q1 | 0.0172 |
|
| 717 |
+
| mse_q2 | 0.00324 |
|
| 718 |
+
| mse_q3 | 0.000408 |
|
| 719 |
+
| param_norm | 194 |
|
| 720 |
+
| samples | 4.96e+05 |
|
| 721 |
+
| step | 3.1e+04 |
|
| 722 |
+
| vb | 0.00405 |
|
| 723 |
+
| vb_q0 | 0.0159 |
|
| 724 |
+
| vb_q1 | 0.000127 |
|
| 725 |
+
| vb_q2 | 2.89e-05 |
|
| 726 |
+
| vb_q3 | 5.09e-06 |
|
| 727 |
+
-------------------------
|
| 728 |
+
-------------------------
|
| 729 |
+
| grad_norm | 0.0595 |
|
| 730 |
+
| loss | 0.0319 |
|
| 731 |
+
| loss_q0 | 0.107 |
|
| 732 |
+
| loss_q1 | 0.0169 |
|
| 733 |
+
| loss_q2 | 0.00331 |
|
| 734 |
+
| loss_q3 | 0.000398 |
|
| 735 |
+
| mse | 0.0293 |
|
| 736 |
+
| mse_q0 | 0.0967 |
|
| 737 |
+
| mse_q1 | 0.0168 |
|
| 738 |
+
| mse_q2 | 0.00328 |
|
| 739 |
+
| mse_q3 | 0.000393 |
|
| 740 |
+
| param_norm | 195 |
|
| 741 |
+
| samples | 5.12e+05 |
|
| 742 |
+
| step | 3.2e+04 |
|
| 743 |
+
| vb | 0.00266 |
|
| 744 |
+
| vb_q0 | 0.0105 |
|
| 745 |
+
| vb_q1 | 0.000124 |
|
| 746 |
+
| vb_q2 | 2.92e-05 |
|
| 747 |
+
| vb_q3 | 4.88e-06 |
|
| 748 |
+
-------------------------
|
| 749 |
+
-------------------------
|
| 750 |
+
| grad_norm | 0.0619 |
|
| 751 |
+
| loss | 0.033 |
|
| 752 |
+
| loss_q0 | 0.113 |
|
| 753 |
+
| loss_q1 | 0.0172 |
|
| 754 |
+
| loss_q2 | 0.00329 |
|
| 755 |
+
| loss_q3 | 0.0004 |
|
| 756 |
+
| mse | 0.0296 |
|
| 757 |
+
| mse_q0 | 0.0996 |
|
| 758 |
+
| mse_q1 | 0.0171 |
|
| 759 |
+
| mse_q2 | 0.00326 |
|
| 760 |
+
| mse_q3 | 0.000395 |
|
| 761 |
+
| param_norm | 195 |
|
| 762 |
+
| samples | 5.28e+05 |
|
| 763 |
+
| step | 3.3e+04 |
|
| 764 |
+
| vb | 0.00338 |
|
| 765 |
+
| vb_q0 | 0.0137 |
|
| 766 |
+
| vb_q1 | 0.000126 |
|
| 767 |
+
| vb_q2 | 2.9e-05 |
|
| 768 |
+
| vb_q3 | 4.93e-06 |
|
| 769 |
+
-------------------------
|
| 770 |
+
-------------------------
|
| 771 |
+
| grad_norm | 0.0606 |
|
| 772 |
+
| loss | 0.0351 |
|
| 773 |
+
| loss_q0 | 0.119 |
|
| 774 |
+
| loss_q1 | 0.017 |
|
| 775 |
+
| loss_q2 | 0.00336 |
|
| 776 |
+
| loss_q3 | 0.000399 |
|
| 777 |
+
| mse | 0.0304 |
|
| 778 |
+
| mse_q0 | 0.1 |
|
| 779 |
+
| mse_q1 | 0.0169 |
|
| 780 |
+
| mse_q2 | 0.00333 |
|
| 781 |
+
| mse_q3 | 0.000394 |
|
| 782 |
+
| param_norm | 196 |
|
| 783 |
+
| samples | 5.44e+05 |
|
| 784 |
+
| step | 3.4e+04 |
|
| 785 |
+
| vb | 0.00465 |
|
| 786 |
+
| vb_q0 | 0.0183 |
|
| 787 |
+
| vb_q1 | 0.000125 |
|
| 788 |
+
| vb_q2 | 2.96e-05 |
|
| 789 |
+
| vb_q3 | 4.89e-06 |
|
| 790 |
+
-------------------------
|
| 791 |
+
-------------------------
|
| 792 |
+
| grad_norm | 0.0636 |
|
| 793 |
+
| loss | 0.0342 |
|
| 794 |
+
| loss_q0 | 0.114 |
|
| 795 |
+
| loss_q1 | 0.017 |
|
| 796 |
+
| loss_q2 | 0.00332 |
|
| 797 |
+
| loss_q3 | 0.000391 |
|
| 798 |
+
| mse | 0.0303 |
|
| 799 |
+
| mse_q0 | 0.0985 |
|
| 800 |
+
| mse_q1 | 0.0169 |
|
| 801 |
+
| mse_q2 | 0.00329 |
|
| 802 |
+
| mse_q3 | 0.000386 |
|
| 803 |
+
| param_norm | 196 |
|
| 804 |
+
| samples | 5.6e+05 |
|
| 805 |
+
| step | 3.5e+04 |
|
| 806 |
+
| vb | 0.00394 |
|
| 807 |
+
| vb_q0 | 0.0153 |
|
| 808 |
+
| vb_q1 | 0.000125 |
|
| 809 |
+
| vb_q2 | 2.92e-05 |
|
| 810 |
+
| vb_q3 | 4.82e-06 |
|
| 811 |
+
-------------------------
|
| 812 |
+
-------------------------
|
| 813 |
+
| grad_norm | 0.0611 |
|
| 814 |
+
| loss | 0.034 |
|
| 815 |
+
| loss_q0 | 0.114 |
|
| 816 |
+
| loss_q1 | 0.017 |
|
| 817 |
+
| loss_q2 | 0.00334 |
|
| 818 |
+
| loss_q3 | 0.000391 |
|
| 819 |
+
| mse | 0.03 |
|
| 820 |
+
| mse_q0 | 0.0984 |
|
| 821 |
+
| mse_q1 | 0.0169 |
|
| 822 |
+
| mse_q2 | 0.00331 |
|
| 823 |
+
| mse_q3 | 0.000387 |
|
| 824 |
+
| param_norm | 197 |
|
| 825 |
+
| samples | 5.76e+05 |
|
| 826 |
+
| step | 3.6e+04 |
|
| 827 |
+
| vb | 0.00397 |
|
| 828 |
+
| vb_q0 | 0.0155 |
|
| 829 |
+
| vb_q1 | 0.000125 |
|
| 830 |
+
| vb_q2 | 2.95e-05 |
|
| 831 |
+
| vb_q3 | 4.81e-06 |
|
| 832 |
+
-------------------------
|
| 833 |
+
-------------------------
|
| 834 |
+
| grad_norm | 0.0599 |
|
| 835 |
+
| loss | 0.0318 |
|
| 836 |
+
| loss_q0 | 0.11 |
|
| 837 |
+
| loss_q1 | 0.017 |
|
| 838 |
+
| loss_q2 | 0.00335 |
|
| 839 |
+
| loss_q3 | 0.000387 |
|
| 840 |
+
| mse | 0.0285 |
|
| 841 |
+
| mse_q0 | 0.0965 |
|
| 842 |
+
| mse_q1 | 0.0169 |
|
| 843 |
+
| mse_q2 | 0.00332 |
|
| 844 |
+
| mse_q3 | 0.000383 |
|
| 845 |
+
| param_norm | 197 |
|
| 846 |
+
| samples | 5.92e+05 |
|
| 847 |
+
| step | 3.7e+04 |
|
| 848 |
+
| vb | 0.00331 |
|
| 849 |
+
| vb_q0 | 0.0136 |
|
| 850 |
+
| vb_q1 | 0.000125 |
|
| 851 |
+
| vb_q2 | 2.95e-05 |
|
| 852 |
+
| vb_q3 | 4.76e-06 |
|
| 853 |
+
-------------------------
|
| 854 |
+
-------------------------
|
| 855 |
+
| grad_norm | 0.0596 |
|
| 856 |
+
| loss | 0.0342 |
|
| 857 |
+
| loss_q0 | 0.116 |
|
| 858 |
+
| loss_q1 | 0.017 |
|
| 859 |
+
| loss_q2 | 0.00336 |
|
| 860 |
+
| loss_q3 | 0.000383 |
|
| 861 |
+
| mse | 0.03 |
|
| 862 |
+
| mse_q0 | 0.0993 |
|
| 863 |
+
| mse_q1 | 0.0168 |
|
| 864 |
+
| mse_q2 | 0.00333 |
|
| 865 |
+
| mse_q3 | 0.000379 |
|
| 866 |
+
| param_norm | 198 |
|
| 867 |
+
| samples | 6.08e+05 |
|
| 868 |
+
| step | 3.8e+04 |
|
| 869 |
+
| vb | 0.00417 |
|
| 870 |
+
| vb_q0 | 0.0165 |
|
| 871 |
+
| vb_q1 | 0.000124 |
|
| 872 |
+
| vb_q2 | 2.95e-05 |
|
| 873 |
+
| vb_q3 | 4.7e-06 |
|
| 874 |
+
-------------------------
|
| 875 |
+
-------------------------
|
| 876 |
+
| grad_norm | 0.062 |
|
| 877 |
+
| loss | 0.0346 |
|
| 878 |
+
| loss_q0 | 0.117 |
|
| 879 |
+
| loss_q1 | 0.0169 |
|
| 880 |
+
| loss_q2 | 0.00327 |
|
| 881 |
+
| loss_q3 | 0.000388 |
|
| 882 |
+
| mse | 0.0298 |
|
| 883 |
+
| mse_q0 | 0.0984 |
|
| 884 |
+
| mse_q1 | 0.0168 |
|
| 885 |
+
| mse_q2 | 0.00325 |
|
| 886 |
+
| mse_q3 | 0.000384 |
|
| 887 |
+
| param_norm | 198 |
|
| 888 |
+
| samples | 6.24e+05 |
|
| 889 |
+
| step | 3.9e+04 |
|
| 890 |
+
| vb | 0.00484 |
|
| 891 |
+
| vb_q0 | 0.0191 |
|
| 892 |
+
| vb_q1 | 0.000124 |
|
| 893 |
+
| vb_q2 | 2.89e-05 |
|
| 894 |
+
| vb_q3 | 4.77e-06 |
|
| 895 |
+
-------------------------
|
| 896 |
+
-------------------------
|
| 897 |
+
| grad_norm | 0.0562 |
|
| 898 |
+
| loss | 0.0336 |
|
| 899 |
+
| loss_q0 | 0.113 |
|
| 900 |
+
| loss_q1 | 0.0167 |
|
| 901 |
+
| loss_q2 | 0.00331 |
|
| 902 |
+
| loss_q3 | 0.000371 |
|
| 903 |
+
| mse | 0.0296 |
|
| 904 |
+
| mse_q0 | 0.0974 |
|
| 905 |
+
| mse_q1 | 0.0166 |
|
| 906 |
+
| mse_q2 | 0.00328 |
|
| 907 |
+
| mse_q3 | 0.000367 |
|
| 908 |
+
| param_norm | 199 |
|
| 909 |
+
| samples | 6.4e+05 |
|
| 910 |
+
| step | 4e+04 |
|
| 911 |
+
| vb | 0.00396 |
|
| 912 |
+
| vb_q0 | 0.0155 |
|
| 913 |
+
| vb_q1 | 0.000123 |
|
| 914 |
+
| vb_q2 | 2.92e-05 |
|
| 915 |
+
| vb_q3 | 4.55e-06 |
|
| 916 |
+
-------------------------
|
| 917 |
+
saving model 0...
|
| 918 |
+
saving model 0.995...
|
| 919 |
+
evaluation indistro starting...
|
| 920 |
+
done 96 samples: bpd=3.5080957412719727
|
| 921 |
+
done 192 samples: bpd=3.5733258724212646
|
| 922 |
+
done 288 samples: bpd=3.587653636932373
|
| 923 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_indistro_terms.npz
|
| 924 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_indistro_terms.npz
|
| 925 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_indistro_terms.npz
|
| 926 |
+
evaluation nll complete
|
| 927 |
+
evaluation outdistro starting...
|
| 928 |
+
done 192 samples: bpd=3.791849136352539
|
| 929 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_outdistro_terms.npz
|
| 930 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_outdistro_terms.npz
|
| 931 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_outdistro_terms.npz
|
| 932 |
+
evaluation nll complete
|
| 933 |
+
sampling starting...
|
| 934 |
+
-------------------------
|
| 935 |
+
| grad_norm | 0.0596 |
|
| 936 |
+
| loss | 0.0344 |
|
| 937 |
+
| loss_q0 | 0.115 |
|
| 938 |
+
| loss_q1 | 0.0168 |
|
| 939 |
+
| loss_q2 | 0.00325 |
|
| 940 |
+
| loss_q3 | 0.000377 |
|
| 941 |
+
| mse | 0.0306 |
|
| 942 |
+
| mse_q0 | 0.1 |
|
| 943 |
+
| mse_q1 | 0.0167 |
|
| 944 |
+
| mse_q2 | 0.00322 |
|
| 945 |
+
| mse_q3 | 0.000372 |
|
| 946 |
+
| param_norm | 199 |
|
| 947 |
+
| samples | 6.56e+05 |
|
| 948 |
+
| step | 4.1e+04 |
|
| 949 |
+
| vb | 0.00381 |
|
| 950 |
+
| vb_q0 | 0.0148 |
|
| 951 |
+
| vb_q1 | 0.000123 |
|
| 952 |
+
| vb_q2 | 2.87e-05 |
|
| 953 |
+
| vb_q3 | 4.62e-06 |
|
| 954 |
+
-------------------------
|
| 955 |
+
-------------------------
|
| 956 |
+
| grad_norm | 0.0589 |
|
| 957 |
+
| loss | 0.0328 |
|
| 958 |
+
| loss_q0 | 0.113 |
|
| 959 |
+
| loss_q1 | 0.017 |
|
| 960 |
+
| loss_q2 | 0.00331 |
|
| 961 |
+
| loss_q3 | 0.00037 |
|
| 962 |
+
| mse | 0.0286 |
|
| 963 |
+
| mse_q0 | 0.0962 |
|
| 964 |
+
| mse_q1 | 0.0168 |
|
| 965 |
+
| mse_q2 | 0.00328 |
|
| 966 |
+
| mse_q3 | 0.000365 |
|
| 967 |
+
| param_norm | 200 |
|
| 968 |
+
| samples | 6.72e+05 |
|
| 969 |
+
| step | 4.2e+04 |
|
| 970 |
+
| vb | 0.00413 |
|
| 971 |
+
| vb_q0 | 0.0168 |
|
| 972 |
+
| vb_q1 | 0.000124 |
|
| 973 |
+
| vb_q2 | 2.92e-05 |
|
| 974 |
+
| vb_q3 | 4.52e-06 |
|
| 975 |
+
-------------------------
|
| 976 |
+
-------------------------
|
| 977 |
+
| grad_norm | 0.0587 |
|
| 978 |
+
| loss | 0.0329 |
|
| 979 |
+
| loss_q0 | 0.111 |
|
| 980 |
+
| loss_q1 | 0.017 |
|
| 981 |
+
| loss_q2 | 0.00332 |
|
| 982 |
+
| loss_q3 | 0.000369 |
|
| 983 |
+
| mse | 0.0295 |
|
| 984 |
+
| mse_q0 | 0.0973 |
|
| 985 |
+
| mse_q1 | 0.0168 |
|
| 986 |
+
| mse_q2 | 0.00329 |
|
| 987 |
+
| mse_q3 | 0.000364 |
|
| 988 |
+
| param_norm | 200 |
|
| 989 |
+
| samples | 6.88e+05 |
|
| 990 |
+
| step | 4.3e+04 |
|
| 991 |
+
| vb | 0.00348 |
|
| 992 |
+
| vb_q0 | 0.0137 |
|
| 993 |
+
| vb_q1 | 0.000125 |
|
| 994 |
+
| vb_q2 | 2.92e-05 |
|
| 995 |
+
| vb_q3 | 4.51e-06 |
|
| 996 |
+
-------------------------
|
| 997 |
+
-------------------------
|
| 998 |
+
| grad_norm | 0.0571 |
|
| 999 |
+
| loss | 0.0338 |
|
| 1000 |
+
| loss_q0 | 0.117 |
|
| 1001 |
+
| loss_q1 | 0.0168 |
|
| 1002 |
+
| loss_q2 | 0.00322 |
|
| 1003 |
+
| loss_q3 | 0.000364 |
|
| 1004 |
+
| mse | 0.0294 |
|
| 1005 |
+
| mse_q0 | 0.0992 |
|
| 1006 |
+
| mse_q1 | 0.0167 |
|
| 1007 |
+
| mse_q2 | 0.00319 |
|
| 1008 |
+
| mse_q3 | 0.000359 |
|
| 1009 |
+
| param_norm | 201 |
|
| 1010 |
+
| samples | 7.04e+05 |
|
| 1011 |
+
| step | 4.4e+04 |
|
| 1012 |
+
| vb | 0.00437 |
|
| 1013 |
+
| vb_q0 | 0.0177 |
|
| 1014 |
+
| vb_q1 | 0.000123 |
|
| 1015 |
+
| vb_q2 | 2.84e-05 |
|
| 1016 |
+
| vb_q3 | 4.45e-06 |
|
| 1017 |
+
-------------------------
|
| 1018 |
+
-------------------------
|
| 1019 |
+
| grad_norm | 0.0587 |
|
| 1020 |
+
| loss | 0.034 |
|
| 1021 |
+
| loss_q0 | 0.114 |
|
| 1022 |
+
| loss_q1 | 0.0171 |
|
| 1023 |
+
| loss_q2 | 0.00331 |
|
| 1024 |
+
| loss_q3 | 0.00037 |
|
| 1025 |
+
| mse | 0.0301 |
|
| 1026 |
+
| mse_q0 | 0.0988 |
|
| 1027 |
+
| mse_q1 | 0.017 |
|
| 1028 |
+
| mse_q2 | 0.00328 |
|
| 1029 |
+
| mse_q3 | 0.000365 |
|
| 1030 |
+
| param_norm | 201 |
|
| 1031 |
+
| samples | 7.2e+05 |
|
| 1032 |
+
| step | 4.5e+04 |
|
| 1033 |
+
| vb | 0.00387 |
|
| 1034 |
+
| vb_q0 | 0.0152 |
|
| 1035 |
+
| vb_q1 | 0.000126 |
|
| 1036 |
+
| vb_q2 | 2.91e-05 |
|
| 1037 |
+
| vb_q3 | 4.52e-06 |
|
| 1038 |
+
-------------------------
|
| 1039 |
+
-------------------------
|
| 1040 |
+
| grad_norm | 0.061 |
|
| 1041 |
+
| loss | 0.0329 |
|
| 1042 |
+
| loss_q0 | 0.11 |
|
| 1043 |
+
| loss_q1 | 0.0169 |
|
| 1044 |
+
| loss_q2 | 0.00329 |
|
| 1045 |
+
| loss_q3 | 0.000368 |
|
| 1046 |
+
| mse | 0.0299 |
|
| 1047 |
+
| mse_q0 | 0.0983 |
|
| 1048 |
+
| mse_q1 | 0.0167 |
|
| 1049 |
+
| mse_q2 | 0.00326 |
|
| 1050 |
+
| mse_q3 | 0.000364 |
|
| 1051 |
+
| param_norm | 202 |
|
| 1052 |
+
| samples | 7.36e+05 |
|
| 1053 |
+
| step | 4.6e+04 |
|
| 1054 |
+
| vb | 0.0031 |
|
| 1055 |
+
| vb_q0 | 0.0121 |
|
| 1056 |
+
| vb_q1 | 0.000124 |
|
| 1057 |
+
| vb_q2 | 2.89e-05 |
|
| 1058 |
+
| vb_q3 | 4.5e-06 |
|
| 1059 |
+
-------------------------
|
| 1060 |
+
-------------------------
|
| 1061 |
+
| grad_norm | 0.0566 |
|
| 1062 |
+
| loss | 0.0328 |
|
| 1063 |
+
| loss_q0 | 0.111 |
|
| 1064 |
+
| loss_q1 | 0.0171 |
|
| 1065 |
+
| loss_q2 | 0.00327 |
|
| 1066 |
+
| loss_q3 | 0.000357 |
|
| 1067 |
+
| mse | 0.0294 |
|
| 1068 |
+
| mse_q0 | 0.0976 |
|
| 1069 |
+
| mse_q1 | 0.017 |
|
| 1070 |
+
| mse_q2 | 0.00324 |
|
| 1071 |
+
| mse_q3 | 0.000353 |
|
| 1072 |
+
| param_norm | 202 |
|
| 1073 |
+
| samples | 7.52e+05 |
|
| 1074 |
+
| step | 4.7e+04 |
|
| 1075 |
+
| vb | 0.00339 |
|
| 1076 |
+
| vb_q0 | 0.0135 |
|
| 1077 |
+
| vb_q1 | 0.000126 |
|
| 1078 |
+
| vb_q2 | 2.88e-05 |
|
| 1079 |
+
| vb_q3 | 4.39e-06 |
|
| 1080 |
+
-------------------------
|
| 1081 |
+
-------------------------
|
| 1082 |
+
| grad_norm | 0.0606 |
|
| 1083 |
+
| loss | 0.0344 |
|
| 1084 |
+
| loss_q0 | 0.114 |
|
| 1085 |
+
| loss_q1 | 0.0168 |
|
| 1086 |
+
| loss_q2 | 0.00333 |
|
| 1087 |
+
| loss_q3 | 0.000357 |
|
| 1088 |
+
| mse | 0.0305 |
|
| 1089 |
+
| mse_q0 | 0.0991 |
|
| 1090 |
+
| mse_q1 | 0.0167 |
|
| 1091 |
+
| mse_q2 | 0.0033 |
|
| 1092 |
+
| mse_q3 | 0.000352 |
|
| 1093 |
+
| param_norm | 203 |
|
| 1094 |
+
| samples | 7.68e+05 |
|
| 1095 |
+
| step | 4.8e+04 |
|
| 1096 |
+
| vb | 0.00387 |
|
| 1097 |
+
| vb_q0 | 0.0149 |
|
| 1098 |
+
| vb_q1 | 0.000123 |
|
| 1099 |
+
| vb_q2 | 2.93e-05 |
|
| 1100 |
+
| vb_q3 | 4.37e-06 |
|
| 1101 |
+
-------------------------
|
| 1102 |
+
-------------------------
|
| 1103 |
+
| grad_norm | 0.0559 |
|
| 1104 |
+
| loss | 0.0327 |
|
| 1105 |
+
| loss_q0 | 0.108 |
|
| 1106 |
+
| loss_q1 | 0.0166 |
|
| 1107 |
+
| loss_q2 | 0.00329 |
|
| 1108 |
+
| loss_q3 | 0.000351 |
|
| 1109 |
+
| mse | 0.0292 |
|
| 1110 |
+
| mse_q0 | 0.0947 |
|
| 1111 |
+
| mse_q1 | 0.0165 |
|
| 1112 |
+
| mse_q2 | 0.00326 |
|
| 1113 |
+
| mse_q3 | 0.000347 |
|
| 1114 |
+
| param_norm | 203 |
|
| 1115 |
+
| samples | 7.84e+05 |
|
| 1116 |
+
| step | 4.9e+04 |
|
| 1117 |
+
| vb | 0.00349 |
|
| 1118 |
+
| vb_q0 | 0.0135 |
|
| 1119 |
+
| vb_q1 | 0.000122 |
|
| 1120 |
+
| vb_q2 | 2.9e-05 |
|
| 1121 |
+
| vb_q3 | 4.29e-06 |
|
| 1122 |
+
-------------------------
|
| 1123 |
+
-------------------------
|
| 1124 |
+
| grad_norm | 0.0589 |
|
| 1125 |
+
| loss | 0.0338 |
|
| 1126 |
+
| loss_q0 | 0.116 |
|
| 1127 |
+
| loss_q1 | 0.0169 |
|
| 1128 |
+
| loss_q2 | 0.00327 |
|
| 1129 |
+
| loss_q3 | 0.00035 |
|
| 1130 |
+
| mse | 0.029 |
|
| 1131 |
+
| mse_q0 | 0.0968 |
|
| 1132 |
+
| mse_q1 | 0.0168 |
|
| 1133 |
+
| mse_q2 | 0.00325 |
|
| 1134 |
+
| mse_q3 | 0.000346 |
|
| 1135 |
+
| param_norm | 204 |
|
| 1136 |
+
| samples | 8e+05 |
|
| 1137 |
+
| step | 5e+04 |
|
| 1138 |
+
| vb | 0.00479 |
|
| 1139 |
+
| vb_q0 | 0.0193 |
|
| 1140 |
+
| vb_q1 | 0.000124 |
|
| 1141 |
+
| vb_q2 | 2.88e-05 |
|
| 1142 |
+
| vb_q3 | 4.29e-06 |
|
| 1143 |
+
-------------------------
|
| 1144 |
+
saving model 0...
|
| 1145 |
+
saving model 0.995...
|
| 1146 |
+
evaluation indistro starting...
|
| 1147 |
+
done 96 samples: bpd=3.513167142868042
|
| 1148 |
+
done 192 samples: bpd=3.5448752641677856
|
| 1149 |
+
done 288 samples: bpd=3.5497219562530518
|
| 1150 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_indistro_terms.npz
|
| 1151 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_indistro_terms.npz
|
| 1152 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_indistro_terms.npz
|
| 1153 |
+
evaluation nll complete
|
| 1154 |
+
evaluation outdistro starting...
|
| 1155 |
+
done 192 samples: bpd=3.7412848472595215
|
| 1156 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_outdistro_terms.npz
|
| 1157 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_outdistro_terms.npz
|
| 1158 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_outdistro_terms.npz
|
| 1159 |
+
evaluation nll complete
|
| 1160 |
+
sampling starting...
|
| 1161 |
+
-------------------------
|
| 1162 |
+
| grad_norm | 0.0547 |
|
| 1163 |
+
| loss | 0.0326 |
|
| 1164 |
+
| loss_q0 | 0.11 |
|
| 1165 |
+
| loss_q1 | 0.0167 |
|
| 1166 |
+
| loss_q2 | 0.00326 |
|
| 1167 |
+
| loss_q3 | 0.000349 |
|
| 1168 |
+
| mse | 0.0291 |
|
| 1169 |
+
| mse_q0 | 0.0965 |
|
| 1170 |
+
| mse_q1 | 0.0166 |
|
| 1171 |
+
| mse_q2 | 0.00323 |
|
| 1172 |
+
| mse_q3 | 0.000345 |
|
| 1173 |
+
| param_norm | 204 |
|
| 1174 |
+
| samples | 8.16e+05 |
|
| 1175 |
+
| step | 5.1e+04 |
|
| 1176 |
+
| vb | 0.00349 |
|
| 1177 |
+
| vb_q0 | 0.0138 |
|
| 1178 |
+
| vb_q1 | 0.000123 |
|
| 1179 |
+
| vb_q2 | 2.87e-05 |
|
| 1180 |
+
| vb_q3 | 4.27e-06 |
|
| 1181 |
+
-------------------------
|
| 1182 |
+
-------------------------
|
| 1183 |
+
| grad_norm | 0.0582 |
|
| 1184 |
+
| loss | 0.0324 |
|
| 1185 |
+
| loss_q0 | 0.109 |
|
| 1186 |
+
| loss_q1 | 0.0168 |
|
| 1187 |
+
| loss_q2 | 0.00319 |
|
| 1188 |
+
| loss_q3 | 0.000349 |
|
| 1189 |
+
| mse | 0.0292 |
|
| 1190 |
+
| mse_q0 | 0.0969 |
|
| 1191 |
+
| mse_q1 | 0.0166 |
|
| 1192 |
+
| mse_q2 | 0.00316 |
|
| 1193 |
+
| mse_q3 | 0.000345 |
|
| 1194 |
+
| param_norm | 205 |
|
| 1195 |
+
| samples | 8.32e+05 |
|
| 1196 |
+
| step | 5.2e+04 |
|
| 1197 |
+
| vb | 0.00317 |
|
| 1198 |
+
| vb_q0 | 0.0126 |
|
| 1199 |
+
| vb_q1 | 0.000123 |
|
| 1200 |
+
| vb_q2 | 2.82e-05 |
|
| 1201 |
+
| vb_q3 | 4.27e-06 |
|
| 1202 |
+
-------------------------
|
| 1203 |
+
-------------------------
|
| 1204 |
+
| grad_norm | 0.0565 |
|
| 1205 |
+
| loss | 0.0328 |
|
| 1206 |
+
| loss_q0 | 0.111 |
|
| 1207 |
+
| loss_q1 | 0.0168 |
|
| 1208 |
+
| loss_q2 | 0.00324 |
|
| 1209 |
+
| loss_q3 | 0.000347 |
|
| 1210 |
+
| mse | 0.0291 |
|
| 1211 |
+
| mse_q0 | 0.0964 |
|
| 1212 |
+
| mse_q1 | 0.0167 |
|
| 1213 |
+
| mse_q2 | 0.00321 |
|
| 1214 |
+
| mse_q3 | 0.000343 |
|
| 1215 |
+
| param_norm | 205 |
|
| 1216 |
+
| samples | 8.48e+05 |
|
| 1217 |
+
| step | 5.3e+04 |
|
| 1218 |
+
| vb | 0.00373 |
|
| 1219 |
+
| vb_q0 | 0.0148 |
|
| 1220 |
+
| vb_q1 | 0.000123 |
|
| 1221 |
+
| vb_q2 | 2.85e-05 |
|
| 1222 |
+
| vb_q3 | 4.23e-06 |
|
| 1223 |
+
-------------------------
|
| 1224 |
+
-------------------------
|
| 1225 |
+
| grad_norm | 0.0586 |
|
| 1226 |
+
| loss | 0.0338 |
|
| 1227 |
+
| loss_q0 | 0.117 |
|
| 1228 |
+
| loss_q1 | 0.0168 |
|
| 1229 |
+
| loss_q2 | 0.00323 |
|
| 1230 |
+
| loss_q3 | 0.000341 |
|
| 1231 |
+
| mse | 0.0297 |
|
| 1232 |
+
| mse_q0 | 0.1 |
|
| 1233 |
+
| mse_q1 | 0.0167 |
|
| 1234 |
+
| mse_q2 | 0.00321 |
|
| 1235 |
+
| mse_q3 | 0.000337 |
|
| 1236 |
+
| param_norm | 206 |
|
| 1237 |
+
| samples | 8.64e+05 |
|
| 1238 |
+
| step | 5.4e+04 |
|
| 1239 |
+
| vb | 0.00406 |
|
| 1240 |
+
| vb_q0 | 0.0164 |
|
| 1241 |
+
| vb_q1 | 0.000123 |
|
| 1242 |
+
| vb_q2 | 2.85e-05 |
|
| 1243 |
+
| vb_q3 | 4.17e-06 |
|
| 1244 |
+
-------------------------
|
| 1245 |
+
-------------------------
|
| 1246 |
+
| grad_norm | 0.0558 |
|
| 1247 |
+
| loss | 0.0336 |
|
| 1248 |
+
| loss_q0 | 0.115 |
|
| 1249 |
+
| loss_q1 | 0.0165 |
|
| 1250 |
+
| loss_q2 | 0.00326 |
|
| 1251 |
+
| loss_q3 | 0.00034 |
|
| 1252 |
+
| mse | 0.0293 |
|
| 1253 |
+
| mse_q0 | 0.098 |
|
| 1254 |
+
| mse_q1 | 0.0164 |
|
| 1255 |
+
| mse_q2 | 0.00323 |
|
| 1256 |
+
| mse_q3 | 0.000336 |
|
| 1257 |
+
| param_norm | 206 |
|
| 1258 |
+
| samples | 8.8e+05 |
|
| 1259 |
+
| step | 5.5e+04 |
|
| 1260 |
+
| vb | 0.00434 |
|
| 1261 |
+
| vb_q0 | 0.0174 |
|
| 1262 |
+
| vb_q1 | 0.000121 |
|
| 1263 |
+
| vb_q2 | 2.87e-05 |
|
| 1264 |
+
| vb_q3 | 4.16e-06 |
|
| 1265 |
+
-------------------------
|
| 1266 |
+
-------------------------
|
| 1267 |
+
| grad_norm | 0.0578 |
|
| 1268 |
+
| loss | 0.0329 |
|
| 1269 |
+
| loss_q0 | 0.112 |
|
| 1270 |
+
| loss_q1 | 0.0164 |
|
| 1271 |
+
| loss_q2 | 0.00319 |
|
| 1272 |
+
| loss_q3 | 0.000341 |
|
| 1273 |
+
| mse | 0.029 |
|
| 1274 |
+
| mse_q0 | 0.0971 |
|
| 1275 |
+
| mse_q1 | 0.0163 |
|
| 1276 |
+
| mse_q2 | 0.00316 |
|
| 1277 |
+
| mse_q3 | 0.000337 |
|
| 1278 |
+
| param_norm | 207 |
|
| 1279 |
+
| samples | 8.96e+05 |
|
| 1280 |
+
| step | 5.6e+04 |
|
| 1281 |
+
| vb | 0.00385 |
|
| 1282 |
+
| vb_q0 | 0.0153 |
|
| 1283 |
+
| vb_q1 | 0.000121 |
|
| 1284 |
+
| vb_q2 | 2.82e-05 |
|
| 1285 |
+
| vb_q3 | 4.18e-06 |
|
| 1286 |
+
-------------------------
|
| 1287 |
+
-------------------------
|
| 1288 |
+
| grad_norm | 0.055 |
|
| 1289 |
+
| loss | 0.0329 |
|
| 1290 |
+
| loss_q0 | 0.112 |
|
| 1291 |
+
| loss_q1 | 0.0165 |
|
| 1292 |
+
| loss_q2 | 0.00321 |
|
| 1293 |
+
| loss_q3 | 0.00033 |
|
| 1294 |
+
| mse | 0.029 |
|
| 1295 |
+
| mse_q0 | 0.0964 |
|
| 1296 |
+
| mse_q1 | 0.0164 |
|
| 1297 |
+
| mse_q2 | 0.00319 |
|
| 1298 |
+
| mse_q3 | 0.000326 |
|
| 1299 |
+
| param_norm | 207 |
|
| 1300 |
+
| samples | 9.12e+05 |
|
| 1301 |
+
| step | 5.7e+04 |
|
| 1302 |
+
| vb | 0.00392 |
|
| 1303 |
+
| vb_q0 | 0.0156 |
|
| 1304 |
+
| vb_q1 | 0.000121 |
|
| 1305 |
+
| vb_q2 | 2.83e-05 |
|
| 1306 |
+
| vb_q3 | 4.04e-06 |
|
| 1307 |
+
-------------------------
|
| 1308 |
+
-------------------------
|
| 1309 |
+
| grad_norm | 0.0567 |
|
| 1310 |
+
| loss | 0.0338 |
|
| 1311 |
+
| loss_q0 | 0.113 |
|
| 1312 |
+
| loss_q1 | 0.0168 |
|
| 1313 |
+
| loss_q2 | 0.00327 |
|
| 1314 |
+
| loss_q3 | 0.000333 |
|
| 1315 |
+
| mse | 0.0295 |
|
| 1316 |
+
| mse_q0 | 0.0965 |
|
| 1317 |
+
| mse_q1 | 0.0167 |
|
| 1318 |
+
| mse_q2 | 0.00324 |
|
| 1319 |
+
| mse_q3 | 0.000329 |
|
| 1320 |
+
| param_norm | 208 |
|
| 1321 |
+
| samples | 9.28e+05 |
|
| 1322 |
+
| step | 5.8e+04 |
|
| 1323 |
+
| vb | 0.00423 |
|
| 1324 |
+
| vb_q0 | 0.0165 |
|
| 1325 |
+
| vb_q1 | 0.000123 |
|
| 1326 |
+
| vb_q2 | 2.88e-05 |
|
| 1327 |
+
| vb_q3 | 4.06e-06 |
|
| 1328 |
+
-------------------------
|
| 1329 |
+
-------------------------
|
| 1330 |
+
| grad_norm | 0.0562 |
|
| 1331 |
+
| loss | 0.0341 |
|
| 1332 |
+
| loss_q0 | 0.115 |
|
| 1333 |
+
| loss_q1 | 0.0166 |
|
| 1334 |
+
| loss_q2 | 0.00321 |
|
| 1335 |
+
| loss_q3 | 0.00033 |
|
| 1336 |
+
| mse | 0.0295 |
|
| 1337 |
+
| mse_q0 | 0.0972 |
|
| 1338 |
+
| mse_q1 | 0.0165 |
|
| 1339 |
+
| mse_q2 | 0.00318 |
|
| 1340 |
+
| mse_q3 | 0.000326 |
|
| 1341 |
+
| param_norm | 209 |
|
| 1342 |
+
| samples | 9.44e+05 |
|
| 1343 |
+
| step | 5.9e+04 |
|
| 1344 |
+
| vb | 0.00459 |
|
| 1345 |
+
| vb_q0 | 0.018 |
|
| 1346 |
+
| vb_q1 | 0.000122 |
|
| 1347 |
+
| vb_q2 | 2.83e-05 |
|
| 1348 |
+
| vb_q3 | 4.03e-06 |
|
| 1349 |
+
-------------------------
|
| 1350 |
+
-------------------------
|
| 1351 |
+
| grad_norm | 0.0591 |
|
| 1352 |
+
| loss | 0.0323 |
|
| 1353 |
+
| loss_q0 | 0.109 |
|
| 1354 |
+
| loss_q1 | 0.0167 |
|
| 1355 |
+
| loss_q2 | 0.00328 |
|
| 1356 |
+
| loss_q3 | 0.000334 |
|
| 1357 |
+
| mse | 0.0289 |
|
| 1358 |
+
| mse_q0 | 0.0958 |
|
| 1359 |
+
| mse_q1 | 0.0166 |
|
| 1360 |
+
| mse_q2 | 0.00325 |
|
| 1361 |
+
| mse_q3 | 0.00033 |
|
| 1362 |
+
| param_norm | 209 |
|
| 1363 |
+
| samples | 9.6e+05 |
|
| 1364 |
+
| step | 6e+04 |
|
| 1365 |
+
| vb | 0.00337 |
|
| 1366 |
+
| vb_q0 | 0.0134 |
|
| 1367 |
+
| vb_q1 | 0.000123 |
|
| 1368 |
+
| vb_q2 | 2.88e-05 |
|
| 1369 |
+
| vb_q3 | 4.07e-06 |
|
| 1370 |
+
-------------------------
|
| 1371 |
+
saving model 0...
|
| 1372 |
+
saving model 0.995...
|
| 1373 |
+
evaluation indistro starting...
|
| 1374 |
+
done 96 samples: bpd=3.7332992553710938
|
| 1375 |
+
done 192 samples: bpd=3.742550849914551
|
| 1376 |
+
done 288 samples: bpd=3.750394821166992
|
| 1377 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_indistro_terms.npz
|
| 1378 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_indistro_terms.npz
|
| 1379 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_indistro_terms.npz
|
| 1380 |
+
evaluation nll complete
|
| 1381 |
+
evaluation outdistro starting...
|
| 1382 |
+
done 192 samples: bpd=3.7803030014038086
|
| 1383 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_outdistro_terms.npz
|
| 1384 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_outdistro_terms.npz
|
| 1385 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_outdistro_terms.npz
|
| 1386 |
+
evaluation nll complete
|
| 1387 |
+
sampling starting...
|
| 1388 |
+
-------------------------
|
| 1389 |
+
| grad_norm | 0.0561 |
|
| 1390 |
+
| loss | 0.0328 |
|
| 1391 |
+
| loss_q0 | 0.11 |
|
| 1392 |
+
| loss_q1 | 0.0166 |
|
| 1393 |
+
| loss_q2 | 0.00324 |
|
| 1394 |
+
| loss_q3 | 0.000332 |
|
| 1395 |
+
| mse | 0.0294 |
|
| 1396 |
+
| mse_q0 | 0.0963 |
|
| 1397 |
+
| mse_q1 | 0.0165 |
|
| 1398 |
+
| mse_q2 | 0.00321 |
|
| 1399 |
+
| mse_q3 | 0.000328 |
|
| 1400 |
+
| param_norm | 210 |
|
| 1401 |
+
| samples | 9.76e+05 |
|
| 1402 |
+
| step | 6.1e+04 |
|
| 1403 |
+
| vb | 0.00346 |
|
| 1404 |
+
| vb_q0 | 0.0135 |
|
| 1405 |
+
| vb_q1 | 0.000122 |
|
| 1406 |
+
| vb_q2 | 2.85e-05 |
|
| 1407 |
+
| vb_q3 | 4.05e-06 |
|
| 1408 |
+
-------------------------
|
| 1409 |
+
-------------------------
|
| 1410 |
+
| grad_norm | 0.055 |
|
| 1411 |
+
| loss | 0.033 |
|
| 1412 |
+
| loss_q0 | 0.113 |
|
| 1413 |
+
| loss_q1 | 0.0167 |
|
| 1414 |
+
| loss_q2 | 0.00321 |
|
| 1415 |
+
| loss_q3 | 0.000327 |
|
| 1416 |
+
| mse | 0.0291 |
|
| 1417 |
+
| mse_q0 | 0.0971 |
|
| 1418 |
+
| mse_q1 | 0.0166 |
|
| 1419 |
+
| mse_q2 | 0.00318 |
|
| 1420 |
+
| mse_q3 | 0.000323 |
|
| 1421 |
+
| param_norm | 210 |
|
| 1422 |
+
| samples | 9.92e+05 |
|
| 1423 |
+
| step | 6.2e+04 |
|
| 1424 |
+
| vb | 0.00388 |
|
| 1425 |
+
| vb_q0 | 0.0155 |
|
| 1426 |
+
| vb_q1 | 0.000122 |
|
| 1427 |
+
| vb_q2 | 2.82e-05 |
|
| 1428 |
+
| vb_q3 | 3.99e-06 |
|
| 1429 |
+
-------------------------
|
| 1430 |
+
-------------------------
|
| 1431 |
+
| grad_norm | 0.0522 |
|
| 1432 |
+
| loss | 0.0327 |
|
| 1433 |
+
| loss_q0 | 0.112 |
|
| 1434 |
+
| loss_q1 | 0.0166 |
|
| 1435 |
+
| loss_q2 | 0.00317 |
|
| 1436 |
+
| loss_q3 | 0.000321 |
|
| 1437 |
+
| mse | 0.0291 |
|
| 1438 |
+
| mse_q0 | 0.0975 |
|
| 1439 |
+
| mse_q1 | 0.0165 |
|
| 1440 |
+
| mse_q2 | 0.00314 |
|
| 1441 |
+
| mse_q3 | 0.000317 |
|
| 1442 |
+
| param_norm | 211 |
|
| 1443 |
+
| samples | 1.01e+06 |
|
| 1444 |
+
| step | 6.3e+04 |
|
| 1445 |
+
| vb | 0.00364 |
|
| 1446 |
+
| vb_q0 | 0.0146 |
|
| 1447 |
+
| vb_q1 | 0.000122 |
|
| 1448 |
+
| vb_q2 | 2.8e-05 |
|
| 1449 |
+
| vb_q3 | 3.91e-06 |
|
| 1450 |
+
-------------------------
|
| 1451 |
+
-------------------------
|
| 1452 |
+
| grad_norm | 0.0563 |
|
| 1453 |
+
| loss | 0.0326 |
|
| 1454 |
+
| loss_q0 | 0.11 |
|
| 1455 |
+
| loss_q1 | 0.0167 |
|
| 1456 |
+
| loss_q2 | 0.00322 |
|
| 1457 |
+
| loss_q3 | 0.000333 |
|
| 1458 |
+
| mse | 0.0287 |
|
| 1459 |
+
| mse_q0 | 0.0949 |
|
| 1460 |
+
| mse_q1 | 0.0165 |
|
| 1461 |
+
| mse_q2 | 0.0032 |
|
| 1462 |
+
| mse_q3 | 0.000329 |
|
| 1463 |
+
| param_norm | 211 |
|
| 1464 |
+
| samples | 1.02e+06 |
|
| 1465 |
+
| step | 6.4e+04 |
|
| 1466 |
+
| vb | 0.00392 |
|
| 1467 |
+
| vb_q0 | 0.0155 |
|
| 1468 |
+
| vb_q1 | 0.000122 |
|
| 1469 |
+
| vb_q2 | 2.84e-05 |
|
| 1470 |
+
| vb_q3 | 4.06e-06 |
|
| 1471 |
+
-------------------------
|
| 1472 |
+
-------------------------
|
| 1473 |
+
| grad_norm | 0.0557 |
|
| 1474 |
+
| loss | 0.0327 |
|
| 1475 |
+
| loss_q0 | 0.111 |
|
| 1476 |
+
| loss_q1 | 0.0167 |
|
| 1477 |
+
| loss_q2 | 0.00317 |
|
| 1478 |
+
| loss_q3 | 0.000325 |
|
| 1479 |
+
| mse | 0.0288 |
|
| 1480 |
+
| mse_q0 | 0.0954 |
|
| 1481 |
+
| mse_q1 | 0.0166 |
|
| 1482 |
+
| mse_q2 | 0.00314 |
|
| 1483 |
+
| mse_q3 | 0.000321 |
|
| 1484 |
+
| param_norm | 212 |
|
| 1485 |
+
| samples | 1.04e+06 |
|
| 1486 |
+
| step | 6.5e+04 |
|
| 1487 |
+
| vb | 0.00387 |
|
| 1488 |
+
| vb_q0 | 0.0154 |
|
| 1489 |
+
| vb_q1 | 0.000122 |
|
| 1490 |
+
| vb_q2 | 2.8e-05 |
|
| 1491 |
+
| vb_q3 | 3.95e-06 |
|
| 1492 |
+
-------------------------
|
| 1493 |
+
-------------------------
|
| 1494 |
+
| grad_norm | 0.0545 |
|
| 1495 |
+
| loss | 0.032 |
|
| 1496 |
+
| loss_q0 | 0.11 |
|
| 1497 |
+
| loss_q1 | 0.0167 |
|
| 1498 |
+
| loss_q2 | 0.00324 |
|
| 1499 |
+
| loss_q3 | 0.000323 |
|
| 1500 |
+
| mse | 0.0282 |
|
| 1501 |
+
| mse_q0 | 0.0944 |
|
| 1502 |
+
| mse_q1 | 0.0165 |
|
| 1503 |
+
| mse_q2 | 0.00321 |
|
| 1504 |
+
| mse_q3 | 0.00032 |
|
| 1505 |
+
| param_norm | 212 |
|
| 1506 |
+
| samples | 1.06e+06 |
|
| 1507 |
+
| step | 6.6e+04 |
|
| 1508 |
+
| vb | 0.00382 |
|
| 1509 |
+
| vb_q0 | 0.0154 |
|
| 1510 |
+
| vb_q1 | 0.000122 |
|
| 1511 |
+
| vb_q2 | 2.85e-05 |
|
| 1512 |
+
| vb_q3 | 3.94e-06 |
|
| 1513 |
+
-------------------------
|
| 1514 |
+
-------------------------
|
| 1515 |
+
| grad_norm | 0.0545 |
|
| 1516 |
+
| loss | 0.0326 |
|
| 1517 |
+
| loss_q0 | 0.111 |
|
| 1518 |
+
| loss_q1 | 0.0166 |
|
| 1519 |
+
| loss_q2 | 0.00322 |
|
| 1520 |
+
| loss_q3 | 0.00032 |
|
| 1521 |
+
| mse | 0.0288 |
|
| 1522 |
+
| mse_q0 | 0.0955 |
|
| 1523 |
+
| mse_q1 | 0.0164 |
|
| 1524 |
+
| mse_q2 | 0.00319 |
|
| 1525 |
+
| mse_q3 | 0.000316 |
|
| 1526 |
+
| param_norm | 213 |
|
| 1527 |
+
| samples | 1.07e+06 |
|
| 1528 |
+
| step | 6.7e+04 |
|
| 1529 |
+
| vb | 0.00382 |
|
| 1530 |
+
| vb_q0 | 0.0152 |
|
| 1531 |
+
| vb_q1 | 0.000121 |
|
| 1532 |
+
| vb_q2 | 2.83e-05 |
|
| 1533 |
+
| vb_q3 | 3.89e-06 |
|
| 1534 |
+
-------------------------
|
| 1535 |
+
-------------------------
|
| 1536 |
+
| grad_norm | 0.0563 |
|
| 1537 |
+
| loss | 0.0335 |
|
| 1538 |
+
| loss_q0 | 0.114 |
|
| 1539 |
+
| loss_q1 | 0.0165 |
|
| 1540 |
+
| loss_q2 | 0.0032 |
|
| 1541 |
+
| loss_q3 | 0.000325 |
|
| 1542 |
+
| mse | 0.0294 |
|
| 1543 |
+
| mse_q0 | 0.098 |
|
| 1544 |
+
| mse_q1 | 0.0164 |
|
| 1545 |
+
| mse_q2 | 0.00317 |
|
| 1546 |
+
| mse_q3 | 0.000321 |
|
| 1547 |
+
| param_norm | 213 |
|
| 1548 |
+
| samples | 1.09e+06 |
|
| 1549 |
+
| step | 6.8e+04 |
|
| 1550 |
+
| vb | 0.00401 |
|
| 1551 |
+
| vb_q0 | 0.0159 |
|
| 1552 |
+
| vb_q1 | 0.000121 |
|
| 1553 |
+
| vb_q2 | 2.81e-05 |
|
| 1554 |
+
| vb_q3 | 3.96e-06 |
|
| 1555 |
+
-------------------------
|
| 1556 |
+
-------------------------
|
| 1557 |
+
| grad_norm | 0.055 |
|
| 1558 |
+
| loss | 0.0318 |
|
| 1559 |
+
| loss_q0 | 0.107 |
|
| 1560 |
+
| loss_q1 | 0.0168 |
|
| 1561 |
+
| loss_q2 | 0.00323 |
|
| 1562 |
+
| loss_q3 | 0.000317 |
|
| 1563 |
+
| mse | 0.0287 |
|
| 1564 |
+
| mse_q0 | 0.0942 |
|
| 1565 |
+
| mse_q1 | 0.0166 |
|
| 1566 |
+
| mse_q2 | 0.00321 |
|
| 1567 |
+
| mse_q3 | 0.000313 |
|
| 1568 |
+
| param_norm | 214 |
|
| 1569 |
+
| samples | 1.1e+06 |
|
| 1570 |
+
| step | 6.9e+04 |
|
| 1571 |
+
| vb | 0.00313 |
|
| 1572 |
+
| vb_q0 | 0.0124 |
|
| 1573 |
+
| vb_q1 | 0.000123 |
|
| 1574 |
+
| vb_q2 | 2.84e-05 |
|
| 1575 |
+
| vb_q3 | 3.86e-06 |
|
| 1576 |
+
-------------------------
|
| 1577 |
+
-------------------------
|
| 1578 |
+
| grad_norm | 0.0537 |
|
| 1579 |
+
| loss | 0.0316 |
|
| 1580 |
+
| loss_q0 | 0.105 |
|
| 1581 |
+
| loss_q1 | 0.0166 |
|
| 1582 |
+
| loss_q2 | 0.00318 |
|
| 1583 |
+
| loss_q3 | 0.000318 |
|
| 1584 |
+
| mse | 0.0286 |
|
| 1585 |
+
| mse_q0 | 0.0936 |
|
| 1586 |
+
| mse_q1 | 0.0165 |
|
| 1587 |
+
| mse_q2 | 0.00315 |
|
| 1588 |
+
| mse_q3 | 0.000314 |
|
| 1589 |
+
| param_norm | 215 |
|
| 1590 |
+
| samples | 1.12e+06 |
|
| 1591 |
+
| step | 7e+04 |
|
| 1592 |
+
| vb | 0.00302 |
|
| 1593 |
+
| vb_q0 | 0.0118 |
|
| 1594 |
+
| vb_q1 | 0.000122 |
|
| 1595 |
+
| vb_q2 | 2.8e-05 |
|
| 1596 |
+
| vb_q3 | 3.87e-06 |
|
| 1597 |
+
-------------------------
|
| 1598 |
+
saving model 0...
|
| 1599 |
+
saving model 0.995...
|
| 1600 |
+
evaluation indistro starting...
|
| 1601 |
+
done 96 samples: bpd=3.8689794540405273
|
| 1602 |
+
done 192 samples: bpd=3.703700542449951
|
| 1603 |
+
done 288 samples: bpd=3.6549039681752524
|
| 1604 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_indistro_terms.npz
|
| 1605 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_indistro_terms.npz
|
| 1606 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model70000_indistro_terms.npz
|
| 1607 |
+
evaluation nll complete
|
| 1608 |
+
evaluation outdistro starting...
|
| 1609 |
+
done 192 samples: bpd=3.788196086883545
|
| 1610 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_outdistro_terms.npz
|
| 1611 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_outdistro_terms.npz
|
| 1612 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model70000_outdistro_terms.npz
|
| 1613 |
+
evaluation nll complete
|
| 1614 |
+
sampling starting...
|
| 1615 |
+
-------------------------
|
| 1616 |
+
| grad_norm | 0.0552 |
|
| 1617 |
+
| loss | 0.0336 |
|
| 1618 |
+
| loss_q0 | 0.112 |
|
| 1619 |
+
| loss_q1 | 0.0168 |
|
| 1620 |
+
| loss_q2 | 0.00322 |
|
| 1621 |
+
| loss_q3 | 0.00032 |
|
| 1622 |
+
| mse | 0.0297 |
|
| 1623 |
+
| mse_q0 | 0.0973 |
|
| 1624 |
+
| mse_q1 | 0.0166 |
|
| 1625 |
+
| mse_q2 | 0.00319 |
|
| 1626 |
+
| mse_q3 | 0.000316 |
|
| 1627 |
+
| param_norm | 215 |
|
| 1628 |
+
| samples | 1.14e+06 |
|
| 1629 |
+
| step | 7.1e+04 |
|
| 1630 |
+
| vb | 0.00389 |
|
| 1631 |
+
| vb_q0 | 0.0152 |
|
| 1632 |
+
| vb_q1 | 0.000123 |
|
| 1633 |
+
| vb_q2 | 2.83e-05 |
|
| 1634 |
+
| vb_q3 | 3.9e-06 |
|
| 1635 |
+
-------------------------
|
| 1636 |
+
-------------------------
|
| 1637 |
+
| grad_norm | 0.0521 |
|
| 1638 |
+
| loss | 0.0323 |
|
| 1639 |
+
| loss_q0 | 0.109 |
|
| 1640 |
+
| loss_q1 | 0.0167 |
|
| 1641 |
+
| loss_q2 | 0.00316 |
|
| 1642 |
+
| loss_q3 | 0.000313 |
|
| 1643 |
+
| mse | 0.0285 |
|
| 1644 |
+
| mse_q0 | 0.0942 |
|
| 1645 |
+
| mse_q1 | 0.0166 |
|
| 1646 |
+
| mse_q2 | 0.00313 |
|
| 1647 |
+
| mse_q3 | 0.00031 |
|
| 1648 |
+
| param_norm | 216 |
|
| 1649 |
+
| samples | 1.15e+06 |
|
| 1650 |
+
| step | 7.2e+04 |
|
| 1651 |
+
| vb | 0.00381 |
|
| 1652 |
+
| vb_q0 | 0.0151 |
|
| 1653 |
+
| vb_q1 | 0.000123 |
|
| 1654 |
+
| vb_q2 | 2.78e-05 |
|
| 1655 |
+
| vb_q3 | 3.81e-06 |
|
| 1656 |
+
-------------------------
|
| 1657 |
+
-------------------------
|
| 1658 |
+
| grad_norm | 0.056 |
|
| 1659 |
+
| loss | 0.0321 |
|
| 1660 |
+
| loss_q0 | 0.109 |
|
| 1661 |
+
| loss_q1 | 0.0165 |
|
| 1662 |
+
| loss_q2 | 0.00314 |
|
| 1663 |
+
| loss_q3 | 0.000315 |
|
| 1664 |
+
| mse | 0.029 |
|
| 1665 |
+
| mse_q0 | 0.0965 |
|
| 1666 |
+
| mse_q1 | 0.0164 |
|
| 1667 |
+
| mse_q2 | 0.00312 |
|
| 1668 |
+
| mse_q3 | 0.000311 |
|
| 1669 |
+
| param_norm | 216 |
|
| 1670 |
+
| samples | 1.17e+06 |
|
| 1671 |
+
| step | 7.3e+04 |
|
| 1672 |
+
| vb | 0.00309 |
|
| 1673 |
+
| vb_q0 | 0.0123 |
|
| 1674 |
+
| vb_q1 | 0.000121 |
|
| 1675 |
+
| vb_q2 | 2.78e-05 |
|
| 1676 |
+
| vb_q3 | 3.84e-06 |
|
| 1677 |
+
-------------------------
|
| 1678 |
+
-------------------------
|
| 1679 |
+
| grad_norm | 0.0551 |
|
| 1680 |
+
| loss | 0.0329 |
|
| 1681 |
+
| loss_q0 | 0.11 |
|
| 1682 |
+
| loss_q1 | 0.0163 |
|
| 1683 |
+
| loss_q2 | 0.00321 |
|
| 1684 |
+
| loss_q3 | 0.00032 |
|
| 1685 |
+
| mse | 0.029 |
|
| 1686 |
+
| mse_q0 | 0.0948 |
|
| 1687 |
+
| mse_q1 | 0.0162 |
|
| 1688 |
+
| mse_q2 | 0.00318 |
|
| 1689 |
+
| mse_q3 | 0.000316 |
|
| 1690 |
+
| param_norm | 217 |
|
| 1691 |
+
| samples | 1.18e+06 |
|
| 1692 |
+
| step | 7.4e+04 |
|
| 1693 |
+
| vb | 0.0039 |
|
| 1694 |
+
| vb_q0 | 0.0152 |
|
| 1695 |
+
| vb_q1 | 0.00012 |
|
| 1696 |
+
| vb_q2 | 2.82e-05 |
|
| 1697 |
+
| vb_q3 | 3.88e-06 |
|
| 1698 |
+
-------------------------
|
| 1699 |
+
-------------------------
|
| 1700 |
+
| grad_norm | 0.0539 |
|
| 1701 |
+
| loss | 0.0323 |
|
| 1702 |
+
| loss_q0 | 0.112 |
|
| 1703 |
+
| loss_q1 | 0.0163 |
|
| 1704 |
+
| loss_q2 | 0.00319 |
|
| 1705 |
+
| loss_q3 | 0.000316 |
|
| 1706 |
+
| mse | 0.0286 |
|
| 1707 |
+
| mse_q0 | 0.0974 |
|
| 1708 |
+
| mse_q1 | 0.0162 |
|
| 1709 |
+
| mse_q2 | 0.00316 |
|
| 1710 |
+
| mse_q3 | 0.000313 |
|
| 1711 |
+
| param_norm | 217 |
|
| 1712 |
+
| samples | 1.2e+06 |
|
| 1713 |
+
| step | 7.5e+04 |
|
| 1714 |
+
| vb | 0.00365 |
|
| 1715 |
+
| vb_q0 | 0.0148 |
|
| 1716 |
+
| vb_q1 | 0.00012 |
|
| 1717 |
+
| vb_q2 | 2.81e-05 |
|
| 1718 |
+
| vb_q3 | 3.85e-06 |
|
| 1719 |
+
-------------------------
|
| 1720 |
+
-------------------------
|
| 1721 |
+
| grad_norm | 0.053 |
|
| 1722 |
+
| loss | 0.0342 |
|
| 1723 |
+
| loss_q0 | 0.116 |
|
| 1724 |
+
| loss_q1 | 0.0166 |
|
| 1725 |
+
| loss_q2 | 0.00318 |
|
| 1726 |
+
| loss_q3 | 0.000306 |
|
| 1727 |
+
| mse | 0.0296 |
|
| 1728 |
+
| mse_q0 | 0.0982 |
|
| 1729 |
+
| mse_q1 | 0.0164 |
|
| 1730 |
+
| mse_q2 | 0.00315 |
|
| 1731 |
+
| mse_q3 | 0.000303 |
|
| 1732 |
+
| param_norm | 218 |
|
| 1733 |
+
| samples | 1.22e+06 |
|
| 1734 |
+
| step | 7.6e+04 |
|
| 1735 |
+
| vb | 0.00462 |
|
| 1736 |
+
| vb_q0 | 0.0183 |
|
| 1737 |
+
| vb_q1 | 0.000122 |
|
| 1738 |
+
| vb_q2 | 2.8e-05 |
|
| 1739 |
+
| vb_q3 | 3.73e-06 |
|
| 1740 |
+
-------------------------
|
| 1741 |
+
-------------------------
|
| 1742 |
+
| grad_norm | 0.0529 |
|
| 1743 |
+
| loss | 0.0316 |
|
| 1744 |
+
| loss_q0 | 0.107 |
|
| 1745 |
+
| loss_q1 | 0.0164 |
|
| 1746 |
+
| loss_q2 | 0.00313 |
|
| 1747 |
+
| loss_q3 | 0.000315 |
|
| 1748 |
+
| mse | 0.0285 |
|
| 1749 |
+
| mse_q0 | 0.0946 |
|
| 1750 |
+
| mse_q1 | 0.0163 |
|
| 1751 |
+
| mse_q2 | 0.00311 |
|
| 1752 |
+
| mse_q3 | 0.000311 |
|
| 1753 |
+
| param_norm | 218 |
|
| 1754 |
+
| samples | 1.23e+06 |
|
| 1755 |
+
| step | 7.7e+04 |
|
| 1756 |
+
| vb | 0.00309 |
|
| 1757 |
+
| vb_q0 | 0.0122 |
|
| 1758 |
+
| vb_q1 | 0.00012 |
|
| 1759 |
+
| vb_q2 | 2.77e-05 |
|
| 1760 |
+
| vb_q3 | 3.82e-06 |
|
| 1761 |
+
-------------------------
|
| 1762 |
+
-------------------------
|
| 1763 |
+
| grad_norm | 0.0518 |
|
| 1764 |
+
| loss | 0.0333 |
|
| 1765 |
+
| loss_q0 | 0.117 |
|
| 1766 |
+
| loss_q1 | 0.0163 |
|
| 1767 |
+
| loss_q2 | 0.00321 |
|
| 1768 |
+
| loss_q3 | 0.000305 |
|
| 1769 |
+
| mse | 0.0287 |
|
| 1770 |
+
| mse_q0 | 0.098 |
|
| 1771 |
+
| mse_q1 | 0.0162 |
|
| 1772 |
+
| mse_q2 | 0.00319 |
|
| 1773 |
+
| mse_q3 | 0.000301 |
|
| 1774 |
+
| param_norm | 219 |
|
| 1775 |
+
| samples | 1.25e+06 |
|
| 1776 |
+
| step | 7.8e+04 |
|
| 1777 |
+
| vb | 0.00466 |
|
| 1778 |
+
| vb_q0 | 0.0191 |
|
| 1779 |
+
| vb_q1 | 0.00012 |
|
| 1780 |
+
| vb_q2 | 2.83e-05 |
|
| 1781 |
+
| vb_q3 | 3.71e-06 |
|
| 1782 |
+
-------------------------
|
| 1783 |
+
-------------------------
|
| 1784 |
+
| grad_norm | 0.0557 |
|
| 1785 |
+
| loss | 0.0322 |
|
| 1786 |
+
| loss_q0 | 0.11 |
|
| 1787 |
+
| loss_q1 | 0.0166 |
|
| 1788 |
+
| loss_q2 | 0.00322 |
|
| 1789 |
+
| loss_q3 | 0.000315 |
|
| 1790 |
+
| mse | 0.0285 |
|
| 1791 |
+
| mse_q0 | 0.0949 |
|
| 1792 |
+
| mse_q1 | 0.0165 |
|
| 1793 |
+
| mse_q2 | 0.00319 |
|
| 1794 |
+
| mse_q3 | 0.000312 |
|
| 1795 |
+
| param_norm | 219 |
|
| 1796 |
+
| samples | 1.26e+06 |
|
| 1797 |
+
| step | 7.9e+04 |
|
| 1798 |
+
| vb | 0.00366 |
|
| 1799 |
+
| vb_q0 | 0.0146 |
|
| 1800 |
+
| vb_q1 | 0.000122 |
|
| 1801 |
+
| vb_q2 | 2.83e-05 |
|
| 1802 |
+
| vb_q3 | 3.83e-06 |
|
| 1803 |
+
-------------------------
|
| 1804 |
+
-------------------------
|
| 1805 |
+
| grad_norm | 0.0526 |
|
| 1806 |
+
| loss | 0.031 |
|
| 1807 |
+
| loss_q0 | 0.107 |
|
| 1808 |
+
| loss_q1 | 0.0165 |
|
| 1809 |
+
| loss_q2 | 0.00321 |
|
| 1810 |
+
| loss_q3 | 0.000306 |
|
| 1811 |
+
| mse | 0.0276 |
|
| 1812 |
+
| mse_q0 | 0.0935 |
|
| 1813 |
+
| mse_q1 | 0.0164 |
|
| 1814 |
+
| mse_q2 | 0.00319 |
|
| 1815 |
+
| mse_q3 | 0.000303 |
|
| 1816 |
+
| param_norm | 220 |
|
| 1817 |
+
| samples | 1.28e+06 |
|
| 1818 |
+
| step | 8e+04 |
|
| 1819 |
+
| vb | 0.00343 |
|
| 1820 |
+
| vb_q0 | 0.014 |
|
| 1821 |
+
| vb_q1 | 0.000121 |
|
| 1822 |
+
| vb_q2 | 2.83e-05 |
|
| 1823 |
+
| vb_q3 | 3.73e-06 |
|
| 1824 |
+
-------------------------
|
| 1825 |
+
saving model 0...
|
| 1826 |
+
saving model 0.995...
|
| 1827 |
+
evaluation indistro starting...
|
| 1828 |
+
done 96 samples: bpd=3.589547634124756
|
| 1829 |
+
done 192 samples: bpd=3.518894910812378
|
| 1830 |
+
done 288 samples: bpd=3.5158642133076987
|
| 1831 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_indistro_terms.npz
|
| 1832 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_indistro_terms.npz
|
| 1833 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model80000_indistro_terms.npz
|
| 1834 |
+
evaluation nll complete
|
| 1835 |
+
evaluation outdistro starting...
|
| 1836 |
+
done 192 samples: bpd=3.783998489379883
|
| 1837 |
+
saving vb terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_outdistro_terms.npz
|
| 1838 |
+
saving mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_outdistro_terms.npz
|
| 1839 |
+
saving xstart_mse terms to /scratch/gigi/fsddpm/cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model80000_outdistro_terms.npz
|
| 1840 |
+
evaluation nll complete
|
| 1841 |
+
sampling starting...
|
| 1842 |
+
-------------------------
|
| 1843 |
+
| grad_norm | 0.0541 |
|
| 1844 |
+
| loss | 0.0329 |
|
| 1845 |
+
| loss_q0 | 0.111 |
|
| 1846 |
+
| loss_q1 | 0.0166 |
|
| 1847 |
+
| loss_q2 | 0.00321 |
|
| 1848 |
+
| loss_q3 | 0.000311 |
|
| 1849 |
+
| mse | 0.0292 |
|
| 1850 |
+
| mse_q0 | 0.0963 |
|
| 1851 |
+
| mse_q1 | 0.0165 |
|
| 1852 |
+
| mse_q2 | 0.00318 |
|
| 1853 |
+
| mse_q3 | 0.000308 |
|
| 1854 |
+
| param_norm | 221 |
|
| 1855 |
+
| samples | 1.3e+06 |
|
| 1856 |
+
| step | 8.1e+04 |
|
| 1857 |
+
| vb | 0.00363 |
|
| 1858 |
+
| vb_q0 | 0.0143 |
|
| 1859 |
+
| vb_q1 | 0.000122 |
|
| 1860 |
+
| vb_q2 | 2.82e-05 |
|
| 1861 |
+
| vb_q3 | 3.79e-06 |
|
| 1862 |
+
-------------------------
|
| 1863 |
+
-------------------------
|
| 1864 |
+
| grad_norm | 0.0519 |
|
| 1865 |
+
| loss | 0.034 |
|
| 1866 |
+
| loss_q0 | 0.116 |
|
| 1867 |
+
| loss_q1 | 0.0167 |
|
| 1868 |
+
| loss_q2 | 0.0032 |
|
| 1869 |
+
| loss_q3 | 0.000307 |
|
| 1870 |
+
| mse | 0.0295 |
|
| 1871 |
+
| mse_q0 | 0.0981 |
|
| 1872 |
+
| mse_q1 | 0.0166 |
|
| 1873 |
+
| mse_q2 | 0.00317 |
|
| 1874 |
+
| mse_q3 | 0.000303 |
|
| 1875 |
+
| param_norm | 221 |
|
| 1876 |
+
| samples | 1.31e+06 |
|
| 1877 |
+
| step | 8.2e+04 |
|
| 1878 |
+
| vb | 0.0045 |
|
| 1879 |
+
| vb_q0 | 0.0179 |
|
| 1880 |
+
| vb_q1 | 0.000122 |
|
| 1881 |
+
| vb_q2 | 2.82e-05 |
|
| 1882 |
+
| vb_q3 | 3.73e-06 |
|
| 1883 |
+
-------------------------
|
| 1884 |
+
-------------------------
|
| 1885 |
+
| grad_norm | 0.0539 |
|
| 1886 |
+
| loss | 0.032 |
|
| 1887 |
+
| loss_q0 | 0.107 |
|
| 1888 |
+
| loss_q1 | 0.0165 |
|
| 1889 |
+
| loss_q2 | 0.00318 |
|
| 1890 |
+
| loss_q3 | 0.000305 |
|
| 1891 |
+
| mse | 0.0288 |
|
| 1892 |
+
| mse_q0 | 0.0941 |
|
| 1893 |
+
| mse_q1 | 0.0164 |
|
| 1894 |
+
| mse_q2 | 0.00315 |
|
| 1895 |
+
| mse_q3 | 0.000301 |
|
| 1896 |
+
| param_norm | 222 |
|
| 1897 |
+
| samples | 1.33e+06 |
|
| 1898 |
+
| step | 8.3e+04 |
|
| 1899 |
+
| vb | 0.00327 |
|
| 1900 |
+
| vb_q0 | 0.0127 |
|
| 1901 |
+
| vb_q1 | 0.000121 |
|
| 1902 |
+
| vb_q2 | 2.8e-05 |
|
| 1903 |
+
| vb_q3 | 3.71e-06 |
|
| 1904 |
+
-------------------------
|
| 1905 |
+
-------------------------
|
| 1906 |
+
| grad_norm | 0.0548 |
|
| 1907 |
+
| loss | 0.0326 |
|
| 1908 |
+
| loss_q0 | 0.111 |
|
| 1909 |
+
| loss_q1 | 0.0164 |
|
| 1910 |
+
| loss_q2 | 0.00321 |
|
| 1911 |
+
| loss_q3 | 0.000306 |
|
| 1912 |
+
| mse | 0.0289 |
|
| 1913 |
+
| mse_q0 | 0.0961 |
|
| 1914 |
+
| mse_q1 | 0.0163 |
|
| 1915 |
+
| mse_q2 | 0.00318 |
|
| 1916 |
+
| mse_q3 | 0.000302 |
|
| 1917 |
+
| param_norm | 222 |
|
| 1918 |
+
| samples | 1.34e+06 |
|
| 1919 |
+
| step | 8.4e+04 |
|
| 1920 |
+
| vb | 0.00375 |
|
| 1921 |
+
| vb_q0 | 0.0149 |
|
| 1922 |
+
| vb_q1 | 0.000121 |
|
| 1923 |
+
| vb_q2 | 2.82e-05 |
|
| 1924 |
+
| vb_q3 | 3.72e-06 |
|
| 1925 |
+
-------------------------
|
| 1926 |
+
-------------------------
|
| 1927 |
+
| grad_norm | 0.0538 |
|
| 1928 |
+
| loss | 0.033 |
|
| 1929 |
+
| loss_q0 | 0.112 |
|
| 1930 |
+
| loss_q1 | 0.0164 |
|
| 1931 |
+
| loss_q2 | 0.00319 |
|
| 1932 |
+
| loss_q3 | 0.000304 |
|
| 1933 |
+
| mse | 0.0287 |
|
| 1934 |
+
| mse_q0 | 0.0949 |
|
| 1935 |
+
| mse_q1 | 0.0163 |
|
| 1936 |
+
| mse_q2 | 0.00317 |
|
| 1937 |
+
| mse_q3 | 0.0003 |
|
| 1938 |
+
| param_norm | 223 |
|
| 1939 |
+
| samples | 1.36e+06 |
|
| 1940 |
+
| step | 8.5e+04 |
|
| 1941 |
+
| vb | 0.00431 |
|
| 1942 |
+
| vb_q0 | 0.0171 |
|
| 1943 |
+
| vb_q1 | 0.00012 |
|
| 1944 |
+
| vb_q2 | 2.81e-05 |
|
| 1945 |
+
| vb_q3 | 3.69e-06 |
|
| 1946 |
+
-------------------------
|
| 1947 |
+
-------------------------
|
| 1948 |
+
| grad_norm | 0.0539 |
|
| 1949 |
+
| loss | 0.0326 |
|
| 1950 |
+
| loss_q0 | 0.112 |
|
| 1951 |
+
| loss_q1 | 0.0162 |
|
| 1952 |
+
| loss_q2 | 0.00316 |
|
| 1953 |
+
| loss_q3 | 0.000305 |
|
| 1954 |
+
| mse | 0.0285 |
|
| 1955 |
+
| mse_q0 | 0.0951 |
|
| 1956 |
+
| mse_q1 | 0.0161 |
|
| 1957 |
+
| mse_q2 | 0.00313 |
|
| 1958 |
+
| mse_q3 | 0.000301 |
|
| 1959 |
+
| param_norm | 223 |
|
| 1960 |
+
| samples | 1.38e+06 |
|
| 1961 |
+
| step | 8.6e+04 |
|
| 1962 |
+
| vb | 0.00417 |
|
| 1963 |
+
| vb_q0 | 0.0167 |
|
| 1964 |
+
| vb_q1 | 0.000119 |
|
| 1965 |
+
| vb_q2 | 2.78e-05 |
|
| 1966 |
+
| vb_q3 | 3.7e-06 |
|
| 1967 |
+
-------------------------
|
| 1968 |
+
-------------------------
|
| 1969 |
+
| grad_norm | 0.0528 |
|
| 1970 |
+
| loss | 0.0334 |
|
| 1971 |
+
| loss_q0 | 0.112 |
|
| 1972 |
+
| loss_q1 | 0.0162 |
|
| 1973 |
+
| loss_q2 | 0.00315 |
|
| 1974 |
+
| loss_q3 | 0.000298 |
|
| 1975 |
+
| mse | 0.0294 |
|
| 1976 |
+
| mse_q0 | 0.0967 |
|
| 1977 |
+
| mse_q1 | 0.0161 |
|
| 1978 |
+
| mse_q2 | 0.00312 |
|
| 1979 |
+
| mse_q3 | 0.000294 |
|
| 1980 |
+
| param_norm | 224 |
|
| 1981 |
+
| samples | 1.39e+06 |
|
| 1982 |
+
| step | 8.7e+04 |
|
| 1983 |
+
| vb | 0.00398 |
|
| 1984 |
+
| vb_q0 | 0.0155 |
|
| 1985 |
+
| vb_q1 | 0.000119 |
|
| 1986 |
+
| vb_q2 | 2.78e-05 |
|
| 1987 |
+
| vb_q3 | 3.62e-06 |
|
| 1988 |
+
-------------------------
|
| 1989 |
+
-------------------------
|
| 1990 |
+
| grad_norm | 0.0519 |
|
| 1991 |
+
| loss | 0.0328 |
|
| 1992 |
+
| loss_q0 | 0.112 |
|
| 1993 |
+
| loss_q1 | 0.0163 |
|
| 1994 |
+
| loss_q2 | 0.00322 |
|
| 1995 |
+
| loss_q3 | 0.000293 |
|
| 1996 |
+
| mse | 0.0285 |
|
| 1997 |
+
| mse_q0 | 0.095 |
|
| 1998 |
+
| mse_q1 | 0.0162 |
|
| 1999 |
+
| mse_q2 | 0.00319 |
|
| 2000 |
+
| mse_q3 | 0.00029 |
|
| 2001 |
+
| param_norm | 224 |
|
| 2002 |
+
| samples | 1.41e+06 |
|
| 2003 |
+
| step | 8.8e+04 |
|
| 2004 |
+
| vb | 0.00427 |
|
| 2005 |
+
| vb_q0 | 0.017 |
|
| 2006 |
+
| vb_q1 | 0.00012 |
|
| 2007 |
+
| vb_q2 | 2.83e-05 |
|
| 2008 |
+
| vb_q3 | 3.58e-06 |
|
| 2009 |
+
-------------------------
|
| 2010 |
+
-------------------------
|
| 2011 |
+
| grad_norm | 0.0527 |
|
| 2012 |
+
| loss | 0.0333 |
|
| 2013 |
+
| loss_q0 | 0.113 |
|
| 2014 |
+
| loss_q1 | 0.0163 |
|
| 2015 |
+
| loss_q2 | 0.00317 |
|
| 2016 |
+
| loss_q3 | 0.000296 |
|
| 2017 |
+
| mse | 0.0293 |
|
| 2018 |
+
| mse_q0 | 0.0969 |
|
| 2019 |
+
| mse_q1 | 0.0162 |
|
| 2020 |
+
| mse_q2 | 0.00315 |
|
| 2021 |
+
| mse_q3 | 0.000293 |
|
| 2022 |
+
| param_norm | 225 |
|
| 2023 |
+
| samples | 1.42e+06 |
|
| 2024 |
+
| step | 8.9e+04 |
|
| 2025 |
+
| vb | 0.00403 |
|
| 2026 |
+
| vb_q0 | 0.0158 |
|
| 2027 |
+
| vb_q1 | 0.00012 |
|
| 2028 |
+
| vb_q2 | 2.79e-05 |
|
| 2029 |
+
| vb_q3 | 3.61e-06 |
|
| 2030 |
+
-------------------------
|
| 2031 |
+
-------------------------
|
| 2032 |
+
| grad_norm | 0.0531 |
|
| 2033 |
+
| loss | 0.0321 |
|
| 2034 |
+
| loss_q0 | 0.109 |
|
| 2035 |
+
| loss_q1 | 0.0163 |
|
| 2036 |
+
| loss_q2 | 0.00314 |
|
| 2037 |
+
| loss_q3 | 0.000301 |
|
| 2038 |
+
| mse | 0.0281 |
|
| 2039 |
+
| mse_q0 | 0.0931 |
|
| 2040 |
+
| mse_q1 | 0.0162 |
|
| 2041 |
+
| mse_q2 | 0.00311 |
|
| 2042 |
+
| mse_q3 | 0.000297 |
|
| 2043 |
+
| param_norm | 225 |
|
| 2044 |
+
| samples | 1.44e+06 |
|
| 2045 |
+
| step | 9e+04 |
|
| 2046 |
+
| vb | 0.00403 |
|
| 2047 |
+
| vb_q0 | 0.0161 |
|
| 2048 |
+
| vb_q1 | 0.00012 |
|
| 2049 |
+
| vb_q2 | 2.77e-05 |
|
| 2050 |
+
| vb_q3 | 3.65e-06 |
|
| 2051 |
+
-------------------------
|
| 2052 |
+
saving model 0...
|
| 2053 |
+
saving model 0.995...
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/model090000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:faa39741934e7290b8c99be648286a526d52da84b83913d8c5fc1d2eda742d3e
|
| 3 |
+
size 118795331
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2d9b7055a02de22f4bf1194021fe75f719aed183afa631bf91ddfc96e92950b
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model10000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d2abf9b2d1212b81e1898946fd6b71b7750dc186e48b1967989fd1f592ef1b7
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f680d6299d5a8bea5679596fa5c17907c3e9305b8824b155a0991ff82da708be
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model20000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab566effd6f15e249d3035436290cf4e8f31b794df613b0be0f513aef26c04af
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3fca8434fd5d5cef29f3dcaa57f04aff6fe174803759c1d25a177bdf1c3fe71
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model30000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47eda96e0d93f907ef270723ece66b2a3f58eff338f76860224e9b96feb69672
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98df3087270472019c5ab8615f297b5269042339aaf2c4a3fb3d2e0db459c6df
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model40000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70e798a4fb4501bcdaf45f8ba89b5816e3fc7f56bf06ec09313f2d1d5a3a8591
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0662f34dcda129eaade97d62bb7f0948541a3e3766e36bd2ba9e8c56e61aae1
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model50000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98742f94747784171671e123b6888d7b5c637b49092cc59a94cfa309f8a0681a
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:beda7d927cf4200f1277b3c54d745cfa72b10475ac7ab5ac9b6ec7244ca2e21f
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model60000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a04bebd68bd06c37a5e7b950aff6a0bfc3fbab35a1fd6e2417db3a1bcee3915
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b72fe3fdc5d8f9bc46ce994ad50024562ead5deb8e254be8cbd8ffbbdd37e1f9
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model70000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93ecad13c3f357059a05c94a281553263823029fda7f3a74044264a68d8f0457
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48b234bca5e10af6780f168a2c9607be1b7512264d74acd91b045d282a8ad381
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/mse_model80000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c37c2f003b3fbd8696b86b6c6a27d0370efe75d4f9fa14cdfa95076ecf7cd0d4
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/progress.csv
ADDED
|
@@ -0,0 +1,92 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
grad_norm,loss,loss_q0,loss_q1,loss_q2,loss_q3,mse,mse_q0,mse_q1,mse_q2,mse_q3,param_norm,samples,step,vb,vb_q0,vb_q1,vb_q2,vb_q3
|
| 2 |
+
2.5351430912370003,1.0083870887756348,1.0080348,1.0147415,1.0054059,1.0136827,0.998694896697998,0.99989533,1.0074818,0.9962311,1.0014414,180.41246248133166,16,0,0.009692199528217316,0.008139333,0.0072596963,0.009174611,0.012241336
|
| 3 |
+
0.38749177888836006,0.1188441446544604,0.23050378,0.09230976,0.07746425,0.07026056,0.11248564948420937,0.20805381,0.091629766,0.07674303,0.069372825,180.66343956539816,16016,1000,0.006358495749438592,0.02245115,0.0006805919,0.0007197115,0.00088763604
|
| 4 |
+
0.12307880156062548,0.04229613807797427,0.1380176,0.02121456,0.006024488,0.002998885,0.03858366940822451,0.1235378,0.021058422,0.005970266,0.0029609331,180.98630945099032,32016,2000,0.0037124686531751676,0.014480295,0.00015607383,5.4194606e-05,3.7959086e-05
|
| 5 |
+
0.10861653979302052,0.039761583946645196,0.13161595,0.019968102,0.004992695,0.0019074993,0.03586718766624112,0.116353765,0.01982141,0.0049480926,0.0018834297,181.3068163062271,48016,3000,0.003894396077477716,0.015261498,0.00014671894,4.4623197e-05,2.4088806e-05
|
| 6 |
+
0.09964214955218444,0.03897652612999087,0.13006906,0.019326078,0.0044136457,0.0014531624,0.034191709961276504,0.111236505,0.019184364,0.004374178,0.0014348875,181.6596103300142,64016,4000,0.004784816259354556,0.018831875,0.00014192188,3.9468487e-05,1.8275206e-05
|
| 7 |
+
0.09317443470311265,0.037605101859662635,0.12454447,0.018902501,0.0041123107,0.001154012,0.03368547698156907,0.109276615,0.018763695,0.004075592,0.0011394793,182.04426555810963,80016,5000,0.0039196247911386295,0.015267931,0.0001387761,3.6689344e-05,1.4532697e-05
|
| 8 |
+
0.0886957447274456,0.035527612912002925,0.120667055,0.01854412,0.0040197615,0.0009905453,0.03219566396577278,0.107276805,0.018407892,0.00398406,0.0009781083,182.46636837398046,96016,6000,0.0033319491002730484,0.01339026,0.00013620706,3.5672114e-05,1.2439021e-05
|
| 9 |
+
0.08884252483390416,0.037085171052720405,0.12610608,0.018420853,0.0038603789,0.00089521776,0.03263257407117637,0.10839811,0.018285641,0.0038261223,0.0008839919,182.8893104605321,112016,7000,0.004452596903582152,0.017707948,0.00013522441,3.426993e-05,1.122406e-05
|
| 10 |
+
0.0857711745360411,0.03572559505654495,0.11959203,0.018250594,0.0038038292,0.0008218667,0.03240766271762553,0.10657379,0.018116733,0.0037700704,0.0008115997,183.31371071363583,128016,8000,0.0033179325486016676,0.013017683,0.00013396822,3.3756118e-05,1.0269199e-05
|
| 11 |
+
0.08352209011027495,0.03627534082811327,0.122893825,0.018271394,0.0037806442,0.00076336414,0.032151561991777225,0.10650192,0.018137224,0.0037471913,0.0007538211,183.72409575601273,144016,9000,0.004123778771936488,0.016392084,0.00013416508,3.3446035e-05,9.537006e-06
|
| 12 |
+
0.07819607665340927,0.03558732673386118,0.12148027,0.01801353,0.0037238055,0.0007050081,0.03151981560187414,0.10513709,0.017881062,0.003690869,0.0006962378,184.14608868604898,160016,10000,0.004067511171997459,0.016343135,0.00013240371,3.294034e-05,8.767597e-06
|
| 13 |
+
0.07929677300921607,0.035510201264638455,0.118732445,0.017892234,0.0036725905,0.0006744754,0.0318000881602056,0.10418824,0.017760986,0.0036401371,0.00066605385,184.56062210642554,176016,11000,0.003710113193408687,0.0145442765,0.00013128045,3.245605e-05,8.422207e-06
|
| 14 |
+
0.07606976359003007,0.036228113402612394,0.11915751,0.01767679,0.003570582,0.0006312284,0.03206723391730331,0.1031912,0.017547045,0.0035389613,0.00062336045,184.98705663130787,192016,12000,0.004160879494367684,0.01596667,0.00012979291,3.1647447e-05,7.869366e-06
|
| 15 |
+
0.07580516411874072,0.035391651648562346,0.11950631,0.01797185,0.0035955356,0.00061021117,0.0313885395638644,0.10364518,0.017839914,0.0035637391,0.00060262426,185.4279781777233,208016,13000,0.004003112132235403,0.015860839,0.00013189905,3.1765376e-05,7.586633e-06
|
| 16 |
+
0.07445083135354322,0.03409526038984763,0.11401415,0.017829452,0.003512294,0.0005860707,0.031001788998255484,0.101847194,0.017698564,0.0034811932,0.00057878107,185.87382808638486,224016,14000,0.003093471366293667,0.012167456,0.00013081093,3.108762e-05,7.2855028e-06
|
| 17 |
+
0.07279939663843127,0.034026893349597354,0.11569134,0.01771187,0.0035322888,0.0005639997,0.03078441938618196,0.102721766,0.017581943,0.0035010688,0.000557,186.32704342058275,240016,15000,0.003242473963002344,0.012969432,0.00013002187,3.120578e-05,6.992426e-06
|
| 18 |
+
0.0736225762665543,0.03601916115265344,0.12135752,0.017668933,0.0035753683,0.00055964786,0.031502397187519876,0.10361251,0.017539231,0.0035438044,0.00055272045,186.78717955530357,256016,16000,0.004516764026866449,0.01774468,0.00012970669,3.1536758e-05,6.9295943e-06
|
| 19 |
+
0.07003611841770217,0.03470956698013467,0.115704976,0.017651262,0.003517309,0.00052276324,0.030937781215412487,0.10103667,0.017521774,0.0034862761,0.0005162885,187.2523824098204,272016,17000,0.003771785830802405,0.014667533,0.00012964712,3.101094e-05,6.4721166e-06
|
| 20 |
+
0.07022596794148567,0.033926365358289357,0.11516196,0.01744049,0.0034680655,0.00051565305,0.03027114991284904,0.10055869,0.01731255,0.0034374394,0.00050925295,187.71733501280244,288016,18000,0.0036552153062184476,0.014603293,0.000128011,3.0635038e-05,6.398486e-06
|
| 21 |
+
0.06760526681911644,0.03312311216723178,0.11218125,0.0174029,0.0034353957,0.00050708477,0.030387418352998782,0.101301864,0.017275268,0.0034049859,0.000500825,188.18610723568634,304016,19000,0.0027356939040691984,0.010879083,0.0001276402,3.0393301e-05,6.259092e-06
|
| 22 |
+
0.06846573576417096,0.033713404638692775,0.11369722,0.017500442,0.0034515406,0.00049525604,0.03003398319613185,0.0990803,0.017371753,0.003421087,0.00048912317,188.66174008771435,320016,20000,0.003679421486311178,0.014616791,0.00012848775,3.0460027e-05,6.1334135e-06
|
| 23 |
+
0.06570787989823366,0.034831443264149116,0.117571786,0.017496178,0.003436851,0.00047775477,0.030749482037965188,0.10144187,0.01736774,0.0034065326,0.0004718528,189.14313822414698,336016,21000,0.0040819612771483636,0.016130125,0.00012842721,3.0319676e-05,5.9043014e-06
|
| 24 |
+
0.06500338504391671,0.03312428622506552,0.11410628,0.017498154,0.0034039908,0.00046727248,0.02946588172530758,0.09922673,0.017369624,0.0033738937,0.00046150686,189.61774857027513,352016,22000,0.0036584045571617105,0.01488075,0.00012852503,3.00793e-05,5.7660286e-06
|
| 25 |
+
0.0657523784396333,0.033238833872135755,0.11149831,0.017255954,0.0033713912,0.00046014483,0.02977588848094456,0.097882025,0.017129181,0.003341607,0.0004544512,190.09695096125114,368016,23000,0.003462945427370877,0.013616501,0.00012662949,2.9804314e-05,5.6928247e-06
|
| 26 |
+
0.06446878267604217,0.033497490535024495,0.11571708,0.017133031,0.0033476737,0.00044819817,0.029288049949798722,0.09865497,0.017007345,0.003318086,0.0004426727,190.5726351798022,384016,24000,0.0042094407337172025,0.017061219,0.00012562412,2.9606575e-05,5.524605e-06
|
| 27 |
+
0.06572510668094186,0.033606036777375274,0.1114288,0.01708275,0.0033722003,0.00045098146,0.030121052097296368,0.09795004,0.01695719,0.0033424366,0.00044541157,191.0554391573781,400016,25000,0.003484984657028679,0.013479048,0.0001253517,2.978108e-05,5.5673586e-06
|
| 28 |
+
0.06389940770783689,0.033072616680990874,0.11113418,0.0173054,0.0033691847,0.000437037,0.030025266982149308,0.09912062,0.017178273,0.0033394808,0.00043164505,191.53368998022734,416016,26000,0.003047349801403475,0.012013028,0.00012700053,2.9700044e-05,5.3882854e-06
|
| 29 |
+
0.06202980238335346,0.03186704055382874,0.108990036,0.017358135,0.0033885366,0.0004237423,0.029358124582795436,0.09887371,0.017230764,0.0033586454,0.00041852126,192.02005145146225,432016,27000,0.0025089161274409006,0.010116346,0.00012742964,2.9885457e-05,5.2215532e-06
|
| 30 |
+
0.06507318903432624,0.032704058849951215,0.108584546,0.017107127,0.0034131126,0.00043490744,0.0294432620073203,0.09584253,0.016981384,0.0033830807,0.000429563,192.50872719285462,448016,28000,0.0032607969519249415,0.012741454,0.00012558771,3.006147e-05,5.342524e-06
|
| 31 |
+
0.061742087373785295,0.03350174230337143,0.11429626,0.017215947,0.0033885192,0.00042082704,0.030044486049562672,0.100424126,0.017089764,0.0033586456,0.00041564347,193.0169310468928,464016,29000,0.0034572562404355297,0.013872838,0.00012633206,2.9865563e-05,5.183321e-06
|
| 32 |
+
0.0624551814011085,0.034128661675378626,0.1173962,0.017290827,0.0033605401,0.00042712872,0.029716186567675287,0.09962314,0.01716392,0.0033309173,0.00042187105,193.51515518296767,480016,30000,0.0044124749983238815,0.01777282,0.00012695667,2.9622672e-05,5.256742e-06
|
| 33 |
+
0.062481250851292316,0.03467470299592233,0.116738975,0.017357923,0.0032680791,0.0004129323,0.030620100070722408,0.10083595,0.01723062,0.003239176,0.00040784662,194.01625004377158,496016,31000,0.004054602820269786,0.015903743,0.00012738437,2.8881595e-05,5.0861936e-06
|
| 34 |
+
0.059544816249945745,0.03191653931303892,0.107237056,0.01688988,0.003309901,0.00039750466,0.029257788867224,0.09673227,0.01676584,0.0032806557,0.0003926191,194.50789803887457,512016,32000,0.0026587504843319045,0.010504916,0.00012396519,2.921592e-05,4.88355e-06
|
| 35 |
+
0.06191545396159866,0.032959418754558954,0.11320956,0.017212626,0.0032893242,0.00040001184,0.029583945242222402,0.099553026,0.017086314,0.0032603175,0.00039507487,195.00805649699484,528016,33000,0.003375473534042611,0.013656557,0.00012623,2.9024919e-05,4.931894e-06
|
| 36 |
+
0.06062383562139264,0.03507452268223289,0.1186602,0.017035112,0.003361485,0.00039891747,0.03042809375678185,0.10035401,0.016909963,0.0033318624,0.0003940254,195.51581487298773,544016,34000,0.00464642891728909,0.01830657,0.0001249956,2.9623676e-05,4.8945435e-06
|
| 37 |
+
0.0635884625233498,0.03421822762326342,0.11376807,0.016997557,0.0033168655,0.0003910728,0.03027863175328823,0.098510556,0.016872844,0.0032876404,0.0003862558,196.01952616591777,560016,35000,0.0039395957740707655,0.015257463,0.00012484925,2.9230518e-05,4.8173247e-06
|
| 38 |
+
0.06107008070458716,0.03400131588359365,0.11395261,0.017034004,0.0033417647,0.000391365,0.030032761705573632,0.09844176,0.01690923,0.0033122944,0.00038655792,196.53440023057288,576016,36000,0.0039685542472416195,0.015511259,0.00012491264,2.9460234e-05,4.8053867e-06
|
| 39 |
+
0.05990060420544789,0.031796633830294026,0.110115506,0.017024536,0.0033530544,0.0003873284,0.028481805210001782,0.09654104,0.016899774,0.0033235375,0.00038257174,197.055504963234,592016,37000,0.00331482850082466,0.013573966,0.00012494644,2.9503595e-05,4.7565004e-06
|
| 40 |
+
0.05964728175132119,0.03421506795426823,0.11576267,0.01695003,0.003358747,0.00038322265,0.030042259609093937,0.09927248,0.016825961,0.0033292135,0.00037852148,197.55391341669232,608016,38000,0.004172808433513642,0.016490666,0.00012431541,2.9531342e-05,4.70193e-06
|
| 41 |
+
0.06199229772136795,0.03464131498523055,0.1174464,0.016948694,0.0032748824,0.0003883894,0.02980534010659902,0.09836048,0.016824186,0.0032459898,0.00038362487,198.06088791144228,624016,39000,0.004835974949110094,0.019086318,0.00012441786,2.888706e-05,4.7685703e-06
|
| 42 |
+
0.056173037045499453,0.03355109516414816,0.11292371,0.016729953,0.0033132827,0.00037121255,0.029589416386792435,0.0973765,0.01660693,0.003284098,0.0003666663,198.56081043473,640016,40000,0.00396167884672832,0.015547644,0.00012284327,2.9201183e-05,4.5452493e-06
|
| 43 |
+
0.059586109913723165,0.03439353797165681,0.11501123,0.016799184,0.0032522487,0.00037694137,0.03058620501356197,0.10024245,0.01667592,0.0032235205,0.00037231977,199.07202000917638,656016,41000,0.003807332962431243,0.0147682,0.00012321919,2.872436e-05,4.6212567e-06
|
| 44 |
+
0.05894077335415071,0.032751620854716786,0.11300882,0.016963845,0.003307908,0.00036955116,0.028623223698232256,0.09623524,0.016839366,0.0032787365,0.00036502533,199.58008478395695,672016,42000,0.0041283972965175135,0.016773384,0.00012447062,2.9154508e-05,4.5238708e-06
|
| 45 |
+
0.05868386952980761,0.03294618712179362,0.11097262,0.016964072,0.0033232172,0.00036870345,0.02946679911063989,0.09728215,0.016839681,0.0032939932,0.00036419198,200.0846214186139,688016,43000,0.0034793879719672975,0.013690477,0.00012450444,2.9235018e-05,4.511798e-06
|
| 46 |
+
0.05712984254316217,0.03381405721371992,0.11685681,0.016791698,0.0032206727,0.00036353475,0.02944247466232629,0.09920453,0.016668713,0.003192205,0.00035909005,200.59420255540854,704016,44000,0.004371582545412817,0.017651275,0.00012318294,2.8447348e-05,4.445859e-06
|
| 47 |
+
0.05872447042537553,0.03396594162192185,0.114005156,0.01711849,0.0033121896,0.00036989406,0.030093214575201265,0.09881455,0.016992783,0.0032830366,0.00036537353,201.11641888427923,720016,45000,0.003872727055175347,0.015191066,0.00012560641,2.9149056e-05,4.5206743e-06
|
| 48 |
+
0.06097992962216492,0.03294634878612119,0.110426016,0.016868757,0.0032893084,0.00036801185,0.029851069680182304,0.09827576,0.016744858,0.0032603466,0.00036351025,201.64697269969358,736016,46000,0.00309527928518946,0.0121497195,0.00012382239,2.8945595e-05,4.5013194e-06
|
| 49 |
+
0.05663350393527339,0.03281864472618324,0.11114136,0.017104618,0.003268149,0.00035735714,0.029430219083558716,0.09762698,0.01697898,0.0032393266,0.0003529712,202.18138340129346,752016,47000,0.0033884257052377476,0.013513711,0.00012554179,2.880804e-05,4.385141e-06
|
| 50 |
+
0.06063569568036176,0.03437269755802121,0.113925785,0.016789563,0.0033288866,0.00035659614,0.030504634066950503,0.09906795,0.01666624,0.0032996624,0.00035222422,202.7109620764582,768016,48000,0.0038680633639451042,0.01485805,0.00012322138,2.9250343e-05,4.3697933e-06
|
| 51 |
+
0.05590325931445254,0.032708261736202934,0.108219825,0.016645735,0.003290488,0.0003511349,0.029215563801117245,0.09470438,0.016523577,0.0032615233,0.00034684205,203.2325454028811,784016,49000,0.0034926978458897744,0.013515289,0.00012212881,2.8963383e-05,4.2930833e-06
|
| 52 |
+
0.05887933848793965,0.03376324380328875,0.116158925,0.016920695,0.0032746454,0.00034992793,0.02897768413065938,0.096828245,0.016796345,0.0032458303,0.0003456357,203.76202215823727,800016,50000,0.004785559726273274,0.019329714,0.00012416193,2.8846493e-05,4.291475e-06
|
| 53 |
+
0.05469590156811721,0.032565321495523644,0.11032303,0.016709045,0.0032559878,0.00034908004,0.02907934553176169,0.096488744,0.016586395,0.0032273156,0.00034481476,204.2916254382747,816016,51000,0.0034859760021263273,0.0138334455,0.00012255994,2.866468e-05,4.2657607e-06
|
| 54 |
+
0.05821708565069131,0.03239636913407592,0.109414965,0.016752806,0.0031915545,0.00034925115,0.02922611857857558,0.09686192,0.016630068,0.003163346,0.00034498065,204.81139891476724,832016,52000,0.003170250439259681,0.0125530595,0.00012287298,2.8185024e-05,4.2722245e-06
|
| 55 |
+
0.056472664837151174,0.032827345147263286,0.11111243,0.016775163,0.0032373543,0.0003468643,0.029102278060745435,0.09635251,0.016651995,0.0032088135,0.00034263523,205.34224746566233,848016,53000,0.0037250671177025646,0.014759482,0.00012308097,2.8527791e-05,4.2316706e-06
|
| 56 |
+
0.058580288619056245,0.03378580757998857,0.116668485,0.01680422,0.0032340037,0.00034146922,0.029724239581264543,0.10026108,0.0166807,0.0032055054,0.0003372957,205.87049279340533,864016,54000,0.0040615680630035084,0.01640741,0.00012337447,2.8509008e-05,4.1713724e-06
|
| 57 |
+
0.05577092016550799,0.03361079018889,0.115389265,0.01653975,0.0032588867,0.00034043673,0.029271172700449793,0.098015465,0.016418306,0.0032301627,0.00033628094,206.39883776488094,880016,55000,0.0043396173334149255,0.01737308,0.000121398225,2.8703816e-05,4.1555404e-06
|
| 58 |
+
0.05777157335551956,0.032890599876409285,0.11236597,0.016426073,0.003189053,0.0003412673,0.029044150866800924,0.09706599,0.016305484,0.0031608941,0.00033709285,206.93104066460336,896016,56000,0.0038464491756367383,0.015299772,0.000120635515,2.8174678e-05,4.1754015e-06
|
| 59 |
+
0.0549993421713471,0.032922283426858504,0.11200538,0.01651029,0.003214448,0.00033035304,0.029002052478957843,0.096423775,0.01638919,0.0031861567,0.0003263155,207.46522256001313,912016,57000,0.003920230926469228,0.01558186,0.00012120526,2.8303351e-05,4.0363334e-06
|
| 60 |
+
0.05667900257998245,0.033775523173855654,0.11304036,0.016811568,0.0032695837,0.00033267093,0.029541628846433042,0.0965043,0.016688148,0.0032408198,0.00032860908,208.0033349397023,928016,58000,0.0042338941080270216,0.016535679,0.00012338899,2.8753026e-05,4.060786e-06
|
| 61 |
+
0.056156006808770274,0.03412930240388957,0.11518897,0.016638665,0.0032071744,0.00032965813,0.029538585802540176,0.09722457,0.016516583,0.0031789169,0.0003256278,208.54892494879786,944016,59000,0.0045907166081415205,0.017964583,0.00012210695,2.8254328e-05,4.029121e-06
|
| 62 |
+
0.05911564312284267,0.03229978877119724,0.10923988,0.016702617,0.0032797777,0.000333632,0.028932071614079128,0.095846295,0.0165801,0.0032509386,0.000329559,209.09054022985416,960016,60000,0.003367717187837117,0.013393664,0.00012255066,2.8840614e-05,4.07416e-06
|
| 63 |
+
0.05608525544731012,0.03283120975131181,0.10976717,0.016605306,0.0032396517,0.0003319304,0.029373283780645538,0.096258745,0.016483575,0.0032111153,0.00032788492,209.62571191879317,976016,61000,0.003457925954358867,0.013508584,0.00012169345,2.8519622e-05,4.046387e-06
|
| 64 |
+
0.05501877534166442,0.03297481621825135,0.11257801,0.016683873,0.0032061664,0.00032656046,0.02909935219865291,0.09710706,0.016561648,0.0031779374,0.0003225721,210.16177222075467,992016,62000,0.0038754640472434404,0.015470902,0.00012244807,2.823787e-05,3.9868305e-06
|
| 65 |
+
0.05219062805249584,0.03271656697243452,0.11215093,0.01660635,0.0031688388,0.00032076152,0.029074916717596305,0.0975485,0.016484628,0.00314089,0.00031685104,210.69716152923755,1008016,63000,0.003641650405934349,0.014602079,0.00012182051,2.796042e-05,3.910809e-06
|
| 66 |
+
0.0563183546792654,0.032633363903267196,0.110403255,0.016650705,0.0032242872,0.00033333438,0.028713572517503037,0.094859675,0.016528629,0.0031959028,0.00032927687,211.23255039549332,1024016,64000,0.003919791538915892,0.01554351,0.00012214162,2.8378483e-05,4.059327e-06
|
| 67 |
+
0.05567153185097883,0.03271436781599188,0.11082813,0.016680101,0.003167083,0.0003245076,0.028839432608569044,0.0954411,0.016557798,0.003139104,0.0003205526,211.7938454092672,1040016,65000,0.0038749351028000024,0.015386748,0.00012239139,2.7955537e-05,3.9548736e-06
|
| 68 |
+
0.054521421907489855,0.03198573151091111,0.10981132,0.016658057,0.0032372614,0.00032345607,0.028164957368280685,0.09436482,0.016535752,0.0032087525,0.0003195153,212.34134123745378,1056016,66000,0.0038207741568548935,0.015447455,0.00012225585,2.8481953e-05,3.9391934e-06
|
| 69 |
+
0.05447587863110852,0.03257946248212834,0.110619865,0.016562264,0.00321832,0.00032014225,0.028763761436566723,0.095464736,0.016440779,0.0031900178,0.00031624868,212.88179851937997,1072016,67000,0.0038157009625974718,0.015155151,0.000121496254,2.830203e-05,3.892867e-06
|
| 70 |
+
0.05625929957161441,0.03345432130480183,0.11385384,0.016502324,0.0031968574,0.00032535195,0.02944285704940558,0.09799432,0.016381111,0.0031687305,0.00032139668,213.43198783288094,1088016,68000,0.004011464272607544,0.015859297,0.000121060184,2.8142187e-05,3.955854e-06
|
| 71 |
+
0.055004896501871965,0.03179665893525817,0.106536396,0.016759587,0.003234906,0.0003170966,0.02866484727500941,0.09416932,0.016636532,0.0032064856,0.00031323388,213.97716156854878,1104016,69000,0.003131811674247735,0.012366518,0.0001230559,2.8449249e-05,3.8646804e-06
|
| 72 |
+
0.0536967586134085,0.031609297288116074,0.10543689,0.016608428,0.0031813001,0.00031804832,0.02858661183598451,0.09358934,0.01648658,0.0031532515,0.0003141802,214.52275669607016,1120016,70000,0.003022685538349841,0.011847356,0.00012193782,2.802256e-05,3.869898e-06
|
| 73 |
+
0.055160000674791175,0.03359202911099426,0.11249393,0.016765459,0.003218583,0.0003199129,0.029701160784345104,0.097294256,0.016642336,0.0031902415,0.0003160156,215.0794749861993,1136016,71000,0.0038908681614521056,0.015199085,0.00012300705,2.8343668e-05,3.8999674e-06
|
| 74 |
+
0.052124493352076494,0.032299238147214054,0.10922959,0.016720576,0.0031599372,0.00031348807,0.028491226778831348,0.09415393,0.016597822,0.0031320874,0.00030967535,215.6190056423105,1152016,72000,0.0038080114894764867,0.015075754,0.00012270373,2.7840493e-05,3.8117723e-06
|
| 75 |
+
0.05602791396815743,0.03207306618290028,0.10878707,0.01654309,0.0031445029,0.00031522085,0.028986355684697665,0.09652405,0.016421627,0.0031167322,0.0003113774,216.16338349037008,1168016,73000,0.0030867105857832968,0.012263436,0.000121361336,2.7754784e-05,3.842977e-06
|
| 76 |
+
0.05514118943080267,0.03291953222267334,0.11000037,0.016335782,0.0032078905,0.00031993998,0.02901805261312983,0.094825625,0.016215825,0.003179649,0.0003160567,216.7088737915842,1184016,74000,0.003901479640284375,0.015174718,0.00011994187,2.8248303e-05,3.8848984e-06
|
| 77 |
+
0.053917622368786805,0.03229256081348279,0.112196766,0.016277803,0.0031891218,0.00031636583,0.028643552313558786,0.097388506,0.016158126,0.0031610357,0.00031251617,217.2531572944162,1200016,75000,0.003649008465410592,0.014807831,0.00011950541,2.8058577e-05,3.8494427e-06
|
| 78 |
+
0.052981417029987224,0.0341953547678421,0.116435856,0.016571032,0.0031762663,0.00030623708,0.029571750625269504,0.09816321,0.016449459,0.00314827,0.00030250393,217.80283299053247,1216016,76000,0.004623604139531382,0.018273614,0.00012165095,2.7984212e-05,3.7342302e-06
|
| 79 |
+
0.05289038967522982,0.03162145696440708,0.10671775,0.01638042,0.0031340923,0.0003145785,0.028533928525866923,0.09455053,0.016260015,0.0031064413,0.00031076107,218.34727276351896,1232016,77000,0.0030875285836682413,0.012167565,0.00012020506,2.765851e-05,3.81587e-06
|
| 80 |
+
0.05182882786087654,0.03334044235898181,0.11710279,0.01634992,0.0032149598,0.00030519342,0.028676871411036683,0.097971424,0.016230054,0.0031866871,0.00030148242,218.8977723329652,1248016,78000,0.004663570980301311,0.01913189,0.00011996337,2.8270782e-05,3.7112736e-06
|
| 81 |
+
0.05568380582659867,0.03217754939687437,0.1095662,0.016602147,0.003222337,0.00031537103,0.028514700887724783,0.0949204,0.01648014,0.0031939843,0.00031153962,219.43789728445705,1264016,79000,0.003662848463267439,0.014646563,0.00012193552,2.8328419e-05,3.8329854e-06
|
| 82 |
+
0.052589483680058065,0.031027754681417816,0.10749624,0.016473018,0.0032142357,0.00030646118,0.027600207204464804,0.093507364,0.016352147,0.0031859952,0.00030273027,219.98566685717032,1280016,80000,0.003427547564009729,0.013987808,0.000120873076,2.8261276e-05,3.7290972e-06
|
| 83 |
+
0.05408931870586312,0.03287746825115753,0.11066489,0.016582951,0.0032121951,0.000311349,0.029243982360698296,0.0963409,0.01646148,0.0031839686,0.00030756238,220.53661458609324,1296016,81000,0.0036334858180962267,0.014324212,0.00012168298,2.8221206e-05,3.7859606e-06
|
| 84 |
+
0.05193936758525872,0.034012925043702125,0.11597945,0.016673468,0.0031951754,0.00030703977,0.029514113441342527,0.098124385,0.016551005,0.0031670453,0.00030331008,221.09667476906426,1312016,82000,0.0044988117457196485,0.017854406,0.00012236196,2.815449e-05,3.7301634e-06
|
| 85 |
+
0.05394444767229505,0.032036127452272856,0.1068324,0.016482735,0.0031777814,0.00030481693,0.028769741350319226,0.0940962,0.016361859,0.0031498182,0.00030111158,221.6284145809641,1328016,83000,0.003266386073872127,0.012735808,0.000120988894,2.7968386e-05,3.7091543e-06
|
| 86 |
+
0.05476221005534034,0.0326294223433361,0.11096678,0.01644256,0.0032055858,0.0003057367,0.028880953270941985,0.09606332,0.016321775,0.0031773986,0.0003020142,222.18229749069903,1344016,84000,0.0037484689268530926,0.014904034,0.00012073276,2.8205677e-05,3.7231591e-06
|
| 87 |
+
0.053805872175713636,0.03300966645451257,0.11195825,0.016388921,0.0031943046,0.00030365036,0.028699940414168,0.094897486,0.016268652,0.003166191,0.00029995653,222.72849472724013,1360016,85000,0.004309725956492912,0.017060978,0.000120299104,2.8126971e-05,3.694623e-06
|
| 88 |
+
0.05389630719102992,0.03263209202885624,0.111721896,0.016232198,0.003155762,0.00030469702,0.02846119845774958,0.095052056,0.016112978,0.0031279782,0.00030099525,223.27321970421107,1376016,86000,0.0041708936295944965,0.016670404,0.000119065,2.778399e-05,3.7022885e-06
|
| 89 |
+
0.052768324952189964,0.03336872462159945,0.11223782,0.016193166,0.0031470296,0.00029771673,0.02939277546736413,0.096720085,0.01607432,0.0031192529,0.00029409528,223.82831639236488,1392016,87000,0.003975949179493906,0.015517785,0.00011882389,2.7750488e-05,3.623136e-06
|
| 90 |
+
0.051911611603562696,0.032762888428755056,0.112017736,0.016323732,0.0032191554,0.00029317968,0.02849486762052399,0.09496883,0.016203977,0.0031908704,0.00028960145,224.36776144545254,1408016,88000,0.004268020885701837,0.017048156,0.000119667515,2.8295772e-05,3.5797157e-06
|
| 91 |
+
0.05270384717706044,0.03329609772935519,0.11268163,0.016314829,0.0031742973,0.0002963548,0.029269737612456045,0.09687495,0.016195076,0.0031463364,0.00029274338,224.9106097117001,1424016,89000,0.0040263602071318,0.015806448,0.00011976254,2.794944e-05,3.6102422e-06
|
| 92 |
+
0.05311616907660258,0.03209496235847477,0.10914376,0.016326811,0.0031423385,0.0003005712,0.028060743806883687,0.09305488,0.016206853,0.003114658,0.00029692045,225.45843791482633,1440016,90000,0.004034218460048576,0.016089164,0.000119740245,2.7677215e-05,3.6494046e-06
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb0488329e5e7a4f16c7265d77818bff83125f16e186d03b91211028af455c85
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model10000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d2040c72d075350bc8a4a03728fcc9e55922d1b4ee3bc61d136e5b57882e13a
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d702e8e25f876edd23ae0a331c45037916d8d9c126c20da8e24d6ddbd8ecaef1
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model20000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da10e3c5d24ec7d4e96a0cccc4288a99b32a91d0419173113379c34cebb75731
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:608f40578e49974a7c24abd8f4614150490c7bc075d135e41c5a6302ddf39343
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model30000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7946119a72301e1a1942646ab6cedc426a664219ffade5ce6b4cce7005cb3e6
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c181760e23bc89a3d148f24ed5ff97ef5c6beb93d90613a792c6a37bd8d971ad
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model40000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:649eabfaedbd9b674647dd4cd198867d548aec8505abe9704566bf265a29ec51
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3e8b60c1887915efbe2269a1e0a83f497ff9202ae9333804116d4823d55c8fd
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model50000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:304aa7488bd234365fbed535049492bf714cc7b29d078a62c61d75f256465097
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d88506c55c4433fbaf3048b562d1968f420a8bb9469fbd1914e528b13ef31dd
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model60000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c6d78f2677a88c633a3cdd7de0112af82132153180957f2c6918aec649ae49d
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48191b3527894041c309ba6d1cb07ffa40c9e0569f783c90330f337572c8e73b
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model70000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:865c44b1954ea89629977a6ffb27ae9521c258127b524e8c392ac3dd37245754
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0431935e48e0758773987b33e2412063afe5e6cdb12221988d9f4d6c6d2e8d7d
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/vb_model80000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c782b97d5ea8910de24497f5b30f6487f01eb8d12a384fc723f8639189c90135
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:325e539489c907a4fba19b8dc77839b48ee1f933bc6870fd24686188ae4c67eb
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model10000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a21fdf727a30b3f77a37bcbd836d8324391082da5f89396a92f99a1ae6a8b2bf
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f7a57d3d8156e6e01e397ca2d7883435b6a5bda71a612658945b55c2c1b15fb
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model20000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e62fa8f3e4680b217857c8fe6a589babf8e8efa26ff69e0359d959503130e055
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de8cb0f654d7525729b210d3ca1b89878112dd243a3712f3473bb6345ab51809
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model30000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48e1a3badf5dfcaac116fbf5403c1e1fde1104e291ec70e2d762b94ab1af5edf
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:608192783cc9fc8aa3a4f6a8dbf55d2c0ba46ba50aefaf256dfd30c471c10b90
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model40000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c552e5b68c30b1e0cf62558869408bb00e9db6b15bdd87c1c6c271c581577a09
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90a7f2f517b6cfb13919e493cf2f2216b90587ca38626c9ebcecd5b08558c75e
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model50000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b9c1e33e3996310692e85fb970bd0c0f6f55c60289412dce8c64cfefa24aca2
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_indistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfaa6a6ec8da1851c85dd78abe110fb19fed87128d46819bf6cbe5f82db4a31d
|
| 3 |
+
size 4264
|
cifar100_vfsddpm_vit_film_mean_sigma_deterministic/run-2026-01-02-02-23-04-976947/xstart_mse_model60000_outdistro_terms.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e010e2655fbf8810873c761fde1eb1f62a773c57447b4668ab3bfbe7789ca92
|
| 3 |
+
size 4264
|