best quick_fid_4096=374.217712 step=50000 at 20260310-062035-UTC
Browse files- .gitattributes +2 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/_CHECKPOINT_METADATA +1 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/_METADATA +0 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/_sharding +0 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/array_metadatas/process_0 +0 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/config.json +63 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/d/937d29a5a60a5543e84aa1aa02cfa807 +0 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/manifest.ocdbt +0 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/144ee7fe81bd3ab92294ecfa31efb382 +0 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/26f1fa3374f1612480c7e27a492db91c +0 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/830c0a5c887e795245b090591abf552a +0 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/a17078b8be935a05c83428e6852d6aae +3 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/afe541b66772ee7a58ce753ae165bcfc +0 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/c389380db73fde17b77dd7b18a0f287e +3 -0
- baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/manifest.ocdbt +0 -0
.gitattributes
CHANGED
|
@@ -61,3 +61,5 @@ jepa2_run/best/step_200000_20260310-021538-UTC/ocdbt.process_0/d/41a74029bb23086
|
|
| 61 |
jepa2_run/best/step_200000_20260310-021538-UTC/ocdbt.process_0/d/5fada07f92c5f470a4c0f793c5eca5fa filter=lfs diff=lfs merge=lfs -text
|
| 62 |
jepa2_run/best/step_200000_20260310-021538-UTC/ocdbt.process_0/d/a3d111d1524ecb78cd4159c4c9b72734 filter=lfs diff=lfs merge=lfs -text
|
| 63 |
jepa2_run/best/step_200000_20260310-021538-UTC/ocdbt.process_0/d/db2450ebf4b361a8fea4f0a983237b6f filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
| 61 |
jepa2_run/best/step_200000_20260310-021538-UTC/ocdbt.process_0/d/5fada07f92c5f470a4c0f793c5eca5fa filter=lfs diff=lfs merge=lfs -text
|
| 62 |
jepa2_run/best/step_200000_20260310-021538-UTC/ocdbt.process_0/d/a3d111d1524ecb78cd4159c4c9b72734 filter=lfs diff=lfs merge=lfs -text
|
| 63 |
jepa2_run/best/step_200000_20260310-021538-UTC/ocdbt.process_0/d/db2450ebf4b361a8fea4f0a983237b6f filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/a17078b8be935a05c83428e6852d6aae filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/c389380db73fde17b77dd7b18a0f287e filter=lfs diff=lfs merge=lfs -text
|
baseline_run_final/best/step_50000_20260310-062035-UTC/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1773123618233733681, "commit_timestamp_nsecs": 1773123635777248032, "custom_metadata": {}}
|
baseline_run_final/best/step_50000_20260310-062035-UTC/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
baseline_run_final/best/step_50000_20260310-062035-UTC/_sharding
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
baseline_run_final/best/step_50000_20260310-062035-UTC/array_metadatas/process_0
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
baseline_run_final/best/step_50000_20260310-062035-UTC/config.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"mode": "baseline",
|
| 3 |
+
"data_dir": "/kaggle/input/datasets/bangchi/miniimagenet256-latents-arrayrecord-sdvae",
|
| 4 |
+
"num_classes": 100,
|
| 5 |
+
"patch_size": 2,
|
| 6 |
+
"hidden_size": 768,
|
| 7 |
+
"depth": 12,
|
| 8 |
+
"num_heads": 12,
|
| 9 |
+
"mlp_ratio": 4.0,
|
| 10 |
+
"opt": "adamw",
|
| 11 |
+
"lr": 0.0001,
|
| 12 |
+
"beta1": 0.9,
|
| 13 |
+
"beta2": 0.99,
|
| 14 |
+
"weight_decay": 0.0,
|
| 15 |
+
"global_batch": 256,
|
| 16 |
+
"steps": 300000,
|
| 17 |
+
"seed": 42,
|
| 18 |
+
"class_dropout_prob": 0.2,
|
| 19 |
+
"aug_flip_p": 0.5,
|
| 20 |
+
"aug_jitter_eps": 0.01,
|
| 21 |
+
"t_schedule": "lognormal",
|
| 22 |
+
"t_lognorm_mean": -0.4,
|
| 23 |
+
"t_lognorm_std": 1.0,
|
| 24 |
+
"lambda_jepa": 0.1,
|
| 25 |
+
"ema_decay": 0.999,
|
| 26 |
+
"mask_ratio": 0.25,
|
| 27 |
+
"student_layer": 3,
|
| 28 |
+
"teacher_layer": 7,
|
| 29 |
+
"lambda_jepa2": 1,
|
| 30 |
+
"jepa2_split_layer": 4,
|
| 31 |
+
"jepa2_mask_lo": 0.2,
|
| 32 |
+
"jepa2_mask_hi": 0.4,
|
| 33 |
+
"jepa2_t_shift": 1,
|
| 34 |
+
"jepa2_alpha_lo": 1.4,
|
| 35 |
+
"jepa2_alpha_hi": 2.0,
|
| 36 |
+
"jepa2_sigreg_slices": 512,
|
| 37 |
+
"jepa2_sigreg_sigma": 1.0,
|
| 38 |
+
"jepa2_sigreg_num_points": 17,
|
| 39 |
+
"jepa2_sigreg_domain_lo": -5.0,
|
| 40 |
+
"jepa2_sigreg_domain_hi": 5.0,
|
| 41 |
+
"cfg_scale": 2.0,
|
| 42 |
+
"sample_steps": 128,
|
| 43 |
+
"num_sample_images": 16,
|
| 44 |
+
"fid_n": 4096,
|
| 45 |
+
"fid_cache_path": "checkpoints/fid_real_stats_4096.npz",
|
| 46 |
+
"fid_decode_batch": 128,
|
| 47 |
+
"fid_inception_batch": 128,
|
| 48 |
+
"log_every": 1000,
|
| 49 |
+
"eval_every": 5000,
|
| 50 |
+
"sample_every": 10000,
|
| 51 |
+
"fid_every": 50000,
|
| 52 |
+
"ckpt_every": 100000,
|
| 53 |
+
"run_name": "baseline_run_final",
|
| 54 |
+
"ckpt_dir": "/kaggle/working/checkpoints_jepa2",
|
| 55 |
+
"best_metric": "quick_fid_4096",
|
| 56 |
+
"hf_repo_id": "",
|
| 57 |
+
"hf_username": "Bangchis",
|
| 58 |
+
"hf_repo_name": "soft-jepa-flow",
|
| 59 |
+
"hf_private": false,
|
| 60 |
+
"latent_size": 32,
|
| 61 |
+
"latent_channels": 4,
|
| 62 |
+
"vae_scaling_factor": 0.18215
|
| 63 |
+
}
|
baseline_run_final/best/step_50000_20260310-062035-UTC/d/937d29a5a60a5543e84aa1aa02cfa807
ADDED
|
Binary file (7.23 kB). View file
|
|
|
baseline_run_final/best/step_50000_20260310-062035-UTC/manifest.ocdbt
ADDED
|
Binary file (118 Bytes). View file
|
|
|
baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/144ee7fe81bd3ab92294ecfa31efb382
ADDED
|
Binary file (198 Bytes). View file
|
|
|
baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/26f1fa3374f1612480c7e27a492db91c
ADDED
|
Binary file (885 Bytes). View file
|
|
|
baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/830c0a5c887e795245b090591abf552a
ADDED
|
Binary file (532 Bytes). View file
|
|
|
baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/a17078b8be935a05c83428e6852d6aae
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33b457da0e5fa15c0ef96cbbbaa329c2ddb502095125b3bfe8946503ef05c899
|
| 3 |
+
size 1452556288
|
baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/afe541b66772ee7a58ce753ae165bcfc
ADDED
|
Binary file (1.08 kB). View file
|
|
|
baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/d/c389380db73fde17b77dd7b18a0f287e
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de92c576a0edb94ffada339631b8a32d1e3a32cc25498da05edb716a449d19d1
|
| 3 |
+
size 320159744
|
baseline_run_final/best/step_50000_20260310-062035-UTC/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (345 Bytes). View file
|
|
|