best quick_fid_4096=48.418213 step=150000 at 20260306-013603-UTC
Browse files- .gitattributes +4 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/_CHECKPOINT_METADATA +1 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/_METADATA +0 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/_sharding +0 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/array_metadatas/process_0 +0 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/config.json +51 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/d/3fc88f86120e8eefa61b1d9365a0bb6b +0 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/manifest.ocdbt +0 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/185f8e1627726b8615e6668d22f38117 +3 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/2a987fd68fb1ad99987498ef8b09cc68 +3 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/4c49a96d1a93b413bb569ca87828100f +3 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/9a631f30dccd467b0cd2898fca1d98e6 +0 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/b73d6cab7365f8a17fa4819f214d603d +0 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/c8e8ac49a896dc7fcb82f7373cb11d33 +3 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/d0ded284ed0cdebe52431daddbc532ba +0 -0
- jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/manifest.ocdbt +0 -0
.gitattributes
CHANGED
|
@@ -42,3 +42,7 @@ jepa_full_final/best/step_100000_20260305-235157-UTC/ocdbt.process_0/d/791a5a64e
|
|
| 42 |
jepa_full_final/best/step_100000_20260305-235157-UTC/ocdbt.process_0/d/aaf3588a581047468ad21486c9bd8c54 filter=lfs diff=lfs merge=lfs -text
|
| 43 |
jepa_full_final/best/step_100000_20260305-235157-UTC/ocdbt.process_0/d/c7756d4de2dfd76cf0bdfcb184da596e filter=lfs diff=lfs merge=lfs -text
|
| 44 |
jepa_full_final/best/step_100000_20260305-235157-UTC/ocdbt.process_0/d/df1ad2e6d4e530e4504c482c8bffb276 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 42 |
jepa_full_final/best/step_100000_20260305-235157-UTC/ocdbt.process_0/d/aaf3588a581047468ad21486c9bd8c54 filter=lfs diff=lfs merge=lfs -text
|
| 43 |
jepa_full_final/best/step_100000_20260305-235157-UTC/ocdbt.process_0/d/c7756d4de2dfd76cf0bdfcb184da596e filter=lfs diff=lfs merge=lfs -text
|
| 44 |
jepa_full_final/best/step_100000_20260305-235157-UTC/ocdbt.process_0/d/df1ad2e6d4e530e4504c482c8bffb276 filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/185f8e1627726b8615e6668d22f38117 filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/2a987fd68fb1ad99987498ef8b09cc68 filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/4c49a96d1a93b413bb569ca87828100f filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/c8e8ac49a896dc7fcb82f7373cb11d33 filter=lfs diff=lfs merge=lfs -text
|
jepa_full_final/best/step_150000_20260306-013603-UTC/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1772760944098882186, "commit_timestamp_nsecs": 1772760962871519522, "custom_metadata": {}}
|
jepa_full_final/best/step_150000_20260306-013603-UTC/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
jepa_full_final/best/step_150000_20260306-013603-UTC/_sharding
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
jepa_full_final/best/step_150000_20260306-013603-UTC/array_metadatas/process_0
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
jepa_full_final/best/step_150000_20260306-013603-UTC/config.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"mode": "jepa",
|
| 3 |
+
"data_dir": "/kaggle/input/datasets/bangchi/miniimagenet256-latents-arrayrecord-sdvae",
|
| 4 |
+
"num_classes": 100,
|
| 5 |
+
"patch_size": 2,
|
| 6 |
+
"hidden_size": 768,
|
| 7 |
+
"depth": 12,
|
| 8 |
+
"num_heads": 12,
|
| 9 |
+
"mlp_ratio": 4.0,
|
| 10 |
+
"opt": "adamw",
|
| 11 |
+
"lr": 0.0001,
|
| 12 |
+
"beta1": 0.9,
|
| 13 |
+
"beta2": 0.99,
|
| 14 |
+
"weight_decay": 0.02,
|
| 15 |
+
"global_batch": 256,
|
| 16 |
+
"steps": 300000,
|
| 17 |
+
"seed": 42,
|
| 18 |
+
"class_dropout_prob": 0.1,
|
| 19 |
+
"aug_flip_p": 0.5,
|
| 20 |
+
"aug_jitter_eps": 0.01,
|
| 21 |
+
"t_schedule": "lognormal",
|
| 22 |
+
"t_lognorm_mean": -0.4,
|
| 23 |
+
"t_lognorm_std": 1.0,
|
| 24 |
+
"lambda_jepa": 0.15,
|
| 25 |
+
"ema_decay": 0.995,
|
| 26 |
+
"mask_ratio": 0.3,
|
| 27 |
+
"student_layer": 3,
|
| 28 |
+
"teacher_layer": 7,
|
| 29 |
+
"cfg_scale": 2.0,
|
| 30 |
+
"sample_steps": 128,
|
| 31 |
+
"num_sample_images": 16,
|
| 32 |
+
"fid_n": 4096,
|
| 33 |
+
"fid_cache_path": "/kaggle/working/checkpoints_jepa/fid_real_stats_4096.npz",
|
| 34 |
+
"fid_decode_batch": 128,
|
| 35 |
+
"fid_inception_batch": 128,
|
| 36 |
+
"log_every": 500,
|
| 37 |
+
"eval_every": 5000,
|
| 38 |
+
"sample_every": 10000,
|
| 39 |
+
"fid_every": 50000,
|
| 40 |
+
"ckpt_every": 50000,
|
| 41 |
+
"run_name": "jepa_full_final",
|
| 42 |
+
"ckpt_dir": "/kaggle/working/checkpoints_jepa",
|
| 43 |
+
"best_metric": "quick_fid_4096",
|
| 44 |
+
"hf_repo_id": "",
|
| 45 |
+
"hf_username": "Bangchis",
|
| 46 |
+
"hf_repo_name": "soft-jepa-flow",
|
| 47 |
+
"hf_private": false,
|
| 48 |
+
"latent_size": 32,
|
| 49 |
+
"latent_channels": 4,
|
| 50 |
+
"vae_scaling_factor": 0.18215
|
| 51 |
+
}
|
jepa_full_final/best/step_150000_20260306-013603-UTC/d/3fc88f86120e8eefa61b1d9365a0bb6b
ADDED
|
Binary file (7.8 kB). View file
|
|
|
jepa_full_final/best/step_150000_20260306-013603-UTC/manifest.ocdbt
ADDED
|
Binary file (118 Bytes). View file
|
|
|
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/185f8e1627726b8615e6668d22f38117
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fdfba224456f45b40326e1ea9f2c98182efbf6d66b6db22f740692e20eacdeaa
|
| 3 |
+
size 953565184
|
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/2a987fd68fb1ad99987498ef8b09cc68
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3247b02b4fa75f45f644fc304edee7264bc64bb8b507e93c2ea34d4cd9e903c6
|
| 3 |
+
size 160329728
|
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/4c49a96d1a93b413bb569ca87828100f
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e82d4ae125f6f0395fb41119cedaaf2502525f76bd820fc434af956ff2345a62
|
| 3 |
+
size 617082880
|
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/9a631f30dccd467b0cd2898fca1d98e6
ADDED
|
Binary file (850 Bytes). View file
|
|
|
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/b73d6cab7365f8a17fa4819f214d603d
ADDED
|
Binary file (937 Bytes). View file
|
|
|
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/c8e8ac49a896dc7fcb82f7373cb11d33
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:beeb88f2c810afa26e7c68e6ff1409e04457e7143f8bc01ae6f1580dd17d647f
|
| 3 |
+
size 224653312
|
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/d/d0ded284ed0cdebe52431daddbc532ba
ADDED
|
Binary file (198 Bytes). View file
|
|
|
jepa_full_final/best/step_150000_20260306-013603-UTC/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (408 Bytes). View file
|
|
|