best quick_fid_4096=66.906830 step=150000 at 20260310-150207-UTC
Browse files- .gitattributes +2 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/_CHECKPOINT_METADATA +1 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/_METADATA +0 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/_sharding +0 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/array_metadatas/process_0 +0 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/config.json +63 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/d/04c525a1ccccf771d9be43ceb822411b +0 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/manifest.ocdbt +0 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/225eaefc2b60c97f537e55e27d61b833 +0 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/2f1dd57d4934a9f170b7c91961731bcf +3 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/4c815373c9cabfa264637c7db6423857 +3 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/5f6666a182e67ca3c7d364e2c7c41171 +0 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/98aae8f44070e5e8b096195141329ed0 +0 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/f9c5c157ce9da85f15c97e64ddb0252f +0 -0
- jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/manifest.ocdbt +0 -0
.gitattributes
CHANGED
|
@@ -79,3 +79,5 @@ baseline_run_5/best/step_150000_20260310-130557-UTC/ocdbt.process_0/d/0722d44421
|
|
| 79 |
baseline_run_5/best/step_150000_20260310-130557-UTC/ocdbt.process_0/d/5f85f80d8957722c3e3b45b51af2f6d1 filter=lfs diff=lfs merge=lfs -text
|
| 80 |
baseline_run_5/best/step_150000_20260310-130557-UTC/ocdbt.process_0/d/9a17087add80ac960097ad02934a5bad filter=lfs diff=lfs merge=lfs -text
|
| 81 |
baseline_run_5/best/step_150000_20260310-130557-UTC/ocdbt.process_0/d/badfab0f4995d2b56bb143323c05e9ca filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
| 79 |
baseline_run_5/best/step_150000_20260310-130557-UTC/ocdbt.process_0/d/5f85f80d8957722c3e3b45b51af2f6d1 filter=lfs diff=lfs merge=lfs -text
|
| 80 |
baseline_run_5/best/step_150000_20260310-130557-UTC/ocdbt.process_0/d/9a17087add80ac960097ad02934a5bad filter=lfs diff=lfs merge=lfs -text
|
| 81 |
baseline_run_5/best/step_150000_20260310-130557-UTC/ocdbt.process_0/d/badfab0f4995d2b56bb143323c05e9ca filter=lfs diff=lfs merge=lfs -text
|
| 82 |
+
jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/2f1dd57d4934a9f170b7c91961731bcf filter=lfs diff=lfs merge=lfs -text
|
| 83 |
+
jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/4c815373c9cabfa264637c7db6423857 filter=lfs diff=lfs merge=lfs -text
|
jepa2_run/best/step_150000_20260310-150207-UTC/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1773154908818880547, "commit_timestamp_nsecs": 1773154927678365662, "custom_metadata": {}}
|
jepa2_run/best/step_150000_20260310-150207-UTC/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
jepa2_run/best/step_150000_20260310-150207-UTC/_sharding
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
jepa2_run/best/step_150000_20260310-150207-UTC/array_metadatas/process_0
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
jepa2_run/best/step_150000_20260310-150207-UTC/config.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"mode": "jepa2",
|
| 3 |
+
"data_dir": "/kaggle/input/datasets/bangchi/miniimagenet256-latents-arrayrecord-sdvae",
|
| 4 |
+
"num_classes": 100,
|
| 5 |
+
"patch_size": 2,
|
| 6 |
+
"hidden_size": 768,
|
| 7 |
+
"depth": 12,
|
| 8 |
+
"num_heads": 12,
|
| 9 |
+
"mlp_ratio": 4.0,
|
| 10 |
+
"opt": "adam",
|
| 11 |
+
"lr": 0.0001,
|
| 12 |
+
"beta1": 0.9,
|
| 13 |
+
"beta2": 0.99,
|
| 14 |
+
"weight_decay": 0.06,
|
| 15 |
+
"global_batch": 128,
|
| 16 |
+
"steps": 200000,
|
| 17 |
+
"seed": 42,
|
| 18 |
+
"class_dropout_prob": 0.2,
|
| 19 |
+
"aug_flip_p": 0.5,
|
| 20 |
+
"aug_jitter_eps": 0.01,
|
| 21 |
+
"t_schedule": "uniform",
|
| 22 |
+
"t_lognorm_mean": -0.4,
|
| 23 |
+
"t_lognorm_std": 1.0,
|
| 24 |
+
"lambda_jepa": 0.1,
|
| 25 |
+
"ema_decay": 0.999,
|
| 26 |
+
"mask_ratio": 0.25,
|
| 27 |
+
"student_layer": 3,
|
| 28 |
+
"teacher_layer": 7,
|
| 29 |
+
"lambda_jepa2": 1.0,
|
| 30 |
+
"jepa2_split_layer": 4,
|
| 31 |
+
"jepa2_mask_lo": 0.2,
|
| 32 |
+
"jepa2_mask_hi": 0.4,
|
| 33 |
+
"jepa2_t_shift": 1.0,
|
| 34 |
+
"jepa2_alpha_lo": 1.4,
|
| 35 |
+
"jepa2_alpha_hi": 2.0,
|
| 36 |
+
"jepa2_sigreg_slices": 512,
|
| 37 |
+
"jepa2_sigreg_sigma": 1.0,
|
| 38 |
+
"jepa2_sigreg_num_points": 17,
|
| 39 |
+
"jepa2_sigreg_domain_lo": -5.0,
|
| 40 |
+
"jepa2_sigreg_domain_hi": 5.0,
|
| 41 |
+
"cfg_scale": 2.0,
|
| 42 |
+
"sample_steps": 128,
|
| 43 |
+
"num_sample_images": 16,
|
| 44 |
+
"fid_n": 4096,
|
| 45 |
+
"fid_cache_path": "checkpoints/fid_real_stats_4096.npz",
|
| 46 |
+
"fid_decode_batch": 128,
|
| 47 |
+
"fid_inception_batch": 128,
|
| 48 |
+
"log_every": 1000,
|
| 49 |
+
"eval_every": 5000,
|
| 50 |
+
"sample_every": 10000,
|
| 51 |
+
"fid_every": 50000,
|
| 52 |
+
"ckpt_every": 100000,
|
| 53 |
+
"run_name": "jepa2_run",
|
| 54 |
+
"ckpt_dir": "/kaggle/working/checkpoints_jepa2",
|
| 55 |
+
"best_metric": "quick_fid_4096",
|
| 56 |
+
"hf_repo_id": "",
|
| 57 |
+
"hf_username": "Bangchis",
|
| 58 |
+
"hf_repo_name": "soft-jepa-flow",
|
| 59 |
+
"hf_private": false,
|
| 60 |
+
"latent_size": 32,
|
| 61 |
+
"latent_channels": 4,
|
| 62 |
+
"vae_scaling_factor": 0.18215
|
| 63 |
+
}
|
jepa2_run/best/step_150000_20260310-150207-UTC/d/04c525a1ccccf771d9be43ceb822411b
ADDED
|
Binary file (7.4 kB). View file
|
|
|
jepa2_run/best/step_150000_20260310-150207-UTC/manifest.ocdbt
ADDED
|
Binary file (118 Bytes). View file
|
|
|
jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/225eaefc2b60c97f537e55e27d61b833
ADDED
|
Binary file (18.3 kB). View file
|
|
|
jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/2f1dd57d4934a9f170b7c91961731bcf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ad93d64ca7666c719ce9a18b29785358054100e78c60e5b13f7a184638049e39
|
| 3 |
+
size 366288896
|
jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/4c815373c9cabfa264637c7db6423857
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a332050e129c1d7115719836f86eb162fa0deca1eef6c99565f75f9772ce8800
|
| 3 |
+
size 1551015936
|
jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/5f6666a182e67ca3c7d364e2c7c41171
ADDED
|
Binary file (560 Bytes). View file
|
|
|
jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/98aae8f44070e5e8b096195141329ed0
ADDED
|
Binary file (198 Bytes). View file
|
|
|
jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/d/f9c5c157ce9da85f15c97e64ddb0252f
ADDED
|
Binary file (776 Bytes). View file
|
|
|
jepa2_run/best/step_150000_20260310-150207-UTC/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (356 Bytes). View file
|
|
|