Checkpoint: danbooru-50k-v1-512-20251117_055745/step116

Browse files

Files changed (3) hide show

danbooru-50k-v1-512-20251117_055745/step116/config.json +121 -0
danbooru-50k-v1-512-20251117_055745/step116/model.safetensors +3 -0
danbooru-50k-v1-512-20251117_055745/step116/training_state.pt +3 -0

danbooru-50k-v1-512-20251117_055745/step116/config.json ADDED Viewed

	@@ -0,0 +1,121 @@

+{
+  "sub_name": "danbooru-50k-v1-512",
+  "num_opinion_anchors": 225,
+  "pentachoron_dim": 512,
+  "scales": [
+    128,
+    256,
+    512,
+    1024
+  ],
+  "scale_hidden_dims": {
+    "128": 128,
+    "256": 512,
+    "512": 1024,
+    "1024": 2048
+  },
+  "alpha_init": 0.1,
+  "alpha_learnable": true,
+  "alpha_per_scale": true,
+  "beta_init": 0.5,
+  "beta_learnable": true,
+  "beta_per_scale": true,
+  "gamma_learnable": true,
+  "learn_layer_weights": true,
+  "siglip_model": "google/siglip-so400m-patch14-384",
+  "clip_tokenizer": "openai/clip-vit-large-patch14",
+  "illustrious_clip_path": "./models/NAI-11-epsilon_clip_l.safetensors",
+  "clip_skip": 0,
+  "siglip_layer_indices": [
+    3,
+    6,
+    9,
+    12,
+    21,
+    23,
+    24,
+    25,
+    26
+  ],
+  "clip_layer_indices": null,
+  "use_gradient_checkpointing": false,
+  "share_scale_embeddings": false,
+  "dataset_name": "animetimm/danbooru-wdtagger-v4-w640-ws-50k",
+  "image_size": 384,
+  "max_tag_length": 77,
+  "batch_size": 16,
+  "num_epochs": 3,
+  "learning_rate": 0.0001,
+  "weight_decay": 0.01,
+  "warmup_steps": 1000,
+  "gradient_clip": 1.0,
+  "gradient_accumulation_steps": 1,
+  "token_loss_weight": 1.0,
+  "geometric_weight": 0.1,
+  "fusion_strategy": "learned_weighted",
+  "text_dropout_prob": 0.3,
+  "text_noise_std": 0.1,
+  "text_noise_prob": 0.5,
+  "vision_only_text": "general: blank_image",
+  "text_dropout_schedule": "linear",
+  "text_dropout_start": 0.1,
+  "text_dropout_end": 0.5,
+  "checkpoint_dir": "./checkpoints/liminal_staircase_danbooru",
+  "save_every": 500,
+  "hf_repo_id": "AbstractPhil/liminal-staircase-v2",
+  "hf_upload_every": 1000,
+  "hf_private": false,
+  "resume": true,
+  "log_dir": "./logs/liminal_staircase_danbooru",
+  "log_every": 5,
+  "device": "cuda",
+  "timestamp": "2025-11-17T06:00:46.795492",
+  "step": 116,
+  "epoch": 0,
+  "val_loss": Infinity,
+  "fusion_diagnostics": {
+    "layer_weights": [
+      0.04763081297278404,
+      0.04762101545929909,
+      0.04759393259882927,
+      0.04762202873826027,
+      0.047565292567014694,
+      0.047590624541044235,
+      0.047599051147699356,
+      0.047562386840581894,
+      0.04760372266173363,
+      0.047676656395196915,
+      0.04768342152237892,
+      0.04765501245856285,
+      0.047600556164979935,
+      0.047637615352869034,
+      0.047645460814237595,
+      0.04759979993104935,
+      0.047738682478666306,
+      0.04763513430953026,
+      0.04761926084756851,
+      0.04758467897772789,
+      0.04753493145108223
+    ],
+    "scale_weights": [
+      0.2466253936290741,
+      0.24661938846111298,
+      0.2533079981803894,
+      0.2534472644329071
+    ],
+    "alpha_per_scale": [
+      0.2630360424518585,
+      0.2630360424518585,
+      0.2630360424518585,
+      0.2630360424518585
+    ],
+    "beta_per_scale": [
+      0.6198403835296631,
+      0.6200416088104248,
+      0.6200869679450989,
+      0.6201481819152832
+    ],
+    "scale_statistics": {}
+  },
+  "is_best": false
+}

danbooru-50k-v1-512-20251117_055745/step116/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7d479fbc8da77d5bf92d67ca27278dc6798b2ed23104034ff0e0589217fc04d
+size 985442620

danbooru-50k-v1-512-20251117_055745/step116/training_state.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68c82e3bcd4e35bb88b0528c29d9d5d6596be0d957be62715d158ba124cddcda
+size 1855182563