AbstractPhil commited on
Commit
7f99c7b
·
verified ·
1 Parent(s): 34412c8

Checkpoint: danbooru-50k-v1-512-2-20251117_060553/step9874

Browse files
danbooru-50k-v1-512-2-20251117_060553/step9874/config.json ADDED
@@ -0,0 +1,130 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sub_name": "danbooru-50k-v1-512-2",
3
+ "num_opinion_anchors": 225,
4
+ "pentachoron_dim": 512,
5
+ "scales": [
6
+ 128,
7
+ 256,
8
+ 512,
9
+ 1024
10
+ ],
11
+ "scale_hidden_dims": {
12
+ "128": 256,
13
+ "256": 512,
14
+ "512": 1024,
15
+ "1024": 2048
16
+ },
17
+ "alpha_init": 0.125,
18
+ "alpha_learnable": true,
19
+ "alpha_per_scale": true,
20
+ "beta_init": 0.5,
21
+ "beta_learnable": true,
22
+ "beta_per_scale": true,
23
+ "gamma_learnable": true,
24
+ "learn_layer_weights": true,
25
+ "siglip_model": "google/siglip-so400m-patch14-384",
26
+ "clip_tokenizer": "openai/clip-vit-large-patch14",
27
+ "illustrious_clip_path": "./models/NAI-11-epsilon_clip_l.safetensors",
28
+ "clip_skip": 1,
29
+ "siglip_layer_indices": [
30
+ 1,
31
+ 2,
32
+ 3,
33
+ 4,
34
+ 5,
35
+ 6,
36
+ 9,
37
+ 12,
38
+ 18,
39
+ 21,
40
+ 23,
41
+ 24,
42
+ 25,
43
+ 26
44
+ ],
45
+ "clip_layer_indices": null,
46
+ "use_gradient_checkpointing": false,
47
+ "share_scale_embeddings": false,
48
+ "dataset_name": "animetimm/danbooru-wdtagger-v4-w640-ws-50k",
49
+ "image_size": 384,
50
+ "max_tag_length": 77,
51
+ "batch_size": 24,
52
+ "num_epochs": 20,
53
+ "learning_rate": 0.0001,
54
+ "weight_decay": 0.01,
55
+ "warmup_steps": 1000,
56
+ "gradient_clip": 1.0,
57
+ "gradient_accumulation_steps": 1,
58
+ "token_loss_weight": 1.0,
59
+ "geometric_weight": 0.1,
60
+ "fusion_strategy": "learned_weighted",
61
+ "text_dropout_prob": 0.3,
62
+ "text_noise_std": 0.1,
63
+ "text_noise_prob": 0.5,
64
+ "vision_only_text": "general: blank_image",
65
+ "text_dropout_schedule": "linear",
66
+ "text_dropout_start": 0.1,
67
+ "text_dropout_end": 0.5,
68
+ "checkpoint_dir": "./checkpoints/liminal_staircase_danbooru",
69
+ "save_every": 500,
70
+ "hf_repo_id": "AbstractPhil/liminal-staircase-v2",
71
+ "hf_upload_every": 1000,
72
+ "hf_private": false,
73
+ "resume": false,
74
+ "log_dir": "./logs/liminal_staircase_danbooru",
75
+ "log_every": 5,
76
+ "device": "cuda",
77
+ "timestamp": "2025-11-17T14:10:35.698828",
78
+ "step": 9874,
79
+ "epoch": 5,
80
+ "val_loss": Infinity,
81
+ "fusion_diagnostics": {
82
+ "layer_weights": [
83
+ 0.04135271906852722,
84
+ 0.040869709104299545,
85
+ 0.042614471167325974,
86
+ 0.041568122804164886,
87
+ 0.04186437278985977,
88
+ 0.04223686456680298,
89
+ 0.03997607156634331,
90
+ 0.04222464561462402,
91
+ 0.03964937850832939,
92
+ 0.038747575134038925,
93
+ 0.03888710215687752,
94
+ 0.03851398453116417,
95
+ 0.0383797213435173,
96
+ 0.03842699155211449,
97
+ 0.038952481001615524,
98
+ 0.038612887263298035,
99
+ 0.03840705752372742,
100
+ 0.03818415477871895,
101
+ 0.03945833817124367,
102
+ 0.040741387754678726,
103
+ 0.040348730981349945,
104
+ 0.04126262664794922,
105
+ 0.04083728790283203,
106
+ 0.03929390013217926,
107
+ 0.03858938068151474
108
+ ],
109
+ "scale_weights": [
110
+ 0.19150905311107635,
111
+ 0.2122136950492859,
112
+ 0.2983412742614746,
113
+ 0.29793596267700195
114
+ ],
115
+ "alpha_per_scale": [
116
+ 0.24941794574260712,
117
+ 0.24941794574260712,
118
+ 0.24941794574260712,
119
+ 0.24941794574260712
120
+ ],
121
+ "beta_per_scale": [
122
+ 0.569037139415741,
123
+ 0.5981298089027405,
124
+ 0.5593996047973633,
125
+ 0.58758544921875
126
+ ],
127
+ "scale_statistics": {}
128
+ },
129
+ "is_best": false
130
+ }
danbooru-50k-v1-512-2-20251117_060553/step9874/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6edaf73851e28edcc9a5cfcb470323a0576ba252de3ef43cb49041c2ca4f4a8
3
+ size 1106728220
danbooru-50k-v1-512-2-20251117_060553/step9874/training_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e93b5d3a5352a989af83b384bcb370ba08cdd0bb2a2872f2a0403ca57e742a5b
3
+ size 2075709603