Add files using upload-large-folder tool
Browse files- trainer_0/ae.pt +3 -0
- trainer_0/checkpoints/ae_0.pt +3 -0
- trainer_0/checkpoints/ae_13.pt +3 -0
- trainer_0/checkpoints/ae_138.pt +3 -0
- trainer_0/checkpoints/ae_1389.pt +3 -0
- trainer_0/checkpoints/ae_4.pt +3 -0
- trainer_0/checkpoints/ae_43.pt +3 -0
- trainer_0/checkpoints/ae_439.pt +3 -0
- trainer_0/config.json +63 -0
- trainer_1/ae.pt +3 -0
- trainer_1/checkpoints/ae_0.pt +3 -0
- trainer_1/checkpoints/ae_13.pt +3 -0
- trainer_1/checkpoints/ae_138.pt +3 -0
- trainer_1/checkpoints/ae_1389.pt +3 -0
- trainer_1/checkpoints/ae_4.pt +3 -0
- trainer_1/checkpoints/ae_43.pt +3 -0
- trainer_1/checkpoints/ae_439.pt +3 -0
- trainer_1/config.json +63 -0
- trainer_2/ae.pt +3 -0
- trainer_2/checkpoints/ae_0.pt +3 -0
- trainer_2/checkpoints/ae_13.pt +3 -0
- trainer_2/checkpoints/ae_138.pt +3 -0
- trainer_2/checkpoints/ae_1389.pt +3 -0
- trainer_2/checkpoints/ae_4.pt +3 -0
- trainer_2/checkpoints/ae_43.pt +3 -0
- trainer_2/checkpoints/ae_439.pt +3 -0
- trainer_2/config.json +63 -0
- trainer_3/ae.pt +3 -0
- trainer_3/checkpoints/ae_0.pt +3 -0
- trainer_3/checkpoints/ae_13.pt +3 -0
- trainer_3/checkpoints/ae_138.pt +3 -0
- trainer_3/checkpoints/ae_1389.pt +3 -0
- trainer_3/checkpoints/ae_4.pt +3 -0
- trainer_3/checkpoints/ae_43.pt +3 -0
- trainer_3/checkpoints/ae_439.pt +3 -0
- trainer_3/config.json +63 -0
trainer_0/ae.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93ad1dc5e4b31d3b7b6a14f5562ee5008c4706c7bd8cfa02e14715b0c8d96175
|
| 3 |
+
size 4213453
|
trainer_0/checkpoints/ae_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9c3f9911d2bd6e34ebfd5c0519fd6ccb8bac61e88d160abb6d1a12a4efa12b22
|
| 3 |
+
size 4213667
|
trainer_0/checkpoints/ae_13.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f384ea83bec4cf5112301f593a87808b18870f2cd828c2ae9d86b82a2edfeef
|
| 3 |
+
size 4213678
|
trainer_0/checkpoints/ae_138.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:404e51502cf4bc94100320fae36b6ab1955fb2a9ea58fb14120ad061925bfd7a
|
| 3 |
+
size 4213689
|
trainer_0/checkpoints/ae_1389.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e18cbda6e3f98c8dbd9e6b6ed4057d3bf8e12ed5b6022876d67b10a6e3d834cb
|
| 3 |
+
size 4213700
|
trainer_0/checkpoints/ae_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe6a301789ca1ef6cf346dcbf988c2d37d6742b9ca843ca55fc216ebf5435c40
|
| 3 |
+
size 4213667
|
trainer_0/checkpoints/ae_43.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:352bbd7e608d43d238ec94d41ae258783111f1a3425f425ed9dd53d747f6e18f
|
| 3 |
+
size 4213678
|
trainer_0/checkpoints/ae_439.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:923f4053939f42e6b3549476a0239df5ea19eae601bc1cba2c464c2e9b60910a
|
| 3 |
+
size 4213689
|
trainer_0/config.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"trainer": {
|
| 3 |
+
"trainer_class": "MatryoshkaBatchTopKTrainer",
|
| 4 |
+
"dict_class": "MatryoshkaBatchTopKSAE",
|
| 5 |
+
"lr": 5e-05,
|
| 6 |
+
"steps": 4394,
|
| 7 |
+
"auxk_alpha": 0.03125,
|
| 8 |
+
"warmup_steps": 1000,
|
| 9 |
+
"decay_start": 3515,
|
| 10 |
+
"threshold_beta": 0.999,
|
| 11 |
+
"threshold_start_step": 1000,
|
| 12 |
+
"top_k_aux": 64,
|
| 13 |
+
"seed": 0,
|
| 14 |
+
"activation_dim": 128,
|
| 15 |
+
"dict_size": 4096,
|
| 16 |
+
"group_fractions": [
|
| 17 |
+
0.03125,
|
| 18 |
+
0.0625,
|
| 19 |
+
0.125,
|
| 20 |
+
0.25,
|
| 21 |
+
0.53125
|
| 22 |
+
],
|
| 23 |
+
"group_weights": [
|
| 24 |
+
0.2,
|
| 25 |
+
0.2,
|
| 26 |
+
0.2,
|
| 27 |
+
0.2,
|
| 28 |
+
0.2
|
| 29 |
+
],
|
| 30 |
+
"group_sizes": [
|
| 31 |
+
128,
|
| 32 |
+
256,
|
| 33 |
+
512,
|
| 34 |
+
1024,
|
| 35 |
+
2176
|
| 36 |
+
],
|
| 37 |
+
"k": 10,
|
| 38 |
+
"device": "cuda:0",
|
| 39 |
+
"layer": "unknown",
|
| 40 |
+
"lm_name": "Lightricks/LTX-Video-0.9.5",
|
| 41 |
+
"wandb_name": "MatryoshkaBatchTopKTrainer-Lightricks/LTX-Video-0.9.5-resid_post_layer_unknown_trainer_0",
|
| 42 |
+
"submodule_name": "resid_post_layer_unknown"
|
| 43 |
+
},
|
| 44 |
+
"buffer": {
|
| 45 |
+
"activation_dir": "/mnt/nw/home/m.yu/repos/dictionary_learning_demo/ltx_activations_vae",
|
| 46 |
+
"d_submodule": 128,
|
| 47 |
+
"out_batch_size": 2048,
|
| 48 |
+
"num_shards": 70,
|
| 49 |
+
"metadata": {
|
| 50 |
+
"model_name": "Lightricks/LTX-Video-0.9.5",
|
| 51 |
+
"hook_target": "vae_latent_mean",
|
| 52 |
+
"d_model": 128,
|
| 53 |
+
"num_frames": 321,
|
| 54 |
+
"height": 256,
|
| 55 |
+
"width": 256,
|
| 56 |
+
"max_norm_multiple": 10,
|
| 57 |
+
"total_tokens": 9063296,
|
| 58 |
+
"num_shards": 70,
|
| 59 |
+
"num_videos": 3454,
|
| 60 |
+
"save_dtype": "float32"
|
| 61 |
+
}
|
| 62 |
+
}
|
| 63 |
+
}
|
trainer_1/ae.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd173b74925893f241c30425b0d5c5bb84609a59ab5446ade384812470d22e61
|
| 3 |
+
size 4213453
|
trainer_1/checkpoints/ae_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6793f04e7b3b6ee42fc869f22457c6bc023b0644a50109f3b403abdb692edef5
|
| 3 |
+
size 4213667
|
trainer_1/checkpoints/ae_13.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59763218433ca21223c434dcc306b2603f713d6b8c633fb90487f82f443d145d
|
| 3 |
+
size 4213678
|
trainer_1/checkpoints/ae_138.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56f498015d7ceaf9c161c01e9c6a7d84be712516266cf100a94dee0de0902927
|
| 3 |
+
size 4213689
|
trainer_1/checkpoints/ae_1389.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9f49f48d3b65bb393a190c2b4013332fed8fb81933080602ec55be0e05b47bf
|
| 3 |
+
size 4213700
|
trainer_1/checkpoints/ae_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bedfdd803b00727035fa04c59fbb450d1866574ce1aa4ff04c87fe50de5dab76
|
| 3 |
+
size 4213667
|
trainer_1/checkpoints/ae_43.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8ef6d2de274bf8838f6a5cf1ac6cd90f338e57af5916a192e6a697f468b9b86
|
| 3 |
+
size 4213678
|
trainer_1/checkpoints/ae_439.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9fe153f90237596a2fc6c1d3fbe0a8db2d42936cf63cf7b6f6f7345137afe5b4
|
| 3 |
+
size 4213689
|
trainer_1/config.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"trainer": {
|
| 3 |
+
"trainer_class": "MatryoshkaBatchTopKTrainer",
|
| 4 |
+
"dict_class": "MatryoshkaBatchTopKSAE",
|
| 5 |
+
"lr": 5e-05,
|
| 6 |
+
"steps": 4394,
|
| 7 |
+
"auxk_alpha": 0.03125,
|
| 8 |
+
"warmup_steps": 1000,
|
| 9 |
+
"decay_start": 3515,
|
| 10 |
+
"threshold_beta": 0.999,
|
| 11 |
+
"threshold_start_step": 1000,
|
| 12 |
+
"top_k_aux": 64,
|
| 13 |
+
"seed": 0,
|
| 14 |
+
"activation_dim": 128,
|
| 15 |
+
"dict_size": 4096,
|
| 16 |
+
"group_fractions": [
|
| 17 |
+
0.03125,
|
| 18 |
+
0.0625,
|
| 19 |
+
0.125,
|
| 20 |
+
0.25,
|
| 21 |
+
0.53125
|
| 22 |
+
],
|
| 23 |
+
"group_weights": [
|
| 24 |
+
0.2,
|
| 25 |
+
0.2,
|
| 26 |
+
0.2,
|
| 27 |
+
0.2,
|
| 28 |
+
0.2
|
| 29 |
+
],
|
| 30 |
+
"group_sizes": [
|
| 31 |
+
128,
|
| 32 |
+
256,
|
| 33 |
+
512,
|
| 34 |
+
1024,
|
| 35 |
+
2176
|
| 36 |
+
],
|
| 37 |
+
"k": 20,
|
| 38 |
+
"device": "cuda:0",
|
| 39 |
+
"layer": "unknown",
|
| 40 |
+
"lm_name": "Lightricks/LTX-Video-0.9.5",
|
| 41 |
+
"wandb_name": "MatryoshkaBatchTopKTrainer-Lightricks/LTX-Video-0.9.5-resid_post_layer_unknown_trainer_1",
|
| 42 |
+
"submodule_name": "resid_post_layer_unknown"
|
| 43 |
+
},
|
| 44 |
+
"buffer": {
|
| 45 |
+
"activation_dir": "/mnt/nw/home/m.yu/repos/dictionary_learning_demo/ltx_activations_vae",
|
| 46 |
+
"d_submodule": 128,
|
| 47 |
+
"out_batch_size": 2048,
|
| 48 |
+
"num_shards": 70,
|
| 49 |
+
"metadata": {
|
| 50 |
+
"model_name": "Lightricks/LTX-Video-0.9.5",
|
| 51 |
+
"hook_target": "vae_latent_mean",
|
| 52 |
+
"d_model": 128,
|
| 53 |
+
"num_frames": 321,
|
| 54 |
+
"height": 256,
|
| 55 |
+
"width": 256,
|
| 56 |
+
"max_norm_multiple": 10,
|
| 57 |
+
"total_tokens": 9063296,
|
| 58 |
+
"num_shards": 70,
|
| 59 |
+
"num_videos": 3454,
|
| 60 |
+
"save_dtype": "float32"
|
| 61 |
+
}
|
| 62 |
+
}
|
| 63 |
+
}
|
trainer_2/ae.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5453a7c93906bc3d8be124a0531b27b2ce3156b1e3ca8cc1da3cf60ea50d6a8d
|
| 3 |
+
size 8424141
|
trainer_2/checkpoints/ae_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bfaa361c6795a19c551cf0dbb3413fe396661dca22d2bab2316cded22d4cadeb
|
| 3 |
+
size 8424355
|
trainer_2/checkpoints/ae_13.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd86bf18519df6c43da415300c3851042aa2c3eaa23d78f1e643f132bb33d9c7
|
| 3 |
+
size 8424366
|
trainer_2/checkpoints/ae_138.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:343bfb39b3b2ac0a9fd8bca21dcdd828f5741ae09b2582f66879b592c97b67a6
|
| 3 |
+
size 8424377
|
trainer_2/checkpoints/ae_1389.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:818aa7a5d4d696ef351d2357956b657106c08750551a143dccfb87a5f2595b9c
|
| 3 |
+
size 8424388
|
trainer_2/checkpoints/ae_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d393eb0f14733a7daeac25f4fdbcc3a5c6d7d2eb0ce71e3eece1b635fdb5c4c
|
| 3 |
+
size 8424355
|
trainer_2/checkpoints/ae_43.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e5984b64c4c44c73504b736e4bb724fb3b3857665a586eaea9233e13116c33a
|
| 3 |
+
size 8424366
|
trainer_2/checkpoints/ae_439.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c721d367067b74a4ce07a1069b047483a9c86e737ea554c76327a3e40b6a03e
|
| 3 |
+
size 8424377
|
trainer_2/config.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"trainer": {
|
| 3 |
+
"trainer_class": "MatryoshkaBatchTopKTrainer",
|
| 4 |
+
"dict_class": "MatryoshkaBatchTopKSAE",
|
| 5 |
+
"lr": 5e-05,
|
| 6 |
+
"steps": 4394,
|
| 7 |
+
"auxk_alpha": 0.03125,
|
| 8 |
+
"warmup_steps": 1000,
|
| 9 |
+
"decay_start": 3515,
|
| 10 |
+
"threshold_beta": 0.999,
|
| 11 |
+
"threshold_start_step": 1000,
|
| 12 |
+
"top_k_aux": 64,
|
| 13 |
+
"seed": 0,
|
| 14 |
+
"activation_dim": 128,
|
| 15 |
+
"dict_size": 8192,
|
| 16 |
+
"group_fractions": [
|
| 17 |
+
0.03125,
|
| 18 |
+
0.0625,
|
| 19 |
+
0.125,
|
| 20 |
+
0.25,
|
| 21 |
+
0.53125
|
| 22 |
+
],
|
| 23 |
+
"group_weights": [
|
| 24 |
+
0.2,
|
| 25 |
+
0.2,
|
| 26 |
+
0.2,
|
| 27 |
+
0.2,
|
| 28 |
+
0.2
|
| 29 |
+
],
|
| 30 |
+
"group_sizes": [
|
| 31 |
+
256,
|
| 32 |
+
512,
|
| 33 |
+
1024,
|
| 34 |
+
2048,
|
| 35 |
+
4352
|
| 36 |
+
],
|
| 37 |
+
"k": 10,
|
| 38 |
+
"device": "cuda:0",
|
| 39 |
+
"layer": "unknown",
|
| 40 |
+
"lm_name": "Lightricks/LTX-Video-0.9.5",
|
| 41 |
+
"wandb_name": "MatryoshkaBatchTopKTrainer-Lightricks/LTX-Video-0.9.5-resid_post_layer_unknown_trainer_2",
|
| 42 |
+
"submodule_name": "resid_post_layer_unknown"
|
| 43 |
+
},
|
| 44 |
+
"buffer": {
|
| 45 |
+
"activation_dir": "/mnt/nw/home/m.yu/repos/dictionary_learning_demo/ltx_activations_vae",
|
| 46 |
+
"d_submodule": 128,
|
| 47 |
+
"out_batch_size": 2048,
|
| 48 |
+
"num_shards": 70,
|
| 49 |
+
"metadata": {
|
| 50 |
+
"model_name": "Lightricks/LTX-Video-0.9.5",
|
| 51 |
+
"hook_target": "vae_latent_mean",
|
| 52 |
+
"d_model": 128,
|
| 53 |
+
"num_frames": 321,
|
| 54 |
+
"height": 256,
|
| 55 |
+
"width": 256,
|
| 56 |
+
"max_norm_multiple": 10,
|
| 57 |
+
"total_tokens": 9063296,
|
| 58 |
+
"num_shards": 70,
|
| 59 |
+
"num_videos": 3454,
|
| 60 |
+
"save_dtype": "float32"
|
| 61 |
+
}
|
| 62 |
+
}
|
| 63 |
+
}
|
trainer_3/ae.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f8f96af28609223c63e8dd9520c5fd234c1bb00d08f4e846e9178b7e696fc83
|
| 3 |
+
size 8424141
|
trainer_3/checkpoints/ae_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:936d3333563d0e0d3a78c862db897082cd33df2ec60c2d234d99baa6dd55b416
|
| 3 |
+
size 8424355
|
trainer_3/checkpoints/ae_13.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1dbea5e5e6c9c25a37ad7231337a14bf91d77d6ff269ceef17edd41ecf7716d6
|
| 3 |
+
size 8424366
|
trainer_3/checkpoints/ae_138.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b5f92a0be68012879ed57faafa25b43db0c1beba2edd1f6be25b4895f3ad703
|
| 3 |
+
size 8424377
|
trainer_3/checkpoints/ae_1389.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d0855599905d920cdb856d676170cb71b0a3a8baf58f2f8df20ca8c9a19e5bed
|
| 3 |
+
size 8424388
|
trainer_3/checkpoints/ae_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1a05416929c5f67c4a5e182f41e7c85d070837dceb31d953b40d20ff9029875
|
| 3 |
+
size 8424355
|
trainer_3/checkpoints/ae_43.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:084986932c0818ef2a6d521b372ebea22a0f768bf8dfb02cf937ed6fd9a2560b
|
| 3 |
+
size 8424366
|
trainer_3/checkpoints/ae_439.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a6010433687e100669133555d0c62c8479b0d9387e39d2e5360b2b4036f3201
|
| 3 |
+
size 8424377
|
trainer_3/config.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"trainer": {
|
| 3 |
+
"trainer_class": "MatryoshkaBatchTopKTrainer",
|
| 4 |
+
"dict_class": "MatryoshkaBatchTopKSAE",
|
| 5 |
+
"lr": 5e-05,
|
| 6 |
+
"steps": 4394,
|
| 7 |
+
"auxk_alpha": 0.03125,
|
| 8 |
+
"warmup_steps": 1000,
|
| 9 |
+
"decay_start": 3515,
|
| 10 |
+
"threshold_beta": 0.999,
|
| 11 |
+
"threshold_start_step": 1000,
|
| 12 |
+
"top_k_aux": 64,
|
| 13 |
+
"seed": 0,
|
| 14 |
+
"activation_dim": 128,
|
| 15 |
+
"dict_size": 8192,
|
| 16 |
+
"group_fractions": [
|
| 17 |
+
0.03125,
|
| 18 |
+
0.0625,
|
| 19 |
+
0.125,
|
| 20 |
+
0.25,
|
| 21 |
+
0.53125
|
| 22 |
+
],
|
| 23 |
+
"group_weights": [
|
| 24 |
+
0.2,
|
| 25 |
+
0.2,
|
| 26 |
+
0.2,
|
| 27 |
+
0.2,
|
| 28 |
+
0.2
|
| 29 |
+
],
|
| 30 |
+
"group_sizes": [
|
| 31 |
+
256,
|
| 32 |
+
512,
|
| 33 |
+
1024,
|
| 34 |
+
2048,
|
| 35 |
+
4352
|
| 36 |
+
],
|
| 37 |
+
"k": 20,
|
| 38 |
+
"device": "cuda:0",
|
| 39 |
+
"layer": "unknown",
|
| 40 |
+
"lm_name": "Lightricks/LTX-Video-0.9.5",
|
| 41 |
+
"wandb_name": "MatryoshkaBatchTopKTrainer-Lightricks/LTX-Video-0.9.5-resid_post_layer_unknown_trainer_3",
|
| 42 |
+
"submodule_name": "resid_post_layer_unknown"
|
| 43 |
+
},
|
| 44 |
+
"buffer": {
|
| 45 |
+
"activation_dir": "/mnt/nw/home/m.yu/repos/dictionary_learning_demo/ltx_activations_vae",
|
| 46 |
+
"d_submodule": 128,
|
| 47 |
+
"out_batch_size": 2048,
|
| 48 |
+
"num_shards": 70,
|
| 49 |
+
"metadata": {
|
| 50 |
+
"model_name": "Lightricks/LTX-Video-0.9.5",
|
| 51 |
+
"hook_target": "vae_latent_mean",
|
| 52 |
+
"d_model": 128,
|
| 53 |
+
"num_frames": 321,
|
| 54 |
+
"height": 256,
|
| 55 |
+
"width": 256,
|
| 56 |
+
"max_norm_multiple": 10,
|
| 57 |
+
"total_tokens": 9063296,
|
| 58 |
+
"num_shards": 70,
|
| 59 |
+
"num_videos": 3454,
|
| 60 |
+
"save_dtype": "float32"
|
| 61 |
+
}
|
| 62 |
+
}
|
| 63 |
+
}
|