File size: 1,733 Bytes
8c669d6 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 | {
"trainer": {
"trainer_class": "MatryoshkaBatchTopKTrainer",
"dict_class": "MatryoshkaBatchTopKSAE",
"lr": 5e-05,
"steps": 4394,
"auxk_alpha": 0.03125,
"warmup_steps": 1000,
"decay_start": 3515,
"threshold_beta": 0.999,
"threshold_start_step": 1000,
"top_k_aux": 64,
"seed": 0,
"activation_dim": 128,
"dict_size": 8192,
"group_fractions": [
0.03125,
0.0625,
0.125,
0.25,
0.53125
],
"group_weights": [
0.2,
0.2,
0.2,
0.2,
0.2
],
"group_sizes": [
256,
512,
1024,
2048,
4352
],
"k": 10,
"device": "cuda:0",
"layer": "unknown",
"lm_name": "Lightricks/LTX-Video-0.9.5",
"wandb_name": "MatryoshkaBatchTopKTrainer-Lightricks/LTX-Video-0.9.5-resid_post_layer_unknown_trainer_2",
"submodule_name": "resid_post_layer_unknown"
},
"buffer": {
"activation_dir": "/mnt/nw/home/m.yu/repos/dictionary_learning_demo/ltx_activations_vae",
"d_submodule": 128,
"out_batch_size": 2048,
"num_shards": 70,
"metadata": {
"model_name": "Lightricks/LTX-Video-0.9.5",
"hook_target": "vae_latent_mean",
"d_model": 128,
"num_frames": 321,
"height": 256,
"width": 256,
"max_norm_multiple": 10,
"total_tokens": 9063296,
"num_shards": 70,
"num_videos": 3454,
"save_dtype": "float32"
}
}
} |