| { | |
| "architectures": [ | |
| "GPTNeoCodebookModel" | |
| ], | |
| "codebook_at": [ | |
| "attn_preproj" | |
| ], | |
| "codebook_kwargs": {}, | |
| "codebook_type": [ | |
| "group" | |
| ], | |
| "k_codebook": [ | |
| 8 | |
| ], | |
| "kmeans_init": false, | |
| "kmeans_init_examples": 1000, | |
| "kmeans_kwargs": { | |
| "batch_size": 24576, | |
| "n_init": "auto" | |
| }, | |
| "kmeans_path": "/.cache/cb_volume/huggingface/kmeans_embeddings.pt", | |
| "layers_to_snap": [ | |
| 0 | |
| ], | |
| "loss": "aeloss", | |
| "model_type": "codebook", | |
| "num_codebooks": [ | |
| 16 | |
| ], | |
| "num_codes": 25000, | |
| "replace_codes": false, | |
| "similarity_metric": "inner_product", | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.29.2" | |
| } | |