Tofu-full / head_config.json
BBigBear's picture
Upload model
64e07f0 verified
raw
history blame contribute delete
452 Bytes
{
"config": {
"activation_function": "gelu",
"bias": true,
"dropout_prob": null,
"embedding_size": 2048,
"head_type": "causal_lm",
"label2id": null,
"layer_norm": true,
"layers": 2,
"shift_labels": true,
"vocab_size": 128256
},
"hidden_size": 2048,
"model_class": "LlamaAdapterModel",
"model_name": "NousResearch/Llama-3.2-1B",
"model_type": "llama",
"name": "Tofu",
"version": "adapters.1.0.1"
}