ts-medium-swiglu / config.json
tdooms's picture
Upload Transformer
942097c verified
raw
history blame contribute delete
276 Bytes
{
"architectures": [
"Transformer"
],
"bias": false,
"bilinear": true,
"d_hidden": 2048,
"d_model": 512,
"gate": "silu",
"n_ctx": 256,
"n_head": 8,
"n_layer": 8,
"normalization": true,
"torch_dtype": "float32",
"transformers_version": "4.45.1"
}