Text Generation
Transformers
PyTorch
Safetensors
English
i3
i3-architecture
hybrid-model
rwkv-mamba
custom_code
i3-80m / config.json
FlameF0X's picture
Upload config.json
9befdad verified
raw
history blame contribute delete
481 Bytes
{
"architectures": [
"i3Model"
],
"model_type": "i3",
"vocab_size": 41320,
"d_model": 512,
"n_layers": 16,
"n_heads": 16,
"max_seq_len": 256,
"conv_layers": 10,
"attn_layers": 6,
"d_state": 64,
"tokenizer_type": "chunk",
"chunk_strategy": "variable_2_3",
"dataset_sources": [
"agentlans/high-quality-english-sentences",
"roneneldan/TinyStories",
"starhopp3r/TinyChat"
],
"torch_dtype": "float32",
"transformers_version": "4.36.0"
}