| { | |
| "model_type": "AuriStreamParallel", | |
| "architectures": [ | |
| "AuriStreamModel" | |
| ], | |
| "auto_map": { | |
| "AutoConfig": "TuKoResearch/AuriStreamParallel-base--configuration_auristream_parallel.AuriStreamParallelConfig", | |
| "AutoModel": "TuKoResearch/AuriStreamParallel-base--modeling_auristream_parallel.AuriStreamModel", | |
| "AutoModelForCausalLM": "TuKoResearch/AuriStreamParallel-base--modeling_auristream_parallel.AuriStreamModel" | |
| }, | |
| "torch_dtype": "bfloat16", | |
| "transformers_version": "4.40.0", | |
| "vocab_size": 8193, | |
| "base_vocab_size": 8192, | |
| "mask_token_id": 8192, | |
| "ignore_index": -100, | |
| "n_embd": 768, | |
| "n_layer": 12, | |
| "n_head": 12, | |
| "dropout": 0.0, | |
| "bias": false, | |
| "use_rope": true, | |
| "group_size": 16, | |
| "seq_len": 4096, | |
| "skip_connections": false, | |
| "mask_schedule": "linear_text_prime" | |
| } |