| { | |
| "_name_or_path": "JonusNattapong/wilai-2.0", | |
| "model_type": "wilai", | |
| "vocab_size": 1000, | |
| "hidden_size": 512, | |
| "num_hidden_layers": 6, | |
| "num_attention_heads": 8, | |
| "max_position_embeddings": 128, | |
| "initializer_range": 0.02, | |
| "layer_norm_epsilon": 1e-5, | |
| "embd_pdrop": 0.1, | |
| "attn_pdrop": 0.1, | |
| "resid_pdrop": 0.1, | |
| "activation_function": "gelu", | |
| "n_inner": null, | |
| "use_cache": true, | |
| "bos_token_id": 1, | |
| "eos_token_id": 2, | |
| "pad_token_id": 0, | |
| "tie_word_embeddings": false, | |
| "use_gradient_checkpointing": true, | |
| "use_mixed_precision": false, | |
| "gradient_clip_norm": 1.0, | |
| "model_name": "wilai-2.0", | |
| "model_version": "1.0.0", | |
| "description": "Thai-specific GPT-like language model", | |
| "created_at": "2025-10-27T11:44:35.229069", | |
| "training_completed": true, | |
| "total_steps": 16600, | |
| "best_val_loss": 2.707622994680773, | |
| "training_time": 58012.46856427193 | |
| } |