TaoNet-mini-T2 / artifacts /model_card.json
StarMist0012's picture
Add files using upload-large-folder tool
e2bfccc verified
{
"state": "completed",
"architecture": "taonet_ssm",
"candidate": "pure_ssm_196m_branch_rms_only",
"pretrain_checkpoint": "/home/student/YouZheng/jobs/taotern/taotern-200m-branch-only-chat-20260514/checkpoints/pretrain/final_model.pt",
"sft_checkpoint": "/home/student/YouZheng/jobs/taotern/taotern-200m-branch-only-chat-20260514/checkpoints/sft/final_model.pt",
"tokenizer_path": "/home/student/YouZheng/tokenizers/taodata_pilot_8k/tokenizer.model",
"pretrain_config": "/home/student/YouZheng/jobs/taotern/taotern-200m-branch-only-chat-20260514/outputs/configs/pretrain.yaml",
"sft_config": "/home/student/YouZheng/jobs/taotern/taotern-200m-branch-only-chat-20260514/outputs/configs/sft.yaml",
"activation_probe": "/home/student/YouZheng/jobs/taotern/taotern-200m-branch-only-chat-20260514/outputs/diagnostics/activation_probe_pretrain_final.json",
"pretrain_samples": "/home/student/YouZheng/jobs/taotern/taotern-200m-branch-only-chat-20260514/outputs/diagnostics/generation_samples_pretrain_final.json",
"sft_samples": "/home/student/YouZheng/jobs/taotern/taotern-200m-branch-only-chat-20260514/outputs/diagnostics/generation_samples_sft_final.json"
}