| { | |
| "package": "tmcra-token-graph-llm-v1-relation-finetune-3k", | |
| "date": "2026-05-30", | |
| "checkpoint": "token_graph_llm_v1_relation_finetune_3k.pt", | |
| "tokenizer": "tokenizer.json", | |
| "checkpoint_size_bytes": 82681830, | |
| "sha256": "0F32BD7105825EF78EEEF509940D51E2BA9AC7F7E9E34C41F46E3442CF9A7057", | |
| "architecture": { | |
| "dim": 384, | |
| "graph_layers": 6, | |
| "decoder_layers": 8, | |
| "untied_embeddings": true, | |
| "max_sequence_tokens": 160, | |
| "transformer_self_attention": false, | |
| "external_llm_inference": false | |
| }, | |
| "training_data": { | |
| "train_samples": 920048, | |
| "validation_samples": 80004, | |
| "vocab_size": 1012 | |
| }, | |
| "finetune": { | |
| "steps": 3000, | |
| "objectives": [ | |
| "next_token_prediction", | |
| "token_path_loss", | |
| "transition_path_loss", | |
| "relation_transition_loss", | |
| "causal_path_consistency_loss" | |
| ] | |
| }, | |
| "final_validation": { | |
| "val_loss": 1.88428, | |
| "lm_loss": 1.816859, | |
| "token_path_loss": 0.984824, | |
| "transition_path_loss": 0.39309, | |
| "relation_transition_loss": 1.208215, | |
| "causal_path_loss": 1.56985 | |
| }, | |
| "status": "research_prototype" | |
| } | |