aam-diffusion-v1 / training_config.json
Wolfvin's picture
AAM Diffusion LLM v1.0 — The Body of Aphantasic Abstraction Model
2d7e335 verified
raw
history blame contribute delete
642 Bytes
{
"model_name": "aam-diffusion-v1.0",
"aam_mind_source": "rsvs_graph",
"aam_body_type": "specialized_diffusion",
"architecture": {
"type": "diffusion_transformer",
"d_model": 64,
"n_layers": 2,
"n_heads": 4,
"d_ff": 128,
"vocab_size": 500,
"max_seq_len": 32,
"pos_encoding_type": "learned"
},
"diffusion": {
"n_timesteps": 50,
"n_inference_steps": 5,
"schedule_type": "cosine",
"prediction_type": "epsilon",
"sampling_method": "ddim"
},
"graph_encoder": {
"d_graph": 32,
"n_graph_layers": 1,
"conditioning_method": "cross_attention"
},
"parameters": 311670
}