armenjeddi's picture
Add base-loop model with 3 layers - max 8 iterations
04e086e verified
{
"architectures": [
"Base_Loop_GPTForCausalLM"
],
"auto_map": {
"AutoConfig": "modeling_base_loop.GPTConfig",
"AutoModelForCausalLM": "modeling_base_loop.Base_Loop_GPTForCausalLM"
},
"dtype": "bfloat16",
"model_type": "base_loop",
"transformers_version": "4.57.0"
}