{ "architectures": [ "LLaMAModel" ], "d_model": 128, "model_type": "llama", "num_heads": 4, "num_layers": 2, "torch_dtype": "float32", "transformers_version": "4.41.2", "vocab_size": 50257 }