from dataclasses import dataclass @dataclass class Model: vocab_size: int num_layers: int hidden_dim: int intermediate_size: int weight_tied_embeddings: bool @dataclass class Parallelism: tensor_parallelism: int pipeline_parallelism: int context_parallelism: int expert_parallelism: int @dataclass class Training: sequence_length: int batch_size: int