TinyLlama_v1.1-mars-peft-benchmark
/
TinyLlama_v1.1-mars-opt0-q8
/TinyLlama_v1.1-mars-arc_c-r2-a2
/training_configuration.json
| { | |
| "model_id": "TinyLlama/TinyLlama_v1.1", | |
| "dataset": { | |
| "name": "ARC_C", | |
| "dataset_id": "allenai/ai2_arc", | |
| "preprocess_id": "arc_train_deepeval" | |
| }, | |
| "peft_config": { | |
| "method": "mars", | |
| "rank": 2, | |
| "alpha": 4, | |
| "dropout": 0.0, | |
| "bias": "none", | |
| "target_modules": [ | |
| "q_proj", | |
| "k_proj", | |
| "v_proj", | |
| "o_proj", | |
| "gate_proj", | |
| "down_proj", | |
| "up_proj" | |
| ], | |
| "trainable_parameter_count": 1307064 | |
| }, | |
| "training_config": { | |
| "max_dataset_length": null, | |
| "batch_size": 64, | |
| "per_device_batch_size": 32, | |
| "gradient_accumulation_steps": 2, | |
| "learning_rate": 0.0003, | |
| "num_epochs": 4, | |
| "warmup_ratio": 0.1 | |
| }, | |
| "model_name": "TinyLlama_v1.1-mars-arc_c-r2-a2", | |
| "output_dir": "./experiment_results/TinyLlama_v1.1-mars-opt3-q8/TinyLlama_v1.1-mars-arc_c-r2-a2", | |
| "seed": 42, | |
| "timestamp": "2025-09-02T01:26:53.248869" | |
| } |