| { | |
| "name": "MTA-DeepCode-r32-a32-epoch20", | |
| "base_model": "Qwen/Qwen2.5-Coder-3B-Instruct", | |
| "context_length": 8192, | |
| "model_type": "finetuned", | |
| "finetune_steps": [ | |
| { | |
| "base_model": "Qwen/Qwen2.5-Coder-3B-Instruct", | |
| "step": 1, | |
| "data": "MTA-project", | |
| "epochs": 20, | |
| "batch_size": 16, | |
| "dataset_size": 5420, | |
| "num_tests": "" | |
| } | |
| ], | |
| "project": "MTA", | |
| "prompt_template": { | |
| "user_tag": "<|start_header_id|>user<|end_header_id|>", | |
| "end_tag": "<|eot_id|>", | |
| "assistant_tag": "<|start_header_id|>assistant<|end_header_id|>" | |
| } | |
| } |