| { |
| "started_at_utc": "2026-03-19T11:54:34.606942+00:00", |
| "ended_at_utc": "2026-03-19T13:30:48.781371+00:00", |
| "train_elapsed_sec": 5774.174, |
| "stopped_by_time_limit": false, |
| "global_step": 43, |
| "train_metrics": { |
| "train_runtime": 5773.5801, |
| "train_samples_per_second": 0.118, |
| "train_steps_per_second": 0.007, |
| "total_flos": 2.771601971163955e+16, |
| "train_loss": 0.9663696178170138, |
| "epoch": 1.0 |
| }, |
| "args": { |
| "model_name": "vodkaslime/codellama-7b-hf", |
| "train_file": "/kaggle/working/python-llm-grpo-new-techniques/training/data/train.jsonl", |
| "val_file": "/kaggle/working/python-llm-grpo-new-techniques/training/data/val.jsonl", |
| "output_dir": "/kaggle/working/python-llm-grpo-new-techniques/training/output/phase2-codellama-7b-lora-kaggle-1h", |
| "block_size": 1024, |
| "num_train_epochs": 1, |
| "max_steps": -1, |
| "max_runtime_minutes": 55.0, |
| "max_runtime_seconds": 7200.0, |
| "effective_max_runtime_seconds": 7200.0, |
| "per_device_train_batch_size": 1, |
| "per_device_eval_batch_size": 1, |
| "gradient_accumulation_steps": 16, |
| "learning_rate": 0.0002, |
| "save_steps": 100, |
| "eval_steps": 100, |
| "save_total_limit": 2, |
| "warmup_steps": 50, |
| "use_4bit": true, |
| "bf16": true, |
| "fp16": false, |
| "gradient_checkpointing": true, |
| "seed": 42, |
| "artifact_mode": "adapter_only" |
| } |
| } |