| { | |
| "experiment": "exp_single_fast", | |
| "model_name": "deepseek-ai/DeepSeek-OCR", | |
| "train_size": 1368, | |
| "val_size": 152, | |
| "prompt": "<image>\nFree OCR.", | |
| "hyperparameters": { | |
| "name": "exp_single_fast", | |
| "num_train_epochs": 1, | |
| "learning_rate": 0.0002, | |
| "gradient_accumulation_steps": 8, | |
| "lora_r": 32, | |
| "lora_alpha": 64, | |
| "lora_dropout": 0.1, | |
| "per_device_train_batch_size": 1, | |
| "per_device_eval_batch_size": 1, | |
| "weight_decay": 0.01, | |
| "warmup_ratio": 0.03 | |
| }, | |
| "eval_metrics": { | |
| "eval_runtime": 278.9663, | |
| "eval_samples_per_second": 0.545, | |
| "eval_steps_per_second": 0.545, | |
| "epoch": 1.0 | |
| }, | |
| "log_summary": { | |
| "best_eval_loss": null, | |
| "last_train_loss": 0.4609, | |
| "last_learning_rate": 2.4242424242424244e-06 | |
| }, | |
| "text_metrics": { | |
| "subset_size": 20, | |
| "wer": 0.46787479406919275, | |
| "cer": 0.4147754249359035 | |
| } | |
| } |