| { | |
| "model_name": "xlm-roberta-large", | |
| "model_id": "M4_4.2_XLM_RoBERTa", | |
| "member": 4, | |
| "spec_compliance": { | |
| "seed": 42, | |
| "max_length": 128, | |
| "batch_size": 8, | |
| "gradient_accumulation_steps": 2, | |
| "effective_batch_size": 16, | |
| "learning_rate": 1e-05, | |
| "epochs_trained": 3, | |
| "total_epochs_limit": 5, | |
| "early_stopping_patience": 5, | |
| "primary_metric": "val_macro_f1", | |
| "data_augmentation": true, | |
| "target_minority_size": 0.05 | |
| }, | |
| "training_results": { | |
| "best_epoch": 3, | |
| "best_val_macro_f1": 0.6920319606014477, | |
| "best_val_macro_precision": 0.6935400158042497, | |
| "best_val_macro_recall": 0.6959520837420035, | |
| "best_val_weighted_f1": 0.7889787090902882, | |
| "best_val_accuracy": 0.7843488649940262, | |
| "training_loss": 0.531401620691845 | |
| }, | |
| "test_results": { | |
| "test_loss": 0.8419096413437215, | |
| "test_accuracy": 0.7831937799043063, | |
| "test_macro_precision": 0.7109259717505931, | |
| "test_macro_recall": 0.6740476446561174, | |
| "test_macro_f1": 0.682211638723438, | |
| "test_weighted_precision": 0.7917048623914406, | |
| "test_weighted_recall": 0.7831937799043063, | |
| "test_weighted_f1": 0.78430327538584, | |
| "per_class_f1": { | |
| "F": 0.8503589177250138, | |
| "R": 0.804436660828955, | |
| "N": 0.8322618351841029, | |
| "M": 0.6457399103139013, | |
| "S": 0.2782608695652174 | |
| } | |
| }, | |
| "data_augmentation": { | |
| "original_train_size": 15699, | |
| "augmented_train_size": 16156, | |
| "augmented_samples": 457, | |
| "target_minority_percentage": 5.0 | |
| }, | |
| "hardware": { | |
| "device": "cuda", | |
| "cuda_available": true, | |
| "python_version": "3.11.11", | |
| "platform": "Linux-6.8.0-87-generic-x86_64-with-glibc2.35", | |
| "cpu_count": 128, | |
| "ram_gb": 754.5698852539062, | |
| "gpu_device": "NVIDIA H100 NVL MIG 1g.24gb", | |
| "gpu_memory_gb": 23.219666944 | |
| }, | |
| "training_time": { | |
| "total_seconds": 4912.679862, | |
| "total_minutes": 81.8779977, | |
| "average_per_epoch": 982.5344182000001, | |
| "timestamp_start": "2025-12-25T13:51:24.634125", | |
| "timestamp_end": "2025-12-25T16:18:05.909736" | |
| }, | |
| "library_versions": { | |
| "pytorch": "2.7.1+cu118", | |
| "transformers": "4.57.3", | |
| "numpy": "1.26.4", | |
| "pandas": "2.2.3", | |
| "scikit-learn": "1.6.1", | |
| "python": "3.11.11" | |
| }, | |
| "data": { | |
| "train_samples_original": 15699, | |
| "train_samples_augmented": 16156, | |
| "val_samples": 3348, | |
| "test_samples": 3344, | |
| "num_classes": 5, | |
| "class_names": [ | |
| "F", | |
| "R", | |
| "N", | |
| "M", | |
| "S" | |
| ] | |
| } | |
| } |