{ "model_name": "xlm-roberta-large", "model_id": "M4_4.2_XLM_RoBERTa", "member": 4, "spec_compliance": { "seed": 42, "max_length": 128, "batch_size": 8, "gradient_accumulation_steps": 2, "effective_batch_size": 16, "learning_rate": 1e-05, "epochs_trained": 3, "total_epochs_limit": 5, "early_stopping_patience": 5, "primary_metric": "val_macro_f1", "data_augmentation": true, "target_minority_size": 0.05 }, "training_results": { "best_epoch": 3, "best_val_macro_f1": 0.6920319606014477, "best_val_macro_precision": 0.6935400158042497, "best_val_macro_recall": 0.6959520837420035, "best_val_weighted_f1": 0.7889787090902882, "best_val_accuracy": 0.7843488649940262, "training_loss": 0.531401620691845 }, "test_results": { "test_loss": 0.8419096413437215, "test_accuracy": 0.7831937799043063, "test_macro_precision": 0.7109259717505931, "test_macro_recall": 0.6740476446561174, "test_macro_f1": 0.682211638723438, "test_weighted_precision": 0.7917048623914406, "test_weighted_recall": 0.7831937799043063, "test_weighted_f1": 0.78430327538584, "per_class_f1": { "F": 0.8503589177250138, "R": 0.804436660828955, "N": 0.8322618351841029, "M": 0.6457399103139013, "S": 0.2782608695652174 } }, "data_augmentation": { "original_train_size": 15699, "augmented_train_size": 16156, "augmented_samples": 457, "target_minority_percentage": 5.0 }, "hardware": { "device": "cuda", "cuda_available": true, "python_version": "3.11.11", "platform": "Linux-6.8.0-87-generic-x86_64-with-glibc2.35", "cpu_count": 128, "ram_gb": 754.5698852539062, "gpu_device": "NVIDIA H100 NVL MIG 1g.24gb", "gpu_memory_gb": 23.219666944 }, "training_time": { "total_seconds": 4912.679862, "total_minutes": 81.8779977, "average_per_epoch": 982.5344182000001, "timestamp_start": "2025-12-25T13:51:24.634125", "timestamp_end": "2025-12-25T16:18:05.909736" }, "library_versions": { "pytorch": "2.7.1+cu118", "transformers": "4.57.3", "numpy": "1.26.4", "pandas": "2.2.3", "scikit-learn": "1.6.1", "python": "3.11.11" }, "data": { "train_samples_original": 15699, "train_samples_augmented": 16156, "val_samples": 3348, "test_samples": 3344, "num_classes": 5, "class_names": [ "F", "R", "N", "M", "S" ] } }