{ "model_name": "DeepFake Detector V13", "version": "13.0", "architecture": "3-Model Ensemble", "total_parameters": "699M", "description": "Large-scale ensemble with ConvNeXt-Large (198M), ViT-Large (304M), and Swin-Large (197M)", "models": [ { "id": 1, "name": "Model 13.1", "backbone": "convnext_large", "parameters": "198M", "dropout": 0.3, "batch_size": 32, "best_f1": 0.8971, "file": "model_1.safetensors" }, { "id": 2, "name": "Model 13.2", "backbone": "vit_large_patch16_224", "parameters": "304M", "dropout": 0.35, "batch_size": 24, "best_f1": 0.9382, "file": "model_2.safetensors" }, { "id": 3, "name": "Model 13.3", "backbone": "swin_large_patch4_window7_224", "parameters": "197M", "dropout": 0.3, "batch_size": 32, "best_f1": 0.9586, "file": "model_3.safetensors" } ], "ensemble_performance": { "average_f1": 0.9313, "best_individual_f1": 0.9586, "total_training_time_hours": 6.1 }, "training": { "epochs_per_model": 10, "learning_rates": [ 2e-05, 1.5e-05, 1.8e-05 ], "weight_decay": 0.0003, "label_smoothing": 0.12, "gradient_accumulation": 4, "mixed_precision": true, "criterion": "FocalLossSmooth (alpha=0.25, gamma=2.5)", "optimizer": "AdamW", "scheduler": "CosineAnnealingWarmRestarts" }, "preprocessing": { "image_size": 224, "normalization": { "mean": [ 0.485, 0.456, 0.406 ], "std": [ 0.229, 0.224, 0.225 ] }, "augmentations": [ "RandomHorizontalFlip(p=0.5)", "RandomRotation(degrees=12)", "ColorJitter(brightness=0.15, contrast=0.15, saturation=0.15)" ] }, "inference": { "ensemble_method": "average", "threshold": 0.5, "description": "Average predictions from all 3 models for final classification" }, "requirements": [ "torch>=2.0.0", "timm>=0.9.0", "torchvision>=0.15.0", "numpy", "pillow", "safetensors" ], "dataset": "ash12321/deepfake-v13-dataset", "predecessor": "ash12321/deepfake-detector-v12" }