{ "repo_id": "BDRC/gyuyig-tsugdri-binary-script-classifier", "train_dataset_id": "BDRC/gyuyig-tsugdri-binary-balanced-script-classification-dataset", "warmstart_repo": "BDRC/4-class-balanced-script-classifier", "task": "gyuyig_tsugdri_binary_classification", "experiment": "dinov3_gyuyig_tsugdri_binary", "classes": [ "Gyuyig", "Tsugdri" ], "pooling": "cls_token", "preprocess": { "train": "center_crop", "val": "center_crop", "test": "center_crop", "size": 224 }, "warmstart": { "warmstart_repo": "BDRC/4-class-balanced-script-classifier", "warmstart_checkpoint": null, "warmstart_checkpoint_file": "final_model.pt", "checkpoint_test_metrics": { "loss": 0.42663901050885517, "accuracy": 0.9208333333333333, "macro_f1": 0.9208489161207983, "weighted_f1": 0.9208489161207983 }, "warmstart_pooling": "cls_token" }, "training_config": { "lr_head_a": 0.0005, "lr_backbone_b": 1e-05, "lr_head_b": 0.0001, "lr_backbone_c": 1.5e-05, "lr_head_c": 5e-05, "epochs_a": 7, "epochs_b": 10, "epochs_c": 12, "unfreeze_blocks_b": 4, "unfreeze_blocks_c": 8, "skip_stage_c": false, "scheduler": "cosine_warmup", "warmup_epochs_a": 0, "warmup_epochs_b": 1, "warmup_epochs_c": 1, "warmup_start_factor": 0.01, "min_lr_ratio": 0.01, "weight_decay": 0.02, "grad_clip_norm": 1.0, "class_weight_mode": "custom", "class_weights": [ 1.0, 1.0 ], "label_smoothing": 0.05, "dropout": 0.1, "early_stop_patience": 6, "early_stop_min_delta": 0.001, "resolved_class_weights": [ 1.0, 1.0 ], "pooling": "cls_token", "lambda_consistency": 0.0, "flip_op": "rot180" }, "best_checkpoint": { "path": "best_stage_c_last_blocks.pt", "epoch": 1, "val_macro_f1": 0.9164578111946533 }, "val_metrics": { "loss": 0.3914561231931051, "accuracy": 0.9166666666666666, "macro_f1": 0.9164578111946533, "weighted_f1": 0.9164578111946533, "auc_roc": 0.9311111111111111 }, "test_metrics": { "loss": 0.40474860469500223, "accuracy": 0.85, "macro_f1": 0.847930160518164, "weighted_f1": 0.847930160518164, "auc_roc": 0.9297222222222223 } }