roberta-MeSH-lora / training_args.json
maxbeettww's picture
Upload LoRA adapter + logs (2026-02-02 10:25:51)
3f1d8d1 verified
raw
history blame contribute delete
556 Bytes
{
"base_model": "roberta-base",
"data": {
"csv_path": "https://github.com/Heng1222/Ohsumed_classification/blob/main/MeSH_data/mesh_dataset.csv?raw=true",
"split": "train=0.9, val=0.1",
"random_state": 42
},
"hyperparams": {
"batch_size": 32,
"lr": 5e-05,
"num_epochs_max": 8,
"patience": 3,
"min_delta": 0.0001,
"lora_r": 16,
"lora_alpha": 32,
"lora_dropout": 0.1,
"target_modules": [
"query",
"key",
"value",
"output.dense"
]
},
"best_val_loss": 0.00934141071531148
}