UDHOV's picture
Add training configuration
340f7cd verified
{
"model_name": "Rajan/NepaliBERT",
"training_strategy": "discriminative",
"hyperparameters": {
"batch_size": 32,
"gradient_accumulation_steps": 1,
"learning_rate": 3e-05,
"num_epochs": 6,
"max_length": 256,
"dropout": 0.3,
"weight_decay": 0.01,
"label_smoothing": 0.05,
"warmup_ratio": 0.1
},
"class_weights": [
0.5,
0.7944444444444444,
3.0,
3.0
],
"label_names": [
"NO",
"OO",
"OR",
"OS"
],
"test_metrics": {
"model": "NepaliBERT",
"version": "improved_v2",
"preprocessing": "Translation + Emoji to Devanagari",
"strategy": "discriminative",
"hyperparameters": {
"batch_size": 32,
"learning_rate": 3e-05,
"epochs": 6,
"dropout": 0.3,
"weight_decay": 0.01,
"label_smoothing": 0.05,
"warmup_ratio": 0.1
},
"test_metrics": {
"accuracy": 0.6972413793103448,
"precision": 0.493269056413594,
"recall": 0.5412612321975574,
"f1": 0.5125857580723172
},
"per_class_f1": {
"NO": 0.7752808988764045,
"OO": 0.6012526096033403,
"OR": 0.48333333333333334,
"OS": 0.19047619047619047
},
"overfitting_gap": 0.0659809267044067
}
}