thejosango
/

nuha-binary

@@ -24,13 +24,13 @@ model-index:
     metrics:
     - name: F1
       type: f1
-      value: 0.6902334758303189
     - name: Precision
       type: precision
-      value: 0.6218338023996445
     - name: Recall
       type: recall
-      value: 0.7755403657860706
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -40,10 +40,10 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.5773
-- F1: 0.6902
-- Precision: 0.6218
-- Recall: 0.7755
 - Support: None
 ## Model description
@@ -68,7 +68,7 @@ The following hyperparameters were used during training:
 - eval_batch_size: 64
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
-- lr_scheduler_type: constant
 - num_epochs: 5
 - label_smoothing_factor: 0.1
@@ -76,14 +76,15 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | F1     | Precision | Recall | Support |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
-| 0.5531        | 0.37  | 500  | 0.5324          | 0.6866 | 0.6190    | 0.7707 | None    |
-| 0.5346        | 0.74  | 1000 | 0.5675          | 0.6920 | 0.5862    | 0.8444 | None    |
-| 0.5142        | 1.11  | 1500 | 0.5444          | 0.6980 | 0.6032    | 0.8280 | None    |
-| 0.472         | 1.48  | 2000 | 0.5466          | 0.6993 | 0.6165    | 0.8079 | None    |
-| 0.4704        | 1.85  | 2500 | 0.5346          | 0.7020 | 0.6274    | 0.7968 | None    |
-| 0.3858        | 2.22  | 3000 | 0.5762          | 0.6989 | 0.6292    | 0.7861 | None    |
-| 0.3912        | 2.58  | 3500 | 0.5676          | 0.6929 | 0.6372    | 0.7593 | None    |
-| 0.3966        | 2.95  | 4000 | 0.5773          | 0.6902 | 0.6218    | 0.7755 | None    |
 ### Framework versions

     metrics:
     - name: F1
       type: f1
+      value: 0.6926479178836685
     - name: Precision
       type: precision
+      value: 0.6316590563165906
     - name: Recall
       type: recall
+      value: 0.7666728246813227
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.6119
+- F1: 0.6926
+- Precision: 0.6317
+- Recall: 0.7667
 - Support: None
 ## Model description
 - eval_batch_size: 64
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
 - num_epochs: 5
 - label_smoothing_factor: 0.1
 | Training Loss | Epoch | Step | Validation Loss | F1     | Precision | Recall | Support |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
+| 0.553         | 0.37  | 500  | 0.5378          | 0.6847 | 0.6064    | 0.7863 | None    |
+| 0.5345        | 0.74  | 1000 | 0.5667          | 0.6915 | 0.5856    | 0.8443 | None    |
+| 0.5144        | 1.11  | 1500 | 0.5550          | 0.6968 | 0.5950    | 0.8406 | None    |
+| 0.4725        | 1.48  | 2000 | 0.5309          | 0.7020 | 0.6443    | 0.7711 | None    |
+| 0.468         | 1.85  | 2500 | 0.5317          | 0.7020 | 0.6252    | 0.8003 | None    |
+| 0.3986        | 2.22  | 3000 | 0.5538          | 0.6995 | 0.6443    | 0.7650 | None    |
+| 0.3967        | 2.58  | 3500 | 0.5581          | 0.6948 | 0.6466    | 0.7508 | None    |
+| 0.3971        | 2.95  | 4000 | 0.5643          | 0.6975 | 0.6290    | 0.7826 | None    |
+| 0.342         | 3.32  | 4500 | 0.6119          | 0.6926 | 0.6317    | 0.7667 | None    |
 ### Framework versions

config.toml CHANGED Viewed

@@ -1,5 +1,5 @@
 [experiment]
-name = "binary-52"
 type = "binary"
@@ -19,13 +19,13 @@ classifier_dropout = 0.25
 [training]
 num_train_epochs = 5
 warmup_steps = 0
-lr_scheduler_type = "constant"
 learning_rate = 5e-5
 per_device_train_batch_size = 64
 per_device_eval_batch_size = 64
 gradient_accumulation_steps = 1
 weight_decay = 1e-3
 label_smoothing_factor = 0.1
-weighted_loss = false
 early_stopping_patience = 5
 early_stopping_threshold = 0.005

 [experiment]
+name = "binary-53"
 type = "binary"
 [training]
 num_train_epochs = 5
 warmup_steps = 0
+lr_scheduler_type = "linear"
 learning_rate = 5e-5
 per_device_train_batch_size = 64
 per_device_eval_batch_size = 64
 gradient_accumulation_steps = 1
 weight_decay = 1e-3
 label_smoothing_factor = 0.1
+weighted_loss = true
 early_stopping_patience = 5
 early_stopping_threshold = 0.005

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77854de095531e646b72ad7d6a9d3323b85a5652cee4d8a587558eaf19f4b5f4
 size 370706033

 version https://git-lfs.github.com/spec/v1
+oid sha256:0a6c22f6383637027556d78ffec12f58f1d678a4d7f46de11664073c36d1d86d
 size 370706033

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:21f5bef3aca0c3c13753416b32c9243167e3d497cac8c70cb0b7b3354d422cb3
 size 4091

 version https://git-lfs.github.com/spec/v1
+oid sha256:c05259d62d10144d73bd28aed57f9da0ce390e5520f5caf1e30a66e33baa68d2
 size 4091