thejosango
/

nuha-binary

@@ -23,13 +23,13 @@ model-index:
     metrics:
     - name: F1
       type: f1
-      value: 0.6928497604059006
     - name: Precision
       type: precision
-      value: 0.7049713193116635
     - name: Recall
       type: recall
-      value: 0.6811380011084427
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -39,10 +39,10 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.4966
-- F1: 0.6928
-- Precision: 0.7050
-- Recall: 0.6811
 - Support: None
 ## Model description
@@ -63,31 +63,21 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 1e-05
-- train_batch_size: 32
-- eval_batch_size: 32
 - seed: 42
-- gradient_accumulation_steps: 2
-- total_train_batch_size: 64
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: constant
-- num_epochs: 5
 - label_smoothing_factor: 0.1
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | F1     | Precision | Recall | Support |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
-| 0.5537        | 0.25  | 500  | 0.5298          | 0.6135 | 0.6830    | 0.5568 | None    |
-| 0.5294        | 0.5   | 1000 | 0.5174          | 0.6260 | 0.7106    | 0.5594 | None    |
-| 0.5236        | 0.75  | 1500 | 0.5129          | 0.6751 | 0.6752    | 0.6750 | None    |
-| 0.5211        | 1.0   | 2000 | 0.5038          | 0.6656 | 0.7084    | 0.6277 | None    |
-| 0.4972        | 1.26  | 2500 | 0.5034          | 0.6486 | 0.7288    | 0.5843 | None    |
-| 0.4926        | 1.51  | 3000 | 0.5058          | 0.6944 | 0.6755    | 0.7144 | None    |
-| 0.4914        | 1.76  | 3500 | 0.5006          | 0.6936 | 0.6901    | 0.6970 | None    |
-| 0.4899        | 2.01  | 4000 | 0.5019          | 0.6881 | 0.7036    | 0.6732 | None    |
-| 0.4715        | 2.26  | 4500 | 0.4987          | 0.6949 | 0.6977    | 0.6920 | None    |
-| 0.474         | 2.51  | 5000 | 0.4990          | 0.6998 | 0.6922    | 0.7076 | None    |
-| 0.4729        | 2.76  | 5500 | 0.4966          | 0.6928 | 0.7050    | 0.6811 | None    |
 ### Framework versions

     metrics:
     - name: F1
       type: f1
+      value: 0.592617830777967
     - name: Precision
       type: precision
+      value: 0.7691627358490566
     - name: Recall
       type: recall
+      value: 0.481987807130981
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.4196
+- F1: 0.5926
+- Precision: 0.7692
+- Recall: 0.4820
 - Support: None
 ## Model description
 The following hyperparameters were used during training:
 - learning_rate: 1e-05
+- train_batch_size: 64
+- eval_batch_size: 64
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: constant
+- num_epochs: 1
 - label_smoothing_factor: 0.1
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | F1     | Precision | Recall | Support |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
+| 0.4508        | 0.25  | 500  | 0.4341          | 0.4407 | 0.7864    | 0.3061 | None    |
+| 0.4317        | 0.5   | 1000 | 0.4229          | 0.4936 | 0.8037    | 0.3562 | None    |
+| 0.4289        | 0.75  | 1500 | 0.4196          | 0.5926 | 0.7692    | 0.4820 | None    |
 ### Framework versions

config.toml CHANGED Viewed

@@ -1,5 +1,5 @@
 [experiment]
-name = "binary-38"
 type = "binary"
@@ -16,15 +16,15 @@ revision = "ce20f497544665775129f9ff5b3cd2a3e350dce8"
 [training]
-num_train_epochs = 5
 warmup_steps = 0
 lr_scheduler_type = "constant"
 learning_rate = 1e-5
-per_device_train_batch_size = 32
-per_device_eval_batch_size = 32
-gradient_accumulation_steps = 2
 weight_decay = 0.00
 label_smoothing_factor = 0.1
-weighted_loss = false
 early_stopping_patience = 5
 early_stopping_threshold = 0.005

 [experiment]
+name = "binary-39"
 type = "binary"
 [training]
+num_train_epochs = 1
 warmup_steps = 0
 lr_scheduler_type = "constant"
 learning_rate = 1e-5
+per_device_train_batch_size = 64
+per_device_eval_batch_size = 64
+gradient_accumulation_steps = 1
 weight_decay = 0.00
 label_smoothing_factor = 0.1
+weighted_loss = true
 early_stopping_patience = 5
 early_stopping_threshold = 0.005

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c3eceddd77e5a00819ab30f4f9f90180c97198b12fefd284d24ecf49c2b80ce5
 size 540847921

 version https://git-lfs.github.com/spec/v1
+oid sha256:99972b963c59dacfc2e2c98109726ef6bbffac594bb8e422cdb7bc65758e593c
 size 540847921

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:08daaa9929d5ac6d9774c9e26f13cc06d212873de4e3172ec8b81ea97d9d5d6b
 size 4091

 version https://git-lfs.github.com/spec/v1
+oid sha256:b50e314607e1472325db96b6790c30fded1af537fb57a1e3c4cacc16a62b2d08
 size 4091