thejosango
/

nuha-ajp-binary

@@ -23,13 +23,13 @@ model-index:
     metrics:
     - name: F1
       type: f1
-      value: 0.6929572707312953
     - name: Precision
       type: precision
-      value: 0.6382018976512677
     - name: Recall
       type: recall
-      value: 0.7579900240162571
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -39,10 +39,10 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.5309
-- F1: 0.6930
-- Precision: 0.6382
-- Recall: 0.7580
 - Support: None
 ## Model description
@@ -62,7 +62,7 @@ More information needed
 ### Training hyperparameters
 The following hyperparameters were used during training:
-- learning_rate: 1e-05
 - train_batch_size: 32
 - eval_batch_size: 32
 - seed: 42
@@ -77,16 +77,13 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | F1     | Precision | Recall | Support |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
-| 0.5819        | 0.37  | 500  | 0.6020          | 0.6493 | 0.5311    | 0.8352 | None    |
-| 0.5611        | 0.74  | 1000 | 0.5814          | 0.6648 | 0.5561    | 0.8263 | None    |
-| 0.5467        | 1.11  | 1500 | 0.5570          | 0.6744 | 0.5878    | 0.7911 | None    |
-| 0.5345        | 1.48  | 2000 | 0.5228          | 0.6756 | 0.6470    | 0.7068 | None    |
-| 0.5299        | 1.85  | 2500 | 0.5283          | 0.6853 | 0.6291    | 0.7526 | None    |
-| 0.5054        | 2.22  | 3000 | 0.5395          | 0.6850 | 0.6159    | 0.7717 | None    |
-| 0.5052        | 2.59  | 3500 | 0.5236          | 0.6876 | 0.6450    | 0.7362 | None    |
-| 0.5033        | 2.96  | 4000 | 0.5338          | 0.6899 | 0.6202    | 0.7774 | None    |
-| 0.4839        | 3.32  | 4500 | 0.5339          | 0.6922 | 0.6292    | 0.7691 | None    |
-| 0.4846        | 3.69  | 5000 | 0.5309          | 0.6930 | 0.6382    | 0.7580 | None    |
 ### Framework versions

     metrics:
     - name: F1
       type: f1
+      value: 0.6829268292682927
     - name: Precision
       type: precision
+      value: 0.6481911715897777
     - name: Recall
       type: recall
+      value: 0.7215961573988546
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.5679
+- F1: 0.6829
+- Precision: 0.6482
+- Recall: 0.7216
 - Support: None
 ## Model description
 ### Training hyperparameters
 The following hyperparameters were used during training:
+- learning_rate: 5e-05
 - train_batch_size: 32
 - eval_batch_size: 32
 - seed: 42
 | Training Loss | Epoch | Step | Validation Loss | F1     | Precision | Recall | Support |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
+| 0.5606        | 0.37  | 500  | 0.5393          | 0.6786 | 0.6092    | 0.7659 | None    |
+| 0.5414        | 0.74  | 1000 | 0.5770          | 0.6845 | 0.5747    | 0.8463 | None    |
+| 0.5178        | 1.11  | 1500 | 0.5384          | 0.6888 | 0.6069    | 0.7962 | None    |
+| 0.4777        | 1.48  | 2000 | 0.5407          | 0.6926 | 0.6266    | 0.7742 | None    |
+| 0.4752        | 1.85  | 2500 | 0.5372          | 0.6960 | 0.6138    | 0.8036 | None    |
+| 0.3952        | 2.22  | 3000 | 0.5873          | 0.6892 | 0.6155    | 0.7829 | None    |
+| 0.4008        | 2.59  | 3500 | 0.5679          | 0.6829 | 0.6482    | 0.7216 | None    |
 ### Framework versions

config.toml CHANGED Viewed

@@ -1,5 +1,5 @@
 [experiment]
-name = "binary-32"
 type = "binary"
@@ -19,7 +19,7 @@ revision = "2caf9ebc5b275737c95f8bb16953288107a7131c"
 num_train_epochs = 30
 warmup_steps = 0
 lr_scheduler_type = "linear"
-learning_rate = 1e-5
 per_device_train_batch_size = 32
 per_device_eval_batch_size = 32
 gradient_accumulation_steps = 2

 [experiment]
+name = "binary-33"
 type = "binary"
 num_train_epochs = 30
 warmup_steps = 0
 lr_scheduler_type = "linear"
+learning_rate = 5e-5
 per_device_train_batch_size = 32
 per_device_eval_batch_size = 32
 gradient_accumulation_steps = 2

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ffa9b265fc5a19baa463bee60e9074ec131fe038226868e561b81b1be06a3607
 size 313992076

 version https://git-lfs.github.com/spec/v1
+oid sha256:9220848386970aac9b2da72bbb5578de2bb93048fe6f3526b02d7e634df83bca
 size 313992076

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc6a77945690f1f63f16259eb40d607f54a53c733180aa51a00d74f6362b8f6f
 size 4091

 version https://git-lfs.github.com/spec/v1
+oid sha256:75405e81cc63a82a054f4fcfa9912126203b652f08c0eabc3a7dfac51214aa66
 size 4091