yazansh commited on
Commit
12eae77
·
verified ·
1 Parent(s): c79de0c

binary-33

Browse files
Files changed (4) hide show
  1. README.md +15 -18
  2. config.toml +2 -2
  3. pytorch_model.bin +1 -1
  4. training_args.bin +1 -1
README.md CHANGED
@@ -23,13 +23,13 @@ model-index:
23
  metrics:
24
  - name: F1
25
  type: f1
26
- value: 0.6929572707312953
27
  - name: Precision
28
  type: precision
29
- value: 0.6382018976512677
30
  - name: Recall
31
  type: recall
32
- value: 0.7579900240162571
33
  ---
34
 
35
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -39,10 +39,10 @@ should probably proofread and complete it, then remove this comment. -->
39
 
40
  This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
41
  It achieves the following results on the evaluation set:
42
- - Loss: 0.5309
43
- - F1: 0.6930
44
- - Precision: 0.6382
45
- - Recall: 0.7580
46
  - Support: None
47
 
48
  ## Model description
@@ -62,7 +62,7 @@ More information needed
62
  ### Training hyperparameters
63
 
64
  The following hyperparameters were used during training:
65
- - learning_rate: 1e-05
66
  - train_batch_size: 32
67
  - eval_batch_size: 32
68
  - seed: 42
@@ -77,16 +77,13 @@ The following hyperparameters were used during training:
77
 
78
  | Training Loss | Epoch | Step | Validation Loss | F1 | Precision | Recall | Support |
79
  |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
80
- | 0.5819 | 0.37 | 500 | 0.6020 | 0.6493 | 0.5311 | 0.8352 | None |
81
- | 0.5611 | 0.74 | 1000 | 0.5814 | 0.6648 | 0.5561 | 0.8263 | None |
82
- | 0.5467 | 1.11 | 1500 | 0.5570 | 0.6744 | 0.5878 | 0.7911 | None |
83
- | 0.5345 | 1.48 | 2000 | 0.5228 | 0.6756 | 0.6470 | 0.7068 | None |
84
- | 0.5299 | 1.85 | 2500 | 0.5283 | 0.6853 | 0.6291 | 0.7526 | None |
85
- | 0.5054 | 2.22 | 3000 | 0.5395 | 0.6850 | 0.6159 | 0.7717 | None |
86
- | 0.5052 | 2.59 | 3500 | 0.5236 | 0.6876 | 0.6450 | 0.7362 | None |
87
- | 0.5033 | 2.96 | 4000 | 0.5338 | 0.6899 | 0.6202 | 0.7774 | None |
88
- | 0.4839 | 3.32 | 4500 | 0.5339 | 0.6922 | 0.6292 | 0.7691 | None |
89
- | 0.4846 | 3.69 | 5000 | 0.5309 | 0.6930 | 0.6382 | 0.7580 | None |
90
 
91
 
92
  ### Framework versions
 
23
  metrics:
24
  - name: F1
25
  type: f1
26
+ value: 0.6829268292682927
27
  - name: Precision
28
  type: precision
29
+ value: 0.6481911715897777
30
  - name: Recall
31
  type: recall
32
+ value: 0.7215961573988546
33
  ---
34
 
35
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
39
 
40
  This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
41
  It achieves the following results on the evaluation set:
42
+ - Loss: 0.5679
43
+ - F1: 0.6829
44
+ - Precision: 0.6482
45
+ - Recall: 0.7216
46
  - Support: None
47
 
48
  ## Model description
 
62
  ### Training hyperparameters
63
 
64
  The following hyperparameters were used during training:
65
+ - learning_rate: 5e-05
66
  - train_batch_size: 32
67
  - eval_batch_size: 32
68
  - seed: 42
 
77
 
78
  | Training Loss | Epoch | Step | Validation Loss | F1 | Precision | Recall | Support |
79
  |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
80
+ | 0.5606 | 0.37 | 500 | 0.5393 | 0.6786 | 0.6092 | 0.7659 | None |
81
+ | 0.5414 | 0.74 | 1000 | 0.5770 | 0.6845 | 0.5747 | 0.8463 | None |
82
+ | 0.5178 | 1.11 | 1500 | 0.5384 | 0.6888 | 0.6069 | 0.7962 | None |
83
+ | 0.4777 | 1.48 | 2000 | 0.5407 | 0.6926 | 0.6266 | 0.7742 | None |
84
+ | 0.4752 | 1.85 | 2500 | 0.5372 | 0.6960 | 0.6138 | 0.8036 | None |
85
+ | 0.3952 | 2.22 | 3000 | 0.5873 | 0.6892 | 0.6155 | 0.7829 | None |
86
+ | 0.4008 | 2.59 | 3500 | 0.5679 | 0.6829 | 0.6482 | 0.7216 | None |
 
 
 
87
 
88
 
89
  ### Framework versions
config.toml CHANGED
@@ -1,5 +1,5 @@
1
  [experiment]
2
- name = "binary-32"
3
  type = "binary"
4
 
5
 
@@ -19,7 +19,7 @@ revision = "2caf9ebc5b275737c95f8bb16953288107a7131c"
19
  num_train_epochs = 30
20
  warmup_steps = 0
21
  lr_scheduler_type = "linear"
22
- learning_rate = 1e-5
23
  per_device_train_batch_size = 32
24
  per_device_eval_batch_size = 32
25
  gradient_accumulation_steps = 2
 
1
  [experiment]
2
+ name = "binary-33"
3
  type = "binary"
4
 
5
 
 
19
  num_train_epochs = 30
20
  warmup_steps = 0
21
  lr_scheduler_type = "linear"
22
+ learning_rate = 5e-5
23
  per_device_train_batch_size = 32
24
  per_device_eval_batch_size = 32
25
  gradient_accumulation_steps = 2
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffa9b265fc5a19baa463bee60e9074ec131fe038226868e561b81b1be06a3607
3
  size 313992076
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9220848386970aac9b2da72bbb5578de2bb93048fe6f3526b02d7e634df83bca
3
  size 313992076
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc6a77945690f1f63f16259eb40d607f54a53c733180aa51a00d74f6362b8f6f
3
  size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75405e81cc63a82a054f4fcfa9912126203b652f08c0eabc3a7dfac51214aa66
3
  size 4091