devagonal commited on
Commit
39bb026
·
verified ·
1 Parent(s): bd42fb7

End of training

Browse files
Files changed (4) hide show
  1. README.md +7 -7
  2. config.json +9 -4
  3. model.safetensors +2 -2
  4. training_args.bin +2 -2
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
  library_name: transformers
3
  license: apache-2.0
4
- base_model: bert-base-uncased
5
  tags:
6
  - generated_from_trainer
7
  metrics:
@@ -19,9 +19,9 @@ should probably proofread and complete it, then remove this comment. -->
19
 
20
  # bert-f1-durga-muhammad
21
 
22
- This model is a fine-tuned version of [bert-base-uncased](https://huggingface.co/bert-base-uncased) on the None dataset.
23
  It achieves the following results on the evaluation set:
24
- - Loss: 0.0313
25
  - Accuracy: 0.995
26
  - Precision: 0.995
27
  - Recall: 0.995
@@ -56,13 +56,13 @@ The following hyperparameters were used during training:
56
 
57
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 |
58
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:---------:|:------:|:-----:|
59
- | 0.3962 | 1.2 | 60 | 0.0549 | 0.995 | 0.995 | 0.995 | 0.995 |
60
- | 0.0345 | 2.4 | 120 | 0.0314 | 0.995 | 0.995 | 0.995 | 0.995 |
61
 
62
 
63
  ### Framework versions
64
 
65
- - Transformers 4.45.2
66
  - Pytorch 2.5.0+cu121
67
  - Datasets 3.0.2
68
- - Tokenizers 0.20.1
 
1
  ---
2
  library_name: transformers
3
  license: apache-2.0
4
+ base_model: google-bert/bert-base-multilingual-cased
5
  tags:
6
  - generated_from_trainer
7
  metrics:
 
19
 
20
  # bert-f1-durga-muhammad
21
 
22
+ This model is a fine-tuned version of [google-bert/bert-base-multilingual-cased](https://huggingface.co/google-bert/bert-base-multilingual-cased) on the None dataset.
23
  It achieves the following results on the evaluation set:
24
+ - Loss: 0.0281
25
  - Accuracy: 0.995
26
  - Precision: 0.995
27
  - Recall: 0.995
 
56
 
57
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 |
58
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:---------:|:------:|:-----:|
59
+ | 0.4433 | 1.2 | 60 | 0.2100 | 0.945 | 0.945 | 0.945 | 0.945 |
60
+ | 0.0858 | 2.4 | 120 | 0.0321 | 0.995 | 0.995 | 0.995 | 0.995 |
61
 
62
 
63
  ### Framework versions
64
 
65
+ - Transformers 4.44.2
66
  - Pytorch 2.5.0+cu121
67
  - Datasets 3.0.2
68
+ - Tokenizers 0.19.1
config.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
- "_name_or_path": "bert-base-uncased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
- "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
@@ -17,11 +17,16 @@
17
  "num_attention_heads": 12,
18
  "num_hidden_layers": 12,
19
  "pad_token_id": 0,
 
 
 
 
 
20
  "position_embedding_type": "absolute",
21
  "problem_type": "single_label_classification",
22
  "torch_dtype": "float32",
23
- "transformers_version": "4.45.2",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
- "vocab_size": 30522
27
  }
 
1
  {
2
+ "_name_or_path": "google-bert/bert-base-multilingual-cased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
+ "directionality": "bidi",
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
 
17
  "num_attention_heads": 12,
18
  "num_hidden_layers": 12,
19
  "pad_token_id": 0,
20
+ "pooler_fc_size": 768,
21
+ "pooler_num_attention_heads": 12,
22
+ "pooler_num_fc_layers": 3,
23
+ "pooler_size_per_head": 128,
24
+ "pooler_type": "first_token_transform",
25
  "position_embedding_type": "absolute",
26
  "problem_type": "single_label_classification",
27
  "torch_dtype": "float32",
28
+ "transformers_version": "4.44.2",
29
  "type_vocab_size": 2,
30
  "use_cache": true,
31
+ "vocab_size": 119547
32
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20382e9b8b6cc41d647b8e8ea58f8e6bc9db532718d69ec5989098c66ed5f0af
3
- size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daf381230470913999b9ddfca697ab1e0b1fc50db21850d3823e13d9774ad328
3
+ size 711443456
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:07aebc5b3d196d036f02f131a1e7cd14e28652993094a0c1e6adce5a9da77c09
3
- size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f754167c4e13a0f6c12429afaaa74def00ddf249463e3d7446cd3d413998da12
3
+ size 5176