AnonymousCS
/

bert-chinese-weibo-90p-v3

@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [google-bert/bert-base-chinese](https://huggingface.co/google-bert/bert-base-chinese) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.3019
-- Accuracy: 0.9429
 ## Model description
@@ -50,15 +50,15 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
-| No log        | 1.0   | 61   | 0.2961          | 0.9398   |
-| 0.0152        | 2.0   | 122  | 0.3069          | 0.9398   |
-| 0.0152        | 3.0   | 183  | 0.2982          | 0.9450   |
-| 0.0174        | 4.0   | 244  | 0.3019          | 0.9429   |
 ### Framework versions
-- Transformers 4.57.1
-- Pytorch 2.8.0+cu126
 - Datasets 4.0.0
-- Tokenizers 0.22.1

 This model is a fine-tuned version of [google-bert/bert-base-chinese](https://huggingface.co/google-bert/bert-base-chinese) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.3092
+- Accuracy: 0.9450
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
+| No log        | 1.0   | 61   | 0.2739          | 0.9356   |
+| 0.0214        | 2.0   | 122  | 0.2764          | 0.9377   |
+| 0.0214        | 3.0   | 183  | 0.2956          | 0.9470   |
+| 0.0163        | 4.0   | 244  | 0.3092          | 0.9450   |
 ### Framework versions
+- Transformers 5.0.0
+- Pytorch 2.9.0+cu126
 - Datasets 4.0.0
+- Tokenizers 0.22.2

config.json CHANGED Viewed

@@ -1,16 +1,20 @@
 {
   "architectures": [
     "BertForSequenceClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
   "classifier_dropout": null,
   "directionality": "bidi",
   "dtype": "float32",
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "model_type": "bert",
@@ -22,10 +26,10 @@
   "pooler_num_fc_layers": 3,
   "pooler_size_per_head": 128,
   "pooler_type": "first_token_transform",
-  "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
-  "transformers_version": "4.57.1",
   "type_vocab_size": 2,
-  "use_cache": true,
   "vocab_size": 21128
 }

 {
+  "add_cross_attention": false,
   "architectures": [
     "BertForSequenceClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": null,
   "classifier_dropout": null,
   "directionality": "bidi",
   "dtype": "float32",
+  "eos_token_id": null,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
+  "is_decoder": false,
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "model_type": "bert",
   "pooler_num_fc_layers": 3,
   "pooler_size_per_head": 128,
   "pooler_type": "first_token_transform",
   "problem_type": "single_label_classification",
+  "tie_word_embeddings": true,
+  "transformers_version": "5.0.0",
   "type_vocab_size": 2,
+  "use_cache": false,
   "vocab_size": 21128
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1f78983d7d9660ebb41a6ba2a189c7ca5df06b8d6bd66793b20dd7e7ea8fdcf4
-size 409100240

 version https://git-lfs.github.com/spec/v1
+oid sha256:e921c91ce95aab04e2c52610903d8de0956e30385cce3f841a40b756c8ba7a51
+size 409100216

tokenizer_config.json CHANGED Viewed

@@ -1,50 +1,8 @@
 {
-  "added_tokens_decoder": {
-    "0": {
-      "content": "[PAD]",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "100": {
-      "content": "[UNK]",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "101": {
-      "content": "[CLS]",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "102": {
-      "content": "[SEP]",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "103": {
-      "content": "[MASK]",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    }
-  },
-  "clean_up_tokenization_spaces": false,
   "cls_token": "[CLS]",
   "do_lower_case": false,
-  "extra_special_tokens": {},
   "mask_token": "[MASK]",
   "model_max_length": 512,
   "pad_token": "[PAD]",

 {
+  "backend": "tokenizers",
   "cls_token": "[CLS]",
   "do_lower_case": false,
+  "is_local": false,
   "mask_token": "[MASK]",
   "model_max_length": 512,
   "pad_token": "[PAD]",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a2b700fe428a7228137401f4f80420d0a94361075a970e148a88778565878c2c
-size 5841

 version https://git-lfs.github.com/spec/v1
+oid sha256:88cdeda8b8fd59ab3632f21a883f1c0d78ba345e7b466489e9fbcc4af4ec98c7
+size 5201