Upload 9 files

Browse files

Files changed (9) hide show

models/o3-mini_20250218/README.md +199 -0
models/o3-mini_20250218/added_tokens.json +3 -0
models/o3-mini_20250218/config.json +150 -0
models/o3-mini_20250218/model.safetensors +3 -0
models/o3-mini_20250218/special_tokens_map.json +15 -0
models/o3-mini_20250218/spm.model +3 -0
models/o3-mini_20250218/tokenizer.json +0 -0
models/o3-mini_20250218/tokenizer_config.json +60 -0
models/o3-mini_20250218/training_args.bin +3 -0

models/o3-mini_20250218/README.md ADDED Viewed

	@@ -0,0 +1,199 @@

+---
+license: bsd-2-clause
+---
+### Dataset: o3-mini_20250218
+```text
+DatasetDict({
+    test: Dataset({
+        features: ['text', 'tokens', 'adj', 'adv', 'det', 'enc', 'func', 'misc', 'ner1', 'ner2', 'noun', 'pronoun', 'punct', 'verb', 'wh'],
+        num_rows: 2571
+    })
+    train: Dataset({
+        features: ['text', 'tokens', 'adj', 'adv', 'det', 'enc', 'func', 'misc', 'ner1', 'ner2', 'noun', 'pronoun', 'punct', 'verb', 'wh'],
+        num_rows: 23389
+    })
+    validation: Dataset({
+        features: ['text', 'tokens', 'adj', 'adv', 'det', 'enc', 'func', 'misc', 'ner1', 'ner2', 'noun', 'pronoun', 'punct', 'verb', 'wh'],
+        num_rows: 2599
+    })
+})
+```
+### Classification Reports
+```text
+----- adj classification report -----
+              precision    recall  f1-score   support
+          JJ       0.90      0.87      0.88      3187
+         JJR       0.95      0.88      0.91       162
+         JJS       0.88      0.84      0.86       102
+           O       0.99      0.99      0.99     29414
+    accuracy                           0.98     32865
+   macro avg       0.93      0.89      0.91     32865
+weighted avg       0.98      0.98      0.98     32865
+----- adv classification report -----
+              precision    recall  f1-score   support
+           O       0.99      0.99      0.99     30468
+          RB       0.91      0.91      0.91      2157
+         RBR       0.89      0.90      0.89       146
+         RBS       0.80      0.79      0.79        94
+    accuracy                           0.99     32865
+   macro avg       0.90      0.90      0.90     32865
+weighted avg       0.99      0.99      0.99     32865
+----- det classification report -----
+              precision    recall  f1-score   support
+          DT       0.96      0.95      0.96      4447
+          EX       0.96      0.90      0.93        82
+           O       0.99      0.99      0.99     28163
+         PDT       0.63      0.55      0.59       173
+    accuracy                           0.99     32865
+   macro avg       0.89      0.85      0.87     32865
+weighted avg       0.99      0.99      0.99     32865
+----- enc classification report -----
+              precision    recall  f1-score   support
+     BRACKET       0.79      0.89      0.84       385
+           O       0.99      0.99      0.99     31944
+       QUOTE       0.75      0.76      0.76       536
+    accuracy                           0.99     32865
+   macro avg       0.85      0.88      0.86     32865
+weighted avg       0.99      0.99      0.99     32865
+----- func classification report -----
+              precision    recall  f1-score   support
+          CC       0.98      0.99      0.98      1153
+          IN       0.97      0.98      0.97      3805
+           O       0.99      0.99      0.99     26444
+          RP       0.87      0.77      0.82       373
+          TO       1.00      0.99      0.99       871
+          UH       0.77      0.68      0.72       219
+    accuracy                           0.99     32865
+   macro avg       0.93      0.90      0.91     32865
+weighted avg       0.99      0.99      0.99     32865
+----- misc classification report -----
+              precision    recall  f1-score   support
+           $       0.92      0.86      0.89        64
+         ADD       0.77      0.71      0.74       719
+          CD       0.89      0.89      0.89       558
+       EMOJI       1.00      0.73      0.85        15
+           O       0.99      0.99      0.99     30608
+        TIME       0.88      0.90      0.89       901
+    accuracy                           0.98     32865
+   macro avg       0.91      0.85      0.87     32865
+weighted avg       0.98      0.98      0.98     32865
+----- ner1 classification report -----
+              precision    recall  f1-score   support
+       B-GPE       0.87      0.90      0.89       473
+       B-ORG       0.86      0.82      0.84       424
+       B-PER       0.95      0.93      0.94       649
+       I-GPE       0.85      0.90      0.87       147
+       I-ORG       0.85      0.82      0.83       310
+       I-PER       0.96      0.96      0.96       261
+           O       0.99      0.99      0.99     30601
+    accuracy                           0.99     32865
+   macro avg       0.90      0.90      0.90     32865
+weighted avg       0.99      0.99      0.99     32865
+----- ner2 classification report -----
+              precision    recall  f1-score   support
+     B-EVENT       0.62      0.52      0.56       621
+       B-LOC       0.78      0.78      0.78       909
+     I-EVENT       0.54      0.32      0.40      1033
+       I-LOC       0.73      0.66      0.70       597
+           O       0.96      0.98      0.97     29705
+    accuracy                           0.94     32865
+   macro avg       0.73      0.65      0.68     32865
+weighted avg       0.93      0.94      0.93     32865
+----- noun classification report -----
+              precision    recall  f1-score   support
+          NN       0.96      0.96      0.96      4400
+         NNP       0.94      0.96      0.95      2410
+        NNPS       0.67      0.72      0.69        61
+         NNS       0.97      0.97      0.97      1698
+           O       0.99      0.99      0.99     24296
+    accuracy                           0.98     32865
+   macro avg       0.91      0.92      0.91     32865
+weighted avg       0.98      0.98      0.98     32865
+----- pronoun classification report -----
+              precision    recall  f1-score   support
+           O       1.00      1.00      1.00     29952
+         POS       0.97      0.97      0.97       154
+         PRP       0.97      0.97      0.97      2139
+        PRP$       0.99      0.98      0.99       620
+    accuracy                           1.00     32865
+   macro avg       0.98      0.98      0.98     32865
+weighted avg       1.00      1.00      1.00     32865
+----- punct classification report -----
+              precision    recall  f1-score   support
+       COLON       0.99      0.95      0.97       201
+       COMMA       0.99      1.00      0.99      1454
+     EXCLAIM       0.99      0.97      0.98       107
+        HYPH       0.96      0.95      0.95       321
+          LS       0.57      0.53      0.55        15
+           O       1.00      1.00      1.00     28545
+      PERIOD       0.98      0.99      0.99      2022
+    QUESTION       0.99      0.99      0.99       156
+         SEP       0.75      0.41      0.53        44
+    accuracy                           1.00     32865
+   macro avg       0.91      0.87      0.88     32865
+weighted avg       1.00      1.00      1.00     32865
+----- verb classification report -----
+              precision    recall  f1-score   support
+          MD       1.00      0.98      0.99       527
+           O       1.00      0.99      0.99     26452
+          VB       0.95      0.94      0.94      1540
+         VBD       0.96      0.96      0.96      1330
+         VBG       0.94      0.96      0.95       625
+         VBN       0.88      0.93      0.90       766
+         VBP       0.88      0.92      0.90       766
+         VBZ       0.99      0.98      0.98       859
+    accuracy                           0.98     32865
+   macro avg       0.95      0.96      0.95     32865
+weighted avg       0.99      0.98      0.98     32865
+----- wh classification report -----
+              precision    recall  f1-score   support
+           O       0.99      1.00      0.99     32019
+         WDT       0.75      0.57      0.65       186
+          WP       0.84      0.71      0.77       164
+         WP$       0.62      0.58      0.60       238
+         WRB       0.94      0.72      0.81       258
+    accuracy                           0.99     32865
+   macro avg       0.83      0.72      0.77     32865
+weighted avg       0.99      0.99      0.99     32865
+```

models/o3-mini_20250218/added_tokens.json ADDED Viewed

	@@ -0,0 +1,3 @@

+{
+  "[MASK]": 128000
+}

models/o3-mini_20250218/config.json ADDED Viewed

	@@ -0,0 +1,150 @@

+{
+  "_name_or_path": "microsoft/deberta-v3-base",
+  "architectures": [
+    "MultiHeadModel"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label_maps": {
+    "adj": [
+      "JJ",
+      "JJS",
+      "JJR",
+      "O"
+    ],
+    "adv": [
+      "RBR",
+      "RB",
+      "RBS",
+      "O"
+    ],
+    "det": [
+      "PDT",
+      "DT",
+      "EX",
+      "O"
+    ],
+    "enc": [
+      "QUOTE",
+      "TICK",
+      "BRACKET",
+      "O"
+    ],
+    "func": [
+      "UH",
+      "RP",
+      "TO",
+      "O",
+      "IN",
+      "CC"
+    ],
+    "misc": [
+      "EMOJI",
+      "TIME",
+      "ADD",
+      "CD",
+      "O",
+      "$"
+    ],
+    "ner1": [
+      "I-ORG",
+      "B-ORG",
+      "I-GPE",
+      "B-PER",
+      "O",
+      "B-GPE",
+      "I-PER"
+    ],
+    "ner2": [
+      "I-LOC",
+      "B-LOC",
+      "I-EVENT",
+      "O",
+      "B-EVENT"
+    ],
+    "noun": [
+      "NNS",
+      "O",
+      "NNP",
+      "NN",
+      "NNPS"
+    ],
+    "pronoun": [
+      "PRP$",
+      "PRP",
+      "POS",
+      "O"
+    ],
+    "punct": [
+      "QUESTION",
+      "LS",
+      "COMMA",
+      "EXCLAIM",
+      "COLON",
+      "PERIOD",
+      "SEP",
+      "O",
+      "HYPH"
+    ],
+    "verb": [
+      "MD",
+      "VBG",
+      "O",
+      "VB",
+      "VBP",
+      "VBZ",
+      "VBN",
+      "VBD"
+    ],
+    "wh": [
+      "WP$",
+      "O",
+      "WP",
+      "WRB",
+      "WDT"
+    ]
+  },
+  "layer_norm_eps": 1e-07,
+  "legacy": true,
+  "max_position_embeddings": 512,
+  "max_relative_positions": -1,
+  "model_type": "deberta-v2",
+  "norm_rel_ebd": "layer_norm",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "num_labels_dict": {
+    "adj": 4,
+    "adv": 4,
+    "det": 4,
+    "enc": 4,
+    "func": 6,
+    "misc": 6,
+    "ner1": 7,
+    "ner2": 5,
+    "noun": 5,
+    "pronoun": 4,
+    "punct": 9,
+    "verb": 8,
+    "wh": 5
+  },
+  "pad_token_id": 0,
+  "pooler_dropout": 0,
+  "pooler_hidden_act": "gelu",
+  "pooler_hidden_size": 768,
+  "pos_att_type": [
+    "p2c",
+    "c2p"
+  ],
+  "position_biased_input": false,
+  "position_buckets": 256,
+  "relative_attention": true,
+  "share_att_key": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.2",
+  "type_vocab_size": 0,
+  "vocab_size": 128100
+}

models/o3-mini_20250218/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7fc80d3a8526faa41c3c79c97c87d72ca6f01fb6ef3812cd3a7764787b9949f
+size 735571028

models/o3-mini_20250218/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "bos_token": "[CLS]",
+  "cls_token": "[CLS]",
+  "eos_token": "[SEP]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

models/o3-mini_20250218/spm.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
+size 2464616

models/o3-mini_20250218/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

models/o3-mini_20250218/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,60 @@

+{
+  "add_prefix_space": true,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "128000": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "[CLS]",
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "eos_token": "[SEP]",
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "sp_model_kwargs": {},
+  "split_by_punct": false,
+  "tokenizer_class": "DebertaV2Tokenizer",
+  "unk_token": "[UNK]",
+  "vocab_type": "spm"
+}

models/o3-mini_20250218/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:393cbff7e2678a2b8c4e3190f5be4af291a4d8e9e2ca5376460939e460fa5ce5
+size 5304