Training in progress, epoch 1
Browse files- config.json +32 -0
- model.safetensors +3 -0
- runs/Jul09_12-52-58_DESKTOP-T04P4ED/events.out.tfevents.1720518779.DESKTOP-T04P4ED.19964.0 +3 -0
- runs/Jul09_12-53-49_DESKTOP-T04P4ED/events.out.tfevents.1720518830.DESKTOP-T04P4ED.19964.1 +3 -0
- runs/Jul09_12-57-12_DESKTOP-T04P4ED/events.out.tfevents.1720519032.DESKTOP-T04P4ED.19964.2 +3 -0
- runs/Jul09_13-15-27_DESKTOP-T04P4ED/events.out.tfevents.1720520127.DESKTOP-T04P4ED.19964.3 +3 -0
- runs/Jul09_13-25-30_DESKTOP-T04P4ED/events.out.tfevents.1720520731.DESKTOP-T04P4ED.19964.4 +3 -0
- runs/Jul09_13-38-05_DESKTOP-T04P4ED/events.out.tfevents.1720521486.DESKTOP-T04P4ED.19964.5 +3 -0
- runs/Jul09_13-42-04_DESKTOP-T04P4ED/events.out.tfevents.1720521725.DESKTOP-T04P4ED.19964.6 +3 -0
- runs/Jul09_13-43-03_DESKTOP-T04P4ED/events.out.tfevents.1720521783.DESKTOP-T04P4ED.19964.7 +3 -0
- runs/Jul09_13-47-10_DESKTOP-T04P4ED/events.out.tfevents.1720522031.DESKTOP-T04P4ED.19964.8 +3 -0
- runs/Jul09_13-48-57_DESKTOP-T04P4ED/events.out.tfevents.1720522138.DESKTOP-T04P4ED.19964.9 +3 -0
- runs/Jul09_13-54-07_DESKTOP-T04P4ED/events.out.tfevents.1720522448.DESKTOP-T04P4ED.19964.10 +3 -0
- runs/Jul09_14-55-56_DESKTOP-T04P4ED/events.out.tfevents.1720526157.DESKTOP-T04P4ED.19964.11 +3 -0
- runs/Jul09_15-12-14_DESKTOP-T04P4ED/events.out.tfevents.1720527135.DESKTOP-T04P4ED.19964.12 +3 -0
- runs/Jul09_15-14-40_DESKTOP-T04P4ED/events.out.tfevents.1720527280.DESKTOP-T04P4ED.13344.0 +3 -0
- runs/Jul09_15-17-35_DESKTOP-T04P4ED/events.out.tfevents.1720527456.DESKTOP-T04P4ED.13344.1 +3 -0
- special_tokens_map.json +7 -0
- tokenizer.json +0 -0
- tokenizer_config.json +57 -0
- training_args.bin +3 -0
- vocab.txt +0 -0
config.json
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_name_or_path": "ai-forever/ruElectra-medium",
|
| 3 |
+
"architectures": [
|
| 4 |
+
"ElectraForSequenceClassification"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"classifier_dropout": null,
|
| 8 |
+
"embedding_size": 576,
|
| 9 |
+
"generator_size": "0.25",
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 576,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 2304,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "electra",
|
| 18 |
+
"num_attention_heads": 9,
|
| 19 |
+
"num_hidden_layers": 12,
|
| 20 |
+
"pad_token_id": 0,
|
| 21 |
+
"position_embedding_type": "absolute",
|
| 22 |
+
"problem_type": "single_label_classification",
|
| 23 |
+
"summary_activation": "gelu",
|
| 24 |
+
"summary_last_dropout": 0.1,
|
| 25 |
+
"summary_type": "first",
|
| 26 |
+
"summary_use_proj": true,
|
| 27 |
+
"torch_dtype": "float32",
|
| 28 |
+
"transformers_version": "4.42.3",
|
| 29 |
+
"type_vocab_size": 2,
|
| 30 |
+
"use_cache": true,
|
| 31 |
+
"vocab_size": 64000
|
| 32 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a974f91186cce7ed440db927e10511c27d9a18adaee3ad1c64555adef8c4e8a
|
| 3 |
+
size 341465432
|
runs/Jul09_12-52-58_DESKTOP-T04P4ED/events.out.tfevents.1720518779.DESKTOP-T04P4ED.19964.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4444210f2d7a225410ea1c54f7bab2c718433e8582c4fd680c77b3ba02dd56fb
|
| 3 |
+
size 5578
|
runs/Jul09_12-53-49_DESKTOP-T04P4ED/events.out.tfevents.1720518830.DESKTOP-T04P4ED.19964.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:103adcd9c19505f7fe558273358e7c3fa1aa9d775fe02281633735f4c4032b19
|
| 3 |
+
size 5578
|
runs/Jul09_12-57-12_DESKTOP-T04P4ED/events.out.tfevents.1720519032.DESKTOP-T04P4ED.19964.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab8d34fcea1bed4244558f847ddd513521a1a1fe5ed14bf89cd1bc3d84494b8a
|
| 3 |
+
size 5578
|
runs/Jul09_13-15-27_DESKTOP-T04P4ED/events.out.tfevents.1720520127.DESKTOP-T04P4ED.19964.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b1ebef7c43cd778129893783ff8c5c94d95a518badd6cf866e33a1ffd974f497
|
| 3 |
+
size 5578
|
runs/Jul09_13-25-30_DESKTOP-T04P4ED/events.out.tfevents.1720520731.DESKTOP-T04P4ED.19964.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97981115834d5d71a169e3a42da09369f7e6bb10a165cfc0505df0c57d5406ff
|
| 3 |
+
size 5578
|
runs/Jul09_13-38-05_DESKTOP-T04P4ED/events.out.tfevents.1720521486.DESKTOP-T04P4ED.19964.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2459e8d177383ab1a80e6cf44c6ace52787719bd344416b89d435b0902587ce
|
| 3 |
+
size 5578
|
runs/Jul09_13-42-04_DESKTOP-T04P4ED/events.out.tfevents.1720521725.DESKTOP-T04P4ED.19964.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b745ea00fb92af27d56a884dc694b5eeda2dbcd64639d50f6746318e3404f70
|
| 3 |
+
size 5576
|
runs/Jul09_13-43-03_DESKTOP-T04P4ED/events.out.tfevents.1720521783.DESKTOP-T04P4ED.19964.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6fb5b01ed57e86c63fff4d9c3080ab4554d539948fffec02de0a8d81e5d611eb
|
| 3 |
+
size 5576
|
runs/Jul09_13-47-10_DESKTOP-T04P4ED/events.out.tfevents.1720522031.DESKTOP-T04P4ED.19964.8
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99044a5255b18623d69d6a9da04a3c594e565903e5d3f88be0e69c6a423b351f
|
| 3 |
+
size 5576
|
runs/Jul09_13-48-57_DESKTOP-T04P4ED/events.out.tfevents.1720522138.DESKTOP-T04P4ED.19964.9
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb84f5f920dcebbd396f2a7a60c5f268e943b5b492b3b61d98d3a1d55cc757f3
|
| 3 |
+
size 5627
|
runs/Jul09_13-54-07_DESKTOP-T04P4ED/events.out.tfevents.1720522448.DESKTOP-T04P4ED.19964.10
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca46ad4b89eeeeeeb71f21a52ac7ff16605c1ec93bfa80ef4b24cee18b37d16a
|
| 3 |
+
size 5573
|
runs/Jul09_14-55-56_DESKTOP-T04P4ED/events.out.tfevents.1720526157.DESKTOP-T04P4ED.19964.11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45354202f38b3460008480849e93f1815112de18fc8718dabfaaa953146a37eb
|
| 3 |
+
size 6917
|
runs/Jul09_15-12-14_DESKTOP-T04P4ED/events.out.tfevents.1720527135.DESKTOP-T04P4ED.19964.12
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2d32070d383b51110e4409381200a1ec1296b9df10b8419ce13fa62d8c5713e
|
| 3 |
+
size 4961
|
runs/Jul09_15-14-40_DESKTOP-T04P4ED/events.out.tfevents.1720527280.DESKTOP-T04P4ED.13344.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1dbea41b855005053c6d1bbdd20ac06e822bcb2ddafaf80a899d0b15ce16879a
|
| 3 |
+
size 4961
|
runs/Jul09_15-17-35_DESKTOP-T04P4ED/events.out.tfevents.1720527456.DESKTOP-T04P4ED.13344.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d6b70e64c50f3802d538a08d6b56ef3011ae1eda258d884de519f5901b73d8d
|
| 3 |
+
size 5755
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": "[CLS]",
|
| 3 |
+
"mask_token": "[MASK]",
|
| 4 |
+
"pad_token": "[PAD]",
|
| 5 |
+
"sep_token": "[SEP]",
|
| 6 |
+
"unk_token": "[UNK]"
|
| 7 |
+
}
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,57 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "[PAD]",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "[UNK]",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "[CLS]",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "[SEP]",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"4": {
|
| 36 |
+
"content": "[MASK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"clean_up_tokenization_spaces": true,
|
| 45 |
+
"cls_token": "[CLS]",
|
| 46 |
+
"do_basic_tokenize": true,
|
| 47 |
+
"do_lower_case": true,
|
| 48 |
+
"mask_token": "[MASK]",
|
| 49 |
+
"model_max_length": 1000000000000000019884624838656,
|
| 50 |
+
"never_split": null,
|
| 51 |
+
"pad_token": "[PAD]",
|
| 52 |
+
"sep_token": "[SEP]",
|
| 53 |
+
"strip_accents": null,
|
| 54 |
+
"tokenize_chinese_chars": true,
|
| 55 |
+
"tokenizer_class": "ElectraTokenizer",
|
| 56 |
+
"unk_token": "[UNK]"
|
| 57 |
+
}
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a273abd72d75a68ce3eb477bdb403d82331c89162e5e0543dc066bdb420fa7ca
|
| 3 |
+
size 5112
|
vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|