Sandrro commited on
Commit
2770f0a
·
1 Parent(s): add8058

Training in progress, epoch 1

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "cointegrated/rubert-tiny2",
3
+ "architectures": [
4
+ "BertForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "emb_size": 312,
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 312,
13
+ "id2label": {
14
+ "0": "\u0414\u043e\u043c",
15
+ "1": "\u0422\u0435\u0440\u0440\u0438\u0442\u043e\u0440\u0438\u044f \u0421\u0430\u043d\u043a\u0442-\u041f\u0435\u0442\u0435\u0440\u0431\u0443\u0440\u0433\u0430",
16
+ "10": "\u041a\u043e\u043c\u043c\u0435\u0440\u0447\u0435\u0441\u043a\u043e\u0435 \u0441\u0442\u0440\u043e\u0438\u0442\u0435\u043b\u044c\u0441\u0442\u0432\u043e",
17
+ "11": "\u041e\u0431\u0449\u0435\u0441\u0442\u0432\u0435\u043d\u043d\u044b\u0439 \u0442\u0440\u0430\u043d\u0441\u043f\u043e\u0440\u0442",
18
+ "12": "\u041e\u0441\u0442\u0430\u043d\u043e\u0432\u043a\u0430 \u043e\u0431\u0449\u0435\u0441\u0442\u0432\u0435\u043d\u043d\u043e\u0433\u043e \u0442\u0440\u0430\u043d\u0441\u043f\u043e\u0440\u0442\u0430",
19
+ "13": "\u041c\u043e\u0441\u0442",
20
+ "14": "\u0421\u0442\u0440\u043e\u0438\u0442\u0435\u043b\u044c\u043d\u0430\u044f \u043f\u043b\u043e\u0449\u0430\u0434\u043a\u0430",
21
+ "2": "\u0414\u0432\u043e\u0440",
22
+ "3": "\u0423\u043b\u0438\u0446\u0430",
23
+ "4": "\u041f\u0430\u0440\u043a, \u0441\u0430\u0434, \u0431\u0443\u043b\u044c\u0432\u0430\u0440, \u0441\u043a\u0432\u0435\u0440",
24
+ "5": "\u0420\u0435\u043a\u043b\u0430\u043c\u043d\u044b\u0435 \u0438\u043b\u0438 \u0438\u043d\u0444\u043e\u0440\u043c\u0430\u0446\u0438\u043e\u043d\u043d\u044b\u0435 \u043a\u043e\u043d\u0441\u0442\u0440\u0443\u043a\u0446\u0438\u0438",
25
+ "6": "\u0421\u043e\u043e\u0440\u0443\u0436\u0435\u043d\u0438\u0435",
26
+ "7": "\u041a\u0432\u0430\u0440\u0442\u0438\u0440\u0430",
27
+ "8": "\u0412\u043e\u0434\u043d\u044b\u0439 \u043e\u0431\u044a\u0435\u043a\u0442",
28
+ "9": "\u0411\u044e\u0434\u0436\u0435\u0442\u043d\u043e\u0435 \u0443\u0447\u0440\u0435\u0436\u0434\u0435\u043d\u0438\u0435"
29
+ },
30
+ "initializer_range": 0.02,
31
+ "intermediate_size": 600,
32
+ "label2id": {
33
+ "\u0411\u044e\u0434\u0436\u0435\u0442\u043d\u043e\u0435 \u0443\u0447\u0440\u0435\u0436\u0434\u0435\u043d\u0438\u0435": "9",
34
+ "\u0412\u043e\u0434\u043d\u044b\u0439 \u043e\u0431\u044a\u0435\u043a\u0442": "8",
35
+ "\u0414\u0432\u043e\u0440": "2",
36
+ "\u0414\u043e\u043c": "0",
37
+ "\u041a\u0432\u0430\u0440\u0442\u0438\u0440\u0430": "7",
38
+ "\u041a\u043e\u043c\u043c\u0435\u0440\u0447\u0435\u0441\u043a\u043e\u0435 \u0441\u0442\u0440\u043e\u0438\u0442\u0435\u043b\u044c\u0441\u0442\u0432\u043e": "10",
39
+ "\u041c\u043e\u0441\u0442": "13",
40
+ "\u041e\u0431\u0449\u0435\u0441\u0442\u0432\u0435\u043d\u043d\u044b\u0439 \u0442\u0440\u0430\u043d\u0441\u043f\u043e\u0440\u0442": "11",
41
+ "\u041e\u0441\u0442\u0430\u043d\u043e\u0432\u043a\u0430 \u043e\u0431\u0449\u0435\u0441\u0442\u0432\u0435\u043d\u043d\u043e\u0433\u043e \u0442\u0440\u0430\u043d\u0441\u043f\u043e\u0440\u0442\u0430": "12",
42
+ "\u041f\u0430\u0440\u043a, \u0441\u0430\u0434, \u0431\u0443\u043b\u044c\u0432\u0430\u0440, \u0441\u043a\u0432\u0435\u0440": "4",
43
+ "\u0420\u0435\u043a\u043b\u0430\u043c\u043d\u044b\u0435 \u0438\u043b\u0438 \u0438\u043d\u0444\u043e\u0440\u043c\u0430\u0446\u0438\u043e\u043d\u043d\u044b\u0435 \u043a\u043e\u043d\u0441\u0442\u0440\u0443\u043a\u0446\u0438\u0438": "5",
44
+ "\u0421\u043e\u043e\u0440\u0443\u0436\u0435\u043d\u0438\u0435": "6",
45
+ "\u0421\u0442\u0440\u043e\u0438\u0442\u0435\u043b\u044c\u043d\u0430\u044f \u043f\u043b\u043e\u0449\u0430\u0434\u043a\u0430": "14",
46
+ "\u0422\u0435\u0440\u0440\u0438\u0442\u043e\u0440\u0438\u044f \u0421\u0430\u043d\u043a\u0442-\u041f\u0435\u0442\u0435\u0440\u0431\u0443\u0440\u0433\u0430": "1",
47
+ "\u0423\u043b\u0438\u0446\u0430": "3"
48
+ },
49
+ "layer_norm_eps": 1e-12,
50
+ "max_position_embeddings": 2048,
51
+ "model_type": "bert",
52
+ "num_attention_heads": 12,
53
+ "num_hidden_layers": 3,
54
+ "pad_token_id": 0,
55
+ "position_embedding_type": "absolute",
56
+ "problem_type": "single_label_classification",
57
+ "torch_dtype": "float32",
58
+ "transformers_version": "4.27.1",
59
+ "type_vocab_size": 2,
60
+ "use_cache": true,
61
+ "vocab_size": 83828
62
+ }
logs/1693485558.788028/events.out.tfevents.1693485558.SERVER-509.10992.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb6cb7b09aaf06e4c8bfdf7ed7cde1361a082db979947403dcbb64d16cd00986
3
+ size 5763
logs/events.out.tfevents.1693485558.SERVER-509.10992.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1559af92734d39f422d7f9cb82957e9da7fa1b9c5df4b6bd1ebb2df024b85e5d
3
+ size 8456
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d0ca3452867c8545b5c06308e22c677726d3ffceabdba774e6545cb5ddf0b46
3
+ size 116828511
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7db7a83e0b3f56c5cca1280caa2cf9b46ed93e369f84ba644d49a85a45e8e092
3
+ size 3579