martin0925 commited on
Commit
0399686
·
verified ·
1 Parent(s): 4d0c9bc

experiment_16 RobeCzech fine-tune

Browse files
config.json ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": 2,
11
+ "gradient_checkpointing": false,
12
+ "hidden_act": "gelu",
13
+ "hidden_dropout_prob": 0.1,
14
+ "hidden_size": 768,
15
+ "id2label": {
16
+ "0": "majetek",
17
+ "1": "doprava",
18
+ "2": "finance_rozpocet",
19
+ "3": "skolstvi",
20
+ "4": "sport",
21
+ "5": "kultura_cestovni_ruch",
22
+ "6": "zivotni_prostredi",
23
+ "7": "socialni_oblast",
24
+ "8": "zdravotnictvi",
25
+ "9": "bydleni",
26
+ "10": "bezpecnost",
27
+ "11": "komunalni_sluzby",
28
+ "12": "uzemni_planovani",
29
+ "13": "rozvoj_verejneho_prostranstvi",
30
+ "14": "informacni_technologie",
31
+ "15": "mezinarodni_spoluprace",
32
+ "16": "legislativa_vnitrni_predpisy"
33
+ },
34
+ "initializer_range": 0.02,
35
+ "intermediate_size": 3072,
36
+ "is_decoder": false,
37
+ "label2id": {
38
+ "bezpecnost": 10,
39
+ "bydleni": 9,
40
+ "doprava": 1,
41
+ "finance_rozpocet": 2,
42
+ "informacni_technologie": 14,
43
+ "komunalni_sluzby": 11,
44
+ "kultura_cestovni_ruch": 5,
45
+ "legislativa_vnitrni_predpisy": 16,
46
+ "majetek": 0,
47
+ "mezinarodni_spoluprace": 15,
48
+ "rozvoj_verejneho_prostranstvi": 13,
49
+ "skolstvi": 3,
50
+ "socialni_oblast": 7,
51
+ "sport": 4,
52
+ "uzemni_planovani": 12,
53
+ "zdravotnictvi": 8,
54
+ "zivotni_prostredi": 6
55
+ },
56
+ "layer_norm_eps": 1e-05,
57
+ "max_position_embeddings": 514,
58
+ "model_type": "roberta",
59
+ "num_attention_heads": 12,
60
+ "num_hidden_layers": 12,
61
+ "pad_token_id": 1,
62
+ "problem_type": "multi_label_classification",
63
+ "tie_word_embeddings": true,
64
+ "transformers_version": "5.0.0",
65
+ "type_vocab_size": 1,
66
+ "use_cache": true,
67
+ "vocab_size": 51997
68
+ }
inference_config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "threshold": 0.65,
3
+ "per_class_thresholds": {
4
+ "majetek": 0.75,
5
+ "doprava": 0.8,
6
+ "finance_rozpocet": 0.7,
7
+ "skolstvi": 0.9,
8
+ "sport": 0.4,
9
+ "kultura_cestovni_ruch": 0.6,
10
+ "zivotni_prostredi": 0.6,
11
+ "socialni_oblast": 0.55,
12
+ "zdravotnictvi": 0.45,
13
+ "bydleni": 0.85,
14
+ "bezpecnost": 0.45,
15
+ "komunalni_sluzby": 0.4,
16
+ "uzemni_planovani": 0.9,
17
+ "rozvoj_verejneho_prostranstvi": 0.5,
18
+ "informacni_technologie": 0.5,
19
+ "mezinarodni_spoluprace": 0.7,
20
+ "legislativa_vnitrni_predpisy": 0.75
21
+ },
22
+ "max_length": 512,
23
+ "labels": [
24
+ "majetek",
25
+ "doprava",
26
+ "finance_rozpocet",
27
+ "skolstvi",
28
+ "sport",
29
+ "kultura_cestovni_ruch",
30
+ "zivotni_prostredi",
31
+ "socialni_oblast",
32
+ "zdravotnictvi",
33
+ "bydleni",
34
+ "bezpecnost",
35
+ "komunalni_sluzby",
36
+ "uzemni_planovani",
37
+ "rozvoj_verejneho_prostranstvi",
38
+ "informacni_technologie",
39
+ "mezinarodni_spoluprace",
40
+ "legislativa_vnitrni_predpisy"
41
+ ],
42
+ "model_name": "ufal/robeczech-base"
43
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7f733d5a08ebe032de6436fb50d18b27a9cc15cc2fb9980fd790a610719e03c
3
+ size 503979644
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": "[CLS]",
5
+ "cls_token": "[CLS]",
6
+ "eos_token": "[SEP]",
7
+ "errors": "replace",
8
+ "is_local": false,
9
+ "mask_token": "[MASK]",
10
+ "model_max_length": 512,
11
+ "pad_token": "[PAD]",
12
+ "sep_token": "[SEP]",
13
+ "tokenizer_class": "RobertaTokenizer",
14
+ "trim_offsets": true,
15
+ "unk_token": "[UNK]"
16
+ }