teru00801 commited on
Commit
47a5778
·
verified ·
1 Parent(s): 2ac5bca

Upload folder using huggingface_hub

Browse files
base_model/.DS_Store ADDED
Binary file (6.15 kB). View file
 
base_model/.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
base_model/config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "DebertaV2ForMaskedLM"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "bos_token_id": 96871,
7
+ "dtype": "float32",
8
+ "eos_token_id": 96868,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-07,
15
+ "legacy": true,
16
+ "max_position_embeddings": 512,
17
+ "max_relative_positions": -1,
18
+ "model_type": "deberta-v2",
19
+ "norm_rel_ebd": "layer_norm",
20
+ "num_attention_heads": 12,
21
+ "num_hidden_layers": 12,
22
+ "pad_token_id": 96869,
23
+ "pooler_dropout": 0,
24
+ "pooler_hidden_act": "gelu",
25
+ "pooler_hidden_size": 768,
26
+ "pos_att_type": [
27
+ "p2c",
28
+ "c2p"
29
+ ],
30
+ "position_biased_input": false,
31
+ "position_buckets": 256,
32
+ "relative_attention": true,
33
+ "share_att_key": true,
34
+ "transformers_version": "4.57.3",
35
+ "type_vocab_size": 0,
36
+ "use_cache": false,
37
+ "vocab_size": 96900
38
+ }
base_model/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7405eb902f13104f959d441ab69dfdef44dd761cb7afa7e1f68c33cfeebdeca3
3
+ size 642260656
base_model/special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "[CLS]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "[SEP]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "[MASK]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "[PAD]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "[SEP]",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "[UNK]",
46
+ "lstrip": false,
47
+ "normalized": true,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
base_model/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
base_model/tokenizer_config.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "96867": {
4
+ "content": "[MASK]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "96868": {
12
+ "content": "[SEP]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "96869": {
20
+ "content": "[PAD]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "96870": {
28
+ "content": "[UNK]",
29
+ "lstrip": false,
30
+ "normalized": true,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "96871": {
36
+ "content": "[CLS]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "bos_token": "[CLS]",
45
+ "clean_up_tokenization_spaces": false,
46
+ "cls_token": "[CLS]",
47
+ "do_lower_case": false,
48
+ "eos_token": "[SEP]",
49
+ "extra_special_tokens": {},
50
+ "keep_accents": true,
51
+ "mask_token": "[MASK]",
52
+ "model_max_length": 1000000000000000019884624838656,
53
+ "pad_token": "[PAD]",
54
+ "sep_token": "[SEP]",
55
+ "sp_model_kwargs": {},
56
+ "split_by_punct": false,
57
+ "tokenizer_class": "DebertaV2Tokenizer",
58
+ "unk_token": "[UNK]"
59
+ }
base_model/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61f62848675760897c3d02bd6e8686ab5e4e122e4fa061eeaf3cc74f603b3ef0
3
+ size 5905
best_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:513c713b88290668d27bed3f705e1b95f9c26c0446a81dd3acb53ef47b38a779
3
+ size 639695148
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_dir": "models/deberta_v3_mlm",
3
+ "task1_csv": "Data_for_deberta/processed/task1_ready/train.csv",
4
+ "task2_csv": "Data_for_deberta/processed/task2_ready/train.csv",
5
+ "output_dir": "outputs/train_runs",
6
+ "max_length": 384,
7
+ "val_ratio": 0.1,
8
+ "seed": 42,
9
+ "batch_size": 16,
10
+ "max_epochs": 10,
11
+ "min_epochs": 3,
12
+ "early_stop_patience": 2,
13
+ "learning_rate": 1.5e-05,
14
+ "weight_decay": 0.01,
15
+ "warmup_ratio": 0.06,
16
+ "boost_mult": 1.0,
17
+ "focal_gamma_task1": 0.0,
18
+ "rdrop_alpha_task2": 0.7,
19
+ "lambda_task1": 1.0,
20
+ "lambda_task2": 1.0,
21
+ "label_smoothing_task1": 0.02,
22
+ "label_smoothing_task2": 0.05,
23
+ "task2_balance_power": 0.5,
24
+ "task2_balance_min": 0.2,
25
+ "task2_balance_max": 5.0,
26
+ "title_empty_token": "[TITLE_EMPTY]",
27
+ "use_amp": true,
28
+ "cartography": true,
29
+ "cartography_lowmean_q": 0.005,
30
+ "cartography_task2_per_category_cap": 30
31
+ }
label_map.json ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "CSR活動": 0,
3
+ "DX": 1,
4
+ "M&A": 2,
5
+ "イベント": 3,
6
+ "サイバー攻撃": 4,
7
+ "システム障害": 5,
8
+ "ダイバーシティ": 6,
9
+ "ハラスメント問題": 7,
10
+ "リニューアルオープン": 8,
11
+ "不法就労": 9,
12
+ "不適切広告": 10,
13
+ "不適切発言": 11,
14
+ "事故": 12,
15
+ "事業効率化": 13,
16
+ "事業縮小": 14,
17
+ "人事異動": 15,
18
+ "人材育成": 16,
19
+ "代表者死亡": 17,
20
+ "企業間トラブル": 18,
21
+ "企業間取引解消": 19,
22
+ "価格変更": 20,
23
+ "債務超過": 21,
24
+ "債権回収不能": 22,
25
+ "債権譲渡": 23,
26
+ "公害": 24,
27
+ "再建型倒産": 25,
28
+ "労働争議": 26,
29
+ "労働災害": 27,
30
+ "労働者の自殺・失踪": 28,
31
+ "反社会的勢力関与": 29,
32
+ "受賞": 30,
33
+ "品質管理不正": 31,
34
+ "商品表示の不備": 32,
35
+ "広報活動": 33,
36
+ "役員変更": 34,
37
+ "従業員の不祥事": 35,
38
+ "従業員数減少": 36,
39
+ "情報漏洩": 37,
40
+ "批判的投稿": 38,
41
+ "提携": 39,
42
+ "新商品の展開": 40,
43
+ "新工場竣工": 41,
44
+ "新店舗開店": 42,
45
+ "新施設開設": 43,
46
+ "新規事業参入": 44,
47
+ "新規採用": 45,
48
+ "新設備導入": 46,
49
+ "本社住所移転": 47,
50
+ "株主変更": 48,
51
+ "株主総会開催": 49,
52
+ "株式保有率変更": 50,
53
+ "株式公開": 51,
54
+ "業績悪化": 52,
55
+ "業績改善": 53,
56
+ "横領": 54,
57
+ "海外進出": 55,
58
+ "清算型倒産": 56,
59
+ "特許取得": 57,
60
+ "生産停止": 58,
61
+ "生産再開": 59,
62
+ "生産拡大": 60,
63
+ "異物混入": 61,
64
+ "知的財産権の侵害": 62,
65
+ "研究開発": 63,
66
+ "社名変更": 64,
67
+ "税務違反": 65,
68
+ "粉飾決算": 66,
69
+ "組織体制変更": 67,
70
+ "経営計画": 68,
71
+ "職場環境改善": 69,
72
+ "行政処分": 70,
73
+ "補助金獲得": 71,
74
+ "設備投資": 72,
75
+ "訴訟": 73,
76
+ "詐欺": 74,
77
+ "認定取得": 75,
78
+ "談合": 76,
79
+ "販路拡大": 77,
80
+ "賃上げ": 78,
81
+ "賃金未払い": 79,
82
+ "資本金の変更": 80,
83
+ "資金調達": 81,
84
+ "贈収賄": 82,
85
+ "通信障害": 83,
86
+ "逮捕": 84,
87
+ "違法残業": 85,
88
+ "顧客トラブル": 86
89
+ }
selected_b_trial.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sweep_dir": "outputs/train_runs/sweep_20260207_073651",
3
+ "best_trial_dir": "outputs/train_runs/sweep_20260207_073651/trial_02_B_gamma0.0_rdrop0.7",
4
+ "model_path": "outputs/train_runs/sweep_20260207_073651/best_model.pt",
5
+ "config_path": "outputs/train_runs/sweep_20260207_073651/best_config.json",
6
+ "label_map_path": "outputs/train_runs/sweep_20260207_073651/trial_02_B_gamma0.0_rdrop0.7/label_map.json",
7
+ "selected": {
8
+ "source": "summary.csv",
9
+ "row": {
10
+ "stage": "B",
11
+ "trial": "2",
12
+ "learning_rate": "1.5e-05",
13
+ "boost_mult": "1.0",
14
+ "focal_gamma_task1": "0.0",
15
+ "rdrop_alpha_task2": "0.7",
16
+ "task1_acc_task1only": "0.8830057070386811",
17
+ "task1_acc": "0.8830057070386811",
18
+ "task2_acc": "0.865073787772312",
19
+ "score": "1.7480794948109932",
20
+ "epoch": "4"
21
+ }
22
+ }
23
+ }
summary.csv ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ stage,trial,learning_rate,boost_mult,focal_gamma_task1,rdrop_alpha_task2,task1_acc_task1only,task1_acc,task2_acc,score,epoch
2
+ B,1,1.5e-05,1.0,0.0,0.3,0.8880786303107165,0.8880786303107165,0.8531271960646521,1.7412058263753687,2
3
+ B,2,1.5e-05,1.0,0.0,0.7,0.8830057070386811,0.8830057070386811,0.865073787772312,1.7480794948109932,4
4
+ B,3,1.5e-05,1.0,1.0,0.3,0.8822130627774255,0.8822130627774255,0.8657765284609978,1.7479895912384233,2
5
+ B,4,1.5e-05,1.0,1.0,0.7,0.8836398224476855,0.8836398224476855,0.8636683063949403,1.7473081288426258,2
6
+ B,5,1.5e-05,1.0,2.0,0.3,0.8731769181991123,0.8731769181991123,0.8699929725931131,1.7431698907922253,4
7
+ B,6,1.5e-05,1.0,2.0,0.7,0.8746036778693722,0.8746036778693722,0.8552354181307098,1.729839096000082,2