mk9165 commited on
Commit
7648eac
·
1 Parent(s): e1ba831

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,11 +1,12 @@
1
  {
2
- "_name_or_path": "skt/kobert-base-v1",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
- "author": "Heewon Jeon(madjakarta@gmail.com)",
8
  "classifier_dropout": null,
 
 
9
  "gradient_checkpointing": false,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
@@ -18,7 +19,6 @@
18
  },
19
  "initializer_range": 0.02,
20
  "intermediate_size": 3072,
21
- "kobert_version": 1.0,
22
  "label2id": {
23
  "LABEL_0": 0,
24
  "LABEL_1": 1,
@@ -30,12 +30,17 @@
30
  "model_type": "bert",
31
  "num_attention_heads": 12,
32
  "num_hidden_layers": 12,
33
- "pad_token_id": 1,
 
 
 
 
 
34
  "position_embedding_type": "absolute",
35
  "problem_type": "single_label_classification",
36
  "torch_dtype": "float32",
37
  "transformers_version": "4.26.1",
38
  "type_vocab_size": 2,
39
  "use_cache": true,
40
- "vocab_size": 8002
41
  }
 
1
  {
2
+ "_name_or_path": "kykim/bert-kor-base",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
 
7
  "classifier_dropout": null,
8
+ "directionality": "bidi",
9
+ "embedding_size": 768,
10
  "gradient_checkpointing": false,
11
  "hidden_act": "gelu",
12
  "hidden_dropout_prob": 0.1,
 
19
  },
20
  "initializer_range": 0.02,
21
  "intermediate_size": 3072,
 
22
  "label2id": {
23
  "LABEL_0": 0,
24
  "LABEL_1": 1,
 
30
  "model_type": "bert",
31
  "num_attention_heads": 12,
32
  "num_hidden_layers": 12,
33
+ "pad_token_id": 0,
34
+ "pooler_fc_size": 768,
35
+ "pooler_num_attention_heads": 12,
36
+ "pooler_num_fc_layers": 3,
37
+ "pooler_size_per_head": 128,
38
+ "pooler_type": "first_token_transform",
39
  "position_embedding_type": "absolute",
40
  "problem_type": "single_label_classification",
41
  "torch_dtype": "float32",
42
  "transformers_version": "4.26.1",
43
  "type_vocab_size": 2,
44
  "use_cache": true,
45
+ "vocab_size": 42000
46
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c77ff64ab58f7c25ee5d56de2d97f8140cc98f8063451e10220324f48b6918d1
3
- size 368832629
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ee21002121deb86cb70c57c00663836b9449c691660f1ac546eabf5ed3a5f5b
3
+ size 473274485
runs/Feb15_03-23-13_b575e53afbdf/1676431496.033246/events.out.tfevents.1676431496.b575e53afbdf.353.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76ddd2dc5d42573583312276204d9f6fd2043306e86e9f927f77e9c9fbbf6d31
3
+ size 5736
runs/Feb15_03-23-13_b575e53afbdf/events.out.tfevents.1676431496.b575e53afbdf.353.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aced1a9872d9cef2beee4928eceb73e6a5ae5b5c1cf8a6ad720f10e43dc9dbac
3
+ size 4136
special_tokens_map.json CHANGED
@@ -1,14 +1,6 @@
1
  {
2
- "bos_token": "[CLS]",
3
  "cls_token": "[CLS]",
4
- "eos_token": "[SEP]",
5
- "mask_token": {
6
- "content": "[MASK]",
7
- "lstrip": true,
8
- "normalized": true,
9
- "rstrip": false,
10
- "single_word": false
11
- },
12
  "pad_token": "[PAD]",
13
  "sep_token": "[SEP]",
14
  "unk_token": "[UNK]"
 
1
  {
 
2
  "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
 
 
 
 
 
 
 
4
  "pad_token": "[PAD]",
5
  "sep_token": "[SEP]",
6
  "unk_token": "[UNK]"
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,25 +1,16 @@
1
  {
2
- "additional_special_tokens": null,
3
- "bos_token": "[CLS]",
4
  "cls_token": "[CLS]",
5
- "do_lower_case": false,
6
- "eos_token": "[SEP]",
7
- "keep_accents": false,
8
- "mask_token": {
9
- "__type": "AddedToken",
10
- "content": "[MASK]",
11
- "lstrip": true,
12
- "normalized": true,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "model_max_length": 1000000000000000019884624838656,
17
- "name_or_path": "skt/kobert-base-v1",
18
  "pad_token": "[PAD]",
19
- "remove_space": true,
20
  "sep_token": "[SEP]",
21
- "sp_model_kwargs": {},
22
- "special_tokens_map_file": "/root/.cache/huggingface/hub/models--skt--kobert-base-v1/snapshots/a9f5849fce18fb088f0cd0f9b29ec3f756958464/special_tokens_map.json",
23
- "tokenizer_class": "KoBERTTokenizer",
 
24
  "unk_token": "[UNK]"
25
  }
 
1
  {
 
 
2
  "cls_token": "[CLS]",
3
+ "do_basic_tokenize": true,
4
+ "do_lower_case": true,
5
+ "mask_token": "[MASK]",
6
+ "model_max_length": 512,
7
+ "name_or_path": "kykim/bert-kor-base",
8
+ "never_split": null,
 
 
 
 
 
 
 
9
  "pad_token": "[PAD]",
 
10
  "sep_token": "[SEP]",
11
+ "special_tokens_map_file": null,
12
+ "strip_accents": false,
13
+ "tokenize_chinese_chars": true,
14
+ "tokenizer_class": "BertTokenizer",
15
  "unk_token": "[UNK]"
16
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:797d791fe18cf9a081593e58d3ded7a5f2b7b7feb414a9d2566510a0d6ab48e7
3
  size 3515
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:600a3ef1dce93da4a1978d5696118a7a5110b6593a70a2f81bc5e0e1cfe7526c
3
  size 3515
vocab.txt ADDED
The diff for this file is too large to render. See raw diff