5cean commited on
Commit
bacc8bb
·
verified ·
1 Parent(s): 7fdceaa

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "_name_or_path": "FacebookAI/xlm-roberta-large",
3
  "architectures": [
4
- "XLMRobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
@@ -9,23 +9,22 @@
9
  "eos_token_id": 2,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
- "hidden_size": 1024,
13
  "id2label": {
14
  "0": "hall",
15
  "1": "business"
16
  },
17
  "initializer_range": 0.02,
18
- "intermediate_size": 4096,
19
  "label2id": {
20
  "business": 1,
21
  "hall": 0
22
  },
23
  "layer_norm_eps": 1e-05,
24
  "max_position_embeddings": 514,
25
- "model_type": "xlm-roberta",
26
- "num_attention_heads": 16,
27
- "num_hidden_layers": 24,
28
- "output_past": true,
29
  "pad_token_id": 1,
30
  "position_embedding_type": "absolute",
31
  "problem_type": "single_label_classification",
@@ -33,5 +32,5 @@
33
  "transformers_version": "4.43.2",
34
  "type_vocab_size": 1,
35
  "use_cache": true,
36
- "vocab_size": 250002
37
  }
 
1
  {
2
+ "_name_or_path": "distilbert/distilroberta-base",
3
  "architectures": [
4
+ "RobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
 
9
  "eos_token_id": 2,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
  "id2label": {
14
  "0": "hall",
15
  "1": "business"
16
  },
17
  "initializer_range": 0.02,
18
+ "intermediate_size": 3072,
19
  "label2id": {
20
  "business": 1,
21
  "hall": 0
22
  },
23
  "layer_norm_eps": 1e-05,
24
  "max_position_embeddings": 514,
25
+ "model_type": "roberta",
26
+ "num_attention_heads": 12,
27
+ "num_hidden_layers": 6,
 
28
  "pad_token_id": 1,
29
  "position_embedding_type": "absolute",
30
  "problem_type": "single_label_classification",
 
32
  "transformers_version": "4.43.2",
33
  "type_vocab_size": 1,
34
  "use_cache": true,
35
+ "vocab_size": 50265
36
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c2678b4f9212e27289a940b561106d3a93bba9686853ca536d78aefff55afde
3
- size 2239618672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77508accc1699218c917154379967adff870374d50dd8abd8bcad78ec04d66ff
3
+ size 328492280
runs/Jul26_16-57-31_gpu-1/events.out.tfevents.1721980652.gpu-1.291149.12 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72e8ac1eefda7f93e8e9d166471cd56affffb7958002ea7c33acad3253dd64a4
3
- size 6425
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a8381b614d39c6ed2ab34e81804027f21c1d95b630b510324ff7959cfea8b29
3
+ size 6636
runs/Jul26_17-11-56_gpu-1/events.out.tfevents.1721981518.gpu-1.291149.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7361988305c1a803a6d584a34067d4f5c191aff6c9424d99a6b616626a3306cf
3
+ size 6394
runs/Jul26_17-13-53_gpu-1/events.out.tfevents.1721981634.gpu-1.291149.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f90b38023f8578f3fe07aee8b9a3b24db627d2c8f882b70a53d002afc2f52cfa
3
+ size 6486
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:883b037111086fd4dfebbbc9b7cee11e1517b5e0c0514879478661440f137085
3
- size 17082987
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8d6b8f1c0016535793387df8c2f39ab70e15a00237af3dae658fe7e0ce2378c
3
+ size 2108896
tokenizer_config.json CHANGED
@@ -1,9 +1,10 @@
1
  {
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<s>",
5
  "lstrip": false,
6
- "normalized": false,
7
  "rstrip": false,
8
  "single_word": false,
9
  "special": true
@@ -11,7 +12,7 @@
11
  "1": {
12
  "content": "<pad>",
13
  "lstrip": false,
14
- "normalized": false,
15
  "rstrip": false,
16
  "single_word": false,
17
  "special": true
@@ -19,7 +20,7 @@
19
  "2": {
20
  "content": "</s>",
21
  "lstrip": false,
22
- "normalized": false,
23
  "rstrip": false,
24
  "single_word": false,
25
  "special": true
@@ -27,12 +28,12 @@
27
  "3": {
28
  "content": "<unk>",
29
  "lstrip": false,
30
- "normalized": false,
31
  "rstrip": false,
32
  "single_word": false,
33
  "special": true
34
  },
35
- "250001": {
36
  "content": "<mask>",
37
  "lstrip": true,
38
  "normalized": false,
@@ -45,10 +46,12 @@
45
  "clean_up_tokenization_spaces": true,
46
  "cls_token": "<s>",
47
  "eos_token": "</s>",
 
48
  "mask_token": "<mask>",
49
  "model_max_length": 512,
50
  "pad_token": "<pad>",
51
  "sep_token": "</s>",
52
- "tokenizer_class": "XLMRobertaTokenizer",
 
53
  "unk_token": "<unk>"
54
  }
 
1
  {
2
+ "add_prefix_space": false,
3
  "added_tokens_decoder": {
4
  "0": {
5
  "content": "<s>",
6
  "lstrip": false,
7
+ "normalized": true,
8
  "rstrip": false,
9
  "single_word": false,
10
  "special": true
 
12
  "1": {
13
  "content": "<pad>",
14
  "lstrip": false,
15
+ "normalized": true,
16
  "rstrip": false,
17
  "single_word": false,
18
  "special": true
 
20
  "2": {
21
  "content": "</s>",
22
  "lstrip": false,
23
+ "normalized": true,
24
  "rstrip": false,
25
  "single_word": false,
26
  "special": true
 
28
  "3": {
29
  "content": "<unk>",
30
  "lstrip": false,
31
+ "normalized": true,
32
  "rstrip": false,
33
  "single_word": false,
34
  "special": true
35
  },
36
+ "50264": {
37
  "content": "<mask>",
38
  "lstrip": true,
39
  "normalized": false,
 
46
  "clean_up_tokenization_spaces": true,
47
  "cls_token": "<s>",
48
  "eos_token": "</s>",
49
+ "errors": "replace",
50
  "mask_token": "<mask>",
51
  "model_max_length": 512,
52
  "pad_token": "<pad>",
53
  "sep_token": "</s>",
54
+ "tokenizer_class": "RobertaTokenizer",
55
+ "trim_offsets": true,
56
  "unk_token": "<unk>"
57
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed320209ba66f70704744e48d436e6770776deb8fe3b24459964229ae7724e76
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b13e0db57b5c8808139a4348604775e5765a0607f454b6c66d0b2b83e74e191
3
  size 5176