5cean commited on
Commit
7fdceaa
·
verified ·
1 Parent(s): 6f9a5be

Training in progress, epoch 1

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "_name_or_path": "openai-community/roberta-large-openai-detector",
3
  "architectures": [
4
- "RobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
@@ -22,7 +22,7 @@
22
  },
23
  "layer_norm_eps": 1e-05,
24
  "max_position_embeddings": 514,
25
- "model_type": "roberta",
26
  "num_attention_heads": 16,
27
  "num_hidden_layers": 24,
28
  "output_past": true,
@@ -33,5 +33,5 @@
33
  "transformers_version": "4.43.2",
34
  "type_vocab_size": 1,
35
  "use_cache": true,
36
- "vocab_size": 50265
37
  }
 
1
  {
2
+ "_name_or_path": "FacebookAI/xlm-roberta-large",
3
  "architectures": [
4
+ "XLMRobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
 
22
  },
23
  "layer_norm_eps": 1e-05,
24
  "max_position_embeddings": 514,
25
+ "model_type": "xlm-roberta",
26
  "num_attention_heads": 16,
27
  "num_hidden_layers": 24,
28
  "output_past": true,
 
33
  "transformers_version": "4.43.2",
34
  "type_vocab_size": 1,
35
  "use_cache": true,
36
+ "vocab_size": 250002
37
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d855d2746523a2c7026633446b5ebdf9cee3fabee761823f84cddfbc884c39bf
3
- size 1421495416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c2678b4f9212e27289a940b561106d3a93bba9686853ca536d78aefff55afde
3
+ size 2239618672
runs/Jul26_16-08-17_gpu-1/events.out.tfevents.1721977699.gpu-1.291149.10 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1266a8e5ae6fafd7f5595549c7d29a5f5d7294c50e09d1d90d8305f378525a30
3
- size 14274
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfb977544072b9358b9b812b1c8ebb6d52a3a59b64c56b15940dff7215120844
3
+ size 14489
runs/Jul26_16-50-11_gpu-1/events.out.tfevents.1721980212.gpu-1.291149.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b139d68272594a4eaaf9c0b1a151a5c4caadf12c0659819a307cf55329dc6eb7
3
+ size 6526
runs/Jul26_16-57-31_gpu-1/events.out.tfevents.1721980652.gpu-1.291149.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72e8ac1eefda7f93e8e9d166471cd56affffb7958002ea7c33acad3253dd64a4
3
+ size 6425
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
3
+ size 5069051
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,10 +1,9 @@
1
  {
2
- "add_prefix_space": false,
3
  "added_tokens_decoder": {
4
  "0": {
5
  "content": "<s>",
6
  "lstrip": false,
7
- "normalized": true,
8
  "rstrip": false,
9
  "single_word": false,
10
  "special": true
@@ -12,7 +11,7 @@
12
  "1": {
13
  "content": "<pad>",
14
  "lstrip": false,
15
- "normalized": true,
16
  "rstrip": false,
17
  "single_word": false,
18
  "special": true
@@ -20,7 +19,7 @@
20
  "2": {
21
  "content": "</s>",
22
  "lstrip": false,
23
- "normalized": true,
24
  "rstrip": false,
25
  "single_word": false,
26
  "special": true
@@ -28,12 +27,12 @@
28
  "3": {
29
  "content": "<unk>",
30
  "lstrip": false,
31
- "normalized": true,
32
  "rstrip": false,
33
  "single_word": false,
34
  "special": true
35
  },
36
- "50264": {
37
  "content": "<mask>",
38
  "lstrip": true,
39
  "normalized": false,
@@ -46,12 +45,10 @@
46
  "clean_up_tokenization_spaces": true,
47
  "cls_token": "<s>",
48
  "eos_token": "</s>",
49
- "errors": "replace",
50
  "mask_token": "<mask>",
51
  "model_max_length": 512,
52
  "pad_token": "<pad>",
53
  "sep_token": "</s>",
54
- "tokenizer_class": "RobertaTokenizer",
55
- "trim_offsets": true,
56
  "unk_token": "<unk>"
57
  }
 
1
  {
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<s>",
5
  "lstrip": false,
6
+ "normalized": false,
7
  "rstrip": false,
8
  "single_word": false,
9
  "special": true
 
11
  "1": {
12
  "content": "<pad>",
13
  "lstrip": false,
14
+ "normalized": false,
15
  "rstrip": false,
16
  "single_word": false,
17
  "special": true
 
19
  "2": {
20
  "content": "</s>",
21
  "lstrip": false,
22
+ "normalized": false,
23
  "rstrip": false,
24
  "single_word": false,
25
  "special": true
 
27
  "3": {
28
  "content": "<unk>",
29
  "lstrip": false,
30
+ "normalized": false,
31
  "rstrip": false,
32
  "single_word": false,
33
  "special": true
34
  },
35
+ "250001": {
36
  "content": "<mask>",
37
  "lstrip": true,
38
  "normalized": false,
 
45
  "clean_up_tokenization_spaces": true,
46
  "cls_token": "<s>",
47
  "eos_token": "</s>",
 
48
  "mask_token": "<mask>",
49
  "model_max_length": 512,
50
  "pad_token": "<pad>",
51
  "sep_token": "</s>",
52
+ "tokenizer_class": "XLMRobertaTokenizer",
 
53
  "unk_token": "<unk>"
54
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e26cb814a19e202afbfef494284645653d4b7b8be778f34870aa056dda4afcfc
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed320209ba66f70704744e48d436e6770776deb8fe3b24459964229ae7724e76
3
  size 5176