dbaezaj commited on
Commit
e439a36
·
1 Parent(s): 53863c2

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
  3. tokenizer.json +36 -0
  4. tokenizer_config.json +32 -3
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "pysentimiento/robertuito-base-uncased",
3
  "architectures": [
4
  "RobertaForSequenceClassification"
5
  ],
@@ -47,5 +47,5 @@
47
  "transformers_version": "4.35.0",
48
  "type_vocab_size": 1,
49
  "use_cache": true,
50
- "vocab_size": 30000
51
  }
 
1
  {
2
+ "_name_or_path": "pysentimiento/robertuito-ner",
3
  "architectures": [
4
  "RobertaForSequenceClassification"
5
  ],
 
47
  "transformers_version": "4.35.0",
48
  "type_vocab_size": 1,
49
  "use_cache": true,
50
+ "vocab_size": 30002
51
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e6eb56fd098879c2ef9ebec33dc23b7cc234ea24b7ff9dd6fd2882e1842de6e6
3
- size 435200612
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab54d6899b07bd7210c0be351e0eaf19efa6b89c66f257fe644a3763c0009db
3
+ size 435206756
tokenizer.json CHANGED
@@ -52,6 +52,42 @@
52
  "rstrip": false,
53
  "normalized": false,
54
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
55
  }
56
  ],
57
  "normalizer": {
 
52
  "rstrip": false,
53
  "normalized": false,
54
  "special": true
55
+ },
56
+ {
57
+ "id": 430,
58
+ "content": "@usuario",
59
+ "single_word": false,
60
+ "lstrip": false,
61
+ "rstrip": false,
62
+ "normalized": true,
63
+ "special": false
64
+ },
65
+ {
66
+ "id": 27394,
67
+ "content": "url",
68
+ "single_word": false,
69
+ "lstrip": false,
70
+ "rstrip": false,
71
+ "normalized": true,
72
+ "special": false
73
+ },
74
+ {
75
+ "id": 30000,
76
+ "content": "hashtag",
77
+ "single_word": false,
78
+ "lstrip": false,
79
+ "rstrip": false,
80
+ "normalized": true,
81
+ "special": false
82
+ },
83
+ {
84
+ "id": 30001,
85
+ "content": "emoji",
86
+ "single_word": false,
87
+ "lstrip": false,
88
+ "rstrip": false,
89
+ "normalized": true,
90
+ "special": false
91
  }
92
  ],
93
  "normalizer": {
tokenizer_config.json CHANGED
@@ -39,6 +39,38 @@
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
42
  }
43
  },
44
  "bos_token": "<s>",
@@ -48,10 +80,7 @@
48
  "mask_token": "<mask>",
49
  "max_length": 128,
50
  "model_max_length": 128,
51
- "pad_to_multiple_of": null,
52
  "pad_token": "<pad>",
53
- "pad_token_type_id": 0,
54
- "padding_side": "right",
55
  "sep_token": "</s>",
56
  "stride": 0,
57
  "tokenizer_class": "PreTrainedTokenizerFast",
 
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
42
+ },
43
+ "430": {
44
+ "content": "@usuario",
45
+ "lstrip": false,
46
+ "normalized": true,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": false
50
+ },
51
+ "27394": {
52
+ "content": "url",
53
+ "lstrip": false,
54
+ "normalized": true,
55
+ "rstrip": false,
56
+ "single_word": false,
57
+ "special": false
58
+ },
59
+ "30000": {
60
+ "content": "hashtag",
61
+ "lstrip": false,
62
+ "normalized": true,
63
+ "rstrip": false,
64
+ "single_word": false,
65
+ "special": false
66
+ },
67
+ "30001": {
68
+ "content": "emoji",
69
+ "lstrip": false,
70
+ "normalized": true,
71
+ "rstrip": false,
72
+ "single_word": false,
73
+ "special": false
74
  }
75
  },
76
  "bos_token": "<s>",
 
80
  "mask_token": "<mask>",
81
  "max_length": 128,
82
  "model_max_length": 128,
 
83
  "pad_token": "<pad>",
 
 
84
  "sep_token": "</s>",
85
  "stride": 0,
86
  "tokenizer_class": "PreTrainedTokenizerFast",