m2im commited on
Commit
822073e
·
1 Parent(s): d8cbe80

uploading tokenizer

Browse files
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ *.json filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -1,42 +1,3 @@
1
- {
2
- "_name_or_path": "setu4993/LaBSE",
3
- "architectures": [
4
- "BertForSequenceClassification"
5
- ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
- "hidden_act": "gelu",
9
- "hidden_dropout_prob": 0.1,
10
- "hidden_size": 768,
11
- "id2label": {
12
- "0": "post7geo10",
13
- "1": "post7geo30",
14
- "2": "post7geo50",
15
- "3": "pre7geo10",
16
- "4": "pre7geo30",
17
- "5": "pre7geo50"
18
- },
19
- "initializer_range": 0.02,
20
- "intermediate_size": 3072,
21
- "label2id": {
22
- "post7geo10": 0,
23
- "post7geo30": 1,
24
- "post7geo50": 2,
25
- "pre7geo10": 3,
26
- "pre7geo30": 4,
27
- "pre7geo50": 5
28
- },
29
- "layer_norm_eps": 1e-12,
30
- "max_position_embeddings": 512,
31
- "model_type": "bert",
32
- "num_attention_heads": 12,
33
- "num_hidden_layers": 12,
34
- "pad_token_id": 0,
35
- "position_embedding_type": "absolute",
36
- "problem_type": "multi_label_classification",
37
- "torch_dtype": "float32",
38
- "transformers_version": "4.19.0",
39
- "type_vocab_size": 2,
40
- "use_cache": true,
41
- "vocab_size": 501153
42
- }
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6667bb3551c88cd213f25fd910f1125c93b0c8b1434c0b8747592b5a86263e52
3
+ size 987
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
special_tokens_map.json CHANGED
@@ -1 +1,3 @@
1
- {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:303df45a03609e4ead04bc3dc1536d0ab19b5358db685b6f3da123d05ec200e3
3
+ size 112
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09216b42d2697b7b4a26ac05ff09ba8bf52dc19b896c5ceee8bbff9f39055322
3
+ size 13631919
tokenizer_config.json CHANGED
@@ -1 +1,3 @@
1
- {"do_lower_case": false, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "clean_up_tokenization_spaces": true, "do_basic_tokenize": true, "model_max_length": 32, "never_split": null, "special_tokens_map_file": "/home/mmendieta/.cache/huggingface/transformers/f7976973d6e1d492e81cc7e3f495661fffb63be89dd6889a1f1b32911095fbbc.7da70648c6cb9951e284c9685f9ba7ae083dd59ed1d6d84bdfc0584a4ea94b6d", "name_or_path": "setu4993/LaBSE", "tokenizer_class": "BertTokenizer"}
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccdb87e6f0f8c02e3494fdb8e48f904bf7f73620581a98021e01d20ca1e17e81
3
+ size 579