Upload tokenizer

Files changed (4) hide show

source.spm CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fd4e951487aed00bae6a6c2ee4ef5d8d1db05fd098b19b608046c9334b58d24d
-size 812240

 version https://git-lfs.github.com/spec/v1
+oid sha256:c4a99ea3602b29fbf901ade8b93a45efa3d7c64eab8fc5fa812383efa327a87d
+size 706917

target.spm CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f5529d3a72f8c1d5f7e357f1b6fd30e3cf58f6e1ba0401db135a118ac92f4a76
-size 1067935

 version https://git-lfs.github.com/spec/v1
+oid sha256:c6dce5fa58fcd7dde9e81e279b8c075bf42ee558278f73d6fb48e342029d7f19
+size 791194

tokenizer_config.json CHANGED Viewed

@@ -16,7 +16,7 @@
       "single_word": false,
       "special": true
     },
-    "61949": {
       "content": "<pad>",
       "lstrip": false,
       "normalized": false,
@@ -31,9 +31,9 @@
   "model_max_length": 512,
   "pad_token": "<pad>",
   "separate_vocabs": false,
-  "source_lang": "eng",
   "sp_model_kwargs": {},
-  "target_lang": "hin",
   "tokenizer_class": "MarianTokenizer",
   "unk_token": "<unk>"
 }

       "single_word": false,
       "special": true
     },
+    "64171": {
       "content": "<pad>",
       "lstrip": false,
       "normalized": false,
   "model_max_length": 512,
   "pad_token": "<pad>",
   "separate_vocabs": false,
+  "source_lang": "mul",
   "sp_model_kwargs": {},
+  "target_lang": "eng",
   "tokenizer_class": "MarianTokenizer",
   "unk_token": "<unk>"
 }

vocab.json CHANGED Viewed

The diff for this file is too large to render. See raw diff