MarketBERT_v2 / tokenizer.json
HamidBekam's picture
Upload folder using huggingface_hub
05789b7 verified
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [],
"normalizer": null,
"pre_tokenizer": {
"type": "Whitespace"
},
"post_processor": null,
"decoder": null,
"model": {
"type": "WordLevel",
"vocab": {
"[PAD]": 0,
"[UNK]": 1,
"[CLS]": 2,
"[SEP]": 3,
"[MASK]": 4,
"YEAR_1996": 5,
"YEAR_1997": 6,
"YEAR_1998": 7,
"YEAR_1999": 8,
"YEAR_2000": 9,
"YEAR_2001": 10,
"YEAR_2002": 11,
"YEAR_2003": 12,
"YEAR_2004": 13,
"YEAR_2005": 14,
"YEAR_2006": 15,
"YEAR_2007": 16,
"YEAR_2008": 17,
"YEAR_2009": 18,
"YEAR_2010": 19,
"YEAR_2011": 20,
"YEAR_2012": 21,
"YEAR_2013": 22,
"YEAR_2014": 23,
"YEAR_2015": 24,
"YEAR_2016": 25,
"YEAR_2017": 26,
"YEAR_2018": 27,
"YEAR_2019": 28,
"YEAR_2020": 29,
"YEAR_2021": 30,
"NICE_01": 31,
"NICE_02": 32,
"NICE_03": 33,
"NICE_04": 34,
"NICE_05": 35,
"NICE_06": 36,
"NICE_07": 37,
"NICE_08": 38,
"NICE_09": 39,
"NICE_10": 40,
"NICE_11": 41,
"NICE_12": 42,
"NICE_13": 43,
"NICE_14": 44,
"NICE_15": 45,
"NICE_16": 46,
"NICE_17": 47,
"NICE_18": 48,
"NICE_19": 49,
"NICE_20": 50,
"NICE_21": 51,
"NICE_22": 52,
"NICE_23": 53,
"NICE_24": 54,
"NICE_25": 55,
"NICE_26": 56,
"NICE_27": 57,
"NICE_28": 58,
"NICE_29": 59,
"NICE_30": 60,
"NICE_31": 61,
"NICE_32": 62,
"NICE_33": 63,
"NICE_34": 64,
"NICE_35": 65,
"NICE_36": 66,
"NICE_37": 67,
"NICE_38": 68,
"NICE_39": 69,
"NICE_40": 70,
"NICE_41": 71,
"NICE_42": 72,
"NICE_43": 73,
"NICE_44": 74,
"NICE_45": 75,
"NICE_UNK": 76
},
"unk_token": "[UNK]"
}
}