{ "config": { "bpe_vocab_size": 7987, "max_sentences": 32, "sentence_boundary_token": "", "pad_token": "", "bos_token": "", "eos_token": "", "mask_token": "", "noise_token": "", "min_frequency": 2 }, "vocab": { "": 0, "": 1, "": 2, "": 3, "": 4, "": 5, "": 6, "": 7, "": 8, "": 9, "": 10, "": 11, "": 12, "%": 13, ",": 14, "-": 15, ".": 16, "0": 17, "1": 18, "2": 19, "3": 20, "4": 21, "5": 22, "6": 23, "7": 24, "8": 25, "9": 26, ":": 27, ";": 28, "?": 29, "_": 30, "a": 31, "b": 32, "c": 33, "d": 34, "e": 35, "f": 36, "g": 37, "h": 38, "i": 39, "j": 40, "k": 41, "l": 42, "m": 43, "n": 44, "o": 45, "p": 46, "r": 47, "s": 48, "t": 49, "u": 50, "v": 51, "w": 52, "y": 53, "z": 54, "an": 55, "an": 56, "er": 57, "da": 58, "en": 59, "ti": 60, "il": 61, "si": 62, "si": 63, "di": 64, "ang": 65, "anc": 66, "al": 67, "kan": 68, "ke": 69, "su": 70, "ef": 71, "ang": 72, "ri": 73, "ter": 74, "se": 75, "on": 76, "te": 77, "hef": 78, "hefe": 79, "on": 80, "ng": 81, "po": 82, "sim": 83, "ul": 84, "re": 85, "pa": 86, "ar": 87, "pen": 88, "la": 89, "dari": 90, "bu": 91, "men": 92, "tida": 93, "om": 94, "hefei": 95, "ance": 96, "in": 97, "asi": 98, "ra": 99, "kesim": 100, "kesimp": 101, "kesimpul": 102, "kesimpulan": 103, "eri": 104, "ai": 105, "jang": 106, "al": 107, "ct": 108, "kon": 109, "dianc": 110, "diancang": 111, "ju": 112, "jangm": 113, "jangmo": 114, "jangmok": 115, "li": 116, "or": 117, "fi": 118, "sa": 119, "ta": 120, "meng": 121, "ksi": 122, "ngkan": 123, "pl": 124, "ja": 125, "buk": 126, "bukt": 127, "bukti": 128, "tidak": 129, "ya": 130, "yang": 131, "di": 132, "per": 133, "sn": 134, "sno": 135, "snow": 136, "plu": 137, "plum": 138, "pil": 139, "pill": 140, "ss": 141, "pi": 142, "cu": 143, "ku": 144, "ili": 145, "fiv": 146, "five": 147, "sw": 148, "swor": 149, "sword": 150, "swords": 151, "tion": 152, "enc": 153, "ence": 154, "ran": 155, "ce": 156, "ro": 157, "lo": 158, "mu": 159, "pencu": 160, "com": 161, "pol": 162, "pola": 163, "anom": 164, "anomal": 165, "gy": 166, "gyer": 167, "gyery": 168, "gyeryon": 169, "gyeryong": 170, "mer": 171, "merc": 172, "merch": 173, "merchan": 174, "merchant": 175, "gu": 176, "guil": 177, "guild": 178, "de": 179, "mar": 180, "marti": 181, "martial": 182, "alli": 183, "alliance": 184, "pre": 185, "predi": 186, "tin": 187, "tinda": 188, "tindakan": 189, "beri": 190, "beriku": 191, "berikut": 192, "berikutn": 193, "berikutnya": 194, "simh": 195, "simhy": 196, "simhye": 197, "simhyeon": 198, "pav": 199, "pavili": 200, "pavilion": 201, "jang": 202, "hang": 203, "hangi": 204, "tae": 205, "taeul": 206, "taeul_": 207, "taeul_se": 208, "taeul_sect": 209, "at": 210, "lapo": 211, "laporan": 212, "gu": 213, "ilm": 214, "ilmu": 215, "terk": 216, "terkai": 217, "terkait": 218, "le": 219, "dar": 220, "dark": 221, "dark_": 222, "dark_f": 223, "dark_fa": 224, "dark_fac": 225, "dark_faction": 226, "sum": 227, "blo": 228, "bloo": 229, "blood": 230, "ser": 231, "serpen": 232, "serpent": 233, "dance": 234, "ste": 235, "step": 236, "anal": 237, "anali": 238, "analisi": 239, "analisis": 240, "cro": 241, "cross": 242, "ref": 243, "refer": 244, "reference": 245, "keja": 246, "kejadi": 247, "kejadian": 248, "mengh": 249, "menghil": 250, "menghilang": 251, "me": 252, "ha": 253, "pat": 254, "patter": 255, "pattern": 256, "terpi": 257, "terpisa": 258, "terpisah": 259, "hefei": 260, "hefei_": 261, "hefei_b": 262, "hefei_br": 263, "hefei_branc": 264, "hefei_branch": 265, "hu": 266, "hubu": 267, "compo": 268, "compos": 269, "compose": 270, "susu": 271, "susun": 272, "dete": 273, "deteksi": 274, "ketida": 275, "ketidak": 276, "ketidakse": 277, "ketidaksesu": 278, "ketidaksesuai": 279, "ketidaksesuaian": 280, "rec": 281, "recal": 282, "recall": 283, "ing": 284, "ingat": 285, "semu": 286, "semua": 287, "predict": 288, "perk": 289, "perki": 290, "perkira": 291, "perkirakan": 292, "veri": 293, "verif": 294, "verify": 295, "cek": 296, "konsi": 297, "konsis": 298, "konsist": 299, "konsisten": 300, "konsistensi": 301, "anomaly": 302, "ban": 303, "bandi": 304, "bandingkan": 305, "tang": 306, "tangg": 307, "tanggal": 308, "hubungkan": 309, "fra": 310, "frag": 311, "fragme": 312, "fragmen": 313, "as": 314, "den": 315, "deng": 316, "dengan": 317, "ad": 318, "ada": 319, "bar": 320, "baru": 321, "bi": 322, "fil": 323, "filte": 324, "filter": 325, "eli": 326, "elim": 327, "elimin": 328, "eliminasi": 329, "rele": 330, "relev": 331, "relevan": 332, "masi": 333, "pencuri": 334, "ber": 335, "dala": 336, "dalam": 337, "konsum": 338, "konsumsi": 339, "ting": 340, "pa": 341, "pencur": 342, "pencuri": 343, "pencurian": 344, "ca": 345, "sumb": 346, "sumbe": 347, "sumber": 348, "inf": 349, "infor": 350, "informasi": 351, "ke": 352, "ka": 353, "inv": 354, "inve": 355, "inves": 356, "investi": 357, "investig": 358, "investigasi": 359, "ya": 360, "mi": 361, "misi": 362, "assi": 363, "assig": 364, "assign": 365, "sen": 366, "sendi": 367, "sendiri": 368, "ah": 369, "menu": 370, "menun": 371, "menunj": 372, "menunju": 373, "menunjuk": 374, "menunjukkan": 375, "dat": 376, "data": 377, "pil": 378, "pasa": 379, "pasar": 380, "ge": 381, "gela": 382, "gelap": 383, "suc": 384, "succe": 385, "success": 386, "rat": 387, "rate": 388, "pai": 389, "pair": 390, "lebi": 391, "lebih": 392, "tingg": 393, "tinggi": 394, "bias": 395, "biasan": 396, "biasanya": 397, "penal": 398, "penalar": 399, "penalaran": 400, "sete": 401, "setela": 402, "setelah": 403, "hari": 404, "sam": 405, "sama": 406, "tan": 407, "tanpa": 408, "je": 409, "jeja": 410, "jejak": 411, "temu": 412, "anomali": 413, "prediksi": 414, "ters": 415, "tersang": 416, "tersangka": 417, "temuan": 418, "berk": 419, "berko": 420, "berkore": 421, "berkorela": 422, "berkorelasi": 423, "cata": 424, "catat": 425, "catatan": 426, "perg": 427, "perger": 428, "pergera": 429, "pergerakan": 430, "mengkon": 431, "mengkonfi": 432, "mengkonfir": 433, "mengkonfirmasi": 434, "ev": 435, "eval": 436, "evalu": 437, "evaluasi": 438, "keper": 439, "keperca": 440, "kepercaya": 441, "kepercayaan": 442, "mengar": 443, "mengarah": 444, "terse": 445, "tersedi": 446, "tersedia": 447, "mem": 448, "memili": 449, "memilik": 450, "memiliki": 451, "kone": 452, "koneksi": 453, "con": 454, "confi": 455, "confid": 456, "confidence": 457, "menja": 458, "menjadi": 459, "kun": 460, "kunc": 461, "kunci": 462, "hasi": 463, "hasil": 464, "insi": 465, "insid": 466, "inside": 467, "jo": 468, "job": 469, "compl": 470, "comple": 471, "completion": 472, "ran": 473, "ranta": 474, "rantai": 475, "berda": 476, "berdas": 477, "berdasar": 478, "berdasarkan": 479, "terha": 480, "terhada": 481, "terhadap": 482, "tingk": 483, "tingkat": 484, "keya": 485, "keyak": 486, "keyakin": 487, "keyakinan": 488, "pro": 489, "prose": 490, "proses": 491, "ded": 492, "dedu": 493, "deduksi": 494, "ba": 495, "bah": 496, "bahw": 497, "bahwa": 498, "sia": 499, "siapa": 500, "mencu": 501, "mencuri": 502, "berta": 503, "bertaha": 504, "bertahap": 505, "mengin": 506, "mengindi": 507, "mengindik": 508, "mengindika": 509, "mengindikasi": 510, "mengindikasikan": 511, "pene": 512, "penel": 513, "penelu": 514, "penelusu": 515, "penelusuran": 516, "log": 517, "logi": 518, "logika": 519, "lang": 520, "langk": 521, "langkah": 522, "hubung": 523, "hubungan": 524, "ant": 525, "antar": 526, "antara": 527, "dan": 528, "terdeteksi": 529, "perha": 530, "perhati": 531, "perhatian": 532, "terda": 533, "terdapa": 534, "terdapat": 535, "kejang": 536, "kejangg": 537, "kejanggal": 538, "kejanggalan": 539, "laz": 540, "lazi": 541, "lazim": 542, "ditemu": 543, "ditemukan": 544, "68": 545, "62": 546, "73": 547, "67": 548, "74": 549, "66": 550, "69": 551, "70": 552, "65": 553, "59": 554, "71": 555, "63": 556, "61": 557, "64": 558, "81": 559, "58": 560, "54": 561, "76": 562, "75": 563, "46": 564, "49": 565, "82": 566, "57": 567, "53": 568, "48": 569, "52": 570, "44": 571, "72": 572, "56": 573, "93": 574, "55": 575 }, "merges": { "a|||n": 0, "a|||n": 1, "e|||r": 2, "d|||a": 3, "e|||n": 4, "t|||i": 5, "i|||l": 6, "s|||i": 7, "s|||i": 8, "d|||i": 9, "an|||g": 10, "an|||c": 11, "a|||l": 12, "k|||an": 13, "k|||e": 14, "s|||u": 15, "e|||f": 16, "an|||g": 17, "r|||i": 18, "t|||er": 19, "s|||e": 20, "o|||n": 21, "t|||e": 22, "h|||ef": 23, "hef|||e": 24, "o|||n": 25, "n|||g": 26, "p|||o": 27, "si|||m": 28, "u|||l": 29, "r|||e": 30, "p|||a": 31, "a|||r": 32, "p|||en": 33, "l|||a": 34, "da|||ri": 35, "b|||u": 36, "m|||en": 37, "ti|||da": 38, "o|||m": 39, "hefe|||i": 40, "anc|||e": 41, "i|||n": 42, "a|||si": 43, "r|||a": 44, "ke|||sim": 45, "kesim|||p": 46, "kesimp|||ul": 47, "kesimpul|||an": 48, "er|||i": 49, "a|||i": 50, "j|||ang": 51, "a|||l": 52, "c|||t": 53, "k|||on": 54, "di|||anc": 55, "dianc|||ang": 56, "j|||u": 57, "jang|||m": 58, "jangm|||o": 59, "jangmo|||k": 60, "l|||i": 61, "o|||r": 62, "f|||i": 63, "s|||a": 64, "t|||a": 65, "men|||g": 66, "k|||si": 67, "ng|||kan": 68, "p|||l": 69, "j|||a": 70, "bu|||k": 71, "buk|||t": 72, "bukt|||i": 73, "tida|||k": 74, "y|||a": 75, "y|||ang": 76, "d|||i": 77, "p|||er": 78, "s|||n": 79, "sn|||o": 80, "sno|||w": 81, "pl|||u": 82, "plu|||m": 83, "p|||il": 84, "pil|||l": 85, "s|||s": 86, "p|||i": 87, "c|||u": 88, "k|||u": 89, "il|||i": 90, "fi|||v": 91, "fiv|||e": 92, "s|||w": 93, "sw|||or": 94, "swor|||d": 95, "sword|||s": 96, "ti|||on": 97, "en|||c": 98, "enc|||e": 99, "r|||an": 100, "c|||e": 101, "r|||o": 102, "l|||o": 103, "m|||u": 104, "pen|||cu": 105, "c|||om": 106, "po|||l": 107, "pol|||a": 108, "an|||om": 109, "anom|||al": 110, "g|||y": 111, "gy|||er": 112, "gyer|||y": 113, "gyery|||on": 114, "gyeryon|||g": 115, "m|||er": 116, "mer|||c": 117, "merc|||h": 118, "merch|||an": 119, "merchan|||t": 120, "g|||u": 121, "gu|||il": 122, "guil|||d": 123, "d|||e": 124, "m|||ar": 125, "mar|||ti": 126, "marti|||al": 127, "al|||li": 128, "alli|||ance": 129, "p|||re": 130, "pre|||di": 131, "ti|||n": 132, "tin|||da": 133, "tinda|||kan": 134, "b|||eri": 135, "beri|||ku": 136, "beriku|||t": 137, "berikut|||n": 138, "berikutn|||ya": 139, "sim|||h": 140, "simh|||y": 141, "simhy|||e": 142, "simhye|||on": 143, "pa|||v": 144, "pav|||ili": 145, "pavili|||on": 146, "j|||ang": 147, "h|||ang": 148, "hang|||i": 149, "ta|||e": 150, "tae|||ul": 151, "taeul|||_": 152, "taeul_|||se": 153, "taeul_se|||ct": 154, "a|||t": 155, "la|||po": 156, "lapo|||ran": 157, "g|||u": 158, "il|||m": 159, "ilm|||u": 160, "ter|||k": 161, "terk|||ai": 162, "terkai|||t": 163, "l|||e": 164, "da|||r": 165, "dar|||k": 166, "dark|||_": 167, "dark_|||f": 168, "dark_f|||a": 169, "dark_fa|||c": 170, "dark_fac|||tion": 171, "su|||m": 172, "b|||lo": 173, "blo|||o": 174, "bloo|||d": 175, "s|||er": 176, "ser|||pen": 177, "serpen|||t": 178, "d|||ance": 179, "s|||te": 180, "ste|||p": 181, "an|||al": 182, "anal|||i": 183, "anali|||si": 184, "analisi|||s": 185, "c|||ro": 186, "cro|||ss": 187, "r|||ef": 188, "ref|||er": 189, "refer|||ence": 190, "ke|||ja": 191, "keja|||di": 192, "kejadi|||an": 193, "meng|||h": 194, "mengh|||il": 195, "menghil|||ang": 196, "m|||e": 197, "h|||a": 198, "pa|||t": 199, "pat|||ter": 200, "patter|||n": 201, "ter|||pi": 202, "terpi|||sa": 203, "terpisa|||h": 204, "hefe|||i": 205, "hefei|||_": 206, "hefei_|||b": 207, "hefei_b|||r": 208, "hefei_br|||anc": 209, "hefei_branc|||h": 210, "h|||u": 211, "hu|||bu": 212, "com|||po": 213, "compo|||s": 214, "compos|||e": 215, "su|||su": 216, "susu|||n": 217, "de|||te": 218, "dete|||ksi": 219, "ke|||tida": 220, "ketida|||k": 221, "ketidak|||se": 222, "ketidakse|||su": 223, "ketidaksesu|||ai": 224, "ketidaksesuai|||an": 225, "re|||c": 226, "rec|||al": 227, "recal|||l": 228, "i|||ng": 229, "ing|||at": 230, "se|||mu": 231, "semu|||a": 232, "predi|||ct": 233, "per|||k": 234, "perk|||i": 235, "perki|||ra": 236, "perkira|||kan": 237, "v|||eri": 238, "veri|||f": 239, "verif|||y": 240, "ce|||k": 241, "kon|||si": 242, "konsi|||s": 243, "konsis|||t": 244, "konsist|||en": 245, "konsisten|||si": 246, "anomal|||y": 247, "b|||an": 248, "ban|||di": 249, "bandi|||ngkan": 250, "t|||ang": 251, "tang|||g": 252, "tangg|||al": 253, "hubu|||ngkan": 254, "f|||ra": 255, "fra|||g": 256, "frag|||me": 257, "fragme|||n": 258, "a|||s": 259, "d|||en": 260, "den|||g": 261, "deng|||an": 262, "a|||d": 263, "ad|||a": 264, "b|||ar": 265, "bar|||u": 266, "b|||i": 267, "f|||il": 268, "fil|||te": 269, "filte|||r": 270, "e|||li": 271, "eli|||m": 272, "elim|||in": 273, "elimin|||asi": 274, "re|||le": 275, "rele|||v": 276, "relev|||an": 277, "m|||asi": 278, "pencu|||ri": 279, "b|||er": 280, "da|||la": 281, "dala|||m": 282, "kon|||sum": 283, "konsum|||si": 284, "ti|||ng": 285, "p|||a": 286, "pencu|||r": 287, "pencur|||i": 288, "pencuri|||an": 289, "c|||a": 290, "sum|||b": 291, "sumb|||e": 292, "sumbe|||r": 293, "in|||f": 294, "inf|||or": 295, "infor|||masi": 296, "k|||e": 297, "k|||a": 298, "in|||v": 299, "inv|||e": 300, "inve|||s": 301, "inves|||ti": 302, "investi|||g": 303, "investig|||asi": 304, "y|||a": 305, "m|||i": 306, "mi|||si": 307, "as|||si": 308, "assi|||g": 309, "assig|||n": 310, "s|||en": 311, "sen|||di": 312, "sendi|||ri": 313, "a|||h": 314, "men|||u": 315, "menu|||n": 316, "menun|||j": 317, "menunj|||u": 318, "menunju|||k": 319, "menunjuk|||kan": 320, "da|||t": 321, "dat|||a": 322, "pi|||l": 323, "pa|||sa": 324, "pasa|||r": 325, "g|||e": 326, "ge|||la": 327, "gela|||p": 328, "su|||c": 329, "suc|||ce": 330, "succe|||ss": 331, "ra|||t": 332, "rat|||e": 333, "pa|||i": 334, "pai|||r": 335, "le|||bi": 336, "lebi|||h": 337, "ting|||g": 338, "tingg|||i": 339, "bi|||as": 340, "bias|||an": 341, "biasan|||ya": 342, "pen|||al": 343, "penal|||ar": 344, "penalar|||an": 345, "se|||te": 346, "sete|||la": 347, "setela|||h": 348, "ha|||ri": 349, "sa|||m": 350, "sam|||a": 351, "t|||an": 352, "tan|||pa": 353, "j|||e": 354, "je|||ja": 355, "jeja|||k": 356, "te|||mu": 357, "anomal|||i": 358, "predi|||ksi": 359, "ter|||s": 360, "ters|||ang": 361, "tersang|||ka": 362, "temu|||an": 363, "ber|||k": 364, "berk|||o": 365, "berko|||re": 366, "berkore|||la": 367, "berkorela|||si": 368, "ca|||ta": 369, "cata|||t": 370, "catat|||an": 371, "per|||g": 372, "perg|||er": 373, "perger|||a": 374, "pergera|||kan": 375, "meng|||kon": 376, "mengkon|||fi": 377, "mengkonfi|||r": 378, "mengkonfir|||masi": 379, "e|||v": 380, "ev|||al": 381, "eval|||u": 382, "evalu|||asi": 383, "ke|||per": 384, "keper|||ca": 385, "keperca|||ya": 386, "kepercaya|||an": 387, "meng|||ar": 388, "mengar|||ah": 389, "ter|||se": 390, "terse|||di": 391, "tersedi|||a": 392, "me|||m": 393, "mem|||ili": 394, "memili|||k": 395, "memilik|||i": 396, "kon|||e": 397, "kone|||ksi": 398, "c|||on": 399, "con|||fi": 400, "confi|||d": 401, "confid|||ence": 402, "men|||ja": 403, "menja|||di": 404, "ku|||n": 405, "kun|||c": 406, "kunc|||i": 407, "ha|||si": 408, "hasi|||l": 409, "in|||si": 410, "insi|||d": 411, "insid|||e": 412, "j|||o": 413, "jo|||b": 414, "com|||pl": 415, "compl|||e": 416, "comple|||tion": 417, "r|||an": 418, "ran|||ta": 419, "ranta|||i": 420, "ber|||da": 421, "berda|||s": 422, "berdas|||ar": 423, "berdasar|||kan": 424, "ter|||ha": 425, "terha|||da": 426, "terhada|||p": 427, "ting|||k": 428, "tingk|||at": 429, "ke|||ya": 430, "keya|||k": 431, "keyak|||in": 432, "keyakin|||an": 433, "p|||ro": 434, "pro|||se": 435, "prose|||s": 436, "de|||d": 437, "ded|||u": 438, "dedu|||ksi": 439, "b|||a": 440, "ba|||h": 441, "bah|||w": 442, "bahw|||a": 443, "si|||a": 444, "sia|||pa": 445, "men|||cu": 446, "mencu|||ri": 447, "ber|||ta": 448, "berta|||ha": 449, "bertaha|||p": 450, "meng|||in": 451, "mengin|||di": 452, "mengindi|||k": 453, "mengindik|||a": 454, "mengindika|||si": 455, "mengindikasi|||kan": 456, "pen|||e": 457, "pene|||l": 458, "penel|||u": 459, "penelu|||su": 460, "penelusu|||ran": 461, "lo|||g": 462, "log|||i": 463, "logi|||ka": 464, "l|||ang": 465, "lang|||k": 466, "langk|||ah": 467, "hubu|||ng": 468, "hubung|||an": 469, "an|||t": 470, "ant|||ar": 471, "antar|||a": 472, "d|||an": 473, "ter|||deteksi": 474, "per|||ha": 475, "perha|||ti": 476, "perhati|||an": 477, "ter|||da": 478, "terda|||pa": 479, "terdapa|||t": 480, "ke|||jang": 481, "kejang|||g": 482, "kejangg|||al": 483, "kejanggal|||an": 484, "la|||z": 485, "laz|||i": 486, "lazi|||m": 487, "di|||temu": 488, "ditemu|||kan": 489, "6|||8": 490, "6|||2": 491, "7|||3": 492, "6|||7": 493, "7|||4": 494, "6|||6": 495, "6|||9": 496, "7|||0": 497, "6|||5": 498, "5|||9": 499, "7|||1": 500, "6|||3": 501, "6|||1": 502, "6|||4": 503, "8|||1": 504, "5|||8": 505, "5|||4": 506, "7|||6": 507, "7|||5": 508, "4|||6": 509, "4|||9": 510, "8|||2": 511, "5|||7": 512, "5|||3": 513, "4|||8": 514, "5|||2": 515, "4|||4": 516, "7|||2": 517, "5|||6": 518, "9|||3": 519, "5|||5": 520 }, "is_trained": true }