wuuuuuuuk commited on
Commit
f4d2c11
·
1 Parent(s): ade5bcf

Test model

Browse files
README.md CHANGED
@@ -1,3 +1,5 @@
1
  ---
2
  license: apache-2.0
3
  ---
 
 
 
1
  ---
2
  license: apache-2.0
3
  ---
4
+
5
+ This is a test model for `transformers/tests/models/lasr/test_modeling_lasr.py`. It is not suitable for non-testing use.
added_tokens.json ADDED
@@ -0,0 +1,103 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<extra_id_0>": 611,
3
+ "<extra_id_10>": 601,
4
+ "<extra_id_11>": 600,
5
+ "<extra_id_12>": 599,
6
+ "<extra_id_13>": 598,
7
+ "<extra_id_14>": 597,
8
+ "<extra_id_15>": 596,
9
+ "<extra_id_16>": 595,
10
+ "<extra_id_17>": 594,
11
+ "<extra_id_18>": 593,
12
+ "<extra_id_19>": 592,
13
+ "<extra_id_1>": 610,
14
+ "<extra_id_20>": 591,
15
+ "<extra_id_21>": 590,
16
+ "<extra_id_22>": 589,
17
+ "<extra_id_23>": 588,
18
+ "<extra_id_24>": 587,
19
+ "<extra_id_25>": 586,
20
+ "<extra_id_26>": 585,
21
+ "<extra_id_27>": 584,
22
+ "<extra_id_28>": 583,
23
+ "<extra_id_29>": 582,
24
+ "<extra_id_2>": 609,
25
+ "<extra_id_30>": 581,
26
+ "<extra_id_31>": 580,
27
+ "<extra_id_32>": 579,
28
+ "<extra_id_33>": 578,
29
+ "<extra_id_34>": 577,
30
+ "<extra_id_35>": 576,
31
+ "<extra_id_36>": 575,
32
+ "<extra_id_37>": 574,
33
+ "<extra_id_38>": 573,
34
+ "<extra_id_39>": 572,
35
+ "<extra_id_3>": 608,
36
+ "<extra_id_40>": 571,
37
+ "<extra_id_41>": 570,
38
+ "<extra_id_42>": 569,
39
+ "<extra_id_43>": 568,
40
+ "<extra_id_44>": 567,
41
+ "<extra_id_45>": 566,
42
+ "<extra_id_46>": 565,
43
+ "<extra_id_47>": 564,
44
+ "<extra_id_48>": 563,
45
+ "<extra_id_49>": 562,
46
+ "<extra_id_4>": 607,
47
+ "<extra_id_50>": 561,
48
+ "<extra_id_51>": 560,
49
+ "<extra_id_52>": 559,
50
+ "<extra_id_53>": 558,
51
+ "<extra_id_54>": 557,
52
+ "<extra_id_55>": 556,
53
+ "<extra_id_56>": 555,
54
+ "<extra_id_57>": 554,
55
+ "<extra_id_58>": 553,
56
+ "<extra_id_59>": 552,
57
+ "<extra_id_5>": 606,
58
+ "<extra_id_60>": 551,
59
+ "<extra_id_61>": 550,
60
+ "<extra_id_62>": 549,
61
+ "<extra_id_63>": 548,
62
+ "<extra_id_64>": 547,
63
+ "<extra_id_65>": 546,
64
+ "<extra_id_66>": 545,
65
+ "<extra_id_67>": 544,
66
+ "<extra_id_68>": 543,
67
+ "<extra_id_69>": 542,
68
+ "<extra_id_6>": 605,
69
+ "<extra_id_70>": 541,
70
+ "<extra_id_71>": 540,
71
+ "<extra_id_72>": 539,
72
+ "<extra_id_73>": 538,
73
+ "<extra_id_74>": 537,
74
+ "<extra_id_75>": 536,
75
+ "<extra_id_76>": 535,
76
+ "<extra_id_77>": 534,
77
+ "<extra_id_78>": 533,
78
+ "<extra_id_79>": 532,
79
+ "<extra_id_7>": 604,
80
+ "<extra_id_80>": 531,
81
+ "<extra_id_81>": 530,
82
+ "<extra_id_82>": 529,
83
+ "<extra_id_83>": 528,
84
+ "<extra_id_84>": 527,
85
+ "<extra_id_85>": 526,
86
+ "<extra_id_86>": 525,
87
+ "<extra_id_87>": 524,
88
+ "<extra_id_88>": 523,
89
+ "<extra_id_89>": 522,
90
+ "<extra_id_8>": 603,
91
+ "<extra_id_90>": 521,
92
+ "<extra_id_91>": 520,
93
+ "<extra_id_92>": 519,
94
+ "<extra_id_93>": 518,
95
+ "<extra_id_94>": 517,
96
+ "<extra_id_95>": 516,
97
+ "<extra_id_96>": 515,
98
+ "<extra_id_97>": 514,
99
+ "<extra_id_98>": 513,
100
+ "<extra_id_99>": 512,
101
+ "<extra_id_9>": 602,
102
+ "<pad>": 612
103
+ }
config.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ctc_loss_reduction": "mean",
3
+ "ctc_zero_infinity": true,
4
+ "encoder_config": {
5
+ "activation_dropout": 0.1,
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.1,
8
+ "batch_norm_momentum": 0.01,
9
+ "conv_kernel_size": 32,
10
+ "conv_residual_weights": [
11
+ 2.0,
12
+ 1.0
13
+ ],
14
+ "convolution_bias": false,
15
+ "dropout": 0.1,
16
+ "dropout_positions": 0.0,
17
+ "feed_forward_residual_weights": [
18
+ 1.5,
19
+ 0.5
20
+ ],
21
+ "hidden_act": "silu",
22
+ "hidden_size": 512,
23
+ "initializer_range": 0.02,
24
+ "intermediate_size": 2048,
25
+ "layer_norm_eps": 1e-06,
26
+ "layerdrop": 0.1,
27
+ "max_position_embeddings": 10000,
28
+ "model_type": "lasr_encoder",
29
+ "num_attention_heads": 8,
30
+ "num_hidden_layers": 17,
31
+ "num_key_value_heads": 8,
32
+ "num_mel_bins": 128,
33
+ "rope_parameters": {
34
+ "rope_theta": 10000.0,
35
+ "rope_type": "default"
36
+ },
37
+ "subsampling_conv_channels": 256,
38
+ "subsampling_conv_kernel_size": 5,
39
+ "subsampling_conv_stride": 2
40
+ },
41
+ "initializer_range": 0.02,
42
+ "model_type": "lasr_ctc",
43
+ "pad_token_id": 0,
44
+ "transformers_version": "5.0.0.dev0",
45
+ "vocab_size": 512
46
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf03cb9c3b710ea4ee8134940bb4b0906f69cb3d54954bf6c84e2b3d0323b739
3
+ size 421172424
preprocessor_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "feature_extractor_type": "LASRFeatureExtractor",
3
+ "feature_size": 128,
4
+ "hop_length": 160,
5
+ "n_fft": 512,
6
+ "padding_side": "right",
7
+ "padding_value": 0.0,
8
+ "processor_class": "LASRProcessor",
9
+ "return_attention_mask": true,
10
+ "sampling_rate": 16000,
11
+ "win_length": 400
12
+ }
processor_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "feature_extractor": {
3
+ "feature_extractor_type": "LasrFeatureExtractor",
4
+ "feature_size": 128,
5
+ "hop_length": 160,
6
+ "n_fft": 512,
7
+ "padding_side": "right",
8
+ "padding_value": 0.0,
9
+ "processor_class": "LasrProcessor",
10
+ "return_attention_mask": true,
11
+ "sampling_rate": 16000,
12
+ "win_length": 400
13
+ },
14
+ "processor_class": "LasrProcessor"
15
+ }
tokenizer.json ADDED
@@ -0,0 +1,3054 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": "<epsilon>",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 1,
17
+ "content": "<s>",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": false,
22
+ "special": true
23
+ },
24
+ {
25
+ "id": 2,
26
+ "content": "</s>",
27
+ "single_word": false,
28
+ "lstrip": false,
29
+ "rstrip": false,
30
+ "normalized": false,
31
+ "special": true
32
+ },
33
+ {
34
+ "id": 3,
35
+ "content": "<unk>",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": false,
40
+ "special": true
41
+ },
42
+ {
43
+ "id": 512,
44
+ "content": "<pad>",
45
+ "single_word": false,
46
+ "lstrip": false,
47
+ "rstrip": false,
48
+ "normalized": false,
49
+ "special": true
50
+ },
51
+ {
52
+ "id": 513,
53
+ "content": "<extra_id_0>",
54
+ "single_word": false,
55
+ "lstrip": false,
56
+ "rstrip": false,
57
+ "normalized": false,
58
+ "special": true
59
+ },
60
+ {
61
+ "id": 514,
62
+ "content": "<extra_id_1>",
63
+ "single_word": false,
64
+ "lstrip": false,
65
+ "rstrip": false,
66
+ "normalized": false,
67
+ "special": true
68
+ },
69
+ {
70
+ "id": 515,
71
+ "content": "<extra_id_2>",
72
+ "single_word": false,
73
+ "lstrip": false,
74
+ "rstrip": false,
75
+ "normalized": false,
76
+ "special": true
77
+ },
78
+ {
79
+ "id": 516,
80
+ "content": "<extra_id_3>",
81
+ "single_word": false,
82
+ "lstrip": false,
83
+ "rstrip": false,
84
+ "normalized": false,
85
+ "special": true
86
+ },
87
+ {
88
+ "id": 517,
89
+ "content": "<extra_id_4>",
90
+ "single_word": false,
91
+ "lstrip": false,
92
+ "rstrip": false,
93
+ "normalized": false,
94
+ "special": true
95
+ },
96
+ {
97
+ "id": 518,
98
+ "content": "<extra_id_5>",
99
+ "single_word": false,
100
+ "lstrip": false,
101
+ "rstrip": false,
102
+ "normalized": false,
103
+ "special": true
104
+ },
105
+ {
106
+ "id": 519,
107
+ "content": "<extra_id_6>",
108
+ "single_word": false,
109
+ "lstrip": false,
110
+ "rstrip": false,
111
+ "normalized": false,
112
+ "special": true
113
+ },
114
+ {
115
+ "id": 520,
116
+ "content": "<extra_id_7>",
117
+ "single_word": false,
118
+ "lstrip": false,
119
+ "rstrip": false,
120
+ "normalized": false,
121
+ "special": true
122
+ },
123
+ {
124
+ "id": 521,
125
+ "content": "<extra_id_8>",
126
+ "single_word": false,
127
+ "lstrip": false,
128
+ "rstrip": false,
129
+ "normalized": false,
130
+ "special": true
131
+ },
132
+ {
133
+ "id": 522,
134
+ "content": "<extra_id_9>",
135
+ "single_word": false,
136
+ "lstrip": false,
137
+ "rstrip": false,
138
+ "normalized": false,
139
+ "special": true
140
+ },
141
+ {
142
+ "id": 523,
143
+ "content": "<extra_id_10>",
144
+ "single_word": false,
145
+ "lstrip": false,
146
+ "rstrip": false,
147
+ "normalized": false,
148
+ "special": true
149
+ },
150
+ {
151
+ "id": 524,
152
+ "content": "<extra_id_11>",
153
+ "single_word": false,
154
+ "lstrip": false,
155
+ "rstrip": false,
156
+ "normalized": false,
157
+ "special": true
158
+ },
159
+ {
160
+ "id": 525,
161
+ "content": "<extra_id_12>",
162
+ "single_word": false,
163
+ "lstrip": false,
164
+ "rstrip": false,
165
+ "normalized": false,
166
+ "special": true
167
+ },
168
+ {
169
+ "id": 526,
170
+ "content": "<extra_id_13>",
171
+ "single_word": false,
172
+ "lstrip": false,
173
+ "rstrip": false,
174
+ "normalized": false,
175
+ "special": true
176
+ },
177
+ {
178
+ "id": 527,
179
+ "content": "<extra_id_14>",
180
+ "single_word": false,
181
+ "lstrip": false,
182
+ "rstrip": false,
183
+ "normalized": false,
184
+ "special": true
185
+ },
186
+ {
187
+ "id": 528,
188
+ "content": "<extra_id_15>",
189
+ "single_word": false,
190
+ "lstrip": false,
191
+ "rstrip": false,
192
+ "normalized": false,
193
+ "special": true
194
+ },
195
+ {
196
+ "id": 529,
197
+ "content": "<extra_id_16>",
198
+ "single_word": false,
199
+ "lstrip": false,
200
+ "rstrip": false,
201
+ "normalized": false,
202
+ "special": true
203
+ },
204
+ {
205
+ "id": 530,
206
+ "content": "<extra_id_17>",
207
+ "single_word": false,
208
+ "lstrip": false,
209
+ "rstrip": false,
210
+ "normalized": false,
211
+ "special": true
212
+ },
213
+ {
214
+ "id": 531,
215
+ "content": "<extra_id_18>",
216
+ "single_word": false,
217
+ "lstrip": false,
218
+ "rstrip": false,
219
+ "normalized": false,
220
+ "special": true
221
+ },
222
+ {
223
+ "id": 532,
224
+ "content": "<extra_id_19>",
225
+ "single_word": false,
226
+ "lstrip": false,
227
+ "rstrip": false,
228
+ "normalized": false,
229
+ "special": true
230
+ },
231
+ {
232
+ "id": 533,
233
+ "content": "<extra_id_20>",
234
+ "single_word": false,
235
+ "lstrip": false,
236
+ "rstrip": false,
237
+ "normalized": false,
238
+ "special": true
239
+ },
240
+ {
241
+ "id": 534,
242
+ "content": "<extra_id_21>",
243
+ "single_word": false,
244
+ "lstrip": false,
245
+ "rstrip": false,
246
+ "normalized": false,
247
+ "special": true
248
+ },
249
+ {
250
+ "id": 535,
251
+ "content": "<extra_id_22>",
252
+ "single_word": false,
253
+ "lstrip": false,
254
+ "rstrip": false,
255
+ "normalized": false,
256
+ "special": true
257
+ },
258
+ {
259
+ "id": 536,
260
+ "content": "<extra_id_23>",
261
+ "single_word": false,
262
+ "lstrip": false,
263
+ "rstrip": false,
264
+ "normalized": false,
265
+ "special": true
266
+ },
267
+ {
268
+ "id": 537,
269
+ "content": "<extra_id_24>",
270
+ "single_word": false,
271
+ "lstrip": false,
272
+ "rstrip": false,
273
+ "normalized": false,
274
+ "special": true
275
+ },
276
+ {
277
+ "id": 538,
278
+ "content": "<extra_id_25>",
279
+ "single_word": false,
280
+ "lstrip": false,
281
+ "rstrip": false,
282
+ "normalized": false,
283
+ "special": true
284
+ },
285
+ {
286
+ "id": 539,
287
+ "content": "<extra_id_26>",
288
+ "single_word": false,
289
+ "lstrip": false,
290
+ "rstrip": false,
291
+ "normalized": false,
292
+ "special": true
293
+ },
294
+ {
295
+ "id": 540,
296
+ "content": "<extra_id_27>",
297
+ "single_word": false,
298
+ "lstrip": false,
299
+ "rstrip": false,
300
+ "normalized": false,
301
+ "special": true
302
+ },
303
+ {
304
+ "id": 541,
305
+ "content": "<extra_id_28>",
306
+ "single_word": false,
307
+ "lstrip": false,
308
+ "rstrip": false,
309
+ "normalized": false,
310
+ "special": true
311
+ },
312
+ {
313
+ "id": 542,
314
+ "content": "<extra_id_29>",
315
+ "single_word": false,
316
+ "lstrip": false,
317
+ "rstrip": false,
318
+ "normalized": false,
319
+ "special": true
320
+ },
321
+ {
322
+ "id": 543,
323
+ "content": "<extra_id_30>",
324
+ "single_word": false,
325
+ "lstrip": false,
326
+ "rstrip": false,
327
+ "normalized": false,
328
+ "special": true
329
+ },
330
+ {
331
+ "id": 544,
332
+ "content": "<extra_id_31>",
333
+ "single_word": false,
334
+ "lstrip": false,
335
+ "rstrip": false,
336
+ "normalized": false,
337
+ "special": true
338
+ },
339
+ {
340
+ "id": 545,
341
+ "content": "<extra_id_32>",
342
+ "single_word": false,
343
+ "lstrip": false,
344
+ "rstrip": false,
345
+ "normalized": false,
346
+ "special": true
347
+ },
348
+ {
349
+ "id": 546,
350
+ "content": "<extra_id_33>",
351
+ "single_word": false,
352
+ "lstrip": false,
353
+ "rstrip": false,
354
+ "normalized": false,
355
+ "special": true
356
+ },
357
+ {
358
+ "id": 547,
359
+ "content": "<extra_id_34>",
360
+ "single_word": false,
361
+ "lstrip": false,
362
+ "rstrip": false,
363
+ "normalized": false,
364
+ "special": true
365
+ },
366
+ {
367
+ "id": 548,
368
+ "content": "<extra_id_35>",
369
+ "single_word": false,
370
+ "lstrip": false,
371
+ "rstrip": false,
372
+ "normalized": false,
373
+ "special": true
374
+ },
375
+ {
376
+ "id": 549,
377
+ "content": "<extra_id_36>",
378
+ "single_word": false,
379
+ "lstrip": false,
380
+ "rstrip": false,
381
+ "normalized": false,
382
+ "special": true
383
+ },
384
+ {
385
+ "id": 550,
386
+ "content": "<extra_id_37>",
387
+ "single_word": false,
388
+ "lstrip": false,
389
+ "rstrip": false,
390
+ "normalized": false,
391
+ "special": true
392
+ },
393
+ {
394
+ "id": 551,
395
+ "content": "<extra_id_38>",
396
+ "single_word": false,
397
+ "lstrip": false,
398
+ "rstrip": false,
399
+ "normalized": false,
400
+ "special": true
401
+ },
402
+ {
403
+ "id": 552,
404
+ "content": "<extra_id_39>",
405
+ "single_word": false,
406
+ "lstrip": false,
407
+ "rstrip": false,
408
+ "normalized": false,
409
+ "special": true
410
+ },
411
+ {
412
+ "id": 553,
413
+ "content": "<extra_id_40>",
414
+ "single_word": false,
415
+ "lstrip": false,
416
+ "rstrip": false,
417
+ "normalized": false,
418
+ "special": true
419
+ },
420
+ {
421
+ "id": 554,
422
+ "content": "<extra_id_41>",
423
+ "single_word": false,
424
+ "lstrip": false,
425
+ "rstrip": false,
426
+ "normalized": false,
427
+ "special": true
428
+ },
429
+ {
430
+ "id": 555,
431
+ "content": "<extra_id_42>",
432
+ "single_word": false,
433
+ "lstrip": false,
434
+ "rstrip": false,
435
+ "normalized": false,
436
+ "special": true
437
+ },
438
+ {
439
+ "id": 556,
440
+ "content": "<extra_id_43>",
441
+ "single_word": false,
442
+ "lstrip": false,
443
+ "rstrip": false,
444
+ "normalized": false,
445
+ "special": true
446
+ },
447
+ {
448
+ "id": 557,
449
+ "content": "<extra_id_44>",
450
+ "single_word": false,
451
+ "lstrip": false,
452
+ "rstrip": false,
453
+ "normalized": false,
454
+ "special": true
455
+ },
456
+ {
457
+ "id": 558,
458
+ "content": "<extra_id_45>",
459
+ "single_word": false,
460
+ "lstrip": false,
461
+ "rstrip": false,
462
+ "normalized": false,
463
+ "special": true
464
+ },
465
+ {
466
+ "id": 559,
467
+ "content": "<extra_id_46>",
468
+ "single_word": false,
469
+ "lstrip": false,
470
+ "rstrip": false,
471
+ "normalized": false,
472
+ "special": true
473
+ },
474
+ {
475
+ "id": 560,
476
+ "content": "<extra_id_47>",
477
+ "single_word": false,
478
+ "lstrip": false,
479
+ "rstrip": false,
480
+ "normalized": false,
481
+ "special": true
482
+ },
483
+ {
484
+ "id": 561,
485
+ "content": "<extra_id_48>",
486
+ "single_word": false,
487
+ "lstrip": false,
488
+ "rstrip": false,
489
+ "normalized": false,
490
+ "special": true
491
+ },
492
+ {
493
+ "id": 562,
494
+ "content": "<extra_id_49>",
495
+ "single_word": false,
496
+ "lstrip": false,
497
+ "rstrip": false,
498
+ "normalized": false,
499
+ "special": true
500
+ },
501
+ {
502
+ "id": 563,
503
+ "content": "<extra_id_50>",
504
+ "single_word": false,
505
+ "lstrip": false,
506
+ "rstrip": false,
507
+ "normalized": false,
508
+ "special": true
509
+ },
510
+ {
511
+ "id": 564,
512
+ "content": "<extra_id_51>",
513
+ "single_word": false,
514
+ "lstrip": false,
515
+ "rstrip": false,
516
+ "normalized": false,
517
+ "special": true
518
+ },
519
+ {
520
+ "id": 565,
521
+ "content": "<extra_id_52>",
522
+ "single_word": false,
523
+ "lstrip": false,
524
+ "rstrip": false,
525
+ "normalized": false,
526
+ "special": true
527
+ },
528
+ {
529
+ "id": 566,
530
+ "content": "<extra_id_53>",
531
+ "single_word": false,
532
+ "lstrip": false,
533
+ "rstrip": false,
534
+ "normalized": false,
535
+ "special": true
536
+ },
537
+ {
538
+ "id": 567,
539
+ "content": "<extra_id_54>",
540
+ "single_word": false,
541
+ "lstrip": false,
542
+ "rstrip": false,
543
+ "normalized": false,
544
+ "special": true
545
+ },
546
+ {
547
+ "id": 568,
548
+ "content": "<extra_id_55>",
549
+ "single_word": false,
550
+ "lstrip": false,
551
+ "rstrip": false,
552
+ "normalized": false,
553
+ "special": true
554
+ },
555
+ {
556
+ "id": 569,
557
+ "content": "<extra_id_56>",
558
+ "single_word": false,
559
+ "lstrip": false,
560
+ "rstrip": false,
561
+ "normalized": false,
562
+ "special": true
563
+ },
564
+ {
565
+ "id": 570,
566
+ "content": "<extra_id_57>",
567
+ "single_word": false,
568
+ "lstrip": false,
569
+ "rstrip": false,
570
+ "normalized": false,
571
+ "special": true
572
+ },
573
+ {
574
+ "id": 571,
575
+ "content": "<extra_id_58>",
576
+ "single_word": false,
577
+ "lstrip": false,
578
+ "rstrip": false,
579
+ "normalized": false,
580
+ "special": true
581
+ },
582
+ {
583
+ "id": 572,
584
+ "content": "<extra_id_59>",
585
+ "single_word": false,
586
+ "lstrip": false,
587
+ "rstrip": false,
588
+ "normalized": false,
589
+ "special": true
590
+ },
591
+ {
592
+ "id": 573,
593
+ "content": "<extra_id_60>",
594
+ "single_word": false,
595
+ "lstrip": false,
596
+ "rstrip": false,
597
+ "normalized": false,
598
+ "special": true
599
+ },
600
+ {
601
+ "id": 574,
602
+ "content": "<extra_id_61>",
603
+ "single_word": false,
604
+ "lstrip": false,
605
+ "rstrip": false,
606
+ "normalized": false,
607
+ "special": true
608
+ },
609
+ {
610
+ "id": 575,
611
+ "content": "<extra_id_62>",
612
+ "single_word": false,
613
+ "lstrip": false,
614
+ "rstrip": false,
615
+ "normalized": false,
616
+ "special": true
617
+ },
618
+ {
619
+ "id": 576,
620
+ "content": "<extra_id_63>",
621
+ "single_word": false,
622
+ "lstrip": false,
623
+ "rstrip": false,
624
+ "normalized": false,
625
+ "special": true
626
+ },
627
+ {
628
+ "id": 577,
629
+ "content": "<extra_id_64>",
630
+ "single_word": false,
631
+ "lstrip": false,
632
+ "rstrip": false,
633
+ "normalized": false,
634
+ "special": true
635
+ },
636
+ {
637
+ "id": 578,
638
+ "content": "<extra_id_65>",
639
+ "single_word": false,
640
+ "lstrip": false,
641
+ "rstrip": false,
642
+ "normalized": false,
643
+ "special": true
644
+ },
645
+ {
646
+ "id": 579,
647
+ "content": "<extra_id_66>",
648
+ "single_word": false,
649
+ "lstrip": false,
650
+ "rstrip": false,
651
+ "normalized": false,
652
+ "special": true
653
+ },
654
+ {
655
+ "id": 580,
656
+ "content": "<extra_id_67>",
657
+ "single_word": false,
658
+ "lstrip": false,
659
+ "rstrip": false,
660
+ "normalized": false,
661
+ "special": true
662
+ },
663
+ {
664
+ "id": 581,
665
+ "content": "<extra_id_68>",
666
+ "single_word": false,
667
+ "lstrip": false,
668
+ "rstrip": false,
669
+ "normalized": false,
670
+ "special": true
671
+ },
672
+ {
673
+ "id": 582,
674
+ "content": "<extra_id_69>",
675
+ "single_word": false,
676
+ "lstrip": false,
677
+ "rstrip": false,
678
+ "normalized": false,
679
+ "special": true
680
+ },
681
+ {
682
+ "id": 583,
683
+ "content": "<extra_id_70>",
684
+ "single_word": false,
685
+ "lstrip": false,
686
+ "rstrip": false,
687
+ "normalized": false,
688
+ "special": true
689
+ },
690
+ {
691
+ "id": 584,
692
+ "content": "<extra_id_71>",
693
+ "single_word": false,
694
+ "lstrip": false,
695
+ "rstrip": false,
696
+ "normalized": false,
697
+ "special": true
698
+ },
699
+ {
700
+ "id": 585,
701
+ "content": "<extra_id_72>",
702
+ "single_word": false,
703
+ "lstrip": false,
704
+ "rstrip": false,
705
+ "normalized": false,
706
+ "special": true
707
+ },
708
+ {
709
+ "id": 586,
710
+ "content": "<extra_id_73>",
711
+ "single_word": false,
712
+ "lstrip": false,
713
+ "rstrip": false,
714
+ "normalized": false,
715
+ "special": true
716
+ },
717
+ {
718
+ "id": 587,
719
+ "content": "<extra_id_74>",
720
+ "single_word": false,
721
+ "lstrip": false,
722
+ "rstrip": false,
723
+ "normalized": false,
724
+ "special": true
725
+ },
726
+ {
727
+ "id": 588,
728
+ "content": "<extra_id_75>",
729
+ "single_word": false,
730
+ "lstrip": false,
731
+ "rstrip": false,
732
+ "normalized": false,
733
+ "special": true
734
+ },
735
+ {
736
+ "id": 589,
737
+ "content": "<extra_id_76>",
738
+ "single_word": false,
739
+ "lstrip": false,
740
+ "rstrip": false,
741
+ "normalized": false,
742
+ "special": true
743
+ },
744
+ {
745
+ "id": 590,
746
+ "content": "<extra_id_77>",
747
+ "single_word": false,
748
+ "lstrip": false,
749
+ "rstrip": false,
750
+ "normalized": false,
751
+ "special": true
752
+ },
753
+ {
754
+ "id": 591,
755
+ "content": "<extra_id_78>",
756
+ "single_word": false,
757
+ "lstrip": false,
758
+ "rstrip": false,
759
+ "normalized": false,
760
+ "special": true
761
+ },
762
+ {
763
+ "id": 592,
764
+ "content": "<extra_id_79>",
765
+ "single_word": false,
766
+ "lstrip": false,
767
+ "rstrip": false,
768
+ "normalized": false,
769
+ "special": true
770
+ },
771
+ {
772
+ "id": 593,
773
+ "content": "<extra_id_80>",
774
+ "single_word": false,
775
+ "lstrip": false,
776
+ "rstrip": false,
777
+ "normalized": false,
778
+ "special": true
779
+ },
780
+ {
781
+ "id": 594,
782
+ "content": "<extra_id_81>",
783
+ "single_word": false,
784
+ "lstrip": false,
785
+ "rstrip": false,
786
+ "normalized": false,
787
+ "special": true
788
+ },
789
+ {
790
+ "id": 595,
791
+ "content": "<extra_id_82>",
792
+ "single_word": false,
793
+ "lstrip": false,
794
+ "rstrip": false,
795
+ "normalized": false,
796
+ "special": true
797
+ },
798
+ {
799
+ "id": 596,
800
+ "content": "<extra_id_83>",
801
+ "single_word": false,
802
+ "lstrip": false,
803
+ "rstrip": false,
804
+ "normalized": false,
805
+ "special": true
806
+ },
807
+ {
808
+ "id": 597,
809
+ "content": "<extra_id_84>",
810
+ "single_word": false,
811
+ "lstrip": false,
812
+ "rstrip": false,
813
+ "normalized": false,
814
+ "special": true
815
+ },
816
+ {
817
+ "id": 598,
818
+ "content": "<extra_id_85>",
819
+ "single_word": false,
820
+ "lstrip": false,
821
+ "rstrip": false,
822
+ "normalized": false,
823
+ "special": true
824
+ },
825
+ {
826
+ "id": 599,
827
+ "content": "<extra_id_86>",
828
+ "single_word": false,
829
+ "lstrip": false,
830
+ "rstrip": false,
831
+ "normalized": false,
832
+ "special": true
833
+ },
834
+ {
835
+ "id": 600,
836
+ "content": "<extra_id_87>",
837
+ "single_word": false,
838
+ "lstrip": false,
839
+ "rstrip": false,
840
+ "normalized": false,
841
+ "special": true
842
+ },
843
+ {
844
+ "id": 601,
845
+ "content": "<extra_id_88>",
846
+ "single_word": false,
847
+ "lstrip": false,
848
+ "rstrip": false,
849
+ "normalized": false,
850
+ "special": true
851
+ },
852
+ {
853
+ "id": 602,
854
+ "content": "<extra_id_89>",
855
+ "single_word": false,
856
+ "lstrip": false,
857
+ "rstrip": false,
858
+ "normalized": false,
859
+ "special": true
860
+ },
861
+ {
862
+ "id": 603,
863
+ "content": "<extra_id_90>",
864
+ "single_word": false,
865
+ "lstrip": false,
866
+ "rstrip": false,
867
+ "normalized": false,
868
+ "special": true
869
+ },
870
+ {
871
+ "id": 604,
872
+ "content": "<extra_id_91>",
873
+ "single_word": false,
874
+ "lstrip": false,
875
+ "rstrip": false,
876
+ "normalized": false,
877
+ "special": true
878
+ },
879
+ {
880
+ "id": 605,
881
+ "content": "<extra_id_92>",
882
+ "single_word": false,
883
+ "lstrip": false,
884
+ "rstrip": false,
885
+ "normalized": false,
886
+ "special": true
887
+ },
888
+ {
889
+ "id": 606,
890
+ "content": "<extra_id_93>",
891
+ "single_word": false,
892
+ "lstrip": false,
893
+ "rstrip": false,
894
+ "normalized": false,
895
+ "special": true
896
+ },
897
+ {
898
+ "id": 607,
899
+ "content": "<extra_id_94>",
900
+ "single_word": false,
901
+ "lstrip": false,
902
+ "rstrip": false,
903
+ "normalized": false,
904
+ "special": true
905
+ },
906
+ {
907
+ "id": 608,
908
+ "content": "<extra_id_95>",
909
+ "single_word": false,
910
+ "lstrip": false,
911
+ "rstrip": false,
912
+ "normalized": false,
913
+ "special": true
914
+ },
915
+ {
916
+ "id": 609,
917
+ "content": "<extra_id_96>",
918
+ "single_word": false,
919
+ "lstrip": false,
920
+ "rstrip": false,
921
+ "normalized": false,
922
+ "special": true
923
+ },
924
+ {
925
+ "id": 610,
926
+ "content": "<extra_id_97>",
927
+ "single_word": false,
928
+ "lstrip": false,
929
+ "rstrip": false,
930
+ "normalized": false,
931
+ "special": true
932
+ },
933
+ {
934
+ "id": 611,
935
+ "content": "<extra_id_98>",
936
+ "single_word": false,
937
+ "lstrip": false,
938
+ "rstrip": false,
939
+ "normalized": false,
940
+ "special": true
941
+ },
942
+ {
943
+ "id": 612,
944
+ "content": "<extra_id_99>",
945
+ "single_word": false,
946
+ "lstrip": false,
947
+ "rstrip": false,
948
+ "normalized": false,
949
+ "special": true
950
+ }
951
+ ],
952
+ "normalizer": null,
953
+ "pre_tokenizer": {
954
+ "type": "Sequence",
955
+ "pretokenizers": [
956
+ {
957
+ "type": "WhitespaceSplit"
958
+ },
959
+ {
960
+ "type": "Metaspace",
961
+ "replacement": "▁",
962
+ "prepend_scheme": "always",
963
+ "split": true
964
+ }
965
+ ]
966
+ },
967
+ "post_processor": {
968
+ "type": "TemplateProcessing",
969
+ "single": [
970
+ {
971
+ "Sequence": {
972
+ "id": "A",
973
+ "type_id": 0
974
+ }
975
+ }
976
+ ],
977
+ "pair": [
978
+ {
979
+ "Sequence": {
980
+ "id": "A",
981
+ "type_id": 0
982
+ }
983
+ },
984
+ {
985
+ "Sequence": {
986
+ "id": "B",
987
+ "type_id": 1
988
+ }
989
+ }
990
+ ],
991
+ "special_tokens": {}
992
+ },
993
+ "decoder": {
994
+ "type": "Metaspace",
995
+ "replacement": "▁",
996
+ "prepend_scheme": "always",
997
+ "split": true
998
+ },
999
+ "model": {
1000
+ "type": "Unigram",
1001
+ "unk_id": 3,
1002
+ "vocab": [
1003
+ [
1004
+ "<epsilon>",
1005
+ 0.0
1006
+ ],
1007
+ [
1008
+ "<s>",
1009
+ 0.0
1010
+ ],
1011
+ [
1012
+ "</s>",
1013
+ 0.0
1014
+ ],
1015
+ [
1016
+ "<unk>",
1017
+ 0.0
1018
+ ],
1019
+ [
1020
+ "▁",
1021
+ -3.1446692943573
1022
+ ],
1023
+ [
1024
+ "s",
1025
+ -3.203380823135376
1026
+ ],
1027
+ [
1028
+ ",",
1029
+ -3.58845591545105
1030
+ ],
1031
+ [
1032
+ "▁the",
1033
+ -3.7101337909698486
1034
+ ],
1035
+ [
1036
+ "t",
1037
+ -3.804173231124878
1038
+ ],
1039
+ [
1040
+ ".",
1041
+ -3.901777982711792
1042
+ ],
1043
+ [
1044
+ "e",
1045
+ -3.9562227725982666
1046
+ ],
1047
+ [
1048
+ "a",
1049
+ -4.208385944366455
1050
+ ],
1051
+ [
1052
+ "ed",
1053
+ -4.236613750457764
1054
+ ],
1055
+ [
1056
+ "o",
1057
+ -4.267106533050537
1058
+ ],
1059
+ [
1060
+ "▁a",
1061
+ -4.278589725494385
1062
+ ],
1063
+ [
1064
+ "d",
1065
+ -4.31550931930542
1066
+ ],
1067
+ [
1068
+ "▁of",
1069
+ -4.320993900299072
1070
+ ],
1071
+ [
1072
+ "n",
1073
+ -4.32736349105835
1074
+ ],
1075
+ [
1076
+ "▁to",
1077
+ -4.410154819488525
1078
+ ],
1079
+ [
1080
+ "▁and",
1081
+ -4.412942886352539
1082
+ ],
1083
+ [
1084
+ "y",
1085
+ -4.42034387588501
1086
+ ],
1087
+ [
1088
+ "m",
1089
+ -4.563985347747803
1090
+ ],
1091
+ [
1092
+ "ing",
1093
+ -4.623386859893799
1094
+ ],
1095
+ [
1096
+ "i",
1097
+ -4.663941860198975
1098
+ ],
1099
+ [
1100
+ "▁in",
1101
+ -4.729295253753662
1102
+ ],
1103
+ [
1104
+ "r",
1105
+ -4.746771335601807
1106
+ ],
1107
+ [
1108
+ "ar",
1109
+ -4.864534854888916
1110
+ ],
1111
+ [
1112
+ "p",
1113
+ -4.92025089263916
1114
+ ],
1115
+ [
1116
+ "u",
1117
+ -4.934468746185303
1118
+ ],
1119
+ [
1120
+ "al",
1121
+ -5.0213141441345215
1122
+ ],
1123
+ [
1124
+ "c",
1125
+ -5.054973602294922
1126
+ ],
1127
+ [
1128
+ "er",
1129
+ -5.077834606170654
1130
+ ],
1131
+ [
1132
+ "▁I",
1133
+ -5.0813212394714355
1134
+ ],
1135
+ [
1136
+ "re",
1137
+ -5.087508201599121
1138
+ ],
1139
+ [
1140
+ "'",
1141
+ -5.108129024505615
1142
+ ],
1143
+ [
1144
+ "st",
1145
+ -5.111265659332275
1146
+ ],
1147
+ [
1148
+ "in",
1149
+ -5.128320693969727
1150
+ ],
1151
+ [
1152
+ "▁he",
1153
+ -5.188534259796143
1154
+ ],
1155
+ [
1156
+ "▁\"",
1157
+ -5.191742897033691
1158
+ ],
1159
+ [
1160
+ "f",
1161
+ -5.197833061218262
1162
+ ],
1163
+ [
1164
+ "or",
1165
+ -5.202470779418945
1166
+ ],
1167
+ [
1168
+ "ly",
1169
+ -5.220283031463623
1170
+ ],
1171
+ [
1172
+ "l",
1173
+ -5.239860534667969
1174
+ ],
1175
+ [
1176
+ "g",
1177
+ -5.254385948181152
1178
+ ],
1179
+ [
1180
+ "b",
1181
+ -5.298688888549805
1182
+ ],
1183
+ [
1184
+ "▁was",
1185
+ -5.323605060577393
1186
+ ],
1187
+ [
1188
+ "le",
1189
+ -5.332465648651123
1190
+ ],
1191
+ [
1192
+ "▁f",
1193
+ -5.342121601104736
1194
+ ],
1195
+ [
1196
+ "▁that",
1197
+ -5.370957851409912
1198
+ ],
1199
+ [
1200
+ "▁be",
1201
+ -5.396873950958252
1202
+ ],
1203
+ [
1204
+ "▁w",
1205
+ -5.398232460021973
1206
+ ],
1207
+ [
1208
+ "▁b",
1209
+ -5.408049583435059
1210
+ ],
1211
+ [
1212
+ "k",
1213
+ -5.498411178588867
1214
+ ],
1215
+ [
1216
+ "▁it",
1217
+ -5.498649597167969
1218
+ ],
1219
+ [
1220
+ "▁c",
1221
+ -5.5201802253723145
1222
+ ],
1223
+ [
1224
+ "▁for",
1225
+ -5.558920860290527
1226
+ ],
1227
+ [
1228
+ "on",
1229
+ -5.5722246170043945
1230
+ ],
1231
+ [
1232
+ "▁is",
1233
+ -5.581616401672363
1234
+ ],
1235
+ [
1236
+ "▁re",
1237
+ -5.58840274810791
1238
+ ],
1239
+ [
1240
+ "▁p",
1241
+ -5.6148576736450195
1242
+ ],
1243
+ [
1244
+ "th",
1245
+ -5.620391845703125
1246
+ ],
1247
+ [
1248
+ "ur",
1249
+ -5.627001762390137
1250
+ ],
1251
+ [
1252
+ "w",
1253
+ -5.631758213043213
1254
+ ],
1255
+ [
1256
+ "▁his",
1257
+ -5.649014949798584
1258
+ ],
1259
+ [
1260
+ "▁with",
1261
+ -5.651855945587158
1262
+ ],
1263
+ [
1264
+ "ter",
1265
+ -5.65963077545166
1266
+ ],
1267
+ [
1268
+ "ce",
1269
+ -5.678774356842041
1270
+ ],
1271
+ [
1272
+ "an",
1273
+ -5.687518119812012
1274
+ ],
1275
+ [
1276
+ "ri",
1277
+ -5.712653636932373
1278
+ ],
1279
+ [
1280
+ "▁you",
1281
+ -5.749940395355225
1282
+ ],
1283
+ [
1284
+ "h",
1285
+ -5.7766032218933105
1286
+ ],
1287
+ [
1288
+ "es",
1289
+ -5.78245735168457
1290
+ ],
1291
+ [
1292
+ "▁me",
1293
+ -5.794474124908447
1294
+ ],
1295
+ [
1296
+ "it",
1297
+ -5.82189416885376
1298
+ ],
1299
+ [
1300
+ "ro",
1301
+ -5.838681221008301
1302
+ ],
1303
+ [
1304
+ "ent",
1305
+ -5.841847896575928
1306
+ ],
1307
+ [
1308
+ "v",
1309
+ -5.853638648986816
1310
+ ],
1311
+ [
1312
+ "▁had",
1313
+ -5.862800121307373
1314
+ ],
1315
+ [
1316
+ "▁The",
1317
+ -5.867185115814209
1318
+ ],
1319
+ [
1320
+ "en",
1321
+ -5.879556655883789
1322
+ ],
1323
+ [
1324
+ "▁as",
1325
+ -5.892141819000244
1326
+ ],
1327
+ [
1328
+ "▁de",
1329
+ -5.9042229652404785
1330
+ ],
1331
+ [
1332
+ "nd",
1333
+ -5.907679080963135
1334
+ ],
1335
+ [
1336
+ "▁her",
1337
+ -5.914851665496826
1338
+ ],
1339
+ [
1340
+ "ic",
1341
+ -5.9341912269592285
1342
+ ],
1343
+ [
1344
+ "▁not",
1345
+ -5.934748649597168
1346
+ ],
1347
+ [
1348
+ "se",
1349
+ -5.941751480102539
1350
+ ],
1351
+ [
1352
+ ";",
1353
+ -5.961045265197754
1354
+ ],
1355
+ [
1356
+ "te",
1357
+ -5.971425533294678
1358
+ ],
1359
+ [
1360
+ "▁e",
1361
+ -6.0015764236450195
1362
+ ],
1363
+ [
1364
+ "ch",
1365
+ -6.004841327667236
1366
+ ],
1367
+ [
1368
+ "ve",
1369
+ -6.012419700622559
1370
+ ],
1371
+ [
1372
+ "ne",
1373
+ -6.013899803161621
1374
+ ],
1375
+ [
1376
+ "▁A",
1377
+ -6.0221428871154785
1378
+ ],
1379
+ [
1380
+ "▁on",
1381
+ -6.028809070587158
1382
+ ],
1383
+ [
1384
+ "il",
1385
+ -6.041737079620361
1386
+ ],
1387
+ [
1388
+ "is",
1389
+ -6.04183292388916
1390
+ ],
1391
+ [
1392
+ "▁so",
1393
+ -6.059542179107666
1394
+ ],
1395
+ [
1396
+ "▁S",
1397
+ -6.070916652679443
1398
+ ],
1399
+ [
1400
+ "at",
1401
+ -6.07675838470459
1402
+ ],
1403
+ [
1404
+ "la",
1405
+ -6.0870466232299805
1406
+ ],
1407
+ [
1408
+ "ad",
1409
+ -6.092111110687256
1410
+ ],
1411
+ [
1412
+ "▁at",
1413
+ -6.0932087898254395
1414
+ ],
1415
+ [
1416
+ "ir",
1417
+ -6.123541355133057
1418
+ ],
1419
+ [
1420
+ "▁do",
1421
+ -6.126033782958984
1422
+ ],
1423
+ [
1424
+ "ng",
1425
+ -6.177332401275635
1426
+ ],
1427
+ [
1428
+ "▁g",
1429
+ -6.208189487457275
1430
+ ],
1431
+ [
1432
+ "}",
1433
+ -6.218713760375977
1434
+ ],
1435
+ [
1436
+ "ra",
1437
+ -6.221874237060547
1438
+ ],
1439
+ [
1440
+ "▁{",
1441
+ -6.222105979919434
1442
+ ],
1443
+ [
1444
+ "▁mo",
1445
+ -6.245700359344482
1446
+ ],
1447
+ [
1448
+ ".\"",
1449
+ -6.260274410247803
1450
+ ],
1451
+ [
1452
+ "ver",
1453
+ -6.260942459106445
1454
+ ],
1455
+ [
1456
+ "▁ma",
1457
+ -6.267685890197754
1458
+ ],
1459
+ [
1460
+ "▁she",
1461
+ -6.298584938049316
1462
+ ],
1463
+ [
1464
+ "▁con",
1465
+ -6.302234649658203
1466
+ ],
1467
+ [
1468
+ "▁have",
1469
+ -6.305024147033691
1470
+ ],
1471
+ [
1472
+ "▁no",
1473
+ -6.305781364440918
1474
+ ],
1475
+ [
1476
+ "I",
1477
+ -6.324380397796631
1478
+ ],
1479
+ [
1480
+ "▁him",
1481
+ -6.327845573425293
1482
+ ],
1483
+ [
1484
+ "H",
1485
+ -6.332118034362793
1486
+ ],
1487
+ [
1488
+ "el",
1489
+ -6.335691928863525
1490
+ ],
1491
+ [
1492
+ "ll",
1493
+ -6.3703484535217285
1494
+ ],
1495
+ [
1496
+ "ation",
1497
+ -6.3807830810546875
1498
+ ],
1499
+ [
1500
+ "▁fa",
1501
+ -6.381678581237793
1502
+ ],
1503
+ [
1504
+ "▁th",
1505
+ -6.384618282318115
1506
+ ],
1507
+ [
1508
+ "▁su",
1509
+ -6.388561248779297
1510
+ ],
1511
+ [
1512
+ "▁but",
1513
+ -6.402822971343994
1514
+ ],
1515
+ [
1516
+ "lo",
1517
+ -6.411969184875488
1518
+ ],
1519
+ [
1520
+ "li",
1521
+ -6.413236141204834
1522
+ ],
1523
+ [
1524
+ "ther",
1525
+ -6.416365623474121
1526
+ ],
1527
+ [
1528
+ "▁by",
1529
+ -6.421297073364258
1530
+ ],
1531
+ [
1532
+ "▁C",
1533
+ -6.428677558898926
1534
+ ],
1535
+ [
1536
+ "▁which",
1537
+ -6.430390357971191
1538
+ ],
1539
+ [
1540
+ "▁all",
1541
+ -6.434648513793945
1542
+ ],
1543
+ [
1544
+ "id",
1545
+ -6.451933860778809
1546
+ ],
1547
+ [
1548
+ "▁se",
1549
+ -6.453425884246826
1550
+ ],
1551
+ [
1552
+ "▁from",
1553
+ -6.4639363288879395
1554
+ ],
1555
+ [
1556
+ "▁la",
1557
+ -6.464136123657227
1558
+ ],
1559
+ [
1560
+ "▁ex",
1561
+ -6.46722412109375
1562
+ ],
1563
+ [
1564
+ "▁or",
1565
+ -6.478571891784668
1566
+ ],
1567
+ [
1568
+ "▁B",
1569
+ -6.484975337982178
1570
+ ],
1571
+ [
1572
+ "▁are",
1573
+ -6.488126277923584
1574
+ ],
1575
+ [
1576
+ "▁M",
1577
+ -6.489441871643066
1578
+ ],
1579
+ [
1580
+ "▁He",
1581
+ -6.494318008422852
1582
+ ],
1583
+ [
1584
+ "R",
1585
+ -6.496219158172607
1586
+ ],
1587
+ [
1588
+ "▁my",
1589
+ -6.501786708831787
1590
+ ],
1591
+ [
1592
+ "ul",
1593
+ -6.503665447235107
1594
+ ],
1595
+ [
1596
+ "un",
1597
+ -6.507981300354004
1598
+ ],
1599
+ [
1600
+ "▁this",
1601
+ -6.509151458740234
1602
+ ],
1603
+ [
1604
+ "▁we",
1605
+ -6.509461402893066
1606
+ ],
1607
+ [
1608
+ "▁were",
1609
+ -6.515420913696289
1610
+ ],
1611
+ [
1612
+ ",\"",
1613
+ -6.516303539276123
1614
+ ],
1615
+ [
1616
+ "ck",
1617
+ -6.536041736602783
1618
+ ],
1619
+ [
1620
+ "▁who",
1621
+ -6.560507297515869
1622
+ ],
1623
+ [
1624
+ "▁sh",
1625
+ -6.560885429382324
1626
+ ],
1627
+ [
1628
+ "▁[",
1629
+ -6.566647529602051
1630
+ ],
1631
+ [
1632
+ "ow",
1633
+ -6.567778587341309
1634
+ ],
1635
+ [
1636
+ "▁said",
1637
+ -6.572078227996826
1638
+ ],
1639
+ [
1640
+ "▁P",
1641
+ -6.572185516357422
1642
+ ],
1643
+ [
1644
+ "D",
1645
+ -6.575502872467041
1646
+ ],
1647
+ [
1648
+ "et",
1649
+ -6.59080696105957
1650
+ ],
1651
+ [
1652
+ "ion",
1653
+ -6.602999687194824
1654
+ ],
1655
+ [
1656
+ "▁L",
1657
+ -6.604433536529541
1658
+ ],
1659
+ [
1660
+ "ant",
1661
+ -6.60852575302124
1662
+ ],
1663
+ [
1664
+ "ment",
1665
+ -6.609012603759766
1666
+ ],
1667
+ [
1668
+ "▁W",
1669
+ -6.60936975479126
1670
+ ],
1671
+ [
1672
+ "▁po",
1673
+ -6.6191205978393555
1674
+ ],
1675
+ [
1676
+ "am",
1677
+ -6.623525142669678
1678
+ ],
1679
+ [
1680
+ "vi",
1681
+ -6.627021789550781
1682
+ ],
1683
+ [
1684
+ "▁]",
1685
+ -6.630141258239746
1686
+ ],
1687
+ [
1688
+ "▁one",
1689
+ -6.639581203460693
1690
+ ],
1691
+ [
1692
+ "x",
1693
+ -6.648676872253418
1694
+ ],
1695
+ [
1696
+ "ct",
1697
+ -6.654047012329102
1698
+ ],
1699
+ [
1700
+ "▁an",
1701
+ -6.659359931945801
1702
+ ],
1703
+ [
1704
+ "period",
1705
+ -6.661555290222168
1706
+ ],
1707
+ [
1708
+ "us",
1709
+ -6.667537689208984
1710
+ ],
1711
+ [
1712
+ "pp",
1713
+ -6.67457389831543
1714
+ ],
1715
+ [
1716
+ "im",
1717
+ -6.682270526885986
1718
+ ],
1719
+ [
1720
+ "▁man",
1721
+ -6.685298442840576
1722
+ ],
1723
+ [
1724
+ "▁pro",
1725
+ -6.695033073425293
1726
+ ],
1727
+ [
1728
+ "ut",
1729
+ -6.69868803024292
1730
+ ],
1731
+ [
1732
+ "▁sp",
1733
+ -6.702606201171875
1734
+ ],
1735
+ [
1736
+ "▁ho",
1737
+ -6.7108588218688965
1738
+ ],
1739
+ [
1740
+ "▁le",
1741
+ -6.717572212219238
1742
+ ],
1743
+ [
1744
+ "▁ca",
1745
+ -6.721408367156982
1746
+ ],
1747
+ [
1748
+ "j",
1749
+ -6.72599983215332
1750
+ ],
1751
+ [
1752
+ "ough",
1753
+ -6.729132175445557
1754
+ ],
1755
+ [
1756
+ "▁go",
1757
+ -6.737214088439941
1758
+ ],
1759
+ [
1760
+ "ge",
1761
+ -6.741745471954346
1762
+ ],
1763
+ [
1764
+ "▁ha",
1765
+ -6.7515549659729
1766
+ ],
1767
+ [
1768
+ "▁F",
1769
+ -6.754391670227051
1770
+ ],
1771
+ [
1772
+ "▁mi",
1773
+ -6.762367248535156
1774
+ ],
1775
+ [
1776
+ "ound",
1777
+ -6.773167610168457
1778
+ ],
1779
+ [
1780
+ "▁they",
1781
+ -6.787041664123535
1782
+ ],
1783
+ [
1784
+ "▁would",
1785
+ -6.787123203277588
1786
+ ],
1787
+ [
1788
+ "hi",
1789
+ -6.79250955581665
1790
+ ],
1791
+ [
1792
+ "ke",
1793
+ -6.795114040374756
1794
+ ],
1795
+ [
1796
+ "ive",
1797
+ -6.7967634201049805
1798
+ ],
1799
+ [
1800
+ "ate",
1801
+ -6.804977893829346
1802
+ ],
1803
+ [
1804
+ "▁T",
1805
+ -6.80813455581665
1806
+ ],
1807
+ [
1808
+ "z",
1809
+ -6.812094211578369
1810
+ ],
1811
+ [
1812
+ "per",
1813
+ -6.8176069259643555
1814
+ ],
1815
+ [
1816
+ "▁sa",
1817
+ -6.819145679473877
1818
+ ],
1819
+ [
1820
+ "▁out",
1821
+ -6.826883316040039
1822
+ ],
1823
+ [
1824
+ "ol",
1825
+ -6.833821773529053
1826
+ ],
1827
+ [
1828
+ "▁up",
1829
+ -6.834559440612793
1830
+ ],
1831
+ [
1832
+ "co",
1833
+ -6.844675540924072
1834
+ ],
1835
+ [
1836
+ "▁pa",
1837
+ -6.855184078216553
1838
+ ],
1839
+ [
1840
+ "A",
1841
+ -6.858541965484619
1842
+ ],
1843
+ [
1844
+ "old",
1845
+ -6.860659599304199
1846
+ ],
1847
+ [
1848
+ "!",
1849
+ -6.876157760620117
1850
+ ],
1851
+ [
1852
+ "▁dis",
1853
+ -6.8776350021362305
1854
+ ],
1855
+ [
1856
+ "▁see",
1857
+ -6.881742000579834
1858
+ ],
1859
+ [
1860
+ "ry",
1861
+ -6.883233547210693
1862
+ ],
1863
+ [
1864
+ "ff",
1865
+ -6.894794940948486
1866
+ ],
1867
+ [
1868
+ "N",
1869
+ -6.899501800537109
1870
+ ],
1871
+ [
1872
+ "▁un",
1873
+ -6.9004364013671875
1874
+ ],
1875
+ [
1876
+ "▁co",
1877
+ -6.9032673835754395
1878
+ ],
1879
+ [
1880
+ "▁O",
1881
+ -6.907948017120361
1882
+ ],
1883
+ [
1884
+ "▁been",
1885
+ -6.916658878326416
1886
+ ],
1887
+ [
1888
+ "ity",
1889
+ -6.9181389808654785
1890
+ ],
1891
+ [
1892
+ "he",
1893
+ -6.921543121337891
1894
+ ],
1895
+ [
1896
+ "▁di",
1897
+ -6.923122882843018
1898
+ ],
1899
+ [
1900
+ "lu",
1901
+ -6.931999206542969
1902
+ ],
1903
+ [
1904
+ "▁there",
1905
+ -6.934426784515381
1906
+ ],
1907
+ [
1908
+ "▁their",
1909
+ -6.934463977813721
1910
+ ],
1911
+ [
1912
+ "der",
1913
+ -6.935543537139893
1914
+ ],
1915
+ [
1916
+ "est",
1917
+ -6.940905570983887
1918
+ ],
1919
+ [
1920
+ "E",
1921
+ -6.9548492431640625
1922
+ ],
1923
+ [
1924
+ "▁will",
1925
+ -6.958393096923828
1926
+ ],
1927
+ [
1928
+ "ight",
1929
+ -6.965392112731934
1930
+ ],
1931
+ [
1932
+ "_",
1933
+ -6.966725826263428
1934
+ ],
1935
+ [
1936
+ "mp",
1937
+ -6.967768669128418
1938
+ ],
1939
+ [
1940
+ "▁fi",
1941
+ -6.972559452056885
1942
+ ],
1943
+ [
1944
+ "ish",
1945
+ -6.979668617248535
1946
+ ],
1947
+ [
1948
+ "ance",
1949
+ -6.982175827026367
1950
+ ],
1951
+ [
1952
+ "ci",
1953
+ -6.984276294708252
1954
+ ],
1955
+ [
1956
+ "▁E",
1957
+ -6.989256381988525
1958
+ ],
1959
+ [
1960
+ "▁tr",
1961
+ -6.989500999450684
1962
+ ],
1963
+ [
1964
+ "▁G",
1965
+ -6.999267578125
1966
+ ],
1967
+ [
1968
+ "▁li",
1969
+ -7.00178861618042
1970
+ ],
1971
+ [
1972
+ "pe",
1973
+ -7.007822513580322
1974
+ ],
1975
+ [
1976
+ "▁bo",
1977
+ -7.010932922363281
1978
+ ],
1979
+ [
1980
+ "▁No",
1981
+ -7.014448642730713
1982
+ ],
1983
+ [
1984
+ "1",
1985
+ -7.014896392822266
1986
+ ],
1987
+ [
1988
+ "qu",
1989
+ -7.022171974182129
1990
+ ],
1991
+ [
1992
+ "ill",
1993
+ -7.023817539215088
1994
+ ],
1995
+ [
1996
+ "ard",
1997
+ -7.024126052856445
1998
+ ],
1999
+ [
2000
+ "?",
2001
+ -7.025038242340088
2002
+ ],
2003
+ [
2004
+ "able",
2005
+ -7.033109188079834
2006
+ ],
2007
+ [
2008
+ "▁when",
2009
+ -7.038402080535889
2010
+ ],
2011
+ [
2012
+ "ten",
2013
+ -7.03859806060791
2014
+ ],
2015
+ [
2016
+ "age",
2017
+ -7.041808605194092
2018
+ ],
2019
+ [
2020
+ "?\"",
2021
+ -7.047811508178711
2022
+ ],
2023
+ [
2024
+ "▁en",
2025
+ -7.050681114196777
2026
+ ],
2027
+ [
2028
+ "ous",
2029
+ -7.060575008392334
2030
+ ],
2031
+ [
2032
+ "tra",
2033
+ -7.063107490539551
2034
+ ],
2035
+ [
2036
+ "ence",
2037
+ -7.072290420532227
2038
+ ],
2039
+ [
2040
+ "ect",
2041
+ -7.075937271118164
2042
+ ],
2043
+ [
2044
+ "J",
2045
+ -7.077571868896484
2046
+ ],
2047
+ [
2048
+ "▁some",
2049
+ -7.081721782684326
2050
+ ],
2051
+ [
2052
+ "▁them",
2053
+ -7.1001973152160645
2054
+ ],
2055
+ [
2056
+ "▁ne",
2057
+ -7.104800701141357
2058
+ ],
2059
+ [
2060
+ "▁could",
2061
+ -7.107924938201904
2062
+ ],
2063
+ [
2064
+ "▁can",
2065
+ -7.113558292388916
2066
+ ],
2067
+ [
2068
+ "▁if",
2069
+ -7.1193528175354
2070
+ ],
2071
+ [
2072
+ "▁what",
2073
+ -7.127973556518555
2074
+ ],
2075
+ [
2076
+ "▁know",
2077
+ -7.130826473236084
2078
+ ],
2079
+ [
2080
+ "ful",
2081
+ -7.136860370635986
2082
+ ],
2083
+ [
2084
+ "O",
2085
+ -7.163638114929199
2086
+ ],
2087
+ [
2088
+ "ru",
2089
+ -7.164709091186523
2090
+ ],
2091
+ [
2092
+ "ell",
2093
+ -7.16968297958374
2094
+ ],
2095
+ [
2096
+ "▁sta",
2097
+ -7.1711201667785645
2098
+ ],
2099
+ [
2100
+ "▁time",
2101
+ -7.173023700714111
2102
+ ],
2103
+ [
2104
+ "▁any",
2105
+ -7.18028450012207
2106
+ ],
2107
+ [
2108
+ "▁ra",
2109
+ -7.186168193817139
2110
+ ],
2111
+ [
2112
+ "▁more",
2113
+ -7.186279296875
2114
+ ],
2115
+ [
2116
+ "▁into",
2117
+ -7.190565586090088
2118
+ ],
2119
+ [
2120
+ "ome",
2121
+ -7.193604469299316
2122
+ ],
2123
+ [
2124
+ "T",
2125
+ -7.196429252624512
2126
+ ],
2127
+ [
2128
+ "▁other",
2129
+ -7.204713344573975
2130
+ ],
2131
+ [
2132
+ ":",
2133
+ -7.209097862243652
2134
+ ],
2135
+ [
2136
+ "ies",
2137
+ -7.218936920166016
2138
+ ],
2139
+ [
2140
+ "▁your",
2141
+ -7.223606109619141
2142
+ ],
2143
+ [
2144
+ "▁And",
2145
+ -7.229339122772217
2146
+ ],
2147
+ [
2148
+ "▁ye",
2149
+ -7.232705116271973
2150
+ ],
2151
+ [
2152
+ "S",
2153
+ -7.234437942504883
2154
+ ],
2155
+ [
2156
+ "▁like",
2157
+ -7.235995769500732
2158
+ ],
2159
+ [
2160
+ "ness",
2161
+ -7.239752292633057
2162
+ ],
2163
+ [
2164
+ "▁dr",
2165
+ -7.25142765045166
2166
+ ],
2167
+ [
2168
+ "low",
2169
+ -7.2691826820373535
2170
+ ],
2171
+ [
2172
+ "▁It",
2173
+ -7.270310878753662
2174
+ ],
2175
+ [
2176
+ "▁sto",
2177
+ -7.2738118171691895
2178
+ ],
2179
+ [
2180
+ "▁us",
2181
+ -7.2769670486450195
2182
+ ],
2183
+ [
2184
+ "▁But",
2185
+ -7.279003620147705
2186
+ ],
2187
+ [
2188
+ "▁pre",
2189
+ -7.3001484870910645
2190
+ ],
2191
+ [
2192
+ "mb",
2193
+ -7.302000522613525
2194
+ ],
2195
+ [
2196
+ "side",
2197
+ -7.3103156089782715
2198
+ ],
2199
+ [
2200
+ "▁has",
2201
+ -7.317553520202637
2202
+ ],
2203
+ [
2204
+ "row",
2205
+ -7.317798137664795
2206
+ ],
2207
+ [
2208
+ "▁There",
2209
+ -7.321875095367432
2210
+ ],
2211
+ [
2212
+ "cu",
2213
+ -7.324193000793457
2214
+ ],
2215
+ [
2216
+ "▁very",
2217
+ -7.333028793334961
2218
+ ],
2219
+ [
2220
+ "▁than",
2221
+ -7.334202289581299
2222
+ ],
2223
+ [
2224
+ "▁lo",
2225
+ -7.334221363067627
2226
+ ],
2227
+ [
2228
+ "▁did",
2229
+ -7.338522911071777
2230
+ ],
2231
+ [
2232
+ "ach",
2233
+ -7.3409504890441895
2234
+ ],
2235
+ [
2236
+ "▁about",
2237
+ -7.341108322143555
2238
+ ],
2239
+ [
2240
+ "▁day",
2241
+ -7.3574066162109375
2242
+ ],
2243
+ [
2244
+ "▁over",
2245
+ -7.358343601226807
2246
+ ],
2247
+ [
2248
+ "▁look",
2249
+ -7.359866142272949
2250
+ ],
2251
+ [
2252
+ "-",
2253
+ -7.369490146636963
2254
+ ],
2255
+ [
2256
+ "tion",
2257
+ -7.372918605804443
2258
+ ],
2259
+ [
2260
+ "ture",
2261
+ -7.383158206939697
2262
+ ],
2263
+ [
2264
+ "▁Mr",
2265
+ -7.389575958251953
2266
+ ],
2267
+ [
2268
+ "ph",
2269
+ -7.394842147827148
2270
+ ],
2271
+ [
2272
+ "▁little",
2273
+ -7.395269393920898
2274
+ ],
2275
+ [
2276
+ "ho",
2277
+ -7.403622627258301
2278
+ ],
2279
+ [
2280
+ "▁again",
2281
+ -7.425952911376953
2282
+ ],
2283
+ [
2284
+ "ction",
2285
+ -7.430576801300049
2286
+ ],
2287
+ [
2288
+ "ig",
2289
+ -7.438838958740234
2290
+ ],
2291
+ [
2292
+ "▁hand",
2293
+ -7.44147253036499
2294
+ ],
2295
+ [
2296
+ "▁now",
2297
+ -7.445526123046875
2298
+ ],
2299
+ [
2300
+ "qui",
2301
+ -7.446432590484619
2302
+ ],
2303
+ [
2304
+ "▁sc",
2305
+ -7.450597763061523
2306
+ ],
2307
+ [
2308
+ "▁should",
2309
+ -7.453698635101318
2310
+ ],
2311
+ [
2312
+ "▁great",
2313
+ -7.463414669036865
2314
+ ],
2315
+ [
2316
+ "▁two",
2317
+ -7.470479965209961
2318
+ ],
2319
+ [
2320
+ "!\"",
2321
+ -7.471007347106934
2322
+ ],
2323
+ [
2324
+ "▁right",
2325
+ -7.472324371337891
2326
+ ],
2327
+ [
2328
+ "ious",
2329
+ -7.481609344482422
2330
+ ],
2331
+ [
2332
+ "man",
2333
+ -7.48414945602417
2334
+ ],
2335
+ [
2336
+ "—",
2337
+ -7.484794616699219
2338
+ ],
2339
+ [
2340
+ "▁our",
2341
+ -7.485799789428711
2342
+ ],
2343
+ [
2344
+ "You",
2345
+ -7.504610538482666
2346
+ ],
2347
+ [
2348
+ "▁say",
2349
+ -7.508391380310059
2350
+ ],
2351
+ [
2352
+ "▁upon",
2353
+ -7.5086517333984375
2354
+ ],
2355
+ [
2356
+ "▁hu",
2357
+ -7.517370223999023
2358
+ ],
2359
+ [
2360
+ "▁comp",
2361
+ -7.519069194793701
2362
+ ],
2363
+ [
2364
+ "ress",
2365
+ -7.519094467163086
2366
+ ],
2367
+ [
2368
+ "▁only",
2369
+ -7.524586200714111
2370
+ ],
2371
+ [
2372
+ "▁She",
2373
+ -7.52614164352417
2374
+ ],
2375
+ [
2376
+ "less",
2377
+ -7.530499458312988
2378
+ ],
2379
+ [
2380
+ "ated",
2381
+ -7.53152322769165
2382
+ ],
2383
+ [
2384
+ "2",
2385
+ -7.5379862785339355
2386
+ ],
2387
+ [
2388
+ "▁left",
2389
+ -7.551514625549316
2390
+ ],
2391
+ [
2392
+ "▁down",
2393
+ -7.5532917976379395
2394
+ ],
2395
+ [
2396
+ "▁ga",
2397
+ -7.558096885681152
2398
+ ],
2399
+ [
2400
+ "0",
2401
+ -7.565780162811279
2402
+ ],
2403
+ [
2404
+ "▁da",
2405
+ -7.566195487976074
2406
+ ],
2407
+ [
2408
+ "▁after",
2409
+ -7.572922706604004
2410
+ ],
2411
+ [
2412
+ "▁made",
2413
+ -7.585012912750244
2414
+ ],
2415
+ [
2416
+ "tain",
2417
+ -7.588871002197266
2418
+ ],
2419
+ [
2420
+ "ick",
2421
+ -7.591251850128174
2422
+ ],
2423
+ [
2424
+ "new",
2425
+ -7.592978000640869
2426
+ ],
2427
+ [
2428
+ "▁com",
2429
+ -7.594455718994141
2430
+ ],
2431
+ [
2432
+ "ving",
2433
+ -7.599806308746338
2434
+ ],
2435
+ [
2436
+ "▁Ma",
2437
+ -7.607027053833008
2438
+ ],
2439
+ [
2440
+ "ward",
2441
+ -7.620022296905518
2442
+ ],
2443
+ [
2444
+ "▁before",
2445
+ -7.6242265701293945
2446
+ ],
2447
+ [
2448
+ "W",
2449
+ -7.633222579956055
2450
+ ],
2451
+ [
2452
+ "U",
2453
+ -7.636125087738037
2454
+ ],
2455
+ [
2456
+ "ven",
2457
+ -7.636752605438232
2458
+ ],
2459
+ [
2460
+ "▁good",
2461
+ -7.638261795043945
2462
+ ],
2463
+ [
2464
+ "ign",
2465
+ -7.644953727722168
2466
+ ],
2467
+ [
2468
+ "tru",
2469
+ -7.648081302642822
2470
+ ],
2471
+ [
2472
+ "▁cha",
2473
+ -7.657571315765381
2474
+ ],
2475
+ [
2476
+ "▁long",
2477
+ -7.658087253570557
2478
+ ],
2479
+ [
2480
+ "▁how",
2481
+ -7.661345958709717
2482
+ ],
2483
+ [
2484
+ "Y",
2485
+ -7.661816120147705
2486
+ ],
2487
+ [
2488
+ "paragraph",
2489
+ -7.664102554321289
2490
+ ],
2491
+ [
2492
+ "▁come",
2493
+ -7.672017574310303
2494
+ ],
2495
+ [
2496
+ "▁part",
2497
+ -7.674316883087158
2498
+ ],
2499
+ [
2500
+ "V",
2501
+ -7.675340175628662
2502
+ ],
2503
+ [
2504
+ "▁ob",
2505
+ -7.680867671966553
2506
+ ],
2507
+ [
2508
+ "▁thing",
2509
+ -7.68093729019165
2510
+ ],
2511
+ [
2512
+ "▁must",
2513
+ -7.683284759521484
2514
+ ],
2515
+ [
2516
+ "ha",
2517
+ -7.684486389160156
2518
+ ],
2519
+ [
2520
+ "▁even",
2521
+ -7.699027061462402
2522
+ ],
2523
+ [
2524
+ "▁way",
2525
+ -7.6992669105529785
2526
+ ],
2527
+ [
2528
+ "▁take",
2529
+ -7.7000508308410645
2530
+ ],
2531
+ [
2532
+ "K",
2533
+ -7.707818984985352
2534
+ ],
2535
+ [
2536
+ "▁back",
2537
+ -7.712675094604492
2538
+ ],
2539
+ [
2540
+ "▁under",
2541
+ -7.713348865509033
2542
+ ],
2543
+ [
2544
+ "▁came",
2545
+ -7.716226577758789
2546
+ ],
2547
+ [
2548
+ "L",
2549
+ -7.728263854980469
2550
+ ],
2551
+ [
2552
+ "▁well",
2553
+ -7.731564521789551
2554
+ ],
2555
+ [
2556
+ "▁think",
2557
+ -7.732664108276367
2558
+ ],
2559
+ [
2560
+ "▁never",
2561
+ -7.760746479034424
2562
+ ],
2563
+ [
2564
+ "▁much",
2565
+ -7.763637542724609
2566
+ ],
2567
+ [
2568
+ "▁gra",
2569
+ -7.766099452972412
2570
+ ],
2571
+ [
2572
+ "▁first",
2573
+ -7.774232387542725
2574
+ ],
2575
+ [
2576
+ "▁every",
2577
+ -7.776756286621094
2578
+ ],
2579
+ [
2580
+ "ugh",
2581
+ -7.790675640106201
2582
+ ],
2583
+ [
2584
+ "▁such",
2585
+ -7.791811466217041
2586
+ ],
2587
+ [
2588
+ "▁where",
2589
+ -7.792065620422363
2590
+ ],
2591
+ [
2592
+ "land",
2593
+ -7.801862716674805
2594
+ ],
2595
+ [
2596
+ "▁Ch",
2597
+ -7.81598424911499
2598
+ ],
2599
+ [
2600
+ "▁imp",
2601
+ -7.82216739654541
2602
+ ],
2603
+ [
2604
+ "▁through",
2605
+ -7.82563591003418
2606
+ ],
2607
+ [
2608
+ "▁own",
2609
+ -7.836172103881836
2610
+ ],
2611
+ [
2612
+ "M",
2613
+ -7.846076011657715
2614
+ ],
2615
+ [
2616
+ "▁make",
2617
+ -7.847618579864502
2618
+ ],
2619
+ [
2620
+ "ook",
2621
+ -7.852067947387695
2622
+ ],
2623
+ [
2624
+ "3",
2625
+ -7.856833457946777
2626
+ ],
2627
+ [
2628
+ "use",
2629
+ -7.864173412322998
2630
+ ],
2631
+ [
2632
+ "C",
2633
+ -7.868447780609131
2634
+ ],
2635
+ [
2636
+ "▁place",
2637
+ -7.8706769943237305
2638
+ ],
2639
+ [
2640
+ "ition",
2641
+ -7.872597694396973
2642
+ ],
2643
+ [
2644
+ "serv",
2645
+ -7.8729166984558105
2646
+ ],
2647
+ [
2648
+ "pri",
2649
+ -7.888969421386719
2650
+ ],
2651
+ [
2652
+ "▁Th",
2653
+ -7.891221046447754
2654
+ ],
2655
+ [
2656
+ "▁give",
2657
+ -7.896949291229248
2658
+ ],
2659
+ [
2660
+ "▁just",
2661
+ -7.907407283782959
2662
+ ],
2663
+ [
2664
+ "5",
2665
+ -7.91018009185791
2666
+ ],
2667
+ [
2668
+ "ible",
2669
+ -7.912111759185791
2670
+ ],
2671
+ [
2672
+ "▁himself",
2673
+ -7.912140846252441
2674
+ ],
2675
+ [
2676
+ "▁might",
2677
+ -7.9202799797058105
2678
+ ],
2679
+ [
2680
+ "4",
2681
+ -7.932826995849609
2682
+ ],
2683
+ [
2684
+ "▁sw",
2685
+ -7.935232639312744
2686
+ ],
2687
+ [
2688
+ "▁life",
2689
+ -7.939643859863281
2690
+ ],
2691
+ [
2692
+ "▁without",
2693
+ -7.945864200592041
2694
+ ],
2695
+ [
2696
+ "▁get",
2697
+ -7.974736213684082
2698
+ ],
2699
+ [
2700
+ "▁work",
2701
+ -7.981810092926025
2702
+ ],
2703
+ [
2704
+ "▁du",
2705
+ -7.989681243896484
2706
+ ],
2707
+ [
2708
+ "▁pass",
2709
+ -7.998128414154053
2710
+ ],
2711
+ [
2712
+ "▁appear",
2713
+ -7.999986171722412
2714
+ ],
2715
+ [
2716
+ "▁house",
2717
+ -8.005838394165039
2718
+ ],
2719
+ [
2720
+ "What",
2721
+ -8.007867813110352
2722
+ ],
2723
+ [
2724
+ "▁away",
2725
+ -8.007869720458984
2726
+ ],
2727
+ [
2728
+ "▁love",
2729
+ -8.025405883789062
2730
+ ],
2731
+ [
2732
+ "▁call",
2733
+ -8.0332670211792
2734
+ ],
2735
+ [
2736
+ "line",
2737
+ -8.03477668762207
2738
+ ],
2739
+ [
2740
+ "▁turn",
2741
+ -8.039846420288086
2742
+ ],
2743
+ [
2744
+ "▁shall",
2745
+ -8.04392147064209
2746
+ ],
2747
+ [
2748
+ "▁This",
2749
+ -8.048504829406738
2750
+ ],
2751
+ [
2752
+ "▁mu",
2753
+ -8.054326057434082
2754
+ ],
2755
+ [
2756
+ "\"",
2757
+ -8.055206298828125
2758
+ ],
2759
+ [
2760
+ "▁those",
2761
+ -8.07278060913086
2762
+ ],
2763
+ [
2764
+ "▁night",
2765
+ -8.08027458190918
2766
+ ],
2767
+ [
2768
+ "The",
2769
+ -8.095630645751953
2770
+ ],
2771
+ [
2772
+ "port",
2773
+ -8.105117797851562
2774
+ ],
2775
+ [
2776
+ "▁word",
2777
+ -8.1146240234375
2778
+ ],
2779
+ [
2780
+ "B",
2781
+ -8.122001647949219
2782
+ ],
2783
+ [
2784
+ "P",
2785
+ -8.130742073059082
2786
+ ],
2787
+ [
2788
+ "*",
2789
+ -8.130934715270996
2790
+ ],
2791
+ [
2792
+ "▁heart",
2793
+ -8.131942749023438
2794
+ ],
2795
+ [
2796
+ "▁still",
2797
+ -8.140876770019531
2798
+ ],
2799
+ [
2800
+ "▁next",
2801
+ -8.142328262329102
2802
+ ],
2803
+ [
2804
+ "▁tell",
2805
+ -8.165434837341309
2806
+ ],
2807
+ [
2808
+ "▁room",
2809
+ -8.168549537658691
2810
+ ],
2811
+ [
2812
+ "8",
2813
+ -8.179108619689941
2814
+ ],
2815
+ [
2816
+ "6",
2817
+ -8.192533493041992
2818
+ ],
2819
+ [
2820
+ "▁three",
2821
+ -8.194826126098633
2822
+ ],
2823
+ [
2824
+ "▁friend",
2825
+ -8.195451736450195
2826
+ ],
2827
+ [
2828
+ "▁people",
2829
+ -8.210062026977539
2830
+ ],
2831
+ [
2832
+ ")",
2833
+ -8.219422340393066
2834
+ ],
2835
+ [
2836
+ "▁same",
2837
+ -8.228056907653809
2838
+ ],
2839
+ [
2840
+ "▁change",
2841
+ -8.232505798339844
2842
+ ],
2843
+ [
2844
+ "▁Do",
2845
+ -8.238903045654297
2846
+ ],
2847
+ [
2848
+ "▁follow",
2849
+ -8.242085456848145
2850
+ ],
2851
+ [
2852
+ "▁while",
2853
+ -8.25542163848877
2854
+ ],
2855
+ [
2856
+ "▁nothing",
2857
+ -8.257135391235352
2858
+ ],
2859
+ [
2860
+ "▁child",
2861
+ -8.258654594421387
2862
+ ],
2863
+ [
2864
+ "7",
2865
+ -8.28925895690918
2866
+ ],
2867
+ [
2868
+ "body",
2869
+ -8.293252944946289
2870
+ ],
2871
+ [
2872
+ "▁Ne",
2873
+ -8.295580863952637
2874
+ ],
2875
+ [
2876
+ "That",
2877
+ -8.300972938537598
2878
+ ],
2879
+ [
2880
+ "comma",
2881
+ -8.305874824523926
2882
+ ],
2883
+ [
2884
+ "▁light",
2885
+ -8.315401077270508
2886
+ ],
2887
+ [
2888
+ "▁another",
2889
+ -8.327678680419922
2890
+ ],
2891
+ [
2892
+ "▁God",
2893
+ -8.32773208618164
2894
+ ],
2895
+ [
2896
+ "▁name",
2897
+ -8.329839706420898
2898
+ ],
2899
+ [
2900
+ "▁asked",
2901
+ -8.341205596923828
2902
+ ],
2903
+ [
2904
+ "▁small",
2905
+ -8.341238975524902
2906
+ ],
2907
+ [
2908
+ "colon",
2909
+ -8.343833923339844
2910
+ ],
2911
+ [
2912
+ "▁open",
2913
+ -8.344965934753418
2914
+ ],
2915
+ [
2916
+ "G",
2917
+ -8.348701477050781
2918
+ ],
2919
+ [
2920
+ "▁IMPRESSION",
2921
+ -8.353904724121094
2922
+ ],
2923
+ [
2924
+ "▁normal",
2925
+ -8.35440444946289
2926
+ ],
2927
+ [
2928
+ "▁present",
2929
+ -8.373336791992188
2930
+ ],
2931
+ [
2932
+ "▁When",
2933
+ -8.376485824584961
2934
+ ],
2935
+ [
2936
+ "ific",
2937
+ -8.377349853515625
2938
+ ],
2939
+ [
2940
+ "▁world",
2941
+ -8.383152961730957
2942
+ ],
2943
+ [
2944
+ "▁answer",
2945
+ -8.385011672973633
2946
+ ],
2947
+ [
2948
+ "▁also",
2949
+ -8.393239974975586
2950
+ ],
2951
+ [
2952
+ "▁view",
2953
+ -8.396413803100586
2954
+ ],
2955
+ [
2956
+ "▁seemed",
2957
+ -8.415339469909668
2958
+ ],
2959
+ [
2960
+ "spect",
2961
+ -8.4177827835083
2962
+ ],
2963
+ [
2964
+ "▁always",
2965
+ -8.420531272888184
2966
+ ],
2967
+ [
2968
+ "F",
2969
+ -8.425969123840332
2970
+ ],
2971
+ [
2972
+ "9",
2973
+ -8.447197914123535
2974
+ ],
2975
+ [
2976
+ "▁knew",
2977
+ -8.451355934143066
2978
+ ],
2979
+ [
2980
+ "▁feel",
2981
+ -8.478418350219727
2982
+ ],
2983
+ [
2984
+ "▁girl",
2985
+ -8.489920616149902
2986
+ ],
2987
+ [
2988
+ "▁woman",
2989
+ -8.507888793945312
2990
+ ],
2991
+ [
2992
+ "▁something",
2993
+ -8.509052276611328
2994
+ ],
2995
+ [
2996
+ "▁return",
2997
+ -8.517931938171387
2998
+ ],
2999
+ [
3000
+ "▁kind",
3001
+ -8.522177696228027
3002
+ ],
3003
+ [
3004
+ "▁high",
3005
+ -8.52599048614502
3006
+ ],
3007
+ [
3008
+ "▁because",
3009
+ -8.552063941955566
3010
+ ],
3011
+ [
3012
+ "]",
3013
+ -8.968759536743164
3014
+ ],
3015
+ [
3016
+ "Q",
3017
+ -9.035648345947266
3018
+ ],
3019
+ [
3020
+ "X",
3021
+ -9.060090065002441
3022
+ ],
3023
+ [
3024
+ "/",
3025
+ -9.441831588745117
3026
+ ],
3027
+ [
3028
+ "Z",
3029
+ -9.746284484863281
3030
+ ],
3031
+ [
3032
+ "[",
3033
+ -10.22707748413086
3034
+ ],
3035
+ [
3036
+ "%",
3037
+ -10.805520057678223
3038
+ ],
3039
+ [
3040
+ "q",
3041
+ -11.41718578338623
3042
+ ],
3043
+ [
3044
+ "+",
3045
+ -12.179898262023926
3046
+ ],
3047
+ [
3048
+ "{",
3049
+ -12.902261734008789
3050
+ ]
3051
+ ],
3052
+ "byte_fallback": false
3053
+ }
3054
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,245 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ {
4
+ "__type": "AddedToken",
5
+ "content": "<epsilon>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ {
13
+ "__type": "AddedToken",
14
+ "content": "<s>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ {
22
+ "__type": "AddedToken",
23
+ "content": "</s>",
24
+ "lstrip": false,
25
+ "normalized": false,
26
+ "rstrip": false,
27
+ "single_word": false,
28
+ "special": true
29
+ },
30
+ "<extra_id_0>",
31
+ "<extra_id_1>",
32
+ "<extra_id_2>",
33
+ "<extra_id_3>",
34
+ "<extra_id_4>",
35
+ "<extra_id_5>",
36
+ "<extra_id_6>",
37
+ "<extra_id_7>",
38
+ "<extra_id_8>",
39
+ "<extra_id_9>",
40
+ "<extra_id_10>",
41
+ "<extra_id_11>",
42
+ "<extra_id_12>",
43
+ "<extra_id_13>",
44
+ "<extra_id_14>",
45
+ "<extra_id_15>",
46
+ "<extra_id_16>",
47
+ "<extra_id_17>",
48
+ "<extra_id_18>",
49
+ "<extra_id_19>",
50
+ "<extra_id_20>",
51
+ "<extra_id_21>",
52
+ "<extra_id_22>",
53
+ "<extra_id_23>",
54
+ "<extra_id_24>",
55
+ "<extra_id_25>",
56
+ "<extra_id_26>",
57
+ "<extra_id_27>",
58
+ "<extra_id_28>",
59
+ "<extra_id_29>",
60
+ "<extra_id_30>",
61
+ "<extra_id_31>",
62
+ "<extra_id_32>",
63
+ "<extra_id_33>",
64
+ "<extra_id_34>",
65
+ "<extra_id_35>",
66
+ "<extra_id_36>",
67
+ "<extra_id_37>",
68
+ "<extra_id_38>",
69
+ "<extra_id_39>",
70
+ "<extra_id_40>",
71
+ "<extra_id_41>",
72
+ "<extra_id_42>",
73
+ "<extra_id_43>",
74
+ "<extra_id_44>",
75
+ "<extra_id_45>",
76
+ "<extra_id_46>",
77
+ "<extra_id_47>",
78
+ "<extra_id_48>",
79
+ "<extra_id_49>",
80
+ "<extra_id_50>",
81
+ "<extra_id_51>",
82
+ "<extra_id_52>",
83
+ "<extra_id_53>",
84
+ "<extra_id_54>",
85
+ "<extra_id_55>",
86
+ "<extra_id_56>",
87
+ "<extra_id_57>",
88
+ "<extra_id_58>",
89
+ "<extra_id_59>",
90
+ "<extra_id_60>",
91
+ "<extra_id_61>",
92
+ "<extra_id_62>",
93
+ "<extra_id_63>",
94
+ "<extra_id_64>",
95
+ "<extra_id_65>",
96
+ "<extra_id_66>",
97
+ "<extra_id_67>",
98
+ "<extra_id_68>",
99
+ "<extra_id_69>",
100
+ "<extra_id_70>",
101
+ "<extra_id_71>",
102
+ "<extra_id_72>",
103
+ "<extra_id_73>",
104
+ "<extra_id_74>",
105
+ "<extra_id_75>",
106
+ "<extra_id_76>",
107
+ "<extra_id_77>",
108
+ "<extra_id_78>",
109
+ "<extra_id_79>",
110
+ "<extra_id_80>",
111
+ "<extra_id_81>",
112
+ "<extra_id_82>",
113
+ "<extra_id_83>",
114
+ "<extra_id_84>",
115
+ "<extra_id_85>",
116
+ "<extra_id_86>",
117
+ "<extra_id_87>",
118
+ "<extra_id_88>",
119
+ "<extra_id_89>",
120
+ "<extra_id_90>",
121
+ "<extra_id_91>",
122
+ "<extra_id_92>",
123
+ "<extra_id_93>",
124
+ "<extra_id_94>",
125
+ "<extra_id_95>",
126
+ "<extra_id_96>",
127
+ "<extra_id_97>",
128
+ "<extra_id_98>",
129
+ "<extra_id_99>"
130
+ ],
131
+ "backend": "tokenizers",
132
+ "eos_token": "</s>",
133
+ "extra_ids": 100,
134
+ "extra_special_tokens": [
135
+ "<epsilon>",
136
+ "<s>",
137
+ "</s>",
138
+ "<extra_id_0>",
139
+ "<extra_id_1>",
140
+ "<extra_id_2>",
141
+ "<extra_id_3>",
142
+ "<extra_id_4>",
143
+ "<extra_id_5>",
144
+ "<extra_id_6>",
145
+ "<extra_id_7>",
146
+ "<extra_id_8>",
147
+ "<extra_id_9>",
148
+ "<extra_id_10>",
149
+ "<extra_id_11>",
150
+ "<extra_id_12>",
151
+ "<extra_id_13>",
152
+ "<extra_id_14>",
153
+ "<extra_id_15>",
154
+ "<extra_id_16>",
155
+ "<extra_id_17>",
156
+ "<extra_id_18>",
157
+ "<extra_id_19>",
158
+ "<extra_id_20>",
159
+ "<extra_id_21>",
160
+ "<extra_id_22>",
161
+ "<extra_id_23>",
162
+ "<extra_id_24>",
163
+ "<extra_id_25>",
164
+ "<extra_id_26>",
165
+ "<extra_id_27>",
166
+ "<extra_id_28>",
167
+ "<extra_id_29>",
168
+ "<extra_id_30>",
169
+ "<extra_id_31>",
170
+ "<extra_id_32>",
171
+ "<extra_id_33>",
172
+ "<extra_id_34>",
173
+ "<extra_id_35>",
174
+ "<extra_id_36>",
175
+ "<extra_id_37>",
176
+ "<extra_id_38>",
177
+ "<extra_id_39>",
178
+ "<extra_id_40>",
179
+ "<extra_id_41>",
180
+ "<extra_id_42>",
181
+ "<extra_id_43>",
182
+ "<extra_id_44>",
183
+ "<extra_id_45>",
184
+ "<extra_id_46>",
185
+ "<extra_id_47>",
186
+ "<extra_id_48>",
187
+ "<extra_id_49>",
188
+ "<extra_id_50>",
189
+ "<extra_id_51>",
190
+ "<extra_id_52>",
191
+ "<extra_id_53>",
192
+ "<extra_id_54>",
193
+ "<extra_id_55>",
194
+ "<extra_id_56>",
195
+ "<extra_id_57>",
196
+ "<extra_id_58>",
197
+ "<extra_id_59>",
198
+ "<extra_id_60>",
199
+ "<extra_id_61>",
200
+ "<extra_id_62>",
201
+ "<extra_id_63>",
202
+ "<extra_id_64>",
203
+ "<extra_id_65>",
204
+ "<extra_id_66>",
205
+ "<extra_id_67>",
206
+ "<extra_id_68>",
207
+ "<extra_id_69>",
208
+ "<extra_id_70>",
209
+ "<extra_id_71>",
210
+ "<extra_id_72>",
211
+ "<extra_id_73>",
212
+ "<extra_id_74>",
213
+ "<extra_id_75>",
214
+ "<extra_id_76>",
215
+ "<extra_id_77>",
216
+ "<extra_id_78>",
217
+ "<extra_id_79>",
218
+ "<extra_id_80>",
219
+ "<extra_id_81>",
220
+ "<extra_id_82>",
221
+ "<extra_id_83>",
222
+ "<extra_id_84>",
223
+ "<extra_id_85>",
224
+ "<extra_id_86>",
225
+ "<extra_id_87>",
226
+ "<extra_id_88>",
227
+ "<extra_id_89>",
228
+ "<extra_id_90>",
229
+ "<extra_id_91>",
230
+ "<extra_id_92>",
231
+ "<extra_id_93>",
232
+ "<extra_id_94>",
233
+ "<extra_id_95>",
234
+ "<extra_id_96>",
235
+ "<extra_id_97>",
236
+ "<extra_id_98>",
237
+ "<extra_id_99>"
238
+ ],
239
+ "is_local": false,
240
+ "model_max_length": 1000000000000000019884624838656,
241
+ "pad_token": "<epsilon>",
242
+ "tokenizer_class": "LasrTokenizer",
243
+ "unk_id": 3,
244
+ "unk_token": "<unk>"
245
+ }