JinghuiLuAstronaut commited on
Commit
907970e
·
verified ·
1 Parent(s): 1a34294

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. LTA_openwebtext_dualt/logs/decode/owt_wd0p1_step64k_lm1b_normal_steps_n32.log +11 -0
  2. LTA_openwebtext_dualt/logs/lm1b_ablate_lr_only/latest_run_name.txt +1 -0
  3. LTA_openwebtext_dualt/logs/lm1b_ablate_lr_only/lta_lm1b_v8192_mask0p1_1p0_lr3e4_constwarmup_only_len128_gbs512_2gpu_1m_20260521_120019.nohup.log +0 -0
  4. LTA_openwebtext_dualt/logs/maskfloor_smoke/lta_owt_maskfloor_oneminust_c1024_4gpu_smoke_20260513_180117.log +103 -0
  5. LTA_openwebtext_dualt/logs/noise_geometry_pilots_4gpu/20260517_163805.log +4134 -0
  6. LTA_openwebtext_dualt/logs/noise_geometry_pilots_4gpu/current.nohup +0 -0
  7. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/__init__.py +115 -0
  8. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/big5freq.py +386 -0
  9. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/big5prober.py +47 -0
  10. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/chardistribution.py +261 -0
  11. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/charsetgroupprober.py +106 -0
  12. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/codingstatemachine.py +90 -0
  13. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/cp949prober.py +49 -0
  14. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/escprober.py +102 -0
  15. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/escsm.py +261 -0
  16. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/eucjpprober.py +102 -0
  17. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/euckrfreq.py +196 -0
  18. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/euctwfreq.py +388 -0
  19. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/euctwprober.py +47 -0
  20. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/gb2312prober.py +47 -0
  21. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/johabfreq.py +2382 -0
  22. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/johabprober.py +47 -0
  23. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/jpcntx.py +238 -0
  24. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langgreekmodel.py +0 -0
  25. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langhebrewmodel.py +0 -0
  26. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langhungarianmodel.py +0 -0
  27. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langrussianmodel.py +0 -0
  28. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langthaimodel.py +0 -0
  29. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langturkishmodel.py +4380 -0
  30. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/latin1prober.py +147 -0
  31. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/macromanprober.py +162 -0
  32. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/mbcharsetprober.py +95 -0
  33. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/mbcsgroupprober.py +57 -0
  34. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/mbcssm.py +661 -0
  35. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/metadata/__init__.py +0 -0
  36. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/metadata/languages.py +352 -0
  37. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/sbcsgroupprober.py +88 -0
  38. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/universaldetector.py +362 -0
  39. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/utf1632prober.py +225 -0
  40. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/version.py +9 -0
  41. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/__init__.py +566 -0
  42. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/__main__.py +53 -0
  43. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/android.py +210 -0
  44. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/api.py +223 -0
  45. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/macos.py +91 -0
  46. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/unix.py +223 -0
  47. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/version.py +4 -0
  48. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/windows.py +255 -0
  49. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/pyproject_hooks/_in_process/__init__.py +18 -0
  50. LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/pyproject_hooks/_in_process/_in_process.py +353 -0
LTA_openwebtext_dualt/logs/decode/owt_wd0p1_step64k_lm1b_normal_steps_n32.log ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [ckpt] runs/lta_owt_gpt2cached_len1024_fullycoupled_rmsnorm_nobias_adamw_wd0p1_nanogpt_fp32_ddit768x12_gbs512_8gpu_1m_20260514_191807/latest.pt step=64000
2
+ [decode] steps128_c16_t1p45 generated 4/32
3
+ [decode] steps128_c16_t1p45 generated 8/32
4
+ [decode] steps128_c16_t1p45 generated 12/32
5
+ [decode] steps128_c16_t1p45 generated 16/32
6
+ [decode] steps128_c16_t1p45 generated 20/32
7
+ [decode] steps128_c16_t1p45 generated 24/32
8
+ [decode] steps128_c16_t1p45 generated 28/32
9
+ [decode] steps128_c16_t1p45 generated 32/32
10
+ [decode] steps128_c256_t1p45 generated 4/32
11
+ [decode] steps128_c256_t1p45 generated 8/32
LTA_openwebtext_dualt/logs/lm1b_ablate_lr_only/latest_run_name.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ lta_lm1b_v8192_mask0p1_1p0_lr3e4_constwarmup_only_len128_gbs512_2gpu_1m_20260521_120019
LTA_openwebtext_dualt/logs/lm1b_ablate_lr_only/lta_lm1b_v8192_mask0p1_1p0_lr3e4_constwarmup_only_len128_gbs512_2gpu_1m_20260521_120019.nohup.log ADDED
The diff for this file is too large to render. See raw diff
 
LTA_openwebtext_dualt/logs/maskfloor_smoke/lta_owt_maskfloor_oneminust_c1024_4gpu_smoke_20260513_180117.log ADDED
@@ -0,0 +1,103 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "device": "cuda:0",
3
+ "rank": 0,
4
+ "world_size": 4,
5
+ "samples": "owt_cached_chunks:8734897",
6
+ "vocab_size": 50257,
7
+ "tokenizer_vocab_size": 50257,
8
+ "save_dir": "runs/lta_owt_maskfloor_oneminust_c1024_4gpu_smoke_20260513_180117",
9
+ "batch_size": 2,
10
+ "grad_accum": 1,
11
+ "effective_batch_size": 8,
12
+ "global_batch_size": 8,
13
+ "lr_schedule": "constant_warmup",
14
+ "optimizer": "muon",
15
+ "warmup_steps": 1,
16
+ "min_lr": 0.0,
17
+ "weight_decay": 0.0,
18
+ "adamw_param_groups": "nanogpt",
19
+ "adam_beta1": 0.9,
20
+ "adam_beta2": 0.95,
21
+ "adam_eps": 1e-08,
22
+ "muon_momentum": 0.95,
23
+ "muon_ns_steps": 5,
24
+ "muon_update_scale": 1.0,
25
+ "ema_decay": 0.0,
26
+ "ema_start_step": 0,
27
+ "model_type": "ddit",
28
+ "dual_t": true,
29
+ "corrupt_t_mode": "same",
30
+ "corrupt_min_t": 0.0,
31
+ "corrupt_max_t": 1.0,
32
+ "prefix_block_prob": 0.0,
33
+ "prefix_block_len": 128,
34
+ "mask_ratio_floor_schedule": "one_minus_t",
35
+ "dirichlet_endpoint_mode": "categorical_dual_t",
36
+ "dirichlet_semantic_t_mode": "same",
37
+ "dirichlet_semantic_t_value": 0.0,
38
+ "categorical_wrong_from_full_vocab": true,
39
+ "categorical_wrong_from_batch_valid_tokens": false,
40
+ "mask_mixture_original_prob": 0.0,
41
+ "mask_mixture_lowk_prob": 0.0,
42
+ "mask_mixture_lowcorrupt_prob": 0.0,
43
+ "mask_mixture_block_prob": 0.0,
44
+ "mask_mixture_all_prob": 0.0,
45
+ "mask_mixture_lowk_clean_tokens": "1,2,4,8,16,32,64",
46
+ "mask_mixture_lowcorrupt_tokens": "1,2,4,8,16,32,64",
47
+ "mask_mixture_block_tokens": "64,128",
48
+ "simplex_bridge_sampler": "dirichlet",
49
+ "logistic_normal_sigma_min": 0.18,
50
+ "logistic_normal_sigma_max": 2.2,
51
+ "logistic_normal_tau_min": 0.65,
52
+ "logistic_normal_tau_max": 1.15,
53
+ "torch_compile": false,
54
+ "compile_mode": "max-autotune",
55
+ "state_format": "prob",
56
+ "target_loss": "hard_ce",
57
+ "meanflow_weight": 0.0,
58
+ "rollout_train_prob": 0.0,
59
+ "rollout_train_steps": 1,
60
+ "rollout_train_infer_steps": 64,
61
+ "rollout_train_temp": 1.45,
62
+ "rollout_train_max_gamma": 1.0,
63
+ "rollout_train_corrupt_only": true,
64
+ "rollout_train_samplewise": false,
65
+ "rollout_train_compute_always": false,
66
+ "bridge_noise_init": "logistic_normal",
67
+ "noise_sigma": -1.0,
68
+ "allow_tf32": true,
69
+ "activation_checkpointing": false,
70
+ "activation_checkpoint_interval": 1,
71
+ "activation_checkpoint_scope": "block",
72
+ "ddp_static_graph": false,
73
+ "ddp_gradient_as_bucket_view": true,
74
+ "blocking_data_transfer": false,
75
+ "dataloader_prefetch_factor": 2,
76
+ "full_train_stats": false,
77
+ "record_pad_truncate": false,
78
+ "record_add_eos": false,
79
+ "record_add_special_tokens": false,
80
+ "record_pad_token": "pad",
81
+ "record_shuffle_buffer": 10000,
82
+ "wrap": true,
83
+ "wrap_mode": "stream",
84
+ "wrap_record_buffer_size": 200,
85
+ "owt_cached_chunks": true,
86
+ "owt_chunk_cache_dir": "/e2e-data/evad-tech-vla/wanghan58/data/small_benchmarks/langflow_2604_11748/openwebtext_lta_cached_chunks/gpt2_len1024_train_minus_100k",
87
+ "owt_chunk_cache_rebuild": false,
88
+ "owt_chunk_cache_write_batch": 4096,
89
+ "owt_exact_repeat_per_chunk": 0,
90
+ "online_chunk_shuffle": false,
91
+ "online_chunk_shuffle_buffer": 10000,
92
+ "openwebtext_split": "train_minus_100k",
93
+ "detokenizer": "auto",
94
+ "resolved_detokenizer": null,
95
+ "num_workers": 0,
96
+ "latest_every": 1000000,
97
+ "resume_path": ""
98
+ }
99
+ step=1 micro_steps=1 elapsed=1.5s lr=2.000000e-03 loss=10.8125 loss_recon=10.8125 loss_meanflow=0.0000 mean_model_t=0.3115 mean_corrupt_t=0.3115 mean_loss_t_weight=1.0000 prior_center_loss_beta=0.0000 rollout_train_applied=0.0000 acc_all=0.0015 acc_corrupt=0.0015 corrupt_frac=0.9883 loss_all=10.8125 loss_corrupt=10.8125 acc_corrupt_t_0p0_0p2=0.0020 corrupt_frac_t_0p0_0p2=0.5000 acc_corrupt_t_0p6_0p8=0.0010 corrupt_frac_t_0p6_0p8=0.5000 wrong_frac=0.6848 init_acc_corrupt=0.3083 init_gold_top10=0.3093 init_gold_top100=0.3612
100
+ step=2 micro_steps=2 elapsed=0.1s lr=2.000000e-03 loss=10.8117 loss_recon=10.8117 loss_meanflow=0.0000 mean_model_t=0.1709 mean_corrupt_t=0.1709 mean_loss_t_weight=1.0000 prior_center_loss_beta=0.0000 rollout_train_applied=0.0000 acc_all=0.0991 acc_corrupt=0.0644 corrupt_frac=0.9180 loss_all=10.8103 loss_corrupt=10.8117 acc_corrupt_t_0p0_0p2=0.0133 corrupt_frac_t_0p0_0p2=0.5186 acc_corrupt_t_0p2_0p4=0.1193 corrupt_frac_t_0p2_0p4=0.4814 wrong_frac=0.8266 init_acc_corrupt=0.0761 init_gold_top10=0.1527 init_gold_top100=0.2356
101
+ step=3 micro_steps=3 elapsed=0.1s lr=2.000000e-03 loss=10.7823 loss_recon=10.7823 loss_meanflow=0.0000 mean_model_t=0.7285 mean_corrupt_t=0.7285 mean_loss_t_weight=1.0000 prior_center_loss_beta=0.0000 rollout_train_applied=0.0000 acc_all=0.4878 acc_corrupt=0.4099 corrupt_frac=0.5991 loss_all=10.7764 loss_corrupt=10.7823 acc_corrupt_t_0p6_0p8=0.4099 corrupt_frac_t_0p6_0p8=1.0000 wrong_frac=0.2649 init_acc_corrupt=0.7351 init_gold_top10=0.7351 init_gold_top100=0.7359
102
+ step=4 micro_steps=4 elapsed=0.1s lr=2.000000e-03 loss=10.7879 loss_recon=10.7879 loss_meanflow=0.0000 mean_model_t=0.4350 mean_corrupt_t=0.4350 mean_loss_t_weight=1.0000 prior_center_loss_beta=0.0000 rollout_train_applied=0.0000 acc_all=0.3228 acc_corrupt=0.2264 corrupt_frac=0.7700 loss_all=10.7760 loss_corrupt=10.7879 acc_corrupt_t_0p0_0p2=0.0720 corrupt_frac_t_0p0_0p2=0.6075 acc_corrupt_t_0p6_0p8=0.4653 corrupt_frac_t_0p6_0p8=0.3925 wrong_frac=0.6119 init_acc_corrupt=0.3075 init_gold_top10=0.3786 init_gold_top100=0.4331
103
+ step=5 micro_steps=5 elapsed=0.1s lr=2.000000e-03 loss=10.7372 loss_recon=10.7372 loss_meanflow=0.0000 mean_model_t=0.6984 mean_corrupt_t=0.6984 mean_loss_t_weight=1.0000 prior_center_loss_beta=0.0000 rollout_train_applied=0.0000 acc_all=0.5400 acc_corrupt=0.4406 corrupt_frac=0.5264 loss_all=10.7200 loss_corrupt=10.7372 acc_corrupt_t_0p6_0p8=0.4406 corrupt_frac_t_0p6_0p8=1.0000 wrong_frac=0.3089 init_acc_corrupt=0.6911 init_gold_top10=0.6911 init_gold_top100=0.6911
LTA_openwebtext_dualt/logs/noise_geometry_pilots_4gpu/20260517_163805.log ADDED
@@ -0,0 +1,4134 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [noise-pilot] start stamp=20260517_163805 len=256 vocab=969 out=docs/lta_samples/metrics_20260517/noise_geometry_pilots_len256_bs512_ode128_20260517_163805
2
+ [noise-pilot] round=1 Sun May 17 16:38:05 UTC 2026
3
+ [noise-pilot] train config=allcorrupt_fullvocab_dirC1_1024 from=0 to=1000 C=1.0->1024 seq_alpha=0.0 sampler=dirichlet
4
+ [noise-pilot] eval config=allcorrupt_fullvocab_dirC1_1024 step=1000
5
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805 step=1000 soft=none
6
+ [decode] max_len=256 generated=64/64
7
+ {
8
+ "num_rows": 1,
9
+ "best_by_run": {
10
+ "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805::none": {
11
+ "run": "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805",
12
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805/step_0001000.pt",
13
+ "ckpt_step": 1000,
14
+ "endpoint_softening": "none",
15
+ "decode_rule": "flowmap",
16
+ "steps": 128,
17
+ "time_schedule": "logit_normal",
18
+ "model_t_mode": "post",
19
+ "final_from": "state",
20
+ "n_gen": 64,
21
+ "n_refs": 8,
22
+ "token_acc_mean": 0.0267333984375,
23
+ "token_acc_min": 0.0078125,
24
+ "token_acc_max": 0.05859375,
25
+ "exact_acc": 0.0,
26
+ "exact_count": 0,
27
+ "exact_ref_coverage": 0.0,
28
+ "exact_ref_count": 0,
29
+ "exact_ref_hits": [],
30
+ "best_ref_idx": [
31
+ 0,
32
+ 7,
33
+ 5,
34
+ 0,
35
+ 7,
36
+ 7,
37
+ 2,
38
+ 7,
39
+ 7,
40
+ 7,
41
+ 0,
42
+ 7,
43
+ 0,
44
+ 5,
45
+ 6,
46
+ 5,
47
+ 4,
48
+ 5,
49
+ 4,
50
+ 7,
51
+ 6,
52
+ 7,
53
+ 6,
54
+ 0,
55
+ 6,
56
+ 7,
57
+ 7,
58
+ 7,
59
+ 6,
60
+ 0,
61
+ 5,
62
+ 6,
63
+ 0,
64
+ 7,
65
+ 7,
66
+ 7,
67
+ 7,
68
+ 6,
69
+ 0,
70
+ 7,
71
+ 6,
72
+ 0,
73
+ 5,
74
+ 0,
75
+ 1,
76
+ 7,
77
+ 7,
78
+ 0,
79
+ 5,
80
+ 7,
81
+ 0,
82
+ 7,
83
+ 6,
84
+ 5,
85
+ 4,
86
+ 6,
87
+ 7,
88
+ 7,
89
+ 4,
90
+ 5,
91
+ 7,
92
+ 0,
93
+ 6,
94
+ 4
95
+ ],
96
+ "best_token_acc": [
97
+ 0.01171875,
98
+ 0.0546875,
99
+ 0.0078125,
100
+ 0.01953125,
101
+ 0.05859375,
102
+ 0.01171875,
103
+ 0.03125,
104
+ 0.02734375,
105
+ 0.0390625,
106
+ 0.015625,
107
+ 0.0078125,
108
+ 0.01171875,
109
+ 0.02734375,
110
+ 0.046875,
111
+ 0.0078125,
112
+ 0.05078125,
113
+ 0.05078125,
114
+ 0.0078125,
115
+ 0.02734375,
116
+ 0.03125,
117
+ 0.01171875,
118
+ 0.015625,
119
+ 0.0078125,
120
+ 0.015625,
121
+ 0.015625,
122
+ 0.0546875,
123
+ 0.01171875,
124
+ 0.03515625,
125
+ 0.015625,
126
+ 0.01171875,
127
+ 0.05859375,
128
+ 0.01171875,
129
+ 0.01171875,
130
+ 0.02734375,
131
+ 0.0390625,
132
+ 0.01953125,
133
+ 0.01171875,
134
+ 0.01953125,
135
+ 0.0234375,
136
+ 0.04296875,
137
+ 0.01171875,
138
+ 0.046875,
139
+ 0.046875,
140
+ 0.0234375,
141
+ 0.0078125,
142
+ 0.01953125,
143
+ 0.05078125,
144
+ 0.03515625,
145
+ 0.015625,
146
+ 0.04296875,
147
+ 0.01171875,
148
+ 0.01953125,
149
+ 0.01171875,
150
+ 0.0546875,
151
+ 0.0390625,
152
+ 0.01171875,
153
+ 0.0546875,
154
+ 0.03125,
155
+ 0.01171875,
156
+ 0.05859375,
157
+ 0.01953125,
158
+ 0.01171875,
159
+ 0.01953125,
160
+ 0.046875
161
+ ]
162
+ }
163
+ },
164
+ "first_exact_by_run": {}
165
+ }
166
+ RESULT config=allcorrupt_fullvocab_dirC1_1024 ckpt_step=1000 views=512000 token_acc=0.0267 exact=0/64 exact_refs=0 hits=[]
167
+ [noise-pilot] continue config=allcorrupt_fullvocab_dirC1_1024 step=1000
168
+ [noise-pilot] train config=allcorrupt_seqrand1_dirC1_1024 from=0 to=1000 C=1.0->1024 seq_alpha=1.0 sampler=dirichlet
169
+ [noise-pilot] eval config=allcorrupt_seqrand1_dirC1_1024 step=1000
170
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805 step=1000 soft=none
171
+ [decode] max_len=256 generated=64/64
172
+ {
173
+ "num_rows": 1,
174
+ "best_by_run": {
175
+ "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805::none": {
176
+ "run": "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805",
177
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805/step_0001000.pt",
178
+ "ckpt_step": 1000,
179
+ "endpoint_softening": "none",
180
+ "decode_rule": "flowmap",
181
+ "steps": 128,
182
+ "time_schedule": "logit_normal",
183
+ "model_t_mode": "post",
184
+ "final_from": "state",
185
+ "n_gen": 64,
186
+ "n_refs": 8,
187
+ "token_acc_mean": 0.03125,
188
+ "token_acc_min": 0.0234375,
189
+ "token_acc_max": 0.0703125,
190
+ "exact_acc": 0.0,
191
+ "exact_count": 0,
192
+ "exact_ref_coverage": 0.0,
193
+ "exact_ref_count": 0,
194
+ "exact_ref_hits": [],
195
+ "best_ref_idx": [
196
+ 5,
197
+ 5,
198
+ 0,
199
+ 5,
200
+ 5,
201
+ 0,
202
+ 7,
203
+ 0,
204
+ 5,
205
+ 5,
206
+ 0,
207
+ 5,
208
+ 5,
209
+ 5,
210
+ 5,
211
+ 5,
212
+ 5,
213
+ 5,
214
+ 5,
215
+ 5,
216
+ 5,
217
+ 5,
218
+ 0,
219
+ 5,
220
+ 0,
221
+ 5,
222
+ 5,
223
+ 5,
224
+ 5,
225
+ 5,
226
+ 5,
227
+ 5,
228
+ 5,
229
+ 5,
230
+ 5,
231
+ 5,
232
+ 5,
233
+ 5,
234
+ 5,
235
+ 5,
236
+ 5,
237
+ 5,
238
+ 5,
239
+ 5,
240
+ 1,
241
+ 5,
242
+ 5,
243
+ 5,
244
+ 5,
245
+ 5,
246
+ 5,
247
+ 5,
248
+ 5,
249
+ 5,
250
+ 5,
251
+ 0,
252
+ 5,
253
+ 5,
254
+ 3,
255
+ 5,
256
+ 5,
257
+ 5,
258
+ 5,
259
+ 5
260
+ ],
261
+ "best_token_acc": [
262
+ 0.02734375,
263
+ 0.0234375,
264
+ 0.0703125,
265
+ 0.04296875,
266
+ 0.02734375,
267
+ 0.05859375,
268
+ 0.05859375,
269
+ 0.0703125,
270
+ 0.02734375,
271
+ 0.02734375,
272
+ 0.0546875,
273
+ 0.03515625,
274
+ 0.03125,
275
+ 0.02734375,
276
+ 0.0234375,
277
+ 0.02734375,
278
+ 0.02734375,
279
+ 0.02734375,
280
+ 0.02734375,
281
+ 0.02734375,
282
+ 0.02734375,
283
+ 0.02734375,
284
+ 0.02734375,
285
+ 0.02734375,
286
+ 0.05859375,
287
+ 0.02734375,
288
+ 0.02734375,
289
+ 0.03125,
290
+ 0.03125,
291
+ 0.03125,
292
+ 0.02734375,
293
+ 0.02734375,
294
+ 0.03125,
295
+ 0.02734375,
296
+ 0.02734375,
297
+ 0.02734375,
298
+ 0.02734375,
299
+ 0.02734375,
300
+ 0.02734375,
301
+ 0.02734375,
302
+ 0.02734375,
303
+ 0.0234375,
304
+ 0.02734375,
305
+ 0.03125,
306
+ 0.0234375,
307
+ 0.02734375,
308
+ 0.03125,
309
+ 0.02734375,
310
+ 0.03125,
311
+ 0.02734375,
312
+ 0.02734375,
313
+ 0.02734375,
314
+ 0.02734375,
315
+ 0.02734375,
316
+ 0.02734375,
317
+ 0.02734375,
318
+ 0.02734375,
319
+ 0.02734375,
320
+ 0.02734375,
321
+ 0.03125,
322
+ 0.02734375,
323
+ 0.02734375,
324
+ 0.02734375,
325
+ 0.02734375
326
+ ]
327
+ }
328
+ },
329
+ "first_exact_by_run": {}
330
+ }
331
+ RESULT config=allcorrupt_seqrand1_dirC1_1024 ckpt_step=1000 views=512000 token_acc=0.0312 exact=0/64 exact_refs=0 hits=[]
332
+ [noise-pilot] continue config=allcorrupt_seqrand1_dirC1_1024 step=1000
333
+ [noise-pilot] train config=allcorrupt_highC64_4096 from=0 to=1000 C=64->4096 seq_alpha=0.0 sampler=dirichlet
334
+ [noise-pilot] eval config=allcorrupt_highC64_4096 step=1000
335
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805 step=1000 soft=none
336
+ [decode] max_len=256 generated=64/64
337
+ {
338
+ "num_rows": 1,
339
+ "best_by_run": {
340
+ "train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805::none": {
341
+ "run": "train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805",
342
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805/step_0001000.pt",
343
+ "ckpt_step": 1000,
344
+ "endpoint_softening": "none",
345
+ "decode_rule": "flowmap",
346
+ "steps": 128,
347
+ "time_schedule": "logit_normal",
348
+ "model_t_mode": "post",
349
+ "final_from": "state",
350
+ "n_gen": 64,
351
+ "n_refs": 8,
352
+ "token_acc_mean": 0.03472900390625,
353
+ "token_acc_min": 0.015625,
354
+ "token_acc_max": 0.0703125,
355
+ "exact_acc": 0.0,
356
+ "exact_count": 0,
357
+ "exact_ref_coverage": 0.0,
358
+ "exact_ref_count": 0,
359
+ "exact_ref_hits": [],
360
+ "best_ref_idx": [
361
+ 1,
362
+ 4,
363
+ 7,
364
+ 1,
365
+ 5,
366
+ 1,
367
+ 1,
368
+ 4,
369
+ 4,
370
+ 1,
371
+ 3,
372
+ 4,
373
+ 0,
374
+ 4,
375
+ 1,
376
+ 7,
377
+ 6,
378
+ 4,
379
+ 0,
380
+ 1,
381
+ 1,
382
+ 4,
383
+ 1,
384
+ 5,
385
+ 6,
386
+ 1,
387
+ 1,
388
+ 2,
389
+ 1,
390
+ 0,
391
+ 5,
392
+ 2,
393
+ 1,
394
+ 1,
395
+ 5,
396
+ 5,
397
+ 1,
398
+ 5,
399
+ 6,
400
+ 1,
401
+ 1,
402
+ 4,
403
+ 0,
404
+ 0,
405
+ 1,
406
+ 4,
407
+ 1,
408
+ 7,
409
+ 0,
410
+ 4,
411
+ 1,
412
+ 1,
413
+ 4,
414
+ 3,
415
+ 4,
416
+ 2,
417
+ 1,
418
+ 5,
419
+ 1,
420
+ 1,
421
+ 4,
422
+ 5,
423
+ 1,
424
+ 6
425
+ ],
426
+ "best_token_acc": [
427
+ 0.0234375,
428
+ 0.03125,
429
+ 0.03125,
430
+ 0.046875,
431
+ 0.03125,
432
+ 0.046875,
433
+ 0.02734375,
434
+ 0.05859375,
435
+ 0.04296875,
436
+ 0.03515625,
437
+ 0.03515625,
438
+ 0.01953125,
439
+ 0.02734375,
440
+ 0.03515625,
441
+ 0.03515625,
442
+ 0.03515625,
443
+ 0.015625,
444
+ 0.05078125,
445
+ 0.01953125,
446
+ 0.04296875,
447
+ 0.04296875,
448
+ 0.0390625,
449
+ 0.02734375,
450
+ 0.0234375,
451
+ 0.0234375,
452
+ 0.04296875,
453
+ 0.046875,
454
+ 0.04296875,
455
+ 0.02734375,
456
+ 0.03125,
457
+ 0.0546875,
458
+ 0.0234375,
459
+ 0.06640625,
460
+ 0.03515625,
461
+ 0.0234375,
462
+ 0.04296875,
463
+ 0.015625,
464
+ 0.04296875,
465
+ 0.03125,
466
+ 0.0390625,
467
+ 0.05859375,
468
+ 0.03125,
469
+ 0.0234375,
470
+ 0.0234375,
471
+ 0.01953125,
472
+ 0.0390625,
473
+ 0.0703125,
474
+ 0.03515625,
475
+ 0.0234375,
476
+ 0.03125,
477
+ 0.0234375,
478
+ 0.03515625,
479
+ 0.03125,
480
+ 0.02734375,
481
+ 0.02734375,
482
+ 0.03125,
483
+ 0.04296875,
484
+ 0.03125,
485
+ 0.0390625,
486
+ 0.04296875,
487
+ 0.015625,
488
+ 0.04296875,
489
+ 0.03515625,
490
+ 0.02734375
491
+ ]
492
+ }
493
+ },
494
+ "first_exact_by_run": {}
495
+ }
496
+ RESULT config=allcorrupt_highC64_4096 ckpt_step=1000 views=512000 token_acc=0.0347 exact=0/64 exact_refs=0 hits=[]
497
+ [noise-pilot] continue config=allcorrupt_highC64_4096 step=1000
498
+ [noise-pilot] train config=allcorrupt_logistic_sig0p05_0p5 from=0 to=1000 C=1.0->1024 seq_alpha=0.0 sampler=logistic_normal_linear_mean
499
+ [noise-pilot] eval config=allcorrupt_logistic_sig0p05_0p5 step=1000
500
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805 step=1000 soft=none
501
+ [decode] max_len=256 generated=64/64
502
+ {
503
+ "num_rows": 1,
504
+ "best_by_run": {
505
+ "train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805::none": {
506
+ "run": "train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805",
507
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805/step_0001000.pt",
508
+ "ckpt_step": 1000,
509
+ "endpoint_softening": "none",
510
+ "decode_rule": "flowmap",
511
+ "steps": 128,
512
+ "time_schedule": "logit_normal",
513
+ "model_t_mode": "post",
514
+ "final_from": "state",
515
+ "n_gen": 64,
516
+ "n_refs": 8,
517
+ "token_acc_mean": 0.1112060546875,
518
+ "token_acc_min": 0.03125,
519
+ "token_acc_max": 0.4296875,
520
+ "exact_acc": 0.0,
521
+ "exact_count": 0,
522
+ "exact_ref_coverage": 0.0,
523
+ "exact_ref_count": 0,
524
+ "exact_ref_hits": [],
525
+ "best_ref_idx": [
526
+ 2,
527
+ 7,
528
+ 2,
529
+ 1,
530
+ 7,
531
+ 2,
532
+ 2,
533
+ 2,
534
+ 7,
535
+ 1,
536
+ 1,
537
+ 2,
538
+ 2,
539
+ 7,
540
+ 0,
541
+ 5,
542
+ 7,
543
+ 2,
544
+ 3,
545
+ 2,
546
+ 7,
547
+ 2,
548
+ 5,
549
+ 2,
550
+ 2,
551
+ 3,
552
+ 2,
553
+ 2,
554
+ 2,
555
+ 2,
556
+ 2,
557
+ 2,
558
+ 2,
559
+ 7,
560
+ 7,
561
+ 2,
562
+ 2,
563
+ 7,
564
+ 2,
565
+ 2,
566
+ 2,
567
+ 2,
568
+ 2,
569
+ 2,
570
+ 2,
571
+ 7,
572
+ 1,
573
+ 2,
574
+ 2,
575
+ 3,
576
+ 2,
577
+ 2,
578
+ 2,
579
+ 2,
580
+ 2,
581
+ 0,
582
+ 1,
583
+ 2,
584
+ 2,
585
+ 2,
586
+ 7,
587
+ 2,
588
+ 2,
589
+ 2
590
+ ],
591
+ "best_token_acc": [
592
+ 0.09765625,
593
+ 0.1015625,
594
+ 0.21875,
595
+ 0.05859375,
596
+ 0.140625,
597
+ 0.0703125,
598
+ 0.04296875,
599
+ 0.078125,
600
+ 0.06640625,
601
+ 0.03125,
602
+ 0.03515625,
603
+ 0.046875,
604
+ 0.078125,
605
+ 0.30859375,
606
+ 0.046875,
607
+ 0.0390625,
608
+ 0.10546875,
609
+ 0.0859375,
610
+ 0.04296875,
611
+ 0.26953125,
612
+ 0.06640625,
613
+ 0.06640625,
614
+ 0.03515625,
615
+ 0.20703125,
616
+ 0.1953125,
617
+ 0.04296875,
618
+ 0.4296875,
619
+ 0.37109375,
620
+ 0.05859375,
621
+ 0.1015625,
622
+ 0.12109375,
623
+ 0.05859375,
624
+ 0.11328125,
625
+ 0.37109375,
626
+ 0.0859375,
627
+ 0.1875,
628
+ 0.0703125,
629
+ 0.0390625,
630
+ 0.140625,
631
+ 0.06640625,
632
+ 0.0703125,
633
+ 0.04296875,
634
+ 0.03515625,
635
+ 0.1015625,
636
+ 0.08984375,
637
+ 0.0390625,
638
+ 0.0390625,
639
+ 0.046875,
640
+ 0.140625,
641
+ 0.0703125,
642
+ 0.12890625,
643
+ 0.05078125,
644
+ 0.046875,
645
+ 0.10546875,
646
+ 0.37109375,
647
+ 0.0625,
648
+ 0.09375,
649
+ 0.234375,
650
+ 0.0546875,
651
+ 0.1953125,
652
+ 0.0625,
653
+ 0.0859375,
654
+ 0.0390625,
655
+ 0.1171875
656
+ ]
657
+ }
658
+ },
659
+ "first_exact_by_run": {}
660
+ }
661
+ RESULT config=allcorrupt_logistic_sig0p05_0p5 ckpt_step=1000 views=512000 token_acc=0.1112 exact=0/64 exact_refs=0 hits=[]
662
+ [noise-pilot] continue config=allcorrupt_logistic_sig0p05_0p5 step=1000
663
+ [noise-pilot] train config=allcorrupt_seqrand1_highC64_4096 from=0 to=1000 C=64->4096 seq_alpha=1.0 sampler=dirichlet
664
+ [noise-pilot] eval config=allcorrupt_seqrand1_highC64_4096 step=1000
665
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805 step=1000 soft=none
666
+ [decode] max_len=256 generated=64/64
667
+ {
668
+ "num_rows": 1,
669
+ "best_by_run": {
670
+ "train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805::none": {
671
+ "run": "train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805",
672
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805/step_0001000.pt",
673
+ "ckpt_step": 1000,
674
+ "endpoint_softening": "none",
675
+ "decode_rule": "flowmap",
676
+ "steps": 128,
677
+ "time_schedule": "logit_normal",
678
+ "model_t_mode": "post",
679
+ "final_from": "state",
680
+ "n_gen": 64,
681
+ "n_refs": 8,
682
+ "token_acc_mean": 0.067626953125,
683
+ "token_acc_min": 0.05078125,
684
+ "token_acc_max": 0.1875,
685
+ "exact_acc": 0.0,
686
+ "exact_count": 0,
687
+ "exact_ref_coverage": 0.0,
688
+ "exact_ref_count": 0,
689
+ "exact_ref_hits": [],
690
+ "best_ref_idx": [
691
+ 0,
692
+ 0,
693
+ 5,
694
+ 5,
695
+ 7,
696
+ 0,
697
+ 5,
698
+ 2,
699
+ 5,
700
+ 5,
701
+ 5,
702
+ 5,
703
+ 0,
704
+ 5,
705
+ 0,
706
+ 7,
707
+ 5,
708
+ 0,
709
+ 5,
710
+ 5,
711
+ 5,
712
+ 0,
713
+ 5,
714
+ 5,
715
+ 2,
716
+ 0,
717
+ 5,
718
+ 0,
719
+ 5,
720
+ 5,
721
+ 2,
722
+ 0,
723
+ 5,
724
+ 0,
725
+ 0,
726
+ 0,
727
+ 0,
728
+ 5,
729
+ 5,
730
+ 5,
731
+ 5,
732
+ 0,
733
+ 5,
734
+ 5,
735
+ 5,
736
+ 5,
737
+ 0,
738
+ 7,
739
+ 0,
740
+ 5,
741
+ 0,
742
+ 0,
743
+ 5,
744
+ 0,
745
+ 5,
746
+ 0,
747
+ 5,
748
+ 0,
749
+ 5,
750
+ 5,
751
+ 0,
752
+ 5,
753
+ 5,
754
+ 0
755
+ ],
756
+ "best_token_acc": [
757
+ 0.0703125,
758
+ 0.05859375,
759
+ 0.0625,
760
+ 0.05859375,
761
+ 0.1328125,
762
+ 0.06640625,
763
+ 0.0703125,
764
+ 0.0703125,
765
+ 0.05859375,
766
+ 0.05078125,
767
+ 0.0625,
768
+ 0.0703125,
769
+ 0.0625,
770
+ 0.0625,
771
+ 0.05859375,
772
+ 0.1484375,
773
+ 0.06640625,
774
+ 0.05078125,
775
+ 0.05859375,
776
+ 0.06640625,
777
+ 0.0703125,
778
+ 0.0625,
779
+ 0.07421875,
780
+ 0.06640625,
781
+ 0.0625,
782
+ 0.07421875,
783
+ 0.06640625,
784
+ 0.0625,
785
+ 0.0703125,
786
+ 0.0625,
787
+ 0.05078125,
788
+ 0.0703125,
789
+ 0.05078125,
790
+ 0.078125,
791
+ 0.0625,
792
+ 0.07421875,
793
+ 0.0625,
794
+ 0.0625,
795
+ 0.0546875,
796
+ 0.05859375,
797
+ 0.0625,
798
+ 0.0625,
799
+ 0.06640625,
800
+ 0.05859375,
801
+ 0.0625,
802
+ 0.05859375,
803
+ 0.0625,
804
+ 0.1875,
805
+ 0.07421875,
806
+ 0.06640625,
807
+ 0.0625,
808
+ 0.05859375,
809
+ 0.0625,
810
+ 0.05859375,
811
+ 0.05078125,
812
+ 0.0625,
813
+ 0.0546875,
814
+ 0.06640625,
815
+ 0.0703125,
816
+ 0.05859375,
817
+ 0.06640625,
818
+ 0.0546875,
819
+ 0.06640625,
820
+ 0.0703125
821
+ ]
822
+ }
823
+ },
824
+ "first_exact_by_run": {}
825
+ }
826
+ RESULT config=allcorrupt_seqrand1_highC64_4096 ckpt_step=1000 views=512000 token_acc=0.0676 exact=0/64 exact_refs=0 hits=[]
827
+ [noise-pilot] continue config=allcorrupt_seqrand1_highC64_4096 step=1000
828
+ [noise-pilot] train config=allcorrupt_unigram_shared0p5 from=0 to=1000 C=1.0->1024 seq_alpha=0.0 sampler=dirichlet
829
+ [noise-pilot] eval config=allcorrupt_unigram_shared0p5 step=1000
830
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805 step=1000 soft=none
831
+ [decode] max_len=256 generated=64/64
832
+ {
833
+ "num_rows": 1,
834
+ "best_by_run": {
835
+ "train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805::none": {
836
+ "run": "train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805",
837
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805/step_0001000.pt",
838
+ "ckpt_step": 1000,
839
+ "endpoint_softening": "none",
840
+ "decode_rule": "flowmap",
841
+ "steps": 128,
842
+ "time_schedule": "logit_normal",
843
+ "model_t_mode": "post",
844
+ "final_from": "state",
845
+ "n_gen": 64,
846
+ "n_refs": 8,
847
+ "token_acc_mean": 0.12799072265625,
848
+ "token_acc_min": 0.05078125,
849
+ "token_acc_max": 0.40234375,
850
+ "exact_acc": 0.0,
851
+ "exact_count": 0,
852
+ "exact_ref_coverage": 0.0,
853
+ "exact_ref_count": 0,
854
+ "exact_ref_hits": [],
855
+ "best_ref_idx": [
856
+ 2,
857
+ 7,
858
+ 6,
859
+ 2,
860
+ 5,
861
+ 3,
862
+ 5,
863
+ 2,
864
+ 3,
865
+ 6,
866
+ 1,
867
+ 3,
868
+ 6,
869
+ 5,
870
+ 0,
871
+ 7,
872
+ 5,
873
+ 4,
874
+ 5,
875
+ 7,
876
+ 3,
877
+ 4,
878
+ 5,
879
+ 4,
880
+ 5,
881
+ 5,
882
+ 5,
883
+ 4,
884
+ 6,
885
+ 4,
886
+ 5,
887
+ 7,
888
+ 1,
889
+ 0,
890
+ 5,
891
+ 3,
892
+ 5,
893
+ 6,
894
+ 3,
895
+ 1,
896
+ 6,
897
+ 5,
898
+ 0,
899
+ 5,
900
+ 6,
901
+ 5,
902
+ 1,
903
+ 5,
904
+ 5,
905
+ 4,
906
+ 6,
907
+ 4,
908
+ 6,
909
+ 1,
910
+ 4,
911
+ 6,
912
+ 1,
913
+ 4,
914
+ 0,
915
+ 7,
916
+ 7,
917
+ 7,
918
+ 5,
919
+ 1
920
+ ],
921
+ "best_token_acc": [
922
+ 0.125,
923
+ 0.06640625,
924
+ 0.34765625,
925
+ 0.078125,
926
+ 0.1328125,
927
+ 0.0546875,
928
+ 0.078125,
929
+ 0.19921875,
930
+ 0.06640625,
931
+ 0.40234375,
932
+ 0.109375,
933
+ 0.09765625,
934
+ 0.08203125,
935
+ 0.18359375,
936
+ 0.08203125,
937
+ 0.06640625,
938
+ 0.109375,
939
+ 0.12890625,
940
+ 0.109375,
941
+ 0.0703125,
942
+ 0.08203125,
943
+ 0.11328125,
944
+ 0.16796875,
945
+ 0.07421875,
946
+ 0.1328125,
947
+ 0.15234375,
948
+ 0.06640625,
949
+ 0.1484375,
950
+ 0.12890625,
951
+ 0.14453125,
952
+ 0.14453125,
953
+ 0.0703125,
954
+ 0.1796875,
955
+ 0.0625,
956
+ 0.11328125,
957
+ 0.078125,
958
+ 0.12109375,
959
+ 0.20703125,
960
+ 0.1953125,
961
+ 0.14453125,
962
+ 0.12109375,
963
+ 0.10546875,
964
+ 0.15625,
965
+ 0.15625,
966
+ 0.3671875,
967
+ 0.16015625,
968
+ 0.140625,
969
+ 0.06640625,
970
+ 0.13671875,
971
+ 0.09765625,
972
+ 0.1171875,
973
+ 0.09765625,
974
+ 0.32421875,
975
+ 0.0625,
976
+ 0.09765625,
977
+ 0.05078125,
978
+ 0.15625,
979
+ 0.0703125,
980
+ 0.15625,
981
+ 0.0859375,
982
+ 0.0703125,
983
+ 0.08984375,
984
+ 0.1171875,
985
+ 0.0703125
986
+ ]
987
+ }
988
+ },
989
+ "first_exact_by_run": {}
990
+ }
991
+ RESULT config=allcorrupt_unigram_shared0p5 ckpt_step=1000 views=512000 token_acc=0.1280 exact=0/64 exact_refs=0 hits=[]
992
+ [noise-pilot] continue config=allcorrupt_unigram_shared0p5 step=1000
993
+ [noise-pilot] round=2 Sun May 17 16:43:11 UTC 2026
994
+ [noise-pilot] train config=allcorrupt_fullvocab_dirC1_1024 from=1000 to=2000 C=1.0->1024 seq_alpha=0.0 sampler=dirichlet
995
+ [noise-pilot] eval config=allcorrupt_fullvocab_dirC1_1024 step=2000
996
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805 step=2000 soft=none
997
+ [decode] max_len=256 generated=64/64
998
+ {
999
+ "num_rows": 1,
1000
+ "best_by_run": {
1001
+ "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805::none": {
1002
+ "run": "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805",
1003
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805/step_0002000.pt",
1004
+ "ckpt_step": 2000,
1005
+ "endpoint_softening": "none",
1006
+ "decode_rule": "flowmap",
1007
+ "steps": 128,
1008
+ "time_schedule": "logit_normal",
1009
+ "model_t_mode": "post",
1010
+ "final_from": "state",
1011
+ "n_gen": 64,
1012
+ "n_refs": 8,
1013
+ "token_acc_mean": 0.06768798828125,
1014
+ "token_acc_min": 0.046875,
1015
+ "token_acc_max": 0.1171875,
1016
+ "exact_acc": 0.0,
1017
+ "exact_count": 0,
1018
+ "exact_ref_coverage": 0.0,
1019
+ "exact_ref_count": 0,
1020
+ "exact_ref_hits": [],
1021
+ "best_ref_idx": [
1022
+ 7,
1023
+ 0,
1024
+ 0,
1025
+ 0,
1026
+ 0,
1027
+ 5,
1028
+ 0,
1029
+ 0,
1030
+ 0,
1031
+ 0,
1032
+ 0,
1033
+ 5,
1034
+ 0,
1035
+ 0,
1036
+ 5,
1037
+ 5,
1038
+ 0,
1039
+ 0,
1040
+ 0,
1041
+ 0,
1042
+ 0,
1043
+ 0,
1044
+ 7,
1045
+ 5,
1046
+ 0,
1047
+ 0,
1048
+ 5,
1049
+ 0,
1050
+ 5,
1051
+ 0,
1052
+ 0,
1053
+ 0,
1054
+ 0,
1055
+ 0,
1056
+ 0,
1057
+ 0,
1058
+ 0,
1059
+ 5,
1060
+ 0,
1061
+ 0,
1062
+ 0,
1063
+ 0,
1064
+ 0,
1065
+ 0,
1066
+ 0,
1067
+ 0,
1068
+ 0,
1069
+ 0,
1070
+ 0,
1071
+ 0,
1072
+ 0,
1073
+ 0,
1074
+ 0,
1075
+ 0,
1076
+ 0,
1077
+ 0,
1078
+ 0,
1079
+ 0,
1080
+ 1,
1081
+ 0,
1082
+ 0,
1083
+ 7,
1084
+ 0,
1085
+ 1
1086
+ ],
1087
+ "best_token_acc": [
1088
+ 0.05859375,
1089
+ 0.08203125,
1090
+ 0.06640625,
1091
+ 0.0703125,
1092
+ 0.078125,
1093
+ 0.078125,
1094
+ 0.0546875,
1095
+ 0.046875,
1096
+ 0.1015625,
1097
+ 0.05078125,
1098
+ 0.08984375,
1099
+ 0.0625,
1100
+ 0.05078125,
1101
+ 0.0625,
1102
+ 0.09375,
1103
+ 0.06640625,
1104
+ 0.05859375,
1105
+ 0.05078125,
1106
+ 0.05078125,
1107
+ 0.046875,
1108
+ 0.05859375,
1109
+ 0.0546875,
1110
+ 0.05078125,
1111
+ 0.06640625,
1112
+ 0.0625,
1113
+ 0.05859375,
1114
+ 0.05859375,
1115
+ 0.0859375,
1116
+ 0.0625,
1117
+ 0.05078125,
1118
+ 0.0703125,
1119
+ 0.07421875,
1120
+ 0.0546875,
1121
+ 0.08203125,
1122
+ 0.078125,
1123
+ 0.05859375,
1124
+ 0.1171875,
1125
+ 0.0703125,
1126
+ 0.06640625,
1127
+ 0.0546875,
1128
+ 0.1015625,
1129
+ 0.0625,
1130
+ 0.05859375,
1131
+ 0.05078125,
1132
+ 0.0546875,
1133
+ 0.0546875,
1134
+ 0.0625,
1135
+ 0.0546875,
1136
+ 0.1015625,
1137
+ 0.09375,
1138
+ 0.06640625,
1139
+ 0.09375,
1140
+ 0.09375,
1141
+ 0.0625,
1142
+ 0.05078125,
1143
+ 0.05859375,
1144
+ 0.08203125,
1145
+ 0.05078125,
1146
+ 0.09375,
1147
+ 0.0703125,
1148
+ 0.0546875,
1149
+ 0.07421875,
1150
+ 0.0625,
1151
+ 0.06640625
1152
+ ]
1153
+ }
1154
+ },
1155
+ "first_exact_by_run": {}
1156
+ }
1157
+ RESULT config=allcorrupt_fullvocab_dirC1_1024 ckpt_step=2000 views=1024000 token_acc=0.0677 exact=0/64 exact_refs=0 hits=[]
1158
+ [noise-pilot] continue config=allcorrupt_fullvocab_dirC1_1024 step=2000
1159
+ [noise-pilot] train config=allcorrupt_seqrand1_dirC1_1024 from=1000 to=2000 C=1.0->1024 seq_alpha=1.0 sampler=dirichlet
1160
+ [noise-pilot] eval config=allcorrupt_seqrand1_dirC1_1024 step=2000
1161
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805 step=2000 soft=none
1162
+ [decode] max_len=256 generated=64/64
1163
+ {
1164
+ "num_rows": 1,
1165
+ "best_by_run": {
1166
+ "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805::none": {
1167
+ "run": "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805",
1168
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805/step_0002000.pt",
1169
+ "ckpt_step": 2000,
1170
+ "endpoint_softening": "none",
1171
+ "decode_rule": "flowmap",
1172
+ "steps": 128,
1173
+ "time_schedule": "logit_normal",
1174
+ "model_t_mode": "post",
1175
+ "final_from": "state",
1176
+ "n_gen": 64,
1177
+ "n_refs": 8,
1178
+ "token_acc_mean": 0.046875,
1179
+ "token_acc_min": 0.046875,
1180
+ "token_acc_max": 0.046875,
1181
+ "exact_acc": 0.0,
1182
+ "exact_count": 0,
1183
+ "exact_ref_coverage": 0.0,
1184
+ "exact_ref_count": 0,
1185
+ "exact_ref_hits": [],
1186
+ "best_ref_idx": [
1187
+ 1,
1188
+ 1,
1189
+ 1,
1190
+ 1,
1191
+ 1,
1192
+ 1,
1193
+ 1,
1194
+ 1,
1195
+ 1,
1196
+ 1,
1197
+ 1,
1198
+ 1,
1199
+ 1,
1200
+ 1,
1201
+ 1,
1202
+ 1,
1203
+ 1,
1204
+ 1,
1205
+ 1,
1206
+ 1,
1207
+ 1,
1208
+ 1,
1209
+ 1,
1210
+ 1,
1211
+ 1,
1212
+ 1,
1213
+ 1,
1214
+ 1,
1215
+ 1,
1216
+ 1,
1217
+ 1,
1218
+ 1,
1219
+ 1,
1220
+ 1,
1221
+ 1,
1222
+ 1,
1223
+ 1,
1224
+ 1,
1225
+ 1,
1226
+ 1,
1227
+ 1,
1228
+ 1,
1229
+ 1,
1230
+ 1,
1231
+ 1,
1232
+ 1,
1233
+ 1,
1234
+ 1,
1235
+ 1,
1236
+ 1,
1237
+ 1,
1238
+ 1,
1239
+ 1,
1240
+ 1,
1241
+ 1,
1242
+ 1,
1243
+ 1,
1244
+ 1,
1245
+ 1,
1246
+ 1,
1247
+ 1,
1248
+ 1,
1249
+ 1,
1250
+ 1
1251
+ ],
1252
+ "best_token_acc": [
1253
+ 0.046875,
1254
+ 0.046875,
1255
+ 0.046875,
1256
+ 0.046875,
1257
+ 0.046875,
1258
+ 0.046875,
1259
+ 0.046875,
1260
+ 0.046875,
1261
+ 0.046875,
1262
+ 0.046875,
1263
+ 0.046875,
1264
+ 0.046875,
1265
+ 0.046875,
1266
+ 0.046875,
1267
+ 0.046875,
1268
+ 0.046875,
1269
+ 0.046875,
1270
+ 0.046875,
1271
+ 0.046875,
1272
+ 0.046875,
1273
+ 0.046875,
1274
+ 0.046875,
1275
+ 0.046875,
1276
+ 0.046875,
1277
+ 0.046875,
1278
+ 0.046875,
1279
+ 0.046875,
1280
+ 0.046875,
1281
+ 0.046875,
1282
+ 0.046875,
1283
+ 0.046875,
1284
+ 0.046875,
1285
+ 0.046875,
1286
+ 0.046875,
1287
+ 0.046875,
1288
+ 0.046875,
1289
+ 0.046875,
1290
+ 0.046875,
1291
+ 0.046875,
1292
+ 0.046875,
1293
+ 0.046875,
1294
+ 0.046875,
1295
+ 0.046875,
1296
+ 0.046875,
1297
+ 0.046875,
1298
+ 0.046875,
1299
+ 0.046875,
1300
+ 0.046875,
1301
+ 0.046875,
1302
+ 0.046875,
1303
+ 0.046875,
1304
+ 0.046875,
1305
+ 0.046875,
1306
+ 0.046875,
1307
+ 0.046875,
1308
+ 0.046875,
1309
+ 0.046875,
1310
+ 0.046875,
1311
+ 0.046875,
1312
+ 0.046875,
1313
+ 0.046875,
1314
+ 0.046875,
1315
+ 0.046875,
1316
+ 0.046875
1317
+ ]
1318
+ }
1319
+ },
1320
+ "first_exact_by_run": {}
1321
+ }
1322
+ RESULT config=allcorrupt_seqrand1_dirC1_1024 ckpt_step=2000 views=1024000 token_acc=0.0469 exact=0/64 exact_refs=0 hits=[]
1323
+ [noise-pilot] continue config=allcorrupt_seqrand1_dirC1_1024 step=2000
1324
+ [noise-pilot] train config=allcorrupt_highC64_4096 from=1000 to=2000 C=64->4096 seq_alpha=0.0 sampler=dirichlet
1325
+ [noise-pilot] eval config=allcorrupt_highC64_4096 step=2000
1326
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805 step=2000 soft=none
1327
+ [decode] max_len=256 generated=64/64
1328
+ {
1329
+ "num_rows": 1,
1330
+ "best_by_run": {
1331
+ "train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805::none": {
1332
+ "run": "train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805",
1333
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805/step_0002000.pt",
1334
+ "ckpt_step": 2000,
1335
+ "endpoint_softening": "none",
1336
+ "decode_rule": "flowmap",
1337
+ "steps": 128,
1338
+ "time_schedule": "logit_normal",
1339
+ "model_t_mode": "post",
1340
+ "final_from": "state",
1341
+ "n_gen": 64,
1342
+ "n_refs": 8,
1343
+ "token_acc_mean": 0.05987548828125,
1344
+ "token_acc_min": 0.046875,
1345
+ "token_acc_max": 0.07421875,
1346
+ "exact_acc": 0.0,
1347
+ "exact_count": 0,
1348
+ "exact_ref_coverage": 0.0,
1349
+ "exact_ref_count": 0,
1350
+ "exact_ref_hits": [],
1351
+ "best_ref_idx": [
1352
+ 5,
1353
+ 5,
1354
+ 5,
1355
+ 5,
1356
+ 5,
1357
+ 5,
1358
+ 5,
1359
+ 5,
1360
+ 5,
1361
+ 5,
1362
+ 5,
1363
+ 5,
1364
+ 5,
1365
+ 5,
1366
+ 5,
1367
+ 5,
1368
+ 3,
1369
+ 5,
1370
+ 5,
1371
+ 5,
1372
+ 3,
1373
+ 5,
1374
+ 5,
1375
+ 5,
1376
+ 5,
1377
+ 5,
1378
+ 5,
1379
+ 5,
1380
+ 5,
1381
+ 3,
1382
+ 5,
1383
+ 5,
1384
+ 5,
1385
+ 5,
1386
+ 5,
1387
+ 4,
1388
+ 5,
1389
+ 5,
1390
+ 5,
1391
+ 5,
1392
+ 4,
1393
+ 5,
1394
+ 5,
1395
+ 5,
1396
+ 5,
1397
+ 4,
1398
+ 5,
1399
+ 5,
1400
+ 5,
1401
+ 3,
1402
+ 5,
1403
+ 5,
1404
+ 5,
1405
+ 5,
1406
+ 5,
1407
+ 5,
1408
+ 5,
1409
+ 5,
1410
+ 5,
1411
+ 5,
1412
+ 5,
1413
+ 5,
1414
+ 5,
1415
+ 5
1416
+ ],
1417
+ "best_token_acc": [
1418
+ 0.0546875,
1419
+ 0.0625,
1420
+ 0.0703125,
1421
+ 0.0546875,
1422
+ 0.0546875,
1423
+ 0.0546875,
1424
+ 0.0625,
1425
+ 0.06640625,
1426
+ 0.0546875,
1427
+ 0.05859375,
1428
+ 0.0546875,
1429
+ 0.0625,
1430
+ 0.0625,
1431
+ 0.0625,
1432
+ 0.06640625,
1433
+ 0.05859375,
1434
+ 0.0546875,
1435
+ 0.0625,
1436
+ 0.0546875,
1437
+ 0.05859375,
1438
+ 0.0546875,
1439
+ 0.07421875,
1440
+ 0.05859375,
1441
+ 0.05859375,
1442
+ 0.0625,
1443
+ 0.0703125,
1444
+ 0.06640625,
1445
+ 0.06640625,
1446
+ 0.0703125,
1447
+ 0.05078125,
1448
+ 0.0546875,
1449
+ 0.0546875,
1450
+ 0.0625,
1451
+ 0.0625,
1452
+ 0.07421875,
1453
+ 0.0546875,
1454
+ 0.0546875,
1455
+ 0.06640625,
1456
+ 0.0546875,
1457
+ 0.0546875,
1458
+ 0.05078125,
1459
+ 0.0546875,
1460
+ 0.05859375,
1461
+ 0.0625,
1462
+ 0.0546875,
1463
+ 0.05859375,
1464
+ 0.05859375,
1465
+ 0.0703125,
1466
+ 0.0546875,
1467
+ 0.05859375,
1468
+ 0.06640625,
1469
+ 0.05859375,
1470
+ 0.07421875,
1471
+ 0.0625,
1472
+ 0.046875,
1473
+ 0.05859375,
1474
+ 0.05859375,
1475
+ 0.0625,
1476
+ 0.05859375,
1477
+ 0.05859375,
1478
+ 0.0625,
1479
+ 0.0546875,
1480
+ 0.0546875,
1481
+ 0.0546875
1482
+ ]
1483
+ }
1484
+ },
1485
+ "first_exact_by_run": {}
1486
+ }
1487
+ RESULT config=allcorrupt_highC64_4096 ckpt_step=2000 views=1024000 token_acc=0.0599 exact=0/64 exact_refs=0 hits=[]
1488
+ [noise-pilot] continue config=allcorrupt_highC64_4096 step=2000
1489
+ [noise-pilot] train config=allcorrupt_logistic_sig0p05_0p5 from=1000 to=2000 C=1.0->1024 seq_alpha=0.0 sampler=logistic_normal_linear_mean
1490
+ [noise-pilot] eval config=allcorrupt_logistic_sig0p05_0p5 step=2000
1491
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805 step=2000 soft=none
1492
+ [decode] max_len=256 generated=64/64
1493
+ {
1494
+ "num_rows": 1,
1495
+ "best_by_run": {
1496
+ "train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805::none": {
1497
+ "run": "train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805",
1498
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805/step_0002000.pt",
1499
+ "ckpt_step": 2000,
1500
+ "endpoint_softening": "none",
1501
+ "decode_rule": "flowmap",
1502
+ "steps": 128,
1503
+ "time_schedule": "logit_normal",
1504
+ "model_t_mode": "post",
1505
+ "final_from": "state",
1506
+ "n_gen": 64,
1507
+ "n_refs": 8,
1508
+ "token_acc_mean": 0.07275390625,
1509
+ "token_acc_min": 0.046875,
1510
+ "token_acc_max": 0.140625,
1511
+ "exact_acc": 0.0,
1512
+ "exact_count": 0,
1513
+ "exact_ref_coverage": 0.0,
1514
+ "exact_ref_count": 0,
1515
+ "exact_ref_hits": [],
1516
+ "best_ref_idx": [
1517
+ 3,
1518
+ 7,
1519
+ 3,
1520
+ 2,
1521
+ 2,
1522
+ 2,
1523
+ 2,
1524
+ 2,
1525
+ 7,
1526
+ 3,
1527
+ 7,
1528
+ 3,
1529
+ 3,
1530
+ 2,
1531
+ 0,
1532
+ 0,
1533
+ 0,
1534
+ 7,
1535
+ 3,
1536
+ 2,
1537
+ 0,
1538
+ 0,
1539
+ 0,
1540
+ 2,
1541
+ 7,
1542
+ 0,
1543
+ 2,
1544
+ 3,
1545
+ 2,
1546
+ 5,
1547
+ 3,
1548
+ 3,
1549
+ 3,
1550
+ 5,
1551
+ 0,
1552
+ 7,
1553
+ 0,
1554
+ 3,
1555
+ 0,
1556
+ 2,
1557
+ 0,
1558
+ 3,
1559
+ 2,
1560
+ 7,
1561
+ 7,
1562
+ 0,
1563
+ 2,
1564
+ 7,
1565
+ 3,
1566
+ 0,
1567
+ 3,
1568
+ 0,
1569
+ 0,
1570
+ 3,
1571
+ 0,
1572
+ 0,
1573
+ 0,
1574
+ 2,
1575
+ 2,
1576
+ 3,
1577
+ 3,
1578
+ 7,
1579
+ 3,
1580
+ 3
1581
+ ],
1582
+ "best_token_acc": [
1583
+ 0.05859375,
1584
+ 0.05859375,
1585
+ 0.06640625,
1586
+ 0.0625,
1587
+ 0.10546875,
1588
+ 0.08203125,
1589
+ 0.078125,
1590
+ 0.140625,
1591
+ 0.05859375,
1592
+ 0.07421875,
1593
+ 0.0703125,
1594
+ 0.0625,
1595
+ 0.08984375,
1596
+ 0.0703125,
1597
+ 0.046875,
1598
+ 0.0546875,
1599
+ 0.07421875,
1600
+ 0.06640625,
1601
+ 0.0625,
1602
+ 0.0546875,
1603
+ 0.05859375,
1604
+ 0.0703125,
1605
+ 0.0703125,
1606
+ 0.0703125,
1607
+ 0.0546875,
1608
+ 0.0625,
1609
+ 0.1015625,
1610
+ 0.0625,
1611
+ 0.07421875,
1612
+ 0.08203125,
1613
+ 0.12109375,
1614
+ 0.0625,
1615
+ 0.06640625,
1616
+ 0.06640625,
1617
+ 0.0546875,
1618
+ 0.0703125,
1619
+ 0.0625,
1620
+ 0.0703125,
1621
+ 0.0546875,
1622
+ 0.0703125,
1623
+ 0.0703125,
1624
+ 0.12109375,
1625
+ 0.08984375,
1626
+ 0.06640625,
1627
+ 0.06640625,
1628
+ 0.078125,
1629
+ 0.125,
1630
+ 0.0703125,
1631
+ 0.08203125,
1632
+ 0.05859375,
1633
+ 0.0703125,
1634
+ 0.08984375,
1635
+ 0.09765625,
1636
+ 0.0625,
1637
+ 0.0625,
1638
+ 0.05859375,
1639
+ 0.06640625,
1640
+ 0.06640625,
1641
+ 0.0859375,
1642
+ 0.06640625,
1643
+ 0.078125,
1644
+ 0.07421875,
1645
+ 0.05078125,
1646
+ 0.0546875
1647
+ ]
1648
+ }
1649
+ },
1650
+ "first_exact_by_run": {}
1651
+ }
1652
+ RESULT config=allcorrupt_logistic_sig0p05_0p5 ckpt_step=2000 views=1024000 token_acc=0.0728 exact=0/64 exact_refs=0 hits=[]
1653
+ [noise-pilot] continue config=allcorrupt_logistic_sig0p05_0p5 step=2000
1654
+ [noise-pilot] train config=allcorrupt_seqrand1_highC64_4096 from=1000 to=2000 C=64->4096 seq_alpha=1.0 sampler=dirichlet
1655
+ [noise-pilot] eval config=allcorrupt_seqrand1_highC64_4096 step=2000
1656
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805 step=2000 soft=none
1657
+ [decode] max_len=256 generated=64/64
1658
+ {
1659
+ "num_rows": 1,
1660
+ "best_by_run": {
1661
+ "train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805::none": {
1662
+ "run": "train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805",
1663
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805/step_0002000.pt",
1664
+ "ckpt_step": 2000,
1665
+ "endpoint_softening": "none",
1666
+ "decode_rule": "flowmap",
1667
+ "steps": 128,
1668
+ "time_schedule": "logit_normal",
1669
+ "model_t_mode": "post",
1670
+ "final_from": "state",
1671
+ "n_gen": 64,
1672
+ "n_refs": 8,
1673
+ "token_acc_mean": 0.07476806640625,
1674
+ "token_acc_min": 0.0234375,
1675
+ "token_acc_max": 0.26171875,
1676
+ "exact_acc": 0.0,
1677
+ "exact_count": 0,
1678
+ "exact_ref_coverage": 0.0,
1679
+ "exact_ref_count": 0,
1680
+ "exact_ref_hits": [],
1681
+ "best_ref_idx": [
1682
+ 7,
1683
+ 7,
1684
+ 0,
1685
+ 7,
1686
+ 7,
1687
+ 3,
1688
+ 7,
1689
+ 7,
1690
+ 0,
1691
+ 3,
1692
+ 4,
1693
+ 5,
1694
+ 7,
1695
+ 0,
1696
+ 7,
1697
+ 0,
1698
+ 7,
1699
+ 0,
1700
+ 5,
1701
+ 3,
1702
+ 7,
1703
+ 7,
1704
+ 7,
1705
+ 7,
1706
+ 7,
1707
+ 3,
1708
+ 5,
1709
+ 5,
1710
+ 5,
1711
+ 0,
1712
+ 7,
1713
+ 7,
1714
+ 5,
1715
+ 5,
1716
+ 4,
1717
+ 7,
1718
+ 0,
1719
+ 3,
1720
+ 0,
1721
+ 7,
1722
+ 5,
1723
+ 0,
1724
+ 3,
1725
+ 5,
1726
+ 7,
1727
+ 0,
1728
+ 5,
1729
+ 7,
1730
+ 0,
1731
+ 5,
1732
+ 5,
1733
+ 5,
1734
+ 4,
1735
+ 7,
1736
+ 4,
1737
+ 7,
1738
+ 3,
1739
+ 7,
1740
+ 3,
1741
+ 7,
1742
+ 5,
1743
+ 7,
1744
+ 3,
1745
+ 4
1746
+ ],
1747
+ "best_token_acc": [
1748
+ 0.234375,
1749
+ 0.03515625,
1750
+ 0.0390625,
1751
+ 0.046875,
1752
+ 0.08203125,
1753
+ 0.03515625,
1754
+ 0.05859375,
1755
+ 0.17578125,
1756
+ 0.03515625,
1757
+ 0.03125,
1758
+ 0.02734375,
1759
+ 0.03125,
1760
+ 0.05078125,
1761
+ 0.03515625,
1762
+ 0.234375,
1763
+ 0.03515625,
1764
+ 0.234375,
1765
+ 0.02734375,
1766
+ 0.05078125,
1767
+ 0.0390625,
1768
+ 0.04296875,
1769
+ 0.21875,
1770
+ 0.04296875,
1771
+ 0.03125,
1772
+ 0.26171875,
1773
+ 0.03515625,
1774
+ 0.046875,
1775
+ 0.04296875,
1776
+ 0.03515625,
1777
+ 0.03515625,
1778
+ 0.23046875,
1779
+ 0.03125,
1780
+ 0.0390625,
1781
+ 0.0390625,
1782
+ 0.03125,
1783
+ 0.0703125,
1784
+ 0.0703125,
1785
+ 0.046875,
1786
+ 0.0625,
1787
+ 0.25,
1788
+ 0.03515625,
1789
+ 0.03515625,
1790
+ 0.03515625,
1791
+ 0.0390625,
1792
+ 0.16796875,
1793
+ 0.02734375,
1794
+ 0.03515625,
1795
+ 0.21875,
1796
+ 0.05859375,
1797
+ 0.03125,
1798
+ 0.03515625,
1799
+ 0.046875,
1800
+ 0.03125,
1801
+ 0.0390625,
1802
+ 0.03125,
1803
+ 0.04296875,
1804
+ 0.03515625,
1805
+ 0.234375,
1806
+ 0.03125,
1807
+ 0.0546875,
1808
+ 0.03515625,
1809
+ 0.21875,
1810
+ 0.0390625,
1811
+ 0.0234375
1812
+ ]
1813
+ }
1814
+ },
1815
+ "first_exact_by_run": {}
1816
+ }
1817
+ RESULT config=allcorrupt_seqrand1_highC64_4096 ckpt_step=2000 views=1024000 token_acc=0.0748 exact=0/64 exact_refs=0 hits=[]
1818
+ [noise-pilot] continue config=allcorrupt_seqrand1_highC64_4096 step=2000
1819
+ [noise-pilot] train config=allcorrupt_unigram_shared0p5 from=1000 to=2000 C=1.0->1024 seq_alpha=0.0 sampler=dirichlet
1820
+ [noise-pilot] start stamp=20260517_163805 len=256 vocab=969 out=docs/lta_samples/metrics_20260517/noise_geometry_pilots_len256_bs512_ode128_20260517_163805
1821
+ [noise-pilot] round=1 Sun May 17 16:50:07 UTC 2026
1822
+ [noise-pilot] train config=allcorrupt_fullvocab_dirC1_1024 from=2000 to=3000 C=1.0->1024 seq_alpha=0.0 sampler=dirichlet
1823
+ [noise-pilot] eval config=allcorrupt_fullvocab_dirC1_1024 step=3000
1824
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805 step=3000 soft=none
1825
+ [decode] max_len=256 generated=64/64
1826
+ {
1827
+ "num_rows": 1,
1828
+ "best_by_run": {
1829
+ "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805::none": {
1830
+ "run": "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805",
1831
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805/step_0003000.pt",
1832
+ "ckpt_step": 3000,
1833
+ "endpoint_softening": "none",
1834
+ "decode_rule": "flowmap",
1835
+ "steps": 128,
1836
+ "time_schedule": "logit_normal",
1837
+ "model_t_mode": "post",
1838
+ "final_from": "state",
1839
+ "n_gen": 64,
1840
+ "n_refs": 8,
1841
+ "token_acc_mean": 0.1204833984375,
1842
+ "token_acc_min": 0.05859375,
1843
+ "token_acc_max": 0.26953125,
1844
+ "exact_acc": 0.0,
1845
+ "exact_count": 0,
1846
+ "exact_ref_coverage": 0.0,
1847
+ "exact_ref_count": 0,
1848
+ "exact_ref_hits": [],
1849
+ "best_ref_idx": [
1850
+ 1,
1851
+ 4,
1852
+ 4,
1853
+ 7,
1854
+ 5,
1855
+ 7,
1856
+ 4,
1857
+ 5,
1858
+ 7,
1859
+ 0,
1860
+ 5,
1861
+ 3,
1862
+ 3,
1863
+ 4,
1864
+ 7,
1865
+ 7,
1866
+ 5,
1867
+ 5,
1868
+ 7,
1869
+ 7,
1870
+ 1,
1871
+ 2,
1872
+ 3,
1873
+ 5,
1874
+ 2,
1875
+ 3,
1876
+ 7,
1877
+ 2,
1878
+ 5,
1879
+ 5,
1880
+ 2,
1881
+ 5,
1882
+ 1,
1883
+ 2,
1884
+ 7,
1885
+ 5,
1886
+ 5,
1887
+ 7,
1888
+ 3,
1889
+ 5,
1890
+ 5,
1891
+ 7,
1892
+ 5,
1893
+ 5,
1894
+ 3,
1895
+ 5,
1896
+ 5,
1897
+ 7,
1898
+ 2,
1899
+ 4,
1900
+ 2,
1901
+ 7,
1902
+ 5,
1903
+ 2,
1904
+ 3,
1905
+ 4,
1906
+ 1,
1907
+ 5,
1908
+ 5,
1909
+ 2,
1910
+ 5,
1911
+ 5,
1912
+ 5,
1913
+ 5
1914
+ ],
1915
+ "best_token_acc": [
1916
+ 0.08203125,
1917
+ 0.07421875,
1918
+ 0.0703125,
1919
+ 0.125,
1920
+ 0.07421875,
1921
+ 0.078125,
1922
+ 0.0703125,
1923
+ 0.1875,
1924
+ 0.05859375,
1925
+ 0.08984375,
1926
+ 0.14453125,
1927
+ 0.078125,
1928
+ 0.14453125,
1929
+ 0.07421875,
1930
+ 0.11328125,
1931
+ 0.08203125,
1932
+ 0.12109375,
1933
+ 0.19140625,
1934
+ 0.08984375,
1935
+ 0.0703125,
1936
+ 0.2421875,
1937
+ 0.14453125,
1938
+ 0.08203125,
1939
+ 0.05859375,
1940
+ 0.0859375,
1941
+ 0.1015625,
1942
+ 0.1015625,
1943
+ 0.26953125,
1944
+ 0.1875,
1945
+ 0.171875,
1946
+ 0.07421875,
1947
+ 0.1640625,
1948
+ 0.0625,
1949
+ 0.06640625,
1950
+ 0.125,
1951
+ 0.16015625,
1952
+ 0.08984375,
1953
+ 0.09375,
1954
+ 0.09375,
1955
+ 0.08984375,
1956
+ 0.09375,
1957
+ 0.15625,
1958
+ 0.12890625,
1959
+ 0.2578125,
1960
+ 0.0625,
1961
+ 0.109375,
1962
+ 0.16796875,
1963
+ 0.21875,
1964
+ 0.07421875,
1965
+ 0.0703125,
1966
+ 0.15234375,
1967
+ 0.08984375,
1968
+ 0.17578125,
1969
+ 0.1484375,
1970
+ 0.1328125,
1971
+ 0.06640625,
1972
+ 0.0625,
1973
+ 0.109375,
1974
+ 0.109375,
1975
+ 0.15234375,
1976
+ 0.171875,
1977
+ 0.20703125,
1978
+ 0.10546875,
1979
+ 0.203125
1980
+ ]
1981
+ }
1982
+ },
1983
+ "first_exact_by_run": {}
1984
+ }
1985
+ RESULT config=allcorrupt_fullvocab_dirC1_1024 ckpt_step=3000 views=1536000 token_acc=0.1205 exact=0/64 exact_refs=0 hits=[]
1986
+ [noise-pilot] continue config=allcorrupt_fullvocab_dirC1_1024 step=3000
1987
+ [noise-pilot] train config=allcorrupt_seqrand1_dirC1_1024 from=2000 to=3000 C=1.0->1024 seq_alpha=1.0 sampler=dirichlet
1988
+ [noise-pilot] eval config=allcorrupt_seqrand1_dirC1_1024 step=3000
1989
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805 step=3000 soft=none
1990
+ [decode] max_len=256 generated=64/64
1991
+ {
1992
+ "num_rows": 1,
1993
+ "best_by_run": {
1994
+ "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805::none": {
1995
+ "run": "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805",
1996
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805/step_0003000.pt",
1997
+ "ckpt_step": 3000,
1998
+ "endpoint_softening": "none",
1999
+ "decode_rule": "flowmap",
2000
+ "steps": 128,
2001
+ "time_schedule": "logit_normal",
2002
+ "model_t_mode": "post",
2003
+ "final_from": "state",
2004
+ "n_gen": 64,
2005
+ "n_refs": 8,
2006
+ "token_acc_mean": 0.0350341796875,
2007
+ "token_acc_min": 0.02734375,
2008
+ "token_acc_max": 0.03515625,
2009
+ "exact_acc": 0.0,
2010
+ "exact_count": 0,
2011
+ "exact_ref_coverage": 0.0,
2012
+ "exact_ref_count": 0,
2013
+ "exact_ref_hits": [],
2014
+ "best_ref_idx": [
2015
+ 2,
2016
+ 2,
2017
+ 2,
2018
+ 2,
2019
+ 2,
2020
+ 2,
2021
+ 2,
2022
+ 2,
2023
+ 2,
2024
+ 2,
2025
+ 2,
2026
+ 2,
2027
+ 2,
2028
+ 2,
2029
+ 2,
2030
+ 2,
2031
+ 2,
2032
+ 2,
2033
+ 2,
2034
+ 2,
2035
+ 2,
2036
+ 2,
2037
+ 2,
2038
+ 2,
2039
+ 2,
2040
+ 2,
2041
+ 2,
2042
+ 2,
2043
+ 2,
2044
+ 2,
2045
+ 2,
2046
+ 2,
2047
+ 2,
2048
+ 2,
2049
+ 2,
2050
+ 2,
2051
+ 2,
2052
+ 2,
2053
+ 2,
2054
+ 2,
2055
+ 2,
2056
+ 2,
2057
+ 2,
2058
+ 2,
2059
+ 2,
2060
+ 2,
2061
+ 2,
2062
+ 2,
2063
+ 2,
2064
+ 2,
2065
+ 2,
2066
+ 2,
2067
+ 2,
2068
+ 2,
2069
+ 2,
2070
+ 2,
2071
+ 2,
2072
+ 2,
2073
+ 2,
2074
+ 2,
2075
+ 2,
2076
+ 2,
2077
+ 4,
2078
+ 2
2079
+ ],
2080
+ "best_token_acc": [
2081
+ 0.03515625,
2082
+ 0.03515625,
2083
+ 0.03515625,
2084
+ 0.03515625,
2085
+ 0.03515625,
2086
+ 0.03515625,
2087
+ 0.03515625,
2088
+ 0.03515625,
2089
+ 0.03515625,
2090
+ 0.03515625,
2091
+ 0.03515625,
2092
+ 0.03515625,
2093
+ 0.03515625,
2094
+ 0.03515625,
2095
+ 0.03515625,
2096
+ 0.03515625,
2097
+ 0.03515625,
2098
+ 0.03515625,
2099
+ 0.03515625,
2100
+ 0.03515625,
2101
+ 0.03515625,
2102
+ 0.03515625,
2103
+ 0.03515625,
2104
+ 0.03515625,
2105
+ 0.03515625,
2106
+ 0.03515625,
2107
+ 0.03515625,
2108
+ 0.03515625,
2109
+ 0.03515625,
2110
+ 0.03515625,
2111
+ 0.03515625,
2112
+ 0.03515625,
2113
+ 0.03515625,
2114
+ 0.03515625,
2115
+ 0.03515625,
2116
+ 0.03515625,
2117
+ 0.03515625,
2118
+ 0.03515625,
2119
+ 0.03515625,
2120
+ 0.03515625,
2121
+ 0.03515625,
2122
+ 0.03515625,
2123
+ 0.03515625,
2124
+ 0.03515625,
2125
+ 0.03515625,
2126
+ 0.03515625,
2127
+ 0.03515625,
2128
+ 0.03515625,
2129
+ 0.03515625,
2130
+ 0.03515625,
2131
+ 0.03515625,
2132
+ 0.03515625,
2133
+ 0.03515625,
2134
+ 0.03515625,
2135
+ 0.03515625,
2136
+ 0.03515625,
2137
+ 0.03515625,
2138
+ 0.03515625,
2139
+ 0.03515625,
2140
+ 0.03515625,
2141
+ 0.03515625,
2142
+ 0.03515625,
2143
+ 0.02734375,
2144
+ 0.03515625
2145
+ ]
2146
+ }
2147
+ },
2148
+ "first_exact_by_run": {}
2149
+ }
2150
+ RESULT config=allcorrupt_seqrand1_dirC1_1024 ckpt_step=3000 views=1536000 token_acc=0.0350 exact=0/64 exact_refs=0 hits=[]
2151
+ [noise-pilot] continue config=allcorrupt_seqrand1_dirC1_1024 step=3000
2152
+ [noise-pilot] train config=allcorrupt_highC64_4096 from=2000 to=3000 C=64->4096 seq_alpha=0.0 sampler=dirichlet
2153
+ [noise-pilot] eval config=allcorrupt_highC64_4096 step=3000
2154
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805 step=3000 soft=none
2155
+ [decode] max_len=256 generated=64/64
2156
+ {
2157
+ "num_rows": 1,
2158
+ "best_by_run": {
2159
+ "train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805::none": {
2160
+ "run": "train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805",
2161
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805/step_0003000.pt",
2162
+ "ckpt_step": 3000,
2163
+ "endpoint_softening": "none",
2164
+ "decode_rule": "flowmap",
2165
+ "steps": 128,
2166
+ "time_schedule": "logit_normal",
2167
+ "model_t_mode": "post",
2168
+ "final_from": "state",
2169
+ "n_gen": 64,
2170
+ "n_refs": 8,
2171
+ "token_acc_mean": 0.0899658203125,
2172
+ "token_acc_min": 0.05078125,
2173
+ "token_acc_max": 0.14453125,
2174
+ "exact_acc": 0.0,
2175
+ "exact_count": 0,
2176
+ "exact_ref_coverage": 0.0,
2177
+ "exact_ref_count": 0,
2178
+ "exact_ref_hits": [],
2179
+ "best_ref_idx": [
2180
+ 6,
2181
+ 6,
2182
+ 7,
2183
+ 5,
2184
+ 5,
2185
+ 6,
2186
+ 6,
2187
+ 6,
2188
+ 6,
2189
+ 6,
2190
+ 6,
2191
+ 6,
2192
+ 6,
2193
+ 6,
2194
+ 6,
2195
+ 6,
2196
+ 5,
2197
+ 5,
2198
+ 6,
2199
+ 6,
2200
+ 5,
2201
+ 5,
2202
+ 0,
2203
+ 6,
2204
+ 6,
2205
+ 5,
2206
+ 6,
2207
+ 6,
2208
+ 5,
2209
+ 6,
2210
+ 5,
2211
+ 4,
2212
+ 6,
2213
+ 6,
2214
+ 6,
2215
+ 6,
2216
+ 6,
2217
+ 6,
2218
+ 7,
2219
+ 5,
2220
+ 6,
2221
+ 6,
2222
+ 4,
2223
+ 5,
2224
+ 5,
2225
+ 5,
2226
+ 0,
2227
+ 6,
2228
+ 6,
2229
+ 5,
2230
+ 5,
2231
+ 6,
2232
+ 5,
2233
+ 5,
2234
+ 5,
2235
+ 6,
2236
+ 6,
2237
+ 6,
2238
+ 5,
2239
+ 5,
2240
+ 6,
2241
+ 6,
2242
+ 5,
2243
+ 6
2244
+ ],
2245
+ "best_token_acc": [
2246
+ 0.0703125,
2247
+ 0.08203125,
2248
+ 0.08203125,
2249
+ 0.06640625,
2250
+ 0.078125,
2251
+ 0.0859375,
2252
+ 0.09375,
2253
+ 0.11328125,
2254
+ 0.0859375,
2255
+ 0.10546875,
2256
+ 0.09375,
2257
+ 0.10546875,
2258
+ 0.08984375,
2259
+ 0.09765625,
2260
+ 0.0859375,
2261
+ 0.10546875,
2262
+ 0.06640625,
2263
+ 0.0703125,
2264
+ 0.14453125,
2265
+ 0.11328125,
2266
+ 0.078125,
2267
+ 0.08203125,
2268
+ 0.05078125,
2269
+ 0.08984375,
2270
+ 0.109375,
2271
+ 0.09375,
2272
+ 0.10546875,
2273
+ 0.125,
2274
+ 0.07421875,
2275
+ 0.1015625,
2276
+ 0.078125,
2277
+ 0.0625,
2278
+ 0.12109375,
2279
+ 0.09375,
2280
+ 0.08203125,
2281
+ 0.08984375,
2282
+ 0.109375,
2283
+ 0.078125,
2284
+ 0.078125,
2285
+ 0.08203125,
2286
+ 0.08203125,
2287
+ 0.1015625,
2288
+ 0.0625,
2289
+ 0.05859375,
2290
+ 0.078125,
2291
+ 0.0703125,
2292
+ 0.07421875,
2293
+ 0.08984375,
2294
+ 0.10546875,
2295
+ 0.078125,
2296
+ 0.0625,
2297
+ 0.12890625,
2298
+ 0.06640625,
2299
+ 0.08203125,
2300
+ 0.0859375,
2301
+ 0.12890625,
2302
+ 0.09375,
2303
+ 0.09375,
2304
+ 0.0859375,
2305
+ 0.0859375,
2306
+ 0.1171875,
2307
+ 0.12109375,
2308
+ 0.078125,
2309
+ 0.10546875
2310
+ ]
2311
+ }
2312
+ },
2313
+ "first_exact_by_run": {}
2314
+ }
2315
+ RESULT config=allcorrupt_highC64_4096 ckpt_step=3000 views=1536000 token_acc=0.0900 exact=0/64 exact_refs=0 hits=[]
2316
+ [noise-pilot] continue config=allcorrupt_highC64_4096 step=3000
2317
+ [noise-pilot] train config=allcorrupt_logistic_sig0p05_0p5 from=2000 to=3000 C=1.0->1024 seq_alpha=0.0 sampler=logistic_normal_linear_mean
2318
+ [noise-pilot] eval config=allcorrupt_logistic_sig0p05_0p5 step=3000
2319
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805 step=3000 soft=none
2320
+ [decode] max_len=256 generated=64/64
2321
+ {
2322
+ "num_rows": 1,
2323
+ "best_by_run": {
2324
+ "train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805::none": {
2325
+ "run": "train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805",
2326
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805/step_0003000.pt",
2327
+ "ckpt_step": 3000,
2328
+ "endpoint_softening": "none",
2329
+ "decode_rule": "flowmap",
2330
+ "steps": 128,
2331
+ "time_schedule": "logit_normal",
2332
+ "model_t_mode": "post",
2333
+ "final_from": "state",
2334
+ "n_gen": 64,
2335
+ "n_refs": 8,
2336
+ "token_acc_mean": 0.07470703125,
2337
+ "token_acc_min": 0.046875,
2338
+ "token_acc_max": 0.1875,
2339
+ "exact_acc": 0.0,
2340
+ "exact_count": 0,
2341
+ "exact_ref_coverage": 0.0,
2342
+ "exact_ref_count": 0,
2343
+ "exact_ref_hits": [],
2344
+ "best_ref_idx": [
2345
+ 2,
2346
+ 3,
2347
+ 5,
2348
+ 5,
2349
+ 5,
2350
+ 2,
2351
+ 7,
2352
+ 2,
2353
+ 2,
2354
+ 3,
2355
+ 5,
2356
+ 3,
2357
+ 5,
2358
+ 3,
2359
+ 7,
2360
+ 7,
2361
+ 5,
2362
+ 7,
2363
+ 7,
2364
+ 2,
2365
+ 2,
2366
+ 1,
2367
+ 3,
2368
+ 5,
2369
+ 7,
2370
+ 3,
2371
+ 5,
2372
+ 3,
2373
+ 7,
2374
+ 5,
2375
+ 3,
2376
+ 5,
2377
+ 3,
2378
+ 5,
2379
+ 2,
2380
+ 2,
2381
+ 5,
2382
+ 3,
2383
+ 5,
2384
+ 7,
2385
+ 3,
2386
+ 7,
2387
+ 5,
2388
+ 5,
2389
+ 7,
2390
+ 7,
2391
+ 7,
2392
+ 3,
2393
+ 7,
2394
+ 2,
2395
+ 5,
2396
+ 7,
2397
+ 3,
2398
+ 7,
2399
+ 5,
2400
+ 3,
2401
+ 7,
2402
+ 3,
2403
+ 5,
2404
+ 5,
2405
+ 7,
2406
+ 5,
2407
+ 5,
2408
+ 5
2409
+ ],
2410
+ "best_token_acc": [
2411
+ 0.0703125,
2412
+ 0.06640625,
2413
+ 0.07421875,
2414
+ 0.10546875,
2415
+ 0.09765625,
2416
+ 0.0703125,
2417
+ 0.08203125,
2418
+ 0.05078125,
2419
+ 0.06640625,
2420
+ 0.0703125,
2421
+ 0.07421875,
2422
+ 0.0625,
2423
+ 0.08984375,
2424
+ 0.05859375,
2425
+ 0.12109375,
2426
+ 0.1875,
2427
+ 0.0703125,
2428
+ 0.0703125,
2429
+ 0.05859375,
2430
+ 0.0625,
2431
+ 0.046875,
2432
+ 0.05859375,
2433
+ 0.046875,
2434
+ 0.07421875,
2435
+ 0.08203125,
2436
+ 0.0703125,
2437
+ 0.0625,
2438
+ 0.05078125,
2439
+ 0.09765625,
2440
+ 0.0703125,
2441
+ 0.0625,
2442
+ 0.078125,
2443
+ 0.06640625,
2444
+ 0.08203125,
2445
+ 0.05859375,
2446
+ 0.05859375,
2447
+ 0.09765625,
2448
+ 0.0625,
2449
+ 0.08984375,
2450
+ 0.1015625,
2451
+ 0.0625,
2452
+ 0.078125,
2453
+ 0.109375,
2454
+ 0.078125,
2455
+ 0.0859375,
2456
+ 0.11328125,
2457
+ 0.0703125,
2458
+ 0.0625,
2459
+ 0.05078125,
2460
+ 0.06640625,
2461
+ 0.078125,
2462
+ 0.07421875,
2463
+ 0.06640625,
2464
+ 0.06640625,
2465
+ 0.0703125,
2466
+ 0.0546875,
2467
+ 0.05859375,
2468
+ 0.06640625,
2469
+ 0.078125,
2470
+ 0.0703125,
2471
+ 0.06640625,
2472
+ 0.07421875,
2473
+ 0.078125,
2474
+ 0.07421875
2475
+ ]
2476
+ }
2477
+ },
2478
+ "first_exact_by_run": {}
2479
+ }
2480
+ RESULT config=allcorrupt_logistic_sig0p05_0p5 ckpt_step=3000 views=1536000 token_acc=0.0747 exact=0/64 exact_refs=0 hits=[]
2481
+ [noise-pilot] continue config=allcorrupt_logistic_sig0p05_0p5 step=3000
2482
+ [noise-pilot] train config=allcorrupt_seqrand1_highC64_4096 from=2000 to=3000 C=64->4096 seq_alpha=1.0 sampler=dirichlet
2483
+ [noise-pilot] eval config=allcorrupt_seqrand1_highC64_4096 step=3000
2484
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805 step=3000 soft=none
2485
+ [decode] max_len=256 generated=64/64
2486
+ {
2487
+ "num_rows": 1,
2488
+ "best_by_run": {
2489
+ "train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805::none": {
2490
+ "run": "train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805",
2491
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805/step_0003000.pt",
2492
+ "ckpt_step": 3000,
2493
+ "endpoint_softening": "none",
2494
+ "decode_rule": "flowmap",
2495
+ "steps": 128,
2496
+ "time_schedule": "logit_normal",
2497
+ "model_t_mode": "post",
2498
+ "final_from": "state",
2499
+ "n_gen": 64,
2500
+ "n_refs": 8,
2501
+ "token_acc_mean": 0.207763671875,
2502
+ "token_acc_min": 0.046875,
2503
+ "token_acc_max": 0.28125,
2504
+ "exact_acc": 0.0,
2505
+ "exact_count": 0,
2506
+ "exact_ref_coverage": 0.0,
2507
+ "exact_ref_count": 0,
2508
+ "exact_ref_hits": [],
2509
+ "best_ref_idx": [
2510
+ 0,
2511
+ 0,
2512
+ 0,
2513
+ 0,
2514
+ 0,
2515
+ 0,
2516
+ 0,
2517
+ 0,
2518
+ 0,
2519
+ 0,
2520
+ 0,
2521
+ 0,
2522
+ 0,
2523
+ 0,
2524
+ 0,
2525
+ 0,
2526
+ 0,
2527
+ 0,
2528
+ 0,
2529
+ 0,
2530
+ 0,
2531
+ 0,
2532
+ 0,
2533
+ 0,
2534
+ 0,
2535
+ 0,
2536
+ 0,
2537
+ 1,
2538
+ 0,
2539
+ 0,
2540
+ 0,
2541
+ 0,
2542
+ 0,
2543
+ 0,
2544
+ 0,
2545
+ 0,
2546
+ 0,
2547
+ 0,
2548
+ 0,
2549
+ 0,
2550
+ 0,
2551
+ 0,
2552
+ 0,
2553
+ 0,
2554
+ 0,
2555
+ 0,
2556
+ 0,
2557
+ 0,
2558
+ 0,
2559
+ 0,
2560
+ 0,
2561
+ 0,
2562
+ 0,
2563
+ 0,
2564
+ 0,
2565
+ 0,
2566
+ 0,
2567
+ 0,
2568
+ 0,
2569
+ 0,
2570
+ 0,
2571
+ 0,
2572
+ 0,
2573
+ 0
2574
+ ],
2575
+ "best_token_acc": [
2576
+ 0.234375,
2577
+ 0.10546875,
2578
+ 0.2578125,
2579
+ 0.2265625,
2580
+ 0.2578125,
2581
+ 0.171875,
2582
+ 0.11328125,
2583
+ 0.25390625,
2584
+ 0.16015625,
2585
+ 0.234375,
2586
+ 0.28125,
2587
+ 0.23828125,
2588
+ 0.18359375,
2589
+ 0.26953125,
2590
+ 0.2578125,
2591
+ 0.23828125,
2592
+ 0.0546875,
2593
+ 0.23828125,
2594
+ 0.26171875,
2595
+ 0.23046875,
2596
+ 0.23828125,
2597
+ 0.14453125,
2598
+ 0.234375,
2599
+ 0.1953125,
2600
+ 0.1875,
2601
+ 0.1328125,
2602
+ 0.25390625,
2603
+ 0.046875,
2604
+ 0.25,
2605
+ 0.234375,
2606
+ 0.19140625,
2607
+ 0.27734375,
2608
+ 0.24609375,
2609
+ 0.1171875,
2610
+ 0.23046875,
2611
+ 0.24609375,
2612
+ 0.2578125,
2613
+ 0.05859375,
2614
+ 0.26171875,
2615
+ 0.23046875,
2616
+ 0.26171875,
2617
+ 0.0859375,
2618
+ 0.25390625,
2619
+ 0.24609375,
2620
+ 0.08984375,
2621
+ 0.26171875,
2622
+ 0.2578125,
2623
+ 0.25390625,
2624
+ 0.21484375,
2625
+ 0.234375,
2626
+ 0.21484375,
2627
+ 0.2578125,
2628
+ 0.25,
2629
+ 0.234375,
2630
+ 0.234375,
2631
+ 0.0859375,
2632
+ 0.19140625,
2633
+ 0.234375,
2634
+ 0.1171875,
2635
+ 0.26171875,
2636
+ 0.2265625,
2637
+ 0.203125,
2638
+ 0.0546875,
2639
+ 0.265625
2640
+ ]
2641
+ }
2642
+ },
2643
+ "first_exact_by_run": {}
2644
+ }
2645
+ RESULT config=allcorrupt_seqrand1_highC64_4096 ckpt_step=3000 views=1536000 token_acc=0.2078 exact=0/64 exact_refs=0 hits=[]
2646
+ [noise-pilot] continue config=allcorrupt_seqrand1_highC64_4096 step=3000
2647
+ [noise-pilot] train config=allcorrupt_unigram_shared0p5 from=1000 to=2000 C=1.0->1024 seq_alpha=0.0 sampler=dirichlet
2648
+ [noise-pilot] eval config=allcorrupt_unigram_shared0p5 step=2000
2649
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805 step=2000 soft=none
2650
+ [decode] max_len=256 generated=64/64
2651
+ {
2652
+ "num_rows": 1,
2653
+ "best_by_run": {
2654
+ "train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805::none": {
2655
+ "run": "train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805",
2656
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805/step_0002000.pt",
2657
+ "ckpt_step": 2000,
2658
+ "endpoint_softening": "none",
2659
+ "decode_rule": "flowmap",
2660
+ "steps": 128,
2661
+ "time_schedule": "logit_normal",
2662
+ "model_t_mode": "post",
2663
+ "final_from": "state",
2664
+ "n_gen": 64,
2665
+ "n_refs": 8,
2666
+ "token_acc_mean": 0.05218505859375,
2667
+ "token_acc_min": 0.0390625,
2668
+ "token_acc_max": 0.08984375,
2669
+ "exact_acc": 0.0,
2670
+ "exact_count": 0,
2671
+ "exact_ref_coverage": 0.0,
2672
+ "exact_ref_count": 0,
2673
+ "exact_ref_hits": [],
2674
+ "best_ref_idx": [
2675
+ 2,
2676
+ 7,
2677
+ 3,
2678
+ 2,
2679
+ 7,
2680
+ 7,
2681
+ 3,
2682
+ 7,
2683
+ 2,
2684
+ 3,
2685
+ 1,
2686
+ 3,
2687
+ 5,
2688
+ 2,
2689
+ 6,
2690
+ 2,
2691
+ 3,
2692
+ 1,
2693
+ 2,
2694
+ 0,
2695
+ 3,
2696
+ 7,
2697
+ 3,
2698
+ 3,
2699
+ 2,
2700
+ 0,
2701
+ 7,
2702
+ 2,
2703
+ 1,
2704
+ 1,
2705
+ 2,
2706
+ 1,
2707
+ 2,
2708
+ 7,
2709
+ 7,
2710
+ 2,
2711
+ 1,
2712
+ 3,
2713
+ 3,
2714
+ 0,
2715
+ 3,
2716
+ 2,
2717
+ 5,
2718
+ 5,
2719
+ 7,
2720
+ 3,
2721
+ 7,
2722
+ 1,
2723
+ 3,
2724
+ 5,
2725
+ 3,
2726
+ 3,
2727
+ 3,
2728
+ 2,
2729
+ 5,
2730
+ 2,
2731
+ 2,
2732
+ 7,
2733
+ 1,
2734
+ 3,
2735
+ 5,
2736
+ 7,
2737
+ 2,
2738
+ 3
2739
+ ],
2740
+ "best_token_acc": [
2741
+ 0.05078125,
2742
+ 0.0625,
2743
+ 0.0390625,
2744
+ 0.0390625,
2745
+ 0.046875,
2746
+ 0.0546875,
2747
+ 0.046875,
2748
+ 0.0625,
2749
+ 0.05078125,
2750
+ 0.05078125,
2751
+ 0.06640625,
2752
+ 0.05078125,
2753
+ 0.05859375,
2754
+ 0.05078125,
2755
+ 0.0625,
2756
+ 0.04296875,
2757
+ 0.04296875,
2758
+ 0.0625,
2759
+ 0.0390625,
2760
+ 0.0390625,
2761
+ 0.05078125,
2762
+ 0.05859375,
2763
+ 0.0546875,
2764
+ 0.04296875,
2765
+ 0.04296875,
2766
+ 0.05078125,
2767
+ 0.0390625,
2768
+ 0.05859375,
2769
+ 0.06640625,
2770
+ 0.05859375,
2771
+ 0.046875,
2772
+ 0.05859375,
2773
+ 0.04296875,
2774
+ 0.0546875,
2775
+ 0.04296875,
2776
+ 0.05078125,
2777
+ 0.0625,
2778
+ 0.046875,
2779
+ 0.046875,
2780
+ 0.05078125,
2781
+ 0.0546875,
2782
+ 0.046875,
2783
+ 0.0546875,
2784
+ 0.05859375,
2785
+ 0.0625,
2786
+ 0.05078125,
2787
+ 0.05078125,
2788
+ 0.0390625,
2789
+ 0.05078125,
2790
+ 0.06640625,
2791
+ 0.04296875,
2792
+ 0.046875,
2793
+ 0.0546875,
2794
+ 0.04296875,
2795
+ 0.05859375,
2796
+ 0.0546875,
2797
+ 0.05078125,
2798
+ 0.0703125,
2799
+ 0.08984375,
2800
+ 0.04296875,
2801
+ 0.05859375,
2802
+ 0.0546875,
2803
+ 0.04296875,
2804
+ 0.046875
2805
+ ]
2806
+ }
2807
+ },
2808
+ "first_exact_by_run": {}
2809
+ }
2810
+ RESULT config=allcorrupt_unigram_shared0p5 ckpt_step=2000 views=1024000 token_acc=0.0522 exact=0/64 exact_refs=0 hits=[]
2811
+ [noise-pilot] continue config=allcorrupt_unigram_shared0p5 step=2000
2812
+ [noise-pilot] round=2 Sun May 17 16:55:15 UTC 2026
2813
+ [noise-pilot] train config=allcorrupt_fullvocab_dirC1_1024 from=3000 to=4000 C=1.0->1024 seq_alpha=0.0 sampler=dirichlet
2814
+ [noise-pilot] eval config=allcorrupt_fullvocab_dirC1_1024 step=4000
2815
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805 step=4000 soft=none
2816
+ [decode] max_len=256 generated=64/64
2817
+ {
2818
+ "num_rows": 1,
2819
+ "best_by_run": {
2820
+ "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805::none": {
2821
+ "run": "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805",
2822
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805/step_0004000.pt",
2823
+ "ckpt_step": 4000,
2824
+ "endpoint_softening": "none",
2825
+ "decode_rule": "flowmap",
2826
+ "steps": 128,
2827
+ "time_schedule": "logit_normal",
2828
+ "model_t_mode": "post",
2829
+ "final_from": "state",
2830
+ "n_gen": 64,
2831
+ "n_refs": 8,
2832
+ "token_acc_mean": 0.1051025390625,
2833
+ "token_acc_min": 0.04296875,
2834
+ "token_acc_max": 0.2890625,
2835
+ "exact_acc": 0.0,
2836
+ "exact_count": 0,
2837
+ "exact_ref_coverage": 0.0,
2838
+ "exact_ref_count": 0,
2839
+ "exact_ref_hits": [],
2840
+ "best_ref_idx": [
2841
+ 2,
2842
+ 5,
2843
+ 7,
2844
+ 1,
2845
+ 5,
2846
+ 3,
2847
+ 0,
2848
+ 1,
2849
+ 5,
2850
+ 7,
2851
+ 1,
2852
+ 7,
2853
+ 7,
2854
+ 7,
2855
+ 7,
2856
+ 7,
2857
+ 7,
2858
+ 7,
2859
+ 7,
2860
+ 5,
2861
+ 1,
2862
+ 7,
2863
+ 5,
2864
+ 7,
2865
+ 7,
2866
+ 1,
2867
+ 7,
2868
+ 7,
2869
+ 7,
2870
+ 7,
2871
+ 1,
2872
+ 7,
2873
+ 5,
2874
+ 0,
2875
+ 5,
2876
+ 2,
2877
+ 1,
2878
+ 7,
2879
+ 5,
2880
+ 1,
2881
+ 7,
2882
+ 0,
2883
+ 7,
2884
+ 7,
2885
+ 3,
2886
+ 7,
2887
+ 0,
2888
+ 2,
2889
+ 7,
2890
+ 7,
2891
+ 1,
2892
+ 5,
2893
+ 7,
2894
+ 2,
2895
+ 5,
2896
+ 5,
2897
+ 5,
2898
+ 7,
2899
+ 7,
2900
+ 1,
2901
+ 1,
2902
+ 1,
2903
+ 7,
2904
+ 7
2905
+ ],
2906
+ "best_token_acc": [
2907
+ 0.078125,
2908
+ 0.10546875,
2909
+ 0.0703125,
2910
+ 0.046875,
2911
+ 0.08203125,
2912
+ 0.1015625,
2913
+ 0.0625,
2914
+ 0.125,
2915
+ 0.1171875,
2916
+ 0.1015625,
2917
+ 0.0859375,
2918
+ 0.10546875,
2919
+ 0.08984375,
2920
+ 0.06640625,
2921
+ 0.0703125,
2922
+ 0.0703125,
2923
+ 0.078125,
2924
+ 0.08984375,
2925
+ 0.09375,
2926
+ 0.1875,
2927
+ 0.0703125,
2928
+ 0.09375,
2929
+ 0.09375,
2930
+ 0.0625,
2931
+ 0.109375,
2932
+ 0.23046875,
2933
+ 0.0859375,
2934
+ 0.2734375,
2935
+ 0.0859375,
2936
+ 0.07421875,
2937
+ 0.09375,
2938
+ 0.05859375,
2939
+ 0.1875,
2940
+ 0.109375,
2941
+ 0.04296875,
2942
+ 0.046875,
2943
+ 0.12890625,
2944
+ 0.0703125,
2945
+ 0.109375,
2946
+ 0.1015625,
2947
+ 0.08203125,
2948
+ 0.06640625,
2949
+ 0.078125,
2950
+ 0.078125,
2951
+ 0.0625,
2952
+ 0.140625,
2953
+ 0.08984375,
2954
+ 0.25390625,
2955
+ 0.06640625,
2956
+ 0.09765625,
2957
+ 0.26953125,
2958
+ 0.1875,
2959
+ 0.078125,
2960
+ 0.2890625,
2961
+ 0.06640625,
2962
+ 0.10546875,
2963
+ 0.18359375,
2964
+ 0.046875,
2965
+ 0.07421875,
2966
+ 0.05078125,
2967
+ 0.16796875,
2968
+ 0.1015625,
2969
+ 0.06640625,
2970
+ 0.06640625
2971
+ ]
2972
+ }
2973
+ },
2974
+ "first_exact_by_run": {}
2975
+ }
2976
+ RESULT config=allcorrupt_fullvocab_dirC1_1024 ckpt_step=4000 views=2048000 token_acc=0.1051 exact=0/64 exact_refs=0 hits=[]
2977
+ [noise-pilot] continue config=allcorrupt_fullvocab_dirC1_1024 step=4000
2978
+ [noise-pilot] train config=allcorrupt_seqrand1_dirC1_1024 from=3000 to=4000 C=1.0->1024 seq_alpha=1.0 sampler=dirichlet
2979
+ [noise-pilot] eval config=allcorrupt_seqrand1_dirC1_1024 step=4000
2980
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805 step=4000 soft=none
2981
+ [decode] max_len=256 generated=64/64
2982
+ {
2983
+ "num_rows": 1,
2984
+ "best_by_run": {
2985
+ "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805::none": {
2986
+ "run": "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805",
2987
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805/step_0004000.pt",
2988
+ "ckpt_step": 4000,
2989
+ "endpoint_softening": "none",
2990
+ "decode_rule": "flowmap",
2991
+ "steps": 128,
2992
+ "time_schedule": "logit_normal",
2993
+ "model_t_mode": "post",
2994
+ "final_from": "state",
2995
+ "n_gen": 64,
2996
+ "n_refs": 8,
2997
+ "token_acc_mean": 0.01953125,
2998
+ "token_acc_min": 0.01953125,
2999
+ "token_acc_max": 0.01953125,
3000
+ "exact_acc": 0.0,
3001
+ "exact_count": 0,
3002
+ "exact_ref_coverage": 0.0,
3003
+ "exact_ref_count": 0,
3004
+ "exact_ref_hits": [],
3005
+ "best_ref_idx": [
3006
+ 0,
3007
+ 0,
3008
+ 0,
3009
+ 0,
3010
+ 0,
3011
+ 0,
3012
+ 0,
3013
+ 0,
3014
+ 0,
3015
+ 0,
3016
+ 0,
3017
+ 0,
3018
+ 0,
3019
+ 0,
3020
+ 0,
3021
+ 0,
3022
+ 0,
3023
+ 0,
3024
+ 0,
3025
+ 0,
3026
+ 0,
3027
+ 0,
3028
+ 0,
3029
+ 0,
3030
+ 0,
3031
+ 0,
3032
+ 0,
3033
+ 0,
3034
+ 0,
3035
+ 0,
3036
+ 0,
3037
+ 0,
3038
+ 0,
3039
+ 0,
3040
+ 0,
3041
+ 0,
3042
+ 0,
3043
+ 0,
3044
+ 0,
3045
+ 0,
3046
+ 0,
3047
+ 0,
3048
+ 0,
3049
+ 0,
3050
+ 0,
3051
+ 0,
3052
+ 0,
3053
+ 0,
3054
+ 0,
3055
+ 0,
3056
+ 0,
3057
+ 0,
3058
+ 0,
3059
+ 0,
3060
+ 0,
3061
+ 0,
3062
+ 0,
3063
+ 0,
3064
+ 0,
3065
+ 0,
3066
+ 0,
3067
+ 0,
3068
+ 0,
3069
+ 0
3070
+ ],
3071
+ "best_token_acc": [
3072
+ 0.01953125,
3073
+ 0.01953125,
3074
+ 0.01953125,
3075
+ 0.01953125,
3076
+ 0.01953125,
3077
+ 0.01953125,
3078
+ 0.01953125,
3079
+ 0.01953125,
3080
+ 0.01953125,
3081
+ 0.01953125,
3082
+ 0.01953125,
3083
+ 0.01953125,
3084
+ 0.01953125,
3085
+ 0.01953125,
3086
+ 0.01953125,
3087
+ 0.01953125,
3088
+ 0.01953125,
3089
+ 0.01953125,
3090
+ 0.01953125,
3091
+ 0.01953125,
3092
+ 0.01953125,
3093
+ 0.01953125,
3094
+ 0.01953125,
3095
+ 0.01953125,
3096
+ 0.01953125,
3097
+ 0.01953125,
3098
+ 0.01953125,
3099
+ 0.01953125,
3100
+ 0.01953125,
3101
+ 0.01953125,
3102
+ 0.01953125,
3103
+ 0.01953125,
3104
+ 0.01953125,
3105
+ 0.01953125,
3106
+ 0.01953125,
3107
+ 0.01953125,
3108
+ 0.01953125,
3109
+ 0.01953125,
3110
+ 0.01953125,
3111
+ 0.01953125,
3112
+ 0.01953125,
3113
+ 0.01953125,
3114
+ 0.01953125,
3115
+ 0.01953125,
3116
+ 0.01953125,
3117
+ 0.01953125,
3118
+ 0.01953125,
3119
+ 0.01953125,
3120
+ 0.01953125,
3121
+ 0.01953125,
3122
+ 0.01953125,
3123
+ 0.01953125,
3124
+ 0.01953125,
3125
+ 0.01953125,
3126
+ 0.01953125,
3127
+ 0.01953125,
3128
+ 0.01953125,
3129
+ 0.01953125,
3130
+ 0.01953125,
3131
+ 0.01953125,
3132
+ 0.01953125,
3133
+ 0.01953125,
3134
+ 0.01953125,
3135
+ 0.01953125
3136
+ ]
3137
+ }
3138
+ },
3139
+ "first_exact_by_run": {}
3140
+ }
3141
+ RESULT config=allcorrupt_seqrand1_dirC1_1024 ckpt_step=4000 views=2048000 token_acc=0.0195 exact=0/64 exact_refs=0 hits=[]
3142
+ [noise-pilot] continue config=allcorrupt_seqrand1_dirC1_1024 step=4000
3143
+ [noise-pilot] train config=allcorrupt_highC64_4096 from=3000 to=4000 C=64->4096 seq_alpha=0.0 sampler=dirichlet
3144
+ [noise-pilot] eval config=allcorrupt_highC64_4096 step=4000
3145
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805 step=4000 soft=none
3146
+ [decode] max_len=256 generated=64/64
3147
+ {
3148
+ "num_rows": 1,
3149
+ "best_by_run": {
3150
+ "train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805::none": {
3151
+ "run": "train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805",
3152
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_highC64_4096_20260517_163805/step_0004000.pt",
3153
+ "ckpt_step": 4000,
3154
+ "endpoint_softening": "none",
3155
+ "decode_rule": "flowmap",
3156
+ "steps": 128,
3157
+ "time_schedule": "logit_normal",
3158
+ "model_t_mode": "post",
3159
+ "final_from": "state",
3160
+ "n_gen": 64,
3161
+ "n_refs": 8,
3162
+ "token_acc_mean": 0.0806884765625,
3163
+ "token_acc_min": 0.046875,
3164
+ "token_acc_max": 0.48828125,
3165
+ "exact_acc": 0.0,
3166
+ "exact_count": 0,
3167
+ "exact_ref_coverage": 0.0,
3168
+ "exact_ref_count": 0,
3169
+ "exact_ref_hits": [],
3170
+ "best_ref_idx": [
3171
+ 4,
3172
+ 5,
3173
+ 5,
3174
+ 0,
3175
+ 5,
3176
+ 0,
3177
+ 0,
3178
+ 7,
3179
+ 7,
3180
+ 7,
3181
+ 0,
3182
+ 0,
3183
+ 2,
3184
+ 6,
3185
+ 7,
3186
+ 7,
3187
+ 7,
3188
+ 0,
3189
+ 7,
3190
+ 0,
3191
+ 7,
3192
+ 5,
3193
+ 0,
3194
+ 7,
3195
+ 7,
3196
+ 5,
3197
+ 0,
3198
+ 0,
3199
+ 7,
3200
+ 0,
3201
+ 5,
3202
+ 0,
3203
+ 0,
3204
+ 0,
3205
+ 2,
3206
+ 0,
3207
+ 2,
3208
+ 0,
3209
+ 0,
3210
+ 5,
3211
+ 0,
3212
+ 5,
3213
+ 3,
3214
+ 5,
3215
+ 0,
3216
+ 5,
3217
+ 7,
3218
+ 0,
3219
+ 3,
3220
+ 7,
3221
+ 5,
3222
+ 6,
3223
+ 0,
3224
+ 5,
3225
+ 7,
3226
+ 5,
3227
+ 7,
3228
+ 0,
3229
+ 3,
3230
+ 0,
3231
+ 0,
3232
+ 0,
3233
+ 0,
3234
+ 3
3235
+ ],
3236
+ "best_token_acc": [
3237
+ 0.05078125,
3238
+ 0.05859375,
3239
+ 0.05859375,
3240
+ 0.0546875,
3241
+ 0.0625,
3242
+ 0.05859375,
3243
+ 0.0546875,
3244
+ 0.0546875,
3245
+ 0.05859375,
3246
+ 0.078125,
3247
+ 0.0546875,
3248
+ 0.0546875,
3249
+ 0.08203125,
3250
+ 0.48828125,
3251
+ 0.0625,
3252
+ 0.05078125,
3253
+ 0.0703125,
3254
+ 0.0546875,
3255
+ 0.109375,
3256
+ 0.0546875,
3257
+ 0.046875,
3258
+ 0.0625,
3259
+ 0.046875,
3260
+ 0.05078125,
3261
+ 0.05859375,
3262
+ 0.0625,
3263
+ 0.0546875,
3264
+ 0.05078125,
3265
+ 0.0703125,
3266
+ 0.05859375,
3267
+ 0.0625,
3268
+ 0.05859375,
3269
+ 0.05078125,
3270
+ 0.0546875,
3271
+ 0.1015625,
3272
+ 0.0546875,
3273
+ 0.23828125,
3274
+ 0.046875,
3275
+ 0.05859375,
3276
+ 0.05859375,
3277
+ 0.0546875,
3278
+ 0.0625,
3279
+ 0.08984375,
3280
+ 0.0546875,
3281
+ 0.0546875,
3282
+ 0.05859375,
3283
+ 0.23046875,
3284
+ 0.0625,
3285
+ 0.31640625,
3286
+ 0.1484375,
3287
+ 0.0703125,
3288
+ 0.171875,
3289
+ 0.0546875,
3290
+ 0.06640625,
3291
+ 0.0625,
3292
+ 0.0546875,
3293
+ 0.0546875,
3294
+ 0.0546875,
3295
+ 0.08984375,
3296
+ 0.09375,
3297
+ 0.05859375,
3298
+ 0.0546875,
3299
+ 0.0625,
3300
+ 0.0625
3301
+ ]
3302
+ }
3303
+ },
3304
+ "first_exact_by_run": {}
3305
+ }
3306
+ RESULT config=allcorrupt_highC64_4096 ckpt_step=4000 views=2048000 token_acc=0.0807 exact=0/64 exact_refs=0 hits=[]
3307
+ [noise-pilot] continue config=allcorrupt_highC64_4096 step=4000
3308
+ [noise-pilot] train config=allcorrupt_logistic_sig0p05_0p5 from=3000 to=4000 C=1.0->1024 seq_alpha=0.0 sampler=logistic_normal_linear_mean
3309
+ [noise-pilot] eval config=allcorrupt_logistic_sig0p05_0p5 step=4000
3310
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805 step=4000 soft=none
3311
+ [decode] max_len=256 generated=64/64
3312
+ {
3313
+ "num_rows": 1,
3314
+ "best_by_run": {
3315
+ "train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805::none": {
3316
+ "run": "train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805",
3317
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_logistic_sig0p05_0p5_20260517_163805/step_0004000.pt",
3318
+ "ckpt_step": 4000,
3319
+ "endpoint_softening": "none",
3320
+ "decode_rule": "flowmap",
3321
+ "steps": 128,
3322
+ "time_schedule": "logit_normal",
3323
+ "model_t_mode": "post",
3324
+ "final_from": "state",
3325
+ "n_gen": 64,
3326
+ "n_refs": 8,
3327
+ "token_acc_mean": 0.091552734375,
3328
+ "token_acc_min": 0.046875,
3329
+ "token_acc_max": 0.328125,
3330
+ "exact_acc": 0.0,
3331
+ "exact_count": 0,
3332
+ "exact_ref_coverage": 0.0,
3333
+ "exact_ref_count": 0,
3334
+ "exact_ref_hits": [],
3335
+ "best_ref_idx": [
3336
+ 3,
3337
+ 3,
3338
+ 3,
3339
+ 0,
3340
+ 0,
3341
+ 2,
3342
+ 3,
3343
+ 3,
3344
+ 0,
3345
+ 0,
3346
+ 4,
3347
+ 3,
3348
+ 3,
3349
+ 0,
3350
+ 0,
3351
+ 0,
3352
+ 3,
3353
+ 0,
3354
+ 3,
3355
+ 0,
3356
+ 0,
3357
+ 0,
3358
+ 3,
3359
+ 3,
3360
+ 3,
3361
+ 0,
3362
+ 3,
3363
+ 3,
3364
+ 0,
3365
+ 3,
3366
+ 3,
3367
+ 0,
3368
+ 0,
3369
+ 0,
3370
+ 3,
3371
+ 3,
3372
+ 0,
3373
+ 0,
3374
+ 3,
3375
+ 3,
3376
+ 3,
3377
+ 0,
3378
+ 3,
3379
+ 3,
3380
+ 0,
3381
+ 3,
3382
+ 2,
3383
+ 3,
3384
+ 4,
3385
+ 0,
3386
+ 3,
3387
+ 4,
3388
+ 3,
3389
+ 3,
3390
+ 3,
3391
+ 3,
3392
+ 0,
3393
+ 3,
3394
+ 3,
3395
+ 0,
3396
+ 0,
3397
+ 3,
3398
+ 0,
3399
+ 0
3400
+ ],
3401
+ "best_token_acc": [
3402
+ 0.07421875,
3403
+ 0.06640625,
3404
+ 0.08984375,
3405
+ 0.08203125,
3406
+ 0.0859375,
3407
+ 0.0546875,
3408
+ 0.0703125,
3409
+ 0.06640625,
3410
+ 0.1484375,
3411
+ 0.1953125,
3412
+ 0.0703125,
3413
+ 0.06640625,
3414
+ 0.0703125,
3415
+ 0.046875,
3416
+ 0.26171875,
3417
+ 0.1015625,
3418
+ 0.1015625,
3419
+ 0.328125,
3420
+ 0.05859375,
3421
+ 0.14453125,
3422
+ 0.0859375,
3423
+ 0.21875,
3424
+ 0.07421875,
3425
+ 0.05078125,
3426
+ 0.06640625,
3427
+ 0.0703125,
3428
+ 0.0703125,
3429
+ 0.078125,
3430
+ 0.12109375,
3431
+ 0.0703125,
3432
+ 0.0703125,
3433
+ 0.078125,
3434
+ 0.08203125,
3435
+ 0.24609375,
3436
+ 0.0546875,
3437
+ 0.0703125,
3438
+ 0.15234375,
3439
+ 0.0703125,
3440
+ 0.05859375,
3441
+ 0.07421875,
3442
+ 0.06640625,
3443
+ 0.08203125,
3444
+ 0.1015625,
3445
+ 0.08984375,
3446
+ 0.0859375,
3447
+ 0.05859375,
3448
+ 0.05078125,
3449
+ 0.0625,
3450
+ 0.046875,
3451
+ 0.08984375,
3452
+ 0.07421875,
3453
+ 0.05859375,
3454
+ 0.06640625,
3455
+ 0.0703125,
3456
+ 0.07421875,
3457
+ 0.05078125,
3458
+ 0.07421875,
3459
+ 0.05859375,
3460
+ 0.05859375,
3461
+ 0.0625,
3462
+ 0.078125,
3463
+ 0.08203125,
3464
+ 0.07421875,
3465
+ 0.1953125
3466
+ ]
3467
+ }
3468
+ },
3469
+ "first_exact_by_run": {}
3470
+ }
3471
+ RESULT config=allcorrupt_logistic_sig0p05_0p5 ckpt_step=4000 views=2048000 token_acc=0.0916 exact=0/64 exact_refs=0 hits=[]
3472
+ [noise-pilot] continue config=allcorrupt_logistic_sig0p05_0p5 step=4000
3473
+ [noise-pilot] train config=allcorrupt_seqrand1_highC64_4096 from=3000 to=4000 C=64->4096 seq_alpha=1.0 sampler=dirichlet
3474
+ [noise-pilot] eval config=allcorrupt_seqrand1_highC64_4096 step=4000
3475
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805 step=4000 soft=none
3476
+ [decode] max_len=256 generated=64/64
3477
+ {
3478
+ "num_rows": 1,
3479
+ "best_by_run": {
3480
+ "train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805::none": {
3481
+ "run": "train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805",
3482
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_seqrand1_highC64_4096_20260517_163805/step_0004000.pt",
3483
+ "ckpt_step": 4000,
3484
+ "endpoint_softening": "none",
3485
+ "decode_rule": "flowmap",
3486
+ "steps": 128,
3487
+ "time_schedule": "logit_normal",
3488
+ "model_t_mode": "post",
3489
+ "final_from": "state",
3490
+ "n_gen": 64,
3491
+ "n_refs": 8,
3492
+ "token_acc_mean": 0.0458984375,
3493
+ "token_acc_min": 0.01953125,
3494
+ "token_acc_max": 0.2265625,
3495
+ "exact_acc": 0.0,
3496
+ "exact_count": 0,
3497
+ "exact_ref_coverage": 0.0,
3498
+ "exact_ref_count": 0,
3499
+ "exact_ref_hits": [],
3500
+ "best_ref_idx": [
3501
+ 0,
3502
+ 1,
3503
+ 0,
3504
+ 0,
3505
+ 0,
3506
+ 0,
3507
+ 1,
3508
+ 0,
3509
+ 0,
3510
+ 0,
3511
+ 5,
3512
+ 5,
3513
+ 0,
3514
+ 0,
3515
+ 0,
3516
+ 0,
3517
+ 0,
3518
+ 0,
3519
+ 1,
3520
+ 5,
3521
+ 3,
3522
+ 0,
3523
+ 5,
3524
+ 5,
3525
+ 1,
3526
+ 5,
3527
+ 0,
3528
+ 1,
3529
+ 5,
3530
+ 0,
3531
+ 0,
3532
+ 1,
3533
+ 5,
3534
+ 5,
3535
+ 5,
3536
+ 0,
3537
+ 0,
3538
+ 5,
3539
+ 7,
3540
+ 0,
3541
+ 0,
3542
+ 0,
3543
+ 1,
3544
+ 7,
3545
+ 0,
3546
+ 5,
3547
+ 5,
3548
+ 7,
3549
+ 0,
3550
+ 0,
3551
+ 0,
3552
+ 0,
3553
+ 1,
3554
+ 1,
3555
+ 4,
3556
+ 0,
3557
+ 7,
3558
+ 0,
3559
+ 1,
3560
+ 0,
3561
+ 0,
3562
+ 0,
3563
+ 0,
3564
+ 4
3565
+ ],
3566
+ "best_token_acc": [
3567
+ 0.0390625,
3568
+ 0.03125,
3569
+ 0.05859375,
3570
+ 0.02734375,
3571
+ 0.03515625,
3572
+ 0.0625,
3573
+ 0.03515625,
3574
+ 0.03125,
3575
+ 0.05078125,
3576
+ 0.0625,
3577
+ 0.0390625,
3578
+ 0.03515625,
3579
+ 0.0390625,
3580
+ 0.03515625,
3581
+ 0.04296875,
3582
+ 0.03515625,
3583
+ 0.0546875,
3584
+ 0.03515625,
3585
+ 0.03125,
3586
+ 0.03125,
3587
+ 0.03125,
3588
+ 0.08203125,
3589
+ 0.03515625,
3590
+ 0.03125,
3591
+ 0.03515625,
3592
+ 0.05078125,
3593
+ 0.0390625,
3594
+ 0.046875,
3595
+ 0.03515625,
3596
+ 0.1015625,
3597
+ 0.08203125,
3598
+ 0.02734375,
3599
+ 0.046875,
3600
+ 0.03125,
3601
+ 0.03125,
3602
+ 0.08984375,
3603
+ 0.05859375,
3604
+ 0.03515625,
3605
+ 0.0390625,
3606
+ 0.04296875,
3607
+ 0.03515625,
3608
+ 0.05859375,
3609
+ 0.03515625,
3610
+ 0.03125,
3611
+ 0.01953125,
3612
+ 0.0390625,
3613
+ 0.0390625,
3614
+ 0.046875,
3615
+ 0.03125,
3616
+ 0.0390625,
3617
+ 0.0390625,
3618
+ 0.03125,
3619
+ 0.03515625,
3620
+ 0.02734375,
3621
+ 0.0625,
3622
+ 0.02734375,
3623
+ 0.05078125,
3624
+ 0.05078125,
3625
+ 0.03125,
3626
+ 0.0390625,
3627
+ 0.0390625,
3628
+ 0.03125,
3629
+ 0.0859375,
3630
+ 0.2265625
3631
+ ]
3632
+ }
3633
+ },
3634
+ "first_exact_by_run": {}
3635
+ }
3636
+ RESULT config=allcorrupt_seqrand1_highC64_4096 ckpt_step=4000 views=2048000 token_acc=0.0459 exact=0/64 exact_refs=0 hits=[]
3637
+ [noise-pilot] continue config=allcorrupt_seqrand1_highC64_4096 step=4000
3638
+ [noise-pilot] train config=allcorrupt_unigram_shared0p5 from=2000 to=3000 C=1.0->1024 seq_alpha=0.0 sampler=dirichlet
3639
+ [noise-pilot] eval config=allcorrupt_unigram_shared0p5 step=3000
3640
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805 step=3000 soft=none
3641
+ [decode] max_len=256 generated=64/64
3642
+ {
3643
+ "num_rows": 1,
3644
+ "best_by_run": {
3645
+ "train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805::none": {
3646
+ "run": "train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805",
3647
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_unigram_shared0p5_20260517_163805/step_0003000.pt",
3648
+ "ckpt_step": 3000,
3649
+ "endpoint_softening": "none",
3650
+ "decode_rule": "flowmap",
3651
+ "steps": 128,
3652
+ "time_schedule": "logit_normal",
3653
+ "model_t_mode": "post",
3654
+ "final_from": "state",
3655
+ "n_gen": 64,
3656
+ "n_refs": 8,
3657
+ "token_acc_mean": 0.21197509765625,
3658
+ "token_acc_min": 0.01953125,
3659
+ "token_acc_max": 0.5703125,
3660
+ "exact_acc": 0.0,
3661
+ "exact_count": 0,
3662
+ "exact_ref_coverage": 0.0,
3663
+ "exact_ref_count": 0,
3664
+ "exact_ref_hits": [],
3665
+ "best_ref_idx": [
3666
+ 6,
3667
+ 3,
3668
+ 5,
3669
+ 3,
3670
+ 5,
3671
+ 7,
3672
+ 5,
3673
+ 2,
3674
+ 2,
3675
+ 6,
3676
+ 1,
3677
+ 1,
3678
+ 6,
3679
+ 3,
3680
+ 2,
3681
+ 6,
3682
+ 6,
3683
+ 6,
3684
+ 2,
3685
+ 2,
3686
+ 3,
3687
+ 1,
3688
+ 3,
3689
+ 6,
3690
+ 6,
3691
+ 4,
3692
+ 1,
3693
+ 5,
3694
+ 2,
3695
+ 1,
3696
+ 1,
3697
+ 6,
3698
+ 3,
3699
+ 2,
3700
+ 2,
3701
+ 5,
3702
+ 2,
3703
+ 2,
3704
+ 2,
3705
+ 6,
3706
+ 5,
3707
+ 1,
3708
+ 5,
3709
+ 6,
3710
+ 6,
3711
+ 3,
3712
+ 7,
3713
+ 6,
3714
+ 6,
3715
+ 1,
3716
+ 5,
3717
+ 6,
3718
+ 6,
3719
+ 2,
3720
+ 2,
3721
+ 5,
3722
+ 5,
3723
+ 4,
3724
+ 3,
3725
+ 3,
3726
+ 2,
3727
+ 2,
3728
+ 6,
3729
+ 4
3730
+ ],
3731
+ "best_token_acc": [
3732
+ 0.44921875,
3733
+ 0.33984375,
3734
+ 0.12890625,
3735
+ 0.44140625,
3736
+ 0.15234375,
3737
+ 0.01953125,
3738
+ 0.1015625,
3739
+ 0.0859375,
3740
+ 0.09765625,
3741
+ 0.04296875,
3742
+ 0.0546875,
3743
+ 0.23828125,
3744
+ 0.08203125,
3745
+ 0.33203125,
3746
+ 0.16796875,
3747
+ 0.375,
3748
+ 0.0546875,
3749
+ 0.5078125,
3750
+ 0.171875,
3751
+ 0.1875,
3752
+ 0.46484375,
3753
+ 0.40625,
3754
+ 0.2109375,
3755
+ 0.04296875,
3756
+ 0.44140625,
3757
+ 0.1953125,
3758
+ 0.359375,
3759
+ 0.1640625,
3760
+ 0.25,
3761
+ 0.296875,
3762
+ 0.05078125,
3763
+ 0.5703125,
3764
+ 0.42578125,
3765
+ 0.1640625,
3766
+ 0.01953125,
3767
+ 0.12890625,
3768
+ 0.2109375,
3769
+ 0.125,
3770
+ 0.15625,
3771
+ 0.5390625,
3772
+ 0.125,
3773
+ 0.06640625,
3774
+ 0.125,
3775
+ 0.546875,
3776
+ 0.22265625,
3777
+ 0.38671875,
3778
+ 0.2265625,
3779
+ 0.06640625,
3780
+ 0.125,
3781
+ 0.203125,
3782
+ 0.140625,
3783
+ 0.0859375,
3784
+ 0.16015625,
3785
+ 0.0390625,
3786
+ 0.1328125,
3787
+ 0.04296875,
3788
+ 0.1484375,
3789
+ 0.09375,
3790
+ 0.24609375,
3791
+ 0.34765625,
3792
+ 0.11328125,
3793
+ 0.078125,
3794
+ 0.30078125,
3795
+ 0.2890625
3796
+ ]
3797
+ }
3798
+ },
3799
+ "first_exact_by_run": {}
3800
+ }
3801
+ RESULT config=allcorrupt_unigram_shared0p5 ckpt_step=3000 views=1536000 token_acc=0.2120 exact=0/64 exact_refs=0 hits=[]
3802
+ [noise-pilot] continue config=allcorrupt_unigram_shared0p5 step=3000
3803
+ [noise-pilot] round=3 Sun May 17 17:00:16 UTC 2026
3804
+ [noise-pilot] train config=allcorrupt_fullvocab_dirC1_1024 from=4000 to=5000 C=1.0->1024 seq_alpha=0.0 sampler=dirichlet
3805
+ [noise-pilot] eval config=allcorrupt_fullvocab_dirC1_1024 step=5000
3806
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805 step=5000 soft=none
3807
+ [decode] max_len=256 generated=64/64
3808
+ {
3809
+ "num_rows": 1,
3810
+ "best_by_run": {
3811
+ "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805::none": {
3812
+ "run": "train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805",
3813
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_fullvocab_dirC1_1024_20260517_163805/step_0005000.pt",
3814
+ "ckpt_step": 5000,
3815
+ "endpoint_softening": "none",
3816
+ "decode_rule": "flowmap",
3817
+ "steps": 128,
3818
+ "time_schedule": "logit_normal",
3819
+ "model_t_mode": "post",
3820
+ "final_from": "state",
3821
+ "n_gen": 64,
3822
+ "n_refs": 8,
3823
+ "token_acc_mean": 0.16851806640625,
3824
+ "token_acc_min": 0.05859375,
3825
+ "token_acc_max": 0.40625,
3826
+ "exact_acc": 0.0,
3827
+ "exact_count": 0,
3828
+ "exact_ref_coverage": 0.0,
3829
+ "exact_ref_count": 0,
3830
+ "exact_ref_hits": [],
3831
+ "best_ref_idx": [
3832
+ 3,
3833
+ 5,
3834
+ 3,
3835
+ 2,
3836
+ 5,
3837
+ 0,
3838
+ 5,
3839
+ 1,
3840
+ 5,
3841
+ 5,
3842
+ 1,
3843
+ 0,
3844
+ 5,
3845
+ 4,
3846
+ 7,
3847
+ 5,
3848
+ 2,
3849
+ 5,
3850
+ 5,
3851
+ 5,
3852
+ 3,
3853
+ 5,
3854
+ 7,
3855
+ 3,
3856
+ 5,
3857
+ 1,
3858
+ 1,
3859
+ 5,
3860
+ 5,
3861
+ 4,
3862
+ 3,
3863
+ 5,
3864
+ 5,
3865
+ 7,
3866
+ 5,
3867
+ 4,
3868
+ 1,
3869
+ 3,
3870
+ 2,
3871
+ 5,
3872
+ 5,
3873
+ 5,
3874
+ 5,
3875
+ 5,
3876
+ 5,
3877
+ 5,
3878
+ 5,
3879
+ 7,
3880
+ 1,
3881
+ 7,
3882
+ 0,
3883
+ 2,
3884
+ 7,
3885
+ 0,
3886
+ 7,
3887
+ 5,
3888
+ 5,
3889
+ 3,
3890
+ 0,
3891
+ 5,
3892
+ 5,
3893
+ 4,
3894
+ 5,
3895
+ 1
3896
+ ],
3897
+ "best_token_acc": [
3898
+ 0.0625,
3899
+ 0.1953125,
3900
+ 0.18359375,
3901
+ 0.140625,
3902
+ 0.15234375,
3903
+ 0.234375,
3904
+ 0.07421875,
3905
+ 0.25390625,
3906
+ 0.23828125,
3907
+ 0.08984375,
3908
+ 0.0859375,
3909
+ 0.22265625,
3910
+ 0.23046875,
3911
+ 0.078125,
3912
+ 0.0859375,
3913
+ 0.1484375,
3914
+ 0.32421875,
3915
+ 0.10546875,
3916
+ 0.0859375,
3917
+ 0.11328125,
3918
+ 0.1796875,
3919
+ 0.11328125,
3920
+ 0.07421875,
3921
+ 0.21484375,
3922
+ 0.078125,
3923
+ 0.16796875,
3924
+ 0.15625,
3925
+ 0.09375,
3926
+ 0.05859375,
3927
+ 0.40625,
3928
+ 0.1015625,
3929
+ 0.2421875,
3930
+ 0.12109375,
3931
+ 0.08984375,
3932
+ 0.08984375,
3933
+ 0.3984375,
3934
+ 0.34765625,
3935
+ 0.20703125,
3936
+ 0.2421875,
3937
+ 0.203125,
3938
+ 0.26171875,
3939
+ 0.1875,
3940
+ 0.09375,
3941
+ 0.11328125,
3942
+ 0.21484375,
3943
+ 0.1640625,
3944
+ 0.14453125,
3945
+ 0.0625,
3946
+ 0.19921875,
3947
+ 0.07421875,
3948
+ 0.23828125,
3949
+ 0.3046875,
3950
+ 0.08203125,
3951
+ 0.265625,
3952
+ 0.09765625,
3953
+ 0.06640625,
3954
+ 0.09375,
3955
+ 0.3125,
3956
+ 0.21875,
3957
+ 0.28515625,
3958
+ 0.0859375,
3959
+ 0.23046875,
3960
+ 0.16015625,
3961
+ 0.13671875
3962
+ ]
3963
+ }
3964
+ },
3965
+ "first_exact_by_run": {}
3966
+ }
3967
+ RESULT config=allcorrupt_fullvocab_dirC1_1024 ckpt_step=5000 views=2560000 token_acc=0.1685 exact=0/64 exact_refs=0 hits=[]
3968
+ [noise-pilot] continue config=allcorrupt_fullvocab_dirC1_1024 step=5000
3969
+ [noise-pilot] train config=allcorrupt_seqrand1_dirC1_1024 from=4000 to=5000 C=1.0->1024 seq_alpha=1.0 sampler=dirichlet
3970
+ [noise-pilot] eval config=allcorrupt_seqrand1_dirC1_1024 step=5000
3971
+ [eval-decode-acc] train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805 step=5000 soft=none
3972
+ [decode] max_len=256 generated=64/64
3973
+ {
3974
+ "num_rows": 1,
3975
+ "best_by_run": {
3976
+ "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805::none": {
3977
+ "run": "train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805",
3978
+ "checkpoint": "runs/train8_noisegeo_len256_allcorrupt_seqrand1_dirC1_1024_20260517_163805/step_0005000.pt",
3979
+ "ckpt_step": 5000,
3980
+ "endpoint_softening": "none",
3981
+ "decode_rule": "flowmap",
3982
+ "steps": 128,
3983
+ "time_schedule": "logit_normal",
3984
+ "model_t_mode": "post",
3985
+ "final_from": "state",
3986
+ "n_gen": 64,
3987
+ "n_refs": 8,
3988
+ "token_acc_mean": 0.0152587890625,
3989
+ "token_acc_min": 0.0078125,
3990
+ "token_acc_max": 0.0625,
3991
+ "exact_acc": 0.0,
3992
+ "exact_count": 0,
3993
+ "exact_ref_coverage": 0.0,
3994
+ "exact_ref_count": 0,
3995
+ "exact_ref_hits": [],
3996
+ "best_ref_idx": [
3997
+ 0,
3998
+ 1,
3999
+ 1,
4000
+ 1,
4001
+ 1,
4002
+ 1,
4003
+ 1,
4004
+ 5,
4005
+ 0,
4006
+ 1,
4007
+ 1,
4008
+ 1,
4009
+ 0,
4010
+ 1,
4011
+ 0,
4012
+ 0,
4013
+ 1,
4014
+ 0,
4015
+ 7,
4016
+ 1,
4017
+ 0,
4018
+ 1,
4019
+ 0,
4020
+ 0,
4021
+ 1,
4022
+ 1,
4023
+ 0,
4024
+ 1,
4025
+ 1,
4026
+ 1,
4027
+ 1,
4028
+ 0,
4029
+ 1,
4030
+ 1,
4031
+ 0,
4032
+ 0,
4033
+ 1,
4034
+ 1,
4035
+ 0,
4036
+ 1,
4037
+ 1,
4038
+ 0,
4039
+ 0,
4040
+ 1,
4041
+ 0,
4042
+ 0,
4043
+ 1,
4044
+ 0,
4045
+ 1,
4046
+ 1,
4047
+ 0,
4048
+ 0,
4049
+ 7,
4050
+ 1,
4051
+ 0,
4052
+ 1,
4053
+ 1,
4054
+ 1,
4055
+ 1,
4056
+ 1,
4057
+ 7,
4058
+ 1,
4059
+ 1,
4060
+ 1
4061
+ ],
4062
+ "best_token_acc": [
4063
+ 0.05078125,
4064
+ 0.0078125,
4065
+ 0.0078125,
4066
+ 0.0078125,
4067
+ 0.0078125,
4068
+ 0.0078125,
4069
+ 0.0078125,
4070
+ 0.01953125,
4071
+ 0.0078125,
4072
+ 0.0078125,
4073
+ 0.0078125,
4074
+ 0.0078125,
4075
+ 0.01171875,
4076
+ 0.0078125,
4077
+ 0.02734375,
4078
+ 0.046875,
4079
+ 0.0078125,
4080
+ 0.015625,
4081
+ 0.03125,
4082
+ 0.0078125,
4083
+ 0.0078125,
4084
+ 0.0078125,
4085
+ 0.0625,
4086
+ 0.0078125,
4087
+ 0.0078125,
4088
+ 0.0078125,
4089
+ 0.046875,
4090
+ 0.0078125,
4091
+ 0.0078125,
4092
+ 0.0078125,
4093
+ 0.0078125,
4094
+ 0.03125,
4095
+ 0.0078125,
4096
+ 0.0078125,
4097
+ 0.01953125,
4098
+ 0.01171875,
4099
+ 0.0078125,
4100
+ 0.0078125,
4101
+ 0.0078125,
4102
+ 0.0078125,
4103
+ 0.0078125,
4104
+ 0.0546875,
4105
+ 0.0078125,
4106
+ 0.0078125,
4107
+ 0.0078125,
4108
+ 0.01171875,
4109
+ 0.01171875,
4110
+ 0.0078125,
4111
+ 0.0078125,
4112
+ 0.01953125,
4113
+ 0.05078125,
4114
+ 0.01171875,
4115
+ 0.05859375,
4116
+ 0.01171875,
4117
+ 0.0078125,
4118
+ 0.0078125,
4119
+ 0.0078125,
4120
+ 0.01171875,
4121
+ 0.0078125,
4122
+ 0.0078125,
4123
+ 0.02734375,
4124
+ 0.0078125,
4125
+ 0.01171875,
4126
+ 0.0078125
4127
+ ]
4128
+ }
4129
+ },
4130
+ "first_exact_by_run": {}
4131
+ }
4132
+ RESULT config=allcorrupt_seqrand1_dirC1_1024 ckpt_step=5000 views=2560000 token_acc=0.0153 exact=0/64 exact_refs=0 hits=[]
4133
+ [noise-pilot] continue config=allcorrupt_seqrand1_dirC1_1024 step=5000
4134
+ [noise-pilot] train config=allcorrupt_highC64_4096 from=4000 to=5000 C=64->4096 seq_alpha=0.0 sampler=dirichlet
LTA_openwebtext_dualt/logs/noise_geometry_pilots_4gpu/current.nohup ADDED
The diff for this file is too large to render. See raw diff
 
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/__init__.py ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # This library is free software; you can redistribute it and/or
3
+ # modify it under the terms of the GNU Lesser General Public
4
+ # License as published by the Free Software Foundation; either
5
+ # version 2.1 of the License, or (at your option) any later version.
6
+ #
7
+ # This library is distributed in the hope that it will be useful,
8
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
9
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
10
+ # Lesser General Public License for more details.
11
+ #
12
+ # You should have received a copy of the GNU Lesser General Public
13
+ # License along with this library; if not, write to the Free Software
14
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
15
+ # 02110-1301 USA
16
+ ######################### END LICENSE BLOCK #########################
17
+
18
+ from typing import List, Union
19
+
20
+ from .charsetgroupprober import CharSetGroupProber
21
+ from .charsetprober import CharSetProber
22
+ from .enums import InputState
23
+ from .resultdict import ResultDict
24
+ from .universaldetector import UniversalDetector
25
+ from .version import VERSION, __version__
26
+
27
+ __all__ = ["UniversalDetector", "detect", "detect_all", "__version__", "VERSION"]
28
+
29
+
30
+ def detect(
31
+ byte_str: Union[bytes, bytearray], should_rename_legacy: bool = False
32
+ ) -> ResultDict:
33
+ """
34
+ Detect the encoding of the given byte string.
35
+
36
+ :param byte_str: The byte sequence to examine.
37
+ :type byte_str: ``bytes`` or ``bytearray``
38
+ :param should_rename_legacy: Should we rename legacy encodings
39
+ to their more modern equivalents?
40
+ :type should_rename_legacy: ``bool``
41
+ """
42
+ if not isinstance(byte_str, bytearray):
43
+ if not isinstance(byte_str, bytes):
44
+ raise TypeError(
45
+ f"Expected object of type bytes or bytearray, got: {type(byte_str)}"
46
+ )
47
+ byte_str = bytearray(byte_str)
48
+ detector = UniversalDetector(should_rename_legacy=should_rename_legacy)
49
+ detector.feed(byte_str)
50
+ return detector.close()
51
+
52
+
53
+ def detect_all(
54
+ byte_str: Union[bytes, bytearray],
55
+ ignore_threshold: bool = False,
56
+ should_rename_legacy: bool = False,
57
+ ) -> List[ResultDict]:
58
+ """
59
+ Detect all the possible encodings of the given byte string.
60
+
61
+ :param byte_str: The byte sequence to examine.
62
+ :type byte_str: ``bytes`` or ``bytearray``
63
+ :param ignore_threshold: Include encodings that are below
64
+ ``UniversalDetector.MINIMUM_THRESHOLD``
65
+ in results.
66
+ :type ignore_threshold: ``bool``
67
+ :param should_rename_legacy: Should we rename legacy encodings
68
+ to their more modern equivalents?
69
+ :type should_rename_legacy: ``bool``
70
+ """
71
+ if not isinstance(byte_str, bytearray):
72
+ if not isinstance(byte_str, bytes):
73
+ raise TypeError(
74
+ f"Expected object of type bytes or bytearray, got: {type(byte_str)}"
75
+ )
76
+ byte_str = bytearray(byte_str)
77
+
78
+ detector = UniversalDetector(should_rename_legacy=should_rename_legacy)
79
+ detector.feed(byte_str)
80
+ detector.close()
81
+
82
+ if detector.input_state == InputState.HIGH_BYTE:
83
+ results: List[ResultDict] = []
84
+ probers: List[CharSetProber] = []
85
+ for prober in detector.charset_probers:
86
+ if isinstance(prober, CharSetGroupProber):
87
+ probers.extend(p for p in prober.probers)
88
+ else:
89
+ probers.append(prober)
90
+ for prober in probers:
91
+ if ignore_threshold or prober.get_confidence() > detector.MINIMUM_THRESHOLD:
92
+ charset_name = prober.charset_name or ""
93
+ lower_charset_name = charset_name.lower()
94
+ # Use Windows encoding name instead of ISO-8859 if we saw any
95
+ # extra Windows-specific bytes
96
+ if lower_charset_name.startswith("iso-8859") and detector.has_win_bytes:
97
+ charset_name = detector.ISO_WIN_MAP.get(
98
+ lower_charset_name, charset_name
99
+ )
100
+ # Rename legacy encodings with superset encodings if asked
101
+ if should_rename_legacy:
102
+ charset_name = detector.LEGACY_MAP.get(
103
+ charset_name.lower(), charset_name
104
+ )
105
+ results.append(
106
+ {
107
+ "encoding": charset_name,
108
+ "confidence": prober.get_confidence(),
109
+ "language": prober.language,
110
+ }
111
+ )
112
+ if len(results) > 0:
113
+ return sorted(results, key=lambda result: -result["confidence"])
114
+
115
+ return [detector.result]
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/big5freq.py ADDED
@@ -0,0 +1,386 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Communicator client code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ # Big5 frequency table
29
+ # by Taiwan's Mandarin Promotion Council
30
+ # <http://www.edu.tw:81/mandr/>
31
+ #
32
+ # 128 --> 0.42261
33
+ # 256 --> 0.57851
34
+ # 512 --> 0.74851
35
+ # 1024 --> 0.89384
36
+ # 2048 --> 0.97583
37
+ #
38
+ # Ideal Distribution Ratio = 0.74851/(1-0.74851) =2.98
39
+ # Random Distribution Ration = 512/(5401-512)=0.105
40
+ #
41
+ # Typical Distribution Ratio about 25% of Ideal one, still much higher than RDR
42
+
43
+ BIG5_TYPICAL_DISTRIBUTION_RATIO = 0.75
44
+
45
+ # Char to FreqOrder table
46
+ BIG5_TABLE_SIZE = 5376
47
+ # fmt: off
48
+ BIG5_CHAR_TO_FREQ_ORDER = (
49
+ 1,1801,1506, 255,1431, 198, 9, 82, 6,5008, 177, 202,3681,1256,2821, 110, # 16
50
+ 3814, 33,3274, 261, 76, 44,2114, 16,2946,2187,1176, 659,3971, 26,3451,2653, # 32
51
+ 1198,3972,3350,4202, 410,2215, 302, 590, 361,1964, 8, 204, 58,4510,5009,1932, # 48
52
+ 63,5010,5011, 317,1614, 75, 222, 159,4203,2417,1480,5012,3555,3091, 224,2822, # 64
53
+ 3682, 3, 10,3973,1471, 29,2787,1135,2866,1940, 873, 130,3275,1123, 312,5013, # 80
54
+ 4511,2052, 507, 252, 682,5014, 142,1915, 124, 206,2947, 34,3556,3204, 64, 604, # 96
55
+ 5015,2501,1977,1978, 155,1991, 645, 641,1606,5016,3452, 337, 72, 406,5017, 80, # 112
56
+ 630, 238,3205,1509, 263, 939,1092,2654, 756,1440,1094,3453, 449, 69,2987, 591, # 128
57
+ 179,2096, 471, 115,2035,1844, 60, 50,2988, 134, 806,1869, 734,2036,3454, 180, # 144
58
+ 995,1607, 156, 537,2907, 688,5018, 319,1305, 779,2145, 514,2379, 298,4512, 359, # 160
59
+ 2502, 90,2716,1338, 663, 11, 906,1099,2553, 20,2441, 182, 532,1716,5019, 732, # 176
60
+ 1376,4204,1311,1420,3206, 25,2317,1056, 113, 399, 382,1950, 242,3455,2474, 529, # 192
61
+ 3276, 475,1447,3683,5020, 117, 21, 656, 810,1297,2300,2334,3557,5021, 126,4205, # 208
62
+ 706, 456, 150, 613,4513, 71,1118,2037,4206, 145,3092, 85, 835, 486,2115,1246, # 224
63
+ 1426, 428, 727,1285,1015, 800, 106, 623, 303,1281,5022,2128,2359, 347,3815, 221, # 240
64
+ 3558,3135,5023,1956,1153,4207, 83, 296,1199,3093, 192, 624, 93,5024, 822,1898, # 256
65
+ 2823,3136, 795,2065, 991,1554,1542,1592, 27, 43,2867, 859, 139,1456, 860,4514, # 272
66
+ 437, 712,3974, 164,2397,3137, 695, 211,3037,2097, 195,3975,1608,3559,3560,3684, # 288
67
+ 3976, 234, 811,2989,2098,3977,2233,1441,3561,1615,2380, 668,2077,1638, 305, 228, # 304
68
+ 1664,4515, 467, 415,5025, 262,2099,1593, 239, 108, 300, 200,1033, 512,1247,2078, # 320
69
+ 5026,5027,2176,3207,3685,2682, 593, 845,1062,3277, 88,1723,2038,3978,1951, 212, # 336
70
+ 266, 152, 149, 468,1899,4208,4516, 77, 187,5028,3038, 37, 5,2990,5029,3979, # 352
71
+ 5030,5031, 39,2524,4517,2908,3208,2079, 55, 148, 74,4518, 545, 483,1474,1029, # 368
72
+ 1665, 217,1870,1531,3138,1104,2655,4209, 24, 172,3562, 900,3980,3563,3564,4519, # 384
73
+ 32,1408,2824,1312, 329, 487,2360,2251,2717, 784,2683, 4,3039,3351,1427,1789, # 400
74
+ 188, 109, 499,5032,3686,1717,1790, 888,1217,3040,4520,5033,3565,5034,3352,1520, # 416
75
+ 3687,3981, 196,1034, 775,5035,5036, 929,1816, 249, 439, 38,5037,1063,5038, 794, # 432
76
+ 3982,1435,2301, 46, 178,3278,2066,5039,2381,5040, 214,1709,4521, 804, 35, 707, # 448
77
+ 324,3688,1601,2554, 140, 459,4210,5041,5042,1365, 839, 272, 978,2262,2580,3456, # 464
78
+ 2129,1363,3689,1423, 697, 100,3094, 48, 70,1231, 495,3139,2196,5043,1294,5044, # 480
79
+ 2080, 462, 586,1042,3279, 853, 256, 988, 185,2382,3457,1698, 434,1084,5045,3458, # 496
80
+ 314,2625,2788,4522,2335,2336, 569,2285, 637,1817,2525, 757,1162,1879,1616,3459, # 512
81
+ 287,1577,2116, 768,4523,1671,2868,3566,2526,1321,3816, 909,2418,5046,4211, 933, # 528
82
+ 3817,4212,2053,2361,1222,4524, 765,2419,1322, 786,4525,5047,1920,1462,1677,2909, # 544
83
+ 1699,5048,4526,1424,2442,3140,3690,2600,3353,1775,1941,3460,3983,4213, 309,1369, # 560
84
+ 1130,2825, 364,2234,1653,1299,3984,3567,3985,3986,2656, 525,1085,3041, 902,2001, # 576
85
+ 1475, 964,4527, 421,1845,1415,1057,2286, 940,1364,3141, 376,4528,4529,1381, 7, # 592
86
+ 2527, 983,2383, 336,1710,2684,1846, 321,3461, 559,1131,3042,2752,1809,1132,1313, # 608
87
+ 265,1481,1858,5049, 352,1203,2826,3280, 167,1089, 420,2827, 776, 792,1724,3568, # 624
88
+ 4214,2443,3281,5050,4215,5051, 446, 229, 333,2753, 901,3818,1200,1557,4530,2657, # 640
89
+ 1921, 395,2754,2685,3819,4216,1836, 125, 916,3209,2626,4531,5052,5053,3820,5054, # 656
90
+ 5055,5056,4532,3142,3691,1133,2555,1757,3462,1510,2318,1409,3569,5057,2146, 438, # 672
91
+ 2601,2910,2384,3354,1068, 958,3043, 461, 311,2869,2686,4217,1916,3210,4218,1979, # 688
92
+ 383, 750,2755,2627,4219, 274, 539, 385,1278,1442,5058,1154,1965, 384, 561, 210, # 704
93
+ 98,1295,2556,3570,5059,1711,2420,1482,3463,3987,2911,1257, 129,5060,3821, 642, # 720
94
+ 523,2789,2790,2658,5061, 141,2235,1333, 68, 176, 441, 876, 907,4220, 603,2602, # 736
95
+ 710, 171,3464, 404, 549, 18,3143,2398,1410,3692,1666,5062,3571,4533,2912,4534, # 752
96
+ 5063,2991, 368,5064, 146, 366, 99, 871,3693,1543, 748, 807,1586,1185, 22,2263, # 768
97
+ 379,3822,3211,5065,3212, 505,1942,2628,1992,1382,2319,5066, 380,2362, 218, 702, # 784
98
+ 1818,1248,3465,3044,3572,3355,3282,5067,2992,3694, 930,3283,3823,5068, 59,5069, # 800
99
+ 585, 601,4221, 497,3466,1112,1314,4535,1802,5070,1223,1472,2177,5071, 749,1837, # 816
100
+ 690,1900,3824,1773,3988,1476, 429,1043,1791,2236,2117, 917,4222, 447,1086,1629, # 832
101
+ 5072, 556,5073,5074,2021,1654, 844,1090, 105, 550, 966,1758,2828,1008,1783, 686, # 848
102
+ 1095,5075,2287, 793,1602,5076,3573,2603,4536,4223,2948,2302,4537,3825, 980,2503, # 864
103
+ 544, 353, 527,4538, 908,2687,2913,5077, 381,2629,1943,1348,5078,1341,1252, 560, # 880
104
+ 3095,5079,3467,2870,5080,2054, 973, 886,2081, 143,4539,5081,5082, 157,3989, 496, # 896
105
+ 4224, 57, 840, 540,2039,4540,4541,3468,2118,1445, 970,2264,1748,1966,2082,4225, # 912
106
+ 3144,1234,1776,3284,2829,3695, 773,1206,2130,1066,2040,1326,3990,1738,1725,4226, # 928
107
+ 279,3145, 51,1544,2604, 423,1578,2131,2067, 173,4542,1880,5083,5084,1583, 264, # 944
108
+ 610,3696,4543,2444, 280, 154,5085,5086,5087,1739, 338,1282,3096, 693,2871,1411, # 960
109
+ 1074,3826,2445,5088,4544,5089,5090,1240, 952,2399,5091,2914,1538,2688, 685,1483, # 976
110
+ 4227,2475,1436, 953,4228,2055,4545, 671,2400, 79,4229,2446,3285, 608, 567,2689, # 992
111
+ 3469,4230,4231,1691, 393,1261,1792,2401,5092,4546,5093,5094,5095,5096,1383,1672, # 1008
112
+ 3827,3213,1464, 522,1119, 661,1150, 216, 675,4547,3991,1432,3574, 609,4548,2690, # 1024
113
+ 2402,5097,5098,5099,4232,3045, 0,5100,2476, 315, 231,2447, 301,3356,4549,2385, # 1040
114
+ 5101, 233,4233,3697,1819,4550,4551,5102, 96,1777,1315,2083,5103, 257,5104,1810, # 1056
115
+ 3698,2718,1139,1820,4234,2022,1124,2164,2791,1778,2659,5105,3097, 363,1655,3214, # 1072
116
+ 5106,2993,5107,5108,5109,3992,1567,3993, 718, 103,3215, 849,1443, 341,3357,2949, # 1088
117
+ 1484,5110,1712, 127, 67, 339,4235,2403, 679,1412, 821,5111,5112, 834, 738, 351, # 1104
118
+ 2994,2147, 846, 235,1497,1881, 418,1993,3828,2719, 186,1100,2148,2756,3575,1545, # 1120
119
+ 1355,2950,2872,1377, 583,3994,4236,2581,2995,5113,1298,3699,1078,2557,3700,2363, # 1136
120
+ 78,3829,3830, 267,1289,2100,2002,1594,4237, 348, 369,1274,2197,2178,1838,4552, # 1152
121
+ 1821,2830,3701,2757,2288,2003,4553,2951,2758, 144,3358, 882,4554,3995,2759,3470, # 1168
122
+ 4555,2915,5114,4238,1726, 320,5115,3996,3046, 788,2996,5116,2831,1774,1327,2873, # 1184
123
+ 3997,2832,5117,1306,4556,2004,1700,3831,3576,2364,2660, 787,2023, 506, 824,3702, # 1200
124
+ 534, 323,4557,1044,3359,2024,1901, 946,3471,5118,1779,1500,1678,5119,1882,4558, # 1216
125
+ 165, 243,4559,3703,2528, 123, 683,4239, 764,4560, 36,3998,1793, 589,2916, 816, # 1232
126
+ 626,1667,3047,2237,1639,1555,1622,3832,3999,5120,4000,2874,1370,1228,1933, 891, # 1248
127
+ 2084,2917, 304,4240,5121, 292,2997,2720,3577, 691,2101,4241,1115,4561, 118, 662, # 1264
128
+ 5122, 611,1156, 854,2386,1316,2875, 2, 386, 515,2918,5123,5124,3286, 868,2238, # 1280
129
+ 1486, 855,2661, 785,2216,3048,5125,1040,3216,3578,5126,3146, 448,5127,1525,5128, # 1296
130
+ 2165,4562,5129,3833,5130,4242,2833,3579,3147, 503, 818,4001,3148,1568, 814, 676, # 1312
131
+ 1444, 306,1749,5131,3834,1416,1030, 197,1428, 805,2834,1501,4563,5132,5133,5134, # 1328
132
+ 1994,5135,4564,5136,5137,2198, 13,2792,3704,2998,3149,1229,1917,5138,3835,2132, # 1344
133
+ 5139,4243,4565,2404,3580,5140,2217,1511,1727,1120,5141,5142, 646,3836,2448, 307, # 1360
134
+ 5143,5144,1595,3217,5145,5146,5147,3705,1113,1356,4002,1465,2529,2530,5148, 519, # 1376
135
+ 5149, 128,2133, 92,2289,1980,5150,4003,1512, 342,3150,2199,5151,2793,2218,1981, # 1392
136
+ 3360,4244, 290,1656,1317, 789, 827,2365,5152,3837,4566, 562, 581,4004,5153, 401, # 1408
137
+ 4567,2252, 94,4568,5154,1399,2794,5155,1463,2025,4569,3218,1944,5156, 828,1105, # 1424
138
+ 4245,1262,1394,5157,4246, 605,4570,5158,1784,2876,5159,2835, 819,2102, 578,2200, # 1440
139
+ 2952,5160,1502, 436,3287,4247,3288,2836,4005,2919,3472,3473,5161,2721,2320,5162, # 1456
140
+ 5163,2337,2068, 23,4571, 193, 826,3838,2103, 699,1630,4248,3098, 390,1794,1064, # 1472
141
+ 3581,5164,1579,3099,3100,1400,5165,4249,1839,1640,2877,5166,4572,4573, 137,4250, # 1488
142
+ 598,3101,1967, 780, 104, 974,2953,5167, 278, 899, 253, 402, 572, 504, 493,1339, # 1504
143
+ 5168,4006,1275,4574,2582,2558,5169,3706,3049,3102,2253, 565,1334,2722, 863, 41, # 1520
144
+ 5170,5171,4575,5172,1657,2338, 19, 463,2760,4251, 606,5173,2999,3289,1087,2085, # 1536
145
+ 1323,2662,3000,5174,1631,1623,1750,4252,2691,5175,2878, 791,2723,2663,2339, 232, # 1552
146
+ 2421,5176,3001,1498,5177,2664,2630, 755,1366,3707,3290,3151,2026,1609, 119,1918, # 1568
147
+ 3474, 862,1026,4253,5178,4007,3839,4576,4008,4577,2265,1952,2477,5179,1125, 817, # 1584
148
+ 4254,4255,4009,1513,1766,2041,1487,4256,3050,3291,2837,3840,3152,5180,5181,1507, # 1600
149
+ 5182,2692, 733, 40,1632,1106,2879, 345,4257, 841,2531, 230,4578,3002,1847,3292, # 1616
150
+ 3475,5183,1263, 986,3476,5184, 735, 879, 254,1137, 857, 622,1300,1180,1388,1562, # 1632
151
+ 4010,4011,2954, 967,2761,2665,1349, 592,2134,1692,3361,3003,1995,4258,1679,4012, # 1648
152
+ 1902,2188,5185, 739,3708,2724,1296,1290,5186,4259,2201,2202,1922,1563,2605,2559, # 1664
153
+ 1871,2762,3004,5187, 435,5188, 343,1108, 596, 17,1751,4579,2239,3477,3709,5189, # 1680
154
+ 4580, 294,3582,2955,1693, 477, 979, 281,2042,3583, 643,2043,3710,2631,2795,2266, # 1696
155
+ 1031,2340,2135,2303,3584,4581, 367,1249,2560,5190,3585,5191,4582,1283,3362,2005, # 1712
156
+ 240,1762,3363,4583,4584, 836,1069,3153, 474,5192,2149,2532, 268,3586,5193,3219, # 1728
157
+ 1521,1284,5194,1658,1546,4260,5195,3587,3588,5196,4261,3364,2693,1685,4262, 961, # 1744
158
+ 1673,2632, 190,2006,2203,3841,4585,4586,5197, 570,2504,3711,1490,5198,4587,2633, # 1760
159
+ 3293,1957,4588, 584,1514, 396,1045,1945,5199,4589,1968,2449,5200,5201,4590,4013, # 1776
160
+ 619,5202,3154,3294, 215,2007,2796,2561,3220,4591,3221,4592, 763,4263,3842,4593, # 1792
161
+ 5203,5204,1958,1767,2956,3365,3712,1174, 452,1477,4594,3366,3155,5205,2838,1253, # 1808
162
+ 2387,2189,1091,2290,4264, 492,5206, 638,1169,1825,2136,1752,4014, 648, 926,1021, # 1824
163
+ 1324,4595, 520,4596, 997, 847,1007, 892,4597,3843,2267,1872,3713,2405,1785,4598, # 1840
164
+ 1953,2957,3103,3222,1728,4265,2044,3714,4599,2008,1701,3156,1551, 30,2268,4266, # 1856
165
+ 5207,2027,4600,3589,5208, 501,5209,4267, 594,3478,2166,1822,3590,3479,3591,3223, # 1872
166
+ 829,2839,4268,5210,1680,3157,1225,4269,5211,3295,4601,4270,3158,2341,5212,4602, # 1888
167
+ 4271,5213,4015,4016,5214,1848,2388,2606,3367,5215,4603, 374,4017, 652,4272,4273, # 1904
168
+ 375,1140, 798,5216,5217,5218,2366,4604,2269, 546,1659, 138,3051,2450,4605,5219, # 1920
169
+ 2254, 612,1849, 910, 796,3844,1740,1371, 825,3845,3846,5220,2920,2562,5221, 692, # 1936
170
+ 444,3052,2634, 801,4606,4274,5222,1491, 244,1053,3053,4275,4276, 340,5223,4018, # 1952
171
+ 1041,3005, 293,1168, 87,1357,5224,1539, 959,5225,2240, 721, 694,4277,3847, 219, # 1968
172
+ 1478, 644,1417,3368,2666,1413,1401,1335,1389,4019,5226,5227,3006,2367,3159,1826, # 1984
173
+ 730,1515, 184,2840, 66,4607,5228,1660,2958, 246,3369, 378,1457, 226,3480, 975, # 2000
174
+ 4020,2959,1264,3592, 674, 696,5229, 163,5230,1141,2422,2167, 713,3593,3370,4608, # 2016
175
+ 4021,5231,5232,1186, 15,5233,1079,1070,5234,1522,3224,3594, 276,1050,2725, 758, # 2032
176
+ 1126, 653,2960,3296,5235,2342, 889,3595,4022,3104,3007, 903,1250,4609,4023,3481, # 2048
177
+ 3596,1342,1681,1718, 766,3297, 286, 89,2961,3715,5236,1713,5237,2607,3371,3008, # 2064
178
+ 5238,2962,2219,3225,2880,5239,4610,2505,2533, 181, 387,1075,4024, 731,2190,3372, # 2080
179
+ 5240,3298, 310, 313,3482,2304, 770,4278, 54,3054, 189,4611,3105,3848,4025,5241, # 2096
180
+ 1230,1617,1850, 355,3597,4279,4612,3373, 111,4280,3716,1350,3160,3483,3055,4281, # 2112
181
+ 2150,3299,3598,5242,2797,4026,4027,3009, 722,2009,5243,1071, 247,1207,2343,2478, # 2128
182
+ 1378,4613,2010, 864,1437,1214,4614, 373,3849,1142,2220, 667,4615, 442,2763,2563, # 2144
183
+ 3850,4028,1969,4282,3300,1840, 837, 170,1107, 934,1336,1883,5244,5245,2119,4283, # 2160
184
+ 2841, 743,1569,5246,4616,4284, 582,2389,1418,3484,5247,1803,5248, 357,1395,1729, # 2176
185
+ 3717,3301,2423,1564,2241,5249,3106,3851,1633,4617,1114,2086,4285,1532,5250, 482, # 2192
186
+ 2451,4618,5251,5252,1492, 833,1466,5253,2726,3599,1641,2842,5254,1526,1272,3718, # 2208
187
+ 4286,1686,1795, 416,2564,1903,1954,1804,5255,3852,2798,3853,1159,2321,5256,2881, # 2224
188
+ 4619,1610,1584,3056,2424,2764, 443,3302,1163,3161,5257,5258,4029,5259,4287,2506, # 2240
189
+ 3057,4620,4030,3162,2104,1647,3600,2011,1873,4288,5260,4289, 431,3485,5261, 250, # 2256
190
+ 97, 81,4290,5262,1648,1851,1558, 160, 848,5263, 866, 740,1694,5264,2204,2843, # 2272
191
+ 3226,4291,4621,3719,1687, 950,2479, 426, 469,3227,3720,3721,4031,5265,5266,1188, # 2288
192
+ 424,1996, 861,3601,4292,3854,2205,2694, 168,1235,3602,4293,5267,2087,1674,4622, # 2304
193
+ 3374,3303, 220,2565,1009,5268,3855, 670,3010, 332,1208, 717,5269,5270,3603,2452, # 2320
194
+ 4032,3375,5271, 513,5272,1209,2882,3376,3163,4623,1080,5273,5274,5275,5276,2534, # 2336
195
+ 3722,3604, 815,1587,4033,4034,5277,3605,3486,3856,1254,4624,1328,3058,1390,4035, # 2352
196
+ 1741,4036,3857,4037,5278, 236,3858,2453,3304,5279,5280,3723,3859,1273,3860,4625, # 2368
197
+ 5281, 308,5282,4626, 245,4627,1852,2480,1307,2583, 430, 715,2137,2454,5283, 270, # 2384
198
+ 199,2883,4038,5284,3606,2727,1753, 761,1754, 725,1661,1841,4628,3487,3724,5285, # 2400
199
+ 5286, 587, 14,3305, 227,2608, 326, 480,2270, 943,2765,3607, 291, 650,1884,5287, # 2416
200
+ 1702,1226, 102,1547, 62,3488, 904,4629,3489,1164,4294,5288,5289,1224,1548,2766, # 2432
201
+ 391, 498,1493,5290,1386,1419,5291,2056,1177,4630, 813, 880,1081,2368, 566,1145, # 2448
202
+ 4631,2291,1001,1035,2566,2609,2242, 394,1286,5292,5293,2069,5294, 86,1494,1730, # 2464
203
+ 4039, 491,1588, 745, 897,2963, 843,3377,4040,2767,2884,3306,1768, 998,2221,2070, # 2480
204
+ 397,1827,1195,1970,3725,3011,3378, 284,5295,3861,2507,2138,2120,1904,5296,4041, # 2496
205
+ 2151,4042,4295,1036,3490,1905, 114,2567,4296, 209,1527,5297,5298,2964,2844,2635, # 2512
206
+ 2390,2728,3164, 812,2568,5299,3307,5300,1559, 737,1885,3726,1210, 885, 28,2695, # 2528
207
+ 3608,3862,5301,4297,1004,1780,4632,5302, 346,1982,2222,2696,4633,3863,1742, 797, # 2544
208
+ 1642,4043,1934,1072,1384,2152, 896,4044,3308,3727,3228,2885,3609,5303,2569,1959, # 2560
209
+ 4634,2455,1786,5304,5305,5306,4045,4298,1005,1308,3728,4299,2729,4635,4636,1528, # 2576
210
+ 2610, 161,1178,4300,1983, 987,4637,1101,4301, 631,4046,1157,3229,2425,1343,1241, # 2592
211
+ 1016,2243,2570, 372, 877,2344,2508,1160, 555,1935, 911,4047,5307, 466,1170, 169, # 2608
212
+ 1051,2921,2697,3729,2481,3012,1182,2012,2571,1251,2636,5308, 992,2345,3491,1540, # 2624
213
+ 2730,1201,2071,2406,1997,2482,5309,4638, 528,1923,2191,1503,1874,1570,2369,3379, # 2640
214
+ 3309,5310, 557,1073,5311,1828,3492,2088,2271,3165,3059,3107, 767,3108,2799,4639, # 2656
215
+ 1006,4302,4640,2346,1267,2179,3730,3230, 778,4048,3231,2731,1597,2667,5312,4641, # 2672
216
+ 5313,3493,5314,5315,5316,3310,2698,1433,3311, 131, 95,1504,4049, 723,4303,3166, # 2688
217
+ 1842,3610,2768,2192,4050,2028,2105,3731,5317,3013,4051,1218,5318,3380,3232,4052, # 2704
218
+ 4304,2584, 248,1634,3864, 912,5319,2845,3732,3060,3865, 654, 53,5320,3014,5321, # 2720
219
+ 1688,4642, 777,3494,1032,4053,1425,5322, 191, 820,2121,2846, 971,4643, 931,3233, # 2736
220
+ 135, 664, 783,3866,1998, 772,2922,1936,4054,3867,4644,2923,3234, 282,2732, 640, # 2752
221
+ 1372,3495,1127, 922, 325,3381,5323,5324, 711,2045,5325,5326,4055,2223,2800,1937, # 2768
222
+ 4056,3382,2224,2255,3868,2305,5327,4645,3869,1258,3312,4057,3235,2139,2965,4058, # 2784
223
+ 4059,5328,2225, 258,3236,4646, 101,1227,5329,3313,1755,5330,1391,3314,5331,2924, # 2800
224
+ 2057, 893,5332,5333,5334,1402,4305,2347,5335,5336,3237,3611,5337,5338, 878,1325, # 2816
225
+ 1781,2801,4647, 259,1385,2585, 744,1183,2272,4648,5339,4060,2509,5340, 684,1024, # 2832
226
+ 4306,5341, 472,3612,3496,1165,3315,4061,4062, 322,2153, 881, 455,1695,1152,1340, # 2848
227
+ 660, 554,2154,4649,1058,4650,4307, 830,1065,3383,4063,4651,1924,5342,1703,1919, # 2864
228
+ 5343, 932,2273, 122,5344,4652, 947, 677,5345,3870,2637, 297,1906,1925,2274,4653, # 2880
229
+ 2322,3316,5346,5347,4308,5348,4309, 84,4310, 112, 989,5349, 547,1059,4064, 701, # 2896
230
+ 3613,1019,5350,4311,5351,3497, 942, 639, 457,2306,2456, 993,2966, 407, 851, 494, # 2912
231
+ 4654,3384, 927,5352,1237,5353,2426,3385, 573,4312, 680, 921,2925,1279,1875, 285, # 2928
232
+ 790,1448,1984, 719,2168,5354,5355,4655,4065,4066,1649,5356,1541, 563,5357,1077, # 2944
233
+ 5358,3386,3061,3498, 511,3015,4067,4068,3733,4069,1268,2572,3387,3238,4656,4657, # 2960
234
+ 5359, 535,1048,1276,1189,2926,2029,3167,1438,1373,2847,2967,1134,2013,5360,4313, # 2976
235
+ 1238,2586,3109,1259,5361, 700,5362,2968,3168,3734,4314,5363,4315,1146,1876,1907, # 2992
236
+ 4658,2611,4070, 781,2427, 132,1589, 203, 147, 273,2802,2407, 898,1787,2155,4071, # 3008
237
+ 4072,5364,3871,2803,5365,5366,4659,4660,5367,3239,5368,1635,3872, 965,5369,1805, # 3024
238
+ 2699,1516,3614,1121,1082,1329,3317,4073,1449,3873, 65,1128,2848,2927,2769,1590, # 3040
239
+ 3874,5370,5371, 12,2668, 45, 976,2587,3169,4661, 517,2535,1013,1037,3240,5372, # 3056
240
+ 3875,2849,5373,3876,5374,3499,5375,2612, 614,1999,2323,3877,3110,2733,2638,5376, # 3072
241
+ 2588,4316, 599,1269,5377,1811,3735,5378,2700,3111, 759,1060, 489,1806,3388,3318, # 3088
242
+ 1358,5379,5380,2391,1387,1215,2639,2256, 490,5381,5382,4317,1759,2392,2348,5383, # 3104
243
+ 4662,3878,1908,4074,2640,1807,3241,4663,3500,3319,2770,2349, 874,5384,5385,3501, # 3120
244
+ 3736,1859, 91,2928,3737,3062,3879,4664,5386,3170,4075,2669,5387,3502,1202,1403, # 3136
245
+ 3880,2969,2536,1517,2510,4665,3503,2511,5388,4666,5389,2701,1886,1495,1731,4076, # 3152
246
+ 2370,4667,5390,2030,5391,5392,4077,2702,1216, 237,2589,4318,2324,4078,3881,4668, # 3168
247
+ 4669,2703,3615,3504, 445,4670,5393,5394,5395,5396,2771, 61,4079,3738,1823,4080, # 3184
248
+ 5397, 687,2046, 935, 925, 405,2670, 703,1096,1860,2734,4671,4081,1877,1367,2704, # 3200
249
+ 3389, 918,2106,1782,2483, 334,3320,1611,1093,4672, 564,3171,3505,3739,3390, 945, # 3216
250
+ 2641,2058,4673,5398,1926, 872,4319,5399,3506,2705,3112, 349,4320,3740,4082,4674, # 3232
251
+ 3882,4321,3741,2156,4083,4675,4676,4322,4677,2408,2047, 782,4084, 400, 251,4323, # 3248
252
+ 1624,5400,5401, 277,3742, 299,1265, 476,1191,3883,2122,4324,4325,1109, 205,5402, # 3264
253
+ 2590,1000,2157,3616,1861,5403,5404,5405,4678,5406,4679,2573, 107,2484,2158,4085, # 3280
254
+ 3507,3172,5407,1533, 541,1301, 158, 753,4326,2886,3617,5408,1696, 370,1088,4327, # 3296
255
+ 4680,3618, 579, 327, 440, 162,2244, 269,1938,1374,3508, 968,3063, 56,1396,3113, # 3312
256
+ 2107,3321,3391,5409,1927,2159,4681,3016,5410,3619,5411,5412,3743,4682,2485,5413, # 3328
257
+ 2804,5414,1650,4683,5415,2613,5416,5417,4086,2671,3392,1149,3393,4087,3884,4088, # 3344
258
+ 5418,1076, 49,5419, 951,3242,3322,3323, 450,2850, 920,5420,1812,2805,2371,4328, # 3360
259
+ 1909,1138,2372,3885,3509,5421,3243,4684,1910,1147,1518,2428,4685,3886,5422,4686, # 3376
260
+ 2393,2614, 260,1796,3244,5423,5424,3887,3324, 708,5425,3620,1704,5426,3621,1351, # 3392
261
+ 1618,3394,3017,1887, 944,4329,3395,4330,3064,3396,4331,5427,3744, 422, 413,1714, # 3408
262
+ 3325, 500,2059,2350,4332,2486,5428,1344,1911, 954,5429,1668,5430,5431,4089,2409, # 3424
263
+ 4333,3622,3888,4334,5432,2307,1318,2512,3114, 133,3115,2887,4687, 629, 31,2851, # 3440
264
+ 2706,3889,4688, 850, 949,4689,4090,2970,1732,2089,4335,1496,1853,5433,4091, 620, # 3456
265
+ 3245, 981,1242,3745,3397,1619,3746,1643,3326,2140,2457,1971,1719,3510,2169,5434, # 3472
266
+ 3246,5435,5436,3398,1829,5437,1277,4690,1565,2048,5438,1636,3623,3116,5439, 869, # 3488
267
+ 2852, 655,3890,3891,3117,4092,3018,3892,1310,3624,4691,5440,5441,5442,1733, 558, # 3504
268
+ 4692,3747, 335,1549,3065,1756,4336,3748,1946,3511,1830,1291,1192, 470,2735,2108, # 3520
269
+ 2806, 913,1054,4093,5443,1027,5444,3066,4094,4693, 982,2672,3399,3173,3512,3247, # 3536
270
+ 3248,1947,2807,5445, 571,4694,5446,1831,5447,3625,2591,1523,2429,5448,2090, 984, # 3552
271
+ 4695,3749,1960,5449,3750, 852, 923,2808,3513,3751, 969,1519, 999,2049,2325,1705, # 3568
272
+ 5450,3118, 615,1662, 151, 597,4095,2410,2326,1049, 275,4696,3752,4337, 568,3753, # 3584
273
+ 3626,2487,4338,3754,5451,2430,2275, 409,3249,5452,1566,2888,3514,1002, 769,2853, # 3600
274
+ 194,2091,3174,3755,2226,3327,4339, 628,1505,5453,5454,1763,2180,3019,4096, 521, # 3616
275
+ 1161,2592,1788,2206,2411,4697,4097,1625,4340,4341, 412, 42,3119, 464,5455,2642, # 3632
276
+ 4698,3400,1760,1571,2889,3515,2537,1219,2207,3893,2643,2141,2373,4699,4700,3328, # 3648
277
+ 1651,3401,3627,5456,5457,3628,2488,3516,5458,3756,5459,5460,2276,2092, 460,5461, # 3664
278
+ 4701,5462,3020, 962, 588,3629, 289,3250,2644,1116, 52,5463,3067,1797,5464,5465, # 3680
279
+ 5466,1467,5467,1598,1143,3757,4342,1985,1734,1067,4702,1280,3402, 465,4703,1572, # 3696
280
+ 510,5468,1928,2245,1813,1644,3630,5469,4704,3758,5470,5471,2673,1573,1534,5472, # 3712
281
+ 5473, 536,1808,1761,3517,3894,3175,2645,5474,5475,5476,4705,3518,2929,1912,2809, # 3728
282
+ 5477,3329,1122, 377,3251,5478, 360,5479,5480,4343,1529, 551,5481,2060,3759,1769, # 3744
283
+ 2431,5482,2930,4344,3330,3120,2327,2109,2031,4706,1404, 136,1468,1479, 672,1171, # 3760
284
+ 3252,2308, 271,3176,5483,2772,5484,2050, 678,2736, 865,1948,4707,5485,2014,4098, # 3776
285
+ 2971,5486,2737,2227,1397,3068,3760,4708,4709,1735,2931,3403,3631,5487,3895, 509, # 3792
286
+ 2854,2458,2890,3896,5488,5489,3177,3178,4710,4345,2538,4711,2309,1166,1010, 552, # 3808
287
+ 681,1888,5490,5491,2972,2973,4099,1287,1596,1862,3179, 358, 453, 736, 175, 478, # 3824
288
+ 1117, 905,1167,1097,5492,1854,1530,5493,1706,5494,2181,3519,2292,3761,3520,3632, # 3840
289
+ 4346,2093,4347,5495,3404,1193,2489,4348,1458,2193,2208,1863,1889,1421,3331,2932, # 3856
290
+ 3069,2182,3521, 595,2123,5496,4100,5497,5498,4349,1707,2646, 223,3762,1359, 751, # 3872
291
+ 3121, 183,3522,5499,2810,3021, 419,2374, 633, 704,3897,2394, 241,5500,5501,5502, # 3888
292
+ 838,3022,3763,2277,2773,2459,3898,1939,2051,4101,1309,3122,2246,1181,5503,1136, # 3904
293
+ 2209,3899,2375,1446,4350,2310,4712,5504,5505,4351,1055,2615, 484,3764,5506,4102, # 3920
294
+ 625,4352,2278,3405,1499,4353,4103,5507,4104,4354,3253,2279,2280,3523,5508,5509, # 3936
295
+ 2774, 808,2616,3765,3406,4105,4355,3123,2539, 526,3407,3900,4356, 955,5510,1620, # 3952
296
+ 4357,2647,2432,5511,1429,3766,1669,1832, 994, 928,5512,3633,1260,5513,5514,5515, # 3968
297
+ 1949,2293, 741,2933,1626,4358,2738,2460, 867,1184, 362,3408,1392,5516,5517,4106, # 3984
298
+ 4359,1770,1736,3254,2934,4713,4714,1929,2707,1459,1158,5518,3070,3409,2891,1292, # 4000
299
+ 1930,2513,2855,3767,1986,1187,2072,2015,2617,4360,5519,2574,2514,2170,3768,2490, # 4016
300
+ 3332,5520,3769,4715,5521,5522, 666,1003,3023,1022,3634,4361,5523,4716,1814,2257, # 4032
301
+ 574,3901,1603, 295,1535, 705,3902,4362, 283, 858, 417,5524,5525,3255,4717,4718, # 4048
302
+ 3071,1220,1890,1046,2281,2461,4107,1393,1599, 689,2575, 388,4363,5526,2491, 802, # 4064
303
+ 5527,2811,3903,2061,1405,2258,5528,4719,3904,2110,1052,1345,3256,1585,5529, 809, # 4080
304
+ 5530,5531,5532, 575,2739,3524, 956,1552,1469,1144,2328,5533,2329,1560,2462,3635, # 4096
305
+ 3257,4108, 616,2210,4364,3180,2183,2294,5534,1833,5535,3525,4720,5536,1319,3770, # 4112
306
+ 3771,1211,3636,1023,3258,1293,2812,5537,5538,5539,3905, 607,2311,3906, 762,2892, # 4128
307
+ 1439,4365,1360,4721,1485,3072,5540,4722,1038,4366,1450,2062,2648,4367,1379,4723, # 4144
308
+ 2593,5541,5542,4368,1352,1414,2330,2935,1172,5543,5544,3907,3908,4724,1798,1451, # 4160
309
+ 5545,5546,5547,5548,2936,4109,4110,2492,2351, 411,4111,4112,3637,3333,3124,4725, # 4176
310
+ 1561,2674,1452,4113,1375,5549,5550, 47,2974, 316,5551,1406,1591,2937,3181,5552, # 4192
311
+ 1025,2142,3125,3182, 354,2740, 884,2228,4369,2412, 508,3772, 726,3638, 996,2433, # 4208
312
+ 3639, 729,5553, 392,2194,1453,4114,4726,3773,5554,5555,2463,3640,2618,1675,2813, # 4224
313
+ 919,2352,2975,2353,1270,4727,4115, 73,5556,5557, 647,5558,3259,2856,2259,1550, # 4240
314
+ 1346,3024,5559,1332, 883,3526,5560,5561,5562,5563,3334,2775,5564,1212, 831,1347, # 4256
315
+ 4370,4728,2331,3909,1864,3073, 720,3910,4729,4730,3911,5565,4371,5566,5567,4731, # 4272
316
+ 5568,5569,1799,4732,3774,2619,4733,3641,1645,2376,4734,5570,2938, 669,2211,2675, # 4288
317
+ 2434,5571,2893,5572,5573,1028,3260,5574,4372,2413,5575,2260,1353,5576,5577,4735, # 4304
318
+ 3183, 518,5578,4116,5579,4373,1961,5580,2143,4374,5581,5582,3025,2354,2355,3912, # 4320
319
+ 516,1834,1454,4117,2708,4375,4736,2229,2620,1972,1129,3642,5583,2776,5584,2976, # 4336
320
+ 1422, 577,1470,3026,1524,3410,5585,5586, 432,4376,3074,3527,5587,2594,1455,2515, # 4352
321
+ 2230,1973,1175,5588,1020,2741,4118,3528,4737,5589,2742,5590,1743,1361,3075,3529, # 4368
322
+ 2649,4119,4377,4738,2295, 895, 924,4378,2171, 331,2247,3076, 166,1627,3077,1098, # 4384
323
+ 5591,1232,2894,2231,3411,4739, 657, 403,1196,2377, 542,3775,3412,1600,4379,3530, # 4400
324
+ 5592,4740,2777,3261, 576, 530,1362,4741,4742,2540,2676,3776,4120,5593, 842,3913, # 4416
325
+ 5594,2814,2032,1014,4121, 213,2709,3413, 665, 621,4380,5595,3777,2939,2435,5596, # 4432
326
+ 2436,3335,3643,3414,4743,4381,2541,4382,4744,3644,1682,4383,3531,1380,5597, 724, # 4448
327
+ 2282, 600,1670,5598,1337,1233,4745,3126,2248,5599,1621,4746,5600, 651,4384,5601, # 4464
328
+ 1612,4385,2621,5602,2857,5603,2743,2312,3078,5604, 716,2464,3079, 174,1255,2710, # 4480
329
+ 4122,3645, 548,1320,1398, 728,4123,1574,5605,1891,1197,3080,4124,5606,3081,3082, # 4496
330
+ 3778,3646,3779, 747,5607, 635,4386,4747,5608,5609,5610,4387,5611,5612,4748,5613, # 4512
331
+ 3415,4749,2437, 451,5614,3780,2542,2073,4388,2744,4389,4125,5615,1764,4750,5616, # 4528
332
+ 4390, 350,4751,2283,2395,2493,5617,4391,4126,2249,1434,4127, 488,4752, 458,4392, # 4544
333
+ 4128,3781, 771,1330,2396,3914,2576,3184,2160,2414,1553,2677,3185,4393,5618,2494, # 4560
334
+ 2895,2622,1720,2711,4394,3416,4753,5619,2543,4395,5620,3262,4396,2778,5621,2016, # 4576
335
+ 2745,5622,1155,1017,3782,3915,5623,3336,2313, 201,1865,4397,1430,5624,4129,5625, # 4592
336
+ 5626,5627,5628,5629,4398,1604,5630, 414,1866, 371,2595,4754,4755,3532,2017,3127, # 4608
337
+ 4756,1708, 960,4399, 887, 389,2172,1536,1663,1721,5631,2232,4130,2356,2940,1580, # 4624
338
+ 5632,5633,1744,4757,2544,4758,4759,5634,4760,5635,2074,5636,4761,3647,3417,2896, # 4640
339
+ 4400,5637,4401,2650,3418,2815, 673,2712,2465, 709,3533,4131,3648,4402,5638,1148, # 4656
340
+ 502, 634,5639,5640,1204,4762,3649,1575,4763,2623,3783,5641,3784,3128, 948,3263, # 4672
341
+ 121,1745,3916,1110,5642,4403,3083,2516,3027,4132,3785,1151,1771,3917,1488,4133, # 4688
342
+ 1987,5643,2438,3534,5644,5645,2094,5646,4404,3918,1213,1407,2816, 531,2746,2545, # 4704
343
+ 3264,1011,1537,4764,2779,4405,3129,1061,5647,3786,3787,1867,2897,5648,2018, 120, # 4720
344
+ 4406,4407,2063,3650,3265,2314,3919,2678,3419,1955,4765,4134,5649,3535,1047,2713, # 4736
345
+ 1266,5650,1368,4766,2858, 649,3420,3920,2546,2747,1102,2859,2679,5651,5652,2000, # 4752
346
+ 5653,1111,3651,2977,5654,2495,3921,3652,2817,1855,3421,3788,5655,5656,3422,2415, # 4768
347
+ 2898,3337,3266,3653,5657,2577,5658,3654,2818,4135,1460, 856,5659,3655,5660,2899, # 4784
348
+ 2978,5661,2900,3922,5662,4408, 632,2517, 875,3923,1697,3924,2296,5663,5664,4767, # 4800
349
+ 3028,1239, 580,4768,4409,5665, 914, 936,2075,1190,4136,1039,2124,5666,5667,5668, # 4816
350
+ 5669,3423,1473,5670,1354,4410,3925,4769,2173,3084,4137, 915,3338,4411,4412,3339, # 4832
351
+ 1605,1835,5671,2748, 398,3656,4413,3926,4138, 328,1913,2860,4139,3927,1331,4414, # 4848
352
+ 3029, 937,4415,5672,3657,4140,4141,3424,2161,4770,3425, 524, 742, 538,3085,1012, # 4864
353
+ 5673,5674,3928,2466,5675, 658,1103, 225,3929,5676,5677,4771,5678,4772,5679,3267, # 4880
354
+ 1243,5680,4142, 963,2250,4773,5681,2714,3658,3186,5682,5683,2596,2332,5684,4774, # 4896
355
+ 5685,5686,5687,3536, 957,3426,2547,2033,1931,2941,2467, 870,2019,3659,1746,2780, # 4912
356
+ 2781,2439,2468,5688,3930,5689,3789,3130,3790,3537,3427,3791,5690,1179,3086,5691, # 4928
357
+ 3187,2378,4416,3792,2548,3188,3131,2749,4143,5692,3428,1556,2549,2297, 977,2901, # 4944
358
+ 2034,4144,1205,3429,5693,1765,3430,3189,2125,1271, 714,1689,4775,3538,5694,2333, # 4960
359
+ 3931, 533,4417,3660,2184, 617,5695,2469,3340,3539,2315,5696,5697,3190,5698,5699, # 4976
360
+ 3932,1988, 618, 427,2651,3540,3431,5700,5701,1244,1690,5702,2819,4418,4776,5703, # 4992
361
+ 3541,4777,5704,2284,1576, 473,3661,4419,3432, 972,5705,3662,5706,3087,5707,5708, # 5008
362
+ 4778,4779,5709,3793,4145,4146,5710, 153,4780, 356,5711,1892,2902,4420,2144, 408, # 5024
363
+ 803,2357,5712,3933,5713,4421,1646,2578,2518,4781,4782,3934,5714,3935,4422,5715, # 5040
364
+ 2416,3433, 752,5716,5717,1962,3341,2979,5718, 746,3030,2470,4783,4423,3794, 698, # 5056
365
+ 4784,1893,4424,3663,2550,4785,3664,3936,5719,3191,3434,5720,1824,1302,4147,2715, # 5072
366
+ 3937,1974,4425,5721,4426,3192, 823,1303,1288,1236,2861,3542,4148,3435, 774,3938, # 5088
367
+ 5722,1581,4786,1304,2862,3939,4787,5723,2440,2162,1083,3268,4427,4149,4428, 344, # 5104
368
+ 1173, 288,2316, 454,1683,5724,5725,1461,4788,4150,2597,5726,5727,4789, 985, 894, # 5120
369
+ 5728,3436,3193,5729,1914,2942,3795,1989,5730,2111,1975,5731,4151,5732,2579,1194, # 5136
370
+ 425,5733,4790,3194,1245,3796,4429,5734,5735,2863,5736, 636,4791,1856,3940, 760, # 5152
371
+ 1800,5737,4430,2212,1508,4792,4152,1894,1684,2298,5738,5739,4793,4431,4432,2213, # 5168
372
+ 479,5740,5741, 832,5742,4153,2496,5743,2980,2497,3797, 990,3132, 627,1815,2652, # 5184
373
+ 4433,1582,4434,2126,2112,3543,4794,5744, 799,4435,3195,5745,4795,2113,1737,3031, # 5200
374
+ 1018, 543, 754,4436,3342,1676,4796,4797,4154,4798,1489,5746,3544,5747,2624,2903, # 5216
375
+ 4155,5748,5749,2981,5750,5751,5752,5753,3196,4799,4800,2185,1722,5754,3269,3270, # 5232
376
+ 1843,3665,1715, 481, 365,1976,1857,5755,5756,1963,2498,4801,5757,2127,3666,3271, # 5248
377
+ 433,1895,2064,2076,5758, 602,2750,5759,5760,5761,5762,5763,3032,1628,3437,5764, # 5264
378
+ 3197,4802,4156,2904,4803,2519,5765,2551,2782,5766,5767,5768,3343,4804,2905,5769, # 5280
379
+ 4805,5770,2864,4806,4807,1221,2982,4157,2520,5771,5772,5773,1868,1990,5774,5775, # 5296
380
+ 5776,1896,5777,5778,4808,1897,4158, 318,5779,2095,4159,4437,5780,5781, 485,5782, # 5312
381
+ 938,3941, 553,2680, 116,5783,3942,3667,5784,3545,2681,2783,3438,3344,2820,5785, # 5328
382
+ 3668,2943,4160,1747,2944,2983,5786,5787, 207,5788,4809,5789,4810,2521,5790,3033, # 5344
383
+ 890,3669,3943,5791,1878,3798,3439,5792,2186,2358,3440,1652,5793,5794,5795, 941, # 5360
384
+ 2299, 208,3546,4161,2020, 330,4438,3944,2906,2499,3799,4439,4811,5796,5797,5798, # 5376
385
+ )
386
+ # fmt: on
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/big5prober.py ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Communicator client code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from .chardistribution import Big5DistributionAnalysis
29
+ from .codingstatemachine import CodingStateMachine
30
+ from .mbcharsetprober import MultiByteCharSetProber
31
+ from .mbcssm import BIG5_SM_MODEL
32
+
33
+
34
+ class Big5Prober(MultiByteCharSetProber):
35
+ def __init__(self) -> None:
36
+ super().__init__()
37
+ self.coding_sm = CodingStateMachine(BIG5_SM_MODEL)
38
+ self.distribution_analyzer = Big5DistributionAnalysis()
39
+ self.reset()
40
+
41
+ @property
42
+ def charset_name(self) -> str:
43
+ return "Big5"
44
+
45
+ @property
46
+ def language(self) -> str:
47
+ return "Chinese"
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/chardistribution.py ADDED
@@ -0,0 +1,261 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Communicator client code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from typing import Tuple, Union
29
+
30
+ from .big5freq import (
31
+ BIG5_CHAR_TO_FREQ_ORDER,
32
+ BIG5_TABLE_SIZE,
33
+ BIG5_TYPICAL_DISTRIBUTION_RATIO,
34
+ )
35
+ from .euckrfreq import (
36
+ EUCKR_CHAR_TO_FREQ_ORDER,
37
+ EUCKR_TABLE_SIZE,
38
+ EUCKR_TYPICAL_DISTRIBUTION_RATIO,
39
+ )
40
+ from .euctwfreq import (
41
+ EUCTW_CHAR_TO_FREQ_ORDER,
42
+ EUCTW_TABLE_SIZE,
43
+ EUCTW_TYPICAL_DISTRIBUTION_RATIO,
44
+ )
45
+ from .gb2312freq import (
46
+ GB2312_CHAR_TO_FREQ_ORDER,
47
+ GB2312_TABLE_SIZE,
48
+ GB2312_TYPICAL_DISTRIBUTION_RATIO,
49
+ )
50
+ from .jisfreq import (
51
+ JIS_CHAR_TO_FREQ_ORDER,
52
+ JIS_TABLE_SIZE,
53
+ JIS_TYPICAL_DISTRIBUTION_RATIO,
54
+ )
55
+ from .johabfreq import JOHAB_TO_EUCKR_ORDER_TABLE
56
+
57
+
58
+ class CharDistributionAnalysis:
59
+ ENOUGH_DATA_THRESHOLD = 1024
60
+ SURE_YES = 0.99
61
+ SURE_NO = 0.01
62
+ MINIMUM_DATA_THRESHOLD = 3
63
+
64
+ def __init__(self) -> None:
65
+ # Mapping table to get frequency order from char order (get from
66
+ # GetOrder())
67
+ self._char_to_freq_order: Tuple[int, ...] = tuple()
68
+ self._table_size = 0 # Size of above table
69
+ # This is a constant value which varies from language to language,
70
+ # used in calculating confidence. See
71
+ # http://www.mozilla.org/projects/intl/UniversalCharsetDetection.html
72
+ # for further detail.
73
+ self.typical_distribution_ratio = 0.0
74
+ self._done = False
75
+ self._total_chars = 0
76
+ self._freq_chars = 0
77
+ self.reset()
78
+
79
+ def reset(self) -> None:
80
+ """reset analyser, clear any state"""
81
+ # If this flag is set to True, detection is done and conclusion has
82
+ # been made
83
+ self._done = False
84
+ self._total_chars = 0 # Total characters encountered
85
+ # The number of characters whose frequency order is less than 512
86
+ self._freq_chars = 0
87
+
88
+ def feed(self, char: Union[bytes, bytearray], char_len: int) -> None:
89
+ """feed a character with known length"""
90
+ if char_len == 2:
91
+ # we only care about 2-bytes character in our distribution analysis
92
+ order = self.get_order(char)
93
+ else:
94
+ order = -1
95
+ if order >= 0:
96
+ self._total_chars += 1
97
+ # order is valid
98
+ if order < self._table_size:
99
+ if 512 > self._char_to_freq_order[order]:
100
+ self._freq_chars += 1
101
+
102
+ def get_confidence(self) -> float:
103
+ """return confidence based on existing data"""
104
+ # if we didn't receive any character in our consideration range,
105
+ # return negative answer
106
+ if self._total_chars <= 0 or self._freq_chars <= self.MINIMUM_DATA_THRESHOLD:
107
+ return self.SURE_NO
108
+
109
+ if self._total_chars != self._freq_chars:
110
+ r = self._freq_chars / (
111
+ (self._total_chars - self._freq_chars) * self.typical_distribution_ratio
112
+ )
113
+ if r < self.SURE_YES:
114
+ return r
115
+
116
+ # normalize confidence (we don't want to be 100% sure)
117
+ return self.SURE_YES
118
+
119
+ def got_enough_data(self) -> bool:
120
+ # It is not necessary to receive all data to draw conclusion.
121
+ # For charset detection, certain amount of data is enough
122
+ return self._total_chars > self.ENOUGH_DATA_THRESHOLD
123
+
124
+ def get_order(self, _: Union[bytes, bytearray]) -> int:
125
+ # We do not handle characters based on the original encoding string,
126
+ # but convert this encoding string to a number, here called order.
127
+ # This allows multiple encodings of a language to share one frequency
128
+ # table.
129
+ return -1
130
+
131
+
132
+ class EUCTWDistributionAnalysis(CharDistributionAnalysis):
133
+ def __init__(self) -> None:
134
+ super().__init__()
135
+ self._char_to_freq_order = EUCTW_CHAR_TO_FREQ_ORDER
136
+ self._table_size = EUCTW_TABLE_SIZE
137
+ self.typical_distribution_ratio = EUCTW_TYPICAL_DISTRIBUTION_RATIO
138
+
139
+ def get_order(self, byte_str: Union[bytes, bytearray]) -> int:
140
+ # for euc-TW encoding, we are interested
141
+ # first byte range: 0xc4 -- 0xfe
142
+ # second byte range: 0xa1 -- 0xfe
143
+ # no validation needed here. State machine has done that
144
+ first_char = byte_str[0]
145
+ if first_char >= 0xC4:
146
+ return 94 * (first_char - 0xC4) + byte_str[1] - 0xA1
147
+ return -1
148
+
149
+
150
+ class EUCKRDistributionAnalysis(CharDistributionAnalysis):
151
+ def __init__(self) -> None:
152
+ super().__init__()
153
+ self._char_to_freq_order = EUCKR_CHAR_TO_FREQ_ORDER
154
+ self._table_size = EUCKR_TABLE_SIZE
155
+ self.typical_distribution_ratio = EUCKR_TYPICAL_DISTRIBUTION_RATIO
156
+
157
+ def get_order(self, byte_str: Union[bytes, bytearray]) -> int:
158
+ # for euc-KR encoding, we are interested
159
+ # first byte range: 0xb0 -- 0xfe
160
+ # second byte range: 0xa1 -- 0xfe
161
+ # no validation needed here. State machine has done that
162
+ first_char = byte_str[0]
163
+ if first_char >= 0xB0:
164
+ return 94 * (first_char - 0xB0) + byte_str[1] - 0xA1
165
+ return -1
166
+
167
+
168
+ class JOHABDistributionAnalysis(CharDistributionAnalysis):
169
+ def __init__(self) -> None:
170
+ super().__init__()
171
+ self._char_to_freq_order = EUCKR_CHAR_TO_FREQ_ORDER
172
+ self._table_size = EUCKR_TABLE_SIZE
173
+ self.typical_distribution_ratio = EUCKR_TYPICAL_DISTRIBUTION_RATIO
174
+
175
+ def get_order(self, byte_str: Union[bytes, bytearray]) -> int:
176
+ first_char = byte_str[0]
177
+ if 0x88 <= first_char < 0xD4:
178
+ code = first_char * 256 + byte_str[1]
179
+ return JOHAB_TO_EUCKR_ORDER_TABLE.get(code, -1)
180
+ return -1
181
+
182
+
183
+ class GB2312DistributionAnalysis(CharDistributionAnalysis):
184
+ def __init__(self) -> None:
185
+ super().__init__()
186
+ self._char_to_freq_order = GB2312_CHAR_TO_FREQ_ORDER
187
+ self._table_size = GB2312_TABLE_SIZE
188
+ self.typical_distribution_ratio = GB2312_TYPICAL_DISTRIBUTION_RATIO
189
+
190
+ def get_order(self, byte_str: Union[bytes, bytearray]) -> int:
191
+ # for GB2312 encoding, we are interested
192
+ # first byte range: 0xb0 -- 0xfe
193
+ # second byte range: 0xa1 -- 0xfe
194
+ # no validation needed here. State machine has done that
195
+ first_char, second_char = byte_str[0], byte_str[1]
196
+ if (first_char >= 0xB0) and (second_char >= 0xA1):
197
+ return 94 * (first_char - 0xB0) + second_char - 0xA1
198
+ return -1
199
+
200
+
201
+ class Big5DistributionAnalysis(CharDistributionAnalysis):
202
+ def __init__(self) -> None:
203
+ super().__init__()
204
+ self._char_to_freq_order = BIG5_CHAR_TO_FREQ_ORDER
205
+ self._table_size = BIG5_TABLE_SIZE
206
+ self.typical_distribution_ratio = BIG5_TYPICAL_DISTRIBUTION_RATIO
207
+
208
+ def get_order(self, byte_str: Union[bytes, bytearray]) -> int:
209
+ # for big5 encoding, we are interested
210
+ # first byte range: 0xa4 -- 0xfe
211
+ # second byte range: 0x40 -- 0x7e , 0xa1 -- 0xfe
212
+ # no validation needed here. State machine has done that
213
+ first_char, second_char = byte_str[0], byte_str[1]
214
+ if first_char >= 0xA4:
215
+ if second_char >= 0xA1:
216
+ return 157 * (first_char - 0xA4) + second_char - 0xA1 + 63
217
+ return 157 * (first_char - 0xA4) + second_char - 0x40
218
+ return -1
219
+
220
+
221
+ class SJISDistributionAnalysis(CharDistributionAnalysis):
222
+ def __init__(self) -> None:
223
+ super().__init__()
224
+ self._char_to_freq_order = JIS_CHAR_TO_FREQ_ORDER
225
+ self._table_size = JIS_TABLE_SIZE
226
+ self.typical_distribution_ratio = JIS_TYPICAL_DISTRIBUTION_RATIO
227
+
228
+ def get_order(self, byte_str: Union[bytes, bytearray]) -> int:
229
+ # for sjis encoding, we are interested
230
+ # first byte range: 0x81 -- 0x9f , 0xe0 -- 0xfe
231
+ # second byte range: 0x40 -- 0x7e, 0x81 -- oxfe
232
+ # no validation needed here. State machine has done that
233
+ first_char, second_char = byte_str[0], byte_str[1]
234
+ if 0x81 <= first_char <= 0x9F:
235
+ order = 188 * (first_char - 0x81)
236
+ elif 0xE0 <= first_char <= 0xEF:
237
+ order = 188 * (first_char - 0xE0 + 31)
238
+ else:
239
+ return -1
240
+ order = order + second_char - 0x40
241
+ if second_char > 0x7F:
242
+ order = -1
243
+ return order
244
+
245
+
246
+ class EUCJPDistributionAnalysis(CharDistributionAnalysis):
247
+ def __init__(self) -> None:
248
+ super().__init__()
249
+ self._char_to_freq_order = JIS_CHAR_TO_FREQ_ORDER
250
+ self._table_size = JIS_TABLE_SIZE
251
+ self.typical_distribution_ratio = JIS_TYPICAL_DISTRIBUTION_RATIO
252
+
253
+ def get_order(self, byte_str: Union[bytes, bytearray]) -> int:
254
+ # for euc-JP encoding, we are interested
255
+ # first byte range: 0xa0 -- 0xfe
256
+ # second byte range: 0xa1 -- 0xfe
257
+ # no validation needed here. State machine has done that
258
+ char = byte_str[0]
259
+ if char >= 0xA0:
260
+ return 94 * (char - 0xA1) + byte_str[1] - 0xA1
261
+ return -1
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/charsetgroupprober.py ADDED
@@ -0,0 +1,106 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Communicator client code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from typing import List, Optional, Union
29
+
30
+ from .charsetprober import CharSetProber
31
+ from .enums import LanguageFilter, ProbingState
32
+
33
+
34
+ class CharSetGroupProber(CharSetProber):
35
+ def __init__(self, lang_filter: LanguageFilter = LanguageFilter.NONE) -> None:
36
+ super().__init__(lang_filter=lang_filter)
37
+ self._active_num = 0
38
+ self.probers: List[CharSetProber] = []
39
+ self._best_guess_prober: Optional[CharSetProber] = None
40
+
41
+ def reset(self) -> None:
42
+ super().reset()
43
+ self._active_num = 0
44
+ for prober in self.probers:
45
+ prober.reset()
46
+ prober.active = True
47
+ self._active_num += 1
48
+ self._best_guess_prober = None
49
+
50
+ @property
51
+ def charset_name(self) -> Optional[str]:
52
+ if not self._best_guess_prober:
53
+ self.get_confidence()
54
+ if not self._best_guess_prober:
55
+ return None
56
+ return self._best_guess_prober.charset_name
57
+
58
+ @property
59
+ def language(self) -> Optional[str]:
60
+ if not self._best_guess_prober:
61
+ self.get_confidence()
62
+ if not self._best_guess_prober:
63
+ return None
64
+ return self._best_guess_prober.language
65
+
66
+ def feed(self, byte_str: Union[bytes, bytearray]) -> ProbingState:
67
+ for prober in self.probers:
68
+ if not prober.active:
69
+ continue
70
+ state = prober.feed(byte_str)
71
+ if not state:
72
+ continue
73
+ if state == ProbingState.FOUND_IT:
74
+ self._best_guess_prober = prober
75
+ self._state = ProbingState.FOUND_IT
76
+ return self.state
77
+ if state == ProbingState.NOT_ME:
78
+ prober.active = False
79
+ self._active_num -= 1
80
+ if self._active_num <= 0:
81
+ self._state = ProbingState.NOT_ME
82
+ return self.state
83
+ return self.state
84
+
85
+ def get_confidence(self) -> float:
86
+ state = self.state
87
+ if state == ProbingState.FOUND_IT:
88
+ return 0.99
89
+ if state == ProbingState.NOT_ME:
90
+ return 0.01
91
+ best_conf = 0.0
92
+ self._best_guess_prober = None
93
+ for prober in self.probers:
94
+ if not prober.active:
95
+ self.logger.debug("%s not active", prober.charset_name)
96
+ continue
97
+ conf = prober.get_confidence()
98
+ self.logger.debug(
99
+ "%s %s confidence = %s", prober.charset_name, prober.language, conf
100
+ )
101
+ if best_conf < conf:
102
+ best_conf = conf
103
+ self._best_guess_prober = prober
104
+ if not self._best_guess_prober:
105
+ return 0.0
106
+ return best_conf
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/codingstatemachine.py ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is mozilla.org code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ import logging
29
+
30
+ from .codingstatemachinedict import CodingStateMachineDict
31
+ from .enums import MachineState
32
+
33
+
34
+ class CodingStateMachine:
35
+ """
36
+ A state machine to verify a byte sequence for a particular encoding. For
37
+ each byte the detector receives, it will feed that byte to every active
38
+ state machine available, one byte at a time. The state machine changes its
39
+ state based on its previous state and the byte it receives. There are 3
40
+ states in a state machine that are of interest to an auto-detector:
41
+
42
+ START state: This is the state to start with, or a legal byte sequence
43
+ (i.e. a valid code point) for character has been identified.
44
+
45
+ ME state: This indicates that the state machine identified a byte sequence
46
+ that is specific to the charset it is designed for and that
47
+ there is no other possible encoding which can contain this byte
48
+ sequence. This will to lead to an immediate positive answer for
49
+ the detector.
50
+
51
+ ERROR state: This indicates the state machine identified an illegal byte
52
+ sequence for that encoding. This will lead to an immediate
53
+ negative answer for this encoding. Detector will exclude this
54
+ encoding from consideration from here on.
55
+ """
56
+
57
+ def __init__(self, sm: CodingStateMachineDict) -> None:
58
+ self._model = sm
59
+ self._curr_byte_pos = 0
60
+ self._curr_char_len = 0
61
+ self._curr_state = MachineState.START
62
+ self.active = True
63
+ self.logger = logging.getLogger(__name__)
64
+ self.reset()
65
+
66
+ def reset(self) -> None:
67
+ self._curr_state = MachineState.START
68
+
69
+ def next_state(self, c: int) -> int:
70
+ # for each byte we get its class
71
+ # if it is first byte, we also get byte length
72
+ byte_class = self._model["class_table"][c]
73
+ if self._curr_state == MachineState.START:
74
+ self._curr_byte_pos = 0
75
+ self._curr_char_len = self._model["char_len_table"][byte_class]
76
+ # from byte's class and state_table, we get its next state
77
+ curr_state = self._curr_state * self._model["class_factor"] + byte_class
78
+ self._curr_state = self._model["state_table"][curr_state]
79
+ self._curr_byte_pos += 1
80
+ return self._curr_state
81
+
82
+ def get_current_charlen(self) -> int:
83
+ return self._curr_char_len
84
+
85
+ def get_coding_state_machine(self) -> str:
86
+ return self._model["name"]
87
+
88
+ @property
89
+ def language(self) -> str:
90
+ return self._model["language"]
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/cp949prober.py ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is mozilla.org code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from .chardistribution import EUCKRDistributionAnalysis
29
+ from .codingstatemachine import CodingStateMachine
30
+ from .mbcharsetprober import MultiByteCharSetProber
31
+ from .mbcssm import CP949_SM_MODEL
32
+
33
+
34
+ class CP949Prober(MultiByteCharSetProber):
35
+ def __init__(self) -> None:
36
+ super().__init__()
37
+ self.coding_sm = CodingStateMachine(CP949_SM_MODEL)
38
+ # NOTE: CP949 is a superset of EUC-KR, so the distribution should be
39
+ # not different.
40
+ self.distribution_analyzer = EUCKRDistributionAnalysis()
41
+ self.reset()
42
+
43
+ @property
44
+ def charset_name(self) -> str:
45
+ return "CP949"
46
+
47
+ @property
48
+ def language(self) -> str:
49
+ return "Korean"
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/escprober.py ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is mozilla.org code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from typing import Optional, Union
29
+
30
+ from .charsetprober import CharSetProber
31
+ from .codingstatemachine import CodingStateMachine
32
+ from .enums import LanguageFilter, MachineState, ProbingState
33
+ from .escsm import (
34
+ HZ_SM_MODEL,
35
+ ISO2022CN_SM_MODEL,
36
+ ISO2022JP_SM_MODEL,
37
+ ISO2022KR_SM_MODEL,
38
+ )
39
+
40
+
41
+ class EscCharSetProber(CharSetProber):
42
+ """
43
+ This CharSetProber uses a "code scheme" approach for detecting encodings,
44
+ whereby easily recognizable escape or shift sequences are relied on to
45
+ identify these encodings.
46
+ """
47
+
48
+ def __init__(self, lang_filter: LanguageFilter = LanguageFilter.NONE) -> None:
49
+ super().__init__(lang_filter=lang_filter)
50
+ self.coding_sm = []
51
+ if self.lang_filter & LanguageFilter.CHINESE_SIMPLIFIED:
52
+ self.coding_sm.append(CodingStateMachine(HZ_SM_MODEL))
53
+ self.coding_sm.append(CodingStateMachine(ISO2022CN_SM_MODEL))
54
+ if self.lang_filter & LanguageFilter.JAPANESE:
55
+ self.coding_sm.append(CodingStateMachine(ISO2022JP_SM_MODEL))
56
+ if self.lang_filter & LanguageFilter.KOREAN:
57
+ self.coding_sm.append(CodingStateMachine(ISO2022KR_SM_MODEL))
58
+ self.active_sm_count = 0
59
+ self._detected_charset: Optional[str] = None
60
+ self._detected_language: Optional[str] = None
61
+ self._state = ProbingState.DETECTING
62
+ self.reset()
63
+
64
+ def reset(self) -> None:
65
+ super().reset()
66
+ for coding_sm in self.coding_sm:
67
+ coding_sm.active = True
68
+ coding_sm.reset()
69
+ self.active_sm_count = len(self.coding_sm)
70
+ self._detected_charset = None
71
+ self._detected_language = None
72
+
73
+ @property
74
+ def charset_name(self) -> Optional[str]:
75
+ return self._detected_charset
76
+
77
+ @property
78
+ def language(self) -> Optional[str]:
79
+ return self._detected_language
80
+
81
+ def get_confidence(self) -> float:
82
+ return 0.99 if self._detected_charset else 0.00
83
+
84
+ def feed(self, byte_str: Union[bytes, bytearray]) -> ProbingState:
85
+ for c in byte_str:
86
+ for coding_sm in self.coding_sm:
87
+ if not coding_sm.active:
88
+ continue
89
+ coding_state = coding_sm.next_state(c)
90
+ if coding_state == MachineState.ERROR:
91
+ coding_sm.active = False
92
+ self.active_sm_count -= 1
93
+ if self.active_sm_count <= 0:
94
+ self._state = ProbingState.NOT_ME
95
+ return self.state
96
+ elif coding_state == MachineState.ITS_ME:
97
+ self._state = ProbingState.FOUND_IT
98
+ self._detected_charset = coding_sm.get_coding_state_machine()
99
+ self._detected_language = coding_sm.language
100
+ return self.state
101
+
102
+ return self.state
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/escsm.py ADDED
@@ -0,0 +1,261 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is mozilla.org code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from .codingstatemachinedict import CodingStateMachineDict
29
+ from .enums import MachineState
30
+
31
+ # fmt: off
32
+ HZ_CLS = (
33
+ 1, 0, 0, 0, 0, 0, 0, 0, # 00 - 07
34
+ 0, 0, 0, 0, 0, 0, 0, 0, # 08 - 0f
35
+ 0, 0, 0, 0, 0, 0, 0, 0, # 10 - 17
36
+ 0, 0, 0, 1, 0, 0, 0, 0, # 18 - 1f
37
+ 0, 0, 0, 0, 0, 0, 0, 0, # 20 - 27
38
+ 0, 0, 0, 0, 0, 0, 0, 0, # 28 - 2f
39
+ 0, 0, 0, 0, 0, 0, 0, 0, # 30 - 37
40
+ 0, 0, 0, 0, 0, 0, 0, 0, # 38 - 3f
41
+ 0, 0, 0, 0, 0, 0, 0, 0, # 40 - 47
42
+ 0, 0, 0, 0, 0, 0, 0, 0, # 48 - 4f
43
+ 0, 0, 0, 0, 0, 0, 0, 0, # 50 - 57
44
+ 0, 0, 0, 0, 0, 0, 0, 0, # 58 - 5f
45
+ 0, 0, 0, 0, 0, 0, 0, 0, # 60 - 67
46
+ 0, 0, 0, 0, 0, 0, 0, 0, # 68 - 6f
47
+ 0, 0, 0, 0, 0, 0, 0, 0, # 70 - 77
48
+ 0, 0, 0, 4, 0, 5, 2, 0, # 78 - 7f
49
+ 1, 1, 1, 1, 1, 1, 1, 1, # 80 - 87
50
+ 1, 1, 1, 1, 1, 1, 1, 1, # 88 - 8f
51
+ 1, 1, 1, 1, 1, 1, 1, 1, # 90 - 97
52
+ 1, 1, 1, 1, 1, 1, 1, 1, # 98 - 9f
53
+ 1, 1, 1, 1, 1, 1, 1, 1, # a0 - a7
54
+ 1, 1, 1, 1, 1, 1, 1, 1, # a8 - af
55
+ 1, 1, 1, 1, 1, 1, 1, 1, # b0 - b7
56
+ 1, 1, 1, 1, 1, 1, 1, 1, # b8 - bf
57
+ 1, 1, 1, 1, 1, 1, 1, 1, # c0 - c7
58
+ 1, 1, 1, 1, 1, 1, 1, 1, # c8 - cf
59
+ 1, 1, 1, 1, 1, 1, 1, 1, # d0 - d7
60
+ 1, 1, 1, 1, 1, 1, 1, 1, # d8 - df
61
+ 1, 1, 1, 1, 1, 1, 1, 1, # e0 - e7
62
+ 1, 1, 1, 1, 1, 1, 1, 1, # e8 - ef
63
+ 1, 1, 1, 1, 1, 1, 1, 1, # f0 - f7
64
+ 1, 1, 1, 1, 1, 1, 1, 1, # f8 - ff
65
+ )
66
+
67
+ HZ_ST = (
68
+ MachineState.START, MachineState.ERROR, 3, MachineState.START, MachineState.START, MachineState.START, MachineState.ERROR, MachineState.ERROR, # 00-07
69
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, # 08-0f
70
+ MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ERROR, MachineState.ERROR, MachineState.START, MachineState.START, 4, MachineState.ERROR, # 10-17
71
+ 5, MachineState.ERROR, 6, MachineState.ERROR, 5, 5, 4, MachineState.ERROR, # 18-1f
72
+ 4, MachineState.ERROR, 4, 4, 4, MachineState.ERROR, 4, MachineState.ERROR, # 20-27
73
+ 4, MachineState.ITS_ME, MachineState.START, MachineState.START, MachineState.START, MachineState.START, MachineState.START, MachineState.START, # 28-2f
74
+ )
75
+ # fmt: on
76
+
77
+ HZ_CHAR_LEN_TABLE = (0, 0, 0, 0, 0, 0)
78
+
79
+ HZ_SM_MODEL: CodingStateMachineDict = {
80
+ "class_table": HZ_CLS,
81
+ "class_factor": 6,
82
+ "state_table": HZ_ST,
83
+ "char_len_table": HZ_CHAR_LEN_TABLE,
84
+ "name": "HZ-GB-2312",
85
+ "language": "Chinese",
86
+ }
87
+
88
+ # fmt: off
89
+ ISO2022CN_CLS = (
90
+ 2, 0, 0, 0, 0, 0, 0, 0, # 00 - 07
91
+ 0, 0, 0, 0, 0, 0, 0, 0, # 08 - 0f
92
+ 0, 0, 0, 0, 0, 0, 0, 0, # 10 - 17
93
+ 0, 0, 0, 1, 0, 0, 0, 0, # 18 - 1f
94
+ 0, 0, 0, 0, 0, 0, 0, 0, # 20 - 27
95
+ 0, 3, 0, 0, 0, 0, 0, 0, # 28 - 2f
96
+ 0, 0, 0, 0, 0, 0, 0, 0, # 30 - 37
97
+ 0, 0, 0, 0, 0, 0, 0, 0, # 38 - 3f
98
+ 0, 0, 0, 4, 0, 0, 0, 0, # 40 - 47
99
+ 0, 0, 0, 0, 0, 0, 0, 0, # 48 - 4f
100
+ 0, 0, 0, 0, 0, 0, 0, 0, # 50 - 57
101
+ 0, 0, 0, 0, 0, 0, 0, 0, # 58 - 5f
102
+ 0, 0, 0, 0, 0, 0, 0, 0, # 60 - 67
103
+ 0, 0, 0, 0, 0, 0, 0, 0, # 68 - 6f
104
+ 0, 0, 0, 0, 0, 0, 0, 0, # 70 - 77
105
+ 0, 0, 0, 0, 0, 0, 0, 0, # 78 - 7f
106
+ 2, 2, 2, 2, 2, 2, 2, 2, # 80 - 87
107
+ 2, 2, 2, 2, 2, 2, 2, 2, # 88 - 8f
108
+ 2, 2, 2, 2, 2, 2, 2, 2, # 90 - 97
109
+ 2, 2, 2, 2, 2, 2, 2, 2, # 98 - 9f
110
+ 2, 2, 2, 2, 2, 2, 2, 2, # a0 - a7
111
+ 2, 2, 2, 2, 2, 2, 2, 2, # a8 - af
112
+ 2, 2, 2, 2, 2, 2, 2, 2, # b0 - b7
113
+ 2, 2, 2, 2, 2, 2, 2, 2, # b8 - bf
114
+ 2, 2, 2, 2, 2, 2, 2, 2, # c0 - c7
115
+ 2, 2, 2, 2, 2, 2, 2, 2, # c8 - cf
116
+ 2, 2, 2, 2, 2, 2, 2, 2, # d0 - d7
117
+ 2, 2, 2, 2, 2, 2, 2, 2, # d8 - df
118
+ 2, 2, 2, 2, 2, 2, 2, 2, # e0 - e7
119
+ 2, 2, 2, 2, 2, 2, 2, 2, # e8 - ef
120
+ 2, 2, 2, 2, 2, 2, 2, 2, # f0 - f7
121
+ 2, 2, 2, 2, 2, 2, 2, 2, # f8 - ff
122
+ )
123
+
124
+ ISO2022CN_ST = (
125
+ MachineState.START, 3, MachineState.ERROR, MachineState.START, MachineState.START, MachineState.START, MachineState.START, MachineState.START, # 00-07
126
+ MachineState.START, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, # 08-0f
127
+ MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, # 10-17
128
+ MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, 4, MachineState.ERROR, # 18-1f
129
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, # 20-27
130
+ 5, 6, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, # 28-2f
131
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, # 30-37
132
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ERROR, MachineState.START, # 38-3f
133
+ )
134
+ # fmt: on
135
+
136
+ ISO2022CN_CHAR_LEN_TABLE = (0, 0, 0, 0, 0, 0, 0, 0, 0)
137
+
138
+ ISO2022CN_SM_MODEL: CodingStateMachineDict = {
139
+ "class_table": ISO2022CN_CLS,
140
+ "class_factor": 9,
141
+ "state_table": ISO2022CN_ST,
142
+ "char_len_table": ISO2022CN_CHAR_LEN_TABLE,
143
+ "name": "ISO-2022-CN",
144
+ "language": "Chinese",
145
+ }
146
+
147
+ # fmt: off
148
+ ISO2022JP_CLS = (
149
+ 2, 0, 0, 0, 0, 0, 0, 0, # 00 - 07
150
+ 0, 0, 0, 0, 0, 0, 2, 2, # 08 - 0f
151
+ 0, 0, 0, 0, 0, 0, 0, 0, # 10 - 17
152
+ 0, 0, 0, 1, 0, 0, 0, 0, # 18 - 1f
153
+ 0, 0, 0, 0, 7, 0, 0, 0, # 20 - 27
154
+ 3, 0, 0, 0, 0, 0, 0, 0, # 28 - 2f
155
+ 0, 0, 0, 0, 0, 0, 0, 0, # 30 - 37
156
+ 0, 0, 0, 0, 0, 0, 0, 0, # 38 - 3f
157
+ 6, 0, 4, 0, 8, 0, 0, 0, # 40 - 47
158
+ 0, 9, 5, 0, 0, 0, 0, 0, # 48 - 4f
159
+ 0, 0, 0, 0, 0, 0, 0, 0, # 50 - 57
160
+ 0, 0, 0, 0, 0, 0, 0, 0, # 58 - 5f
161
+ 0, 0, 0, 0, 0, 0, 0, 0, # 60 - 67
162
+ 0, 0, 0, 0, 0, 0, 0, 0, # 68 - 6f
163
+ 0, 0, 0, 0, 0, 0, 0, 0, # 70 - 77
164
+ 0, 0, 0, 0, 0, 0, 0, 0, # 78 - 7f
165
+ 2, 2, 2, 2, 2, 2, 2, 2, # 80 - 87
166
+ 2, 2, 2, 2, 2, 2, 2, 2, # 88 - 8f
167
+ 2, 2, 2, 2, 2, 2, 2, 2, # 90 - 97
168
+ 2, 2, 2, 2, 2, 2, 2, 2, # 98 - 9f
169
+ 2, 2, 2, 2, 2, 2, 2, 2, # a0 - a7
170
+ 2, 2, 2, 2, 2, 2, 2, 2, # a8 - af
171
+ 2, 2, 2, 2, 2, 2, 2, 2, # b0 - b7
172
+ 2, 2, 2, 2, 2, 2, 2, 2, # b8 - bf
173
+ 2, 2, 2, 2, 2, 2, 2, 2, # c0 - c7
174
+ 2, 2, 2, 2, 2, 2, 2, 2, # c8 - cf
175
+ 2, 2, 2, 2, 2, 2, 2, 2, # d0 - d7
176
+ 2, 2, 2, 2, 2, 2, 2, 2, # d8 - df
177
+ 2, 2, 2, 2, 2, 2, 2, 2, # e0 - e7
178
+ 2, 2, 2, 2, 2, 2, 2, 2, # e8 - ef
179
+ 2, 2, 2, 2, 2, 2, 2, 2, # f0 - f7
180
+ 2, 2, 2, 2, 2, 2, 2, 2, # f8 - ff
181
+ )
182
+
183
+ ISO2022JP_ST = (
184
+ MachineState.START, 3, MachineState.ERROR, MachineState.START, MachineState.START, MachineState.START, MachineState.START, MachineState.START, # 00-07
185
+ MachineState.START, MachineState.START, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, # 08-0f
186
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, # 10-17
187
+ MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ERROR, MachineState.ERROR, # 18-1f
188
+ MachineState.ERROR, 5, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, 4, MachineState.ERROR, MachineState.ERROR, # 20-27
189
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, 6, MachineState.ITS_ME, MachineState.ERROR, MachineState.ITS_ME, MachineState.ERROR, # 28-2f
190
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ITS_ME, # 30-37
191
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, # 38-3f
192
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ERROR, MachineState.START, MachineState.START, # 40-47
193
+ )
194
+ # fmt: on
195
+
196
+ ISO2022JP_CHAR_LEN_TABLE = (0, 0, 0, 0, 0, 0, 0, 0, 0, 0)
197
+
198
+ ISO2022JP_SM_MODEL: CodingStateMachineDict = {
199
+ "class_table": ISO2022JP_CLS,
200
+ "class_factor": 10,
201
+ "state_table": ISO2022JP_ST,
202
+ "char_len_table": ISO2022JP_CHAR_LEN_TABLE,
203
+ "name": "ISO-2022-JP",
204
+ "language": "Japanese",
205
+ }
206
+
207
+ # fmt: off
208
+ ISO2022KR_CLS = (
209
+ 2, 0, 0, 0, 0, 0, 0, 0, # 00 - 07
210
+ 0, 0, 0, 0, 0, 0, 0, 0, # 08 - 0f
211
+ 0, 0, 0, 0, 0, 0, 0, 0, # 10 - 17
212
+ 0, 0, 0, 1, 0, 0, 0, 0, # 18 - 1f
213
+ 0, 0, 0, 0, 3, 0, 0, 0, # 20 - 27
214
+ 0, 4, 0, 0, 0, 0, 0, 0, # 28 - 2f
215
+ 0, 0, 0, 0, 0, 0, 0, 0, # 30 - 37
216
+ 0, 0, 0, 0, 0, 0, 0, 0, # 38 - 3f
217
+ 0, 0, 0, 5, 0, 0, 0, 0, # 40 - 47
218
+ 0, 0, 0, 0, 0, 0, 0, 0, # 48 - 4f
219
+ 0, 0, 0, 0, 0, 0, 0, 0, # 50 - 57
220
+ 0, 0, 0, 0, 0, 0, 0, 0, # 58 - 5f
221
+ 0, 0, 0, 0, 0, 0, 0, 0, # 60 - 67
222
+ 0, 0, 0, 0, 0, 0, 0, 0, # 68 - 6f
223
+ 0, 0, 0, 0, 0, 0, 0, 0, # 70 - 77
224
+ 0, 0, 0, 0, 0, 0, 0, 0, # 78 - 7f
225
+ 2, 2, 2, 2, 2, 2, 2, 2, # 80 - 87
226
+ 2, 2, 2, 2, 2, 2, 2, 2, # 88 - 8f
227
+ 2, 2, 2, 2, 2, 2, 2, 2, # 90 - 97
228
+ 2, 2, 2, 2, 2, 2, 2, 2, # 98 - 9f
229
+ 2, 2, 2, 2, 2, 2, 2, 2, # a0 - a7
230
+ 2, 2, 2, 2, 2, 2, 2, 2, # a8 - af
231
+ 2, 2, 2, 2, 2, 2, 2, 2, # b0 - b7
232
+ 2, 2, 2, 2, 2, 2, 2, 2, # b8 - bf
233
+ 2, 2, 2, 2, 2, 2, 2, 2, # c0 - c7
234
+ 2, 2, 2, 2, 2, 2, 2, 2, # c8 - cf
235
+ 2, 2, 2, 2, 2, 2, 2, 2, # d0 - d7
236
+ 2, 2, 2, 2, 2, 2, 2, 2, # d8 - df
237
+ 2, 2, 2, 2, 2, 2, 2, 2, # e0 - e7
238
+ 2, 2, 2, 2, 2, 2, 2, 2, # e8 - ef
239
+ 2, 2, 2, 2, 2, 2, 2, 2, # f0 - f7
240
+ 2, 2, 2, 2, 2, 2, 2, 2, # f8 - ff
241
+ )
242
+
243
+ ISO2022KR_ST = (
244
+ MachineState.START, 3, MachineState.ERROR, MachineState.START, MachineState.START, MachineState.START, MachineState.ERROR, MachineState.ERROR, # 00-07
245
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ITS_ME, # 08-0f
246
+ MachineState.ITS_ME, MachineState.ITS_ME, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, 4, MachineState.ERROR, MachineState.ERROR, # 10-17
247
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, 5, MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, # 18-1f
248
+ MachineState.ERROR, MachineState.ERROR, MachineState.ERROR, MachineState.ITS_ME, MachineState.START, MachineState.START, MachineState.START, MachineState.START, # 20-27
249
+ )
250
+ # fmt: on
251
+
252
+ ISO2022KR_CHAR_LEN_TABLE = (0, 0, 0, 0, 0, 0)
253
+
254
+ ISO2022KR_SM_MODEL: CodingStateMachineDict = {
255
+ "class_table": ISO2022KR_CLS,
256
+ "class_factor": 6,
257
+ "state_table": ISO2022KR_ST,
258
+ "char_len_table": ISO2022KR_CHAR_LEN_TABLE,
259
+ "name": "ISO-2022-KR",
260
+ "language": "Korean",
261
+ }
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/eucjpprober.py ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is mozilla.org code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from typing import Union
29
+
30
+ from .chardistribution import EUCJPDistributionAnalysis
31
+ from .codingstatemachine import CodingStateMachine
32
+ from .enums import MachineState, ProbingState
33
+ from .jpcntx import EUCJPContextAnalysis
34
+ from .mbcharsetprober import MultiByteCharSetProber
35
+ from .mbcssm import EUCJP_SM_MODEL
36
+
37
+
38
+ class EUCJPProber(MultiByteCharSetProber):
39
+ def __init__(self) -> None:
40
+ super().__init__()
41
+ self.coding_sm = CodingStateMachine(EUCJP_SM_MODEL)
42
+ self.distribution_analyzer = EUCJPDistributionAnalysis()
43
+ self.context_analyzer = EUCJPContextAnalysis()
44
+ self.reset()
45
+
46
+ def reset(self) -> None:
47
+ super().reset()
48
+ self.context_analyzer.reset()
49
+
50
+ @property
51
+ def charset_name(self) -> str:
52
+ return "EUC-JP"
53
+
54
+ @property
55
+ def language(self) -> str:
56
+ return "Japanese"
57
+
58
+ def feed(self, byte_str: Union[bytes, bytearray]) -> ProbingState:
59
+ assert self.coding_sm is not None
60
+ assert self.distribution_analyzer is not None
61
+
62
+ for i, byte in enumerate(byte_str):
63
+ # PY3K: byte_str is a byte array, so byte is an int, not a byte
64
+ coding_state = self.coding_sm.next_state(byte)
65
+ if coding_state == MachineState.ERROR:
66
+ self.logger.debug(
67
+ "%s %s prober hit error at byte %s",
68
+ self.charset_name,
69
+ self.language,
70
+ i,
71
+ )
72
+ self._state = ProbingState.NOT_ME
73
+ break
74
+ if coding_state == MachineState.ITS_ME:
75
+ self._state = ProbingState.FOUND_IT
76
+ break
77
+ if coding_state == MachineState.START:
78
+ char_len = self.coding_sm.get_current_charlen()
79
+ if i == 0:
80
+ self._last_char[1] = byte
81
+ self.context_analyzer.feed(self._last_char, char_len)
82
+ self.distribution_analyzer.feed(self._last_char, char_len)
83
+ else:
84
+ self.context_analyzer.feed(byte_str[i - 1 : i + 1], char_len)
85
+ self.distribution_analyzer.feed(byte_str[i - 1 : i + 1], char_len)
86
+
87
+ self._last_char[0] = byte_str[-1]
88
+
89
+ if self.state == ProbingState.DETECTING:
90
+ if self.context_analyzer.got_enough_data() and (
91
+ self.get_confidence() > self.SHORTCUT_THRESHOLD
92
+ ):
93
+ self._state = ProbingState.FOUND_IT
94
+
95
+ return self.state
96
+
97
+ def get_confidence(self) -> float:
98
+ assert self.distribution_analyzer is not None
99
+
100
+ context_conf = self.context_analyzer.get_confidence()
101
+ distrib_conf = self.distribution_analyzer.get_confidence()
102
+ return max(context_conf, distrib_conf)
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/euckrfreq.py ADDED
@@ -0,0 +1,196 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Communicator client code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ # Sampling from about 20M text materials include literature and computer technology
29
+
30
+ # 128 --> 0.79
31
+ # 256 --> 0.92
32
+ # 512 --> 0.986
33
+ # 1024 --> 0.99944
34
+ # 2048 --> 0.99999
35
+ #
36
+ # Idea Distribution Ratio = 0.98653 / (1-0.98653) = 73.24
37
+ # Random Distribution Ration = 512 / (2350-512) = 0.279.
38
+ #
39
+ # Typical Distribution Ratio
40
+
41
+ EUCKR_TYPICAL_DISTRIBUTION_RATIO = 6.0
42
+
43
+ EUCKR_TABLE_SIZE = 2352
44
+
45
+ # Char to FreqOrder table ,
46
+ # fmt: off
47
+ EUCKR_CHAR_TO_FREQ_ORDER = (
48
+ 13, 130, 120,1396, 481,1719,1720, 328, 609, 212,1721, 707, 400, 299,1722, 87,
49
+ 1397,1723, 104, 536,1117,1203,1724,1267, 685,1268, 508,1725,1726,1727,1728,1398,
50
+ 1399,1729,1730,1731, 141, 621, 326,1057, 368,1732, 267, 488, 20,1733,1269,1734,
51
+ 945,1400,1735, 47, 904,1270,1736,1737, 773, 248,1738, 409, 313, 786, 429,1739,
52
+ 116, 987, 813,1401, 683, 75,1204, 145,1740,1741,1742,1743, 16, 847, 667, 622,
53
+ 708,1744,1745,1746, 966, 787, 304, 129,1747, 60, 820, 123, 676,1748,1749,1750,
54
+ 1751, 617,1752, 626,1753,1754,1755,1756, 653,1757,1758,1759,1760,1761,1762, 856,
55
+ 344,1763,1764,1765,1766, 89, 401, 418, 806, 905, 848,1767,1768,1769, 946,1205,
56
+ 709,1770,1118,1771, 241,1772,1773,1774,1271,1775, 569,1776, 999,1777,1778,1779,
57
+ 1780, 337, 751,1058, 28, 628, 254,1781, 177, 906, 270, 349, 891,1079,1782, 19,
58
+ 1783, 379,1784, 315,1785, 629, 754,1402, 559,1786, 636, 203,1206,1787, 710, 567,
59
+ 1788, 935, 814,1789,1790,1207, 766, 528,1791,1792,1208,1793,1794,1795,1796,1797,
60
+ 1403,1798,1799, 533,1059,1404,1405,1156,1406, 936, 884,1080,1800, 351,1801,1802,
61
+ 1803,1804,1805, 801,1806,1807,1808,1119,1809,1157, 714, 474,1407,1810, 298, 899,
62
+ 885,1811,1120, 802,1158,1812, 892,1813,1814,1408, 659,1815,1816,1121,1817,1818,
63
+ 1819,1820,1821,1822, 319,1823, 594, 545,1824, 815, 937,1209,1825,1826, 573,1409,
64
+ 1022,1827,1210,1828,1829,1830,1831,1832,1833, 556, 722, 807,1122,1060,1834, 697,
65
+ 1835, 900, 557, 715,1836,1410, 540,1411, 752,1159, 294, 597,1211, 976, 803, 770,
66
+ 1412,1837,1838, 39, 794,1413, 358,1839, 371, 925,1840, 453, 661, 788, 531, 723,
67
+ 544,1023,1081, 869, 91,1841, 392, 430, 790, 602,1414, 677,1082, 457,1415,1416,
68
+ 1842,1843, 475, 327,1024,1417, 795, 121,1844, 733, 403,1418,1845,1846,1847, 300,
69
+ 119, 711,1212, 627,1848,1272, 207,1849,1850, 796,1213, 382,1851, 519,1852,1083,
70
+ 893,1853,1854,1855, 367, 809, 487, 671,1856, 663,1857,1858, 956, 471, 306, 857,
71
+ 1859,1860,1160,1084,1861,1862,1863,1864,1865,1061,1866,1867,1868,1869,1870,1871,
72
+ 282, 96, 574,1872, 502,1085,1873,1214,1874, 907,1875,1876, 827, 977,1419,1420,
73
+ 1421, 268,1877,1422,1878,1879,1880, 308,1881, 2, 537,1882,1883,1215,1884,1885,
74
+ 127, 791,1886,1273,1423,1887, 34, 336, 404, 643,1888, 571, 654, 894, 840,1889,
75
+ 0, 886,1274, 122, 575, 260, 908, 938,1890,1275, 410, 316,1891,1892, 100,1893,
76
+ 1894,1123, 48,1161,1124,1025,1895, 633, 901,1276,1896,1897, 115, 816,1898, 317,
77
+ 1899, 694,1900, 909, 734,1424, 572, 866,1425, 691, 85, 524,1010, 543, 394, 841,
78
+ 1901,1902,1903,1026,1904,1905,1906,1907,1908,1909, 30, 451, 651, 988, 310,1910,
79
+ 1911,1426, 810,1216, 93,1912,1913,1277,1217,1914, 858, 759, 45, 58, 181, 610,
80
+ 269,1915,1916, 131,1062, 551, 443,1000, 821,1427, 957, 895,1086,1917,1918, 375,
81
+ 1919, 359,1920, 687,1921, 822,1922, 293,1923,1924, 40, 662, 118, 692, 29, 939,
82
+ 887, 640, 482, 174,1925, 69,1162, 728,1428, 910,1926,1278,1218,1279, 386, 870,
83
+ 217, 854,1163, 823,1927,1928,1929,1930, 834,1931, 78,1932, 859,1933,1063,1934,
84
+ 1935,1936,1937, 438,1164, 208, 595,1938,1939,1940,1941,1219,1125,1942, 280, 888,
85
+ 1429,1430,1220,1431,1943,1944,1945,1946,1947,1280, 150, 510,1432,1948,1949,1950,
86
+ 1951,1952,1953,1954,1011,1087,1955,1433,1043,1956, 881,1957, 614, 958,1064,1065,
87
+ 1221,1958, 638,1001, 860, 967, 896,1434, 989, 492, 553,1281,1165,1959,1282,1002,
88
+ 1283,1222,1960,1961,1962,1963, 36, 383, 228, 753, 247, 454,1964, 876, 678,1965,
89
+ 1966,1284, 126, 464, 490, 835, 136, 672, 529, 940,1088,1435, 473,1967,1968, 467,
90
+ 50, 390, 227, 587, 279, 378, 598, 792, 968, 240, 151, 160, 849, 882,1126,1285,
91
+ 639,1044, 133, 140, 288, 360, 811, 563,1027, 561, 142, 523,1969,1970,1971, 7,
92
+ 103, 296, 439, 407, 506, 634, 990,1972,1973,1974,1975, 645,1976,1977,1978,1979,
93
+ 1980,1981, 236,1982,1436,1983,1984,1089, 192, 828, 618, 518,1166, 333,1127,1985,
94
+ 818,1223,1986,1987,1988,1989,1990,1991,1992,1993, 342,1128,1286, 746, 842,1994,
95
+ 1995, 560, 223,1287, 98, 8, 189, 650, 978,1288,1996,1437,1997, 17, 345, 250,
96
+ 423, 277, 234, 512, 226, 97, 289, 42, 167,1998, 201,1999,2000, 843, 836, 824,
97
+ 532, 338, 783,1090, 182, 576, 436,1438,1439, 527, 500,2001, 947, 889,2002,2003,
98
+ 2004,2005, 262, 600, 314, 447,2006, 547,2007, 693, 738,1129,2008, 71,1440, 745,
99
+ 619, 688,2009, 829,2010,2011, 147,2012, 33, 948,2013,2014, 74, 224,2015, 61,
100
+ 191, 918, 399, 637,2016,1028,1130, 257, 902,2017,2018,2019,2020,2021,2022,2023,
101
+ 2024,2025,2026, 837,2027,2028,2029,2030, 179, 874, 591, 52, 724, 246,2031,2032,
102
+ 2033,2034,1167, 969,2035,1289, 630, 605, 911,1091,1168,2036,2037,2038,1441, 912,
103
+ 2039, 623,2040,2041, 253,1169,1290,2042,1442, 146, 620, 611, 577, 433,2043,1224,
104
+ 719,1170, 959, 440, 437, 534, 84, 388, 480,1131, 159, 220, 198, 679,2044,1012,
105
+ 819,1066,1443, 113,1225, 194, 318,1003,1029,2045,2046,2047,2048,1067,2049,2050,
106
+ 2051,2052,2053, 59, 913, 112,2054, 632,2055, 455, 144, 739,1291,2056, 273, 681,
107
+ 499,2057, 448,2058,2059, 760,2060,2061, 970, 384, 169, 245,1132,2062,2063, 414,
108
+ 1444,2064,2065, 41, 235,2066, 157, 252, 877, 568, 919, 789, 580,2067, 725,2068,
109
+ 2069,1292,2070,2071,1445,2072,1446,2073,2074, 55, 588, 66,1447, 271,1092,2075,
110
+ 1226,2076, 960,1013, 372,2077,2078,2079,2080,2081,1293,2082,2083,2084,2085, 850,
111
+ 2086,2087,2088,2089,2090, 186,2091,1068, 180,2092,2093,2094, 109,1227, 522, 606,
112
+ 2095, 867,1448,1093, 991,1171, 926, 353,1133,2096, 581,2097,2098,2099,1294,1449,
113
+ 1450,2100, 596,1172,1014,1228,2101,1451,1295,1173,1229,2102,2103,1296,1134,1452,
114
+ 949,1135,2104,2105,1094,1453,1454,1455,2106,1095,2107,2108,2109,2110,2111,2112,
115
+ 2113,2114,2115,2116,2117, 804,2118,2119,1230,1231, 805,1456, 405,1136,2120,2121,
116
+ 2122,2123,2124, 720, 701,1297, 992,1457, 927,1004,2125,2126,2127,2128,2129,2130,
117
+ 22, 417,2131, 303,2132, 385,2133, 971, 520, 513,2134,1174, 73,1096, 231, 274,
118
+ 962,1458, 673,2135,1459,2136, 152,1137,2137,2138,2139,2140,1005,1138,1460,1139,
119
+ 2141,2142,2143,2144, 11, 374, 844,2145, 154,1232, 46,1461,2146, 838, 830, 721,
120
+ 1233, 106,2147, 90, 428, 462, 578, 566,1175, 352,2148,2149, 538,1234, 124,1298,
121
+ 2150,1462, 761, 565,2151, 686,2152, 649,2153, 72, 173,2154, 460, 415,2155,1463,
122
+ 2156,1235, 305,2157,2158,2159,2160,2161,2162, 579,2163,2164,2165,2166,2167, 747,
123
+ 2168,2169,2170,2171,1464, 669,2172,2173,2174,2175,2176,1465,2177, 23, 530, 285,
124
+ 2178, 335, 729,2179, 397,2180,2181,2182,1030,2183,2184, 698,2185,2186, 325,2187,
125
+ 2188, 369,2189, 799,1097,1015, 348,2190,1069, 680,2191, 851,1466,2192,2193, 10,
126
+ 2194, 613, 424,2195, 979, 108, 449, 589, 27, 172, 81,1031, 80, 774, 281, 350,
127
+ 1032, 525, 301, 582,1176,2196, 674,1045,2197,2198,1467, 730, 762,2199,2200,2201,
128
+ 2202,1468,2203, 993,2204,2205, 266,1070, 963,1140,2206,2207,2208, 664,1098, 972,
129
+ 2209,2210,2211,1177,1469,1470, 871,2212,2213,2214,2215,2216,1471,2217,2218,2219,
130
+ 2220,2221,2222,2223,2224,2225,2226,2227,1472,1236,2228,2229,2230,2231,2232,2233,
131
+ 2234,2235,1299,2236,2237, 200,2238, 477, 373,2239,2240, 731, 825, 777,2241,2242,
132
+ 2243, 521, 486, 548,2244,2245,2246,1473,1300, 53, 549, 137, 875, 76, 158,2247,
133
+ 1301,1474, 469, 396,1016, 278, 712,2248, 321, 442, 503, 767, 744, 941,1237,1178,
134
+ 1475,2249, 82, 178,1141,1179, 973,2250,1302,2251, 297,2252,2253, 570,2254,2255,
135
+ 2256, 18, 450, 206,2257, 290, 292,1142,2258, 511, 162, 99, 346, 164, 735,2259,
136
+ 1476,1477, 4, 554, 343, 798,1099,2260,1100,2261, 43, 171,1303, 139, 215,2262,
137
+ 2263, 717, 775,2264,1033, 322, 216,2265, 831,2266, 149,2267,1304,2268,2269, 702,
138
+ 1238, 135, 845, 347, 309,2270, 484,2271, 878, 655, 238,1006,1478,2272, 67,2273,
139
+ 295,2274,2275, 461,2276, 478, 942, 412,2277,1034,2278,2279,2280, 265,2281, 541,
140
+ 2282,2283,2284,2285,2286, 70, 852,1071,2287,2288,2289,2290, 21, 56, 509, 117,
141
+ 432,2291,2292, 331, 980, 552,1101, 148, 284, 105, 393,1180,1239, 755,2293, 187,
142
+ 2294,1046,1479,2295, 340,2296, 63,1047, 230,2297,2298,1305, 763,1306, 101, 800,
143
+ 808, 494,2299,2300,2301, 903,2302, 37,1072, 14, 5,2303, 79, 675,2304, 312,
144
+ 2305,2306,2307,2308,2309,1480, 6,1307,2310,2311,2312, 1, 470, 35, 24, 229,
145
+ 2313, 695, 210, 86, 778, 15, 784, 592, 779, 32, 77, 855, 964,2314, 259,2315,
146
+ 501, 380,2316,2317, 83, 981, 153, 689,1308,1481,1482,1483,2318,2319, 716,1484,
147
+ 2320,2321,2322,2323,2324,2325,1485,2326,2327, 128, 57, 68, 261,1048, 211, 170,
148
+ 1240, 31,2328, 51, 435, 742,2329,2330,2331, 635,2332, 264, 456,2333,2334,2335,
149
+ 425,2336,1486, 143, 507, 263, 943,2337, 363, 920,1487, 256,1488,1102, 243, 601,
150
+ 1489,2338,2339,2340,2341,2342,2343,2344, 861,2345,2346,2347,2348,2349,2350, 395,
151
+ 2351,1490,1491, 62, 535, 166, 225,2352,2353, 668, 419,1241, 138, 604, 928,2354,
152
+ 1181,2355,1492,1493,2356,2357,2358,1143,2359, 696,2360, 387, 307,1309, 682, 476,
153
+ 2361,2362, 332, 12, 222, 156,2363, 232,2364, 641, 276, 656, 517,1494,1495,1035,
154
+ 416, 736,1496,2365,1017, 586,2366,2367,2368,1497,2369, 242,2370,2371,2372,1498,
155
+ 2373, 965, 713,2374,2375,2376,2377, 740, 982,1499, 944,1500,1007,2378,2379,1310,
156
+ 1501,2380,2381,2382, 785, 329,2383,2384,1502,2385,2386,2387, 932,2388,1503,2389,
157
+ 2390,2391,2392,1242,2393,2394,2395,2396,2397, 994, 950,2398,2399,2400,2401,1504,
158
+ 1311,2402,2403,2404,2405,1049, 749,2406,2407, 853, 718,1144,1312,2408,1182,1505,
159
+ 2409,2410, 255, 516, 479, 564, 550, 214,1506,1507,1313, 413, 239, 444, 339,1145,
160
+ 1036,1508,1509,1314,1037,1510,1315,2411,1511,2412,2413,2414, 176, 703, 497, 624,
161
+ 593, 921, 302,2415, 341, 165,1103,1512,2416,1513,2417,2418,2419, 376,2420, 700,
162
+ 2421,2422,2423, 258, 768,1316,2424,1183,2425, 995, 608,2426,2427,2428,2429, 221,
163
+ 2430,2431,2432,2433,2434,2435,2436,2437, 195, 323, 726, 188, 897, 983,1317, 377,
164
+ 644,1050, 879,2438, 452,2439,2440,2441,2442,2443,2444, 914,2445,2446,2447,2448,
165
+ 915, 489,2449,1514,1184,2450,2451, 515, 64, 427, 495,2452, 583,2453, 483, 485,
166
+ 1038, 562, 213,1515, 748, 666,2454,2455,2456,2457, 334,2458, 780, 996,1008, 705,
167
+ 1243,2459,2460,2461,2462,2463, 114,2464, 493,1146, 366, 163,1516, 961,1104,2465,
168
+ 291,2466,1318,1105,2467,1517, 365,2468, 355, 951,1244,2469,1319,2470, 631,2471,
169
+ 2472, 218,1320, 364, 320, 756,1518,1519,1321,1520,1322,2473,2474,2475,2476, 997,
170
+ 2477,2478,2479,2480, 665,1185,2481, 916,1521,2482,2483,2484, 584, 684,2485,2486,
171
+ 797,2487,1051,1186,2488,2489,2490,1522,2491,2492, 370,2493,1039,1187, 65,2494,
172
+ 434, 205, 463,1188,2495, 125, 812, 391, 402, 826, 699, 286, 398, 155, 781, 771,
173
+ 585,2496, 590, 505,1073,2497, 599, 244, 219, 917,1018, 952, 646,1523,2498,1323,
174
+ 2499,2500, 49, 984, 354, 741,2501, 625,2502,1324,2503,1019, 190, 357, 757, 491,
175
+ 95, 782, 868,2504,2505,2506,2507,2508,2509, 134,1524,1074, 422,1525, 898,2510,
176
+ 161,2511,2512,2513,2514, 769,2515,1526,2516,2517, 411,1325,2518, 472,1527,2519,
177
+ 2520,2521,2522,2523,2524, 985,2525,2526,2527,2528,2529,2530, 764,2531,1245,2532,
178
+ 2533, 25, 204, 311,2534, 496,2535,1052,2536,2537,2538,2539,2540,2541,2542, 199,
179
+ 704, 504, 468, 758, 657,1528, 196, 44, 839,1246, 272, 750,2543, 765, 862,2544,
180
+ 2545,1326,2546, 132, 615, 933,2547, 732,2548,2549,2550,1189,1529,2551, 283,1247,
181
+ 1053, 607, 929,2552,2553,2554, 930, 183, 872, 616,1040,1147,2555,1148,1020, 441,
182
+ 249,1075,2556,2557,2558, 466, 743,2559,2560,2561, 92, 514, 426, 420, 526,2562,
183
+ 2563,2564,2565,2566,2567,2568, 185,2569,2570,2571,2572, 776,1530, 658,2573, 362,
184
+ 2574, 361, 922,1076, 793,2575,2576,2577,2578,2579,2580,1531, 251,2581,2582,2583,
185
+ 2584,1532, 54, 612, 237,1327,2585,2586, 275, 408, 647, 111,2587,1533,1106, 465,
186
+ 3, 458, 9, 38,2588, 107, 110, 890, 209, 26, 737, 498,2589,1534,2590, 431,
187
+ 202, 88,1535, 356, 287,1107, 660,1149,2591, 381,1536, 986,1150, 445,1248,1151,
188
+ 974,2592,2593, 846,2594, 446, 953, 184,1249,1250, 727,2595, 923, 193, 883,2596,
189
+ 2597,2598, 102, 324, 539, 817,2599, 421,1041,2600, 832,2601, 94, 175, 197, 406,
190
+ 2602, 459,2603,2604,2605,2606,2607, 330, 555,2608,2609,2610, 706,1108, 389,2611,
191
+ 2612,2613,2614, 233,2615, 833, 558, 931, 954,1251,2616,2617,1537, 546,2618,2619,
192
+ 1009,2620,2621,2622,1538, 690,1328,2623, 955,2624,1539,2625,2626, 772,2627,2628,
193
+ 2629,2630,2631, 924, 648, 863, 603,2632,2633, 934,1540, 864, 865,2634, 642,1042,
194
+ 670,1190,2635,2636,2637,2638, 168,2639, 652, 873, 542,1054,1541,2640,2641,2642, # 512, 256
195
+ )
196
+ # fmt: on
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/euctwfreq.py ADDED
@@ -0,0 +1,388 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Communicator client code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ # EUCTW frequency table
29
+ # Converted from big5 work
30
+ # by Taiwan's Mandarin Promotion Council
31
+ # <http:#www.edu.tw:81/mandr/>
32
+
33
+ # 128 --> 0.42261
34
+ # 256 --> 0.57851
35
+ # 512 --> 0.74851
36
+ # 1024 --> 0.89384
37
+ # 2048 --> 0.97583
38
+ #
39
+ # Idea Distribution Ratio = 0.74851/(1-0.74851) =2.98
40
+ # Random Distribution Ration = 512/(5401-512)=0.105
41
+ #
42
+ # Typical Distribution Ratio about 25% of Ideal one, still much higher than RDR
43
+
44
+ EUCTW_TYPICAL_DISTRIBUTION_RATIO = 0.75
45
+
46
+ # Char to FreqOrder table
47
+ EUCTW_TABLE_SIZE = 5376
48
+
49
+ # fmt: off
50
+ EUCTW_CHAR_TO_FREQ_ORDER = (
51
+ 1, 1800, 1506, 255, 1431, 198, 9, 82, 6, 7310, 177, 202, 3615, 1256, 2808, 110, # 2742
52
+ 3735, 33, 3241, 261, 76, 44, 2113, 16, 2931, 2184, 1176, 659, 3868, 26, 3404, 2643, # 2758
53
+ 1198, 3869, 3313, 4060, 410, 2211, 302, 590, 361, 1963, 8, 204, 58, 4296, 7311, 1931, # 2774
54
+ 63, 7312, 7313, 317, 1614, 75, 222, 159, 4061, 2412, 1480, 7314, 3500, 3068, 224, 2809, # 2790
55
+ 3616, 3, 10, 3870, 1471, 29, 2774, 1135, 2852, 1939, 873, 130, 3242, 1123, 312, 7315, # 2806
56
+ 4297, 2051, 507, 252, 682, 7316, 142, 1914, 124, 206, 2932, 34, 3501, 3173, 64, 604, # 2822
57
+ 7317, 2494, 1976, 1977, 155, 1990, 645, 641, 1606, 7318, 3405, 337, 72, 406, 7319, 80, # 2838
58
+ 630, 238, 3174, 1509, 263, 939, 1092, 2644, 756, 1440, 1094, 3406, 449, 69, 2969, 591, # 2854
59
+ 179, 2095, 471, 115, 2034, 1843, 60, 50, 2970, 134, 806, 1868, 734, 2035, 3407, 180, # 2870
60
+ 995, 1607, 156, 537, 2893, 688, 7320, 319, 1305, 779, 2144, 514, 2374, 298, 4298, 359, # 2886
61
+ 2495, 90, 2707, 1338, 663, 11, 906, 1099, 2545, 20, 2436, 182, 532, 1716, 7321, 732, # 2902
62
+ 1376, 4062, 1311, 1420, 3175, 25, 2312, 1056, 113, 399, 382, 1949, 242, 3408, 2467, 529, # 2918
63
+ 3243, 475, 1447, 3617, 7322, 117, 21, 656, 810, 1297, 2295, 2329, 3502, 7323, 126, 4063, # 2934
64
+ 706, 456, 150, 613, 4299, 71, 1118, 2036, 4064, 145, 3069, 85, 835, 486, 2114, 1246, # 2950
65
+ 1426, 428, 727, 1285, 1015, 800, 106, 623, 303, 1281, 7324, 2127, 2354, 347, 3736, 221, # 2966
66
+ 3503, 3110, 7325, 1955, 1153, 4065, 83, 296, 1199, 3070, 192, 624, 93, 7326, 822, 1897, # 2982
67
+ 2810, 3111, 795, 2064, 991, 1554, 1542, 1592, 27, 43, 2853, 859, 139, 1456, 860, 4300, # 2998
68
+ 437, 712, 3871, 164, 2392, 3112, 695, 211, 3017, 2096, 195, 3872, 1608, 3504, 3505, 3618, # 3014
69
+ 3873, 234, 811, 2971, 2097, 3874, 2229, 1441, 3506, 1615, 2375, 668, 2076, 1638, 305, 228, # 3030
70
+ 1664, 4301, 467, 415, 7327, 262, 2098, 1593, 239, 108, 300, 200, 1033, 512, 1247, 2077, # 3046
71
+ 7328, 7329, 2173, 3176, 3619, 2673, 593, 845, 1062, 3244, 88, 1723, 2037, 3875, 1950, 212, # 3062
72
+ 266, 152, 149, 468, 1898, 4066, 4302, 77, 187, 7330, 3018, 37, 5, 2972, 7331, 3876, # 3078
73
+ 7332, 7333, 39, 2517, 4303, 2894, 3177, 2078, 55, 148, 74, 4304, 545, 483, 1474, 1029, # 3094
74
+ 1665, 217, 1869, 1531, 3113, 1104, 2645, 4067, 24, 172, 3507, 900, 3877, 3508, 3509, 4305, # 3110
75
+ 32, 1408, 2811, 1312, 329, 487, 2355, 2247, 2708, 784, 2674, 4, 3019, 3314, 1427, 1788, # 3126
76
+ 188, 109, 499, 7334, 3620, 1717, 1789, 888, 1217, 3020, 4306, 7335, 3510, 7336, 3315, 1520, # 3142
77
+ 3621, 3878, 196, 1034, 775, 7337, 7338, 929, 1815, 249, 439, 38, 7339, 1063, 7340, 794, # 3158
78
+ 3879, 1435, 2296, 46, 178, 3245, 2065, 7341, 2376, 7342, 214, 1709, 4307, 804, 35, 707, # 3174
79
+ 324, 3622, 1601, 2546, 140, 459, 4068, 7343, 7344, 1365, 839, 272, 978, 2257, 2572, 3409, # 3190
80
+ 2128, 1363, 3623, 1423, 697, 100, 3071, 48, 70, 1231, 495, 3114, 2193, 7345, 1294, 7346, # 3206
81
+ 2079, 462, 586, 1042, 3246, 853, 256, 988, 185, 2377, 3410, 1698, 434, 1084, 7347, 3411, # 3222
82
+ 314, 2615, 2775, 4308, 2330, 2331, 569, 2280, 637, 1816, 2518, 757, 1162, 1878, 1616, 3412, # 3238
83
+ 287, 1577, 2115, 768, 4309, 1671, 2854, 3511, 2519, 1321, 3737, 909, 2413, 7348, 4069, 933, # 3254
84
+ 3738, 7349, 2052, 2356, 1222, 4310, 765, 2414, 1322, 786, 4311, 7350, 1919, 1462, 1677, 2895, # 3270
85
+ 1699, 7351, 4312, 1424, 2437, 3115, 3624, 2590, 3316, 1774, 1940, 3413, 3880, 4070, 309, 1369, # 3286
86
+ 1130, 2812, 364, 2230, 1653, 1299, 3881, 3512, 3882, 3883, 2646, 525, 1085, 3021, 902, 2000, # 3302
87
+ 1475, 964, 4313, 421, 1844, 1415, 1057, 2281, 940, 1364, 3116, 376, 4314, 4315, 1381, 7, # 3318
88
+ 2520, 983, 2378, 336, 1710, 2675, 1845, 321, 3414, 559, 1131, 3022, 2742, 1808, 1132, 1313, # 3334
89
+ 265, 1481, 1857, 7352, 352, 1203, 2813, 3247, 167, 1089, 420, 2814, 776, 792, 1724, 3513, # 3350
90
+ 4071, 2438, 3248, 7353, 4072, 7354, 446, 229, 333, 2743, 901, 3739, 1200, 1557, 4316, 2647, # 3366
91
+ 1920, 395, 2744, 2676, 3740, 4073, 1835, 125, 916, 3178, 2616, 4317, 7355, 7356, 3741, 7357, # 3382
92
+ 7358, 7359, 4318, 3117, 3625, 1133, 2547, 1757, 3415, 1510, 2313, 1409, 3514, 7360, 2145, 438, # 3398
93
+ 2591, 2896, 2379, 3317, 1068, 958, 3023, 461, 311, 2855, 2677, 4074, 1915, 3179, 4075, 1978, # 3414
94
+ 383, 750, 2745, 2617, 4076, 274, 539, 385, 1278, 1442, 7361, 1154, 1964, 384, 561, 210, # 3430
95
+ 98, 1295, 2548, 3515, 7362, 1711, 2415, 1482, 3416, 3884, 2897, 1257, 129, 7363, 3742, 642, # 3446
96
+ 523, 2776, 2777, 2648, 7364, 141, 2231, 1333, 68, 176, 441, 876, 907, 4077, 603, 2592, # 3462
97
+ 710, 171, 3417, 404, 549, 18, 3118, 2393, 1410, 3626, 1666, 7365, 3516, 4319, 2898, 4320, # 3478
98
+ 7366, 2973, 368, 7367, 146, 366, 99, 871, 3627, 1543, 748, 807, 1586, 1185, 22, 2258, # 3494
99
+ 379, 3743, 3180, 7368, 3181, 505, 1941, 2618, 1991, 1382, 2314, 7369, 380, 2357, 218, 702, # 3510
100
+ 1817, 1248, 3418, 3024, 3517, 3318, 3249, 7370, 2974, 3628, 930, 3250, 3744, 7371, 59, 7372, # 3526
101
+ 585, 601, 4078, 497, 3419, 1112, 1314, 4321, 1801, 7373, 1223, 1472, 2174, 7374, 749, 1836, # 3542
102
+ 690, 1899, 3745, 1772, 3885, 1476, 429, 1043, 1790, 2232, 2116, 917, 4079, 447, 1086, 1629, # 3558
103
+ 7375, 556, 7376, 7377, 2020, 1654, 844, 1090, 105, 550, 966, 1758, 2815, 1008, 1782, 686, # 3574
104
+ 1095, 7378, 2282, 793, 1602, 7379, 3518, 2593, 4322, 4080, 2933, 2297, 4323, 3746, 980, 2496, # 3590
105
+ 544, 353, 527, 4324, 908, 2678, 2899, 7380, 381, 2619, 1942, 1348, 7381, 1341, 1252, 560, # 3606
106
+ 3072, 7382, 3420, 2856, 7383, 2053, 973, 886, 2080, 143, 4325, 7384, 7385, 157, 3886, 496, # 3622
107
+ 4081, 57, 840, 540, 2038, 4326, 4327, 3421, 2117, 1445, 970, 2259, 1748, 1965, 2081, 4082, # 3638
108
+ 3119, 1234, 1775, 3251, 2816, 3629, 773, 1206, 2129, 1066, 2039, 1326, 3887, 1738, 1725, 4083, # 3654
109
+ 279, 3120, 51, 1544, 2594, 423, 1578, 2130, 2066, 173, 4328, 1879, 7386, 7387, 1583, 264, # 3670
110
+ 610, 3630, 4329, 2439, 280, 154, 7388, 7389, 7390, 1739, 338, 1282, 3073, 693, 2857, 1411, # 3686
111
+ 1074, 3747, 2440, 7391, 4330, 7392, 7393, 1240, 952, 2394, 7394, 2900, 1538, 2679, 685, 1483, # 3702
112
+ 4084, 2468, 1436, 953, 4085, 2054, 4331, 671, 2395, 79, 4086, 2441, 3252, 608, 567, 2680, # 3718
113
+ 3422, 4087, 4088, 1691, 393, 1261, 1791, 2396, 7395, 4332, 7396, 7397, 7398, 7399, 1383, 1672, # 3734
114
+ 3748, 3182, 1464, 522, 1119, 661, 1150, 216, 675, 4333, 3888, 1432, 3519, 609, 4334, 2681, # 3750
115
+ 2397, 7400, 7401, 7402, 4089, 3025, 0, 7403, 2469, 315, 231, 2442, 301, 3319, 4335, 2380, # 3766
116
+ 7404, 233, 4090, 3631, 1818, 4336, 4337, 7405, 96, 1776, 1315, 2082, 7406, 257, 7407, 1809, # 3782
117
+ 3632, 2709, 1139, 1819, 4091, 2021, 1124, 2163, 2778, 1777, 2649, 7408, 3074, 363, 1655, 3183, # 3798
118
+ 7409, 2975, 7410, 7411, 7412, 3889, 1567, 3890, 718, 103, 3184, 849, 1443, 341, 3320, 2934, # 3814
119
+ 1484, 7413, 1712, 127, 67, 339, 4092, 2398, 679, 1412, 821, 7414, 7415, 834, 738, 351, # 3830
120
+ 2976, 2146, 846, 235, 1497, 1880, 418, 1992, 3749, 2710, 186, 1100, 2147, 2746, 3520, 1545, # 3846
121
+ 1355, 2935, 2858, 1377, 583, 3891, 4093, 2573, 2977, 7416, 1298, 3633, 1078, 2549, 3634, 2358, # 3862
122
+ 78, 3750, 3751, 267, 1289, 2099, 2001, 1594, 4094, 348, 369, 1274, 2194, 2175, 1837, 4338, # 3878
123
+ 1820, 2817, 3635, 2747, 2283, 2002, 4339, 2936, 2748, 144, 3321, 882, 4340, 3892, 2749, 3423, # 3894
124
+ 4341, 2901, 7417, 4095, 1726, 320, 7418, 3893, 3026, 788, 2978, 7419, 2818, 1773, 1327, 2859, # 3910
125
+ 3894, 2819, 7420, 1306, 4342, 2003, 1700, 3752, 3521, 2359, 2650, 787, 2022, 506, 824, 3636, # 3926
126
+ 534, 323, 4343, 1044, 3322, 2023, 1900, 946, 3424, 7421, 1778, 1500, 1678, 7422, 1881, 4344, # 3942
127
+ 165, 243, 4345, 3637, 2521, 123, 683, 4096, 764, 4346, 36, 3895, 1792, 589, 2902, 816, # 3958
128
+ 626, 1667, 3027, 2233, 1639, 1555, 1622, 3753, 3896, 7423, 3897, 2860, 1370, 1228, 1932, 891, # 3974
129
+ 2083, 2903, 304, 4097, 7424, 292, 2979, 2711, 3522, 691, 2100, 4098, 1115, 4347, 118, 662, # 3990
130
+ 7425, 611, 1156, 854, 2381, 1316, 2861, 2, 386, 515, 2904, 7426, 7427, 3253, 868, 2234, # 4006
131
+ 1486, 855, 2651, 785, 2212, 3028, 7428, 1040, 3185, 3523, 7429, 3121, 448, 7430, 1525, 7431, # 4022
132
+ 2164, 4348, 7432, 3754, 7433, 4099, 2820, 3524, 3122, 503, 818, 3898, 3123, 1568, 814, 676, # 4038
133
+ 1444, 306, 1749, 7434, 3755, 1416, 1030, 197, 1428, 805, 2821, 1501, 4349, 7435, 7436, 7437, # 4054
134
+ 1993, 7438, 4350, 7439, 7440, 2195, 13, 2779, 3638, 2980, 3124, 1229, 1916, 7441, 3756, 2131, # 4070
135
+ 7442, 4100, 4351, 2399, 3525, 7443, 2213, 1511, 1727, 1120, 7444, 7445, 646, 3757, 2443, 307, # 4086
136
+ 7446, 7447, 1595, 3186, 7448, 7449, 7450, 3639, 1113, 1356, 3899, 1465, 2522, 2523, 7451, 519, # 4102
137
+ 7452, 128, 2132, 92, 2284, 1979, 7453, 3900, 1512, 342, 3125, 2196, 7454, 2780, 2214, 1980, # 4118
138
+ 3323, 7455, 290, 1656, 1317, 789, 827, 2360, 7456, 3758, 4352, 562, 581, 3901, 7457, 401, # 4134
139
+ 4353, 2248, 94, 4354, 1399, 2781, 7458, 1463, 2024, 4355, 3187, 1943, 7459, 828, 1105, 4101, # 4150
140
+ 1262, 1394, 7460, 4102, 605, 4356, 7461, 1783, 2862, 7462, 2822, 819, 2101, 578, 2197, 2937, # 4166
141
+ 7463, 1502, 436, 3254, 4103, 3255, 2823, 3902, 2905, 3425, 3426, 7464, 2712, 2315, 7465, 7466, # 4182
142
+ 2332, 2067, 23, 4357, 193, 826, 3759, 2102, 699, 1630, 4104, 3075, 390, 1793, 1064, 3526, # 4198
143
+ 7467, 1579, 3076, 3077, 1400, 7468, 4105, 1838, 1640, 2863, 7469, 4358, 4359, 137, 4106, 598, # 4214
144
+ 3078, 1966, 780, 104, 974, 2938, 7470, 278, 899, 253, 402, 572, 504, 493, 1339, 7471, # 4230
145
+ 3903, 1275, 4360, 2574, 2550, 7472, 3640, 3029, 3079, 2249, 565, 1334, 2713, 863, 41, 7473, # 4246
146
+ 7474, 4361, 7475, 1657, 2333, 19, 463, 2750, 4107, 606, 7476, 2981, 3256, 1087, 2084, 1323, # 4262
147
+ 2652, 2982, 7477, 1631, 1623, 1750, 4108, 2682, 7478, 2864, 791, 2714, 2653, 2334, 232, 2416, # 4278
148
+ 7479, 2983, 1498, 7480, 2654, 2620, 755, 1366, 3641, 3257, 3126, 2025, 1609, 119, 1917, 3427, # 4294
149
+ 862, 1026, 4109, 7481, 3904, 3760, 4362, 3905, 4363, 2260, 1951, 2470, 7482, 1125, 817, 4110, # 4310
150
+ 4111, 3906, 1513, 1766, 2040, 1487, 4112, 3030, 3258, 2824, 3761, 3127, 7483, 7484, 1507, 7485, # 4326
151
+ 2683, 733, 40, 1632, 1106, 2865, 345, 4113, 841, 2524, 230, 4364, 2984, 1846, 3259, 3428, # 4342
152
+ 7486, 1263, 986, 3429, 7487, 735, 879, 254, 1137, 857, 622, 1300, 1180, 1388, 1562, 3907, # 4358
153
+ 3908, 2939, 967, 2751, 2655, 1349, 592, 2133, 1692, 3324, 2985, 1994, 4114, 1679, 3909, 1901, # 4374
154
+ 2185, 7488, 739, 3642, 2715, 1296, 1290, 7489, 4115, 2198, 2199, 1921, 1563, 2595, 2551, 1870, # 4390
155
+ 2752, 2986, 7490, 435, 7491, 343, 1108, 596, 17, 1751, 4365, 2235, 3430, 3643, 7492, 4366, # 4406
156
+ 294, 3527, 2940, 1693, 477, 979, 281, 2041, 3528, 643, 2042, 3644, 2621, 2782, 2261, 1031, # 4422
157
+ 2335, 2134, 2298, 3529, 4367, 367, 1249, 2552, 7493, 3530, 7494, 4368, 1283, 3325, 2004, 240, # 4438
158
+ 1762, 3326, 4369, 4370, 836, 1069, 3128, 474, 7495, 2148, 2525, 268, 3531, 7496, 3188, 1521, # 4454
159
+ 1284, 7497, 1658, 1546, 4116, 7498, 3532, 3533, 7499, 4117, 3327, 2684, 1685, 4118, 961, 1673, # 4470
160
+ 2622, 190, 2005, 2200, 3762, 4371, 4372, 7500, 570, 2497, 3645, 1490, 7501, 4373, 2623, 3260, # 4486
161
+ 1956, 4374, 584, 1514, 396, 1045, 1944, 7502, 4375, 1967, 2444, 7503, 7504, 4376, 3910, 619, # 4502
162
+ 7505, 3129, 3261, 215, 2006, 2783, 2553, 3189, 4377, 3190, 4378, 763, 4119, 3763, 4379, 7506, # 4518
163
+ 7507, 1957, 1767, 2941, 3328, 3646, 1174, 452, 1477, 4380, 3329, 3130, 7508, 2825, 1253, 2382, # 4534
164
+ 2186, 1091, 2285, 4120, 492, 7509, 638, 1169, 1824, 2135, 1752, 3911, 648, 926, 1021, 1324, # 4550
165
+ 4381, 520, 4382, 997, 847, 1007, 892, 4383, 3764, 2262, 1871, 3647, 7510, 2400, 1784, 4384, # 4566
166
+ 1952, 2942, 3080, 3191, 1728, 4121, 2043, 3648, 4385, 2007, 1701, 3131, 1551, 30, 2263, 4122, # 4582
167
+ 7511, 2026, 4386, 3534, 7512, 501, 7513, 4123, 594, 3431, 2165, 1821, 3535, 3432, 3536, 3192, # 4598
168
+ 829, 2826, 4124, 7514, 1680, 3132, 1225, 4125, 7515, 3262, 4387, 4126, 3133, 2336, 7516, 4388, # 4614
169
+ 4127, 7517, 3912, 3913, 7518, 1847, 2383, 2596, 3330, 7519, 4389, 374, 3914, 652, 4128, 4129, # 4630
170
+ 375, 1140, 798, 7520, 7521, 7522, 2361, 4390, 2264, 546, 1659, 138, 3031, 2445, 4391, 7523, # 4646
171
+ 2250, 612, 1848, 910, 796, 3765, 1740, 1371, 825, 3766, 3767, 7524, 2906, 2554, 7525, 692, # 4662
172
+ 444, 3032, 2624, 801, 4392, 4130, 7526, 1491, 244, 1053, 3033, 4131, 4132, 340, 7527, 3915, # 4678
173
+ 1041, 2987, 293, 1168, 87, 1357, 7528, 1539, 959, 7529, 2236, 721, 694, 4133, 3768, 219, # 4694
174
+ 1478, 644, 1417, 3331, 2656, 1413, 1401, 1335, 1389, 3916, 7530, 7531, 2988, 2362, 3134, 1825, # 4710
175
+ 730, 1515, 184, 2827, 66, 4393, 7532, 1660, 2943, 246, 3332, 378, 1457, 226, 3433, 975, # 4726
176
+ 3917, 2944, 1264, 3537, 674, 696, 7533, 163, 7534, 1141, 2417, 2166, 713, 3538, 3333, 4394, # 4742
177
+ 3918, 7535, 7536, 1186, 15, 7537, 1079, 1070, 7538, 1522, 3193, 3539, 276, 1050, 2716, 758, # 4758
178
+ 1126, 653, 2945, 3263, 7539, 2337, 889, 3540, 3919, 3081, 2989, 903, 1250, 4395, 3920, 3434, # 4774
179
+ 3541, 1342, 1681, 1718, 766, 3264, 286, 89, 2946, 3649, 7540, 1713, 7541, 2597, 3334, 2990, # 4790
180
+ 7542, 2947, 2215, 3194, 2866, 7543, 4396, 2498, 2526, 181, 387, 1075, 3921, 731, 2187, 3335, # 4806
181
+ 7544, 3265, 310, 313, 3435, 2299, 770, 4134, 54, 3034, 189, 4397, 3082, 3769, 3922, 7545, # 4822
182
+ 1230, 1617, 1849, 355, 3542, 4135, 4398, 3336, 111, 4136, 3650, 1350, 3135, 3436, 3035, 4137, # 4838
183
+ 2149, 3266, 3543, 7546, 2784, 3923, 3924, 2991, 722, 2008, 7547, 1071, 247, 1207, 2338, 2471, # 4854
184
+ 1378, 4399, 2009, 864, 1437, 1214, 4400, 373, 3770, 1142, 2216, 667, 4401, 442, 2753, 2555, # 4870
185
+ 3771, 3925, 1968, 4138, 3267, 1839, 837, 170, 1107, 934, 1336, 1882, 7548, 7549, 2118, 4139, # 4886
186
+ 2828, 743, 1569, 7550, 4402, 4140, 582, 2384, 1418, 3437, 7551, 1802, 7552, 357, 1395, 1729, # 4902
187
+ 3651, 3268, 2418, 1564, 2237, 7553, 3083, 3772, 1633, 4403, 1114, 2085, 4141, 1532, 7554, 482, # 4918
188
+ 2446, 4404, 7555, 7556, 1492, 833, 1466, 7557, 2717, 3544, 1641, 2829, 7558, 1526, 1272, 3652, # 4934
189
+ 4142, 1686, 1794, 416, 2556, 1902, 1953, 1803, 7559, 3773, 2785, 3774, 1159, 2316, 7560, 2867, # 4950
190
+ 4405, 1610, 1584, 3036, 2419, 2754, 443, 3269, 1163, 3136, 7561, 7562, 3926, 7563, 4143, 2499, # 4966
191
+ 3037, 4406, 3927, 3137, 2103, 1647, 3545, 2010, 1872, 4144, 7564, 4145, 431, 3438, 7565, 250, # 4982
192
+ 97, 81, 4146, 7566, 1648, 1850, 1558, 160, 848, 7567, 866, 740, 1694, 7568, 2201, 2830, # 4998
193
+ 3195, 4147, 4407, 3653, 1687, 950, 2472, 426, 469, 3196, 3654, 3655, 3928, 7569, 7570, 1188, # 5014
194
+ 424, 1995, 861, 3546, 4148, 3775, 2202, 2685, 168, 1235, 3547, 4149, 7571, 2086, 1674, 4408, # 5030
195
+ 3337, 3270, 220, 2557, 1009, 7572, 3776, 670, 2992, 332, 1208, 717, 7573, 7574, 3548, 2447, # 5046
196
+ 3929, 3338, 7575, 513, 7576, 1209, 2868, 3339, 3138, 4409, 1080, 7577, 7578, 7579, 7580, 2527, # 5062
197
+ 3656, 3549, 815, 1587, 3930, 3931, 7581, 3550, 3439, 3777, 1254, 4410, 1328, 3038, 1390, 3932, # 5078
198
+ 1741, 3933, 3778, 3934, 7582, 236, 3779, 2448, 3271, 7583, 7584, 3657, 3780, 1273, 3781, 4411, # 5094
199
+ 7585, 308, 7586, 4412, 245, 4413, 1851, 2473, 1307, 2575, 430, 715, 2136, 2449, 7587, 270, # 5110
200
+ 199, 2869, 3935, 7588, 3551, 2718, 1753, 761, 1754, 725, 1661, 1840, 4414, 3440, 3658, 7589, # 5126
201
+ 7590, 587, 14, 3272, 227, 2598, 326, 480, 2265, 943, 2755, 3552, 291, 650, 1883, 7591, # 5142
202
+ 1702, 1226, 102, 1547, 62, 3441, 904, 4415, 3442, 1164, 4150, 7592, 7593, 1224, 1548, 2756, # 5158
203
+ 391, 498, 1493, 7594, 1386, 1419, 7595, 2055, 1177, 4416, 813, 880, 1081, 2363, 566, 1145, # 5174
204
+ 4417, 2286, 1001, 1035, 2558, 2599, 2238, 394, 1286, 7596, 7597, 2068, 7598, 86, 1494, 1730, # 5190
205
+ 3936, 491, 1588, 745, 897, 2948, 843, 3340, 3937, 2757, 2870, 3273, 1768, 998, 2217, 2069, # 5206
206
+ 397, 1826, 1195, 1969, 3659, 2993, 3341, 284, 7599, 3782, 2500, 2137, 2119, 1903, 7600, 3938, # 5222
207
+ 2150, 3939, 4151, 1036, 3443, 1904, 114, 2559, 4152, 209, 1527, 7601, 7602, 2949, 2831, 2625, # 5238
208
+ 2385, 2719, 3139, 812, 2560, 7603, 3274, 7604, 1559, 737, 1884, 3660, 1210, 885, 28, 2686, # 5254
209
+ 3553, 3783, 7605, 4153, 1004, 1779, 4418, 7606, 346, 1981, 2218, 2687, 4419, 3784, 1742, 797, # 5270
210
+ 1642, 3940, 1933, 1072, 1384, 2151, 896, 3941, 3275, 3661, 3197, 2871, 3554, 7607, 2561, 1958, # 5286
211
+ 4420, 2450, 1785, 7608, 7609, 7610, 3942, 4154, 1005, 1308, 3662, 4155, 2720, 4421, 4422, 1528, # 5302
212
+ 2600, 161, 1178, 4156, 1982, 987, 4423, 1101, 4157, 631, 3943, 1157, 3198, 2420, 1343, 1241, # 5318
213
+ 1016, 2239, 2562, 372, 877, 2339, 2501, 1160, 555, 1934, 911, 3944, 7611, 466, 1170, 169, # 5334
214
+ 1051, 2907, 2688, 3663, 2474, 2994, 1182, 2011, 2563, 1251, 2626, 7612, 992, 2340, 3444, 1540, # 5350
215
+ 2721, 1201, 2070, 2401, 1996, 2475, 7613, 4424, 528, 1922, 2188, 1503, 1873, 1570, 2364, 3342, # 5366
216
+ 3276, 7614, 557, 1073, 7615, 1827, 3445, 2087, 2266, 3140, 3039, 3084, 767, 3085, 2786, 4425, # 5382
217
+ 1006, 4158, 4426, 2341, 1267, 2176, 3664, 3199, 778, 3945, 3200, 2722, 1597, 2657, 7616, 4427, # 5398
218
+ 7617, 3446, 7618, 7619, 7620, 3277, 2689, 1433, 3278, 131, 95, 1504, 3946, 723, 4159, 3141, # 5414
219
+ 1841, 3555, 2758, 2189, 3947, 2027, 2104, 3665, 7621, 2995, 3948, 1218, 7622, 3343, 3201, 3949, # 5430
220
+ 4160, 2576, 248, 1634, 3785, 912, 7623, 2832, 3666, 3040, 3786, 654, 53, 7624, 2996, 7625, # 5446
221
+ 1688, 4428, 777, 3447, 1032, 3950, 1425, 7626, 191, 820, 2120, 2833, 971, 4429, 931, 3202, # 5462
222
+ 135, 664, 783, 3787, 1997, 772, 2908, 1935, 3951, 3788, 4430, 2909, 3203, 282, 2723, 640, # 5478
223
+ 1372, 3448, 1127, 922, 325, 3344, 7627, 7628, 711, 2044, 7629, 7630, 3952, 2219, 2787, 1936, # 5494
224
+ 3953, 3345, 2220, 2251, 3789, 2300, 7631, 4431, 3790, 1258, 3279, 3954, 3204, 2138, 2950, 3955, # 5510
225
+ 3956, 7632, 2221, 258, 3205, 4432, 101, 1227, 7633, 3280, 1755, 7634, 1391, 3281, 7635, 2910, # 5526
226
+ 2056, 893, 7636, 7637, 7638, 1402, 4161, 2342, 7639, 7640, 3206, 3556, 7641, 7642, 878, 1325, # 5542
227
+ 1780, 2788, 4433, 259, 1385, 2577, 744, 1183, 2267, 4434, 7643, 3957, 2502, 7644, 684, 1024, # 5558
228
+ 4162, 7645, 472, 3557, 3449, 1165, 3282, 3958, 3959, 322, 2152, 881, 455, 1695, 1152, 1340, # 5574
229
+ 660, 554, 2153, 4435, 1058, 4436, 4163, 830, 1065, 3346, 3960, 4437, 1923, 7646, 1703, 1918, # 5590
230
+ 7647, 932, 2268, 122, 7648, 4438, 947, 677, 7649, 3791, 2627, 297, 1905, 1924, 2269, 4439, # 5606
231
+ 2317, 3283, 7650, 7651, 4164, 7652, 4165, 84, 4166, 112, 989, 7653, 547, 1059, 3961, 701, # 5622
232
+ 3558, 1019, 7654, 4167, 7655, 3450, 942, 639, 457, 2301, 2451, 993, 2951, 407, 851, 494, # 5638
233
+ 4440, 3347, 927, 7656, 1237, 7657, 2421, 3348, 573, 4168, 680, 921, 2911, 1279, 1874, 285, # 5654
234
+ 790, 1448, 1983, 719, 2167, 7658, 7659, 4441, 3962, 3963, 1649, 7660, 1541, 563, 7661, 1077, # 5670
235
+ 7662, 3349, 3041, 3451, 511, 2997, 3964, 3965, 3667, 3966, 1268, 2564, 3350, 3207, 4442, 4443, # 5686
236
+ 7663, 535, 1048, 1276, 1189, 2912, 2028, 3142, 1438, 1373, 2834, 2952, 1134, 2012, 7664, 4169, # 5702
237
+ 1238, 2578, 3086, 1259, 7665, 700, 7666, 2953, 3143, 3668, 4170, 7667, 4171, 1146, 1875, 1906, # 5718
238
+ 4444, 2601, 3967, 781, 2422, 132, 1589, 203, 147, 273, 2789, 2402, 898, 1786, 2154, 3968, # 5734
239
+ 3969, 7668, 3792, 2790, 7669, 7670, 4445, 4446, 7671, 3208, 7672, 1635, 3793, 965, 7673, 1804, # 5750
240
+ 2690, 1516, 3559, 1121, 1082, 1329, 3284, 3970, 1449, 3794, 65, 1128, 2835, 2913, 2759, 1590, # 5766
241
+ 3795, 7674, 7675, 12, 2658, 45, 976, 2579, 3144, 4447, 517, 2528, 1013, 1037, 3209, 7676, # 5782
242
+ 3796, 2836, 7677, 3797, 7678, 3452, 7679, 2602, 614, 1998, 2318, 3798, 3087, 2724, 2628, 7680, # 5798
243
+ 2580, 4172, 599, 1269, 7681, 1810, 3669, 7682, 2691, 3088, 759, 1060, 489, 1805, 3351, 3285, # 5814
244
+ 1358, 7683, 7684, 2386, 1387, 1215, 2629, 2252, 490, 7685, 7686, 4173, 1759, 2387, 2343, 7687, # 5830
245
+ 4448, 3799, 1907, 3971, 2630, 1806, 3210, 4449, 3453, 3286, 2760, 2344, 874, 7688, 7689, 3454, # 5846
246
+ 3670, 1858, 91, 2914, 3671, 3042, 3800, 4450, 7690, 3145, 3972, 2659, 7691, 3455, 1202, 1403, # 5862
247
+ 3801, 2954, 2529, 1517, 2503, 4451, 3456, 2504, 7692, 4452, 7693, 2692, 1885, 1495, 1731, 3973, # 5878
248
+ 2365, 4453, 7694, 2029, 7695, 7696, 3974, 2693, 1216, 237, 2581, 4174, 2319, 3975, 3802, 4454, # 5894
249
+ 4455, 2694, 3560, 3457, 445, 4456, 7697, 7698, 7699, 7700, 2761, 61, 3976, 3672, 1822, 3977, # 5910
250
+ 7701, 687, 2045, 935, 925, 405, 2660, 703, 1096, 1859, 2725, 4457, 3978, 1876, 1367, 2695, # 5926
251
+ 3352, 918, 2105, 1781, 2476, 334, 3287, 1611, 1093, 4458, 564, 3146, 3458, 3673, 3353, 945, # 5942
252
+ 2631, 2057, 4459, 7702, 1925, 872, 4175, 7703, 3459, 2696, 3089, 349, 4176, 3674, 3979, 4460, # 5958
253
+ 3803, 4177, 3675, 2155, 3980, 4461, 4462, 4178, 4463, 2403, 2046, 782, 3981, 400, 251, 4179, # 5974
254
+ 1624, 7704, 7705, 277, 3676, 299, 1265, 476, 1191, 3804, 2121, 4180, 4181, 1109, 205, 7706, # 5990
255
+ 2582, 1000, 2156, 3561, 1860, 7707, 7708, 7709, 4464, 7710, 4465, 2565, 107, 2477, 2157, 3982, # 6006
256
+ 3460, 3147, 7711, 1533, 541, 1301, 158, 753, 4182, 2872, 3562, 7712, 1696, 370, 1088, 4183, # 6022
257
+ 4466, 3563, 579, 327, 440, 162, 2240, 269, 1937, 1374, 3461, 968, 3043, 56, 1396, 3090, # 6038
258
+ 2106, 3288, 3354, 7713, 1926, 2158, 4467, 2998, 7714, 3564, 7715, 7716, 3677, 4468, 2478, 7717, # 6054
259
+ 2791, 7718, 1650, 4469, 7719, 2603, 7720, 7721, 3983, 2661, 3355, 1149, 3356, 3984, 3805, 3985, # 6070
260
+ 7722, 1076, 49, 7723, 951, 3211, 3289, 3290, 450, 2837, 920, 7724, 1811, 2792, 2366, 4184, # 6086
261
+ 1908, 1138, 2367, 3806, 3462, 7725, 3212, 4470, 1909, 1147, 1518, 2423, 4471, 3807, 7726, 4472, # 6102
262
+ 2388, 2604, 260, 1795, 3213, 7727, 7728, 3808, 3291, 708, 7729, 3565, 1704, 7730, 3566, 1351, # 6118
263
+ 1618, 3357, 2999, 1886, 944, 4185, 3358, 4186, 3044, 3359, 4187, 7731, 3678, 422, 413, 1714, # 6134
264
+ 3292, 500, 2058, 2345, 4188, 2479, 7732, 1344, 1910, 954, 7733, 1668, 7734, 7735, 3986, 2404, # 6150
265
+ 4189, 3567, 3809, 4190, 7736, 2302, 1318, 2505, 3091, 133, 3092, 2873, 4473, 629, 31, 2838, # 6166
266
+ 2697, 3810, 4474, 850, 949, 4475, 3987, 2955, 1732, 2088, 4191, 1496, 1852, 7737, 3988, 620, # 6182
267
+ 3214, 981, 1242, 3679, 3360, 1619, 3680, 1643, 3293, 2139, 2452, 1970, 1719, 3463, 2168, 7738, # 6198
268
+ 3215, 7739, 7740, 3361, 1828, 7741, 1277, 4476, 1565, 2047, 7742, 1636, 3568, 3093, 7743, 869, # 6214
269
+ 2839, 655, 3811, 3812, 3094, 3989, 3000, 3813, 1310, 3569, 4477, 7744, 7745, 7746, 1733, 558, # 6230
270
+ 4478, 3681, 335, 1549, 3045, 1756, 4192, 3682, 1945, 3464, 1829, 1291, 1192, 470, 2726, 2107, # 6246
271
+ 2793, 913, 1054, 3990, 7747, 1027, 7748, 3046, 3991, 4479, 982, 2662, 3362, 3148, 3465, 3216, # 6262
272
+ 3217, 1946, 2794, 7749, 571, 4480, 7750, 1830, 7751, 3570, 2583, 1523, 2424, 7752, 2089, 984, # 6278
273
+ 4481, 3683, 1959, 7753, 3684, 852, 923, 2795, 3466, 3685, 969, 1519, 999, 2048, 2320, 1705, # 6294
274
+ 7754, 3095, 615, 1662, 151, 597, 3992, 2405, 2321, 1049, 275, 4482, 3686, 4193, 568, 3687, # 6310
275
+ 3571, 2480, 4194, 3688, 7755, 2425, 2270, 409, 3218, 7756, 1566, 2874, 3467, 1002, 769, 2840, # 6326
276
+ 194, 2090, 3149, 3689, 2222, 3294, 4195, 628, 1505, 7757, 7758, 1763, 2177, 3001, 3993, 521, # 6342
277
+ 1161, 2584, 1787, 2203, 2406, 4483, 3994, 1625, 4196, 4197, 412, 42, 3096, 464, 7759, 2632, # 6358
278
+ 4484, 3363, 1760, 1571, 2875, 3468, 2530, 1219, 2204, 3814, 2633, 2140, 2368, 4485, 4486, 3295, # 6374
279
+ 1651, 3364, 3572, 7760, 7761, 3573, 2481, 3469, 7762, 3690, 7763, 7764, 2271, 2091, 460, 7765, # 6390
280
+ 4487, 7766, 3002, 962, 588, 3574, 289, 3219, 2634, 1116, 52, 7767, 3047, 1796, 7768, 7769, # 6406
281
+ 7770, 1467, 7771, 1598, 1143, 3691, 4198, 1984, 1734, 1067, 4488, 1280, 3365, 465, 4489, 1572, # 6422
282
+ 510, 7772, 1927, 2241, 1812, 1644, 3575, 7773, 4490, 3692, 7774, 7775, 2663, 1573, 1534, 7776, # 6438
283
+ 7777, 4199, 536, 1807, 1761, 3470, 3815, 3150, 2635, 7778, 7779, 7780, 4491, 3471, 2915, 1911, # 6454
284
+ 2796, 7781, 3296, 1122, 377, 3220, 7782, 360, 7783, 7784, 4200, 1529, 551, 7785, 2059, 3693, # 6470
285
+ 1769, 2426, 7786, 2916, 4201, 3297, 3097, 2322, 2108, 2030, 4492, 1404, 136, 1468, 1479, 672, # 6486
286
+ 1171, 3221, 2303, 271, 3151, 7787, 2762, 7788, 2049, 678, 2727, 865, 1947, 4493, 7789, 2013, # 6502
287
+ 3995, 2956, 7790, 2728, 2223, 1397, 3048, 3694, 4494, 4495, 1735, 2917, 3366, 3576, 7791, 3816, # 6518
288
+ 509, 2841, 2453, 2876, 3817, 7792, 7793, 3152, 3153, 4496, 4202, 2531, 4497, 2304, 1166, 1010, # 6534
289
+ 552, 681, 1887, 7794, 7795, 2957, 2958, 3996, 1287, 1596, 1861, 3154, 358, 453, 736, 175, # 6550
290
+ 478, 1117, 905, 1167, 1097, 7796, 1853, 1530, 7797, 1706, 7798, 2178, 3472, 2287, 3695, 3473, # 6566
291
+ 3577, 4203, 2092, 4204, 7799, 3367, 1193, 2482, 4205, 1458, 2190, 2205, 1862, 1888, 1421, 3298, # 6582
292
+ 2918, 3049, 2179, 3474, 595, 2122, 7800, 3997, 7801, 7802, 4206, 1707, 2636, 223, 3696, 1359, # 6598
293
+ 751, 3098, 183, 3475, 7803, 2797, 3003, 419, 2369, 633, 704, 3818, 2389, 241, 7804, 7805, # 6614
294
+ 7806, 838, 3004, 3697, 2272, 2763, 2454, 3819, 1938, 2050, 3998, 1309, 3099, 2242, 1181, 7807, # 6630
295
+ 1136, 2206, 3820, 2370, 1446, 4207, 2305, 4498, 7808, 7809, 4208, 1055, 2605, 484, 3698, 7810, # 6646
296
+ 3999, 625, 4209, 2273, 3368, 1499, 4210, 4000, 7811, 4001, 4211, 3222, 2274, 2275, 3476, 7812, # 6662
297
+ 7813, 2764, 808, 2606, 3699, 3369, 4002, 4212, 3100, 2532, 526, 3370, 3821, 4213, 955, 7814, # 6678
298
+ 1620, 4214, 2637, 2427, 7815, 1429, 3700, 1669, 1831, 994, 928, 7816, 3578, 1260, 7817, 7818, # 6694
299
+ 7819, 1948, 2288, 741, 2919, 1626, 4215, 2729, 2455, 867, 1184, 362, 3371, 1392, 7820, 7821, # 6710
300
+ 4003, 4216, 1770, 1736, 3223, 2920, 4499, 4500, 1928, 2698, 1459, 1158, 7822, 3050, 3372, 2877, # 6726
301
+ 1292, 1929, 2506, 2842, 3701, 1985, 1187, 2071, 2014, 2607, 4217, 7823, 2566, 2507, 2169, 3702, # 6742
302
+ 2483, 3299, 7824, 3703, 4501, 7825, 7826, 666, 1003, 3005, 1022, 3579, 4218, 7827, 4502, 1813, # 6758
303
+ 2253, 574, 3822, 1603, 295, 1535, 705, 3823, 4219, 283, 858, 417, 7828, 7829, 3224, 4503, # 6774
304
+ 4504, 3051, 1220, 1889, 1046, 2276, 2456, 4004, 1393, 1599, 689, 2567, 388, 4220, 7830, 2484, # 6790
305
+ 802, 7831, 2798, 3824, 2060, 1405, 2254, 7832, 4505, 3825, 2109, 1052, 1345, 3225, 1585, 7833, # 6806
306
+ 809, 7834, 7835, 7836, 575, 2730, 3477, 956, 1552, 1469, 1144, 2323, 7837, 2324, 1560, 2457, # 6822
307
+ 3580, 3226, 4005, 616, 2207, 3155, 2180, 2289, 7838, 1832, 7839, 3478, 4506, 7840, 1319, 3704, # 6838
308
+ 3705, 1211, 3581, 1023, 3227, 1293, 2799, 7841, 7842, 7843, 3826, 607, 2306, 3827, 762, 2878, # 6854
309
+ 1439, 4221, 1360, 7844, 1485, 3052, 7845, 4507, 1038, 4222, 1450, 2061, 2638, 4223, 1379, 4508, # 6870
310
+ 2585, 7846, 7847, 4224, 1352, 1414, 2325, 2921, 1172, 7848, 7849, 3828, 3829, 7850, 1797, 1451, # 6886
311
+ 7851, 7852, 7853, 7854, 2922, 4006, 4007, 2485, 2346, 411, 4008, 4009, 3582, 3300, 3101, 4509, # 6902
312
+ 1561, 2664, 1452, 4010, 1375, 7855, 7856, 47, 2959, 316, 7857, 1406, 1591, 2923, 3156, 7858, # 6918
313
+ 1025, 2141, 3102, 3157, 354, 2731, 884, 2224, 4225, 2407, 508, 3706, 726, 3583, 996, 2428, # 6934
314
+ 3584, 729, 7859, 392, 2191, 1453, 4011, 4510, 3707, 7860, 7861, 2458, 3585, 2608, 1675, 2800, # 6950
315
+ 919, 2347, 2960, 2348, 1270, 4511, 4012, 73, 7862, 7863, 647, 7864, 3228, 2843, 2255, 1550, # 6966
316
+ 1346, 3006, 7865, 1332, 883, 3479, 7866, 7867, 7868, 7869, 3301, 2765, 7870, 1212, 831, 1347, # 6982
317
+ 4226, 4512, 2326, 3830, 1863, 3053, 720, 3831, 4513, 4514, 3832, 7871, 4227, 7872, 7873, 4515, # 6998
318
+ 7874, 7875, 1798, 4516, 3708, 2609, 4517, 3586, 1645, 2371, 7876, 7877, 2924, 669, 2208, 2665, # 7014
319
+ 2429, 7878, 2879, 7879, 7880, 1028, 3229, 7881, 4228, 2408, 7882, 2256, 1353, 7883, 7884, 4518, # 7030
320
+ 3158, 518, 7885, 4013, 7886, 4229, 1960, 7887, 2142, 4230, 7888, 7889, 3007, 2349, 2350, 3833, # 7046
321
+ 516, 1833, 1454, 4014, 2699, 4231, 4519, 2225, 2610, 1971, 1129, 3587, 7890, 2766, 7891, 2961, # 7062
322
+ 1422, 577, 1470, 3008, 1524, 3373, 7892, 7893, 432, 4232, 3054, 3480, 7894, 2586, 1455, 2508, # 7078
323
+ 2226, 1972, 1175, 7895, 1020, 2732, 4015, 3481, 4520, 7896, 2733, 7897, 1743, 1361, 3055, 3482, # 7094
324
+ 2639, 4016, 4233, 4521, 2290, 895, 924, 4234, 2170, 331, 2243, 3056, 166, 1627, 3057, 1098, # 7110
325
+ 7898, 1232, 2880, 2227, 3374, 4522, 657, 403, 1196, 2372, 542, 3709, 3375, 1600, 4235, 3483, # 7126
326
+ 7899, 4523, 2767, 3230, 576, 530, 1362, 7900, 4524, 2533, 2666, 3710, 4017, 7901, 842, 3834, # 7142
327
+ 7902, 2801, 2031, 1014, 4018, 213, 2700, 3376, 665, 621, 4236, 7903, 3711, 2925, 2430, 7904, # 7158
328
+ 2431, 3302, 3588, 3377, 7905, 4237, 2534, 4238, 4525, 3589, 1682, 4239, 3484, 1380, 7906, 724, # 7174
329
+ 2277, 600, 1670, 7907, 1337, 1233, 4526, 3103, 2244, 7908, 1621, 4527, 7909, 651, 4240, 7910, # 7190
330
+ 1612, 4241, 2611, 7911, 2844, 7912, 2734, 2307, 3058, 7913, 716, 2459, 3059, 174, 1255, 2701, # 7206
331
+ 4019, 3590, 548, 1320, 1398, 728, 4020, 1574, 7914, 1890, 1197, 3060, 4021, 7915, 3061, 3062, # 7222
332
+ 3712, 3591, 3713, 747, 7916, 635, 4242, 4528, 7917, 7918, 7919, 4243, 7920, 7921, 4529, 7922, # 7238
333
+ 3378, 4530, 2432, 451, 7923, 3714, 2535, 2072, 4244, 2735, 4245, 4022, 7924, 1764, 4531, 7925, # 7254
334
+ 4246, 350, 7926, 2278, 2390, 2486, 7927, 4247, 4023, 2245, 1434, 4024, 488, 4532, 458, 4248, # 7270
335
+ 4025, 3715, 771, 1330, 2391, 3835, 2568, 3159, 2159, 2409, 1553, 2667, 3160, 4249, 7928, 2487, # 7286
336
+ 2881, 2612, 1720, 2702, 4250, 3379, 4533, 7929, 2536, 4251, 7930, 3231, 4252, 2768, 7931, 2015, # 7302
337
+ 2736, 7932, 1155, 1017, 3716, 3836, 7933, 3303, 2308, 201, 1864, 4253, 1430, 7934, 4026, 7935, # 7318
338
+ 7936, 7937, 7938, 7939, 4254, 1604, 7940, 414, 1865, 371, 2587, 4534, 4535, 3485, 2016, 3104, # 7334
339
+ 4536, 1708, 960, 4255, 887, 389, 2171, 1536, 1663, 1721, 7941, 2228, 4027, 2351, 2926, 1580, # 7350
340
+ 7942, 7943, 7944, 1744, 7945, 2537, 4537, 4538, 7946, 4539, 7947, 2073, 7948, 7949, 3592, 3380, # 7366
341
+ 2882, 4256, 7950, 4257, 2640, 3381, 2802, 673, 2703, 2460, 709, 3486, 4028, 3593, 4258, 7951, # 7382
342
+ 1148, 502, 634, 7952, 7953, 1204, 4540, 3594, 1575, 4541, 2613, 3717, 7954, 3718, 3105, 948, # 7398
343
+ 3232, 121, 1745, 3837, 1110, 7955, 4259, 3063, 2509, 3009, 4029, 3719, 1151, 1771, 3838, 1488, # 7414
344
+ 4030, 1986, 7956, 2433, 3487, 7957, 7958, 2093, 7959, 4260, 3839, 1213, 1407, 2803, 531, 2737, # 7430
345
+ 2538, 3233, 1011, 1537, 7960, 2769, 4261, 3106, 1061, 7961, 3720, 3721, 1866, 2883, 7962, 2017, # 7446
346
+ 120, 4262, 4263, 2062, 3595, 3234, 2309, 3840, 2668, 3382, 1954, 4542, 7963, 7964, 3488, 1047, # 7462
347
+ 2704, 1266, 7965, 1368, 4543, 2845, 649, 3383, 3841, 2539, 2738, 1102, 2846, 2669, 7966, 7967, # 7478
348
+ 1999, 7968, 1111, 3596, 2962, 7969, 2488, 3842, 3597, 2804, 1854, 3384, 3722, 7970, 7971, 3385, # 7494
349
+ 2410, 2884, 3304, 3235, 3598, 7972, 2569, 7973, 3599, 2805, 4031, 1460, 856, 7974, 3600, 7975, # 7510
350
+ 2885, 2963, 7976, 2886, 3843, 7977, 4264, 632, 2510, 875, 3844, 1697, 3845, 2291, 7978, 7979, # 7526
351
+ 4544, 3010, 1239, 580, 4545, 4265, 7980, 914, 936, 2074, 1190, 4032, 1039, 2123, 7981, 7982, # 7542
352
+ 7983, 3386, 1473, 7984, 1354, 4266, 3846, 7985, 2172, 3064, 4033, 915, 3305, 4267, 4268, 3306, # 7558
353
+ 1605, 1834, 7986, 2739, 398, 3601, 4269, 3847, 4034, 328, 1912, 2847, 4035, 3848, 1331, 4270, # 7574
354
+ 3011, 937, 4271, 7987, 3602, 4036, 4037, 3387, 2160, 4546, 3388, 524, 742, 538, 3065, 1012, # 7590
355
+ 7988, 7989, 3849, 2461, 7990, 658, 1103, 225, 3850, 7991, 7992, 4547, 7993, 4548, 7994, 3236, # 7606
356
+ 1243, 7995, 4038, 963, 2246, 4549, 7996, 2705, 3603, 3161, 7997, 7998, 2588, 2327, 7999, 4550, # 7622
357
+ 8000, 8001, 8002, 3489, 3307, 957, 3389, 2540, 2032, 1930, 2927, 2462, 870, 2018, 3604, 1746, # 7638
358
+ 2770, 2771, 2434, 2463, 8003, 3851, 8004, 3723, 3107, 3724, 3490, 3390, 3725, 8005, 1179, 3066, # 7654
359
+ 8006, 3162, 2373, 4272, 3726, 2541, 3163, 3108, 2740, 4039, 8007, 3391, 1556, 2542, 2292, 977, # 7670
360
+ 2887, 2033, 4040, 1205, 3392, 8008, 1765, 3393, 3164, 2124, 1271, 1689, 714, 4551, 3491, 8009, # 7686
361
+ 2328, 3852, 533, 4273, 3605, 2181, 617, 8010, 2464, 3308, 3492, 2310, 8011, 8012, 3165, 8013, # 7702
362
+ 8014, 3853, 1987, 618, 427, 2641, 3493, 3394, 8015, 8016, 1244, 1690, 8017, 2806, 4274, 4552, # 7718
363
+ 8018, 3494, 8019, 8020, 2279, 1576, 473, 3606, 4275, 3395, 972, 8021, 3607, 8022, 3067, 8023, # 7734
364
+ 8024, 4553, 4554, 8025, 3727, 4041, 4042, 8026, 153, 4555, 356, 8027, 1891, 2888, 4276, 2143, # 7750
365
+ 408, 803, 2352, 8028, 3854, 8029, 4277, 1646, 2570, 2511, 4556, 4557, 3855, 8030, 3856, 4278, # 7766
366
+ 8031, 2411, 3396, 752, 8032, 8033, 1961, 2964, 8034, 746, 3012, 2465, 8035, 4279, 3728, 698, # 7782
367
+ 4558, 1892, 4280, 3608, 2543, 4559, 3609, 3857, 8036, 3166, 3397, 8037, 1823, 1302, 4043, 2706, # 7798
368
+ 3858, 1973, 4281, 8038, 4282, 3167, 823, 1303, 1288, 1236, 2848, 3495, 4044, 3398, 774, 3859, # 7814
369
+ 8039, 1581, 4560, 1304, 2849, 3860, 4561, 8040, 2435, 2161, 1083, 3237, 4283, 4045, 4284, 344, # 7830
370
+ 1173, 288, 2311, 454, 1683, 8041, 8042, 1461, 4562, 4046, 2589, 8043, 8044, 4563, 985, 894, # 7846
371
+ 8045, 3399, 3168, 8046, 1913, 2928, 3729, 1988, 8047, 2110, 1974, 8048, 4047, 8049, 2571, 1194, # 7862
372
+ 425, 8050, 4564, 3169, 1245, 3730, 4285, 8051, 8052, 2850, 8053, 636, 4565, 1855, 3861, 760, # 7878
373
+ 1799, 8054, 4286, 2209, 1508, 4566, 4048, 1893, 1684, 2293, 8055, 8056, 8057, 4287, 4288, 2210, # 7894
374
+ 479, 8058, 8059, 832, 8060, 4049, 2489, 8061, 2965, 2490, 3731, 990, 3109, 627, 1814, 2642, # 7910
375
+ 4289, 1582, 4290, 2125, 2111, 3496, 4567, 8062, 799, 4291, 3170, 8063, 4568, 2112, 1737, 3013, # 7926
376
+ 1018, 543, 754, 4292, 3309, 1676, 4569, 4570, 4050, 8064, 1489, 8065, 3497, 8066, 2614, 2889, # 7942
377
+ 4051, 8067, 8068, 2966, 8069, 8070, 8071, 8072, 3171, 4571, 4572, 2182, 1722, 8073, 3238, 3239, # 7958
378
+ 1842, 3610, 1715, 481, 365, 1975, 1856, 8074, 8075, 1962, 2491, 4573, 8076, 2126, 3611, 3240, # 7974
379
+ 433, 1894, 2063, 2075, 8077, 602, 2741, 8078, 8079, 8080, 8081, 8082, 3014, 1628, 3400, 8083, # 7990
380
+ 3172, 4574, 4052, 2890, 4575, 2512, 8084, 2544, 2772, 8085, 8086, 8087, 3310, 4576, 2891, 8088, # 8006
381
+ 4577, 8089, 2851, 4578, 4579, 1221, 2967, 4053, 2513, 8090, 8091, 8092, 1867, 1989, 8093, 8094, # 8022
382
+ 8095, 1895, 8096, 8097, 4580, 1896, 4054, 318, 8098, 2094, 4055, 4293, 8099, 8100, 485, 8101, # 8038
383
+ 938, 3862, 553, 2670, 116, 8102, 3863, 3612, 8103, 3498, 2671, 2773, 3401, 3311, 2807, 8104, # 8054
384
+ 3613, 2929, 4056, 1747, 2930, 2968, 8105, 8106, 207, 8107, 8108, 2672, 4581, 2514, 8109, 3015, # 8070
385
+ 890, 3614, 3864, 8110, 1877, 3732, 3402, 8111, 2183, 2353, 3403, 1652, 8112, 8113, 8114, 941, # 8086
386
+ 2294, 208, 3499, 4057, 2019, 330, 4294, 3865, 2892, 2492, 3733, 4295, 8115, 8116, 8117, 8118, # 8102
387
+ )
388
+ # fmt: on
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/euctwprober.py ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is mozilla.org code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from .chardistribution import EUCTWDistributionAnalysis
29
+ from .codingstatemachine import CodingStateMachine
30
+ from .mbcharsetprober import MultiByteCharSetProber
31
+ from .mbcssm import EUCTW_SM_MODEL
32
+
33
+
34
+ class EUCTWProber(MultiByteCharSetProber):
35
+ def __init__(self) -> None:
36
+ super().__init__()
37
+ self.coding_sm = CodingStateMachine(EUCTW_SM_MODEL)
38
+ self.distribution_analyzer = EUCTWDistributionAnalysis()
39
+ self.reset()
40
+
41
+ @property
42
+ def charset_name(self) -> str:
43
+ return "EUC-TW"
44
+
45
+ @property
46
+ def language(self) -> str:
47
+ return "Taiwan"
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/gb2312prober.py ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is mozilla.org code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from .chardistribution import GB2312DistributionAnalysis
29
+ from .codingstatemachine import CodingStateMachine
30
+ from .mbcharsetprober import MultiByteCharSetProber
31
+ from .mbcssm import GB2312_SM_MODEL
32
+
33
+
34
+ class GB2312Prober(MultiByteCharSetProber):
35
+ def __init__(self) -> None:
36
+ super().__init__()
37
+ self.coding_sm = CodingStateMachine(GB2312_SM_MODEL)
38
+ self.distribution_analyzer = GB2312DistributionAnalysis()
39
+ self.reset()
40
+
41
+ @property
42
+ def charset_name(self) -> str:
43
+ return "GB2312"
44
+
45
+ @property
46
+ def language(self) -> str:
47
+ return "Chinese"
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/johabfreq.py ADDED
@@ -0,0 +1,2382 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Communicator client code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ # The frequency data itself is the same as euc-kr.
29
+ # This is just a mapping table to euc-kr.
30
+
31
+ JOHAB_TO_EUCKR_ORDER_TABLE = {
32
+ 0x8861: 0,
33
+ 0x8862: 1,
34
+ 0x8865: 2,
35
+ 0x8868: 3,
36
+ 0x8869: 4,
37
+ 0x886A: 5,
38
+ 0x886B: 6,
39
+ 0x8871: 7,
40
+ 0x8873: 8,
41
+ 0x8874: 9,
42
+ 0x8875: 10,
43
+ 0x8876: 11,
44
+ 0x8877: 12,
45
+ 0x8878: 13,
46
+ 0x8879: 14,
47
+ 0x887B: 15,
48
+ 0x887C: 16,
49
+ 0x887D: 17,
50
+ 0x8881: 18,
51
+ 0x8882: 19,
52
+ 0x8885: 20,
53
+ 0x8889: 21,
54
+ 0x8891: 22,
55
+ 0x8893: 23,
56
+ 0x8895: 24,
57
+ 0x8896: 25,
58
+ 0x8897: 26,
59
+ 0x88A1: 27,
60
+ 0x88A2: 28,
61
+ 0x88A5: 29,
62
+ 0x88A9: 30,
63
+ 0x88B5: 31,
64
+ 0x88B7: 32,
65
+ 0x88C1: 33,
66
+ 0x88C5: 34,
67
+ 0x88C9: 35,
68
+ 0x88E1: 36,
69
+ 0x88E2: 37,
70
+ 0x88E5: 38,
71
+ 0x88E8: 39,
72
+ 0x88E9: 40,
73
+ 0x88EB: 41,
74
+ 0x88F1: 42,
75
+ 0x88F3: 43,
76
+ 0x88F5: 44,
77
+ 0x88F6: 45,
78
+ 0x88F7: 46,
79
+ 0x88F8: 47,
80
+ 0x88FB: 48,
81
+ 0x88FC: 49,
82
+ 0x88FD: 50,
83
+ 0x8941: 51,
84
+ 0x8945: 52,
85
+ 0x8949: 53,
86
+ 0x8951: 54,
87
+ 0x8953: 55,
88
+ 0x8955: 56,
89
+ 0x8956: 57,
90
+ 0x8957: 58,
91
+ 0x8961: 59,
92
+ 0x8962: 60,
93
+ 0x8963: 61,
94
+ 0x8965: 62,
95
+ 0x8968: 63,
96
+ 0x8969: 64,
97
+ 0x8971: 65,
98
+ 0x8973: 66,
99
+ 0x8975: 67,
100
+ 0x8976: 68,
101
+ 0x8977: 69,
102
+ 0x897B: 70,
103
+ 0x8981: 71,
104
+ 0x8985: 72,
105
+ 0x8989: 73,
106
+ 0x8993: 74,
107
+ 0x8995: 75,
108
+ 0x89A1: 76,
109
+ 0x89A2: 77,
110
+ 0x89A5: 78,
111
+ 0x89A8: 79,
112
+ 0x89A9: 80,
113
+ 0x89AB: 81,
114
+ 0x89AD: 82,
115
+ 0x89B0: 83,
116
+ 0x89B1: 84,
117
+ 0x89B3: 85,
118
+ 0x89B5: 86,
119
+ 0x89B7: 87,
120
+ 0x89B8: 88,
121
+ 0x89C1: 89,
122
+ 0x89C2: 90,
123
+ 0x89C5: 91,
124
+ 0x89C9: 92,
125
+ 0x89CB: 93,
126
+ 0x89D1: 94,
127
+ 0x89D3: 95,
128
+ 0x89D5: 96,
129
+ 0x89D7: 97,
130
+ 0x89E1: 98,
131
+ 0x89E5: 99,
132
+ 0x89E9: 100,
133
+ 0x89F3: 101,
134
+ 0x89F6: 102,
135
+ 0x89F7: 103,
136
+ 0x8A41: 104,
137
+ 0x8A42: 105,
138
+ 0x8A45: 106,
139
+ 0x8A49: 107,
140
+ 0x8A51: 108,
141
+ 0x8A53: 109,
142
+ 0x8A55: 110,
143
+ 0x8A57: 111,
144
+ 0x8A61: 112,
145
+ 0x8A65: 113,
146
+ 0x8A69: 114,
147
+ 0x8A73: 115,
148
+ 0x8A75: 116,
149
+ 0x8A81: 117,
150
+ 0x8A82: 118,
151
+ 0x8A85: 119,
152
+ 0x8A88: 120,
153
+ 0x8A89: 121,
154
+ 0x8A8A: 122,
155
+ 0x8A8B: 123,
156
+ 0x8A90: 124,
157
+ 0x8A91: 125,
158
+ 0x8A93: 126,
159
+ 0x8A95: 127,
160
+ 0x8A97: 128,
161
+ 0x8A98: 129,
162
+ 0x8AA1: 130,
163
+ 0x8AA2: 131,
164
+ 0x8AA5: 132,
165
+ 0x8AA9: 133,
166
+ 0x8AB6: 134,
167
+ 0x8AB7: 135,
168
+ 0x8AC1: 136,
169
+ 0x8AD5: 137,
170
+ 0x8AE1: 138,
171
+ 0x8AE2: 139,
172
+ 0x8AE5: 140,
173
+ 0x8AE9: 141,
174
+ 0x8AF1: 142,
175
+ 0x8AF3: 143,
176
+ 0x8AF5: 144,
177
+ 0x8B41: 145,
178
+ 0x8B45: 146,
179
+ 0x8B49: 147,
180
+ 0x8B61: 148,
181
+ 0x8B62: 149,
182
+ 0x8B65: 150,
183
+ 0x8B68: 151,
184
+ 0x8B69: 152,
185
+ 0x8B6A: 153,
186
+ 0x8B71: 154,
187
+ 0x8B73: 155,
188
+ 0x8B75: 156,
189
+ 0x8B77: 157,
190
+ 0x8B81: 158,
191
+ 0x8BA1: 159,
192
+ 0x8BA2: 160,
193
+ 0x8BA5: 161,
194
+ 0x8BA8: 162,
195
+ 0x8BA9: 163,
196
+ 0x8BAB: 164,
197
+ 0x8BB1: 165,
198
+ 0x8BB3: 166,
199
+ 0x8BB5: 167,
200
+ 0x8BB7: 168,
201
+ 0x8BB8: 169,
202
+ 0x8BBC: 170,
203
+ 0x8C61: 171,
204
+ 0x8C62: 172,
205
+ 0x8C63: 173,
206
+ 0x8C65: 174,
207
+ 0x8C69: 175,
208
+ 0x8C6B: 176,
209
+ 0x8C71: 177,
210
+ 0x8C73: 178,
211
+ 0x8C75: 179,
212
+ 0x8C76: 180,
213
+ 0x8C77: 181,
214
+ 0x8C7B: 182,
215
+ 0x8C81: 183,
216
+ 0x8C82: 184,
217
+ 0x8C85: 185,
218
+ 0x8C89: 186,
219
+ 0x8C91: 187,
220
+ 0x8C93: 188,
221
+ 0x8C95: 189,
222
+ 0x8C96: 190,
223
+ 0x8C97: 191,
224
+ 0x8CA1: 192,
225
+ 0x8CA2: 193,
226
+ 0x8CA9: 194,
227
+ 0x8CE1: 195,
228
+ 0x8CE2: 196,
229
+ 0x8CE3: 197,
230
+ 0x8CE5: 198,
231
+ 0x8CE9: 199,
232
+ 0x8CF1: 200,
233
+ 0x8CF3: 201,
234
+ 0x8CF5: 202,
235
+ 0x8CF6: 203,
236
+ 0x8CF7: 204,
237
+ 0x8D41: 205,
238
+ 0x8D42: 206,
239
+ 0x8D45: 207,
240
+ 0x8D51: 208,
241
+ 0x8D55: 209,
242
+ 0x8D57: 210,
243
+ 0x8D61: 211,
244
+ 0x8D65: 212,
245
+ 0x8D69: 213,
246
+ 0x8D75: 214,
247
+ 0x8D76: 215,
248
+ 0x8D7B: 216,
249
+ 0x8D81: 217,
250
+ 0x8DA1: 218,
251
+ 0x8DA2: 219,
252
+ 0x8DA5: 220,
253
+ 0x8DA7: 221,
254
+ 0x8DA9: 222,
255
+ 0x8DB1: 223,
256
+ 0x8DB3: 224,
257
+ 0x8DB5: 225,
258
+ 0x8DB7: 226,
259
+ 0x8DB8: 227,
260
+ 0x8DB9: 228,
261
+ 0x8DC1: 229,
262
+ 0x8DC2: 230,
263
+ 0x8DC9: 231,
264
+ 0x8DD6: 232,
265
+ 0x8DD7: 233,
266
+ 0x8DE1: 234,
267
+ 0x8DE2: 235,
268
+ 0x8DF7: 236,
269
+ 0x8E41: 237,
270
+ 0x8E45: 238,
271
+ 0x8E49: 239,
272
+ 0x8E51: 240,
273
+ 0x8E53: 241,
274
+ 0x8E57: 242,
275
+ 0x8E61: 243,
276
+ 0x8E81: 244,
277
+ 0x8E82: 245,
278
+ 0x8E85: 246,
279
+ 0x8E89: 247,
280
+ 0x8E90: 248,
281
+ 0x8E91: 249,
282
+ 0x8E93: 250,
283
+ 0x8E95: 251,
284
+ 0x8E97: 252,
285
+ 0x8E98: 253,
286
+ 0x8EA1: 254,
287
+ 0x8EA9: 255,
288
+ 0x8EB6: 256,
289
+ 0x8EB7: 257,
290
+ 0x8EC1: 258,
291
+ 0x8EC2: 259,
292
+ 0x8EC5: 260,
293
+ 0x8EC9: 261,
294
+ 0x8ED1: 262,
295
+ 0x8ED3: 263,
296
+ 0x8ED6: 264,
297
+ 0x8EE1: 265,
298
+ 0x8EE5: 266,
299
+ 0x8EE9: 267,
300
+ 0x8EF1: 268,
301
+ 0x8EF3: 269,
302
+ 0x8F41: 270,
303
+ 0x8F61: 271,
304
+ 0x8F62: 272,
305
+ 0x8F65: 273,
306
+ 0x8F67: 274,
307
+ 0x8F69: 275,
308
+ 0x8F6B: 276,
309
+ 0x8F70: 277,
310
+ 0x8F71: 278,
311
+ 0x8F73: 279,
312
+ 0x8F75: 280,
313
+ 0x8F77: 281,
314
+ 0x8F7B: 282,
315
+ 0x8FA1: 283,
316
+ 0x8FA2: 284,
317
+ 0x8FA5: 285,
318
+ 0x8FA9: 286,
319
+ 0x8FB1: 287,
320
+ 0x8FB3: 288,
321
+ 0x8FB5: 289,
322
+ 0x8FB7: 290,
323
+ 0x9061: 291,
324
+ 0x9062: 292,
325
+ 0x9063: 293,
326
+ 0x9065: 294,
327
+ 0x9068: 295,
328
+ 0x9069: 296,
329
+ 0x906A: 297,
330
+ 0x906B: 298,
331
+ 0x9071: 299,
332
+ 0x9073: 300,
333
+ 0x9075: 301,
334
+ 0x9076: 302,
335
+ 0x9077: 303,
336
+ 0x9078: 304,
337
+ 0x9079: 305,
338
+ 0x907B: 306,
339
+ 0x907D: 307,
340
+ 0x9081: 308,
341
+ 0x9082: 309,
342
+ 0x9085: 310,
343
+ 0x9089: 311,
344
+ 0x9091: 312,
345
+ 0x9093: 313,
346
+ 0x9095: 314,
347
+ 0x9096: 315,
348
+ 0x9097: 316,
349
+ 0x90A1: 317,
350
+ 0x90A2: 318,
351
+ 0x90A5: 319,
352
+ 0x90A9: 320,
353
+ 0x90B1: 321,
354
+ 0x90B7: 322,
355
+ 0x90E1: 323,
356
+ 0x90E2: 324,
357
+ 0x90E4: 325,
358
+ 0x90E5: 326,
359
+ 0x90E9: 327,
360
+ 0x90EB: 328,
361
+ 0x90EC: 329,
362
+ 0x90F1: 330,
363
+ 0x90F3: 331,
364
+ 0x90F5: 332,
365
+ 0x90F6: 333,
366
+ 0x90F7: 334,
367
+ 0x90FD: 335,
368
+ 0x9141: 336,
369
+ 0x9142: 337,
370
+ 0x9145: 338,
371
+ 0x9149: 339,
372
+ 0x9151: 340,
373
+ 0x9153: 341,
374
+ 0x9155: 342,
375
+ 0x9156: 343,
376
+ 0x9157: 344,
377
+ 0x9161: 345,
378
+ 0x9162: 346,
379
+ 0x9165: 347,
380
+ 0x9169: 348,
381
+ 0x9171: 349,
382
+ 0x9173: 350,
383
+ 0x9176: 351,
384
+ 0x9177: 352,
385
+ 0x917A: 353,
386
+ 0x9181: 354,
387
+ 0x9185: 355,
388
+ 0x91A1: 356,
389
+ 0x91A2: 357,
390
+ 0x91A5: 358,
391
+ 0x91A9: 359,
392
+ 0x91AB: 360,
393
+ 0x91B1: 361,
394
+ 0x91B3: 362,
395
+ 0x91B5: 363,
396
+ 0x91B7: 364,
397
+ 0x91BC: 365,
398
+ 0x91BD: 366,
399
+ 0x91C1: 367,
400
+ 0x91C5: 368,
401
+ 0x91C9: 369,
402
+ 0x91D6: 370,
403
+ 0x9241: 371,
404
+ 0x9245: 372,
405
+ 0x9249: 373,
406
+ 0x9251: 374,
407
+ 0x9253: 375,
408
+ 0x9255: 376,
409
+ 0x9261: 377,
410
+ 0x9262: 378,
411
+ 0x9265: 379,
412
+ 0x9269: 380,
413
+ 0x9273: 381,
414
+ 0x9275: 382,
415
+ 0x9277: 383,
416
+ 0x9281: 384,
417
+ 0x9282: 385,
418
+ 0x9285: 386,
419
+ 0x9288: 387,
420
+ 0x9289: 388,
421
+ 0x9291: 389,
422
+ 0x9293: 390,
423
+ 0x9295: 391,
424
+ 0x9297: 392,
425
+ 0x92A1: 393,
426
+ 0x92B6: 394,
427
+ 0x92C1: 395,
428
+ 0x92E1: 396,
429
+ 0x92E5: 397,
430
+ 0x92E9: 398,
431
+ 0x92F1: 399,
432
+ 0x92F3: 400,
433
+ 0x9341: 401,
434
+ 0x9342: 402,
435
+ 0x9349: 403,
436
+ 0x9351: 404,
437
+ 0x9353: 405,
438
+ 0x9357: 406,
439
+ 0x9361: 407,
440
+ 0x9362: 408,
441
+ 0x9365: 409,
442
+ 0x9369: 410,
443
+ 0x936A: 411,
444
+ 0x936B: 412,
445
+ 0x9371: 413,
446
+ 0x9373: 414,
447
+ 0x9375: 415,
448
+ 0x9377: 416,
449
+ 0x9378: 417,
450
+ 0x937C: 418,
451
+ 0x9381: 419,
452
+ 0x9385: 420,
453
+ 0x9389: 421,
454
+ 0x93A1: 422,
455
+ 0x93A2: 423,
456
+ 0x93A5: 424,
457
+ 0x93A9: 425,
458
+ 0x93AB: 426,
459
+ 0x93B1: 427,
460
+ 0x93B3: 428,
461
+ 0x93B5: 429,
462
+ 0x93B7: 430,
463
+ 0x93BC: 431,
464
+ 0x9461: 432,
465
+ 0x9462: 433,
466
+ 0x9463: 434,
467
+ 0x9465: 435,
468
+ 0x9468: 436,
469
+ 0x9469: 437,
470
+ 0x946A: 438,
471
+ 0x946B: 439,
472
+ 0x946C: 440,
473
+ 0x9470: 441,
474
+ 0x9471: 442,
475
+ 0x9473: 443,
476
+ 0x9475: 444,
477
+ 0x9476: 445,
478
+ 0x9477: 446,
479
+ 0x9478: 447,
480
+ 0x9479: 448,
481
+ 0x947D: 449,
482
+ 0x9481: 450,
483
+ 0x9482: 451,
484
+ 0x9485: 452,
485
+ 0x9489: 453,
486
+ 0x9491: 454,
487
+ 0x9493: 455,
488
+ 0x9495: 456,
489
+ 0x9496: 457,
490
+ 0x9497: 458,
491
+ 0x94A1: 459,
492
+ 0x94E1: 460,
493
+ 0x94E2: 461,
494
+ 0x94E3: 462,
495
+ 0x94E5: 463,
496
+ 0x94E8: 464,
497
+ 0x94E9: 465,
498
+ 0x94EB: 466,
499
+ 0x94EC: 467,
500
+ 0x94F1: 468,
501
+ 0x94F3: 469,
502
+ 0x94F5: 470,
503
+ 0x94F7: 471,
504
+ 0x94F9: 472,
505
+ 0x94FC: 473,
506
+ 0x9541: 474,
507
+ 0x9542: 475,
508
+ 0x9545: 476,
509
+ 0x9549: 477,
510
+ 0x9551: 478,
511
+ 0x9553: 479,
512
+ 0x9555: 480,
513
+ 0x9556: 481,
514
+ 0x9557: 482,
515
+ 0x9561: 483,
516
+ 0x9565: 484,
517
+ 0x9569: 485,
518
+ 0x9576: 486,
519
+ 0x9577: 487,
520
+ 0x9581: 488,
521
+ 0x9585: 489,
522
+ 0x95A1: 490,
523
+ 0x95A2: 491,
524
+ 0x95A5: 492,
525
+ 0x95A8: 493,
526
+ 0x95A9: 494,
527
+ 0x95AB: 495,
528
+ 0x95AD: 496,
529
+ 0x95B1: 497,
530
+ 0x95B3: 498,
531
+ 0x95B5: 499,
532
+ 0x95B7: 500,
533
+ 0x95B9: 501,
534
+ 0x95BB: 502,
535
+ 0x95C1: 503,
536
+ 0x95C5: 504,
537
+ 0x95C9: 505,
538
+ 0x95E1: 506,
539
+ 0x95F6: 507,
540
+ 0x9641: 508,
541
+ 0x9645: 509,
542
+ 0x9649: 510,
543
+ 0x9651: 511,
544
+ 0x9653: 512,
545
+ 0x9655: 513,
546
+ 0x9661: 514,
547
+ 0x9681: 515,
548
+ 0x9682: 516,
549
+ 0x9685: 517,
550
+ 0x9689: 518,
551
+ 0x9691: 519,
552
+ 0x9693: 520,
553
+ 0x9695: 521,
554
+ 0x9697: 522,
555
+ 0x96A1: 523,
556
+ 0x96B6: 524,
557
+ 0x96C1: 525,
558
+ 0x96D7: 526,
559
+ 0x96E1: 527,
560
+ 0x96E5: 528,
561
+ 0x96E9: 529,
562
+ 0x96F3: 530,
563
+ 0x96F5: 531,
564
+ 0x96F7: 532,
565
+ 0x9741: 533,
566
+ 0x9745: 534,
567
+ 0x9749: 535,
568
+ 0x9751: 536,
569
+ 0x9757: 537,
570
+ 0x9761: 538,
571
+ 0x9762: 539,
572
+ 0x9765: 540,
573
+ 0x9768: 541,
574
+ 0x9769: 542,
575
+ 0x976B: 543,
576
+ 0x9771: 544,
577
+ 0x9773: 545,
578
+ 0x9775: 546,
579
+ 0x9777: 547,
580
+ 0x9781: 548,
581
+ 0x97A1: 549,
582
+ 0x97A2: 550,
583
+ 0x97A5: 551,
584
+ 0x97A8: 552,
585
+ 0x97A9: 553,
586
+ 0x97B1: 554,
587
+ 0x97B3: 555,
588
+ 0x97B5: 556,
589
+ 0x97B6: 557,
590
+ 0x97B7: 558,
591
+ 0x97B8: 559,
592
+ 0x9861: 560,
593
+ 0x9862: 561,
594
+ 0x9865: 562,
595
+ 0x9869: 563,
596
+ 0x9871: 564,
597
+ 0x9873: 565,
598
+ 0x9875: 566,
599
+ 0x9876: 567,
600
+ 0x9877: 568,
601
+ 0x987D: 569,
602
+ 0x9881: 570,
603
+ 0x9882: 571,
604
+ 0x9885: 572,
605
+ 0x9889: 573,
606
+ 0x9891: 574,
607
+ 0x9893: 575,
608
+ 0x9895: 576,
609
+ 0x9896: 577,
610
+ 0x9897: 578,
611
+ 0x98E1: 579,
612
+ 0x98E2: 580,
613
+ 0x98E5: 581,
614
+ 0x98E9: 582,
615
+ 0x98EB: 583,
616
+ 0x98EC: 584,
617
+ 0x98F1: 585,
618
+ 0x98F3: 586,
619
+ 0x98F5: 587,
620
+ 0x98F6: 588,
621
+ 0x98F7: 589,
622
+ 0x98FD: 590,
623
+ 0x9941: 591,
624
+ 0x9942: 592,
625
+ 0x9945: 593,
626
+ 0x9949: 594,
627
+ 0x9951: 595,
628
+ 0x9953: 596,
629
+ 0x9955: 597,
630
+ 0x9956: 598,
631
+ 0x9957: 599,
632
+ 0x9961: 600,
633
+ 0x9976: 601,
634
+ 0x99A1: 602,
635
+ 0x99A2: 603,
636
+ 0x99A5: 604,
637
+ 0x99A9: 605,
638
+ 0x99B7: 606,
639
+ 0x99C1: 607,
640
+ 0x99C9: 608,
641
+ 0x99E1: 609,
642
+ 0x9A41: 610,
643
+ 0x9A45: 611,
644
+ 0x9A81: 612,
645
+ 0x9A82: 613,
646
+ 0x9A85: 614,
647
+ 0x9A89: 615,
648
+ 0x9A90: 616,
649
+ 0x9A91: 617,
650
+ 0x9A97: 618,
651
+ 0x9AC1: 619,
652
+ 0x9AE1: 620,
653
+ 0x9AE5: 621,
654
+ 0x9AE9: 622,
655
+ 0x9AF1: 623,
656
+ 0x9AF3: 624,
657
+ 0x9AF7: 625,
658
+ 0x9B61: 626,
659
+ 0x9B62: 627,
660
+ 0x9B65: 628,
661
+ 0x9B68: 629,
662
+ 0x9B69: 630,
663
+ 0x9B71: 631,
664
+ 0x9B73: 632,
665
+ 0x9B75: 633,
666
+ 0x9B81: 634,
667
+ 0x9B85: 635,
668
+ 0x9B89: 636,
669
+ 0x9B91: 637,
670
+ 0x9B93: 638,
671
+ 0x9BA1: 639,
672
+ 0x9BA5: 640,
673
+ 0x9BA9: 641,
674
+ 0x9BB1: 642,
675
+ 0x9BB3: 643,
676
+ 0x9BB5: 644,
677
+ 0x9BB7: 645,
678
+ 0x9C61: 646,
679
+ 0x9C62: 647,
680
+ 0x9C65: 648,
681
+ 0x9C69: 649,
682
+ 0x9C71: 650,
683
+ 0x9C73: 651,
684
+ 0x9C75: 652,
685
+ 0x9C76: 653,
686
+ 0x9C77: 654,
687
+ 0x9C78: 655,
688
+ 0x9C7C: 656,
689
+ 0x9C7D: 657,
690
+ 0x9C81: 658,
691
+ 0x9C82: 659,
692
+ 0x9C85: 660,
693
+ 0x9C89: 661,
694
+ 0x9C91: 662,
695
+ 0x9C93: 663,
696
+ 0x9C95: 664,
697
+ 0x9C96: 665,
698
+ 0x9C97: 666,
699
+ 0x9CA1: 667,
700
+ 0x9CA2: 668,
701
+ 0x9CA5: 669,
702
+ 0x9CB5: 670,
703
+ 0x9CB7: 671,
704
+ 0x9CE1: 672,
705
+ 0x9CE2: 673,
706
+ 0x9CE5: 674,
707
+ 0x9CE9: 675,
708
+ 0x9CF1: 676,
709
+ 0x9CF3: 677,
710
+ 0x9CF5: 678,
711
+ 0x9CF6: 679,
712
+ 0x9CF7: 680,
713
+ 0x9CFD: 681,
714
+ 0x9D41: 682,
715
+ 0x9D42: 683,
716
+ 0x9D45: 684,
717
+ 0x9D49: 685,
718
+ 0x9D51: 686,
719
+ 0x9D53: 687,
720
+ 0x9D55: 688,
721
+ 0x9D57: 689,
722
+ 0x9D61: 690,
723
+ 0x9D62: 691,
724
+ 0x9D65: 692,
725
+ 0x9D69: 693,
726
+ 0x9D71: 694,
727
+ 0x9D73: 695,
728
+ 0x9D75: 696,
729
+ 0x9D76: 697,
730
+ 0x9D77: 698,
731
+ 0x9D81: 699,
732
+ 0x9D85: 700,
733
+ 0x9D93: 701,
734
+ 0x9D95: 702,
735
+ 0x9DA1: 703,
736
+ 0x9DA2: 704,
737
+ 0x9DA5: 705,
738
+ 0x9DA9: 706,
739
+ 0x9DB1: 707,
740
+ 0x9DB3: 708,
741
+ 0x9DB5: 709,
742
+ 0x9DB7: 710,
743
+ 0x9DC1: 711,
744
+ 0x9DC5: 712,
745
+ 0x9DD7: 713,
746
+ 0x9DF6: 714,
747
+ 0x9E41: 715,
748
+ 0x9E45: 716,
749
+ 0x9E49: 717,
750
+ 0x9E51: 718,
751
+ 0x9E53: 719,
752
+ 0x9E55: 720,
753
+ 0x9E57: 721,
754
+ 0x9E61: 722,
755
+ 0x9E65: 723,
756
+ 0x9E69: 724,
757
+ 0x9E73: 725,
758
+ 0x9E75: 726,
759
+ 0x9E77: 727,
760
+ 0x9E81: 728,
761
+ 0x9E82: 729,
762
+ 0x9E85: 730,
763
+ 0x9E89: 731,
764
+ 0x9E91: 732,
765
+ 0x9E93: 733,
766
+ 0x9E95: 734,
767
+ 0x9E97: 735,
768
+ 0x9EA1: 736,
769
+ 0x9EB6: 737,
770
+ 0x9EC1: 738,
771
+ 0x9EE1: 739,
772
+ 0x9EE2: 740,
773
+ 0x9EE5: 741,
774
+ 0x9EE9: 742,
775
+ 0x9EF1: 743,
776
+ 0x9EF5: 744,
777
+ 0x9EF7: 745,
778
+ 0x9F41: 746,
779
+ 0x9F42: 747,
780
+ 0x9F45: 748,
781
+ 0x9F49: 749,
782
+ 0x9F51: 750,
783
+ 0x9F53: 751,
784
+ 0x9F55: 752,
785
+ 0x9F57: 753,
786
+ 0x9F61: 754,
787
+ 0x9F62: 755,
788
+ 0x9F65: 756,
789
+ 0x9F69: 757,
790
+ 0x9F71: 758,
791
+ 0x9F73: 759,
792
+ 0x9F75: 760,
793
+ 0x9F77: 761,
794
+ 0x9F78: 762,
795
+ 0x9F7B: 763,
796
+ 0x9F7C: 764,
797
+ 0x9FA1: 765,
798
+ 0x9FA2: 766,
799
+ 0x9FA5: 767,
800
+ 0x9FA9: 768,
801
+ 0x9FB1: 769,
802
+ 0x9FB3: 770,
803
+ 0x9FB5: 771,
804
+ 0x9FB7: 772,
805
+ 0xA061: 773,
806
+ 0xA062: 774,
807
+ 0xA065: 775,
808
+ 0xA067: 776,
809
+ 0xA068: 777,
810
+ 0xA069: 778,
811
+ 0xA06A: 779,
812
+ 0xA06B: 780,
813
+ 0xA071: 781,
814
+ 0xA073: 782,
815
+ 0xA075: 783,
816
+ 0xA077: 784,
817
+ 0xA078: 785,
818
+ 0xA07B: 786,
819
+ 0xA07D: 787,
820
+ 0xA081: 788,
821
+ 0xA082: 789,
822
+ 0xA085: 790,
823
+ 0xA089: 791,
824
+ 0xA091: 792,
825
+ 0xA093: 793,
826
+ 0xA095: 794,
827
+ 0xA096: 795,
828
+ 0xA097: 796,
829
+ 0xA098: 797,
830
+ 0xA0A1: 798,
831
+ 0xA0A2: 799,
832
+ 0xA0A9: 800,
833
+ 0xA0B7: 801,
834
+ 0xA0E1: 802,
835
+ 0xA0E2: 803,
836
+ 0xA0E5: 804,
837
+ 0xA0E9: 805,
838
+ 0xA0EB: 806,
839
+ 0xA0F1: 807,
840
+ 0xA0F3: 808,
841
+ 0xA0F5: 809,
842
+ 0xA0F7: 810,
843
+ 0xA0F8: 811,
844
+ 0xA0FD: 812,
845
+ 0xA141: 813,
846
+ 0xA142: 814,
847
+ 0xA145: 815,
848
+ 0xA149: 816,
849
+ 0xA151: 817,
850
+ 0xA153: 818,
851
+ 0xA155: 819,
852
+ 0xA156: 820,
853
+ 0xA157: 821,
854
+ 0xA161: 822,
855
+ 0xA162: 823,
856
+ 0xA165: 824,
857
+ 0xA169: 825,
858
+ 0xA175: 826,
859
+ 0xA176: 827,
860
+ 0xA177: 828,
861
+ 0xA179: 829,
862
+ 0xA181: 830,
863
+ 0xA1A1: 831,
864
+ 0xA1A2: 832,
865
+ 0xA1A4: 833,
866
+ 0xA1A5: 834,
867
+ 0xA1A9: 835,
868
+ 0xA1AB: 836,
869
+ 0xA1B1: 837,
870
+ 0xA1B3: 838,
871
+ 0xA1B5: 839,
872
+ 0xA1B7: 840,
873
+ 0xA1C1: 841,
874
+ 0xA1C5: 842,
875
+ 0xA1D6: 843,
876
+ 0xA1D7: 844,
877
+ 0xA241: 845,
878
+ 0xA245: 846,
879
+ 0xA249: 847,
880
+ 0xA253: 848,
881
+ 0xA255: 849,
882
+ 0xA257: 850,
883
+ 0xA261: 851,
884
+ 0xA265: 852,
885
+ 0xA269: 853,
886
+ 0xA273: 854,
887
+ 0xA275: 855,
888
+ 0xA281: 856,
889
+ 0xA282: 857,
890
+ 0xA283: 858,
891
+ 0xA285: 859,
892
+ 0xA288: 860,
893
+ 0xA289: 861,
894
+ 0xA28A: 862,
895
+ 0xA28B: 863,
896
+ 0xA291: 864,
897
+ 0xA293: 865,
898
+ 0xA295: 866,
899
+ 0xA297: 867,
900
+ 0xA29B: 868,
901
+ 0xA29D: 869,
902
+ 0xA2A1: 870,
903
+ 0xA2A5: 871,
904
+ 0xA2A9: 872,
905
+ 0xA2B3: 873,
906
+ 0xA2B5: 874,
907
+ 0xA2C1: 875,
908
+ 0xA2E1: 876,
909
+ 0xA2E5: 877,
910
+ 0xA2E9: 878,
911
+ 0xA341: 879,
912
+ 0xA345: 880,
913
+ 0xA349: 881,
914
+ 0xA351: 882,
915
+ 0xA355: 883,
916
+ 0xA361: 884,
917
+ 0xA365: 885,
918
+ 0xA369: 886,
919
+ 0xA371: 887,
920
+ 0xA375: 888,
921
+ 0xA3A1: 889,
922
+ 0xA3A2: 890,
923
+ 0xA3A5: 891,
924
+ 0xA3A8: 892,
925
+ 0xA3A9: 893,
926
+ 0xA3AB: 894,
927
+ 0xA3B1: 895,
928
+ 0xA3B3: 896,
929
+ 0xA3B5: 897,
930
+ 0xA3B6: 898,
931
+ 0xA3B7: 899,
932
+ 0xA3B9: 900,
933
+ 0xA3BB: 901,
934
+ 0xA461: 902,
935
+ 0xA462: 903,
936
+ 0xA463: 904,
937
+ 0xA464: 905,
938
+ 0xA465: 906,
939
+ 0xA468: 907,
940
+ 0xA469: 908,
941
+ 0xA46A: 909,
942
+ 0xA46B: 910,
943
+ 0xA46C: 911,
944
+ 0xA471: 912,
945
+ 0xA473: 913,
946
+ 0xA475: 914,
947
+ 0xA477: 915,
948
+ 0xA47B: 916,
949
+ 0xA481: 917,
950
+ 0xA482: 918,
951
+ 0xA485: 919,
952
+ 0xA489: 920,
953
+ 0xA491: 921,
954
+ 0xA493: 922,
955
+ 0xA495: 923,
956
+ 0xA496: 924,
957
+ 0xA497: 925,
958
+ 0xA49B: 926,
959
+ 0xA4A1: 927,
960
+ 0xA4A2: 928,
961
+ 0xA4A5: 929,
962
+ 0xA4B3: 930,
963
+ 0xA4E1: 931,
964
+ 0xA4E2: 932,
965
+ 0xA4E5: 933,
966
+ 0xA4E8: 934,
967
+ 0xA4E9: 935,
968
+ 0xA4EB: 936,
969
+ 0xA4F1: 937,
970
+ 0xA4F3: 938,
971
+ 0xA4F5: 939,
972
+ 0xA4F7: 940,
973
+ 0xA4F8: 941,
974
+ 0xA541: 942,
975
+ 0xA542: 943,
976
+ 0xA545: 944,
977
+ 0xA548: 945,
978
+ 0xA549: 946,
979
+ 0xA551: 947,
980
+ 0xA553: 948,
981
+ 0xA555: 949,
982
+ 0xA556: 950,
983
+ 0xA557: 951,
984
+ 0xA561: 952,
985
+ 0xA562: 953,
986
+ 0xA565: 954,
987
+ 0xA569: 955,
988
+ 0xA573: 956,
989
+ 0xA575: 957,
990
+ 0xA576: 958,
991
+ 0xA577: 959,
992
+ 0xA57B: 960,
993
+ 0xA581: 961,
994
+ 0xA585: 962,
995
+ 0xA5A1: 963,
996
+ 0xA5A2: 964,
997
+ 0xA5A3: 965,
998
+ 0xA5A5: 966,
999
+ 0xA5A9: 967,
1000
+ 0xA5B1: 968,
1001
+ 0xA5B3: 969,
1002
+ 0xA5B5: 970,
1003
+ 0xA5B7: 971,
1004
+ 0xA5C1: 972,
1005
+ 0xA5C5: 973,
1006
+ 0xA5D6: 974,
1007
+ 0xA5E1: 975,
1008
+ 0xA5F6: 976,
1009
+ 0xA641: 977,
1010
+ 0xA642: 978,
1011
+ 0xA645: 979,
1012
+ 0xA649: 980,
1013
+ 0xA651: 981,
1014
+ 0xA653: 982,
1015
+ 0xA661: 983,
1016
+ 0xA665: 984,
1017
+ 0xA681: 985,
1018
+ 0xA682: 986,
1019
+ 0xA685: 987,
1020
+ 0xA688: 988,
1021
+ 0xA689: 989,
1022
+ 0xA68A: 990,
1023
+ 0xA68B: 991,
1024
+ 0xA691: 992,
1025
+ 0xA693: 993,
1026
+ 0xA695: 994,
1027
+ 0xA697: 995,
1028
+ 0xA69B: 996,
1029
+ 0xA69C: 997,
1030
+ 0xA6A1: 998,
1031
+ 0xA6A9: 999,
1032
+ 0xA6B6: 1000,
1033
+ 0xA6C1: 1001,
1034
+ 0xA6E1: 1002,
1035
+ 0xA6E2: 1003,
1036
+ 0xA6E5: 1004,
1037
+ 0xA6E9: 1005,
1038
+ 0xA6F7: 1006,
1039
+ 0xA741: 1007,
1040
+ 0xA745: 1008,
1041
+ 0xA749: 1009,
1042
+ 0xA751: 1010,
1043
+ 0xA755: 1011,
1044
+ 0xA757: 1012,
1045
+ 0xA761: 1013,
1046
+ 0xA762: 1014,
1047
+ 0xA765: 1015,
1048
+ 0xA769: 1016,
1049
+ 0xA771: 1017,
1050
+ 0xA773: 1018,
1051
+ 0xA775: 1019,
1052
+ 0xA7A1: 1020,
1053
+ 0xA7A2: 1021,
1054
+ 0xA7A5: 1022,
1055
+ 0xA7A9: 1023,
1056
+ 0xA7AB: 1024,
1057
+ 0xA7B1: 1025,
1058
+ 0xA7B3: 1026,
1059
+ 0xA7B5: 1027,
1060
+ 0xA7B7: 1028,
1061
+ 0xA7B8: 1029,
1062
+ 0xA7B9: 1030,
1063
+ 0xA861: 1031,
1064
+ 0xA862: 1032,
1065
+ 0xA865: 1033,
1066
+ 0xA869: 1034,
1067
+ 0xA86B: 1035,
1068
+ 0xA871: 1036,
1069
+ 0xA873: 1037,
1070
+ 0xA875: 1038,
1071
+ 0xA876: 1039,
1072
+ 0xA877: 1040,
1073
+ 0xA87D: 1041,
1074
+ 0xA881: 1042,
1075
+ 0xA882: 1043,
1076
+ 0xA885: 1044,
1077
+ 0xA889: 1045,
1078
+ 0xA891: 1046,
1079
+ 0xA893: 1047,
1080
+ 0xA895: 1048,
1081
+ 0xA896: 1049,
1082
+ 0xA897: 1050,
1083
+ 0xA8A1: 1051,
1084
+ 0xA8A2: 1052,
1085
+ 0xA8B1: 1053,
1086
+ 0xA8E1: 1054,
1087
+ 0xA8E2: 1055,
1088
+ 0xA8E5: 1056,
1089
+ 0xA8E8: 1057,
1090
+ 0xA8E9: 1058,
1091
+ 0xA8F1: 1059,
1092
+ 0xA8F5: 1060,
1093
+ 0xA8F6: 1061,
1094
+ 0xA8F7: 1062,
1095
+ 0xA941: 1063,
1096
+ 0xA957: 1064,
1097
+ 0xA961: 1065,
1098
+ 0xA962: 1066,
1099
+ 0xA971: 1067,
1100
+ 0xA973: 1068,
1101
+ 0xA975: 1069,
1102
+ 0xA976: 1070,
1103
+ 0xA977: 1071,
1104
+ 0xA9A1: 1072,
1105
+ 0xA9A2: 1073,
1106
+ 0xA9A5: 1074,
1107
+ 0xA9A9: 1075,
1108
+ 0xA9B1: 1076,
1109
+ 0xA9B3: 1077,
1110
+ 0xA9B7: 1078,
1111
+ 0xAA41: 1079,
1112
+ 0xAA61: 1080,
1113
+ 0xAA77: 1081,
1114
+ 0xAA81: 1082,
1115
+ 0xAA82: 1083,
1116
+ 0xAA85: 1084,
1117
+ 0xAA89: 1085,
1118
+ 0xAA91: 1086,
1119
+ 0xAA95: 1087,
1120
+ 0xAA97: 1088,
1121
+ 0xAB41: 1089,
1122
+ 0xAB57: 1090,
1123
+ 0xAB61: 1091,
1124
+ 0xAB65: 1092,
1125
+ 0xAB69: 1093,
1126
+ 0xAB71: 1094,
1127
+ 0xAB73: 1095,
1128
+ 0xABA1: 1096,
1129
+ 0xABA2: 1097,
1130
+ 0xABA5: 1098,
1131
+ 0xABA9: 1099,
1132
+ 0xABB1: 1100,
1133
+ 0xABB3: 1101,
1134
+ 0xABB5: 1102,
1135
+ 0xABB7: 1103,
1136
+ 0xAC61: 1104,
1137
+ 0xAC62: 1105,
1138
+ 0xAC64: 1106,
1139
+ 0xAC65: 1107,
1140
+ 0xAC68: 1108,
1141
+ 0xAC69: 1109,
1142
+ 0xAC6A: 1110,
1143
+ 0xAC6B: 1111,
1144
+ 0xAC71: 1112,
1145
+ 0xAC73: 1113,
1146
+ 0xAC75: 1114,
1147
+ 0xAC76: 1115,
1148
+ 0xAC77: 1116,
1149
+ 0xAC7B: 1117,
1150
+ 0xAC81: 1118,
1151
+ 0xAC82: 1119,
1152
+ 0xAC85: 1120,
1153
+ 0xAC89: 1121,
1154
+ 0xAC91: 1122,
1155
+ 0xAC93: 1123,
1156
+ 0xAC95: 1124,
1157
+ 0xAC96: 1125,
1158
+ 0xAC97: 1126,
1159
+ 0xACA1: 1127,
1160
+ 0xACA2: 1128,
1161
+ 0xACA5: 1129,
1162
+ 0xACA9: 1130,
1163
+ 0xACB1: 1131,
1164
+ 0xACB3: 1132,
1165
+ 0xACB5: 1133,
1166
+ 0xACB7: 1134,
1167
+ 0xACC1: 1135,
1168
+ 0xACC5: 1136,
1169
+ 0xACC9: 1137,
1170
+ 0xACD1: 1138,
1171
+ 0xACD7: 1139,
1172
+ 0xACE1: 1140,
1173
+ 0xACE2: 1141,
1174
+ 0xACE3: 1142,
1175
+ 0xACE4: 1143,
1176
+ 0xACE5: 1144,
1177
+ 0xACE8: 1145,
1178
+ 0xACE9: 1146,
1179
+ 0xACEB: 1147,
1180
+ 0xACEC: 1148,
1181
+ 0xACF1: 1149,
1182
+ 0xACF3: 1150,
1183
+ 0xACF5: 1151,
1184
+ 0xACF6: 1152,
1185
+ 0xACF7: 1153,
1186
+ 0xACFC: 1154,
1187
+ 0xAD41: 1155,
1188
+ 0xAD42: 1156,
1189
+ 0xAD45: 1157,
1190
+ 0xAD49: 1158,
1191
+ 0xAD51: 1159,
1192
+ 0xAD53: 1160,
1193
+ 0xAD55: 1161,
1194
+ 0xAD56: 1162,
1195
+ 0xAD57: 1163,
1196
+ 0xAD61: 1164,
1197
+ 0xAD62: 1165,
1198
+ 0xAD65: 1166,
1199
+ 0xAD69: 1167,
1200
+ 0xAD71: 1168,
1201
+ 0xAD73: 1169,
1202
+ 0xAD75: 1170,
1203
+ 0xAD76: 1171,
1204
+ 0xAD77: 1172,
1205
+ 0xAD81: 1173,
1206
+ 0xAD85: 1174,
1207
+ 0xAD89: 1175,
1208
+ 0xAD97: 1176,
1209
+ 0xADA1: 1177,
1210
+ 0xADA2: 1178,
1211
+ 0xADA3: 1179,
1212
+ 0xADA5: 1180,
1213
+ 0xADA9: 1181,
1214
+ 0xADAB: 1182,
1215
+ 0xADB1: 1183,
1216
+ 0xADB3: 1184,
1217
+ 0xADB5: 1185,
1218
+ 0xADB7: 1186,
1219
+ 0xADBB: 1187,
1220
+ 0xADC1: 1188,
1221
+ 0xADC2: 1189,
1222
+ 0xADC5: 1190,
1223
+ 0xADC9: 1191,
1224
+ 0xADD7: 1192,
1225
+ 0xADE1: 1193,
1226
+ 0xADE5: 1194,
1227
+ 0xADE9: 1195,
1228
+ 0xADF1: 1196,
1229
+ 0xADF5: 1197,
1230
+ 0xADF6: 1198,
1231
+ 0xAE41: 1199,
1232
+ 0xAE45: 1200,
1233
+ 0xAE49: 1201,
1234
+ 0xAE51: 1202,
1235
+ 0xAE53: 1203,
1236
+ 0xAE55: 1204,
1237
+ 0xAE61: 1205,
1238
+ 0xAE62: 1206,
1239
+ 0xAE65: 1207,
1240
+ 0xAE69: 1208,
1241
+ 0xAE71: 1209,
1242
+ 0xAE73: 1210,
1243
+ 0xAE75: 1211,
1244
+ 0xAE77: 1212,
1245
+ 0xAE81: 1213,
1246
+ 0xAE82: 1214,
1247
+ 0xAE85: 1215,
1248
+ 0xAE88: 1216,
1249
+ 0xAE89: 1217,
1250
+ 0xAE91: 1218,
1251
+ 0xAE93: 1219,
1252
+ 0xAE95: 1220,
1253
+ 0xAE97: 1221,
1254
+ 0xAE99: 1222,
1255
+ 0xAE9B: 1223,
1256
+ 0xAE9C: 1224,
1257
+ 0xAEA1: 1225,
1258
+ 0xAEB6: 1226,
1259
+ 0xAEC1: 1227,
1260
+ 0xAEC2: 1228,
1261
+ 0xAEC5: 1229,
1262
+ 0xAEC9: 1230,
1263
+ 0xAED1: 1231,
1264
+ 0xAED7: 1232,
1265
+ 0xAEE1: 1233,
1266
+ 0xAEE2: 1234,
1267
+ 0xAEE5: 1235,
1268
+ 0xAEE9: 1236,
1269
+ 0xAEF1: 1237,
1270
+ 0xAEF3: 1238,
1271
+ 0xAEF5: 1239,
1272
+ 0xAEF7: 1240,
1273
+ 0xAF41: 1241,
1274
+ 0xAF42: 1242,
1275
+ 0xAF49: 1243,
1276
+ 0xAF51: 1244,
1277
+ 0xAF55: 1245,
1278
+ 0xAF57: 1246,
1279
+ 0xAF61: 1247,
1280
+ 0xAF62: 1248,
1281
+ 0xAF65: 1249,
1282
+ 0xAF69: 1250,
1283
+ 0xAF6A: 1251,
1284
+ 0xAF71: 1252,
1285
+ 0xAF73: 1253,
1286
+ 0xAF75: 1254,
1287
+ 0xAF77: 1255,
1288
+ 0xAFA1: 1256,
1289
+ 0xAFA2: 1257,
1290
+ 0xAFA5: 1258,
1291
+ 0xAFA8: 1259,
1292
+ 0xAFA9: 1260,
1293
+ 0xAFB0: 1261,
1294
+ 0xAFB1: 1262,
1295
+ 0xAFB3: 1263,
1296
+ 0xAFB5: 1264,
1297
+ 0xAFB7: 1265,
1298
+ 0xAFBC: 1266,
1299
+ 0xB061: 1267,
1300
+ 0xB062: 1268,
1301
+ 0xB064: 1269,
1302
+ 0xB065: 1270,
1303
+ 0xB069: 1271,
1304
+ 0xB071: 1272,
1305
+ 0xB073: 1273,
1306
+ 0xB076: 1274,
1307
+ 0xB077: 1275,
1308
+ 0xB07D: 1276,
1309
+ 0xB081: 1277,
1310
+ 0xB082: 1278,
1311
+ 0xB085: 1279,
1312
+ 0xB089: 1280,
1313
+ 0xB091: 1281,
1314
+ 0xB093: 1282,
1315
+ 0xB096: 1283,
1316
+ 0xB097: 1284,
1317
+ 0xB0B7: 1285,
1318
+ 0xB0E1: 1286,
1319
+ 0xB0E2: 1287,
1320
+ 0xB0E5: 1288,
1321
+ 0xB0E9: 1289,
1322
+ 0xB0EB: 1290,
1323
+ 0xB0F1: 1291,
1324
+ 0xB0F3: 1292,
1325
+ 0xB0F6: 1293,
1326
+ 0xB0F7: 1294,
1327
+ 0xB141: 1295,
1328
+ 0xB145: 1296,
1329
+ 0xB149: 1297,
1330
+ 0xB185: 1298,
1331
+ 0xB1A1: 1299,
1332
+ 0xB1A2: 1300,
1333
+ 0xB1A5: 1301,
1334
+ 0xB1A8: 1302,
1335
+ 0xB1A9: 1303,
1336
+ 0xB1AB: 1304,
1337
+ 0xB1B1: 1305,
1338
+ 0xB1B3: 1306,
1339
+ 0xB1B7: 1307,
1340
+ 0xB1C1: 1308,
1341
+ 0xB1C2: 1309,
1342
+ 0xB1C5: 1310,
1343
+ 0xB1D6: 1311,
1344
+ 0xB1E1: 1312,
1345
+ 0xB1F6: 1313,
1346
+ 0xB241: 1314,
1347
+ 0xB245: 1315,
1348
+ 0xB249: 1316,
1349
+ 0xB251: 1317,
1350
+ 0xB253: 1318,
1351
+ 0xB261: 1319,
1352
+ 0xB281: 1320,
1353
+ 0xB282: 1321,
1354
+ 0xB285: 1322,
1355
+ 0xB289: 1323,
1356
+ 0xB291: 1324,
1357
+ 0xB293: 1325,
1358
+ 0xB297: 1326,
1359
+ 0xB2A1: 1327,
1360
+ 0xB2B6: 1328,
1361
+ 0xB2C1: 1329,
1362
+ 0xB2E1: 1330,
1363
+ 0xB2E5: 1331,
1364
+ 0xB357: 1332,
1365
+ 0xB361: 1333,
1366
+ 0xB362: 1334,
1367
+ 0xB365: 1335,
1368
+ 0xB369: 1336,
1369
+ 0xB36B: 1337,
1370
+ 0xB370: 1338,
1371
+ 0xB371: 1339,
1372
+ 0xB373: 1340,
1373
+ 0xB381: 1341,
1374
+ 0xB385: 1342,
1375
+ 0xB389: 1343,
1376
+ 0xB391: 1344,
1377
+ 0xB3A1: 1345,
1378
+ 0xB3A2: 1346,
1379
+ 0xB3A5: 1347,
1380
+ 0xB3A9: 1348,
1381
+ 0xB3B1: 1349,
1382
+ 0xB3B3: 1350,
1383
+ 0xB3B5: 1351,
1384
+ 0xB3B7: 1352,
1385
+ 0xB461: 1353,
1386
+ 0xB462: 1354,
1387
+ 0xB465: 1355,
1388
+ 0xB466: 1356,
1389
+ 0xB467: 1357,
1390
+ 0xB469: 1358,
1391
+ 0xB46A: 1359,
1392
+ 0xB46B: 1360,
1393
+ 0xB470: 1361,
1394
+ 0xB471: 1362,
1395
+ 0xB473: 1363,
1396
+ 0xB475: 1364,
1397
+ 0xB476: 1365,
1398
+ 0xB477: 1366,
1399
+ 0xB47B: 1367,
1400
+ 0xB47C: 1368,
1401
+ 0xB481: 1369,
1402
+ 0xB482: 1370,
1403
+ 0xB485: 1371,
1404
+ 0xB489: 1372,
1405
+ 0xB491: 1373,
1406
+ 0xB493: 1374,
1407
+ 0xB495: 1375,
1408
+ 0xB496: 1376,
1409
+ 0xB497: 1377,
1410
+ 0xB4A1: 1378,
1411
+ 0xB4A2: 1379,
1412
+ 0xB4A5: 1380,
1413
+ 0xB4A9: 1381,
1414
+ 0xB4AC: 1382,
1415
+ 0xB4B1: 1383,
1416
+ 0xB4B3: 1384,
1417
+ 0xB4B5: 1385,
1418
+ 0xB4B7: 1386,
1419
+ 0xB4BB: 1387,
1420
+ 0xB4BD: 1388,
1421
+ 0xB4C1: 1389,
1422
+ 0xB4C5: 1390,
1423
+ 0xB4C9: 1391,
1424
+ 0xB4D3: 1392,
1425
+ 0xB4E1: 1393,
1426
+ 0xB4E2: 1394,
1427
+ 0xB4E5: 1395,
1428
+ 0xB4E6: 1396,
1429
+ 0xB4E8: 1397,
1430
+ 0xB4E9: 1398,
1431
+ 0xB4EA: 1399,
1432
+ 0xB4EB: 1400,
1433
+ 0xB4F1: 1401,
1434
+ 0xB4F3: 1402,
1435
+ 0xB4F4: 1403,
1436
+ 0xB4F5: 1404,
1437
+ 0xB4F6: 1405,
1438
+ 0xB4F7: 1406,
1439
+ 0xB4F8: 1407,
1440
+ 0xB4FA: 1408,
1441
+ 0xB4FC: 1409,
1442
+ 0xB541: 1410,
1443
+ 0xB542: 1411,
1444
+ 0xB545: 1412,
1445
+ 0xB549: 1413,
1446
+ 0xB551: 1414,
1447
+ 0xB553: 1415,
1448
+ 0xB555: 1416,
1449
+ 0xB557: 1417,
1450
+ 0xB561: 1418,
1451
+ 0xB562: 1419,
1452
+ 0xB563: 1420,
1453
+ 0xB565: 1421,
1454
+ 0xB569: 1422,
1455
+ 0xB56B: 1423,
1456
+ 0xB56C: 1424,
1457
+ 0xB571: 1425,
1458
+ 0xB573: 1426,
1459
+ 0xB574: 1427,
1460
+ 0xB575: 1428,
1461
+ 0xB576: 1429,
1462
+ 0xB577: 1430,
1463
+ 0xB57B: 1431,
1464
+ 0xB57C: 1432,
1465
+ 0xB57D: 1433,
1466
+ 0xB581: 1434,
1467
+ 0xB585: 1435,
1468
+ 0xB589: 1436,
1469
+ 0xB591: 1437,
1470
+ 0xB593: 1438,
1471
+ 0xB595: 1439,
1472
+ 0xB596: 1440,
1473
+ 0xB5A1: 1441,
1474
+ 0xB5A2: 1442,
1475
+ 0xB5A5: 1443,
1476
+ 0xB5A9: 1444,
1477
+ 0xB5AA: 1445,
1478
+ 0xB5AB: 1446,
1479
+ 0xB5AD: 1447,
1480
+ 0xB5B0: 1448,
1481
+ 0xB5B1: 1449,
1482
+ 0xB5B3: 1450,
1483
+ 0xB5B5: 1451,
1484
+ 0xB5B7: 1452,
1485
+ 0xB5B9: 1453,
1486
+ 0xB5C1: 1454,
1487
+ 0xB5C2: 1455,
1488
+ 0xB5C5: 1456,
1489
+ 0xB5C9: 1457,
1490
+ 0xB5D1: 1458,
1491
+ 0xB5D3: 1459,
1492
+ 0xB5D5: 1460,
1493
+ 0xB5D6: 1461,
1494
+ 0xB5D7: 1462,
1495
+ 0xB5E1: 1463,
1496
+ 0xB5E2: 1464,
1497
+ 0xB5E5: 1465,
1498
+ 0xB5F1: 1466,
1499
+ 0xB5F5: 1467,
1500
+ 0xB5F7: 1468,
1501
+ 0xB641: 1469,
1502
+ 0xB642: 1470,
1503
+ 0xB645: 1471,
1504
+ 0xB649: 1472,
1505
+ 0xB651: 1473,
1506
+ 0xB653: 1474,
1507
+ 0xB655: 1475,
1508
+ 0xB657: 1476,
1509
+ 0xB661: 1477,
1510
+ 0xB662: 1478,
1511
+ 0xB665: 1479,
1512
+ 0xB669: 1480,
1513
+ 0xB671: 1481,
1514
+ 0xB673: 1482,
1515
+ 0xB675: 1483,
1516
+ 0xB677: 1484,
1517
+ 0xB681: 1485,
1518
+ 0xB682: 1486,
1519
+ 0xB685: 1487,
1520
+ 0xB689: 1488,
1521
+ 0xB68A: 1489,
1522
+ 0xB68B: 1490,
1523
+ 0xB691: 1491,
1524
+ 0xB693: 1492,
1525
+ 0xB695: 1493,
1526
+ 0xB697: 1494,
1527
+ 0xB6A1: 1495,
1528
+ 0xB6A2: 1496,
1529
+ 0xB6A5: 1497,
1530
+ 0xB6A9: 1498,
1531
+ 0xB6B1: 1499,
1532
+ 0xB6B3: 1500,
1533
+ 0xB6B6: 1501,
1534
+ 0xB6B7: 1502,
1535
+ 0xB6C1: 1503,
1536
+ 0xB6C2: 1504,
1537
+ 0xB6C5: 1505,
1538
+ 0xB6C9: 1506,
1539
+ 0xB6D1: 1507,
1540
+ 0xB6D3: 1508,
1541
+ 0xB6D7: 1509,
1542
+ 0xB6E1: 1510,
1543
+ 0xB6E2: 1511,
1544
+ 0xB6E5: 1512,
1545
+ 0xB6E9: 1513,
1546
+ 0xB6F1: 1514,
1547
+ 0xB6F3: 1515,
1548
+ 0xB6F5: 1516,
1549
+ 0xB6F7: 1517,
1550
+ 0xB741: 1518,
1551
+ 0xB742: 1519,
1552
+ 0xB745: 1520,
1553
+ 0xB749: 1521,
1554
+ 0xB751: 1522,
1555
+ 0xB753: 1523,
1556
+ 0xB755: 1524,
1557
+ 0xB757: 1525,
1558
+ 0xB759: 1526,
1559
+ 0xB761: 1527,
1560
+ 0xB762: 1528,
1561
+ 0xB765: 1529,
1562
+ 0xB769: 1530,
1563
+ 0xB76F: 1531,
1564
+ 0xB771: 1532,
1565
+ 0xB773: 1533,
1566
+ 0xB775: 1534,
1567
+ 0xB777: 1535,
1568
+ 0xB778: 1536,
1569
+ 0xB779: 1537,
1570
+ 0xB77A: 1538,
1571
+ 0xB77B: 1539,
1572
+ 0xB77C: 1540,
1573
+ 0xB77D: 1541,
1574
+ 0xB781: 1542,
1575
+ 0xB785: 1543,
1576
+ 0xB789: 1544,
1577
+ 0xB791: 1545,
1578
+ 0xB795: 1546,
1579
+ 0xB7A1: 1547,
1580
+ 0xB7A2: 1548,
1581
+ 0xB7A5: 1549,
1582
+ 0xB7A9: 1550,
1583
+ 0xB7AA: 1551,
1584
+ 0xB7AB: 1552,
1585
+ 0xB7B0: 1553,
1586
+ 0xB7B1: 1554,
1587
+ 0xB7B3: 1555,
1588
+ 0xB7B5: 1556,
1589
+ 0xB7B6: 1557,
1590
+ 0xB7B7: 1558,
1591
+ 0xB7B8: 1559,
1592
+ 0xB7BC: 1560,
1593
+ 0xB861: 1561,
1594
+ 0xB862: 1562,
1595
+ 0xB865: 1563,
1596
+ 0xB867: 1564,
1597
+ 0xB868: 1565,
1598
+ 0xB869: 1566,
1599
+ 0xB86B: 1567,
1600
+ 0xB871: 1568,
1601
+ 0xB873: 1569,
1602
+ 0xB875: 1570,
1603
+ 0xB876: 1571,
1604
+ 0xB877: 1572,
1605
+ 0xB878: 1573,
1606
+ 0xB881: 1574,
1607
+ 0xB882: 1575,
1608
+ 0xB885: 1576,
1609
+ 0xB889: 1577,
1610
+ 0xB891: 1578,
1611
+ 0xB893: 1579,
1612
+ 0xB895: 1580,
1613
+ 0xB896: 1581,
1614
+ 0xB897: 1582,
1615
+ 0xB8A1: 1583,
1616
+ 0xB8A2: 1584,
1617
+ 0xB8A5: 1585,
1618
+ 0xB8A7: 1586,
1619
+ 0xB8A9: 1587,
1620
+ 0xB8B1: 1588,
1621
+ 0xB8B7: 1589,
1622
+ 0xB8C1: 1590,
1623
+ 0xB8C5: 1591,
1624
+ 0xB8C9: 1592,
1625
+ 0xB8E1: 1593,
1626
+ 0xB8E2: 1594,
1627
+ 0xB8E5: 1595,
1628
+ 0xB8E9: 1596,
1629
+ 0xB8EB: 1597,
1630
+ 0xB8F1: 1598,
1631
+ 0xB8F3: 1599,
1632
+ 0xB8F5: 1600,
1633
+ 0xB8F7: 1601,
1634
+ 0xB8F8: 1602,
1635
+ 0xB941: 1603,
1636
+ 0xB942: 1604,
1637
+ 0xB945: 1605,
1638
+ 0xB949: 1606,
1639
+ 0xB951: 1607,
1640
+ 0xB953: 1608,
1641
+ 0xB955: 1609,
1642
+ 0xB957: 1610,
1643
+ 0xB961: 1611,
1644
+ 0xB965: 1612,
1645
+ 0xB969: 1613,
1646
+ 0xB971: 1614,
1647
+ 0xB973: 1615,
1648
+ 0xB976: 1616,
1649
+ 0xB977: 1617,
1650
+ 0xB981: 1618,
1651
+ 0xB9A1: 1619,
1652
+ 0xB9A2: 1620,
1653
+ 0xB9A5: 1621,
1654
+ 0xB9A9: 1622,
1655
+ 0xB9AB: 1623,
1656
+ 0xB9B1: 1624,
1657
+ 0xB9B3: 1625,
1658
+ 0xB9B5: 1626,
1659
+ 0xB9B7: 1627,
1660
+ 0xB9B8: 1628,
1661
+ 0xB9B9: 1629,
1662
+ 0xB9BD: 1630,
1663
+ 0xB9C1: 1631,
1664
+ 0xB9C2: 1632,
1665
+ 0xB9C9: 1633,
1666
+ 0xB9D3: 1634,
1667
+ 0xB9D5: 1635,
1668
+ 0xB9D7: 1636,
1669
+ 0xB9E1: 1637,
1670
+ 0xB9F6: 1638,
1671
+ 0xB9F7: 1639,
1672
+ 0xBA41: 1640,
1673
+ 0xBA45: 1641,
1674
+ 0xBA49: 1642,
1675
+ 0xBA51: 1643,
1676
+ 0xBA53: 1644,
1677
+ 0xBA55: 1645,
1678
+ 0xBA57: 1646,
1679
+ 0xBA61: 1647,
1680
+ 0xBA62: 1648,
1681
+ 0xBA65: 1649,
1682
+ 0xBA77: 1650,
1683
+ 0xBA81: 1651,
1684
+ 0xBA82: 1652,
1685
+ 0xBA85: 1653,
1686
+ 0xBA89: 1654,
1687
+ 0xBA8A: 1655,
1688
+ 0xBA8B: 1656,
1689
+ 0xBA91: 1657,
1690
+ 0xBA93: 1658,
1691
+ 0xBA95: 1659,
1692
+ 0xBA97: 1660,
1693
+ 0xBAA1: 1661,
1694
+ 0xBAB6: 1662,
1695
+ 0xBAC1: 1663,
1696
+ 0xBAE1: 1664,
1697
+ 0xBAE2: 1665,
1698
+ 0xBAE5: 1666,
1699
+ 0xBAE9: 1667,
1700
+ 0xBAF1: 1668,
1701
+ 0xBAF3: 1669,
1702
+ 0xBAF5: 1670,
1703
+ 0xBB41: 1671,
1704
+ 0xBB45: 1672,
1705
+ 0xBB49: 1673,
1706
+ 0xBB51: 1674,
1707
+ 0xBB61: 1675,
1708
+ 0xBB62: 1676,
1709
+ 0xBB65: 1677,
1710
+ 0xBB69: 1678,
1711
+ 0xBB71: 1679,
1712
+ 0xBB73: 1680,
1713
+ 0xBB75: 1681,
1714
+ 0xBB77: 1682,
1715
+ 0xBBA1: 1683,
1716
+ 0xBBA2: 1684,
1717
+ 0xBBA5: 1685,
1718
+ 0xBBA8: 1686,
1719
+ 0xBBA9: 1687,
1720
+ 0xBBAB: 1688,
1721
+ 0xBBB1: 1689,
1722
+ 0xBBB3: 1690,
1723
+ 0xBBB5: 1691,
1724
+ 0xBBB7: 1692,
1725
+ 0xBBB8: 1693,
1726
+ 0xBBBB: 1694,
1727
+ 0xBBBC: 1695,
1728
+ 0xBC61: 1696,
1729
+ 0xBC62: 1697,
1730
+ 0xBC65: 1698,
1731
+ 0xBC67: 1699,
1732
+ 0xBC69: 1700,
1733
+ 0xBC6C: 1701,
1734
+ 0xBC71: 1702,
1735
+ 0xBC73: 1703,
1736
+ 0xBC75: 1704,
1737
+ 0xBC76: 1705,
1738
+ 0xBC77: 1706,
1739
+ 0xBC81: 1707,
1740
+ 0xBC82: 1708,
1741
+ 0xBC85: 1709,
1742
+ 0xBC89: 1710,
1743
+ 0xBC91: 1711,
1744
+ 0xBC93: 1712,
1745
+ 0xBC95: 1713,
1746
+ 0xBC96: 1714,
1747
+ 0xBC97: 1715,
1748
+ 0xBCA1: 1716,
1749
+ 0xBCA5: 1717,
1750
+ 0xBCB7: 1718,
1751
+ 0xBCE1: 1719,
1752
+ 0xBCE2: 1720,
1753
+ 0xBCE5: 1721,
1754
+ 0xBCE9: 1722,
1755
+ 0xBCF1: 1723,
1756
+ 0xBCF3: 1724,
1757
+ 0xBCF5: 1725,
1758
+ 0xBCF6: 1726,
1759
+ 0xBCF7: 1727,
1760
+ 0xBD41: 1728,
1761
+ 0xBD57: 1729,
1762
+ 0xBD61: 1730,
1763
+ 0xBD76: 1731,
1764
+ 0xBDA1: 1732,
1765
+ 0xBDA2: 1733,
1766
+ 0xBDA5: 1734,
1767
+ 0xBDA9: 1735,
1768
+ 0xBDB1: 1736,
1769
+ 0xBDB3: 1737,
1770
+ 0xBDB5: 1738,
1771
+ 0xBDB7: 1739,
1772
+ 0xBDB9: 1740,
1773
+ 0xBDC1: 1741,
1774
+ 0xBDC2: 1742,
1775
+ 0xBDC9: 1743,
1776
+ 0xBDD6: 1744,
1777
+ 0xBDE1: 1745,
1778
+ 0xBDF6: 1746,
1779
+ 0xBE41: 1747,
1780
+ 0xBE45: 1748,
1781
+ 0xBE49: 1749,
1782
+ 0xBE51: 1750,
1783
+ 0xBE53: 1751,
1784
+ 0xBE77: 1752,
1785
+ 0xBE81: 1753,
1786
+ 0xBE82: 1754,
1787
+ 0xBE85: 1755,
1788
+ 0xBE89: 1756,
1789
+ 0xBE91: 1757,
1790
+ 0xBE93: 1758,
1791
+ 0xBE97: 1759,
1792
+ 0xBEA1: 1760,
1793
+ 0xBEB6: 1761,
1794
+ 0xBEB7: 1762,
1795
+ 0xBEE1: 1763,
1796
+ 0xBF41: 1764,
1797
+ 0xBF61: 1765,
1798
+ 0xBF71: 1766,
1799
+ 0xBF75: 1767,
1800
+ 0xBF77: 1768,
1801
+ 0xBFA1: 1769,
1802
+ 0xBFA2: 1770,
1803
+ 0xBFA5: 1771,
1804
+ 0xBFA9: 1772,
1805
+ 0xBFB1: 1773,
1806
+ 0xBFB3: 1774,
1807
+ 0xBFB7: 1775,
1808
+ 0xBFB8: 1776,
1809
+ 0xBFBD: 1777,
1810
+ 0xC061: 1778,
1811
+ 0xC062: 1779,
1812
+ 0xC065: 1780,
1813
+ 0xC067: 1781,
1814
+ 0xC069: 1782,
1815
+ 0xC071: 1783,
1816
+ 0xC073: 1784,
1817
+ 0xC075: 1785,
1818
+ 0xC076: 1786,
1819
+ 0xC077: 1787,
1820
+ 0xC078: 1788,
1821
+ 0xC081: 1789,
1822
+ 0xC082: 1790,
1823
+ 0xC085: 1791,
1824
+ 0xC089: 1792,
1825
+ 0xC091: 1793,
1826
+ 0xC093: 1794,
1827
+ 0xC095: 1795,
1828
+ 0xC096: 1796,
1829
+ 0xC097: 1797,
1830
+ 0xC0A1: 1798,
1831
+ 0xC0A5: 1799,
1832
+ 0xC0A7: 1800,
1833
+ 0xC0A9: 1801,
1834
+ 0xC0B1: 1802,
1835
+ 0xC0B7: 1803,
1836
+ 0xC0E1: 1804,
1837
+ 0xC0E2: 1805,
1838
+ 0xC0E5: 1806,
1839
+ 0xC0E9: 1807,
1840
+ 0xC0F1: 1808,
1841
+ 0xC0F3: 1809,
1842
+ 0xC0F5: 1810,
1843
+ 0xC0F6: 1811,
1844
+ 0xC0F7: 1812,
1845
+ 0xC141: 1813,
1846
+ 0xC142: 1814,
1847
+ 0xC145: 1815,
1848
+ 0xC149: 1816,
1849
+ 0xC151: 1817,
1850
+ 0xC153: 1818,
1851
+ 0xC155: 1819,
1852
+ 0xC157: 1820,
1853
+ 0xC161: 1821,
1854
+ 0xC165: 1822,
1855
+ 0xC176: 1823,
1856
+ 0xC181: 1824,
1857
+ 0xC185: 1825,
1858
+ 0xC197: 1826,
1859
+ 0xC1A1: 1827,
1860
+ 0xC1A2: 1828,
1861
+ 0xC1A5: 1829,
1862
+ 0xC1A9: 1830,
1863
+ 0xC1B1: 1831,
1864
+ 0xC1B3: 1832,
1865
+ 0xC1B5: 1833,
1866
+ 0xC1B7: 1834,
1867
+ 0xC1C1: 1835,
1868
+ 0xC1C5: 1836,
1869
+ 0xC1C9: 1837,
1870
+ 0xC1D7: 1838,
1871
+ 0xC241: 1839,
1872
+ 0xC245: 1840,
1873
+ 0xC249: 1841,
1874
+ 0xC251: 1842,
1875
+ 0xC253: 1843,
1876
+ 0xC255: 1844,
1877
+ 0xC257: 1845,
1878
+ 0xC261: 1846,
1879
+ 0xC271: 1847,
1880
+ 0xC281: 1848,
1881
+ 0xC282: 1849,
1882
+ 0xC285: 1850,
1883
+ 0xC289: 1851,
1884
+ 0xC291: 1852,
1885
+ 0xC293: 1853,
1886
+ 0xC295: 1854,
1887
+ 0xC297: 1855,
1888
+ 0xC2A1: 1856,
1889
+ 0xC2B6: 1857,
1890
+ 0xC2C1: 1858,
1891
+ 0xC2C5: 1859,
1892
+ 0xC2E1: 1860,
1893
+ 0xC2E5: 1861,
1894
+ 0xC2E9: 1862,
1895
+ 0xC2F1: 1863,
1896
+ 0xC2F3: 1864,
1897
+ 0xC2F5: 1865,
1898
+ 0xC2F7: 1866,
1899
+ 0xC341: 1867,
1900
+ 0xC345: 1868,
1901
+ 0xC349: 1869,
1902
+ 0xC351: 1870,
1903
+ 0xC357: 1871,
1904
+ 0xC361: 1872,
1905
+ 0xC362: 1873,
1906
+ 0xC365: 1874,
1907
+ 0xC369: 1875,
1908
+ 0xC371: 1876,
1909
+ 0xC373: 1877,
1910
+ 0xC375: 1878,
1911
+ 0xC377: 1879,
1912
+ 0xC3A1: 1880,
1913
+ 0xC3A2: 1881,
1914
+ 0xC3A5: 1882,
1915
+ 0xC3A8: 1883,
1916
+ 0xC3A9: 1884,
1917
+ 0xC3AA: 1885,
1918
+ 0xC3B1: 1886,
1919
+ 0xC3B3: 1887,
1920
+ 0xC3B5: 1888,
1921
+ 0xC3B7: 1889,
1922
+ 0xC461: 1890,
1923
+ 0xC462: 1891,
1924
+ 0xC465: 1892,
1925
+ 0xC469: 1893,
1926
+ 0xC471: 1894,
1927
+ 0xC473: 1895,
1928
+ 0xC475: 1896,
1929
+ 0xC477: 1897,
1930
+ 0xC481: 1898,
1931
+ 0xC482: 1899,
1932
+ 0xC485: 1900,
1933
+ 0xC489: 1901,
1934
+ 0xC491: 1902,
1935
+ 0xC493: 1903,
1936
+ 0xC495: 1904,
1937
+ 0xC496: 1905,
1938
+ 0xC497: 1906,
1939
+ 0xC4A1: 1907,
1940
+ 0xC4A2: 1908,
1941
+ 0xC4B7: 1909,
1942
+ 0xC4E1: 1910,
1943
+ 0xC4E2: 1911,
1944
+ 0xC4E5: 1912,
1945
+ 0xC4E8: 1913,
1946
+ 0xC4E9: 1914,
1947
+ 0xC4F1: 1915,
1948
+ 0xC4F3: 1916,
1949
+ 0xC4F5: 1917,
1950
+ 0xC4F6: 1918,
1951
+ 0xC4F7: 1919,
1952
+ 0xC541: 1920,
1953
+ 0xC542: 1921,
1954
+ 0xC545: 1922,
1955
+ 0xC549: 1923,
1956
+ 0xC551: 1924,
1957
+ 0xC553: 1925,
1958
+ 0xC555: 1926,
1959
+ 0xC557: 1927,
1960
+ 0xC561: 1928,
1961
+ 0xC565: 1929,
1962
+ 0xC569: 1930,
1963
+ 0xC571: 1931,
1964
+ 0xC573: 1932,
1965
+ 0xC575: 1933,
1966
+ 0xC576: 1934,
1967
+ 0xC577: 1935,
1968
+ 0xC581: 1936,
1969
+ 0xC5A1: 1937,
1970
+ 0xC5A2: 1938,
1971
+ 0xC5A5: 1939,
1972
+ 0xC5A9: 1940,
1973
+ 0xC5B1: 1941,
1974
+ 0xC5B3: 1942,
1975
+ 0xC5B5: 1943,
1976
+ 0xC5B7: 1944,
1977
+ 0xC5C1: 1945,
1978
+ 0xC5C2: 1946,
1979
+ 0xC5C5: 1947,
1980
+ 0xC5C9: 1948,
1981
+ 0xC5D1: 1949,
1982
+ 0xC5D7: 1950,
1983
+ 0xC5E1: 1951,
1984
+ 0xC5F7: 1952,
1985
+ 0xC641: 1953,
1986
+ 0xC649: 1954,
1987
+ 0xC661: 1955,
1988
+ 0xC681: 1956,
1989
+ 0xC682: 1957,
1990
+ 0xC685: 1958,
1991
+ 0xC689: 1959,
1992
+ 0xC691: 1960,
1993
+ 0xC693: 1961,
1994
+ 0xC695: 1962,
1995
+ 0xC697: 1963,
1996
+ 0xC6A1: 1964,
1997
+ 0xC6A5: 1965,
1998
+ 0xC6A9: 1966,
1999
+ 0xC6B7: 1967,
2000
+ 0xC6C1: 1968,
2001
+ 0xC6D7: 1969,
2002
+ 0xC6E1: 1970,
2003
+ 0xC6E2: 1971,
2004
+ 0xC6E5: 1972,
2005
+ 0xC6E9: 1973,
2006
+ 0xC6F1: 1974,
2007
+ 0xC6F3: 1975,
2008
+ 0xC6F5: 1976,
2009
+ 0xC6F7: 1977,
2010
+ 0xC741: 1978,
2011
+ 0xC745: 1979,
2012
+ 0xC749: 1980,
2013
+ 0xC751: 1981,
2014
+ 0xC761: 1982,
2015
+ 0xC762: 1983,
2016
+ 0xC765: 1984,
2017
+ 0xC769: 1985,
2018
+ 0xC771: 1986,
2019
+ 0xC773: 1987,
2020
+ 0xC777: 1988,
2021
+ 0xC7A1: 1989,
2022
+ 0xC7A2: 1990,
2023
+ 0xC7A5: 1991,
2024
+ 0xC7A9: 1992,
2025
+ 0xC7B1: 1993,
2026
+ 0xC7B3: 1994,
2027
+ 0xC7B5: 1995,
2028
+ 0xC7B7: 1996,
2029
+ 0xC861: 1997,
2030
+ 0xC862: 1998,
2031
+ 0xC865: 1999,
2032
+ 0xC869: 2000,
2033
+ 0xC86A: 2001,
2034
+ 0xC871: 2002,
2035
+ 0xC873: 2003,
2036
+ 0xC875: 2004,
2037
+ 0xC876: 2005,
2038
+ 0xC877: 2006,
2039
+ 0xC881: 2007,
2040
+ 0xC882: 2008,
2041
+ 0xC885: 2009,
2042
+ 0xC889: 2010,
2043
+ 0xC891: 2011,
2044
+ 0xC893: 2012,
2045
+ 0xC895: 2013,
2046
+ 0xC896: 2014,
2047
+ 0xC897: 2015,
2048
+ 0xC8A1: 2016,
2049
+ 0xC8B7: 2017,
2050
+ 0xC8E1: 2018,
2051
+ 0xC8E2: 2019,
2052
+ 0xC8E5: 2020,
2053
+ 0xC8E9: 2021,
2054
+ 0xC8EB: 2022,
2055
+ 0xC8F1: 2023,
2056
+ 0xC8F3: 2024,
2057
+ 0xC8F5: 2025,
2058
+ 0xC8F6: 2026,
2059
+ 0xC8F7: 2027,
2060
+ 0xC941: 2028,
2061
+ 0xC942: 2029,
2062
+ 0xC945: 2030,
2063
+ 0xC949: 2031,
2064
+ 0xC951: 2032,
2065
+ 0xC953: 2033,
2066
+ 0xC955: 2034,
2067
+ 0xC957: 2035,
2068
+ 0xC961: 2036,
2069
+ 0xC965: 2037,
2070
+ 0xC976: 2038,
2071
+ 0xC981: 2039,
2072
+ 0xC985: 2040,
2073
+ 0xC9A1: 2041,
2074
+ 0xC9A2: 2042,
2075
+ 0xC9A5: 2043,
2076
+ 0xC9A9: 2044,
2077
+ 0xC9B1: 2045,
2078
+ 0xC9B3: 2046,
2079
+ 0xC9B5: 2047,
2080
+ 0xC9B7: 2048,
2081
+ 0xC9BC: 2049,
2082
+ 0xC9C1: 2050,
2083
+ 0xC9C5: 2051,
2084
+ 0xC9E1: 2052,
2085
+ 0xCA41: 2053,
2086
+ 0xCA45: 2054,
2087
+ 0xCA55: 2055,
2088
+ 0xCA57: 2056,
2089
+ 0xCA61: 2057,
2090
+ 0xCA81: 2058,
2091
+ 0xCA82: 2059,
2092
+ 0xCA85: 2060,
2093
+ 0xCA89: 2061,
2094
+ 0xCA91: 2062,
2095
+ 0xCA93: 2063,
2096
+ 0xCA95: 2064,
2097
+ 0xCA97: 2065,
2098
+ 0xCAA1: 2066,
2099
+ 0xCAB6: 2067,
2100
+ 0xCAC1: 2068,
2101
+ 0xCAE1: 2069,
2102
+ 0xCAE2: 2070,
2103
+ 0xCAE5: 2071,
2104
+ 0xCAE9: 2072,
2105
+ 0xCAF1: 2073,
2106
+ 0xCAF3: 2074,
2107
+ 0xCAF7: 2075,
2108
+ 0xCB41: 2076,
2109
+ 0xCB45: 2077,
2110
+ 0xCB49: 2078,
2111
+ 0xCB51: 2079,
2112
+ 0xCB57: 2080,
2113
+ 0xCB61: 2081,
2114
+ 0xCB62: 2082,
2115
+ 0xCB65: 2083,
2116
+ 0xCB68: 2084,
2117
+ 0xCB69: 2085,
2118
+ 0xCB6B: 2086,
2119
+ 0xCB71: 2087,
2120
+ 0xCB73: 2088,
2121
+ 0xCB75: 2089,
2122
+ 0xCB81: 2090,
2123
+ 0xCB85: 2091,
2124
+ 0xCB89: 2092,
2125
+ 0xCB91: 2093,
2126
+ 0xCB93: 2094,
2127
+ 0xCBA1: 2095,
2128
+ 0xCBA2: 2096,
2129
+ 0xCBA5: 2097,
2130
+ 0xCBA9: 2098,
2131
+ 0xCBB1: 2099,
2132
+ 0xCBB3: 2100,
2133
+ 0xCBB5: 2101,
2134
+ 0xCBB7: 2102,
2135
+ 0xCC61: 2103,
2136
+ 0xCC62: 2104,
2137
+ 0xCC63: 2105,
2138
+ 0xCC65: 2106,
2139
+ 0xCC69: 2107,
2140
+ 0xCC6B: 2108,
2141
+ 0xCC71: 2109,
2142
+ 0xCC73: 2110,
2143
+ 0xCC75: 2111,
2144
+ 0xCC76: 2112,
2145
+ 0xCC77: 2113,
2146
+ 0xCC7B: 2114,
2147
+ 0xCC81: 2115,
2148
+ 0xCC82: 2116,
2149
+ 0xCC85: 2117,
2150
+ 0xCC89: 2118,
2151
+ 0xCC91: 2119,
2152
+ 0xCC93: 2120,
2153
+ 0xCC95: 2121,
2154
+ 0xCC96: 2122,
2155
+ 0xCC97: 2123,
2156
+ 0xCCA1: 2124,
2157
+ 0xCCA2: 2125,
2158
+ 0xCCE1: 2126,
2159
+ 0xCCE2: 2127,
2160
+ 0xCCE5: 2128,
2161
+ 0xCCE9: 2129,
2162
+ 0xCCF1: 2130,
2163
+ 0xCCF3: 2131,
2164
+ 0xCCF5: 2132,
2165
+ 0xCCF6: 2133,
2166
+ 0xCCF7: 2134,
2167
+ 0xCD41: 2135,
2168
+ 0xCD42: 2136,
2169
+ 0xCD45: 2137,
2170
+ 0xCD49: 2138,
2171
+ 0xCD51: 2139,
2172
+ 0xCD53: 2140,
2173
+ 0xCD55: 2141,
2174
+ 0xCD57: 2142,
2175
+ 0xCD61: 2143,
2176
+ 0xCD65: 2144,
2177
+ 0xCD69: 2145,
2178
+ 0xCD71: 2146,
2179
+ 0xCD73: 2147,
2180
+ 0xCD76: 2148,
2181
+ 0xCD77: 2149,
2182
+ 0xCD81: 2150,
2183
+ 0xCD89: 2151,
2184
+ 0xCD93: 2152,
2185
+ 0xCD95: 2153,
2186
+ 0xCDA1: 2154,
2187
+ 0xCDA2: 2155,
2188
+ 0xCDA5: 2156,
2189
+ 0xCDA9: 2157,
2190
+ 0xCDB1: 2158,
2191
+ 0xCDB3: 2159,
2192
+ 0xCDB5: 2160,
2193
+ 0xCDB7: 2161,
2194
+ 0xCDC1: 2162,
2195
+ 0xCDD7: 2163,
2196
+ 0xCE41: 2164,
2197
+ 0xCE45: 2165,
2198
+ 0xCE61: 2166,
2199
+ 0xCE65: 2167,
2200
+ 0xCE69: 2168,
2201
+ 0xCE73: 2169,
2202
+ 0xCE75: 2170,
2203
+ 0xCE81: 2171,
2204
+ 0xCE82: 2172,
2205
+ 0xCE85: 2173,
2206
+ 0xCE88: 2174,
2207
+ 0xCE89: 2175,
2208
+ 0xCE8B: 2176,
2209
+ 0xCE91: 2177,
2210
+ 0xCE93: 2178,
2211
+ 0xCE95: 2179,
2212
+ 0xCE97: 2180,
2213
+ 0xCEA1: 2181,
2214
+ 0xCEB7: 2182,
2215
+ 0xCEE1: 2183,
2216
+ 0xCEE5: 2184,
2217
+ 0xCEE9: 2185,
2218
+ 0xCEF1: 2186,
2219
+ 0xCEF5: 2187,
2220
+ 0xCF41: 2188,
2221
+ 0xCF45: 2189,
2222
+ 0xCF49: 2190,
2223
+ 0xCF51: 2191,
2224
+ 0xCF55: 2192,
2225
+ 0xCF57: 2193,
2226
+ 0xCF61: 2194,
2227
+ 0xCF65: 2195,
2228
+ 0xCF69: 2196,
2229
+ 0xCF71: 2197,
2230
+ 0xCF73: 2198,
2231
+ 0xCF75: 2199,
2232
+ 0xCFA1: 2200,
2233
+ 0xCFA2: 2201,
2234
+ 0xCFA5: 2202,
2235
+ 0xCFA9: 2203,
2236
+ 0xCFB1: 2204,
2237
+ 0xCFB3: 2205,
2238
+ 0xCFB5: 2206,
2239
+ 0xCFB7: 2207,
2240
+ 0xD061: 2208,
2241
+ 0xD062: 2209,
2242
+ 0xD065: 2210,
2243
+ 0xD069: 2211,
2244
+ 0xD06E: 2212,
2245
+ 0xD071: 2213,
2246
+ 0xD073: 2214,
2247
+ 0xD075: 2215,
2248
+ 0xD077: 2216,
2249
+ 0xD081: 2217,
2250
+ 0xD082: 2218,
2251
+ 0xD085: 2219,
2252
+ 0xD089: 2220,
2253
+ 0xD091: 2221,
2254
+ 0xD093: 2222,
2255
+ 0xD095: 2223,
2256
+ 0xD096: 2224,
2257
+ 0xD097: 2225,
2258
+ 0xD0A1: 2226,
2259
+ 0xD0B7: 2227,
2260
+ 0xD0E1: 2228,
2261
+ 0xD0E2: 2229,
2262
+ 0xD0E5: 2230,
2263
+ 0xD0E9: 2231,
2264
+ 0xD0EB: 2232,
2265
+ 0xD0F1: 2233,
2266
+ 0xD0F3: 2234,
2267
+ 0xD0F5: 2235,
2268
+ 0xD0F7: 2236,
2269
+ 0xD141: 2237,
2270
+ 0xD142: 2238,
2271
+ 0xD145: 2239,
2272
+ 0xD149: 2240,
2273
+ 0xD151: 2241,
2274
+ 0xD153: 2242,
2275
+ 0xD155: 2243,
2276
+ 0xD157: 2244,
2277
+ 0xD161: 2245,
2278
+ 0xD162: 2246,
2279
+ 0xD165: 2247,
2280
+ 0xD169: 2248,
2281
+ 0xD171: 2249,
2282
+ 0xD173: 2250,
2283
+ 0xD175: 2251,
2284
+ 0xD176: 2252,
2285
+ 0xD177: 2253,
2286
+ 0xD181: 2254,
2287
+ 0xD185: 2255,
2288
+ 0xD189: 2256,
2289
+ 0xD193: 2257,
2290
+ 0xD1A1: 2258,
2291
+ 0xD1A2: 2259,
2292
+ 0xD1A5: 2260,
2293
+ 0xD1A9: 2261,
2294
+ 0xD1AE: 2262,
2295
+ 0xD1B1: 2263,
2296
+ 0xD1B3: 2264,
2297
+ 0xD1B5: 2265,
2298
+ 0xD1B7: 2266,
2299
+ 0xD1BB: 2267,
2300
+ 0xD1C1: 2268,
2301
+ 0xD1C2: 2269,
2302
+ 0xD1C5: 2270,
2303
+ 0xD1C9: 2271,
2304
+ 0xD1D5: 2272,
2305
+ 0xD1D7: 2273,
2306
+ 0xD1E1: 2274,
2307
+ 0xD1E2: 2275,
2308
+ 0xD1E5: 2276,
2309
+ 0xD1F5: 2277,
2310
+ 0xD1F7: 2278,
2311
+ 0xD241: 2279,
2312
+ 0xD242: 2280,
2313
+ 0xD245: 2281,
2314
+ 0xD249: 2282,
2315
+ 0xD253: 2283,
2316
+ 0xD255: 2284,
2317
+ 0xD257: 2285,
2318
+ 0xD261: 2286,
2319
+ 0xD265: 2287,
2320
+ 0xD269: 2288,
2321
+ 0xD273: 2289,
2322
+ 0xD275: 2290,
2323
+ 0xD281: 2291,
2324
+ 0xD282: 2292,
2325
+ 0xD285: 2293,
2326
+ 0xD289: 2294,
2327
+ 0xD28E: 2295,
2328
+ 0xD291: 2296,
2329
+ 0xD295: 2297,
2330
+ 0xD297: 2298,
2331
+ 0xD2A1: 2299,
2332
+ 0xD2A5: 2300,
2333
+ 0xD2A9: 2301,
2334
+ 0xD2B1: 2302,
2335
+ 0xD2B7: 2303,
2336
+ 0xD2C1: 2304,
2337
+ 0xD2C2: 2305,
2338
+ 0xD2C5: 2306,
2339
+ 0xD2C9: 2307,
2340
+ 0xD2D7: 2308,
2341
+ 0xD2E1: 2309,
2342
+ 0xD2E2: 2310,
2343
+ 0xD2E5: 2311,
2344
+ 0xD2E9: 2312,
2345
+ 0xD2F1: 2313,
2346
+ 0xD2F3: 2314,
2347
+ 0xD2F5: 2315,
2348
+ 0xD2F7: 2316,
2349
+ 0xD341: 2317,
2350
+ 0xD342: 2318,
2351
+ 0xD345: 2319,
2352
+ 0xD349: 2320,
2353
+ 0xD351: 2321,
2354
+ 0xD355: 2322,
2355
+ 0xD357: 2323,
2356
+ 0xD361: 2324,
2357
+ 0xD362: 2325,
2358
+ 0xD365: 2326,
2359
+ 0xD367: 2327,
2360
+ 0xD368: 2328,
2361
+ 0xD369: 2329,
2362
+ 0xD36A: 2330,
2363
+ 0xD371: 2331,
2364
+ 0xD373: 2332,
2365
+ 0xD375: 2333,
2366
+ 0xD377: 2334,
2367
+ 0xD37B: 2335,
2368
+ 0xD381: 2336,
2369
+ 0xD385: 2337,
2370
+ 0xD389: 2338,
2371
+ 0xD391: 2339,
2372
+ 0xD393: 2340,
2373
+ 0xD397: 2341,
2374
+ 0xD3A1: 2342,
2375
+ 0xD3A2: 2343,
2376
+ 0xD3A5: 2344,
2377
+ 0xD3A9: 2345,
2378
+ 0xD3B1: 2346,
2379
+ 0xD3B3: 2347,
2380
+ 0xD3B5: 2348,
2381
+ 0xD3B7: 2349,
2382
+ }
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/johabprober.py ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is mozilla.org code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from .chardistribution import JOHABDistributionAnalysis
29
+ from .codingstatemachine import CodingStateMachine
30
+ from .mbcharsetprober import MultiByteCharSetProber
31
+ from .mbcssm import JOHAB_SM_MODEL
32
+
33
+
34
+ class JOHABProber(MultiByteCharSetProber):
35
+ def __init__(self) -> None:
36
+ super().__init__()
37
+ self.coding_sm = CodingStateMachine(JOHAB_SM_MODEL)
38
+ self.distribution_analyzer = JOHABDistributionAnalysis()
39
+ self.reset()
40
+
41
+ @property
42
+ def charset_name(self) -> str:
43
+ return "Johab"
44
+
45
+ @property
46
+ def language(self) -> str:
47
+ return "Korean"
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/jpcntx.py ADDED
@@ -0,0 +1,238 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Communicator client code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from typing import List, Tuple, Union
29
+
30
+ # This is hiragana 2-char sequence table, the number in each cell represents its frequency category
31
+ # fmt: off
32
+ jp2_char_context = (
33
+ (0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1),
34
+ (2, 4, 0, 4, 0, 3, 0, 4, 0, 3, 4, 4, 4, 2, 4, 3, 3, 4, 3, 2, 3, 3, 4, 2, 3, 3, 3, 2, 4, 1, 4, 3, 3, 1, 5, 4, 3, 4, 3, 4, 3, 5, 3, 0, 3, 5, 4, 2, 0, 3, 1, 0, 3, 3, 0, 3, 3, 0, 1, 1, 0, 4, 3, 0, 3, 3, 0, 4, 0, 2, 0, 3, 5, 5, 5, 5, 4, 0, 4, 1, 0, 3, 4),
35
+ (0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2),
36
+ (0, 4, 0, 5, 0, 5, 0, 4, 0, 4, 5, 4, 4, 3, 5, 3, 5, 1, 5, 3, 4, 3, 4, 4, 3, 4, 3, 3, 4, 3, 5, 4, 4, 3, 5, 5, 3, 5, 5, 5, 3, 5, 5, 3, 4, 5, 5, 3, 1, 3, 2, 0, 3, 4, 0, 4, 2, 0, 4, 2, 1, 5, 3, 2, 3, 5, 0, 4, 0, 2, 0, 5, 4, 4, 5, 4, 5, 0, 4, 0, 0, 4, 4),
37
+ (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0),
38
+ (0, 3, 0, 4, 0, 3, 0, 3, 0, 4, 5, 4, 3, 3, 3, 3, 4, 3, 5, 4, 4, 3, 5, 4, 4, 3, 4, 3, 4, 4, 4, 4, 5, 3, 4, 4, 3, 4, 5, 5, 4, 5, 5, 1, 4, 5, 4, 3, 0, 3, 3, 1, 3, 3, 0, 4, 4, 0, 3, 3, 1, 5, 3, 3, 3, 5, 0, 4, 0, 3, 0, 4, 4, 3, 4, 3, 3, 0, 4, 1, 1, 3, 4),
39
+ (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0),
40
+ (0, 4, 0, 3, 0, 3, 0, 4, 0, 3, 4, 4, 3, 2, 2, 1, 2, 1, 3, 1, 3, 3, 3, 3, 3, 4, 3, 1, 3, 3, 5, 3, 3, 0, 4, 3, 0, 5, 4, 3, 3, 5, 4, 4, 3, 4, 4, 5, 0, 1, 2, 0, 1, 2, 0, 2, 2, 0, 1, 0, 0, 5, 2, 2, 1, 4, 0, 3, 0, 1, 0, 4, 4, 3, 5, 4, 3, 0, 2, 1, 0, 4, 3),
41
+ (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0),
42
+ (0, 3, 0, 5, 0, 4, 0, 2, 1, 4, 4, 2, 4, 1, 4, 2, 4, 2, 4, 3, 3, 3, 4, 3, 3, 3, 3, 1, 4, 2, 3, 3, 3, 1, 4, 4, 1, 1, 1, 4, 3, 3, 2, 0, 2, 4, 3, 2, 0, 3, 3, 0, 3, 1, 1, 0, 0, 0, 3, 3, 0, 4, 2, 2, 3, 4, 0, 4, 0, 3, 0, 4, 4, 5, 3, 4, 4, 0, 3, 0, 0, 1, 4),
43
+ (1, 4, 0, 4, 0, 4, 0, 4, 0, 3, 5, 4, 4, 3, 4, 3, 5, 4, 3, 3, 4, 3, 5, 4, 4, 4, 4, 3, 4, 2, 4, 3, 3, 1, 5, 4, 3, 2, 4, 5, 4, 5, 5, 4, 4, 5, 4, 4, 0, 3, 2, 2, 3, 3, 0, 4, 3, 1, 3, 2, 1, 4, 3, 3, 4, 5, 0, 3, 0, 2, 0, 4, 5, 5, 4, 5, 4, 0, 4, 0, 0, 5, 4),
44
+ (0, 5, 0, 5, 0, 4, 0, 3, 0, 4, 4, 3, 4, 3, 3, 3, 4, 0, 4, 4, 4, 3, 4, 3, 4, 3, 3, 1, 4, 2, 4, 3, 4, 0, 5, 4, 1, 4, 5, 4, 4, 5, 3, 2, 4, 3, 4, 3, 2, 4, 1, 3, 3, 3, 2, 3, 2, 0, 4, 3, 3, 4, 3, 3, 3, 4, 0, 4, 0, 3, 0, 4, 5, 4, 4, 4, 3, 0, 4, 1, 0, 1, 3),
45
+ (0, 3, 1, 4, 0, 3, 0, 2, 0, 3, 4, 4, 3, 1, 4, 2, 3, 3, 4, 3, 4, 3, 4, 3, 4, 4, 3, 2, 3, 1, 5, 4, 4, 1, 4, 4, 3, 5, 4, 4, 3, 5, 5, 4, 3, 4, 4, 3, 1, 2, 3, 1, 2, 2, 0, 3, 2, 0, 3, 1, 0, 5, 3, 3, 3, 4, 3, 3, 3, 3, 4, 4, 4, 4, 5, 4, 2, 0, 3, 3, 2, 4, 3),
46
+ (0, 2, 0, 3, 0, 1, 0, 1, 0, 0, 3, 2, 0, 0, 2, 0, 1, 0, 2, 1, 3, 3, 3, 1, 2, 3, 1, 0, 1, 0, 4, 2, 1, 1, 3, 3, 0, 4, 3, 3, 1, 4, 3, 3, 0, 3, 3, 2, 0, 0, 0, 0, 1, 0, 0, 2, 0, 0, 0, 0, 0, 4, 1, 0, 2, 3, 2, 2, 2, 1, 3, 3, 3, 4, 4, 3, 2, 0, 3, 1, 0, 3, 3),
47
+ (0, 4, 0, 4, 0, 3, 0, 3, 0, 4, 4, 4, 3, 3, 3, 3, 3, 3, 4, 3, 4, 2, 4, 3, 4, 3, 3, 2, 4, 3, 4, 5, 4, 1, 4, 5, 3, 5, 4, 5, 3, 5, 4, 0, 3, 5, 5, 3, 1, 3, 3, 2, 2, 3, 0, 3, 4, 1, 3, 3, 2, 4, 3, 3, 3, 4, 0, 4, 0, 3, 0, 4, 5, 4, 4, 5, 3, 0, 4, 1, 0, 3, 4),
48
+ (0, 2, 0, 3, 0, 3, 0, 0, 0, 2, 2, 2, 1, 0, 1, 0, 0, 0, 3, 0, 3, 0, 3, 0, 1, 3, 1, 0, 3, 1, 3, 3, 3, 1, 3, 3, 3, 0, 1, 3, 1, 3, 4, 0, 0, 3, 1, 1, 0, 3, 2, 0, 0, 0, 0, 1, 3, 0, 1, 0, 0, 3, 3, 2, 0, 3, 0, 0, 0, 0, 0, 3, 4, 3, 4, 3, 3, 0, 3, 0, 0, 2, 3),
49
+ (2, 3, 0, 3, 0, 2, 0, 1, 0, 3, 3, 4, 3, 1, 3, 1, 1, 1, 3, 1, 4, 3, 4, 3, 3, 3, 0, 0, 3, 1, 5, 4, 3, 1, 4, 3, 2, 5, 5, 4, 4, 4, 4, 3, 3, 4, 4, 4, 0, 2, 1, 1, 3, 2, 0, 1, 2, 0, 0, 1, 0, 4, 1, 3, 3, 3, 0, 3, 0, 1, 0, 4, 4, 4, 5, 5, 3, 0, 2, 0, 0, 4, 4),
50
+ (0, 2, 0, 1, 0, 3, 1, 3, 0, 2, 3, 3, 3, 0, 3, 1, 0, 0, 3, 0, 3, 2, 3, 1, 3, 2, 1, 1, 0, 0, 4, 2, 1, 0, 2, 3, 1, 4, 3, 2, 0, 4, 4, 3, 1, 3, 1, 3, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 4, 1, 1, 1, 2, 0, 3, 0, 0, 0, 3, 4, 2, 4, 3, 2, 0, 1, 0, 0, 3, 3),
51
+ (0, 1, 0, 4, 0, 5, 0, 4, 0, 2, 4, 4, 2, 3, 3, 2, 3, 3, 5, 3, 3, 3, 4, 3, 4, 2, 3, 0, 4, 3, 3, 3, 4, 1, 4, 3, 2, 1, 5, 5, 3, 4, 5, 1, 3, 5, 4, 2, 0, 3, 3, 0, 1, 3, 0, 4, 2, 0, 1, 3, 1, 4, 3, 3, 3, 3, 0, 3, 0, 1, 0, 3, 4, 4, 4, 5, 5, 0, 3, 0, 1, 4, 5),
52
+ (0, 2, 0, 3, 0, 3, 0, 0, 0, 2, 3, 1, 3, 0, 4, 0, 1, 1, 3, 0, 3, 4, 3, 2, 3, 1, 0, 3, 3, 2, 3, 1, 3, 0, 2, 3, 0, 2, 1, 4, 1, 2, 2, 0, 0, 3, 3, 0, 0, 2, 0, 0, 0, 1, 0, 0, 0, 0, 2, 2, 0, 3, 2, 1, 3, 3, 0, 2, 0, 2, 0, 0, 3, 3, 1, 2, 4, 0, 3, 0, 2, 2, 3),
53
+ (2, 4, 0, 5, 0, 4, 0, 4, 0, 2, 4, 4, 4, 3, 4, 3, 3, 3, 1, 2, 4, 3, 4, 3, 4, 4, 5, 0, 3, 3, 3, 3, 2, 0, 4, 3, 1, 4, 3, 4, 1, 4, 4, 3, 3, 4, 4, 3, 1, 2, 3, 0, 4, 2, 0, 4, 1, 0, 3, 3, 0, 4, 3, 3, 3, 4, 0, 4, 0, 2, 0, 3, 5, 3, 4, 5, 2, 0, 3, 0, 0, 4, 5),
54
+ (0, 3, 0, 4, 0, 1, 0, 1, 0, 1, 3, 2, 2, 1, 3, 0, 3, 0, 2, 0, 2, 0, 3, 0, 2, 0, 0, 0, 1, 0, 1, 1, 0, 0, 3, 1, 0, 0, 0, 4, 0, 3, 1, 0, 2, 1, 3, 0, 0, 0, 0, 0, 0, 3, 0, 0, 0, 0, 0, 0, 0, 4, 2, 2, 3, 1, 0, 3, 0, 0, 0, 1, 4, 4, 4, 3, 0, 0, 4, 0, 0, 1, 4),
55
+ (1, 4, 1, 5, 0, 3, 0, 3, 0, 4, 5, 4, 4, 3, 5, 3, 3, 4, 4, 3, 4, 1, 3, 3, 3, 3, 2, 1, 4, 1, 5, 4, 3, 1, 4, 4, 3, 5, 4, 4, 3, 5, 4, 3, 3, 4, 4, 4, 0, 3, 3, 1, 2, 3, 0, 3, 1, 0, 3, 3, 0, 5, 4, 4, 4, 4, 4, 4, 3, 3, 5, 4, 4, 3, 3, 5, 4, 0, 3, 2, 0, 4, 4),
56
+ (0, 2, 0, 3, 0, 1, 0, 0, 0, 1, 3, 3, 3, 2, 4, 1, 3, 0, 3, 1, 3, 0, 2, 2, 1, 1, 0, 0, 2, 0, 4, 3, 1, 0, 4, 3, 0, 4, 4, 4, 1, 4, 3, 1, 1, 3, 3, 1, 0, 2, 0, 0, 1, 3, 0, 0, 0, 0, 2, 0, 0, 4, 3, 2, 4, 3, 5, 4, 3, 3, 3, 4, 3, 3, 4, 3, 3, 0, 2, 1, 0, 3, 3),
57
+ (0, 2, 0, 4, 0, 3, 0, 2, 0, 2, 5, 5, 3, 4, 4, 4, 4, 1, 4, 3, 3, 0, 4, 3, 4, 3, 1, 3, 3, 2, 4, 3, 0, 3, 4, 3, 0, 3, 4, 4, 2, 4, 4, 0, 4, 5, 3, 3, 2, 2, 1, 1, 1, 2, 0, 1, 5, 0, 3, 3, 2, 4, 3, 3, 3, 4, 0, 3, 0, 2, 0, 4, 4, 3, 5, 5, 0, 0, 3, 0, 2, 3, 3),
58
+ (0, 3, 0, 4, 0, 3, 0, 1, 0, 3, 4, 3, 3, 1, 3, 3, 3, 0, 3, 1, 3, 0, 4, 3, 3, 1, 1, 0, 3, 0, 3, 3, 0, 0, 4, 4, 0, 1, 5, 4, 3, 3, 5, 0, 3, 3, 4, 3, 0, 2, 0, 1, 1, 1, 0, 1, 3, 0, 1, 2, 1, 3, 3, 2, 3, 3, 0, 3, 0, 1, 0, 1, 3, 3, 4, 4, 1, 0, 1, 2, 2, 1, 3),
59
+ (0, 1, 0, 4, 0, 4, 0, 3, 0, 1, 3, 3, 3, 2, 3, 1, 1, 0, 3, 0, 3, 3, 4, 3, 2, 4, 2, 0, 1, 0, 4, 3, 2, 0, 4, 3, 0, 5, 3, 3, 2, 4, 4, 4, 3, 3, 3, 4, 0, 1, 3, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 4, 2, 3, 3, 3, 0, 3, 0, 0, 0, 4, 4, 4, 5, 3, 2, 0, 3, 3, 0, 3, 5),
60
+ (0, 2, 0, 3, 0, 0, 0, 3, 0, 1, 3, 0, 2, 0, 0, 0, 1, 0, 3, 1, 1, 3, 3, 0, 0, 3, 0, 0, 3, 0, 2, 3, 1, 0, 3, 1, 0, 3, 3, 2, 0, 4, 2, 2, 0, 2, 0, 0, 0, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 2, 0, 1, 0, 1, 0, 0, 0, 1, 3, 1, 2, 0, 0, 0, 1, 0, 0, 1, 4),
61
+ (0, 3, 0, 3, 0, 5, 0, 1, 0, 2, 4, 3, 1, 3, 3, 2, 1, 1, 5, 2, 1, 0, 5, 1, 2, 0, 0, 0, 3, 3, 2, 2, 3, 2, 4, 3, 0, 0, 3, 3, 1, 3, 3, 0, 2, 5, 3, 4, 0, 3, 3, 0, 1, 2, 0, 2, 2, 0, 3, 2, 0, 2, 2, 3, 3, 3, 0, 2, 0, 1, 0, 3, 4, 4, 2, 5, 4, 0, 3, 0, 0, 3, 5),
62
+ (0, 3, 0, 3, 0, 3, 0, 1, 0, 3, 3, 3, 3, 0, 3, 0, 2, 0, 2, 1, 1, 0, 2, 0, 1, 0, 0, 0, 2, 1, 0, 0, 1, 0, 3, 2, 0, 0, 3, 3, 1, 2, 3, 1, 0, 3, 3, 0, 0, 1, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 2, 3, 1, 2, 3, 0, 3, 0, 1, 0, 3, 2, 1, 0, 4, 3, 0, 1, 1, 0, 3, 3),
63
+ (0, 4, 0, 5, 0, 3, 0, 3, 0, 4, 5, 5, 4, 3, 5, 3, 4, 3, 5, 3, 3, 2, 5, 3, 4, 4, 4, 3, 4, 3, 4, 5, 5, 3, 4, 4, 3, 4, 4, 5, 4, 4, 4, 3, 4, 5, 5, 4, 2, 3, 4, 2, 3, 4, 0, 3, 3, 1, 4, 3, 2, 4, 3, 3, 5, 5, 0, 3, 0, 3, 0, 5, 5, 5, 5, 4, 4, 0, 4, 0, 1, 4, 4),
64
+ (0, 4, 0, 4, 0, 3, 0, 3, 0, 3, 5, 4, 4, 2, 3, 2, 5, 1, 3, 2, 5, 1, 4, 2, 3, 2, 3, 3, 4, 3, 3, 3, 3, 2, 5, 4, 1, 3, 3, 5, 3, 4, 4, 0, 4, 4, 3, 1, 1, 3, 1, 0, 2, 3, 0, 2, 3, 0, 3, 0, 0, 4, 3, 1, 3, 4, 0, 3, 0, 2, 0, 4, 4, 4, 3, 4, 5, 0, 4, 0, 0, 3, 4),
65
+ (0, 3, 0, 3, 0, 3, 1, 2, 0, 3, 4, 4, 3, 3, 3, 0, 2, 2, 4, 3, 3, 1, 3, 3, 3, 1, 1, 0, 3, 1, 4, 3, 2, 3, 4, 4, 2, 4, 4, 4, 3, 4, 4, 3, 2, 4, 4, 3, 1, 3, 3, 1, 3, 3, 0, 4, 1, 0, 2, 2, 1, 4, 3, 2, 3, 3, 5, 4, 3, 3, 5, 4, 4, 3, 3, 0, 4, 0, 3, 2, 2, 4, 4),
66
+ (0, 2, 0, 1, 0, 0, 0, 0, 0, 1, 2, 1, 3, 0, 0, 0, 0, 0, 2, 0, 1, 2, 1, 0, 0, 1, 0, 0, 0, 0, 3, 0, 0, 1, 0, 1, 1, 3, 1, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 2, 2, 0, 3, 4, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1),
67
+ (0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 4, 0, 4, 1, 4, 0, 3, 0, 4, 0, 3, 0, 4, 0, 3, 0, 3, 0, 4, 1, 5, 1, 4, 0, 0, 3, 0, 5, 0, 5, 2, 0, 1, 0, 0, 0, 2, 1, 4, 0, 1, 3, 0, 0, 3, 0, 0, 3, 1, 1, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0),
68
+ (1, 4, 0, 5, 0, 3, 0, 2, 0, 3, 5, 4, 4, 3, 4, 3, 5, 3, 4, 3, 3, 0, 4, 3, 3, 3, 3, 3, 3, 2, 4, 4, 3, 1, 3, 4, 4, 5, 4, 4, 3, 4, 4, 1, 3, 5, 4, 3, 3, 3, 1, 2, 2, 3, 3, 1, 3, 1, 3, 3, 3, 5, 3, 3, 4, 5, 0, 3, 0, 3, 0, 3, 4, 3, 4, 4, 3, 0, 3, 0, 2, 4, 3),
69
+ (0, 1, 0, 4, 0, 0, 0, 0, 0, 1, 4, 0, 4, 1, 4, 2, 4, 0, 3, 0, 1, 0, 1, 0, 0, 0, 0, 0, 2, 0, 3, 1, 1, 1, 0, 3, 0, 0, 0, 1, 2, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 3, 0, 0, 0, 0, 3, 2, 0, 2, 2, 0, 1, 0, 0, 0, 2, 3, 2, 3, 3, 0, 0, 0, 0, 2, 1, 0),
70
+ (0, 5, 1, 5, 0, 3, 0, 3, 0, 5, 4, 4, 5, 1, 5, 3, 3, 0, 4, 3, 4, 3, 5, 3, 4, 3, 3, 2, 4, 3, 4, 3, 3, 0, 3, 3, 1, 4, 4, 3, 4, 4, 4, 3, 4, 5, 5, 3, 2, 3, 1, 1, 3, 3, 1, 3, 1, 1, 3, 3, 2, 4, 5, 3, 3, 5, 0, 4, 0, 3, 0, 4, 4, 3, 5, 3, 3, 0, 3, 4, 0, 4, 3),
71
+ (0, 5, 0, 5, 0, 3, 0, 2, 0, 4, 4, 3, 5, 2, 4, 3, 3, 3, 4, 4, 4, 3, 5, 3, 5, 3, 3, 1, 4, 0, 4, 3, 3, 0, 3, 3, 0, 4, 4, 4, 4, 5, 4, 3, 3, 5, 5, 3, 2, 3, 1, 2, 3, 2, 0, 1, 0, 0, 3, 2, 2, 4, 4, 3, 1, 5, 0, 4, 0, 3, 0, 4, 3, 1, 3, 2, 1, 0, 3, 3, 0, 3, 3),
72
+ (0, 4, 0, 5, 0, 5, 0, 4, 0, 4, 5, 5, 5, 3, 4, 3, 3, 2, 5, 4, 4, 3, 5, 3, 5, 3, 4, 0, 4, 3, 4, 4, 3, 2, 4, 4, 3, 4, 5, 4, 4, 5, 5, 0, 3, 5, 5, 4, 1, 3, 3, 2, 3, 3, 1, 3, 1, 0, 4, 3, 1, 4, 4, 3, 4, 5, 0, 4, 0, 2, 0, 4, 3, 4, 4, 3, 3, 0, 4, 0, 0, 5, 5),
73
+ (0, 4, 0, 4, 0, 5, 0, 1, 1, 3, 3, 4, 4, 3, 4, 1, 3, 0, 5, 1, 3, 0, 3, 1, 3, 1, 1, 0, 3, 0, 3, 3, 4, 0, 4, 3, 0, 4, 4, 4, 3, 4, 4, 0, 3, 5, 4, 1, 0, 3, 0, 0, 2, 3, 0, 3, 1, 0, 3, 1, 0, 3, 2, 1, 3, 5, 0, 3, 0, 1, 0, 3, 2, 3, 3, 4, 4, 0, 2, 2, 0, 4, 4),
74
+ (2, 4, 0, 5, 0, 4, 0, 3, 0, 4, 5, 5, 4, 3, 5, 3, 5, 3, 5, 3, 5, 2, 5, 3, 4, 3, 3, 4, 3, 4, 5, 3, 2, 1, 5, 4, 3, 2, 3, 4, 5, 3, 4, 1, 2, 5, 4, 3, 0, 3, 3, 0, 3, 2, 0, 2, 3, 0, 4, 1, 0, 3, 4, 3, 3, 5, 0, 3, 0, 1, 0, 4, 5, 5, 5, 4, 3, 0, 4, 2, 0, 3, 5),
75
+ (0, 5, 0, 4, 0, 4, 0, 2, 0, 5, 4, 3, 4, 3, 4, 3, 3, 3, 4, 3, 4, 2, 5, 3, 5, 3, 4, 1, 4, 3, 4, 4, 4, 0, 3, 5, 0, 4, 4, 4, 4, 5, 3, 1, 3, 4, 5, 3, 3, 3, 3, 3, 3, 3, 0, 2, 2, 0, 3, 3, 2, 4, 3, 3, 3, 5, 3, 4, 1, 3, 3, 5, 3, 2, 0, 0, 0, 0, 4, 3, 1, 3, 3),
76
+ (0, 1, 0, 3, 0, 3, 0, 1, 0, 1, 3, 3, 3, 2, 3, 3, 3, 0, 3, 0, 0, 0, 3, 1, 3, 0, 0, 0, 2, 2, 2, 3, 0, 0, 3, 2, 0, 1, 2, 4, 1, 3, 3, 0, 0, 3, 3, 3, 0, 1, 0, 0, 2, 1, 0, 0, 3, 0, 3, 1, 0, 3, 0, 0, 1, 3, 0, 2, 0, 1, 0, 3, 3, 1, 3, 3, 0, 0, 1, 1, 0, 3, 3),
77
+ (0, 2, 0, 3, 0, 2, 1, 4, 0, 2, 2, 3, 1, 1, 3, 1, 1, 0, 2, 0, 3, 1, 2, 3, 1, 3, 0, 0, 1, 0, 4, 3, 2, 3, 3, 3, 1, 4, 2, 3, 3, 3, 3, 1, 0, 3, 1, 4, 0, 1, 1, 0, 1, 2, 0, 1, 1, 0, 1, 1, 0, 3, 1, 3, 2, 2, 0, 1, 0, 0, 0, 2, 3, 3, 3, 1, 0, 0, 0, 0, 0, 2, 3),
78
+ (0, 5, 0, 4, 0, 5, 0, 2, 0, 4, 5, 5, 3, 3, 4, 3, 3, 1, 5, 4, 4, 2, 4, 4, 4, 3, 4, 2, 4, 3, 5, 5, 4, 3, 3, 4, 3, 3, 5, 5, 4, 5, 5, 1, 3, 4, 5, 3, 1, 4, 3, 1, 3, 3, 0, 3, 3, 1, 4, 3, 1, 4, 5, 3, 3, 5, 0, 4, 0, 3, 0, 5, 3, 3, 1, 4, 3, 0, 4, 0, 1, 5, 3),
79
+ (0, 5, 0, 5, 0, 4, 0, 2, 0, 4, 4, 3, 4, 3, 3, 3, 3, 3, 5, 4, 4, 4, 4, 4, 4, 5, 3, 3, 5, 2, 4, 4, 4, 3, 4, 4, 3, 3, 4, 4, 5, 5, 3, 3, 4, 3, 4, 3, 3, 4, 3, 3, 3, 3, 1, 2, 2, 1, 4, 3, 3, 5, 4, 4, 3, 4, 0, 4, 0, 3, 0, 4, 4, 4, 4, 4, 1, 0, 4, 2, 0, 2, 4),
80
+ (0, 4, 0, 4, 0, 3, 0, 1, 0, 3, 5, 2, 3, 0, 3, 0, 2, 1, 4, 2, 3, 3, 4, 1, 4, 3, 3, 2, 4, 1, 3, 3, 3, 0, 3, 3, 0, 0, 3, 3, 3, 5, 3, 3, 3, 3, 3, 2, 0, 2, 0, 0, 2, 0, 0, 2, 0, 0, 1, 0, 0, 3, 1, 2, 2, 3, 0, 3, 0, 2, 0, 4, 4, 3, 3, 4, 1, 0, 3, 0, 0, 2, 4),
81
+ (0, 0, 0, 4, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 2, 0, 0, 0, 0, 0, 1, 0, 2, 0, 1, 0, 0, 0, 0, 0, 3, 1, 3, 0, 3, 2, 0, 0, 0, 1, 0, 3, 2, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 4, 0, 2, 0, 0, 0, 0, 0, 0, 2),
82
+ (0, 2, 1, 3, 0, 2, 0, 2, 0, 3, 3, 3, 3, 1, 3, 1, 3, 3, 3, 3, 3, 3, 4, 2, 2, 1, 2, 1, 4, 0, 4, 3, 1, 3, 3, 3, 2, 4, 3, 5, 4, 3, 3, 3, 3, 3, 3, 3, 0, 1, 3, 0, 2, 0, 0, 1, 0, 0, 1, 0, 0, 4, 2, 0, 2, 3, 0, 3, 3, 0, 3, 3, 4, 2, 3, 1, 4, 0, 1, 2, 0, 2, 3),
83
+ (0, 3, 0, 3, 0, 1, 0, 3, 0, 2, 3, 3, 3, 0, 3, 1, 2, 0, 3, 3, 2, 3, 3, 2, 3, 2, 3, 1, 3, 0, 4, 3, 2, 0, 3, 3, 1, 4, 3, 3, 2, 3, 4, 3, 1, 3, 3, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 4, 1, 1, 0, 3, 0, 3, 1, 0, 2, 3, 3, 3, 3, 3, 1, 0, 0, 2, 0, 3, 3),
84
+ (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 0, 2, 0, 3, 0, 0, 0, 0, 0, 0, 0, 3, 0, 0, 0, 0, 0, 0, 0, 3, 0, 3, 0, 3, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 0, 2, 0, 2, 3, 0, 0, 0, 0, 0, 0, 0, 0, 3),
85
+ (0, 2, 0, 3, 1, 3, 0, 3, 0, 2, 3, 3, 3, 1, 3, 1, 3, 1, 3, 1, 3, 3, 3, 1, 3, 0, 2, 3, 1, 1, 4, 3, 3, 2, 3, 3, 1, 2, 2, 4, 1, 3, 3, 0, 1, 4, 2, 3, 0, 1, 3, 0, 3, 0, 0, 1, 3, 0, 2, 0, 0, 3, 3, 2, 1, 3, 0, 3, 0, 2, 0, 3, 4, 4, 4, 3, 1, 0, 3, 0, 0, 3, 3),
86
+ (0, 2, 0, 1, 0, 2, 0, 0, 0, 1, 3, 2, 2, 1, 3, 0, 1, 1, 3, 0, 3, 2, 3, 1, 2, 0, 2, 0, 1, 1, 3, 3, 3, 0, 3, 3, 1, 1, 2, 3, 2, 3, 3, 1, 2, 3, 2, 0, 0, 1, 0, 0, 0, 0, 0, 0, 3, 0, 1, 0, 0, 2, 1, 2, 1, 3, 0, 3, 0, 0, 0, 3, 4, 4, 4, 3, 2, 0, 2, 0, 0, 2, 4),
87
+ (0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 2, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 3, 1, 0, 0, 0, 0, 0, 0, 0, 3),
88
+ (0, 3, 0, 3, 0, 2, 0, 3, 0, 3, 3, 3, 2, 3, 2, 2, 2, 0, 3, 1, 3, 3, 3, 2, 3, 3, 0, 0, 3, 0, 3, 2, 2, 0, 2, 3, 1, 4, 3, 4, 3, 3, 2, 3, 1, 5, 4, 4, 0, 3, 1, 2, 1, 3, 0, 3, 1, 1, 2, 0, 2, 3, 1, 3, 1, 3, 0, 3, 0, 1, 0, 3, 3, 4, 4, 2, 1, 0, 2, 1, 0, 2, 4),
89
+ (0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 4, 2, 5, 1, 4, 0, 2, 0, 2, 1, 3, 1, 4, 0, 2, 1, 0, 0, 2, 1, 4, 1, 1, 0, 3, 3, 0, 5, 1, 3, 2, 3, 3, 1, 0, 3, 2, 3, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 4, 0, 1, 0, 3, 0, 2, 0, 1, 0, 3, 3, 3, 4, 3, 3, 0, 0, 0, 0, 2, 3),
90
+ (0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 2, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 0, 0, 1, 0, 0, 0, 0, 0, 3),
91
+ (0, 1, 0, 3, 0, 4, 0, 3, 0, 2, 4, 3, 1, 0, 3, 2, 2, 1, 3, 1, 2, 2, 3, 1, 1, 1, 2, 1, 3, 0, 1, 2, 0, 1, 3, 2, 1, 3, 0, 5, 5, 1, 0, 0, 1, 3, 2, 1, 0, 3, 0, 0, 1, 0, 0, 0, 0, 0, 3, 4, 0, 1, 1, 1, 3, 2, 0, 2, 0, 1, 0, 2, 3, 3, 1, 2, 3, 0, 1, 0, 1, 0, 4),
92
+ (0, 0, 0, 1, 0, 3, 0, 3, 0, 2, 2, 1, 0, 0, 4, 0, 3, 0, 3, 1, 3, 0, 3, 0, 3, 0, 1, 0, 3, 0, 3, 1, 3, 0, 3, 3, 0, 0, 1, 2, 1, 1, 1, 0, 1, 2, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 2, 2, 1, 2, 0, 0, 2, 0, 0, 0, 0, 2, 3, 3, 3, 3, 0, 0, 0, 0, 1, 4),
93
+ (0, 0, 0, 3, 0, 3, 0, 0, 0, 0, 3, 1, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 3, 0, 2, 0, 2, 3, 0, 0, 2, 2, 3, 1, 2, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 0, 0, 2, 0, 0, 0, 0, 2, 3),
94
+ (2, 4, 0, 5, 0, 5, 0, 4, 0, 3, 4, 3, 3, 3, 4, 3, 3, 3, 4, 3, 4, 4, 5, 4, 5, 5, 5, 2, 3, 0, 5, 5, 4, 1, 5, 4, 3, 1, 5, 4, 3, 4, 4, 3, 3, 4, 3, 3, 0, 3, 2, 0, 2, 3, 0, 3, 0, 0, 3, 3, 0, 5, 3, 2, 3, 3, 0, 3, 0, 3, 0, 3, 4, 5, 4, 5, 3, 0, 4, 3, 0, 3, 4),
95
+ (0, 3, 0, 3, 0, 3, 0, 3, 0, 3, 3, 4, 3, 2, 3, 2, 3, 0, 4, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 2, 4, 3, 3, 1, 3, 4, 3, 4, 4, 4, 3, 4, 4, 3, 2, 4, 4, 1, 0, 2, 0, 0, 1, 1, 0, 2, 0, 0, 3, 1, 0, 5, 3, 2, 1, 3, 0, 3, 0, 1, 2, 4, 3, 2, 4, 3, 3, 0, 3, 2, 0, 4, 4),
96
+ (0, 3, 0, 3, 0, 1, 0, 0, 0, 1, 4, 3, 3, 2, 3, 1, 3, 1, 4, 2, 3, 2, 4, 2, 3, 4, 3, 0, 2, 2, 3, 3, 3, 0, 3, 3, 3, 0, 3, 4, 1, 3, 3, 0, 3, 4, 3, 3, 0, 1, 1, 0, 1, 0, 0, 0, 4, 0, 3, 0, 0, 3, 1, 2, 1, 3, 0, 4, 0, 1, 0, 4, 3, 3, 4, 3, 3, 0, 2, 0, 0, 3, 3),
97
+ (0, 3, 0, 4, 0, 1, 0, 3, 0, 3, 4, 3, 3, 0, 3, 3, 3, 1, 3, 1, 3, 3, 4, 3, 3, 3, 0, 0, 3, 1, 5, 3, 3, 1, 3, 3, 2, 5, 4, 3, 3, 4, 5, 3, 2, 5, 3, 4, 0, 1, 0, 0, 0, 0, 0, 2, 0, 0, 1, 1, 0, 4, 2, 2, 1, 3, 0, 3, 0, 2, 0, 4, 4, 3, 5, 3, 2, 0, 1, 1, 0, 3, 4),
98
+ (0, 5, 0, 4, 0, 5, 0, 2, 0, 4, 4, 3, 3, 2, 3, 3, 3, 1, 4, 3, 4, 1, 5, 3, 4, 3, 4, 0, 4, 2, 4, 3, 4, 1, 5, 4, 0, 4, 4, 4, 4, 5, 4, 1, 3, 5, 4, 2, 1, 4, 1, 1, 3, 2, 0, 3, 1, 0, 3, 2, 1, 4, 3, 3, 3, 4, 0, 4, 0, 3, 0, 4, 4, 4, 3, 3, 3, 0, 4, 2, 0, 3, 4),
99
+ (1, 4, 0, 4, 0, 3, 0, 1, 0, 3, 3, 3, 1, 1, 3, 3, 2, 2, 3, 3, 1, 0, 3, 2, 2, 1, 2, 0, 3, 1, 2, 1, 2, 0, 3, 2, 0, 2, 2, 3, 3, 4, 3, 0, 3, 3, 1, 2, 0, 1, 1, 3, 1, 2, 0, 0, 3, 0, 1, 1, 0, 3, 2, 2, 3, 3, 0, 3, 0, 0, 0, 2, 3, 3, 4, 3, 3, 0, 1, 0, 0, 1, 4),
100
+ (0, 4, 0, 4, 0, 4, 0, 0, 0, 3, 4, 4, 3, 1, 4, 2, 3, 2, 3, 3, 3, 1, 4, 3, 4, 0, 3, 0, 4, 2, 3, 3, 2, 2, 5, 4, 2, 1, 3, 4, 3, 4, 3, 1, 3, 3, 4, 2, 0, 2, 1, 0, 3, 3, 0, 0, 2, 0, 3, 1, 0, 4, 4, 3, 4, 3, 0, 4, 0, 1, 0, 2, 4, 4, 4, 4, 4, 0, 3, 2, 0, 3, 3),
101
+ (0, 0, 0, 1, 0, 4, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 3, 2, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 2),
102
+ (0, 2, 0, 3, 0, 4, 0, 4, 0, 1, 3, 3, 3, 0, 4, 0, 2, 1, 2, 1, 1, 1, 2, 0, 3, 1, 1, 0, 1, 0, 3, 1, 0, 0, 3, 3, 2, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 2, 0, 2, 2, 0, 3, 1, 0, 0, 1, 0, 1, 1, 0, 1, 2, 0, 3, 0, 0, 0, 0, 1, 0, 0, 3, 3, 4, 3, 1, 0, 1, 0, 3, 0, 2),
103
+ (0, 0, 0, 3, 0, 5, 0, 0, 0, 0, 1, 0, 2, 0, 3, 1, 0, 1, 3, 0, 0, 0, 2, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 4, 0, 0, 0, 2, 3, 0, 1, 4, 1, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 3, 0, 0, 0, 0, 0, 3),
104
+ (0, 2, 0, 5, 0, 5, 0, 1, 0, 2, 4, 3, 3, 2, 5, 1, 3, 2, 3, 3, 3, 0, 4, 1, 2, 0, 3, 0, 4, 0, 2, 2, 1, 1, 5, 3, 0, 0, 1, 4, 2, 3, 2, 0, 3, 3, 3, 2, 0, 2, 4, 1, 1, 2, 0, 1, 1, 0, 3, 1, 0, 1, 3, 1, 2, 3, 0, 2, 0, 0, 0, 1, 3, 5, 4, 4, 4, 0, 3, 0, 0, 1, 3),
105
+ (0, 4, 0, 5, 0, 4, 0, 4, 0, 4, 5, 4, 3, 3, 4, 3, 3, 3, 4, 3, 4, 4, 5, 3, 4, 5, 4, 2, 4, 2, 3, 4, 3, 1, 4, 4, 1, 3, 5, 4, 4, 5, 5, 4, 4, 5, 5, 5, 2, 3, 3, 1, 4, 3, 1, 3, 3, 0, 3, 3, 1, 4, 3, 4, 4, 4, 0, 3, 0, 4, 0, 3, 3, 4, 4, 5, 0, 0, 4, 3, 0, 4, 5),
106
+ (0, 4, 0, 4, 0, 3, 0, 3, 0, 3, 4, 4, 4, 3, 3, 2, 4, 3, 4, 3, 4, 3, 5, 3, 4, 3, 2, 1, 4, 2, 4, 4, 3, 1, 3, 4, 2, 4, 5, 5, 3, 4, 5, 4, 1, 5, 4, 3, 0, 3, 2, 2, 3, 2, 1, 3, 1, 0, 3, 3, 3, 5, 3, 3, 3, 5, 4, 4, 2, 3, 3, 4, 3, 3, 3, 2, 1, 0, 3, 2, 1, 4, 3),
107
+ (0, 4, 0, 5, 0, 4, 0, 3, 0, 3, 5, 5, 3, 2, 4, 3, 4, 0, 5, 4, 4, 1, 4, 4, 4, 3, 3, 3, 4, 3, 5, 5, 2, 3, 3, 4, 1, 2, 5, 5, 3, 5, 5, 2, 3, 5, 5, 4, 0, 3, 2, 0, 3, 3, 1, 1, 5, 1, 4, 1, 0, 4, 3, 2, 3, 5, 0, 4, 0, 3, 0, 5, 4, 3, 4, 3, 0, 0, 4, 1, 0, 4, 4),
108
+ (1, 3, 0, 4, 0, 2, 0, 2, 0, 2, 5, 5, 3, 3, 3, 3, 3, 0, 4, 2, 3, 4, 4, 4, 3, 4, 0, 0, 3, 4, 5, 4, 3, 3, 3, 3, 2, 5, 5, 4, 5, 5, 5, 4, 3, 5, 5, 5, 1, 3, 1, 0, 1, 0, 0, 3, 2, 0, 4, 2, 0, 5, 2, 3, 2, 4, 1, 3, 0, 3, 0, 4, 5, 4, 5, 4, 3, 0, 4, 2, 0, 5, 4),
109
+ (0, 3, 0, 4, 0, 5, 0, 3, 0, 3, 4, 4, 3, 2, 3, 2, 3, 3, 3, 3, 3, 2, 4, 3, 3, 2, 2, 0, 3, 3, 3, 3, 3, 1, 3, 3, 3, 0, 4, 4, 3, 4, 4, 1, 1, 4, 4, 2, 0, 3, 1, 0, 1, 1, 0, 4, 1, 0, 2, 3, 1, 3, 3, 1, 3, 4, 0, 3, 0, 1, 0, 3, 1, 3, 0, 0, 1, 0, 2, 0, 0, 4, 4),
110
+ (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0),
111
+ (0, 3, 0, 3, 0, 2, 0, 3, 0, 1, 5, 4, 3, 3, 3, 1, 4, 2, 1, 2, 3, 4, 4, 2, 4, 4, 5, 0, 3, 1, 4, 3, 4, 0, 4, 3, 3, 3, 2, 3, 2, 5, 3, 4, 3, 2, 2, 3, 0, 0, 3, 0, 2, 1, 0, 1, 2, 0, 0, 0, 0, 2, 1, 1, 3, 1, 0, 2, 0, 4, 0, 3, 4, 4, 4, 5, 2, 0, 2, 0, 0, 1, 3),
112
+ (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 4, 2, 1, 1, 0, 1, 0, 3, 2, 0, 0, 3, 1, 1, 1, 2, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 0, 1, 0, 0, 0, 2, 0, 0, 0, 1, 4, 0, 4, 2, 1, 0, 0, 0, 0, 0, 1),
113
+ (0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 3, 1, 0, 0, 0, 2, 0, 2, 1, 0, 0, 1, 2, 1, 0, 1, 1, 0, 0, 3, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 3, 1, 0, 0, 0, 0, 0, 1, 0, 0, 2, 1, 0, 0, 0, 0, 0, 0, 0, 0, 2),
114
+ (0, 4, 0, 4, 0, 4, 0, 3, 0, 4, 4, 3, 4, 2, 4, 3, 2, 0, 4, 4, 4, 3, 5, 3, 5, 3, 3, 2, 4, 2, 4, 3, 4, 3, 1, 4, 0, 2, 3, 4, 4, 4, 3, 3, 3, 4, 4, 4, 3, 4, 1, 3, 4, 3, 2, 1, 2, 1, 3, 3, 3, 4, 4, 3, 3, 5, 0, 4, 0, 3, 0, 4, 3, 3, 3, 2, 1, 0, 3, 0, 0, 3, 3),
115
+ (0, 4, 0, 3, 0, 3, 0, 3, 0, 3, 5, 5, 3, 3, 3, 3, 4, 3, 4, 3, 3, 3, 4, 4, 4, 3, 3, 3, 3, 4, 3, 5, 3, 3, 1, 3, 2, 4, 5, 5, 5, 5, 4, 3, 4, 5, 5, 3, 2, 2, 3, 3, 3, 3, 2, 3, 3, 1, 2, 3, 2, 4, 3, 3, 3, 4, 0, 4, 0, 2, 0, 4, 3, 2, 2, 1, 2, 0, 3, 0, 0, 4, 1),
116
+ )
117
+ # fmt: on
118
+
119
+
120
+ class JapaneseContextAnalysis:
121
+ NUM_OF_CATEGORY = 6
122
+ DONT_KNOW = -1
123
+ ENOUGH_REL_THRESHOLD = 100
124
+ MAX_REL_THRESHOLD = 1000
125
+ MINIMUM_DATA_THRESHOLD = 4
126
+
127
+ def __init__(self) -> None:
128
+ self._total_rel = 0
129
+ self._rel_sample: List[int] = []
130
+ self._need_to_skip_char_num = 0
131
+ self._last_char_order = -1
132
+ self._done = False
133
+ self.reset()
134
+
135
+ def reset(self) -> None:
136
+ self._total_rel = 0 # total sequence received
137
+ # category counters, each integer counts sequence in its category
138
+ self._rel_sample = [0] * self.NUM_OF_CATEGORY
139
+ # if last byte in current buffer is not the last byte of a character,
140
+ # we need to know how many bytes to skip in next buffer
141
+ self._need_to_skip_char_num = 0
142
+ self._last_char_order = -1 # The order of previous char
143
+ # If this flag is set to True, detection is done and conclusion has
144
+ # been made
145
+ self._done = False
146
+
147
+ def feed(self, byte_str: Union[bytes, bytearray], num_bytes: int) -> None:
148
+ if self._done:
149
+ return
150
+
151
+ # The buffer we got is byte oriented, and a character may span in more than one
152
+ # buffers. In case the last one or two byte in last buffer is not
153
+ # complete, we record how many byte needed to complete that character
154
+ # and skip these bytes here. We can choose to record those bytes as
155
+ # well and analyse the character once it is complete, but since a
156
+ # character will not make much difference, by simply skipping
157
+ # this character will simply our logic and improve performance.
158
+ i = self._need_to_skip_char_num
159
+ while i < num_bytes:
160
+ order, char_len = self.get_order(byte_str[i : i + 2])
161
+ i += char_len
162
+ if i > num_bytes:
163
+ self._need_to_skip_char_num = i - num_bytes
164
+ self._last_char_order = -1
165
+ else:
166
+ if (order != -1) and (self._last_char_order != -1):
167
+ self._total_rel += 1
168
+ if self._total_rel > self.MAX_REL_THRESHOLD:
169
+ self._done = True
170
+ break
171
+ self._rel_sample[
172
+ jp2_char_context[self._last_char_order][order]
173
+ ] += 1
174
+ self._last_char_order = order
175
+
176
+ def got_enough_data(self) -> bool:
177
+ return self._total_rel > self.ENOUGH_REL_THRESHOLD
178
+
179
+ def get_confidence(self) -> float:
180
+ # This is just one way to calculate confidence. It works well for me.
181
+ if self._total_rel > self.MINIMUM_DATA_THRESHOLD:
182
+ return (self._total_rel - self._rel_sample[0]) / self._total_rel
183
+ return self.DONT_KNOW
184
+
185
+ def get_order(self, _: Union[bytes, bytearray]) -> Tuple[int, int]:
186
+ return -1, 1
187
+
188
+
189
+ class SJISContextAnalysis(JapaneseContextAnalysis):
190
+ def __init__(self) -> None:
191
+ super().__init__()
192
+ self._charset_name = "SHIFT_JIS"
193
+
194
+ @property
195
+ def charset_name(self) -> str:
196
+ return self._charset_name
197
+
198
+ def get_order(self, byte_str: Union[bytes, bytearray]) -> Tuple[int, int]:
199
+ if not byte_str:
200
+ return -1, 1
201
+ # find out current char's byte length
202
+ first_char = byte_str[0]
203
+ if (0x81 <= first_char <= 0x9F) or (0xE0 <= first_char <= 0xFC):
204
+ char_len = 2
205
+ if (first_char == 0x87) or (0xFA <= first_char <= 0xFC):
206
+ self._charset_name = "CP932"
207
+ else:
208
+ char_len = 1
209
+
210
+ # return its order if it is hiragana
211
+ if len(byte_str) > 1:
212
+ second_char = byte_str[1]
213
+ if (first_char == 202) and (0x9F <= second_char <= 0xF1):
214
+ return second_char - 0x9F, char_len
215
+
216
+ return -1, char_len
217
+
218
+
219
+ class EUCJPContextAnalysis(JapaneseContextAnalysis):
220
+ def get_order(self, byte_str: Union[bytes, bytearray]) -> Tuple[int, int]:
221
+ if not byte_str:
222
+ return -1, 1
223
+ # find out current char's byte length
224
+ first_char = byte_str[0]
225
+ if (first_char == 0x8E) or (0xA1 <= first_char <= 0xFE):
226
+ char_len = 2
227
+ elif first_char == 0x8F:
228
+ char_len = 3
229
+ else:
230
+ char_len = 1
231
+
232
+ # return its order if it is hiragana
233
+ if len(byte_str) > 1:
234
+ second_char = byte_str[1]
235
+ if (first_char == 0xA4) and (0xA1 <= second_char <= 0xF3):
236
+ return second_char - 0xA1, char_len
237
+
238
+ return -1, char_len
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langgreekmodel.py ADDED
The diff for this file is too large to render. See raw diff
 
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langhebrewmodel.py ADDED
The diff for this file is too large to render. See raw diff
 
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langhungarianmodel.py ADDED
The diff for this file is too large to render. See raw diff
 
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langrussianmodel.py ADDED
The diff for this file is too large to render. See raw diff
 
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langthaimodel.py ADDED
The diff for this file is too large to render. See raw diff
 
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/langturkishmodel.py ADDED
@@ -0,0 +1,4380 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from pip._vendor.chardet.sbcharsetprober import SingleByteCharSetModel
2
+
3
+ # 3: Positive
4
+ # 2: Likely
5
+ # 1: Unlikely
6
+ # 0: Negative
7
+
8
+ TURKISH_LANG_MODEL = {
9
+ 23: { # 'A'
10
+ 23: 0, # 'A'
11
+ 37: 0, # 'B'
12
+ 47: 0, # 'C'
13
+ 39: 0, # 'D'
14
+ 29: 0, # 'E'
15
+ 52: 0, # 'F'
16
+ 36: 0, # 'G'
17
+ 45: 0, # 'H'
18
+ 53: 0, # 'I'
19
+ 60: 0, # 'J'
20
+ 16: 0, # 'K'
21
+ 49: 0, # 'L'
22
+ 20: 0, # 'M'
23
+ 46: 0, # 'N'
24
+ 42: 0, # 'O'
25
+ 48: 0, # 'P'
26
+ 44: 0, # 'R'
27
+ 35: 0, # 'S'
28
+ 31: 0, # 'T'
29
+ 51: 0, # 'U'
30
+ 38: 0, # 'V'
31
+ 62: 0, # 'W'
32
+ 43: 0, # 'Y'
33
+ 56: 0, # 'Z'
34
+ 1: 3, # 'a'
35
+ 21: 0, # 'b'
36
+ 28: 0, # 'c'
37
+ 12: 2, # 'd'
38
+ 2: 3, # 'e'
39
+ 18: 0, # 'f'
40
+ 27: 1, # 'g'
41
+ 25: 1, # 'h'
42
+ 3: 1, # 'i'
43
+ 24: 0, # 'j'
44
+ 10: 2, # 'k'
45
+ 5: 1, # 'l'
46
+ 13: 1, # 'm'
47
+ 4: 1, # 'n'
48
+ 15: 0, # 'o'
49
+ 26: 0, # 'p'
50
+ 7: 1, # 'r'
51
+ 8: 1, # 's'
52
+ 9: 1, # 't'
53
+ 14: 1, # 'u'
54
+ 32: 0, # 'v'
55
+ 57: 0, # 'w'
56
+ 58: 0, # 'x'
57
+ 11: 3, # 'y'
58
+ 22: 0, # 'z'
59
+ 63: 0, # '·'
60
+ 54: 0, # 'Ç'
61
+ 50: 0, # 'Ö'
62
+ 55: 0, # 'Ü'
63
+ 59: 0, # 'â'
64
+ 33: 1, # 'ç'
65
+ 61: 0, # 'î'
66
+ 34: 0, # 'ö'
67
+ 17: 0, # 'ü'
68
+ 30: 0, # 'ğ'
69
+ 41: 0, # 'İ'
70
+ 6: 0, # 'ı'
71
+ 40: 0, # 'Ş'
72
+ 19: 0, # 'ş'
73
+ },
74
+ 37: { # 'B'
75
+ 23: 0, # 'A'
76
+ 37: 0, # 'B'
77
+ 47: 2, # 'C'
78
+ 39: 0, # 'D'
79
+ 29: 0, # 'E'
80
+ 52: 2, # 'F'
81
+ 36: 0, # 'G'
82
+ 45: 0, # 'H'
83
+ 53: 0, # 'I'
84
+ 60: 0, # 'J'
85
+ 16: 1, # 'K'
86
+ 49: 0, # 'L'
87
+ 20: 0, # 'M'
88
+ 46: 0, # 'N'
89
+ 42: 0, # 'O'
90
+ 48: 1, # 'P'
91
+ 44: 0, # 'R'
92
+ 35: 1, # 'S'
93
+ 31: 0, # 'T'
94
+ 51: 0, # 'U'
95
+ 38: 1, # 'V'
96
+ 62: 0, # 'W'
97
+ 43: 1, # 'Y'
98
+ 56: 0, # 'Z'
99
+ 1: 2, # 'a'
100
+ 21: 0, # 'b'
101
+ 28: 2, # 'c'
102
+ 12: 0, # 'd'
103
+ 2: 3, # 'e'
104
+ 18: 0, # 'f'
105
+ 27: 0, # 'g'
106
+ 25: 0, # 'h'
107
+ 3: 0, # 'i'
108
+ 24: 0, # 'j'
109
+ 10: 0, # 'k'
110
+ 5: 0, # 'l'
111
+ 13: 1, # 'm'
112
+ 4: 1, # 'n'
113
+ 15: 0, # 'o'
114
+ 26: 0, # 'p'
115
+ 7: 0, # 'r'
116
+ 8: 0, # 's'
117
+ 9: 0, # 't'
118
+ 14: 2, # 'u'
119
+ 32: 0, # 'v'
120
+ 57: 0, # 'w'
121
+ 58: 0, # 'x'
122
+ 11: 0, # 'y'
123
+ 22: 1, # 'z'
124
+ 63: 0, # '·'
125
+ 54: 0, # 'Ç'
126
+ 50: 1, # 'Ö'
127
+ 55: 0, # 'Ü'
128
+ 59: 0, # 'â'
129
+ 33: 0, # 'ç'
130
+ 61: 0, # 'î'
131
+ 34: 1, # 'ö'
132
+ 17: 0, # 'ü'
133
+ 30: 0, # 'ğ'
134
+ 41: 0, # 'İ'
135
+ 6: 0, # 'ı'
136
+ 40: 1, # 'Ş'
137
+ 19: 1, # 'ş'
138
+ },
139
+ 47: { # 'C'
140
+ 23: 0, # 'A'
141
+ 37: 0, # 'B'
142
+ 47: 0, # 'C'
143
+ 39: 0, # 'D'
144
+ 29: 0, # 'E'
145
+ 52: 1, # 'F'
146
+ 36: 0, # 'G'
147
+ 45: 0, # 'H'
148
+ 53: 0, # 'I'
149
+ 60: 0, # 'J'
150
+ 16: 0, # 'K'
151
+ 49: 1, # 'L'
152
+ 20: 0, # 'M'
153
+ 46: 1, # 'N'
154
+ 42: 0, # 'O'
155
+ 48: 1, # 'P'
156
+ 44: 1, # 'R'
157
+ 35: 0, # 'S'
158
+ 31: 0, # 'T'
159
+ 51: 0, # 'U'
160
+ 38: 1, # 'V'
161
+ 62: 0, # 'W'
162
+ 43: 1, # 'Y'
163
+ 56: 0, # 'Z'
164
+ 1: 3, # 'a'
165
+ 21: 0, # 'b'
166
+ 28: 2, # 'c'
167
+ 12: 0, # 'd'
168
+ 2: 3, # 'e'
169
+ 18: 0, # 'f'
170
+ 27: 0, # 'g'
171
+ 25: 0, # 'h'
172
+ 3: 0, # 'i'
173
+ 24: 2, # 'j'
174
+ 10: 1, # 'k'
175
+ 5: 2, # 'l'
176
+ 13: 2, # 'm'
177
+ 4: 2, # 'n'
178
+ 15: 1, # 'o'
179
+ 26: 0, # 'p'
180
+ 7: 2, # 'r'
181
+ 8: 0, # 's'
182
+ 9: 0, # 't'
183
+ 14: 3, # 'u'
184
+ 32: 0, # 'v'
185
+ 57: 0, # 'w'
186
+ 58: 0, # 'x'
187
+ 11: 0, # 'y'
188
+ 22: 2, # 'z'
189
+ 63: 0, # '·'
190
+ 54: 0, # 'Ç'
191
+ 50: 1, # 'Ö'
192
+ 55: 0, # 'Ü'
193
+ 59: 0, # 'â'
194
+ 33: 1, # 'ç'
195
+ 61: 0, # 'î'
196
+ 34: 1, # 'ö'
197
+ 17: 0, # 'ü'
198
+ 30: 0, # 'ğ'
199
+ 41: 1, # 'İ'
200
+ 6: 3, # 'ı'
201
+ 40: 0, # 'Ş'
202
+ 19: 0, # 'ş'
203
+ },
204
+ 39: { # 'D'
205
+ 23: 0, # 'A'
206
+ 37: 0, # 'B'
207
+ 47: 0, # 'C'
208
+ 39: 0, # 'D'
209
+ 29: 0, # 'E'
210
+ 52: 1, # 'F'
211
+ 36: 0, # 'G'
212
+ 45: 0, # 'H'
213
+ 53: 0, # 'I'
214
+ 60: 0, # 'J'
215
+ 16: 1, # 'K'
216
+ 49: 0, # 'L'
217
+ 20: 0, # 'M'
218
+ 46: 0, # 'N'
219
+ 42: 0, # 'O'
220
+ 48: 1, # 'P'
221
+ 44: 0, # 'R'
222
+ 35: 0, # 'S'
223
+ 31: 0, # 'T'
224
+ 51: 0, # 'U'
225
+ 38: 0, # 'V'
226
+ 62: 0, # 'W'
227
+ 43: 0, # 'Y'
228
+ 56: 0, # 'Z'
229
+ 1: 2, # 'a'
230
+ 21: 0, # 'b'
231
+ 28: 2, # 'c'
232
+ 12: 0, # 'd'
233
+ 2: 2, # 'e'
234
+ 18: 0, # 'f'
235
+ 27: 0, # 'g'
236
+ 25: 0, # 'h'
237
+ 3: 0, # 'i'
238
+ 24: 0, # 'j'
239
+ 10: 0, # 'k'
240
+ 5: 1, # 'l'
241
+ 13: 3, # 'm'
242
+ 4: 0, # 'n'
243
+ 15: 1, # 'o'
244
+ 26: 0, # 'p'
245
+ 7: 0, # 'r'
246
+ 8: 0, # 's'
247
+ 9: 0, # 't'
248
+ 14: 1, # 'u'
249
+ 32: 0, # 'v'
250
+ 57: 0, # 'w'
251
+ 58: 0, # 'x'
252
+ 11: 0, # 'y'
253
+ 22: 1, # 'z'
254
+ 63: 0, # '·'
255
+ 54: 1, # 'Ç'
256
+ 50: 0, # 'Ö'
257
+ 55: 0, # 'Ü'
258
+ 59: 0, # 'â'
259
+ 33: 1, # 'ç'
260
+ 61: 0, # 'î'
261
+ 34: 0, # 'ö'
262
+ 17: 0, # 'ü'
263
+ 30: 1, # 'ğ'
264
+ 41: 0, # 'İ'
265
+ 6: 1, # 'ı'
266
+ 40: 1, # 'Ş'
267
+ 19: 0, # 'ş'
268
+ },
269
+ 29: { # 'E'
270
+ 23: 0, # 'A'
271
+ 37: 0, # 'B'
272
+ 47: 0, # 'C'
273
+ 39: 0, # 'D'
274
+ 29: 1, # 'E'
275
+ 52: 0, # 'F'
276
+ 36: 0, # 'G'
277
+ 45: 0, # 'H'
278
+ 53: 0, # 'I'
279
+ 60: 0, # 'J'
280
+ 16: 3, # 'K'
281
+ 49: 0, # 'L'
282
+ 20: 1, # 'M'
283
+ 46: 0, # 'N'
284
+ 42: 0, # 'O'
285
+ 48: 0, # 'P'
286
+ 44: 0, # 'R'
287
+ 35: 0, # 'S'
288
+ 31: 0, # 'T'
289
+ 51: 0, # 'U'
290
+ 38: 0, # 'V'
291
+ 62: 0, # 'W'
292
+ 43: 0, # 'Y'
293
+ 56: 0, # 'Z'
294
+ 1: 3, # 'a'
295
+ 21: 0, # 'b'
296
+ 28: 0, # 'c'
297
+ 12: 2, # 'd'
298
+ 2: 3, # 'e'
299
+ 18: 0, # 'f'
300
+ 27: 1, # 'g'
301
+ 25: 0, # 'h'
302
+ 3: 1, # 'i'
303
+ 24: 1, # 'j'
304
+ 10: 0, # 'k'
305
+ 5: 3, # 'l'
306
+ 13: 3, # 'm'
307
+ 4: 3, # 'n'
308
+ 15: 0, # 'o'
309
+ 26: 0, # 'p'
310
+ 7: 0, # 'r'
311
+ 8: 1, # 's'
312
+ 9: 1, # 't'
313
+ 14: 1, # 'u'
314
+ 32: 1, # 'v'
315
+ 57: 0, # 'w'
316
+ 58: 0, # 'x'
317
+ 11: 2, # 'y'
318
+ 22: 0, # 'z'
319
+ 63: 0, # '·'
320
+ 54: 0, # 'Ç'
321
+ 50: 0, # 'Ö'
322
+ 55: 0, # 'Ü'
323
+ 59: 0, # 'â'
324
+ 33: 0, # 'ç'
325
+ 61: 0, # 'î'
326
+ 34: 0, # 'ö'
327
+ 17: 0, # 'ü'
328
+ 30: 0, # 'ğ'
329
+ 41: 0, # 'İ'
330
+ 6: 3, # 'ı'
331
+ 40: 0, # 'Ş'
332
+ 19: 0, # 'ş'
333
+ },
334
+ 52: { # 'F'
335
+ 23: 0, # 'A'
336
+ 37: 1, # 'B'
337
+ 47: 1, # 'C'
338
+ 39: 1, # 'D'
339
+ 29: 1, # 'E'
340
+ 52: 2, # 'F'
341
+ 36: 0, # 'G'
342
+ 45: 2, # 'H'
343
+ 53: 1, # 'I'
344
+ 60: 0, # 'J'
345
+ 16: 0, # 'K'
346
+ 49: 0, # 'L'
347
+ 20: 1, # 'M'
348
+ 46: 1, # 'N'
349
+ 42: 1, # 'O'
350
+ 48: 2, # 'P'
351
+ 44: 1, # 'R'
352
+ 35: 1, # 'S'
353
+ 31: 1, # 'T'
354
+ 51: 1, # 'U'
355
+ 38: 1, # 'V'
356
+ 62: 0, # 'W'
357
+ 43: 2, # 'Y'
358
+ 56: 0, # 'Z'
359
+ 1: 0, # 'a'
360
+ 21: 1, # 'b'
361
+ 28: 1, # 'c'
362
+ 12: 1, # 'd'
363
+ 2: 0, # 'e'
364
+ 18: 1, # 'f'
365
+ 27: 0, # 'g'
366
+ 25: 0, # 'h'
367
+ 3: 2, # 'i'
368
+ 24: 1, # 'j'
369
+ 10: 0, # 'k'
370
+ 5: 0, # 'l'
371
+ 13: 1, # 'm'
372
+ 4: 2, # 'n'
373
+ 15: 1, # 'o'
374
+ 26: 0, # 'p'
375
+ 7: 2, # 'r'
376
+ 8: 1, # 's'
377
+ 9: 1, # 't'
378
+ 14: 1, # 'u'
379
+ 32: 0, # 'v'
380
+ 57: 0, # 'w'
381
+ 58: 0, # 'x'
382
+ 11: 1, # 'y'
383
+ 22: 1, # 'z'
384
+ 63: 0, # '·'
385
+ 54: 0, # 'Ç'
386
+ 50: 1, # 'Ö'
387
+ 55: 2, # 'Ü'
388
+ 59: 0, # 'â'
389
+ 33: 0, # 'ç'
390
+ 61: 0, # 'î'
391
+ 34: 2, # 'ö'
392
+ 17: 0, # 'ü'
393
+ 30: 1, # 'ğ'
394
+ 41: 1, # 'İ'
395
+ 6: 2, # 'ı'
396
+ 40: 0, # 'Ş'
397
+ 19: 2, # 'ş'
398
+ },
399
+ 36: { # 'G'
400
+ 23: 1, # 'A'
401
+ 37: 0, # 'B'
402
+ 47: 1, # 'C'
403
+ 39: 0, # 'D'
404
+ 29: 0, # 'E'
405
+ 52: 1, # 'F'
406
+ 36: 2, # 'G'
407
+ 45: 0, # 'H'
408
+ 53: 0, # 'I'
409
+ 60: 0, # 'J'
410
+ 16: 2, # 'K'
411
+ 49: 0, # 'L'
412
+ 20: 0, # 'M'
413
+ 46: 2, # 'N'
414
+ 42: 1, # 'O'
415
+ 48: 1, # 'P'
416
+ 44: 1, # 'R'
417
+ 35: 1, # 'S'
418
+ 31: 0, # 'T'
419
+ 51: 1, # 'U'
420
+ 38: 2, # 'V'
421
+ 62: 0, # 'W'
422
+ 43: 0, # 'Y'
423
+ 56: 0, # 'Z'
424
+ 1: 3, # 'a'
425
+ 21: 0, # 'b'
426
+ 28: 1, # 'c'
427
+ 12: 0, # 'd'
428
+ 2: 3, # 'e'
429
+ 18: 0, # 'f'
430
+ 27: 0, # 'g'
431
+ 25: 0, # 'h'
432
+ 3: 0, # 'i'
433
+ 24: 1, # 'j'
434
+ 10: 1, # 'k'
435
+ 5: 0, # 'l'
436
+ 13: 3, # 'm'
437
+ 4: 2, # 'n'
438
+ 15: 0, # 'o'
439
+ 26: 1, # 'p'
440
+ 7: 0, # 'r'
441
+ 8: 1, # 's'
442
+ 9: 1, # 't'
443
+ 14: 3, # 'u'
444
+ 32: 0, # 'v'
445
+ 57: 0, # 'w'
446
+ 58: 1, # 'x'
447
+ 11: 0, # 'y'
448
+ 22: 2, # 'z'
449
+ 63: 0, # '·'
450
+ 54: 1, # 'Ç'
451
+ 50: 2, # 'Ö'
452
+ 55: 0, # 'Ü'
453
+ 59: 1, # 'â'
454
+ 33: 2, # 'ç'
455
+ 61: 0, # 'î'
456
+ 34: 0, # 'ö'
457
+ 17: 0, # 'ü'
458
+ 30: 1, # 'ğ'
459
+ 41: 1, # 'İ'
460
+ 6: 2, # 'ı'
461
+ 40: 2, # 'Ş'
462
+ 19: 1, # 'ş'
463
+ },
464
+ 45: { # 'H'
465
+ 23: 0, # 'A'
466
+ 37: 1, # 'B'
467
+ 47: 0, # 'C'
468
+ 39: 0, # 'D'
469
+ 29: 0, # 'E'
470
+ 52: 2, # 'F'
471
+ 36: 2, # 'G'
472
+ 45: 1, # 'H'
473
+ 53: 1, # 'I'
474
+ 60: 0, # 'J'
475
+ 16: 2, # 'K'
476
+ 49: 1, # 'L'
477
+ 20: 0, # 'M'
478
+ 46: 1, # 'N'
479
+ 42: 1, # 'O'
480
+ 48: 1, # 'P'
481
+ 44: 0, # 'R'
482
+ 35: 2, # 'S'
483
+ 31: 0, # 'T'
484
+ 51: 1, # 'U'
485
+ 38: 2, # 'V'
486
+ 62: 0, # 'W'
487
+ 43: 0, # 'Y'
488
+ 56: 0, # 'Z'
489
+ 1: 3, # 'a'
490
+ 21: 0, # 'b'
491
+ 28: 2, # 'c'
492
+ 12: 0, # 'd'
493
+ 2: 3, # 'e'
494
+ 18: 0, # 'f'
495
+ 27: 0, # 'g'
496
+ 25: 0, # 'h'
497
+ 3: 2, # 'i'
498
+ 24: 0, # 'j'
499
+ 10: 1, # 'k'
500
+ 5: 0, # 'l'
501
+ 13: 2, # 'm'
502
+ 4: 0, # 'n'
503
+ 15: 1, # 'o'
504
+ 26: 1, # 'p'
505
+ 7: 1, # 'r'
506
+ 8: 0, # 's'
507
+ 9: 0, # 't'
508
+ 14: 3, # 'u'
509
+ 32: 0, # 'v'
510
+ 57: 0, # 'w'
511
+ 58: 0, # 'x'
512
+ 11: 0, # 'y'
513
+ 22: 2, # 'z'
514
+ 63: 0, # '·'
515
+ 54: 1, # 'Ç'
516
+ 50: 1, # 'Ö'
517
+ 55: 0, # 'Ü'
518
+ 59: 0, # 'â'
519
+ 33: 1, # 'ç'
520
+ 61: 0, # 'î'
521
+ 34: 1, # 'ö'
522
+ 17: 0, # 'ü'
523
+ 30: 2, # 'ğ'
524
+ 41: 1, # 'İ'
525
+ 6: 0, # 'ı'
526
+ 40: 2, # 'Ş'
527
+ 19: 1, # 'ş'
528
+ },
529
+ 53: { # 'I'
530
+ 23: 0, # 'A'
531
+ 37: 0, # 'B'
532
+ 47: 0, # 'C'
533
+ 39: 0, # 'D'
534
+ 29: 0, # 'E'
535
+ 52: 1, # 'F'
536
+ 36: 0, # 'G'
537
+ 45: 0, # 'H'
538
+ 53: 0, # 'I'
539
+ 60: 0, # 'J'
540
+ 16: 2, # 'K'
541
+ 49: 0, # 'L'
542
+ 20: 0, # 'M'
543
+ 46: 0, # 'N'
544
+ 42: 0, # 'O'
545
+ 48: 1, # 'P'
546
+ 44: 0, # 'R'
547
+ 35: 0, # 'S'
548
+ 31: 0, # 'T'
549
+ 51: 0, # 'U'
550
+ 38: 0, # 'V'
551
+ 62: 0, # 'W'
552
+ 43: 0, # 'Y'
553
+ 56: 0, # 'Z'
554
+ 1: 2, # 'a'
555
+ 21: 0, # 'b'
556
+ 28: 2, # 'c'
557
+ 12: 0, # 'd'
558
+ 2: 2, # 'e'
559
+ 18: 0, # 'f'
560
+ 27: 0, # 'g'
561
+ 25: 0, # 'h'
562
+ 3: 0, # 'i'
563
+ 24: 0, # 'j'
564
+ 10: 0, # 'k'
565
+ 5: 2, # 'l'
566
+ 13: 2, # 'm'
567
+ 4: 0, # 'n'
568
+ 15: 0, # 'o'
569
+ 26: 0, # 'p'
570
+ 7: 0, # 'r'
571
+ 8: 0, # 's'
572
+ 9: 0, # 't'
573
+ 14: 2, # 'u'
574
+ 32: 0, # 'v'
575
+ 57: 0, # 'w'
576
+ 58: 0, # 'x'
577
+ 11: 0, # 'y'
578
+ 22: 2, # 'z'
579
+ 63: 0, # '·'
580
+ 54: 1, # 'Ç'
581
+ 50: 0, # 'Ö'
582
+ 55: 0, # 'Ü'
583
+ 59: 0, # 'â'
584
+ 33: 2, # 'ç'
585
+ 61: 0, # 'î'
586
+ 34: 1, # 'ö'
587
+ 17: 0, # 'ü'
588
+ 30: 0, # 'ğ'
589
+ 41: 0, # 'İ'
590
+ 6: 0, # 'ı'
591
+ 40: 1, # 'Ş'
592
+ 19: 1, # 'ş'
593
+ },
594
+ 60: { # 'J'
595
+ 23: 0, # 'A'
596
+ 37: 0, # 'B'
597
+ 47: 0, # 'C'
598
+ 39: 0, # 'D'
599
+ 29: 0, # 'E'
600
+ 52: 0, # 'F'
601
+ 36: 0, # 'G'
602
+ 45: 0, # 'H'
603
+ 53: 0, # 'I'
604
+ 60: 0, # 'J'
605
+ 16: 0, # 'K'
606
+ 49: 0, # 'L'
607
+ 20: 1, # 'M'
608
+ 46: 0, # 'N'
609
+ 42: 0, # 'O'
610
+ 48: 0, # 'P'
611
+ 44: 0, # 'R'
612
+ 35: 0, # 'S'
613
+ 31: 0, # 'T'
614
+ 51: 0, # 'U'
615
+ 38: 0, # 'V'
616
+ 62: 0, # 'W'
617
+ 43: 0, # 'Y'
618
+ 56: 0, # 'Z'
619
+ 1: 0, # 'a'
620
+ 21: 1, # 'b'
621
+ 28: 0, # 'c'
622
+ 12: 1, # 'd'
623
+ 2: 0, # 'e'
624
+ 18: 0, # 'f'
625
+ 27: 0, # 'g'
626
+ 25: 0, # 'h'
627
+ 3: 1, # 'i'
628
+ 24: 0, # 'j'
629
+ 10: 0, # 'k'
630
+ 5: 0, # 'l'
631
+ 13: 0, # 'm'
632
+ 4: 1, # 'n'
633
+ 15: 0, # 'o'
634
+ 26: 0, # 'p'
635
+ 7: 0, # 'r'
636
+ 8: 1, # 's'
637
+ 9: 0, # 't'
638
+ 14: 0, # 'u'
639
+ 32: 0, # 'v'
640
+ 57: 0, # 'w'
641
+ 58: 0, # 'x'
642
+ 11: 0, # 'y'
643
+ 22: 0, # 'z'
644
+ 63: 0, # '·'
645
+ 54: 0, # 'Ç'
646
+ 50: 0, # 'Ö'
647
+ 55: 0, # 'Ü'
648
+ 59: 0, # 'â'
649
+ 33: 0, # 'ç'
650
+ 61: 0, # 'î'
651
+ 34: 0, # 'ö'
652
+ 17: 0, # 'ü'
653
+ 30: 0, # 'ğ'
654
+ 41: 0, # 'İ'
655
+ 6: 0, # 'ı'
656
+ 40: 0, # 'Ş'
657
+ 19: 0, # 'ş'
658
+ },
659
+ 16: { # 'K'
660
+ 23: 0, # 'A'
661
+ 37: 0, # 'B'
662
+ 47: 0, # 'C'
663
+ 39: 0, # 'D'
664
+ 29: 3, # 'E'
665
+ 52: 0, # 'F'
666
+ 36: 0, # 'G'
667
+ 45: 0, # 'H'
668
+ 53: 0, # 'I'
669
+ 60: 0, # 'J'
670
+ 16: 0, # 'K'
671
+ 49: 0, # 'L'
672
+ 20: 2, # 'M'
673
+ 46: 0, # 'N'
674
+ 42: 0, # 'O'
675
+ 48: 0, # 'P'
676
+ 44: 0, # 'R'
677
+ 35: 0, # 'S'
678
+ 31: 2, # 'T'
679
+ 51: 0, # 'U'
680
+ 38: 0, # 'V'
681
+ 62: 0, # 'W'
682
+ 43: 0, # 'Y'
683
+ 56: 0, # 'Z'
684
+ 1: 2, # 'a'
685
+ 21: 3, # 'b'
686
+ 28: 0, # 'c'
687
+ 12: 3, # 'd'
688
+ 2: 1, # 'e'
689
+ 18: 3, # 'f'
690
+ 27: 3, # 'g'
691
+ 25: 3, # 'h'
692
+ 3: 3, # 'i'
693
+ 24: 2, # 'j'
694
+ 10: 3, # 'k'
695
+ 5: 0, # 'l'
696
+ 13: 0, # 'm'
697
+ 4: 3, # 'n'
698
+ 15: 0, # 'o'
699
+ 26: 1, # 'p'
700
+ 7: 3, # 'r'
701
+ 8: 3, # 's'
702
+ 9: 3, # 't'
703
+ 14: 0, # 'u'
704
+ 32: 3, # 'v'
705
+ 57: 0, # 'w'
706
+ 58: 0, # 'x'
707
+ 11: 2, # 'y'
708
+ 22: 1, # 'z'
709
+ 63: 0, # '·'
710
+ 54: 0, # 'Ç'
711
+ 50: 0, # 'Ö'
712
+ 55: 0, # 'Ü'
713
+ 59: 0, # 'â'
714
+ 33: 0, # 'ç'
715
+ 61: 0, # 'î'
716
+ 34: 0, # 'ö'
717
+ 17: 2, # 'ü'
718
+ 30: 0, # 'ğ'
719
+ 41: 1, # 'İ'
720
+ 6: 3, # 'ı'
721
+ 40: 0, # 'Ş'
722
+ 19: 0, # 'ş'
723
+ },
724
+ 49: { # 'L'
725
+ 23: 0, # 'A'
726
+ 37: 0, # 'B'
727
+ 47: 0, # 'C'
728
+ 39: 0, # 'D'
729
+ 29: 2, # 'E'
730
+ 52: 0, # 'F'
731
+ 36: 1, # 'G'
732
+ 45: 1, # 'H'
733
+ 53: 0, # 'I'
734
+ 60: 0, # 'J'
735
+ 16: 0, # 'K'
736
+ 49: 0, # 'L'
737
+ 20: 1, # 'M'
738
+ 46: 0, # 'N'
739
+ 42: 2, # 'O'
740
+ 48: 0, # 'P'
741
+ 44: 0, # 'R'
742
+ 35: 0, # 'S'
743
+ 31: 0, # 'T'
744
+ 51: 0, # 'U'
745
+ 38: 0, # 'V'
746
+ 62: 0, # 'W'
747
+ 43: 1, # 'Y'
748
+ 56: 0, # 'Z'
749
+ 1: 0, # 'a'
750
+ 21: 3, # 'b'
751
+ 28: 0, # 'c'
752
+ 12: 2, # 'd'
753
+ 2: 0, # 'e'
754
+ 18: 0, # 'f'
755
+ 27: 0, # 'g'
756
+ 25: 0, # 'h'
757
+ 3: 2, # 'i'
758
+ 24: 0, # 'j'
759
+ 10: 1, # 'k'
760
+ 5: 0, # 'l'
761
+ 13: 0, # 'm'
762
+ 4: 2, # 'n'
763
+ 15: 1, # 'o'
764
+ 26: 1, # 'p'
765
+ 7: 1, # 'r'
766
+ 8: 1, # 's'
767
+ 9: 1, # 't'
768
+ 14: 0, # 'u'
769
+ 32: 0, # 'v'
770
+ 57: 0, # 'w'
771
+ 58: 0, # 'x'
772
+ 11: 2, # 'y'
773
+ 22: 0, # 'z'
774
+ 63: 0, # '·'
775
+ 54: 0, # 'Ç'
776
+ 50: 0, # 'Ö'
777
+ 55: 2, # 'Ü'
778
+ 59: 0, # 'â'
779
+ 33: 0, # 'ç'
780
+ 61: 0, # 'î'
781
+ 34: 1, # 'ö'
782
+ 17: 1, # 'ü'
783
+ 30: 1, # 'ğ'
784
+ 41: 0, # 'İ'
785
+ 6: 2, # 'ı'
786
+ 40: 0, # 'Ş'
787
+ 19: 0, # 'ş'
788
+ },
789
+ 20: { # 'M'
790
+ 23: 1, # 'A'
791
+ 37: 0, # 'B'
792
+ 47: 0, # 'C'
793
+ 39: 0, # 'D'
794
+ 29: 0, # 'E'
795
+ 52: 0, # 'F'
796
+ 36: 0, # 'G'
797
+ 45: 0, # 'H'
798
+ 53: 0, # 'I'
799
+ 60: 1, # 'J'
800
+ 16: 3, # 'K'
801
+ 49: 0, # 'L'
802
+ 20: 2, # 'M'
803
+ 46: 0, # 'N'
804
+ 42: 0, # 'O'
805
+ 48: 0, # 'P'
806
+ 44: 0, # 'R'
807
+ 35: 0, # 'S'
808
+ 31: 1, # 'T'
809
+ 51: 0, # 'U'
810
+ 38: 0, # 'V'
811
+ 62: 0, # 'W'
812
+ 43: 0, # 'Y'
813
+ 56: 0, # 'Z'
814
+ 1: 3, # 'a'
815
+ 21: 2, # 'b'
816
+ 28: 0, # 'c'
817
+ 12: 3, # 'd'
818
+ 2: 3, # 'e'
819
+ 18: 0, # 'f'
820
+ 27: 1, # 'g'
821
+ 25: 1, # 'h'
822
+ 3: 2, # 'i'
823
+ 24: 2, # 'j'
824
+ 10: 2, # 'k'
825
+ 5: 2, # 'l'
826
+ 13: 3, # 'm'
827
+ 4: 3, # 'n'
828
+ 15: 0, # 'o'
829
+ 26: 1, # 'p'
830
+ 7: 3, # 'r'
831
+ 8: 0, # 's'
832
+ 9: 2, # 't'
833
+ 14: 3, # 'u'
834
+ 32: 0, # 'v'
835
+ 57: 0, # 'w'
836
+ 58: 0, # 'x'
837
+ 11: 2, # 'y'
838
+ 22: 0, # 'z'
839
+ 63: 0, # '·'
840
+ 54: 0, # 'Ç'
841
+ 50: 0, # 'Ö'
842
+ 55: 0, # 'Ü'
843
+ 59: 0, # 'â'
844
+ 33: 3, # 'ç'
845
+ 61: 0, # 'î'
846
+ 34: 0, # 'ö'
847
+ 17: 0, # 'ü'
848
+ 30: 0, # 'ğ'
849
+ 41: 0, # 'İ'
850
+ 6: 3, # 'ı'
851
+ 40: 0, # 'Ş'
852
+ 19: 0, # 'ş'
853
+ },
854
+ 46: { # 'N'
855
+ 23: 0, # 'A'
856
+ 37: 1, # 'B'
857
+ 47: 0, # 'C'
858
+ 39: 0, # 'D'
859
+ 29: 0, # 'E'
860
+ 52: 1, # 'F'
861
+ 36: 1, # 'G'
862
+ 45: 1, # 'H'
863
+ 53: 0, # 'I'
864
+ 60: 0, # 'J'
865
+ 16: 2, # 'K'
866
+ 49: 0, # 'L'
867
+ 20: 0, # 'M'
868
+ 46: 1, # 'N'
869
+ 42: 0, # 'O'
870
+ 48: 0, # 'P'
871
+ 44: 1, # 'R'
872
+ 35: 1, # 'S'
873
+ 31: 0, # 'T'
874
+ 51: 1, # 'U'
875
+ 38: 2, # 'V'
876
+ 62: 0, # 'W'
877
+ 43: 1, # 'Y'
878
+ 56: 0, # 'Z'
879
+ 1: 3, # 'a'
880
+ 21: 0, # 'b'
881
+ 28: 2, # 'c'
882
+ 12: 0, # 'd'
883
+ 2: 3, # 'e'
884
+ 18: 0, # 'f'
885
+ 27: 1, # 'g'
886
+ 25: 0, # 'h'
887
+ 3: 0, # 'i'
888
+ 24: 2, # 'j'
889
+ 10: 1, # 'k'
890
+ 5: 1, # 'l'
891
+ 13: 3, # 'm'
892
+ 4: 2, # 'n'
893
+ 15: 1, # 'o'
894
+ 26: 1, # 'p'
895
+ 7: 1, # 'r'
896
+ 8: 0, # 's'
897
+ 9: 0, # 't'
898
+ 14: 3, # 'u'
899
+ 32: 0, # 'v'
900
+ 57: 0, # 'w'
901
+ 58: 1, # 'x'
902
+ 11: 1, # 'y'
903
+ 22: 2, # 'z'
904
+ 63: 0, # '·'
905
+ 54: 1, # 'Ç'
906
+ 50: 1, # 'Ö'
907
+ 55: 0, # 'Ü'
908
+ 59: 0, # 'â'
909
+ 33: 0, # 'ç'
910
+ 61: 0, # 'î'
911
+ 34: 1, # 'ö'
912
+ 17: 0, # 'ü'
913
+ 30: 0, # 'ğ'
914
+ 41: 1, # 'İ'
915
+ 6: 2, # 'ı'
916
+ 40: 1, # 'Ş'
917
+ 19: 1, # 'ş'
918
+ },
919
+ 42: { # 'O'
920
+ 23: 0, # 'A'
921
+ 37: 0, # 'B'
922
+ 47: 0, # 'C'
923
+ 39: 0, # 'D'
924
+ 29: 0, # 'E'
925
+ 52: 1, # 'F'
926
+ 36: 0, # 'G'
927
+ 45: 1, # 'H'
928
+ 53: 0, # 'I'
929
+ 60: 0, # 'J'
930
+ 16: 2, # 'K'
931
+ 49: 1, # 'L'
932
+ 20: 0, # 'M'
933
+ 46: 0, # 'N'
934
+ 42: 0, # 'O'
935
+ 48: 2, # 'P'
936
+ 44: 1, # 'R'
937
+ 35: 1, # 'S'
938
+ 31: 0, # 'T'
939
+ 51: 1, # 'U'
940
+ 38: 1, # 'V'
941
+ 62: 0, # 'W'
942
+ 43: 0, # 'Y'
943
+ 56: 0, # 'Z'
944
+ 1: 3, # 'a'
945
+ 21: 0, # 'b'
946
+ 28: 2, # 'c'
947
+ 12: 0, # 'd'
948
+ 2: 2, # 'e'
949
+ 18: 0, # 'f'
950
+ 27: 0, # 'g'
951
+ 25: 0, # 'h'
952
+ 3: 0, # 'i'
953
+ 24: 0, # 'j'
954
+ 10: 0, # 'k'
955
+ 5: 3, # 'l'
956
+ 13: 3, # 'm'
957
+ 4: 0, # 'n'
958
+ 15: 1, # 'o'
959
+ 26: 0, # 'p'
960
+ 7: 0, # 'r'
961
+ 8: 0, # 's'
962
+ 9: 0, # 't'
963
+ 14: 2, # 'u'
964
+ 32: 0, # 'v'
965
+ 57: 0, # 'w'
966
+ 58: 0, # 'x'
967
+ 11: 0, # 'y'
968
+ 22: 2, # 'z'
969
+ 63: 0, # '·'
970
+ 54: 2, # 'Ç'
971
+ 50: 1, # 'Ö'
972
+ 55: 0, # 'Ü'
973
+ 59: 0, # 'â'
974
+ 33: 2, # 'ç'
975
+ 61: 0, # 'î'
976
+ 34: 1, # 'ö'
977
+ 17: 0, # 'ü'
978
+ 30: 1, # 'ğ'
979
+ 41: 2, # 'İ'
980
+ 6: 1, # 'ı'
981
+ 40: 1, # 'Ş'
982
+ 19: 1, # 'ş'
983
+ },
984
+ 48: { # 'P'
985
+ 23: 0, # 'A'
986
+ 37: 0, # 'B'
987
+ 47: 2, # 'C'
988
+ 39: 0, # 'D'
989
+ 29: 0, # 'E'
990
+ 52: 2, # 'F'
991
+ 36: 1, # 'G'
992
+ 45: 1, # 'H'
993
+ 53: 0, # 'I'
994
+ 60: 0, # 'J'
995
+ 16: 2, # 'K'
996
+ 49: 0, # 'L'
997
+ 20: 0, # 'M'
998
+ 46: 1, # 'N'
999
+ 42: 1, # 'O'
1000
+ 48: 1, # 'P'
1001
+ 44: 0, # 'R'
1002
+ 35: 1, # 'S'
1003
+ 31: 0, # 'T'
1004
+ 51: 0, # 'U'
1005
+ 38: 1, # 'V'
1006
+ 62: 0, # 'W'
1007
+ 43: 0, # 'Y'
1008
+ 56: 0, # 'Z'
1009
+ 1: 2, # 'a'
1010
+ 21: 0, # 'b'
1011
+ 28: 2, # 'c'
1012
+ 12: 0, # 'd'
1013
+ 2: 3, # 'e'
1014
+ 18: 0, # 'f'
1015
+ 27: 0, # 'g'
1016
+ 25: 0, # 'h'
1017
+ 3: 0, # 'i'
1018
+ 24: 0, # 'j'
1019
+ 10: 1, # 'k'
1020
+ 5: 0, # 'l'
1021
+ 13: 2, # 'm'
1022
+ 4: 0, # 'n'
1023
+ 15: 2, # 'o'
1024
+ 26: 0, # 'p'
1025
+ 7: 0, # 'r'
1026
+ 8: 0, # 's'
1027
+ 9: 0, # 't'
1028
+ 14: 2, # 'u'
1029
+ 32: 0, # 'v'
1030
+ 57: 0, # 'w'
1031
+ 58: 2, # 'x'
1032
+ 11: 0, # 'y'
1033
+ 22: 2, # 'z'
1034
+ 63: 0, # '·'
1035
+ 54: 1, # 'Ç'
1036
+ 50: 2, # 'Ö'
1037
+ 55: 0, # 'Ü'
1038
+ 59: 0, # 'â'
1039
+ 33: 0, # 'ç'
1040
+ 61: 0, # 'î'
1041
+ 34: 2, # 'ö'
1042
+ 17: 0, # 'ü'
1043
+ 30: 1, # 'ğ'
1044
+ 41: 1, # 'İ'
1045
+ 6: 0, # 'ı'
1046
+ 40: 2, # 'Ş'
1047
+ 19: 1, # 'ş'
1048
+ },
1049
+ 44: { # 'R'
1050
+ 23: 0, # 'A'
1051
+ 37: 0, # 'B'
1052
+ 47: 1, # 'C'
1053
+ 39: 0, # 'D'
1054
+ 29: 0, # 'E'
1055
+ 52: 1, # 'F'
1056
+ 36: 0, # 'G'
1057
+ 45: 0, # 'H'
1058
+ 53: 0, # 'I'
1059
+ 60: 0, # 'J'
1060
+ 16: 3, # 'K'
1061
+ 49: 0, # 'L'
1062
+ 20: 0, # 'M'
1063
+ 46: 0, # 'N'
1064
+ 42: 0, # 'O'
1065
+ 48: 1, # 'P'
1066
+ 44: 0, # 'R'
1067
+ 35: 0, # 'S'
1068
+ 31: 0, # 'T'
1069
+ 51: 0, # 'U'
1070
+ 38: 0, # 'V'
1071
+ 62: 0, # 'W'
1072
+ 43: 1, # 'Y'
1073
+ 56: 0, # 'Z'
1074
+ 1: 3, # 'a'
1075
+ 21: 1, # 'b'
1076
+ 28: 1, # 'c'
1077
+ 12: 0, # 'd'
1078
+ 2: 2, # 'e'
1079
+ 18: 0, # 'f'
1080
+ 27: 0, # 'g'
1081
+ 25: 0, # 'h'
1082
+ 3: 0, # 'i'
1083
+ 24: 0, # 'j'
1084
+ 10: 1, # 'k'
1085
+ 5: 2, # 'l'
1086
+ 13: 2, # 'm'
1087
+ 4: 0, # 'n'
1088
+ 15: 1, # 'o'
1089
+ 26: 0, # 'p'
1090
+ 7: 0, # 'r'
1091
+ 8: 0, # 's'
1092
+ 9: 0, # 't'
1093
+ 14: 2, # 'u'
1094
+ 32: 0, # 'v'
1095
+ 57: 0, # 'w'
1096
+ 58: 0, # 'x'
1097
+ 11: 1, # 'y'
1098
+ 22: 2, # 'z'
1099
+ 63: 0, # '·'
1100
+ 54: 0, # 'Ç'
1101
+ 50: 1, # 'Ö'
1102
+ 55: 0, # 'Ü'
1103
+ 59: 0, # 'â'
1104
+ 33: 1, # 'ç'
1105
+ 61: 0, # 'î'
1106
+ 34: 1, # 'ö'
1107
+ 17: 1, # 'ü'
1108
+ 30: 1, # 'ğ'
1109
+ 41: 0, # 'İ'
1110
+ 6: 2, # 'ı'
1111
+ 40: 1, # 'Ş'
1112
+ 19: 1, # 'ş'
1113
+ },
1114
+ 35: { # 'S'
1115
+ 23: 0, # 'A'
1116
+ 37: 0, # 'B'
1117
+ 47: 1, # 'C'
1118
+ 39: 0, # 'D'
1119
+ 29: 0, # 'E'
1120
+ 52: 1, # 'F'
1121
+ 36: 1, # 'G'
1122
+ 45: 1, # 'H'
1123
+ 53: 0, # 'I'
1124
+ 60: 0, # 'J'
1125
+ 16: 3, # 'K'
1126
+ 49: 1, # 'L'
1127
+ 20: 1, # 'M'
1128
+ 46: 0, # 'N'
1129
+ 42: 0, # 'O'
1130
+ 48: 1, # 'P'
1131
+ 44: 0, # 'R'
1132
+ 35: 0, # 'S'
1133
+ 31: 0, # 'T'
1134
+ 51: 1, # 'U'
1135
+ 38: 1, # 'V'
1136
+ 62: 0, # 'W'
1137
+ 43: 1, # 'Y'
1138
+ 56: 0, # 'Z'
1139
+ 1: 3, # 'a'
1140
+ 21: 0, # 'b'
1141
+ 28: 2, # 'c'
1142
+ 12: 0, # 'd'
1143
+ 2: 3, # 'e'
1144
+ 18: 0, # 'f'
1145
+ 27: 0, # 'g'
1146
+ 25: 0, # 'h'
1147
+ 3: 0, # 'i'
1148
+ 24: 0, # 'j'
1149
+ 10: 1, # 'k'
1150
+ 5: 1, # 'l'
1151
+ 13: 2, # 'm'
1152
+ 4: 1, # 'n'
1153
+ 15: 0, # 'o'
1154
+ 26: 0, # 'p'
1155
+ 7: 0, # 'r'
1156
+ 8: 0, # 's'
1157
+ 9: 1, # 't'
1158
+ 14: 2, # 'u'
1159
+ 32: 0, # 'v'
1160
+ 57: 0, # 'w'
1161
+ 58: 0, # 'x'
1162
+ 11: 0, # 'y'
1163
+ 22: 1, # 'z'
1164
+ 63: 0, # '·'
1165
+ 54: 2, # 'Ç'
1166
+ 50: 2, # 'Ö'
1167
+ 55: 0, # 'Ü'
1168
+ 59: 0, # 'â'
1169
+ 33: 3, # 'ç'
1170
+ 61: 0, # 'î'
1171
+ 34: 1, # 'ö'
1172
+ 17: 0, # 'ü'
1173
+ 30: 0, # 'ğ'
1174
+ 41: 0, # 'İ'
1175
+ 6: 3, # 'ı'
1176
+ 40: 2, # 'Ş'
1177
+ 19: 1, # 'ş'
1178
+ },
1179
+ 31: { # 'T'
1180
+ 23: 0, # 'A'
1181
+ 37: 0, # 'B'
1182
+ 47: 0, # 'C'
1183
+ 39: 0, # 'D'
1184
+ 29: 0, # 'E'
1185
+ 52: 0, # 'F'
1186
+ 36: 0, # 'G'
1187
+ 45: 0, # 'H'
1188
+ 53: 0, # 'I'
1189
+ 60: 1, # 'J'
1190
+ 16: 2, # 'K'
1191
+ 49: 0, # 'L'
1192
+ 20: 1, # 'M'
1193
+ 46: 0, # 'N'
1194
+ 42: 0, # 'O'
1195
+ 48: 0, # 'P'
1196
+ 44: 0, # 'R'
1197
+ 35: 0, # 'S'
1198
+ 31: 2, # 'T'
1199
+ 51: 0, # 'U'
1200
+ 38: 0, # 'V'
1201
+ 62: 0, # 'W'
1202
+ 43: 0, # 'Y'
1203
+ 56: 0, # 'Z'
1204
+ 1: 3, # 'a'
1205
+ 21: 2, # 'b'
1206
+ 28: 0, # 'c'
1207
+ 12: 1, # 'd'
1208
+ 2: 3, # 'e'
1209
+ 18: 2, # 'f'
1210
+ 27: 2, # 'g'
1211
+ 25: 0, # 'h'
1212
+ 3: 1, # 'i'
1213
+ 24: 1, # 'j'
1214
+ 10: 2, # 'k'
1215
+ 5: 2, # 'l'
1216
+ 13: 3, # 'm'
1217
+ 4: 3, # 'n'
1218
+ 15: 0, # 'o'
1219
+ 26: 2, # 'p'
1220
+ 7: 2, # 'r'
1221
+ 8: 0, # 's'
1222
+ 9: 2, # 't'
1223
+ 14: 2, # 'u'
1224
+ 32: 1, # 'v'
1225
+ 57: 1, # 'w'
1226
+ 58: 1, # 'x'
1227
+ 11: 2, # 'y'
1228
+ 22: 0, # 'z'
1229
+ 63: 0, # '·'
1230
+ 54: 0, # 'Ç'
1231
+ 50: 0, # 'Ö'
1232
+ 55: 0, # 'Ü'
1233
+ 59: 0, # 'â'
1234
+ 33: 0, # 'ç'
1235
+ 61: 0, # 'î'
1236
+ 34: 0, # 'ö'
1237
+ 17: 1, # 'ü'
1238
+ 30: 0, # 'ğ'
1239
+ 41: 0, # 'İ'
1240
+ 6: 3, # 'ı'
1241
+ 40: 0, # 'Ş'
1242
+ 19: 0, # 'ş'
1243
+ },
1244
+ 51: { # 'U'
1245
+ 23: 0, # 'A'
1246
+ 37: 0, # 'B'
1247
+ 47: 0, # 'C'
1248
+ 39: 0, # 'D'
1249
+ 29: 0, # 'E'
1250
+ 52: 1, # 'F'
1251
+ 36: 1, # 'G'
1252
+ 45: 0, # 'H'
1253
+ 53: 0, # 'I'
1254
+ 60: 0, # 'J'
1255
+ 16: 1, # 'K'
1256
+ 49: 0, # 'L'
1257
+ 20: 0, # 'M'
1258
+ 46: 1, # 'N'
1259
+ 42: 0, # 'O'
1260
+ 48: 1, # 'P'
1261
+ 44: 0, # 'R'
1262
+ 35: 0, # 'S'
1263
+ 31: 0, # 'T'
1264
+ 51: 1, # 'U'
1265
+ 38: 1, # 'V'
1266
+ 62: 0, # 'W'
1267
+ 43: 0, # 'Y'
1268
+ 56: 0, # 'Z'
1269
+ 1: 3, # 'a'
1270
+ 21: 0, # 'b'
1271
+ 28: 1, # 'c'
1272
+ 12: 0, # 'd'
1273
+ 2: 3, # 'e'
1274
+ 18: 0, # 'f'
1275
+ 27: 2, # 'g'
1276
+ 25: 0, # 'h'
1277
+ 3: 0, # 'i'
1278
+ 24: 0, # 'j'
1279
+ 10: 1, # 'k'
1280
+ 5: 1, # 'l'
1281
+ 13: 3, # 'm'
1282
+ 4: 2, # 'n'
1283
+ 15: 0, # 'o'
1284
+ 26: 1, # 'p'
1285
+ 7: 0, # 'r'
1286
+ 8: 0, # 's'
1287
+ 9: 0, # 't'
1288
+ 14: 2, # 'u'
1289
+ 32: 0, # 'v'
1290
+ 57: 0, # 'w'
1291
+ 58: 0, # 'x'
1292
+ 11: 0, # 'y'
1293
+ 22: 2, # 'z'
1294
+ 63: 0, # '·'
1295
+ 54: 1, # 'Ç'
1296
+ 50: 1, # 'Ö'
1297
+ 55: 0, # 'Ü'
1298
+ 59: 0, # 'â'
1299
+ 33: 0, # 'ç'
1300
+ 61: 0, # 'î'
1301
+ 34: 0, # 'ö'
1302
+ 17: 0, # 'ü'
1303
+ 30: 1, # 'ğ'
1304
+ 41: 1, # 'İ'
1305
+ 6: 2, # 'ı'
1306
+ 40: 0, # 'Ş'
1307
+ 19: 1, # 'ş'
1308
+ },
1309
+ 38: { # 'V'
1310
+ 23: 1, # 'A'
1311
+ 37: 1, # 'B'
1312
+ 47: 1, # 'C'
1313
+ 39: 0, # 'D'
1314
+ 29: 0, # 'E'
1315
+ 52: 2, # 'F'
1316
+ 36: 0, # 'G'
1317
+ 45: 0, # 'H'
1318
+ 53: 0, # 'I'
1319
+ 60: 0, # 'J'
1320
+ 16: 3, # 'K'
1321
+ 49: 0, # 'L'
1322
+ 20: 3, # 'M'
1323
+ 46: 0, # 'N'
1324
+ 42: 0, # 'O'
1325
+ 48: 1, # 'P'
1326
+ 44: 1, # 'R'
1327
+ 35: 0, # 'S'
1328
+ 31: 0, # 'T'
1329
+ 51: 1, # 'U'
1330
+ 38: 1, # 'V'
1331
+ 62: 0, # 'W'
1332
+ 43: 0, # 'Y'
1333
+ 56: 0, # 'Z'
1334
+ 1: 3, # 'a'
1335
+ 21: 0, # 'b'
1336
+ 28: 2, # 'c'
1337
+ 12: 0, # 'd'
1338
+ 2: 3, # 'e'
1339
+ 18: 0, # 'f'
1340
+ 27: 0, # 'g'
1341
+ 25: 0, # 'h'
1342
+ 3: 0, # 'i'
1343
+ 24: 0, # 'j'
1344
+ 10: 0, # 'k'
1345
+ 5: 2, # 'l'
1346
+ 13: 2, # 'm'
1347
+ 4: 0, # 'n'
1348
+ 15: 2, # 'o'
1349
+ 26: 0, # 'p'
1350
+ 7: 0, # 'r'
1351
+ 8: 0, # 's'
1352
+ 9: 1, # 't'
1353
+ 14: 3, # 'u'
1354
+ 32: 0, # 'v'
1355
+ 57: 0, # 'w'
1356
+ 58: 0, # 'x'
1357
+ 11: 1, # 'y'
1358
+ 22: 2, # 'z'
1359
+ 63: 0, # '·'
1360
+ 54: 1, # 'Ç'
1361
+ 50: 1, # 'Ö'
1362
+ 55: 0, # 'Ü'
1363
+ 59: 1, # 'â'
1364
+ 33: 2, # 'ç'
1365
+ 61: 0, # 'î'
1366
+ 34: 1, # 'ö'
1367
+ 17: 0, # 'ü'
1368
+ 30: 1, # 'ğ'
1369
+ 41: 1, # 'İ'
1370
+ 6: 3, # 'ı'
1371
+ 40: 2, # 'Ş'
1372
+ 19: 1, # 'ş'
1373
+ },
1374
+ 62: { # 'W'
1375
+ 23: 0, # 'A'
1376
+ 37: 0, # 'B'
1377
+ 47: 0, # 'C'
1378
+ 39: 0, # 'D'
1379
+ 29: 0, # 'E'
1380
+ 52: 0, # 'F'
1381
+ 36: 0, # 'G'
1382
+ 45: 0, # 'H'
1383
+ 53: 0, # 'I'
1384
+ 60: 0, # 'J'
1385
+ 16: 0, # 'K'
1386
+ 49: 0, # 'L'
1387
+ 20: 0, # 'M'
1388
+ 46: 0, # 'N'
1389
+ 42: 0, # 'O'
1390
+ 48: 0, # 'P'
1391
+ 44: 0, # 'R'
1392
+ 35: 0, # 'S'
1393
+ 31: 0, # 'T'
1394
+ 51: 0, # 'U'
1395
+ 38: 0, # 'V'
1396
+ 62: 0, # 'W'
1397
+ 43: 0, # 'Y'
1398
+ 56: 0, # 'Z'
1399
+ 1: 0, # 'a'
1400
+ 21: 0, # 'b'
1401
+ 28: 0, # 'c'
1402
+ 12: 0, # 'd'
1403
+ 2: 0, # 'e'
1404
+ 18: 0, # 'f'
1405
+ 27: 0, # 'g'
1406
+ 25: 0, # 'h'
1407
+ 3: 0, # 'i'
1408
+ 24: 0, # 'j'
1409
+ 10: 0, # 'k'
1410
+ 5: 0, # 'l'
1411
+ 13: 0, # 'm'
1412
+ 4: 0, # 'n'
1413
+ 15: 0, # 'o'
1414
+ 26: 0, # 'p'
1415
+ 7: 0, # 'r'
1416
+ 8: 0, # 's'
1417
+ 9: 0, # 't'
1418
+ 14: 0, # 'u'
1419
+ 32: 0, # 'v'
1420
+ 57: 0, # 'w'
1421
+ 58: 0, # 'x'
1422
+ 11: 0, # 'y'
1423
+ 22: 0, # 'z'
1424
+ 63: 0, # '·'
1425
+ 54: 0, # 'Ç'
1426
+ 50: 0, # 'Ö'
1427
+ 55: 0, # 'Ü'
1428
+ 59: 0, # 'â'
1429
+ 33: 0, # 'ç'
1430
+ 61: 0, # 'î'
1431
+ 34: 0, # 'ö'
1432
+ 17: 0, # 'ü'
1433
+ 30: 0, # 'ğ'
1434
+ 41: 0, # 'İ'
1435
+ 6: 0, # 'ı'
1436
+ 40: 0, # 'Ş'
1437
+ 19: 0, # 'ş'
1438
+ },
1439
+ 43: { # 'Y'
1440
+ 23: 0, # 'A'
1441
+ 37: 0, # 'B'
1442
+ 47: 1, # 'C'
1443
+ 39: 0, # 'D'
1444
+ 29: 0, # 'E'
1445
+ 52: 2, # 'F'
1446
+ 36: 0, # 'G'
1447
+ 45: 1, # 'H'
1448
+ 53: 1, # 'I'
1449
+ 60: 0, # 'J'
1450
+ 16: 2, # 'K'
1451
+ 49: 0, # 'L'
1452
+ 20: 0, # 'M'
1453
+ 46: 2, # 'N'
1454
+ 42: 0, # 'O'
1455
+ 48: 2, # 'P'
1456
+ 44: 1, # 'R'
1457
+ 35: 1, # 'S'
1458
+ 31: 0, # 'T'
1459
+ 51: 1, # 'U'
1460
+ 38: 2, # 'V'
1461
+ 62: 0, # 'W'
1462
+ 43: 0, # 'Y'
1463
+ 56: 0, # 'Z'
1464
+ 1: 3, # 'a'
1465
+ 21: 0, # 'b'
1466
+ 28: 2, # 'c'
1467
+ 12: 0, # 'd'
1468
+ 2: 2, # 'e'
1469
+ 18: 0, # 'f'
1470
+ 27: 0, # 'g'
1471
+ 25: 0, # 'h'
1472
+ 3: 0, # 'i'
1473
+ 24: 1, # 'j'
1474
+ 10: 1, # 'k'
1475
+ 5: 1, # 'l'
1476
+ 13: 3, # 'm'
1477
+ 4: 0, # 'n'
1478
+ 15: 2, # 'o'
1479
+ 26: 0, # 'p'
1480
+ 7: 0, # 'r'
1481
+ 8: 0, # 's'
1482
+ 9: 0, # 't'
1483
+ 14: 3, # 'u'
1484
+ 32: 0, # 'v'
1485
+ 57: 0, # 'w'
1486
+ 58: 1, # 'x'
1487
+ 11: 0, # 'y'
1488
+ 22: 2, # 'z'
1489
+ 63: 0, # '·'
1490
+ 54: 1, # 'Ç'
1491
+ 50: 2, # 'Ö'
1492
+ 55: 1, # 'Ü'
1493
+ 59: 1, # 'â'
1494
+ 33: 0, # 'ç'
1495
+ 61: 0, # 'î'
1496
+ 34: 1, # 'ö'
1497
+ 17: 0, # 'ü'
1498
+ 30: 1, # 'ğ'
1499
+ 41: 1, # 'İ'
1500
+ 6: 0, # 'ı'
1501
+ 40: 2, # 'Ş'
1502
+ 19: 1, # 'ş'
1503
+ },
1504
+ 56: { # 'Z'
1505
+ 23: 0, # 'A'
1506
+ 37: 0, # 'B'
1507
+ 47: 0, # 'C'
1508
+ 39: 0, # 'D'
1509
+ 29: 0, # 'E'
1510
+ 52: 0, # 'F'
1511
+ 36: 0, # 'G'
1512
+ 45: 0, # 'H'
1513
+ 53: 0, # 'I'
1514
+ 60: 0, # 'J'
1515
+ 16: 0, # 'K'
1516
+ 49: 0, # 'L'
1517
+ 20: 0, # 'M'
1518
+ 46: 0, # 'N'
1519
+ 42: 0, # 'O'
1520
+ 48: 0, # 'P'
1521
+ 44: 0, # 'R'
1522
+ 35: 0, # 'S'
1523
+ 31: 0, # 'T'
1524
+ 51: 0, # 'U'
1525
+ 38: 0, # 'V'
1526
+ 62: 0, # 'W'
1527
+ 43: 0, # 'Y'
1528
+ 56: 2, # 'Z'
1529
+ 1: 2, # 'a'
1530
+ 21: 1, # 'b'
1531
+ 28: 0, # 'c'
1532
+ 12: 0, # 'd'
1533
+ 2: 2, # 'e'
1534
+ 18: 0, # 'f'
1535
+ 27: 0, # 'g'
1536
+ 25: 0, # 'h'
1537
+ 3: 2, # 'i'
1538
+ 24: 1, # 'j'
1539
+ 10: 0, # 'k'
1540
+ 5: 0, # 'l'
1541
+ 13: 1, # 'm'
1542
+ 4: 1, # 'n'
1543
+ 15: 0, # 'o'
1544
+ 26: 0, # 'p'
1545
+ 7: 1, # 'r'
1546
+ 8: 1, # 's'
1547
+ 9: 0, # 't'
1548
+ 14: 2, # 'u'
1549
+ 32: 0, # 'v'
1550
+ 57: 0, # 'w'
1551
+ 58: 0, # 'x'
1552
+ 11: 0, # 'y'
1553
+ 22: 0, # 'z'
1554
+ 63: 0, # '·'
1555
+ 54: 0, # 'Ç'
1556
+ 50: 0, # 'Ö'
1557
+ 55: 0, # 'Ü'
1558
+ 59: 0, # 'â'
1559
+ 33: 0, # 'ç'
1560
+ 61: 0, # 'î'
1561
+ 34: 0, # 'ö'
1562
+ 17: 1, # 'ü'
1563
+ 30: 0, # 'ğ'
1564
+ 41: 0, # 'İ'
1565
+ 6: 1, # 'ı'
1566
+ 40: 0, # 'Ş'
1567
+ 19: 0, # 'ş'
1568
+ },
1569
+ 1: { # 'a'
1570
+ 23: 3, # 'A'
1571
+ 37: 0, # 'B'
1572
+ 47: 1, # 'C'
1573
+ 39: 0, # 'D'
1574
+ 29: 3, # 'E'
1575
+ 52: 0, # 'F'
1576
+ 36: 1, # 'G'
1577
+ 45: 1, # 'H'
1578
+ 53: 0, # 'I'
1579
+ 60: 0, # 'J'
1580
+ 16: 0, # 'K'
1581
+ 49: 0, # 'L'
1582
+ 20: 3, # 'M'
1583
+ 46: 1, # 'N'
1584
+ 42: 0, # 'O'
1585
+ 48: 1, # 'P'
1586
+ 44: 0, # 'R'
1587
+ 35: 0, # 'S'
1588
+ 31: 3, # 'T'
1589
+ 51: 0, # 'U'
1590
+ 38: 1, # 'V'
1591
+ 62: 0, # 'W'
1592
+ 43: 0, # 'Y'
1593
+ 56: 2, # 'Z'
1594
+ 1: 2, # 'a'
1595
+ 21: 3, # 'b'
1596
+ 28: 0, # 'c'
1597
+ 12: 3, # 'd'
1598
+ 2: 2, # 'e'
1599
+ 18: 3, # 'f'
1600
+ 27: 3, # 'g'
1601
+ 25: 3, # 'h'
1602
+ 3: 3, # 'i'
1603
+ 24: 3, # 'j'
1604
+ 10: 3, # 'k'
1605
+ 5: 0, # 'l'
1606
+ 13: 2, # 'm'
1607
+ 4: 3, # 'n'
1608
+ 15: 1, # 'o'
1609
+ 26: 3, # 'p'
1610
+ 7: 3, # 'r'
1611
+ 8: 3, # 's'
1612
+ 9: 3, # 't'
1613
+ 14: 3, # 'u'
1614
+ 32: 3, # 'v'
1615
+ 57: 2, # 'w'
1616
+ 58: 0, # 'x'
1617
+ 11: 3, # 'y'
1618
+ 22: 0, # 'z'
1619
+ 63: 1, # '·'
1620
+ 54: 0, # 'Ç'
1621
+ 50: 0, # 'Ö'
1622
+ 55: 0, # 'Ü'
1623
+ 59: 0, # 'â'
1624
+ 33: 1, # 'ç'
1625
+ 61: 1, # 'î'
1626
+ 34: 1, # 'ö'
1627
+ 17: 3, # 'ü'
1628
+ 30: 0, # 'ğ'
1629
+ 41: 0, # 'İ'
1630
+ 6: 3, # 'ı'
1631
+ 40: 0, # 'Ş'
1632
+ 19: 1, # 'ş'
1633
+ },
1634
+ 21: { # 'b'
1635
+ 23: 0, # 'A'
1636
+ 37: 0, # 'B'
1637
+ 47: 0, # 'C'
1638
+ 39: 0, # 'D'
1639
+ 29: 0, # 'E'
1640
+ 52: 0, # 'F'
1641
+ 36: 1, # 'G'
1642
+ 45: 0, # 'H'
1643
+ 53: 0, # 'I'
1644
+ 60: 1, # 'J'
1645
+ 16: 2, # 'K'
1646
+ 49: 0, # 'L'
1647
+ 20: 2, # 'M'
1648
+ 46: 0, # 'N'
1649
+ 42: 0, # 'O'
1650
+ 48: 0, # 'P'
1651
+ 44: 0, # 'R'
1652
+ 35: 0, # 'S'
1653
+ 31: 1, # 'T'
1654
+ 51: 0, # 'U'
1655
+ 38: 0, # 'V'
1656
+ 62: 0, # 'W'
1657
+ 43: 1, # 'Y'
1658
+ 56: 0, # 'Z'
1659
+ 1: 3, # 'a'
1660
+ 21: 2, # 'b'
1661
+ 28: 0, # 'c'
1662
+ 12: 3, # 'd'
1663
+ 2: 3, # 'e'
1664
+ 18: 0, # 'f'
1665
+ 27: 3, # 'g'
1666
+ 25: 1, # 'h'
1667
+ 3: 3, # 'i'
1668
+ 24: 2, # 'j'
1669
+ 10: 3, # 'k'
1670
+ 5: 3, # 'l'
1671
+ 13: 3, # 'm'
1672
+ 4: 3, # 'n'
1673
+ 15: 0, # 'o'
1674
+ 26: 3, # 'p'
1675
+ 7: 1, # 'r'
1676
+ 8: 2, # 's'
1677
+ 9: 2, # 't'
1678
+ 14: 2, # 'u'
1679
+ 32: 1, # 'v'
1680
+ 57: 0, # 'w'
1681
+ 58: 1, # 'x'
1682
+ 11: 3, # 'y'
1683
+ 22: 0, # 'z'
1684
+ 63: 0, # '·'
1685
+ 54: 0, # 'Ç'
1686
+ 50: 0, # 'Ö'
1687
+ 55: 0, # 'Ü'
1688
+ 59: 0, # 'â'
1689
+ 33: 1, # 'ç'
1690
+ 61: 0, # 'î'
1691
+ 34: 0, # 'ö'
1692
+ 17: 0, # 'ü'
1693
+ 30: 1, # 'ğ'
1694
+ 41: 0, # 'İ'
1695
+ 6: 2, # 'ı'
1696
+ 40: 0, # 'Ş'
1697
+ 19: 0, # 'ş'
1698
+ },
1699
+ 28: { # 'c'
1700
+ 23: 0, # 'A'
1701
+ 37: 1, # 'B'
1702
+ 47: 1, # 'C'
1703
+ 39: 1, # 'D'
1704
+ 29: 2, # 'E'
1705
+ 52: 0, # 'F'
1706
+ 36: 2, # 'G'
1707
+ 45: 2, # 'H'
1708
+ 53: 1, # 'I'
1709
+ 60: 0, # 'J'
1710
+ 16: 0, # 'K'
1711
+ 49: 0, # 'L'
1712
+ 20: 2, # 'M'
1713
+ 46: 1, # 'N'
1714
+ 42: 1, # 'O'
1715
+ 48: 2, # 'P'
1716
+ 44: 1, # 'R'
1717
+ 35: 1, # 'S'
1718
+ 31: 2, # 'T'
1719
+ 51: 2, # 'U'
1720
+ 38: 2, # 'V'
1721
+ 62: 0, # 'W'
1722
+ 43: 3, # 'Y'
1723
+ 56: 0, # 'Z'
1724
+ 1: 1, # 'a'
1725
+ 21: 1, # 'b'
1726
+ 28: 2, # 'c'
1727
+ 12: 2, # 'd'
1728
+ 2: 1, # 'e'
1729
+ 18: 1, # 'f'
1730
+ 27: 2, # 'g'
1731
+ 25: 2, # 'h'
1732
+ 3: 3, # 'i'
1733
+ 24: 1, # 'j'
1734
+ 10: 3, # 'k'
1735
+ 5: 0, # 'l'
1736
+ 13: 2, # 'm'
1737
+ 4: 3, # 'n'
1738
+ 15: 2, # 'o'
1739
+ 26: 2, # 'p'
1740
+ 7: 3, # 'r'
1741
+ 8: 3, # 's'
1742
+ 9: 3, # 't'
1743
+ 14: 1, # 'u'
1744
+ 32: 0, # 'v'
1745
+ 57: 1, # 'w'
1746
+ 58: 0, # 'x'
1747
+ 11: 2, # 'y'
1748
+ 22: 1, # 'z'
1749
+ 63: 1, # '·'
1750
+ 54: 0, # 'Ç'
1751
+ 50: 0, # 'Ö'
1752
+ 55: 1, # 'Ü'
1753
+ 59: 0, # 'â'
1754
+ 33: 0, # 'ç'
1755
+ 61: 1, # 'î'
1756
+ 34: 2, # 'ö'
1757
+ 17: 2, # 'ü'
1758
+ 30: 2, # 'ğ'
1759
+ 41: 1, # 'İ'
1760
+ 6: 3, # 'ı'
1761
+ 40: 0, # 'Ş'
1762
+ 19: 2, # 'ş'
1763
+ },
1764
+ 12: { # 'd'
1765
+ 23: 1, # 'A'
1766
+ 37: 0, # 'B'
1767
+ 47: 0, # 'C'
1768
+ 39: 0, # 'D'
1769
+ 29: 0, # 'E'
1770
+ 52: 0, # 'F'
1771
+ 36: 0, # 'G'
1772
+ 45: 0, # 'H'
1773
+ 53: 0, # 'I'
1774
+ 60: 2, # 'J'
1775
+ 16: 3, # 'K'
1776
+ 49: 0, # 'L'
1777
+ 20: 3, # 'M'
1778
+ 46: 0, # 'N'
1779
+ 42: 0, # 'O'
1780
+ 48: 0, # 'P'
1781
+ 44: 0, # 'R'
1782
+ 35: 1, # 'S'
1783
+ 31: 1, # 'T'
1784
+ 51: 0, # 'U'
1785
+ 38: 0, # 'V'
1786
+ 62: 0, # 'W'
1787
+ 43: 0, # 'Y'
1788
+ 56: 0, # 'Z'
1789
+ 1: 3, # 'a'
1790
+ 21: 2, # 'b'
1791
+ 28: 1, # 'c'
1792
+ 12: 3, # 'd'
1793
+ 2: 3, # 'e'
1794
+ 18: 1, # 'f'
1795
+ 27: 3, # 'g'
1796
+ 25: 3, # 'h'
1797
+ 3: 2, # 'i'
1798
+ 24: 3, # 'j'
1799
+ 10: 2, # 'k'
1800
+ 5: 3, # 'l'
1801
+ 13: 3, # 'm'
1802
+ 4: 3, # 'n'
1803
+ 15: 1, # 'o'
1804
+ 26: 2, # 'p'
1805
+ 7: 3, # 'r'
1806
+ 8: 2, # 's'
1807
+ 9: 2, # 't'
1808
+ 14: 3, # 'u'
1809
+ 32: 1, # 'v'
1810
+ 57: 0, # 'w'
1811
+ 58: 1, # 'x'
1812
+ 11: 3, # 'y'
1813
+ 22: 1, # 'z'
1814
+ 63: 1, # '·'
1815
+ 54: 0, # 'Ç'
1816
+ 50: 0, # 'Ö'
1817
+ 55: 0, # 'Ü'
1818
+ 59: 0, # 'â'
1819
+ 33: 0, # 'ç'
1820
+ 61: 0, # 'î'
1821
+ 34: 0, # 'ö'
1822
+ 17: 1, # 'ü'
1823
+ 30: 0, # 'ğ'
1824
+ 41: 0, # 'İ'
1825
+ 6: 2, # 'ı'
1826
+ 40: 0, # 'Ş'
1827
+ 19: 0, # 'ş'
1828
+ },
1829
+ 2: { # 'e'
1830
+ 23: 2, # 'A'
1831
+ 37: 0, # 'B'
1832
+ 47: 2, # 'C'
1833
+ 39: 0, # 'D'
1834
+ 29: 3, # 'E'
1835
+ 52: 1, # 'F'
1836
+ 36: 0, # 'G'
1837
+ 45: 0, # 'H'
1838
+ 53: 0, # 'I'
1839
+ 60: 0, # 'J'
1840
+ 16: 1, # 'K'
1841
+ 49: 0, # 'L'
1842
+ 20: 3, # 'M'
1843
+ 46: 1, # 'N'
1844
+ 42: 0, # 'O'
1845
+ 48: 1, # 'P'
1846
+ 44: 1, # 'R'
1847
+ 35: 0, # 'S'
1848
+ 31: 3, # 'T'
1849
+ 51: 0, # 'U'
1850
+ 38: 1, # 'V'
1851
+ 62: 0, # 'W'
1852
+ 43: 1, # 'Y'
1853
+ 56: 0, # 'Z'
1854
+ 1: 3, # 'a'
1855
+ 21: 3, # 'b'
1856
+ 28: 0, # 'c'
1857
+ 12: 3, # 'd'
1858
+ 2: 2, # 'e'
1859
+ 18: 3, # 'f'
1860
+ 27: 3, # 'g'
1861
+ 25: 3, # 'h'
1862
+ 3: 3, # 'i'
1863
+ 24: 3, # 'j'
1864
+ 10: 3, # 'k'
1865
+ 5: 0, # 'l'
1866
+ 13: 2, # 'm'
1867
+ 4: 3, # 'n'
1868
+ 15: 1, # 'o'
1869
+ 26: 3, # 'p'
1870
+ 7: 3, # 'r'
1871
+ 8: 3, # 's'
1872
+ 9: 3, # 't'
1873
+ 14: 3, # 'u'
1874
+ 32: 3, # 'v'
1875
+ 57: 2, # 'w'
1876
+ 58: 0, # 'x'
1877
+ 11: 3, # 'y'
1878
+ 22: 1, # 'z'
1879
+ 63: 1, # '·'
1880
+ 54: 0, # 'Ç'
1881
+ 50: 0, # 'Ö'
1882
+ 55: 0, # 'Ü'
1883
+ 59: 0, # 'â'
1884
+ 33: 1, # 'ç'
1885
+ 61: 0, # 'î'
1886
+ 34: 1, # 'ö'
1887
+ 17: 3, # 'ü'
1888
+ 30: 0, # 'ğ'
1889
+ 41: 0, # 'İ'
1890
+ 6: 3, # 'ı'
1891
+ 40: 0, # 'Ş'
1892
+ 19: 0, # 'ş'
1893
+ },
1894
+ 18: { # 'f'
1895
+ 23: 0, # 'A'
1896
+ 37: 0, # 'B'
1897
+ 47: 0, # 'C'
1898
+ 39: 0, # 'D'
1899
+ 29: 0, # 'E'
1900
+ 52: 0, # 'F'
1901
+ 36: 0, # 'G'
1902
+ 45: 0, # 'H'
1903
+ 53: 0, # 'I'
1904
+ 60: 0, # 'J'
1905
+ 16: 2, # 'K'
1906
+ 49: 0, # 'L'
1907
+ 20: 2, # 'M'
1908
+ 46: 0, # 'N'
1909
+ 42: 0, # 'O'
1910
+ 48: 0, # 'P'
1911
+ 44: 0, # 'R'
1912
+ 35: 0, # 'S'
1913
+ 31: 2, # 'T'
1914
+ 51: 0, # 'U'
1915
+ 38: 0, # 'V'
1916
+ 62: 0, # 'W'
1917
+ 43: 0, # 'Y'
1918
+ 56: 0, # 'Z'
1919
+ 1: 3, # 'a'
1920
+ 21: 1, # 'b'
1921
+ 28: 0, # 'c'
1922
+ 12: 3, # 'd'
1923
+ 2: 3, # 'e'
1924
+ 18: 2, # 'f'
1925
+ 27: 1, # 'g'
1926
+ 25: 1, # 'h'
1927
+ 3: 1, # 'i'
1928
+ 24: 1, # 'j'
1929
+ 10: 1, # 'k'
1930
+ 5: 3, # 'l'
1931
+ 13: 3, # 'm'
1932
+ 4: 3, # 'n'
1933
+ 15: 0, # 'o'
1934
+ 26: 2, # 'p'
1935
+ 7: 1, # 'r'
1936
+ 8: 3, # 's'
1937
+ 9: 3, # 't'
1938
+ 14: 1, # 'u'
1939
+ 32: 2, # 'v'
1940
+ 57: 0, # 'w'
1941
+ 58: 0, # 'x'
1942
+ 11: 1, # 'y'
1943
+ 22: 0, # 'z'
1944
+ 63: 0, # '·'
1945
+ 54: 0, # 'Ç'
1946
+ 50: 0, # 'Ö'
1947
+ 55: 0, # 'Ü'
1948
+ 59: 0, # 'â'
1949
+ 33: 1, # 'ç'
1950
+ 61: 0, # 'î'
1951
+ 34: 0, # 'ö'
1952
+ 17: 1, # 'ü'
1953
+ 30: 0, # 'ğ'
1954
+ 41: 0, # 'İ'
1955
+ 6: 1, # 'ı'
1956
+ 40: 0, # 'Ş'
1957
+ 19: 0, # 'ş'
1958
+ },
1959
+ 27: { # 'g'
1960
+ 23: 0, # 'A'
1961
+ 37: 0, # 'B'
1962
+ 47: 0, # 'C'
1963
+ 39: 0, # 'D'
1964
+ 29: 0, # 'E'
1965
+ 52: 0, # 'F'
1966
+ 36: 0, # 'G'
1967
+ 45: 0, # 'H'
1968
+ 53: 0, # 'I'
1969
+ 60: 0, # 'J'
1970
+ 16: 3, # 'K'
1971
+ 49: 0, # 'L'
1972
+ 20: 0, # 'M'
1973
+ 46: 0, # 'N'
1974
+ 42: 0, # 'O'
1975
+ 48: 0, # 'P'
1976
+ 44: 0, # 'R'
1977
+ 35: 1, # 'S'
1978
+ 31: 1, # 'T'
1979
+ 51: 0, # 'U'
1980
+ 38: 2, # 'V'
1981
+ 62: 0, # 'W'
1982
+ 43: 0, # 'Y'
1983
+ 56: 0, # 'Z'
1984
+ 1: 3, # 'a'
1985
+ 21: 1, # 'b'
1986
+ 28: 0, # 'c'
1987
+ 12: 1, # 'd'
1988
+ 2: 3, # 'e'
1989
+ 18: 0, # 'f'
1990
+ 27: 2, # 'g'
1991
+ 25: 1, # 'h'
1992
+ 3: 2, # 'i'
1993
+ 24: 3, # 'j'
1994
+ 10: 2, # 'k'
1995
+ 5: 3, # 'l'
1996
+ 13: 3, # 'm'
1997
+ 4: 2, # 'n'
1998
+ 15: 0, # 'o'
1999
+ 26: 1, # 'p'
2000
+ 7: 2, # 'r'
2001
+ 8: 2, # 's'
2002
+ 9: 3, # 't'
2003
+ 14: 3, # 'u'
2004
+ 32: 1, # 'v'
2005
+ 57: 0, # 'w'
2006
+ 58: 0, # 'x'
2007
+ 11: 1, # 'y'
2008
+ 22: 0, # 'z'
2009
+ 63: 1, # '·'
2010
+ 54: 0, # 'Ç'
2011
+ 50: 0, # 'Ö'
2012
+ 55: 0, # 'Ü'
2013
+ 59: 0, # 'â'
2014
+ 33: 0, # 'ç'
2015
+ 61: 0, # 'î'
2016
+ 34: 0, # 'ö'
2017
+ 17: 0, # 'ü'
2018
+ 30: 0, # 'ğ'
2019
+ 41: 0, # 'İ'
2020
+ 6: 2, # 'ı'
2021
+ 40: 0, # 'Ş'
2022
+ 19: 0, # 'ş'
2023
+ },
2024
+ 25: { # 'h'
2025
+ 23: 0, # 'A'
2026
+ 37: 0, # 'B'
2027
+ 47: 0, # 'C'
2028
+ 39: 0, # 'D'
2029
+ 29: 0, # 'E'
2030
+ 52: 0, # 'F'
2031
+ 36: 0, # 'G'
2032
+ 45: 0, # 'H'
2033
+ 53: 0, # 'I'
2034
+ 60: 0, # 'J'
2035
+ 16: 2, # 'K'
2036
+ 49: 0, # 'L'
2037
+ 20: 0, # 'M'
2038
+ 46: 0, # 'N'
2039
+ 42: 0, # 'O'
2040
+ 48: 0, # 'P'
2041
+ 44: 0, # 'R'
2042
+ 35: 0, # 'S'
2043
+ 31: 0, # 'T'
2044
+ 51: 0, # 'U'
2045
+ 38: 0, # 'V'
2046
+ 62: 0, # 'W'
2047
+ 43: 0, # 'Y'
2048
+ 56: 0, # 'Z'
2049
+ 1: 3, # 'a'
2050
+ 21: 0, # 'b'
2051
+ 28: 0, # 'c'
2052
+ 12: 2, # 'd'
2053
+ 2: 3, # 'e'
2054
+ 18: 0, # 'f'
2055
+ 27: 1, # 'g'
2056
+ 25: 2, # 'h'
2057
+ 3: 2, # 'i'
2058
+ 24: 3, # 'j'
2059
+ 10: 3, # 'k'
2060
+ 5: 3, # 'l'
2061
+ 13: 3, # 'm'
2062
+ 4: 3, # 'n'
2063
+ 15: 1, # 'o'
2064
+ 26: 1, # 'p'
2065
+ 7: 3, # 'r'
2066
+ 8: 3, # 's'
2067
+ 9: 2, # 't'
2068
+ 14: 3, # 'u'
2069
+ 32: 2, # 'v'
2070
+ 57: 1, # 'w'
2071
+ 58: 0, # 'x'
2072
+ 11: 1, # 'y'
2073
+ 22: 0, # 'z'
2074
+ 63: 0, # '·'
2075
+ 54: 0, # 'Ç'
2076
+ 50: 0, # 'Ö'
2077
+ 55: 0, # 'Ü'
2078
+ 59: 0, # 'â'
2079
+ 33: 0, # 'ç'
2080
+ 61: 0, # 'î'
2081
+ 34: 0, # 'ö'
2082
+ 17: 0, # 'ü'
2083
+ 30: 0, # 'ğ'
2084
+ 41: 0, # 'İ'
2085
+ 6: 3, # 'ı'
2086
+ 40: 0, # 'Ş'
2087
+ 19: 0, # 'ş'
2088
+ },
2089
+ 3: { # 'i'
2090
+ 23: 2, # 'A'
2091
+ 37: 0, # 'B'
2092
+ 47: 0, # 'C'
2093
+ 39: 0, # 'D'
2094
+ 29: 0, # 'E'
2095
+ 52: 0, # 'F'
2096
+ 36: 0, # 'G'
2097
+ 45: 0, # 'H'
2098
+ 53: 0, # 'I'
2099
+ 60: 1, # 'J'
2100
+ 16: 3, # 'K'
2101
+ 49: 0, # 'L'
2102
+ 20: 3, # 'M'
2103
+ 46: 0, # 'N'
2104
+ 42: 1, # 'O'
2105
+ 48: 0, # 'P'
2106
+ 44: 0, # 'R'
2107
+ 35: 1, # 'S'
2108
+ 31: 2, # 'T'
2109
+ 51: 0, # 'U'
2110
+ 38: 1, # 'V'
2111
+ 62: 0, # 'W'
2112
+ 43: 0, # 'Y'
2113
+ 56: 0, # 'Z'
2114
+ 1: 3, # 'a'
2115
+ 21: 2, # 'b'
2116
+ 28: 0, # 'c'
2117
+ 12: 3, # 'd'
2118
+ 2: 3, # 'e'
2119
+ 18: 2, # 'f'
2120
+ 27: 3, # 'g'
2121
+ 25: 1, # 'h'
2122
+ 3: 3, # 'i'
2123
+ 24: 2, # 'j'
2124
+ 10: 3, # 'k'
2125
+ 5: 3, # 'l'
2126
+ 13: 3, # 'm'
2127
+ 4: 3, # 'n'
2128
+ 15: 1, # 'o'
2129
+ 26: 3, # 'p'
2130
+ 7: 3, # 'r'
2131
+ 8: 3, # 's'
2132
+ 9: 3, # 't'
2133
+ 14: 3, # 'u'
2134
+ 32: 2, # 'v'
2135
+ 57: 1, # 'w'
2136
+ 58: 1, # 'x'
2137
+ 11: 3, # 'y'
2138
+ 22: 1, # 'z'
2139
+ 63: 1, # '·'
2140
+ 54: 0, # 'Ç'
2141
+ 50: 0, # 'Ö'
2142
+ 55: 1, # 'Ü'
2143
+ 59: 0, # 'â'
2144
+ 33: 2, # 'ç'
2145
+ 61: 0, # 'î'
2146
+ 34: 0, # 'ö'
2147
+ 17: 3, # 'ü'
2148
+ 30: 0, # 'ğ'
2149
+ 41: 1, # 'İ'
2150
+ 6: 2, # 'ı'
2151
+ 40: 0, # 'Ş'
2152
+ 19: 0, # 'ş'
2153
+ },
2154
+ 24: { # 'j'
2155
+ 23: 0, # 'A'
2156
+ 37: 0, # 'B'
2157
+ 47: 0, # 'C'
2158
+ 39: 0, # 'D'
2159
+ 29: 0, # 'E'
2160
+ 52: 0, # 'F'
2161
+ 36: 0, # 'G'
2162
+ 45: 0, # 'H'
2163
+ 53: 0, # 'I'
2164
+ 60: 1, # 'J'
2165
+ 16: 2, # 'K'
2166
+ 49: 0, # 'L'
2167
+ 20: 2, # 'M'
2168
+ 46: 0, # 'N'
2169
+ 42: 0, # 'O'
2170
+ 48: 1, # 'P'
2171
+ 44: 0, # 'R'
2172
+ 35: 0, # 'S'
2173
+ 31: 1, # 'T'
2174
+ 51: 0, # 'U'
2175
+ 38: 0, # 'V'
2176
+ 62: 0, # 'W'
2177
+ 43: 0, # 'Y'
2178
+ 56: 1, # 'Z'
2179
+ 1: 3, # 'a'
2180
+ 21: 1, # 'b'
2181
+ 28: 1, # 'c'
2182
+ 12: 3, # 'd'
2183
+ 2: 3, # 'e'
2184
+ 18: 2, # 'f'
2185
+ 27: 1, # 'g'
2186
+ 25: 1, # 'h'
2187
+ 3: 2, # 'i'
2188
+ 24: 1, # 'j'
2189
+ 10: 2, # 'k'
2190
+ 5: 2, # 'l'
2191
+ 13: 3, # 'm'
2192
+ 4: 2, # 'n'
2193
+ 15: 0, # 'o'
2194
+ 26: 1, # 'p'
2195
+ 7: 2, # 'r'
2196
+ 8: 3, # 's'
2197
+ 9: 2, # 't'
2198
+ 14: 3, # 'u'
2199
+ 32: 2, # 'v'
2200
+ 57: 0, # 'w'
2201
+ 58: 2, # 'x'
2202
+ 11: 1, # 'y'
2203
+ 22: 0, # 'z'
2204
+ 63: 0, # '·'
2205
+ 54: 0, # 'Ç'
2206
+ 50: 0, # 'Ö'
2207
+ 55: 0, # 'Ü'
2208
+ 59: 0, # 'â'
2209
+ 33: 1, # 'ç'
2210
+ 61: 0, # 'î'
2211
+ 34: 0, # 'ö'
2212
+ 17: 1, # 'ü'
2213
+ 30: 0, # 'ğ'
2214
+ 41: 0, # 'İ'
2215
+ 6: 3, # 'ı'
2216
+ 40: 0, # 'Ş'
2217
+ 19: 0, # 'ş'
2218
+ },
2219
+ 10: { # 'k'
2220
+ 23: 0, # 'A'
2221
+ 37: 0, # 'B'
2222
+ 47: 0, # 'C'
2223
+ 39: 0, # 'D'
2224
+ 29: 0, # 'E'
2225
+ 52: 0, # 'F'
2226
+ 36: 0, # 'G'
2227
+ 45: 0, # 'H'
2228
+ 53: 0, # 'I'
2229
+ 60: 0, # 'J'
2230
+ 16: 3, # 'K'
2231
+ 49: 0, # 'L'
2232
+ 20: 2, # 'M'
2233
+ 46: 0, # 'N'
2234
+ 42: 0, # 'O'
2235
+ 48: 0, # 'P'
2236
+ 44: 0, # 'R'
2237
+ 35: 0, # 'S'
2238
+ 31: 3, # 'T'
2239
+ 51: 0, # 'U'
2240
+ 38: 1, # 'V'
2241
+ 62: 0, # 'W'
2242
+ 43: 0, # 'Y'
2243
+ 56: 1, # 'Z'
2244
+ 1: 3, # 'a'
2245
+ 21: 2, # 'b'
2246
+ 28: 0, # 'c'
2247
+ 12: 2, # 'd'
2248
+ 2: 3, # 'e'
2249
+ 18: 1, # 'f'
2250
+ 27: 2, # 'g'
2251
+ 25: 2, # 'h'
2252
+ 3: 3, # 'i'
2253
+ 24: 2, # 'j'
2254
+ 10: 2, # 'k'
2255
+ 5: 3, # 'l'
2256
+ 13: 3, # 'm'
2257
+ 4: 3, # 'n'
2258
+ 15: 0, # 'o'
2259
+ 26: 3, # 'p'
2260
+ 7: 2, # 'r'
2261
+ 8: 2, # 's'
2262
+ 9: 2, # 't'
2263
+ 14: 3, # 'u'
2264
+ 32: 0, # 'v'
2265
+ 57: 0, # 'w'
2266
+ 58: 1, # 'x'
2267
+ 11: 3, # 'y'
2268
+ 22: 0, # 'z'
2269
+ 63: 1, # '·'
2270
+ 54: 0, # 'Ç'
2271
+ 50: 0, # 'Ö'
2272
+ 55: 0, # 'Ü'
2273
+ 59: 0, # 'â'
2274
+ 33: 3, # 'ç'
2275
+ 61: 0, # 'î'
2276
+ 34: 1, # 'ö'
2277
+ 17: 3, # 'ü'
2278
+ 30: 1, # 'ğ'
2279
+ 41: 0, # 'İ'
2280
+ 6: 3, # 'ı'
2281
+ 40: 0, # 'Ş'
2282
+ 19: 1, # 'ş'
2283
+ },
2284
+ 5: { # 'l'
2285
+ 23: 0, # 'A'
2286
+ 37: 0, # 'B'
2287
+ 47: 0, # 'C'
2288
+ 39: 0, # 'D'
2289
+ 29: 3, # 'E'
2290
+ 52: 0, # 'F'
2291
+ 36: 0, # 'G'
2292
+ 45: 0, # 'H'
2293
+ 53: 0, # 'I'
2294
+ 60: 0, # 'J'
2295
+ 16: 0, # 'K'
2296
+ 49: 0, # 'L'
2297
+ 20: 2, # 'M'
2298
+ 46: 0, # 'N'
2299
+ 42: 0, # 'O'
2300
+ 48: 0, # 'P'
2301
+ 44: 0, # 'R'
2302
+ 35: 0, # 'S'
2303
+ 31: 1, # 'T'
2304
+ 51: 0, # 'U'
2305
+ 38: 0, # 'V'
2306
+ 62: 0, # 'W'
2307
+ 43: 0, # 'Y'
2308
+ 56: 0, # 'Z'
2309
+ 1: 0, # 'a'
2310
+ 21: 3, # 'b'
2311
+ 28: 0, # 'c'
2312
+ 12: 3, # 'd'
2313
+ 2: 1, # 'e'
2314
+ 18: 3, # 'f'
2315
+ 27: 3, # 'g'
2316
+ 25: 2, # 'h'
2317
+ 3: 3, # 'i'
2318
+ 24: 2, # 'j'
2319
+ 10: 3, # 'k'
2320
+ 5: 1, # 'l'
2321
+ 13: 1, # 'm'
2322
+ 4: 3, # 'n'
2323
+ 15: 0, # 'o'
2324
+ 26: 2, # 'p'
2325
+ 7: 3, # 'r'
2326
+ 8: 3, # 's'
2327
+ 9: 3, # 't'
2328
+ 14: 2, # 'u'
2329
+ 32: 2, # 'v'
2330
+ 57: 0, # 'w'
2331
+ 58: 0, # 'x'
2332
+ 11: 3, # 'y'
2333
+ 22: 0, # 'z'
2334
+ 63: 0, # '·'
2335
+ 54: 0, # 'Ç'
2336
+ 50: 0, # 'Ö'
2337
+ 55: 0, # 'Ü'
2338
+ 59: 0, # 'â'
2339
+ 33: 1, # 'ç'
2340
+ 61: 0, # 'î'
2341
+ 34: 0, # 'ö'
2342
+ 17: 2, # 'ü'
2343
+ 30: 0, # 'ğ'
2344
+ 41: 0, # 'İ'
2345
+ 6: 3, # 'ı'
2346
+ 40: 0, # 'Ş'
2347
+ 19: 0, # 'ş'
2348
+ },
2349
+ 13: { # 'm'
2350
+ 23: 1, # 'A'
2351
+ 37: 0, # 'B'
2352
+ 47: 0, # 'C'
2353
+ 39: 0, # 'D'
2354
+ 29: 3, # 'E'
2355
+ 52: 0, # 'F'
2356
+ 36: 0, # 'G'
2357
+ 45: 0, # 'H'
2358
+ 53: 0, # 'I'
2359
+ 60: 0, # 'J'
2360
+ 16: 0, # 'K'
2361
+ 49: 0, # 'L'
2362
+ 20: 3, # 'M'
2363
+ 46: 0, # 'N'
2364
+ 42: 0, # 'O'
2365
+ 48: 0, # 'P'
2366
+ 44: 0, # 'R'
2367
+ 35: 0, # 'S'
2368
+ 31: 3, # 'T'
2369
+ 51: 0, # 'U'
2370
+ 38: 0, # 'V'
2371
+ 62: 0, # 'W'
2372
+ 43: 1, # 'Y'
2373
+ 56: 0, # 'Z'
2374
+ 1: 2, # 'a'
2375
+ 21: 3, # 'b'
2376
+ 28: 0, # 'c'
2377
+ 12: 3, # 'd'
2378
+ 2: 2, # 'e'
2379
+ 18: 3, # 'f'
2380
+ 27: 3, # 'g'
2381
+ 25: 3, # 'h'
2382
+ 3: 3, # 'i'
2383
+ 24: 3, # 'j'
2384
+ 10: 3, # 'k'
2385
+ 5: 0, # 'l'
2386
+ 13: 2, # 'm'
2387
+ 4: 3, # 'n'
2388
+ 15: 1, # 'o'
2389
+ 26: 2, # 'p'
2390
+ 7: 3, # 'r'
2391
+ 8: 3, # 's'
2392
+ 9: 3, # 't'
2393
+ 14: 2, # 'u'
2394
+ 32: 2, # 'v'
2395
+ 57: 1, # 'w'
2396
+ 58: 0, # 'x'
2397
+ 11: 3, # 'y'
2398
+ 22: 0, # 'z'
2399
+ 63: 0, # '·'
2400
+ 54: 0, # 'Ç'
2401
+ 50: 0, # 'Ö'
2402
+ 55: 0, # 'Ü'
2403
+ 59: 0, # 'â'
2404
+ 33: 0, # 'ç'
2405
+ 61: 0, # 'î'
2406
+ 34: 0, # 'ö'
2407
+ 17: 3, # 'ü'
2408
+ 30: 0, # 'ğ'
2409
+ 41: 0, # 'İ'
2410
+ 6: 3, # 'ı'
2411
+ 40: 0, # 'Ş'
2412
+ 19: 1, # 'ş'
2413
+ },
2414
+ 4: { # 'n'
2415
+ 23: 1, # 'A'
2416
+ 37: 0, # 'B'
2417
+ 47: 0, # 'C'
2418
+ 39: 0, # 'D'
2419
+ 29: 0, # 'E'
2420
+ 52: 0, # 'F'
2421
+ 36: 0, # 'G'
2422
+ 45: 1, # 'H'
2423
+ 53: 0, # 'I'
2424
+ 60: 2, # 'J'
2425
+ 16: 3, # 'K'
2426
+ 49: 0, # 'L'
2427
+ 20: 3, # 'M'
2428
+ 46: 0, # 'N'
2429
+ 42: 0, # 'O'
2430
+ 48: 0, # 'P'
2431
+ 44: 0, # 'R'
2432
+ 35: 0, # 'S'
2433
+ 31: 2, # 'T'
2434
+ 51: 0, # 'U'
2435
+ 38: 0, # 'V'
2436
+ 62: 0, # 'W'
2437
+ 43: 0, # 'Y'
2438
+ 56: 0, # 'Z'
2439
+ 1: 3, # 'a'
2440
+ 21: 2, # 'b'
2441
+ 28: 1, # 'c'
2442
+ 12: 3, # 'd'
2443
+ 2: 3, # 'e'
2444
+ 18: 1, # 'f'
2445
+ 27: 2, # 'g'
2446
+ 25: 3, # 'h'
2447
+ 3: 2, # 'i'
2448
+ 24: 2, # 'j'
2449
+ 10: 3, # 'k'
2450
+ 5: 3, # 'l'
2451
+ 13: 3, # 'm'
2452
+ 4: 3, # 'n'
2453
+ 15: 1, # 'o'
2454
+ 26: 3, # 'p'
2455
+ 7: 2, # 'r'
2456
+ 8: 3, # 's'
2457
+ 9: 3, # 't'
2458
+ 14: 3, # 'u'
2459
+ 32: 2, # 'v'
2460
+ 57: 0, # 'w'
2461
+ 58: 2, # 'x'
2462
+ 11: 3, # 'y'
2463
+ 22: 0, # 'z'
2464
+ 63: 0, # '·'
2465
+ 54: 0, # 'Ç'
2466
+ 50: 0, # 'Ö'
2467
+ 55: 0, # 'Ü'
2468
+ 59: 0, # 'â'
2469
+ 33: 1, # 'ç'
2470
+ 61: 0, # 'î'
2471
+ 34: 0, # 'ö'
2472
+ 17: 2, # 'ü'
2473
+ 30: 0, # 'ğ'
2474
+ 41: 0, # 'İ'
2475
+ 6: 1, # 'ı'
2476
+ 40: 0, # 'Ş'
2477
+ 19: 0, # 'ş'
2478
+ },
2479
+ 15: { # 'o'
2480
+ 23: 0, # 'A'
2481
+ 37: 0, # 'B'
2482
+ 47: 1, # 'C'
2483
+ 39: 0, # 'D'
2484
+ 29: 0, # 'E'
2485
+ 52: 2, # 'F'
2486
+ 36: 1, # 'G'
2487
+ 45: 1, # 'H'
2488
+ 53: 1, # 'I'
2489
+ 60: 0, # 'J'
2490
+ 16: 3, # 'K'
2491
+ 49: 2, # 'L'
2492
+ 20: 0, # 'M'
2493
+ 46: 2, # 'N'
2494
+ 42: 1, # 'O'
2495
+ 48: 2, # 'P'
2496
+ 44: 1, # 'R'
2497
+ 35: 0, # 'S'
2498
+ 31: 0, # 'T'
2499
+ 51: 0, # 'U'
2500
+ 38: 0, # 'V'
2501
+ 62: 0, # 'W'
2502
+ 43: 0, # 'Y'
2503
+ 56: 0, # 'Z'
2504
+ 1: 3, # 'a'
2505
+ 21: 0, # 'b'
2506
+ 28: 2, # 'c'
2507
+ 12: 0, # 'd'
2508
+ 2: 3, # 'e'
2509
+ 18: 0, # 'f'
2510
+ 27: 0, # 'g'
2511
+ 25: 0, # 'h'
2512
+ 3: 1, # 'i'
2513
+ 24: 2, # 'j'
2514
+ 10: 1, # 'k'
2515
+ 5: 3, # 'l'
2516
+ 13: 3, # 'm'
2517
+ 4: 2, # 'n'
2518
+ 15: 2, # 'o'
2519
+ 26: 0, # 'p'
2520
+ 7: 1, # 'r'
2521
+ 8: 0, # 's'
2522
+ 9: 0, # 't'
2523
+ 14: 3, # 'u'
2524
+ 32: 0, # 'v'
2525
+ 57: 0, # 'w'
2526
+ 58: 2, # 'x'
2527
+ 11: 0, # 'y'
2528
+ 22: 2, # 'z'
2529
+ 63: 0, # '·'
2530
+ 54: 1, # 'Ç'
2531
+ 50: 2, # 'Ö'
2532
+ 55: 0, # 'Ü'
2533
+ 59: 0, # 'â'
2534
+ 33: 3, # 'ç'
2535
+ 61: 0, # 'î'
2536
+ 34: 1, # 'ö'
2537
+ 17: 0, # 'ü'
2538
+ 30: 2, # 'ğ'
2539
+ 41: 2, # 'İ'
2540
+ 6: 3, # 'ı'
2541
+ 40: 2, # 'Ş'
2542
+ 19: 2, # 'ş'
2543
+ },
2544
+ 26: { # 'p'
2545
+ 23: 0, # 'A'
2546
+ 37: 0, # 'B'
2547
+ 47: 0, # 'C'
2548
+ 39: 0, # 'D'
2549
+ 29: 0, # 'E'
2550
+ 52: 0, # 'F'
2551
+ 36: 0, # 'G'
2552
+ 45: 0, # 'H'
2553
+ 53: 0, # 'I'
2554
+ 60: 0, # 'J'
2555
+ 16: 3, # 'K'
2556
+ 49: 0, # 'L'
2557
+ 20: 1, # 'M'
2558
+ 46: 0, # 'N'
2559
+ 42: 0, # 'O'
2560
+ 48: 0, # 'P'
2561
+ 44: 0, # 'R'
2562
+ 35: 0, # 'S'
2563
+ 31: 0, # 'T'
2564
+ 51: 0, # 'U'
2565
+ 38: 0, # 'V'
2566
+ 62: 0, # 'W'
2567
+ 43: 0, # 'Y'
2568
+ 56: 0, # 'Z'
2569
+ 1: 3, # 'a'
2570
+ 21: 1, # 'b'
2571
+ 28: 0, # 'c'
2572
+ 12: 1, # 'd'
2573
+ 2: 3, # 'e'
2574
+ 18: 0, # 'f'
2575
+ 27: 1, # 'g'
2576
+ 25: 1, # 'h'
2577
+ 3: 2, # 'i'
2578
+ 24: 3, # 'j'
2579
+ 10: 1, # 'k'
2580
+ 5: 3, # 'l'
2581
+ 13: 3, # 'm'
2582
+ 4: 2, # 'n'
2583
+ 15: 0, # 'o'
2584
+ 26: 2, # 'p'
2585
+ 7: 2, # 'r'
2586
+ 8: 1, # 's'
2587
+ 9: 1, # 't'
2588
+ 14: 3, # 'u'
2589
+ 32: 0, # 'v'
2590
+ 57: 0, # 'w'
2591
+ 58: 1, # 'x'
2592
+ 11: 1, # 'y'
2593
+ 22: 0, # 'z'
2594
+ 63: 0, # '·'
2595
+ 54: 0, # 'Ç'
2596
+ 50: 0, # 'Ö'
2597
+ 55: 0, # 'Ü'
2598
+ 59: 0, # 'â'
2599
+ 33: 3, # 'ç'
2600
+ 61: 0, # 'î'
2601
+ 34: 0, # 'ö'
2602
+ 17: 1, # 'ü'
2603
+ 30: 0, # 'ğ'
2604
+ 41: 0, # 'İ'
2605
+ 6: 3, # 'ı'
2606
+ 40: 0, # 'Ş'
2607
+ 19: 0, # 'ş'
2608
+ },
2609
+ 7: { # 'r'
2610
+ 23: 0, # 'A'
2611
+ 37: 0, # 'B'
2612
+ 47: 0, # 'C'
2613
+ 39: 0, # 'D'
2614
+ 29: 0, # 'E'
2615
+ 52: 1, # 'F'
2616
+ 36: 0, # 'G'
2617
+ 45: 0, # 'H'
2618
+ 53: 0, # 'I'
2619
+ 60: 2, # 'J'
2620
+ 16: 3, # 'K'
2621
+ 49: 0, # 'L'
2622
+ 20: 2, # 'M'
2623
+ 46: 0, # 'N'
2624
+ 42: 0, # 'O'
2625
+ 48: 0, # 'P'
2626
+ 44: 0, # 'R'
2627
+ 35: 0, # 'S'
2628
+ 31: 2, # 'T'
2629
+ 51: 1, # 'U'
2630
+ 38: 0, # 'V'
2631
+ 62: 0, # 'W'
2632
+ 43: 0, # 'Y'
2633
+ 56: 1, # 'Z'
2634
+ 1: 3, # 'a'
2635
+ 21: 1, # 'b'
2636
+ 28: 0, # 'c'
2637
+ 12: 3, # 'd'
2638
+ 2: 3, # 'e'
2639
+ 18: 0, # 'f'
2640
+ 27: 2, # 'g'
2641
+ 25: 3, # 'h'
2642
+ 3: 2, # 'i'
2643
+ 24: 2, # 'j'
2644
+ 10: 3, # 'k'
2645
+ 5: 3, # 'l'
2646
+ 13: 3, # 'm'
2647
+ 4: 3, # 'n'
2648
+ 15: 0, # 'o'
2649
+ 26: 2, # 'p'
2650
+ 7: 3, # 'r'
2651
+ 8: 3, # 's'
2652
+ 9: 3, # 't'
2653
+ 14: 3, # 'u'
2654
+ 32: 2, # 'v'
2655
+ 57: 0, # 'w'
2656
+ 58: 1, # 'x'
2657
+ 11: 2, # 'y'
2658
+ 22: 0, # 'z'
2659
+ 63: 1, # '·'
2660
+ 54: 0, # 'Ç'
2661
+ 50: 0, # 'Ö'
2662
+ 55: 0, # 'Ü'
2663
+ 59: 0, # 'â'
2664
+ 33: 2, # 'ç'
2665
+ 61: 0, # 'î'
2666
+ 34: 0, # 'ö'
2667
+ 17: 3, # 'ü'
2668
+ 30: 0, # 'ğ'
2669
+ 41: 0, # 'İ'
2670
+ 6: 2, # 'ı'
2671
+ 40: 0, # 'Ş'
2672
+ 19: 0, # 'ş'
2673
+ },
2674
+ 8: { # 's'
2675
+ 23: 1, # 'A'
2676
+ 37: 0, # 'B'
2677
+ 47: 0, # 'C'
2678
+ 39: 0, # 'D'
2679
+ 29: 0, # 'E'
2680
+ 52: 0, # 'F'
2681
+ 36: 1, # 'G'
2682
+ 45: 0, # 'H'
2683
+ 53: 0, # 'I'
2684
+ 60: 0, # 'J'
2685
+ 16: 3, # 'K'
2686
+ 49: 0, # 'L'
2687
+ 20: 3, # 'M'
2688
+ 46: 0, # 'N'
2689
+ 42: 0, # 'O'
2690
+ 48: 0, # 'P'
2691
+ 44: 0, # 'R'
2692
+ 35: 0, # 'S'
2693
+ 31: 2, # 'T'
2694
+ 51: 0, # 'U'
2695
+ 38: 0, # 'V'
2696
+ 62: 0, # 'W'
2697
+ 43: 0, # 'Y'
2698
+ 56: 1, # 'Z'
2699
+ 1: 3, # 'a'
2700
+ 21: 2, # 'b'
2701
+ 28: 1, # 'c'
2702
+ 12: 3, # 'd'
2703
+ 2: 3, # 'e'
2704
+ 18: 0, # 'f'
2705
+ 27: 2, # 'g'
2706
+ 25: 2, # 'h'
2707
+ 3: 2, # 'i'
2708
+ 24: 3, # 'j'
2709
+ 10: 3, # 'k'
2710
+ 5: 3, # 'l'
2711
+ 13: 3, # 'm'
2712
+ 4: 3, # 'n'
2713
+ 15: 0, # 'o'
2714
+ 26: 3, # 'p'
2715
+ 7: 3, # 'r'
2716
+ 8: 3, # 's'
2717
+ 9: 3, # 't'
2718
+ 14: 3, # 'u'
2719
+ 32: 2, # 'v'
2720
+ 57: 0, # 'w'
2721
+ 58: 1, # 'x'
2722
+ 11: 2, # 'y'
2723
+ 22: 1, # 'z'
2724
+ 63: 0, # '·'
2725
+ 54: 0, # 'Ç'
2726
+ 50: 0, # 'Ö'
2727
+ 55: 0, # 'Ü'
2728
+ 59: 0, # 'â'
2729
+ 33: 2, # 'ç'
2730
+ 61: 0, # 'î'
2731
+ 34: 0, # 'ö'
2732
+ 17: 2, # 'ü'
2733
+ 30: 0, # 'ğ'
2734
+ 41: 0, # 'İ'
2735
+ 6: 3, # 'ı'
2736
+ 40: 0, # 'Ş'
2737
+ 19: 1, # 'ş'
2738
+ },
2739
+ 9: { # 't'
2740
+ 23: 0, # 'A'
2741
+ 37: 0, # 'B'
2742
+ 47: 0, # 'C'
2743
+ 39: 0, # 'D'
2744
+ 29: 0, # 'E'
2745
+ 52: 0, # 'F'
2746
+ 36: 0, # 'G'
2747
+ 45: 0, # 'H'
2748
+ 53: 0, # 'I'
2749
+ 60: 1, # 'J'
2750
+ 16: 3, # 'K'
2751
+ 49: 0, # 'L'
2752
+ 20: 2, # 'M'
2753
+ 46: 0, # 'N'
2754
+ 42: 0, # 'O'
2755
+ 48: 0, # 'P'
2756
+ 44: 0, # 'R'
2757
+ 35: 0, # 'S'
2758
+ 31: 2, # 'T'
2759
+ 51: 0, # 'U'
2760
+ 38: 0, # 'V'
2761
+ 62: 0, # 'W'
2762
+ 43: 0, # 'Y'
2763
+ 56: 1, # 'Z'
2764
+ 1: 3, # 'a'
2765
+ 21: 3, # 'b'
2766
+ 28: 0, # 'c'
2767
+ 12: 3, # 'd'
2768
+ 2: 3, # 'e'
2769
+ 18: 2, # 'f'
2770
+ 27: 2, # 'g'
2771
+ 25: 2, # 'h'
2772
+ 3: 2, # 'i'
2773
+ 24: 2, # 'j'
2774
+ 10: 3, # 'k'
2775
+ 5: 3, # 'l'
2776
+ 13: 3, # 'm'
2777
+ 4: 3, # 'n'
2778
+ 15: 0, # 'o'
2779
+ 26: 2, # 'p'
2780
+ 7: 3, # 'r'
2781
+ 8: 3, # 's'
2782
+ 9: 3, # 't'
2783
+ 14: 3, # 'u'
2784
+ 32: 3, # 'v'
2785
+ 57: 0, # 'w'
2786
+ 58: 2, # 'x'
2787
+ 11: 2, # 'y'
2788
+ 22: 0, # 'z'
2789
+ 63: 0, # '·'
2790
+ 54: 0, # 'Ç'
2791
+ 50: 0, # 'Ö'
2792
+ 55: 0, # 'Ü'
2793
+ 59: 0, # 'â'
2794
+ 33: 3, # 'ç'
2795
+ 61: 0, # 'î'
2796
+ 34: 0, # 'ö'
2797
+ 17: 2, # 'ü'
2798
+ 30: 0, # 'ğ'
2799
+ 41: 0, # 'İ'
2800
+ 6: 3, # 'ı'
2801
+ 40: 0, # 'Ş'
2802
+ 19: 0, # 'ş'
2803
+ },
2804
+ 14: { # 'u'
2805
+ 23: 3, # 'A'
2806
+ 37: 0, # 'B'
2807
+ 47: 0, # 'C'
2808
+ 39: 0, # 'D'
2809
+ 29: 3, # 'E'
2810
+ 52: 0, # 'F'
2811
+ 36: 0, # 'G'
2812
+ 45: 1, # 'H'
2813
+ 53: 0, # 'I'
2814
+ 60: 1, # 'J'
2815
+ 16: 0, # 'K'
2816
+ 49: 0, # 'L'
2817
+ 20: 3, # 'M'
2818
+ 46: 2, # 'N'
2819
+ 42: 0, # 'O'
2820
+ 48: 1, # 'P'
2821
+ 44: 0, # 'R'
2822
+ 35: 0, # 'S'
2823
+ 31: 3, # 'T'
2824
+ 51: 0, # 'U'
2825
+ 38: 0, # 'V'
2826
+ 62: 0, # 'W'
2827
+ 43: 1, # 'Y'
2828
+ 56: 2, # 'Z'
2829
+ 1: 2, # 'a'
2830
+ 21: 3, # 'b'
2831
+ 28: 0, # 'c'
2832
+ 12: 3, # 'd'
2833
+ 2: 2, # 'e'
2834
+ 18: 2, # 'f'
2835
+ 27: 3, # 'g'
2836
+ 25: 3, # 'h'
2837
+ 3: 3, # 'i'
2838
+ 24: 2, # 'j'
2839
+ 10: 3, # 'k'
2840
+ 5: 0, # 'l'
2841
+ 13: 3, # 'm'
2842
+ 4: 3, # 'n'
2843
+ 15: 0, # 'o'
2844
+ 26: 3, # 'p'
2845
+ 7: 3, # 'r'
2846
+ 8: 3, # 's'
2847
+ 9: 3, # 't'
2848
+ 14: 3, # 'u'
2849
+ 32: 2, # 'v'
2850
+ 57: 2, # 'w'
2851
+ 58: 0, # 'x'
2852
+ 11: 3, # 'y'
2853
+ 22: 0, # 'z'
2854
+ 63: 1, # '·'
2855
+ 54: 0, # 'Ç'
2856
+ 50: 0, # 'Ö'
2857
+ 55: 0, # 'Ü'
2858
+ 59: 0, # 'â'
2859
+ 33: 0, # 'ç'
2860
+ 61: 0, # 'î'
2861
+ 34: 0, # 'ö'
2862
+ 17: 3, # 'ü'
2863
+ 30: 1, # 'ğ'
2864
+ 41: 0, # 'İ'
2865
+ 6: 3, # 'ı'
2866
+ 40: 0, # 'Ş'
2867
+ 19: 0, # 'ş'
2868
+ },
2869
+ 32: { # 'v'
2870
+ 23: 0, # 'A'
2871
+ 37: 0, # 'B'
2872
+ 47: 0, # 'C'
2873
+ 39: 0, # 'D'
2874
+ 29: 0, # 'E'
2875
+ 52: 0, # 'F'
2876
+ 36: 0, # 'G'
2877
+ 45: 0, # 'H'
2878
+ 53: 0, # 'I'
2879
+ 60: 0, # 'J'
2880
+ 16: 3, # 'K'
2881
+ 49: 0, # 'L'
2882
+ 20: 1, # 'M'
2883
+ 46: 0, # 'N'
2884
+ 42: 0, # 'O'
2885
+ 48: 0, # 'P'
2886
+ 44: 0, # 'R'
2887
+ 35: 0, # 'S'
2888
+ 31: 0, # 'T'
2889
+ 51: 0, # 'U'
2890
+ 38: 0, # 'V'
2891
+ 62: 0, # 'W'
2892
+ 43: 0, # 'Y'
2893
+ 56: 0, # 'Z'
2894
+ 1: 3, # 'a'
2895
+ 21: 0, # 'b'
2896
+ 28: 0, # 'c'
2897
+ 12: 3, # 'd'
2898
+ 2: 3, # 'e'
2899
+ 18: 0, # 'f'
2900
+ 27: 0, # 'g'
2901
+ 25: 0, # 'h'
2902
+ 3: 0, # 'i'
2903
+ 24: 1, # 'j'
2904
+ 10: 1, # 'k'
2905
+ 5: 3, # 'l'
2906
+ 13: 2, # 'm'
2907
+ 4: 3, # 'n'
2908
+ 15: 0, # 'o'
2909
+ 26: 1, # 'p'
2910
+ 7: 1, # 'r'
2911
+ 8: 2, # 's'
2912
+ 9: 3, # 't'
2913
+ 14: 3, # 'u'
2914
+ 32: 1, # 'v'
2915
+ 57: 0, # 'w'
2916
+ 58: 0, # 'x'
2917
+ 11: 0, # 'y'
2918
+ 22: 0, # 'z'
2919
+ 63: 0, # '·'
2920
+ 54: 0, # 'Ç'
2921
+ 50: 0, # 'Ö'
2922
+ 55: 0, # 'Ü'
2923
+ 59: 0, # 'â'
2924
+ 33: 2, # 'ç'
2925
+ 61: 0, # 'î'
2926
+ 34: 0, # 'ö'
2927
+ 17: 0, # 'ü'
2928
+ 30: 0, # 'ğ'
2929
+ 41: 0, # 'İ'
2930
+ 6: 1, # 'ı'
2931
+ 40: 0, # 'Ş'
2932
+ 19: 0, # 'ş'
2933
+ },
2934
+ 57: { # 'w'
2935
+ 23: 0, # 'A'
2936
+ 37: 0, # 'B'
2937
+ 47: 0, # 'C'
2938
+ 39: 0, # 'D'
2939
+ 29: 0, # 'E'
2940
+ 52: 0, # 'F'
2941
+ 36: 0, # 'G'
2942
+ 45: 0, # 'H'
2943
+ 53: 0, # 'I'
2944
+ 60: 0, # 'J'
2945
+ 16: 0, # 'K'
2946
+ 49: 0, # 'L'
2947
+ 20: 0, # 'M'
2948
+ 46: 0, # 'N'
2949
+ 42: 0, # 'O'
2950
+ 48: 0, # 'P'
2951
+ 44: 0, # 'R'
2952
+ 35: 0, # 'S'
2953
+ 31: 0, # 'T'
2954
+ 51: 1, # 'U'
2955
+ 38: 0, # 'V'
2956
+ 62: 0, # 'W'
2957
+ 43: 0, # 'Y'
2958
+ 56: 0, # 'Z'
2959
+ 1: 1, # 'a'
2960
+ 21: 0, # 'b'
2961
+ 28: 0, # 'c'
2962
+ 12: 0, # 'd'
2963
+ 2: 2, # 'e'
2964
+ 18: 0, # 'f'
2965
+ 27: 0, # 'g'
2966
+ 25: 1, # 'h'
2967
+ 3: 0, # 'i'
2968
+ 24: 0, # 'j'
2969
+ 10: 1, # 'k'
2970
+ 5: 0, # 'l'
2971
+ 13: 0, # 'm'
2972
+ 4: 1, # 'n'
2973
+ 15: 0, # 'o'
2974
+ 26: 0, # 'p'
2975
+ 7: 0, # 'r'
2976
+ 8: 1, # 's'
2977
+ 9: 0, # 't'
2978
+ 14: 1, # 'u'
2979
+ 32: 0, # 'v'
2980
+ 57: 2, # 'w'
2981
+ 58: 0, # 'x'
2982
+ 11: 0, # 'y'
2983
+ 22: 0, # 'z'
2984
+ 63: 1, # '·'
2985
+ 54: 0, # 'Ç'
2986
+ 50: 0, # 'Ö'
2987
+ 55: 0, # 'Ü'
2988
+ 59: 0, # 'â'
2989
+ 33: 0, # 'ç'
2990
+ 61: 0, # 'î'
2991
+ 34: 0, # 'ö'
2992
+ 17: 1, # 'ü'
2993
+ 30: 0, # 'ğ'
2994
+ 41: 0, # 'İ'
2995
+ 6: 0, # 'ı'
2996
+ 40: 0, # 'Ş'
2997
+ 19: 0, # 'ş'
2998
+ },
2999
+ 58: { # 'x'
3000
+ 23: 0, # 'A'
3001
+ 37: 0, # 'B'
3002
+ 47: 0, # 'C'
3003
+ 39: 0, # 'D'
3004
+ 29: 1, # 'E'
3005
+ 52: 0, # 'F'
3006
+ 36: 0, # 'G'
3007
+ 45: 0, # 'H'
3008
+ 53: 0, # 'I'
3009
+ 60: 1, # 'J'
3010
+ 16: 0, # 'K'
3011
+ 49: 0, # 'L'
3012
+ 20: 1, # 'M'
3013
+ 46: 0, # 'N'
3014
+ 42: 0, # 'O'
3015
+ 48: 0, # 'P'
3016
+ 44: 0, # 'R'
3017
+ 35: 0, # 'S'
3018
+ 31: 0, # 'T'
3019
+ 51: 0, # 'U'
3020
+ 38: 0, # 'V'
3021
+ 62: 0, # 'W'
3022
+ 43: 0, # 'Y'
3023
+ 56: 0, # 'Z'
3024
+ 1: 0, # 'a'
3025
+ 21: 1, # 'b'
3026
+ 28: 0, # 'c'
3027
+ 12: 2, # 'd'
3028
+ 2: 1, # 'e'
3029
+ 18: 0, # 'f'
3030
+ 27: 0, # 'g'
3031
+ 25: 0, # 'h'
3032
+ 3: 2, # 'i'
3033
+ 24: 2, # 'j'
3034
+ 10: 1, # 'k'
3035
+ 5: 0, # 'l'
3036
+ 13: 0, # 'm'
3037
+ 4: 2, # 'n'
3038
+ 15: 0, # 'o'
3039
+ 26: 0, # 'p'
3040
+ 7: 1, # 'r'
3041
+ 8: 2, # 's'
3042
+ 9: 1, # 't'
3043
+ 14: 0, # 'u'
3044
+ 32: 0, # 'v'
3045
+ 57: 0, # 'w'
3046
+ 58: 0, # 'x'
3047
+ 11: 2, # 'y'
3048
+ 22: 0, # 'z'
3049
+ 63: 0, # '·'
3050
+ 54: 0, # 'Ç'
3051
+ 50: 0, # 'Ö'
3052
+ 55: 0, # 'Ü'
3053
+ 59: 0, # 'â'
3054
+ 33: 0, # 'ç'
3055
+ 61: 0, # 'î'
3056
+ 34: 0, # 'ö'
3057
+ 17: 1, # 'ü'
3058
+ 30: 0, # 'ğ'
3059
+ 41: 0, # 'İ'
3060
+ 6: 2, # 'ı'
3061
+ 40: 0, # 'Ş'
3062
+ 19: 0, # 'ş'
3063
+ },
3064
+ 11: { # 'y'
3065
+ 23: 1, # 'A'
3066
+ 37: 0, # 'B'
3067
+ 47: 0, # 'C'
3068
+ 39: 0, # 'D'
3069
+ 29: 0, # 'E'
3070
+ 52: 0, # 'F'
3071
+ 36: 0, # 'G'
3072
+ 45: 0, # 'H'
3073
+ 53: 0, # 'I'
3074
+ 60: 1, # 'J'
3075
+ 16: 3, # 'K'
3076
+ 49: 0, # 'L'
3077
+ 20: 1, # 'M'
3078
+ 46: 0, # 'N'
3079
+ 42: 0, # 'O'
3080
+ 48: 0, # 'P'
3081
+ 44: 0, # 'R'
3082
+ 35: 0, # 'S'
3083
+ 31: 1, # 'T'
3084
+ 51: 0, # 'U'
3085
+ 38: 0, # 'V'
3086
+ 62: 0, # 'W'
3087
+ 43: 1, # 'Y'
3088
+ 56: 1, # 'Z'
3089
+ 1: 3, # 'a'
3090
+ 21: 1, # 'b'
3091
+ 28: 0, # 'c'
3092
+ 12: 2, # 'd'
3093
+ 2: 3, # 'e'
3094
+ 18: 0, # 'f'
3095
+ 27: 2, # 'g'
3096
+ 25: 2, # 'h'
3097
+ 3: 2, # 'i'
3098
+ 24: 1, # 'j'
3099
+ 10: 2, # 'k'
3100
+ 5: 3, # 'l'
3101
+ 13: 3, # 'm'
3102
+ 4: 3, # 'n'
3103
+ 15: 0, # 'o'
3104
+ 26: 1, # 'p'
3105
+ 7: 2, # 'r'
3106
+ 8: 1, # 's'
3107
+ 9: 2, # 't'
3108
+ 14: 3, # 'u'
3109
+ 32: 0, # 'v'
3110
+ 57: 0, # 'w'
3111
+ 58: 1, # 'x'
3112
+ 11: 3, # 'y'
3113
+ 22: 0, # 'z'
3114
+ 63: 0, # '·'
3115
+ 54: 0, # 'Ç'
3116
+ 50: 0, # 'Ö'
3117
+ 55: 0, # 'Ü'
3118
+ 59: 0, # 'â'
3119
+ 33: 3, # 'ç'
3120
+ 61: 0, # 'î'
3121
+ 34: 0, # 'ö'
3122
+ 17: 2, # 'ü'
3123
+ 30: 0, # 'ğ'
3124
+ 41: 0, # 'İ'
3125
+ 6: 3, # 'ı'
3126
+ 40: 0, # 'Ş'
3127
+ 19: 0, # 'ş'
3128
+ },
3129
+ 22: { # 'z'
3130
+ 23: 2, # 'A'
3131
+ 37: 2, # 'B'
3132
+ 47: 1, # 'C'
3133
+ 39: 2, # 'D'
3134
+ 29: 3, # 'E'
3135
+ 52: 1, # 'F'
3136
+ 36: 2, # 'G'
3137
+ 45: 2, # 'H'
3138
+ 53: 1, # 'I'
3139
+ 60: 0, # 'J'
3140
+ 16: 0, # 'K'
3141
+ 49: 0, # 'L'
3142
+ 20: 3, # 'M'
3143
+ 46: 2, # 'N'
3144
+ 42: 2, # 'O'
3145
+ 48: 2, # 'P'
3146
+ 44: 1, # 'R'
3147
+ 35: 1, # 'S'
3148
+ 31: 3, # 'T'
3149
+ 51: 2, # 'U'
3150
+ 38: 2, # 'V'
3151
+ 62: 0, # 'W'
3152
+ 43: 2, # 'Y'
3153
+ 56: 1, # 'Z'
3154
+ 1: 1, # 'a'
3155
+ 21: 2, # 'b'
3156
+ 28: 1, # 'c'
3157
+ 12: 2, # 'd'
3158
+ 2: 2, # 'e'
3159
+ 18: 3, # 'f'
3160
+ 27: 2, # 'g'
3161
+ 25: 2, # 'h'
3162
+ 3: 3, # 'i'
3163
+ 24: 2, # 'j'
3164
+ 10: 3, # 'k'
3165
+ 5: 0, # 'l'
3166
+ 13: 2, # 'm'
3167
+ 4: 3, # 'n'
3168
+ 15: 2, # 'o'
3169
+ 26: 2, # 'p'
3170
+ 7: 3, # 'r'
3171
+ 8: 3, # 's'
3172
+ 9: 3, # 't'
3173
+ 14: 0, # 'u'
3174
+ 32: 2, # 'v'
3175
+ 57: 0, # 'w'
3176
+ 58: 0, # 'x'
3177
+ 11: 3, # 'y'
3178
+ 22: 2, # 'z'
3179
+ 63: 1, # '·'
3180
+ 54: 0, # 'Ç'
3181
+ 50: 0, # 'Ö'
3182
+ 55: 2, # 'Ü'
3183
+ 59: 1, # 'â'
3184
+ 33: 0, # 'ç'
3185
+ 61: 0, # 'î'
3186
+ 34: 2, # 'ö'
3187
+ 17: 2, # 'ü'
3188
+ 30: 2, # 'ğ'
3189
+ 41: 1, # 'İ'
3190
+ 6: 3, # 'ı'
3191
+ 40: 1, # 'Ş'
3192
+ 19: 2, # 'ş'
3193
+ },
3194
+ 63: { # '·'
3195
+ 23: 0, # 'A'
3196
+ 37: 0, # 'B'
3197
+ 47: 0, # 'C'
3198
+ 39: 0, # 'D'
3199
+ 29: 0, # 'E'
3200
+ 52: 0, # 'F'
3201
+ 36: 0, # 'G'
3202
+ 45: 0, # 'H'
3203
+ 53: 0, # 'I'
3204
+ 60: 0, # 'J'
3205
+ 16: 0, # 'K'
3206
+ 49: 0, # 'L'
3207
+ 20: 0, # 'M'
3208
+ 46: 0, # 'N'
3209
+ 42: 0, # 'O'
3210
+ 48: 0, # 'P'
3211
+ 44: 0, # 'R'
3212
+ 35: 0, # 'S'
3213
+ 31: 0, # 'T'
3214
+ 51: 0, # 'U'
3215
+ 38: 0, # 'V'
3216
+ 62: 0, # 'W'
3217
+ 43: 0, # 'Y'
3218
+ 56: 0, # 'Z'
3219
+ 1: 0, # 'a'
3220
+ 21: 0, # 'b'
3221
+ 28: 0, # 'c'
3222
+ 12: 0, # 'd'
3223
+ 2: 1, # 'e'
3224
+ 18: 0, # 'f'
3225
+ 27: 0, # 'g'
3226
+ 25: 0, # 'h'
3227
+ 3: 0, # 'i'
3228
+ 24: 0, # 'j'
3229
+ 10: 0, # 'k'
3230
+ 5: 0, # 'l'
3231
+ 13: 2, # 'm'
3232
+ 4: 0, # 'n'
3233
+ 15: 0, # 'o'
3234
+ 26: 0, # 'p'
3235
+ 7: 0, # 'r'
3236
+ 8: 0, # 's'
3237
+ 9: 0, # 't'
3238
+ 14: 2, # 'u'
3239
+ 32: 0, # 'v'
3240
+ 57: 0, # 'w'
3241
+ 58: 0, # 'x'
3242
+ 11: 0, # 'y'
3243
+ 22: 0, # 'z'
3244
+ 63: 0, # '·'
3245
+ 54: 0, # 'Ç'
3246
+ 50: 0, # 'Ö'
3247
+ 55: 0, # 'Ü'
3248
+ 59: 0, # 'â'
3249
+ 33: 0, # 'ç'
3250
+ 61: 0, # 'î'
3251
+ 34: 0, # 'ö'
3252
+ 17: 0, # 'ü'
3253
+ 30: 0, # 'ğ'
3254
+ 41: 0, # 'İ'
3255
+ 6: 0, # 'ı'
3256
+ 40: 0, # 'Ş'
3257
+ 19: 0, # 'ş'
3258
+ },
3259
+ 54: { # 'Ç'
3260
+ 23: 0, # 'A'
3261
+ 37: 0, # 'B'
3262
+ 47: 1, # 'C'
3263
+ 39: 1, # 'D'
3264
+ 29: 0, # 'E'
3265
+ 52: 0, # 'F'
3266
+ 36: 1, # 'G'
3267
+ 45: 1, # 'H'
3268
+ 53: 1, # 'I'
3269
+ 60: 0, # 'J'
3270
+ 16: 0, # 'K'
3271
+ 49: 0, # 'L'
3272
+ 20: 0, # 'M'
3273
+ 46: 0, # 'N'
3274
+ 42: 1, # 'O'
3275
+ 48: 1, # 'P'
3276
+ 44: 0, # 'R'
3277
+ 35: 0, # 'S'
3278
+ 31: 0, # 'T'
3279
+ 51: 1, # 'U'
3280
+ 38: 1, # 'V'
3281
+ 62: 0, # 'W'
3282
+ 43: 2, # 'Y'
3283
+ 56: 0, # 'Z'
3284
+ 1: 0, # 'a'
3285
+ 21: 1, # 'b'
3286
+ 28: 0, # 'c'
3287
+ 12: 1, # 'd'
3288
+ 2: 0, # 'e'
3289
+ 18: 0, # 'f'
3290
+ 27: 1, # 'g'
3291
+ 25: 0, # 'h'
3292
+ 3: 3, # 'i'
3293
+ 24: 0, # 'j'
3294
+ 10: 1, # 'k'
3295
+ 5: 0, # 'l'
3296
+ 13: 0, # 'm'
3297
+ 4: 2, # 'n'
3298
+ 15: 1, # 'o'
3299
+ 26: 0, # 'p'
3300
+ 7: 2, # 'r'
3301
+ 8: 0, # 's'
3302
+ 9: 1, # 't'
3303
+ 14: 0, # 'u'
3304
+ 32: 2, # 'v'
3305
+ 57: 0, # 'w'
3306
+ 58: 0, # 'x'
3307
+ 11: 0, # 'y'
3308
+ 22: 0, # 'z'
3309
+ 63: 0, # '·'
3310
+ 54: 0, # 'Ç'
3311
+ 50: 0, # 'Ö'
3312
+ 55: 2, # 'Ü'
3313
+ 59: 0, # 'â'
3314
+ 33: 0, # 'ç'
3315
+ 61: 0, # 'î'
3316
+ 34: 1, # 'ö'
3317
+ 17: 0, # 'ü'
3318
+ 30: 0, # 'ğ'
3319
+ 41: 0, # 'İ'
3320
+ 6: 2, # 'ı'
3321
+ 40: 0, # 'Ş'
3322
+ 19: 1, # 'ş'
3323
+ },
3324
+ 50: { # 'Ö'
3325
+ 23: 0, # 'A'
3326
+ 37: 0, # 'B'
3327
+ 47: 1, # 'C'
3328
+ 39: 1, # 'D'
3329
+ 29: 2, # 'E'
3330
+ 52: 0, # 'F'
3331
+ 36: 1, # 'G'
3332
+ 45: 2, # 'H'
3333
+ 53: 0, # 'I'
3334
+ 60: 0, # 'J'
3335
+ 16: 0, # 'K'
3336
+ 49: 0, # 'L'
3337
+ 20: 1, # 'M'
3338
+ 46: 1, # 'N'
3339
+ 42: 2, # 'O'
3340
+ 48: 2, # 'P'
3341
+ 44: 1, # 'R'
3342
+ 35: 0, # 'S'
3343
+ 31: 0, # 'T'
3344
+ 51: 1, # 'U'
3345
+ 38: 1, # 'V'
3346
+ 62: 0, # 'W'
3347
+ 43: 2, # 'Y'
3348
+ 56: 0, # 'Z'
3349
+ 1: 0, # 'a'
3350
+ 21: 2, # 'b'
3351
+ 28: 1, # 'c'
3352
+ 12: 2, # 'd'
3353
+ 2: 0, # 'e'
3354
+ 18: 1, # 'f'
3355
+ 27: 1, # 'g'
3356
+ 25: 1, # 'h'
3357
+ 3: 2, # 'i'
3358
+ 24: 0, # 'j'
3359
+ 10: 2, # 'k'
3360
+ 5: 0, # 'l'
3361
+ 13: 0, # 'm'
3362
+ 4: 3, # 'n'
3363
+ 15: 2, # 'o'
3364
+ 26: 2, # 'p'
3365
+ 7: 3, # 'r'
3366
+ 8: 1, # 's'
3367
+ 9: 2, # 't'
3368
+ 14: 0, # 'u'
3369
+ 32: 1, # 'v'
3370
+ 57: 0, # 'w'
3371
+ 58: 0, # 'x'
3372
+ 11: 0, # 'y'
3373
+ 22: 1, # 'z'
3374
+ 63: 0, # '·'
3375
+ 54: 0, # 'Ç'
3376
+ 50: 0, # 'Ö'
3377
+ 55: 0, # 'Ü'
3378
+ 59: 0, # 'â'
3379
+ 33: 0, # 'ç'
3380
+ 61: 0, # 'î'
3381
+ 34: 2, # 'ö'
3382
+ 17: 2, # 'ü'
3383
+ 30: 1, # 'ğ'
3384
+ 41: 0, # 'İ'
3385
+ 6: 2, # 'ı'
3386
+ 40: 0, # 'Ş'
3387
+ 19: 1, # 'ş'
3388
+ },
3389
+ 55: { # 'Ü'
3390
+ 23: 0, # 'A'
3391
+ 37: 0, # 'B'
3392
+ 47: 0, # 'C'
3393
+ 39: 0, # 'D'
3394
+ 29: 0, # 'E'
3395
+ 52: 2, # 'F'
3396
+ 36: 0, # 'G'
3397
+ 45: 0, # 'H'
3398
+ 53: 0, # 'I'
3399
+ 60: 0, # 'J'
3400
+ 16: 1, # 'K'
3401
+ 49: 0, # 'L'
3402
+ 20: 0, # 'M'
3403
+ 46: 0, # 'N'
3404
+ 42: 0, # 'O'
3405
+ 48: 1, # 'P'
3406
+ 44: 0, # 'R'
3407
+ 35: 0, # 'S'
3408
+ 31: 0, # 'T'
3409
+ 51: 0, # 'U'
3410
+ 38: 1, # 'V'
3411
+ 62: 0, # 'W'
3412
+ 43: 0, # 'Y'
3413
+ 56: 0, # 'Z'
3414
+ 1: 2, # 'a'
3415
+ 21: 0, # 'b'
3416
+ 28: 2, # 'c'
3417
+ 12: 0, # 'd'
3418
+ 2: 2, # 'e'
3419
+ 18: 0, # 'f'
3420
+ 27: 1, # 'g'
3421
+ 25: 0, # 'h'
3422
+ 3: 0, # 'i'
3423
+ 24: 0, # 'j'
3424
+ 10: 0, # 'k'
3425
+ 5: 1, # 'l'
3426
+ 13: 1, # 'm'
3427
+ 4: 1, # 'n'
3428
+ 15: 0, # 'o'
3429
+ 26: 0, # 'p'
3430
+ 7: 0, # 'r'
3431
+ 8: 0, # 's'
3432
+ 9: 1, # 't'
3433
+ 14: 2, # 'u'
3434
+ 32: 0, # 'v'
3435
+ 57: 0, # 'w'
3436
+ 58: 0, # 'x'
3437
+ 11: 0, # 'y'
3438
+ 22: 1, # 'z'
3439
+ 63: 0, # '·'
3440
+ 54: 0, # 'Ç'
3441
+ 50: 1, # 'Ö'
3442
+ 55: 0, # 'Ü'
3443
+ 59: 0, # 'â'
3444
+ 33: 0, # 'ç'
3445
+ 61: 0, # 'î'
3446
+ 34: 1, # 'ö'
3447
+ 17: 0, # 'ü'
3448
+ 30: 1, # 'ğ'
3449
+ 41: 1, # 'İ'
3450
+ 6: 0, # 'ı'
3451
+ 40: 0, # 'Ş'
3452
+ 19: 1, # 'ş'
3453
+ },
3454
+ 59: { # 'â'
3455
+ 23: 0, # 'A'
3456
+ 37: 0, # 'B'
3457
+ 47: 0, # 'C'
3458
+ 39: 0, # 'D'
3459
+ 29: 0, # 'E'
3460
+ 52: 0, # 'F'
3461
+ 36: 1, # 'G'
3462
+ 45: 0, # 'H'
3463
+ 53: 0, # 'I'
3464
+ 60: 0, # 'J'
3465
+ 16: 1, # 'K'
3466
+ 49: 0, # 'L'
3467
+ 20: 0, # 'M'
3468
+ 46: 0, # 'N'
3469
+ 42: 0, # 'O'
3470
+ 48: 0, # 'P'
3471
+ 44: 0, # 'R'
3472
+ 35: 0, # 'S'
3473
+ 31: 0, # 'T'
3474
+ 51: 0, # 'U'
3475
+ 38: 0, # 'V'
3476
+ 62: 0, # 'W'
3477
+ 43: 0, # 'Y'
3478
+ 56: 0, # 'Z'
3479
+ 1: 2, # 'a'
3480
+ 21: 0, # 'b'
3481
+ 28: 0, # 'c'
3482
+ 12: 0, # 'd'
3483
+ 2: 2, # 'e'
3484
+ 18: 0, # 'f'
3485
+ 27: 0, # 'g'
3486
+ 25: 0, # 'h'
3487
+ 3: 0, # 'i'
3488
+ 24: 0, # 'j'
3489
+ 10: 0, # 'k'
3490
+ 5: 0, # 'l'
3491
+ 13: 2, # 'm'
3492
+ 4: 0, # 'n'
3493
+ 15: 1, # 'o'
3494
+ 26: 0, # 'p'
3495
+ 7: 0, # 'r'
3496
+ 8: 0, # 's'
3497
+ 9: 0, # 't'
3498
+ 14: 2, # 'u'
3499
+ 32: 0, # 'v'
3500
+ 57: 0, # 'w'
3501
+ 58: 0, # 'x'
3502
+ 11: 0, # 'y'
3503
+ 22: 1, # 'z'
3504
+ 63: 0, # '·'
3505
+ 54: 0, # 'Ç'
3506
+ 50: 0, # 'Ö'
3507
+ 55: 0, # 'Ü'
3508
+ 59: 0, # 'â'
3509
+ 33: 0, # 'ç'
3510
+ 61: 0, # 'î'
3511
+ 34: 0, # 'ö'
3512
+ 17: 0, # 'ü'
3513
+ 30: 0, # 'ğ'
3514
+ 41: 0, # 'İ'
3515
+ 6: 1, # 'ı'
3516
+ 40: 1, # 'Ş'
3517
+ 19: 0, # 'ş'
3518
+ },
3519
+ 33: { # 'ç'
3520
+ 23: 0, # 'A'
3521
+ 37: 0, # 'B'
3522
+ 47: 0, # 'C'
3523
+ 39: 0, # 'D'
3524
+ 29: 3, # 'E'
3525
+ 52: 0, # 'F'
3526
+ 36: 0, # 'G'
3527
+ 45: 0, # 'H'
3528
+ 53: 0, # 'I'
3529
+ 60: 0, # 'J'
3530
+ 16: 0, # 'K'
3531
+ 49: 0, # 'L'
3532
+ 20: 1, # 'M'
3533
+ 46: 0, # 'N'
3534
+ 42: 0, # 'O'
3535
+ 48: 0, # 'P'
3536
+ 44: 0, # 'R'
3537
+ 35: 0, # 'S'
3538
+ 31: 2, # 'T'
3539
+ 51: 0, # 'U'
3540
+ 38: 1, # 'V'
3541
+ 62: 0, # 'W'
3542
+ 43: 0, # 'Y'
3543
+ 56: 0, # 'Z'
3544
+ 1: 0, # 'a'
3545
+ 21: 3, # 'b'
3546
+ 28: 0, # 'c'
3547
+ 12: 2, # 'd'
3548
+ 2: 0, # 'e'
3549
+ 18: 2, # 'f'
3550
+ 27: 1, # 'g'
3551
+ 25: 3, # 'h'
3552
+ 3: 3, # 'i'
3553
+ 24: 0, # 'j'
3554
+ 10: 3, # 'k'
3555
+ 5: 0, # 'l'
3556
+ 13: 0, # 'm'
3557
+ 4: 3, # 'n'
3558
+ 15: 0, # 'o'
3559
+ 26: 1, # 'p'
3560
+ 7: 3, # 'r'
3561
+ 8: 2, # 's'
3562
+ 9: 3, # 't'
3563
+ 14: 0, # 'u'
3564
+ 32: 2, # 'v'
3565
+ 57: 0, # 'w'
3566
+ 58: 0, # 'x'
3567
+ 11: 2, # 'y'
3568
+ 22: 0, # 'z'
3569
+ 63: 0, # '·'
3570
+ 54: 0, # 'Ç'
3571
+ 50: 0, # 'Ö'
3572
+ 55: 0, # 'Ü'
3573
+ 59: 0, # 'â'
3574
+ 33: 0, # 'ç'
3575
+ 61: 0, # 'î'
3576
+ 34: 0, # 'ö'
3577
+ 17: 1, # 'ü'
3578
+ 30: 0, # 'ğ'
3579
+ 41: 0, # 'İ'
3580
+ 6: 3, # 'ı'
3581
+ 40: 0, # 'Ş'
3582
+ 19: 0, # 'ş'
3583
+ },
3584
+ 61: { # 'î'
3585
+ 23: 0, # 'A'
3586
+ 37: 0, # 'B'
3587
+ 47: 0, # 'C'
3588
+ 39: 0, # 'D'
3589
+ 29: 0, # 'E'
3590
+ 52: 0, # 'F'
3591
+ 36: 0, # 'G'
3592
+ 45: 0, # 'H'
3593
+ 53: 0, # 'I'
3594
+ 60: 0, # 'J'
3595
+ 16: 0, # 'K'
3596
+ 49: 0, # 'L'
3597
+ 20: 0, # 'M'
3598
+ 46: 0, # 'N'
3599
+ 42: 0, # 'O'
3600
+ 48: 0, # 'P'
3601
+ 44: 0, # 'R'
3602
+ 35: 0, # 'S'
3603
+ 31: 0, # 'T'
3604
+ 51: 0, # 'U'
3605
+ 38: 0, # 'V'
3606
+ 62: 0, # 'W'
3607
+ 43: 0, # 'Y'
3608
+ 56: 1, # 'Z'
3609
+ 1: 2, # 'a'
3610
+ 21: 0, # 'b'
3611
+ 28: 0, # 'c'
3612
+ 12: 0, # 'd'
3613
+ 2: 2, # 'e'
3614
+ 18: 0, # 'f'
3615
+ 27: 0, # 'g'
3616
+ 25: 0, # 'h'
3617
+ 3: 0, # 'i'
3618
+ 24: 1, # 'j'
3619
+ 10: 0, # 'k'
3620
+ 5: 0, # 'l'
3621
+ 13: 1, # 'm'
3622
+ 4: 1, # 'n'
3623
+ 15: 0, # 'o'
3624
+ 26: 0, # 'p'
3625
+ 7: 0, # 'r'
3626
+ 8: 0, # 's'
3627
+ 9: 0, # 't'
3628
+ 14: 1, # 'u'
3629
+ 32: 0, # 'v'
3630
+ 57: 0, # 'w'
3631
+ 58: 0, # 'x'
3632
+ 11: 0, # 'y'
3633
+ 22: 1, # 'z'
3634
+ 63: 0, # '·'
3635
+ 54: 0, # 'Ç'
3636
+ 50: 0, # 'Ö'
3637
+ 55: 0, # 'Ü'
3638
+ 59: 0, # 'â'
3639
+ 33: 0, # 'ç'
3640
+ 61: 1, # 'î'
3641
+ 34: 0, # 'ö'
3642
+ 17: 0, # 'ü'
3643
+ 30: 0, # 'ğ'
3644
+ 41: 0, # 'İ'
3645
+ 6: 1, # 'ı'
3646
+ 40: 0, # 'Ş'
3647
+ 19: 0, # 'ş'
3648
+ },
3649
+ 34: { # 'ö'
3650
+ 23: 0, # 'A'
3651
+ 37: 1, # 'B'
3652
+ 47: 1, # 'C'
3653
+ 39: 0, # 'D'
3654
+ 29: 0, # 'E'
3655
+ 52: 2, # 'F'
3656
+ 36: 1, # 'G'
3657
+ 45: 1, # 'H'
3658
+ 53: 0, # 'I'
3659
+ 60: 0, # 'J'
3660
+ 16: 3, # 'K'
3661
+ 49: 1, # 'L'
3662
+ 20: 0, # 'M'
3663
+ 46: 1, # 'N'
3664
+ 42: 1, # 'O'
3665
+ 48: 2, # 'P'
3666
+ 44: 1, # 'R'
3667
+ 35: 1, # 'S'
3668
+ 31: 1, # 'T'
3669
+ 51: 1, # 'U'
3670
+ 38: 1, # 'V'
3671
+ 62: 0, # 'W'
3672
+ 43: 0, # 'Y'
3673
+ 56: 1, # 'Z'
3674
+ 1: 3, # 'a'
3675
+ 21: 1, # 'b'
3676
+ 28: 2, # 'c'
3677
+ 12: 1, # 'd'
3678
+ 2: 3, # 'e'
3679
+ 18: 0, # 'f'
3680
+ 27: 2, # 'g'
3681
+ 25: 2, # 'h'
3682
+ 3: 1, # 'i'
3683
+ 24: 2, # 'j'
3684
+ 10: 1, # 'k'
3685
+ 5: 2, # 'l'
3686
+ 13: 3, # 'm'
3687
+ 4: 2, # 'n'
3688
+ 15: 2, # 'o'
3689
+ 26: 0, # 'p'
3690
+ 7: 0, # 'r'
3691
+ 8: 3, # 's'
3692
+ 9: 1, # 't'
3693
+ 14: 3, # 'u'
3694
+ 32: 0, # 'v'
3695
+ 57: 0, # 'w'
3696
+ 58: 0, # 'x'
3697
+ 11: 1, # 'y'
3698
+ 22: 2, # 'z'
3699
+ 63: 0, # '·'
3700
+ 54: 1, # 'Ç'
3701
+ 50: 2, # 'Ö'
3702
+ 55: 0, # 'Ü'
3703
+ 59: 0, # 'â'
3704
+ 33: 2, # 'ç'
3705
+ 61: 0, # 'î'
3706
+ 34: 2, # 'ö'
3707
+ 17: 0, # 'ü'
3708
+ 30: 2, # 'ğ'
3709
+ 41: 1, # 'İ'
3710
+ 6: 1, # 'ı'
3711
+ 40: 2, # 'Ş'
3712
+ 19: 1, # 'ş'
3713
+ },
3714
+ 17: { # 'ü'
3715
+ 23: 0, # 'A'
3716
+ 37: 0, # 'B'
3717
+ 47: 1, # 'C'
3718
+ 39: 0, # 'D'
3719
+ 29: 0, # 'E'
3720
+ 52: 0, # 'F'
3721
+ 36: 0, # 'G'
3722
+ 45: 0, # 'H'
3723
+ 53: 0, # 'I'
3724
+ 60: 1, # 'J'
3725
+ 16: 1, # 'K'
3726
+ 49: 0, # 'L'
3727
+ 20: 1, # 'M'
3728
+ 46: 0, # 'N'
3729
+ 42: 0, # 'O'
3730
+ 48: 0, # 'P'
3731
+ 44: 0, # 'R'
3732
+ 35: 0, # 'S'
3733
+ 31: 1, # 'T'
3734
+ 51: 0, # 'U'
3735
+ 38: 0, # 'V'
3736
+ 62: 0, # 'W'
3737
+ 43: 0, # 'Y'
3738
+ 56: 1, # 'Z'
3739
+ 1: 3, # 'a'
3740
+ 21: 0, # 'b'
3741
+ 28: 0, # 'c'
3742
+ 12: 1, # 'd'
3743
+ 2: 3, # 'e'
3744
+ 18: 1, # 'f'
3745
+ 27: 2, # 'g'
3746
+ 25: 0, # 'h'
3747
+ 3: 1, # 'i'
3748
+ 24: 1, # 'j'
3749
+ 10: 2, # 'k'
3750
+ 5: 3, # 'l'
3751
+ 13: 2, # 'm'
3752
+ 4: 3, # 'n'
3753
+ 15: 0, # 'o'
3754
+ 26: 2, # 'p'
3755
+ 7: 2, # 'r'
3756
+ 8: 3, # 's'
3757
+ 9: 2, # 't'
3758
+ 14: 3, # 'u'
3759
+ 32: 1, # 'v'
3760
+ 57: 1, # 'w'
3761
+ 58: 0, # 'x'
3762
+ 11: 0, # 'y'
3763
+ 22: 0, # 'z'
3764
+ 63: 0, # '·'
3765
+ 54: 0, # 'Ç'
3766
+ 50: 0, # 'Ö'
3767
+ 55: 0, # 'Ü'
3768
+ 59: 0, # 'â'
3769
+ 33: 1, # 'ç'
3770
+ 61: 0, # 'î'
3771
+ 34: 0, # 'ö'
3772
+ 17: 2, # 'ü'
3773
+ 30: 0, # 'ğ'
3774
+ 41: 0, # 'İ'
3775
+ 6: 2, # 'ı'
3776
+ 40: 0, # 'Ş'
3777
+ 19: 0, # 'ş'
3778
+ },
3779
+ 30: { # 'ğ'
3780
+ 23: 0, # 'A'
3781
+ 37: 2, # 'B'
3782
+ 47: 1, # 'C'
3783
+ 39: 0, # 'D'
3784
+ 29: 0, # 'E'
3785
+ 52: 2, # 'F'
3786
+ 36: 1, # 'G'
3787
+ 45: 0, # 'H'
3788
+ 53: 1, # 'I'
3789
+ 60: 0, # 'J'
3790
+ 16: 3, # 'K'
3791
+ 49: 0, # 'L'
3792
+ 20: 1, # 'M'
3793
+ 46: 2, # 'N'
3794
+ 42: 2, # 'O'
3795
+ 48: 1, # 'P'
3796
+ 44: 1, # 'R'
3797
+ 35: 0, # 'S'
3798
+ 31: 1, # 'T'
3799
+ 51: 0, # 'U'
3800
+ 38: 2, # 'V'
3801
+ 62: 0, # 'W'
3802
+ 43: 2, # 'Y'
3803
+ 56: 0, # 'Z'
3804
+ 1: 3, # 'a'
3805
+ 21: 0, # 'b'
3806
+ 28: 2, # 'c'
3807
+ 12: 0, # 'd'
3808
+ 2: 2, # 'e'
3809
+ 18: 0, # 'f'
3810
+ 27: 0, # 'g'
3811
+ 25: 0, # 'h'
3812
+ 3: 0, # 'i'
3813
+ 24: 3, # 'j'
3814
+ 10: 1, # 'k'
3815
+ 5: 2, # 'l'
3816
+ 13: 3, # 'm'
3817
+ 4: 0, # 'n'
3818
+ 15: 1, # 'o'
3819
+ 26: 0, # 'p'
3820
+ 7: 1, # 'r'
3821
+ 8: 0, # 's'
3822
+ 9: 0, # 't'
3823
+ 14: 3, # 'u'
3824
+ 32: 0, # 'v'
3825
+ 57: 0, # 'w'
3826
+ 58: 0, # 'x'
3827
+ 11: 0, # 'y'
3828
+ 22: 2, # 'z'
3829
+ 63: 0, # '·'
3830
+ 54: 2, # 'Ç'
3831
+ 50: 2, # 'Ö'
3832
+ 55: 0, # 'Ü'
3833
+ 59: 0, # 'â'
3834
+ 33: 1, # 'ç'
3835
+ 61: 0, # 'î'
3836
+ 34: 2, # 'ö'
3837
+ 17: 0, # 'ü'
3838
+ 30: 1, # 'ğ'
3839
+ 41: 2, # 'İ'
3840
+ 6: 2, # 'ı'
3841
+ 40: 2, # 'Ş'
3842
+ 19: 1, # 'ş'
3843
+ },
3844
+ 41: { # 'İ'
3845
+ 23: 0, # 'A'
3846
+ 37: 0, # 'B'
3847
+ 47: 1, # 'C'
3848
+ 39: 1, # 'D'
3849
+ 29: 1, # 'E'
3850
+ 52: 0, # 'F'
3851
+ 36: 2, # 'G'
3852
+ 45: 2, # 'H'
3853
+ 53: 0, # 'I'
3854
+ 60: 0, # 'J'
3855
+ 16: 0, # 'K'
3856
+ 49: 0, # 'L'
3857
+ 20: 2, # 'M'
3858
+ 46: 1, # 'N'
3859
+ 42: 1, # 'O'
3860
+ 48: 2, # 'P'
3861
+ 44: 0, # 'R'
3862
+ 35: 1, # 'S'
3863
+ 31: 1, # 'T'
3864
+ 51: 1, # 'U'
3865
+ 38: 1, # 'V'
3866
+ 62: 0, # 'W'
3867
+ 43: 2, # 'Y'
3868
+ 56: 0, # 'Z'
3869
+ 1: 1, # 'a'
3870
+ 21: 2, # 'b'
3871
+ 28: 1, # 'c'
3872
+ 12: 2, # 'd'
3873
+ 2: 1, # 'e'
3874
+ 18: 0, # 'f'
3875
+ 27: 3, # 'g'
3876
+ 25: 2, # 'h'
3877
+ 3: 2, # 'i'
3878
+ 24: 2, # 'j'
3879
+ 10: 2, # 'k'
3880
+ 5: 0, # 'l'
3881
+ 13: 1, # 'm'
3882
+ 4: 3, # 'n'
3883
+ 15: 1, # 'o'
3884
+ 26: 1, # 'p'
3885
+ 7: 3, # 'r'
3886
+ 8: 3, # 's'
3887
+ 9: 2, # 't'
3888
+ 14: 0, # 'u'
3889
+ 32: 0, # 'v'
3890
+ 57: 1, # 'w'
3891
+ 58: 0, # 'x'
3892
+ 11: 2, # 'y'
3893
+ 22: 0, # 'z'
3894
+ 63: 0, # '·'
3895
+ 54: 0, # 'Ç'
3896
+ 50: 0, # 'Ö'
3897
+ 55: 1, # 'Ü'
3898
+ 59: 1, # 'â'
3899
+ 33: 0, # 'ç'
3900
+ 61: 0, # 'î'
3901
+ 34: 1, # 'ö'
3902
+ 17: 1, # 'ü'
3903
+ 30: 2, # 'ğ'
3904
+ 41: 0, # 'İ'
3905
+ 6: 3, # 'ı'
3906
+ 40: 0, # 'Ş'
3907
+ 19: 1, # 'ş'
3908
+ },
3909
+ 6: { # 'ı'
3910
+ 23: 2, # 'A'
3911
+ 37: 0, # 'B'
3912
+ 47: 0, # 'C'
3913
+ 39: 0, # 'D'
3914
+ 29: 0, # 'E'
3915
+ 52: 0, # 'F'
3916
+ 36: 1, # 'G'
3917
+ 45: 0, # 'H'
3918
+ 53: 0, # 'I'
3919
+ 60: 2, # 'J'
3920
+ 16: 3, # 'K'
3921
+ 49: 0, # 'L'
3922
+ 20: 3, # 'M'
3923
+ 46: 1, # 'N'
3924
+ 42: 0, # 'O'
3925
+ 48: 0, # 'P'
3926
+ 44: 0, # 'R'
3927
+ 35: 0, # 'S'
3928
+ 31: 2, # 'T'
3929
+ 51: 0, # 'U'
3930
+ 38: 0, # 'V'
3931
+ 62: 0, # 'W'
3932
+ 43: 2, # 'Y'
3933
+ 56: 1, # 'Z'
3934
+ 1: 3, # 'a'
3935
+ 21: 2, # 'b'
3936
+ 28: 1, # 'c'
3937
+ 12: 3, # 'd'
3938
+ 2: 3, # 'e'
3939
+ 18: 3, # 'f'
3940
+ 27: 3, # 'g'
3941
+ 25: 2, # 'h'
3942
+ 3: 3, # 'i'
3943
+ 24: 3, # 'j'
3944
+ 10: 3, # 'k'
3945
+ 5: 3, # 'l'
3946
+ 13: 3, # 'm'
3947
+ 4: 3, # 'n'
3948
+ 15: 0, # 'o'
3949
+ 26: 3, # 'p'
3950
+ 7: 3, # 'r'
3951
+ 8: 3, # 's'
3952
+ 9: 3, # 't'
3953
+ 14: 3, # 'u'
3954
+ 32: 3, # 'v'
3955
+ 57: 1, # 'w'
3956
+ 58: 1, # 'x'
3957
+ 11: 3, # 'y'
3958
+ 22: 0, # 'z'
3959
+ 63: 1, # '·'
3960
+ 54: 0, # 'Ç'
3961
+ 50: 0, # 'Ö'
3962
+ 55: 0, # 'Ü'
3963
+ 59: 0, # 'â'
3964
+ 33: 2, # 'ç'
3965
+ 61: 0, # 'î'
3966
+ 34: 0, # 'ö'
3967
+ 17: 3, # 'ü'
3968
+ 30: 0, # 'ğ'
3969
+ 41: 0, # 'İ'
3970
+ 6: 3, # 'ı'
3971
+ 40: 0, # 'Ş'
3972
+ 19: 0, # 'ş'
3973
+ },
3974
+ 40: { # 'Ş'
3975
+ 23: 0, # 'A'
3976
+ 37: 0, # 'B'
3977
+ 47: 1, # 'C'
3978
+ 39: 1, # 'D'
3979
+ 29: 1, # 'E'
3980
+ 52: 0, # 'F'
3981
+ 36: 1, # 'G'
3982
+ 45: 2, # 'H'
3983
+ 53: 1, # 'I'
3984
+ 60: 0, # 'J'
3985
+ 16: 0, # 'K'
3986
+ 49: 0, # 'L'
3987
+ 20: 2, # 'M'
3988
+ 46: 1, # 'N'
3989
+ 42: 1, # 'O'
3990
+ 48: 2, # 'P'
3991
+ 44: 2, # 'R'
3992
+ 35: 1, # 'S'
3993
+ 31: 1, # 'T'
3994
+ 51: 0, # 'U'
3995
+ 38: 1, # 'V'
3996
+ 62: 0, # 'W'
3997
+ 43: 2, # 'Y'
3998
+ 56: 1, # 'Z'
3999
+ 1: 0, # 'a'
4000
+ 21: 2, # 'b'
4001
+ 28: 0, # 'c'
4002
+ 12: 2, # 'd'
4003
+ 2: 0, # 'e'
4004
+ 18: 3, # 'f'
4005
+ 27: 0, # 'g'
4006
+ 25: 2, # 'h'
4007
+ 3: 3, # 'i'
4008
+ 24: 2, # 'j'
4009
+ 10: 1, # 'k'
4010
+ 5: 0, # 'l'
4011
+ 13: 1, # 'm'
4012
+ 4: 3, # 'n'
4013
+ 15: 2, # 'o'
4014
+ 26: 0, # 'p'
4015
+ 7: 3, # 'r'
4016
+ 8: 2, # 's'
4017
+ 9: 2, # 't'
4018
+ 14: 1, # 'u'
4019
+ 32: 3, # 'v'
4020
+ 57: 0, # 'w'
4021
+ 58: 0, # 'x'
4022
+ 11: 2, # 'y'
4023
+ 22: 0, # 'z'
4024
+ 63: 0, # '·'
4025
+ 54: 0, # 'Ç'
4026
+ 50: 0, # 'Ö'
4027
+ 55: 1, # 'Ü'
4028
+ 59: 0, # 'â'
4029
+ 33: 0, # 'ç'
4030
+ 61: 0, # 'î'
4031
+ 34: 2, # 'ö'
4032
+ 17: 1, # 'ü'
4033
+ 30: 2, # 'ğ'
4034
+ 41: 0, # 'İ'
4035
+ 6: 2, # 'ı'
4036
+ 40: 1, # 'Ş'
4037
+ 19: 2, # 'ş'
4038
+ },
4039
+ 19: { # 'ş'
4040
+ 23: 0, # 'A'
4041
+ 37: 0, # 'B'
4042
+ 47: 1, # 'C'
4043
+ 39: 0, # 'D'
4044
+ 29: 0, # 'E'
4045
+ 52: 2, # 'F'
4046
+ 36: 1, # 'G'
4047
+ 45: 0, # 'H'
4048
+ 53: 0, # 'I'
4049
+ 60: 0, # 'J'
4050
+ 16: 3, # 'K'
4051
+ 49: 2, # 'L'
4052
+ 20: 0, # 'M'
4053
+ 46: 1, # 'N'
4054
+ 42: 1, # 'O'
4055
+ 48: 1, # 'P'
4056
+ 44: 1, # 'R'
4057
+ 35: 1, # 'S'
4058
+ 31: 0, # 'T'
4059
+ 51: 1, # 'U'
4060
+ 38: 1, # 'V'
4061
+ 62: 0, # 'W'
4062
+ 43: 1, # 'Y'
4063
+ 56: 0, # 'Z'
4064
+ 1: 3, # 'a'
4065
+ 21: 1, # 'b'
4066
+ 28: 2, # 'c'
4067
+ 12: 0, # 'd'
4068
+ 2: 3, # 'e'
4069
+ 18: 0, # 'f'
4070
+ 27: 2, # 'g'
4071
+ 25: 1, # 'h'
4072
+ 3: 1, # 'i'
4073
+ 24: 0, # 'j'
4074
+ 10: 2, # 'k'
4075
+ 5: 2, # 'l'
4076
+ 13: 3, # 'm'
4077
+ 4: 0, # 'n'
4078
+ 15: 0, # 'o'
4079
+ 26: 1, # 'p'
4080
+ 7: 3, # 'r'
4081
+ 8: 0, # 's'
4082
+ 9: 0, # 't'
4083
+ 14: 3, # 'u'
4084
+ 32: 0, # 'v'
4085
+ 57: 0, # 'w'
4086
+ 58: 0, # 'x'
4087
+ 11: 0, # 'y'
4088
+ 22: 2, # 'z'
4089
+ 63: 0, # '·'
4090
+ 54: 1, # 'Ç'
4091
+ 50: 2, # 'Ö'
4092
+ 55: 0, # 'Ü'
4093
+ 59: 0, # 'â'
4094
+ 33: 1, # 'ç'
4095
+ 61: 1, # 'î'
4096
+ 34: 2, # 'ö'
4097
+ 17: 0, # 'ü'
4098
+ 30: 1, # 'ğ'
4099
+ 41: 1, # 'İ'
4100
+ 6: 1, # 'ı'
4101
+ 40: 1, # 'Ş'
4102
+ 19: 1, # 'ş'
4103
+ },
4104
+ }
4105
+
4106
+ # 255: Undefined characters that did not exist in training text
4107
+ # 254: Carriage/Return
4108
+ # 253: symbol (punctuation) that does not belong to word
4109
+ # 252: 0 - 9
4110
+ # 251: Control characters
4111
+
4112
+ # Character Mapping Table(s):
4113
+ ISO_8859_9_TURKISH_CHAR_TO_ORDER = {
4114
+ 0: 255, # '\x00'
4115
+ 1: 255, # '\x01'
4116
+ 2: 255, # '\x02'
4117
+ 3: 255, # '\x03'
4118
+ 4: 255, # '\x04'
4119
+ 5: 255, # '\x05'
4120
+ 6: 255, # '\x06'
4121
+ 7: 255, # '\x07'
4122
+ 8: 255, # '\x08'
4123
+ 9: 255, # '\t'
4124
+ 10: 255, # '\n'
4125
+ 11: 255, # '\x0b'
4126
+ 12: 255, # '\x0c'
4127
+ 13: 255, # '\r'
4128
+ 14: 255, # '\x0e'
4129
+ 15: 255, # '\x0f'
4130
+ 16: 255, # '\x10'
4131
+ 17: 255, # '\x11'
4132
+ 18: 255, # '\x12'
4133
+ 19: 255, # '\x13'
4134
+ 20: 255, # '\x14'
4135
+ 21: 255, # '\x15'
4136
+ 22: 255, # '\x16'
4137
+ 23: 255, # '\x17'
4138
+ 24: 255, # '\x18'
4139
+ 25: 255, # '\x19'
4140
+ 26: 255, # '\x1a'
4141
+ 27: 255, # '\x1b'
4142
+ 28: 255, # '\x1c'
4143
+ 29: 255, # '\x1d'
4144
+ 30: 255, # '\x1e'
4145
+ 31: 255, # '\x1f'
4146
+ 32: 255, # ' '
4147
+ 33: 255, # '!'
4148
+ 34: 255, # '"'
4149
+ 35: 255, # '#'
4150
+ 36: 255, # '$'
4151
+ 37: 255, # '%'
4152
+ 38: 255, # '&'
4153
+ 39: 255, # "'"
4154
+ 40: 255, # '('
4155
+ 41: 255, # ')'
4156
+ 42: 255, # '*'
4157
+ 43: 255, # '+'
4158
+ 44: 255, # ','
4159
+ 45: 255, # '-'
4160
+ 46: 255, # '.'
4161
+ 47: 255, # '/'
4162
+ 48: 255, # '0'
4163
+ 49: 255, # '1'
4164
+ 50: 255, # '2'
4165
+ 51: 255, # '3'
4166
+ 52: 255, # '4'
4167
+ 53: 255, # '5'
4168
+ 54: 255, # '6'
4169
+ 55: 255, # '7'
4170
+ 56: 255, # '8'
4171
+ 57: 255, # '9'
4172
+ 58: 255, # ':'
4173
+ 59: 255, # ';'
4174
+ 60: 255, # '<'
4175
+ 61: 255, # '='
4176
+ 62: 255, # '>'
4177
+ 63: 255, # '?'
4178
+ 64: 255, # '@'
4179
+ 65: 23, # 'A'
4180
+ 66: 37, # 'B'
4181
+ 67: 47, # 'C'
4182
+ 68: 39, # 'D'
4183
+ 69: 29, # 'E'
4184
+ 70: 52, # 'F'
4185
+ 71: 36, # 'G'
4186
+ 72: 45, # 'H'
4187
+ 73: 53, # 'I'
4188
+ 74: 60, # 'J'
4189
+ 75: 16, # 'K'
4190
+ 76: 49, # 'L'
4191
+ 77: 20, # 'M'
4192
+ 78: 46, # 'N'
4193
+ 79: 42, # 'O'
4194
+ 80: 48, # 'P'
4195
+ 81: 69, # 'Q'
4196
+ 82: 44, # 'R'
4197
+ 83: 35, # 'S'
4198
+ 84: 31, # 'T'
4199
+ 85: 51, # 'U'
4200
+ 86: 38, # 'V'
4201
+ 87: 62, # 'W'
4202
+ 88: 65, # 'X'
4203
+ 89: 43, # 'Y'
4204
+ 90: 56, # 'Z'
4205
+ 91: 255, # '['
4206
+ 92: 255, # '\\'
4207
+ 93: 255, # ']'
4208
+ 94: 255, # '^'
4209
+ 95: 255, # '_'
4210
+ 96: 255, # '`'
4211
+ 97: 1, # 'a'
4212
+ 98: 21, # 'b'
4213
+ 99: 28, # 'c'
4214
+ 100: 12, # 'd'
4215
+ 101: 2, # 'e'
4216
+ 102: 18, # 'f'
4217
+ 103: 27, # 'g'
4218
+ 104: 25, # 'h'
4219
+ 105: 3, # 'i'
4220
+ 106: 24, # 'j'
4221
+ 107: 10, # 'k'
4222
+ 108: 5, # 'l'
4223
+ 109: 13, # 'm'
4224
+ 110: 4, # 'n'
4225
+ 111: 15, # 'o'
4226
+ 112: 26, # 'p'
4227
+ 113: 64, # 'q'
4228
+ 114: 7, # 'r'
4229
+ 115: 8, # 's'
4230
+ 116: 9, # 't'
4231
+ 117: 14, # 'u'
4232
+ 118: 32, # 'v'
4233
+ 119: 57, # 'w'
4234
+ 120: 58, # 'x'
4235
+ 121: 11, # 'y'
4236
+ 122: 22, # 'z'
4237
+ 123: 255, # '{'
4238
+ 124: 255, # '|'
4239
+ 125: 255, # '}'
4240
+ 126: 255, # '~'
4241
+ 127: 255, # '\x7f'
4242
+ 128: 180, # '\x80'
4243
+ 129: 179, # '\x81'
4244
+ 130: 178, # '\x82'
4245
+ 131: 177, # '\x83'
4246
+ 132: 176, # '\x84'
4247
+ 133: 175, # '\x85'
4248
+ 134: 174, # '\x86'
4249
+ 135: 173, # '\x87'
4250
+ 136: 172, # '\x88'
4251
+ 137: 171, # '\x89'
4252
+ 138: 170, # '\x8a'
4253
+ 139: 169, # '\x8b'
4254
+ 140: 168, # '\x8c'
4255
+ 141: 167, # '\x8d'
4256
+ 142: 166, # '\x8e'
4257
+ 143: 165, # '\x8f'
4258
+ 144: 164, # '\x90'
4259
+ 145: 163, # '\x91'
4260
+ 146: 162, # '\x92'
4261
+ 147: 161, # '\x93'
4262
+ 148: 160, # '\x94'
4263
+ 149: 159, # '\x95'
4264
+ 150: 101, # '\x96'
4265
+ 151: 158, # '\x97'
4266
+ 152: 157, # '\x98'
4267
+ 153: 156, # '\x99'
4268
+ 154: 155, # '\x9a'
4269
+ 155: 154, # '\x9b'
4270
+ 156: 153, # '\x9c'
4271
+ 157: 152, # '\x9d'
4272
+ 158: 151, # '\x9e'
4273
+ 159: 106, # '\x9f'
4274
+ 160: 150, # '\xa0'
4275
+ 161: 149, # '¡'
4276
+ 162: 148, # '¢'
4277
+ 163: 147, # '£'
4278
+ 164: 146, # '¤'
4279
+ 165: 145, # '¥'
4280
+ 166: 144, # '¦'
4281
+ 167: 100, # '§'
4282
+ 168: 143, # '¨'
4283
+ 169: 142, # '©'
4284
+ 170: 141, # 'ª'
4285
+ 171: 140, # '«'
4286
+ 172: 139, # '¬'
4287
+ 173: 138, # '\xad'
4288
+ 174: 137, # '®'
4289
+ 175: 136, # '¯'
4290
+ 176: 94, # '°'
4291
+ 177: 80, # '±'
4292
+ 178: 93, # '²'
4293
+ 179: 135, # '³'
4294
+ 180: 105, # '´'
4295
+ 181: 134, # 'µ'
4296
+ 182: 133, # '¶'
4297
+ 183: 63, # '·'
4298
+ 184: 132, # '¸'
4299
+ 185: 131, # '¹'
4300
+ 186: 130, # 'º'
4301
+ 187: 129, # '»'
4302
+ 188: 128, # '¼'
4303
+ 189: 127, # '½'
4304
+ 190: 126, # '¾'
4305
+ 191: 125, # '¿'
4306
+ 192: 124, # 'À'
4307
+ 193: 104, # 'Á'
4308
+ 194: 73, # 'Â'
4309
+ 195: 99, # 'Ã'
4310
+ 196: 79, # 'Ä'
4311
+ 197: 85, # 'Å'
4312
+ 198: 123, # 'Æ'
4313
+ 199: 54, # 'Ç'
4314
+ 200: 122, # 'È'
4315
+ 201: 98, # 'É'
4316
+ 202: 92, # 'Ê'
4317
+ 203: 121, # 'Ë'
4318
+ 204: 120, # 'Ì'
4319
+ 205: 91, # 'Í'
4320
+ 206: 103, # 'Î'
4321
+ 207: 119, # 'Ï'
4322
+ 208: 68, # 'Ğ'
4323
+ 209: 118, # 'Ñ'
4324
+ 210: 117, # 'Ò'
4325
+ 211: 97, # 'Ó'
4326
+ 212: 116, # 'Ô'
4327
+ 213: 115, # 'Õ'
4328
+ 214: 50, # 'Ö'
4329
+ 215: 90, # '×'
4330
+ 216: 114, # 'Ø'
4331
+ 217: 113, # 'Ù'
4332
+ 218: 112, # 'Ú'
4333
+ 219: 111, # 'Û'
4334
+ 220: 55, # 'Ü'
4335
+ 221: 41, # 'İ'
4336
+ 222: 40, # 'Ş'
4337
+ 223: 86, # 'ß'
4338
+ 224: 89, # 'à'
4339
+ 225: 70, # 'á'
4340
+ 226: 59, # 'â'
4341
+ 227: 78, # 'ã'
4342
+ 228: 71, # 'ä'
4343
+ 229: 82, # 'å'
4344
+ 230: 88, # 'æ'
4345
+ 231: 33, # 'ç'
4346
+ 232: 77, # 'è'
4347
+ 233: 66, # 'é'
4348
+ 234: 84, # 'ê'
4349
+ 235: 83, # 'ë'
4350
+ 236: 110, # 'ì'
4351
+ 237: 75, # 'í'
4352
+ 238: 61, # 'î'
4353
+ 239: 96, # 'ï'
4354
+ 240: 30, # 'ğ'
4355
+ 241: 67, # 'ñ'
4356
+ 242: 109, # 'ò'
4357
+ 243: 74, # 'ó'
4358
+ 244: 87, # 'ô'
4359
+ 245: 102, # 'õ'
4360
+ 246: 34, # 'ö'
4361
+ 247: 95, # '÷'
4362
+ 248: 81, # 'ø'
4363
+ 249: 108, # 'ù'
4364
+ 250: 76, # 'ú'
4365
+ 251: 72, # 'û'
4366
+ 252: 17, # 'ü'
4367
+ 253: 6, # 'ı'
4368
+ 254: 19, # 'ş'
4369
+ 255: 107, # 'ÿ'
4370
+ }
4371
+
4372
+ ISO_8859_9_TURKISH_MODEL = SingleByteCharSetModel(
4373
+ charset_name="ISO-8859-9",
4374
+ language="Turkish",
4375
+ char_to_order_map=ISO_8859_9_TURKISH_CHAR_TO_ORDER,
4376
+ language_model=TURKISH_LANG_MODEL,
4377
+ typical_positive_ratio=0.97029,
4378
+ keep_ascii_letters=True,
4379
+ alphabet="ABCDEFGHIJKLMNOPRSTUVYZabcdefghijklmnoprstuvyzÂÇÎÖÛÜâçîöûüĞğİıŞş",
4380
+ )
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/latin1prober.py ADDED
@@ -0,0 +1,147 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Universal charset detector code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 2001
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ # Shy Shalom - original C code
12
+ #
13
+ # This library is free software; you can redistribute it and/or
14
+ # modify it under the terms of the GNU Lesser General Public
15
+ # License as published by the Free Software Foundation; either
16
+ # version 2.1 of the License, or (at your option) any later version.
17
+ #
18
+ # This library is distributed in the hope that it will be useful,
19
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
20
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21
+ # Lesser General Public License for more details.
22
+ #
23
+ # You should have received a copy of the GNU Lesser General Public
24
+ # License along with this library; if not, write to the Free Software
25
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
26
+ # 02110-1301 USA
27
+ ######################### END LICENSE BLOCK #########################
28
+
29
+ from typing import List, Union
30
+
31
+ from .charsetprober import CharSetProber
32
+ from .enums import ProbingState
33
+
34
+ FREQ_CAT_NUM = 4
35
+
36
+ UDF = 0 # undefined
37
+ OTH = 1 # other
38
+ ASC = 2 # ascii capital letter
39
+ ASS = 3 # ascii small letter
40
+ ACV = 4 # accent capital vowel
41
+ ACO = 5 # accent capital other
42
+ ASV = 6 # accent small vowel
43
+ ASO = 7 # accent small other
44
+ CLASS_NUM = 8 # total classes
45
+
46
+ # fmt: off
47
+ Latin1_CharToClass = (
48
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 00 - 07
49
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 08 - 0F
50
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 10 - 17
51
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 18 - 1F
52
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 20 - 27
53
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 28 - 2F
54
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 30 - 37
55
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 38 - 3F
56
+ OTH, ASC, ASC, ASC, ASC, ASC, ASC, ASC, # 40 - 47
57
+ ASC, ASC, ASC, ASC, ASC, ASC, ASC, ASC, # 48 - 4F
58
+ ASC, ASC, ASC, ASC, ASC, ASC, ASC, ASC, # 50 - 57
59
+ ASC, ASC, ASC, OTH, OTH, OTH, OTH, OTH, # 58 - 5F
60
+ OTH, ASS, ASS, ASS, ASS, ASS, ASS, ASS, # 60 - 67
61
+ ASS, ASS, ASS, ASS, ASS, ASS, ASS, ASS, # 68 - 6F
62
+ ASS, ASS, ASS, ASS, ASS, ASS, ASS, ASS, # 70 - 77
63
+ ASS, ASS, ASS, OTH, OTH, OTH, OTH, OTH, # 78 - 7F
64
+ OTH, UDF, OTH, ASO, OTH, OTH, OTH, OTH, # 80 - 87
65
+ OTH, OTH, ACO, OTH, ACO, UDF, ACO, UDF, # 88 - 8F
66
+ UDF, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 90 - 97
67
+ OTH, OTH, ASO, OTH, ASO, UDF, ASO, ACO, # 98 - 9F
68
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # A0 - A7
69
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # A8 - AF
70
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # B0 - B7
71
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # B8 - BF
72
+ ACV, ACV, ACV, ACV, ACV, ACV, ACO, ACO, # C0 - C7
73
+ ACV, ACV, ACV, ACV, ACV, ACV, ACV, ACV, # C8 - CF
74
+ ACO, ACO, ACV, ACV, ACV, ACV, ACV, OTH, # D0 - D7
75
+ ACV, ACV, ACV, ACV, ACV, ACO, ACO, ACO, # D8 - DF
76
+ ASV, ASV, ASV, ASV, ASV, ASV, ASO, ASO, # E0 - E7
77
+ ASV, ASV, ASV, ASV, ASV, ASV, ASV, ASV, # E8 - EF
78
+ ASO, ASO, ASV, ASV, ASV, ASV, ASV, OTH, # F0 - F7
79
+ ASV, ASV, ASV, ASV, ASV, ASO, ASO, ASO, # F8 - FF
80
+ )
81
+
82
+ # 0 : illegal
83
+ # 1 : very unlikely
84
+ # 2 : normal
85
+ # 3 : very likely
86
+ Latin1ClassModel = (
87
+ # UDF OTH ASC ASS ACV ACO ASV ASO
88
+ 0, 0, 0, 0, 0, 0, 0, 0, # UDF
89
+ 0, 3, 3, 3, 3, 3, 3, 3, # OTH
90
+ 0, 3, 3, 3, 3, 3, 3, 3, # ASC
91
+ 0, 3, 3, 3, 1, 1, 3, 3, # ASS
92
+ 0, 3, 3, 3, 1, 2, 1, 2, # ACV
93
+ 0, 3, 3, 3, 3, 3, 3, 3, # ACO
94
+ 0, 3, 1, 3, 1, 1, 1, 3, # ASV
95
+ 0, 3, 1, 3, 1, 1, 3, 3, # ASO
96
+ )
97
+ # fmt: on
98
+
99
+
100
+ class Latin1Prober(CharSetProber):
101
+ def __init__(self) -> None:
102
+ super().__init__()
103
+ self._last_char_class = OTH
104
+ self._freq_counter: List[int] = []
105
+ self.reset()
106
+
107
+ def reset(self) -> None:
108
+ self._last_char_class = OTH
109
+ self._freq_counter = [0] * FREQ_CAT_NUM
110
+ super().reset()
111
+
112
+ @property
113
+ def charset_name(self) -> str:
114
+ return "ISO-8859-1"
115
+
116
+ @property
117
+ def language(self) -> str:
118
+ return ""
119
+
120
+ def feed(self, byte_str: Union[bytes, bytearray]) -> ProbingState:
121
+ byte_str = self.remove_xml_tags(byte_str)
122
+ for c in byte_str:
123
+ char_class = Latin1_CharToClass[c]
124
+ freq = Latin1ClassModel[(self._last_char_class * CLASS_NUM) + char_class]
125
+ if freq == 0:
126
+ self._state = ProbingState.NOT_ME
127
+ break
128
+ self._freq_counter[freq] += 1
129
+ self._last_char_class = char_class
130
+
131
+ return self.state
132
+
133
+ def get_confidence(self) -> float:
134
+ if self.state == ProbingState.NOT_ME:
135
+ return 0.01
136
+
137
+ total = sum(self._freq_counter)
138
+ confidence = (
139
+ 0.0
140
+ if total < 0.01
141
+ else (self._freq_counter[3] - self._freq_counter[1] * 20.0) / total
142
+ )
143
+ confidence = max(confidence, 0.0)
144
+ # lower the confidence of latin1 so that other more accurate
145
+ # detector can take priority.
146
+ confidence *= 0.73
147
+ return confidence
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/macromanprober.py ADDED
@@ -0,0 +1,162 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # This code was modified from latin1prober.py by Rob Speer <rob@lumino.so>.
3
+ # The Original Code is Mozilla Universal charset detector code.
4
+ #
5
+ # The Initial Developer of the Original Code is
6
+ # Netscape Communications Corporation.
7
+ # Portions created by the Initial Developer are Copyright (C) 2001
8
+ # the Initial Developer. All Rights Reserved.
9
+ #
10
+ # Contributor(s):
11
+ # Rob Speer - adapt to MacRoman encoding
12
+ # Mark Pilgrim - port to Python
13
+ # Shy Shalom - original C code
14
+ #
15
+ # This library is free software; you can redistribute it and/or
16
+ # modify it under the terms of the GNU Lesser General Public
17
+ # License as published by the Free Software Foundation; either
18
+ # version 2.1 of the License, or (at your option) any later version.
19
+ #
20
+ # This library is distributed in the hope that it will be useful,
21
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
22
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
23
+ # Lesser General Public License for more details.
24
+ #
25
+ # You should have received a copy of the GNU Lesser General Public
26
+ # License along with this library; if not, write to the Free Software
27
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
28
+ # 02110-1301 USA
29
+ ######################### END LICENSE BLOCK #########################
30
+
31
+ from typing import List, Union
32
+
33
+ from .charsetprober import CharSetProber
34
+ from .enums import ProbingState
35
+
36
+ FREQ_CAT_NUM = 4
37
+
38
+ UDF = 0 # undefined
39
+ OTH = 1 # other
40
+ ASC = 2 # ascii capital letter
41
+ ASS = 3 # ascii small letter
42
+ ACV = 4 # accent capital vowel
43
+ ACO = 5 # accent capital other
44
+ ASV = 6 # accent small vowel
45
+ ASO = 7 # accent small other
46
+ ODD = 8 # character that is unlikely to appear
47
+ CLASS_NUM = 9 # total classes
48
+
49
+ # The change from Latin1 is that we explicitly look for extended characters
50
+ # that are infrequently-occurring symbols, and consider them to always be
51
+ # improbable. This should let MacRoman get out of the way of more likely
52
+ # encodings in most situations.
53
+
54
+ # fmt: off
55
+ MacRoman_CharToClass = (
56
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 00 - 07
57
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 08 - 0F
58
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 10 - 17
59
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 18 - 1F
60
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 20 - 27
61
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 28 - 2F
62
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 30 - 37
63
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # 38 - 3F
64
+ OTH, ASC, ASC, ASC, ASC, ASC, ASC, ASC, # 40 - 47
65
+ ASC, ASC, ASC, ASC, ASC, ASC, ASC, ASC, # 48 - 4F
66
+ ASC, ASC, ASC, ASC, ASC, ASC, ASC, ASC, # 50 - 57
67
+ ASC, ASC, ASC, OTH, OTH, OTH, OTH, OTH, # 58 - 5F
68
+ OTH, ASS, ASS, ASS, ASS, ASS, ASS, ASS, # 60 - 67
69
+ ASS, ASS, ASS, ASS, ASS, ASS, ASS, ASS, # 68 - 6F
70
+ ASS, ASS, ASS, ASS, ASS, ASS, ASS, ASS, # 70 - 77
71
+ ASS, ASS, ASS, OTH, OTH, OTH, OTH, OTH, # 78 - 7F
72
+ ACV, ACV, ACO, ACV, ACO, ACV, ACV, ASV, # 80 - 87
73
+ ASV, ASV, ASV, ASV, ASV, ASO, ASV, ASV, # 88 - 8F
74
+ ASV, ASV, ASV, ASV, ASV, ASV, ASO, ASV, # 90 - 97
75
+ ASV, ASV, ASV, ASV, ASV, ASV, ASV, ASV, # 98 - 9F
76
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, ASO, # A0 - A7
77
+ OTH, OTH, ODD, ODD, OTH, OTH, ACV, ACV, # A8 - AF
78
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, OTH, # B0 - B7
79
+ OTH, OTH, OTH, OTH, OTH, OTH, ASV, ASV, # B8 - BF
80
+ OTH, OTH, ODD, OTH, ODD, OTH, OTH, OTH, # C0 - C7
81
+ OTH, OTH, OTH, ACV, ACV, ACV, ACV, ASV, # C8 - CF
82
+ OTH, OTH, OTH, OTH, OTH, OTH, OTH, ODD, # D0 - D7
83
+ ASV, ACV, ODD, OTH, OTH, OTH, OTH, OTH, # D8 - DF
84
+ OTH, OTH, OTH, OTH, OTH, ACV, ACV, ACV, # E0 - E7
85
+ ACV, ACV, ACV, ACV, ACV, ACV, ACV, ACV, # E8 - EF
86
+ ODD, ACV, ACV, ACV, ACV, ASV, ODD, ODD, # F0 - F7
87
+ ODD, ODD, ODD, ODD, ODD, ODD, ODD, ODD, # F8 - FF
88
+ )
89
+
90
+ # 0 : illegal
91
+ # 1 : very unlikely
92
+ # 2 : normal
93
+ # 3 : very likely
94
+ MacRomanClassModel = (
95
+ # UDF OTH ASC ASS ACV ACO ASV ASO ODD
96
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, # UDF
97
+ 0, 3, 3, 3, 3, 3, 3, 3, 1, # OTH
98
+ 0, 3, 3, 3, 3, 3, 3, 3, 1, # ASC
99
+ 0, 3, 3, 3, 1, 1, 3, 3, 1, # ASS
100
+ 0, 3, 3, 3, 1, 2, 1, 2, 1, # ACV
101
+ 0, 3, 3, 3, 3, 3, 3, 3, 1, # ACO
102
+ 0, 3, 1, 3, 1, 1, 1, 3, 1, # ASV
103
+ 0, 3, 1, 3, 1, 1, 3, 3, 1, # ASO
104
+ 0, 1, 1, 1, 1, 1, 1, 1, 1, # ODD
105
+ )
106
+ # fmt: on
107
+
108
+
109
+ class MacRomanProber(CharSetProber):
110
+ def __init__(self) -> None:
111
+ super().__init__()
112
+ self._last_char_class = OTH
113
+ self._freq_counter: List[int] = []
114
+ self.reset()
115
+
116
+ def reset(self) -> None:
117
+ self._last_char_class = OTH
118
+ self._freq_counter = [0] * FREQ_CAT_NUM
119
+
120
+ # express the prior that MacRoman is a somewhat rare encoding;
121
+ # this can be done by starting out in a slightly improbable state
122
+ # that must be overcome
123
+ self._freq_counter[2] = 10
124
+
125
+ super().reset()
126
+
127
+ @property
128
+ def charset_name(self) -> str:
129
+ return "MacRoman"
130
+
131
+ @property
132
+ def language(self) -> str:
133
+ return ""
134
+
135
+ def feed(self, byte_str: Union[bytes, bytearray]) -> ProbingState:
136
+ byte_str = self.remove_xml_tags(byte_str)
137
+ for c in byte_str:
138
+ char_class = MacRoman_CharToClass[c]
139
+ freq = MacRomanClassModel[(self._last_char_class * CLASS_NUM) + char_class]
140
+ if freq == 0:
141
+ self._state = ProbingState.NOT_ME
142
+ break
143
+ self._freq_counter[freq] += 1
144
+ self._last_char_class = char_class
145
+
146
+ return self.state
147
+
148
+ def get_confidence(self) -> float:
149
+ if self.state == ProbingState.NOT_ME:
150
+ return 0.01
151
+
152
+ total = sum(self._freq_counter)
153
+ confidence = (
154
+ 0.0
155
+ if total < 0.01
156
+ else (self._freq_counter[3] - self._freq_counter[1] * 20.0) / total
157
+ )
158
+ confidence = max(confidence, 0.0)
159
+ # lower the confidence of MacRoman so that other more accurate
160
+ # detector can take priority.
161
+ confidence *= 0.73
162
+ return confidence
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/mbcharsetprober.py ADDED
@@ -0,0 +1,95 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Universal charset detector code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 2001
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ # Shy Shalom - original C code
12
+ # Proofpoint, Inc.
13
+ #
14
+ # This library is free software; you can redistribute it and/or
15
+ # modify it under the terms of the GNU Lesser General Public
16
+ # License as published by the Free Software Foundation; either
17
+ # version 2.1 of the License, or (at your option) any later version.
18
+ #
19
+ # This library is distributed in the hope that it will be useful,
20
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
21
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
22
+ # Lesser General Public License for more details.
23
+ #
24
+ # You should have received a copy of the GNU Lesser General Public
25
+ # License along with this library; if not, write to the Free Software
26
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
27
+ # 02110-1301 USA
28
+ ######################### END LICENSE BLOCK #########################
29
+
30
+ from typing import Optional, Union
31
+
32
+ from .chardistribution import CharDistributionAnalysis
33
+ from .charsetprober import CharSetProber
34
+ from .codingstatemachine import CodingStateMachine
35
+ from .enums import LanguageFilter, MachineState, ProbingState
36
+
37
+
38
+ class MultiByteCharSetProber(CharSetProber):
39
+ """
40
+ MultiByteCharSetProber
41
+ """
42
+
43
+ def __init__(self, lang_filter: LanguageFilter = LanguageFilter.NONE) -> None:
44
+ super().__init__(lang_filter=lang_filter)
45
+ self.distribution_analyzer: Optional[CharDistributionAnalysis] = None
46
+ self.coding_sm: Optional[CodingStateMachine] = None
47
+ self._last_char = bytearray(b"\0\0")
48
+
49
+ def reset(self) -> None:
50
+ super().reset()
51
+ if self.coding_sm:
52
+ self.coding_sm.reset()
53
+ if self.distribution_analyzer:
54
+ self.distribution_analyzer.reset()
55
+ self._last_char = bytearray(b"\0\0")
56
+
57
+ def feed(self, byte_str: Union[bytes, bytearray]) -> ProbingState:
58
+ assert self.coding_sm is not None
59
+ assert self.distribution_analyzer is not None
60
+
61
+ for i, byte in enumerate(byte_str):
62
+ coding_state = self.coding_sm.next_state(byte)
63
+ if coding_state == MachineState.ERROR:
64
+ self.logger.debug(
65
+ "%s %s prober hit error at byte %s",
66
+ self.charset_name,
67
+ self.language,
68
+ i,
69
+ )
70
+ self._state = ProbingState.NOT_ME
71
+ break
72
+ if coding_state == MachineState.ITS_ME:
73
+ self._state = ProbingState.FOUND_IT
74
+ break
75
+ if coding_state == MachineState.START:
76
+ char_len = self.coding_sm.get_current_charlen()
77
+ if i == 0:
78
+ self._last_char[1] = byte
79
+ self.distribution_analyzer.feed(self._last_char, char_len)
80
+ else:
81
+ self.distribution_analyzer.feed(byte_str[i - 1 : i + 1], char_len)
82
+
83
+ self._last_char[0] = byte_str[-1]
84
+
85
+ if self.state == ProbingState.DETECTING:
86
+ if self.distribution_analyzer.got_enough_data() and (
87
+ self.get_confidence() > self.SHORTCUT_THRESHOLD
88
+ ):
89
+ self._state = ProbingState.FOUND_IT
90
+
91
+ return self.state
92
+
93
+ def get_confidence(self) -> float:
94
+ assert self.distribution_analyzer is not None
95
+ return self.distribution_analyzer.get_confidence()
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/mbcsgroupprober.py ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Universal charset detector code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 2001
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ # Shy Shalom - original C code
12
+ # Proofpoint, Inc.
13
+ #
14
+ # This library is free software; you can redistribute it and/or
15
+ # modify it under the terms of the GNU Lesser General Public
16
+ # License as published by the Free Software Foundation; either
17
+ # version 2.1 of the License, or (at your option) any later version.
18
+ #
19
+ # This library is distributed in the hope that it will be useful,
20
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
21
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
22
+ # Lesser General Public License for more details.
23
+ #
24
+ # You should have received a copy of the GNU Lesser General Public
25
+ # License along with this library; if not, write to the Free Software
26
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
27
+ # 02110-1301 USA
28
+ ######################### END LICENSE BLOCK #########################
29
+
30
+ from .big5prober import Big5Prober
31
+ from .charsetgroupprober import CharSetGroupProber
32
+ from .cp949prober import CP949Prober
33
+ from .enums import LanguageFilter
34
+ from .eucjpprober import EUCJPProber
35
+ from .euckrprober import EUCKRProber
36
+ from .euctwprober import EUCTWProber
37
+ from .gb2312prober import GB2312Prober
38
+ from .johabprober import JOHABProber
39
+ from .sjisprober import SJISProber
40
+ from .utf8prober import UTF8Prober
41
+
42
+
43
+ class MBCSGroupProber(CharSetGroupProber):
44
+ def __init__(self, lang_filter: LanguageFilter = LanguageFilter.NONE) -> None:
45
+ super().__init__(lang_filter=lang_filter)
46
+ self.probers = [
47
+ UTF8Prober(),
48
+ SJISProber(),
49
+ EUCJPProber(),
50
+ GB2312Prober(),
51
+ EUCKRProber(),
52
+ CP949Prober(),
53
+ Big5Prober(),
54
+ EUCTWProber(),
55
+ JOHABProber(),
56
+ ]
57
+ self.reset()
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/mbcssm.py ADDED
@@ -0,0 +1,661 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is mozilla.org code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 1998
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ #
12
+ # This library is free software; you can redistribute it and/or
13
+ # modify it under the terms of the GNU Lesser General Public
14
+ # License as published by the Free Software Foundation; either
15
+ # version 2.1 of the License, or (at your option) any later version.
16
+ #
17
+ # This library is distributed in the hope that it will be useful,
18
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20
+ # Lesser General Public License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Lesser General Public
23
+ # License along with this library; if not, write to the Free Software
24
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25
+ # 02110-1301 USA
26
+ ######################### END LICENSE BLOCK #########################
27
+
28
+ from .codingstatemachinedict import CodingStateMachineDict
29
+ from .enums import MachineState
30
+
31
+ # BIG5
32
+
33
+ # fmt: off
34
+ BIG5_CLS = (
35
+ 1, 1, 1, 1, 1, 1, 1, 1, # 00 - 07 #allow 0x00 as legal value
36
+ 1, 1, 1, 1, 1, 1, 0, 0, # 08 - 0f
37
+ 1, 1, 1, 1, 1, 1, 1, 1, # 10 - 17
38
+ 1, 1, 1, 0, 1, 1, 1, 1, # 18 - 1f
39
+ 1, 1, 1, 1, 1, 1, 1, 1, # 20 - 27
40
+ 1, 1, 1, 1, 1, 1, 1, 1, # 28 - 2f
41
+ 1, 1, 1, 1, 1, 1, 1, 1, # 30 - 37
42
+ 1, 1, 1, 1, 1, 1, 1, 1, # 38 - 3f
43
+ 2, 2, 2, 2, 2, 2, 2, 2, # 40 - 47
44
+ 2, 2, 2, 2, 2, 2, 2, 2, # 48 - 4f
45
+ 2, 2, 2, 2, 2, 2, 2, 2, # 50 - 57
46
+ 2, 2, 2, 2, 2, 2, 2, 2, # 58 - 5f
47
+ 2, 2, 2, 2, 2, 2, 2, 2, # 60 - 67
48
+ 2, 2, 2, 2, 2, 2, 2, 2, # 68 - 6f
49
+ 2, 2, 2, 2, 2, 2, 2, 2, # 70 - 77
50
+ 2, 2, 2, 2, 2, 2, 2, 1, # 78 - 7f
51
+ 4, 4, 4, 4, 4, 4, 4, 4, # 80 - 87
52
+ 4, 4, 4, 4, 4, 4, 4, 4, # 88 - 8f
53
+ 4, 4, 4, 4, 4, 4, 4, 4, # 90 - 97
54
+ 4, 4, 4, 4, 4, 4, 4, 4, # 98 - 9f
55
+ 4, 3, 3, 3, 3, 3, 3, 3, # a0 - a7
56
+ 3, 3, 3, 3, 3, 3, 3, 3, # a8 - af
57
+ 3, 3, 3, 3, 3, 3, 3, 3, # b0 - b7
58
+ 3, 3, 3, 3, 3, 3, 3, 3, # b8 - bf
59
+ 3, 3, 3, 3, 3, 3, 3, 3, # c0 - c7
60
+ 3, 3, 3, 3, 3, 3, 3, 3, # c8 - cf
61
+ 3, 3, 3, 3, 3, 3, 3, 3, # d0 - d7
62
+ 3, 3, 3, 3, 3, 3, 3, 3, # d8 - df
63
+ 3, 3, 3, 3, 3, 3, 3, 3, # e0 - e7
64
+ 3, 3, 3, 3, 3, 3, 3, 3, # e8 - ef
65
+ 3, 3, 3, 3, 3, 3, 3, 3, # f0 - f7
66
+ 3, 3, 3, 3, 3, 3, 3, 0 # f8 - ff
67
+ )
68
+
69
+ BIG5_ST = (
70
+ MachineState.ERROR,MachineState.START,MachineState.START, 3,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#00-07
71
+ MachineState.ERROR,MachineState.ERROR,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ERROR,#08-0f
72
+ MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START#10-17
73
+ )
74
+ # fmt: on
75
+
76
+ BIG5_CHAR_LEN_TABLE = (0, 1, 1, 2, 0)
77
+
78
+ BIG5_SM_MODEL: CodingStateMachineDict = {
79
+ "class_table": BIG5_CLS,
80
+ "class_factor": 5,
81
+ "state_table": BIG5_ST,
82
+ "char_len_table": BIG5_CHAR_LEN_TABLE,
83
+ "name": "Big5",
84
+ }
85
+
86
+ # CP949
87
+ # fmt: off
88
+ CP949_CLS = (
89
+ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, # 00 - 0f
90
+ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, # 10 - 1f
91
+ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, # 20 - 2f
92
+ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, # 30 - 3f
93
+ 1, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, # 40 - 4f
94
+ 4, 4, 5, 5, 5, 5, 5, 5, 5, 5, 5, 1, 1, 1, 1, 1, # 50 - 5f
95
+ 1, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, # 60 - 6f
96
+ 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 1, 1, 1, 1, 1, # 70 - 7f
97
+ 0, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, # 80 - 8f
98
+ 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, # 90 - 9f
99
+ 6, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 8, 8, 8, # a0 - af
100
+ 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, # b0 - bf
101
+ 7, 7, 7, 7, 7, 7, 9, 2, 2, 3, 2, 2, 2, 2, 2, 2, # c0 - cf
102
+ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, # d0 - df
103
+ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, # e0 - ef
104
+ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 0, # f0 - ff
105
+ )
106
+
107
+ CP949_ST = (
108
+ #cls= 0 1 2 3 4 5 6 7 8 9 # previous state =
109
+ MachineState.ERROR,MachineState.START, 3,MachineState.ERROR,MachineState.START,MachineState.START, 4, 5,MachineState.ERROR, 6, # MachineState.START
110
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR, # MachineState.ERROR
111
+ MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME, # MachineState.ITS_ME
112
+ MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START, # 3
113
+ MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START, # 4
114
+ MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START, # 5
115
+ MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START, # 6
116
+ )
117
+ # fmt: on
118
+
119
+ CP949_CHAR_LEN_TABLE = (0, 1, 2, 0, 1, 1, 2, 2, 0, 2)
120
+
121
+ CP949_SM_MODEL: CodingStateMachineDict = {
122
+ "class_table": CP949_CLS,
123
+ "class_factor": 10,
124
+ "state_table": CP949_ST,
125
+ "char_len_table": CP949_CHAR_LEN_TABLE,
126
+ "name": "CP949",
127
+ }
128
+
129
+ # EUC-JP
130
+ # fmt: off
131
+ EUCJP_CLS = (
132
+ 4, 4, 4, 4, 4, 4, 4, 4, # 00 - 07
133
+ 4, 4, 4, 4, 4, 4, 5, 5, # 08 - 0f
134
+ 4, 4, 4, 4, 4, 4, 4, 4, # 10 - 17
135
+ 4, 4, 4, 5, 4, 4, 4, 4, # 18 - 1f
136
+ 4, 4, 4, 4, 4, 4, 4, 4, # 20 - 27
137
+ 4, 4, 4, 4, 4, 4, 4, 4, # 28 - 2f
138
+ 4, 4, 4, 4, 4, 4, 4, 4, # 30 - 37
139
+ 4, 4, 4, 4, 4, 4, 4, 4, # 38 - 3f
140
+ 4, 4, 4, 4, 4, 4, 4, 4, # 40 - 47
141
+ 4, 4, 4, 4, 4, 4, 4, 4, # 48 - 4f
142
+ 4, 4, 4, 4, 4, 4, 4, 4, # 50 - 57
143
+ 4, 4, 4, 4, 4, 4, 4, 4, # 58 - 5f
144
+ 4, 4, 4, 4, 4, 4, 4, 4, # 60 - 67
145
+ 4, 4, 4, 4, 4, 4, 4, 4, # 68 - 6f
146
+ 4, 4, 4, 4, 4, 4, 4, 4, # 70 - 77
147
+ 4, 4, 4, 4, 4, 4, 4, 4, # 78 - 7f
148
+ 5, 5, 5, 5, 5, 5, 5, 5, # 80 - 87
149
+ 5, 5, 5, 5, 5, 5, 1, 3, # 88 - 8f
150
+ 5, 5, 5, 5, 5, 5, 5, 5, # 90 - 97
151
+ 5, 5, 5, 5, 5, 5, 5, 5, # 98 - 9f
152
+ 5, 2, 2, 2, 2, 2, 2, 2, # a0 - a7
153
+ 2, 2, 2, 2, 2, 2, 2, 2, # a8 - af
154
+ 2, 2, 2, 2, 2, 2, 2, 2, # b0 - b7
155
+ 2, 2, 2, 2, 2, 2, 2, 2, # b8 - bf
156
+ 2, 2, 2, 2, 2, 2, 2, 2, # c0 - c7
157
+ 2, 2, 2, 2, 2, 2, 2, 2, # c8 - cf
158
+ 2, 2, 2, 2, 2, 2, 2, 2, # d0 - d7
159
+ 2, 2, 2, 2, 2, 2, 2, 2, # d8 - df
160
+ 0, 0, 0, 0, 0, 0, 0, 0, # e0 - e7
161
+ 0, 0, 0, 0, 0, 0, 0, 0, # e8 - ef
162
+ 0, 0, 0, 0, 0, 0, 0, 0, # f0 - f7
163
+ 0, 0, 0, 0, 0, 0, 0, 5 # f8 - ff
164
+ )
165
+
166
+ EUCJP_ST = (
167
+ 3, 4, 3, 5,MachineState.START,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#00-07
168
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,#08-0f
169
+ MachineState.ITS_ME,MachineState.ITS_ME,MachineState.START,MachineState.ERROR,MachineState.START,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#10-17
170
+ MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR, 3,MachineState.ERROR,#18-1f
171
+ 3,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START#20-27
172
+ )
173
+ # fmt: on
174
+
175
+ EUCJP_CHAR_LEN_TABLE = (2, 2, 2, 3, 1, 0)
176
+
177
+ EUCJP_SM_MODEL: CodingStateMachineDict = {
178
+ "class_table": EUCJP_CLS,
179
+ "class_factor": 6,
180
+ "state_table": EUCJP_ST,
181
+ "char_len_table": EUCJP_CHAR_LEN_TABLE,
182
+ "name": "EUC-JP",
183
+ }
184
+
185
+ # EUC-KR
186
+ # fmt: off
187
+ EUCKR_CLS = (
188
+ 1, 1, 1, 1, 1, 1, 1, 1, # 00 - 07
189
+ 1, 1, 1, 1, 1, 1, 0, 0, # 08 - 0f
190
+ 1, 1, 1, 1, 1, 1, 1, 1, # 10 - 17
191
+ 1, 1, 1, 0, 1, 1, 1, 1, # 18 - 1f
192
+ 1, 1, 1, 1, 1, 1, 1, 1, # 20 - 27
193
+ 1, 1, 1, 1, 1, 1, 1, 1, # 28 - 2f
194
+ 1, 1, 1, 1, 1, 1, 1, 1, # 30 - 37
195
+ 1, 1, 1, 1, 1, 1, 1, 1, # 38 - 3f
196
+ 1, 1, 1, 1, 1, 1, 1, 1, # 40 - 47
197
+ 1, 1, 1, 1, 1, 1, 1, 1, # 48 - 4f
198
+ 1, 1, 1, 1, 1, 1, 1, 1, # 50 - 57
199
+ 1, 1, 1, 1, 1, 1, 1, 1, # 58 - 5f
200
+ 1, 1, 1, 1, 1, 1, 1, 1, # 60 - 67
201
+ 1, 1, 1, 1, 1, 1, 1, 1, # 68 - 6f
202
+ 1, 1, 1, 1, 1, 1, 1, 1, # 70 - 77
203
+ 1, 1, 1, 1, 1, 1, 1, 1, # 78 - 7f
204
+ 0, 0, 0, 0, 0, 0, 0, 0, # 80 - 87
205
+ 0, 0, 0, 0, 0, 0, 0, 0, # 88 - 8f
206
+ 0, 0, 0, 0, 0, 0, 0, 0, # 90 - 97
207
+ 0, 0, 0, 0, 0, 0, 0, 0, # 98 - 9f
208
+ 0, 2, 2, 2, 2, 2, 2, 2, # a0 - a7
209
+ 2, 2, 2, 2, 2, 3, 3, 3, # a8 - af
210
+ 2, 2, 2, 2, 2, 2, 2, 2, # b0 - b7
211
+ 2, 2, 2, 2, 2, 2, 2, 2, # b8 - bf
212
+ 2, 2, 2, 2, 2, 2, 2, 2, # c0 - c7
213
+ 2, 3, 2, 2, 2, 2, 2, 2, # c8 - cf
214
+ 2, 2, 2, 2, 2, 2, 2, 2, # d0 - d7
215
+ 2, 2, 2, 2, 2, 2, 2, 2, # d8 - df
216
+ 2, 2, 2, 2, 2, 2, 2, 2, # e0 - e7
217
+ 2, 2, 2, 2, 2, 2, 2, 2, # e8 - ef
218
+ 2, 2, 2, 2, 2, 2, 2, 2, # f0 - f7
219
+ 2, 2, 2, 2, 2, 2, 2, 0 # f8 - ff
220
+ )
221
+
222
+ EUCKR_ST = (
223
+ MachineState.ERROR,MachineState.START, 3,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#00-07
224
+ MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START #08-0f
225
+ )
226
+ # fmt: on
227
+
228
+ EUCKR_CHAR_LEN_TABLE = (0, 1, 2, 0)
229
+
230
+ EUCKR_SM_MODEL: CodingStateMachineDict = {
231
+ "class_table": EUCKR_CLS,
232
+ "class_factor": 4,
233
+ "state_table": EUCKR_ST,
234
+ "char_len_table": EUCKR_CHAR_LEN_TABLE,
235
+ "name": "EUC-KR",
236
+ }
237
+
238
+ # JOHAB
239
+ # fmt: off
240
+ JOHAB_CLS = (
241
+ 4,4,4,4,4,4,4,4, # 00 - 07
242
+ 4,4,4,4,4,4,0,0, # 08 - 0f
243
+ 4,4,4,4,4,4,4,4, # 10 - 17
244
+ 4,4,4,0,4,4,4,4, # 18 - 1f
245
+ 4,4,4,4,4,4,4,4, # 20 - 27
246
+ 4,4,4,4,4,4,4,4, # 28 - 2f
247
+ 4,3,3,3,3,3,3,3, # 30 - 37
248
+ 3,3,3,3,3,3,3,3, # 38 - 3f
249
+ 3,1,1,1,1,1,1,1, # 40 - 47
250
+ 1,1,1,1,1,1,1,1, # 48 - 4f
251
+ 1,1,1,1,1,1,1,1, # 50 - 57
252
+ 1,1,1,1,1,1,1,1, # 58 - 5f
253
+ 1,1,1,1,1,1,1,1, # 60 - 67
254
+ 1,1,1,1,1,1,1,1, # 68 - 6f
255
+ 1,1,1,1,1,1,1,1, # 70 - 77
256
+ 1,1,1,1,1,1,1,2, # 78 - 7f
257
+ 6,6,6,6,8,8,8,8, # 80 - 87
258
+ 8,8,8,8,8,8,8,8, # 88 - 8f
259
+ 8,7,7,7,7,7,7,7, # 90 - 97
260
+ 7,7,7,7,7,7,7,7, # 98 - 9f
261
+ 7,7,7,7,7,7,7,7, # a0 - a7
262
+ 7,7,7,7,7,7,7,7, # a8 - af
263
+ 7,7,7,7,7,7,7,7, # b0 - b7
264
+ 7,7,7,7,7,7,7,7, # b8 - bf
265
+ 7,7,7,7,7,7,7,7, # c0 - c7
266
+ 7,7,7,7,7,7,7,7, # c8 - cf
267
+ 7,7,7,7,5,5,5,5, # d0 - d7
268
+ 5,9,9,9,9,9,9,5, # d8 - df
269
+ 9,9,9,9,9,9,9,9, # e0 - e7
270
+ 9,9,9,9,9,9,9,9, # e8 - ef
271
+ 9,9,9,9,9,9,9,9, # f0 - f7
272
+ 9,9,5,5,5,5,5,0 # f8 - ff
273
+ )
274
+
275
+ JOHAB_ST = (
276
+ # cls = 0 1 2 3 4 5 6 7 8 9
277
+ MachineState.ERROR ,MachineState.START ,MachineState.START ,MachineState.START ,MachineState.START ,MachineState.ERROR ,MachineState.ERROR ,3 ,3 ,4 , # MachineState.START
278
+ MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME, # MachineState.ITS_ME
279
+ MachineState.ERROR ,MachineState.ERROR ,MachineState.ERROR ,MachineState.ERROR ,MachineState.ERROR ,MachineState.ERROR ,MachineState.ERROR ,MachineState.ERROR ,MachineState.ERROR ,MachineState.ERROR , # MachineState.ERROR
280
+ MachineState.ERROR ,MachineState.START ,MachineState.START ,MachineState.ERROR ,MachineState.ERROR ,MachineState.START ,MachineState.START ,MachineState.START ,MachineState.START ,MachineState.START , # 3
281
+ MachineState.ERROR ,MachineState.START ,MachineState.ERROR ,MachineState.START ,MachineState.ERROR ,MachineState.START ,MachineState.ERROR ,MachineState.START ,MachineState.ERROR ,MachineState.START , # 4
282
+ )
283
+ # fmt: on
284
+
285
+ JOHAB_CHAR_LEN_TABLE = (0, 1, 1, 1, 1, 0, 0, 2, 2, 2)
286
+
287
+ JOHAB_SM_MODEL: CodingStateMachineDict = {
288
+ "class_table": JOHAB_CLS,
289
+ "class_factor": 10,
290
+ "state_table": JOHAB_ST,
291
+ "char_len_table": JOHAB_CHAR_LEN_TABLE,
292
+ "name": "Johab",
293
+ }
294
+
295
+ # EUC-TW
296
+ # fmt: off
297
+ EUCTW_CLS = (
298
+ 2, 2, 2, 2, 2, 2, 2, 2, # 00 - 07
299
+ 2, 2, 2, 2, 2, 2, 0, 0, # 08 - 0f
300
+ 2, 2, 2, 2, 2, 2, 2, 2, # 10 - 17
301
+ 2, 2, 2, 0, 2, 2, 2, 2, # 18 - 1f
302
+ 2, 2, 2, 2, 2, 2, 2, 2, # 20 - 27
303
+ 2, 2, 2, 2, 2, 2, 2, 2, # 28 - 2f
304
+ 2, 2, 2, 2, 2, 2, 2, 2, # 30 - 37
305
+ 2, 2, 2, 2, 2, 2, 2, 2, # 38 - 3f
306
+ 2, 2, 2, 2, 2, 2, 2, 2, # 40 - 47
307
+ 2, 2, 2, 2, 2, 2, 2, 2, # 48 - 4f
308
+ 2, 2, 2, 2, 2, 2, 2, 2, # 50 - 57
309
+ 2, 2, 2, 2, 2, 2, 2, 2, # 58 - 5f
310
+ 2, 2, 2, 2, 2, 2, 2, 2, # 60 - 67
311
+ 2, 2, 2, 2, 2, 2, 2, 2, # 68 - 6f
312
+ 2, 2, 2, 2, 2, 2, 2, 2, # 70 - 77
313
+ 2, 2, 2, 2, 2, 2, 2, 2, # 78 - 7f
314
+ 0, 0, 0, 0, 0, 0, 0, 0, # 80 - 87
315
+ 0, 0, 0, 0, 0, 0, 6, 0, # 88 - 8f
316
+ 0, 0, 0, 0, 0, 0, 0, 0, # 90 - 97
317
+ 0, 0, 0, 0, 0, 0, 0, 0, # 98 - 9f
318
+ 0, 3, 4, 4, 4, 4, 4, 4, # a0 - a7
319
+ 5, 5, 1, 1, 1, 1, 1, 1, # a8 - af
320
+ 1, 1, 1, 1, 1, 1, 1, 1, # b0 - b7
321
+ 1, 1, 1, 1, 1, 1, 1, 1, # b8 - bf
322
+ 1, 1, 3, 1, 3, 3, 3, 3, # c0 - c7
323
+ 3, 3, 3, 3, 3, 3, 3, 3, # c8 - cf
324
+ 3, 3, 3, 3, 3, 3, 3, 3, # d0 - d7
325
+ 3, 3, 3, 3, 3, 3, 3, 3, # d8 - df
326
+ 3, 3, 3, 3, 3, 3, 3, 3, # e0 - e7
327
+ 3, 3, 3, 3, 3, 3, 3, 3, # e8 - ef
328
+ 3, 3, 3, 3, 3, 3, 3, 3, # f0 - f7
329
+ 3, 3, 3, 3, 3, 3, 3, 0 # f8 - ff
330
+ )
331
+
332
+ EUCTW_ST = (
333
+ MachineState.ERROR,MachineState.ERROR,MachineState.START, 3, 3, 3, 4,MachineState.ERROR,#00-07
334
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ITS_ME,MachineState.ITS_ME,#08-0f
335
+ MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ERROR,MachineState.START,MachineState.ERROR,#10-17
336
+ MachineState.START,MachineState.START,MachineState.START,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#18-1f
337
+ 5,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.ERROR,MachineState.START,MachineState.START,#20-27
338
+ MachineState.START,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START #28-2f
339
+ )
340
+ # fmt: on
341
+
342
+ EUCTW_CHAR_LEN_TABLE = (0, 0, 1, 2, 2, 2, 3)
343
+
344
+ EUCTW_SM_MODEL: CodingStateMachineDict = {
345
+ "class_table": EUCTW_CLS,
346
+ "class_factor": 7,
347
+ "state_table": EUCTW_ST,
348
+ "char_len_table": EUCTW_CHAR_LEN_TABLE,
349
+ "name": "x-euc-tw",
350
+ }
351
+
352
+ # GB2312
353
+ # fmt: off
354
+ GB2312_CLS = (
355
+ 1, 1, 1, 1, 1, 1, 1, 1, # 00 - 07
356
+ 1, 1, 1, 1, 1, 1, 0, 0, # 08 - 0f
357
+ 1, 1, 1, 1, 1, 1, 1, 1, # 10 - 17
358
+ 1, 1, 1, 0, 1, 1, 1, 1, # 18 - 1f
359
+ 1, 1, 1, 1, 1, 1, 1, 1, # 20 - 27
360
+ 1, 1, 1, 1, 1, 1, 1, 1, # 28 - 2f
361
+ 3, 3, 3, 3, 3, 3, 3, 3, # 30 - 37
362
+ 3, 3, 1, 1, 1, 1, 1, 1, # 38 - 3f
363
+ 2, 2, 2, 2, 2, 2, 2, 2, # 40 - 47
364
+ 2, 2, 2, 2, 2, 2, 2, 2, # 48 - 4f
365
+ 2, 2, 2, 2, 2, 2, 2, 2, # 50 - 57
366
+ 2, 2, 2, 2, 2, 2, 2, 2, # 58 - 5f
367
+ 2, 2, 2, 2, 2, 2, 2, 2, # 60 - 67
368
+ 2, 2, 2, 2, 2, 2, 2, 2, # 68 - 6f
369
+ 2, 2, 2, 2, 2, 2, 2, 2, # 70 - 77
370
+ 2, 2, 2, 2, 2, 2, 2, 4, # 78 - 7f
371
+ 5, 6, 6, 6, 6, 6, 6, 6, # 80 - 87
372
+ 6, 6, 6, 6, 6, 6, 6, 6, # 88 - 8f
373
+ 6, 6, 6, 6, 6, 6, 6, 6, # 90 - 97
374
+ 6, 6, 6, 6, 6, 6, 6, 6, # 98 - 9f
375
+ 6, 6, 6, 6, 6, 6, 6, 6, # a0 - a7
376
+ 6, 6, 6, 6, 6, 6, 6, 6, # a8 - af
377
+ 6, 6, 6, 6, 6, 6, 6, 6, # b0 - b7
378
+ 6, 6, 6, 6, 6, 6, 6, 6, # b8 - bf
379
+ 6, 6, 6, 6, 6, 6, 6, 6, # c0 - c7
380
+ 6, 6, 6, 6, 6, 6, 6, 6, # c8 - cf
381
+ 6, 6, 6, 6, 6, 6, 6, 6, # d0 - d7
382
+ 6, 6, 6, 6, 6, 6, 6, 6, # d8 - df
383
+ 6, 6, 6, 6, 6, 6, 6, 6, # e0 - e7
384
+ 6, 6, 6, 6, 6, 6, 6, 6, # e8 - ef
385
+ 6, 6, 6, 6, 6, 6, 6, 6, # f0 - f7
386
+ 6, 6, 6, 6, 6, 6, 6, 0 # f8 - ff
387
+ )
388
+
389
+ GB2312_ST = (
390
+ MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START, 3,MachineState.ERROR,#00-07
391
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ITS_ME,MachineState.ITS_ME,#08-0f
392
+ MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ERROR,MachineState.ERROR,MachineState.START,#10-17
393
+ 4,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#18-1f
394
+ MachineState.ERROR,MachineState.ERROR, 5,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ITS_ME,MachineState.ERROR,#20-27
395
+ MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.START #28-2f
396
+ )
397
+ # fmt: on
398
+
399
+ # To be accurate, the length of class 6 can be either 2 or 4.
400
+ # But it is not necessary to discriminate between the two since
401
+ # it is used for frequency analysis only, and we are validating
402
+ # each code range there as well. So it is safe to set it to be
403
+ # 2 here.
404
+ GB2312_CHAR_LEN_TABLE = (0, 1, 1, 1, 1, 1, 2)
405
+
406
+ GB2312_SM_MODEL: CodingStateMachineDict = {
407
+ "class_table": GB2312_CLS,
408
+ "class_factor": 7,
409
+ "state_table": GB2312_ST,
410
+ "char_len_table": GB2312_CHAR_LEN_TABLE,
411
+ "name": "GB2312",
412
+ }
413
+
414
+ # Shift_JIS
415
+ # fmt: off
416
+ SJIS_CLS = (
417
+ 1, 1, 1, 1, 1, 1, 1, 1, # 00 - 07
418
+ 1, 1, 1, 1, 1, 1, 0, 0, # 08 - 0f
419
+ 1, 1, 1, 1, 1, 1, 1, 1, # 10 - 17
420
+ 1, 1, 1, 0, 1, 1, 1, 1, # 18 - 1f
421
+ 1, 1, 1, 1, 1, 1, 1, 1, # 20 - 27
422
+ 1, 1, 1, 1, 1, 1, 1, 1, # 28 - 2f
423
+ 1, 1, 1, 1, 1, 1, 1, 1, # 30 - 37
424
+ 1, 1, 1, 1, 1, 1, 1, 1, # 38 - 3f
425
+ 2, 2, 2, 2, 2, 2, 2, 2, # 40 - 47
426
+ 2, 2, 2, 2, 2, 2, 2, 2, # 48 - 4f
427
+ 2, 2, 2, 2, 2, 2, 2, 2, # 50 - 57
428
+ 2, 2, 2, 2, 2, 2, 2, 2, # 58 - 5f
429
+ 2, 2, 2, 2, 2, 2, 2, 2, # 60 - 67
430
+ 2, 2, 2, 2, 2, 2, 2, 2, # 68 - 6f
431
+ 2, 2, 2, 2, 2, 2, 2, 2, # 70 - 77
432
+ 2, 2, 2, 2, 2, 2, 2, 1, # 78 - 7f
433
+ 3, 3, 3, 3, 3, 2, 2, 3, # 80 - 87
434
+ 3, 3, 3, 3, 3, 3, 3, 3, # 88 - 8f
435
+ 3, 3, 3, 3, 3, 3, 3, 3, # 90 - 97
436
+ 3, 3, 3, 3, 3, 3, 3, 3, # 98 - 9f
437
+ #0xa0 is illegal in sjis encoding, but some pages does
438
+ #contain such byte. We need to be more error forgiven.
439
+ 2, 2, 2, 2, 2, 2, 2, 2, # a0 - a7
440
+ 2, 2, 2, 2, 2, 2, 2, 2, # a8 - af
441
+ 2, 2, 2, 2, 2, 2, 2, 2, # b0 - b7
442
+ 2, 2, 2, 2, 2, 2, 2, 2, # b8 - bf
443
+ 2, 2, 2, 2, 2, 2, 2, 2, # c0 - c7
444
+ 2, 2, 2, 2, 2, 2, 2, 2, # c8 - cf
445
+ 2, 2, 2, 2, 2, 2, 2, 2, # d0 - d7
446
+ 2, 2, 2, 2, 2, 2, 2, 2, # d8 - df
447
+ 3, 3, 3, 3, 3, 3, 3, 3, # e0 - e7
448
+ 3, 3, 3, 3, 3, 4, 4, 4, # e8 - ef
449
+ 3, 3, 3, 3, 3, 3, 3, 3, # f0 - f7
450
+ 3, 3, 3, 3, 3, 0, 0, 0, # f8 - ff
451
+ )
452
+
453
+ SJIS_ST = (
454
+ MachineState.ERROR,MachineState.START,MachineState.START, 3,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#00-07
455
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,#08-0f
456
+ MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START #10-17
457
+ )
458
+ # fmt: on
459
+
460
+ SJIS_CHAR_LEN_TABLE = (0, 1, 1, 2, 0, 0)
461
+
462
+ SJIS_SM_MODEL: CodingStateMachineDict = {
463
+ "class_table": SJIS_CLS,
464
+ "class_factor": 6,
465
+ "state_table": SJIS_ST,
466
+ "char_len_table": SJIS_CHAR_LEN_TABLE,
467
+ "name": "Shift_JIS",
468
+ }
469
+
470
+ # UCS2-BE
471
+ # fmt: off
472
+ UCS2BE_CLS = (
473
+ 0, 0, 0, 0, 0, 0, 0, 0, # 00 - 07
474
+ 0, 0, 1, 0, 0, 2, 0, 0, # 08 - 0f
475
+ 0, 0, 0, 0, 0, 0, 0, 0, # 10 - 17
476
+ 0, 0, 0, 3, 0, 0, 0, 0, # 18 - 1f
477
+ 0, 0, 0, 0, 0, 0, 0, 0, # 20 - 27
478
+ 0, 3, 3, 3, 3, 3, 0, 0, # 28 - 2f
479
+ 0, 0, 0, 0, 0, 0, 0, 0, # 30 - 37
480
+ 0, 0, 0, 0, 0, 0, 0, 0, # 38 - 3f
481
+ 0, 0, 0, 0, 0, 0, 0, 0, # 40 - 47
482
+ 0, 0, 0, 0, 0, 0, 0, 0, # 48 - 4f
483
+ 0, 0, 0, 0, 0, 0, 0, 0, # 50 - 57
484
+ 0, 0, 0, 0, 0, 0, 0, 0, # 58 - 5f
485
+ 0, 0, 0, 0, 0, 0, 0, 0, # 60 - 67
486
+ 0, 0, 0, 0, 0, 0, 0, 0, # 68 - 6f
487
+ 0, 0, 0, 0, 0, 0, 0, 0, # 70 - 77
488
+ 0, 0, 0, 0, 0, 0, 0, 0, # 78 - 7f
489
+ 0, 0, 0, 0, 0, 0, 0, 0, # 80 - 87
490
+ 0, 0, 0, 0, 0, 0, 0, 0, # 88 - 8f
491
+ 0, 0, 0, 0, 0, 0, 0, 0, # 90 - 97
492
+ 0, 0, 0, 0, 0, 0, 0, 0, # 98 - 9f
493
+ 0, 0, 0, 0, 0, 0, 0, 0, # a0 - a7
494
+ 0, 0, 0, 0, 0, 0, 0, 0, # a8 - af
495
+ 0, 0, 0, 0, 0, 0, 0, 0, # b0 - b7
496
+ 0, 0, 0, 0, 0, 0, 0, 0, # b8 - bf
497
+ 0, 0, 0, 0, 0, 0, 0, 0, # c0 - c7
498
+ 0, 0, 0, 0, 0, 0, 0, 0, # c8 - cf
499
+ 0, 0, 0, 0, 0, 0, 0, 0, # d0 - d7
500
+ 0, 0, 0, 0, 0, 0, 0, 0, # d8 - df
501
+ 0, 0, 0, 0, 0, 0, 0, 0, # e0 - e7
502
+ 0, 0, 0, 0, 0, 0, 0, 0, # e8 - ef
503
+ 0, 0, 0, 0, 0, 0, 0, 0, # f0 - f7
504
+ 0, 0, 0, 0, 0, 0, 4, 5 # f8 - ff
505
+ )
506
+
507
+ UCS2BE_ST = (
508
+ 5, 7, 7,MachineState.ERROR, 4, 3,MachineState.ERROR,MachineState.ERROR,#00-07
509
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,#08-0f
510
+ MachineState.ITS_ME,MachineState.ITS_ME, 6, 6, 6, 6,MachineState.ERROR,MachineState.ERROR,#10-17
511
+ 6, 6, 6, 6, 6,MachineState.ITS_ME, 6, 6,#18-1f
512
+ 6, 6, 6, 6, 5, 7, 7,MachineState.ERROR,#20-27
513
+ 5, 8, 6, 6,MachineState.ERROR, 6, 6, 6,#28-2f
514
+ 6, 6, 6, 6,MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START #30-37
515
+ )
516
+ # fmt: on
517
+
518
+ UCS2BE_CHAR_LEN_TABLE = (2, 2, 2, 0, 2, 2)
519
+
520
+ UCS2BE_SM_MODEL: CodingStateMachineDict = {
521
+ "class_table": UCS2BE_CLS,
522
+ "class_factor": 6,
523
+ "state_table": UCS2BE_ST,
524
+ "char_len_table": UCS2BE_CHAR_LEN_TABLE,
525
+ "name": "UTF-16BE",
526
+ }
527
+
528
+ # UCS2-LE
529
+ # fmt: off
530
+ UCS2LE_CLS = (
531
+ 0, 0, 0, 0, 0, 0, 0, 0, # 00 - 07
532
+ 0, 0, 1, 0, 0, 2, 0, 0, # 08 - 0f
533
+ 0, 0, 0, 0, 0, 0, 0, 0, # 10 - 17
534
+ 0, 0, 0, 3, 0, 0, 0, 0, # 18 - 1f
535
+ 0, 0, 0, 0, 0, 0, 0, 0, # 20 - 27
536
+ 0, 3, 3, 3, 3, 3, 0, 0, # 28 - 2f
537
+ 0, 0, 0, 0, 0, 0, 0, 0, # 30 - 37
538
+ 0, 0, 0, 0, 0, 0, 0, 0, # 38 - 3f
539
+ 0, 0, 0, 0, 0, 0, 0, 0, # 40 - 47
540
+ 0, 0, 0, 0, 0, 0, 0, 0, # 48 - 4f
541
+ 0, 0, 0, 0, 0, 0, 0, 0, # 50 - 57
542
+ 0, 0, 0, 0, 0, 0, 0, 0, # 58 - 5f
543
+ 0, 0, 0, 0, 0, 0, 0, 0, # 60 - 67
544
+ 0, 0, 0, 0, 0, 0, 0, 0, # 68 - 6f
545
+ 0, 0, 0, 0, 0, 0, 0, 0, # 70 - 77
546
+ 0, 0, 0, 0, 0, 0, 0, 0, # 78 - 7f
547
+ 0, 0, 0, 0, 0, 0, 0, 0, # 80 - 87
548
+ 0, 0, 0, 0, 0, 0, 0, 0, # 88 - 8f
549
+ 0, 0, 0, 0, 0, 0, 0, 0, # 90 - 97
550
+ 0, 0, 0, 0, 0, 0, 0, 0, # 98 - 9f
551
+ 0, 0, 0, 0, 0, 0, 0, 0, # a0 - a7
552
+ 0, 0, 0, 0, 0, 0, 0, 0, # a8 - af
553
+ 0, 0, 0, 0, 0, 0, 0, 0, # b0 - b7
554
+ 0, 0, 0, 0, 0, 0, 0, 0, # b8 - bf
555
+ 0, 0, 0, 0, 0, 0, 0, 0, # c0 - c7
556
+ 0, 0, 0, 0, 0, 0, 0, 0, # c8 - cf
557
+ 0, 0, 0, 0, 0, 0, 0, 0, # d0 - d7
558
+ 0, 0, 0, 0, 0, 0, 0, 0, # d8 - df
559
+ 0, 0, 0, 0, 0, 0, 0, 0, # e0 - e7
560
+ 0, 0, 0, 0, 0, 0, 0, 0, # e8 - ef
561
+ 0, 0, 0, 0, 0, 0, 0, 0, # f0 - f7
562
+ 0, 0, 0, 0, 0, 0, 4, 5 # f8 - ff
563
+ )
564
+
565
+ UCS2LE_ST = (
566
+ 6, 6, 7, 6, 4, 3,MachineState.ERROR,MachineState.ERROR,#00-07
567
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,#08-0f
568
+ MachineState.ITS_ME,MachineState.ITS_ME, 5, 5, 5,MachineState.ERROR,MachineState.ITS_ME,MachineState.ERROR,#10-17
569
+ 5, 5, 5,MachineState.ERROR, 5,MachineState.ERROR, 6, 6,#18-1f
570
+ 7, 6, 8, 8, 5, 5, 5,MachineState.ERROR,#20-27
571
+ 5, 5, 5,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR, 5, 5,#28-2f
572
+ 5, 5, 5,MachineState.ERROR, 5,MachineState.ERROR,MachineState.START,MachineState.START #30-37
573
+ )
574
+ # fmt: on
575
+
576
+ UCS2LE_CHAR_LEN_TABLE = (2, 2, 2, 2, 2, 2)
577
+
578
+ UCS2LE_SM_MODEL: CodingStateMachineDict = {
579
+ "class_table": UCS2LE_CLS,
580
+ "class_factor": 6,
581
+ "state_table": UCS2LE_ST,
582
+ "char_len_table": UCS2LE_CHAR_LEN_TABLE,
583
+ "name": "UTF-16LE",
584
+ }
585
+
586
+ # UTF-8
587
+ # fmt: off
588
+ UTF8_CLS = (
589
+ 1, 1, 1, 1, 1, 1, 1, 1, # 00 - 07 #allow 0x00 as a legal value
590
+ 1, 1, 1, 1, 1, 1, 0, 0, # 08 - 0f
591
+ 1, 1, 1, 1, 1, 1, 1, 1, # 10 - 17
592
+ 1, 1, 1, 0, 1, 1, 1, 1, # 18 - 1f
593
+ 1, 1, 1, 1, 1, 1, 1, 1, # 20 - 27
594
+ 1, 1, 1, 1, 1, 1, 1, 1, # 28 - 2f
595
+ 1, 1, 1, 1, 1, 1, 1, 1, # 30 - 37
596
+ 1, 1, 1, 1, 1, 1, 1, 1, # 38 - 3f
597
+ 1, 1, 1, 1, 1, 1, 1, 1, # 40 - 47
598
+ 1, 1, 1, 1, 1, 1, 1, 1, # 48 - 4f
599
+ 1, 1, 1, 1, 1, 1, 1, 1, # 50 - 57
600
+ 1, 1, 1, 1, 1, 1, 1, 1, # 58 - 5f
601
+ 1, 1, 1, 1, 1, 1, 1, 1, # 60 - 67
602
+ 1, 1, 1, 1, 1, 1, 1, 1, # 68 - 6f
603
+ 1, 1, 1, 1, 1, 1, 1, 1, # 70 - 77
604
+ 1, 1, 1, 1, 1, 1, 1, 1, # 78 - 7f
605
+ 2, 2, 2, 2, 3, 3, 3, 3, # 80 - 87
606
+ 4, 4, 4, 4, 4, 4, 4, 4, # 88 - 8f
607
+ 4, 4, 4, 4, 4, 4, 4, 4, # 90 - 97
608
+ 4, 4, 4, 4, 4, 4, 4, 4, # 98 - 9f
609
+ 5, 5, 5, 5, 5, 5, 5, 5, # a0 - a7
610
+ 5, 5, 5, 5, 5, 5, 5, 5, # a8 - af
611
+ 5, 5, 5, 5, 5, 5, 5, 5, # b0 - b7
612
+ 5, 5, 5, 5, 5, 5, 5, 5, # b8 - bf
613
+ 0, 0, 6, 6, 6, 6, 6, 6, # c0 - c7
614
+ 6, 6, 6, 6, 6, 6, 6, 6, # c8 - cf
615
+ 6, 6, 6, 6, 6, 6, 6, 6, # d0 - d7
616
+ 6, 6, 6, 6, 6, 6, 6, 6, # d8 - df
617
+ 7, 8, 8, 8, 8, 8, 8, 8, # e0 - e7
618
+ 8, 8, 8, 8, 8, 9, 8, 8, # e8 - ef
619
+ 10, 11, 11, 11, 11, 11, 11, 11, # f0 - f7
620
+ 12, 13, 13, 13, 14, 15, 0, 0 # f8 - ff
621
+ )
622
+
623
+ UTF8_ST = (
624
+ MachineState.ERROR,MachineState.START,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR, 12, 10,#00-07
625
+ 9, 11, 8, 7, 6, 5, 4, 3,#08-0f
626
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#10-17
627
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#18-1f
628
+ MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,#20-27
629
+ MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,MachineState.ITS_ME,#28-2f
630
+ MachineState.ERROR,MachineState.ERROR, 5, 5, 5, 5,MachineState.ERROR,MachineState.ERROR,#30-37
631
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#38-3f
632
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR, 5, 5, 5,MachineState.ERROR,MachineState.ERROR,#40-47
633
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#48-4f
634
+ MachineState.ERROR,MachineState.ERROR, 7, 7, 7, 7,MachineState.ERROR,MachineState.ERROR,#50-57
635
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#58-5f
636
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR, 7, 7,MachineState.ERROR,MachineState.ERROR,#60-67
637
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#68-6f
638
+ MachineState.ERROR,MachineState.ERROR, 9, 9, 9, 9,MachineState.ERROR,MachineState.ERROR,#70-77
639
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#78-7f
640
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR, 9,MachineState.ERROR,MachineState.ERROR,#80-87
641
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#88-8f
642
+ MachineState.ERROR,MachineState.ERROR, 12, 12, 12, 12,MachineState.ERROR,MachineState.ERROR,#90-97
643
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#98-9f
644
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR, 12,MachineState.ERROR,MachineState.ERROR,#a0-a7
645
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#a8-af
646
+ MachineState.ERROR,MachineState.ERROR, 12, 12, 12,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#b0-b7
647
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,#b8-bf
648
+ MachineState.ERROR,MachineState.ERROR,MachineState.START,MachineState.START,MachineState.START,MachineState.START,MachineState.ERROR,MachineState.ERROR,#c0-c7
649
+ MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR,MachineState.ERROR #c8-cf
650
+ )
651
+ # fmt: on
652
+
653
+ UTF8_CHAR_LEN_TABLE = (0, 1, 0, 0, 0, 0, 2, 3, 3, 3, 4, 4, 5, 5, 6, 6)
654
+
655
+ UTF8_SM_MODEL: CodingStateMachineDict = {
656
+ "class_table": UTF8_CLS,
657
+ "class_factor": 16,
658
+ "state_table": UTF8_ST,
659
+ "char_len_table": UTF8_CHAR_LEN_TABLE,
660
+ "name": "UTF-8",
661
+ }
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/metadata/__init__.py ADDED
File without changes
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/metadata/languages.py ADDED
@@ -0,0 +1,352 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """
2
+ Metadata about languages used by our model training code for our
3
+ SingleByteCharSetProbers. Could be used for other things in the future.
4
+
5
+ This code is based on the language metadata from the uchardet project.
6
+ """
7
+
8
+ from string import ascii_letters
9
+ from typing import List, Optional
10
+
11
+ # TODO: Add Ukrainian (KOI8-U)
12
+
13
+
14
+ class Language:
15
+ """Metadata about a language useful for training models
16
+
17
+ :ivar name: The human name for the language, in English.
18
+ :type name: str
19
+ :ivar iso_code: 2-letter ISO 639-1 if possible, 3-letter ISO code otherwise,
20
+ or use another catalog as a last resort.
21
+ :type iso_code: str
22
+ :ivar use_ascii: Whether or not ASCII letters should be included in trained
23
+ models.
24
+ :type use_ascii: bool
25
+ :ivar charsets: The charsets we want to support and create data for.
26
+ :type charsets: list of str
27
+ :ivar alphabet: The characters in the language's alphabet. If `use_ascii` is
28
+ `True`, you only need to add those not in the ASCII set.
29
+ :type alphabet: str
30
+ :ivar wiki_start_pages: The Wikipedia pages to start from if we're crawling
31
+ Wikipedia for training data.
32
+ :type wiki_start_pages: list of str
33
+ """
34
+
35
+ def __init__(
36
+ self,
37
+ name: Optional[str] = None,
38
+ iso_code: Optional[str] = None,
39
+ use_ascii: bool = True,
40
+ charsets: Optional[List[str]] = None,
41
+ alphabet: Optional[str] = None,
42
+ wiki_start_pages: Optional[List[str]] = None,
43
+ ) -> None:
44
+ super().__init__()
45
+ self.name = name
46
+ self.iso_code = iso_code
47
+ self.use_ascii = use_ascii
48
+ self.charsets = charsets
49
+ if self.use_ascii:
50
+ if alphabet:
51
+ alphabet += ascii_letters
52
+ else:
53
+ alphabet = ascii_letters
54
+ elif not alphabet:
55
+ raise ValueError("Must supply alphabet if use_ascii is False")
56
+ self.alphabet = "".join(sorted(set(alphabet))) if alphabet else None
57
+ self.wiki_start_pages = wiki_start_pages
58
+
59
+ def __repr__(self) -> str:
60
+ param_str = ", ".join(
61
+ f"{k}={v!r}" for k, v in self.__dict__.items() if not k.startswith("_")
62
+ )
63
+ return f"{self.__class__.__name__}({param_str})"
64
+
65
+
66
+ LANGUAGES = {
67
+ "Arabic": Language(
68
+ name="Arabic",
69
+ iso_code="ar",
70
+ use_ascii=False,
71
+ # We only support encodings that use isolated
72
+ # forms, because the current recommendation is
73
+ # that the rendering system handles presentation
74
+ # forms. This means we purposefully skip IBM864.
75
+ charsets=["ISO-8859-6", "WINDOWS-1256", "CP720", "CP864"],
76
+ alphabet="ءآأؤإئابةتثجحخدذرزسشصضطظعغػؼؽؾؿـفقكلمنهوىيًٌٍَُِّ",
77
+ wiki_start_pages=["الصفحة_الرئيسية"],
78
+ ),
79
+ "Belarusian": Language(
80
+ name="Belarusian",
81
+ iso_code="be",
82
+ use_ascii=False,
83
+ charsets=["ISO-8859-5", "WINDOWS-1251", "IBM866", "MacCyrillic"],
84
+ alphabet="АБВГДЕЁЖЗІЙКЛМНОПРСТУЎФХЦЧШЫЬЭЮЯабвгдеёжзійклмнопрстуўфхцчшыьэюяʼ",
85
+ wiki_start_pages=["Галоўная_старонка"],
86
+ ),
87
+ "Bulgarian": Language(
88
+ name="Bulgarian",
89
+ iso_code="bg",
90
+ use_ascii=False,
91
+ charsets=["ISO-8859-5", "WINDOWS-1251", "IBM855"],
92
+ alphabet="АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯабвгдежзийклмнопрстуфхцчшщъьюя",
93
+ wiki_start_pages=["Начална_страница"],
94
+ ),
95
+ "Czech": Language(
96
+ name="Czech",
97
+ iso_code="cz",
98
+ use_ascii=True,
99
+ charsets=["ISO-8859-2", "WINDOWS-1250"],
100
+ alphabet="áčďéěíňóřšťúůýžÁČĎÉĚÍŇÓŘŠŤÚŮÝŽ",
101
+ wiki_start_pages=["Hlavní_strana"],
102
+ ),
103
+ "Danish": Language(
104
+ name="Danish",
105
+ iso_code="da",
106
+ use_ascii=True,
107
+ charsets=["ISO-8859-1", "ISO-8859-15", "WINDOWS-1252", "MacRoman"],
108
+ alphabet="æøåÆØÅ",
109
+ wiki_start_pages=["Forside"],
110
+ ),
111
+ "German": Language(
112
+ name="German",
113
+ iso_code="de",
114
+ use_ascii=True,
115
+ charsets=["ISO-8859-1", "ISO-8859-15", "WINDOWS-1252", "MacRoman"],
116
+ alphabet="äöüßẞÄÖÜ",
117
+ wiki_start_pages=["Wikipedia:Hauptseite"],
118
+ ),
119
+ "Greek": Language(
120
+ name="Greek",
121
+ iso_code="el",
122
+ use_ascii=False,
123
+ charsets=["ISO-8859-7", "WINDOWS-1253"],
124
+ alphabet="αβγδεζηθικλμνξοπρσςτυφχψωάέήίόύώΑΒΓΔΕΖΗΘΙΚΛΜΝΞΟΠΡΣΣΤΥΦΧΨΩΆΈΉΊΌΎΏ",
125
+ wiki_start_pages=["Πύλη:Κύρια"],
126
+ ),
127
+ "English": Language(
128
+ name="English",
129
+ iso_code="en",
130
+ use_ascii=True,
131
+ charsets=["ISO-8859-1", "WINDOWS-1252", "MacRoman"],
132
+ wiki_start_pages=["Main_Page"],
133
+ ),
134
+ "Esperanto": Language(
135
+ name="Esperanto",
136
+ iso_code="eo",
137
+ # Q, W, X, and Y not used at all
138
+ use_ascii=False,
139
+ charsets=["ISO-8859-3"],
140
+ alphabet="abcĉdefgĝhĥijĵklmnoprsŝtuŭvzABCĈDEFGĜHĤIJĴKLMNOPRSŜTUŬVZ",
141
+ wiki_start_pages=["Vikipedio:Ĉefpaĝo"],
142
+ ),
143
+ "Spanish": Language(
144
+ name="Spanish",
145
+ iso_code="es",
146
+ use_ascii=True,
147
+ charsets=["ISO-8859-1", "ISO-8859-15", "WINDOWS-1252", "MacRoman"],
148
+ alphabet="ñáéíóúüÑÁÉÍÓÚÜ",
149
+ wiki_start_pages=["Wikipedia:Portada"],
150
+ ),
151
+ "Estonian": Language(
152
+ name="Estonian",
153
+ iso_code="et",
154
+ use_ascii=False,
155
+ charsets=["ISO-8859-4", "ISO-8859-13", "WINDOWS-1257"],
156
+ # C, F, Š, Q, W, X, Y, Z, Ž are only for
157
+ # loanwords
158
+ alphabet="ABDEGHIJKLMNOPRSTUVÕÄÖÜabdeghijklmnoprstuvõäöü",
159
+ wiki_start_pages=["Esileht"],
160
+ ),
161
+ "Finnish": Language(
162
+ name="Finnish",
163
+ iso_code="fi",
164
+ use_ascii=True,
165
+ charsets=["ISO-8859-1", "ISO-8859-15", "WINDOWS-1252", "MacRoman"],
166
+ alphabet="ÅÄÖŠŽåäöšž",
167
+ wiki_start_pages=["Wikipedia:Etusivu"],
168
+ ),
169
+ "French": Language(
170
+ name="French",
171
+ iso_code="fr",
172
+ use_ascii=True,
173
+ charsets=["ISO-8859-1", "ISO-8859-15", "WINDOWS-1252", "MacRoman"],
174
+ alphabet="œàâçèéîïùûêŒÀÂÇÈÉÎÏÙÛÊ",
175
+ wiki_start_pages=["Wikipédia:Accueil_principal", "Bœuf (animal)"],
176
+ ),
177
+ "Hebrew": Language(
178
+ name="Hebrew",
179
+ iso_code="he",
180
+ use_ascii=False,
181
+ charsets=["ISO-8859-8", "WINDOWS-1255"],
182
+ alphabet="אבגדהוזחטיךכלםמןנסעףפץצקרשתװױײ",
183
+ wiki_start_pages=["עמוד_ראשי"],
184
+ ),
185
+ "Croatian": Language(
186
+ name="Croatian",
187
+ iso_code="hr",
188
+ # Q, W, X, Y are only used for foreign words.
189
+ use_ascii=False,
190
+ charsets=["ISO-8859-2", "WINDOWS-1250"],
191
+ alphabet="abcčćdđefghijklmnoprsštuvzžABCČĆDĐEFGHIJKLMNOPRSŠTUVZŽ",
192
+ wiki_start_pages=["Glavna_stranica"],
193
+ ),
194
+ "Hungarian": Language(
195
+ name="Hungarian",
196
+ iso_code="hu",
197
+ # Q, W, X, Y are only used for foreign words.
198
+ use_ascii=False,
199
+ charsets=["ISO-8859-2", "WINDOWS-1250"],
200
+ alphabet="abcdefghijklmnoprstuvzáéíóöőúüűABCDEFGHIJKLMNOPRSTUVZÁÉÍÓÖŐÚÜŰ",
201
+ wiki_start_pages=["Kezdőlap"],
202
+ ),
203
+ "Italian": Language(
204
+ name="Italian",
205
+ iso_code="it",
206
+ use_ascii=True,
207
+ charsets=["ISO-8859-1", "ISO-8859-15", "WINDOWS-1252", "MacRoman"],
208
+ alphabet="ÀÈÉÌÒÓÙàèéìòóù",
209
+ wiki_start_pages=["Pagina_principale"],
210
+ ),
211
+ "Lithuanian": Language(
212
+ name="Lithuanian",
213
+ iso_code="lt",
214
+ use_ascii=False,
215
+ charsets=["ISO-8859-13", "WINDOWS-1257", "ISO-8859-4"],
216
+ # Q, W, and X not used at all
217
+ alphabet="AĄBCČDEĘĖFGHIĮYJKLMNOPRSŠTUŲŪVZŽaąbcčdeęėfghiįyjklmnoprsštuųūvzž",
218
+ wiki_start_pages=["Pagrindinis_puslapis"],
219
+ ),
220
+ "Latvian": Language(
221
+ name="Latvian",
222
+ iso_code="lv",
223
+ use_ascii=False,
224
+ charsets=["ISO-8859-13", "WINDOWS-1257", "ISO-8859-4"],
225
+ # Q, W, X, Y are only for loanwords
226
+ alphabet="AĀBCČDEĒFGĢHIĪJKĶLĻMNŅOPRSŠTUŪVZŽaābcčdeēfgģhiījkķlļmnņoprsštuūvzž",
227
+ wiki_start_pages=["Sākumlapa"],
228
+ ),
229
+ "Macedonian": Language(
230
+ name="Macedonian",
231
+ iso_code="mk",
232
+ use_ascii=False,
233
+ charsets=["ISO-8859-5", "WINDOWS-1251", "MacCyrillic", "IBM855"],
234
+ alphabet="АБВГДЃЕЖЗЅИЈКЛЉМНЊОПРСТЌУФХЦЧЏШабвгдѓежзѕијклљмнњопрстќуфхцчџш",
235
+ wiki_start_pages=["Главна_страница"],
236
+ ),
237
+ "Dutch": Language(
238
+ name="Dutch",
239
+ iso_code="nl",
240
+ use_ascii=True,
241
+ charsets=["ISO-8859-1", "WINDOWS-1252", "MacRoman"],
242
+ wiki_start_pages=["Hoofdpagina"],
243
+ ),
244
+ "Polish": Language(
245
+ name="Polish",
246
+ iso_code="pl",
247
+ # Q and X are only used for foreign words.
248
+ use_ascii=False,
249
+ charsets=["ISO-8859-2", "WINDOWS-1250"],
250
+ alphabet="AĄBCĆDEĘFGHIJKLŁMNŃOÓPRSŚTUWYZŹŻaąbcćdeęfghijklłmnńoóprsśtuwyzźż",
251
+ wiki_start_pages=["Wikipedia:Strona_główna"],
252
+ ),
253
+ "Portuguese": Language(
254
+ name="Portuguese",
255
+ iso_code="pt",
256
+ use_ascii=True,
257
+ charsets=["ISO-8859-1", "ISO-8859-15", "WINDOWS-1252", "MacRoman"],
258
+ alphabet="ÁÂÃÀÇÉÊÍÓÔÕÚáâãàçéêíóôõú",
259
+ wiki_start_pages=["Wikipédia:Página_principal"],
260
+ ),
261
+ "Romanian": Language(
262
+ name="Romanian",
263
+ iso_code="ro",
264
+ use_ascii=True,
265
+ charsets=["ISO-8859-2", "WINDOWS-1250"],
266
+ alphabet="ăâîșțĂÂÎȘȚ",
267
+ wiki_start_pages=["Pagina_principală"],
268
+ ),
269
+ "Russian": Language(
270
+ name="Russian",
271
+ iso_code="ru",
272
+ use_ascii=False,
273
+ charsets=[
274
+ "ISO-8859-5",
275
+ "WINDOWS-1251",
276
+ "KOI8-R",
277
+ "MacCyrillic",
278
+ "IBM866",
279
+ "IBM855",
280
+ ],
281
+ alphabet="абвгдеёжзийклмнопрстуфхцчшщъыьэюяАБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯ",
282
+ wiki_start_pages=["Заглавная_страница"],
283
+ ),
284
+ "Slovak": Language(
285
+ name="Slovak",
286
+ iso_code="sk",
287
+ use_ascii=True,
288
+ charsets=["ISO-8859-2", "WINDOWS-1250"],
289
+ alphabet="áäčďéíĺľňóôŕšťúýžÁÄČĎÉÍĹĽŇÓÔŔŠŤÚÝŽ",
290
+ wiki_start_pages=["Hlavná_stránka"],
291
+ ),
292
+ "Slovene": Language(
293
+ name="Slovene",
294
+ iso_code="sl",
295
+ # Q, W, X, Y are only used for foreign words.
296
+ use_ascii=False,
297
+ charsets=["ISO-8859-2", "WINDOWS-1250"],
298
+ alphabet="abcčdefghijklmnoprsštuvzžABCČDEFGHIJKLMNOPRSŠTUVZŽ",
299
+ wiki_start_pages=["Glavna_stran"],
300
+ ),
301
+ # Serbian can be written in both Latin and Cyrillic, but there's no
302
+ # simple way to get the Latin alphabet pages from Wikipedia through
303
+ # the API, so for now we just support Cyrillic.
304
+ "Serbian": Language(
305
+ name="Serbian",
306
+ iso_code="sr",
307
+ alphabet="АБВГДЂЕЖЗИЈКЛЉМНЊОПРСТЋУФХЦЧЏШабвгдђежзијклљмнњопрстћуфхцчџш",
308
+ charsets=["ISO-8859-5", "WINDOWS-1251", "MacCyrillic", "IBM855"],
309
+ wiki_start_pages=["Главна_страна"],
310
+ ),
311
+ "Thai": Language(
312
+ name="Thai",
313
+ iso_code="th",
314
+ use_ascii=False,
315
+ charsets=["ISO-8859-11", "TIS-620", "CP874"],
316
+ alphabet="กขฃคฅฆงจฉชซฌญฎฏฐฑฒณดตถทธนบปผฝพฟภมยรฤลฦวศษสหฬอฮฯะัาำิีึืฺุู฿เแโใไๅๆ็่้๊๋์ํ๎๏๐๑๒๓๔๕๖๗๘๙๚๛",
317
+ wiki_start_pages=["หน้าหลัก"],
318
+ ),
319
+ "Turkish": Language(
320
+ name="Turkish",
321
+ iso_code="tr",
322
+ # Q, W, and X are not used by Turkish
323
+ use_ascii=False,
324
+ charsets=["ISO-8859-3", "ISO-8859-9", "WINDOWS-1254"],
325
+ alphabet="abcçdefgğhıijklmnoöprsştuüvyzâîûABCÇDEFGĞHIİJKLMNOÖPRSŞTUÜVYZÂÎÛ",
326
+ wiki_start_pages=["Ana_Sayfa"],
327
+ ),
328
+ "Vietnamese": Language(
329
+ name="Vietnamese",
330
+ iso_code="vi",
331
+ use_ascii=False,
332
+ # Windows-1258 is the only common 8-bit
333
+ # Vietnamese encoding supported by Python.
334
+ # From Wikipedia:
335
+ # For systems that lack support for Unicode,
336
+ # dozens of 8-bit Vietnamese code pages are
337
+ # available.[1] The most common are VISCII
338
+ # (TCVN 5712:1993), VPS, and Windows-1258.[3]
339
+ # Where ASCII is required, such as when
340
+ # ensuring readability in plain text e-mail,
341
+ # Vietnamese letters are often encoded
342
+ # according to Vietnamese Quoted-Readable
343
+ # (VIQR) or VSCII Mnemonic (VSCII-MNEM),[4]
344
+ # though usage of either variable-width
345
+ # scheme has declined dramatically following
346
+ # the adoption of Unicode on the World Wide
347
+ # Web.
348
+ charsets=["WINDOWS-1258"],
349
+ alphabet="aăâbcdđeêghiklmnoôơpqrstuưvxyAĂÂBCDĐEÊGHIKLMNOÔƠPQRSTUƯVXY",
350
+ wiki_start_pages=["Chữ_Quốc_ngữ"],
351
+ ),
352
+ }
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/sbcsgroupprober.py ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Universal charset detector code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 2001
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ # Shy Shalom - original C code
12
+ #
13
+ # This library is free software; you can redistribute it and/or
14
+ # modify it under the terms of the GNU Lesser General Public
15
+ # License as published by the Free Software Foundation; either
16
+ # version 2.1 of the License, or (at your option) any later version.
17
+ #
18
+ # This library is distributed in the hope that it will be useful,
19
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
20
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21
+ # Lesser General Public License for more details.
22
+ #
23
+ # You should have received a copy of the GNU Lesser General Public
24
+ # License along with this library; if not, write to the Free Software
25
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
26
+ # 02110-1301 USA
27
+ ######################### END LICENSE BLOCK #########################
28
+
29
+ from .charsetgroupprober import CharSetGroupProber
30
+ from .hebrewprober import HebrewProber
31
+ from .langbulgarianmodel import ISO_8859_5_BULGARIAN_MODEL, WINDOWS_1251_BULGARIAN_MODEL
32
+ from .langgreekmodel import ISO_8859_7_GREEK_MODEL, WINDOWS_1253_GREEK_MODEL
33
+ from .langhebrewmodel import WINDOWS_1255_HEBREW_MODEL
34
+
35
+ # from .langhungarianmodel import (ISO_8859_2_HUNGARIAN_MODEL,
36
+ # WINDOWS_1250_HUNGARIAN_MODEL)
37
+ from .langrussianmodel import (
38
+ IBM855_RUSSIAN_MODEL,
39
+ IBM866_RUSSIAN_MODEL,
40
+ ISO_8859_5_RUSSIAN_MODEL,
41
+ KOI8_R_RUSSIAN_MODEL,
42
+ MACCYRILLIC_RUSSIAN_MODEL,
43
+ WINDOWS_1251_RUSSIAN_MODEL,
44
+ )
45
+ from .langthaimodel import TIS_620_THAI_MODEL
46
+ from .langturkishmodel import ISO_8859_9_TURKISH_MODEL
47
+ from .sbcharsetprober import SingleByteCharSetProber
48
+
49
+
50
+ class SBCSGroupProber(CharSetGroupProber):
51
+ def __init__(self) -> None:
52
+ super().__init__()
53
+ hebrew_prober = HebrewProber()
54
+ logical_hebrew_prober = SingleByteCharSetProber(
55
+ WINDOWS_1255_HEBREW_MODEL, is_reversed=False, name_prober=hebrew_prober
56
+ )
57
+ # TODO: See if using ISO-8859-8 Hebrew model works better here, since
58
+ # it's actually the visual one
59
+ visual_hebrew_prober = SingleByteCharSetProber(
60
+ WINDOWS_1255_HEBREW_MODEL, is_reversed=True, name_prober=hebrew_prober
61
+ )
62
+ hebrew_prober.set_model_probers(logical_hebrew_prober, visual_hebrew_prober)
63
+ # TODO: ORDER MATTERS HERE. I changed the order vs what was in master
64
+ # and several tests failed that did not before. Some thought
65
+ # should be put into the ordering, and we should consider making
66
+ # order not matter here, because that is very counter-intuitive.
67
+ self.probers = [
68
+ SingleByteCharSetProber(WINDOWS_1251_RUSSIAN_MODEL),
69
+ SingleByteCharSetProber(KOI8_R_RUSSIAN_MODEL),
70
+ SingleByteCharSetProber(ISO_8859_5_RUSSIAN_MODEL),
71
+ SingleByteCharSetProber(MACCYRILLIC_RUSSIAN_MODEL),
72
+ SingleByteCharSetProber(IBM866_RUSSIAN_MODEL),
73
+ SingleByteCharSetProber(IBM855_RUSSIAN_MODEL),
74
+ SingleByteCharSetProber(ISO_8859_7_GREEK_MODEL),
75
+ SingleByteCharSetProber(WINDOWS_1253_GREEK_MODEL),
76
+ SingleByteCharSetProber(ISO_8859_5_BULGARIAN_MODEL),
77
+ SingleByteCharSetProber(WINDOWS_1251_BULGARIAN_MODEL),
78
+ # TODO: Restore Hungarian encodings (iso-8859-2 and windows-1250)
79
+ # after we retrain model.
80
+ # SingleByteCharSetProber(ISO_8859_2_HUNGARIAN_MODEL),
81
+ # SingleByteCharSetProber(WINDOWS_1250_HUNGARIAN_MODEL),
82
+ SingleByteCharSetProber(TIS_620_THAI_MODEL),
83
+ SingleByteCharSetProber(ISO_8859_9_TURKISH_MODEL),
84
+ hebrew_prober,
85
+ logical_hebrew_prober,
86
+ visual_hebrew_prober,
87
+ ]
88
+ self.reset()
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/universaldetector.py ADDED
@@ -0,0 +1,362 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ # The Original Code is Mozilla Universal charset detector code.
3
+ #
4
+ # The Initial Developer of the Original Code is
5
+ # Netscape Communications Corporation.
6
+ # Portions created by the Initial Developer are Copyright (C) 2001
7
+ # the Initial Developer. All Rights Reserved.
8
+ #
9
+ # Contributor(s):
10
+ # Mark Pilgrim - port to Python
11
+ # Shy Shalom - original C code
12
+ #
13
+ # This library is free software; you can redistribute it and/or
14
+ # modify it under the terms of the GNU Lesser General Public
15
+ # License as published by the Free Software Foundation; either
16
+ # version 2.1 of the License, or (at your option) any later version.
17
+ #
18
+ # This library is distributed in the hope that it will be useful,
19
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
20
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21
+ # Lesser General Public License for more details.
22
+ #
23
+ # You should have received a copy of the GNU Lesser General Public
24
+ # License along with this library; if not, write to the Free Software
25
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
26
+ # 02110-1301 USA
27
+ ######################### END LICENSE BLOCK #########################
28
+ """
29
+ Module containing the UniversalDetector detector class, which is the primary
30
+ class a user of ``chardet`` should use.
31
+
32
+ :author: Mark Pilgrim (initial port to Python)
33
+ :author: Shy Shalom (original C code)
34
+ :author: Dan Blanchard (major refactoring for 3.0)
35
+ :author: Ian Cordasco
36
+ """
37
+
38
+
39
+ import codecs
40
+ import logging
41
+ import re
42
+ from typing import List, Optional, Union
43
+
44
+ from .charsetgroupprober import CharSetGroupProber
45
+ from .charsetprober import CharSetProber
46
+ from .enums import InputState, LanguageFilter, ProbingState
47
+ from .escprober import EscCharSetProber
48
+ from .latin1prober import Latin1Prober
49
+ from .macromanprober import MacRomanProber
50
+ from .mbcsgroupprober import MBCSGroupProber
51
+ from .resultdict import ResultDict
52
+ from .sbcsgroupprober import SBCSGroupProber
53
+ from .utf1632prober import UTF1632Prober
54
+
55
+
56
+ class UniversalDetector:
57
+ """
58
+ The ``UniversalDetector`` class underlies the ``chardet.detect`` function
59
+ and coordinates all of the different charset probers.
60
+
61
+ To get a ``dict`` containing an encoding and its confidence, you can simply
62
+ run:
63
+
64
+ .. code::
65
+
66
+ u = UniversalDetector()
67
+ u.feed(some_bytes)
68
+ u.close()
69
+ detected = u.result
70
+
71
+ """
72
+
73
+ MINIMUM_THRESHOLD = 0.20
74
+ HIGH_BYTE_DETECTOR = re.compile(b"[\x80-\xFF]")
75
+ ESC_DETECTOR = re.compile(b"(\033|~{)")
76
+ WIN_BYTE_DETECTOR = re.compile(b"[\x80-\x9F]")
77
+ ISO_WIN_MAP = {
78
+ "iso-8859-1": "Windows-1252",
79
+ "iso-8859-2": "Windows-1250",
80
+ "iso-8859-5": "Windows-1251",
81
+ "iso-8859-6": "Windows-1256",
82
+ "iso-8859-7": "Windows-1253",
83
+ "iso-8859-8": "Windows-1255",
84
+ "iso-8859-9": "Windows-1254",
85
+ "iso-8859-13": "Windows-1257",
86
+ }
87
+ # Based on https://encoding.spec.whatwg.org/#names-and-labels
88
+ # but altered to match Python names for encodings and remove mappings
89
+ # that break tests.
90
+ LEGACY_MAP = {
91
+ "ascii": "Windows-1252",
92
+ "iso-8859-1": "Windows-1252",
93
+ "tis-620": "ISO-8859-11",
94
+ "iso-8859-9": "Windows-1254",
95
+ "gb2312": "GB18030",
96
+ "euc-kr": "CP949",
97
+ "utf-16le": "UTF-16",
98
+ }
99
+
100
+ def __init__(
101
+ self,
102
+ lang_filter: LanguageFilter = LanguageFilter.ALL,
103
+ should_rename_legacy: bool = False,
104
+ ) -> None:
105
+ self._esc_charset_prober: Optional[EscCharSetProber] = None
106
+ self._utf1632_prober: Optional[UTF1632Prober] = None
107
+ self._charset_probers: List[CharSetProber] = []
108
+ self.result: ResultDict = {
109
+ "encoding": None,
110
+ "confidence": 0.0,
111
+ "language": None,
112
+ }
113
+ self.done = False
114
+ self._got_data = False
115
+ self._input_state = InputState.PURE_ASCII
116
+ self._last_char = b""
117
+ self.lang_filter = lang_filter
118
+ self.logger = logging.getLogger(__name__)
119
+ self._has_win_bytes = False
120
+ self.should_rename_legacy = should_rename_legacy
121
+ self.reset()
122
+
123
+ @property
124
+ def input_state(self) -> int:
125
+ return self._input_state
126
+
127
+ @property
128
+ def has_win_bytes(self) -> bool:
129
+ return self._has_win_bytes
130
+
131
+ @property
132
+ def charset_probers(self) -> List[CharSetProber]:
133
+ return self._charset_probers
134
+
135
+ def reset(self) -> None:
136
+ """
137
+ Reset the UniversalDetector and all of its probers back to their
138
+ initial states. This is called by ``__init__``, so you only need to
139
+ call this directly in between analyses of different documents.
140
+ """
141
+ self.result = {"encoding": None, "confidence": 0.0, "language": None}
142
+ self.done = False
143
+ self._got_data = False
144
+ self._has_win_bytes = False
145
+ self._input_state = InputState.PURE_ASCII
146
+ self._last_char = b""
147
+ if self._esc_charset_prober:
148
+ self._esc_charset_prober.reset()
149
+ if self._utf1632_prober:
150
+ self._utf1632_prober.reset()
151
+ for prober in self._charset_probers:
152
+ prober.reset()
153
+
154
+ def feed(self, byte_str: Union[bytes, bytearray]) -> None:
155
+ """
156
+ Takes a chunk of a document and feeds it through all of the relevant
157
+ charset probers.
158
+
159
+ After calling ``feed``, you can check the value of the ``done``
160
+ attribute to see if you need to continue feeding the
161
+ ``UniversalDetector`` more data, or if it has made a prediction
162
+ (in the ``result`` attribute).
163
+
164
+ .. note::
165
+ You should always call ``close`` when you're done feeding in your
166
+ document if ``done`` is not already ``True``.
167
+ """
168
+ if self.done:
169
+ return
170
+
171
+ if not byte_str:
172
+ return
173
+
174
+ if not isinstance(byte_str, bytearray):
175
+ byte_str = bytearray(byte_str)
176
+
177
+ # First check for known BOMs, since these are guaranteed to be correct
178
+ if not self._got_data:
179
+ # If the data starts with BOM, we know it is UTF
180
+ if byte_str.startswith(codecs.BOM_UTF8):
181
+ # EF BB BF UTF-8 with BOM
182
+ self.result = {
183
+ "encoding": "UTF-8-SIG",
184
+ "confidence": 1.0,
185
+ "language": "",
186
+ }
187
+ elif byte_str.startswith((codecs.BOM_UTF32_LE, codecs.BOM_UTF32_BE)):
188
+ # FF FE 00 00 UTF-32, little-endian BOM
189
+ # 00 00 FE FF UTF-32, big-endian BOM
190
+ self.result = {"encoding": "UTF-32", "confidence": 1.0, "language": ""}
191
+ elif byte_str.startswith(b"\xFE\xFF\x00\x00"):
192
+ # FE FF 00 00 UCS-4, unusual octet order BOM (3412)
193
+ self.result = {
194
+ # TODO: This encoding is not supported by Python. Should remove?
195
+ "encoding": "X-ISO-10646-UCS-4-3412",
196
+ "confidence": 1.0,
197
+ "language": "",
198
+ }
199
+ elif byte_str.startswith(b"\x00\x00\xFF\xFE"):
200
+ # 00 00 FF FE UCS-4, unusual octet order BOM (2143)
201
+ self.result = {
202
+ # TODO: This encoding is not supported by Python. Should remove?
203
+ "encoding": "X-ISO-10646-UCS-4-2143",
204
+ "confidence": 1.0,
205
+ "language": "",
206
+ }
207
+ elif byte_str.startswith((codecs.BOM_LE, codecs.BOM_BE)):
208
+ # FF FE UTF-16, little endian BOM
209
+ # FE FF UTF-16, big endian BOM
210
+ self.result = {"encoding": "UTF-16", "confidence": 1.0, "language": ""}
211
+
212
+ self._got_data = True
213
+ if self.result["encoding"] is not None:
214
+ self.done = True
215
+ return
216
+
217
+ # If none of those matched and we've only see ASCII so far, check
218
+ # for high bytes and escape sequences
219
+ if self._input_state == InputState.PURE_ASCII:
220
+ if self.HIGH_BYTE_DETECTOR.search(byte_str):
221
+ self._input_state = InputState.HIGH_BYTE
222
+ elif (
223
+ self._input_state == InputState.PURE_ASCII
224
+ and self.ESC_DETECTOR.search(self._last_char + byte_str)
225
+ ):
226
+ self._input_state = InputState.ESC_ASCII
227
+
228
+ self._last_char = byte_str[-1:]
229
+
230
+ # next we will look to see if it is appears to be either a UTF-16 or
231
+ # UTF-32 encoding
232
+ if not self._utf1632_prober:
233
+ self._utf1632_prober = UTF1632Prober()
234
+
235
+ if self._utf1632_prober.state == ProbingState.DETECTING:
236
+ if self._utf1632_prober.feed(byte_str) == ProbingState.FOUND_IT:
237
+ self.result = {
238
+ "encoding": self._utf1632_prober.charset_name,
239
+ "confidence": self._utf1632_prober.get_confidence(),
240
+ "language": "",
241
+ }
242
+ self.done = True
243
+ return
244
+
245
+ # If we've seen escape sequences, use the EscCharSetProber, which
246
+ # uses a simple state machine to check for known escape sequences in
247
+ # HZ and ISO-2022 encodings, since those are the only encodings that
248
+ # use such sequences.
249
+ if self._input_state == InputState.ESC_ASCII:
250
+ if not self._esc_charset_prober:
251
+ self._esc_charset_prober = EscCharSetProber(self.lang_filter)
252
+ if self._esc_charset_prober.feed(byte_str) == ProbingState.FOUND_IT:
253
+ self.result = {
254
+ "encoding": self._esc_charset_prober.charset_name,
255
+ "confidence": self._esc_charset_prober.get_confidence(),
256
+ "language": self._esc_charset_prober.language,
257
+ }
258
+ self.done = True
259
+ # If we've seen high bytes (i.e., those with values greater than 127),
260
+ # we need to do more complicated checks using all our multi-byte and
261
+ # single-byte probers that are left. The single-byte probers
262
+ # use character bigram distributions to determine the encoding, whereas
263
+ # the multi-byte probers use a combination of character unigram and
264
+ # bigram distributions.
265
+ elif self._input_state == InputState.HIGH_BYTE:
266
+ if not self._charset_probers:
267
+ self._charset_probers = [MBCSGroupProber(self.lang_filter)]
268
+ # If we're checking non-CJK encodings, use single-byte prober
269
+ if self.lang_filter & LanguageFilter.NON_CJK:
270
+ self._charset_probers.append(SBCSGroupProber())
271
+ self._charset_probers.append(Latin1Prober())
272
+ self._charset_probers.append(MacRomanProber())
273
+ for prober in self._charset_probers:
274
+ if prober.feed(byte_str) == ProbingState.FOUND_IT:
275
+ self.result = {
276
+ "encoding": prober.charset_name,
277
+ "confidence": prober.get_confidence(),
278
+ "language": prober.language,
279
+ }
280
+ self.done = True
281
+ break
282
+ if self.WIN_BYTE_DETECTOR.search(byte_str):
283
+ self._has_win_bytes = True
284
+
285
+ def close(self) -> ResultDict:
286
+ """
287
+ Stop analyzing the current document and come up with a final
288
+ prediction.
289
+
290
+ :returns: The ``result`` attribute, a ``dict`` with the keys
291
+ `encoding`, `confidence`, and `language`.
292
+ """
293
+ # Don't bother with checks if we're already done
294
+ if self.done:
295
+ return self.result
296
+ self.done = True
297
+
298
+ if not self._got_data:
299
+ self.logger.debug("no data received!")
300
+
301
+ # Default to ASCII if it is all we've seen so far
302
+ elif self._input_state == InputState.PURE_ASCII:
303
+ self.result = {"encoding": "ascii", "confidence": 1.0, "language": ""}
304
+
305
+ # If we have seen non-ASCII, return the best that met MINIMUM_THRESHOLD
306
+ elif self._input_state == InputState.HIGH_BYTE:
307
+ prober_confidence = None
308
+ max_prober_confidence = 0.0
309
+ max_prober = None
310
+ for prober in self._charset_probers:
311
+ if not prober:
312
+ continue
313
+ prober_confidence = prober.get_confidence()
314
+ if prober_confidence > max_prober_confidence:
315
+ max_prober_confidence = prober_confidence
316
+ max_prober = prober
317
+ if max_prober and (max_prober_confidence > self.MINIMUM_THRESHOLD):
318
+ charset_name = max_prober.charset_name
319
+ assert charset_name is not None
320
+ lower_charset_name = charset_name.lower()
321
+ confidence = max_prober.get_confidence()
322
+ # Use Windows encoding name instead of ISO-8859 if we saw any
323
+ # extra Windows-specific bytes
324
+ if lower_charset_name.startswith("iso-8859"):
325
+ if self._has_win_bytes:
326
+ charset_name = self.ISO_WIN_MAP.get(
327
+ lower_charset_name, charset_name
328
+ )
329
+ # Rename legacy encodings with superset encodings if asked
330
+ if self.should_rename_legacy:
331
+ charset_name = self.LEGACY_MAP.get(
332
+ (charset_name or "").lower(), charset_name
333
+ )
334
+ self.result = {
335
+ "encoding": charset_name,
336
+ "confidence": confidence,
337
+ "language": max_prober.language,
338
+ }
339
+
340
+ # Log all prober confidences if none met MINIMUM_THRESHOLD
341
+ if self.logger.getEffectiveLevel() <= logging.DEBUG:
342
+ if self.result["encoding"] is None:
343
+ self.logger.debug("no probers hit minimum threshold")
344
+ for group_prober in self._charset_probers:
345
+ if not group_prober:
346
+ continue
347
+ if isinstance(group_prober, CharSetGroupProber):
348
+ for prober in group_prober.probers:
349
+ self.logger.debug(
350
+ "%s %s confidence = %s",
351
+ prober.charset_name,
352
+ prober.language,
353
+ prober.get_confidence(),
354
+ )
355
+ else:
356
+ self.logger.debug(
357
+ "%s %s confidence = %s",
358
+ group_prober.charset_name,
359
+ group_prober.language,
360
+ group_prober.get_confidence(),
361
+ )
362
+ return self.result
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/utf1632prober.py ADDED
@@ -0,0 +1,225 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ######################## BEGIN LICENSE BLOCK ########################
2
+ #
3
+ # Contributor(s):
4
+ # Jason Zavaglia
5
+ #
6
+ # This library is free software; you can redistribute it and/or
7
+ # modify it under the terms of the GNU Lesser General Public
8
+ # License as published by the Free Software Foundation; either
9
+ # version 2.1 of the License, or (at your option) any later version.
10
+ #
11
+ # This library is distributed in the hope that it will be useful,
12
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
13
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14
+ # Lesser General Public License for more details.
15
+ #
16
+ # You should have received a copy of the GNU Lesser General Public
17
+ # License along with this library; if not, write to the Free Software
18
+ # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
19
+ # 02110-1301 USA
20
+ ######################### END LICENSE BLOCK #########################
21
+ from typing import List, Union
22
+
23
+ from .charsetprober import CharSetProber
24
+ from .enums import ProbingState
25
+
26
+
27
+ class UTF1632Prober(CharSetProber):
28
+ """
29
+ This class simply looks for occurrences of zero bytes, and infers
30
+ whether the file is UTF16 or UTF32 (low-endian or big-endian)
31
+ For instance, files looking like ( \0 \0 \0 [nonzero] )+
32
+ have a good probability to be UTF32BE. Files looking like ( \0 [nonzero] )+
33
+ may be guessed to be UTF16BE, and inversely for little-endian varieties.
34
+ """
35
+
36
+ # how many logical characters to scan before feeling confident of prediction
37
+ MIN_CHARS_FOR_DETECTION = 20
38
+ # a fixed constant ratio of expected zeros or non-zeros in modulo-position.
39
+ EXPECTED_RATIO = 0.94
40
+
41
+ def __init__(self) -> None:
42
+ super().__init__()
43
+ self.position = 0
44
+ self.zeros_at_mod = [0] * 4
45
+ self.nonzeros_at_mod = [0] * 4
46
+ self._state = ProbingState.DETECTING
47
+ self.quad = [0, 0, 0, 0]
48
+ self.invalid_utf16be = False
49
+ self.invalid_utf16le = False
50
+ self.invalid_utf32be = False
51
+ self.invalid_utf32le = False
52
+ self.first_half_surrogate_pair_detected_16be = False
53
+ self.first_half_surrogate_pair_detected_16le = False
54
+ self.reset()
55
+
56
+ def reset(self) -> None:
57
+ super().reset()
58
+ self.position = 0
59
+ self.zeros_at_mod = [0] * 4
60
+ self.nonzeros_at_mod = [0] * 4
61
+ self._state = ProbingState.DETECTING
62
+ self.invalid_utf16be = False
63
+ self.invalid_utf16le = False
64
+ self.invalid_utf32be = False
65
+ self.invalid_utf32le = False
66
+ self.first_half_surrogate_pair_detected_16be = False
67
+ self.first_half_surrogate_pair_detected_16le = False
68
+ self.quad = [0, 0, 0, 0]
69
+
70
+ @property
71
+ def charset_name(self) -> str:
72
+ if self.is_likely_utf32be():
73
+ return "utf-32be"
74
+ if self.is_likely_utf32le():
75
+ return "utf-32le"
76
+ if self.is_likely_utf16be():
77
+ return "utf-16be"
78
+ if self.is_likely_utf16le():
79
+ return "utf-16le"
80
+ # default to something valid
81
+ return "utf-16"
82
+
83
+ @property
84
+ def language(self) -> str:
85
+ return ""
86
+
87
+ def approx_32bit_chars(self) -> float:
88
+ return max(1.0, self.position / 4.0)
89
+
90
+ def approx_16bit_chars(self) -> float:
91
+ return max(1.0, self.position / 2.0)
92
+
93
+ def is_likely_utf32be(self) -> bool:
94
+ approx_chars = self.approx_32bit_chars()
95
+ return approx_chars >= self.MIN_CHARS_FOR_DETECTION and (
96
+ self.zeros_at_mod[0] / approx_chars > self.EXPECTED_RATIO
97
+ and self.zeros_at_mod[1] / approx_chars > self.EXPECTED_RATIO
98
+ and self.zeros_at_mod[2] / approx_chars > self.EXPECTED_RATIO
99
+ and self.nonzeros_at_mod[3] / approx_chars > self.EXPECTED_RATIO
100
+ and not self.invalid_utf32be
101
+ )
102
+
103
+ def is_likely_utf32le(self) -> bool:
104
+ approx_chars = self.approx_32bit_chars()
105
+ return approx_chars >= self.MIN_CHARS_FOR_DETECTION and (
106
+ self.nonzeros_at_mod[0] / approx_chars > self.EXPECTED_RATIO
107
+ and self.zeros_at_mod[1] / approx_chars > self.EXPECTED_RATIO
108
+ and self.zeros_at_mod[2] / approx_chars > self.EXPECTED_RATIO
109
+ and self.zeros_at_mod[3] / approx_chars > self.EXPECTED_RATIO
110
+ and not self.invalid_utf32le
111
+ )
112
+
113
+ def is_likely_utf16be(self) -> bool:
114
+ approx_chars = self.approx_16bit_chars()
115
+ return approx_chars >= self.MIN_CHARS_FOR_DETECTION and (
116
+ (self.nonzeros_at_mod[1] + self.nonzeros_at_mod[3]) / approx_chars
117
+ > self.EXPECTED_RATIO
118
+ and (self.zeros_at_mod[0] + self.zeros_at_mod[2]) / approx_chars
119
+ > self.EXPECTED_RATIO
120
+ and not self.invalid_utf16be
121
+ )
122
+
123
+ def is_likely_utf16le(self) -> bool:
124
+ approx_chars = self.approx_16bit_chars()
125
+ return approx_chars >= self.MIN_CHARS_FOR_DETECTION and (
126
+ (self.nonzeros_at_mod[0] + self.nonzeros_at_mod[2]) / approx_chars
127
+ > self.EXPECTED_RATIO
128
+ and (self.zeros_at_mod[1] + self.zeros_at_mod[3]) / approx_chars
129
+ > self.EXPECTED_RATIO
130
+ and not self.invalid_utf16le
131
+ )
132
+
133
+ def validate_utf32_characters(self, quad: List[int]) -> None:
134
+ """
135
+ Validate if the quad of bytes is valid UTF-32.
136
+
137
+ UTF-32 is valid in the range 0x00000000 - 0x0010FFFF
138
+ excluding 0x0000D800 - 0x0000DFFF
139
+
140
+ https://en.wikipedia.org/wiki/UTF-32
141
+ """
142
+ if (
143
+ quad[0] != 0
144
+ or quad[1] > 0x10
145
+ or (quad[0] == 0 and quad[1] == 0 and 0xD8 <= quad[2] <= 0xDF)
146
+ ):
147
+ self.invalid_utf32be = True
148
+ if (
149
+ quad[3] != 0
150
+ or quad[2] > 0x10
151
+ or (quad[3] == 0 and quad[2] == 0 and 0xD8 <= quad[1] <= 0xDF)
152
+ ):
153
+ self.invalid_utf32le = True
154
+
155
+ def validate_utf16_characters(self, pair: List[int]) -> None:
156
+ """
157
+ Validate if the pair of bytes is valid UTF-16.
158
+
159
+ UTF-16 is valid in the range 0x0000 - 0xFFFF excluding 0xD800 - 0xFFFF
160
+ with an exception for surrogate pairs, which must be in the range
161
+ 0xD800-0xDBFF followed by 0xDC00-0xDFFF
162
+
163
+ https://en.wikipedia.org/wiki/UTF-16
164
+ """
165
+ if not self.first_half_surrogate_pair_detected_16be:
166
+ if 0xD8 <= pair[0] <= 0xDB:
167
+ self.first_half_surrogate_pair_detected_16be = True
168
+ elif 0xDC <= pair[0] <= 0xDF:
169
+ self.invalid_utf16be = True
170
+ else:
171
+ if 0xDC <= pair[0] <= 0xDF:
172
+ self.first_half_surrogate_pair_detected_16be = False
173
+ else:
174
+ self.invalid_utf16be = True
175
+
176
+ if not self.first_half_surrogate_pair_detected_16le:
177
+ if 0xD8 <= pair[1] <= 0xDB:
178
+ self.first_half_surrogate_pair_detected_16le = True
179
+ elif 0xDC <= pair[1] <= 0xDF:
180
+ self.invalid_utf16le = True
181
+ else:
182
+ if 0xDC <= pair[1] <= 0xDF:
183
+ self.first_half_surrogate_pair_detected_16le = False
184
+ else:
185
+ self.invalid_utf16le = True
186
+
187
+ def feed(self, byte_str: Union[bytes, bytearray]) -> ProbingState:
188
+ for c in byte_str:
189
+ mod4 = self.position % 4
190
+ self.quad[mod4] = c
191
+ if mod4 == 3:
192
+ self.validate_utf32_characters(self.quad)
193
+ self.validate_utf16_characters(self.quad[0:2])
194
+ self.validate_utf16_characters(self.quad[2:4])
195
+ if c == 0:
196
+ self.zeros_at_mod[mod4] += 1
197
+ else:
198
+ self.nonzeros_at_mod[mod4] += 1
199
+ self.position += 1
200
+ return self.state
201
+
202
+ @property
203
+ def state(self) -> ProbingState:
204
+ if self._state in {ProbingState.NOT_ME, ProbingState.FOUND_IT}:
205
+ # terminal, decided states
206
+ return self._state
207
+ if self.get_confidence() > 0.80:
208
+ self._state = ProbingState.FOUND_IT
209
+ elif self.position > 4 * 1024:
210
+ # if we get to 4kb into the file, and we can't conclude it's UTF,
211
+ # let's give up
212
+ self._state = ProbingState.NOT_ME
213
+ return self._state
214
+
215
+ def get_confidence(self) -> float:
216
+ return (
217
+ 0.85
218
+ if (
219
+ self.is_likely_utf16le()
220
+ or self.is_likely_utf16be()
221
+ or self.is_likely_utf32le()
222
+ or self.is_likely_utf32be()
223
+ )
224
+ else 0.00
225
+ )
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/chardet/version.py ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ """
2
+ This module exists only to simplify retrieving the version number of chardet
3
+ from within setuptools and from chardet subpackages.
4
+
5
+ :author: Dan Blanchard (dan.blanchard@gmail.com)
6
+ """
7
+
8
+ __version__ = "5.1.0"
9
+ VERSION = __version__.split(".")
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/__init__.py ADDED
@@ -0,0 +1,566 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """
2
+ Utilities for determining application-specific dirs. See <https://github.com/platformdirs/platformdirs> for details and
3
+ usage.
4
+ """
5
+ from __future__ import annotations
6
+
7
+ import os
8
+ import sys
9
+ from typing import TYPE_CHECKING
10
+
11
+ from .api import PlatformDirsABC
12
+ from .version import __version__
13
+ from .version import __version_tuple__ as __version_info__
14
+
15
+ if TYPE_CHECKING:
16
+ from pathlib import Path
17
+
18
+ if sys.version_info >= (3, 8): # pragma: no cover (py38+)
19
+ from typing import Literal
20
+ else: # pragma: no cover (py38+)
21
+ from pip._vendor.typing_extensions import Literal
22
+
23
+
24
+ def _set_platform_dir_class() -> type[PlatformDirsABC]:
25
+ if sys.platform == "win32":
26
+ from pip._vendor.platformdirs.windows import Windows as Result
27
+ elif sys.platform == "darwin":
28
+ from pip._vendor.platformdirs.macos import MacOS as Result
29
+ else:
30
+ from pip._vendor.platformdirs.unix import Unix as Result
31
+
32
+ if os.getenv("ANDROID_DATA") == "/data" and os.getenv("ANDROID_ROOT") == "/system":
33
+ if os.getenv("SHELL") or os.getenv("PREFIX"):
34
+ return Result
35
+
36
+ from pip._vendor.platformdirs.android import _android_folder
37
+
38
+ if _android_folder() is not None:
39
+ from pip._vendor.platformdirs.android import Android
40
+
41
+ return Android # return to avoid redefinition of result
42
+
43
+ return Result
44
+
45
+
46
+ PlatformDirs = _set_platform_dir_class() #: Currently active platform
47
+ AppDirs = PlatformDirs #: Backwards compatibility with appdirs
48
+
49
+
50
+ def user_data_dir(
51
+ appname: str | None = None,
52
+ appauthor: str | None | Literal[False] = None,
53
+ version: str | None = None,
54
+ roaming: bool = False, # noqa: FBT001, FBT002
55
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
56
+ ) -> str:
57
+ """
58
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
59
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
60
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
61
+ :param roaming: See `roaming <platformdirs.api.PlatformDirsABC.roaming>`.
62
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
63
+ :returns: data directory tied to the user
64
+ """
65
+ return PlatformDirs(
66
+ appname=appname,
67
+ appauthor=appauthor,
68
+ version=version,
69
+ roaming=roaming,
70
+ ensure_exists=ensure_exists,
71
+ ).user_data_dir
72
+
73
+
74
+ def site_data_dir(
75
+ appname: str | None = None,
76
+ appauthor: str | None | Literal[False] = None,
77
+ version: str | None = None,
78
+ multipath: bool = False, # noqa: FBT001, FBT002
79
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
80
+ ) -> str:
81
+ """
82
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
83
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
84
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
85
+ :param multipath: See `roaming <platformdirs.api.PlatformDirsABC.multipath>`.
86
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
87
+ :returns: data directory shared by users
88
+ """
89
+ return PlatformDirs(
90
+ appname=appname,
91
+ appauthor=appauthor,
92
+ version=version,
93
+ multipath=multipath,
94
+ ensure_exists=ensure_exists,
95
+ ).site_data_dir
96
+
97
+
98
+ def user_config_dir(
99
+ appname: str | None = None,
100
+ appauthor: str | None | Literal[False] = None,
101
+ version: str | None = None,
102
+ roaming: bool = False, # noqa: FBT001, FBT002
103
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
104
+ ) -> str:
105
+ """
106
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
107
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
108
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
109
+ :param roaming: See `roaming <platformdirs.api.PlatformDirsABC.roaming>`.
110
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
111
+ :returns: config directory tied to the user
112
+ """
113
+ return PlatformDirs(
114
+ appname=appname,
115
+ appauthor=appauthor,
116
+ version=version,
117
+ roaming=roaming,
118
+ ensure_exists=ensure_exists,
119
+ ).user_config_dir
120
+
121
+
122
+ def site_config_dir(
123
+ appname: str | None = None,
124
+ appauthor: str | None | Literal[False] = None,
125
+ version: str | None = None,
126
+ multipath: bool = False, # noqa: FBT001, FBT002
127
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
128
+ ) -> str:
129
+ """
130
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
131
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
132
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
133
+ :param multipath: See `roaming <platformdirs.api.PlatformDirsABC.multipath>`.
134
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
135
+ :returns: config directory shared by the users
136
+ """
137
+ return PlatformDirs(
138
+ appname=appname,
139
+ appauthor=appauthor,
140
+ version=version,
141
+ multipath=multipath,
142
+ ensure_exists=ensure_exists,
143
+ ).site_config_dir
144
+
145
+
146
+ def user_cache_dir(
147
+ appname: str | None = None,
148
+ appauthor: str | None | Literal[False] = None,
149
+ version: str | None = None,
150
+ opinion: bool = True, # noqa: FBT001, FBT002
151
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
152
+ ) -> str:
153
+ """
154
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
155
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
156
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
157
+ :param opinion: See `roaming <platformdirs.api.PlatformDirsABC.opinion>`.
158
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
159
+ :returns: cache directory tied to the user
160
+ """
161
+ return PlatformDirs(
162
+ appname=appname,
163
+ appauthor=appauthor,
164
+ version=version,
165
+ opinion=opinion,
166
+ ensure_exists=ensure_exists,
167
+ ).user_cache_dir
168
+
169
+
170
+ def site_cache_dir(
171
+ appname: str | None = None,
172
+ appauthor: str | None | Literal[False] = None,
173
+ version: str | None = None,
174
+ opinion: bool = True, # noqa: FBT001, FBT002
175
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
176
+ ) -> str:
177
+ """
178
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
179
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
180
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
181
+ :param opinion: See `opinion <platformdirs.api.PlatformDirsABC.opinion>`.
182
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
183
+ :returns: cache directory tied to the user
184
+ """
185
+ return PlatformDirs(
186
+ appname=appname,
187
+ appauthor=appauthor,
188
+ version=version,
189
+ opinion=opinion,
190
+ ensure_exists=ensure_exists,
191
+ ).site_cache_dir
192
+
193
+
194
+ def user_state_dir(
195
+ appname: str | None = None,
196
+ appauthor: str | None | Literal[False] = None,
197
+ version: str | None = None,
198
+ roaming: bool = False, # noqa: FBT001, FBT002
199
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
200
+ ) -> str:
201
+ """
202
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
203
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
204
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
205
+ :param roaming: See `roaming <platformdirs.api.PlatformDirsABC.roaming>`.
206
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
207
+ :returns: state directory tied to the user
208
+ """
209
+ return PlatformDirs(
210
+ appname=appname,
211
+ appauthor=appauthor,
212
+ version=version,
213
+ roaming=roaming,
214
+ ensure_exists=ensure_exists,
215
+ ).user_state_dir
216
+
217
+
218
+ def user_log_dir(
219
+ appname: str | None = None,
220
+ appauthor: str | None | Literal[False] = None,
221
+ version: str | None = None,
222
+ opinion: bool = True, # noqa: FBT001, FBT002
223
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
224
+ ) -> str:
225
+ """
226
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
227
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
228
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
229
+ :param opinion: See `roaming <platformdirs.api.PlatformDirsABC.opinion>`.
230
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
231
+ :returns: log directory tied to the user
232
+ """
233
+ return PlatformDirs(
234
+ appname=appname,
235
+ appauthor=appauthor,
236
+ version=version,
237
+ opinion=opinion,
238
+ ensure_exists=ensure_exists,
239
+ ).user_log_dir
240
+
241
+
242
+ def user_documents_dir() -> str:
243
+ """:returns: documents directory tied to the user"""
244
+ return PlatformDirs().user_documents_dir
245
+
246
+
247
+ def user_downloads_dir() -> str:
248
+ """:returns: downloads directory tied to the user"""
249
+ return PlatformDirs().user_downloads_dir
250
+
251
+
252
+ def user_pictures_dir() -> str:
253
+ """:returns: pictures directory tied to the user"""
254
+ return PlatformDirs().user_pictures_dir
255
+
256
+
257
+ def user_videos_dir() -> str:
258
+ """:returns: videos directory tied to the user"""
259
+ return PlatformDirs().user_videos_dir
260
+
261
+
262
+ def user_music_dir() -> str:
263
+ """:returns: music directory tied to the user"""
264
+ return PlatformDirs().user_music_dir
265
+
266
+
267
+ def user_runtime_dir(
268
+ appname: str | None = None,
269
+ appauthor: str | None | Literal[False] = None,
270
+ version: str | None = None,
271
+ opinion: bool = True, # noqa: FBT001, FBT002
272
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
273
+ ) -> str:
274
+ """
275
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
276
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
277
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
278
+ :param opinion: See `opinion <platformdirs.api.PlatformDirsABC.opinion>`.
279
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
280
+ :returns: runtime directory tied to the user
281
+ """
282
+ return PlatformDirs(
283
+ appname=appname,
284
+ appauthor=appauthor,
285
+ version=version,
286
+ opinion=opinion,
287
+ ensure_exists=ensure_exists,
288
+ ).user_runtime_dir
289
+
290
+
291
+ def user_data_path(
292
+ appname: str | None = None,
293
+ appauthor: str | None | Literal[False] = None,
294
+ version: str | None = None,
295
+ roaming: bool = False, # noqa: FBT001, FBT002
296
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
297
+ ) -> Path:
298
+ """
299
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
300
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
301
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
302
+ :param roaming: See `roaming <platformdirs.api.PlatformDirsABC.roaming>`.
303
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
304
+ :returns: data path tied to the user
305
+ """
306
+ return PlatformDirs(
307
+ appname=appname,
308
+ appauthor=appauthor,
309
+ version=version,
310
+ roaming=roaming,
311
+ ensure_exists=ensure_exists,
312
+ ).user_data_path
313
+
314
+
315
+ def site_data_path(
316
+ appname: str | None = None,
317
+ appauthor: str | None | Literal[False] = None,
318
+ version: str | None = None,
319
+ multipath: bool = False, # noqa: FBT001, FBT002
320
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
321
+ ) -> Path:
322
+ """
323
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
324
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
325
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
326
+ :param multipath: See `multipath <platformdirs.api.PlatformDirsABC.multipath>`.
327
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
328
+ :returns: data path shared by users
329
+ """
330
+ return PlatformDirs(
331
+ appname=appname,
332
+ appauthor=appauthor,
333
+ version=version,
334
+ multipath=multipath,
335
+ ensure_exists=ensure_exists,
336
+ ).site_data_path
337
+
338
+
339
+ def user_config_path(
340
+ appname: str | None = None,
341
+ appauthor: str | None | Literal[False] = None,
342
+ version: str | None = None,
343
+ roaming: bool = False, # noqa: FBT001, FBT002
344
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
345
+ ) -> Path:
346
+ """
347
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
348
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
349
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
350
+ :param roaming: See `roaming <platformdirs.api.PlatformDirsABC.roaming>`.
351
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
352
+ :returns: config path tied to the user
353
+ """
354
+ return PlatformDirs(
355
+ appname=appname,
356
+ appauthor=appauthor,
357
+ version=version,
358
+ roaming=roaming,
359
+ ensure_exists=ensure_exists,
360
+ ).user_config_path
361
+
362
+
363
+ def site_config_path(
364
+ appname: str | None = None,
365
+ appauthor: str | None | Literal[False] = None,
366
+ version: str | None = None,
367
+ multipath: bool = False, # noqa: FBT001, FBT002
368
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
369
+ ) -> Path:
370
+ """
371
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
372
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
373
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
374
+ :param multipath: See `roaming <platformdirs.api.PlatformDirsABC.multipath>`.
375
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
376
+ :returns: config path shared by the users
377
+ """
378
+ return PlatformDirs(
379
+ appname=appname,
380
+ appauthor=appauthor,
381
+ version=version,
382
+ multipath=multipath,
383
+ ensure_exists=ensure_exists,
384
+ ).site_config_path
385
+
386
+
387
+ def site_cache_path(
388
+ appname: str | None = None,
389
+ appauthor: str | None | Literal[False] = None,
390
+ version: str | None = None,
391
+ opinion: bool = True, # noqa: FBT001, FBT002
392
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
393
+ ) -> Path:
394
+ """
395
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
396
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
397
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
398
+ :param opinion: See `opinion <platformdirs.api.PlatformDirsABC.opinion>`.
399
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
400
+ :returns: cache directory tied to the user
401
+ """
402
+ return PlatformDirs(
403
+ appname=appname,
404
+ appauthor=appauthor,
405
+ version=version,
406
+ opinion=opinion,
407
+ ensure_exists=ensure_exists,
408
+ ).site_cache_path
409
+
410
+
411
+ def user_cache_path(
412
+ appname: str | None = None,
413
+ appauthor: str | None | Literal[False] = None,
414
+ version: str | None = None,
415
+ opinion: bool = True, # noqa: FBT001, FBT002
416
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
417
+ ) -> Path:
418
+ """
419
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
420
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
421
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
422
+ :param opinion: See `roaming <platformdirs.api.PlatformDirsABC.opinion>`.
423
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
424
+ :returns: cache path tied to the user
425
+ """
426
+ return PlatformDirs(
427
+ appname=appname,
428
+ appauthor=appauthor,
429
+ version=version,
430
+ opinion=opinion,
431
+ ensure_exists=ensure_exists,
432
+ ).user_cache_path
433
+
434
+
435
+ def user_state_path(
436
+ appname: str | None = None,
437
+ appauthor: str | None | Literal[False] = None,
438
+ version: str | None = None,
439
+ roaming: bool = False, # noqa: FBT001, FBT002
440
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
441
+ ) -> Path:
442
+ """
443
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
444
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
445
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
446
+ :param roaming: See `roaming <platformdirs.api.PlatformDirsABC.roaming>`.
447
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
448
+ :returns: state path tied to the user
449
+ """
450
+ return PlatformDirs(
451
+ appname=appname,
452
+ appauthor=appauthor,
453
+ version=version,
454
+ roaming=roaming,
455
+ ensure_exists=ensure_exists,
456
+ ).user_state_path
457
+
458
+
459
+ def user_log_path(
460
+ appname: str | None = None,
461
+ appauthor: str | None | Literal[False] = None,
462
+ version: str | None = None,
463
+ opinion: bool = True, # noqa: FBT001, FBT002
464
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
465
+ ) -> Path:
466
+ """
467
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
468
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
469
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
470
+ :param opinion: See `roaming <platformdirs.api.PlatformDirsABC.opinion>`.
471
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
472
+ :returns: log path tied to the user
473
+ """
474
+ return PlatformDirs(
475
+ appname=appname,
476
+ appauthor=appauthor,
477
+ version=version,
478
+ opinion=opinion,
479
+ ensure_exists=ensure_exists,
480
+ ).user_log_path
481
+
482
+
483
+ def user_documents_path() -> Path:
484
+ """:returns: documents path tied to the user"""
485
+ return PlatformDirs().user_documents_path
486
+
487
+
488
+ def user_downloads_path() -> Path:
489
+ """:returns: downloads path tied to the user"""
490
+ return PlatformDirs().user_downloads_path
491
+
492
+
493
+ def user_pictures_path() -> Path:
494
+ """:returns: pictures path tied to the user"""
495
+ return PlatformDirs().user_pictures_path
496
+
497
+
498
+ def user_videos_path() -> Path:
499
+ """:returns: videos path tied to the user"""
500
+ return PlatformDirs().user_videos_path
501
+
502
+
503
+ def user_music_path() -> Path:
504
+ """:returns: music path tied to the user"""
505
+ return PlatformDirs().user_music_path
506
+
507
+
508
+ def user_runtime_path(
509
+ appname: str | None = None,
510
+ appauthor: str | None | Literal[False] = None,
511
+ version: str | None = None,
512
+ opinion: bool = True, # noqa: FBT001, FBT002
513
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
514
+ ) -> Path:
515
+ """
516
+ :param appname: See `appname <platformdirs.api.PlatformDirsABC.appname>`.
517
+ :param appauthor: See `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`.
518
+ :param version: See `version <platformdirs.api.PlatformDirsABC.version>`.
519
+ :param opinion: See `opinion <platformdirs.api.PlatformDirsABC.opinion>`.
520
+ :param ensure_exists: See `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
521
+ :returns: runtime path tied to the user
522
+ """
523
+ return PlatformDirs(
524
+ appname=appname,
525
+ appauthor=appauthor,
526
+ version=version,
527
+ opinion=opinion,
528
+ ensure_exists=ensure_exists,
529
+ ).user_runtime_path
530
+
531
+
532
+ __all__ = [
533
+ "__version__",
534
+ "__version_info__",
535
+ "PlatformDirs",
536
+ "AppDirs",
537
+ "PlatformDirsABC",
538
+ "user_data_dir",
539
+ "user_config_dir",
540
+ "user_cache_dir",
541
+ "user_state_dir",
542
+ "user_log_dir",
543
+ "user_documents_dir",
544
+ "user_downloads_dir",
545
+ "user_pictures_dir",
546
+ "user_videos_dir",
547
+ "user_music_dir",
548
+ "user_runtime_dir",
549
+ "site_data_dir",
550
+ "site_config_dir",
551
+ "site_cache_dir",
552
+ "user_data_path",
553
+ "user_config_path",
554
+ "user_cache_path",
555
+ "user_state_path",
556
+ "user_log_path",
557
+ "user_documents_path",
558
+ "user_downloads_path",
559
+ "user_pictures_path",
560
+ "user_videos_path",
561
+ "user_music_path",
562
+ "user_runtime_path",
563
+ "site_data_path",
564
+ "site_config_path",
565
+ "site_cache_path",
566
+ ]
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/__main__.py ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """Main entry point."""
2
+ from __future__ import annotations
3
+
4
+ from pip._vendor.platformdirs import PlatformDirs, __version__
5
+
6
+ PROPS = (
7
+ "user_data_dir",
8
+ "user_config_dir",
9
+ "user_cache_dir",
10
+ "user_state_dir",
11
+ "user_log_dir",
12
+ "user_documents_dir",
13
+ "user_downloads_dir",
14
+ "user_pictures_dir",
15
+ "user_videos_dir",
16
+ "user_music_dir",
17
+ "user_runtime_dir",
18
+ "site_data_dir",
19
+ "site_config_dir",
20
+ "site_cache_dir",
21
+ )
22
+
23
+
24
+ def main() -> None:
25
+ """Run main entry point."""
26
+ app_name = "MyApp"
27
+ app_author = "MyCompany"
28
+
29
+ print(f"-- platformdirs {__version__} --") # noqa: T201
30
+
31
+ print("-- app dirs (with optional 'version')") # noqa: T201
32
+ dirs = PlatformDirs(app_name, app_author, version="1.0")
33
+ for prop in PROPS:
34
+ print(f"{prop}: {getattr(dirs, prop)}") # noqa: T201
35
+
36
+ print("\n-- app dirs (without optional 'version')") # noqa: T201
37
+ dirs = PlatformDirs(app_name, app_author)
38
+ for prop in PROPS:
39
+ print(f"{prop}: {getattr(dirs, prop)}") # noqa: T201
40
+
41
+ print("\n-- app dirs (without optional 'appauthor')") # noqa: T201
42
+ dirs = PlatformDirs(app_name)
43
+ for prop in PROPS:
44
+ print(f"{prop}: {getattr(dirs, prop)}") # noqa: T201
45
+
46
+ print("\n-- app dirs (with disabled 'appauthor')") # noqa: T201
47
+ dirs = PlatformDirs(app_name, appauthor=False)
48
+ for prop in PROPS:
49
+ print(f"{prop}: {getattr(dirs, prop)}") # noqa: T201
50
+
51
+
52
+ if __name__ == "__main__":
53
+ main()
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/android.py ADDED
@@ -0,0 +1,210 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """Android."""
2
+ from __future__ import annotations
3
+
4
+ import os
5
+ import re
6
+ import sys
7
+ from functools import lru_cache
8
+ from typing import cast
9
+
10
+ from .api import PlatformDirsABC
11
+
12
+
13
+ class Android(PlatformDirsABC):
14
+ """
15
+ Follows the guidance `from here <https://android.stackexchange.com/a/216132>`_. Makes use of the
16
+ `appname <platformdirs.api.PlatformDirsABC.appname>`,
17
+ `version <platformdirs.api.PlatformDirsABC.version>`,
18
+ `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
19
+ """
20
+
21
+ @property
22
+ def user_data_dir(self) -> str:
23
+ """:return: data directory tied to the user, e.g. ``/data/user/<userid>/<packagename>/files/<AppName>``"""
24
+ return self._append_app_name_and_version(cast(str, _android_folder()), "files")
25
+
26
+ @property
27
+ def site_data_dir(self) -> str:
28
+ """:return: data directory shared by users, same as `user_data_dir`"""
29
+ return self.user_data_dir
30
+
31
+ @property
32
+ def user_config_dir(self) -> str:
33
+ """
34
+ :return: config directory tied to the user, e.g. \
35
+ ``/data/user/<userid>/<packagename>/shared_prefs/<AppName>``
36
+ """
37
+ return self._append_app_name_and_version(cast(str, _android_folder()), "shared_prefs")
38
+
39
+ @property
40
+ def site_config_dir(self) -> str:
41
+ """:return: config directory shared by the users, same as `user_config_dir`"""
42
+ return self.user_config_dir
43
+
44
+ @property
45
+ def user_cache_dir(self) -> str:
46
+ """:return: cache directory tied to the user, e.g. e.g. ``/data/user/<userid>/<packagename>/cache/<AppName>``"""
47
+ return self._append_app_name_and_version(cast(str, _android_folder()), "cache")
48
+
49
+ @property
50
+ def site_cache_dir(self) -> str:
51
+ """:return: cache directory shared by users, same as `user_cache_dir`"""
52
+ return self.user_cache_dir
53
+
54
+ @property
55
+ def user_state_dir(self) -> str:
56
+ """:return: state directory tied to the user, same as `user_data_dir`"""
57
+ return self.user_data_dir
58
+
59
+ @property
60
+ def user_log_dir(self) -> str:
61
+ """
62
+ :return: log directory tied to the user, same as `user_cache_dir` if not opinionated else ``log`` in it,
63
+ e.g. ``/data/user/<userid>/<packagename>/cache/<AppName>/log``
64
+ """
65
+ path = self.user_cache_dir
66
+ if self.opinion:
67
+ path = os.path.join(path, "log") # noqa: PTH118
68
+ return path
69
+
70
+ @property
71
+ def user_documents_dir(self) -> str:
72
+ """:return: documents directory tied to the user e.g. ``/storage/emulated/0/Documents``"""
73
+ return _android_documents_folder()
74
+
75
+ @property
76
+ def user_downloads_dir(self) -> str:
77
+ """:return: downloads directory tied to the user e.g. ``/storage/emulated/0/Downloads``"""
78
+ return _android_downloads_folder()
79
+
80
+ @property
81
+ def user_pictures_dir(self) -> str:
82
+ """:return: pictures directory tied to the user e.g. ``/storage/emulated/0/Pictures``"""
83
+ return _android_pictures_folder()
84
+
85
+ @property
86
+ def user_videos_dir(self) -> str:
87
+ """:return: videos directory tied to the user e.g. ``/storage/emulated/0/DCIM/Camera``"""
88
+ return _android_videos_folder()
89
+
90
+ @property
91
+ def user_music_dir(self) -> str:
92
+ """:return: music directory tied to the user e.g. ``/storage/emulated/0/Music``"""
93
+ return _android_music_folder()
94
+
95
+ @property
96
+ def user_runtime_dir(self) -> str:
97
+ """
98
+ :return: runtime directory tied to the user, same as `user_cache_dir` if not opinionated else ``tmp`` in it,
99
+ e.g. ``/data/user/<userid>/<packagename>/cache/<AppName>/tmp``
100
+ """
101
+ path = self.user_cache_dir
102
+ if self.opinion:
103
+ path = os.path.join(path, "tmp") # noqa: PTH118
104
+ return path
105
+
106
+
107
+ @lru_cache(maxsize=1)
108
+ def _android_folder() -> str | None:
109
+ """:return: base folder for the Android OS or None if it cannot be found"""
110
+ try:
111
+ # First try to get path to android app via pyjnius
112
+ from jnius import autoclass
113
+
114
+ context = autoclass("android.content.Context")
115
+ result: str | None = context.getFilesDir().getParentFile().getAbsolutePath()
116
+ except Exception: # noqa: BLE001
117
+ # if fails find an android folder looking path on the sys.path
118
+ pattern = re.compile(r"/data/(data|user/\d+)/(.+)/files")
119
+ for path in sys.path:
120
+ if pattern.match(path):
121
+ result = path.split("/files")[0]
122
+ break
123
+ else:
124
+ result = None
125
+ return result
126
+
127
+
128
+ @lru_cache(maxsize=1)
129
+ def _android_documents_folder() -> str:
130
+ """:return: documents folder for the Android OS"""
131
+ # Get directories with pyjnius
132
+ try:
133
+ from jnius import autoclass
134
+
135
+ context = autoclass("android.content.Context")
136
+ environment = autoclass("android.os.Environment")
137
+ documents_dir: str = context.getExternalFilesDir(environment.DIRECTORY_DOCUMENTS).getAbsolutePath()
138
+ except Exception: # noqa: BLE001
139
+ documents_dir = "/storage/emulated/0/Documents"
140
+
141
+ return documents_dir
142
+
143
+
144
+ @lru_cache(maxsize=1)
145
+ def _android_downloads_folder() -> str:
146
+ """:return: downloads folder for the Android OS"""
147
+ # Get directories with pyjnius
148
+ try:
149
+ from jnius import autoclass
150
+
151
+ context = autoclass("android.content.Context")
152
+ environment = autoclass("android.os.Environment")
153
+ downloads_dir: str = context.getExternalFilesDir(environment.DIRECTORY_DOWNLOADS).getAbsolutePath()
154
+ except Exception: # noqa: BLE001
155
+ downloads_dir = "/storage/emulated/0/Downloads"
156
+
157
+ return downloads_dir
158
+
159
+
160
+ @lru_cache(maxsize=1)
161
+ def _android_pictures_folder() -> str:
162
+ """:return: pictures folder for the Android OS"""
163
+ # Get directories with pyjnius
164
+ try:
165
+ from jnius import autoclass
166
+
167
+ context = autoclass("android.content.Context")
168
+ environment = autoclass("android.os.Environment")
169
+ pictures_dir: str = context.getExternalFilesDir(environment.DIRECTORY_PICTURES).getAbsolutePath()
170
+ except Exception: # noqa: BLE001
171
+ pictures_dir = "/storage/emulated/0/Pictures"
172
+
173
+ return pictures_dir
174
+
175
+
176
+ @lru_cache(maxsize=1)
177
+ def _android_videos_folder() -> str:
178
+ """:return: videos folder for the Android OS"""
179
+ # Get directories with pyjnius
180
+ try:
181
+ from jnius import autoclass
182
+
183
+ context = autoclass("android.content.Context")
184
+ environment = autoclass("android.os.Environment")
185
+ videos_dir: str = context.getExternalFilesDir(environment.DIRECTORY_DCIM).getAbsolutePath()
186
+ except Exception: # noqa: BLE001
187
+ videos_dir = "/storage/emulated/0/DCIM/Camera"
188
+
189
+ return videos_dir
190
+
191
+
192
+ @lru_cache(maxsize=1)
193
+ def _android_music_folder() -> str:
194
+ """:return: music folder for the Android OS"""
195
+ # Get directories with pyjnius
196
+ try:
197
+ from jnius import autoclass
198
+
199
+ context = autoclass("android.content.Context")
200
+ environment = autoclass("android.os.Environment")
201
+ music_dir: str = context.getExternalFilesDir(environment.DIRECTORY_MUSIC).getAbsolutePath()
202
+ except Exception: # noqa: BLE001
203
+ music_dir = "/storage/emulated/0/Music"
204
+
205
+ return music_dir
206
+
207
+
208
+ __all__ = [
209
+ "Android",
210
+ ]
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/api.py ADDED
@@ -0,0 +1,223 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """Base API."""
2
+ from __future__ import annotations
3
+
4
+ import os
5
+ from abc import ABC, abstractmethod
6
+ from pathlib import Path
7
+ from typing import TYPE_CHECKING
8
+
9
+ if TYPE_CHECKING:
10
+ import sys
11
+
12
+ if sys.version_info >= (3, 8): # pragma: no cover (py38+)
13
+ from typing import Literal
14
+ else: # pragma: no cover (py38+)
15
+ from pip._vendor.typing_extensions import Literal
16
+
17
+
18
+ class PlatformDirsABC(ABC):
19
+ """Abstract base class for platform directories."""
20
+
21
+ def __init__( # noqa: PLR0913
22
+ self,
23
+ appname: str | None = None,
24
+ appauthor: str | None | Literal[False] = None,
25
+ version: str | None = None,
26
+ roaming: bool = False, # noqa: FBT001, FBT002
27
+ multipath: bool = False, # noqa: FBT001, FBT002
28
+ opinion: bool = True, # noqa: FBT001, FBT002
29
+ ensure_exists: bool = False, # noqa: FBT001, FBT002
30
+ ) -> None:
31
+ """
32
+ Create a new platform directory.
33
+
34
+ :param appname: See `appname`.
35
+ :param appauthor: See `appauthor`.
36
+ :param version: See `version`.
37
+ :param roaming: See `roaming`.
38
+ :param multipath: See `multipath`.
39
+ :param opinion: See `opinion`.
40
+ :param ensure_exists: See `ensure_exists`.
41
+ """
42
+ self.appname = appname #: The name of application.
43
+ self.appauthor = appauthor
44
+ """
45
+ The name of the app author or distributing body for this application. Typically, it is the owning company name.
46
+ Defaults to `appname`. You may pass ``False`` to disable it.
47
+ """
48
+ self.version = version
49
+ """
50
+ An optional version path element to append to the path. You might want to use this if you want multiple versions
51
+ of your app to be able to run independently. If used, this would typically be ``<major>.<minor>``.
52
+ """
53
+ self.roaming = roaming
54
+ """
55
+ Whether to use the roaming appdata directory on Windows. That means that for users on a Windows network setup
56
+ for roaming profiles, this user data will be synced on login (see
57
+ `here <http://technet.microsoft.com/en-us/library/cc766489(WS.10).aspx>`_).
58
+ """
59
+ self.multipath = multipath
60
+ """
61
+ An optional parameter only applicable to Unix/Linux which indicates that the entire list of data dirs should be
62
+ returned. By default, the first item would only be returned.
63
+ """
64
+ self.opinion = opinion #: A flag to indicating to use opinionated values.
65
+ self.ensure_exists = ensure_exists
66
+ """
67
+ Optionally create the directory (and any missing parents) upon access if it does not exist.
68
+ By default, no directories are created.
69
+ """
70
+
71
+ def _append_app_name_and_version(self, *base: str) -> str:
72
+ params = list(base[1:])
73
+ if self.appname:
74
+ params.append(self.appname)
75
+ if self.version:
76
+ params.append(self.version)
77
+ path = os.path.join(base[0], *params) # noqa: PTH118
78
+ self._optionally_create_directory(path)
79
+ return path
80
+
81
+ def _optionally_create_directory(self, path: str) -> None:
82
+ if self.ensure_exists:
83
+ Path(path).mkdir(parents=True, exist_ok=True)
84
+
85
+ @property
86
+ @abstractmethod
87
+ def user_data_dir(self) -> str:
88
+ """:return: data directory tied to the user"""
89
+
90
+ @property
91
+ @abstractmethod
92
+ def site_data_dir(self) -> str:
93
+ """:return: data directory shared by users"""
94
+
95
+ @property
96
+ @abstractmethod
97
+ def user_config_dir(self) -> str:
98
+ """:return: config directory tied to the user"""
99
+
100
+ @property
101
+ @abstractmethod
102
+ def site_config_dir(self) -> str:
103
+ """:return: config directory shared by the users"""
104
+
105
+ @property
106
+ @abstractmethod
107
+ def user_cache_dir(self) -> str:
108
+ """:return: cache directory tied to the user"""
109
+
110
+ @property
111
+ @abstractmethod
112
+ def site_cache_dir(self) -> str:
113
+ """:return: cache directory shared by users"""
114
+
115
+ @property
116
+ @abstractmethod
117
+ def user_state_dir(self) -> str:
118
+ """:return: state directory tied to the user"""
119
+
120
+ @property
121
+ @abstractmethod
122
+ def user_log_dir(self) -> str:
123
+ """:return: log directory tied to the user"""
124
+
125
+ @property
126
+ @abstractmethod
127
+ def user_documents_dir(self) -> str:
128
+ """:return: documents directory tied to the user"""
129
+
130
+ @property
131
+ @abstractmethod
132
+ def user_downloads_dir(self) -> str:
133
+ """:return: downloads directory tied to the user"""
134
+
135
+ @property
136
+ @abstractmethod
137
+ def user_pictures_dir(self) -> str:
138
+ """:return: pictures directory tied to the user"""
139
+
140
+ @property
141
+ @abstractmethod
142
+ def user_videos_dir(self) -> str:
143
+ """:return: videos directory tied to the user"""
144
+
145
+ @property
146
+ @abstractmethod
147
+ def user_music_dir(self) -> str:
148
+ """:return: music directory tied to the user"""
149
+
150
+ @property
151
+ @abstractmethod
152
+ def user_runtime_dir(self) -> str:
153
+ """:return: runtime directory tied to the user"""
154
+
155
+ @property
156
+ def user_data_path(self) -> Path:
157
+ """:return: data path tied to the user"""
158
+ return Path(self.user_data_dir)
159
+
160
+ @property
161
+ def site_data_path(self) -> Path:
162
+ """:return: data path shared by users"""
163
+ return Path(self.site_data_dir)
164
+
165
+ @property
166
+ def user_config_path(self) -> Path:
167
+ """:return: config path tied to the user"""
168
+ return Path(self.user_config_dir)
169
+
170
+ @property
171
+ def site_config_path(self) -> Path:
172
+ """:return: config path shared by the users"""
173
+ return Path(self.site_config_dir)
174
+
175
+ @property
176
+ def user_cache_path(self) -> Path:
177
+ """:return: cache path tied to the user"""
178
+ return Path(self.user_cache_dir)
179
+
180
+ @property
181
+ def site_cache_path(self) -> Path:
182
+ """:return: cache path shared by users"""
183
+ return Path(self.site_cache_dir)
184
+
185
+ @property
186
+ def user_state_path(self) -> Path:
187
+ """:return: state path tied to the user"""
188
+ return Path(self.user_state_dir)
189
+
190
+ @property
191
+ def user_log_path(self) -> Path:
192
+ """:return: log path tied to the user"""
193
+ return Path(self.user_log_dir)
194
+
195
+ @property
196
+ def user_documents_path(self) -> Path:
197
+ """:return: documents path tied to the user"""
198
+ return Path(self.user_documents_dir)
199
+
200
+ @property
201
+ def user_downloads_path(self) -> Path:
202
+ """:return: downloads path tied to the user"""
203
+ return Path(self.user_downloads_dir)
204
+
205
+ @property
206
+ def user_pictures_path(self) -> Path:
207
+ """:return: pictures path tied to the user"""
208
+ return Path(self.user_pictures_dir)
209
+
210
+ @property
211
+ def user_videos_path(self) -> Path:
212
+ """:return: videos path tied to the user"""
213
+ return Path(self.user_videos_dir)
214
+
215
+ @property
216
+ def user_music_path(self) -> Path:
217
+ """:return: music path tied to the user"""
218
+ return Path(self.user_music_dir)
219
+
220
+ @property
221
+ def user_runtime_path(self) -> Path:
222
+ """:return: runtime path tied to the user"""
223
+ return Path(self.user_runtime_dir)
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/macos.py ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """macOS."""
2
+ from __future__ import annotations
3
+
4
+ import os.path
5
+
6
+ from .api import PlatformDirsABC
7
+
8
+
9
+ class MacOS(PlatformDirsABC):
10
+ """
11
+ Platform directories for the macOS operating system. Follows the guidance from `Apple documentation
12
+ <https://developer.apple.com/library/archive/documentation/FileManagement/Conceptual/FileSystemProgrammingGuide/MacOSXDirectories/MacOSXDirectories.html>`_.
13
+ Makes use of the `appname <platformdirs.api.PlatformDirsABC.appname>`,
14
+ `version <platformdirs.api.PlatformDirsABC.version>`,
15
+ `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
16
+ """
17
+
18
+ @property
19
+ def user_data_dir(self) -> str:
20
+ """:return: data directory tied to the user, e.g. ``~/Library/Application Support/$appname/$version``"""
21
+ return self._append_app_name_and_version(os.path.expanduser("~/Library/Application Support")) # noqa: PTH111
22
+
23
+ @property
24
+ def site_data_dir(self) -> str:
25
+ """:return: data directory shared by users, e.g. ``/Library/Application Support/$appname/$version``"""
26
+ return self._append_app_name_and_version("/Library/Application Support")
27
+
28
+ @property
29
+ def user_config_dir(self) -> str:
30
+ """:return: config directory tied to the user, same as `user_data_dir`"""
31
+ return self.user_data_dir
32
+
33
+ @property
34
+ def site_config_dir(self) -> str:
35
+ """:return: config directory shared by the users, same as `site_data_dir`"""
36
+ return self.site_data_dir
37
+
38
+ @property
39
+ def user_cache_dir(self) -> str:
40
+ """:return: cache directory tied to the user, e.g. ``~/Library/Caches/$appname/$version``"""
41
+ return self._append_app_name_and_version(os.path.expanduser("~/Library/Caches")) # noqa: PTH111
42
+
43
+ @property
44
+ def site_cache_dir(self) -> str:
45
+ """:return: cache directory shared by users, e.g. ``/Library/Caches/$appname/$version``"""
46
+ return self._append_app_name_and_version("/Library/Caches")
47
+
48
+ @property
49
+ def user_state_dir(self) -> str:
50
+ """:return: state directory tied to the user, same as `user_data_dir`"""
51
+ return self.user_data_dir
52
+
53
+ @property
54
+ def user_log_dir(self) -> str:
55
+ """:return: log directory tied to the user, e.g. ``~/Library/Logs/$appname/$version``"""
56
+ return self._append_app_name_and_version(os.path.expanduser("~/Library/Logs")) # noqa: PTH111
57
+
58
+ @property
59
+ def user_documents_dir(self) -> str:
60
+ """:return: documents directory tied to the user, e.g. ``~/Documents``"""
61
+ return os.path.expanduser("~/Documents") # noqa: PTH111
62
+
63
+ @property
64
+ def user_downloads_dir(self) -> str:
65
+ """:return: downloads directory tied to the user, e.g. ``~/Downloads``"""
66
+ return os.path.expanduser("~/Downloads") # noqa: PTH111
67
+
68
+ @property
69
+ def user_pictures_dir(self) -> str:
70
+ """:return: pictures directory tied to the user, e.g. ``~/Pictures``"""
71
+ return os.path.expanduser("~/Pictures") # noqa: PTH111
72
+
73
+ @property
74
+ def user_videos_dir(self) -> str:
75
+ """:return: videos directory tied to the user, e.g. ``~/Movies``"""
76
+ return os.path.expanduser("~/Movies") # noqa: PTH111
77
+
78
+ @property
79
+ def user_music_dir(self) -> str:
80
+ """:return: music directory tied to the user, e.g. ``~/Music``"""
81
+ return os.path.expanduser("~/Music") # noqa: PTH111
82
+
83
+ @property
84
+ def user_runtime_dir(self) -> str:
85
+ """:return: runtime directory tied to the user, e.g. ``~/Library/Caches/TemporaryItems/$appname/$version``"""
86
+ return self._append_app_name_and_version(os.path.expanduser("~/Library/Caches/TemporaryItems")) # noqa: PTH111
87
+
88
+
89
+ __all__ = [
90
+ "MacOS",
91
+ ]
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/unix.py ADDED
@@ -0,0 +1,223 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """Unix."""
2
+ from __future__ import annotations
3
+
4
+ import os
5
+ import sys
6
+ from configparser import ConfigParser
7
+ from pathlib import Path
8
+
9
+ from .api import PlatformDirsABC
10
+
11
+ if sys.platform == "win32":
12
+
13
+ def getuid() -> int:
14
+ msg = "should only be used on Unix"
15
+ raise RuntimeError(msg)
16
+
17
+ else:
18
+ from os import getuid
19
+
20
+
21
+ class Unix(PlatformDirsABC):
22
+ """
23
+ On Unix/Linux, we follow the
24
+ `XDG Basedir Spec <https://specifications.freedesktop.org/basedir-spec/basedir-spec-latest.html>`_. The spec allows
25
+ overriding directories with environment variables. The examples show are the default values, alongside the name of
26
+ the environment variable that overrides them. Makes use of the
27
+ `appname <platformdirs.api.PlatformDirsABC.appname>`,
28
+ `version <platformdirs.api.PlatformDirsABC.version>`,
29
+ `multipath <platformdirs.api.PlatformDirsABC.multipath>`,
30
+ `opinion <platformdirs.api.PlatformDirsABC.opinion>`,
31
+ `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
32
+ """
33
+
34
+ @property
35
+ def user_data_dir(self) -> str:
36
+ """
37
+ :return: data directory tied to the user, e.g. ``~/.local/share/$appname/$version`` or
38
+ ``$XDG_DATA_HOME/$appname/$version``
39
+ """
40
+ path = os.environ.get("XDG_DATA_HOME", "")
41
+ if not path.strip():
42
+ path = os.path.expanduser("~/.local/share") # noqa: PTH111
43
+ return self._append_app_name_and_version(path)
44
+
45
+ @property
46
+ def site_data_dir(self) -> str:
47
+ """
48
+ :return: data directories shared by users (if `multipath <platformdirs.api.PlatformDirsABC.multipath>` is
49
+ enabled and ``XDG_DATA_DIR`` is set and a multi path the response is also a multi path separated by the OS
50
+ path separator), e.g. ``/usr/local/share/$appname/$version`` or ``/usr/share/$appname/$version``
51
+ """
52
+ # XDG default for $XDG_DATA_DIRS; only first, if multipath is False
53
+ path = os.environ.get("XDG_DATA_DIRS", "")
54
+ if not path.strip():
55
+ path = f"/usr/local/share{os.pathsep}/usr/share"
56
+ return self._with_multi_path(path)
57
+
58
+ def _with_multi_path(self, path: str) -> str:
59
+ path_list = path.split(os.pathsep)
60
+ if not self.multipath:
61
+ path_list = path_list[0:1]
62
+ path_list = [self._append_app_name_and_version(os.path.expanduser(p)) for p in path_list] # noqa: PTH111
63
+ return os.pathsep.join(path_list)
64
+
65
+ @property
66
+ def user_config_dir(self) -> str:
67
+ """
68
+ :return: config directory tied to the user, e.g. ``~/.config/$appname/$version`` or
69
+ ``$XDG_CONFIG_HOME/$appname/$version``
70
+ """
71
+ path = os.environ.get("XDG_CONFIG_HOME", "")
72
+ if not path.strip():
73
+ path = os.path.expanduser("~/.config") # noqa: PTH111
74
+ return self._append_app_name_and_version(path)
75
+
76
+ @property
77
+ def site_config_dir(self) -> str:
78
+ """
79
+ :return: config directories shared by users (if `multipath <platformdirs.api.PlatformDirsABC.multipath>`
80
+ is enabled and ``XDG_DATA_DIR`` is set and a multi path the response is also a multi path separated by the OS
81
+ path separator), e.g. ``/etc/xdg/$appname/$version``
82
+ """
83
+ # XDG default for $XDG_CONFIG_DIRS only first, if multipath is False
84
+ path = os.environ.get("XDG_CONFIG_DIRS", "")
85
+ if not path.strip():
86
+ path = "/etc/xdg"
87
+ return self._with_multi_path(path)
88
+
89
+ @property
90
+ def user_cache_dir(self) -> str:
91
+ """
92
+ :return: cache directory tied to the user, e.g. ``~/.cache/$appname/$version`` or
93
+ ``~/$XDG_CACHE_HOME/$appname/$version``
94
+ """
95
+ path = os.environ.get("XDG_CACHE_HOME", "")
96
+ if not path.strip():
97
+ path = os.path.expanduser("~/.cache") # noqa: PTH111
98
+ return self._append_app_name_and_version(path)
99
+
100
+ @property
101
+ def site_cache_dir(self) -> str:
102
+ """:return: cache directory shared by users, e.g. ``/var/tmp/$appname/$version``"""
103
+ return self._append_app_name_and_version("/var/tmp") # noqa: S108
104
+
105
+ @property
106
+ def user_state_dir(self) -> str:
107
+ """
108
+ :return: state directory tied to the user, e.g. ``~/.local/state/$appname/$version`` or
109
+ ``$XDG_STATE_HOME/$appname/$version``
110
+ """
111
+ path = os.environ.get("XDG_STATE_HOME", "")
112
+ if not path.strip():
113
+ path = os.path.expanduser("~/.local/state") # noqa: PTH111
114
+ return self._append_app_name_and_version(path)
115
+
116
+ @property
117
+ def user_log_dir(self) -> str:
118
+ """:return: log directory tied to the user, same as `user_state_dir` if not opinionated else ``log`` in it"""
119
+ path = self.user_state_dir
120
+ if self.opinion:
121
+ path = os.path.join(path, "log") # noqa: PTH118
122
+ return path
123
+
124
+ @property
125
+ def user_documents_dir(self) -> str:
126
+ """:return: documents directory tied to the user, e.g. ``~/Documents``"""
127
+ return _get_user_media_dir("XDG_DOCUMENTS_DIR", "~/Documents")
128
+
129
+ @property
130
+ def user_downloads_dir(self) -> str:
131
+ """:return: downloads directory tied to the user, e.g. ``~/Downloads``"""
132
+ return _get_user_media_dir("XDG_DOWNLOAD_DIR", "~/Downloads")
133
+
134
+ @property
135
+ def user_pictures_dir(self) -> str:
136
+ """:return: pictures directory tied to the user, e.g. ``~/Pictures``"""
137
+ return _get_user_media_dir("XDG_PICTURES_DIR", "~/Pictures")
138
+
139
+ @property
140
+ def user_videos_dir(self) -> str:
141
+ """:return: videos directory tied to the user, e.g. ``~/Videos``"""
142
+ return _get_user_media_dir("XDG_VIDEOS_DIR", "~/Videos")
143
+
144
+ @property
145
+ def user_music_dir(self) -> str:
146
+ """:return: music directory tied to the user, e.g. ``~/Music``"""
147
+ return _get_user_media_dir("XDG_MUSIC_DIR", "~/Music")
148
+
149
+ @property
150
+ def user_runtime_dir(self) -> str:
151
+ """
152
+ :return: runtime directory tied to the user, e.g. ``/run/user/$(id -u)/$appname/$version`` or
153
+ ``$XDG_RUNTIME_DIR/$appname/$version``.
154
+
155
+ For FreeBSD/OpenBSD/NetBSD, it would return ``/var/run/user/$(id -u)/$appname/$version`` if
156
+ exists, otherwise ``/tmp/runtime-$(id -u)/$appname/$version``, if``$XDG_RUNTIME_DIR``
157
+ is not set.
158
+ """
159
+ path = os.environ.get("XDG_RUNTIME_DIR", "")
160
+ if not path.strip():
161
+ if sys.platform.startswith(("freebsd", "openbsd", "netbsd")):
162
+ path = f"/var/run/user/{getuid()}"
163
+ if not Path(path).exists():
164
+ path = f"/tmp/runtime-{getuid()}" # noqa: S108
165
+ else:
166
+ path = f"/run/user/{getuid()}"
167
+ return self._append_app_name_and_version(path)
168
+
169
+ @property
170
+ def site_data_path(self) -> Path:
171
+ """:return: data path shared by users. Only return first item, even if ``multipath`` is set to ``True``"""
172
+ return self._first_item_as_path_if_multipath(self.site_data_dir)
173
+
174
+ @property
175
+ def site_config_path(self) -> Path:
176
+ """:return: config path shared by the users. Only return first item, even if ``multipath`` is set to ``True``"""
177
+ return self._first_item_as_path_if_multipath(self.site_config_dir)
178
+
179
+ @property
180
+ def site_cache_path(self) -> Path:
181
+ """:return: cache path shared by users. Only return first item, even if ``multipath`` is set to ``True``"""
182
+ return self._first_item_as_path_if_multipath(self.site_cache_dir)
183
+
184
+ def _first_item_as_path_if_multipath(self, directory: str) -> Path:
185
+ if self.multipath:
186
+ # If multipath is True, the first path is returned.
187
+ directory = directory.split(os.pathsep)[0]
188
+ return Path(directory)
189
+
190
+
191
+ def _get_user_media_dir(env_var: str, fallback_tilde_path: str) -> str:
192
+ media_dir = _get_user_dirs_folder(env_var)
193
+ if media_dir is None:
194
+ media_dir = os.environ.get(env_var, "").strip()
195
+ if not media_dir:
196
+ media_dir = os.path.expanduser(fallback_tilde_path) # noqa: PTH111
197
+
198
+ return media_dir
199
+
200
+
201
+ def _get_user_dirs_folder(key: str) -> str | None:
202
+ """Return directory from user-dirs.dirs config file. See https://freedesktop.org/wiki/Software/xdg-user-dirs/."""
203
+ user_dirs_config_path = Path(Unix().user_config_dir) / "user-dirs.dirs"
204
+ if user_dirs_config_path.exists():
205
+ parser = ConfigParser()
206
+
207
+ with user_dirs_config_path.open() as stream:
208
+ # Add fake section header, so ConfigParser doesn't complain
209
+ parser.read_string(f"[top]\n{stream.read()}")
210
+
211
+ if key not in parser["top"]:
212
+ return None
213
+
214
+ path = parser["top"][key].strip('"')
215
+ # Handle relative home paths
216
+ return path.replace("$HOME", os.path.expanduser("~")) # noqa: PTH111
217
+
218
+ return None
219
+
220
+
221
+ __all__ = [
222
+ "Unix",
223
+ ]
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/version.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ # file generated by setuptools_scm
2
+ # don't change, don't track in version control
3
+ __version__ = version = '3.8.1'
4
+ __version_tuple__ = version_tuple = (3, 8, 1)
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/platformdirs/windows.py ADDED
@@ -0,0 +1,255 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """Windows."""
2
+ from __future__ import annotations
3
+
4
+ import ctypes
5
+ import os
6
+ import sys
7
+ from functools import lru_cache
8
+ from typing import TYPE_CHECKING
9
+
10
+ from .api import PlatformDirsABC
11
+
12
+ if TYPE_CHECKING:
13
+ from collections.abc import Callable
14
+
15
+
16
+ class Windows(PlatformDirsABC):
17
+ """
18
+ `MSDN on where to store app data files
19
+ <http://support.microsoft.com/default.aspx?scid=kb;en-us;310294#XSLTH3194121123120121120120>`_.
20
+ Makes use of the
21
+ `appname <platformdirs.api.PlatformDirsABC.appname>`,
22
+ `appauthor <platformdirs.api.PlatformDirsABC.appauthor>`,
23
+ `version <platformdirs.api.PlatformDirsABC.version>`,
24
+ `roaming <platformdirs.api.PlatformDirsABC.roaming>`,
25
+ `opinion <platformdirs.api.PlatformDirsABC.opinion>`,
26
+ `ensure_exists <platformdirs.api.PlatformDirsABC.ensure_exists>`.
27
+ """
28
+
29
+ @property
30
+ def user_data_dir(self) -> str:
31
+ """
32
+ :return: data directory tied to the user, e.g.
33
+ ``%USERPROFILE%\\AppData\\Local\\$appauthor\\$appname`` (not roaming) or
34
+ ``%USERPROFILE%\\AppData\\Roaming\\$appauthor\\$appname`` (roaming)
35
+ """
36
+ const = "CSIDL_APPDATA" if self.roaming else "CSIDL_LOCAL_APPDATA"
37
+ path = os.path.normpath(get_win_folder(const))
38
+ return self._append_parts(path)
39
+
40
+ def _append_parts(self, path: str, *, opinion_value: str | None = None) -> str:
41
+ params = []
42
+ if self.appname:
43
+ if self.appauthor is not False:
44
+ author = self.appauthor or self.appname
45
+ params.append(author)
46
+ params.append(self.appname)
47
+ if opinion_value is not None and self.opinion:
48
+ params.append(opinion_value)
49
+ if self.version:
50
+ params.append(self.version)
51
+ path = os.path.join(path, *params) # noqa: PTH118
52
+ self._optionally_create_directory(path)
53
+ return path
54
+
55
+ @property
56
+ def site_data_dir(self) -> str:
57
+ """:return: data directory shared by users, e.g. ``C:\\ProgramData\\$appauthor\\$appname``"""
58
+ path = os.path.normpath(get_win_folder("CSIDL_COMMON_APPDATA"))
59
+ return self._append_parts(path)
60
+
61
+ @property
62
+ def user_config_dir(self) -> str:
63
+ """:return: config directory tied to the user, same as `user_data_dir`"""
64
+ return self.user_data_dir
65
+
66
+ @property
67
+ def site_config_dir(self) -> str:
68
+ """:return: config directory shared by the users, same as `site_data_dir`"""
69
+ return self.site_data_dir
70
+
71
+ @property
72
+ def user_cache_dir(self) -> str:
73
+ """
74
+ :return: cache directory tied to the user (if opinionated with ``Cache`` folder within ``$appname``) e.g.
75
+ ``%USERPROFILE%\\AppData\\Local\\$appauthor\\$appname\\Cache\\$version``
76
+ """
77
+ path = os.path.normpath(get_win_folder("CSIDL_LOCAL_APPDATA"))
78
+ return self._append_parts(path, opinion_value="Cache")
79
+
80
+ @property
81
+ def site_cache_dir(self) -> str:
82
+ """:return: cache directory shared by users, e.g. ``C:\\ProgramData\\$appauthor\\$appname\\Cache\\$version``"""
83
+ path = os.path.normpath(get_win_folder("CSIDL_COMMON_APPDATA"))
84
+ return self._append_parts(path, opinion_value="Cache")
85
+
86
+ @property
87
+ def user_state_dir(self) -> str:
88
+ """:return: state directory tied to the user, same as `user_data_dir`"""
89
+ return self.user_data_dir
90
+
91
+ @property
92
+ def user_log_dir(self) -> str:
93
+ """:return: log directory tied to the user, same as `user_data_dir` if not opinionated else ``Logs`` in it"""
94
+ path = self.user_data_dir
95
+ if self.opinion:
96
+ path = os.path.join(path, "Logs") # noqa: PTH118
97
+ self._optionally_create_directory(path)
98
+ return path
99
+
100
+ @property
101
+ def user_documents_dir(self) -> str:
102
+ """:return: documents directory tied to the user e.g. ``%USERPROFILE%\\Documents``"""
103
+ return os.path.normpath(get_win_folder("CSIDL_PERSONAL"))
104
+
105
+ @property
106
+ def user_downloads_dir(self) -> str:
107
+ """:return: downloads directory tied to the user e.g. ``%USERPROFILE%\\Downloads``"""
108
+ return os.path.normpath(get_win_folder("CSIDL_DOWNLOADS"))
109
+
110
+ @property
111
+ def user_pictures_dir(self) -> str:
112
+ """:return: pictures directory tied to the user e.g. ``%USERPROFILE%\\Pictures``"""
113
+ return os.path.normpath(get_win_folder("CSIDL_MYPICTURES"))
114
+
115
+ @property
116
+ def user_videos_dir(self) -> str:
117
+ """:return: videos directory tied to the user e.g. ``%USERPROFILE%\\Videos``"""
118
+ return os.path.normpath(get_win_folder("CSIDL_MYVIDEO"))
119
+
120
+ @property
121
+ def user_music_dir(self) -> str:
122
+ """:return: music directory tied to the user e.g. ``%USERPROFILE%\\Music``"""
123
+ return os.path.normpath(get_win_folder("CSIDL_MYMUSIC"))
124
+
125
+ @property
126
+ def user_runtime_dir(self) -> str:
127
+ """
128
+ :return: runtime directory tied to the user, e.g.
129
+ ``%USERPROFILE%\\AppData\\Local\\Temp\\$appauthor\\$appname``
130
+ """
131
+ path = os.path.normpath(os.path.join(get_win_folder("CSIDL_LOCAL_APPDATA"), "Temp")) # noqa: PTH118
132
+ return self._append_parts(path)
133
+
134
+
135
+ def get_win_folder_from_env_vars(csidl_name: str) -> str:
136
+ """Get folder from environment variables."""
137
+ result = get_win_folder_if_csidl_name_not_env_var(csidl_name)
138
+ if result is not None:
139
+ return result
140
+
141
+ env_var_name = {
142
+ "CSIDL_APPDATA": "APPDATA",
143
+ "CSIDL_COMMON_APPDATA": "ALLUSERSPROFILE",
144
+ "CSIDL_LOCAL_APPDATA": "LOCALAPPDATA",
145
+ }.get(csidl_name)
146
+ if env_var_name is None:
147
+ msg = f"Unknown CSIDL name: {csidl_name}"
148
+ raise ValueError(msg)
149
+ result = os.environ.get(env_var_name)
150
+ if result is None:
151
+ msg = f"Unset environment variable: {env_var_name}"
152
+ raise ValueError(msg)
153
+ return result
154
+
155
+
156
+ def get_win_folder_if_csidl_name_not_env_var(csidl_name: str) -> str | None:
157
+ """Get folder for a CSIDL name that does not exist as an environment variable."""
158
+ if csidl_name == "CSIDL_PERSONAL":
159
+ return os.path.join(os.path.normpath(os.environ["USERPROFILE"]), "Documents") # noqa: PTH118
160
+
161
+ if csidl_name == "CSIDL_DOWNLOADS":
162
+ return os.path.join(os.path.normpath(os.environ["USERPROFILE"]), "Downloads") # noqa: PTH118
163
+
164
+ if csidl_name == "CSIDL_MYPICTURES":
165
+ return os.path.join(os.path.normpath(os.environ["USERPROFILE"]), "Pictures") # noqa: PTH118
166
+
167
+ if csidl_name == "CSIDL_MYVIDEO":
168
+ return os.path.join(os.path.normpath(os.environ["USERPROFILE"]), "Videos") # noqa: PTH118
169
+
170
+ if csidl_name == "CSIDL_MYMUSIC":
171
+ return os.path.join(os.path.normpath(os.environ["USERPROFILE"]), "Music") # noqa: PTH118
172
+ return None
173
+
174
+
175
+ def get_win_folder_from_registry(csidl_name: str) -> str:
176
+ """
177
+ Get folder from the registry.
178
+
179
+ This is a fallback technique at best. I'm not sure if using the registry for these guarantees us the correct answer
180
+ for all CSIDL_* names.
181
+ """
182
+ shell_folder_name = {
183
+ "CSIDL_APPDATA": "AppData",
184
+ "CSIDL_COMMON_APPDATA": "Common AppData",
185
+ "CSIDL_LOCAL_APPDATA": "Local AppData",
186
+ "CSIDL_PERSONAL": "Personal",
187
+ "CSIDL_DOWNLOADS": "{374DE290-123F-4565-9164-39C4925E467B}",
188
+ "CSIDL_MYPICTURES": "My Pictures",
189
+ "CSIDL_MYVIDEO": "My Video",
190
+ "CSIDL_MYMUSIC": "My Music",
191
+ }.get(csidl_name)
192
+ if shell_folder_name is None:
193
+ msg = f"Unknown CSIDL name: {csidl_name}"
194
+ raise ValueError(msg)
195
+ if sys.platform != "win32": # only needed for mypy type checker to know that this code runs only on Windows
196
+ raise NotImplementedError
197
+ import winreg
198
+
199
+ key = winreg.OpenKey(winreg.HKEY_CURRENT_USER, r"Software\Microsoft\Windows\CurrentVersion\Explorer\Shell Folders")
200
+ directory, _ = winreg.QueryValueEx(key, shell_folder_name)
201
+ return str(directory)
202
+
203
+
204
+ def get_win_folder_via_ctypes(csidl_name: str) -> str:
205
+ """Get folder with ctypes."""
206
+ # There is no 'CSIDL_DOWNLOADS'.
207
+ # Use 'CSIDL_PROFILE' (40) and append the default folder 'Downloads' instead.
208
+ # https://learn.microsoft.com/en-us/windows/win32/shell/knownfolderid
209
+
210
+ csidl_const = {
211
+ "CSIDL_APPDATA": 26,
212
+ "CSIDL_COMMON_APPDATA": 35,
213
+ "CSIDL_LOCAL_APPDATA": 28,
214
+ "CSIDL_PERSONAL": 5,
215
+ "CSIDL_MYPICTURES": 39,
216
+ "CSIDL_MYVIDEO": 14,
217
+ "CSIDL_MYMUSIC": 13,
218
+ "CSIDL_DOWNLOADS": 40,
219
+ }.get(csidl_name)
220
+ if csidl_const is None:
221
+ msg = f"Unknown CSIDL name: {csidl_name}"
222
+ raise ValueError(msg)
223
+
224
+ buf = ctypes.create_unicode_buffer(1024)
225
+ windll = getattr(ctypes, "windll") # noqa: B009 # using getattr to avoid false positive with mypy type checker
226
+ windll.shell32.SHGetFolderPathW(None, csidl_const, None, 0, buf)
227
+
228
+ # Downgrade to short path name if it has highbit chars.
229
+ if any(ord(c) > 255 for c in buf): # noqa: PLR2004
230
+ buf2 = ctypes.create_unicode_buffer(1024)
231
+ if windll.kernel32.GetShortPathNameW(buf.value, buf2, 1024):
232
+ buf = buf2
233
+
234
+ if csidl_name == "CSIDL_DOWNLOADS":
235
+ return os.path.join(buf.value, "Downloads") # noqa: PTH118
236
+
237
+ return buf.value
238
+
239
+
240
+ def _pick_get_win_folder() -> Callable[[str], str]:
241
+ if hasattr(ctypes, "windll"):
242
+ return get_win_folder_via_ctypes
243
+ try:
244
+ import winreg # noqa: F401
245
+ except ImportError:
246
+ return get_win_folder_from_env_vars
247
+ else:
248
+ return get_win_folder_from_registry
249
+
250
+
251
+ get_win_folder = lru_cache(maxsize=None)(_pick_get_win_folder())
252
+
253
+ __all__ = [
254
+ "Windows",
255
+ ]
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/pyproject_hooks/_in_process/__init__.py ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """This is a subpackage because the directory is on sys.path for _in_process.py
2
+
3
+ The subpackage should stay as empty as possible to avoid shadowing modules that
4
+ the backend might import.
5
+ """
6
+
7
+ import importlib.resources as resources
8
+
9
+ try:
10
+ resources.files
11
+ except AttributeError:
12
+ # Python 3.8 compatibility
13
+ def _in_proc_script_path():
14
+ return resources.path(__package__, '_in_process.py')
15
+ else:
16
+ def _in_proc_script_path():
17
+ return resources.as_file(
18
+ resources.files(__package__).joinpath('_in_process.py'))
LTA_openwebtext_dualt/mini_owt_logdirichlet/.venv_qwen35/lib/python3.12/site-packages/pip/_vendor/pyproject_hooks/_in_process/_in_process.py ADDED
@@ -0,0 +1,353 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """This is invoked in a subprocess to call the build backend hooks.
2
+
3
+ It expects:
4
+ - Command line args: hook_name, control_dir
5
+ - Environment variables:
6
+ PEP517_BUILD_BACKEND=entry.point:spec
7
+ PEP517_BACKEND_PATH=paths (separated with os.pathsep)
8
+ - control_dir/input.json:
9
+ - {"kwargs": {...}}
10
+
11
+ Results:
12
+ - control_dir/output.json
13
+ - {"return_val": ...}
14
+ """
15
+ import json
16
+ import os
17
+ import os.path
18
+ import re
19
+ import shutil
20
+ import sys
21
+ import traceback
22
+ from glob import glob
23
+ from importlib import import_module
24
+ from os.path import join as pjoin
25
+
26
+ # This file is run as a script, and `import wrappers` is not zip-safe, so we
27
+ # include write_json() and read_json() from wrappers.py.
28
+
29
+
30
+ def write_json(obj, path, **kwargs):
31
+ with open(path, 'w', encoding='utf-8') as f:
32
+ json.dump(obj, f, **kwargs)
33
+
34
+
35
+ def read_json(path):
36
+ with open(path, encoding='utf-8') as f:
37
+ return json.load(f)
38
+
39
+
40
+ class BackendUnavailable(Exception):
41
+ """Raised if we cannot import the backend"""
42
+ def __init__(self, traceback):
43
+ self.traceback = traceback
44
+
45
+
46
+ class BackendInvalid(Exception):
47
+ """Raised if the backend is invalid"""
48
+ def __init__(self, message):
49
+ self.message = message
50
+
51
+
52
+ class HookMissing(Exception):
53
+ """Raised if a hook is missing and we are not executing the fallback"""
54
+ def __init__(self, hook_name=None):
55
+ super().__init__(hook_name)
56
+ self.hook_name = hook_name
57
+
58
+
59
+ def contained_in(filename, directory):
60
+ """Test if a file is located within the given directory."""
61
+ filename = os.path.normcase(os.path.abspath(filename))
62
+ directory = os.path.normcase(os.path.abspath(directory))
63
+ return os.path.commonprefix([filename, directory]) == directory
64
+
65
+
66
+ def _build_backend():
67
+ """Find and load the build backend"""
68
+ # Add in-tree backend directories to the front of sys.path.
69
+ backend_path = os.environ.get('PEP517_BACKEND_PATH')
70
+ if backend_path:
71
+ extra_pathitems = backend_path.split(os.pathsep)
72
+ sys.path[:0] = extra_pathitems
73
+
74
+ ep = os.environ['PEP517_BUILD_BACKEND']
75
+ mod_path, _, obj_path = ep.partition(':')
76
+ try:
77
+ obj = import_module(mod_path)
78
+ except ImportError:
79
+ raise BackendUnavailable(traceback.format_exc())
80
+
81
+ if backend_path:
82
+ if not any(
83
+ contained_in(obj.__file__, path)
84
+ for path in extra_pathitems
85
+ ):
86
+ raise BackendInvalid("Backend was not loaded from backend-path")
87
+
88
+ if obj_path:
89
+ for path_part in obj_path.split('.'):
90
+ obj = getattr(obj, path_part)
91
+ return obj
92
+
93
+
94
+ def _supported_features():
95
+ """Return the list of options features supported by the backend.
96
+
97
+ Returns a list of strings.
98
+ The only possible value is 'build_editable'.
99
+ """
100
+ backend = _build_backend()
101
+ features = []
102
+ if hasattr(backend, "build_editable"):
103
+ features.append("build_editable")
104
+ return features
105
+
106
+
107
+ def get_requires_for_build_wheel(config_settings):
108
+ """Invoke the optional get_requires_for_build_wheel hook
109
+
110
+ Returns [] if the hook is not defined.
111
+ """
112
+ backend = _build_backend()
113
+ try:
114
+ hook = backend.get_requires_for_build_wheel
115
+ except AttributeError:
116
+ return []
117
+ else:
118
+ return hook(config_settings)
119
+
120
+
121
+ def get_requires_for_build_editable(config_settings):
122
+ """Invoke the optional get_requires_for_build_editable hook
123
+
124
+ Returns [] if the hook is not defined.
125
+ """
126
+ backend = _build_backend()
127
+ try:
128
+ hook = backend.get_requires_for_build_editable
129
+ except AttributeError:
130
+ return []
131
+ else:
132
+ return hook(config_settings)
133
+
134
+
135
+ def prepare_metadata_for_build_wheel(
136
+ metadata_directory, config_settings, _allow_fallback):
137
+ """Invoke optional prepare_metadata_for_build_wheel
138
+
139
+ Implements a fallback by building a wheel if the hook isn't defined,
140
+ unless _allow_fallback is False in which case HookMissing is raised.
141
+ """
142
+ backend = _build_backend()
143
+ try:
144
+ hook = backend.prepare_metadata_for_build_wheel
145
+ except AttributeError:
146
+ if not _allow_fallback:
147
+ raise HookMissing()
148
+ else:
149
+ return hook(metadata_directory, config_settings)
150
+ # fallback to build_wheel outside the try block to avoid exception chaining
151
+ # which can be confusing to users and is not relevant
152
+ whl_basename = backend.build_wheel(metadata_directory, config_settings)
153
+ return _get_wheel_metadata_from_wheel(whl_basename, metadata_directory,
154
+ config_settings)
155
+
156
+
157
+ def prepare_metadata_for_build_editable(
158
+ metadata_directory, config_settings, _allow_fallback):
159
+ """Invoke optional prepare_metadata_for_build_editable
160
+
161
+ Implements a fallback by building an editable wheel if the hook isn't
162
+ defined, unless _allow_fallback is False in which case HookMissing is
163
+ raised.
164
+ """
165
+ backend = _build_backend()
166
+ try:
167
+ hook = backend.prepare_metadata_for_build_editable
168
+ except AttributeError:
169
+ if not _allow_fallback:
170
+ raise HookMissing()
171
+ try:
172
+ build_hook = backend.build_editable
173
+ except AttributeError:
174
+ raise HookMissing(hook_name='build_editable')
175
+ else:
176
+ whl_basename = build_hook(metadata_directory, config_settings)
177
+ return _get_wheel_metadata_from_wheel(whl_basename,
178
+ metadata_directory,
179
+ config_settings)
180
+ else:
181
+ return hook(metadata_directory, config_settings)
182
+
183
+
184
+ WHEEL_BUILT_MARKER = 'PEP517_ALREADY_BUILT_WHEEL'
185
+
186
+
187
+ def _dist_info_files(whl_zip):
188
+ """Identify the .dist-info folder inside a wheel ZipFile."""
189
+ res = []
190
+ for path in whl_zip.namelist():
191
+ m = re.match(r'[^/\\]+-[^/\\]+\.dist-info/', path)
192
+ if m:
193
+ res.append(path)
194
+ if res:
195
+ return res
196
+ raise Exception("No .dist-info folder found in wheel")
197
+
198
+
199
+ def _get_wheel_metadata_from_wheel(
200
+ whl_basename, metadata_directory, config_settings):
201
+ """Extract the metadata from a wheel.
202
+
203
+ Fallback for when the build backend does not
204
+ define the 'get_wheel_metadata' hook.
205
+ """
206
+ from zipfile import ZipFile
207
+ with open(os.path.join(metadata_directory, WHEEL_BUILT_MARKER), 'wb'):
208
+ pass # Touch marker file
209
+
210
+ whl_file = os.path.join(metadata_directory, whl_basename)
211
+ with ZipFile(whl_file) as zipf:
212
+ dist_info = _dist_info_files(zipf)
213
+ zipf.extractall(path=metadata_directory, members=dist_info)
214
+ return dist_info[0].split('/')[0]
215
+
216
+
217
+ def _find_already_built_wheel(metadata_directory):
218
+ """Check for a wheel already built during the get_wheel_metadata hook.
219
+ """
220
+ if not metadata_directory:
221
+ return None
222
+ metadata_parent = os.path.dirname(metadata_directory)
223
+ if not os.path.isfile(pjoin(metadata_parent, WHEEL_BUILT_MARKER)):
224
+ return None
225
+
226
+ whl_files = glob(os.path.join(metadata_parent, '*.whl'))
227
+ if not whl_files:
228
+ print('Found wheel built marker, but no .whl files')
229
+ return None
230
+ if len(whl_files) > 1:
231
+ print('Found multiple .whl files; unspecified behaviour. '
232
+ 'Will call build_wheel.')
233
+ return None
234
+
235
+ # Exactly one .whl file
236
+ return whl_files[0]
237
+
238
+
239
+ def build_wheel(wheel_directory, config_settings, metadata_directory=None):
240
+ """Invoke the mandatory build_wheel hook.
241
+
242
+ If a wheel was already built in the
243
+ prepare_metadata_for_build_wheel fallback, this
244
+ will copy it rather than rebuilding the wheel.
245
+ """
246
+ prebuilt_whl = _find_already_built_wheel(metadata_directory)
247
+ if prebuilt_whl:
248
+ shutil.copy2(prebuilt_whl, wheel_directory)
249
+ return os.path.basename(prebuilt_whl)
250
+
251
+ return _build_backend().build_wheel(wheel_directory, config_settings,
252
+ metadata_directory)
253
+
254
+
255
+ def build_editable(wheel_directory, config_settings, metadata_directory=None):
256
+ """Invoke the optional build_editable hook.
257
+
258
+ If a wheel was already built in the
259
+ prepare_metadata_for_build_editable fallback, this
260
+ will copy it rather than rebuilding the wheel.
261
+ """
262
+ backend = _build_backend()
263
+ try:
264
+ hook = backend.build_editable
265
+ except AttributeError:
266
+ raise HookMissing()
267
+ else:
268
+ prebuilt_whl = _find_already_built_wheel(metadata_directory)
269
+ if prebuilt_whl:
270
+ shutil.copy2(prebuilt_whl, wheel_directory)
271
+ return os.path.basename(prebuilt_whl)
272
+
273
+ return hook(wheel_directory, config_settings, metadata_directory)
274
+
275
+
276
+ def get_requires_for_build_sdist(config_settings):
277
+ """Invoke the optional get_requires_for_build_wheel hook
278
+
279
+ Returns [] if the hook is not defined.
280
+ """
281
+ backend = _build_backend()
282
+ try:
283
+ hook = backend.get_requires_for_build_sdist
284
+ except AttributeError:
285
+ return []
286
+ else:
287
+ return hook(config_settings)
288
+
289
+
290
+ class _DummyException(Exception):
291
+ """Nothing should ever raise this exception"""
292
+
293
+
294
+ class GotUnsupportedOperation(Exception):
295
+ """For internal use when backend raises UnsupportedOperation"""
296
+ def __init__(self, traceback):
297
+ self.traceback = traceback
298
+
299
+
300
+ def build_sdist(sdist_directory, config_settings):
301
+ """Invoke the mandatory build_sdist hook."""
302
+ backend = _build_backend()
303
+ try:
304
+ return backend.build_sdist(sdist_directory, config_settings)
305
+ except getattr(backend, 'UnsupportedOperation', _DummyException):
306
+ raise GotUnsupportedOperation(traceback.format_exc())
307
+
308
+
309
+ HOOK_NAMES = {
310
+ 'get_requires_for_build_wheel',
311
+ 'prepare_metadata_for_build_wheel',
312
+ 'build_wheel',
313
+ 'get_requires_for_build_editable',
314
+ 'prepare_metadata_for_build_editable',
315
+ 'build_editable',
316
+ 'get_requires_for_build_sdist',
317
+ 'build_sdist',
318
+ '_supported_features',
319
+ }
320
+
321
+
322
+ def main():
323
+ if len(sys.argv) < 3:
324
+ sys.exit("Needs args: hook_name, control_dir")
325
+ hook_name = sys.argv[1]
326
+ control_dir = sys.argv[2]
327
+ if hook_name not in HOOK_NAMES:
328
+ sys.exit("Unknown hook: %s" % hook_name)
329
+ hook = globals()[hook_name]
330
+
331
+ hook_input = read_json(pjoin(control_dir, 'input.json'))
332
+
333
+ json_out = {'unsupported': False, 'return_val': None}
334
+ try:
335
+ json_out['return_val'] = hook(**hook_input['kwargs'])
336
+ except BackendUnavailable as e:
337
+ json_out['no_backend'] = True
338
+ json_out['traceback'] = e.traceback
339
+ except BackendInvalid as e:
340
+ json_out['backend_invalid'] = True
341
+ json_out['backend_error'] = e.message
342
+ except GotUnsupportedOperation as e:
343
+ json_out['unsupported'] = True
344
+ json_out['traceback'] = e.traceback
345
+ except HookMissing as e:
346
+ json_out['hook_missing'] = True
347
+ json_out['missing_hook_name'] = e.hook_name or hook_name
348
+
349
+ write_json(json_out, pjoin(control_dir, 'output.json'), indent=2)
350
+
351
+
352
+ if __name__ == '__main__':
353
+ main()