ayymen commited on
Commit
4858319
·
verified ·
1 Parent(s): 07641cc

Upload tokenizer

Browse files
Files changed (3) hide show
  1. added_tokens.json +203 -203
  2. sentencepiece.bpe.model +2 -2
  3. tokenizer_config.json +203 -203
added_tokens.json CHANGED
@@ -1,205 +1,205 @@
1
  {
2
- "<mask>": 14045,
3
- "ace_Arab": 14046,
4
- "ace_Latn": 14047,
5
- "acm_Arab": 14048,
6
- "acq_Arab": 14049,
7
- "aeb_Arab": 14050,
8
- "afr_Latn": 14051,
9
- "ajp_Arab": 14052,
10
- "aka_Latn": 14053,
11
- "als_Latn": 14207,
12
- "amh_Ethi": 14054,
13
- "apc_Arab": 14055,
14
- "arb_Arab": 14056,
15
- "ars_Arab": 14057,
16
- "ary_Arab": 14058,
17
- "arz_Arab": 14059,
18
- "asm_Beng": 14060,
19
- "ast_Latn": 14061,
20
- "awa_Deva": 14062,
21
- "ayr_Latn": 14063,
22
- "azb_Arab": 14064,
23
- "azj_Latn": 14065,
24
- "bak_Cyrl": 14066,
25
- "bam_Latn": 14067,
26
- "ban_Latn": 14068,
27
- "bel_Cyrl": 14069,
28
- "bem_Latn": 14070,
29
- "ben_Beng": 14071,
30
- "bho_Deva": 14072,
31
- "bjn_Arab": 14073,
32
- "bjn_Latn": 14074,
33
- "bod_Tibt": 14075,
34
- "bos_Latn": 14076,
35
- "bug_Latn": 14077,
36
- "bul_Cyrl": 14078,
37
- "cat_Latn": 14079,
38
- "ceb_Latn": 14080,
39
- "ces_Latn": 14081,
40
- "cjk_Latn": 14082,
41
- "ckb_Arab": 14083,
42
- "crh_Latn": 14084,
43
- "cym_Latn": 14085,
44
- "dan_Latn": 14086,
45
- "deu_Latn": 14087,
46
- "dik_Latn": 14088,
47
- "dyu_Latn": 14089,
48
- "dzo_Tibt": 14090,
49
- "ell_Grek": 14091,
50
- "eng_Latn": 14092,
51
- "epo_Latn": 14093,
52
- "est_Latn": 14094,
53
- "eus_Latn": 14095,
54
- "ewe_Latn": 14096,
55
- "fao_Latn": 14097,
56
- "fij_Latn": 14099,
57
- "fin_Latn": 14100,
58
- "fon_Latn": 14101,
59
- "fra_Latn": 14102,
60
- "fur_Latn": 14103,
61
- "fuv_Latn": 14104,
62
- "gaz_Latn": 14180,
63
- "gla_Latn": 14105,
64
- "gle_Latn": 14106,
65
- "glg_Latn": 14107,
66
- "grn_Latn": 14108,
67
- "guj_Gujr": 14109,
68
- "hat_Latn": 14110,
69
- "hau_Latn": 14111,
70
- "heb_Hebr": 14112,
71
- "hin_Deva": 14113,
72
- "hne_Deva": 14114,
73
- "hrv_Latn": 14115,
74
- "hun_Latn": 14116,
75
- "hye_Armn": 14117,
76
- "ibo_Latn": 14118,
77
- "ilo_Latn": 14119,
78
- "ind_Latn": 14120,
79
- "isl_Latn": 14121,
80
- "ita_Latn": 14122,
81
- "jav_Latn": 14123,
82
- "jpn_Jpan": 14124,
83
- "kab_Latn": 14125,
84
- "kac_Latn": 14126,
85
- "kam_Latn": 14127,
86
- "kan_Knda": 14128,
87
- "kas_Arab": 14129,
88
- "kas_Deva": 14130,
89
- "kat_Geor": 14131,
90
- "kaz_Cyrl": 14134,
91
- "kbp_Latn": 14135,
92
- "kea_Latn": 14136,
93
- "khk_Cyrl": 14167,
94
- "khm_Khmr": 14137,
95
- "kik_Latn": 14138,
96
- "kin_Latn": 14139,
97
- "kir_Cyrl": 14140,
98
- "kmb_Latn": 14141,
99
- "kmr_Latn": 14144,
100
- "knc_Arab": 14132,
101
- "knc_Latn": 14133,
102
- "kon_Latn": 14142,
103
- "kor_Hang": 14143,
104
- "lao_Laoo": 14145,
105
- "lij_Latn": 14147,
106
- "lim_Latn": 14148,
107
- "lin_Latn": 14149,
108
- "lit_Latn": 14150,
109
- "lmo_Latn": 14151,
110
- "ltg_Latn": 14152,
111
- "ltz_Latn": 14153,
112
- "lua_Latn": 14154,
113
- "lug_Latn": 14155,
114
- "luo_Latn": 14156,
115
- "lus_Latn": 14157,
116
- "lvs_Latn": 14146,
117
- "mag_Deva": 14158,
118
- "mai_Deva": 14159,
119
- "mal_Mlym": 14160,
120
- "mar_Deva": 14161,
121
- "min_Latn": 14162,
122
- "mkd_Cyrl": 14163,
123
- "mlt_Latn": 14165,
124
- "mni_Beng": 14166,
125
- "mos_Latn": 14168,
126
- "mri_Latn": 14169,
127
- "mya_Mymr": 14171,
128
- "nld_Latn": 14172,
129
- "nno_Latn": 14173,
130
- "nob_Latn": 14174,
131
- "npi_Deva": 14175,
132
- "nso_Latn": 14176,
133
- "nus_Latn": 14177,
134
- "nya_Latn": 14178,
135
- "oci_Latn": 14179,
136
- "ory_Orya": 14181,
137
- "pag_Latn": 14182,
138
- "pan_Guru": 14183,
139
- "pap_Latn": 14184,
140
- "pbt_Arab": 14188,
141
- "pes_Arab": 14098,
142
- "plt_Latn": 14164,
143
- "pol_Latn": 14185,
144
- "por_Latn": 14186,
145
- "prs_Arab": 14187,
146
- "quy_Latn": 14189,
147
- "ron_Latn": 14190,
148
- "run_Latn": 14191,
149
- "rus_Cyrl": 14192,
150
- "sag_Latn": 14193,
151
- "san_Deva": 14194,
152
- "sat_Beng": 14195,
153
- "scn_Latn": 14196,
154
- "shn_Mymr": 14197,
155
- "sin_Sinh": 14198,
156
- "slk_Latn": 14199,
157
- "slv_Latn": 14200,
158
- "smo_Latn": 14201,
159
- "sna_Latn": 14202,
160
- "snd_Arab": 14203,
161
- "som_Latn": 14204,
162
- "sot_Latn": 14205,
163
- "spa_Latn": 14206,
164
- "srd_Latn": 14208,
165
- "srp_Cyrl": 14209,
166
- "ssw_Latn": 14210,
167
- "sun_Latn": 14211,
168
- "swe_Latn": 14212,
169
- "swh_Latn": 14213,
170
- "szl_Latn": 14214,
171
- "tam_Taml": 14215,
172
- "taq_Latn": 14222,
173
- "taq_Tfng": 14223,
174
- "tat_Cyrl": 14216,
175
- "tel_Telu": 14217,
176
- "tgk_Cyrl": 14218,
177
- "tgl_Latn": 14219,
178
- "tha_Thai": 14220,
179
- "tir_Ethi": 14221,
180
- "tpi_Latn": 14224,
181
- "tsn_Latn": 14225,
182
- "tso_Latn": 14226,
183
- "tuk_Latn": 14227,
184
- "tum_Latn": 14228,
185
- "tur_Latn": 14229,
186
- "twi_Latn": 14230,
187
- "tzm_Tfng": 14231,
188
- "uig_Arab": 14232,
189
- "ukr_Cyrl": 14233,
190
- "umb_Latn": 14234,
191
- "urd_Arab": 14235,
192
- "uzn_Latn": 14236,
193
- "vec_Latn": 14237,
194
- "vie_Latn": 14238,
195
- "war_Latn": 14239,
196
- "wol_Latn": 14240,
197
- "xho_Latn": 14241,
198
- "ydd_Hebr": 14242,
199
- "yor_Latn": 14243,
200
- "yue_Hant": 14244,
201
- "zho_Hans": 14245,
202
- "zho_Hant": 14246,
203
- "zsm_Latn": 14170,
204
- "zul_Latn": 14247
205
  }
 
1
  {
2
+ "<mask>": 15070,
3
+ "ace_Arab": 15071,
4
+ "ace_Latn": 15072,
5
+ "acm_Arab": 15073,
6
+ "acq_Arab": 15074,
7
+ "aeb_Arab": 15075,
8
+ "afr_Latn": 15076,
9
+ "ajp_Arab": 15077,
10
+ "aka_Latn": 15078,
11
+ "als_Latn": 15232,
12
+ "amh_Ethi": 15079,
13
+ "apc_Arab": 15080,
14
+ "arb_Arab": 15081,
15
+ "ars_Arab": 15082,
16
+ "ary_Arab": 15083,
17
+ "arz_Arab": 15084,
18
+ "asm_Beng": 15085,
19
+ "ast_Latn": 15086,
20
+ "awa_Deva": 15087,
21
+ "ayr_Latn": 15088,
22
+ "azb_Arab": 15089,
23
+ "azj_Latn": 15090,
24
+ "bak_Cyrl": 15091,
25
+ "bam_Latn": 15092,
26
+ "ban_Latn": 15093,
27
+ "bel_Cyrl": 15094,
28
+ "bem_Latn": 15095,
29
+ "ben_Beng": 15096,
30
+ "bho_Deva": 15097,
31
+ "bjn_Arab": 15098,
32
+ "bjn_Latn": 15099,
33
+ "bod_Tibt": 15100,
34
+ "bos_Latn": 15101,
35
+ "bug_Latn": 15102,
36
+ "bul_Cyrl": 15103,
37
+ "cat_Latn": 15104,
38
+ "ceb_Latn": 15105,
39
+ "ces_Latn": 15106,
40
+ "cjk_Latn": 15107,
41
+ "ckb_Arab": 15108,
42
+ "crh_Latn": 15109,
43
+ "cym_Latn": 15110,
44
+ "dan_Latn": 15111,
45
+ "deu_Latn": 15112,
46
+ "dik_Latn": 15113,
47
+ "dyu_Latn": 15114,
48
+ "dzo_Tibt": 15115,
49
+ "ell_Grek": 15116,
50
+ "eng_Latn": 15117,
51
+ "epo_Latn": 15118,
52
+ "est_Latn": 15119,
53
+ "eus_Latn": 15120,
54
+ "ewe_Latn": 15121,
55
+ "fao_Latn": 15122,
56
+ "fij_Latn": 15124,
57
+ "fin_Latn": 15125,
58
+ "fon_Latn": 15126,
59
+ "fra_Latn": 15127,
60
+ "fur_Latn": 15128,
61
+ "fuv_Latn": 15129,
62
+ "gaz_Latn": 15205,
63
+ "gla_Latn": 15130,
64
+ "gle_Latn": 15131,
65
+ "glg_Latn": 15132,
66
+ "grn_Latn": 15133,
67
+ "guj_Gujr": 15134,
68
+ "hat_Latn": 15135,
69
+ "hau_Latn": 15136,
70
+ "heb_Hebr": 15137,
71
+ "hin_Deva": 15138,
72
+ "hne_Deva": 15139,
73
+ "hrv_Latn": 15140,
74
+ "hun_Latn": 15141,
75
+ "hye_Armn": 15142,
76
+ "ibo_Latn": 15143,
77
+ "ilo_Latn": 15144,
78
+ "ind_Latn": 15145,
79
+ "isl_Latn": 15146,
80
+ "ita_Latn": 15147,
81
+ "jav_Latn": 15148,
82
+ "jpn_Jpan": 15149,
83
+ "kab_Latn": 15150,
84
+ "kac_Latn": 15151,
85
+ "kam_Latn": 15152,
86
+ "kan_Knda": 15153,
87
+ "kas_Arab": 15154,
88
+ "kas_Deva": 15155,
89
+ "kat_Geor": 15156,
90
+ "kaz_Cyrl": 15159,
91
+ "kbp_Latn": 15160,
92
+ "kea_Latn": 15161,
93
+ "khk_Cyrl": 15192,
94
+ "khm_Khmr": 15162,
95
+ "kik_Latn": 15163,
96
+ "kin_Latn": 15164,
97
+ "kir_Cyrl": 15165,
98
+ "kmb_Latn": 15166,
99
+ "kmr_Latn": 15169,
100
+ "knc_Arab": 15157,
101
+ "knc_Latn": 15158,
102
+ "kon_Latn": 15167,
103
+ "kor_Hang": 15168,
104
+ "lao_Laoo": 15170,
105
+ "lij_Latn": 15172,
106
+ "lim_Latn": 15173,
107
+ "lin_Latn": 15174,
108
+ "lit_Latn": 15175,
109
+ "lmo_Latn": 15176,
110
+ "ltg_Latn": 15177,
111
+ "ltz_Latn": 15178,
112
+ "lua_Latn": 15179,
113
+ "lug_Latn": 15180,
114
+ "luo_Latn": 15181,
115
+ "lus_Latn": 15182,
116
+ "lvs_Latn": 15171,
117
+ "mag_Deva": 15183,
118
+ "mai_Deva": 15184,
119
+ "mal_Mlym": 15185,
120
+ "mar_Deva": 15186,
121
+ "min_Latn": 15187,
122
+ "mkd_Cyrl": 15188,
123
+ "mlt_Latn": 15190,
124
+ "mni_Beng": 15191,
125
+ "mos_Latn": 15193,
126
+ "mri_Latn": 15194,
127
+ "mya_Mymr": 15196,
128
+ "nld_Latn": 15197,
129
+ "nno_Latn": 15198,
130
+ "nob_Latn": 15199,
131
+ "npi_Deva": 15200,
132
+ "nso_Latn": 15201,
133
+ "nus_Latn": 15202,
134
+ "nya_Latn": 15203,
135
+ "oci_Latn": 15204,
136
+ "ory_Orya": 15206,
137
+ "pag_Latn": 15207,
138
+ "pan_Guru": 15208,
139
+ "pap_Latn": 15209,
140
+ "pbt_Arab": 15213,
141
+ "pes_Arab": 15123,
142
+ "plt_Latn": 15189,
143
+ "pol_Latn": 15210,
144
+ "por_Latn": 15211,
145
+ "prs_Arab": 15212,
146
+ "quy_Latn": 15214,
147
+ "ron_Latn": 15215,
148
+ "run_Latn": 15216,
149
+ "rus_Cyrl": 15217,
150
+ "sag_Latn": 15218,
151
+ "san_Deva": 15219,
152
+ "sat_Beng": 15220,
153
+ "scn_Latn": 15221,
154
+ "shn_Mymr": 15222,
155
+ "sin_Sinh": 15223,
156
+ "slk_Latn": 15224,
157
+ "slv_Latn": 15225,
158
+ "smo_Latn": 15226,
159
+ "sna_Latn": 15227,
160
+ "snd_Arab": 15228,
161
+ "som_Latn": 15229,
162
+ "sot_Latn": 15230,
163
+ "spa_Latn": 15231,
164
+ "srd_Latn": 15233,
165
+ "srp_Cyrl": 15234,
166
+ "ssw_Latn": 15235,
167
+ "sun_Latn": 15236,
168
+ "swe_Latn": 15237,
169
+ "swh_Latn": 15238,
170
+ "szl_Latn": 15239,
171
+ "tam_Taml": 15240,
172
+ "taq_Latn": 15247,
173
+ "taq_Tfng": 15248,
174
+ "tat_Cyrl": 15241,
175
+ "tel_Telu": 15242,
176
+ "tgk_Cyrl": 15243,
177
+ "tgl_Latn": 15244,
178
+ "tha_Thai": 15245,
179
+ "tir_Ethi": 15246,
180
+ "tpi_Latn": 15249,
181
+ "tsn_Latn": 15250,
182
+ "tso_Latn": 15251,
183
+ "tuk_Latn": 15252,
184
+ "tum_Latn": 15253,
185
+ "tur_Latn": 15254,
186
+ "twi_Latn": 15255,
187
+ "tzm_Tfng": 15256,
188
+ "uig_Arab": 15257,
189
+ "ukr_Cyrl": 15258,
190
+ "umb_Latn": 15259,
191
+ "urd_Arab": 15260,
192
+ "uzn_Latn": 15261,
193
+ "vec_Latn": 15262,
194
+ "vie_Latn": 15263,
195
+ "war_Latn": 15264,
196
+ "wol_Latn": 15265,
197
+ "xho_Latn": 15266,
198
+ "ydd_Hebr": 15267,
199
+ "yor_Latn": 15268,
200
+ "yue_Hant": 15269,
201
+ "zho_Hans": 15270,
202
+ "zho_Hant": 15271,
203
+ "zsm_Latn": 15195,
204
+ "zul_Latn": 15272
205
  }
sentencepiece.bpe.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4cd4478a6e2887e0312413a4d8eb780ff03e38913cd231bd83e00e4f5305cfc
3
- size 502660
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0755cc25485187df053783aa1da1d121882d7ffecf4d1cbec1c8b48bc228edd
3
+ size 471840
tokenizer_config.json CHANGED
@@ -32,7 +32,7 @@
32
  "single_word": false,
33
  "special": true
34
  },
35
- "14045": {
36
  "content": "<mask>",
37
  "lstrip": true,
38
  "normalized": true,
@@ -40,7 +40,7 @@
40
  "single_word": false,
41
  "special": true
42
  },
43
- "14046": {
44
  "content": "ace_Arab",
45
  "lstrip": false,
46
  "normalized": false,
@@ -48,7 +48,7 @@
48
  "single_word": false,
49
  "special": true
50
  },
51
- "14047": {
52
  "content": "ace_Latn",
53
  "lstrip": false,
54
  "normalized": false,
@@ -56,7 +56,7 @@
56
  "single_word": false,
57
  "special": true
58
  },
59
- "14048": {
60
  "content": "acm_Arab",
61
  "lstrip": false,
62
  "normalized": false,
@@ -64,7 +64,7 @@
64
  "single_word": false,
65
  "special": true
66
  },
67
- "14049": {
68
  "content": "acq_Arab",
69
  "lstrip": false,
70
  "normalized": false,
@@ -72,7 +72,7 @@
72
  "single_word": false,
73
  "special": true
74
  },
75
- "14050": {
76
  "content": "aeb_Arab",
77
  "lstrip": false,
78
  "normalized": false,
@@ -80,7 +80,7 @@
80
  "single_word": false,
81
  "special": true
82
  },
83
- "14051": {
84
  "content": "afr_Latn",
85
  "lstrip": false,
86
  "normalized": false,
@@ -88,7 +88,7 @@
88
  "single_word": false,
89
  "special": true
90
  },
91
- "14052": {
92
  "content": "ajp_Arab",
93
  "lstrip": false,
94
  "normalized": false,
@@ -96,7 +96,7 @@
96
  "single_word": false,
97
  "special": true
98
  },
99
- "14053": {
100
  "content": "aka_Latn",
101
  "lstrip": false,
102
  "normalized": false,
@@ -104,7 +104,7 @@
104
  "single_word": false,
105
  "special": true
106
  },
107
- "14054": {
108
  "content": "amh_Ethi",
109
  "lstrip": false,
110
  "normalized": false,
@@ -112,7 +112,7 @@
112
  "single_word": false,
113
  "special": true
114
  },
115
- "14055": {
116
  "content": "apc_Arab",
117
  "lstrip": false,
118
  "normalized": false,
@@ -120,7 +120,7 @@
120
  "single_word": false,
121
  "special": true
122
  },
123
- "14056": {
124
  "content": "arb_Arab",
125
  "lstrip": false,
126
  "normalized": false,
@@ -128,7 +128,7 @@
128
  "single_word": false,
129
  "special": true
130
  },
131
- "14057": {
132
  "content": "ars_Arab",
133
  "lstrip": false,
134
  "normalized": false,
@@ -136,7 +136,7 @@
136
  "single_word": false,
137
  "special": true
138
  },
139
- "14058": {
140
  "content": "ary_Arab",
141
  "lstrip": false,
142
  "normalized": false,
@@ -144,7 +144,7 @@
144
  "single_word": false,
145
  "special": true
146
  },
147
- "14059": {
148
  "content": "arz_Arab",
149
  "lstrip": false,
150
  "normalized": false,
@@ -152,7 +152,7 @@
152
  "single_word": false,
153
  "special": true
154
  },
155
- "14060": {
156
  "content": "asm_Beng",
157
  "lstrip": false,
158
  "normalized": false,
@@ -160,7 +160,7 @@
160
  "single_word": false,
161
  "special": true
162
  },
163
- "14061": {
164
  "content": "ast_Latn",
165
  "lstrip": false,
166
  "normalized": false,
@@ -168,7 +168,7 @@
168
  "single_word": false,
169
  "special": true
170
  },
171
- "14062": {
172
  "content": "awa_Deva",
173
  "lstrip": false,
174
  "normalized": false,
@@ -176,7 +176,7 @@
176
  "single_word": false,
177
  "special": true
178
  },
179
- "14063": {
180
  "content": "ayr_Latn",
181
  "lstrip": false,
182
  "normalized": false,
@@ -184,7 +184,7 @@
184
  "single_word": false,
185
  "special": true
186
  },
187
- "14064": {
188
  "content": "azb_Arab",
189
  "lstrip": false,
190
  "normalized": false,
@@ -192,7 +192,7 @@
192
  "single_word": false,
193
  "special": true
194
  },
195
- "14065": {
196
  "content": "azj_Latn",
197
  "lstrip": false,
198
  "normalized": false,
@@ -200,7 +200,7 @@
200
  "single_word": false,
201
  "special": true
202
  },
203
- "14066": {
204
  "content": "bak_Cyrl",
205
  "lstrip": false,
206
  "normalized": false,
@@ -208,7 +208,7 @@
208
  "single_word": false,
209
  "special": true
210
  },
211
- "14067": {
212
  "content": "bam_Latn",
213
  "lstrip": false,
214
  "normalized": false,
@@ -216,7 +216,7 @@
216
  "single_word": false,
217
  "special": true
218
  },
219
- "14068": {
220
  "content": "ban_Latn",
221
  "lstrip": false,
222
  "normalized": false,
@@ -224,7 +224,7 @@
224
  "single_word": false,
225
  "special": true
226
  },
227
- "14069": {
228
  "content": "bel_Cyrl",
229
  "lstrip": false,
230
  "normalized": false,
@@ -232,7 +232,7 @@
232
  "single_word": false,
233
  "special": true
234
  },
235
- "14070": {
236
  "content": "bem_Latn",
237
  "lstrip": false,
238
  "normalized": false,
@@ -240,7 +240,7 @@
240
  "single_word": false,
241
  "special": true
242
  },
243
- "14071": {
244
  "content": "ben_Beng",
245
  "lstrip": false,
246
  "normalized": false,
@@ -248,7 +248,7 @@
248
  "single_word": false,
249
  "special": true
250
  },
251
- "14072": {
252
  "content": "bho_Deva",
253
  "lstrip": false,
254
  "normalized": false,
@@ -256,7 +256,7 @@
256
  "single_word": false,
257
  "special": true
258
  },
259
- "14073": {
260
  "content": "bjn_Arab",
261
  "lstrip": false,
262
  "normalized": false,
@@ -264,7 +264,7 @@
264
  "single_word": false,
265
  "special": true
266
  },
267
- "14074": {
268
  "content": "bjn_Latn",
269
  "lstrip": false,
270
  "normalized": false,
@@ -272,7 +272,7 @@
272
  "single_word": false,
273
  "special": true
274
  },
275
- "14075": {
276
  "content": "bod_Tibt",
277
  "lstrip": false,
278
  "normalized": false,
@@ -280,7 +280,7 @@
280
  "single_word": false,
281
  "special": true
282
  },
283
- "14076": {
284
  "content": "bos_Latn",
285
  "lstrip": false,
286
  "normalized": false,
@@ -288,7 +288,7 @@
288
  "single_word": false,
289
  "special": true
290
  },
291
- "14077": {
292
  "content": "bug_Latn",
293
  "lstrip": false,
294
  "normalized": false,
@@ -296,7 +296,7 @@
296
  "single_word": false,
297
  "special": true
298
  },
299
- "14078": {
300
  "content": "bul_Cyrl",
301
  "lstrip": false,
302
  "normalized": false,
@@ -304,7 +304,7 @@
304
  "single_word": false,
305
  "special": true
306
  },
307
- "14079": {
308
  "content": "cat_Latn",
309
  "lstrip": false,
310
  "normalized": false,
@@ -312,7 +312,7 @@
312
  "single_word": false,
313
  "special": true
314
  },
315
- "14080": {
316
  "content": "ceb_Latn",
317
  "lstrip": false,
318
  "normalized": false,
@@ -320,7 +320,7 @@
320
  "single_word": false,
321
  "special": true
322
  },
323
- "14081": {
324
  "content": "ces_Latn",
325
  "lstrip": false,
326
  "normalized": false,
@@ -328,7 +328,7 @@
328
  "single_word": false,
329
  "special": true
330
  },
331
- "14082": {
332
  "content": "cjk_Latn",
333
  "lstrip": false,
334
  "normalized": false,
@@ -336,7 +336,7 @@
336
  "single_word": false,
337
  "special": true
338
  },
339
- "14083": {
340
  "content": "ckb_Arab",
341
  "lstrip": false,
342
  "normalized": false,
@@ -344,7 +344,7 @@
344
  "single_word": false,
345
  "special": true
346
  },
347
- "14084": {
348
  "content": "crh_Latn",
349
  "lstrip": false,
350
  "normalized": false,
@@ -352,7 +352,7 @@
352
  "single_word": false,
353
  "special": true
354
  },
355
- "14085": {
356
  "content": "cym_Latn",
357
  "lstrip": false,
358
  "normalized": false,
@@ -360,7 +360,7 @@
360
  "single_word": false,
361
  "special": true
362
  },
363
- "14086": {
364
  "content": "dan_Latn",
365
  "lstrip": false,
366
  "normalized": false,
@@ -368,7 +368,7 @@
368
  "single_word": false,
369
  "special": true
370
  },
371
- "14087": {
372
  "content": "deu_Latn",
373
  "lstrip": false,
374
  "normalized": false,
@@ -376,7 +376,7 @@
376
  "single_word": false,
377
  "special": true
378
  },
379
- "14088": {
380
  "content": "dik_Latn",
381
  "lstrip": false,
382
  "normalized": false,
@@ -384,7 +384,7 @@
384
  "single_word": false,
385
  "special": true
386
  },
387
- "14089": {
388
  "content": "dyu_Latn",
389
  "lstrip": false,
390
  "normalized": false,
@@ -392,7 +392,7 @@
392
  "single_word": false,
393
  "special": true
394
  },
395
- "14090": {
396
  "content": "dzo_Tibt",
397
  "lstrip": false,
398
  "normalized": false,
@@ -400,7 +400,7 @@
400
  "single_word": false,
401
  "special": true
402
  },
403
- "14091": {
404
  "content": "ell_Grek",
405
  "lstrip": false,
406
  "normalized": false,
@@ -408,7 +408,7 @@
408
  "single_word": false,
409
  "special": true
410
  },
411
- "14092": {
412
  "content": "eng_Latn",
413
  "lstrip": false,
414
  "normalized": false,
@@ -416,7 +416,7 @@
416
  "single_word": false,
417
  "special": true
418
  },
419
- "14093": {
420
  "content": "epo_Latn",
421
  "lstrip": false,
422
  "normalized": false,
@@ -424,7 +424,7 @@
424
  "single_word": false,
425
  "special": true
426
  },
427
- "14094": {
428
  "content": "est_Latn",
429
  "lstrip": false,
430
  "normalized": false,
@@ -432,7 +432,7 @@
432
  "single_word": false,
433
  "special": true
434
  },
435
- "14095": {
436
  "content": "eus_Latn",
437
  "lstrip": false,
438
  "normalized": false,
@@ -440,7 +440,7 @@
440
  "single_word": false,
441
  "special": true
442
  },
443
- "14096": {
444
  "content": "ewe_Latn",
445
  "lstrip": false,
446
  "normalized": false,
@@ -448,7 +448,7 @@
448
  "single_word": false,
449
  "special": true
450
  },
451
- "14097": {
452
  "content": "fao_Latn",
453
  "lstrip": false,
454
  "normalized": false,
@@ -456,7 +456,7 @@
456
  "single_word": false,
457
  "special": true
458
  },
459
- "14098": {
460
  "content": "pes_Arab",
461
  "lstrip": false,
462
  "normalized": false,
@@ -464,7 +464,7 @@
464
  "single_word": false,
465
  "special": true
466
  },
467
- "14099": {
468
  "content": "fij_Latn",
469
  "lstrip": false,
470
  "normalized": false,
@@ -472,7 +472,7 @@
472
  "single_word": false,
473
  "special": true
474
  },
475
- "14100": {
476
  "content": "fin_Latn",
477
  "lstrip": false,
478
  "normalized": false,
@@ -480,7 +480,7 @@
480
  "single_word": false,
481
  "special": true
482
  },
483
- "14101": {
484
  "content": "fon_Latn",
485
  "lstrip": false,
486
  "normalized": false,
@@ -488,7 +488,7 @@
488
  "single_word": false,
489
  "special": true
490
  },
491
- "14102": {
492
  "content": "fra_Latn",
493
  "lstrip": false,
494
  "normalized": false,
@@ -496,7 +496,7 @@
496
  "single_word": false,
497
  "special": true
498
  },
499
- "14103": {
500
  "content": "fur_Latn",
501
  "lstrip": false,
502
  "normalized": false,
@@ -504,7 +504,7 @@
504
  "single_word": false,
505
  "special": true
506
  },
507
- "14104": {
508
  "content": "fuv_Latn",
509
  "lstrip": false,
510
  "normalized": false,
@@ -512,7 +512,7 @@
512
  "single_word": false,
513
  "special": true
514
  },
515
- "14105": {
516
  "content": "gla_Latn",
517
  "lstrip": false,
518
  "normalized": false,
@@ -520,7 +520,7 @@
520
  "single_word": false,
521
  "special": true
522
  },
523
- "14106": {
524
  "content": "gle_Latn",
525
  "lstrip": false,
526
  "normalized": false,
@@ -528,7 +528,7 @@
528
  "single_word": false,
529
  "special": true
530
  },
531
- "14107": {
532
  "content": "glg_Latn",
533
  "lstrip": false,
534
  "normalized": false,
@@ -536,7 +536,7 @@
536
  "single_word": false,
537
  "special": true
538
  },
539
- "14108": {
540
  "content": "grn_Latn",
541
  "lstrip": false,
542
  "normalized": false,
@@ -544,7 +544,7 @@
544
  "single_word": false,
545
  "special": true
546
  },
547
- "14109": {
548
  "content": "guj_Gujr",
549
  "lstrip": false,
550
  "normalized": false,
@@ -552,7 +552,7 @@
552
  "single_word": false,
553
  "special": true
554
  },
555
- "14110": {
556
  "content": "hat_Latn",
557
  "lstrip": false,
558
  "normalized": false,
@@ -560,7 +560,7 @@
560
  "single_word": false,
561
  "special": true
562
  },
563
- "14111": {
564
  "content": "hau_Latn",
565
  "lstrip": false,
566
  "normalized": false,
@@ -568,7 +568,7 @@
568
  "single_word": false,
569
  "special": true
570
  },
571
- "14112": {
572
  "content": "heb_Hebr",
573
  "lstrip": false,
574
  "normalized": false,
@@ -576,7 +576,7 @@
576
  "single_word": false,
577
  "special": true
578
  },
579
- "14113": {
580
  "content": "hin_Deva",
581
  "lstrip": false,
582
  "normalized": false,
@@ -584,7 +584,7 @@
584
  "single_word": false,
585
  "special": true
586
  },
587
- "14114": {
588
  "content": "hne_Deva",
589
  "lstrip": false,
590
  "normalized": false,
@@ -592,7 +592,7 @@
592
  "single_word": false,
593
  "special": true
594
  },
595
- "14115": {
596
  "content": "hrv_Latn",
597
  "lstrip": false,
598
  "normalized": false,
@@ -600,7 +600,7 @@
600
  "single_word": false,
601
  "special": true
602
  },
603
- "14116": {
604
  "content": "hun_Latn",
605
  "lstrip": false,
606
  "normalized": false,
@@ -608,7 +608,7 @@
608
  "single_word": false,
609
  "special": true
610
  },
611
- "14117": {
612
  "content": "hye_Armn",
613
  "lstrip": false,
614
  "normalized": false,
@@ -616,7 +616,7 @@
616
  "single_word": false,
617
  "special": true
618
  },
619
- "14118": {
620
  "content": "ibo_Latn",
621
  "lstrip": false,
622
  "normalized": false,
@@ -624,7 +624,7 @@
624
  "single_word": false,
625
  "special": true
626
  },
627
- "14119": {
628
  "content": "ilo_Latn",
629
  "lstrip": false,
630
  "normalized": false,
@@ -632,7 +632,7 @@
632
  "single_word": false,
633
  "special": true
634
  },
635
- "14120": {
636
  "content": "ind_Latn",
637
  "lstrip": false,
638
  "normalized": false,
@@ -640,7 +640,7 @@
640
  "single_word": false,
641
  "special": true
642
  },
643
- "14121": {
644
  "content": "isl_Latn",
645
  "lstrip": false,
646
  "normalized": false,
@@ -648,7 +648,7 @@
648
  "single_word": false,
649
  "special": true
650
  },
651
- "14122": {
652
  "content": "ita_Latn",
653
  "lstrip": false,
654
  "normalized": false,
@@ -656,7 +656,7 @@
656
  "single_word": false,
657
  "special": true
658
  },
659
- "14123": {
660
  "content": "jav_Latn",
661
  "lstrip": false,
662
  "normalized": false,
@@ -664,7 +664,7 @@
664
  "single_word": false,
665
  "special": true
666
  },
667
- "14124": {
668
  "content": "jpn_Jpan",
669
  "lstrip": false,
670
  "normalized": false,
@@ -672,7 +672,7 @@
672
  "single_word": false,
673
  "special": true
674
  },
675
- "14125": {
676
  "content": "kab_Latn",
677
  "lstrip": false,
678
  "normalized": false,
@@ -680,7 +680,7 @@
680
  "single_word": false,
681
  "special": true
682
  },
683
- "14126": {
684
  "content": "kac_Latn",
685
  "lstrip": false,
686
  "normalized": false,
@@ -688,7 +688,7 @@
688
  "single_word": false,
689
  "special": true
690
  },
691
- "14127": {
692
  "content": "kam_Latn",
693
  "lstrip": false,
694
  "normalized": false,
@@ -696,7 +696,7 @@
696
  "single_word": false,
697
  "special": true
698
  },
699
- "14128": {
700
  "content": "kan_Knda",
701
  "lstrip": false,
702
  "normalized": false,
@@ -704,7 +704,7 @@
704
  "single_word": false,
705
  "special": true
706
  },
707
- "14129": {
708
  "content": "kas_Arab",
709
  "lstrip": false,
710
  "normalized": false,
@@ -712,7 +712,7 @@
712
  "single_word": false,
713
  "special": true
714
  },
715
- "14130": {
716
  "content": "kas_Deva",
717
  "lstrip": false,
718
  "normalized": false,
@@ -720,7 +720,7 @@
720
  "single_word": false,
721
  "special": true
722
  },
723
- "14131": {
724
  "content": "kat_Geor",
725
  "lstrip": false,
726
  "normalized": false,
@@ -728,7 +728,7 @@
728
  "single_word": false,
729
  "special": true
730
  },
731
- "14132": {
732
  "content": "knc_Arab",
733
  "lstrip": false,
734
  "normalized": false,
@@ -736,7 +736,7 @@
736
  "single_word": false,
737
  "special": true
738
  },
739
- "14133": {
740
  "content": "knc_Latn",
741
  "lstrip": false,
742
  "normalized": false,
@@ -744,7 +744,7 @@
744
  "single_word": false,
745
  "special": true
746
  },
747
- "14134": {
748
  "content": "kaz_Cyrl",
749
  "lstrip": false,
750
  "normalized": false,
@@ -752,7 +752,7 @@
752
  "single_word": false,
753
  "special": true
754
  },
755
- "14135": {
756
  "content": "kbp_Latn",
757
  "lstrip": false,
758
  "normalized": false,
@@ -760,7 +760,7 @@
760
  "single_word": false,
761
  "special": true
762
  },
763
- "14136": {
764
  "content": "kea_Latn",
765
  "lstrip": false,
766
  "normalized": false,
@@ -768,7 +768,7 @@
768
  "single_word": false,
769
  "special": true
770
  },
771
- "14137": {
772
  "content": "khm_Khmr",
773
  "lstrip": false,
774
  "normalized": false,
@@ -776,7 +776,7 @@
776
  "single_word": false,
777
  "special": true
778
  },
779
- "14138": {
780
  "content": "kik_Latn",
781
  "lstrip": false,
782
  "normalized": false,
@@ -784,7 +784,7 @@
784
  "single_word": false,
785
  "special": true
786
  },
787
- "14139": {
788
  "content": "kin_Latn",
789
  "lstrip": false,
790
  "normalized": false,
@@ -792,7 +792,7 @@
792
  "single_word": false,
793
  "special": true
794
  },
795
- "14140": {
796
  "content": "kir_Cyrl",
797
  "lstrip": false,
798
  "normalized": false,
@@ -800,7 +800,7 @@
800
  "single_word": false,
801
  "special": true
802
  },
803
- "14141": {
804
  "content": "kmb_Latn",
805
  "lstrip": false,
806
  "normalized": false,
@@ -808,7 +808,7 @@
808
  "single_word": false,
809
  "special": true
810
  },
811
- "14142": {
812
  "content": "kon_Latn",
813
  "lstrip": false,
814
  "normalized": false,
@@ -816,7 +816,7 @@
816
  "single_word": false,
817
  "special": true
818
  },
819
- "14143": {
820
  "content": "kor_Hang",
821
  "lstrip": false,
822
  "normalized": false,
@@ -824,7 +824,7 @@
824
  "single_word": false,
825
  "special": true
826
  },
827
- "14144": {
828
  "content": "kmr_Latn",
829
  "lstrip": false,
830
  "normalized": false,
@@ -832,7 +832,7 @@
832
  "single_word": false,
833
  "special": true
834
  },
835
- "14145": {
836
  "content": "lao_Laoo",
837
  "lstrip": false,
838
  "normalized": false,
@@ -840,7 +840,7 @@
840
  "single_word": false,
841
  "special": true
842
  },
843
- "14146": {
844
  "content": "lvs_Latn",
845
  "lstrip": false,
846
  "normalized": false,
@@ -848,7 +848,7 @@
848
  "single_word": false,
849
  "special": true
850
  },
851
- "14147": {
852
  "content": "lij_Latn",
853
  "lstrip": false,
854
  "normalized": false,
@@ -856,7 +856,7 @@
856
  "single_word": false,
857
  "special": true
858
  },
859
- "14148": {
860
  "content": "lim_Latn",
861
  "lstrip": false,
862
  "normalized": false,
@@ -864,7 +864,7 @@
864
  "single_word": false,
865
  "special": true
866
  },
867
- "14149": {
868
  "content": "lin_Latn",
869
  "lstrip": false,
870
  "normalized": false,
@@ -872,7 +872,7 @@
872
  "single_word": false,
873
  "special": true
874
  },
875
- "14150": {
876
  "content": "lit_Latn",
877
  "lstrip": false,
878
  "normalized": false,
@@ -880,7 +880,7 @@
880
  "single_word": false,
881
  "special": true
882
  },
883
- "14151": {
884
  "content": "lmo_Latn",
885
  "lstrip": false,
886
  "normalized": false,
@@ -888,7 +888,7 @@
888
  "single_word": false,
889
  "special": true
890
  },
891
- "14152": {
892
  "content": "ltg_Latn",
893
  "lstrip": false,
894
  "normalized": false,
@@ -896,7 +896,7 @@
896
  "single_word": false,
897
  "special": true
898
  },
899
- "14153": {
900
  "content": "ltz_Latn",
901
  "lstrip": false,
902
  "normalized": false,
@@ -904,7 +904,7 @@
904
  "single_word": false,
905
  "special": true
906
  },
907
- "14154": {
908
  "content": "lua_Latn",
909
  "lstrip": false,
910
  "normalized": false,
@@ -912,7 +912,7 @@
912
  "single_word": false,
913
  "special": true
914
  },
915
- "14155": {
916
  "content": "lug_Latn",
917
  "lstrip": false,
918
  "normalized": false,
@@ -920,7 +920,7 @@
920
  "single_word": false,
921
  "special": true
922
  },
923
- "14156": {
924
  "content": "luo_Latn",
925
  "lstrip": false,
926
  "normalized": false,
@@ -928,7 +928,7 @@
928
  "single_word": false,
929
  "special": true
930
  },
931
- "14157": {
932
  "content": "lus_Latn",
933
  "lstrip": false,
934
  "normalized": false,
@@ -936,7 +936,7 @@
936
  "single_word": false,
937
  "special": true
938
  },
939
- "14158": {
940
  "content": "mag_Deva",
941
  "lstrip": false,
942
  "normalized": false,
@@ -944,7 +944,7 @@
944
  "single_word": false,
945
  "special": true
946
  },
947
- "14159": {
948
  "content": "mai_Deva",
949
  "lstrip": false,
950
  "normalized": false,
@@ -952,7 +952,7 @@
952
  "single_word": false,
953
  "special": true
954
  },
955
- "14160": {
956
  "content": "mal_Mlym",
957
  "lstrip": false,
958
  "normalized": false,
@@ -960,7 +960,7 @@
960
  "single_word": false,
961
  "special": true
962
  },
963
- "14161": {
964
  "content": "mar_Deva",
965
  "lstrip": false,
966
  "normalized": false,
@@ -968,7 +968,7 @@
968
  "single_word": false,
969
  "special": true
970
  },
971
- "14162": {
972
  "content": "min_Latn",
973
  "lstrip": false,
974
  "normalized": false,
@@ -976,7 +976,7 @@
976
  "single_word": false,
977
  "special": true
978
  },
979
- "14163": {
980
  "content": "mkd_Cyrl",
981
  "lstrip": false,
982
  "normalized": false,
@@ -984,7 +984,7 @@
984
  "single_word": false,
985
  "special": true
986
  },
987
- "14164": {
988
  "content": "plt_Latn",
989
  "lstrip": false,
990
  "normalized": false,
@@ -992,7 +992,7 @@
992
  "single_word": false,
993
  "special": true
994
  },
995
- "14165": {
996
  "content": "mlt_Latn",
997
  "lstrip": false,
998
  "normalized": false,
@@ -1000,7 +1000,7 @@
1000
  "single_word": false,
1001
  "special": true
1002
  },
1003
- "14166": {
1004
  "content": "mni_Beng",
1005
  "lstrip": false,
1006
  "normalized": false,
@@ -1008,7 +1008,7 @@
1008
  "single_word": false,
1009
  "special": true
1010
  },
1011
- "14167": {
1012
  "content": "khk_Cyrl",
1013
  "lstrip": false,
1014
  "normalized": false,
@@ -1016,7 +1016,7 @@
1016
  "single_word": false,
1017
  "special": true
1018
  },
1019
- "14168": {
1020
  "content": "mos_Latn",
1021
  "lstrip": false,
1022
  "normalized": false,
@@ -1024,7 +1024,7 @@
1024
  "single_word": false,
1025
  "special": true
1026
  },
1027
- "14169": {
1028
  "content": "mri_Latn",
1029
  "lstrip": false,
1030
  "normalized": false,
@@ -1032,7 +1032,7 @@
1032
  "single_word": false,
1033
  "special": true
1034
  },
1035
- "14170": {
1036
  "content": "zsm_Latn",
1037
  "lstrip": false,
1038
  "normalized": false,
@@ -1040,7 +1040,7 @@
1040
  "single_word": false,
1041
  "special": true
1042
  },
1043
- "14171": {
1044
  "content": "mya_Mymr",
1045
  "lstrip": false,
1046
  "normalized": false,
@@ -1048,7 +1048,7 @@
1048
  "single_word": false,
1049
  "special": true
1050
  },
1051
- "14172": {
1052
  "content": "nld_Latn",
1053
  "lstrip": false,
1054
  "normalized": false,
@@ -1056,7 +1056,7 @@
1056
  "single_word": false,
1057
  "special": true
1058
  },
1059
- "14173": {
1060
  "content": "nno_Latn",
1061
  "lstrip": false,
1062
  "normalized": false,
@@ -1064,7 +1064,7 @@
1064
  "single_word": false,
1065
  "special": true
1066
  },
1067
- "14174": {
1068
  "content": "nob_Latn",
1069
  "lstrip": false,
1070
  "normalized": false,
@@ -1072,7 +1072,7 @@
1072
  "single_word": false,
1073
  "special": true
1074
  },
1075
- "14175": {
1076
  "content": "npi_Deva",
1077
  "lstrip": false,
1078
  "normalized": false,
@@ -1080,7 +1080,7 @@
1080
  "single_word": false,
1081
  "special": true
1082
  },
1083
- "14176": {
1084
  "content": "nso_Latn",
1085
  "lstrip": false,
1086
  "normalized": false,
@@ -1088,7 +1088,7 @@
1088
  "single_word": false,
1089
  "special": true
1090
  },
1091
- "14177": {
1092
  "content": "nus_Latn",
1093
  "lstrip": false,
1094
  "normalized": false,
@@ -1096,7 +1096,7 @@
1096
  "single_word": false,
1097
  "special": true
1098
  },
1099
- "14178": {
1100
  "content": "nya_Latn",
1101
  "lstrip": false,
1102
  "normalized": false,
@@ -1104,7 +1104,7 @@
1104
  "single_word": false,
1105
  "special": true
1106
  },
1107
- "14179": {
1108
  "content": "oci_Latn",
1109
  "lstrip": false,
1110
  "normalized": false,
@@ -1112,7 +1112,7 @@
1112
  "single_word": false,
1113
  "special": true
1114
  },
1115
- "14180": {
1116
  "content": "gaz_Latn",
1117
  "lstrip": false,
1118
  "normalized": false,
@@ -1120,7 +1120,7 @@
1120
  "single_word": false,
1121
  "special": true
1122
  },
1123
- "14181": {
1124
  "content": "ory_Orya",
1125
  "lstrip": false,
1126
  "normalized": false,
@@ -1128,7 +1128,7 @@
1128
  "single_word": false,
1129
  "special": true
1130
  },
1131
- "14182": {
1132
  "content": "pag_Latn",
1133
  "lstrip": false,
1134
  "normalized": false,
@@ -1136,7 +1136,7 @@
1136
  "single_word": false,
1137
  "special": true
1138
  },
1139
- "14183": {
1140
  "content": "pan_Guru",
1141
  "lstrip": false,
1142
  "normalized": false,
@@ -1144,7 +1144,7 @@
1144
  "single_word": false,
1145
  "special": true
1146
  },
1147
- "14184": {
1148
  "content": "pap_Latn",
1149
  "lstrip": false,
1150
  "normalized": false,
@@ -1152,7 +1152,7 @@
1152
  "single_word": false,
1153
  "special": true
1154
  },
1155
- "14185": {
1156
  "content": "pol_Latn",
1157
  "lstrip": false,
1158
  "normalized": false,
@@ -1160,7 +1160,7 @@
1160
  "single_word": false,
1161
  "special": true
1162
  },
1163
- "14186": {
1164
  "content": "por_Latn",
1165
  "lstrip": false,
1166
  "normalized": false,
@@ -1168,7 +1168,7 @@
1168
  "single_word": false,
1169
  "special": true
1170
  },
1171
- "14187": {
1172
  "content": "prs_Arab",
1173
  "lstrip": false,
1174
  "normalized": false,
@@ -1176,7 +1176,7 @@
1176
  "single_word": false,
1177
  "special": true
1178
  },
1179
- "14188": {
1180
  "content": "pbt_Arab",
1181
  "lstrip": false,
1182
  "normalized": false,
@@ -1184,7 +1184,7 @@
1184
  "single_word": false,
1185
  "special": true
1186
  },
1187
- "14189": {
1188
  "content": "quy_Latn",
1189
  "lstrip": false,
1190
  "normalized": false,
@@ -1192,7 +1192,7 @@
1192
  "single_word": false,
1193
  "special": true
1194
  },
1195
- "14190": {
1196
  "content": "ron_Latn",
1197
  "lstrip": false,
1198
  "normalized": false,
@@ -1200,7 +1200,7 @@
1200
  "single_word": false,
1201
  "special": true
1202
  },
1203
- "14191": {
1204
  "content": "run_Latn",
1205
  "lstrip": false,
1206
  "normalized": false,
@@ -1208,7 +1208,7 @@
1208
  "single_word": false,
1209
  "special": true
1210
  },
1211
- "14192": {
1212
  "content": "rus_Cyrl",
1213
  "lstrip": false,
1214
  "normalized": false,
@@ -1216,7 +1216,7 @@
1216
  "single_word": false,
1217
  "special": true
1218
  },
1219
- "14193": {
1220
  "content": "sag_Latn",
1221
  "lstrip": false,
1222
  "normalized": false,
@@ -1224,7 +1224,7 @@
1224
  "single_word": false,
1225
  "special": true
1226
  },
1227
- "14194": {
1228
  "content": "san_Deva",
1229
  "lstrip": false,
1230
  "normalized": false,
@@ -1232,7 +1232,7 @@
1232
  "single_word": false,
1233
  "special": true
1234
  },
1235
- "14195": {
1236
  "content": "sat_Beng",
1237
  "lstrip": false,
1238
  "normalized": false,
@@ -1240,7 +1240,7 @@
1240
  "single_word": false,
1241
  "special": true
1242
  },
1243
- "14196": {
1244
  "content": "scn_Latn",
1245
  "lstrip": false,
1246
  "normalized": false,
@@ -1248,7 +1248,7 @@
1248
  "single_word": false,
1249
  "special": true
1250
  },
1251
- "14197": {
1252
  "content": "shn_Mymr",
1253
  "lstrip": false,
1254
  "normalized": false,
@@ -1256,7 +1256,7 @@
1256
  "single_word": false,
1257
  "special": true
1258
  },
1259
- "14198": {
1260
  "content": "sin_Sinh",
1261
  "lstrip": false,
1262
  "normalized": false,
@@ -1264,7 +1264,7 @@
1264
  "single_word": false,
1265
  "special": true
1266
  },
1267
- "14199": {
1268
  "content": "slk_Latn",
1269
  "lstrip": false,
1270
  "normalized": false,
@@ -1272,7 +1272,7 @@
1272
  "single_word": false,
1273
  "special": true
1274
  },
1275
- "14200": {
1276
  "content": "slv_Latn",
1277
  "lstrip": false,
1278
  "normalized": false,
@@ -1280,7 +1280,7 @@
1280
  "single_word": false,
1281
  "special": true
1282
  },
1283
- "14201": {
1284
  "content": "smo_Latn",
1285
  "lstrip": false,
1286
  "normalized": false,
@@ -1288,7 +1288,7 @@
1288
  "single_word": false,
1289
  "special": true
1290
  },
1291
- "14202": {
1292
  "content": "sna_Latn",
1293
  "lstrip": false,
1294
  "normalized": false,
@@ -1296,7 +1296,7 @@
1296
  "single_word": false,
1297
  "special": true
1298
  },
1299
- "14203": {
1300
  "content": "snd_Arab",
1301
  "lstrip": false,
1302
  "normalized": false,
@@ -1304,7 +1304,7 @@
1304
  "single_word": false,
1305
  "special": true
1306
  },
1307
- "14204": {
1308
  "content": "som_Latn",
1309
  "lstrip": false,
1310
  "normalized": false,
@@ -1312,7 +1312,7 @@
1312
  "single_word": false,
1313
  "special": true
1314
  },
1315
- "14205": {
1316
  "content": "sot_Latn",
1317
  "lstrip": false,
1318
  "normalized": false,
@@ -1320,7 +1320,7 @@
1320
  "single_word": false,
1321
  "special": true
1322
  },
1323
- "14206": {
1324
  "content": "spa_Latn",
1325
  "lstrip": false,
1326
  "normalized": false,
@@ -1328,7 +1328,7 @@
1328
  "single_word": false,
1329
  "special": true
1330
  },
1331
- "14207": {
1332
  "content": "als_Latn",
1333
  "lstrip": false,
1334
  "normalized": false,
@@ -1336,7 +1336,7 @@
1336
  "single_word": false,
1337
  "special": true
1338
  },
1339
- "14208": {
1340
  "content": "srd_Latn",
1341
  "lstrip": false,
1342
  "normalized": false,
@@ -1344,7 +1344,7 @@
1344
  "single_word": false,
1345
  "special": true
1346
  },
1347
- "14209": {
1348
  "content": "srp_Cyrl",
1349
  "lstrip": false,
1350
  "normalized": false,
@@ -1352,7 +1352,7 @@
1352
  "single_word": false,
1353
  "special": true
1354
  },
1355
- "14210": {
1356
  "content": "ssw_Latn",
1357
  "lstrip": false,
1358
  "normalized": false,
@@ -1360,7 +1360,7 @@
1360
  "single_word": false,
1361
  "special": true
1362
  },
1363
- "14211": {
1364
  "content": "sun_Latn",
1365
  "lstrip": false,
1366
  "normalized": false,
@@ -1368,7 +1368,7 @@
1368
  "single_word": false,
1369
  "special": true
1370
  },
1371
- "14212": {
1372
  "content": "swe_Latn",
1373
  "lstrip": false,
1374
  "normalized": false,
@@ -1376,7 +1376,7 @@
1376
  "single_word": false,
1377
  "special": true
1378
  },
1379
- "14213": {
1380
  "content": "swh_Latn",
1381
  "lstrip": false,
1382
  "normalized": false,
@@ -1384,7 +1384,7 @@
1384
  "single_word": false,
1385
  "special": true
1386
  },
1387
- "14214": {
1388
  "content": "szl_Latn",
1389
  "lstrip": false,
1390
  "normalized": false,
@@ -1392,7 +1392,7 @@
1392
  "single_word": false,
1393
  "special": true
1394
  },
1395
- "14215": {
1396
  "content": "tam_Taml",
1397
  "lstrip": false,
1398
  "normalized": false,
@@ -1400,7 +1400,7 @@
1400
  "single_word": false,
1401
  "special": true
1402
  },
1403
- "14216": {
1404
  "content": "tat_Cyrl",
1405
  "lstrip": false,
1406
  "normalized": false,
@@ -1408,7 +1408,7 @@
1408
  "single_word": false,
1409
  "special": true
1410
  },
1411
- "14217": {
1412
  "content": "tel_Telu",
1413
  "lstrip": false,
1414
  "normalized": false,
@@ -1416,7 +1416,7 @@
1416
  "single_word": false,
1417
  "special": true
1418
  },
1419
- "14218": {
1420
  "content": "tgk_Cyrl",
1421
  "lstrip": false,
1422
  "normalized": false,
@@ -1424,7 +1424,7 @@
1424
  "single_word": false,
1425
  "special": true
1426
  },
1427
- "14219": {
1428
  "content": "tgl_Latn",
1429
  "lstrip": false,
1430
  "normalized": false,
@@ -1432,7 +1432,7 @@
1432
  "single_word": false,
1433
  "special": true
1434
  },
1435
- "14220": {
1436
  "content": "tha_Thai",
1437
  "lstrip": false,
1438
  "normalized": false,
@@ -1440,7 +1440,7 @@
1440
  "single_word": false,
1441
  "special": true
1442
  },
1443
- "14221": {
1444
  "content": "tir_Ethi",
1445
  "lstrip": false,
1446
  "normalized": false,
@@ -1448,7 +1448,7 @@
1448
  "single_word": false,
1449
  "special": true
1450
  },
1451
- "14222": {
1452
  "content": "taq_Latn",
1453
  "lstrip": false,
1454
  "normalized": false,
@@ -1456,7 +1456,7 @@
1456
  "single_word": false,
1457
  "special": true
1458
  },
1459
- "14223": {
1460
  "content": "taq_Tfng",
1461
  "lstrip": false,
1462
  "normalized": false,
@@ -1464,7 +1464,7 @@
1464
  "single_word": false,
1465
  "special": true
1466
  },
1467
- "14224": {
1468
  "content": "tpi_Latn",
1469
  "lstrip": false,
1470
  "normalized": false,
@@ -1472,7 +1472,7 @@
1472
  "single_word": false,
1473
  "special": true
1474
  },
1475
- "14225": {
1476
  "content": "tsn_Latn",
1477
  "lstrip": false,
1478
  "normalized": false,
@@ -1480,7 +1480,7 @@
1480
  "single_word": false,
1481
  "special": true
1482
  },
1483
- "14226": {
1484
  "content": "tso_Latn",
1485
  "lstrip": false,
1486
  "normalized": false,
@@ -1488,7 +1488,7 @@
1488
  "single_word": false,
1489
  "special": true
1490
  },
1491
- "14227": {
1492
  "content": "tuk_Latn",
1493
  "lstrip": false,
1494
  "normalized": false,
@@ -1496,7 +1496,7 @@
1496
  "single_word": false,
1497
  "special": true
1498
  },
1499
- "14228": {
1500
  "content": "tum_Latn",
1501
  "lstrip": false,
1502
  "normalized": false,
@@ -1504,7 +1504,7 @@
1504
  "single_word": false,
1505
  "special": true
1506
  },
1507
- "14229": {
1508
  "content": "tur_Latn",
1509
  "lstrip": false,
1510
  "normalized": false,
@@ -1512,7 +1512,7 @@
1512
  "single_word": false,
1513
  "special": true
1514
  },
1515
- "14230": {
1516
  "content": "twi_Latn",
1517
  "lstrip": false,
1518
  "normalized": false,
@@ -1520,7 +1520,7 @@
1520
  "single_word": false,
1521
  "special": true
1522
  },
1523
- "14231": {
1524
  "content": "tzm_Tfng",
1525
  "lstrip": false,
1526
  "normalized": false,
@@ -1528,7 +1528,7 @@
1528
  "single_word": false,
1529
  "special": true
1530
  },
1531
- "14232": {
1532
  "content": "uig_Arab",
1533
  "lstrip": false,
1534
  "normalized": false,
@@ -1536,7 +1536,7 @@
1536
  "single_word": false,
1537
  "special": true
1538
  },
1539
- "14233": {
1540
  "content": "ukr_Cyrl",
1541
  "lstrip": false,
1542
  "normalized": false,
@@ -1544,7 +1544,7 @@
1544
  "single_word": false,
1545
  "special": true
1546
  },
1547
- "14234": {
1548
  "content": "umb_Latn",
1549
  "lstrip": false,
1550
  "normalized": false,
@@ -1552,7 +1552,7 @@
1552
  "single_word": false,
1553
  "special": true
1554
  },
1555
- "14235": {
1556
  "content": "urd_Arab",
1557
  "lstrip": false,
1558
  "normalized": false,
@@ -1560,7 +1560,7 @@
1560
  "single_word": false,
1561
  "special": true
1562
  },
1563
- "14236": {
1564
  "content": "uzn_Latn",
1565
  "lstrip": false,
1566
  "normalized": false,
@@ -1568,7 +1568,7 @@
1568
  "single_word": false,
1569
  "special": true
1570
  },
1571
- "14237": {
1572
  "content": "vec_Latn",
1573
  "lstrip": false,
1574
  "normalized": false,
@@ -1576,7 +1576,7 @@
1576
  "single_word": false,
1577
  "special": true
1578
  },
1579
- "14238": {
1580
  "content": "vie_Latn",
1581
  "lstrip": false,
1582
  "normalized": false,
@@ -1584,7 +1584,7 @@
1584
  "single_word": false,
1585
  "special": true
1586
  },
1587
- "14239": {
1588
  "content": "war_Latn",
1589
  "lstrip": false,
1590
  "normalized": false,
@@ -1592,7 +1592,7 @@
1592
  "single_word": false,
1593
  "special": true
1594
  },
1595
- "14240": {
1596
  "content": "wol_Latn",
1597
  "lstrip": false,
1598
  "normalized": false,
@@ -1600,7 +1600,7 @@
1600
  "single_word": false,
1601
  "special": true
1602
  },
1603
- "14241": {
1604
  "content": "xho_Latn",
1605
  "lstrip": false,
1606
  "normalized": false,
@@ -1608,7 +1608,7 @@
1608
  "single_word": false,
1609
  "special": true
1610
  },
1611
- "14242": {
1612
  "content": "ydd_Hebr",
1613
  "lstrip": false,
1614
  "normalized": false,
@@ -1616,7 +1616,7 @@
1616
  "single_word": false,
1617
  "special": true
1618
  },
1619
- "14243": {
1620
  "content": "yor_Latn",
1621
  "lstrip": false,
1622
  "normalized": false,
@@ -1624,7 +1624,7 @@
1624
  "single_word": false,
1625
  "special": true
1626
  },
1627
- "14244": {
1628
  "content": "yue_Hant",
1629
  "lstrip": false,
1630
  "normalized": false,
@@ -1632,7 +1632,7 @@
1632
  "single_word": false,
1633
  "special": true
1634
  },
1635
- "14245": {
1636
  "content": "zho_Hans",
1637
  "lstrip": false,
1638
  "normalized": false,
@@ -1640,7 +1640,7 @@
1640
  "single_word": false,
1641
  "special": true
1642
  },
1643
- "14246": {
1644
  "content": "zho_Hant",
1645
  "lstrip": false,
1646
  "normalized": false,
@@ -1648,7 +1648,7 @@
1648
  "single_word": false,
1649
  "special": true
1650
  },
1651
- "14247": {
1652
  "content": "zul_Latn",
1653
  "lstrip": false,
1654
  "normalized": false,
 
32
  "single_word": false,
33
  "special": true
34
  },
35
+ "15070": {
36
  "content": "<mask>",
37
  "lstrip": true,
38
  "normalized": true,
 
40
  "single_word": false,
41
  "special": true
42
  },
43
+ "15071": {
44
  "content": "ace_Arab",
45
  "lstrip": false,
46
  "normalized": false,
 
48
  "single_word": false,
49
  "special": true
50
  },
51
+ "15072": {
52
  "content": "ace_Latn",
53
  "lstrip": false,
54
  "normalized": false,
 
56
  "single_word": false,
57
  "special": true
58
  },
59
+ "15073": {
60
  "content": "acm_Arab",
61
  "lstrip": false,
62
  "normalized": false,
 
64
  "single_word": false,
65
  "special": true
66
  },
67
+ "15074": {
68
  "content": "acq_Arab",
69
  "lstrip": false,
70
  "normalized": false,
 
72
  "single_word": false,
73
  "special": true
74
  },
75
+ "15075": {
76
  "content": "aeb_Arab",
77
  "lstrip": false,
78
  "normalized": false,
 
80
  "single_word": false,
81
  "special": true
82
  },
83
+ "15076": {
84
  "content": "afr_Latn",
85
  "lstrip": false,
86
  "normalized": false,
 
88
  "single_word": false,
89
  "special": true
90
  },
91
+ "15077": {
92
  "content": "ajp_Arab",
93
  "lstrip": false,
94
  "normalized": false,
 
96
  "single_word": false,
97
  "special": true
98
  },
99
+ "15078": {
100
  "content": "aka_Latn",
101
  "lstrip": false,
102
  "normalized": false,
 
104
  "single_word": false,
105
  "special": true
106
  },
107
+ "15079": {
108
  "content": "amh_Ethi",
109
  "lstrip": false,
110
  "normalized": false,
 
112
  "single_word": false,
113
  "special": true
114
  },
115
+ "15080": {
116
  "content": "apc_Arab",
117
  "lstrip": false,
118
  "normalized": false,
 
120
  "single_word": false,
121
  "special": true
122
  },
123
+ "15081": {
124
  "content": "arb_Arab",
125
  "lstrip": false,
126
  "normalized": false,
 
128
  "single_word": false,
129
  "special": true
130
  },
131
+ "15082": {
132
  "content": "ars_Arab",
133
  "lstrip": false,
134
  "normalized": false,
 
136
  "single_word": false,
137
  "special": true
138
  },
139
+ "15083": {
140
  "content": "ary_Arab",
141
  "lstrip": false,
142
  "normalized": false,
 
144
  "single_word": false,
145
  "special": true
146
  },
147
+ "15084": {
148
  "content": "arz_Arab",
149
  "lstrip": false,
150
  "normalized": false,
 
152
  "single_word": false,
153
  "special": true
154
  },
155
+ "15085": {
156
  "content": "asm_Beng",
157
  "lstrip": false,
158
  "normalized": false,
 
160
  "single_word": false,
161
  "special": true
162
  },
163
+ "15086": {
164
  "content": "ast_Latn",
165
  "lstrip": false,
166
  "normalized": false,
 
168
  "single_word": false,
169
  "special": true
170
  },
171
+ "15087": {
172
  "content": "awa_Deva",
173
  "lstrip": false,
174
  "normalized": false,
 
176
  "single_word": false,
177
  "special": true
178
  },
179
+ "15088": {
180
  "content": "ayr_Latn",
181
  "lstrip": false,
182
  "normalized": false,
 
184
  "single_word": false,
185
  "special": true
186
  },
187
+ "15089": {
188
  "content": "azb_Arab",
189
  "lstrip": false,
190
  "normalized": false,
 
192
  "single_word": false,
193
  "special": true
194
  },
195
+ "15090": {
196
  "content": "azj_Latn",
197
  "lstrip": false,
198
  "normalized": false,
 
200
  "single_word": false,
201
  "special": true
202
  },
203
+ "15091": {
204
  "content": "bak_Cyrl",
205
  "lstrip": false,
206
  "normalized": false,
 
208
  "single_word": false,
209
  "special": true
210
  },
211
+ "15092": {
212
  "content": "bam_Latn",
213
  "lstrip": false,
214
  "normalized": false,
 
216
  "single_word": false,
217
  "special": true
218
  },
219
+ "15093": {
220
  "content": "ban_Latn",
221
  "lstrip": false,
222
  "normalized": false,
 
224
  "single_word": false,
225
  "special": true
226
  },
227
+ "15094": {
228
  "content": "bel_Cyrl",
229
  "lstrip": false,
230
  "normalized": false,
 
232
  "single_word": false,
233
  "special": true
234
  },
235
+ "15095": {
236
  "content": "bem_Latn",
237
  "lstrip": false,
238
  "normalized": false,
 
240
  "single_word": false,
241
  "special": true
242
  },
243
+ "15096": {
244
  "content": "ben_Beng",
245
  "lstrip": false,
246
  "normalized": false,
 
248
  "single_word": false,
249
  "special": true
250
  },
251
+ "15097": {
252
  "content": "bho_Deva",
253
  "lstrip": false,
254
  "normalized": false,
 
256
  "single_word": false,
257
  "special": true
258
  },
259
+ "15098": {
260
  "content": "bjn_Arab",
261
  "lstrip": false,
262
  "normalized": false,
 
264
  "single_word": false,
265
  "special": true
266
  },
267
+ "15099": {
268
  "content": "bjn_Latn",
269
  "lstrip": false,
270
  "normalized": false,
 
272
  "single_word": false,
273
  "special": true
274
  },
275
+ "15100": {
276
  "content": "bod_Tibt",
277
  "lstrip": false,
278
  "normalized": false,
 
280
  "single_word": false,
281
  "special": true
282
  },
283
+ "15101": {
284
  "content": "bos_Latn",
285
  "lstrip": false,
286
  "normalized": false,
 
288
  "single_word": false,
289
  "special": true
290
  },
291
+ "15102": {
292
  "content": "bug_Latn",
293
  "lstrip": false,
294
  "normalized": false,
 
296
  "single_word": false,
297
  "special": true
298
  },
299
+ "15103": {
300
  "content": "bul_Cyrl",
301
  "lstrip": false,
302
  "normalized": false,
 
304
  "single_word": false,
305
  "special": true
306
  },
307
+ "15104": {
308
  "content": "cat_Latn",
309
  "lstrip": false,
310
  "normalized": false,
 
312
  "single_word": false,
313
  "special": true
314
  },
315
+ "15105": {
316
  "content": "ceb_Latn",
317
  "lstrip": false,
318
  "normalized": false,
 
320
  "single_word": false,
321
  "special": true
322
  },
323
+ "15106": {
324
  "content": "ces_Latn",
325
  "lstrip": false,
326
  "normalized": false,
 
328
  "single_word": false,
329
  "special": true
330
  },
331
+ "15107": {
332
  "content": "cjk_Latn",
333
  "lstrip": false,
334
  "normalized": false,
 
336
  "single_word": false,
337
  "special": true
338
  },
339
+ "15108": {
340
  "content": "ckb_Arab",
341
  "lstrip": false,
342
  "normalized": false,
 
344
  "single_word": false,
345
  "special": true
346
  },
347
+ "15109": {
348
  "content": "crh_Latn",
349
  "lstrip": false,
350
  "normalized": false,
 
352
  "single_word": false,
353
  "special": true
354
  },
355
+ "15110": {
356
  "content": "cym_Latn",
357
  "lstrip": false,
358
  "normalized": false,
 
360
  "single_word": false,
361
  "special": true
362
  },
363
+ "15111": {
364
  "content": "dan_Latn",
365
  "lstrip": false,
366
  "normalized": false,
 
368
  "single_word": false,
369
  "special": true
370
  },
371
+ "15112": {
372
  "content": "deu_Latn",
373
  "lstrip": false,
374
  "normalized": false,
 
376
  "single_word": false,
377
  "special": true
378
  },
379
+ "15113": {
380
  "content": "dik_Latn",
381
  "lstrip": false,
382
  "normalized": false,
 
384
  "single_word": false,
385
  "special": true
386
  },
387
+ "15114": {
388
  "content": "dyu_Latn",
389
  "lstrip": false,
390
  "normalized": false,
 
392
  "single_word": false,
393
  "special": true
394
  },
395
+ "15115": {
396
  "content": "dzo_Tibt",
397
  "lstrip": false,
398
  "normalized": false,
 
400
  "single_word": false,
401
  "special": true
402
  },
403
+ "15116": {
404
  "content": "ell_Grek",
405
  "lstrip": false,
406
  "normalized": false,
 
408
  "single_word": false,
409
  "special": true
410
  },
411
+ "15117": {
412
  "content": "eng_Latn",
413
  "lstrip": false,
414
  "normalized": false,
 
416
  "single_word": false,
417
  "special": true
418
  },
419
+ "15118": {
420
  "content": "epo_Latn",
421
  "lstrip": false,
422
  "normalized": false,
 
424
  "single_word": false,
425
  "special": true
426
  },
427
+ "15119": {
428
  "content": "est_Latn",
429
  "lstrip": false,
430
  "normalized": false,
 
432
  "single_word": false,
433
  "special": true
434
  },
435
+ "15120": {
436
  "content": "eus_Latn",
437
  "lstrip": false,
438
  "normalized": false,
 
440
  "single_word": false,
441
  "special": true
442
  },
443
+ "15121": {
444
  "content": "ewe_Latn",
445
  "lstrip": false,
446
  "normalized": false,
 
448
  "single_word": false,
449
  "special": true
450
  },
451
+ "15122": {
452
  "content": "fao_Latn",
453
  "lstrip": false,
454
  "normalized": false,
 
456
  "single_word": false,
457
  "special": true
458
  },
459
+ "15123": {
460
  "content": "pes_Arab",
461
  "lstrip": false,
462
  "normalized": false,
 
464
  "single_word": false,
465
  "special": true
466
  },
467
+ "15124": {
468
  "content": "fij_Latn",
469
  "lstrip": false,
470
  "normalized": false,
 
472
  "single_word": false,
473
  "special": true
474
  },
475
+ "15125": {
476
  "content": "fin_Latn",
477
  "lstrip": false,
478
  "normalized": false,
 
480
  "single_word": false,
481
  "special": true
482
  },
483
+ "15126": {
484
  "content": "fon_Latn",
485
  "lstrip": false,
486
  "normalized": false,
 
488
  "single_word": false,
489
  "special": true
490
  },
491
+ "15127": {
492
  "content": "fra_Latn",
493
  "lstrip": false,
494
  "normalized": false,
 
496
  "single_word": false,
497
  "special": true
498
  },
499
+ "15128": {
500
  "content": "fur_Latn",
501
  "lstrip": false,
502
  "normalized": false,
 
504
  "single_word": false,
505
  "special": true
506
  },
507
+ "15129": {
508
  "content": "fuv_Latn",
509
  "lstrip": false,
510
  "normalized": false,
 
512
  "single_word": false,
513
  "special": true
514
  },
515
+ "15130": {
516
  "content": "gla_Latn",
517
  "lstrip": false,
518
  "normalized": false,
 
520
  "single_word": false,
521
  "special": true
522
  },
523
+ "15131": {
524
  "content": "gle_Latn",
525
  "lstrip": false,
526
  "normalized": false,
 
528
  "single_word": false,
529
  "special": true
530
  },
531
+ "15132": {
532
  "content": "glg_Latn",
533
  "lstrip": false,
534
  "normalized": false,
 
536
  "single_word": false,
537
  "special": true
538
  },
539
+ "15133": {
540
  "content": "grn_Latn",
541
  "lstrip": false,
542
  "normalized": false,
 
544
  "single_word": false,
545
  "special": true
546
  },
547
+ "15134": {
548
  "content": "guj_Gujr",
549
  "lstrip": false,
550
  "normalized": false,
 
552
  "single_word": false,
553
  "special": true
554
  },
555
+ "15135": {
556
  "content": "hat_Latn",
557
  "lstrip": false,
558
  "normalized": false,
 
560
  "single_word": false,
561
  "special": true
562
  },
563
+ "15136": {
564
  "content": "hau_Latn",
565
  "lstrip": false,
566
  "normalized": false,
 
568
  "single_word": false,
569
  "special": true
570
  },
571
+ "15137": {
572
  "content": "heb_Hebr",
573
  "lstrip": false,
574
  "normalized": false,
 
576
  "single_word": false,
577
  "special": true
578
  },
579
+ "15138": {
580
  "content": "hin_Deva",
581
  "lstrip": false,
582
  "normalized": false,
 
584
  "single_word": false,
585
  "special": true
586
  },
587
+ "15139": {
588
  "content": "hne_Deva",
589
  "lstrip": false,
590
  "normalized": false,
 
592
  "single_word": false,
593
  "special": true
594
  },
595
+ "15140": {
596
  "content": "hrv_Latn",
597
  "lstrip": false,
598
  "normalized": false,
 
600
  "single_word": false,
601
  "special": true
602
  },
603
+ "15141": {
604
  "content": "hun_Latn",
605
  "lstrip": false,
606
  "normalized": false,
 
608
  "single_word": false,
609
  "special": true
610
  },
611
+ "15142": {
612
  "content": "hye_Armn",
613
  "lstrip": false,
614
  "normalized": false,
 
616
  "single_word": false,
617
  "special": true
618
  },
619
+ "15143": {
620
  "content": "ibo_Latn",
621
  "lstrip": false,
622
  "normalized": false,
 
624
  "single_word": false,
625
  "special": true
626
  },
627
+ "15144": {
628
  "content": "ilo_Latn",
629
  "lstrip": false,
630
  "normalized": false,
 
632
  "single_word": false,
633
  "special": true
634
  },
635
+ "15145": {
636
  "content": "ind_Latn",
637
  "lstrip": false,
638
  "normalized": false,
 
640
  "single_word": false,
641
  "special": true
642
  },
643
+ "15146": {
644
  "content": "isl_Latn",
645
  "lstrip": false,
646
  "normalized": false,
 
648
  "single_word": false,
649
  "special": true
650
  },
651
+ "15147": {
652
  "content": "ita_Latn",
653
  "lstrip": false,
654
  "normalized": false,
 
656
  "single_word": false,
657
  "special": true
658
  },
659
+ "15148": {
660
  "content": "jav_Latn",
661
  "lstrip": false,
662
  "normalized": false,
 
664
  "single_word": false,
665
  "special": true
666
  },
667
+ "15149": {
668
  "content": "jpn_Jpan",
669
  "lstrip": false,
670
  "normalized": false,
 
672
  "single_word": false,
673
  "special": true
674
  },
675
+ "15150": {
676
  "content": "kab_Latn",
677
  "lstrip": false,
678
  "normalized": false,
 
680
  "single_word": false,
681
  "special": true
682
  },
683
+ "15151": {
684
  "content": "kac_Latn",
685
  "lstrip": false,
686
  "normalized": false,
 
688
  "single_word": false,
689
  "special": true
690
  },
691
+ "15152": {
692
  "content": "kam_Latn",
693
  "lstrip": false,
694
  "normalized": false,
 
696
  "single_word": false,
697
  "special": true
698
  },
699
+ "15153": {
700
  "content": "kan_Knda",
701
  "lstrip": false,
702
  "normalized": false,
 
704
  "single_word": false,
705
  "special": true
706
  },
707
+ "15154": {
708
  "content": "kas_Arab",
709
  "lstrip": false,
710
  "normalized": false,
 
712
  "single_word": false,
713
  "special": true
714
  },
715
+ "15155": {
716
  "content": "kas_Deva",
717
  "lstrip": false,
718
  "normalized": false,
 
720
  "single_word": false,
721
  "special": true
722
  },
723
+ "15156": {
724
  "content": "kat_Geor",
725
  "lstrip": false,
726
  "normalized": false,
 
728
  "single_word": false,
729
  "special": true
730
  },
731
+ "15157": {
732
  "content": "knc_Arab",
733
  "lstrip": false,
734
  "normalized": false,
 
736
  "single_word": false,
737
  "special": true
738
  },
739
+ "15158": {
740
  "content": "knc_Latn",
741
  "lstrip": false,
742
  "normalized": false,
 
744
  "single_word": false,
745
  "special": true
746
  },
747
+ "15159": {
748
  "content": "kaz_Cyrl",
749
  "lstrip": false,
750
  "normalized": false,
 
752
  "single_word": false,
753
  "special": true
754
  },
755
+ "15160": {
756
  "content": "kbp_Latn",
757
  "lstrip": false,
758
  "normalized": false,
 
760
  "single_word": false,
761
  "special": true
762
  },
763
+ "15161": {
764
  "content": "kea_Latn",
765
  "lstrip": false,
766
  "normalized": false,
 
768
  "single_word": false,
769
  "special": true
770
  },
771
+ "15162": {
772
  "content": "khm_Khmr",
773
  "lstrip": false,
774
  "normalized": false,
 
776
  "single_word": false,
777
  "special": true
778
  },
779
+ "15163": {
780
  "content": "kik_Latn",
781
  "lstrip": false,
782
  "normalized": false,
 
784
  "single_word": false,
785
  "special": true
786
  },
787
+ "15164": {
788
  "content": "kin_Latn",
789
  "lstrip": false,
790
  "normalized": false,
 
792
  "single_word": false,
793
  "special": true
794
  },
795
+ "15165": {
796
  "content": "kir_Cyrl",
797
  "lstrip": false,
798
  "normalized": false,
 
800
  "single_word": false,
801
  "special": true
802
  },
803
+ "15166": {
804
  "content": "kmb_Latn",
805
  "lstrip": false,
806
  "normalized": false,
 
808
  "single_word": false,
809
  "special": true
810
  },
811
+ "15167": {
812
  "content": "kon_Latn",
813
  "lstrip": false,
814
  "normalized": false,
 
816
  "single_word": false,
817
  "special": true
818
  },
819
+ "15168": {
820
  "content": "kor_Hang",
821
  "lstrip": false,
822
  "normalized": false,
 
824
  "single_word": false,
825
  "special": true
826
  },
827
+ "15169": {
828
  "content": "kmr_Latn",
829
  "lstrip": false,
830
  "normalized": false,
 
832
  "single_word": false,
833
  "special": true
834
  },
835
+ "15170": {
836
  "content": "lao_Laoo",
837
  "lstrip": false,
838
  "normalized": false,
 
840
  "single_word": false,
841
  "special": true
842
  },
843
+ "15171": {
844
  "content": "lvs_Latn",
845
  "lstrip": false,
846
  "normalized": false,
 
848
  "single_word": false,
849
  "special": true
850
  },
851
+ "15172": {
852
  "content": "lij_Latn",
853
  "lstrip": false,
854
  "normalized": false,
 
856
  "single_word": false,
857
  "special": true
858
  },
859
+ "15173": {
860
  "content": "lim_Latn",
861
  "lstrip": false,
862
  "normalized": false,
 
864
  "single_word": false,
865
  "special": true
866
  },
867
+ "15174": {
868
  "content": "lin_Latn",
869
  "lstrip": false,
870
  "normalized": false,
 
872
  "single_word": false,
873
  "special": true
874
  },
875
+ "15175": {
876
  "content": "lit_Latn",
877
  "lstrip": false,
878
  "normalized": false,
 
880
  "single_word": false,
881
  "special": true
882
  },
883
+ "15176": {
884
  "content": "lmo_Latn",
885
  "lstrip": false,
886
  "normalized": false,
 
888
  "single_word": false,
889
  "special": true
890
  },
891
+ "15177": {
892
  "content": "ltg_Latn",
893
  "lstrip": false,
894
  "normalized": false,
 
896
  "single_word": false,
897
  "special": true
898
  },
899
+ "15178": {
900
  "content": "ltz_Latn",
901
  "lstrip": false,
902
  "normalized": false,
 
904
  "single_word": false,
905
  "special": true
906
  },
907
+ "15179": {
908
  "content": "lua_Latn",
909
  "lstrip": false,
910
  "normalized": false,
 
912
  "single_word": false,
913
  "special": true
914
  },
915
+ "15180": {
916
  "content": "lug_Latn",
917
  "lstrip": false,
918
  "normalized": false,
 
920
  "single_word": false,
921
  "special": true
922
  },
923
+ "15181": {
924
  "content": "luo_Latn",
925
  "lstrip": false,
926
  "normalized": false,
 
928
  "single_word": false,
929
  "special": true
930
  },
931
+ "15182": {
932
  "content": "lus_Latn",
933
  "lstrip": false,
934
  "normalized": false,
 
936
  "single_word": false,
937
  "special": true
938
  },
939
+ "15183": {
940
  "content": "mag_Deva",
941
  "lstrip": false,
942
  "normalized": false,
 
944
  "single_word": false,
945
  "special": true
946
  },
947
+ "15184": {
948
  "content": "mai_Deva",
949
  "lstrip": false,
950
  "normalized": false,
 
952
  "single_word": false,
953
  "special": true
954
  },
955
+ "15185": {
956
  "content": "mal_Mlym",
957
  "lstrip": false,
958
  "normalized": false,
 
960
  "single_word": false,
961
  "special": true
962
  },
963
+ "15186": {
964
  "content": "mar_Deva",
965
  "lstrip": false,
966
  "normalized": false,
 
968
  "single_word": false,
969
  "special": true
970
  },
971
+ "15187": {
972
  "content": "min_Latn",
973
  "lstrip": false,
974
  "normalized": false,
 
976
  "single_word": false,
977
  "special": true
978
  },
979
+ "15188": {
980
  "content": "mkd_Cyrl",
981
  "lstrip": false,
982
  "normalized": false,
 
984
  "single_word": false,
985
  "special": true
986
  },
987
+ "15189": {
988
  "content": "plt_Latn",
989
  "lstrip": false,
990
  "normalized": false,
 
992
  "single_word": false,
993
  "special": true
994
  },
995
+ "15190": {
996
  "content": "mlt_Latn",
997
  "lstrip": false,
998
  "normalized": false,
 
1000
  "single_word": false,
1001
  "special": true
1002
  },
1003
+ "15191": {
1004
  "content": "mni_Beng",
1005
  "lstrip": false,
1006
  "normalized": false,
 
1008
  "single_word": false,
1009
  "special": true
1010
  },
1011
+ "15192": {
1012
  "content": "khk_Cyrl",
1013
  "lstrip": false,
1014
  "normalized": false,
 
1016
  "single_word": false,
1017
  "special": true
1018
  },
1019
+ "15193": {
1020
  "content": "mos_Latn",
1021
  "lstrip": false,
1022
  "normalized": false,
 
1024
  "single_word": false,
1025
  "special": true
1026
  },
1027
+ "15194": {
1028
  "content": "mri_Latn",
1029
  "lstrip": false,
1030
  "normalized": false,
 
1032
  "single_word": false,
1033
  "special": true
1034
  },
1035
+ "15195": {
1036
  "content": "zsm_Latn",
1037
  "lstrip": false,
1038
  "normalized": false,
 
1040
  "single_word": false,
1041
  "special": true
1042
  },
1043
+ "15196": {
1044
  "content": "mya_Mymr",
1045
  "lstrip": false,
1046
  "normalized": false,
 
1048
  "single_word": false,
1049
  "special": true
1050
  },
1051
+ "15197": {
1052
  "content": "nld_Latn",
1053
  "lstrip": false,
1054
  "normalized": false,
 
1056
  "single_word": false,
1057
  "special": true
1058
  },
1059
+ "15198": {
1060
  "content": "nno_Latn",
1061
  "lstrip": false,
1062
  "normalized": false,
 
1064
  "single_word": false,
1065
  "special": true
1066
  },
1067
+ "15199": {
1068
  "content": "nob_Latn",
1069
  "lstrip": false,
1070
  "normalized": false,
 
1072
  "single_word": false,
1073
  "special": true
1074
  },
1075
+ "15200": {
1076
  "content": "npi_Deva",
1077
  "lstrip": false,
1078
  "normalized": false,
 
1080
  "single_word": false,
1081
  "special": true
1082
  },
1083
+ "15201": {
1084
  "content": "nso_Latn",
1085
  "lstrip": false,
1086
  "normalized": false,
 
1088
  "single_word": false,
1089
  "special": true
1090
  },
1091
+ "15202": {
1092
  "content": "nus_Latn",
1093
  "lstrip": false,
1094
  "normalized": false,
 
1096
  "single_word": false,
1097
  "special": true
1098
  },
1099
+ "15203": {
1100
  "content": "nya_Latn",
1101
  "lstrip": false,
1102
  "normalized": false,
 
1104
  "single_word": false,
1105
  "special": true
1106
  },
1107
+ "15204": {
1108
  "content": "oci_Latn",
1109
  "lstrip": false,
1110
  "normalized": false,
 
1112
  "single_word": false,
1113
  "special": true
1114
  },
1115
+ "15205": {
1116
  "content": "gaz_Latn",
1117
  "lstrip": false,
1118
  "normalized": false,
 
1120
  "single_word": false,
1121
  "special": true
1122
  },
1123
+ "15206": {
1124
  "content": "ory_Orya",
1125
  "lstrip": false,
1126
  "normalized": false,
 
1128
  "single_word": false,
1129
  "special": true
1130
  },
1131
+ "15207": {
1132
  "content": "pag_Latn",
1133
  "lstrip": false,
1134
  "normalized": false,
 
1136
  "single_word": false,
1137
  "special": true
1138
  },
1139
+ "15208": {
1140
  "content": "pan_Guru",
1141
  "lstrip": false,
1142
  "normalized": false,
 
1144
  "single_word": false,
1145
  "special": true
1146
  },
1147
+ "15209": {
1148
  "content": "pap_Latn",
1149
  "lstrip": false,
1150
  "normalized": false,
 
1152
  "single_word": false,
1153
  "special": true
1154
  },
1155
+ "15210": {
1156
  "content": "pol_Latn",
1157
  "lstrip": false,
1158
  "normalized": false,
 
1160
  "single_word": false,
1161
  "special": true
1162
  },
1163
+ "15211": {
1164
  "content": "por_Latn",
1165
  "lstrip": false,
1166
  "normalized": false,
 
1168
  "single_word": false,
1169
  "special": true
1170
  },
1171
+ "15212": {
1172
  "content": "prs_Arab",
1173
  "lstrip": false,
1174
  "normalized": false,
 
1176
  "single_word": false,
1177
  "special": true
1178
  },
1179
+ "15213": {
1180
  "content": "pbt_Arab",
1181
  "lstrip": false,
1182
  "normalized": false,
 
1184
  "single_word": false,
1185
  "special": true
1186
  },
1187
+ "15214": {
1188
  "content": "quy_Latn",
1189
  "lstrip": false,
1190
  "normalized": false,
 
1192
  "single_word": false,
1193
  "special": true
1194
  },
1195
+ "15215": {
1196
  "content": "ron_Latn",
1197
  "lstrip": false,
1198
  "normalized": false,
 
1200
  "single_word": false,
1201
  "special": true
1202
  },
1203
+ "15216": {
1204
  "content": "run_Latn",
1205
  "lstrip": false,
1206
  "normalized": false,
 
1208
  "single_word": false,
1209
  "special": true
1210
  },
1211
+ "15217": {
1212
  "content": "rus_Cyrl",
1213
  "lstrip": false,
1214
  "normalized": false,
 
1216
  "single_word": false,
1217
  "special": true
1218
  },
1219
+ "15218": {
1220
  "content": "sag_Latn",
1221
  "lstrip": false,
1222
  "normalized": false,
 
1224
  "single_word": false,
1225
  "special": true
1226
  },
1227
+ "15219": {
1228
  "content": "san_Deva",
1229
  "lstrip": false,
1230
  "normalized": false,
 
1232
  "single_word": false,
1233
  "special": true
1234
  },
1235
+ "15220": {
1236
  "content": "sat_Beng",
1237
  "lstrip": false,
1238
  "normalized": false,
 
1240
  "single_word": false,
1241
  "special": true
1242
  },
1243
+ "15221": {
1244
  "content": "scn_Latn",
1245
  "lstrip": false,
1246
  "normalized": false,
 
1248
  "single_word": false,
1249
  "special": true
1250
  },
1251
+ "15222": {
1252
  "content": "shn_Mymr",
1253
  "lstrip": false,
1254
  "normalized": false,
 
1256
  "single_word": false,
1257
  "special": true
1258
  },
1259
+ "15223": {
1260
  "content": "sin_Sinh",
1261
  "lstrip": false,
1262
  "normalized": false,
 
1264
  "single_word": false,
1265
  "special": true
1266
  },
1267
+ "15224": {
1268
  "content": "slk_Latn",
1269
  "lstrip": false,
1270
  "normalized": false,
 
1272
  "single_word": false,
1273
  "special": true
1274
  },
1275
+ "15225": {
1276
  "content": "slv_Latn",
1277
  "lstrip": false,
1278
  "normalized": false,
 
1280
  "single_word": false,
1281
  "special": true
1282
  },
1283
+ "15226": {
1284
  "content": "smo_Latn",
1285
  "lstrip": false,
1286
  "normalized": false,
 
1288
  "single_word": false,
1289
  "special": true
1290
  },
1291
+ "15227": {
1292
  "content": "sna_Latn",
1293
  "lstrip": false,
1294
  "normalized": false,
 
1296
  "single_word": false,
1297
  "special": true
1298
  },
1299
+ "15228": {
1300
  "content": "snd_Arab",
1301
  "lstrip": false,
1302
  "normalized": false,
 
1304
  "single_word": false,
1305
  "special": true
1306
  },
1307
+ "15229": {
1308
  "content": "som_Latn",
1309
  "lstrip": false,
1310
  "normalized": false,
 
1312
  "single_word": false,
1313
  "special": true
1314
  },
1315
+ "15230": {
1316
  "content": "sot_Latn",
1317
  "lstrip": false,
1318
  "normalized": false,
 
1320
  "single_word": false,
1321
  "special": true
1322
  },
1323
+ "15231": {
1324
  "content": "spa_Latn",
1325
  "lstrip": false,
1326
  "normalized": false,
 
1328
  "single_word": false,
1329
  "special": true
1330
  },
1331
+ "15232": {
1332
  "content": "als_Latn",
1333
  "lstrip": false,
1334
  "normalized": false,
 
1336
  "single_word": false,
1337
  "special": true
1338
  },
1339
+ "15233": {
1340
  "content": "srd_Latn",
1341
  "lstrip": false,
1342
  "normalized": false,
 
1344
  "single_word": false,
1345
  "special": true
1346
  },
1347
+ "15234": {
1348
  "content": "srp_Cyrl",
1349
  "lstrip": false,
1350
  "normalized": false,
 
1352
  "single_word": false,
1353
  "special": true
1354
  },
1355
+ "15235": {
1356
  "content": "ssw_Latn",
1357
  "lstrip": false,
1358
  "normalized": false,
 
1360
  "single_word": false,
1361
  "special": true
1362
  },
1363
+ "15236": {
1364
  "content": "sun_Latn",
1365
  "lstrip": false,
1366
  "normalized": false,
 
1368
  "single_word": false,
1369
  "special": true
1370
  },
1371
+ "15237": {
1372
  "content": "swe_Latn",
1373
  "lstrip": false,
1374
  "normalized": false,
 
1376
  "single_word": false,
1377
  "special": true
1378
  },
1379
+ "15238": {
1380
  "content": "swh_Latn",
1381
  "lstrip": false,
1382
  "normalized": false,
 
1384
  "single_word": false,
1385
  "special": true
1386
  },
1387
+ "15239": {
1388
  "content": "szl_Latn",
1389
  "lstrip": false,
1390
  "normalized": false,
 
1392
  "single_word": false,
1393
  "special": true
1394
  },
1395
+ "15240": {
1396
  "content": "tam_Taml",
1397
  "lstrip": false,
1398
  "normalized": false,
 
1400
  "single_word": false,
1401
  "special": true
1402
  },
1403
+ "15241": {
1404
  "content": "tat_Cyrl",
1405
  "lstrip": false,
1406
  "normalized": false,
 
1408
  "single_word": false,
1409
  "special": true
1410
  },
1411
+ "15242": {
1412
  "content": "tel_Telu",
1413
  "lstrip": false,
1414
  "normalized": false,
 
1416
  "single_word": false,
1417
  "special": true
1418
  },
1419
+ "15243": {
1420
  "content": "tgk_Cyrl",
1421
  "lstrip": false,
1422
  "normalized": false,
 
1424
  "single_word": false,
1425
  "special": true
1426
  },
1427
+ "15244": {
1428
  "content": "tgl_Latn",
1429
  "lstrip": false,
1430
  "normalized": false,
 
1432
  "single_word": false,
1433
  "special": true
1434
  },
1435
+ "15245": {
1436
  "content": "tha_Thai",
1437
  "lstrip": false,
1438
  "normalized": false,
 
1440
  "single_word": false,
1441
  "special": true
1442
  },
1443
+ "15246": {
1444
  "content": "tir_Ethi",
1445
  "lstrip": false,
1446
  "normalized": false,
 
1448
  "single_word": false,
1449
  "special": true
1450
  },
1451
+ "15247": {
1452
  "content": "taq_Latn",
1453
  "lstrip": false,
1454
  "normalized": false,
 
1456
  "single_word": false,
1457
  "special": true
1458
  },
1459
+ "15248": {
1460
  "content": "taq_Tfng",
1461
  "lstrip": false,
1462
  "normalized": false,
 
1464
  "single_word": false,
1465
  "special": true
1466
  },
1467
+ "15249": {
1468
  "content": "tpi_Latn",
1469
  "lstrip": false,
1470
  "normalized": false,
 
1472
  "single_word": false,
1473
  "special": true
1474
  },
1475
+ "15250": {
1476
  "content": "tsn_Latn",
1477
  "lstrip": false,
1478
  "normalized": false,
 
1480
  "single_word": false,
1481
  "special": true
1482
  },
1483
+ "15251": {
1484
  "content": "tso_Latn",
1485
  "lstrip": false,
1486
  "normalized": false,
 
1488
  "single_word": false,
1489
  "special": true
1490
  },
1491
+ "15252": {
1492
  "content": "tuk_Latn",
1493
  "lstrip": false,
1494
  "normalized": false,
 
1496
  "single_word": false,
1497
  "special": true
1498
  },
1499
+ "15253": {
1500
  "content": "tum_Latn",
1501
  "lstrip": false,
1502
  "normalized": false,
 
1504
  "single_word": false,
1505
  "special": true
1506
  },
1507
+ "15254": {
1508
  "content": "tur_Latn",
1509
  "lstrip": false,
1510
  "normalized": false,
 
1512
  "single_word": false,
1513
  "special": true
1514
  },
1515
+ "15255": {
1516
  "content": "twi_Latn",
1517
  "lstrip": false,
1518
  "normalized": false,
 
1520
  "single_word": false,
1521
  "special": true
1522
  },
1523
+ "15256": {
1524
  "content": "tzm_Tfng",
1525
  "lstrip": false,
1526
  "normalized": false,
 
1528
  "single_word": false,
1529
  "special": true
1530
  },
1531
+ "15257": {
1532
  "content": "uig_Arab",
1533
  "lstrip": false,
1534
  "normalized": false,
 
1536
  "single_word": false,
1537
  "special": true
1538
  },
1539
+ "15258": {
1540
  "content": "ukr_Cyrl",
1541
  "lstrip": false,
1542
  "normalized": false,
 
1544
  "single_word": false,
1545
  "special": true
1546
  },
1547
+ "15259": {
1548
  "content": "umb_Latn",
1549
  "lstrip": false,
1550
  "normalized": false,
 
1552
  "single_word": false,
1553
  "special": true
1554
  },
1555
+ "15260": {
1556
  "content": "urd_Arab",
1557
  "lstrip": false,
1558
  "normalized": false,
 
1560
  "single_word": false,
1561
  "special": true
1562
  },
1563
+ "15261": {
1564
  "content": "uzn_Latn",
1565
  "lstrip": false,
1566
  "normalized": false,
 
1568
  "single_word": false,
1569
  "special": true
1570
  },
1571
+ "15262": {
1572
  "content": "vec_Latn",
1573
  "lstrip": false,
1574
  "normalized": false,
 
1576
  "single_word": false,
1577
  "special": true
1578
  },
1579
+ "15263": {
1580
  "content": "vie_Latn",
1581
  "lstrip": false,
1582
  "normalized": false,
 
1584
  "single_word": false,
1585
  "special": true
1586
  },
1587
+ "15264": {
1588
  "content": "war_Latn",
1589
  "lstrip": false,
1590
  "normalized": false,
 
1592
  "single_word": false,
1593
  "special": true
1594
  },
1595
+ "15265": {
1596
  "content": "wol_Latn",
1597
  "lstrip": false,
1598
  "normalized": false,
 
1600
  "single_word": false,
1601
  "special": true
1602
  },
1603
+ "15266": {
1604
  "content": "xho_Latn",
1605
  "lstrip": false,
1606
  "normalized": false,
 
1608
  "single_word": false,
1609
  "special": true
1610
  },
1611
+ "15267": {
1612
  "content": "ydd_Hebr",
1613
  "lstrip": false,
1614
  "normalized": false,
 
1616
  "single_word": false,
1617
  "special": true
1618
  },
1619
+ "15268": {
1620
  "content": "yor_Latn",
1621
  "lstrip": false,
1622
  "normalized": false,
 
1624
  "single_word": false,
1625
  "special": true
1626
  },
1627
+ "15269": {
1628
  "content": "yue_Hant",
1629
  "lstrip": false,
1630
  "normalized": false,
 
1632
  "single_word": false,
1633
  "special": true
1634
  },
1635
+ "15270": {
1636
  "content": "zho_Hans",
1637
  "lstrip": false,
1638
  "normalized": false,
 
1640
  "single_word": false,
1641
  "special": true
1642
  },
1643
+ "15271": {
1644
  "content": "zho_Hant",
1645
  "lstrip": false,
1646
  "normalized": false,
 
1648
  "single_word": false,
1649
  "special": true
1650
  },
1651
+ "15272": {
1652
  "content": "zul_Latn",
1653
  "lstrip": false,
1654
  "normalized": false,