comparison CSP2/CSP2_env/env-d9b9114564458d9d-741b3de822f2aaca6c6caa4325c4afce/lib/python3.8/encodings/aliases.py @ 69:33d812a61356

planemo upload commit 2e9511a184a1ca667c7be0c6321a36dc4e3d116d
author jpayne
date Tue, 18 Mar 2025 17:55:14 -0400
parents
children
comparison
equal deleted inserted replaced
67:0e9998148a16 69:33d812a61356
1 """ Encoding Aliases Support
2
3 This module is used by the encodings package search function to
4 map encodings names to module names.
5
6 Note that the search function normalizes the encoding names before
7 doing the lookup, so the mapping will have to map normalized
8 encoding names to module names.
9
10 Contents:
11
12 The following aliases dictionary contains mappings of all IANA
13 character set names for which the Python core library provides
14 codecs. In addition to these, a few Python specific codec
15 aliases have also been added.
16
17 """
18 aliases = {
19
20 # Please keep this list sorted alphabetically by value !
21
22 # ascii codec
23 '646' : 'ascii',
24 'ansi_x3.4_1968' : 'ascii',
25 'ansi_x3_4_1968' : 'ascii', # some email headers use this non-standard name
26 'ansi_x3.4_1986' : 'ascii',
27 'cp367' : 'ascii',
28 'csascii' : 'ascii',
29 'ibm367' : 'ascii',
30 'iso646_us' : 'ascii',
31 'iso_646.irv_1991' : 'ascii',
32 'iso_ir_6' : 'ascii',
33 'us' : 'ascii',
34 'us_ascii' : 'ascii',
35
36 # base64_codec codec
37 'base64' : 'base64_codec',
38 'base_64' : 'base64_codec',
39
40 # big5 codec
41 'big5_tw' : 'big5',
42 'csbig5' : 'big5',
43
44 # big5hkscs codec
45 'big5_hkscs' : 'big5hkscs',
46 'hkscs' : 'big5hkscs',
47
48 # bz2_codec codec
49 'bz2' : 'bz2_codec',
50
51 # cp037 codec
52 '037' : 'cp037',
53 'csibm037' : 'cp037',
54 'ebcdic_cp_ca' : 'cp037',
55 'ebcdic_cp_nl' : 'cp037',
56 'ebcdic_cp_us' : 'cp037',
57 'ebcdic_cp_wt' : 'cp037',
58 'ibm037' : 'cp037',
59 'ibm039' : 'cp037',
60
61 # cp1026 codec
62 '1026' : 'cp1026',
63 'csibm1026' : 'cp1026',
64 'ibm1026' : 'cp1026',
65
66 # cp1125 codec
67 '1125' : 'cp1125',
68 'ibm1125' : 'cp1125',
69 'cp866u' : 'cp1125',
70 'ruscii' : 'cp1125',
71
72 # cp1140 codec
73 '1140' : 'cp1140',
74 'ibm1140' : 'cp1140',
75
76 # cp1250 codec
77 '1250' : 'cp1250',
78 'windows_1250' : 'cp1250',
79
80 # cp1251 codec
81 '1251' : 'cp1251',
82 'windows_1251' : 'cp1251',
83
84 # cp1252 codec
85 '1252' : 'cp1252',
86 'windows_1252' : 'cp1252',
87
88 # cp1253 codec
89 '1253' : 'cp1253',
90 'windows_1253' : 'cp1253',
91
92 # cp1254 codec
93 '1254' : 'cp1254',
94 'windows_1254' : 'cp1254',
95
96 # cp1255 codec
97 '1255' : 'cp1255',
98 'windows_1255' : 'cp1255',
99
100 # cp1256 codec
101 '1256' : 'cp1256',
102 'windows_1256' : 'cp1256',
103
104 # cp1257 codec
105 '1257' : 'cp1257',
106 'windows_1257' : 'cp1257',
107
108 # cp1258 codec
109 '1258' : 'cp1258',
110 'windows_1258' : 'cp1258',
111
112 # cp273 codec
113 '273' : 'cp273',
114 'ibm273' : 'cp273',
115 'csibm273' : 'cp273',
116
117 # cp424 codec
118 '424' : 'cp424',
119 'csibm424' : 'cp424',
120 'ebcdic_cp_he' : 'cp424',
121 'ibm424' : 'cp424',
122
123 # cp437 codec
124 '437' : 'cp437',
125 'cspc8codepage437' : 'cp437',
126 'ibm437' : 'cp437',
127
128 # cp500 codec
129 '500' : 'cp500',
130 'csibm500' : 'cp500',
131 'ebcdic_cp_be' : 'cp500',
132 'ebcdic_cp_ch' : 'cp500',
133 'ibm500' : 'cp500',
134
135 # cp775 codec
136 '775' : 'cp775',
137 'cspc775baltic' : 'cp775',
138 'ibm775' : 'cp775',
139
140 # cp850 codec
141 '850' : 'cp850',
142 'cspc850multilingual' : 'cp850',
143 'ibm850' : 'cp850',
144
145 # cp852 codec
146 '852' : 'cp852',
147 'cspcp852' : 'cp852',
148 'ibm852' : 'cp852',
149
150 # cp855 codec
151 '855' : 'cp855',
152 'csibm855' : 'cp855',
153 'ibm855' : 'cp855',
154
155 # cp857 codec
156 '857' : 'cp857',
157 'csibm857' : 'cp857',
158 'ibm857' : 'cp857',
159
160 # cp858 codec
161 '858' : 'cp858',
162 'csibm858' : 'cp858',
163 'ibm858' : 'cp858',
164
165 # cp860 codec
166 '860' : 'cp860',
167 'csibm860' : 'cp860',
168 'ibm860' : 'cp860',
169
170 # cp861 codec
171 '861' : 'cp861',
172 'cp_is' : 'cp861',
173 'csibm861' : 'cp861',
174 'ibm861' : 'cp861',
175
176 # cp862 codec
177 '862' : 'cp862',
178 'cspc862latinhebrew' : 'cp862',
179 'ibm862' : 'cp862',
180
181 # cp863 codec
182 '863' : 'cp863',
183 'csibm863' : 'cp863',
184 'ibm863' : 'cp863',
185
186 # cp864 codec
187 '864' : 'cp864',
188 'csibm864' : 'cp864',
189 'ibm864' : 'cp864',
190
191 # cp865 codec
192 '865' : 'cp865',
193 'csibm865' : 'cp865',
194 'ibm865' : 'cp865',
195
196 # cp866 codec
197 '866' : 'cp866',
198 'csibm866' : 'cp866',
199 'ibm866' : 'cp866',
200
201 # cp869 codec
202 '869' : 'cp869',
203 'cp_gr' : 'cp869',
204 'csibm869' : 'cp869',
205 'ibm869' : 'cp869',
206
207 # cp932 codec
208 '932' : 'cp932',
209 'ms932' : 'cp932',
210 'mskanji' : 'cp932',
211 'ms_kanji' : 'cp932',
212
213 # cp949 codec
214 '949' : 'cp949',
215 'ms949' : 'cp949',
216 'uhc' : 'cp949',
217
218 # cp950 codec
219 '950' : 'cp950',
220 'ms950' : 'cp950',
221
222 # euc_jis_2004 codec
223 'jisx0213' : 'euc_jis_2004',
224 'eucjis2004' : 'euc_jis_2004',
225 'euc_jis2004' : 'euc_jis_2004',
226
227 # euc_jisx0213 codec
228 'eucjisx0213' : 'euc_jisx0213',
229
230 # euc_jp codec
231 'eucjp' : 'euc_jp',
232 'ujis' : 'euc_jp',
233 'u_jis' : 'euc_jp',
234
235 # euc_kr codec
236 'euckr' : 'euc_kr',
237 'korean' : 'euc_kr',
238 'ksc5601' : 'euc_kr',
239 'ks_c_5601' : 'euc_kr',
240 'ks_c_5601_1987' : 'euc_kr',
241 'ksx1001' : 'euc_kr',
242 'ks_x_1001' : 'euc_kr',
243
244 # gb18030 codec
245 'gb18030_2000' : 'gb18030',
246
247 # gb2312 codec
248 'chinese' : 'gb2312',
249 'csiso58gb231280' : 'gb2312',
250 'euc_cn' : 'gb2312',
251 'euccn' : 'gb2312',
252 'eucgb2312_cn' : 'gb2312',
253 'gb2312_1980' : 'gb2312',
254 'gb2312_80' : 'gb2312',
255 'iso_ir_58' : 'gb2312',
256
257 # gbk codec
258 '936' : 'gbk',
259 'cp936' : 'gbk',
260 'ms936' : 'gbk',
261
262 # hex_codec codec
263 'hex' : 'hex_codec',
264
265 # hp_roman8 codec
266 'roman8' : 'hp_roman8',
267 'r8' : 'hp_roman8',
268 'csHPRoman8' : 'hp_roman8',
269 'cp1051' : 'hp_roman8',
270 'ibm1051' : 'hp_roman8',
271
272 # hz codec
273 'hzgb' : 'hz',
274 'hz_gb' : 'hz',
275 'hz_gb_2312' : 'hz',
276
277 # iso2022_jp codec
278 'csiso2022jp' : 'iso2022_jp',
279 'iso2022jp' : 'iso2022_jp',
280 'iso_2022_jp' : 'iso2022_jp',
281
282 # iso2022_jp_1 codec
283 'iso2022jp_1' : 'iso2022_jp_1',
284 'iso_2022_jp_1' : 'iso2022_jp_1',
285
286 # iso2022_jp_2 codec
287 'iso2022jp_2' : 'iso2022_jp_2',
288 'iso_2022_jp_2' : 'iso2022_jp_2',
289
290 # iso2022_jp_2004 codec
291 'iso_2022_jp_2004' : 'iso2022_jp_2004',
292 'iso2022jp_2004' : 'iso2022_jp_2004',
293
294 # iso2022_jp_3 codec
295 'iso2022jp_3' : 'iso2022_jp_3',
296 'iso_2022_jp_3' : 'iso2022_jp_3',
297
298 # iso2022_jp_ext codec
299 'iso2022jp_ext' : 'iso2022_jp_ext',
300 'iso_2022_jp_ext' : 'iso2022_jp_ext',
301
302 # iso2022_kr codec
303 'csiso2022kr' : 'iso2022_kr',
304 'iso2022kr' : 'iso2022_kr',
305 'iso_2022_kr' : 'iso2022_kr',
306
307 # iso8859_10 codec
308 'csisolatin6' : 'iso8859_10',
309 'iso_8859_10' : 'iso8859_10',
310 'iso_8859_10_1992' : 'iso8859_10',
311 'iso_ir_157' : 'iso8859_10',
312 'l6' : 'iso8859_10',
313 'latin6' : 'iso8859_10',
314
315 # iso8859_11 codec
316 'thai' : 'iso8859_11',
317 'iso_8859_11' : 'iso8859_11',
318 'iso_8859_11_2001' : 'iso8859_11',
319
320 # iso8859_13 codec
321 'iso_8859_13' : 'iso8859_13',
322 'l7' : 'iso8859_13',
323 'latin7' : 'iso8859_13',
324
325 # iso8859_14 codec
326 'iso_8859_14' : 'iso8859_14',
327 'iso_8859_14_1998' : 'iso8859_14',
328 'iso_celtic' : 'iso8859_14',
329 'iso_ir_199' : 'iso8859_14',
330 'l8' : 'iso8859_14',
331 'latin8' : 'iso8859_14',
332
333 # iso8859_15 codec
334 'iso_8859_15' : 'iso8859_15',
335 'l9' : 'iso8859_15',
336 'latin9' : 'iso8859_15',
337
338 # iso8859_16 codec
339 'iso_8859_16' : 'iso8859_16',
340 'iso_8859_16_2001' : 'iso8859_16',
341 'iso_ir_226' : 'iso8859_16',
342 'l10' : 'iso8859_16',
343 'latin10' : 'iso8859_16',
344
345 # iso8859_2 codec
346 'csisolatin2' : 'iso8859_2',
347 'iso_8859_2' : 'iso8859_2',
348 'iso_8859_2_1987' : 'iso8859_2',
349 'iso_ir_101' : 'iso8859_2',
350 'l2' : 'iso8859_2',
351 'latin2' : 'iso8859_2',
352
353 # iso8859_3 codec
354 'csisolatin3' : 'iso8859_3',
355 'iso_8859_3' : 'iso8859_3',
356 'iso_8859_3_1988' : 'iso8859_3',
357 'iso_ir_109' : 'iso8859_3',
358 'l3' : 'iso8859_3',
359 'latin3' : 'iso8859_3',
360
361 # iso8859_4 codec
362 'csisolatin4' : 'iso8859_4',
363 'iso_8859_4' : 'iso8859_4',
364 'iso_8859_4_1988' : 'iso8859_4',
365 'iso_ir_110' : 'iso8859_4',
366 'l4' : 'iso8859_4',
367 'latin4' : 'iso8859_4',
368
369 # iso8859_5 codec
370 'csisolatincyrillic' : 'iso8859_5',
371 'cyrillic' : 'iso8859_5',
372 'iso_8859_5' : 'iso8859_5',
373 'iso_8859_5_1988' : 'iso8859_5',
374 'iso_ir_144' : 'iso8859_5',
375
376 # iso8859_6 codec
377 'arabic' : 'iso8859_6',
378 'asmo_708' : 'iso8859_6',
379 'csisolatinarabic' : 'iso8859_6',
380 'ecma_114' : 'iso8859_6',
381 'iso_8859_6' : 'iso8859_6',
382 'iso_8859_6_1987' : 'iso8859_6',
383 'iso_ir_127' : 'iso8859_6',
384
385 # iso8859_7 codec
386 'csisolatingreek' : 'iso8859_7',
387 'ecma_118' : 'iso8859_7',
388 'elot_928' : 'iso8859_7',
389 'greek' : 'iso8859_7',
390 'greek8' : 'iso8859_7',
391 'iso_8859_7' : 'iso8859_7',
392 'iso_8859_7_1987' : 'iso8859_7',
393 'iso_ir_126' : 'iso8859_7',
394
395 # iso8859_8 codec
396 'csisolatinhebrew' : 'iso8859_8',
397 'hebrew' : 'iso8859_8',
398 'iso_8859_8' : 'iso8859_8',
399 'iso_8859_8_1988' : 'iso8859_8',
400 'iso_ir_138' : 'iso8859_8',
401
402 # iso8859_9 codec
403 'csisolatin5' : 'iso8859_9',
404 'iso_8859_9' : 'iso8859_9',
405 'iso_8859_9_1989' : 'iso8859_9',
406 'iso_ir_148' : 'iso8859_9',
407 'l5' : 'iso8859_9',
408 'latin5' : 'iso8859_9',
409
410 # johab codec
411 'cp1361' : 'johab',
412 'ms1361' : 'johab',
413
414 # koi8_r codec
415 'cskoi8r' : 'koi8_r',
416
417 # kz1048 codec
418 'kz_1048' : 'kz1048',
419 'rk1048' : 'kz1048',
420 'strk1048_2002' : 'kz1048',
421
422 # latin_1 codec
423 #
424 # Note that the latin_1 codec is implemented internally in C and a
425 # lot faster than the charmap codec iso8859_1 which uses the same
426 # encoding. This is why we discourage the use of the iso8859_1
427 # codec and alias it to latin_1 instead.
428 #
429 '8859' : 'latin_1',
430 'cp819' : 'latin_1',
431 'csisolatin1' : 'latin_1',
432 'ibm819' : 'latin_1',
433 'iso8859' : 'latin_1',
434 'iso8859_1' : 'latin_1',
435 'iso_8859_1' : 'latin_1',
436 'iso_8859_1_1987' : 'latin_1',
437 'iso_ir_100' : 'latin_1',
438 'l1' : 'latin_1',
439 'latin' : 'latin_1',
440 'latin1' : 'latin_1',
441
442 # mac_cyrillic codec
443 'maccyrillic' : 'mac_cyrillic',
444
445 # mac_greek codec
446 'macgreek' : 'mac_greek',
447
448 # mac_iceland codec
449 'maciceland' : 'mac_iceland',
450
451 # mac_latin2 codec
452 'maccentraleurope' : 'mac_latin2',
453 'maclatin2' : 'mac_latin2',
454
455 # mac_roman codec
456 'macintosh' : 'mac_roman',
457 'macroman' : 'mac_roman',
458
459 # mac_turkish codec
460 'macturkish' : 'mac_turkish',
461
462 # mbcs codec
463 'ansi' : 'mbcs',
464 'dbcs' : 'mbcs',
465
466 # ptcp154 codec
467 'csptcp154' : 'ptcp154',
468 'pt154' : 'ptcp154',
469 'cp154' : 'ptcp154',
470 'cyrillic_asian' : 'ptcp154',
471
472 # quopri_codec codec
473 'quopri' : 'quopri_codec',
474 'quoted_printable' : 'quopri_codec',
475 'quotedprintable' : 'quopri_codec',
476
477 # rot_13 codec
478 'rot13' : 'rot_13',
479
480 # shift_jis codec
481 'csshiftjis' : 'shift_jis',
482 'shiftjis' : 'shift_jis',
483 'sjis' : 'shift_jis',
484 's_jis' : 'shift_jis',
485
486 # shift_jis_2004 codec
487 'shiftjis2004' : 'shift_jis_2004',
488 'sjis_2004' : 'shift_jis_2004',
489 's_jis_2004' : 'shift_jis_2004',
490
491 # shift_jisx0213 codec
492 'shiftjisx0213' : 'shift_jisx0213',
493 'sjisx0213' : 'shift_jisx0213',
494 's_jisx0213' : 'shift_jisx0213',
495
496 # tactis codec
497 'tis260' : 'tactis',
498
499 # tis_620 codec
500 'tis620' : 'tis_620',
501 'tis_620_0' : 'tis_620',
502 'tis_620_2529_0' : 'tis_620',
503 'tis_620_2529_1' : 'tis_620',
504 'iso_ir_166' : 'tis_620',
505
506 # utf_16 codec
507 'u16' : 'utf_16',
508 'utf16' : 'utf_16',
509
510 # utf_16_be codec
511 'unicodebigunmarked' : 'utf_16_be',
512 'utf_16be' : 'utf_16_be',
513
514 # utf_16_le codec
515 'unicodelittleunmarked' : 'utf_16_le',
516 'utf_16le' : 'utf_16_le',
517
518 # utf_32 codec
519 'u32' : 'utf_32',
520 'utf32' : 'utf_32',
521
522 # utf_32_be codec
523 'utf_32be' : 'utf_32_be',
524
525 # utf_32_le codec
526 'utf_32le' : 'utf_32_le',
527
528 # utf_7 codec
529 'u7' : 'utf_7',
530 'utf7' : 'utf_7',
531 'unicode_1_1_utf_7' : 'utf_7',
532
533 # utf_8 codec
534 'u8' : 'utf_8',
535 'utf' : 'utf_8',
536 'utf8' : 'utf_8',
537 'utf8_ucs2' : 'utf_8',
538 'utf8_ucs4' : 'utf_8',
539 'cp65001' : 'utf_8',
540
541 # uu_codec codec
542 'uu' : 'uu_codec',
543
544 # zlib_codec codec
545 'zip' : 'zlib_codec',
546 'zlib' : 'zlib_codec',
547
548 # temporary mac CJK aliases, will be replaced by proper codecs in 3.1
549 'x_mac_japanese' : 'shift_jis',
550 'x_mac_korean' : 'euc_kr',
551 'x_mac_simp_chinese' : 'gb2312',
552 'x_mac_trad_chinese' : 'big5',
553 }