Mercurial > repos > rliterman > csp2
comparison CSP2/CSP2_env/env-d9b9114564458d9d-741b3de822f2aaca6c6caa4325c4afce/lib/python3.8/encodings/aliases.py @ 69:33d812a61356
planemo upload commit 2e9511a184a1ca667c7be0c6321a36dc4e3d116d
author | jpayne |
---|---|
date | Tue, 18 Mar 2025 17:55:14 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
67:0e9998148a16 | 69:33d812a61356 |
---|---|
1 """ Encoding Aliases Support | |
2 | |
3 This module is used by the encodings package search function to | |
4 map encodings names to module names. | |
5 | |
6 Note that the search function normalizes the encoding names before | |
7 doing the lookup, so the mapping will have to map normalized | |
8 encoding names to module names. | |
9 | |
10 Contents: | |
11 | |
12 The following aliases dictionary contains mappings of all IANA | |
13 character set names for which the Python core library provides | |
14 codecs. In addition to these, a few Python specific codec | |
15 aliases have also been added. | |
16 | |
17 """ | |
18 aliases = { | |
19 | |
20 # Please keep this list sorted alphabetically by value ! | |
21 | |
22 # ascii codec | |
23 '646' : 'ascii', | |
24 'ansi_x3.4_1968' : 'ascii', | |
25 'ansi_x3_4_1968' : 'ascii', # some email headers use this non-standard name | |
26 'ansi_x3.4_1986' : 'ascii', | |
27 'cp367' : 'ascii', | |
28 'csascii' : 'ascii', | |
29 'ibm367' : 'ascii', | |
30 'iso646_us' : 'ascii', | |
31 'iso_646.irv_1991' : 'ascii', | |
32 'iso_ir_6' : 'ascii', | |
33 'us' : 'ascii', | |
34 'us_ascii' : 'ascii', | |
35 | |
36 # base64_codec codec | |
37 'base64' : 'base64_codec', | |
38 'base_64' : 'base64_codec', | |
39 | |
40 # big5 codec | |
41 'big5_tw' : 'big5', | |
42 'csbig5' : 'big5', | |
43 | |
44 # big5hkscs codec | |
45 'big5_hkscs' : 'big5hkscs', | |
46 'hkscs' : 'big5hkscs', | |
47 | |
48 # bz2_codec codec | |
49 'bz2' : 'bz2_codec', | |
50 | |
51 # cp037 codec | |
52 '037' : 'cp037', | |
53 'csibm037' : 'cp037', | |
54 'ebcdic_cp_ca' : 'cp037', | |
55 'ebcdic_cp_nl' : 'cp037', | |
56 'ebcdic_cp_us' : 'cp037', | |
57 'ebcdic_cp_wt' : 'cp037', | |
58 'ibm037' : 'cp037', | |
59 'ibm039' : 'cp037', | |
60 | |
61 # cp1026 codec | |
62 '1026' : 'cp1026', | |
63 'csibm1026' : 'cp1026', | |
64 'ibm1026' : 'cp1026', | |
65 | |
66 # cp1125 codec | |
67 '1125' : 'cp1125', | |
68 'ibm1125' : 'cp1125', | |
69 'cp866u' : 'cp1125', | |
70 'ruscii' : 'cp1125', | |
71 | |
72 # cp1140 codec | |
73 '1140' : 'cp1140', | |
74 'ibm1140' : 'cp1140', | |
75 | |
76 # cp1250 codec | |
77 '1250' : 'cp1250', | |
78 'windows_1250' : 'cp1250', | |
79 | |
80 # cp1251 codec | |
81 '1251' : 'cp1251', | |
82 'windows_1251' : 'cp1251', | |
83 | |
84 # cp1252 codec | |
85 '1252' : 'cp1252', | |
86 'windows_1252' : 'cp1252', | |
87 | |
88 # cp1253 codec | |
89 '1253' : 'cp1253', | |
90 'windows_1253' : 'cp1253', | |
91 | |
92 # cp1254 codec | |
93 '1254' : 'cp1254', | |
94 'windows_1254' : 'cp1254', | |
95 | |
96 # cp1255 codec | |
97 '1255' : 'cp1255', | |
98 'windows_1255' : 'cp1255', | |
99 | |
100 # cp1256 codec | |
101 '1256' : 'cp1256', | |
102 'windows_1256' : 'cp1256', | |
103 | |
104 # cp1257 codec | |
105 '1257' : 'cp1257', | |
106 'windows_1257' : 'cp1257', | |
107 | |
108 # cp1258 codec | |
109 '1258' : 'cp1258', | |
110 'windows_1258' : 'cp1258', | |
111 | |
112 # cp273 codec | |
113 '273' : 'cp273', | |
114 'ibm273' : 'cp273', | |
115 'csibm273' : 'cp273', | |
116 | |
117 # cp424 codec | |
118 '424' : 'cp424', | |
119 'csibm424' : 'cp424', | |
120 'ebcdic_cp_he' : 'cp424', | |
121 'ibm424' : 'cp424', | |
122 | |
123 # cp437 codec | |
124 '437' : 'cp437', | |
125 'cspc8codepage437' : 'cp437', | |
126 'ibm437' : 'cp437', | |
127 | |
128 # cp500 codec | |
129 '500' : 'cp500', | |
130 'csibm500' : 'cp500', | |
131 'ebcdic_cp_be' : 'cp500', | |
132 'ebcdic_cp_ch' : 'cp500', | |
133 'ibm500' : 'cp500', | |
134 | |
135 # cp775 codec | |
136 '775' : 'cp775', | |
137 'cspc775baltic' : 'cp775', | |
138 'ibm775' : 'cp775', | |
139 | |
140 # cp850 codec | |
141 '850' : 'cp850', | |
142 'cspc850multilingual' : 'cp850', | |
143 'ibm850' : 'cp850', | |
144 | |
145 # cp852 codec | |
146 '852' : 'cp852', | |
147 'cspcp852' : 'cp852', | |
148 'ibm852' : 'cp852', | |
149 | |
150 # cp855 codec | |
151 '855' : 'cp855', | |
152 'csibm855' : 'cp855', | |
153 'ibm855' : 'cp855', | |
154 | |
155 # cp857 codec | |
156 '857' : 'cp857', | |
157 'csibm857' : 'cp857', | |
158 'ibm857' : 'cp857', | |
159 | |
160 # cp858 codec | |
161 '858' : 'cp858', | |
162 'csibm858' : 'cp858', | |
163 'ibm858' : 'cp858', | |
164 | |
165 # cp860 codec | |
166 '860' : 'cp860', | |
167 'csibm860' : 'cp860', | |
168 'ibm860' : 'cp860', | |
169 | |
170 # cp861 codec | |
171 '861' : 'cp861', | |
172 'cp_is' : 'cp861', | |
173 'csibm861' : 'cp861', | |
174 'ibm861' : 'cp861', | |
175 | |
176 # cp862 codec | |
177 '862' : 'cp862', | |
178 'cspc862latinhebrew' : 'cp862', | |
179 'ibm862' : 'cp862', | |
180 | |
181 # cp863 codec | |
182 '863' : 'cp863', | |
183 'csibm863' : 'cp863', | |
184 'ibm863' : 'cp863', | |
185 | |
186 # cp864 codec | |
187 '864' : 'cp864', | |
188 'csibm864' : 'cp864', | |
189 'ibm864' : 'cp864', | |
190 | |
191 # cp865 codec | |
192 '865' : 'cp865', | |
193 'csibm865' : 'cp865', | |
194 'ibm865' : 'cp865', | |
195 | |
196 # cp866 codec | |
197 '866' : 'cp866', | |
198 'csibm866' : 'cp866', | |
199 'ibm866' : 'cp866', | |
200 | |
201 # cp869 codec | |
202 '869' : 'cp869', | |
203 'cp_gr' : 'cp869', | |
204 'csibm869' : 'cp869', | |
205 'ibm869' : 'cp869', | |
206 | |
207 # cp932 codec | |
208 '932' : 'cp932', | |
209 'ms932' : 'cp932', | |
210 'mskanji' : 'cp932', | |
211 'ms_kanji' : 'cp932', | |
212 | |
213 # cp949 codec | |
214 '949' : 'cp949', | |
215 'ms949' : 'cp949', | |
216 'uhc' : 'cp949', | |
217 | |
218 # cp950 codec | |
219 '950' : 'cp950', | |
220 'ms950' : 'cp950', | |
221 | |
222 # euc_jis_2004 codec | |
223 'jisx0213' : 'euc_jis_2004', | |
224 'eucjis2004' : 'euc_jis_2004', | |
225 'euc_jis2004' : 'euc_jis_2004', | |
226 | |
227 # euc_jisx0213 codec | |
228 'eucjisx0213' : 'euc_jisx0213', | |
229 | |
230 # euc_jp codec | |
231 'eucjp' : 'euc_jp', | |
232 'ujis' : 'euc_jp', | |
233 'u_jis' : 'euc_jp', | |
234 | |
235 # euc_kr codec | |
236 'euckr' : 'euc_kr', | |
237 'korean' : 'euc_kr', | |
238 'ksc5601' : 'euc_kr', | |
239 'ks_c_5601' : 'euc_kr', | |
240 'ks_c_5601_1987' : 'euc_kr', | |
241 'ksx1001' : 'euc_kr', | |
242 'ks_x_1001' : 'euc_kr', | |
243 | |
244 # gb18030 codec | |
245 'gb18030_2000' : 'gb18030', | |
246 | |
247 # gb2312 codec | |
248 'chinese' : 'gb2312', | |
249 'csiso58gb231280' : 'gb2312', | |
250 'euc_cn' : 'gb2312', | |
251 'euccn' : 'gb2312', | |
252 'eucgb2312_cn' : 'gb2312', | |
253 'gb2312_1980' : 'gb2312', | |
254 'gb2312_80' : 'gb2312', | |
255 'iso_ir_58' : 'gb2312', | |
256 | |
257 # gbk codec | |
258 '936' : 'gbk', | |
259 'cp936' : 'gbk', | |
260 'ms936' : 'gbk', | |
261 | |
262 # hex_codec codec | |
263 'hex' : 'hex_codec', | |
264 | |
265 # hp_roman8 codec | |
266 'roman8' : 'hp_roman8', | |
267 'r8' : 'hp_roman8', | |
268 'csHPRoman8' : 'hp_roman8', | |
269 'cp1051' : 'hp_roman8', | |
270 'ibm1051' : 'hp_roman8', | |
271 | |
272 # hz codec | |
273 'hzgb' : 'hz', | |
274 'hz_gb' : 'hz', | |
275 'hz_gb_2312' : 'hz', | |
276 | |
277 # iso2022_jp codec | |
278 'csiso2022jp' : 'iso2022_jp', | |
279 'iso2022jp' : 'iso2022_jp', | |
280 'iso_2022_jp' : 'iso2022_jp', | |
281 | |
282 # iso2022_jp_1 codec | |
283 'iso2022jp_1' : 'iso2022_jp_1', | |
284 'iso_2022_jp_1' : 'iso2022_jp_1', | |
285 | |
286 # iso2022_jp_2 codec | |
287 'iso2022jp_2' : 'iso2022_jp_2', | |
288 'iso_2022_jp_2' : 'iso2022_jp_2', | |
289 | |
290 # iso2022_jp_2004 codec | |
291 'iso_2022_jp_2004' : 'iso2022_jp_2004', | |
292 'iso2022jp_2004' : 'iso2022_jp_2004', | |
293 | |
294 # iso2022_jp_3 codec | |
295 'iso2022jp_3' : 'iso2022_jp_3', | |
296 'iso_2022_jp_3' : 'iso2022_jp_3', | |
297 | |
298 # iso2022_jp_ext codec | |
299 'iso2022jp_ext' : 'iso2022_jp_ext', | |
300 'iso_2022_jp_ext' : 'iso2022_jp_ext', | |
301 | |
302 # iso2022_kr codec | |
303 'csiso2022kr' : 'iso2022_kr', | |
304 'iso2022kr' : 'iso2022_kr', | |
305 'iso_2022_kr' : 'iso2022_kr', | |
306 | |
307 # iso8859_10 codec | |
308 'csisolatin6' : 'iso8859_10', | |
309 'iso_8859_10' : 'iso8859_10', | |
310 'iso_8859_10_1992' : 'iso8859_10', | |
311 'iso_ir_157' : 'iso8859_10', | |
312 'l6' : 'iso8859_10', | |
313 'latin6' : 'iso8859_10', | |
314 | |
315 # iso8859_11 codec | |
316 'thai' : 'iso8859_11', | |
317 'iso_8859_11' : 'iso8859_11', | |
318 'iso_8859_11_2001' : 'iso8859_11', | |
319 | |
320 # iso8859_13 codec | |
321 'iso_8859_13' : 'iso8859_13', | |
322 'l7' : 'iso8859_13', | |
323 'latin7' : 'iso8859_13', | |
324 | |
325 # iso8859_14 codec | |
326 'iso_8859_14' : 'iso8859_14', | |
327 'iso_8859_14_1998' : 'iso8859_14', | |
328 'iso_celtic' : 'iso8859_14', | |
329 'iso_ir_199' : 'iso8859_14', | |
330 'l8' : 'iso8859_14', | |
331 'latin8' : 'iso8859_14', | |
332 | |
333 # iso8859_15 codec | |
334 'iso_8859_15' : 'iso8859_15', | |
335 'l9' : 'iso8859_15', | |
336 'latin9' : 'iso8859_15', | |
337 | |
338 # iso8859_16 codec | |
339 'iso_8859_16' : 'iso8859_16', | |
340 'iso_8859_16_2001' : 'iso8859_16', | |
341 'iso_ir_226' : 'iso8859_16', | |
342 'l10' : 'iso8859_16', | |
343 'latin10' : 'iso8859_16', | |
344 | |
345 # iso8859_2 codec | |
346 'csisolatin2' : 'iso8859_2', | |
347 'iso_8859_2' : 'iso8859_2', | |
348 'iso_8859_2_1987' : 'iso8859_2', | |
349 'iso_ir_101' : 'iso8859_2', | |
350 'l2' : 'iso8859_2', | |
351 'latin2' : 'iso8859_2', | |
352 | |
353 # iso8859_3 codec | |
354 'csisolatin3' : 'iso8859_3', | |
355 'iso_8859_3' : 'iso8859_3', | |
356 'iso_8859_3_1988' : 'iso8859_3', | |
357 'iso_ir_109' : 'iso8859_3', | |
358 'l3' : 'iso8859_3', | |
359 'latin3' : 'iso8859_3', | |
360 | |
361 # iso8859_4 codec | |
362 'csisolatin4' : 'iso8859_4', | |
363 'iso_8859_4' : 'iso8859_4', | |
364 'iso_8859_4_1988' : 'iso8859_4', | |
365 'iso_ir_110' : 'iso8859_4', | |
366 'l4' : 'iso8859_4', | |
367 'latin4' : 'iso8859_4', | |
368 | |
369 # iso8859_5 codec | |
370 'csisolatincyrillic' : 'iso8859_5', | |
371 'cyrillic' : 'iso8859_5', | |
372 'iso_8859_5' : 'iso8859_5', | |
373 'iso_8859_5_1988' : 'iso8859_5', | |
374 'iso_ir_144' : 'iso8859_5', | |
375 | |
376 # iso8859_6 codec | |
377 'arabic' : 'iso8859_6', | |
378 'asmo_708' : 'iso8859_6', | |
379 'csisolatinarabic' : 'iso8859_6', | |
380 'ecma_114' : 'iso8859_6', | |
381 'iso_8859_6' : 'iso8859_6', | |
382 'iso_8859_6_1987' : 'iso8859_6', | |
383 'iso_ir_127' : 'iso8859_6', | |
384 | |
385 # iso8859_7 codec | |
386 'csisolatingreek' : 'iso8859_7', | |
387 'ecma_118' : 'iso8859_7', | |
388 'elot_928' : 'iso8859_7', | |
389 'greek' : 'iso8859_7', | |
390 'greek8' : 'iso8859_7', | |
391 'iso_8859_7' : 'iso8859_7', | |
392 'iso_8859_7_1987' : 'iso8859_7', | |
393 'iso_ir_126' : 'iso8859_7', | |
394 | |
395 # iso8859_8 codec | |
396 'csisolatinhebrew' : 'iso8859_8', | |
397 'hebrew' : 'iso8859_8', | |
398 'iso_8859_8' : 'iso8859_8', | |
399 'iso_8859_8_1988' : 'iso8859_8', | |
400 'iso_ir_138' : 'iso8859_8', | |
401 | |
402 # iso8859_9 codec | |
403 'csisolatin5' : 'iso8859_9', | |
404 'iso_8859_9' : 'iso8859_9', | |
405 'iso_8859_9_1989' : 'iso8859_9', | |
406 'iso_ir_148' : 'iso8859_9', | |
407 'l5' : 'iso8859_9', | |
408 'latin5' : 'iso8859_9', | |
409 | |
410 # johab codec | |
411 'cp1361' : 'johab', | |
412 'ms1361' : 'johab', | |
413 | |
414 # koi8_r codec | |
415 'cskoi8r' : 'koi8_r', | |
416 | |
417 # kz1048 codec | |
418 'kz_1048' : 'kz1048', | |
419 'rk1048' : 'kz1048', | |
420 'strk1048_2002' : 'kz1048', | |
421 | |
422 # latin_1 codec | |
423 # | |
424 # Note that the latin_1 codec is implemented internally in C and a | |
425 # lot faster than the charmap codec iso8859_1 which uses the same | |
426 # encoding. This is why we discourage the use of the iso8859_1 | |
427 # codec and alias it to latin_1 instead. | |
428 # | |
429 '8859' : 'latin_1', | |
430 'cp819' : 'latin_1', | |
431 'csisolatin1' : 'latin_1', | |
432 'ibm819' : 'latin_1', | |
433 'iso8859' : 'latin_1', | |
434 'iso8859_1' : 'latin_1', | |
435 'iso_8859_1' : 'latin_1', | |
436 'iso_8859_1_1987' : 'latin_1', | |
437 'iso_ir_100' : 'latin_1', | |
438 'l1' : 'latin_1', | |
439 'latin' : 'latin_1', | |
440 'latin1' : 'latin_1', | |
441 | |
442 # mac_cyrillic codec | |
443 'maccyrillic' : 'mac_cyrillic', | |
444 | |
445 # mac_greek codec | |
446 'macgreek' : 'mac_greek', | |
447 | |
448 # mac_iceland codec | |
449 'maciceland' : 'mac_iceland', | |
450 | |
451 # mac_latin2 codec | |
452 'maccentraleurope' : 'mac_latin2', | |
453 'maclatin2' : 'mac_latin2', | |
454 | |
455 # mac_roman codec | |
456 'macintosh' : 'mac_roman', | |
457 'macroman' : 'mac_roman', | |
458 | |
459 # mac_turkish codec | |
460 'macturkish' : 'mac_turkish', | |
461 | |
462 # mbcs codec | |
463 'ansi' : 'mbcs', | |
464 'dbcs' : 'mbcs', | |
465 | |
466 # ptcp154 codec | |
467 'csptcp154' : 'ptcp154', | |
468 'pt154' : 'ptcp154', | |
469 'cp154' : 'ptcp154', | |
470 'cyrillic_asian' : 'ptcp154', | |
471 | |
472 # quopri_codec codec | |
473 'quopri' : 'quopri_codec', | |
474 'quoted_printable' : 'quopri_codec', | |
475 'quotedprintable' : 'quopri_codec', | |
476 | |
477 # rot_13 codec | |
478 'rot13' : 'rot_13', | |
479 | |
480 # shift_jis codec | |
481 'csshiftjis' : 'shift_jis', | |
482 'shiftjis' : 'shift_jis', | |
483 'sjis' : 'shift_jis', | |
484 's_jis' : 'shift_jis', | |
485 | |
486 # shift_jis_2004 codec | |
487 'shiftjis2004' : 'shift_jis_2004', | |
488 'sjis_2004' : 'shift_jis_2004', | |
489 's_jis_2004' : 'shift_jis_2004', | |
490 | |
491 # shift_jisx0213 codec | |
492 'shiftjisx0213' : 'shift_jisx0213', | |
493 'sjisx0213' : 'shift_jisx0213', | |
494 's_jisx0213' : 'shift_jisx0213', | |
495 | |
496 # tactis codec | |
497 'tis260' : 'tactis', | |
498 | |
499 # tis_620 codec | |
500 'tis620' : 'tis_620', | |
501 'tis_620_0' : 'tis_620', | |
502 'tis_620_2529_0' : 'tis_620', | |
503 'tis_620_2529_1' : 'tis_620', | |
504 'iso_ir_166' : 'tis_620', | |
505 | |
506 # utf_16 codec | |
507 'u16' : 'utf_16', | |
508 'utf16' : 'utf_16', | |
509 | |
510 # utf_16_be codec | |
511 'unicodebigunmarked' : 'utf_16_be', | |
512 'utf_16be' : 'utf_16_be', | |
513 | |
514 # utf_16_le codec | |
515 'unicodelittleunmarked' : 'utf_16_le', | |
516 'utf_16le' : 'utf_16_le', | |
517 | |
518 # utf_32 codec | |
519 'u32' : 'utf_32', | |
520 'utf32' : 'utf_32', | |
521 | |
522 # utf_32_be codec | |
523 'utf_32be' : 'utf_32_be', | |
524 | |
525 # utf_32_le codec | |
526 'utf_32le' : 'utf_32_le', | |
527 | |
528 # utf_7 codec | |
529 'u7' : 'utf_7', | |
530 'utf7' : 'utf_7', | |
531 'unicode_1_1_utf_7' : 'utf_7', | |
532 | |
533 # utf_8 codec | |
534 'u8' : 'utf_8', | |
535 'utf' : 'utf_8', | |
536 'utf8' : 'utf_8', | |
537 'utf8_ucs2' : 'utf_8', | |
538 'utf8_ucs4' : 'utf_8', | |
539 'cp65001' : 'utf_8', | |
540 | |
541 # uu_codec codec | |
542 'uu' : 'uu_codec', | |
543 | |
544 # zlib_codec codec | |
545 'zip' : 'zlib_codec', | |
546 'zlib' : 'zlib_codec', | |
547 | |
548 # temporary mac CJK aliases, will be replaced by proper codecs in 3.1 | |
549 'x_mac_japanese' : 'shift_jis', | |
550 'x_mac_korean' : 'euc_kr', | |
551 'x_mac_simp_chinese' : 'gb2312', | |
552 'x_mac_trad_chinese' : 'big5', | |
553 } |