2000-03-10 23:17:24 +00:00
|
|
|
""" Encoding Aliases Support
|
|
|
|
|
|
|
|
This module is used by the encodings package search function to
|
|
|
|
map encodings names to module names.
|
|
|
|
|
|
|
|
Note that the search function converts the encoding names to lower
|
|
|
|
case and replaces hyphens with underscores *before* performing the
|
|
|
|
lookup.
|
|
|
|
|
|
|
|
"""
|
|
|
|
aliases = {
|
|
|
|
|
|
|
|
# Latin-1
|
|
|
|
'latin': 'latin_1',
|
|
|
|
'latin1': 'latin_1',
|
|
|
|
|
2001-09-20 10:35:46 +00:00
|
|
|
# UTF-7
|
|
|
|
'utf7': 'utf_7',
|
|
|
|
'u7': 'utf_7',
|
|
|
|
|
2000-03-10 23:17:24 +00:00
|
|
|
# UTF-8
|
|
|
|
'utf': 'utf_8',
|
|
|
|
'utf8': 'utf_8',
|
|
|
|
'u8': 'utf_8',
|
2000-06-07 09:12:30 +00:00
|
|
|
'utf8@ucs2': 'utf_8',
|
|
|
|
'utf8@ucs4': 'utf_8',
|
2000-03-10 23:17:24 +00:00
|
|
|
|
|
|
|
# UTF-16
|
|
|
|
'utf16': 'utf_16',
|
|
|
|
'u16': 'utf_16',
|
|
|
|
'utf_16be': 'utf_16_be',
|
|
|
|
'utf_16le': 'utf_16_le',
|
2000-03-31 17:23:18 +00:00
|
|
|
'unicodebigunmarked': 'utf_16_be',
|
|
|
|
'unicodelittleunmarked': 'utf_16_le',
|
2000-03-10 23:17:24 +00:00
|
|
|
|
|
|
|
# ASCII
|
|
|
|
'us_ascii': 'ascii',
|
2001-08-10 13:58:50 +00:00
|
|
|
'ansi_x3.4_1968': 'ascii', # used on Linux
|
|
|
|
'646': 'ascii', # used on Solaris
|
2000-03-10 23:17:24 +00:00
|
|
|
|
2001-06-07 19:39:25 +00:00
|
|
|
# EBCDIC
|
|
|
|
'ebcdic_cp_us': 'cp037',
|
|
|
|
'ibm039': 'cp037',
|
|
|
|
'ibm1140': 'cp1140',
|
|
|
|
|
2000-03-10 23:17:24 +00:00
|
|
|
# ISO
|
2000-06-07 09:12:30 +00:00
|
|
|
'8859': 'latin_1',
|
|
|
|
'iso8859': 'latin_1',
|
2000-03-10 23:17:24 +00:00
|
|
|
'iso8859_1': 'latin_1',
|
|
|
|
'iso_8859_1': 'latin_1',
|
|
|
|
'iso_8859_10': 'iso8859_10',
|
|
|
|
'iso_8859_13': 'iso8859_13',
|
|
|
|
'iso_8859_14': 'iso8859_14',
|
|
|
|
'iso_8859_15': 'iso8859_15',
|
|
|
|
'iso_8859_2': 'iso8859_2',
|
|
|
|
'iso_8859_3': 'iso8859_3',
|
|
|
|
'iso_8859_4': 'iso8859_4',
|
|
|
|
'iso_8859_5': 'iso8859_5',
|
|
|
|
'iso_8859_6': 'iso8859_6',
|
|
|
|
'iso_8859_7': 'iso8859_7',
|
|
|
|
'iso_8859_8': 'iso8859_8',
|
|
|
|
'iso_8859_9': 'iso8859_9',
|
|
|
|
|
|
|
|
# Mac
|
2000-06-07 09:12:30 +00:00
|
|
|
'maclatin2': 'mac_latin2',
|
2000-03-31 17:23:18 +00:00
|
|
|
'maccentraleurope': 'mac_latin2',
|
|
|
|
'maccyrillic': 'mac_cyrillic',
|
|
|
|
'macgreek': 'mac_greek',
|
|
|
|
'maciceland': 'mac_iceland',
|
|
|
|
'macroman': 'mac_roman',
|
|
|
|
'macturkish': 'mac_turkish',
|
2000-03-10 23:17:24 +00:00
|
|
|
|
2001-06-04 02:31:23 +00:00
|
|
|
# Windows
|
|
|
|
'windows_1252': 'cp1252',
|
|
|
|
'windows_1254': 'cp1254',
|
|
|
|
'windows_1255': 'cp1255',
|
|
|
|
|
2000-04-05 20:11:21 +00:00
|
|
|
# MBCS
|
|
|
|
'dbcs': 'mbcs',
|
|
|
|
|
2000-06-07 09:12:30 +00:00
|
|
|
# Code pages
|
|
|
|
'437': 'cp437',
|
|
|
|
|
|
|
|
# CJK
|
|
|
|
#
|
|
|
|
# The codecs for these encodings are not distributed with the
|
|
|
|
# Python core, but are included here for reference, since the
|
|
|
|
# locale module relies on having these aliases available.
|
|
|
|
#
|
|
|
|
'jis_7': 'jis_7',
|
|
|
|
'iso_2022_jp': 'jis_7',
|
|
|
|
'ujis': 'euc_jp',
|
|
|
|
'ajec': 'euc_jp',
|
|
|
|
'eucjp': 'euc_jp',
|
|
|
|
'tis260': 'tactis',
|
|
|
|
'sjis': 'shift_jis',
|
|
|
|
|
2001-05-15 12:00:02 +00:00
|
|
|
# Content transfer/compression encodings
|
|
|
|
'rot13': 'rot_13',
|
|
|
|
'base64': 'base64_codec',
|
|
|
|
'base_64': 'base64_codec',
|
|
|
|
'zlib': 'zlib_codec',
|
|
|
|
'zip': 'zlib_codec',
|
|
|
|
'hex': 'hex_codec',
|
|
|
|
'uu': 'uu_codec',
|
2001-05-15 15:34:07 +00:00
|
|
|
'quopri': 'quopri_codec',
|
|
|
|
'quotedprintable': 'quopri_codec',
|
|
|
|
'quoted_printable': 'quopri_codec',
|
2001-05-15 12:00:02 +00:00
|
|
|
|
2000-03-10 23:17:24 +00:00
|
|
|
}
|