mirror of
				https://github.com/python/cpython.git
				synced 2025-10-26 19:24:34 +00:00 
			
		
		
		
	 988ad2bdff
			
		
	
	
		988ad2bdff
		
	
	
	
	
		
			
			encodings package aliases mapping dictionary rather than in the internal cache used by the search function. This enables aliases to take advantage of the full normalization process applied to encoding names which was previously not available. The patch restricts alias registration to new aliases. Existing aliases cannot be overridden anymore.
		
			
				
	
	
		
			86 lines
		
	
	
	
		
			2.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			86 lines
		
	
	
	
		
			2.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| """ Standard "encodings" Package
 | |
| 
 | |
|     Standard Python encoding modules are stored in this package
 | |
|     directory.
 | |
| 
 | |
|     Codec modules must have names corresponding to standard lower-case
 | |
|     encoding names with hyphens mapped to underscores, e.g. 'utf-8' is
 | |
|     implemented by the module 'utf_8.py'.
 | |
| 
 | |
|     Each codec module must export the following interface:
 | |
| 
 | |
|     * getregentry() -> (encoder, decoder, stream_reader, stream_writer)
 | |
|     The getregentry() API must return callable objects which adhere to
 | |
|     the Python Codec Interface Standard.
 | |
| 
 | |
|     In addition, a module may optionally also define the following
 | |
|     APIs which are then used by the package's codec search function:
 | |
| 
 | |
|     * getaliases() -> sequence of encoding name strings to use as aliases
 | |
| 
 | |
|     Alias names returned by getaliases() must be standard encoding
 | |
|     names as defined above (lower-case, hyphens converted to
 | |
|     underscores).
 | |
| 
 | |
| Written by Marc-Andre Lemburg (mal@lemburg.com).
 | |
| 
 | |
| (c) Copyright CNRI, All Rights Reserved. NO WARRANTY.
 | |
| 
 | |
| """#"
 | |
| 
 | |
| import codecs,aliases
 | |
| 
 | |
| _cache = {}
 | |
| _unknown = '--unknown--'
 | |
| 
 | |
| def search_function(encoding):
 | |
|     
 | |
|     # Cache lookup
 | |
|     entry = _cache.get(encoding,_unknown)
 | |
|     if entry is not _unknown:
 | |
|         return entry
 | |
| 
 | |
|     # Import the module
 | |
|     modname = encoding.replace('-', '_')
 | |
|     modname = aliases.aliases.get(modname,modname)
 | |
|     try:
 | |
|         mod = __import__(modname,globals(),locals(),'*')
 | |
|     except ImportError,why:
 | |
|         # cache misses
 | |
|         _cache[encoding] = None
 | |
|         return None
 | |
|     
 | |
|     # Now ask the module for the registry entry
 | |
|     try:
 | |
|         entry = tuple(mod.getregentry())
 | |
|     except AttributeError:
 | |
|         entry = ()
 | |
|     if len(entry) != 4:
 | |
|         raise SystemError,\
 | |
|               'module "%s.%s" failed to register' % \
 | |
|               (__name__,modname)
 | |
|     for obj in entry:
 | |
|         if not callable(obj):
 | |
|             raise SystemError,\
 | |
|                   'incompatible codecs in module "%s.%s"' % \
 | |
|                   (__name__,modname)
 | |
| 
 | |
|     # Cache the codec registry entry
 | |
|     _cache[encoding] = entry
 | |
| 
 | |
|     # Register its aliases (without overwriting previously registered
 | |
|     # aliases)
 | |
|     try:
 | |
|         codecaliases = mod.getaliases()
 | |
|     except AttributeError:
 | |
|         pass
 | |
|     else:
 | |
|         for alias in codecaliases:
 | |
|             if not aliases.aliases.has_key(alias):
 | |
|                 aliases.aliases[alias] = modname
 | |
| 
 | |
|     # Return the registry entry
 | |
|     return entry
 | |
| 
 | |
| # Register the search_function in the Python codec registry
 | |
| codecs.register(search_function)
 |