mirror of
				https://github.com/python/cpython.git
				synced 2025-10-25 02:43:41 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			499 lines
		
	
	
	
		
			16 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			499 lines
		
	
	
	
		
			16 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #
 | |
| # imputil.py
 | |
| #
 | |
| # Written by Greg Stein. Public Domain.
 | |
| # No Copyright, no Rights Reserved, and no Warranties.
 | |
| #
 | |
| # Utilities to help out with custom import mechanisms.
 | |
| #
 | |
| # Additional modifications were contribed by Marc-Andre Lemburg and
 | |
| # Gordon McMillan.
 | |
| #
 | |
| # This module is maintained by Greg and is available at:
 | |
| #    http://www.lyra.org/greg/python/imputil.py
 | |
| #
 | |
| # Since this isn't in the Python distribution yet, we'll use the CVS ID
 | |
| # for tracking:
 | |
| #   $Id$
 | |
| #
 | |
| 
 | |
| __version__ = '0.3'
 | |
| 
 | |
| # note: avoid importing non-builtin modules
 | |
| import imp
 | |
| import sys
 | |
| import strop
 | |
| import __builtin__	### why this instead of just using __builtins__ ??
 | |
| 
 | |
| # for the DirectoryImporter
 | |
| import struct
 | |
| import marshal
 | |
| 
 | |
| class Importer:
 | |
|   "Base class for replacing standard import functions."
 | |
| 
 | |
|   def install(self):
 | |
|     self.__chain_import = __builtin__.__import__
 | |
|     self.__chain_reload = __builtin__.reload
 | |
|     __builtin__.__import__ = self._import_hook
 | |
|     __builtin__.reload = self._reload_hook
 | |
| 
 | |
|   ######################################################################
 | |
|   #
 | |
|   # PRIVATE METHODS
 | |
|   #
 | |
|   def _import_hook(self, name, globals=None, locals=None, fromlist=None):
 | |
|     """Python calls this hook to locate and import a module.
 | |
| 
 | |
|     This method attempts to load the (dotted) module name. If it cannot
 | |
|     find it, then it delegates the import to the next import hook in the
 | |
|     chain (where "next" is defined as the import hook that was in place
 | |
|     at the time this Importer instance was installed).
 | |
|     """
 | |
| 
 | |
|     ### insert a fast-path check for whether the module is already
 | |
|     ### loaded? use a variant of _determine_import_context() which
 | |
|     ### returns a context regardless of Importer used. generate an
 | |
|     ### fqname and look in sys.modules for it.
 | |
| 
 | |
|     # determine the context of this import
 | |
|     parent = self._determine_import_context(globals)
 | |
| 
 | |
|     # import the module within the context, or from the default context
 | |
|     top, tail = self._import_top_module(parent, name)
 | |
|     if top is None:
 | |
|       # the module was not found; delegate to the next import hook
 | |
|       return self.__chain_import(name, globals, locals, fromlist)
 | |
| 
 | |
|     # the top module may be under the control of a different importer.
 | |
|     # if so, then defer to that importer for completion of the import.
 | |
|     # note it may be self, or is undefined so we (self) may as well
 | |
|     # finish the import.
 | |
|     importer = top.__dict__.get('__importer__', self)
 | |
|     return importer._finish_import(top, tail, fromlist)
 | |
| 
 | |
|   def _finish_import(self, top, tail, fromlist):
 | |
|     # if "a.b.c" was provided, then load the ".b.c" portion down from
 | |
|     # below the top-level module.
 | |
|     bottom = self._load_tail(top, tail)
 | |
| 
 | |
|     # if the form is "import a.b.c", then return "a"
 | |
|     if not fromlist:
 | |
|       # no fromlist: return the top of the import tree
 | |
|       return top
 | |
| 
 | |
|     # the top module was imported by self, or it was not imported through
 | |
|     # the Importer mechanism and self is simply handling the import of
 | |
|     # the sub-modules and fromlist.
 | |
|     #
 | |
|     # this means that the bottom module was also imported by self, or we
 | |
|     # are handling things in the absence of a prior Importer
 | |
|     #
 | |
|     # ### why the heck are we handling it? what is the example scenario
 | |
|     # ### where this happens? note that we can't determine is_package()
 | |
|     # ### for non-Importer modules.
 | |
|     #
 | |
|     # since we imported/handled the bottom module, this means that we can
 | |
|     # also handle its fromlist (and reliably determine is_package()).
 | |
| 
 | |
|     # if the bottom node is a package, then (potentially) import some modules.
 | |
|     #
 | |
|     # note: if it is not a package, then "fromlist" refers to names in
 | |
|     #       the bottom module rather than modules.
 | |
|     # note: for a mix of names and modules in the fromlist, we will
 | |
|     #       import all modules and insert those into the namespace of
 | |
|     #       the package module. Python will pick up all fromlist names
 | |
|     #       from the bottom (package) module; some will be modules that
 | |
|     #       we imported and stored in the namespace, others are expected
 | |
|     #       to be present already.
 | |
|     if self._is_package(bottom.__dict__):
 | |
|       self._import_fromlist(bottom, fromlist)
 | |
| 
 | |
|     # if the form is "from a.b import c, d" then return "b"
 | |
|     return bottom
 | |
| 
 | |
|   def _reload_hook(self, module):
 | |
|     "Python calls this hook to reload a module."
 | |
| 
 | |
|     # reloading of a module may or may not be possible (depending on the
 | |
|     # importer), but at least we can validate that it's ours to reload
 | |
|     importer = module.__dict__.get('__importer__', None)
 | |
|     if importer is not self:
 | |
|       return self.__chain_reload(module)
 | |
| 
 | |
|     # okay. it is ours, but we don't know what to do (yet)
 | |
|     ### we should blast the module dict and do another get_code(). need to
 | |
|     ### flesh this out and add proper docco...
 | |
|     raise SystemError, "reload not yet implemented"
 | |
| 
 | |
|   def _determine_import_context(self, globals):
 | |
|     """Returns the context in which a module should be imported.
 | |
| 
 | |
|     The context could be a loaded (package) module and the imported module
 | |
|     will be looked for within that package. The context could also be None,
 | |
|     meaning there is no context -- the module should be looked for as a
 | |
|     "top-level" module.
 | |
|     """
 | |
| 
 | |
|     if not globals or \
 | |
|        globals.get('__importer__', None) is not self:
 | |
|       # globals does not refer to one of our modules or packages.
 | |
|       # That implies there is no relative import context, and it
 | |
|       # should just pick it off the standard path.
 | |
|       return None
 | |
| 
 | |
|     # The globals refer to a module or package of ours. It will define
 | |
|     # the context of the new import. Get the module/package fqname.
 | |
|     parent_fqname = globals['__name__']
 | |
| 
 | |
|     # for a package, return itself (imports refer to pkg contents)
 | |
|     if self._is_package(globals):
 | |
|       parent = sys.modules[parent_fqname]
 | |
|       assert globals is parent.__dict__
 | |
|       return parent
 | |
| 
 | |
|     i = strop.rfind(parent_fqname, '.')
 | |
| 
 | |
|     # a module outside of a package has no particular import context
 | |
|     if i == -1:
 | |
|       return None
 | |
| 
 | |
|     # for a module in a package, return the package (imports refer to siblings)
 | |
|     parent_fqname = parent_fqname[:i]
 | |
|     parent = sys.modules[parent_fqname]
 | |
|     assert parent.__name__ == parent_fqname
 | |
|     return parent
 | |
| 
 | |
|   def _import_top_module(self, parent, name):
 | |
|     """Locate the top of the import tree (relative or absolute).
 | |
| 
 | |
|     parent defines the context in which the import should occur. See
 | |
|     _determine_import_context() for details.
 | |
| 
 | |
|     Returns a tuple (module, tail). module is the loaded (top-level) module,
 | |
|     or None if the module is not found. tail is the remaining portion of
 | |
|     the dotted name.
 | |
|     """
 | |
|     i = strop.find(name, '.')
 | |
|     if i == -1:
 | |
|       head = name
 | |
|       tail = ""
 | |
|     else:
 | |
|       head = name[:i]
 | |
|       tail = name[i+1:]
 | |
|     if parent:
 | |
|       fqname = "%s.%s" % (parent.__name__, head)
 | |
|     else:
 | |
|       fqname = head
 | |
|     module = self._import_one(parent, head, fqname)
 | |
|     if module:
 | |
|       # the module was relative, or no context existed (the module was
 | |
|       # simply found on the path).
 | |
|       return module, tail
 | |
|     if parent:
 | |
|       # we tried relative, now try an absolute import (from the path)
 | |
|       module = self._import_one(None, head, head)
 | |
|       if module:
 | |
|         return module, tail
 | |
| 
 | |
|     # the module wasn't found
 | |
|     return None, None
 | |
| 
 | |
|   def _import_one(self, parent, modname, fqname):
 | |
|     "Import a single module."
 | |
| 
 | |
|     # has the module already been imported?
 | |
|     try:
 | |
|       return sys.modules[fqname]
 | |
|     except KeyError:
 | |
|       pass
 | |
| 
 | |
|     # load the module's code, or fetch the module itself
 | |
|     result = self.get_code(parent, modname, fqname)
 | |
|     if result is None:
 | |
|       return None
 | |
| 
 | |
|     # did get_code() return an actual module? (rather than a code object)
 | |
|     is_module = type(result[1]) is type(sys)
 | |
| 
 | |
|     # use the returned module, or create a new one to exec code into
 | |
|     if is_module:
 | |
|       module = result[1]
 | |
|     else:
 | |
|       module = imp.new_module(fqname)
 | |
| 
 | |
|     ### record packages a bit differently??
 | |
|     module.__importer__ = self
 | |
|     module.__ispkg__ = result[0]
 | |
| 
 | |
|     # if present, the third item is a set of values to insert into the module
 | |
|     if len(result) > 2:
 | |
|       module.__dict__.update(result[2])
 | |
| 
 | |
|     # the module is almost ready... make it visible
 | |
|     sys.modules[fqname] = module
 | |
| 
 | |
|     # execute the code within the module's namespace
 | |
|     if not is_module:
 | |
|       exec result[1] in module.__dict__
 | |
| 
 | |
|     # insert the module into its parent
 | |
|     if parent:
 | |
|       setattr(parent, modname, module)
 | |
|     return module
 | |
| 
 | |
|   def _load_tail(self, m, tail):
 | |
|     """Import the rest of the modules, down from the top-level module.
 | |
| 
 | |
|     Returns the last module in the dotted list of modules.
 | |
|     """
 | |
|     if tail:
 | |
|       for part in strop.splitfields(tail, '.'):
 | |
|         fqname = "%s.%s" % (m.__name__, part)
 | |
|         m = self._import_one(m, part, fqname)
 | |
|         if not m:
 | |
|           raise ImportError, "No module named " + fqname
 | |
|     return m
 | |
| 
 | |
|   def _import_fromlist(self, package, fromlist):
 | |
|     'Import any sub-modules in the "from" list.'
 | |
| 
 | |
|     # if '*' is present in the fromlist, then look for the '__all__' variable
 | |
|     # to find additional items (modules) to import.
 | |
|     if '*' in fromlist:
 | |
|       fromlist = list(fromlist) + list(package.__dict__.get('__all__', []))
 | |
| 
 | |
|     for sub in fromlist:
 | |
|       # if the name is already present, then don't try to import it (it
 | |
|       # might not be a module!).
 | |
|       if sub != '*' and not hasattr(package, sub):
 | |
|         subname = "%s.%s" % (package.__name__, sub)
 | |
|         submod = self._import_one(package, sub, subname)
 | |
|         if not submod:
 | |
|           raise ImportError, "cannot import name " + subname
 | |
| 
 | |
|   def _is_package(self, module_dict):
 | |
|     """Determine if a given module (dictionary) specifies a package.
 | |
| 
 | |
|     The package status is in the module-level name __ispkg__. The module
 | |
|     must also have been imported by self, so that we can reliably apply
 | |
|     semantic meaning to __ispkg__.
 | |
| 
 | |
|     ### weaken the test to issubclass(Importer)?
 | |
|     """
 | |
|     return module_dict.get('__importer__', None) is self and \
 | |
|            module_dict['__ispkg__']
 | |
| 
 | |
|   ######################################################################
 | |
|   #
 | |
|   # METHODS TO OVERRIDE
 | |
|   #
 | |
|   def get_code(self, parent, modname, fqname):
 | |
|     """Find and retrieve the code for the given module.
 | |
| 
 | |
|     parent specifies a parent module to define a context for importing. It
 | |
|     may be None, indicating no particular context for the search.
 | |
| 
 | |
|     modname specifies a single module (not dotted) within the parent.
 | |
| 
 | |
|     fqname specifies the fully-qualified module name. This is a (potentially)
 | |
|     dotted name from the "root" of the module namespace down to the modname.
 | |
|     If there is no parent, then modname==fqname.
 | |
| 
 | |
|     This method should return None, a 2-tuple, or a 3-tuple.
 | |
| 
 | |
|     * If the module was not found, then None should be returned.
 | |
| 
 | |
|     * The first item of the 2- or 3-tuple should be the integer 0 or 1,
 | |
|       specifying whether the module that was found is a package or not.
 | |
| 
 | |
|     * The second item is the code object for the module (it will be
 | |
|       executed within the new module's namespace). This item can also
 | |
|       be a fully-loaded module object (e.g. loaded from a shared lib).
 | |
| 
 | |
|     * If present, the third item is a dictionary of name/value pairs that
 | |
|       will be inserted into new module before the code object is executed.
 | |
|       This provided in case the module's code expects certain values (such
 | |
|       as where the module was found). When the second item is a module
 | |
|       object, then these names/values will be inserted *after* the module
 | |
|       has been loaded/initialized.
 | |
|     """
 | |
|     raise RuntimeError, "get_code not implemented"
 | |
| 
 | |
| 
 | |
| ######################################################################
 | |
| #
 | |
| # Simple function-based importer
 | |
| #
 | |
| class FuncImporter(Importer):
 | |
|   "Importer subclass to use a supplied function rather than method overrides."
 | |
|   def __init__(self, func):
 | |
|     self.func = func
 | |
|   def get_code(self, parent, modname, fqname):
 | |
|     return self.func(parent, modname, fqname)
 | |
| 
 | |
| def install_with(func):
 | |
|   FuncImporter(func).install()
 | |
| 
 | |
| 
 | |
| ######################################################################
 | |
| #
 | |
| # Base class for archive-based importing
 | |
| #
 | |
| class PackageArchiveImporter(Importer):
 | |
|   "Importer subclass to import from (file) archives."
 | |
| 
 | |
|   def get_code(self, parent, modname, fqname):
 | |
|     if parent:
 | |
|       # if a parent "package" is provided, then we are importing a sub-file
 | |
|       # from the archive.
 | |
|       result = self.get_subfile(parent.__archive__, modname)
 | |
|       if result is None:
 | |
|         return None
 | |
|       if type(result) == type(()):
 | |
|         return (0,) + result
 | |
|       return 0, result
 | |
| 
 | |
|     # no parent was provided, so the archive should exist somewhere on the
 | |
|     # default "path".
 | |
|     archive = self.get_archive(modname)
 | |
|     if archive is None:
 | |
|       return None
 | |
|     return 1, "", {'__archive__':archive}
 | |
| 
 | |
|   def get_archive(self, modname):
 | |
|     """Get an archive of modules.
 | |
| 
 | |
|     This method should locate an archive and return a value which can be
 | |
|     used by get_subfile to load modules from it. The value may be a simple
 | |
|     pathname, an open file, or a complex object that caches information
 | |
|     for future imports.
 | |
| 
 | |
|     Return None if the archive was not found.
 | |
|     """
 | |
|     raise RuntimeError, "get_archive not implemented"
 | |
| 
 | |
|   def get_subfile(self, archive, modname):
 | |
|     """Get code from a subfile in the specified archive.
 | |
| 
 | |
|     Given the specified archive (as returned by get_archive()), locate
 | |
|     and return a code object for the specified module name.
 | |
| 
 | |
|     A 2-tuple may be returned, consisting of a code object and a dict
 | |
|     of name/values to place into the target module.
 | |
| 
 | |
|     Return None if the subfile was not found.
 | |
|     """
 | |
|     raise RuntimeError, "get_subfile not implemented"
 | |
| 
 | |
| 
 | |
| class PackageArchive(PackageArchiveImporter):
 | |
|   "PackageArchiveImporter subclass that refers to a specific archive."
 | |
| 
 | |
|   def __init__(self, modname, archive_pathname):
 | |
|     self.__modname = modname
 | |
|     self.__path = archive_pathname
 | |
| 
 | |
|   def get_archive(self, modname):
 | |
|     if modname == self.__modname:
 | |
|       return self.__path
 | |
|     return None
 | |
| 
 | |
|   # get_subfile is passed the full pathname of the archive
 | |
| 
 | |
| 
 | |
| ######################################################################
 | |
| #
 | |
| # Emulate the standard directory-based import mechanism
 | |
| #
 | |
| 
 | |
| class DirectoryImporter(Importer):
 | |
|   "Importer subclass to emulate the standard importer."
 | |
| 
 | |
|   def __init__(self, dir):
 | |
|     self.dir = dir
 | |
|     self.ext_char = __debug__ and 'c' or 'o'
 | |
|     self.ext = '.py' + self.ext_char
 | |
| 
 | |
|   def get_code(self, parent, modname, fqname):
 | |
|     if parent:
 | |
|       dir = parent.__pkgdir__
 | |
|     else:
 | |
|       dir = self.dir
 | |
| 
 | |
|     # pull the os module from our instance data. we don't do this at the
 | |
|     # top-level, because it isn't a builtin module (and we want to defer
 | |
|     # loading non-builtins until as late as possible).
 | |
|     try:
 | |
|       os = self.os
 | |
|     except AttributeError:
 | |
|       import os
 | |
|       self.os = os
 | |
| 
 | |
|     pathname = os.path.join(dir, modname)
 | |
|     if os.path.isdir(pathname):
 | |
|       values = { '__pkgdir__' : pathname }
 | |
|       ispkg = 1
 | |
|       pathname = os.path.join(pathname, '__init__')
 | |
|     else:
 | |
|       values = { }
 | |
|       ispkg = 0
 | |
| 
 | |
|     t_py = self._timestamp(pathname + '.py')
 | |
|     t_pyc = self._timestamp(pathname + self.ext)
 | |
|     if t_py is None and t_pyc is None:
 | |
|       return None
 | |
|     code = None
 | |
|     if t_py is None or (t_pyc is not None and t_pyc >= t_py):
 | |
|       f = open(pathname + self.ext, 'rb')
 | |
|       if f.read(4) == imp.get_magic():
 | |
|         t = struct.unpack('<I', f.read(4))[0]
 | |
|         if t == t_py:
 | |
|           code = marshal.load(f)
 | |
|       f.close()
 | |
|     if code is None:
 | |
|       code = self._compile(pathname + '.py', t_py)
 | |
|     return ispkg, code, values
 | |
| 
 | |
|   def _timestamp(self, pathname):
 | |
|     try:
 | |
|       s = self.os.stat(pathname)
 | |
|     except OSError:
 | |
|       return None
 | |
|     return long(s[8])
 | |
| 
 | |
|   def _compile(self, pathname, timestamp):
 | |
|     codestring = open(pathname, 'r').read()
 | |
|     if codestring and codestring[-1] != '\n':
 | |
|       codestring = codestring + '\n'
 | |
|     code = __builtin__.compile(codestring, pathname, 'exec')
 | |
| 
 | |
|     # try to cache the compiled code
 | |
|     try:
 | |
|       f = open(pathname + self.ext_char, 'wb')
 | |
|       f.write('\0\0\0\0')
 | |
|       f.write(struct.pack('<I', timestamp))
 | |
|       marshal.dump(code, f)
 | |
|       f.flush()
 | |
|       f.seek(0, 0)
 | |
|       f.write(imp.get_magic())
 | |
|       f.close()
 | |
|     except OSError:
 | |
|       pass
 | |
| 
 | |
|     return code
 | |
| 
 | |
|   def __repr__(self):
 | |
|     return '<%s.%s for "%s" at 0x%x>' % (self.__class__.__module__,
 | |
|                                          self.__class__.__name__,
 | |
|                                          self.dir,
 | |
|                                          id(self))
 | |
| 
 | |
| def _test_dir():
 | |
|   "Debug/test function to create DirectoryImporters from sys.path."
 | |
|   path = sys.path[:]
 | |
|   path.reverse()
 | |
|   for d in path:
 | |
|     DirectoryImporter(d).install()
 | |
| 
 | |
| ######################################################################
 | 
