diff options
author | Greg Stein <gstein@lyra.org> | 2000-01-03 02:38:29 (GMT) |
---|---|---|
committer | Greg Stein <gstein@lyra.org> | 2000-01-03 02:38:29 (GMT) |
commit | f23aa1ee9facd990c8cf102ed69d56e2a688730d (patch) | |
tree | cd7addcc9f2de4ec95b94bea0f2d2c395261cd8e | |
parent | bb05b2520dc65f9c637d012f015f7b965a44d0f7 (diff) | |
download | cpython-f23aa1ee9facd990c8cf102ed69d56e2a688730d.zip cpython-f23aa1ee9facd990c8cf102ed69d56e2a688730d.tar.gz cpython-f23aa1ee9facd990c8cf102ed69d56e2a688730d.tar.bz2 |
redesign/rebuild around the ImportManager concept.
-rw-r--r-- | Lib/imputil.py | 440 |
1 files changed, 291 insertions, 149 deletions
diff --git a/Lib/imputil.py b/Lib/imputil.py index 6d70938..3417ea6 100644 --- a/Lib/imputil.py +++ b/Lib/imputil.py @@ -27,105 +27,105 @@ import __builtin__ import struct import marshal -class Importer: - "Base class for replacing standard import functions." +_StringType = type('') +_ModuleType = type(sys) + +class ImportManager: + "Manage the import process." def install(self): + ### warning: Python 1.6 will have a different hook mechanism; this + ### code will need to change. self.__chain_import = __builtin__.__import__ self.__chain_reload = __builtin__.reload __builtin__.__import__ = self._import_hook - __builtin__.reload = self._reload_hook + ### fix this + #__builtin__.reload = None + #__builtin__.reload = self._reload_hook + + def add_suffix(self, suffix, importer): + assert isinstance(importer, SuffixImporter) + self.suffixes.append((suffix, importer)) ###################################################################### # # PRIVATE METHODS # - def _import_hook(self, name, globals=None, locals=None, fromlist=None): - """Python calls this hook to locate and import a module. + def __init__(self): + # we're definitely going to be importing something in the future, + # so let's just load the OS-related facilities. + if not _os_stat: + _os_bootstrap() - This method attempts to load the (dotted) module name. If it cannot - find it, then it delegates the import to the next import hook in the - chain (where "next" is defined as the import hook that was in place - at the time this Importer instance was installed). - """ + # Initialize the set of suffixes that we recognize and import. + # The default will import dynamic-load modules first, followed by + # .py files (or a .py file's cached bytecode) + self.suffixes = [ ] + for desc in imp.get_suffixes(): + if desc[2] == imp.C_EXTENSION: + self.suffixes.append((desc[0], DynLoadSuffixImporter(desc))) + self.suffixes.append(('.py', PySuffixImporter())) + + # This is the importer that we use for grabbing stuff from the + # filesystem. It defines one more method (import_from_dir) for our use. + self.fs_imp = _FilesystemImporter(self.suffixes) - ### insert a fast-path check for whether the module is already - ### loaded? use a variant of _determine_import_context() which - ### returns a context regardless of Importer used. generate an - ### fqname and look in sys.modules for it. + def _import_hook(self, fqname, globals=None, locals=None, fromlist=None): + """Python calls this hook to locate and import a module.""" - ### note that given module a.b which imports c, if c is already - ### loaded, python still wants to look for a.c + parts = strop.split(fqname, '.') # determine the context of this import parent = self._determine_import_context(globals) - # import the module within the context, or from the default context - top, tail = self._import_top_module(parent, name) - if top is None: - # the module was not found; delegate to the next import hook - return self.__chain_import(name, globals, locals, fromlist) - - # the top module may be under the control of a different importer. - # if so, then defer to that importer for completion of the import. - # note it may be self, or is undefined so we (self) may as well - # finish the import. - importer = top.__dict__.get('__importer__', self) - return importer._finish_import(top, tail, fromlist) - - def _finish_import(self, top, tail, fromlist): - # if "a.b.c" was provided, then load the ".b.c" portion down from - # below the top-level module. - bottom = self._load_tail(top, tail) - - # if the form is "import a.b.c", then return "a" - if not fromlist: - # no fromlist: return the top of the import tree - return top - - # the top module was imported by self, or it was not imported through - # the Importer mechanism and self is simply handling the import of - # the sub-modules and fromlist. - # - # this means that the bottom module was also imported by self, or we - # are handling things in the absence of a prior Importer - # - # ### why the heck are we handling it? what is the example scenario - # ### where this happens? note that we can't determine is_package() - # ### for non-Importer modules. - # - # since we imported/handled the bottom module, this means that we can - # also handle its fromlist (and reliably determine is_package()). - - # if the bottom node is a package, then (potentially) import some modules. - # - # note: if it is not a package, then "fromlist" refers to names in - # the bottom module rather than modules. - # note: for a mix of names and modules in the fromlist, we will - # import all modules and insert those into the namespace of - # the package module. Python will pick up all fromlist names - # from the bottom (package) module; some will be modules that - # we imported and stored in the namespace, others are expected - # to be present already. - if self._is_package(bottom.__dict__): - self._import_fromlist(bottom, fromlist) - - # if the form is "from a.b import c, d" then return "b" - return bottom - - def _reload_hook(self, module): - "Python calls this hook to reload a module." + # if there is a parent, then its importer should manage this import + if parent: + module = parent.__importer__._do_import(parent, parts, fromlist) + if module: + return module - # reloading of a module may or may not be possible (depending on the - # importer), but at least we can validate that it's ours to reload - importer = module.__dict__.get('__importer__', None) - if importer is not self: - return self.__chain_reload(module) + # has the top module already been imported? + try: + top_module = sys.modules[parts[0]] + except KeyError: - # okay. it is ours, but we don't know what to do (yet) - ### we should blast the module dict and do another get_code(). need to - ### flesh this out and add proper docco... - raise SystemError, "reload not yet implemented" + # look for the topmost module + top_module = self._import_top_module(parts[0]) + if not top_module: + # the topmost module wasn't found at all. + raise ImportError, 'No module named ' + fqname + return self.__chain_import(name, globals, locals, fromlist) + + # fast-path simple imports + if len(parts) == 1: + if not fromlist: + return top_module + + if not top_module.__dict__.get('__ispkg__'): + # __ispkg__ isn't defined (the module was not imported by us), or + # it is zero. + # + # In the former case, there is no way that we could import + # sub-modules that occur in the fromlist (but we can't raise an + # error because it may just be names) because we don't know how + # to deal with packages that were imported by other systems. + # + # In the latter case (__ispkg__ == 0), there can't be any sub- + # modules present, so we can just return. + # + # In both cases, since len(parts) == 1, the top_module is also + # the "bottom" which is the defined return when a fromlist exists. + return top_module + + importer = top_module.__dict__.get('__importer__') + if importer: + return importer._finish_import(top_module, parts[1:], fromlist) + + # If the importer does not exist, then we have to bail. A missing importer + # means that something else imported the module, and we have no knowledge + # of how to get sub-modules out of the thing. + raise ImportError, 'No module named ' + fqname + return self.__chain_import(name, globals, locals, fromlist) def _determine_import_context(self, globals): """Returns the context in which a module should be imported. @@ -136,19 +136,19 @@ class Importer: "top-level" module. """ - if not globals or \ - globals.get('__importer__', None) is not self: - # globals does not refer to one of our modules or packages. - # That implies there is no relative import context, and it - # should just pick it off the standard path. + if not globals or not globals.get('__importer__'): + # globals does not refer to one of our modules or packages. That + # implies there is no relative import context (as far as we are + # concerned), and it should just pick it off the standard path. return None # The globals refer to a module or package of ours. It will define # the context of the new import. Get the module/package fqname. parent_fqname = globals['__name__'] - # for a package, return itself (imports refer to pkg contents) - if self._is_package(globals): + # if a package is performing the import, then return itself (imports + # refer to pkg contents) + if globals['__ispkg__']: parent = sys.modules[parent_fqname] assert globals is parent.__dict__ return parent @@ -159,46 +159,88 @@ class Importer: if i == -1: return None - # for a module in a package, return the package (imports refer to siblings) + # if a module in a package is performing the import, then return the + # package (imports refer to siblings) parent_fqname = parent_fqname[:i] parent = sys.modules[parent_fqname] assert parent.__name__ == parent_fqname return parent - def _import_top_module(self, parent, name): - """Locate the top of the import tree (relative or absolute). + def _import_top_module(self, name): + # scan sys.path looking for a location in the filesystem that contains + # the module, or an Importer object that can import the module. + for item in sys.path: + if type(item) == _StringType: + module = self.fs_imp.import_from_dir(item, name) + else: + module = item.import_top(name) + if module: + return module + return None + + def _reload_hook(self, module): + "Python calls this hook to reload a module." - parent defines the context in which the import should occur. See - _determine_import_context() for details. + # reloading of a module may or may not be possible (depending on the + # importer), but at least we can validate that it's ours to reload + importer = module.__dict__.get('__importer__') + if not importer: + return self.__chain_reload(module) - Returns a tuple (module, tail). module is the loaded (top-level) module, - or None if the module is not found. tail is the remaining portion of - the dotted name. - """ - i = strop.find(name, '.') - if i == -1: - head = name - tail = "" - else: - head = name[:i] - tail = name[i+1:] - if parent: - fqname = "%s.%s" % (parent.__name__, head) - else: - fqname = head - module = self._import_one(parent, head, fqname) - if module: - # the module was relative, or no context existed (the module was - # simply found on the path). - return module, tail - if parent: - # we tried relative, now try an absolute import (from the path) - module = self._import_one(None, head, head) - if module: - return module, tail + # okay. it is using the imputil system, and we must delegate it, but + # we don't know what to do (yet) + ### we should blast the module dict and do another get_code(). need to + ### flesh this out and add proper docco... + raise SystemError, "reload not yet implemented" - # the module wasn't found - return None, None + +class Importer: + "Base class for replacing standard import functions." + + def install(self): + sys.path.insert(0, self) + + def import_top(self, name): + "Import a top-level module." + return self._import_one(None, name, name) + + ###################################################################### + # + # PRIVATE METHODS + # + def _finish_import(self, top, parts, fromlist): + # if "a.b.c" was provided, then load the ".b.c" portion down from + # below the top-level module. + bottom = self._load_tail(top, parts) + + # if the form is "import a.b.c", then return "a" + if not fromlist: + # no fromlist: return the top of the import tree + return top + + # the top module was imported by self. + # + # this means that the bottom module was also imported by self (just + # now, or in the past and we fetched it from sys.modules). + # + # since we imported/handled the bottom module, this means that we can + # also handle its fromlist (and reliably use __ispkg__). + + # if the bottom node is a package, then (potentially) import some modules. + # + # note: if it is not a package, then "fromlist" refers to names in + # the bottom module rather than modules. + # note: for a mix of names and modules in the fromlist, we will + # import all modules and insert those into the namespace of + # the package module. Python will pick up all fromlist names + # from the bottom (package) module; some will be modules that + # we imported and stored in the namespace, others are expected + # to be present already. + if bottom.__ispkg__: + self._import_fromlist(bottom, fromlist) + + # if the form is "from a.b import c, d" then return "b" + return bottom def _import_one(self, parent, modname, fqname): "Import a single module." @@ -214,46 +256,53 @@ class Importer: if result is None: return None + ### backwards-compat + if len(result) == 2: + result = result + ({},) + + module = self._process_result(result, fqname) + + # insert the module into its parent + if parent: + setattr(parent, modname, module) + return module + + def _process_result(self, (ispkg, code, values), fqname): # did get_code() return an actual module? (rather than a code object) - is_module = type(result[1]) is type(sys) + is_module = type(code) is _ModuleType # use the returned module, or create a new one to exec code into if is_module: - module = result[1] + module = code else: module = imp.new_module(fqname) ### record packages a bit differently?? module.__importer__ = self - module.__ispkg__ = result[0] + module.__ispkg__ = ispkg - # if present, the third item is a set of values to insert into the module - if len(result) > 2: - module.__dict__.update(result[2]) + # insert additional values into the module (before executing the code) + module.__dict__.update(values) # the module is almost ready... make it visible sys.modules[fqname] = module # execute the code within the module's namespace if not is_module: - exec result[1] in module.__dict__ + exec code in module.__dict__ - # insert the module into its parent - if parent: - setattr(parent, modname, module) return module - def _load_tail(self, m, tail): + def _load_tail(self, m, parts): """Import the rest of the modules, down from the top-level module. Returns the last module in the dotted list of modules. """ - if tail: - for part in strop.splitfields(tail, '.'): - fqname = "%s.%s" % (m.__name__, part) - m = self._import_one(m, part, fqname) - if not m: - raise ImportError, "No module named " + fqname + for part in parts: + fqname = "%s.%s" % (m.__name__, part) + m = self._import_one(m, part, fqname) + if not m: + raise ImportError, "No module named " + fqname return m def _import_fromlist(self, package, fromlist): @@ -273,17 +322,20 @@ class Importer: if not submod: raise ImportError, "cannot import name " + subname - def _is_package(self, module_dict): - """Determine if a given module (dictionary) specifies a package. - - The package status is in the module-level name __ispkg__. The module - must also have been imported by self, so that we can reliably apply - semantic meaning to __ispkg__. + def _do_import(self, parent, parts, fromlist): + """Attempt to import the module relative to parent. - ### weaken the test to issubclass(Importer)? + This method is used when the import context specifies that <self> + imported the parent module. """ - return module_dict.get('__importer__', None) is self and \ - module_dict['__ispkg__'] + top_name = parts[0] + top_fqname = parent.__name__ + '.' + top_name + top_module = self._import_one(parent, top_name, top_fqname) + if not top_module: + # this importer and parent could not find the module (relatively) + return None + + return self._finish_import(top_module, parts[1:], fromlist) ###################################################################### # @@ -301,7 +353,7 @@ class Importer: dotted name from the "root" of the module namespace down to the modname. If there is no parent, then modname==fqname. - This method should return None, a 2-tuple, or a 3-tuple. + This method should return None, or a 3-tuple. * If the module was not found, then None should be returned. @@ -312,9 +364,9 @@ class Importer: executed within the new module's namespace). This item can also be a fully-loaded module object (e.g. loaded from a shared lib). - * If present, the third item is a dictionary of name/value pairs that - will be inserted into new module before the code object is executed. - This provided in case the module's code expects certain values (such + * The third item is a dictionary of name/value pairs that will be + inserted into new module before the code object is executed. This + is provided in case the module's code expects certain values (such as where the module was found). When the second item is a module object, then these names/values will be inserted *after* the module has been loaded/initialized. @@ -653,6 +705,92 @@ class BuiltinImporter(Importer): ###################################################################### +# +# Internal importer used for importing from the filesystem +# +class _FilesystemImporter(Importer): + def __init__(self, suffixes): + # this list is shared with the ImportManager. + self.suffixes = suffixes + + def import_from_dir(self, dir, fqname): + result = self._import_pathname(_os_path_join(dir, fqname), fqname) + if result: + return self._process_result(result, fqname) + return None + + def get_code(self, parent, modname, fqname): + # This importer is never used with an empty parent. Its existence is + # private to the ImportManager. The ImportManager uses the + # import_from_dir() method to import top-level modules/packages. + # This method is only used when we look for a module within a package. + assert parent + + return self._import_pathname(_os_path_join(parent.__pkgdir__, modname), + fqname) + + def _import_pathname(self, pathname, fqname): + if _os_path_isdir(pathname): + result = self._import_pathname(_os_path_join(pathname, '__init__'), + fqname) + if result: + values = result[2] + values['__pkgdir__'] = pathname + values['__path__'] = [ pathname ] + return 1, result[1], values + return None + + for suffix, importer in self.suffixes: + filename = pathname + suffix + try: + finfo = _os_stat(filename) + except OSError: + pass + else: + return importer.import_file(filename, finfo, fqname) + return None + +###################################################################### +# +# SUFFIX-BASED IMPORTERS +# + +class SuffixImporter: + def import_file(self, filename, finfo, fqname): + raise RuntimeError + +class PySuffixImporter(SuffixImporter): + def import_file(self, filename, finfo, fqname): + file = filename[:-3] + _suffix + t_py = long(finfo[8]) + t_pyc = _timestamp(file) + + code = None + if t_pyc is not None and t_pyc >= t_py: + f = open(file, 'rb') + if f.read(4) == imp.get_magic(): + t = struct.unpack('<I', f.read(4))[0] + if t == t_py: + code = marshal.load(f) + f.close() + if code is None: + file = filename + code = _compile(file, t_py) + + return 0, code, { '__file__' : file } + +class DynLoadSuffixImporter(SuffixImporter): + def __init__(self, desc): + self.desc = desc + + def import_file(self, filename, finfo, fqname): + fp = open(filename, self.desc[1]) + module = imp.load_module(fqname, fp, filename, self.desc) + module.__file__ = filename + return 0, module, { } + + +###################################################################### def _test_dir(): "Debug/test function to create DirectoryImporters from sys.path." @@ -675,4 +813,8 @@ def _print_importers(): else: print name, '-- non-existent module' +def _test_revamp(): + ImportManager().install() + sys.path.insert(0, BuiltinImporter()) + ###################################################################### |