1998-03-05 11:42:00 +08:00
|
|
|
"""Find modules used by a script, using introspection."""
|
2002-11-26 04:21:59 +08:00
|
|
|
|
1998-03-05 11:42:00 +08:00
|
|
|
import dis
|
2015-05-03 09:15:18 +08:00
|
|
|
import importlib._bootstrap_external
|
2012-12-23 08:34:21 +08:00
|
|
|
import importlib.machinery
|
1998-03-05 11:42:00 +08:00
|
|
|
import marshal
|
|
|
|
import os
|
2020-04-15 03:16:06 +08:00
|
|
|
import io
|
1998-03-05 11:42:00 +08:00
|
|
|
import sys
|
2019-04-07 16:00:41 +08:00
|
|
|
|
|
|
|
# Old imp constants:
|
|
|
|
|
|
|
|
_SEARCH_ERROR = 0
|
|
|
|
_PY_SOURCE = 1
|
|
|
|
_PY_COMPILED = 2
|
|
|
|
_C_EXTENSION = 3
|
|
|
|
_PKG_DIRECTORY = 5
|
|
|
|
_C_BUILTIN = 6
|
|
|
|
_PY_FROZEN = 7
|
|
|
|
|
1998-05-19 04:21:56 +08:00
|
|
|
# Modulefinder does a good job at simulating Python's, but it can not
|
|
|
|
# handle __path__ modifications packages make at runtime. Therefore there
|
|
|
|
# is a mechanism whereby you can register extra paths in this map for a
|
2000-07-16 20:04:32 +08:00
|
|
|
# package, and it will be honored.
|
1998-05-19 04:21:56 +08:00
|
|
|
|
|
|
|
# Note this is a mapping is lists of paths.
|
|
|
|
packagePathMap = {}
|
|
|
|
|
|
|
|
# A Public interface
|
|
|
|
def AddPackagePath(packagename, path):
|
2011-08-01 21:29:07 +08:00
|
|
|
packagePathMap.setdefault(packagename, []).append(path)
|
1998-03-05 11:42:00 +08:00
|
|
|
|
2002-11-15 02:45:11 +08:00
|
|
|
replacePackageMap = {}
|
|
|
|
|
2011-05-09 14:05:43 +08:00
|
|
|
# This ReplacePackage mechanism allows modulefinder to work around
|
|
|
|
# situations in which a package injects itself under the name
|
|
|
|
# of another package into sys.modules at runtime by calling
|
|
|
|
# ReplacePackage("real_package_name", "faked_package_name")
|
2002-11-15 02:45:11 +08:00
|
|
|
# before running ModuleFinder.
|
|
|
|
|
|
|
|
def ReplacePackage(oldname, newname):
|
|
|
|
replacePackageMap[oldname] = newname
|
|
|
|
|
|
|
|
|
2019-04-07 16:00:41 +08:00
|
|
|
def _find_module(name, path=None):
|
|
|
|
"""An importlib reimplementation of imp.find_module (for our purposes)."""
|
|
|
|
|
|
|
|
# It's necessary to clear the caches for our Finder first, in case any
|
|
|
|
# modules are being added/deleted/modified at runtime. In particular,
|
|
|
|
# test_modulefinder.py changes file tree contents in a cache-breaking way:
|
|
|
|
|
|
|
|
importlib.machinery.PathFinder.invalidate_caches()
|
|
|
|
|
|
|
|
spec = importlib.machinery.PathFinder.find_spec(name, path)
|
|
|
|
|
|
|
|
if spec is None:
|
|
|
|
raise ImportError("No module named {name!r}".format(name=name), name=name)
|
|
|
|
|
|
|
|
# Some special cases:
|
|
|
|
|
|
|
|
if spec.loader is importlib.machinery.BuiltinImporter:
|
2020-04-20 22:58:42 +08:00
|
|
|
return None, None, ("", "", _C_BUILTIN)
|
2019-04-07 16:00:41 +08:00
|
|
|
|
|
|
|
if spec.loader is importlib.machinery.FrozenImporter:
|
2020-04-20 22:58:42 +08:00
|
|
|
return None, None, ("", "", _PY_FROZEN)
|
2019-04-07 16:00:41 +08:00
|
|
|
|
|
|
|
file_path = spec.origin
|
|
|
|
|
|
|
|
if spec.loader.is_package(name):
|
2020-04-20 22:58:42 +08:00
|
|
|
return None, os.path.dirname(file_path), ("", "", _PKG_DIRECTORY)
|
2019-04-07 16:00:41 +08:00
|
|
|
|
|
|
|
if isinstance(spec.loader, importlib.machinery.SourceFileLoader):
|
|
|
|
kind = _PY_SOURCE
|
|
|
|
|
|
|
|
elif isinstance(spec.loader, importlib.machinery.ExtensionFileLoader):
|
|
|
|
kind = _C_EXTENSION
|
|
|
|
|
|
|
|
elif isinstance(spec.loader, importlib.machinery.SourcelessFileLoader):
|
|
|
|
kind = _PY_COMPILED
|
|
|
|
|
|
|
|
else: # Should never happen.
|
2020-04-20 22:58:42 +08:00
|
|
|
return None, None, ("", "", _SEARCH_ERROR)
|
2019-04-07 16:00:41 +08:00
|
|
|
|
2020-04-15 03:16:06 +08:00
|
|
|
file = io.open_code(file_path)
|
2019-04-07 16:00:41 +08:00
|
|
|
suffix = os.path.splitext(file_path)[-1]
|
|
|
|
|
2020-04-20 22:58:42 +08:00
|
|
|
return file, file_path, (suffix, "rb", kind)
|
2019-04-07 16:00:41 +08:00
|
|
|
|
|
|
|
|
1998-03-05 11:42:00 +08:00
|
|
|
class Module:
|
|
|
|
|
|
|
|
def __init__(self, name, file=None, path=None):
|
1998-03-05 12:56:37 +08:00
|
|
|
self.__name__ = name
|
|
|
|
self.__file__ = file
|
|
|
|
self.__path__ = path
|
|
|
|
self.__code__ = None
|
2003-01-01 00:33:00 +08:00
|
|
|
# The set of global names that are assigned to in the module.
|
|
|
|
# This includes those names imported through starimports of
|
|
|
|
# Python modules.
|
|
|
|
self.globalnames = {}
|
|
|
|
# The set of starimports this module did that could not be
|
|
|
|
# resolved, ie. a starimport from a non-Python module.
|
|
|
|
self.starimports = {}
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def __repr__(self):
|
2004-02-16 00:43:20 +08:00
|
|
|
s = "Module(%r" % (self.__name__,)
|
1998-03-05 12:56:37 +08:00
|
|
|
if self.__file__ is not None:
|
2004-02-13 01:35:32 +08:00
|
|
|
s = s + ", %r" % (self.__file__,)
|
1998-03-05 12:56:37 +08:00
|
|
|
if self.__path__ is not None:
|
2004-02-13 01:35:32 +08:00
|
|
|
s = s + ", %r" % (self.__path__,)
|
1998-03-05 12:56:37 +08:00
|
|
|
s = s + ")"
|
|
|
|
return s
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
class ModuleFinder:
|
|
|
|
|
2019-04-07 16:00:41 +08:00
|
|
|
def __init__(self, path=None, debug=0, excludes=None, replace_paths=None):
|
1998-03-05 12:56:37 +08:00
|
|
|
if path is None:
|
|
|
|
path = sys.path
|
|
|
|
self.path = path
|
|
|
|
self.modules = {}
|
|
|
|
self.badmodules = {}
|
|
|
|
self.debug = debug
|
|
|
|
self.indent = 0
|
2019-04-07 16:00:41 +08:00
|
|
|
self.excludes = excludes if excludes is not None else []
|
|
|
|
self.replace_paths = replace_paths if replace_paths is not None else []
|
2001-03-21 04:43:34 +08:00
|
|
|
self.processed_paths = [] # Used in debugging only
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def msg(self, level, str, *args):
|
1998-03-05 12:56:37 +08:00
|
|
|
if level <= self.debug:
|
|
|
|
for i in range(self.indent):
|
2007-02-09 13:37:30 +08:00
|
|
|
print(" ", end=' ')
|
|
|
|
print(str, end=' ')
|
1998-03-05 12:56:37 +08:00
|
|
|
for arg in args:
|
2007-02-09 13:37:30 +08:00
|
|
|
print(repr(arg), end=' ')
|
|
|
|
print()
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def msgin(self, *args):
|
1998-03-05 12:56:37 +08:00
|
|
|
level = args[0]
|
|
|
|
if level <= self.debug:
|
|
|
|
self.indent = self.indent + 1
|
2003-02-28 04:14:51 +08:00
|
|
|
self.msg(*args)
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def msgout(self, *args):
|
1998-03-05 12:56:37 +08:00
|
|
|
level = args[0]
|
|
|
|
if level <= self.debug:
|
|
|
|
self.indent = self.indent - 1
|
2003-02-28 04:14:51 +08:00
|
|
|
self.msg(*args)
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def run_script(self, pathname):
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msg(2, "run_script", pathname)
|
2020-04-15 03:16:06 +08:00
|
|
|
with io.open_code(pathname) as fp:
|
2020-04-20 22:58:42 +08:00
|
|
|
stuff = ("", "rb", _PY_SOURCE)
|
2010-10-30 08:26:48 +08:00
|
|
|
self.load_module('__main__', fp, pathname, stuff)
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def load_file(self, pathname):
|
1998-03-05 12:56:37 +08:00
|
|
|
dir, name = os.path.split(pathname)
|
|
|
|
name, ext = os.path.splitext(name)
|
2020-04-15 03:16:06 +08:00
|
|
|
with io.open_code(pathname) as fp:
|
2020-04-20 22:58:42 +08:00
|
|
|
stuff = (ext, "rb", _PY_SOURCE)
|
2010-10-30 08:26:48 +08:00
|
|
|
self.load_module(name, fp, pathname, stuff)
|
1998-03-05 11:42:00 +08:00
|
|
|
|
2006-10-28 07:06:01 +08:00
|
|
|
def import_hook(self, name, caller=None, fromlist=None, level=-1):
|
|
|
|
self.msg(3, "import_hook", name, caller, fromlist, level)
|
|
|
|
parent = self.determine_parent(caller, level=level)
|
1998-03-05 12:56:37 +08:00
|
|
|
q, tail = self.find_head_package(parent, name)
|
|
|
|
m = self.load_tail(q, tail)
|
|
|
|
if not fromlist:
|
|
|
|
return q
|
|
|
|
if m.__path__:
|
|
|
|
self.ensure_fromlist(m, fromlist)
|
2002-11-26 16:06:50 +08:00
|
|
|
return None
|
1998-03-05 11:42:00 +08:00
|
|
|
|
2006-10-28 07:06:01 +08:00
|
|
|
def determine_parent(self, caller, level=-1):
|
|
|
|
self.msgin(4, "determine_parent", caller, level)
|
|
|
|
if not caller or level == 0:
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msgout(4, "determine_parent -> None")
|
|
|
|
return None
|
|
|
|
pname = caller.__name__
|
2006-10-28 07:06:01 +08:00
|
|
|
if level >= 1: # relative import
|
|
|
|
if caller.__path__:
|
|
|
|
level -= 1
|
|
|
|
if level == 0:
|
|
|
|
parent = self.modules[pname]
|
|
|
|
assert parent is caller
|
|
|
|
self.msgout(4, "determine_parent ->", parent)
|
|
|
|
return parent
|
|
|
|
if pname.count(".") < level:
|
2007-08-30 09:19:48 +08:00
|
|
|
raise ImportError("relative importpath too deep")
|
2006-10-28 07:06:01 +08:00
|
|
|
pname = ".".join(pname.split(".")[:-level])
|
|
|
|
parent = self.modules[pname]
|
|
|
|
self.msgout(4, "determine_parent ->", parent)
|
|
|
|
return parent
|
1998-03-05 12:56:37 +08:00
|
|
|
if caller.__path__:
|
|
|
|
parent = self.modules[pname]
|
|
|
|
assert caller is parent
|
|
|
|
self.msgout(4, "determine_parent ->", parent)
|
|
|
|
return parent
|
|
|
|
if '.' in pname:
|
2002-09-12 04:36:02 +08:00
|
|
|
i = pname.rfind('.')
|
1998-03-05 12:56:37 +08:00
|
|
|
pname = pname[:i]
|
|
|
|
parent = self.modules[pname]
|
|
|
|
assert parent.__name__ == pname
|
|
|
|
self.msgout(4, "determine_parent ->", parent)
|
|
|
|
return parent
|
|
|
|
self.msgout(4, "determine_parent -> None")
|
|
|
|
return None
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def find_head_package(self, parent, name):
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msgin(4, "find_head_package", parent, name)
|
|
|
|
if '.' in name:
|
2002-09-12 04:36:02 +08:00
|
|
|
i = name.find('.')
|
1998-03-05 12:56:37 +08:00
|
|
|
head = name[:i]
|
|
|
|
tail = name[i+1:]
|
|
|
|
else:
|
|
|
|
head = name
|
|
|
|
tail = ""
|
|
|
|
if parent:
|
|
|
|
qname = "%s.%s" % (parent.__name__, head)
|
|
|
|
else:
|
|
|
|
qname = head
|
|
|
|
q = self.import_module(head, qname, parent)
|
|
|
|
if q:
|
|
|
|
self.msgout(4, "find_head_package ->", (q, tail))
|
|
|
|
return q, tail
|
|
|
|
if parent:
|
|
|
|
qname = head
|
|
|
|
parent = None
|
|
|
|
q = self.import_module(head, qname, parent)
|
|
|
|
if q:
|
|
|
|
self.msgout(4, "find_head_package ->", (q, tail))
|
|
|
|
return q, tail
|
|
|
|
self.msgout(4, "raise ImportError: No module named", qname)
|
2007-08-30 09:19:48 +08:00
|
|
|
raise ImportError("No module named " + qname)
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def load_tail(self, q, tail):
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msgin(4, "load_tail", q, tail)
|
|
|
|
m = q
|
|
|
|
while tail:
|
2002-09-12 04:36:02 +08:00
|
|
|
i = tail.find('.')
|
1998-03-05 12:56:37 +08:00
|
|
|
if i < 0: i = len(tail)
|
|
|
|
head, tail = tail[:i], tail[i+1:]
|
|
|
|
mname = "%s.%s" % (m.__name__, head)
|
|
|
|
m = self.import_module(head, mname, m)
|
|
|
|
if not m:
|
|
|
|
self.msgout(4, "raise ImportError: No module named", mname)
|
2007-08-30 09:19:48 +08:00
|
|
|
raise ImportError("No module named " + mname)
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msgout(4, "load_tail ->", m)
|
|
|
|
return m
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def ensure_fromlist(self, m, fromlist, recursive=0):
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msg(4, "ensure_fromlist", m, fromlist, recursive)
|
|
|
|
for sub in fromlist:
|
|
|
|
if sub == "*":
|
|
|
|
if not recursive:
|
|
|
|
all = self.find_all_submodules(m)
|
|
|
|
if all:
|
|
|
|
self.ensure_fromlist(m, all, 1)
|
|
|
|
elif not hasattr(m, sub):
|
|
|
|
subname = "%s.%s" % (m.__name__, sub)
|
|
|
|
submod = self.import_module(sub, subname, m)
|
|
|
|
if not submod:
|
2007-08-30 09:19:48 +08:00
|
|
|
raise ImportError("No module named " + subname)
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def find_all_submodules(self, m):
|
1998-03-05 12:56:37 +08:00
|
|
|
if not m.__path__:
|
|
|
|
return
|
|
|
|
modules = {}
|
2015-04-14 02:21:02 +08:00
|
|
|
# 'suffixes' used to be a list hardcoded to [".py", ".pyc"].
|
2003-11-14 18:28:42 +08:00
|
|
|
# But we must also collect Python extension modules - although
|
|
|
|
# we cannot separate normal dlls from Python extensions.
|
|
|
|
suffixes = []
|
2012-05-12 00:58:42 +08:00
|
|
|
suffixes += importlib.machinery.EXTENSION_SUFFIXES[:]
|
|
|
|
suffixes += importlib.machinery.SOURCE_SUFFIXES[:]
|
|
|
|
suffixes += importlib.machinery.BYTECODE_SUFFIXES[:]
|
1998-03-05 12:56:37 +08:00
|
|
|
for dir in m.__path__:
|
|
|
|
try:
|
|
|
|
names = os.listdir(dir)
|
2012-12-19 04:02:39 +08:00
|
|
|
except OSError:
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msg(2, "can't list directory", dir)
|
|
|
|
continue
|
|
|
|
for name in names:
|
|
|
|
mod = None
|
|
|
|
for suff in suffixes:
|
|
|
|
n = len(suff)
|
|
|
|
if name[-n:] == suff:
|
|
|
|
mod = name[:-n]
|
|
|
|
break
|
|
|
|
if mod and mod != "__init__":
|
|
|
|
modules[mod] = mod
|
|
|
|
return modules.keys()
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def import_module(self, partname, fqname, parent):
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msgin(3, "import_module", partname, fqname, parent)
|
|
|
|
try:
|
|
|
|
m = self.modules[fqname]
|
|
|
|
except KeyError:
|
|
|
|
pass
|
|
|
|
else:
|
|
|
|
self.msgout(3, "import_module ->", m)
|
|
|
|
return m
|
2006-08-19 06:13:04 +08:00
|
|
|
if fqname in self.badmodules:
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msgout(3, "import_module -> None")
|
|
|
|
return None
|
2004-05-11 23:10:59 +08:00
|
|
|
if parent and parent.__path__ is None:
|
|
|
|
self.msgout(3, "import_module -> None")
|
|
|
|
return None
|
1998-03-05 12:56:37 +08:00
|
|
|
try:
|
|
|
|
fp, pathname, stuff = self.find_module(partname,
|
2003-03-06 01:23:48 +08:00
|
|
|
parent and parent.__path__, parent)
|
1998-03-05 12:56:37 +08:00
|
|
|
except ImportError:
|
|
|
|
self.msgout(3, "import_module ->", None)
|
|
|
|
return None
|
2020-04-20 22:58:42 +08:00
|
|
|
|
1998-03-05 12:56:37 +08:00
|
|
|
try:
|
|
|
|
m = self.load_module(fqname, fp, pathname, stuff)
|
|
|
|
finally:
|
2011-07-29 05:35:29 +08:00
|
|
|
if fp:
|
|
|
|
fp.close()
|
1998-03-05 12:56:37 +08:00
|
|
|
if parent:
|
|
|
|
setattr(parent, partname, m)
|
|
|
|
self.msgout(3, "import_module ->", m)
|
|
|
|
return m
|
1998-03-05 11:42:00 +08:00
|
|
|
|
2007-05-16 02:46:22 +08:00
|
|
|
def load_module(self, fqname, fp, pathname, file_info):
|
2020-04-20 22:58:42 +08:00
|
|
|
suffix, mode, type = file_info
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msgin(2, "load_module", fqname, fp and "fp", pathname)
|
2019-04-07 16:00:41 +08:00
|
|
|
if type == _PKG_DIRECTORY:
|
1998-03-05 12:56:37 +08:00
|
|
|
m = self.load_package(fqname, pathname)
|
|
|
|
self.msgout(2, "load_module ->", m)
|
|
|
|
return m
|
2019-04-07 16:00:41 +08:00
|
|
|
if type == _PY_SOURCE:
|
2020-04-23 02:42:53 +08:00
|
|
|
co = compile(fp.read(), pathname, 'exec')
|
2019-04-07 16:00:41 +08:00
|
|
|
elif type == _PY_COMPILED:
|
2014-02-28 23:50:34 +08:00
|
|
|
try:
|
2017-12-10 02:26:52 +08:00
|
|
|
data = fp.read()
|
|
|
|
importlib._bootstrap_external._classify_pyc(data, fqname, {})
|
2014-02-28 23:50:34 +08:00
|
|
|
except ImportError as exc:
|
|
|
|
self.msgout(2, "raise ImportError: " + str(exc), pathname)
|
|
|
|
raise
|
2017-12-10 02:26:52 +08:00
|
|
|
co = marshal.loads(memoryview(data)[16:])
|
1998-03-05 12:56:37 +08:00
|
|
|
else:
|
|
|
|
co = None
|
|
|
|
m = self.add_module(fqname)
|
1998-03-07 03:55:10 +08:00
|
|
|
m.__file__ = pathname
|
1998-03-05 12:56:37 +08:00
|
|
|
if co:
|
2001-03-21 04:43:34 +08:00
|
|
|
if self.replace_paths:
|
|
|
|
co = self.replace_paths_in_code(co)
|
1998-03-05 12:56:37 +08:00
|
|
|
m.__code__ = co
|
1998-03-05 13:15:07 +08:00
|
|
|
self.scan_code(co, m)
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msgout(2, "load_module ->", m)
|
|
|
|
return m
|
1998-03-05 11:42:00 +08:00
|
|
|
|
2003-01-01 00:33:00 +08:00
|
|
|
def _add_badmodule(self, name, caller):
|
|
|
|
if name not in self.badmodules:
|
|
|
|
self.badmodules[name] = {}
|
Merged revisions 67028,67040,67044,67046,67052,67065,67070,67077,67082 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk
........
r67028 | benjamin.peterson | 2008-10-25 18:27:07 -0500 (Sat, 25 Oct 2008) | 1 line
don't use a catch-all
........
r67040 | armin.rigo | 2008-10-28 12:01:21 -0500 (Tue, 28 Oct 2008) | 5 lines
Fix one of the tests: it relied on being present in an "output test" in
order to actually test what it was supposed to test, i.e. that the code
in the __del__ method did not crash. Use instead the new helper
test_support.captured_output().
........
r67044 | amaury.forgeotdarc | 2008-10-29 18:15:57 -0500 (Wed, 29 Oct 2008) | 3 lines
Correct error message in io.open():
closefd=True is the only accepted value with a file name.
........
r67046 | thomas.heller | 2008-10-30 15:18:13 -0500 (Thu, 30 Oct 2008) | 2 lines
Fixed a modulefinder crash on certain relative imports.
........
r67052 | christian.heimes | 2008-10-30 16:26:15 -0500 (Thu, 30 Oct 2008) | 1 line
Issue #4237: io.FileIO() was raising invalid warnings caused by insufficient initialization of PyFileIOObject struct members.
........
r67065 | benjamin.peterson | 2008-10-30 18:59:18 -0500 (Thu, 30 Oct 2008) | 1 line
move unprefixed error into .c file
........
r67070 | benjamin.peterson | 2008-10-31 15:41:44 -0500 (Fri, 31 Oct 2008) | 1 line
rephrase has_key doc
........
r67077 | benjamin.peterson | 2008-11-03 09:14:51 -0600 (Mon, 03 Nov 2008) | 1 line
#4048 make the parser module accept relative imports as valid
........
r67082 | hirokazu.yamamoto | 2008-11-03 12:03:06 -0600 (Mon, 03 Nov 2008) | 2 lines
Issue #3774: Fixed an error when create a Tkinter menu item without command
and then remove it. Written by Guilherme Polo (gpolo).
........
2008-11-04 04:31:38 +08:00
|
|
|
if caller:
|
|
|
|
self.badmodules[name][caller.__name__] = 1
|
|
|
|
else:
|
|
|
|
self.badmodules[name]["-"] = 1
|
2003-01-01 00:33:00 +08:00
|
|
|
|
2006-10-28 07:06:01 +08:00
|
|
|
def _safe_import_hook(self, name, caller, fromlist, level=-1):
|
2003-01-01 00:33:00 +08:00
|
|
|
# wrapper for self.import_hook() that won't raise ImportError
|
|
|
|
if name in self.badmodules:
|
|
|
|
self._add_badmodule(name, caller)
|
|
|
|
return
|
|
|
|
try:
|
2006-10-28 07:06:01 +08:00
|
|
|
self.import_hook(name, caller, level=level)
|
2007-01-11 00:19:56 +08:00
|
|
|
except ImportError as msg:
|
2003-01-01 00:33:00 +08:00
|
|
|
self.msg(2, "ImportError:", str(msg))
|
|
|
|
self._add_badmodule(name, caller)
|
2019-04-07 16:00:41 +08:00
|
|
|
except SyntaxError as msg:
|
|
|
|
self.msg(2, "SyntaxError:", str(msg))
|
|
|
|
self._add_badmodule(name, caller)
|
2003-01-01 00:33:00 +08:00
|
|
|
else:
|
|
|
|
if fromlist:
|
|
|
|
for sub in fromlist:
|
2019-04-07 16:00:41 +08:00
|
|
|
fullname = name + "." + sub
|
|
|
|
if fullname in self.badmodules:
|
|
|
|
self._add_badmodule(fullname, caller)
|
2003-01-01 00:33:00 +08:00
|
|
|
continue
|
|
|
|
try:
|
2006-10-28 07:06:01 +08:00
|
|
|
self.import_hook(name, caller, [sub], level=level)
|
2007-01-11 00:19:56 +08:00
|
|
|
except ImportError as msg:
|
2003-01-01 00:33:00 +08:00
|
|
|
self.msg(2, "ImportError:", str(msg))
|
|
|
|
self._add_badmodule(fullname, caller)
|
|
|
|
|
2016-05-09 04:43:50 +08:00
|
|
|
def scan_opcodes(self, co):
|
2006-10-28 07:06:01 +08:00
|
|
|
# Scan the code, and yield 'interesting' opcode combinations
|
2021-09-09 21:04:12 +08:00
|
|
|
for name in dis._find_store_names(co):
|
|
|
|
yield "store", (name,)
|
|
|
|
for name, level, fromlist in dis._find_imports(co):
|
|
|
|
if level == 0: # absolute import
|
|
|
|
yield "absolute_import", (fromlist, name)
|
|
|
|
else: # relative import
|
|
|
|
yield "relative_import", (level, fromlist, name)
|
2006-10-28 07:06:01 +08:00
|
|
|
|
1998-03-05 13:15:07 +08:00
|
|
|
def scan_code(self, co, m):
|
|
|
|
code = co.co_code
|
2016-05-09 04:43:50 +08:00
|
|
|
scanner = self.scan_opcodes
|
2006-10-28 07:06:01 +08:00
|
|
|
for what, args in scanner(co):
|
|
|
|
if what == "store":
|
|
|
|
name, = args
|
|
|
|
m.globalnames[name] = 1
|
|
|
|
elif what == "absolute_import":
|
|
|
|
fromlist, name = args
|
2003-01-01 00:33:00 +08:00
|
|
|
have_star = 0
|
|
|
|
if fromlist is not None:
|
|
|
|
if "*" in fromlist:
|
|
|
|
have_star = 1
|
|
|
|
fromlist = [f for f in fromlist if f != "*"]
|
2006-10-28 07:06:01 +08:00
|
|
|
self._safe_import_hook(name, m, fromlist, level=0)
|
2003-01-01 00:33:00 +08:00
|
|
|
if have_star:
|
|
|
|
# We've encountered an "import *". If it is a Python module,
|
|
|
|
# the code has already been parsed and we can suck out the
|
|
|
|
# global names.
|
|
|
|
mm = None
|
|
|
|
if m.__path__:
|
|
|
|
# At this point we don't know whether 'name' is a
|
|
|
|
# submodule of 'm' or a global module. Let's just try
|
|
|
|
# the full name first.
|
|
|
|
mm = self.modules.get(m.__name__ + "." + name)
|
|
|
|
if mm is None:
|
|
|
|
mm = self.modules.get(name)
|
|
|
|
if mm is not None:
|
|
|
|
m.globalnames.update(mm.globalnames)
|
|
|
|
m.starimports.update(mm.starimports)
|
|
|
|
if mm.__code__ is None:
|
|
|
|
m.starimports[name] = 1
|
|
|
|
else:
|
|
|
|
m.starimports[name] = 1
|
2006-10-28 07:06:01 +08:00
|
|
|
elif what == "relative_import":
|
|
|
|
level, fromlist, name = args
|
|
|
|
if name:
|
|
|
|
self._safe_import_hook(name, m, fromlist, level=level)
|
|
|
|
else:
|
|
|
|
parent = self.determine_parent(m, level=level)
|
|
|
|
self._safe_import_hook(parent.__name__, None, fromlist, level=0)
|
|
|
|
else:
|
|
|
|
# We don't expect anything else from the generator.
|
|
|
|
raise RuntimeError(what)
|
|
|
|
|
1998-03-05 13:15:07 +08:00
|
|
|
for c in co.co_consts:
|
|
|
|
if isinstance(c, type(co)):
|
|
|
|
self.scan_code(c, m)
|
|
|
|
|
1998-03-05 11:42:00 +08:00
|
|
|
def load_package(self, fqname, pathname):
|
1998-03-05 12:56:37 +08:00
|
|
|
self.msgin(2, "load_package", fqname, pathname)
|
2002-11-15 02:45:11 +08:00
|
|
|
newname = replacePackageMap.get(fqname)
|
|
|
|
if newname:
|
|
|
|
fqname = newname
|
1998-03-05 12:56:37 +08:00
|
|
|
m = self.add_module(fqname)
|
|
|
|
m.__file__ = pathname
|
|
|
|
m.__path__ = [pathname]
|
1998-05-19 04:21:56 +08:00
|
|
|
|
1998-09-15 00:02:28 +08:00
|
|
|
# As per comment at top of file, simulate runtime __path__ additions.
|
|
|
|
m.__path__ = m.__path__ + packagePathMap.get(fqname, [])
|
1998-05-19 04:21:56 +08:00
|
|
|
|
1998-03-05 12:56:37 +08:00
|
|
|
fp, buf, stuff = self.find_module("__init__", m.__path__)
|
2010-10-30 08:26:48 +08:00
|
|
|
try:
|
|
|
|
self.load_module(fqname, fp, buf, stuff)
|
|
|
|
self.msgout(2, "load_package ->", m)
|
|
|
|
return m
|
|
|
|
finally:
|
|
|
|
if fp:
|
|
|
|
fp.close()
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def add_module(self, fqname):
|
2006-08-19 06:13:04 +08:00
|
|
|
if fqname in self.modules:
|
1998-03-05 12:56:37 +08:00
|
|
|
return self.modules[fqname]
|
|
|
|
self.modules[fqname] = m = Module(fqname)
|
|
|
|
return m
|
1998-03-05 11:42:00 +08:00
|
|
|
|
2003-03-06 01:23:48 +08:00
|
|
|
def find_module(self, name, path, parent=None):
|
|
|
|
if parent is not None:
|
2004-05-11 23:10:59 +08:00
|
|
|
# assert path is not None
|
2003-03-06 01:23:48 +08:00
|
|
|
fullname = parent.__name__+'.'+name
|
2001-10-19 03:15:32 +08:00
|
|
|
else:
|
|
|
|
fullname = name
|
|
|
|
if fullname in self.excludes:
|
|
|
|
self.msgout(3, "find_module -> Excluded", fullname)
|
2007-08-30 09:19:48 +08:00
|
|
|
raise ImportError(name)
|
1998-03-21 01:37:24 +08:00
|
|
|
|
1998-03-05 12:56:37 +08:00
|
|
|
if path is None:
|
|
|
|
if name in sys.builtin_module_names:
|
2020-04-20 22:58:42 +08:00
|
|
|
return (None, None, ("", "", _C_BUILTIN))
|
1998-03-21 01:37:24 +08:00
|
|
|
|
1998-03-05 12:56:37 +08:00
|
|
|
path = self.path
|
2019-04-07 16:00:41 +08:00
|
|
|
|
|
|
|
return _find_module(name, path)
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def report(self):
|
2003-01-01 00:33:00 +08:00
|
|
|
"""Print a report to stdout, listing the found modules with their
|
|
|
|
paths, as well as modules that are missing, or seem to be missing.
|
|
|
|
"""
|
2007-02-09 13:37:30 +08:00
|
|
|
print()
|
|
|
|
print(" %-25s %s" % ("Name", "File"))
|
|
|
|
print(" %-25s %s" % ("----", "----"))
|
1998-03-05 12:56:37 +08:00
|
|
|
# Print modules found
|
2007-06-12 08:25:08 +08:00
|
|
|
keys = sorted(self.modules.keys())
|
1998-03-05 12:56:37 +08:00
|
|
|
for key in keys:
|
|
|
|
m = self.modules[key]
|
|
|
|
if m.__path__:
|
2007-02-09 13:37:30 +08:00
|
|
|
print("P", end=' ')
|
1998-03-05 12:56:37 +08:00
|
|
|
else:
|
2007-02-09 13:37:30 +08:00
|
|
|
print("m", end=' ')
|
|
|
|
print("%-25s" % key, m.__file__ or "")
|
1998-03-05 12:56:37 +08:00
|
|
|
|
|
|
|
# Print missing modules
|
2003-01-01 00:33:00 +08:00
|
|
|
missing, maybe = self.any_missing_maybe()
|
|
|
|
if missing:
|
2007-02-09 13:37:30 +08:00
|
|
|
print()
|
|
|
|
print("Missing modules:")
|
2003-01-01 00:33:00 +08:00
|
|
|
for name in missing:
|
2007-06-12 08:25:08 +08:00
|
|
|
mods = sorted(self.badmodules[name].keys())
|
2007-02-09 13:37:30 +08:00
|
|
|
print("?", name, "imported from", ', '.join(mods))
|
2003-01-01 00:33:00 +08:00
|
|
|
# Print modules that may be missing, but then again, maybe not...
|
|
|
|
if maybe:
|
2007-02-09 13:37:30 +08:00
|
|
|
print()
|
2013-08-17 20:50:46 +08:00
|
|
|
print("Submodules that appear to be missing, but could also be", end=' ')
|
2007-02-09 13:37:30 +08:00
|
|
|
print("global names in the parent package:")
|
2003-01-01 00:33:00 +08:00
|
|
|
for name in maybe:
|
2007-06-12 08:25:08 +08:00
|
|
|
mods = sorted(self.badmodules[name].keys())
|
2007-02-09 13:37:30 +08:00
|
|
|
print("?", name, "imported from", ', '.join(mods))
|
1998-03-05 11:42:00 +08:00
|
|
|
|
2001-10-19 03:15:32 +08:00
|
|
|
def any_missing(self):
|
2003-01-01 00:33:00 +08:00
|
|
|
"""Return a list of modules that appear to be missing. Use
|
|
|
|
any_missing_maybe() if you want to know which modules are
|
|
|
|
certain to be missing, and which *may* be missing.
|
|
|
|
"""
|
|
|
|
missing, maybe = self.any_missing_maybe()
|
|
|
|
return missing + maybe
|
|
|
|
|
|
|
|
def any_missing_maybe(self):
|
|
|
|
"""Return two lists, one with modules that are certainly missing
|
|
|
|
and one with modules that *may* be missing. The latter names could
|
|
|
|
either be submodules *or* just global names in the package.
|
|
|
|
|
|
|
|
The reason it can't always be determined is that it's impossible to
|
|
|
|
tell which names are imported when "from module import *" is done
|
|
|
|
with an extension module, short of actually importing it.
|
|
|
|
"""
|
2001-10-19 03:15:32 +08:00
|
|
|
missing = []
|
2003-01-01 00:33:00 +08:00
|
|
|
maybe = []
|
|
|
|
for name in self.badmodules:
|
|
|
|
if name in self.excludes:
|
|
|
|
continue
|
|
|
|
i = name.rfind(".")
|
|
|
|
if i < 0:
|
|
|
|
missing.append(name)
|
|
|
|
continue
|
|
|
|
subname = name[i+1:]
|
|
|
|
pkgname = name[:i]
|
|
|
|
pkg = self.modules.get(pkgname)
|
|
|
|
if pkg is not None:
|
|
|
|
if pkgname in self.badmodules[name]:
|
|
|
|
# The package tried to import this module itself and
|
|
|
|
# failed. It's definitely missing.
|
|
|
|
missing.append(name)
|
|
|
|
elif subname in pkg.globalnames:
|
|
|
|
# It's a global in the package: definitely not missing.
|
|
|
|
pass
|
|
|
|
elif pkg.starimports:
|
|
|
|
# It could be missing, but the package did an "import *"
|
|
|
|
# from a non-Python module, so we simply can't be sure.
|
|
|
|
maybe.append(name)
|
|
|
|
else:
|
|
|
|
# It's not a global in the package, the package didn't
|
|
|
|
# do funny star imports, it's very likely to be missing.
|
|
|
|
# The symbol could be inserted into the package from the
|
|
|
|
# outside, but since that's not good style we simply list
|
|
|
|
# it missing.
|
|
|
|
missing.append(name)
|
|
|
|
else:
|
|
|
|
missing.append(name)
|
|
|
|
missing.sort()
|
|
|
|
maybe.sort()
|
|
|
|
return missing, maybe
|
2001-10-19 03:15:32 +08:00
|
|
|
|
2001-03-21 04:43:34 +08:00
|
|
|
def replace_paths_in_code(self, co):
|
|
|
|
new_filename = original_filename = os.path.normpath(co.co_filename)
|
2003-01-01 00:33:00 +08:00
|
|
|
for f, r in self.replace_paths:
|
2001-03-21 04:43:34 +08:00
|
|
|
if original_filename.startswith(f):
|
2003-01-01 00:33:00 +08:00
|
|
|
new_filename = r + original_filename[len(f):]
|
2001-03-21 04:43:34 +08:00
|
|
|
break
|
|
|
|
|
|
|
|
if self.debug and original_filename not in self.processed_paths:
|
2003-01-01 00:33:00 +08:00
|
|
|
if new_filename != original_filename:
|
2001-03-21 04:43:34 +08:00
|
|
|
self.msgout(2, "co_filename %r changed to %r" \
|
|
|
|
% (original_filename,new_filename,))
|
|
|
|
else:
|
|
|
|
self.msgout(2, "co_filename %r remains unchanged" \
|
|
|
|
% (original_filename,))
|
|
|
|
self.processed_paths.append(original_filename)
|
|
|
|
|
|
|
|
consts = list(co.co_consts)
|
|
|
|
for i in range(len(consts)):
|
|
|
|
if isinstance(consts[i], type(co)):
|
|
|
|
consts[i] = self.replace_paths_in_code(consts[i])
|
|
|
|
|
2019-05-25 05:57:23 +08:00
|
|
|
return co.replace(co_consts=tuple(consts), co_filename=new_filename)
|
2001-03-21 04:43:34 +08:00
|
|
|
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
def test():
|
|
|
|
# Parse command line
|
|
|
|
import getopt
|
|
|
|
try:
|
1998-08-25 22:06:55 +08:00
|
|
|
opts, args = getopt.getopt(sys.argv[1:], "dmp:qx:")
|
2007-01-11 00:19:56 +08:00
|
|
|
except getopt.error as msg:
|
2007-02-09 13:37:30 +08:00
|
|
|
print(msg)
|
1998-03-05 12:56:37 +08:00
|
|
|
return
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
# Process options
|
|
|
|
debug = 1
|
|
|
|
domods = 0
|
|
|
|
addpath = []
|
1998-08-25 22:06:55 +08:00
|
|
|
exclude = []
|
1998-03-05 11:42:00 +08:00
|
|
|
for o, a in opts:
|
1998-03-05 12:56:37 +08:00
|
|
|
if o == '-d':
|
|
|
|
debug = debug + 1
|
|
|
|
if o == '-m':
|
|
|
|
domods = 1
|
|
|
|
if o == '-p':
|
2002-09-12 04:36:02 +08:00
|
|
|
addpath = addpath + a.split(os.pathsep)
|
1998-03-05 12:56:37 +08:00
|
|
|
if o == '-q':
|
|
|
|
debug = 0
|
1998-08-25 22:06:55 +08:00
|
|
|
if o == '-x':
|
|
|
|
exclude.append(a)
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
# Provide default arguments
|
|
|
|
if not args:
|
1998-03-05 12:56:37 +08:00
|
|
|
script = "hello.py"
|
1998-03-05 11:42:00 +08:00
|
|
|
else:
|
1998-03-05 12:56:37 +08:00
|
|
|
script = args[0]
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
# Set the path based on sys.path and the script directory
|
|
|
|
path = sys.path[:]
|
|
|
|
path[0] = os.path.dirname(script)
|
|
|
|
path = addpath + path
|
|
|
|
if debug > 1:
|
2007-02-09 13:37:30 +08:00
|
|
|
print("path:")
|
1998-03-05 12:56:37 +08:00
|
|
|
for item in path:
|
2007-02-09 13:37:30 +08:00
|
|
|
print(" ", repr(item))
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
# Create the module finder and turn its crank
|
1998-08-25 22:06:55 +08:00
|
|
|
mf = ModuleFinder(path, debug, exclude)
|
1998-03-05 11:42:00 +08:00
|
|
|
for arg in args[1:]:
|
1998-03-05 12:56:37 +08:00
|
|
|
if arg == '-m':
|
|
|
|
domods = 1
|
|
|
|
continue
|
|
|
|
if domods:
|
|
|
|
if arg[-2:] == '.*':
|
|
|
|
mf.import_hook(arg[:-2], None, ["*"])
|
|
|
|
else:
|
|
|
|
mf.import_hook(arg)
|
1998-03-05 11:42:00 +08:00
|
|
|
else:
|
1998-03-05 12:56:37 +08:00
|
|
|
mf.load_file(arg)
|
1998-03-05 11:42:00 +08:00
|
|
|
mf.run_script(script)
|
|
|
|
mf.report()
|
2003-01-01 00:33:00 +08:00
|
|
|
return mf # for -i debugging
|
1998-03-05 11:42:00 +08:00
|
|
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
try:
|
2003-01-01 00:33:00 +08:00
|
|
|
mf = test()
|
1998-03-05 11:42:00 +08:00
|
|
|
except KeyboardInterrupt:
|
2011-07-29 05:35:29 +08:00
|
|
|
print("\n[interrupted]")
|