cpython/Tools/scripts/pdeps.py

#! /usr/bin/env python

# pdeps
#
# Find dependencies between a bunch of Python modules.
#
# Usage:
#       pdeps file1.py file2.py ...
#
# Output:
# Four tables separated by lines like '--- Closure ---':
# 1) Direct dependencies, listing which module imports which other modules
# 2) The inverse of (1)
# 3) Indirect dependencies, or the closure of the above
# 4) The inverse of (3)
#
# To do:
# - command line options to select output type
# - option to automatically scan the Python library for referenced modules
# - option to limit output to particular modules


import sys
import regex
import os


# Main program
#
def main():
    args = sys.argv[1:]
    if not args:
        print 'usage: pdeps file.py file.py ...'
        return 2
    #
    table = {}
    for arg in args:
        process(arg, table)
    #
    print '--- Uses ---'
    printresults(table)
    #
    print '--- Used By ---'
    inv = inverse(table)
    printresults(inv)
    #
    print '--- Closure of Uses ---'
    reach = closure(table)
    printresults(reach)
    #
    print '--- Closure of Used By ---'
    invreach = inverse(reach)
    printresults(invreach)
    #
    return 0


# Compiled regular expressions to search for import statements
#
m_import = regex.compile('^[ \t]*from[ \t]+\([^ \t]+\)[ \t]+')
m_from = regex.compile('^[ \t]*import[ \t]+\([^#]+\)')


# Collect data from one file
#
def process(filename, table):
    fp = open(filename, 'r')
    mod = os.path.basename(filename)
    if mod[-3:] == '.py':
        mod = mod[:-3]
    table[mod] = list = []
    while 1:
        line = fp.readline()
        if not line: break
        while line[-1:] == '\\':
            nextline = fp.readline()
            if not nextline: break
            line = line[:-1] + nextline
        if m_import.match(line) >= 0:
            (a, b), (a1, b1) = m_import.regs[:2]
        elif m_from.match(line) >= 0:
            (a, b), (a1, b1) = m_from.regs[:2]
        else: continue
        words = line[a1:b1].split(',')
        # print '#', line, words
        for word in words:
            word = word.strip()
            if word not in list:
                list.append(word)


# Compute closure (this is in fact totally general)
#
def closure(table):
    modules = table.keys()
    #
    # Initialize reach with a copy of table
    #
    reach = {}
    for mod in modules:
        reach[mod] = table[mod][:]
    #
    # Iterate until no more change
    #
    change = 1
    while change:
        change = 0
        for mod in modules:
            for mo in reach[mod]:
                if mo in modules:
                    for m in reach[mo]:
                        if m not in reach[mod]:
                            reach[mod].append(m)
                            change = 1
    #
    return reach


# Invert a table (this is again totally general).
# All keys of the original table are made keys of the inverse,
# so there may be empty lists in the inverse.
#
def inverse(table):
    inv = {}
    for key in table.keys():
        if not inv.has_key(key):
            inv[key] = []
        for item in table[key]:
            store(inv, item, key)
    return inv


# Store "item" in "dict" under "key".
# The dictionary maps keys to lists of items.
# If there is no list for the key yet, it is created.
#
def store(dict, key, item):
    if dict.has_key(key):
        dict[key].append(item)
    else:
        dict[key] = [item]


# Tabulate results neatly
#
def printresults(table):
    modules = table.keys()
    maxlen = 0
    for mod in modules: maxlen = max(maxlen, len(mod))
    modules.sort()
    for mod in modules:
        list = table[mod]
        list.sort()
        print mod.ljust(maxlen), ':',
        if mod in list:
            print '(*)',
        for ref in list:
            print ref,
        print


# Call main and honor exit status
if __name__ == '__main__':
    try:
        sys.exit(main())
    except KeyboardInterrupt:
        sys.exit(1)
/usr/local/bin/python -> /usr/bin/env python 1996-11-28 03:52:01 +08:00			`#! /usr/bin/env python`
Initial revision 1991-06-05 05:36:54 +09:00
			`# pdeps`
			`#`
			`# Find dependencies between a bunch of Python modules.`
			`#`
			`# Usage:`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`# pdeps file1.py file2.py ...`
Initial revision 1991-06-05 05:36:54 +09:00			`#`
			`# Output:`
			`# Four tables separated by lines like '--- Closure ---':`
			`# 1) Direct dependencies, listing which module imports which other modules`
			`# 2) The inverse of (1)`
			`# 3) Indirect dependencies, or the closure of the above`
			`# 4) The inverse of (3)`
			`#`
			`# To do:`
			`# - command line options to select output type`
			`# - option to automatically scan the Python library for referenced modules`
			`# - option to limit output to particular modules`


			`import sys`
Adapt to modern times... 1992-12-10 08:00:58 +08:00			`import regex`
			`import os`
Initial revision 1991-06-05 05:36:54 +09:00

			`# Main program`
			`#`
			`def main():`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`args = sys.argv[1:]`
			`if not args:`
			`print 'usage: pdeps file.py file.py ...'`
			`return 2`
			`#`
			`table = {}`
			`for arg in args:`
			`process(arg, table)`
			`#`
			`print '--- Uses ---'`
			`printresults(table)`
			`#`
			`print '--- Used By ---'`
			`inv = inverse(table)`
			`printresults(inv)`
			`#`
			`print '--- Closure of Uses ---'`
			`reach = closure(table)`
			`printresults(reach)`
			`#`
			`print '--- Closure of Used By ---'`
			`invreach = inverse(reach)`
			`printresults(invreach)`
			`#`
			`return 0`
Initial revision 1991-06-05 05:36:54 +09:00

			`# Compiled regular expressions to search for import statements`
			`#`
Adapt to modern times... 1992-12-10 08:00:58 +08:00			`m_import = regex.compile('^[ \t]*from[ \t]+\([^ \t]+\)[ \t]+')`
			`m_from = regex.compile('^[ \t]*import[ \t]+\([^#]+\)')`
Initial revision 1991-06-05 05:36:54 +09:00

			`# Collect data from one file`
			`#`
			`def process(filename, table):`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`fp = open(filename, 'r')`
			`mod = os.path.basename(filename)`
			`if mod[-3:] == '.py':`
			`mod = mod[:-3]`
			`table[mod] = list = []`
			`while 1:`
			`line = fp.readline()`
			`if not line: break`
			`while line[-1:] == '\\':`
			`nextline = fp.readline()`
			`if not nextline: break`
			`line = line[:-1] + nextline`
			`if m_import.match(line) >= 0:`
			`(a, b), (a1, b1) = m_import.regs[:2]`
			`elif m_from.match(line) >= 0:`
			`(a, b), (a1, b1) = m_from.regs[:2]`
			`else: continue`
Apply diff2.txt from SF patch http://www.python.org/sf/572113 (with one small bugfix in bgen/bgen/scantools.py) This replaces string module functions with string methods for the stuff in the Tools directory. Several uses of string.letters etc. are still remaining. 2002-09-12 04:36:02 +08:00			`words = line[a1:b1].split(',')`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`# print '#', line, words`
			`for word in words:`
Apply diff2.txt from SF patch http://www.python.org/sf/572113 (with one small bugfix in bgen/bgen/scantools.py) This replaces string module functions with string methods for the stuff in the Tools directory. Several uses of string.letters etc. are still remaining. 2002-09-12 04:36:02 +08:00			`word = word.strip()`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`if word not in list:`
			`list.append(word)`
Initial revision 1991-06-05 05:36:54 +09:00

			`# Compute closure (this is in fact totally general)`
			`#`
			`def closure(table):`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`modules = table.keys()`
			`#`
			`# Initialize reach with a copy of table`
			`#`
			`reach = {}`
			`for mod in modules:`
			`reach[mod] = table[mod][:]`
			`#`
			`# Iterate until no more change`
			`#`
			`change = 1`
			`while change:`
			`change = 0`
			`for mod in modules:`
			`for mo in reach[mod]:`
			`if mo in modules:`
			`for m in reach[mo]:`
			`if m not in reach[mod]:`
			`reach[mod].append(m)`
			`change = 1`
			`#`
			`return reach`
Initial revision 1991-06-05 05:36:54 +09:00

			`# Invert a table (this is again totally general).`
			`# All keys of the original table are made keys of the inverse,`
			`# so there may be empty lists in the inverse.`
			`#`
			`def inverse(table):`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`inv = {}`
			`for key in table.keys():`
			`if not inv.has_key(key):`
			`inv[key] = []`
			`for item in table[key]:`
			`store(inv, item, key)`
			`return inv`
Initial revision 1991-06-05 05:36:54 +09:00

			`# Store "item" in "dict" under "key".`
			`# The dictionary maps keys to lists of items.`
			`# If there is no list for the key yet, it is created.`
			`#`
			`def store(dict, key, item):`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`if dict.has_key(key):`
			`dict[key].append(item)`
			`else:`
			`dict[key] = [item]`
Initial revision 1991-06-05 05:36:54 +09:00

			`# Tabulate results neatly`
			`#`
			`def printresults(table):`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`modules = table.keys()`
			`maxlen = 0`
			`for mod in modules: maxlen = max(maxlen, len(mod))`
			`modules.sort()`
			`for mod in modules:`
			`list = table[mod]`
			`list.sort()`
Apply diff2.txt from SF patch http://www.python.org/sf/572113 (with one small bugfix in bgen/bgen/scantools.py) This replaces string module functions with string methods for the stuff in the Tools directory. Several uses of string.letters etc. are still remaining. 2002-09-12 04:36:02 +08:00			`print mod.ljust(maxlen), ':',`
Whitespace normalization. 2001-01-17 16:48:39 +08:00			`if mod in list:`
			`print '(*)',`
			`for ref in list:`
			`print ref,`
			`print`
Initial revision 1991-06-05 05:36:54 +09:00

			`# Call main and honor exit status`
[Patch #1005491 ] use __name__ == '__main__' in scripts 2004-08-10 01:27:55 +08:00			`if __name__ == '__main__':`
			`try:`
			`sys.exit(main())`
			`except KeyboardInterrupt:`
			`sys.exit(1)`