blob: f8218ac5243d1e511e3790874dfddcd9b7b46a56 [file] [log] [blame]
Benjamin Peterson90f5ba52010-03-11 22:53:45 +00001#! /usr/bin/env python3
Guido van Rossumec758ea1991-06-04 20:36:54 +00002
3# pdeps
4#
5# Find dependencies between a bunch of Python modules.
6#
7# Usage:
Tim Peters70c43782001-01-17 08:48:39 +00008# pdeps file1.py file2.py ...
Guido van Rossumec758ea1991-06-04 20:36:54 +00009#
10# Output:
11# Four tables separated by lines like '--- Closure ---':
12# 1) Direct dependencies, listing which module imports which other modules
13# 2) The inverse of (1)
14# 3) Indirect dependencies, or the closure of the above
15# 4) The inverse of (3)
16#
17# To do:
18# - command line options to select output type
19# - option to automatically scan the Python library for referenced modules
20# - option to limit output to particular modules
21
22
23import sys
Thomas Wouters49fd7fa2006-04-21 10:40:58 +000024import re
Guido van Rossum15f27fb1992-12-10 00:00:58 +000025import os
Guido van Rossumec758ea1991-06-04 20:36:54 +000026
27
28# Main program
29#
30def main():
Tim Peters70c43782001-01-17 08:48:39 +000031 args = sys.argv[1:]
32 if not args:
Collin Winter6afaeb72007-08-03 17:06:41 +000033 print('usage: pdeps file.py file.py ...')
Tim Peters70c43782001-01-17 08:48:39 +000034 return 2
35 #
36 table = {}
37 for arg in args:
38 process(arg, table)
39 #
Collin Winter6afaeb72007-08-03 17:06:41 +000040 print('--- Uses ---')
Tim Peters70c43782001-01-17 08:48:39 +000041 printresults(table)
42 #
Collin Winter6afaeb72007-08-03 17:06:41 +000043 print('--- Used By ---')
Tim Peters70c43782001-01-17 08:48:39 +000044 inv = inverse(table)
45 printresults(inv)
46 #
Collin Winter6afaeb72007-08-03 17:06:41 +000047 print('--- Closure of Uses ---')
Tim Peters70c43782001-01-17 08:48:39 +000048 reach = closure(table)
49 printresults(reach)
50 #
Collin Winter6afaeb72007-08-03 17:06:41 +000051 print('--- Closure of Used By ---')
Tim Peters70c43782001-01-17 08:48:39 +000052 invreach = inverse(reach)
53 printresults(invreach)
54 #
55 return 0
Guido van Rossumec758ea1991-06-04 20:36:54 +000056
57
58# Compiled regular expressions to search for import statements
59#
Thomas Wouters49fd7fa2006-04-21 10:40:58 +000060m_import = re.compile('^[ \t]*from[ \t]+([^ \t]+)[ \t]+')
61m_from = re.compile('^[ \t]*import[ \t]+([^#]+)')
Guido van Rossumec758ea1991-06-04 20:36:54 +000062
63
64# Collect data from one file
65#
66def process(filename, table):
Tim Peters70c43782001-01-17 08:48:39 +000067 fp = open(filename, 'r')
68 mod = os.path.basename(filename)
69 if mod[-3:] == '.py':
70 mod = mod[:-3]
71 table[mod] = list = []
72 while 1:
73 line = fp.readline()
74 if not line: break
75 while line[-1:] == '\\':
76 nextline = fp.readline()
77 if not nextline: break
78 line = line[:-1] + nextline
R David Murrayd3af6342012-04-05 22:59:13 -040079 m_found = m_import.match(line) or m_from.match(line)
80 if m_found:
81 (a, b), (a1, b1) = m_found.regs[:2]
Tim Peters70c43782001-01-17 08:48:39 +000082 else: continue
Walter Dörwaldaaab30e2002-09-11 20:36:02 +000083 words = line[a1:b1].split(',')
Tim Peters70c43782001-01-17 08:48:39 +000084 # print '#', line, words
85 for word in words:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +000086 word = word.strip()
Tim Peters70c43782001-01-17 08:48:39 +000087 if word not in list:
88 list.append(word)
R David Murrayd3af6342012-04-05 22:59:13 -040089 fp.close()
Guido van Rossumec758ea1991-06-04 20:36:54 +000090
91
92# Compute closure (this is in fact totally general)
93#
94def closure(table):
Georg Brandl8efadf52008-05-16 15:23:30 +000095 modules = list(table.keys())
Tim Peters70c43782001-01-17 08:48:39 +000096 #
97 # Initialize reach with a copy of table
98 #
99 reach = {}
100 for mod in modules:
101 reach[mod] = table[mod][:]
102 #
103 # Iterate until no more change
104 #
105 change = 1
106 while change:
107 change = 0
108 for mod in modules:
109 for mo in reach[mod]:
110 if mo in modules:
111 for m in reach[mo]:
112 if m not in reach[mod]:
113 reach[mod].append(m)
114 change = 1
115 #
116 return reach
Guido van Rossumec758ea1991-06-04 20:36:54 +0000117
118
119# Invert a table (this is again totally general).
120# All keys of the original table are made keys of the inverse,
121# so there may be empty lists in the inverse.
122#
123def inverse(table):
Tim Peters70c43782001-01-17 08:48:39 +0000124 inv = {}
125 for key in table.keys():
R David Murrayd3af6342012-04-05 22:59:13 -0400126 if key not in inv:
Tim Peters70c43782001-01-17 08:48:39 +0000127 inv[key] = []
128 for item in table[key]:
129 store(inv, item, key)
130 return inv
Guido van Rossumec758ea1991-06-04 20:36:54 +0000131
132
133# Store "item" in "dict" under "key".
134# The dictionary maps keys to lists of items.
135# If there is no list for the key yet, it is created.
136#
137def store(dict, key, item):
Georg Brandl8efadf52008-05-16 15:23:30 +0000138 if key in dict:
Tim Peters70c43782001-01-17 08:48:39 +0000139 dict[key].append(item)
140 else:
141 dict[key] = [item]
Guido van Rossumec758ea1991-06-04 20:36:54 +0000142
143
144# Tabulate results neatly
145#
146def printresults(table):
Georg Brandl8efadf52008-05-16 15:23:30 +0000147 modules = sorted(table.keys())
Tim Peters70c43782001-01-17 08:48:39 +0000148 maxlen = 0
149 for mod in modules: maxlen = max(maxlen, len(mod))
Tim Peters70c43782001-01-17 08:48:39 +0000150 for mod in modules:
Georg Brandl8efadf52008-05-16 15:23:30 +0000151 list = sorted(table[mod])
Collin Winter6afaeb72007-08-03 17:06:41 +0000152 print(mod.ljust(maxlen), ':', end=' ')
Tim Peters70c43782001-01-17 08:48:39 +0000153 if mod in list:
Collin Winter6afaeb72007-08-03 17:06:41 +0000154 print('(*)', end=' ')
Tim Peters70c43782001-01-17 08:48:39 +0000155 for ref in list:
Collin Winter6afaeb72007-08-03 17:06:41 +0000156 print(ref, end=' ')
157 print()
Guido van Rossumec758ea1991-06-04 20:36:54 +0000158
159
160# Call main and honor exit status
Andrew M. Kuchlinge236b382004-08-09 17:27:55 +0000161if __name__ == '__main__':
162 try:
163 sys.exit(main())
164 except KeyboardInterrupt:
165 sys.exit(1)