blob: 382509039c95833ce19f74b571c2e59b68c99d69 [file] [log] [blame]
Johnny Chen14097802011-04-28 21:31:18 +00001#
Johnny Chend7e04d92011-08-05 20:17:27 +00002# modify-python-lldb.py
Johnny Chen14097802011-04-28 21:31:18 +00003#
4# This script modifies the lldb module (which was automatically generated via
Johnny Chen22e418a2011-04-29 19:22:24 +00005# running swig) to support iteration and/or equality operations for certain lldb
Johnny Chene5637d22011-05-24 21:05:16 +00006# objects, implements truth value testing for certain lldb objects, and adds a
7# global variable 'debugger_unique_id' which is initialized to 0.
Johnny Chen14097802011-04-28 21:31:18 +00008#
Johnny Chen09e0a422011-07-01 22:14:07 +00009# As a cleanup step, it also removes the 'residues' from the autodoc features of
10# swig. For an example, take a look at SBTarget.h header file, where we take
Johnny Chen2c77fa42011-07-02 20:01:09 +000011# advantage of the already existing doxygen C++-docblock and make it the Python
Johnny Chen09e0a422011-07-01 22:14:07 +000012# docstring for the same method. The 'residues' in this context include the
Johnny Chenf6ce70a2011-07-03 19:55:50 +000013# '#endif', the '#ifdef SWIG', the c comment marker, the trailing blank (SPC's)
14# line, and the doxygen comment start marker.
Johnny Chen09e0a422011-07-01 22:14:07 +000015#
Johnny Chen37811372011-07-06 21:55:45 +000016# In addition to the 'residues' removal during the cleanup step, it also
17# transforms the 'char' data type (which was actually 'char *' but the 'autodoc'
18# feature of swig removes ' *' from it into 'str' (as a Python str type).
19#
Johnny Chen14097802011-04-28 21:31:18 +000020# It also calls SBDebugger.Initialize() to initialize the lldb debugger
21# subsystem.
22#
23
24import sys, re, StringIO
25
26if len (sys.argv) != 2:
27 output_name = "./lldb.py"
28else:
29 output_name = sys.argv[1] + "/lldb.py"
30
31# print "output_name is '" + output_name + "'"
32
Johnny Chen37811372011-07-06 21:55:45 +000033#
Johnny Chen09e0a422011-07-01 22:14:07 +000034# Residues to be removed.
Johnny Chen37811372011-07-06 21:55:45 +000035#
Johnny Chen09e0a422011-07-01 22:14:07 +000036c_endif_swig = "#endif"
37c_ifdef_swig = "#ifdef SWIG"
Johnny Chen2c77fa42011-07-02 20:01:09 +000038c_comment_marker = "//------------"
39# The pattern for recognizing the doxygen comment block line.
Johnny Chenebd63b22011-07-16 21:15:39 +000040doxygen_comment_start = re.compile("^\s*(/// ?)")
Johnny Chenf6ce70a2011-07-03 19:55:50 +000041# The demarcation point for turning on/off residue removal state.
42# When bracketed by the lines, the CLEANUP_DOCSTRING state (see below) is ON.
43toggle_docstring_cleanup_line = ' """'
Johnny Chen09e0a422011-07-01 22:14:07 +000044
Johnny Chen37811372011-07-06 21:55:45 +000045def char_to_str_xform(line):
46 """This transforms the 'char', i.e, 'char *' to 'str', Python string."""
47 line = line.replace(' char', ' str')
48 line = line.replace('char ', 'str ')
Johnny Chen2de7ce62011-07-14 00:17:49 +000049 # Special case handling of 'char **argv' and 'char **envp'.
50 line = line.replace('str argv', 'list argv')
51 line = line.replace('str envp', 'list envp')
Johnny Chen37811372011-07-06 21:55:45 +000052 return line
53
54#
55# The one-liner docstring also needs char_to_str transformation, btw.
56#
Johnny Chen21c0fd12011-07-08 23:57:20 +000057TWO_SPACES = ' ' * 2
58EIGHT_SPACES = ' ' * 8
59one_liner_docstring_pattern = re.compile('^(%s|%s)""".*"""$' % (TWO_SPACES, EIGHT_SPACES))
Johnny Chen37811372011-07-06 21:55:45 +000060
Johnny Chen14097802011-04-28 21:31:18 +000061#
Johnny Chenec5e0a22011-06-01 18:40:11 +000062# lldb_iter() should appear before our first SB* class definition.
Johnny Chen14097802011-04-28 21:31:18 +000063#
64lldb_iter_def = '''
65# ===================================
66# Iterator for lldb container objects
67# ===================================
68def lldb_iter(obj, getsize, getelem):
69 """A generator adaptor to support iteration for lldb container objects."""
70 size = getattr(obj, getsize)
71 elem = getattr(obj, getelem)
72 for i in range(size()):
73 yield elem(i)
74
Johnny Chen81422202011-06-01 19:21:08 +000075# ==============================================================================
76# The modify-python-lldb.py script is responsible for post-processing this SWIG-
77# generated lldb.py module. It is responsible for adding the above lldb_iter()
78# function definition as well as the supports, in the following, for iteration
79# protocol: __iter__, rich comparison methods: __eq__ and __ne__, truth value
80# testing (and built-in operation bool()): __nonzero__, and built-in function
81# len(): __len__.
82# ==============================================================================
Johnny Chen14097802011-04-28 21:31:18 +000083'''
84
Johnny Chenfbebbc92011-07-25 19:32:35 +000085#
Johnny Chende856cc2011-07-25 23:41:08 +000086# linked_list_iter() is a special purpose iterator to treat the SBValue as the
87# head of a list data structure, where you specify the child member name which
88# points to the next item on the list and you specify the end-of-list function
89# which takes an SBValue and returns True if EOL is reached and False if not.
Johnny Chenfbebbc92011-07-25 19:32:35 +000090#
91linked_list_iter_def = '''
Johnny Chena4673e12011-07-26 20:57:10 +000092 def __eol_test__(val):
93 """Default function for end of list test takes an SBValue object.
94
95 Return True if val is invalid or it corresponds to a null pointer.
96 Otherwise, return False.
97 """
Johnny Chend96c9e82011-08-11 00:49:03 +000098 if not val or val.GetValueAsUnsigned() == 0:
Johnny Chena4673e12011-07-26 20:57:10 +000099 return True
100 else:
101 return False
102
Johnny Chenfbebbc92011-07-25 19:32:35 +0000103 # ==================================================
104 # Iterator for lldb.SBValue treated as a linked list
105 # ==================================================
Johnny Chena4673e12011-07-26 20:57:10 +0000106 def linked_list_iter(self, next_item_name, end_of_list_test=__eol_test__):
Johnny Chende856cc2011-07-25 23:41:08 +0000107 """Generator adaptor to support iteration for SBValue as a linked list.
108
109 linked_list_iter() is a special purpose iterator to treat the SBValue as
110 the head of a list data structure, where you specify the child member
111 name which points to the next item on the list and you specify the
112 end-of-list test function which takes an SBValue for an item and returns
113 True if EOL is reached and False if not.
Johnny Chenfbebbc92011-07-25 19:32:35 +0000114
Johnny Chen758db962011-08-11 01:19:46 +0000115 linked_list_iter() also detects infinite loop and bails out early.
116
Johnny Chena4673e12011-07-26 20:57:10 +0000117 The end_of_list_test arg, if omitted, defaults to the __eol_test__
118 function above.
119
Johnny Chenfbebbc92011-07-25 19:32:35 +0000120 For example,
121
Johnny Chenfbebbc92011-07-25 19:32:35 +0000122 # Get Frame #0.
123 ...
124
125 # Get variable 'task_head'.
126 task_head = frame0.FindVariable('task_head')
127 ...
128
Johnny Chena4673e12011-07-26 20:57:10 +0000129 for t in task_head.linked_list_iter('next'):
Johnny Chenfbebbc92011-07-25 19:32:35 +0000130 print t
131 """
Johnny Chend96c9e82011-08-11 00:49:03 +0000132 if end_of_list_test(self):
133 return
134 item = self
Johnny Chen758db962011-08-11 01:19:46 +0000135 visited = set()
Johnny Chenfbebbc92011-07-25 19:32:35 +0000136 try:
Johnny Chen758db962011-08-11 01:19:46 +0000137 while not end_of_list_test(item) and not item.GetValueAsUnsigned() in visited:
138 visited.add(item.GetValueAsUnsigned())
Johnny Chenfbebbc92011-07-25 19:32:35 +0000139 yield item
140 # Prepare for the next iteration.
141 item = item.GetChildMemberWithName(next_item_name)
Johnny Chenfbebbc92011-07-25 19:32:35 +0000142 except:
143 # Exception occurred. Stop the generator.
144 pass
145
146 return
147'''
148
Johnny Chen14097802011-04-28 21:31:18 +0000149# This supports the iteration protocol.
Johnny Chen14097802011-04-28 21:31:18 +0000150iter_def = " def __iter__(self): return lldb_iter(self, '%s', '%s')"
151module_iter = " def module_iter(self): return lldb_iter(self, '%s', '%s')"
152breakpoint_iter = " def breakpoint_iter(self): return lldb_iter(self, '%s', '%s')"
Johnny Chen2077f0d2011-05-17 22:14:39 +0000153
Johnny Chena79a21c2011-05-16 20:31:18 +0000154# Called to implement the built-in function len().
155# Eligible objects are those containers with unambiguous iteration support.
Johnny Chena79a21c2011-05-16 20:31:18 +0000156len_def = " def __len__(self): return self.%s()"
Johnny Chen2077f0d2011-05-17 22:14:39 +0000157
Johnny Chen3a3d6592011-04-29 19:03:02 +0000158# This supports the rich comparison methods of __eq__ and __ne__.
Johnny Chen7616cb92011-05-02 19:05:52 +0000159eq_def = " def __eq__(self, other): return isinstance(other, %s) and %s"
Johnny Chen3a3d6592011-04-29 19:03:02 +0000160ne_def = " def __ne__(self, other): return not self.__eq__(other)"
Johnny Chen14097802011-04-28 21:31:18 +0000161
Johnny Chen2077f0d2011-05-17 22:14:39 +0000162# Called to implement truth value testing and the built-in operation bool();
163# should return False or True, or their integer equivalents 0 or 1.
164# Delegate to self.IsValid() if it is defined for the current lldb object.
165nonzero_def = " def __nonzero__(self): return self.IsValid()"
166
Johnny Chen14097802011-04-28 21:31:18 +0000167#
Johnny Chena6303ef2011-05-24 22:53:03 +0000168# This dictionary defines a mapping from classname to (getsize, getelem) tuple.
Johnny Chen14097802011-04-28 21:31:18 +0000169#
170d = { 'SBBreakpoint': ('GetNumLocations', 'GetLocationAtIndex'),
171 'SBCompileUnit': ('GetNumLineEntries', 'GetLineEntryAtIndex'),
172 'SBDebugger': ('GetNumTargets', 'GetTargetAtIndex'),
173 'SBModule': ('GetNumSymbols', 'GetSymbolAtIndex'),
174 'SBProcess': ('GetNumThreads', 'GetThreadAtIndex'),
175 'SBThread': ('GetNumFrames', 'GetFrameAtIndex'),
176
177 'SBInstructionList': ('GetSize', 'GetInstructionAtIndex'),
178 'SBStringList': ('GetSize', 'GetStringAtIndex',),
179 'SBSymbolContextList': ('GetSize', 'GetContextAtIndex'),
Johnny Chen3ee85202011-08-05 01:35:49 +0000180 'SBTypeList': ('GetSize', 'GetTypeAtIndex'),
181 'SBValueList': ('GetSize', 'GetValueAtIndex'),
Johnny Chen14097802011-04-28 21:31:18 +0000182
183 'SBType': ('GetNumberChildren', 'GetChildAtIndex'),
184 'SBValue': ('GetNumChildren', 'GetChildAtIndex'),
185
Johnny Chen08477f52011-05-24 22:57:42 +0000186 # SBTarget needs special processing, see below.
Johnny Chen14097802011-04-28 21:31:18 +0000187 'SBTarget': {'module': ('GetNumModules', 'GetModuleAtIndex'),
188 'breakpoint': ('GetNumBreakpoints', 'GetBreakpointAtIndex')
189 }
190 }
191
Johnny Chen3a3d6592011-04-29 19:03:02 +0000192#
Johnny Chen7616cb92011-05-02 19:05:52 +0000193# This dictionary defines a mapping from classname to equality method name(s).
Johnny Chen3a3d6592011-04-29 19:03:02 +0000194#
Johnny Chen694cfd02011-06-09 22:04:56 +0000195e = { 'SBAddress': ['GetFileAddress', 'GetModule'],
196 'SBBreakpoint': ['GetID'],
Johnny Chen7616cb92011-05-02 19:05:52 +0000197 'SBFileSpec': ['GetFilename', 'GetDirectory'],
Johnny Chend7e04d92011-08-05 20:17:27 +0000198 'SBModule': ['GetFileSpec', 'GetUUIDString'],
199 'SBType': ['GetByteSize', 'GetName']
Johnny Chen7616cb92011-05-02 19:05:52 +0000200 }
201
202def list_to_frag(list):
203 """Transform a list to equality program fragment.
204
205 For example, ['GetID'] is transformed to 'self.GetID() == other.GetID()',
206 and ['GetFilename', 'GetDirectory'] to 'self.GetFilename() == other.GetFilename()
207 and self.GetDirectory() == other.GetDirectory()'.
208 """
209 if not list:
210 raise Exception("list should be non-empty")
211 frag = StringIO.StringIO()
212 for i in range(len(list)):
213 if i > 0:
214 frag.write(" and ")
215 frag.write("self.{0}() == other.{0}()".format(list[i]))
216 return frag.getvalue()
Johnny Chen3a3d6592011-04-29 19:03:02 +0000217
Johnny Chenebd63b22011-07-16 21:15:39 +0000218class NewContent(StringIO.StringIO):
219 """Simple facade to keep track of the previous line to be committed."""
220 def __init__(self):
221 StringIO.StringIO.__init__(self)
222 self.prev_line = None
223 def add_line(self, a_line):
224 """Add a line to the content, if there is a previous line, commit it."""
225 if self.prev_line != None:
226 print >> self, self.prev_line
227 self.prev_line = a_line
228 def del_line(self):
229 """Forget about the previous line, do not commit it."""
230 self.prev_line = None
231 def del_blank_line(self):
232 """Forget about the previous line if it is a blank line."""
233 if self.prev_line != None and not self.prev_line.strip():
234 self.prev_line = None
235 def finish(self):
236 """Call this when you're finished with populating content."""
237 if self.prev_line != None:
238 print >> self, self.prev_line
239 self.prev_line = None
240
Johnny Chen14097802011-04-28 21:31:18 +0000241# The new content will have the iteration protocol defined for our lldb objects.
Johnny Chenebd63b22011-07-16 21:15:39 +0000242new_content = NewContent()
Johnny Chen14097802011-04-28 21:31:18 +0000243
244with open(output_name, 'r') as f_in:
245 content = f_in.read()
246
247# The pattern for recognizing the beginning of an SB class definition.
248class_pattern = re.compile("^class (SB.*)\(_object\):$")
249
250# The pattern for recognizing the beginning of the __init__ method definition.
Johnny Chen3ee85202011-08-05 01:35:49 +0000251init_pattern = re.compile("^ def __init__\(self.*\):")
Johnny Chen14097802011-04-28 21:31:18 +0000252
Johnny Chen2077f0d2011-05-17 22:14:39 +0000253# The pattern for recognizing the beginning of the IsValid method definition.
Peter Collingbournef2084532011-06-14 03:55:41 +0000254isvalid_pattern = re.compile("^ def IsValid\(")
Johnny Chen2077f0d2011-05-17 22:14:39 +0000255
Johnny Chena79a21c2011-05-16 20:31:18 +0000256# These define the states of our finite state machine.
Johnny Chen14097802011-04-28 21:31:18 +0000257NORMAL = 0
258DEFINING_ITERATOR = 1
Johnny Chen3a3d6592011-04-29 19:03:02 +0000259DEFINING_EQUALITY = 2
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000260CLEANUP_DOCSTRING = 4
Johnny Chen14097802011-04-28 21:31:18 +0000261
262# The lldb_iter_def only needs to be inserted once.
263lldb_iter_defined = False;
264
Johnny Chen2077f0d2011-05-17 22:14:39 +0000265# Our FSM begins its life in the NORMAL state, and transitions to the
266# DEFINING_ITERATOR and/or DEFINING_EQUALITY state whenever it encounters the
267# beginning of certain class definitions, see dictionaries 'd' and 'e' above.
268#
269# Note that the two states DEFINING_ITERATOR and DEFINING_EQUALITY are
270# orthogonal in that our FSM can be in one, the other, or both states at the
271# same time. During such time, the FSM is eagerly searching for the __init__
272# method definition in order to insert the appropriate method(s) into the lldb
273# module.
274#
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000275# The state CLEANUP_DOCSTRING can be entered from either the NORMAL or the
276# DEFINING_ITERATOR/EQUALITY states. While in this state, the FSM is fixing/
277# cleaning the Python docstrings generated by the swig docstring features.
278#
Johnny Chenb72d1772011-05-24 22:29:49 +0000279# The FSM, in all possible states, also checks the current input for IsValid()
280# definition, and inserts a __nonzero__() method definition to implement truth
281# value testing and the built-in operation bool().
Johnny Chen14097802011-04-28 21:31:18 +0000282state = NORMAL
283for line in content.splitlines():
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000284 # Handle the state transition into CLEANUP_DOCSTRING state as it is possible
285 # to enter this state from either NORMAL or DEFINING_ITERATOR/EQUALITY.
286 #
287 # If ' """' is the sole line, prepare to transition to the
288 # CLEANUP_DOCSTRING state or out of it.
289 if line == toggle_docstring_cleanup_line:
290 if state & CLEANUP_DOCSTRING:
Johnny Chenebd63b22011-07-16 21:15:39 +0000291 # Special handling of the trailing blank line right before the '"""'
292 # end docstring marker.
293 new_content.del_blank_line()
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000294 state ^= CLEANUP_DOCSTRING
295 else:
296 state |= CLEANUP_DOCSTRING
Johnny Chen09e0a422011-07-01 22:14:07 +0000297
Johnny Chen14097802011-04-28 21:31:18 +0000298 if state == NORMAL:
299 match = class_pattern.search(line)
Johnny Chen2077f0d2011-05-17 22:14:39 +0000300 # Inserts the lldb_iter() definition before the first class definition.
Johnny Chen14097802011-04-28 21:31:18 +0000301 if not lldb_iter_defined and match:
Johnny Chenebd63b22011-07-16 21:15:39 +0000302 new_content.add_line(lldb_iter_def)
Johnny Chen14097802011-04-28 21:31:18 +0000303 lldb_iter_defined = True
Johnny Chen2077f0d2011-05-17 22:14:39 +0000304
305 # If we are at the beginning of the class definitions, prepare to
306 # transition to the DEFINING_ITERATOR/DEFINING_EQUALITY state for the
307 # right class names.
Johnny Chen3a3d6592011-04-29 19:03:02 +0000308 if match:
Johnny Chen14097802011-04-28 21:31:18 +0000309 cls = match.group(1)
Johnny Chen3a3d6592011-04-29 19:03:02 +0000310 if cls in d:
311 # Adding support for iteration for the matched SB class.
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000312 state |= DEFINING_ITERATOR
Johnny Chen3a3d6592011-04-29 19:03:02 +0000313 if cls in e:
314 # Adding support for eq and ne for the matched SB class.
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000315 state |= DEFINING_EQUALITY
316
Johnny Chen533ed2f2011-07-15 20:46:19 +0000317 if (state & DEFINING_ITERATOR) or (state & DEFINING_EQUALITY):
Johnny Chen14097802011-04-28 21:31:18 +0000318 match = init_pattern.search(line)
319 if match:
320 # We found the beginning of the __init__ method definition.
Johnny Chen3a3d6592011-04-29 19:03:02 +0000321 # This is a good spot to insert the iter and/or eq-ne support.
Johnny Chen14097802011-04-28 21:31:18 +0000322 #
323 # But note that SBTarget has two types of iterations.
324 if cls == "SBTarget":
Johnny Chenebd63b22011-07-16 21:15:39 +0000325 new_content.add_line(module_iter % (d[cls]['module']))
326 new_content.add_line(breakpoint_iter % (d[cls]['breakpoint']))
Johnny Chen14097802011-04-28 21:31:18 +0000327 else:
Johnny Chen3a3d6592011-04-29 19:03:02 +0000328 if (state & DEFINING_ITERATOR):
Johnny Chenebd63b22011-07-16 21:15:39 +0000329 new_content.add_line(iter_def % d[cls])
330 new_content.add_line(len_def % d[cls][0])
Johnny Chen3a3d6592011-04-29 19:03:02 +0000331 if (state & DEFINING_EQUALITY):
Johnny Chenebd63b22011-07-16 21:15:39 +0000332 new_content.add_line(eq_def % (cls, list_to_frag(e[cls])))
333 new_content.add_line(ne_def)
Johnny Chena2f86e82011-04-29 19:19:13 +0000334
Johnny Chenfbebbc92011-07-25 19:32:35 +0000335 # This special purpose iterator is for SBValue only!!!
336 if cls == "SBValue":
337 new_content.add_line(linked_list_iter_def)
338
Johnny Chena2f86e82011-04-29 19:19:13 +0000339 # Next state will be NORMAL.
340 state = NORMAL
Johnny Chen14097802011-04-28 21:31:18 +0000341
Johnny Chen533ed2f2011-07-15 20:46:19 +0000342 if (state & CLEANUP_DOCSTRING):
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000343 # Cleanse the lldb.py of the autodoc'ed residues.
344 if c_ifdef_swig in line or c_endif_swig in line:
345 continue
Johnny Chenebd63b22011-07-16 21:15:39 +0000346 # As well as the comment marker line.
347 if c_comment_marker in line:
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000348 continue
Johnny Chenebd63b22011-07-16 21:15:39 +0000349
Johnny Chen533ed2f2011-07-15 20:46:19 +0000350 # Also remove the '\a ' and '\b 'substrings.
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000351 line = line.replace('\a ', '')
Johnny Chen533ed2f2011-07-15 20:46:19 +0000352 line = line.replace('\b ', '')
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000353 # And the leading '///' substring.
354 doxygen_comment_match = doxygen_comment_start.match(line)
355 if doxygen_comment_match:
356 line = line.replace(doxygen_comment_match.group(1), '', 1)
357
Johnny Chen37811372011-07-06 21:55:45 +0000358 line = char_to_str_xform(line)
359
Johnny Chenf6ce70a2011-07-03 19:55:50 +0000360 # Note that the transition out of CLEANUP_DOCSTRING is handled at the
361 # beginning of this function already.
362
Johnny Chen37811372011-07-06 21:55:45 +0000363 # This deals with one-liner docstring, for example, SBThread.GetName:
364 # """GetName(self) -> char""".
365 if one_liner_docstring_pattern.match(line):
366 line = char_to_str_xform(line)
367
Johnny Chenb72d1772011-05-24 22:29:49 +0000368 # Look for 'def IsValid(*args):', and once located, add implementation
369 # of truth value testing for this object by delegation.
370 if isvalid_pattern.search(line):
Johnny Chenebd63b22011-07-16 21:15:39 +0000371 new_content.add_line(nonzero_def)
Johnny Chenb72d1772011-05-24 22:29:49 +0000372
Johnny Chen6ea16c72011-05-02 17:53:04 +0000373 # Pass the original line of content to new_content.
Johnny Chenebd63b22011-07-16 21:15:39 +0000374 new_content.add_line(line)
375
376# We are finished with recording new content.
377new_content.finish()
378
Johnny Chen14097802011-04-28 21:31:18 +0000379with open(output_name, 'w') as f_out:
380 f_out.write(new_content.getvalue())
381 f_out.write("debugger_unique_id = 0\n")
382 f_out.write("SBDebugger.Initialize()\n")