blob: f62898ff803ace8e4f2b38ff20c78ec92e75f46f [file] [log] [blame]
# a wrapper for the Objective-C runtime for use by LLDB
import lldb
import cache
class Utilities:
@staticmethod
def read_ascii(process, pointer,max_len=128,when_over_return_none=True):
error = lldb.SBError()
pystr = ''
count = 0
# there is not any length byte to tell us how much to read
# however, there are most probably ways to optimize this
# in order to avoid doing the read byte-by-byte (caching is
# still occurring, but we could just fetch a larger chunk
# of memory instead of going one byte at a time)
while True:
content = process.ReadMemory(pointer, 1, error)
new_bytes = bytearray(content)
if new_bytes == None or len(new_bytes) == 0:
break
b0 = new_bytes[0]
pointer = pointer + 1
if b0 == 0:
break
count = count + 1
if count > max_len:
if when_over_return_none:
return None
else:
return pystr
pystr = pystr + chr(b0)
return pystr
@staticmethod
def is_valid_pointer(pointer, pointer_size, allow_tagged):
if pointer == None:
return False
if pointer == 0:
return False
if allow_tagged:
if (pointer % 2) == 1:
return True
return ((pointer % pointer_size) == 0)
# Objective-C runtime has a rule that pointers in a class_t will only have bits 0 thru 46 set
# so if any pointer has bits 47 thru 63 high we know that this is not a valid isa
@staticmethod
def is_allowed_pointer(pointer):
if pointer == None:
return False
mask = 0xFFFF800000000000
if (pointer & mask) != 0:
return False
return True
@staticmethod
def read_child_of(valobj,offset,type):
child = valobj.CreateChildAtOffset("childUNK",offset,type)
if child == None or child.IsValid() == False:
return None;
return child.GetValueAsUnsigned()
@staticmethod
def is_valid_identifier(name):
if name is None:
return None
if len(name) == 0:
return None
return True
# the rules below make perfect sense for compile-time class names, but the runtime is free
# to create classes with arbitrary names to implement functionality (e.g -poseAsClass)
# hence, we cannot really outlaw anything appearing in an identifier
#ok_first = dict.fromkeys("$ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz_")
#ok_others = dict.fromkeys("$ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz_1234567890")
#if name[0] not in ok_first:
# return False
#return all(c in ok_others for c in name[1:])
class RoT_Data:
def __init__(self,rot_pointer,params):
if (Utilities.is_valid_pointer(rot_pointer.GetValueAsUnsigned(),params.pointer_size, allow_tagged=False)):
self.sys_params = params
self.valobj = rot_pointer
self.flags = Utilities.read_child_of(self.valobj,0,self.sys_params.uint32_t)
self.instanceStart = Utilities.read_child_of(self.valobj,4,self.sys_params.uint32_t)
self.instanceSize = Utilities.read_child_of(self.valobj,8,self.sys_params.uint32_t)
if self.sys_params.lp64:
self.reserved = Utilities.read_child_of(self.valobj,12,self.sys_params.uint32_t)
offset = 16
else:
self.reserved = 0
offset = 12
self.ivarLayoutPtr = Utilities.read_child_of(self.valobj,offset,self.sys_params.addr_ptr_type)
offset = offset + self.sys_params.pointer_size
self.namePointer = Utilities.read_child_of(self.valobj,offset,self.sys_params.addr_ptr_type)
self.check_valid()
else:
self.valid = False
if self.valid:
self.name = Utilities.read_ascii(self.valobj.GetTarget().GetProcess(),self.namePointer)
if not(Utilities.is_valid_identifier(self.name)):
self.valid = False
# perform sanity checks on the contents of this class_rw_t
def check_valid(self):
self.valid = True
# misaligned pointers seem to be possible for this field
#if not(Utilities.is_valid_pointer(self.namePointer,self.sys_params.pointer_size,allow_tagged=False)):
# self.valid = False
# pass
def __str__(self):
return 'flags = ' + str(self.flags) + "\n" + \
"instanceStart = " + hex(self.instanceStart) + "\n" + \
"instanceSize = " + hex(self.instanceSize) + "\n" + \
"reserved = " + hex(self.reserved) + "\n" + \
"ivarLayoutPtr = " + hex(self.ivarLayoutPtr) + "\n" + \
"namePointer = " + hex(self.namePointer) + " --> " + self.name
def is_valid(self):
return self.valid
class RwT_Data:
def __init__(self,rwt_pointer,params):
if (Utilities.is_valid_pointer(rwt_pointer.GetValueAsUnsigned(),params.pointer_size, allow_tagged=False)):
self.sys_params = params
self.valobj = rwt_pointer
self.flags = Utilities.read_child_of(self.valobj,0,self.sys_params.uint32_t)
self.version = Utilities.read_child_of(self.valobj,4,self.sys_params.uint32_t)
self.roPointer = Utilities.read_child_of(self.valobj,8,self.sys_params.addr_ptr_type)
self.check_valid()
else:
self.valid = False
if self.valid:
self.rot = self.valobj.CreateValueFromAddress("rot",self.roPointer,self.sys_params.addr_ptr_type).AddressOf()
self.data = RoT_Data(self.rot,self.sys_params)
# perform sanity checks on the contents of this class_rw_t
def check_valid(self):
self.valid = True
if not(Utilities.is_valid_pointer(self.roPointer,self.sys_params.pointer_size,allow_tagged=False)):
self.valid = False
def __str__(self):
return 'flags = ' + str(self.flags) + "\n" + \
"version = " + hex(self.version) + "\n" + \
"roPointer = " + hex(self.roPointer)
def is_valid(self):
if self.valid:
return self.data.is_valid()
return False
class Class_Data_V2:
def __init__(self,isa_pointer,params):
if (isa_pointer != None) and (Utilities.is_valid_pointer(isa_pointer.GetValueAsUnsigned(),params.pointer_size, allow_tagged=False)):
self.sys_params = params
self.valobj = isa_pointer
self.isaPointer = Utilities.read_child_of(self.valobj,0,self.sys_params.addr_ptr_type)
self.superclassIsaPointer = Utilities.read_child_of(self.valobj,1*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.cachePointer = Utilities.read_child_of(self.valobj,2*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.vtablePointer = Utilities.read_child_of(self.valobj,3*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.dataPointer = Utilities.read_child_of(self.valobj,4*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.check_valid()
else:
self.valid = False
if self.valid:
self.rwt = self.valobj.CreateValueFromAddress("rwt",self.dataPointer,self.sys_params.addr_ptr_type).AddressOf()
self.data = RwT_Data(self.rwt,self.sys_params)
# perform sanity checks on the contents of this class_t
def check_valid(self):
self.valid = True
if not(Utilities.is_valid_pointer(self.isaPointer,self.sys_params.pointer_size,allow_tagged=False)):
self.valid = False
return
if not(Utilities.is_valid_pointer(self.superclassIsaPointer,self.sys_params.pointer_size,allow_tagged=False)):
# NULL is a valid value for superclass (it means we have reached NSObject)
if self.superclassIsaPointer != 0:
self.valid = False
return
if not(Utilities.is_valid_pointer(self.cachePointer,self.sys_params.pointer_size,allow_tagged=False)):
self.valid = False
return
if not(Utilities.is_valid_pointer(self.vtablePointer,self.sys_params.pointer_size,allow_tagged=False)):
self.valid = False
return
if not(Utilities.is_valid_pointer(self.dataPointer,self.sys_params.pointer_size,allow_tagged=False)):
self.valid = False
return
if not(Utilities.is_allowed_pointer(self.isaPointer)):
self.valid = False
return
if not(Utilities.is_allowed_pointer(self.superclassIsaPointer)):
# NULL is a valid value for superclass (it means we have reached NSObject)
if self.superclassIsaPointer != 0:
self.valid = False
return
if not(Utilities.is_allowed_pointer(self.cachePointer)):
self.valid = False
return
if not(Utilities.is_allowed_pointer(self.vtablePointer)):
self.valid = False
return
if not(Utilities.is_allowed_pointer(self.dataPointer)):
self.valid = False
return
def is_kvo(self):
if self.is_valid():
if self.data.data.name.startswith("NSKVONotify"):
return True
else:
return None
def get_superclass(self):
if self.is_valid():
parent_isa_pointer = self.valobj.CreateChildAtOffset("parent_isa",
self.sys_params.pointer_size,
self.sys_params.addr_ptr_type)
return Class_Data_V2(parent_isa_pointer,self.sys_params)
else:
return None
def class_name(self):
if self.is_valid():
return self.data.data.name
else:
return None
def is_valid(self):
if self.valid:
return self.data.is_valid()
return False
def __str__(self):
return 'isaPointer = ' + hex(self.isaPointer) + "\n" + \
"superclassIsaPointer = " + hex(self.superclassIsaPointer) + "\n" + \
"cachePointer = " + hex(self.cachePointer) + "\n" + \
"vtablePointer = " + hex(self.vtablePointer) + "\n" + \
"data = " + hex(self.dataPointer)
def is_tagged(self):
return False
def instance_size(self,align=False):
if self.is_valid() == False:
return None
if align:
unalign = self.instance_size(False)
if self.sys_params.lp64:
return ((unalign + 7) & ~7) % 0x100000000
else:
return ((unalign + 3) & ~3) % 0x100000000
else:
return self.rwt.rot.instanceSize
# runtime v1 is much less intricate than v2 and stores relevant information directly in the class_t object
class Class_Data_V1:
def __init__(self,isa_pointer,params):
if (isa_pointer != None) and (Utilities.is_valid_pointer(isa_pointer.GetValueAsUnsigned(),params.pointer_size, allow_tagged=False)):
self.sys_params = params
self.valobj = isa_pointer
self.isaPointer = Utilities.read_child_of(self.valobj,0,self.sys_params.addr_ptr_type)
self.superclassIsaPointer = Utilities.read_child_of(self.valobj,1*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.namePointer = Utilities.read_child_of(self.valobj,2*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.version = Utilities.read_child_of(self.valobj,3*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.info = Utilities.read_child_of(self.valobj,4*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.instanceSize = Utilities.read_child_of(self.valobj,5*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
# since we do not introspect ivars, methods, ... these four pointers need not be named in a meaningful way
# moreover, we do not care about their values, just that they are correctly aligned
self.ptr1 = Utilities.read_child_of(self.valobj,6*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.ptr2 = Utilities.read_child_of(self.valobj,7*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.ptr3 = Utilities.read_child_of(self.valobj,8*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.ptr4 = Utilities.read_child_of(self.valobj,9*self.sys_params.pointer_size,self.sys_params.addr_ptr_type)
self.check_valid()
else:
self.valid = False
if self.valid:
self.name = Utilities.read_ascii(self.valobj.GetTarget().GetProcess(),self.namePointer)
if not(Utilities.is_valid_identifier(self.name)):
self.valid = False
# perform sanity checks on the contents of this class_t
def check_valid(self):
self.valid = True
if not(Utilities.is_valid_pointer(self.isaPointer,self.sys_params.pointer_size,allow_tagged=False)):
self.valid = False
return
if not(Utilities.is_valid_pointer(self.superclassIsaPointer,self.sys_params.pointer_size,allow_tagged=False)):
# NULL is a valid value for superclass (it means we have reached NSObject)
if self.superclassIsaPointer != 0:
self.valid = False
return
#if not(Utilities.is_valid_pointer(self.namePointer,self.sys_params.pointer_size,allow_tagged=False)):
# self.valid = False
# return
def is_kvo(self):
if self.is_valid():
if self.name.startswith("NSKVONotify"):
return True
else:
return None
def get_superclass(self):
if self.is_valid():
parent_isa_pointer = self.valobj.CreateChildAtOffset("parent_isa",
self.sys_params.pointer_size,
self.sys_params.addr_ptr_type)
return Class_Data_V1(parent_isa_pointer,self.sys_params)
else:
return None
def class_name(self):
if self.is_valid():
return self.name
else:
return None
def is_valid(self):
return self.valid
def __str__(self):
return 'isaPointer = ' + hex(self.isaPointer) + "\n" + \
"superclassIsaPointer = " + hex(self.superclassIsaPointer) + "\n" + \
"namePointer = " + hex(self.namePointer) + " --> " + self.name + \
"version = " + hex(self.version) + "\n" + \
"info = " + hex(self.info) + "\n" + \
"instanceSize = " + hex(self.instanceSize) + "\n"
def is_tagged(self):
return False
def instance_size(self,align=False):
if self.is_valid() == False:
return None
if align:
unalign = self.instance_size(False)
if self.sys_params.lp64:
return ((unalign + 7) & ~7) % 0x100000000
else:
return ((unalign + 3) & ~3) % 0x100000000
else:
return self.instanceSize
class TaggedClass_Data:
def __init__(self,pointer,params):
self.valid = True
self.name = None
self.sys_params = params
self.valobj = pointer
self.val = (pointer & ~0x0000000000000000FF) >> 8
self.class_bits = (pointer & 0xE) >> 1
self.i_bits = (pointer & 0xF0) >> 4
# ignoring the LSB, NSNumber gets marked
# as 3 on Zin and as 1 on Lion - I can either make
# a difference or accept false positives
# ToT LLDB + some knowledge of framework versioning
# would let me do the right thing - for now I just
# act dumb and accept false positives
if self.class_bits == 0 or \
self.class_bits == 5 or \
self.class_bits == 7 or \
self.class_bits == 9:
self.valid = False
return
elif self.class_bits == 3 or self.class_bits == 1:
self.name = 'NSNumber'
elif self.class_bits == 11:
self.name = 'NSManagedObject'
elif self.class_bits == 13:
self.name = 'NSDate'
elif self.class_bits == 15:
self.name = 'NSDateTS' # not sure what this is
else:
self.valid = False
def is_valid(self):
return self.valid
def class_name(self):
if self.is_valid():
return self.name
else:
return None
def value(self):
return self.val if self.is_valid() else None
def info_bits(self):
return self.i_bits if self.is_valid() else None
def is_kvo(self):
return False
# we would need to go around looking for the superclass or ask the runtime
# for now, we seem not to require support for this operation so we will merrily
# pretend to be at a root point in the hierarchy
def get_superclass(self):
return None
# anything that is handled here is tagged
def is_tagged(self):
return True
# it seems reasonable to say that a tagged pointer is the size of a pointer
def instance_size(self,align=False):
if self.is_valid() == False:
return None
return 8 if self.sys_params.lp64 else 4
class InvalidClass_Data:
def __init__(self):
pass
def is_valid(self):
return False
runtime_version = cache.Cache()
class SystemParameters:
def __init__(self,valobj):
self.adjust_for_architecture(valobj)
def adjust_for_architecture(self,valobj):
self.process = valobj.GetTarget().GetProcess()
self.lp64 = (self.process.GetAddressByteSize() == 8)
self.is_little = (self.process.GetByteOrder() == lldb.eByteOrderLittle)
self.pointer_size = self.process.GetAddressByteSize()
self.addr_type = valobj.GetType().GetBasicType(lldb.eBasicTypeUnsignedLong)
self.addr_ptr_type = self.addr_type.GetPointerType()
self.uint32_t = valobj.GetType().GetBasicType(lldb.eBasicTypeUnsignedInt)
global runtime_version
pid = self.process.GetProcessID()
if runtime_version.look_for_key(pid):
self.runtime_version = runtime_version.get_value(pid)
else:
self.runtime_version = ObjCRuntime.runtime_version(self.process)
runtime_version.add_item(pid,self.runtime_version)
isa_cache = cache.Cache()
class ObjCRuntime:
# the ObjC runtime has no explicit "version" field that we can use
# instead, we discriminate v1 from v2 by looking for the presence
# of a well-known section only present in v1
@staticmethod
def runtime_version(process):
if process.IsValid() == False:
return None
target = process.GetTarget()
num_modules = target.GetNumModules()
module_objc = None
for idx in range(num_modules):
module = target.GetModuleAtIndex(idx)
if module.GetFileSpec().GetFilename() == 'libobjc.A.dylib':
module_objc = module
break
if module_objc == None or module_objc.IsValid() == False:
return None
num_sections = module.GetNumSections()
section_objc = None
for idx in range(num_sections):
section = module.GetSectionAtIndex(idx)
if section.GetName() == '__OBJC':
section_objc = section
break
if section_objc != None and section_objc.IsValid():
return 1
return 2
def __init__(self,valobj):
self.valobj = valobj
self.adjust_for_architecture()
self.sys_params = SystemParameters(self.valobj)
def adjust_for_architecture(self):
self.lp64 = (self.valobj.GetTarget().GetProcess().GetAddressByteSize() == 8)
self.is_little = (self.valobj.GetTarget().GetProcess().GetByteOrder() == lldb.eByteOrderLittle)
self.pointer_size = self.valobj.GetTarget().GetProcess().GetAddressByteSize()
self.addr_type = self.valobj.GetType().GetBasicType(lldb.eBasicTypeUnsignedLong)
self.addr_ptr_type = self.addr_type.GetPointerType()
# an ObjC pointer can either be tagged or must be aligned
def is_tagged(self):
if self.valobj is None:
return False
return (Utilities.is_valid_pointer(self.valobj.GetValueAsUnsigned(),self.pointer_size, allow_tagged=True) and not(Utilities.is_valid_pointer(self.valobj.GetValueAsUnsigned(),self.pointer_size, allow_tagged=False)))
def is_valid(self):
if self.valobj is None:
return False
if self.valobj.IsInScope() == False:
return False
return Utilities.is_valid_pointer(self.valobj.GetValueAsUnsigned(),self.pointer_size, allow_tagged=True)
def read_isa(self):
isa_pointer = self.valobj.CreateChildAtOffset("cfisa",
0,
self.addr_ptr_type)
if isa_pointer == None or isa_pointer.IsValid() == False:
return None;
if isa_pointer.GetValueAsUnsigned(1) == 1:
return None;
return isa_pointer
def read_class_data(self):
global isa_cache
if self.is_tagged():
# tagged pointers only exist in ObjC v2
if self.sys_params.runtime_version == 2:
# not every odd-valued pointer is actually tagged. most are just plain wrong
# we could try and predetect this before even creating a TaggedClass_Data object
# but unless performance requires it, this seems a cleaner way to tackle the task
tentative_tagged = TaggedClass_Data(self.valobj.GetValueAsUnsigned(0),self.sys_params)
return tentative_tagged if tentative_tagged.is_valid() else InvalidClass_Data()
else:
return InvalidClass_Data()
if self.is_valid() == False:
return InvalidClass_Data()
isa = self.read_isa()
if isa == None:
return InvalidClass_Data()
isa_value = isa.GetValueAsUnsigned(1)
if isa_value == 1:
return InvalidClass_Data()
data = isa_cache.get_value(isa_value,default=None)
if data != None:
return data
if self.sys_params.runtime_version == 2:
data = Class_Data_V2(isa,self.sys_params)
else:
data = Class_Data_V1(isa,self.sys_params)
if data == None:
return InvalidClass_Data()
if data.is_valid():
isa_cache.add_item(isa_value,data,ok_to_replace=True)
return data