Diff 512968

lldb/examples/python/crashlog.py

Show First 20 Lines • Show All 74 Lines • ▼ Show 20 Lines

class CrashLog(symbolication.Symbolicator):		class CrashLog(symbolication.Symbolicator):
class Thread:		class Thread:
"""Class that represents a thread in a darwin crash log"""		"""Class that represents a thread in a darwin crash log"""

def __init__(self, index, app_specific_backtrace):		def __init__(self, index, app_specific_backtrace):
self.index = index		self.index = index
self.id = index		self.id = index
		self.images = list()
self.frames = list()		self.frames = list()
self.idents = list()		self.idents = list()
self.registers = dict()		self.registers = dict()
self.reason = None		self.reason = None
self.name = None		self.name = None
self.queue = None		self.queue = None
self.crashed = False		self.crashed = False
self.app_specific_backtrace = app_specific_backtrace		self.app_specific_backtrace = app_specific_backtrace
▲ Show 20 Lines • Show All 360 Lines • ▼ Show 20 Lines	def is_valid_json(path):

with open(path, 'r', encoding='utf-8') as f:		with open(path, 'r', encoding='utf-8') as f:
buffer = f.read()		buffer = f.read()
try:		try:
return parse_json(buffer)		return parse_json(buffer)
except:		except:
return None		return None

		def __init__(self, debugger, path, verbose):
		super().__init__(debugger, path, verbose)
		# List of DarwinImages sorted by their index.
		self.images = list()

		mibUnsubmitted Done Reply Inline Actions Why do we need this ? mib: Why do we need this ?
		JDevlieghereAuthorUnsubmitted Done Reply Inline Actions The parser now stores a list of images sorted by their index. We can't use the list of images in the crashlog (`self.crashlog.images`) because they have the main module at index `0`. JDevlieghere: The parser now stores a list of images sorted by their index. We can't use the list of images…
def parse(self):		def parse(self):
try:		try:
self.parse_process_info(self.data)		self.parse_process_info(self.data)
self.parse_images(self.data['usedImages'])		self.parse_images(self.data['usedImages'])
self.parse_main_image(self.data)		self.parse_main_image(self.data)
self.parse_threads(self.data['threads'])		self.parse_threads(self.data['threads'])
if 'asi' in self.data:		if 'asi' in self.data:
self.crashlog.asi = self.data['asi']		self.crashlog.asi = self.data['asi']
Show All 34 Lines	def parse_crash_reason(self, json_exception):
elif 'subtype' in json_exception:		elif 'subtype' in json_exception:
exception_extra = " ({})".format(json_exception['subtype'])		exception_extra = " ({})".format(json_exception['subtype'])
else:		else:
exception_extra = ""		exception_extra = ""
return "{}{}{}".format(exception_type, exception_signal,		return "{}{}{}".format(exception_type, exception_signal,
exception_extra)		exception_extra)

def parse_images(self, json_images):		def parse_images(self, json_images):
idx = 0		for idx, json_image in enumerate(json_images):
		mibUnsubmitted Done Reply Inline Actions What do we use `idx` for ? mib: What do we use `idx` for ?
		JDevlieghereAuthorUnsubmitted Done Reply Inline Actions You're right, this isn't necessary anymore. JDevlieghere: You're right, this isn't necessary anymore.
		mibUnsubmitted Done Reply Inline Actions I'm really not a big fan of having very similar image lists ... may be we could use the from the crashlog object and skip the first entry (since we know it's the main executable). What do you think ? mib: I'm really not a big fan of having very similar image lists ... may be we could use the from…
		mibUnsubmitted Done Reply Inline Actions Otherwise, we could hoist the main executable image from the image list and handle it separately. mib: Otherwise, we could hoist the main executable image from the image list and handle it…
		JDevlieghereAuthorUnsubmitted Done Reply Inline Actions I understand the concern. To be fair, I didn't check whether the main executable coming first is something we rely on, but I'm pretty sure we are: we'll need it to create the target. I didn't want to mess with that and risk introducing a bug that way. It took me quite some time to figure out this was an issue when parsing the symbol data. If we don't want to break that assumption, there's nothing more efficient than keeping a second list of references. I also think it makes sense to keep that in the JSON parser, because the index of (parsed) image is only something that makes sense for that format because it cross references images based on their index. That's not the case in the textual or parser crashlogs. FWIW this is the code that moves the main image to the top, invalidating the image indexes of every image before it: def set_main_image(self, identifier): for i, image in enumerate(self.images): if image.identifier == identifier: self.images.insert(0, self.images.pop(i)) break JDevlieghere: I understand the concern. To be fair, I didn't check whether the main executable coming first…
		mibUnsubmitted Not Done Reply Inline Actions Fair mib: Fair
for json_image in json_images:
img_uuid = uuid.UUID(json_image['uuid'])		img_uuid = uuid.UUID(json_image['uuid'])
low = int(json_image['base'])		low = int(json_image['base'])
high = low + int(		high = low + int(
json_image['size']) if 'size' in json_image else low		json_image['size']) if 'size' in json_image else low
name = json_image['name'] if 'name' in json_image else ''		name = json_image['name'] if 'name' in json_image else ''
path = json_image['path'] if 'path' in json_image else ''		path = json_image['path'] if 'path' in json_image else ''
version = ''		version = ''
darwin_image = self.crashlog.DarwinImage(low, high, name, version,		darwin_image = self.crashlog.DarwinImage(low, high, name, version,
img_uuid, path,		img_uuid, path,
self.verbose)		self.verbose)
		self.images.append(darwin_image)
self.crashlog.images.append(darwin_image)		self.crashlog.images.append(darwin_image)
		mibUnsubmitted Done Reply Inline Actions Seems like we're doing the same things for both `self.images` and `self.crashlog.images` ... In that case, is `self.images` really necessary ? mib: Seems like we're doing the same things for both `self.images` and `self.crashlog.images` ... In…
		JDevlieghereAuthorUnsubmitted Done Reply Inline Actions Yes, see my previous comment. JDevlieghere: Yes, see my previous comment.
idx += 1

def parse_main_image(self, json_data):		def parse_main_image(self, json_data):
if 'procName' in json_data:		if 'procName' in json_data:
proc_name = json_data['procName']		proc_name = json_data['procName']
self.crashlog.set_main_image(proc_name)		self.crashlog.set_main_image(proc_name)

def parse_frames(self, thread, json_frames):		def parse_frames(self, thread, json_frames):
idx = 0		idx = 0
for json_frame in json_frames:		for json_frame in json_frames:
image_id = int(json_frame['imageIndex'])		image_id = int(json_frame['imageIndex'])
json_image = self.get_used_image(image_id)		json_image = self.get_used_image(image_id)
ident = json_image['name'] if 'name' in json_image else ''		ident = json_image['name'] if 'name' in json_image else ''
thread.add_ident(ident)		thread.add_ident(ident)
if ident not in self.crashlog.idents:		if ident not in self.crashlog.idents:
self.crashlog.idents.append(ident)		self.crashlog.idents.append(ident)

frame_offset = int(json_frame['imageOffset'])		frame_offset = int(json_frame['imageOffset'])
image_addr = self.get_used_image(image_id)['base']		image_addr = self.get_used_image(image_id)['base']
pc = image_addr + frame_offset		pc = image_addr + frame_offset

		if 'symbol' in json_frame:
		symbol = json_frame['symbol']
		location = int(json_frame['symbolLocation'])
		image = self.images[image_id]
		image.symbols[symbol] = {
		"name": symbol,
		"type": "code",
		"size": 0x0,
		mibUnsubmitted Done Reply Inline Actions Does this needs to be initialized ? mib: Does this needs to be initialized ?
		"address": frame_offset - location
		}

thread.frames.append(self.crashlog.Frame(idx, pc, frame_offset))		thread.frames.append(self.crashlog.Frame(idx, pc, frame_offset))

# on arm64 systems, if it jump through a null function pointer,		# on arm64 systems, if it jump through a null function pointer,
# we end up at address 0 and the crash reporter unwinder		# we end up at address 0 and the crash reporter unwinder
# misses the frame that actually faulted.		# misses the frame that actually faulted.
# But $lr can tell us where the last BL/BLR instruction used		# But $lr can tell us where the last BL/BLR instruction used
# was at, so insert that address as the caller stack frame.		# was at, so insert that address as the caller stack frame.
if idx == 0 and pc == 0 and "lr" in thread.registers:		if idx == 0 and pc == 0 and "lr" in thread.registers:
▲ Show 20 Lines • Show All 808 Lines • Show Last 20 Lines

lldb/examples/python/scripted_process/crashlog_scripted_process.py

Show All 16 Lines	def set_crashlog(self, crashlog):
self.loaded_images = []		self.loaded_images = []
self.exception = self.crashlog.exception		self.exception = self.crashlog.exception
self.app_specific_thread = None		self.app_specific_thread = None
if hasattr(self.crashlog, 'asi'):		if hasattr(self.crashlog, 'asi'):
self.metadata['asi'] = self.crashlog.asi		self.metadata['asi'] = self.crashlog.asi
if hasattr(self.crashlog, 'asb'):		if hasattr(self.crashlog, 'asb'):
self.extended_thread_info = self.crashlog.asb		self.extended_thread_info = self.crashlog.asb

def load_images(self, images):		if self.load_all_images:
#TODO: Add to self.loaded_images and load images in lldb		for image in self.crashlog.images:
if images:		image.resolve = True
for image in images:		else:
		for thread in self.crashlog.threads:
		if thread.did_crash():
		for ident in thread.idents:
		for image in self.crashlog.find_images_with_identifier(ident):
		image.resolve = False

		for image in self.crashlog.images:
if image not in self.loaded_images:		if image not in self.loaded_images:
if image.uuid == uuid.UUID(int=0):		if image.uuid == uuid.UUID(int=0):
continue		continue
err = image.add_module(self.target)		err = image.add_module(self.target)
if err:		if err:
# Append to SBCommandReturnObject		# Append to SBCommandReturnObject
print(err)		print(err)
else:		else:
self.loaded_images.append(image)		self.loaded_images.append(image)

		mibUnsubmitted Done Reply Inline Actions Nice! mib: Nice!
for thread in self.crashlog.threads:		for thread in self.crashlog.threads:
if self.load_all_images:
load_images(self, self.crashlog.images)
elif thread.did_crash():
for ident in thread.idents:
load_images(self, self.crashlog.find_images_with_identifier(ident))

if hasattr(thread, 'app_specific_backtrace') and thread.app_specific_backtrace:		if hasattr(thread, 'app_specific_backtrace') and thread.app_specific_backtrace:
# We don't want to include the Application Specific Backtrace		# We don't want to include the Application Specific Backtrace
# Thread into the Scripted Process' Thread list.		# Thread into the Scripted Process' Thread list.
# Instead, we will try to extract the stackframe pcs from the		# Instead, we will try to extract the stackframe pcs from the
# backtrace and inject that as the extended thread info.		# backtrace and inject that as the extended thread info.
self.app_specific_thread = thread		self.app_specific_thread = thread
continue		continue

▲ Show 20 Lines • Show All 146 Lines • Show Last 20 Lines

lldb/examples/python/symbolication.py

Show All 29 Lines

import optparse import optparse

import os import os

import plistlib import plistlib

import re import re

import shlex import shlex

import sys import sys

import time import time

import uuid import uuid

import json

import tempfile

import pathlib

class Address: class Address:

"""Class that represents an address that will be symbolicated""" """Class that represents an address that will be symbolicated"""

def __init__(self, target, load_addr): def __init__(self, target, load_addr):

self.target = target self.target = target

self.load_addr = load_addr # The load address that this object represents self.load_addr = load_addr # The load address that this object represents

▲ Show 20 Lines • Show All 179 Lines • ▼ Show 20 Lines

class Image: class Image:

"""A class that represents an executable image and any associated data""" """A class that represents an executable image and any associated data"""

def __init__(self, path, uuid=None): def __init__(self, path, uuid=None):

self.path = path self.path = path

self.resolved_path = None self.resolved_path = None

self.resolve = False

self.resolved = False self.resolved = False

self.unavailable = False self.unavailable = False

self.uuid = uuid self.uuid = uuid

self.section_infos = list() self.section_infos = list()

self.identifier = None self.identifier = None

self.version = None self.version = None

self.arch = None self.arch = None

self.module = None self.module = None

self.symfile = None self.symfile = None

self.slide = None self.slide = None

self.symbols = dict()

@classmethod @classmethod

def InitWithSBTargetAndSBModule(cls, target, module): def InitWithSBTargetAndSBModule(cls, target, module):

'''Initialize this Image object with a module from a target.''' '''Initialize this Image object with a module from a target.'''

obj = cls(module.file.fullpath, module.uuid) obj = cls(module.file.fullpath, module.uuid)

obj.resolved_path = module.platform_file.fullpath obj.resolved_path = module.platform_file.fullpath

obj.resolved = True obj.resolved = True

for section in module.sections: for section in module.sections:

▲ Show 20 Lines • Show All 116 Lines • ▼ Show 20 Lines class Image:

def add_module(self, target): def add_module(self, target):

'''Add the Image described in this object to "target" and load the sections if "load" is True.''' '''Add the Image described in this object to "target" and load the sections if "load" is True.'''

if target: if target:

# Try and find using UUID only first so that paths need not match # Try and find using UUID only first so that paths need not match

# up # up

uuid_str = self.get_normalized_uuid_string() uuid_str = self.get_normalized_uuid_string()

if uuid_str: if uuid_str:

self.module = target.AddModule(None, None, uuid_str) self.module = target.AddModule(None, None, uuid_str)

if not self.module: if not self.module and self.resolve:

self.locate_module_and_debug_symbols() self.locate_module_and_debug_symbols()

if self.unavailable: if self.unavailable:

return None return None

resolved_path = self.get_resolved_path() resolved_path = self.get_resolved_path()

self.module = target.AddModule( self.module = target.AddModule(

resolved_path, None, uuid_str, self.symfile) resolved_path, None, uuid_str, self.symfile)

if not self.module and self.section_infos:

name = pathlib.Path(self.path).name

with tempfile.NamedTemporaryFile(suffix='.' + name) as tf:

data = {

'triple': target.triple,

'uuid': uuid_str,

'type': 'sharedlibrary',

'sections': list(),

'symbols': list()

}

for section in self.section_infos:

data['sections'].append({

'name' : section.name,

'address': 0,

'size': section.end_addr - section.start_addr

})

for symbol in self.symbols.values():

data['symbols'].append(symbol)

with open(tf.name, 'w') as f:

f.write(json.dumps(data, indent=4))

self.module = target.AddModule(tf.name, None, uuid_str)

if not self.module: if not self.module:

return 'error: unable to get module for (%s) "%s"' % ( return 'error: unable to get module for (%s) "%s"' % (

self.arch, self.get_resolved_path()) self.arch, self.get_resolved_path())

if self.has_section_load_info(): if self.has_section_load_info():

return self.load_module(target) return self.load_module(target)

else: else:

mibUnsubmitted

Done

if not self.module and self.section_infos:

- name = pathlib.Path(self.path).name

+ name = os.path.basename(self.path)

with tempfile.NamedTemporaryFile(suffix='.' + name) as tf:

Fancy! Can't we just do this and remove the extra import ?

mib: Fancy! Can't we just do this and remove the extra import ?

return None # No sections, the module was added to the target, so success return None # No sections, the module was added to the target, so success

else: else:

return 'error: invalid target' return 'error: invalid target'

def locate_module_and_debug_symbols(self): def locate_module_and_debug_symbols(self):

# By default, just use the paths that were supplied in: # By default, just use the paths that were supplied in:

# self.path # self.path

# self.resolved_path # self.resolved_path

# self.module # self.module

# self.symfile # self.symfile

# Subclasses can inherit from this class and override this function # Subclasses can inherit from this class and override this function

self.resolved = True self.resolved = True

mibUnsubmitted

Done

Since this field is optional in the ObjectFileJSON, I think it should be included here. We should just initialize it to 0 in lldb if the user didn't provide it.

mib: Since this field is optional in the ObjectFileJSON, I think it should be included here. We…

return True return True

def get_uuid(self): def get_uuid(self):

mibUnsubmitted

Done

'size': section.end_addr - section.start_addr

})

- for symbol in self.symbols.values():

- data['symbols'].append(symbol)

+ data['symbols'] = list(self.symbols.values())

with open(tf.name, 'w') as f:

What about :

mib: What about :

if not self.uuid and self.module: if not self.uuid and self.module:

mibUnsubmitted

Done

'size': section.end_addr - section.start_addr

})

- for symbol in self.symbols.values():

- data['symbols'].append(symbol)

+ data['symbols'] = symbols.values()

with open(tf.name, 'w') as f:

This should work, right ?

mib: This should work, right ?

JDevlieghereAuthorUnsubmitted

Done

Apparently not: values() returns a view object rather than a list: https://docs.python.org/3/library/stdtypes.html#dict-views

JDevlieghere: Apparently not: `values()` returns a view object rather than a list: https://docs.python.

self.uuid = uuid.UUID(self.module.GetUUIDString()) self.uuid = uuid.UUID(self.module.GetUUIDString())

return self.uuid return self.uuid

def get_normalized_uuid_string(self): def get_normalized_uuid_string(self):

if self.uuid: if self.uuid:

return str(self.uuid).upper() return str(self.uuid).upper()

return None return None

▲ Show 20 Lines • Show All 325 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[lldb] Use ObjectFileJSON to create modules for interactive crashlogs
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 512968

lldb/examples/python/crashlog.py

lldb/examples/python/scripted_process/crashlog_scripted_process.py

lldb/examples/python/symbolication.py

This is an archive of the discontinued LLVM Phabricator instance.

[lldb] Use ObjectFileJSON to create modules for interactive crashlogsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 512968

lldb/examples/python/crashlog.py

lldb/examples/python/scripted_process/crashlog_scripted_process.py

lldb/examples/python/symbolication.py

[lldb] Use ObjectFileJSON to create modules for interactive crashlogs
ClosedPublic