diff options
Diffstat (limited to 'tools/perf/scripts/python')
| -rwxr-xr-x | tools/perf/scripts/python/arm-cs-trace-disasm.py | 274 | ||||
| -rw-r--r-- | tools/perf/scripts/python/intel-pt-events.py | 40 | 
2 files changed, 308 insertions, 6 deletions
diff --git a/tools/perf/scripts/python/arm-cs-trace-disasm.py b/tools/perf/scripts/python/arm-cs-trace-disasm.py new file mode 100755 index 000000000000..4339692a8d0b --- /dev/null +++ b/tools/perf/scripts/python/arm-cs-trace-disasm.py @@ -0,0 +1,274 @@ +# SPDX-License-Identifier: GPL-2.0 +# arm-cs-trace-disasm.py: ARM CoreSight Trace Dump With Disassember +# +# Author: Tor Jeremiassen <tor@ti.com> +#         Mathieu Poirier <mathieu.poirier@linaro.org> +#         Leo Yan <leo.yan@linaro.org> +#         Al Grant <Al.Grant@arm.com> + +from __future__ import print_function +import os +from os import path +import sys +import re +from subprocess import * +from optparse import OptionParser, make_option + +from perf_trace_context import perf_set_itrace_options, \ +	perf_sample_insn, perf_sample_srccode + +# Below are some example commands for using this script. +# +# Output disassembly with objdump: +#  perf script -s scripts/python/arm-cs-trace-disasm.py \ +#		-- -d objdump -k path/to/vmlinux +# Output disassembly with llvm-objdump: +#  perf script -s scripts/python/arm-cs-trace-disasm.py \ +#		-- -d llvm-objdump-11 -k path/to/vmlinux +# Output only source line and symbols: +#  perf script -s scripts/python/arm-cs-trace-disasm.py + +# Command line parsing. +option_list = [ +	# formatting options for the bottom entry of the stack +	make_option("-k", "--vmlinux", dest="vmlinux_name", +		    help="Set path to vmlinux file"), +	make_option("-d", "--objdump", dest="objdump_name", +		    help="Set path to objdump executable file"), +	make_option("-v", "--verbose", dest="verbose", +		    action="store_true", default=False, +		    help="Enable debugging log") +] + +parser = OptionParser(option_list=option_list) +(options, args) = parser.parse_args() + +# Initialize global dicts and regular expression +disasm_cache = dict() +cpu_data = dict() +disasm_re = re.compile("^\s*([0-9a-fA-F]+):") +disasm_func_re = re.compile("^\s*([0-9a-fA-F]+)\s.*:") +cache_size = 64*1024 + +glb_source_file_name	= None +glb_line_number		= None +glb_dso			= None + +def get_optional(perf_dict, field): +       if field in perf_dict: +               return perf_dict[field] +       return "[unknown]" + +def get_offset(perf_dict, field): +	if field in perf_dict: +		return "+%#x" % perf_dict[field] +	return "" + +def get_dso_file_path(dso_name, dso_build_id): +	if (dso_name == "[kernel.kallsyms]" or dso_name == "vmlinux"): +		if (options.vmlinux_name): +			return options.vmlinux_name; +		else: +			return dso_name + +	if (dso_name == "[vdso]") : +		append = "/vdso" +	else: +		append = "/elf" + +	dso_path = os.environ['PERF_BUILDID_DIR'] + "/" + dso_name + "/" + dso_build_id + append; +	# Replace duplicate slash chars to single slash char +	dso_path = dso_path.replace('//', '/', 1) +	return dso_path + +def read_disam(dso_fname, dso_start, start_addr, stop_addr): +	addr_range = str(start_addr) + ":" + str(stop_addr) + ":" + dso_fname + +	# Don't let the cache get too big, clear it when it hits max size +	if (len(disasm_cache) > cache_size): +		disasm_cache.clear(); + +	if addr_range in disasm_cache: +		disasm_output = disasm_cache[addr_range]; +	else: +		start_addr = start_addr - dso_start; +		stop_addr = stop_addr - dso_start; +		disasm = [ options.objdump_name, "-d", "-z", +			   "--start-address="+format(start_addr,"#x"), +			   "--stop-address="+format(stop_addr,"#x") ] +		disasm += [ dso_fname ] +		disasm_output = check_output(disasm).decode('utf-8').split('\n') +		disasm_cache[addr_range] = disasm_output + +	return disasm_output + +def print_disam(dso_fname, dso_start, start_addr, stop_addr): +	for line in read_disam(dso_fname, dso_start, start_addr, stop_addr): +		m = disasm_func_re.search(line) +		if m is None: +			m = disasm_re.search(line) +			if m is None: +				continue +		print("\t" + line) + +def print_sample(sample): +	print("Sample = { cpu: %04d addr: 0x%016x phys_addr: 0x%016x ip: 0x%016x " \ +	      "pid: %d tid: %d period: %d time: %d }" % \ +	      (sample['cpu'], sample['addr'], sample['phys_addr'], \ +	       sample['ip'], sample['pid'], sample['tid'], \ +	       sample['period'], sample['time'])) + +def trace_begin(): +	print('ARM CoreSight Trace Data Assembler Dump') + +def trace_end(): +	print('End') + +def trace_unhandled(event_name, context, event_fields_dict): +	print(' '.join(['%s=%s'%(k,str(v))for k,v in sorted(event_fields_dict.items())])) + +def common_start_str(comm, sample): +	sec = int(sample["time"] / 1000000000) +	ns = sample["time"] % 1000000000 +	cpu = sample["cpu"] +	pid = sample["pid"] +	tid = sample["tid"] +	return "%16s %5u/%-5u [%04u] %9u.%09u  " % (comm, pid, tid, cpu, sec, ns) + +# This code is copied from intel-pt-events.py for printing source code +# line and symbols. +def print_srccode(comm, param_dict, sample, symbol, dso): +	ip = sample["ip"] +	if symbol == "[unknown]": +		start_str = common_start_str(comm, sample) + ("%x" % ip).rjust(16).ljust(40) +	else: +		offs = get_offset(param_dict, "symoff") +		start_str = common_start_str(comm, sample) + (symbol + offs).ljust(40) + +	global glb_source_file_name +	global glb_line_number +	global glb_dso + +	source_file_name, line_number, source_line = perf_sample_srccode(perf_script_context) +	if source_file_name: +		if glb_line_number == line_number and glb_source_file_name == source_file_name: +			src_str = "" +		else: +			if len(source_file_name) > 40: +				src_file = ("..." + source_file_name[-37:]) + " " +			else: +				src_file = source_file_name.ljust(41) + +			if source_line is None: +				src_str = src_file + str(line_number).rjust(4) + " <source not found>" +			else: +				src_str = src_file + str(line_number).rjust(4) + " " + source_line +		glb_dso = None +	elif dso == glb_dso: +		src_str = "" +	else: +		src_str = dso +		glb_dso = dso + +	glb_line_number = line_number +	glb_source_file_name = source_file_name + +	print(start_str, src_str) + +def process_event(param_dict): +	global cache_size +	global options + +	sample = param_dict["sample"] +	comm = param_dict["comm"] + +	name = param_dict["ev_name"] +	dso = get_optional(param_dict, "dso") +	dso_bid = get_optional(param_dict, "dso_bid") +	dso_start = get_optional(param_dict, "dso_map_start") +	dso_end = get_optional(param_dict, "dso_map_end") +	symbol = get_optional(param_dict, "symbol") + +	if (options.verbose == True): +		print("Event type: %s" % name) +		print_sample(sample) + +	# If cannot find dso so cannot dump assembler, bail out +	if (dso == '[unknown]'): +		return + +	# Validate dso start and end addresses +	if ((dso_start == '[unknown]') or (dso_end == '[unknown]')): +		print("Failed to find valid dso map for dso %s" % dso) +		return + +	if (name[0:12] == "instructions"): +		print_srccode(comm, param_dict, sample, symbol, dso) +		return + +	# Don't proceed if this event is not a branch sample, . +	if (name[0:8] != "branches"): +		return + +	cpu = sample["cpu"] +	ip = sample["ip"] +	addr = sample["addr"] + +	# Initialize CPU data if it's empty, and directly return back +	# if this is the first tracing event for this CPU. +	if (cpu_data.get(str(cpu) + 'addr') == None): +		cpu_data[str(cpu) + 'addr'] = addr +		return + +	# The format for packet is: +	# +	#		  +------------+------------+------------+ +	#  sample_prev:   |    addr    |    ip	    |	 cpu	 | +	#		  +------------+------------+------------+ +	#  sample_next:   |    addr    |    ip	    |	 cpu	 | +	#		  +------------+------------+------------+ +	# +	# We need to combine the two continuous packets to get the instruction +	# range for sample_prev::cpu: +	# +	#     [ sample_prev::addr .. sample_next::ip ] +	# +	# For this purose, sample_prev::addr is stored into cpu_data structure +	# and read back for 'start_addr' when the new packet comes, and we need +	# to use sample_next::ip to calculate 'stop_addr', plusing extra 4 for +	# 'stop_addr' is for the sake of objdump so the final assembler dump can +	# include last instruction for sample_next::ip. +	start_addr = cpu_data[str(cpu) + 'addr'] +	stop_addr  = ip + 4 + +	# Record for previous sample packet +	cpu_data[str(cpu) + 'addr'] = addr + +	# Handle CS_ETM_TRACE_ON packet if start_addr=0 and stop_addr=4 +	if (start_addr == 0 and stop_addr == 4): +		print("CPU%d: CS_ETM_TRACE_ON packet is inserted" % cpu) +		return + +	if (start_addr < int(dso_start) or start_addr > int(dso_end)): +		print("Start address 0x%x is out of range [ 0x%x .. 0x%x ] for dso %s" % (start_addr, int(dso_start), int(dso_end), dso)) +		return + +	if (stop_addr < int(dso_start) or stop_addr > int(dso_end)): +		print("Stop address 0x%x is out of range [ 0x%x .. 0x%x ] for dso %s" % (stop_addr, int(dso_start), int(dso_end), dso)) +		return + +	if (options.objdump_name != None): +		# It doesn't need to decrease virtual memory offset for disassembly +		# for kernel dso, so in this case we set vm_start to zero. +		if (dso == "[kernel.kallsyms]"): +			dso_vm_start = 0 +		else: +			dso_vm_start = int(dso_start) + +		dso_fname = get_dso_file_path(dso, dso_bid) +		if path.exists(dso_fname): +			print_disam(dso_fname, dso_vm_start, start_addr, stop_addr) +		else: +			print("Failed to find dso %s for address range [ 0x%x .. 0x%x ]" % (dso, start_addr, stop_addr)) + +	print_srccode(comm, param_dict, sample, symbol, dso) diff --git a/tools/perf/scripts/python/intel-pt-events.py b/tools/perf/scripts/python/intel-pt-events.py index 973bd12b7b40..6be7fd8fd615 100644 --- a/tools/perf/scripts/python/intel-pt-events.py +++ b/tools/perf/scripts/python/intel-pt-events.py @@ -104,7 +104,13 @@ def print_ptwrite(raw_buf):  	flags = data[0]  	payload = data[1]  	exact_ip = flags & 1 -	print("IP: %u payload: %#x" % (exact_ip, payload), end=' ') +	try: +		s = payload.to_bytes(8, "little").decode("ascii").rstrip("\x00") +		if not s.isprintable(): +			s = "" +	except: +		s = "" +	print("IP: %u payload: %#x" % (exact_ip, payload), s, end=' ')  def print_cbr(raw_buf):  	data = struct.unpack_from("<BBBBII", raw_buf) @@ -191,7 +197,12 @@ def common_start_str(comm, sample):  	cpu = sample["cpu"]  	pid = sample["pid"]  	tid = sample["tid"] -	return "%16s %5u/%-5u [%03u] %9u.%09u  " % (comm, pid, tid, cpu, ts / 1000000000, ts %1000000000) +	if "machine_pid" in sample: +		machine_pid = sample["machine_pid"] +		vcpu = sample["vcpu"] +		return "VM:%5d VCPU:%03d %16s %5u/%-5u [%03u] %9u.%09u  " % (machine_pid, vcpu, comm, pid, tid, cpu, ts / 1000000000, ts %1000000000) +	else: +		return "%16s %5u/%-5u [%03u] %9u.%09u  " % (comm, pid, tid, cpu, ts / 1000000000, ts %1000000000)  def print_common_start(comm, sample, name):  	flags_disp = get_optional_null(sample, "flags_disp") @@ -373,9 +384,19 @@ def process_event(param_dict):  		sys.exit(1)  def auxtrace_error(typ, code, cpu, pid, tid, ip, ts, msg, cpumode, *x): +	if len(x) >= 2 and x[0]: +		machine_pid = x[0] +		vcpu = x[1] +	else: +		machine_pid = 0 +		vcpu = -1  	try: -		print("%16s %5u/%-5u [%03u] %9u.%09u  error type %u code %u: %s ip 0x%16x" % -			("Trace error", pid, tid, cpu, ts / 1000000000, ts %1000000000, typ, code, msg, ip)) +		if machine_pid: +			print("VM:%5d VCPU:%03d %16s %5u/%-5u [%03u] %9u.%09u  error type %u code %u: %s ip 0x%16x" % +				(machine_pid, vcpu, "Trace error", pid, tid, cpu, ts / 1000000000, ts %1000000000, typ, code, msg, ip)) +		else: +			print("%16s %5u/%-5u [%03u] %9u.%09u  error type %u code %u: %s ip 0x%16x" % +				("Trace error", pid, tid, cpu, ts / 1000000000, ts %1000000000, typ, code, msg, ip))  	except broken_pipe_exception:  		# Stop python printing broken pipe errors and traceback  		sys.stdout = open(os.devnull, 'w') @@ -390,14 +411,21 @@ def context_switch(ts, cpu, pid, tid, np_pid, np_tid, machine_pid, out, out_pree  		preempt_str = "preempt"  	else:  		preempt_str = "" +	if len(x) >= 2 and x[0]: +		machine_pid = x[0] +		vcpu = x[1] +	else: +		vcpu = None;  	if machine_pid == -1:  		machine_str = "" -	else: +	elif vcpu is None:  		machine_str = "machine PID %d" % machine_pid +	else: +		machine_str = "machine PID %d VCPU %d" % (machine_pid, vcpu)  	switch_str = "%16s %5d/%-5d [%03u] %9u.%09u %5d/%-5d %s %s" % \  		(out_str, pid, tid, cpu, ts / 1000000000, ts %1000000000, np_pid, np_tid, machine_str, preempt_str)  	if glb_args.all_switch_events: -		print(switch_str); +		print(switch_str)  	else:  		global glb_switch_str  		glb_switch_str[cpu] = switch_str  | 
