blob: bbe8347d9fc4be7d21e5b2ee78b5ccc9fc1df1f5 [file] [log] [blame]
#
# Copyright © 2021 Intel Corporation
#
# Permission is hereby granted, free of charge, to any person obtaining a
# copy of this software and associated documentation files (the "Software"),
# to deal in the Software without restriction, including without limitation
# the rights to use, copy, modify, merge, publish, distribute, sublicense,
# and/or sell copies of the Software, and to permit persons to whom the
# Software is furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice (including the next
# paragraph) shall be included in all copies or substantial portions of the
# Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.
#
import argparse
import sys
# List of the default tracepoints enabled. By default most tracepoints are
# enabled, set tp_default=False to disable them by default.
#
# Currently only stall is disabled by default
intel_default_tps = []
#
# Tracepoint definitions:
#
def define_tracepoints(args):
from u_trace import Header, HeaderScope
from u_trace import ForwardDecl
from u_trace import Tracepoint
from u_trace import TracepointArg as Arg
from u_trace import TracepointArgStruct as ArgStruct
Header('intel_driver_ds.h', scope=HeaderScope.SOURCE)
Header('vulkan/vulkan_core.h', scope=HeaderScope.SOURCE|HeaderScope.PERFETTO)
Header('blorp/blorp_priv.h', scope=HeaderScope.HEADER)
Header('ds/intel_driver_ds.h', scope=HeaderScope.HEADER)
def begin_end_tp(name, tp_args=[], tp_struct=None, tp_print=None,
tp_default_enabled=True, end_pipelined=True,
compute=False, maybe_compute=False,
need_cs_param=False):
global intel_default_tps
if tp_default_enabled:
intel_default_tps.append(name)
# Preprocess arguments to handle display_as_hex
processed_args = []
for arg in tp_args:
# Manually handle display_as_hex by modifying the format
if "hash" in arg.var:
arg = Arg(type=arg.type, var=arg.var, c_format='%#x') # Convert to hex format
processed_args.append(arg)
Tracepoint('intel_begin_{0}'.format(name),
toggle_name=name,
tp_perfetto='intel_ds_begin_{0}'.format(name),
need_cs_param=need_cs_param)
tp_flags = []
if end_pipelined:
if compute:
tp_flags.append('INTEL_DS_TRACEPOINT_FLAG_END_CS')
elif maybe_compute:
tp_flags.append('INTEL_DS_TRACEPOINT_FLAG_END_CS_OR_NOOP')
else:
tp_flags.append('INTEL_DS_TRACEPOINT_FLAG_END_OF_PIPE')
Tracepoint('intel_end_{0}'.format(name),
toggle_name=name,
args=processed_args,
tp_struct=tp_struct,
tp_perfetto='intel_ds_end_{0}'.format(name),
tp_print=tp_print,
tp_flags=tp_flags,
need_cs_param=need_cs_param)
# Frame tracepoints
begin_end_tp('frame',
tp_args=[Arg(type='uint32_t', var='frame', c_format='%u'),],
end_pipelined=False,
need_cs_param=True)
# Annotations for Queue(Begin|End)DebugUtilsLabelEXT
begin_end_tp('queue_annotation',
tp_args=[Arg(type='unsigned', var='len'),
Arg(type='str', var='str', c_format='%s', length_arg='len + 1', copy_func='strncpy'),],
tp_struct=[Arg(type='uint8_t', name='dummy', var='0')],
end_pipelined=False,
need_cs_param=True)
# Batch buffer tracepoints, only for Iris
begin_end_tp('batch',
tp_args=[Arg(type='uint8_t', var='name', c_format='%hhu'),],
end_pipelined=False)
# Command buffer tracepoints, only for Anv
begin_end_tp('cmd_buffer',
tp_args=[Arg(type='uint8_t', var='level', c_format='%hhu'),],
end_pipelined=False)
# Annotations for Cmd(Begin|End)DebugUtilsLabelEXT
begin_end_tp('cmd_buffer_annotation',
tp_args=[Arg(type='unsigned', var='len'),
Arg(type='str', var='str', c_format='%s', length_arg='len + 1', copy_func='strncpy'),],
tp_struct=[Arg(type='uint8_t', name='dummy', var='0'),],
end_pipelined=True)
# Transform feedback, only for Anv
begin_end_tp('xfb',
end_pipelined=False)
# Dynamic rendering tracepoints, only for Anv
begin_end_tp('render_pass',
tp_args=[Arg(type='uint16_t', var='width', c_format='%hu'),
Arg(type='uint16_t', var='height', c_format='%hu'),
Arg(type='uint8_t', var='att_count', c_format='%hhu'),
Arg(type='uint8_t', var='msaa', c_format='%hhu'),])
# Blorp operations, Anv & Iris
begin_end_tp('blorp',
tp_args=[Arg(type='enum blorp_op', var='op', c_format='%s', to_prim_type='blorp_op_to_name({})'),
Arg(type='uint32_t', var='width', c_format='%u'),
Arg(type='uint32_t', var='height', c_format='%u'),
Arg(type='uint32_t', var='samples', c_format='%u'),
Arg(type='enum blorp_shader_pipeline', var='shader_pipe', c_format='%s', to_prim_type='blorp_shader_pipeline_to_name({})'),
Arg(type='enum isl_format', var='dst_fmt', c_format='%s', to_prim_type='isl_format_get_short_name({})'),
Arg(type='enum isl_format', var='src_fmt', c_format='%s', to_prim_type='isl_format_get_short_name({})'),
Arg(type='uint8_t', var='predicated', c_format='%hhu'),
])
# vkCmdWriteBufferMarker*, only for Anv
begin_end_tp('write_buffer_marker',
end_pipelined=False)
# Indirect draw generation, only for Anv
begin_end_tp('generate_draws')
begin_end_tp('generate_commands')
# vkCmdResetQuery, only for Anv
begin_end_tp('query_clear_blorp',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u')])
begin_end_tp('query_clear_cs',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u')],
end_pipelined=False)
# vkCmdCopyQueryResults, only for Anv
begin_end_tp('query_copy_cs',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u')],
end_pipelined=False)
begin_end_tp('query_copy_shader',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u')])
# Various draws/dispatch, Anv & Iris
begin_end_tp('draw',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u'),
Arg(type='uint32_t', var='vs_hash', c_format='%u'),
Arg(type='uint32_t', var='fs_hash', c_format='%u')])
begin_end_tp('draw_multi',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u'),
Arg(type='uint32_t', var='vs_hash', c_format='%u'),
Arg(type='uint32_t', var='fs_hash', c_format='%u')])
begin_end_tp('draw_indexed',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u'),
Arg(type='uint32_t', var='vs_hash', c_format='%u'),
Arg(type='uint32_t', var='fs_hash', c_format='%u')])
begin_end_tp('draw_indexed_multi',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u'),
Arg(type='uint32_t', var='vs_hash', c_format='%u'),
Arg(type='uint32_t', var='fs_hash', c_format='%u')])
begin_end_tp('draw_indirect_byte_count',
tp_args=[Arg(type='uint32_t', var='instance_count', c_format='%u'),
Arg(type='uint32_t', var='vs_hash', c_format='%u'),
Arg(type='uint32_t', var='fs_hash', c_format='%u')])
begin_end_tp('draw_indirect',
tp_args=[Arg(type='uint32_t', var='draw_count', c_format='%u'),
Arg(type='uint32_t', var='vs_hash', c_format='%u'),
Arg(type='uint32_t', var='fs_hash', c_format='%u')])
begin_end_tp('draw_indexed_indirect',
tp_args=[Arg(type='uint32_t', var='draw_count', c_format='%u'),
Arg(type='uint32_t', var='vs_hash', c_format='%u'),
Arg(type='uint32_t', var='fs_hash', c_format='%u')])
begin_end_tp('draw_indirect_count',
tp_args=[Arg(type='uint32_t', var='draw_count', c_format='%u',
is_indirect=True),
Arg(type='uint32_t', var='vs_hash', c_format='%u'),
Arg(type='uint32_t', var='fs_hash', c_format='%u')])
begin_end_tp('draw_indexed_indirect_count',
tp_args=[Arg(type='uint32_t', var='draw_count', c_format='%u',
is_indirect=True),
Arg(type='uint32_t', var='vs_hash', c_format='%u'),
Arg(type='uint32_t', var='fs_hash', c_format='%u')])
begin_end_tp('draw_mesh',
tp_args=[Arg(type='uint32_t', var='group_x', c_format='%u'),
Arg(type='uint32_t', var='group_y', c_format='%u'),
Arg(type='uint32_t', var='group_z', c_format='%u'),])
begin_end_tp('draw_mesh_indirect',
tp_args=[Arg(type='uint32_t', var='draw_count', c_format='%u'),])
begin_end_tp('draw_mesh_indirect_count',
tp_args=[Arg(type='uint32_t', var='draw_count', c_format='%u',
is_indirect=True),])
begin_end_tp('compute',
tp_args=[Arg(type='uint32_t', var='group_x', c_format='%u'),
Arg(type='uint32_t', var='group_y', c_format='%u'),
Arg(type='uint32_t', var='group_z', c_format='%u'),
Arg(type='uint32_t', var='cs_hash', c_format='%u')],
compute=True)
begin_end_tp('compute_indirect',
tp_args=[ArgStruct(type='VkDispatchIndirectCommand', var='size',
is_indirect=True, c_format="%ux%ux%u",
fields=['x', 'y', 'z']),
Arg(type='uint32_t', var='cs_hash', c_format='%u')],
compute=True)
# Used to identify copies generated by utrace
begin_end_tp('trace_copy',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u'),])
begin_end_tp('trace_copy_cb',
tp_args=[Arg(type='uint32_t', var='count', c_format='%u'),],
need_cs_param=True)
begin_end_tp('as_build')
begin_end_tp('as_build_leaves', maybe_compute=True)
begin_end_tp('as_morton_generate', maybe_compute=True)
begin_end_tp('as_morton_sort', maybe_compute=True)
begin_end_tp('as_lbvh_build_internal', maybe_compute=True)
begin_end_tp('as_ploc_build_internal', maybe_compute=True)
begin_end_tp('as_encode', maybe_compute=True)
begin_end_tp('as_copy', maybe_compute=True)
begin_end_tp('rays',
tp_args=[Arg(type='uint32_t', var='group_x', c_format='%u'),
Arg(type='uint32_t', var='group_y', c_format='%u'),
Arg(type='uint32_t', var='group_z', c_format='%u'),],
compute=True)
def flag_bits(args):
bits = [Arg(type='enum intel_ds_stall_flag', name='flags', var='decode_cb(flags)', c_format='0x%x')]
for a in args:
bits.append(Arg(type='bool', name=a[1], var='__entry->flags & INTEL_DS_{0}_BIT'.format(a[0]), c_format='%u'))
return bits
def stall_args(args):
fmt = ''
exprs = []
for a in args:
fmt += '%s'
exprs.append('(__entry->flags & INTEL_DS_{0}_BIT) ? "+{1}" : ""'.format(a[0], a[1]))
fmt += ' : %s%s%s%s%s%s%s'
exprs.append('(__entry->reason1) ? __entry->reason1 : "unknown"')
exprs.append('(__entry->reason2) ? "; " : ""')
exprs.append('(__entry->reason2) ? __entry->reason2 : ""')
exprs.append('(__entry->reason3) ? "; " : ""')
exprs.append('(__entry->reason3) ? __entry->reason3 : ""')
exprs.append('(__entry->reason4) ? "; " : ""')
exprs.append('(__entry->reason4) ? __entry->reason4 : ""')
# To printout flags
# fmt += '(0x%08x)'
# exprs.append('__entry->flags')
fmt = [fmt]
fmt += exprs
return fmt
stall_flags = [['DEPTH_CACHE_FLUSH', 'depth_flush'],
['DATA_CACHE_FLUSH', 'dc_flush'],
['HDC_PIPELINE_FLUSH', 'hdc_flush'],
['RENDER_TARGET_CACHE_FLUSH', 'rt_flush'],
['TILE_CACHE_FLUSH', 'tile_flush'],
['STATE_CACHE_INVALIDATE', 'state_inval'],
['CONST_CACHE_INVALIDATE', 'const_inval'],
['VF_CACHE_INVALIDATE', 'vf_inval'],
['TEXTURE_CACHE_INVALIDATE', 'tex_inval'],
['INST_CACHE_INVALIDATE', 'ic_inval'],
['STALL_AT_SCOREBOARD', 'pb_stall'],
['DEPTH_STALL', 'depth_stall'],
['CS_STALL', 'cs_stall'],
['UNTYPED_DATAPORT_CACHE_FLUSH', 'udp_flush'],
['PSS_STALL_SYNC', 'pss_stall'],
['END_OF_PIPE', 'eop'],
['CCS_CACHE_FLUSH', 'ccs_flush']]
begin_end_tp('stall',
tp_args=[ArgStruct(type='uint32_t', var='flags'),
ArgStruct(type='intel_ds_stall_cb_t', var='decode_cb'),
ArgStruct(type='const char *', var='reason1'),
ArgStruct(type='const char *', var='reason2'),
ArgStruct(type='const char *', var='reason3'),
ArgStruct(type='const char *', var='reason4'),],
tp_struct=[Arg(type='uint32_t', name='flags', var='decode_cb(flags)', c_format='0x%x'),
Arg(type='const char *', name='reason1', var='reason1', c_format='%s'),
Arg(type='const char *', name='reason2', var='reason2', c_format='%s'),
Arg(type='const char *', name='reason3', var='reason3', c_format='%s'),
Arg(type='const char *', name='reason4', var='reason4', c_format='%s'),],
tp_print=stall_args(stall_flags),
tp_default_enabled=False,
end_pipelined=False)
def generate_code(args):
from u_trace import utrace_generate
from u_trace import utrace_generate_perfetto_utils
utrace_generate(cpath=args.utrace_src, hpath=args.utrace_hdr,
ctx_param='struct intel_ds_device *dev',
trace_toggle_name='intel_gpu_tracepoint',
trace_toggle_defaults=intel_default_tps)
utrace_generate_perfetto_utils(hpath=args.perfetto_hdr,
basename="intel_tracepoint")
def main():
parser = argparse.ArgumentParser()
parser.add_argument('-p', '--import-path', required=True)
parser.add_argument('--utrace-src', required=True)
parser.add_argument('--utrace-hdr', required=True)
parser.add_argument('--perfetto-hdr', required=True)
args = parser.parse_args()
sys.path.insert(0, args.import_path)
define_tracepoints(args)
generate_code(args)
if __name__ == '__main__':
main()