[libomptarget] [amdgpu] Added LDS usage to the kernel trace

Reviewed By: JonChesterfield

Differential Revision: https://reviews.llvm.org/D103059
This commit is contained in:
Dhruva Chakrabarti 2021-05-24 16:35:29 -07:00
parent d881319cc5
commit 96d70f4d28
1 changed files with 6 additions and 4 deletions

View File

@ -1788,10 +1788,12 @@ int32_t __tgt_rtl_run_target_team_region_locked(
return OFFLOAD_FAIL;
}
uint32_t group_segment_size;
uint32_t sgpr_count, vgpr_count, sgpr_spill_count, vgpr_spill_count;
{
auto it = KernelInfoTable[device_id][kernel_name];
group_segment_size = it.group_segment_size;
sgpr_count = it.sgpr_count;
vgpr_count = it.vgpr_count;
sgpr_spill_count = it.sgpr_spill_count;
@ -1819,12 +1821,12 @@ int32_t __tgt_rtl_run_target_team_region_locked(
bool traceToStdout = print_kernel_trace & (RTL_TO_STDOUT | RTL_TIMING);
fprintf(traceToStdout ? stdout : stderr,
"DEVID:%2d SGN:%1d ConstWGSize:%-4d args:%2d teamsXthrds:(%4dX%4d) "
"reqd:(%4dX%4d) sgpr_count:%u vgpr_count:%u sgpr_spill_count:%u "
"vgpr_spill_count:%u tripcount:%lu n:%s\n",
"reqd:(%4dX%4d) lds_usage:%uB sgpr_count:%u vgpr_count:%u "
"sgpr_spill_count:%u vgpr_spill_count:%u tripcount:%lu n:%s\n",
device_id, KernelInfo->ExecutionMode, KernelInfo->ConstWGSize,
arg_num, num_groups, threadsPerGroup, num_teams, thread_limit,
sgpr_count, vgpr_count, sgpr_spill_count, vgpr_spill_count,
loop_tripcount, KernelInfo->Name);
group_segment_size, sgpr_count, vgpr_count, sgpr_spill_count,
vgpr_spill_count, loop_tripcount, KernelInfo->Name);
}
// Run on the device.