forked from OSchip/llvm-project
279 lines
9.5 KiB
ArmAsm
279 lines
9.5 KiB
ArmAsm
// RUN: llvm-mc -triple amdgcn--amdhsa -mcpu=kaveri -show-encoding %s | FileCheck %s --check-prefix=ASM
|
|
// RUN: llvm-mc -filetype=obj -triple amdgcn--amdhsa -mcpu=kaveri -show-encoding %s | llvm-readobj -symbols -s -sd | FileCheck %s --check-prefix=ELF
|
|
|
|
// ELF: Section {
|
|
// ELF: Name: .text
|
|
// ELF: Type: SHT_PROGBITS (0x1)
|
|
// ELF: Flags [ (0x6)
|
|
// ELF: SHF_ALLOC (0x2)
|
|
// ELF: SHF_EXECINSTR (0x4)
|
|
|
|
// ELF: SHT_NOTE
|
|
// ELF: 0000: 04000000 08000000 01000000 414D4400
|
|
// ELF: 0010: 02000000 00000000 04000000 1B000000
|
|
// ELF: 0020: 03000000 414D4400 04000700 07000000
|
|
// ELF: 0030: 00000000 00000000 414D4400 414D4447
|
|
// ELF: 0040: 50550000
|
|
// We can't check binary representation of metadata note: it is different on
|
|
// Windows and Linux because of carriage return on Windows
|
|
|
|
// ELF: Symbol {
|
|
// ELF: Name: amd_kernel_code_t_minimal
|
|
// ELF: Type: AMDGPU_HSA_KERNEL (0xA)
|
|
// ELF: Section: .text
|
|
// ELF: }
|
|
// ELF: Symbol {
|
|
// ELF: Name: amd_kernel_code_t_test_all
|
|
// ELF: Type: AMDGPU_HSA_KERNEL (0xA)
|
|
// ELF: Section: .text
|
|
// ELF: }
|
|
|
|
.text
|
|
// ASM: .text
|
|
|
|
.hsa_code_object_version 2,0
|
|
// ASM: .hsa_code_object_version 2,0
|
|
|
|
.hsa_code_object_isa 7,0,0,"AMD","AMDGPU"
|
|
// ASM: .hsa_code_object_isa 7,0,0,"AMD","AMDGPU"
|
|
|
|
.amdgpu_runtime_metadata
|
|
{
|
|
amd.MDVersion: [ 2, 0 ]
|
|
amd.Kernels: [
|
|
{ amd.KernelName: amd_kernel_code_t_test_all },
|
|
{ amd.KernelName: amd_kernel_code_t_minimal }
|
|
]
|
|
}
|
|
.end_amdgpu_runtime_metadata
|
|
|
|
// ASM: .amdgpu_runtime_metadata
|
|
// ASM: {
|
|
// ASM: amd.MDVersion: [ 2, 0 ]
|
|
// ASM: amd.IsaInfo: { amd.IsaInfoWavefrontSize: 64, amd.IsaInfoLocalMemorySize: 65536, amd.IsaInfoEUsPerCU: 4, amd.IsaInfoMaxWavesPerEU: 10, amd.IsaInfoMaxFlatWorkGroupSize: 2048, amd.IsaInfoSGPRAllocGranule: 8, amd.IsaInfoTotalNumSGPRs: 512, amd.IsaInfoAddressableNumSGPRs: 104, amd.IsaInfoVGPRAllocGranule: 4, amd.IsaInfoTotalNumVGPRs: 256, amd.IsaInfoAddressableNumVGPRs: 256 },
|
|
// ASM: amd.Kernels:
|
|
// ASM: - { amd.KernelName: amd_kernel_code_t_test_all }
|
|
// ASM: - { amd.KernelName: amd_kernel_code_t_minimal }
|
|
// ASM: }
|
|
// ASM: .end_amdgpu_runtime_metadata
|
|
|
|
.amdgpu_hsa_kernel amd_kernel_code_t_test_all
|
|
.amdgpu_hsa_kernel amd_kernel_code_t_minimal
|
|
|
|
amd_kernel_code_t_test_all:
|
|
; Test all amd_kernel_code_t members with non-default values.
|
|
.amd_kernel_code_t
|
|
kernel_code_version_major = 100
|
|
kernel_code_version_minor = 100
|
|
machine_kind = 0
|
|
machine_version_major = 5
|
|
machine_version_minor = 5
|
|
machine_version_stepping = 5
|
|
kernel_code_entry_byte_offset = 512
|
|
kernel_code_prefetch_byte_size = 1
|
|
max_scratch_backing_memory_byte_size = 1
|
|
compute_pgm_rsrc1_vgprs = 1
|
|
compute_pgm_rsrc1_sgprs = 1
|
|
compute_pgm_rsrc1_priority = 1
|
|
compute_pgm_rsrc1_float_mode = 1
|
|
compute_pgm_rsrc1_priv = 1
|
|
compute_pgm_rsrc1_dx10_clamp = 1
|
|
compute_pgm_rsrc1_debug_mode = 1
|
|
compute_pgm_rsrc1_ieee_mode = 1
|
|
compute_pgm_rsrc2_scratch_en = 1
|
|
compute_pgm_rsrc2_user_sgpr = 1
|
|
compute_pgm_rsrc2_tgid_x_en = 1
|
|
compute_pgm_rsrc2_tgid_y_en = 1
|
|
compute_pgm_rsrc2_tgid_z_en = 1
|
|
compute_pgm_rsrc2_tg_size_en = 1
|
|
compute_pgm_rsrc2_tidig_comp_cnt = 1
|
|
compute_pgm_rsrc2_excp_en_msb = 1
|
|
compute_pgm_rsrc2_lds_size = 1
|
|
compute_pgm_rsrc2_excp_en = 1
|
|
enable_sgpr_private_segment_buffer = 1
|
|
enable_sgpr_dispatch_ptr = 1
|
|
enable_sgpr_queue_ptr = 1
|
|
enable_sgpr_kernarg_segment_ptr = 1
|
|
enable_sgpr_dispatch_id = 1
|
|
enable_sgpr_flat_scratch_init = 1
|
|
enable_sgpr_private_segment_size = 1
|
|
enable_sgpr_grid_workgroup_count_x = 1
|
|
enable_sgpr_grid_workgroup_count_y = 1
|
|
enable_sgpr_grid_workgroup_count_z = 1
|
|
enable_ordered_append_gds = 1
|
|
private_element_size = 1
|
|
is_ptr64 = 1
|
|
is_dynamic_callstack = 1
|
|
is_debug_enabled = 1
|
|
is_xnack_enabled = 1
|
|
workitem_private_segment_byte_size = 1
|
|
workgroup_group_segment_byte_size = 1
|
|
gds_segment_byte_size = 1
|
|
kernarg_segment_byte_size = 1
|
|
workgroup_fbarrier_count = 1
|
|
wavefront_sgpr_count = 1
|
|
workitem_vgpr_count = 1
|
|
reserved_vgpr_first = 1
|
|
reserved_vgpr_count = 1
|
|
reserved_sgpr_first = 1
|
|
reserved_sgpr_count = 1
|
|
debug_wavefront_private_segment_offset_sgpr = 1
|
|
debug_private_segment_buffer_sgpr = 1
|
|
kernarg_segment_alignment = 5
|
|
group_segment_alignment = 5
|
|
private_segment_alignment = 5
|
|
wavefront_size = 5
|
|
call_convention = 1
|
|
runtime_loader_kernel_symbol = 1
|
|
.end_amd_kernel_code_t
|
|
|
|
// ASM-LABEL: {{^}}amd_kernel_code_t_test_all:
|
|
// ASM: .amd_kernel_code_t
|
|
// ASM: amd_code_version_major = 100
|
|
// ASM: amd_code_version_minor = 100
|
|
// ASM: amd_machine_kind = 0
|
|
// ASM: amd_machine_version_major = 5
|
|
// ASM: amd_machine_version_minor = 5
|
|
// ASM: amd_machine_version_stepping = 5
|
|
// ASM: kernel_code_entry_byte_offset = 512
|
|
// ASM: kernel_code_prefetch_byte_size = 1
|
|
// ASM: max_scratch_backing_memory_byte_size = 1
|
|
// ASM: granulated_workitem_vgpr_count = 1
|
|
// ASM: granulated_wavefront_sgpr_count = 1
|
|
// ASM: priority = 1
|
|
// ASM: float_mode = 1
|
|
// ASM: priv = 1
|
|
// ASM: enable_dx10_clamp = 1
|
|
// ASM: debug_mode = 1
|
|
// ASM: enable_ieee_mode = 1
|
|
// ASM: enable_sgpr_private_segment_wave_byte_offset = 1
|
|
// ASM: user_sgpr_count = 1
|
|
// ASM: enable_sgpr_workgroup_id_x = 1
|
|
// ASM: enable_sgpr_workgroup_id_y = 1
|
|
// ASM: enable_sgpr_workgroup_id_z = 1
|
|
// ASM: enable_sgpr_workgroup_info = 1
|
|
// ASM: enable_vgpr_workitem_id = 1
|
|
// ASM: enable_exception_msb = 1
|
|
// ASM: granulated_lds_size = 1
|
|
// ASM: enable_exception = 1
|
|
// ASM: enable_sgpr_private_segment_buffer = 1
|
|
// ASM: enable_sgpr_dispatch_ptr = 1
|
|
// ASM: enable_sgpr_queue_ptr = 1
|
|
// ASM: enable_sgpr_kernarg_segment_ptr = 1
|
|
// ASM: enable_sgpr_dispatch_id = 1
|
|
// ASM: enable_sgpr_flat_scratch_init = 1
|
|
// ASM: enable_sgpr_private_segment_size = 1
|
|
// ASM: enable_sgpr_grid_workgroup_count_x = 1
|
|
// ASM: enable_sgpr_grid_workgroup_count_y = 1
|
|
// ASM: enable_sgpr_grid_workgroup_count_z = 1
|
|
// ASM: enable_ordered_append_gds = 1
|
|
// ASM: private_element_size = 1
|
|
// ASM: is_ptr64 = 1
|
|
// ASM: is_dynamic_callstack = 1
|
|
// ASM: is_debug_enabled = 1
|
|
// ASM: is_xnack_enabled = 1
|
|
// ASM: workitem_private_segment_byte_size = 1
|
|
// ASM: workgroup_group_segment_byte_size = 1
|
|
// ASM: gds_segment_byte_size = 1
|
|
// ASM: kernarg_segment_byte_size = 1
|
|
// ASM: workgroup_fbarrier_count = 1
|
|
// ASM: wavefront_sgpr_count = 1
|
|
// ASM: workitem_vgpr_count = 1
|
|
// ASM: reserved_vgpr_first = 1
|
|
// ASM: reserved_vgpr_count = 1
|
|
// ASM: reserved_sgpr_first = 1
|
|
// ASM: reserved_sgpr_count = 1
|
|
// ASM: debug_wavefront_private_segment_offset_sgpr = 1
|
|
// ASM: debug_private_segment_buffer_sgpr = 1
|
|
// ASM: kernarg_segment_alignment = 5
|
|
// ASM: group_segment_alignment = 5
|
|
// ASM: private_segment_alignment = 5
|
|
// ASM: wavefront_size = 5
|
|
// ASM: call_convention = 1
|
|
// ASM: runtime_loader_kernel_symbol = 1
|
|
// ASM: .end_amd_kernel_code_t
|
|
|
|
amd_kernel_code_t_minimal:
|
|
.amd_kernel_code_t
|
|
enable_sgpr_kernarg_segment_ptr = 1
|
|
is_ptr64 = 1
|
|
granulated_workitem_vgpr_count = 1
|
|
granulated_wavefront_sgpr_count = 1
|
|
user_sgpr_count = 2
|
|
kernarg_segment_byte_size = 16
|
|
wavefront_sgpr_count = 8
|
|
// wavefront_sgpr_count = 7
|
|
; wavefront_sgpr_count = 7
|
|
// Make sure a blank line won't break anything:
|
|
|
|
// Make sure a line with whitespace won't break anything:
|
|
|
|
workitem_vgpr_count = 16
|
|
.end_amd_kernel_code_t
|
|
|
|
// ASM-LABEL: {{^}}amd_kernel_code_t_minimal:
|
|
// ASM: .amd_kernel_code_t
|
|
// ASM: amd_code_version_major = 1
|
|
// ASM: amd_code_version_minor = 1
|
|
// ASM: amd_machine_kind = 1
|
|
// ASM: amd_machine_version_major = 7
|
|
// ASM: amd_machine_version_minor = 0
|
|
// ASM: amd_machine_version_stepping = 0
|
|
// ASM: kernel_code_entry_byte_offset = 256
|
|
// ASM: kernel_code_prefetch_byte_size = 0
|
|
// ASM: max_scratch_backing_memory_byte_size = 0
|
|
// ASM: granulated_workitem_vgpr_count = 1
|
|
// ASM: granulated_wavefront_sgpr_count = 1
|
|
// ASM: priority = 0
|
|
// ASM: float_mode = 0
|
|
// ASM: priv = 0
|
|
// ASM: enable_dx10_clamp = 0
|
|
// ASM: debug_mode = 0
|
|
// ASM: enable_ieee_mode = 0
|
|
// ASM: enable_sgpr_private_segment_wave_byte_offset = 0
|
|
// ASM: user_sgpr_count = 2
|
|
// ASM: enable_sgpr_workgroup_id_x = 0
|
|
// ASM: enable_sgpr_workgroup_id_y = 0
|
|
// ASM: enable_sgpr_workgroup_id_z = 0
|
|
// ASM: enable_sgpr_workgroup_info = 0
|
|
// ASM: enable_vgpr_workitem_id = 0
|
|
// ASM: enable_exception_msb = 0
|
|
// ASM: granulated_lds_size = 0
|
|
// ASM: enable_exception = 0
|
|
// ASM: enable_sgpr_private_segment_buffer = 0
|
|
// ASM: enable_sgpr_dispatch_ptr = 0
|
|
// ASM: enable_sgpr_queue_ptr = 0
|
|
// ASM: enable_sgpr_kernarg_segment_ptr = 1
|
|
// ASM: enable_sgpr_dispatch_id = 0
|
|
// ASM: enable_sgpr_flat_scratch_init = 0
|
|
// ASM: enable_sgpr_private_segment_size = 0
|
|
// ASM: enable_sgpr_grid_workgroup_count_x = 0
|
|
// ASM: enable_sgpr_grid_workgroup_count_y = 0
|
|
// ASM: enable_sgpr_grid_workgroup_count_z = 0
|
|
// ASM: enable_ordered_append_gds = 0
|
|
// ASM: private_element_size = 0
|
|
// ASM: is_ptr64 = 1
|
|
// ASM: is_dynamic_callstack = 0
|
|
// ASM: is_debug_enabled = 0
|
|
// ASM: is_xnack_enabled = 0
|
|
// ASM: workitem_private_segment_byte_size = 0
|
|
// ASM: workgroup_group_segment_byte_size = 0
|
|
// ASM: gds_segment_byte_size = 0
|
|
// ASM: kernarg_segment_byte_size = 16
|
|
// ASM: workgroup_fbarrier_count = 0
|
|
// ASM: wavefront_sgpr_count = 8
|
|
// ASM: workitem_vgpr_count = 16
|
|
// ASM: reserved_vgpr_first = 0
|
|
// ASM: reserved_vgpr_count = 0
|
|
// ASM: reserved_sgpr_first = 0
|
|
// ASM: reserved_sgpr_count = 0
|
|
// ASM: debug_wavefront_private_segment_offset_sgpr = 0
|
|
// ASM: debug_private_segment_buffer_sgpr = 0
|
|
// ASM: kernarg_segment_alignment = 4
|
|
// ASM: group_segment_alignment = 4
|
|
// ASM: private_segment_alignment = 4
|
|
// ASM: wavefront_size = 6
|
|
// ASM: call_convention = -1
|
|
// ASM: runtime_loader_kernel_symbol = 0
|
|
// ASM: .end_amd_kernel_code_t
|