Home | History | Annotate | Download | only in AMDGPU
      1 // RUN: llvm-mc -triple amdgcn--amdhsa -mcpu=kaveri -show-encoding %s | FileCheck %s --check-prefix=ASM
      2 // RUN: llvm-mc -filetype=obj -triple amdgcn--amdhsa -mcpu=kaveri -show-encoding %s | llvm-readobj -symbols -s -sd | FileCheck %s --check-prefix=ELF
      3 
      4 // ELF: Section {
      5 // ELF: Name: .hsatext
      6 // ELF: Type: SHT_PROGBITS (0x1)
      7 // ELF: Flags [ (0xC00007)
      8 // ELF: SHF_ALLOC (0x2)
      9 // ELF: SHF_AMDGPU_HSA_AGENT (0x800000)
     10 // ELF: SHF_AMDGPU_HSA_CODE (0x400000)
     11 // ELF: SHF_EXECINSTR (0x4)
     12 // ELF: SHF_WRITE (0x1)
     13 
     14 // ELF: SHT_NOTE
     15 // ELF: 0000: 04000000 08000000 01000000 414D4400
     16 // ELF: 0010: 01000000 00000000 04000000 1B000000
     17 // ELF: 0020: 03000000 414D4400 04000700 07000000
     18 // ELF: 0030: 00000000 00000000 414D4400 414D4447
     19 // ELF: 0040: 50550000
     20 
     21 // ELF: Symbol {
     22 // ELF: Name: amd_kernel_code_t_minimal
     23 // ELF: Type: AMDGPU_HSA_KERNEL (0xA)
     24 // ELF: Section: .hsatext
     25 // ELF: }
     26 // ELF: Symbol {
     27 // ELF: Name: amd_kernel_code_t_test_all
     28 // ELF: Type: AMDGPU_HSA_KERNEL (0xA)
     29 // ELF: Section: .hsatext
     30 // ELF: }
     31 
     32 
     33 .hsa_code_object_version 1,0
     34 // ASM: .hsa_code_object_version 1,0
     35 
     36 .hsa_code_object_isa 7,0,0,"AMD","AMDGPU"
     37 // ASM: .hsa_code_object_isa 7,0,0,"AMD","AMDGPU"
     38 
     39 .amdgpu_hsa_kernel amd_kernel_code_t_test_all
     40 .amdgpu_hsa_kernel amd_kernel_code_t_minimal
     41 
     42 .hsatext
     43 // ASM: .hsatext
     44 
     45 amd_kernel_code_t_test_all:
     46 ; Test all amd_kernel_code_t members with non-default values.
     47 .amd_kernel_code_t
     48 	kernel_code_version_major = 100
     49 	kernel_code_version_minor = 100
     50 	machine_kind = 0
     51 	machine_version_major = 5
     52 	machine_version_minor = 5
     53 	machine_version_stepping = 5
     54 	kernel_code_entry_byte_offset = 512
     55 	kernel_code_prefetch_byte_size = 1
     56 	max_scratch_backing_memory_byte_size = 1
     57 	compute_pgm_rsrc1_vgprs = 1
     58 	compute_pgm_rsrc1_sgprs = 1
     59 	compute_pgm_rsrc1_priority = 1
     60 	compute_pgm_rsrc1_float_mode = 1
     61 	compute_pgm_rsrc1_priv = 1
     62 	compute_pgm_rsrc1_dx10_clamp = 1
     63 	compute_pgm_rsrc1_debug_mode = 1
     64 	compute_pgm_rsrc1_ieee_mode = 1
     65 	compute_pgm_rsrc2_scratch_en = 1
     66 	compute_pgm_rsrc2_user_sgpr = 1
     67 	compute_pgm_rsrc2_tgid_x_en = 1
     68 	compute_pgm_rsrc2_tgid_y_en = 1
     69 	compute_pgm_rsrc2_tgid_z_en = 1
     70 	compute_pgm_rsrc2_tg_size_en = 1
     71 	compute_pgm_rsrc2_tidig_comp_cnt = 1
     72 	compute_pgm_rsrc2_excp_en_msb = 1
     73 	compute_pgm_rsrc2_lds_size = 1
     74 	compute_pgm_rsrc2_excp_en = 1
     75 	enable_sgpr_private_segment_buffer = 1
     76 	enable_sgpr_dispatch_ptr = 1
     77 	enable_sgpr_queue_ptr = 1
     78 	enable_sgpr_kernarg_segment_ptr = 1
     79 	enable_sgpr_dispatch_id = 1
     80 	enable_sgpr_flat_scratch_init = 1
     81 	enable_sgpr_private_segment_size = 1
     82 	enable_sgpr_grid_workgroup_count_x = 1
     83 	enable_sgpr_grid_workgroup_count_y = 1
     84 	enable_sgpr_grid_workgroup_count_z = 1
     85 	enable_ordered_append_gds = 1
     86 	private_element_size = 1
     87 	is_ptr64 = 1
     88 	is_dynamic_callstack = 1
     89 	is_debug_enabled = 1
     90 	is_xnack_enabled = 1
     91 	workitem_private_segment_byte_size = 1
     92 	workgroup_group_segment_byte_size = 1
     93 	gds_segment_byte_size = 1
     94 	kernarg_segment_byte_size = 1
     95 	workgroup_fbarrier_count = 1
     96 	wavefront_sgpr_count = 1
     97 	workitem_vgpr_count = 1
     98 	reserved_vgpr_first = 1
     99 	reserved_vgpr_count = 1
    100 	reserved_sgpr_first = 1
    101 	reserved_sgpr_count = 1
    102 	debug_wavefront_private_segment_offset_sgpr = 1
    103 	debug_private_segment_buffer_sgpr = 1
    104 	kernarg_segment_alignment = 5
    105 	group_segment_alignment = 5
    106 	private_segment_alignment = 5
    107 	wavefront_size = 5
    108 	call_convention = 1
    109 	runtime_loader_kernel_symbol = 1
    110 .end_amd_kernel_code_t
    111 
    112 // ASM-LABEL: {{^}}amd_kernel_code_t_test_all:
    113 // ASM: .amd_kernel_code_t
    114 // ASM: kernel_code_version_major = 100
    115 // ASM: kernel_code_version_minor = 100
    116 // ASM: machine_kind = 0
    117 // ASM: machine_version_major = 5
    118 // ASM: machine_version_minor = 5
    119 // ASM: machine_version_stepping = 5
    120 // ASM: kernel_code_entry_byte_offset = 512
    121 // ASM: kernel_code_prefetch_byte_size = 1
    122 // ASM: max_scratch_backing_memory_byte_size = 1
    123 // ASM: compute_pgm_rsrc1_vgprs = 1
    124 // ASM: compute_pgm_rsrc1_sgprs = 1
    125 // ASM: compute_pgm_rsrc1_priority = 1
    126 // ASM: compute_pgm_rsrc1_float_mode = 1
    127 // ASM: compute_pgm_rsrc1_priv = 1
    128 // ASM: compute_pgm_rsrc1_dx10_clamp = 1
    129 // ASM: compute_pgm_rsrc1_debug_mode = 1
    130 // ASM: compute_pgm_rsrc1_ieee_mode = 1
    131 // ASM: compute_pgm_rsrc2_scratch_en = 1
    132 // ASM: compute_pgm_rsrc2_user_sgpr = 1
    133 // ASM: compute_pgm_rsrc2_tgid_x_en = 1
    134 // ASM: compute_pgm_rsrc2_tgid_y_en = 1
    135 // ASM: compute_pgm_rsrc2_tgid_z_en = 1
    136 // ASM: compute_pgm_rsrc2_tg_size_en = 1
    137 // ASM: compute_pgm_rsrc2_tidig_comp_cnt = 1
    138 // ASM: compute_pgm_rsrc2_excp_en_msb = 1
    139 // ASM: compute_pgm_rsrc2_lds_size = 1
    140 // ASM: compute_pgm_rsrc2_excp_en = 1
    141 // ASM: enable_sgpr_private_segment_buffer = 1
    142 // ASM: enable_sgpr_dispatch_ptr = 1
    143 // ASM: enable_sgpr_queue_ptr = 1
    144 // ASM: enable_sgpr_kernarg_segment_ptr = 1
    145 // ASM: enable_sgpr_dispatch_id = 1
    146 // ASM: enable_sgpr_flat_scratch_init = 1
    147 // ASM: enable_sgpr_private_segment_size = 1
    148 // ASM: enable_sgpr_grid_workgroup_count_x = 1
    149 // ASM: enable_sgpr_grid_workgroup_count_y = 1
    150 // ASM: enable_sgpr_grid_workgroup_count_z = 1
    151 // ASM: enable_ordered_append_gds = 1
    152 // ASM: private_element_size = 1
    153 // ASM: is_ptr64 = 1
    154 // ASM: is_dynamic_callstack = 1
    155 // ASM: is_debug_enabled = 1
    156 // ASM: is_xnack_enabled = 1
    157 // ASM: workitem_private_segment_byte_size = 1
    158 // ASM: workgroup_group_segment_byte_size = 1
    159 // ASM: gds_segment_byte_size = 1
    160 // ASM: kernarg_segment_byte_size = 1
    161 // ASM: workgroup_fbarrier_count = 1
    162 // ASM: wavefront_sgpr_count = 1
    163 // ASM: workitem_vgpr_count = 1
    164 // ASM: reserved_vgpr_first = 1
    165 // ASM: reserved_vgpr_count = 1
    166 // ASM: reserved_sgpr_first = 1
    167 // ASM: reserved_sgpr_count = 1
    168 // ASM: debug_wavefront_private_segment_offset_sgpr = 1
    169 // ASM: debug_private_segment_buffer_sgpr = 1
    170 // ASM: kernarg_segment_alignment = 5
    171 // ASM: group_segment_alignment = 5
    172 // ASM: private_segment_alignment = 5
    173 // ASM: wavefront_size = 5
    174 // ASM: call_convention = 1
    175 // ASM: runtime_loader_kernel_symbol = 1
    176 // ASM: .end_amd_kernel_code_t
    177 
    178 amd_kernel_code_t_minimal:
    179 .amd_kernel_code_t
    180 	enable_sgpr_kernarg_segment_ptr = 1
    181 	is_ptr64 = 1
    182 	compute_pgm_rsrc1_vgprs = 1
    183 	compute_pgm_rsrc1_sgprs = 1
    184 	compute_pgm_rsrc2_user_sgpr = 2
    185 	kernarg_segment_byte_size = 16
    186 	wavefront_sgpr_count = 8
    187 //      wavefront_sgpr_count = 7
    188 ;	wavefront_sgpr_count = 7
    189 // Make sure a blank line won't break anything:
    190 
    191 // Make sure a line with whitespace won't break anything:
    192 
    193 	workitem_vgpr_count = 16
    194 .end_amd_kernel_code_t
    195 
    196 // ASM-LABEL: {{^}}amd_kernel_code_t_minimal:
    197 // ASM: .amd_kernel_code_t
    198 // ASM:	kernel_code_version_major = 1
    199 // ASM:	kernel_code_version_minor = 0
    200 // ASM:	machine_kind = 1
    201 // ASM:	machine_version_major = 7
    202 // ASM:	machine_version_minor = 0
    203 // ASM:	machine_version_stepping = 0
    204 // ASM:	kernel_code_entry_byte_offset = 256
    205 // ASM:	kernel_code_prefetch_byte_size = 0
    206 // ASM:	max_scratch_backing_memory_byte_size = 0
    207 // ASM:	compute_pgm_rsrc1_vgprs = 1
    208 // ASM:	compute_pgm_rsrc1_sgprs = 1
    209 // ASM:	compute_pgm_rsrc1_priority = 0
    210 // ASM:	compute_pgm_rsrc1_float_mode = 0
    211 // ASM:	compute_pgm_rsrc1_priv = 0
    212 // ASM:	compute_pgm_rsrc1_dx10_clamp = 0
    213 // ASM:	compute_pgm_rsrc1_debug_mode = 0
    214 // ASM:	compute_pgm_rsrc1_ieee_mode = 0
    215 // ASM:	compute_pgm_rsrc2_scratch_en = 0
    216 // ASM:	compute_pgm_rsrc2_user_sgpr = 2
    217 // ASM:	compute_pgm_rsrc2_tgid_x_en = 0
    218 // ASM:	compute_pgm_rsrc2_tgid_y_en = 0
    219 // ASM:	compute_pgm_rsrc2_tgid_z_en = 0
    220 // ASM:	compute_pgm_rsrc2_tg_size_en = 0
    221 // ASM:	compute_pgm_rsrc2_tidig_comp_cnt = 0
    222 // ASM:	compute_pgm_rsrc2_excp_en_msb = 0
    223 // ASM:	compute_pgm_rsrc2_lds_size = 0
    224 // ASM:	compute_pgm_rsrc2_excp_en = 0
    225 // ASM:	enable_sgpr_private_segment_buffer = 0
    226 // ASM:	enable_sgpr_dispatch_ptr = 0
    227 // ASM:	enable_sgpr_queue_ptr = 0
    228 // ASM:	enable_sgpr_kernarg_segment_ptr = 1
    229 // ASM:	enable_sgpr_dispatch_id = 0
    230 // ASM:	enable_sgpr_flat_scratch_init = 0
    231 // ASM:	enable_sgpr_private_segment_size = 0
    232 // ASM:	enable_sgpr_grid_workgroup_count_x = 0
    233 // ASM:	enable_sgpr_grid_workgroup_count_y = 0
    234 // ASM:	enable_sgpr_grid_workgroup_count_z = 0
    235 // ASM:	enable_ordered_append_gds = 0
    236 // ASM:	private_element_size = 0
    237 // ASM:	is_ptr64 = 1
    238 // ASM:	is_dynamic_callstack = 0
    239 // ASM:	is_debug_enabled = 0
    240 // ASM:	is_xnack_enabled = 0
    241 // ASM:	workitem_private_segment_byte_size = 0
    242 // ASM:	workgroup_group_segment_byte_size = 0
    243 // ASM:	gds_segment_byte_size = 0
    244 // ASM:	kernarg_segment_byte_size = 16
    245 // ASM:	workgroup_fbarrier_count = 0
    246 // ASM:	wavefront_sgpr_count = 8
    247 // ASM:	workitem_vgpr_count = 16
    248 // ASM:	reserved_vgpr_first = 0
    249 // ASM:	reserved_vgpr_count = 0
    250 // ASM:	reserved_sgpr_first = 0
    251 // ASM:	reserved_sgpr_count = 0
    252 // ASM:	debug_wavefront_private_segment_offset_sgpr = 0
    253 // ASM:	debug_private_segment_buffer_sgpr = 0
    254 // ASM:	kernarg_segment_alignment = 4
    255 // ASM:	group_segment_alignment = 4
    256 // ASM:	private_segment_alignment = 4
    257 // ASM:	wavefront_size = 6
    258 // ASM:	call_convention = 0
    259 // ASM:	runtime_loader_kernel_symbol = 0
    260 // ASM: .end_amd_kernel_code_t
    261