Home | History | Annotate | Download | only in AMDGPU
      1 ; RUN: llc -mtriple=amdgcn--amdhsa -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
      2 
      3 ; GCN-LABEL: {{^}}test_default_ci:
      4 ; GCN: float_mode = 192
      5 ; GCN: enable_dx10_clamp = 1
      6 ; GCN: enable_ieee_mode = 1
      7 define amdgpu_kernel void @test_default_ci(float addrspace(1)* %out0, double addrspace(1)* %out1) #0 {
      8   store float 0.0, float addrspace(1)* %out0
      9   store double 0.0, double addrspace(1)* %out1
     10   ret void
     11 }
     12 
     13 ; GCN-LABEL: {{^}}test_default_vi:
     14 ; GCN: float_mode = 192
     15 ; GCN: enable_dx10_clamp = 1
     16 ; GCN: enable_ieee_mode = 1
     17 define amdgpu_kernel void @test_default_vi(float addrspace(1)* %out0, double addrspace(1)* %out1) #1 {
     18   store float 0.0, float addrspace(1)* %out0
     19   store double 0.0, double addrspace(1)* %out1
     20   ret void
     21 }
     22 
     23 ; GCN-LABEL: {{^}}test_f64_denormals:
     24 ; GCN: float_mode = 192
     25 ; GCN: enable_dx10_clamp = 1
     26 ; GCN: enable_ieee_mode = 1
     27 define amdgpu_kernel void @test_f64_denormals(float addrspace(1)* %out0, double addrspace(1)* %out1) #2 {
     28   store float 0.0, float addrspace(1)* %out0
     29   store double 0.0, double addrspace(1)* %out1
     30   ret void
     31 }
     32 
     33 ; GCN-LABEL: {{^}}test_f32_denormals:
     34 ; GCN: float_mode = 48
     35 ; GCN: enable_dx10_clamp = 1
     36 ; GCN: enable_ieee_mode = 1
     37 define amdgpu_kernel void @test_f32_denormals(float addrspace(1)* %out0, double addrspace(1)* %out1) #3 {
     38   store float 0.0, float addrspace(1)* %out0
     39   store double 0.0, double addrspace(1)* %out1
     40   ret void
     41 }
     42 
     43 ; GCN-LABEL: {{^}}test_f32_f64_denormals:
     44 ; GCN: float_mode = 240
     45 ; GCN: enable_dx10_clamp = 1
     46 ; GCN: enable_ieee_mode = 1
     47 define amdgpu_kernel void @test_f32_f64_denormals(float addrspace(1)* %out0, double addrspace(1)* %out1) #4 {
     48   store float 0.0, float addrspace(1)* %out0
     49   store double 0.0, double addrspace(1)* %out1
     50   ret void
     51 }
     52 
     53 ; GCN-LABEL: {{^}}test_no_denormals:
     54 ; GCN: float_mode = 0
     55 ; GCN: enable_dx10_clamp = 1
     56 ; GCN: enable_ieee_mode = 1
     57 define amdgpu_kernel void @test_no_denormals(float addrspace(1)* %out0, double addrspace(1)* %out1) #5 {
     58   store float 0.0, float addrspace(1)* %out0
     59   store double 0.0, double addrspace(1)* %out1
     60   ret void
     61 }
     62 
     63 ; GCN-LABEL: {{^}}test_no_dx10_clamp_vi:
     64 ; GCN: float_mode = 192
     65 ; GCN: enable_dx10_clamp = 0
     66 ; GCN: enable_ieee_mode = 1
     67 define amdgpu_kernel void @test_no_dx10_clamp_vi(float addrspace(1)* %out0, double addrspace(1)* %out1) #6 {
     68   store float 0.0, float addrspace(1)* %out0
     69   store double 0.0, double addrspace(1)* %out1
     70   ret void
     71 }
     72 
     73 attributes #0 = { nounwind "target-cpu"="kaveri" }
     74 attributes #1 = { nounwind "target-cpu"="fiji" }
     75 attributes #2 = { nounwind "target-features"="-fp32-denormals,+fp64-fp16-denormals" }
     76 attributes #3 = { nounwind "target-features"="+fp32-denormals,-fp64-fp16-denormals" }
     77 attributes #4 = { nounwind "target-features"="+fp32-denormals,+fp64-fp16-denormals" }
     78 attributes #5 = { nounwind "target-features"="-fp32-denormals,-fp64-fp16-denormals" }
     79 attributes #6 = { nounwind "target-cpu"="fiji" "target-features"="-dx10-clamp" }
     80