1 ; RUN: llc -mtriple=amdgcn--amdhsa -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s 2 3 ; GCN-LABEL: {{^}}test_default_ci: 4 ; GCN: float_mode = 192 5 ; GCN: enable_dx10_clamp = 1 6 ; GCN: enable_ieee_mode = 1 7 define amdgpu_kernel void @test_default_ci(float addrspace(1)* %out0, double addrspace(1)* %out1) #0 { 8 store float 0.0, float addrspace(1)* %out0 9 store double 0.0, double addrspace(1)* %out1 10 ret void 11 } 12 13 ; GCN-LABEL: {{^}}test_default_vi: 14 ; GCN: float_mode = 192 15 ; GCN: enable_dx10_clamp = 1 16 ; GCN: enable_ieee_mode = 1 17 define amdgpu_kernel void @test_default_vi(float addrspace(1)* %out0, double addrspace(1)* %out1) #1 { 18 store float 0.0, float addrspace(1)* %out0 19 store double 0.0, double addrspace(1)* %out1 20 ret void 21 } 22 23 ; GCN-LABEL: {{^}}test_f64_denormals: 24 ; GCN: float_mode = 192 25 ; GCN: enable_dx10_clamp = 1 26 ; GCN: enable_ieee_mode = 1 27 define amdgpu_kernel void @test_f64_denormals(float addrspace(1)* %out0, double addrspace(1)* %out1) #2 { 28 store float 0.0, float addrspace(1)* %out0 29 store double 0.0, double addrspace(1)* %out1 30 ret void 31 } 32 33 ; GCN-LABEL: {{^}}test_f32_denormals: 34 ; GCN: float_mode = 48 35 ; GCN: enable_dx10_clamp = 1 36 ; GCN: enable_ieee_mode = 1 37 define amdgpu_kernel void @test_f32_denormals(float addrspace(1)* %out0, double addrspace(1)* %out1) #3 { 38 store float 0.0, float addrspace(1)* %out0 39 store double 0.0, double addrspace(1)* %out1 40 ret void 41 } 42 43 ; GCN-LABEL: {{^}}test_f32_f64_denormals: 44 ; GCN: float_mode = 240 45 ; GCN: enable_dx10_clamp = 1 46 ; GCN: enable_ieee_mode = 1 47 define amdgpu_kernel void @test_f32_f64_denormals(float addrspace(1)* %out0, double addrspace(1)* %out1) #4 { 48 store float 0.0, float addrspace(1)* %out0 49 store double 0.0, double addrspace(1)* %out1 50 ret void 51 } 52 53 ; GCN-LABEL: {{^}}test_no_denormals: 54 ; GCN: float_mode = 0 55 ; GCN: enable_dx10_clamp = 1 56 ; GCN: enable_ieee_mode = 1 57 define amdgpu_kernel void @test_no_denormals(float addrspace(1)* %out0, double addrspace(1)* %out1) #5 { 58 store float 0.0, float addrspace(1)* %out0 59 store double 0.0, double addrspace(1)* %out1 60 ret void 61 } 62 63 ; GCN-LABEL: {{^}}test_no_dx10_clamp_vi: 64 ; GCN: float_mode = 192 65 ; GCN: enable_dx10_clamp = 0 66 ; GCN: enable_ieee_mode = 1 67 define amdgpu_kernel void @test_no_dx10_clamp_vi(float addrspace(1)* %out0, double addrspace(1)* %out1) #6 { 68 store float 0.0, float addrspace(1)* %out0 69 store double 0.0, double addrspace(1)* %out1 70 ret void 71 } 72 73 attributes #0 = { nounwind "target-cpu"="kaveri" } 74 attributes #1 = { nounwind "target-cpu"="fiji" } 75 attributes #2 = { nounwind "target-features"="-fp32-denormals,+fp64-fp16-denormals" } 76 attributes #3 = { nounwind "target-features"="+fp32-denormals,-fp64-fp16-denormals" } 77 attributes #4 = { nounwind "target-features"="+fp32-denormals,+fp64-fp16-denormals" } 78 attributes #5 = { nounwind "target-features"="-fp32-denormals,-fp64-fp16-denormals" } 79 attributes #6 = { nounwind "target-cpu"="fiji" "target-features"="-dx10-clamp" } 80