1 ; RUN: opt -S -instcombine %s -o - | FileCheck %s 2 target datalayout = "e-p:32:32:32-p1:64:64:64-p2:8:8:8-p3:16:16:16-p4:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:32" 3 4 @g = addrspace(3) global i32 89 5 6 @const_zero_i8_as1 = addrspace(1) constant i8 0 7 @const_zero_i32_as1 = addrspace(1) constant i32 0 8 9 @const_zero_i8_as2 = addrspace(2) constant i8 0 10 @const_zero_i32_as2 = addrspace(2) constant i32 0 11 12 @const_zero_i8_as3 = addrspace(3) constant i8 0 13 @const_zero_i32_as3 = addrspace(3) constant i32 0 14 15 ; Test constant folding of inttoptr (ptrtoint constantexpr) 16 ; The intermediate integer size is the same as the pointer size 17 define i32 addrspace(3)* @test_constant_fold_inttoptr_as_pointer_same_size() { 18 ; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_same_size( 19 ; CHECK-NEXT: ret i32 addrspace(3)* @const_zero_i32_as3 20 %x = ptrtoint i32 addrspace(3)* @const_zero_i32_as3 to i32 21 %y = inttoptr i32 %x to i32 addrspace(3)* 22 ret i32 addrspace(3)* %y 23 } 24 25 ; The intermediate integer size is larger than the pointer size 26 define i32 addrspace(2)* @test_constant_fold_inttoptr_as_pointer_smaller() { 27 ; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_smaller( 28 ; CHECK-NEXT: ret i32 addrspace(2)* @const_zero_i32_as2 29 %x = ptrtoint i32 addrspace(2)* @const_zero_i32_as2 to i16 30 %y = inttoptr i16 %x to i32 addrspace(2)* 31 ret i32 addrspace(2)* %y 32 } 33 34 ; Different address spaces that are the same size, but they are 35 ; different so nothing should happen 36 define i32 addrspace(4)* @test_constant_fold_inttoptr_as_pointer_smaller_different_as() { 37 ; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_smaller_different_as( 38 ; CHECK-NEXT: ret i32 addrspace(4)* inttoptr (i16 ptrtoint (i32 addrspace(3)* @const_zero_i32_as3 to i16) to i32 addrspace(4)*) 39 %x = ptrtoint i32 addrspace(3)* @const_zero_i32_as3 to i16 40 %y = inttoptr i16 %x to i32 addrspace(4)* 41 ret i32 addrspace(4)* %y 42 } 43 44 ; Make sure we don't introduce a bitcast between different sized 45 ; address spaces when folding this 46 define i32 addrspace(2)* @test_constant_fold_inttoptr_as_pointer_smaller_different_size_as() { 47 ; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_smaller_different_size_as( 48 ; CHECK-NEXT: ret i32 addrspace(2)* inttoptr (i32 ptrtoint (i32 addrspace(3)* @const_zero_i32_as3 to i32) to i32 addrspace(2)*) 49 %x = ptrtoint i32 addrspace(3)* @const_zero_i32_as3 to i32 50 %y = inttoptr i32 %x to i32 addrspace(2)* 51 ret i32 addrspace(2)* %y 52 } 53 54 ; The intermediate integer size is too small, nothing should happen 55 define i32 addrspace(3)* @test_constant_fold_inttoptr_as_pointer_larger() { 56 ; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_larger( 57 ; CHECK-NEXT: ret i32 addrspace(3)* inttoptr (i8 ptrtoint (i32 addrspace(3)* @const_zero_i32_as3 to i8) to i32 addrspace(3)*) 58 %x = ptrtoint i32 addrspace(3)* @const_zero_i32_as3 to i8 59 %y = inttoptr i8 %x to i32 addrspace(3)* 60 ret i32 addrspace(3)* %y 61 } 62 63 define i8 @const_fold_ptrtoint() { 64 ; CHECK-LABEL: @const_fold_ptrtoint( 65 ; CHECK-NEXT: ret i8 4 66 ret i8 ptrtoint (i32 addrspace(2)* inttoptr (i4 4 to i32 addrspace(2)*) to i8) 67 } 68 69 ; Test that mask happens when the destination pointer is smaller than 70 ; the original 71 define i8 @const_fold_ptrtoint_mask() { 72 ; CHECK-LABEL: @const_fold_ptrtoint_mask( 73 ; CHECK-NEXT: ret i8 1 74 ret i8 ptrtoint (i32 addrspace(3)* inttoptr (i32 257 to i32 addrspace(3)*) to i8) 75 } 76 77 ; Address space 0 is too small for the correct mask, should mask with 78 ; 64-bits instead of 32 79 define i64 @const_fold_ptrtoint_mask_small_as0() { 80 ; CHECK-LABEL: @const_fold_ptrtoint_mask_small_as0( 81 ; CHECK: ret i64 -1 82 ret i64 ptrtoint (i32 addrspace(1)* inttoptr (i128 -1 to i32 addrspace(1)*) to i64) 83 } 84 85 define i32 addrspace(3)* @const_inttoptr() { 86 ; CHECK-LABEL: @const_inttoptr( 87 ; CHECK-NEXT: ret i32 addrspace(3)* inttoptr (i16 4 to i32 addrspace(3)*) 88 %p = inttoptr i16 4 to i32 addrspace(3)* 89 ret i32 addrspace(3)* %p 90 } 91 92 define i16 @const_ptrtoint() { 93 ; CHECK-LABEL: @const_ptrtoint( 94 ; CHECK-NEXT: ret i16 ptrtoint (i32 addrspace(3)* @g to i16) 95 %i = ptrtoint i32 addrspace(3)* @g to i16 96 ret i16 %i 97 } 98 99 define i16 @const_inttoptr_ptrtoint() { 100 ; CHECK-LABEL: @const_inttoptr_ptrtoint( 101 ; CHECK-NEXT: ret i16 9 102 ret i16 ptrtoint (i32 addrspace(3)* inttoptr (i16 9 to i32 addrspace(3)*) to i16) 103 } 104 105 define i1 @constant_fold_cmp_constantexpr_inttoptr() { 106 ; CHECK-LABEL: @constant_fold_cmp_constantexpr_inttoptr( 107 ; CHECK-NEXT: ret i1 true 108 %x = icmp eq i32 addrspace(3)* inttoptr (i16 0 to i32 addrspace(3)*), null 109 ret i1 %x 110 } 111 112 define i1 @constant_fold_inttoptr_null(i16 %i) { 113 ; CHECK-LABEL: @constant_fold_inttoptr_null( 114 ; CHECK-NEXT: ret i1 false 115 %x = icmp eq i32 addrspace(3)* inttoptr (i16 99 to i32 addrspace(3)*), inttoptr (i16 0 to i32 addrspace(3)*) 116 ret i1 %x 117 } 118 119 define i1 @constant_fold_ptrtoint_null() { 120 ; CHECK-LABEL: @constant_fold_ptrtoint_null( 121 ; CHECK-NEXT: ret i1 false 122 %x = icmp eq i16 ptrtoint (i32 addrspace(3)* @g to i16), ptrtoint (i32 addrspace(3)* null to i16) 123 ret i1 %x 124 } 125 126 define i1 @constant_fold_ptrtoint_null_2() { 127 ; CHECK-LABEL: @constant_fold_ptrtoint_null_2( 128 ; CHECK-NEXT: ret i1 false 129 %x = icmp eq i16 ptrtoint (i32 addrspace(3)* null to i16), ptrtoint (i32 addrspace(3)* @g to i16) 130 ret i1 %x 131 } 132 133 define i1 @constant_fold_ptrtoint() { 134 ; CHECK-LABEL: @constant_fold_ptrtoint( 135 ; CHECK-NEXT: ret i1 true 136 %x = icmp eq i16 ptrtoint (i32 addrspace(3)* @g to i16), ptrtoint (i32 addrspace(3)* @g to i16) 137 ret i1 %x 138 } 139 140 define i1 @constant_fold_inttoptr() { 141 ; CHECK-LABEL: @constant_fold_inttoptr( 142 ; CHECK-NEXT: ret i1 false 143 %x = icmp eq i32 addrspace(3)* inttoptr (i16 99 to i32 addrspace(3)*), inttoptr (i16 27 to i32 addrspace(3)*) 144 ret i1 %x 145 } 146 147 @g_float_as3 = addrspace(3) global float zeroinitializer 148 @g_v4f_as3 = addrspace(3) global <4 x float> zeroinitializer 149 150 define float @constant_fold_bitcast_ftoi_load() { 151 ; CHECK-LABEL: @constant_fold_bitcast_ftoi_load( 152 ; CHECK: load float addrspace(3)* bitcast (i32 addrspace(3)* @g to float addrspace(3)*), align 4 153 %a = load float addrspace(3)* bitcast (i32 addrspace(3)* @g to float addrspace(3)*), align 4 154 ret float %a 155 } 156 157 define i32 @constant_fold_bitcast_itof_load() { 158 ; CHECK-LABEL: @constant_fold_bitcast_itof_load( 159 ; CHECK: load i32 addrspace(3)* bitcast (float addrspace(3)* @g_float_as3 to i32 addrspace(3)*), align 4 160 %a = load i32 addrspace(3)* bitcast (float addrspace(3)* @g_float_as3 to i32 addrspace(3)*), align 4 161 ret i32 %a 162 } 163 164 define <4 x i32> @constant_fold_bitcast_vector_as() { 165 ; CHECK-LABEL: @constant_fold_bitcast_vector_as( 166 ; CHECK: load <4 x float> addrspace(3)* @g_v4f_as3, align 16 167 ; CHECK: bitcast <4 x float> %1 to <4 x i32> 168 %a = load <4 x i32> addrspace(3)* bitcast (<4 x float> addrspace(3)* @g_v4f_as3 to <4 x i32> addrspace(3)*), align 4 169 ret <4 x i32> %a 170 } 171 172 @i32_array_as3 = addrspace(3) global [10 x i32] zeroinitializer 173 174 define i32 @test_cast_gep_small_indices_as() { 175 ; CHECK-LABEL: @test_cast_gep_small_indices_as( 176 ; CHECK: load i32 addrspace(3)* getelementptr inbounds ([10 x i32] addrspace(3)* @i32_array_as3, i16 0, i16 0), align 16 177 %p = getelementptr [10 x i32] addrspace(3)* @i32_array_as3, i7 0, i7 0 178 %x = load i32 addrspace(3)* %p, align 4 179 ret i32 %x 180 } 181 182 %struct.foo = type { float, float, [4 x i32], i32 addrspace(3)* } 183 184 @constant_fold_global_ptr = addrspace(3) global %struct.foo { 185 float 0.0, 186 float 0.0, 187 [4 x i32] zeroinitializer, 188 i32 addrspace(3)* getelementptr ([10 x i32] addrspace(3)* @i32_array_as3, i64 0, i64 0) 189 } 190 191 define i32 @test_cast_gep_large_indices_as() { 192 ; CHECK-LABEL: @test_cast_gep_large_indices_as( 193 ; CHECK: load i32 addrspace(3)* getelementptr inbounds ([10 x i32] addrspace(3)* @i32_array_as3, i16 0, i16 0), align 16 194 %p = getelementptr [10 x i32] addrspace(3)* @i32_array_as3, i64 0, i64 0 195 %x = load i32 addrspace(3)* %p, align 4 196 ret i32 %x 197 } 198 199 define i32 @test_constant_cast_gep_struct_indices_as() { 200 ; CHECK-LABEL: @test_constant_cast_gep_struct_indices_as( 201 ; CHECK: load i32 addrspace(3)* getelementptr inbounds (%struct.foo addrspace(3)* @constant_fold_global_ptr, i16 0, i32 2, i16 2), align 8 202 %x = getelementptr %struct.foo addrspace(3)* @constant_fold_global_ptr, i18 0, i32 2, i12 2 203 %y = load i32 addrspace(3)* %x, align 4 204 ret i32 %y 205 } 206 207 @constant_data_as3 = addrspace(3) constant [5 x i32] [i32 1, i32 2, i32 3, i32 4, i32 5] 208 209 define i32 @test_read_data_from_global_as3() { 210 ; CHECK-LABEL: @test_read_data_from_global_as3( 211 ; CHECK-NEXT: ret i32 2 212 %x = getelementptr [5 x i32] addrspace(3)* @constant_data_as3, i32 0, i32 1 213 %y = load i32 addrspace(3)* %x, align 4 214 ret i32 %y 215 } 216 217 @a = addrspace(1) constant i32 9 218 @b = addrspace(1) constant i32 23 219 @c = addrspace(1) constant i32 34 220 @d = addrspace(1) constant i32 99 221 222 @ptr_array = addrspace(2) constant [4 x i32 addrspace(1)*] [ i32 addrspace(1)* @a, i32 addrspace(1)* @b, i32 addrspace(1)* @c, i32 addrspace(1)* @d] 223 @indirect = addrspace(0) constant i32 addrspace(1)* addrspace(2)* getelementptr inbounds ([4 x i32 addrspace(1)*] addrspace(2)* @ptr_array, i1 0, i32 2) 224 225 define i32 @constant_through_array_as_ptrs() { 226 ; CHECK-LABEL: @constant_through_array_as_ptrs( 227 ; CHECK-NEXT: ret i32 34 228 %p = load i32 addrspace(1)* addrspace(2)* addrspace(0)* @indirect, align 4 229 %a = load i32 addrspace(1)* addrspace(2)* %p, align 4 230 %b = load i32 addrspace(1)* %a, align 4 231 ret i32 %b 232 } 233 234 @shared_mem = external addrspace(3) global [0 x i8] 235 236 define float @canonicalize_addrspacecast(i32 %i) { 237 ; CHECK-LABEL: @canonicalize_addrspacecast 238 ; CHECK-NEXT: getelementptr inbounds float* addrspacecast (float addrspace(3)* bitcast ([0 x i8] addrspace(3)* @shared_mem to float addrspace(3)*) to float*), i32 %i 239 %p = getelementptr inbounds float* addrspacecast ([0 x i8] addrspace(3)* @shared_mem to float*), i32 %i 240 %v = load float* %p 241 ret float %v 242 } 243