1 ; RUN: llc < %s -relocation-model=static -mcpu=yonah | FileCheck %s 2 3 ; The double argument is at 4(esp) which is 16-byte aligned, but we 4 ; are required to read in extra bytes of memory in order to fold the 5 ; load. Bad Things may happen when reading/processing undefined bytes, 6 ; so don't fold the load. 7 ; PR22371 / http://reviews.llvm.org/D7474 8 9 target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-v64:64:64-v128:128:128-a0:0:64-f80:128:128" 10 target triple = "i686-apple-darwin8" 11 @G = external global double 12 13 define void @test({ double, double }* byval %z, double* %P) nounwind { 14 entry: 15 %tmp3 = load double, double* @G, align 16 ; <double> [#uses=1] 16 %tmp4 = tail call double @fabs( double %tmp3 ) readnone ; <double> [#uses=1] 17 store volatile double %tmp4, double* %P 18 %tmp = getelementptr { double, double }, { double, double }* %z, i32 0, i32 0 ; <double*> [#uses=1] 19 %tmp1 = load volatile double, double* %tmp, align 8 ; <double> [#uses=1] 20 %tmp2 = tail call double @fabs( double %tmp1 ) readnone ; <double> [#uses=1] 21 %tmp6 = fadd double %tmp4, %tmp2 ; <double> [#uses=1] 22 store volatile double %tmp6, double* %P, align 8 23 ret void 24 25 ; CHECK-LABEL: test: 26 ; CHECK: movsd {{.*}}G, %xmm{{.*}} 27 ; CHECK: andpd %xmm{{.*}}, %xmm{{.*}} 28 ; CHECK: movsd 4(%esp), %xmm{{.*}} 29 ; CHECK: andpd %xmm{{.*}}, %xmm{{.*}} 30 31 32 } 33 34 define void @test2() alignstack(16) nounwind { 35 entry: 36 ; CHECK-LABEL: test2: 37 ; CHECK: andl{{.*}}$-16, %esp 38 ret void 39 } 40 41 ; Use a call to force a spill. 42 define <2 x double> @test3(<2 x double> %x, <2 x double> %y) alignstack(32) nounwind { 43 entry: 44 ; CHECK-LABEL: test3: 45 ; CHECK: andl{{.*}}$-32, %esp 46 call void @test2() 47 %A = fmul <2 x double> %x, %y 48 ret <2 x double> %A 49 } 50 51 declare double @fabs(double) 52 53 ; The pointer is already known aligned, so and x,-16 is eliminable. 54 define i32 @test4() nounwind { 55 entry: 56 %buffer = alloca [2048 x i8], align 16 57 %0 = ptrtoint [2048 x i8]* %buffer to i32 58 %and = and i32 %0, -16 59 ret i32 %and 60 ; CHECK-LABEL: test4: 61 ; CHECK-NOT: and 62 ; CHECK: ret 63 } 64