blob: 04bae023984f13b13871b4470685d8e6b2993821 [file] [log] [blame]
Bill Wendling810417d2013-08-01 21:42:05 +00001; RUN: llc < %s -relocation-model=static -mcpu=yonah | FileCheck %s
Chris Lattnerf6480ec2008-01-26 19:45:50 +00002
Sanjay Patelbd08b6b2015-02-17 20:08:21 +00003; The double argument is at 4(esp) which is 16-byte aligned, but we
4; are required to read in extra bytes of memory in order to fold the
5; load. Bad Things may happen when reading/processing undefined bytes,
6; so don't fold the load.
7; PR22371 / http://reviews.llvm.org/D7474
Chris Lattnerf6480ec2008-01-26 19:45:50 +00008
9target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-v64:64:64-v128:128:128-a0:0:64-f80:128:128"
10target triple = "i686-apple-darwin8"
11@G = external global double
12
Chris Lattner18ca2172011-02-13 22:25:43 +000013define void @test({ double, double }* byval %z, double* %P) nounwind {
Chris Lattnerf6480ec2008-01-26 19:45:50 +000014entry:
David Blaikie7a1e2bf2015-02-27 21:17:42 +000015 %tmp3 = load double, double* @G, align 16 ; <double> [#uses=1]
Bob Wilson664b48c2012-08-03 23:29:17 +000016 %tmp4 = tail call double @fabs( double %tmp3 ) readnone ; <double> [#uses=1]
Chris Lattnerec474ed2011-11-27 06:54:59 +000017 store volatile double %tmp4, double* %P
David Blaikie80b000c2015-02-27 19:29:02 +000018 %tmp = getelementptr { double, double }, { double, double }* %z, i32 0, i32 0 ; <double*> [#uses=1]
David Blaikie7a1e2bf2015-02-27 21:17:42 +000019 %tmp1 = load volatile double, double* %tmp, align 8 ; <double> [#uses=1]
Bob Wilson664b48c2012-08-03 23:29:17 +000020 %tmp2 = tail call double @fabs( double %tmp1 ) readnone ; <double> [#uses=1]
Dan Gohman84cf78f2009-06-04 22:49:04 +000021 %tmp6 = fadd double %tmp4, %tmp2 ; <double> [#uses=1]
Chris Lattnerec474ed2011-11-27 06:54:59 +000022 store volatile double %tmp6, double* %P, align 8
Chris Lattnerf6480ec2008-01-26 19:45:50 +000023 ret void
Sanjay Patelbd08b6b2015-02-17 20:08:21 +000024
25; CHECK-LABEL: test:
26; CHECK: movsd {{.*}}G, %xmm{{.*}}
27; CHECK: andpd %xmm{{.*}}, %xmm{{.*}}
28; CHECK: movsd 4(%esp), %xmm{{.*}}
29; CHECK: andpd %xmm{{.*}}, %xmm{{.*}}
30
31
Chris Lattnerf6480ec2008-01-26 19:45:50 +000032}
33
Chris Lattner18ca2172011-02-13 22:25:43 +000034define void @test2() alignstack(16) nounwind {
Charles Davisfafdc892010-02-19 18:17:13 +000035entry:
Sanjay Patelbd08b6b2015-02-17 20:08:21 +000036; CHECK-LABEL: test2:
37; CHECK: andl{{.*}}$-16, %esp
Charles Davisfafdc892010-02-19 18:17:13 +000038 ret void
39}
40
41; Use a call to force a spill.
Chris Lattner18ca2172011-02-13 22:25:43 +000042define <2 x double> @test3(<2 x double> %x, <2 x double> %y) alignstack(32) nounwind {
Charles Davisfafdc892010-02-19 18:17:13 +000043entry:
Sanjay Patelbd08b6b2015-02-17 20:08:21 +000044; CHECK-LABEL: test3:
45; CHECK: andl{{.*}}$-32, %esp
Charles Davisfafdc892010-02-19 18:17:13 +000046 call void @test2()
Dan Gohman0b79c7d2010-05-03 22:36:46 +000047 %A = fmul <2 x double> %x, %y
Charles Davisfafdc892010-02-19 18:17:13 +000048 ret <2 x double> %A
49}
50
Chris Lattnerf6480ec2008-01-26 19:45:50 +000051declare double @fabs(double)
Charles Davisfafdc892010-02-19 18:17:13 +000052
Chris Lattner18ca2172011-02-13 22:25:43 +000053; The pointer is already known aligned, so and x,-16 is eliminable.
54define i32 @test4() nounwind {
55entry:
56 %buffer = alloca [2048 x i8], align 16
57 %0 = ptrtoint [2048 x i8]* %buffer to i32
58 %and = and i32 %0, -16
59 ret i32 %and
Stephen Lin5fc363e2013-07-13 20:38:47 +000060; CHECK-LABEL: test4:
Chris Lattner18ca2172011-02-13 22:25:43 +000061; CHECK-NOT: and
62; CHECK: ret
63}
Charles Davis3ff19ce2016-04-09 23:34:42 +000064
65%struct.sixteen = type { [16 x i8] }
66
67; Accessing stack parameters shouldn't assume stack alignment. Here we should
68; emit two 8-byte loads, followed by two 8-byte stores.
69define x86_stdcallcc void @test5(%struct.sixteen* byval nocapture readonly align 4 %s) #0 {
70 %d.sroa.0 = alloca [16 x i8], align 1
71 %1 = getelementptr inbounds [16 x i8], [16 x i8]* %d.sroa.0, i32 0, i32 0
72 call void @llvm.lifetime.start(i64 16, i8* %1)
73 %2 = getelementptr inbounds %struct.sixteen, %struct.sixteen* %s, i32 0, i32 0, i32 0
74 call void @llvm.memcpy.p0i8.p0i8.i32(i8* %1, i8* %2, i32 16, i32 1, i1 true)
75 call void @llvm.lifetime.end(i64 16, i8* %1)
76 ret void
77; CHECK-LABEL: test5:
78; CHECK: and
79; CHECK: movsd
80; CHECK-NEXT: movsd
81; CHECK-NEXT: movsd
82; CHECK-NEXT: movsd
83}
84
85declare void @llvm.lifetime.start(i64, i8* nocapture) argmemonly nounwind
86
87declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture readonly, i32, i32, i1) argmemonly nounwind
88
89declare void @llvm.lifetime.end(i64, i8* nocapture) argmemonly nounwind
90
91attributes #0 = { nounwind alignstack=16 "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" }