Bill Wendling | 810417d | 2013-08-01 21:42:05 +0000 | [diff] [blame] | 1 | ; RUN: llc < %s -relocation-model=static -mcpu=yonah | FileCheck %s |
Chris Lattner | f6480ec | 2008-01-26 19:45:50 +0000 | [diff] [blame] | 2 | |
Sanjay Patel | bd08b6b | 2015-02-17 20:08:21 +0000 | [diff] [blame] | 3 | ; The double argument is at 4(esp) which is 16-byte aligned, but we |
| 4 | ; are required to read in extra bytes of memory in order to fold the |
| 5 | ; load. Bad Things may happen when reading/processing undefined bytes, |
| 6 | ; so don't fold the load. |
| 7 | ; PR22371 / http://reviews.llvm.org/D7474 |
Chris Lattner | f6480ec | 2008-01-26 19:45:50 +0000 | [diff] [blame] | 8 | |
| 9 | target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-v64:64:64-v128:128:128-a0:0:64-f80:128:128" |
| 10 | target triple = "i686-apple-darwin8" |
| 11 | @G = external global double |
| 12 | |
Chris Lattner | 18ca217 | 2011-02-13 22:25:43 +0000 | [diff] [blame] | 13 | define void @test({ double, double }* byval %z, double* %P) nounwind { |
Chris Lattner | f6480ec | 2008-01-26 19:45:50 +0000 | [diff] [blame] | 14 | entry: |
David Blaikie | 7a1e2bf | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 15 | %tmp3 = load double, double* @G, align 16 ; <double> [#uses=1] |
Bob Wilson | 664b48c | 2012-08-03 23:29:17 +0000 | [diff] [blame] | 16 | %tmp4 = tail call double @fabs( double %tmp3 ) readnone ; <double> [#uses=1] |
Chris Lattner | ec474ed | 2011-11-27 06:54:59 +0000 | [diff] [blame] | 17 | store volatile double %tmp4, double* %P |
David Blaikie | 80b000c | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 18 | %tmp = getelementptr { double, double }, { double, double }* %z, i32 0, i32 0 ; <double*> [#uses=1] |
David Blaikie | 7a1e2bf | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 19 | %tmp1 = load volatile double, double* %tmp, align 8 ; <double> [#uses=1] |
Bob Wilson | 664b48c | 2012-08-03 23:29:17 +0000 | [diff] [blame] | 20 | %tmp2 = tail call double @fabs( double %tmp1 ) readnone ; <double> [#uses=1] |
Dan Gohman | 84cf78f | 2009-06-04 22:49:04 +0000 | [diff] [blame] | 21 | %tmp6 = fadd double %tmp4, %tmp2 ; <double> [#uses=1] |
Chris Lattner | ec474ed | 2011-11-27 06:54:59 +0000 | [diff] [blame] | 22 | store volatile double %tmp6, double* %P, align 8 |
Chris Lattner | f6480ec | 2008-01-26 19:45:50 +0000 | [diff] [blame] | 23 | ret void |
Sanjay Patel | bd08b6b | 2015-02-17 20:08:21 +0000 | [diff] [blame] | 24 | |
| 25 | ; CHECK-LABEL: test: |
| 26 | ; CHECK: movsd {{.*}}G, %xmm{{.*}} |
| 27 | ; CHECK: andpd %xmm{{.*}}, %xmm{{.*}} |
| 28 | ; CHECK: movsd 4(%esp), %xmm{{.*}} |
| 29 | ; CHECK: andpd %xmm{{.*}}, %xmm{{.*}} |
| 30 | |
| 31 | |
Chris Lattner | f6480ec | 2008-01-26 19:45:50 +0000 | [diff] [blame] | 32 | } |
| 33 | |
Chris Lattner | 18ca217 | 2011-02-13 22:25:43 +0000 | [diff] [blame] | 34 | define void @test2() alignstack(16) nounwind { |
Charles Davis | fafdc89 | 2010-02-19 18:17:13 +0000 | [diff] [blame] | 35 | entry: |
Sanjay Patel | bd08b6b | 2015-02-17 20:08:21 +0000 | [diff] [blame] | 36 | ; CHECK-LABEL: test2: |
| 37 | ; CHECK: andl{{.*}}$-16, %esp |
Charles Davis | fafdc89 | 2010-02-19 18:17:13 +0000 | [diff] [blame] | 38 | ret void |
| 39 | } |
| 40 | |
| 41 | ; Use a call to force a spill. |
Chris Lattner | 18ca217 | 2011-02-13 22:25:43 +0000 | [diff] [blame] | 42 | define <2 x double> @test3(<2 x double> %x, <2 x double> %y) alignstack(32) nounwind { |
Charles Davis | fafdc89 | 2010-02-19 18:17:13 +0000 | [diff] [blame] | 43 | entry: |
Sanjay Patel | bd08b6b | 2015-02-17 20:08:21 +0000 | [diff] [blame] | 44 | ; CHECK-LABEL: test3: |
| 45 | ; CHECK: andl{{.*}}$-32, %esp |
Charles Davis | fafdc89 | 2010-02-19 18:17:13 +0000 | [diff] [blame] | 46 | call void @test2() |
Dan Gohman | 0b79c7d | 2010-05-03 22:36:46 +0000 | [diff] [blame] | 47 | %A = fmul <2 x double> %x, %y |
Charles Davis | fafdc89 | 2010-02-19 18:17:13 +0000 | [diff] [blame] | 48 | ret <2 x double> %A |
| 49 | } |
| 50 | |
Chris Lattner | f6480ec | 2008-01-26 19:45:50 +0000 | [diff] [blame] | 51 | declare double @fabs(double) |
Charles Davis | fafdc89 | 2010-02-19 18:17:13 +0000 | [diff] [blame] | 52 | |
Chris Lattner | 18ca217 | 2011-02-13 22:25:43 +0000 | [diff] [blame] | 53 | ; The pointer is already known aligned, so and x,-16 is eliminable. |
| 54 | define i32 @test4() nounwind { |
| 55 | entry: |
| 56 | %buffer = alloca [2048 x i8], align 16 |
| 57 | %0 = ptrtoint [2048 x i8]* %buffer to i32 |
| 58 | %and = and i32 %0, -16 |
| 59 | ret i32 %and |
Stephen Lin | 5fc363e | 2013-07-13 20:38:47 +0000 | [diff] [blame] | 60 | ; CHECK-LABEL: test4: |
Chris Lattner | 18ca217 | 2011-02-13 22:25:43 +0000 | [diff] [blame] | 61 | ; CHECK-NOT: and |
| 62 | ; CHECK: ret |
| 63 | } |
Charles Davis | 3ff19ce | 2016-04-09 23:34:42 +0000 | [diff] [blame^] | 64 | |
| 65 | %struct.sixteen = type { [16 x i8] } |
| 66 | |
| 67 | ; Accessing stack parameters shouldn't assume stack alignment. Here we should |
| 68 | ; emit two 8-byte loads, followed by two 8-byte stores. |
| 69 | define x86_stdcallcc void @test5(%struct.sixteen* byval nocapture readonly align 4 %s) #0 { |
| 70 | %d.sroa.0 = alloca [16 x i8], align 1 |
| 71 | %1 = getelementptr inbounds [16 x i8], [16 x i8]* %d.sroa.0, i32 0, i32 0 |
| 72 | call void @llvm.lifetime.start(i64 16, i8* %1) |
| 73 | %2 = getelementptr inbounds %struct.sixteen, %struct.sixteen* %s, i32 0, i32 0, i32 0 |
| 74 | call void @llvm.memcpy.p0i8.p0i8.i32(i8* %1, i8* %2, i32 16, i32 1, i1 true) |
| 75 | call void @llvm.lifetime.end(i64 16, i8* %1) |
| 76 | ret void |
| 77 | ; CHECK-LABEL: test5: |
| 78 | ; CHECK: and |
| 79 | ; CHECK: movsd |
| 80 | ; CHECK-NEXT: movsd |
| 81 | ; CHECK-NEXT: movsd |
| 82 | ; CHECK-NEXT: movsd |
| 83 | } |
| 84 | |
| 85 | declare void @llvm.lifetime.start(i64, i8* nocapture) argmemonly nounwind |
| 86 | |
| 87 | declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture readonly, i32, i32, i1) argmemonly nounwind |
| 88 | |
| 89 | declare void @llvm.lifetime.end(i64, i8* nocapture) argmemonly nounwind |
| 90 | |
| 91 | attributes #0 = { nounwind alignstack=16 "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" } |