| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| ; RUN: llc < %s -mtriple=i686-apple-darwin -mattr=+sse2 | FileCheck %s |
| ; PR1501 |
| |
| define float @foo(i32* %x, float* %y, i32 %c) nounwind { |
| ; CHECK-LABEL: foo: |
| ; CHECK: ## %bb.0: ## %entry |
| ; CHECK-NEXT: pushl %esi |
| ; CHECK-NEXT: pushl %eax |
| ; CHECK-NEXT: movl {{[0-9]+}}(%esp), %eax |
| ; CHECK-NEXT: testl %eax, %eax |
| ; CHECK-NEXT: je LBB0_1 |
| ; CHECK-NEXT: ## %bb.2: ## %bb.preheader |
| ; CHECK-NEXT: movl {{[0-9]+}}(%esp), %ecx |
| ; CHECK-NEXT: movl {{[0-9]+}}(%esp), %edx |
| ; CHECK-NEXT: xorps %xmm0, %xmm0 |
| ; CHECK-NEXT: xorl %esi, %esi |
| ; CHECK-NEXT: .p2align 4, 0x90 |
| ; CHECK-NEXT: LBB0_3: ## %bb |
| ; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1 |
| ; CHECK-NEXT: xorps %xmm1, %xmm1 |
| ; CHECK-NEXT: cvtsi2ssl (%edx,%esi,4), %xmm1 |
| ; CHECK-NEXT: mulss (%ecx,%esi,4), %xmm1 |
| ; CHECK-NEXT: addss %xmm1, %xmm0 |
| ; CHECK-NEXT: incl %esi |
| ; CHECK-NEXT: cmpl %eax, %esi |
| ; CHECK-NEXT: jb LBB0_3 |
| ; CHECK-NEXT: jmp LBB0_4 |
| ; CHECK-NEXT: LBB0_1: |
| ; CHECK-NEXT: xorps %xmm0, %xmm0 |
| ; CHECK-NEXT: LBB0_4: ## %bb23 |
| ; CHECK-NEXT: movss %xmm0, (%esp) |
| ; CHECK-NEXT: flds (%esp) |
| ; CHECK-NEXT: addl $4, %esp |
| ; CHECK-NEXT: popl %esi |
| ; CHECK-NEXT: retl |
| entry: |
| %tmp2132 = icmp eq i32 %c, 0 ; <i1> [#uses=2] |
| br i1 %tmp2132, label %bb23, label %bb.preheader |
| |
| bb.preheader: ; preds = %entry |
| %umax = select i1 %tmp2132, i32 1, i32 %c ; <i32> [#uses=1] |
| br label %bb |
| |
| bb: ; preds = %bb, %bb.preheader |
| %i.0.reg2mem.0 = phi i32 [ 0, %bb.preheader ], [ %indvar.next, %bb ] ; <i32> [#uses=3] |
| %res.0.reg2mem.0 = phi float [ 0.000000e+00, %bb.preheader ], [ %tmp14, %bb ] ; <float> [#uses=1] |
| %tmp3 = getelementptr i32, i32* %x, i32 %i.0.reg2mem.0 ; <i32*> [#uses=1] |
| %tmp4 = load i32, i32* %tmp3, align 4 ; <i32> [#uses=1] |
| %tmp45 = sitofp i32 %tmp4 to float ; <float> [#uses=1] |
| %tmp8 = getelementptr float, float* %y, i32 %i.0.reg2mem.0 ; <float*> [#uses=1] |
| %tmp9 = load float, float* %tmp8, align 4 ; <float> [#uses=1] |
| %tmp11 = fmul float %tmp9, %tmp45 ; <float> [#uses=1] |
| %tmp14 = fadd float %tmp11, %res.0.reg2mem.0 ; <float> [#uses=2] |
| %indvar.next = add i32 %i.0.reg2mem.0, 1 ; <i32> [#uses=2] |
| %exitcond = icmp eq i32 %indvar.next, %umax ; <i1> [#uses=1] |
| br i1 %exitcond, label %bb23, label %bb |
| |
| bb23: ; preds = %bb, %entry |
| %res.0.reg2mem.1 = phi float [ 0.000000e+00, %entry ], [ %tmp14, %bb ] ; <float> [#uses=1] |
| ret float %res.0.reg2mem.1 |
| } |