| ; RUN: opt -passes='loop-vectorize' -force-vector-width=2 %s -S -debug 2>&1 | FileCheck %s |
| |
| ; REQUIRES: asserts |
| |
| target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" |
| |
| ; FIXME |
| ; Test case for PR47751. Make sure the runtime check includes a required |
| ; addition of the size of the element type (a pointer) for the end bound. |
| |
| define void @test(i64 %arg, i32 %arg1, ptr %base) { |
| ; CHECK: LAA: Adding RT check for range: |
| ; CHECK-NEXT: Start: ((8 * (zext i32 (-1 + %arg1)<nsw> to i64))<nuw><nsw> + (8 * (1 smin %arg)) + (-8 * %arg) + %base) |
| ; CHECK-SAME: End: (8 + (8 * (zext i32 (-1 + %arg1)<nsw> to i64))<nuw><nsw> + %base) |
| ; CHECK-NEXT: LAA: Adding RT check for range: |
| ; CHECK-NEXT: Start: ((8 * (1 smin %arg)) + %base) |
| ; CHECK-SAME: End: (8 + (8 * %arg) + %base) |
| |
| ; CHECK: vector.body |
| |
| entry: |
| br label %loop |
| |
| loop: |
| %iv.1 = phi i64 [ %arg, %entry ], [ %iv.1.next, %loop ] |
| %iv.2 = phi i32 [ %arg1, %entry ], [ %iv.2.next, %loop ] |
| %iv.2.next = add nsw i32 %iv.2, -1 |
| %iv.2.ext = zext i32 %iv.2.next to i64 |
| %idx.1 = getelementptr inbounds ptr, ptr %base, i64 %iv.2.ext |
| %v.1 = load ptr, ptr %idx.1, align 8 |
| %idx.2 = getelementptr inbounds ptr, ptr %base, i64 %iv.1 |
| %v.2 = load ptr, ptr %idx.2, align 8 |
| store ptr %v.2, ptr %idx.1, align 8 |
| store ptr %v.1, ptr %idx.2, align 8 |
| %tmp11 = icmp sgt i64 %iv.1, 1 |
| %iv.1.next = add nsw i64 %iv.1, -1 |
| br i1 %tmp11, label %loop, label %exit |
| |
| exit: ; preds = %bb3 |
| ret void |
| } |