| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --function-signature |
| ; RUN: opt < %s -basic-aa -globals-aa -memcpyopt -S -verify-memoryssa | FileCheck %s |
| |
| target datalayout = "e" |
| |
| declare void @foo(i8*) |
| declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i1) nounwind |
| declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) |
| declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) |
| |
| ; Check that the transformation isn't applied if the called function can |
| ; capture the pointer argument (i.e. the nocapture attribute isn't present) |
| define void @test() { |
| ; CHECK-LABEL: define {{[^@]+}}@test() { |
| ; CHECK-NEXT: [[PTR1:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: [[PTR2:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: call void @foo(i8* [[PTR2]]) |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[PTR1]], i8* [[PTR2]], i32 1, i1 false) |
| ; CHECK-NEXT: call void @foo(i8* [[PTR1]]) |
| ; CHECK-NEXT: ret void |
| ; |
| %ptr1 = alloca i8 |
| %ptr2 = alloca i8 |
| call void @foo(i8* %ptr2) |
| call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr1, i8* %ptr2, i32 1, i1 false) |
| call void @foo(i8* %ptr1) |
| ret void |
| } |
| |
| ; Same as previous test, but with a bitcasted argument. |
| define void @test_bitcast() { |
| ; CHECK-LABEL: define {{[^@]+}}@test_bitcast() { |
| ; CHECK-NEXT: [[PTR1:%.*]] = alloca [2 x i8], align 1 |
| ; CHECK-NEXT: [[PTR2:%.*]] = alloca [2 x i8], align 1 |
| ; CHECK-NEXT: [[PTR1_CAST:%.*]] = bitcast [2 x i8]* [[PTR1]] to i8* |
| ; CHECK-NEXT: [[PTR2_CAST:%.*]] = bitcast [2 x i8]* [[PTR2]] to i8* |
| ; CHECK-NEXT: call void @foo(i8* [[PTR2_CAST]]) |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[PTR1_CAST]], i8* [[PTR2_CAST]], i32 2, i1 false) |
| ; CHECK-NEXT: call void @foo(i8* [[PTR1_CAST]]) |
| ; CHECK-NEXT: ret void |
| ; |
| %ptr1 = alloca [2 x i8] |
| %ptr2 = alloca [2 x i8] |
| %ptr1.cast = bitcast [2 x i8]* %ptr1 to i8* |
| %ptr2.cast = bitcast [2 x i8]* %ptr2 to i8* |
| call void @foo(i8* %ptr2.cast) |
| call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr1.cast, i8* %ptr2.cast, i32 2, i1 false) |
| call void @foo(i8* %ptr1.cast) |
| ret void |
| } |
| |
| ; Lifetime of %ptr2 ends before the potential use of the capture in the second |
| ; call. |
| define void @test_lifetime_end() { |
| ; CHECK-LABEL: define {{[^@]+}}@test_lifetime_end() { |
| ; CHECK-NEXT: [[PTR1:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: [[PTR2:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: call void @llvm.lifetime.start.p0i8(i64 1, i8* [[PTR2]]) |
| ; CHECK-NEXT: call void @foo(i8* [[PTR1]]) |
| ; CHECK-NEXT: call void @llvm.lifetime.end.p0i8(i64 1, i8* [[PTR2]]) |
| ; CHECK-NEXT: call void @foo(i8* [[PTR1]]) |
| ; CHECK-NEXT: ret void |
| ; |
| %ptr1 = alloca i8 |
| %ptr2 = alloca i8 |
| call void @llvm.lifetime.start.p0i8(i64 1, i8* %ptr2) |
| call void @foo(i8* %ptr2) |
| call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr1, i8* %ptr2, i32 1, i1 false) |
| call void @llvm.lifetime.end.p0i8(i64 1, i8* %ptr2) |
| call void @foo(i8* %ptr1) |
| ret void |
| } |
| |
| ; Lifetime of %ptr2 does not end, because of size mismatch. |
| define void @test_lifetime_not_end() { |
| ; CHECK-LABEL: define {{[^@]+}}@test_lifetime_not_end() { |
| ; CHECK-NEXT: [[PTR1:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: [[PTR2:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: call void @llvm.lifetime.start.p0i8(i64 1, i8* [[PTR2]]) |
| ; CHECK-NEXT: call void @foo(i8* [[PTR2]]) |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[PTR1]], i8* [[PTR2]], i32 1, i1 false) |
| ; CHECK-NEXT: call void @llvm.lifetime.end.p0i8(i64 0, i8* [[PTR2]]) |
| ; CHECK-NEXT: call void @foo(i8* [[PTR1]]) |
| ; CHECK-NEXT: ret void |
| ; |
| %ptr1 = alloca i8 |
| %ptr2 = alloca i8 |
| call void @llvm.lifetime.start.p0i8(i64 1, i8* %ptr2) |
| call void @foo(i8* %ptr2) |
| call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr1, i8* %ptr2, i32 1, i1 false) |
| call void @llvm.lifetime.end.p0i8(i64 0, i8* %ptr2) |
| call void @foo(i8* %ptr1) |
| ret void |
| } |
| |
| ; Lifetime of %ptr2 ends before any potential use of the capture because we |
| ; return from the function. |
| define void @test_function_end() { |
| ; CHECK-LABEL: define {{[^@]+}}@test_function_end() { |
| ; CHECK-NEXT: [[PTR1:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: [[PTR2:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: call void @foo(i8* [[PTR1]]) |
| ; CHECK-NEXT: ret void |
| ; |
| %ptr1 = alloca i8 |
| %ptr2 = alloca i8 |
| call void @foo(i8* %ptr2) |
| call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr1, i8* %ptr2, i32 1, i1 false) |
| ret void |
| } |
| |
| ; A potential use of the capture occurs in a later block, can't be optimized. |
| define void @test_terminator() { |
| ; CHECK-LABEL: define {{[^@]+}}@test_terminator() { |
| ; CHECK-NEXT: [[PTR1:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: [[PTR2:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: call void @foo(i8* [[PTR2]]) |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[PTR1]], i8* [[PTR2]], i32 1, i1 false) |
| ; CHECK-NEXT: br label [[NEXT:%.*]] |
| ; CHECK: next: |
| ; CHECK-NEXT: call void @foo(i8* [[PTR1]]) |
| ; CHECK-NEXT: ret void |
| ; |
| %ptr1 = alloca i8 |
| %ptr2 = alloca i8 |
| call void @foo(i8* %ptr2) |
| call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr1, i8* %ptr2, i32 1, i1 false) |
| br label %next |
| |
| next: |
| call void @foo(i8* %ptr1) |
| ret void |
| } |
| |
| ; This case can be optimized, but would require a scan across multiple blocks |
| ; and is currently not performed. |
| define void @test_terminator2() { |
| ; CHECK-LABEL: define {{[^@]+}}@test_terminator2() { |
| ; CHECK-NEXT: [[PTR1:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: [[PTR2:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: call void @foo(i8* [[PTR2]]) |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[PTR1]], i8* [[PTR2]], i32 1, i1 false) |
| ; CHECK-NEXT: br label [[NEXT:%.*]] |
| ; CHECK: next: |
| ; CHECK-NEXT: ret void |
| ; |
| %ptr1 = alloca i8 |
| %ptr2 = alloca i8 |
| call void @foo(i8* %ptr2) |
| call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr1, i8* %ptr2, i32 1, i1 false) |
| br label %next |
| |
| next: |
| ret void |
| } |
| |
| declare void @capture(i8*) |
| |
| ; This case should not be optimized, because dest is captured before the call. |
| define void @test_dest_captured_before_alloca() { |
| ; CHECK-LABEL: define {{[^@]+}}@test_dest_captured_before_alloca() { |
| ; CHECK-NEXT: [[PTR1:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: [[PTR2:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: call void @capture(i8* [[PTR1]]) |
| ; CHECK-NEXT: call void @foo(i8* [[PTR2]]) #[[ATTR2:[0-9]+]] |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[PTR1]], i8* [[PTR2]], i32 1, i1 false) |
| ; CHECK-NEXT: ret void |
| ; |
| %ptr1 = alloca i8 |
| %ptr2 = alloca i8 |
| call void @capture(i8* %ptr1) |
| call void @foo(i8* %ptr2) argmemonly |
| call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr1, i8* %ptr2, i32 1, i1 false) |
| ret void |
| } |
| |
| |
| @g = internal global i8 0 |
| |
| ; This case should not be optimized, because @g is captured before the call |
| ; (being a global) and @icmp_g might depend on its identity. |
| define void @test_dest_captured_before_global() { |
| ; CHECK-LABEL: define {{[^@]+}}@test_dest_captured_before_global() { |
| ; CHECK-NEXT: [[PTR:%.*]] = alloca i8, align 1 |
| ; CHECK-NEXT: call void @icmp_g(i8* [[PTR]]) |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* @g, i8* [[PTR]], i32 1, i1 false) |
| ; CHECK-NEXT: ret void |
| ; |
| %ptr = alloca i8 |
| call void @icmp_g(i8* %ptr) |
| call void @llvm.memcpy.p0i8.p0i8.i32(i8* @g, i8* %ptr, i32 1, i1 false) |
| ret void |
| } |
| |
| define void @icmp_g(i8* %p) { |
| ; CHECK-LABEL: define {{[^@]+}}@icmp_g |
| ; CHECK-SAME: (i8* [[P:%.*]]) { |
| ; CHECK-NEXT: [[C:%.*]] = icmp eq i8* [[P]], @g |
| ; CHECK-NEXT: br i1 [[C]], label [[IF:%.*]], label [[ELSE:%.*]] |
| ; CHECK: if: |
| ; CHECK-NEXT: store i8 1, i8* [[P]], align 1 |
| ; CHECK-NEXT: ret void |
| ; CHECK: else: |
| ; CHECK-NEXT: store i8 2, i8* [[P]], align 1 |
| ; CHECK-NEXT: ret void |
| ; |
| %c = icmp eq i8* %p, @g |
| br i1 %c, label %if, label %else |
| |
| if: |
| store i8 1, i8* %p |
| ret void |
| |
| else: |
| store i8 2, i8* %p |
| ret void |
| } |