blob: b6f7b1fd1685e345ab3dbbf20e2a87e79c2d992b [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt < %s -passes=sroa -S | FileCheck %s
declare void @callee(ptr nocapture readonly %p)
define i32 @simple() {
; CHECK-LABEL: @simple(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: ret i32 0
;
%a = alloca i32
store i32 0, ptr %a
call void @callee(ptr %a)
%l1 = load i32, ptr %a
ret i32 %l1
}
define i32 @smallbig() {
; CHECK-LABEL: @smallbig(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i8 0, ptr [[A]], align 1
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[L1:%.*]] = load i32, ptr [[A]], align 4
; CHECK-NEXT: ret i32 [[L1]]
;
%a = alloca i32
store i8 0, ptr %a
call void @callee(ptr %a)
%l1 = load i32, ptr %a
ret i32 %l1
}
define i32 @twoalloc() {
; CHECK-LABEL: @twoalloc(
; CHECK-NEXT: [[A:%.*]] = alloca { i32, i32 }, align 8
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: store i32 1, ptr [[B]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[R:%.*]] = add i32 0, 1
; CHECK-NEXT: ret i32 [[R]]
;
%a = alloca {i32, i32}
store i32 0, ptr %a
%b = getelementptr i32, ptr %a, i32 1
store i32 1, ptr %b
call void @callee(ptr %a)
%l1 = load i32, ptr %a
%l2 = load i32, ptr %b
%r = add i32 %l1, %l2
ret i32 %r
}
define i32 @twostore() {
; CHECK-LABEL: @twostore(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i32 1, ptr [[A]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: store i32 2, ptr [[A]], align 4
; CHECK-NEXT: ret i32 2
;
%a = alloca i32
store i32 1, ptr %a
call void @callee(ptr %a)
store i32 2, ptr %a
%l = load i32, ptr %a
ret i32 %l
}
define float @differenttype() {
; CHECK-LABEL: @differenttype(
; CHECK-NEXT: [[A:%.*]] = alloca { i32, i32 }, align 8
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: store i32 1, ptr [[B]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[L2:%.*]] = load float, ptr [[B]], align 4
; CHECK-NEXT: ret float [[L2]]
;
%a = alloca {i32, i32}
%b = getelementptr i32, ptr %a, i32 1
store i32 1, ptr %b
call void @callee(ptr %a)
%l2 = load float, ptr %b
ret float %l2
}
define i32 @twoalloc_store64(i64 %x) {
; CHECK-LABEL: @twoalloc_store64(
; CHECK-NEXT: [[A:%.*]] = alloca i64, align 8
; CHECK-NEXT: store i64 [[X:%.*]], ptr [[A]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[L1:%.*]] = load i32, ptr [[A]], align 4
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: [[L2:%.*]] = load i32, ptr [[B]], align 4
; CHECK-NEXT: ret i32 [[L2]]
;
%a = alloca i64
store i64 %x, ptr %a
call void @callee(ptr %a)
%l1 = load i32, ptr %a
%b = getelementptr i32, ptr %a, i32 1
%l2 = load i32, ptr %b
ret i32 %l2
}
define i32 @twocalls() {
; CHECK-LABEL: @twocalls(
; CHECK-NEXT: [[A:%.*]] = alloca { i32, i32 }, align 8
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: store i32 1, ptr [[B]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[R:%.*]] = add i32 0, 1
; CHECK-NEXT: ret i32 [[R]]
;
%a = alloca {i32, i32}
store i32 0, ptr %a
%b = getelementptr i32, ptr %a, i32 1
store i32 1, ptr %b
call void @callee(ptr %a)
%l1 = load i32, ptr %a
call void @callee(ptr %a)
%l2 = load i32, ptr %b
%r = add i32 %l1, %l2
ret i32 %r
}
define i32 @volatile() {
; CHECK-LABEL: @volatile(
; CHECK-NEXT: [[A:%.*]] = alloca { i32, i32 }, align 8
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: store volatile i32 1, ptr [[B]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[L1:%.*]] = load volatile i32, ptr [[A]], align 4
; CHECK-NEXT: [[L2:%.*]] = load i32, ptr [[B]], align 4
; CHECK-NEXT: [[R:%.*]] = add i32 [[L1]], [[L2]]
; CHECK-NEXT: ret i32 [[R]]
;
%a = alloca {i32, i32}
store i32 0, ptr %a
%b = getelementptr i32, ptr %a, i32 1
store volatile i32 1, ptr %b
call void @callee(ptr %a)
%l1 = load volatile i32, ptr %a
%l2 = load i32, ptr %b
%r = add i32 %l1, %l2
ret i32 %r
}
define i32 @atomic() {
; CHECK-LABEL: @atomic(
; CHECK-NEXT: [[A:%.*]] = alloca { i32, i32 }, align 8
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: store i32 1, ptr [[B]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[L1:%.*]] = load atomic i32, ptr [[A]] seq_cst, align 4
; CHECK-NEXT: [[R:%.*]] = add i32 [[L1]], 1
; CHECK-NEXT: ret i32 [[R]]
;
%a = alloca {i32, i32}
store i32 0, ptr %a
%b = getelementptr i32, ptr %a, i32 1
store i32 1, ptr %b
call void @callee(ptr %a)
%l1 = load atomic i32, ptr %a seq_cst, align 4
%l2 = load i32, ptr %b
%r = add i32 %l1, %l2
ret i32 %r
}
define i32 @notdominating() {
; CHECK-LABEL: @notdominating(
; CHECK-NEXT: [[A:%.*]] = alloca { i32, i32 }, align 8
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: store i32 1, ptr [[B]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[R:%.*]] = add i32 undef, undef
; CHECK-NEXT: ret i32 [[R]]
;
%a = alloca {i32, i32}
%b = getelementptr i32, ptr %a, i32 1
%l1 = load i32, ptr %a
%l2 = load i32, ptr %b
store i32 0, ptr %a
store i32 1, ptr %b
call void @callee(ptr %a)
%r = add i32 %l1, %l2
ret i32 %r
}
declare void @callee_notreadonly(ptr %p)
define i32 @notreadonly() {
; CHECK-LABEL: @notreadonly(
; CHECK-NEXT: [[A:%.*]] = alloca { i32, i32 }, align 8
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: store i32 1, ptr [[B]], align 4
; CHECK-NEXT: call void @callee_notreadonly(ptr [[A]])
; CHECK-NEXT: [[L1:%.*]] = load i32, ptr [[A]], align 4
; CHECK-NEXT: [[L2:%.*]] = load i32, ptr [[B]], align 4
; CHECK-NEXT: [[R:%.*]] = add i32 [[L1]], [[L2]]
; CHECK-NEXT: ret i32 [[R]]
;
%a = alloca {i32, i32}
store i32 0, ptr %a
%b = getelementptr i32, ptr %a, i32 1
store i32 1, ptr %b
call void @callee_notreadonly(ptr %a)
%l1 = load i32, ptr %a
%l2 = load i32, ptr %b
%r = add i32 %l1, %l2
ret i32 %r
}
declare void @callee_multiuse(ptr nocapture readonly %p, ptr nocapture readonly %q)
define i32 @multiuse() {
; CHECK-LABEL: @multiuse(
; CHECK-NEXT: [[A:%.*]] = alloca { i32, i32 }, align 8
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: store i32 1, ptr [[B]], align 4
; CHECK-NEXT: call void @callee_multiuse(ptr [[A]], ptr [[A]])
; CHECK-NEXT: [[R:%.*]] = add i32 0, 1
; CHECK-NEXT: ret i32 [[R]]
;
%a = alloca {i32, i32}
store i32 0, ptr %a
%b = getelementptr i32, ptr %a, i32 1
store i32 1, ptr %b
call void @callee_multiuse(ptr %a, ptr %a)
%l1 = load i32, ptr %a
%l2 = load i32, ptr %b
%r = add i32 %l1, %l2
ret i32 %r
}
define i32 @memcpyed(ptr %src) {
; CHECK-LABEL: @memcpyed(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr [[A]], ptr [[SRC:%.*]], i64 4, i1 false)
; CHECK-NEXT: [[L1:%.*]] = load i32, ptr [[A]], align 4
; CHECK-NEXT: ret i32 [[L1]]
;
%a = alloca i32
store i32 0, ptr %a
call void @callee(ptr %a)
call void @llvm.memcpy.p0.p0.i64(ptr %a, ptr %src, i64 4, i1 false)
%l1 = load i32, ptr %a
ret i32 %l1
}
define ptr @memcpyedsplit(ptr %src) {
; CHECK-LABEL: @memcpyedsplit(
; CHECK-NEXT: [[A:%.*]] = alloca { i64, i64 }, align 8
; CHECK-NEXT: store i8 1, ptr [[A]], align 1
; CHECK-NEXT: [[B:%.*]] = getelementptr i64, ptr [[A]], i32 1
; CHECK-NEXT: store ptr null, ptr [[B]], align 8
; CHECK-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr [[A]], ptr [[SRC:%.*]], i64 16, i1 false)
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[L1:%.*]] = load ptr, ptr [[B]], align 8
; CHECK-NEXT: ret ptr [[L1]]
;
%a = alloca { i64, i64 }
store i8 1, ptr %a
%b = getelementptr i64, ptr %a, i32 1
store ptr null, ptr %b
call void @llvm.memcpy.p0.p0.i64(ptr %a, ptr %src, i64 16, i1 false)
call void @callee(ptr %a)
%l1 = load ptr, ptr %b
ret ptr %l1
}
; This struct contains padding bits. The load should not be replaced by poison.
%struct.LoadImmediateInfo = type { i32 }
define void @incompletestruct(i1 %b, i1 %c) {
; CHECK-LABEL: @incompletestruct(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[LII:%.*]] = alloca [[STRUCT_LOADIMMEDIATEINFO:%.*]], align 4
; CHECK-NEXT: call void @llvm.lifetime.start.p0(ptr nonnull [[LII]])
; CHECK-NEXT: [[BF_CLEAR4:%.*]] = and i32 undef, -262144
; CHECK-NEXT: [[BF_SET5:%.*]] = select i1 [[B:%.*]], i32 196608, i32 131072
; CHECK-NEXT: [[BF_SET12:%.*]] = or disjoint i32 [[BF_SET5]], [[BF_CLEAR4]]
; CHECK-NEXT: store i32 [[BF_SET12]], ptr [[LII]], align 4
; CHECK-NEXT: call void @callee(ptr [[LII]])
; CHECK-NEXT: call void @llvm.lifetime.end.p0(ptr nonnull [[LII]])
; CHECK-NEXT: ret void
;
entry:
%LII = alloca %struct.LoadImmediateInfo, align 4
call void @llvm.lifetime.start.p0(ptr nonnull %LII)
%bf.load = load i32, ptr %LII, align 4
%bf.clear4 = and i32 %bf.load, -262144
%bf.set5 = select i1 %b, i32 196608, i32 131072
%bf.set12 = or disjoint i32 %bf.set5, %bf.clear4
store i32 %bf.set12, ptr %LII, align 4
call void @callee(ptr %LII)
call void @llvm.lifetime.end.p0(ptr nonnull %LII)
ret void
}
define void @incompletestruct_bb(i1 %b, i1 %c) {
; CHECK-LABEL: @incompletestruct_bb(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[LII:%.*]] = alloca [[STRUCT_LOADIMMEDIATEINFO:%.*]], align 4
; CHECK-NEXT: br i1 [[C:%.*]], label [[IF_THEN:%.*]], label [[IF_END:%.*]]
; CHECK: if.then:
; CHECK-NEXT: call void @llvm.lifetime.start.p0(ptr nonnull [[LII]])
; CHECK-NEXT: [[BF_CLEAR4:%.*]] = and i32 undef, -262144
; CHECK-NEXT: [[BF_SET5:%.*]] = select i1 [[B:%.*]], i32 196608, i32 131072
; CHECK-NEXT: [[BF_SET12:%.*]] = or disjoint i32 [[BF_SET5]], [[BF_CLEAR4]]
; CHECK-NEXT: store i32 [[BF_SET12]], ptr [[LII]], align 4
; CHECK-NEXT: call void @callee(ptr [[LII]])
; CHECK-NEXT: call void @llvm.lifetime.end.p0(ptr nonnull [[LII]])
; CHECK-NEXT: br label [[IF_END]]
; CHECK: if.end:
; CHECK-NEXT: ret void
;
entry:
%LII = alloca %struct.LoadImmediateInfo, align 4
br i1 %c, label %if.then, label %if.end
if.then: ; preds = %entry
call void @llvm.lifetime.start.p0(ptr nonnull %LII)
%bf.load = load i32, ptr %LII, align 4
%bf.clear4 = and i32 %bf.load, -262144
%bf.set5 = select i1 %b, i32 196608, i32 131072
%bf.set12 = or disjoint i32 %bf.set5, %bf.clear4
store i32 %bf.set12, ptr %LII, align 4
call void @callee(ptr %LII)
call void @llvm.lifetime.end.p0(ptr nonnull %LII)
br label %if.end
if.end: ; preds = %if.then, %entry
ret void
}
define i32 @sixteenload() {
; CHECK-LABEL: @sixteenload(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[A1:%.*]] = add i32 0, 0
; CHECK-NEXT: [[A2:%.*]] = add i32 [[A1]], 0
; CHECK-NEXT: ret i32 [[A2]]
;
%a = alloca i32
store i32 0, ptr %a
call void @callee(ptr %a)
%l1 = load i32, ptr %a
%l2 = load i32, ptr %a
%l3 = load i32, ptr %a
%l4 = load i32, ptr %a
%l5 = load i32, ptr %a
%l6 = load i32, ptr %a
%l7 = load i32, ptr %a
%l8 = load i32, ptr %a
%l9 = load i32, ptr %a
%l10 = load i32, ptr %a
%l11 = load i32, ptr %a
%l12 = load i32, ptr %a
%l13 = load i32, ptr %a
%l14 = load i32, ptr %a
%l15 = load i32, ptr %a
%l16 = load i32, ptr %a
%a1 = add i32 %l1, %l2
%a2 = add i32 %a1, %l3
ret i32 %a2
}
define i32 @testcallalloca() {
; CHECK-LABEL: @testcallalloca(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: call void [[A]]()
; CHECK-NEXT: [[L1:%.*]] = load i32, ptr [[A]], align 4
; CHECK-NEXT: ret i32 [[L1]]
;
%a = alloca i32
store i32 0, ptr %a
call void %a()
%l1 = load i32, ptr %a
ret i32 %l1
}
declare void @callee_byval(ptr byval(i32) %p)
define i32 @simple_byval() {
; CHECK-LABEL: @simple_byval(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: call void @callee_byval(ptr [[A]])
; CHECK-NEXT: ret i32 0
;
%a = alloca i32
store i32 0, ptr %a
call void @callee_byval(ptr %a)
%l1 = load i32, ptr %a
ret i32 %l1
}
declare void @callee_address_only_capture(ptr readonly captures(address) %p)
define i32 @address_only_capture() {
; CHECK-LABEL: @address_only_capture(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: call void @callee_address_only_capture(ptr [[A]])
; CHECK-NEXT: ret i32 0
;
%a = alloca i32
store i32 0, ptr %a
call void @callee_address_only_capture(ptr %a)
%l1 = load i32, ptr %a
ret i32 %l1
}
declare void @callee_read_only_capture(ptr readonly captures(address, read_provenance) %p)
define i32 @read_only_capture() {
; CHECK-LABEL: @read_only_capture(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: call void @callee_read_only_capture(ptr [[A]])
; CHECK-NEXT: ret i32 0
;
%a = alloca i32
store i32 0, ptr %a
call void @callee_read_only_capture(ptr %a)
%l1 = load i32, ptr %a
ret i32 %l1
}
declare void @callee_provenance_only_capture(ptr readonly captures(provenance) %p)
; Should not be transformed, as write-provenance is captured.
define i32 @provenance_only_capture() {
; CHECK-LABEL: @provenance_only_capture(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: call void @callee_provenance_only_capture(ptr [[A]])
; CHECK-NEXT: [[L1:%.*]] = load i32, ptr [[A]], align 4
; CHECK-NEXT: ret i32 [[L1]]
;
%a = alloca i32
store i32 0, ptr %a
call void @callee_provenance_only_capture(ptr %a)
%l1 = load i32, ptr %a
ret i32 %l1
}
define i32 @simple_with_lifetimes() {
; CHECK-LABEL: @simple_with_lifetimes(
; CHECK-NEXT: [[A:%.*]] = alloca i32, align 4
; CHECK-NEXT: call void @llvm.lifetime.start.p0(ptr [[A]])
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: call void @llvm.lifetime.end.p0(ptr [[A]])
; CHECK-NEXT: ret i32 0
;
%a = alloca i32
call void @llvm.lifetime.start(ptr %a)
store i32 0, ptr %a
call void @callee(ptr %a)
%l1 = load i32, ptr %a
call void @llvm.lifetime.end(ptr %a)
ret i32 %l1
}
define i32 @twoalloc_with_lifetimes() {
; CHECK-LABEL: @twoalloc_with_lifetimes(
; CHECK-NEXT: [[A:%.*]] = alloca { i32, i32 }, align 8
; CHECK-NEXT: call void @llvm.lifetime.start.p0(ptr [[A]])
; CHECK-NEXT: store i32 0, ptr [[A]], align 4
; CHECK-NEXT: [[B:%.*]] = getelementptr i32, ptr [[A]], i32 1
; CHECK-NEXT: store i32 1, ptr [[B]], align 4
; CHECK-NEXT: call void @callee(ptr [[A]])
; CHECK-NEXT: [[R:%.*]] = add i32 0, 1
; CHECK-NEXT: call void @llvm.lifetime.end.p0(ptr [[A]])
; CHECK-NEXT: ret i32 [[R]]
;
%a = alloca {i32, i32}
call void @llvm.lifetime.start(ptr %a)
store i32 0, ptr %a
%b = getelementptr i32, ptr %a, i32 1
store i32 1, ptr %b
call void @callee(ptr %a)
%l1 = load i32, ptr %a
%l2 = load i32, ptr %b
%r = add i32 %l1, %l2
call void @llvm.lifetime.end(ptr %a)
ret i32 %r
}
declare void @use.i32(i32)
; We can promote the %i load, even though there is an unknown offset load
; in the loop. It is sufficient that we know all stores.
define void @load_dyn_offset(ptr %ary) {
; CHECK-LABEL: @load_dyn_offset(
; CHECK-NEXT: [[A:%.*]] = alloca { i64, [4 x i32] }, align 8
; CHECK-NEXT: store i64 0, ptr [[A]], align 4
; CHECK-NEXT: [[GEP:%.*]] = getelementptr i8, ptr [[A]], i64 8
; CHECK-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr [[GEP]], ptr [[ARY:%.*]], i64 16, i1 false)
; CHECK-NEXT: br label [[LOOP:%.*]]
; CHECK: loop:
; CHECK-NEXT: [[I:%.*]] = phi i64 [ [[I_NEXT:%.*]], [[LOOP]] ], [ 0, [[TMP0:%.*]] ]
; CHECK-NEXT: [[I_NEXT]] = add i64 [[I]], 1
; CHECK-NEXT: store i64 [[I_NEXT]], ptr [[A]], align 4
; CHECK-NEXT: [[GEP_I:%.*]] = getelementptr i32, ptr [[GEP]], i64 [[I]]
; CHECK-NEXT: [[VAL:%.*]] = load i32, ptr [[GEP_I]], align 4
; CHECK-NEXT: call void @use.i32(i32 [[VAL]])
; CHECK-NEXT: [[CMP:%.*]] = icmp eq i64 [[I_NEXT]], 6
; CHECK-NEXT: br i1 [[CMP]], label [[EXIT:%.*]], label [[LOOP]]
; CHECK: exit:
; CHECK-NEXT: ret void
;
%a = alloca {i64, [4 x i32]}
store i64 0, ptr %a
%gep = getelementptr i8, ptr %a, i64 8
call void @llvm.memcpy(ptr %gep, ptr %ary, i64 16, i1 false)
br label %loop
loop:
%i = load i64, ptr %a
%i.next = add i64 %i, 1
store i64 %i.next, ptr %a
%gep.i = getelementptr i32, ptr %gep, i64 %i
%val = load i32, ptr %gep.i
call void @use.i32(i32 %val)
%cmp = icmp eq i64 %i.next, 6
br i1 %cmp, label %exit, label %loop
exit:
ret void
}
; Same as previous test, but with an unknown-offset store. We can't promote in
; that case.
define void @store_dyn_offset(ptr %ary) {
; CHECK-LABEL: @store_dyn_offset(
; CHECK-NEXT: [[A:%.*]] = alloca { i64, [4 x i32] }, align 8
; CHECK-NEXT: store i64 0, ptr [[A]], align 4
; CHECK-NEXT: [[GEP:%.*]] = getelementptr i8, ptr [[A]], i64 8
; CHECK-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr [[GEP]], ptr [[ARY:%.*]], i64 16, i1 false)
; CHECK-NEXT: br label [[LOOP:%.*]]
; CHECK: loop:
; CHECK-NEXT: [[I:%.*]] = load i64, ptr [[A]], align 4
; CHECK-NEXT: [[I_NEXT:%.*]] = add i64 [[I]], 1
; CHECK-NEXT: store i64 [[I_NEXT]], ptr [[A]], align 4
; CHECK-NEXT: [[GEP_I:%.*]] = getelementptr i32, ptr [[GEP]], i64 [[I]]
; CHECK-NEXT: [[I_TRUNC:%.*]] = trunc i64 [[I]] to i32
; CHECK-NEXT: store i32 [[I_TRUNC]], ptr [[GEP_I]], align 4
; CHECK-NEXT: [[CMP:%.*]] = icmp eq i64 [[I_NEXT]], 6
; CHECK-NEXT: br i1 [[CMP]], label [[EXIT:%.*]], label [[LOOP]]
; CHECK: exit:
; CHECK-NEXT: ret void
;
%a = alloca {i64, [4 x i32]}
store i64 0, ptr %a
%gep = getelementptr i8, ptr %a, i64 8
call void @llvm.memcpy(ptr %gep, ptr %ary, i64 16, i1 false)
br label %loop
loop:
%i = load i64, ptr %a
%i.next = add i64 %i, 1
store i64 %i.next, ptr %a
%gep.i = getelementptr i32, ptr %gep, i64 %i
%i.trunc = trunc i64 %i to i32
store i32 %i.trunc, ptr %gep.i
%cmp = icmp eq i64 %i.next, 6
br i1 %cmp, label %exit, label %loop
exit:
ret void
}
declare void @llvm.memcpy.p0.p0.i64(ptr, ptr, i64, i1)