blob: 4f3ff2d1ea0f4c3c7ee92e35a3b7dfcc397e57cc [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt < %s -passes='separate-const-offset-from-gep<lower-gep>' \
; RUN: -reassociate-geps-verify-no-dead-code -S | FileCheck %s
target triple = "amdgcn-amd-amdhsa"
%struct.Packed = type <{ [3 x i32], [8 x i64] }> ; <> means packed
@packed_struct_array = addrspace(3) global [1024 x %struct.Packed] poison, align 1
; Verifies we can emit correct uglygep if the address is not natually
; aligned. This shoult not produce a no-op bitcast with opaque
; pointers.
define ptr addrspace(3) @packed_struct(i32 %i, i32 %j) {
; CHECK-LABEL: @packed_struct(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[IDXPROM:%.*]] = trunc i64 0 to i32
; CHECK-NEXT: [[TMP0:%.*]] = mul i32 [[IDXPROM]], 77824
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr i8, ptr addrspace(3) @packed_struct_array, i32 [[TMP0]]
; CHECK-NEXT: [[TMP1:%.*]] = mul i32 [[I:%.*]], 76
; CHECK-NEXT: [[UGLYGEP3:%.*]] = getelementptr i8, ptr addrspace(3) [[UGLYGEP]], i32 [[TMP1]]
; CHECK-NEXT: [[TMP2:%.*]] = shl i32 [[J:%.*]], 3
; CHECK-NEXT: [[UGLYGEP4:%.*]] = getelementptr i8, ptr addrspace(3) [[UGLYGEP3]], i32 [[TMP2]]
; CHECK-NEXT: [[UGLYGEP5:%.*]] = getelementptr i8, ptr addrspace(3) [[UGLYGEP4]], i32 112
; CHECK-NEXT: ret ptr addrspace(3) [[UGLYGEP5]]
;
entry:
%add = add nsw i32 %j, 3
%add1 = add nsw i32 %i, 1
%arrayidx3 = getelementptr inbounds [1024 x %struct.Packed], ptr addrspace(3) @packed_struct_array, i64 0, i32 %add1, i32 1, i32 %add
ret ptr addrspace(3) %arrayidx3
}
%struct = type { i32, i32, i32 }
define i32 @test1(ptr %ptr, i64 %idx) {
; CHECK-LABEL: @test1(
; CHECK-NEXT: [[TMP1:%.*]] = mul i64 [[IDX:%.*]], 12
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr i8, ptr [[PTR:%.*]], i64 [[TMP1]]
; CHECK-NEXT: [[UGLYGEP1:%.*]] = getelementptr i8, ptr [[UGLYGEP]], i64 4
; CHECK-NEXT: [[LV_1:%.*]] = load i32, ptr [[UGLYGEP1]], align 4
; CHECK-NEXT: [[C:%.*]] = icmp slt i32 [[LV_1]], 0
; CHECK-NEXT: br i1 [[C]], label [[THEN:%.*]], label [[ELSE:%.*]]
; CHECK: then:
; CHECK-NEXT: [[TMP2:%.*]] = mul i64 [[IDX]], 12
; CHECK-NEXT: [[UGLYGEP2:%.*]] = getelementptr i8, ptr [[PTR]], i64 [[TMP2]]
; CHECK-NEXT: [[UGLYGEP3:%.*]] = getelementptr i8, ptr [[UGLYGEP2]], i64 8
; CHECK-NEXT: [[LV_2:%.*]] = load i32, ptr [[UGLYGEP3]], align 4
; CHECK-NEXT: [[RES:%.*]] = add i32 [[LV_1]], [[LV_2]]
; CHECK-NEXT: ret i32 [[RES]]
; CHECK: else:
; CHECK-NEXT: ret i32 0
;
%gep.1 = getelementptr %struct, ptr %ptr, i64 %idx, i32 1
%lv.1 = load i32, ptr %gep.1
%c = icmp slt i32 %lv.1, 0
br i1 %c, label %then, label %else
then:
%gep.2 = getelementptr %struct, ptr %ptr, i64 %idx, i32 2
%lv.2 = load i32, ptr %gep.2
%res = add i32 %lv.1, %lv.2
ret i32 %res
else:
ret i32 0
}
define i32 @test1_fatptr(ptr addrspace(7) %ptr, i64 %idx) {
; CHECK-LABEL: @test1_fatptr(
; CHECK-NEXT: [[IDXPROM:%.*]] = trunc i64 [[IDX:%.*]] to i32
; CHECK-NEXT: [[TMP1:%.*]] = mul i32 [[IDXPROM]], 12
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr i8, ptr addrspace(7) [[PTR:%.*]], i32 [[TMP1]]
; CHECK-NEXT: [[UGLYGEP1:%.*]] = getelementptr i8, ptr addrspace(7) [[UGLYGEP]], i32 4
; CHECK-NEXT: [[LV_1:%.*]] = load i32, ptr addrspace(7) [[UGLYGEP1]], align 4
; CHECK-NEXT: [[C:%.*]] = icmp slt i32 [[LV_1]], 0
; CHECK-NEXT: br i1 [[C]], label [[THEN:%.*]], label [[ELSE:%.*]]
; CHECK: then:
; CHECK-NEXT: [[IDXPROM2:%.*]] = trunc i64 [[IDX]] to i32
; CHECK-NEXT: [[TMP2:%.*]] = mul i32 [[IDXPROM2]], 12
; CHECK-NEXT: [[UGLYGEP3:%.*]] = getelementptr i8, ptr addrspace(7) [[PTR]], i32 [[TMP2]]
; CHECK-NEXT: [[UGLYGEP4:%.*]] = getelementptr i8, ptr addrspace(7) [[UGLYGEP3]], i32 8
; CHECK-NEXT: [[LV_2:%.*]] = load i32, ptr addrspace(7) [[UGLYGEP4]], align 4
; CHECK-NEXT: [[RES:%.*]] = add i32 [[LV_1]], [[LV_2]]
; CHECK-NEXT: ret i32 [[RES]]
; CHECK: else:
; CHECK-NEXT: ret i32 0
;
%gep.1 = getelementptr %struct, ptr addrspace(7) %ptr, i64 %idx, i32 1
%lv.1 = load i32, ptr addrspace(7) %gep.1
%c = icmp slt i32 %lv.1, 0
br i1 %c, label %then, label %else
then:
%gep.2 = getelementptr %struct, ptr addrspace(7) %ptr, i64 %idx, i32 2
%lv.2 = load i32, ptr addrspace(7) %gep.2
%res = add i32 %lv.1, %lv.2
ret i32 %res
else:
ret i32 0
}
; Test lowerToSingleIndexGEPs
define void @test_A_sub_B_add_ConstantInt(ptr %p) {
; CHECK-LABEL: @test_A_sub_B_add_ConstantInt(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[TMP0:%.*]] = tail call i32 @foo()
; CHECK-NEXT: [[REM:%.*]] = srem i32 [[TMP0]], 5
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
; CHECK: for.body:
; CHECK-NEXT: [[K:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[COND_END:%.*]] ]
; CHECK-NEXT: [[MUL:%.*]] = mul nuw nsw i32 [[K]], 5
; CHECK-NEXT: [[SUB1:%.*]] = sub nsw i32 [[MUL]], [[REM]]
; CHECK-NEXT: [[CMP26:%.*]] = icmp ult i32 [[SUB1]], 512
; CHECK-NEXT: br i1 [[CMP26]], label [[COND_TRUE:%.*]], label [[COND_END]]
; CHECK: cond.true:
; CHECK-NEXT: [[TMP1:%.*]] = sext i32 [[MUL]] to i64
; CHECK-NEXT: [[TMP2:%.*]] = sext i32 [[REM]] to i64
; CHECK-NEXT: [[SUB22:%.*]] = sub i64 [[TMP2]], [[TMP1]]
; CHECK-NEXT: [[TMP3:%.*]] = shl i64 [[SUB22]], 2
; CHECK-NEXT: [[UGLYGEP4:%.*]] = getelementptr i8, ptr [[UGLYGEP3:%.*]], i64 2044
; CHECK-NEXT: [[UGLYGEP5:%.*]] = getelementptr i8, ptr [[UGLYGEP4]], i64 [[TMP3]]
; CHECK-NEXT: store float 1.000000e+00, ptr [[UGLYGEP5]], align 4
; CHECK-NEXT: br label [[COND_END]]
; CHECK: cond.end:
; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[K]], 1
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp ne i32 [[INC]], 100
; CHECK-NEXT: br i1 [[EXITCOND]], label [[FOR_BODY]], label [[FOR_END:%.*]]
; CHECK: for.end:
; CHECK-NEXT: ret void
;
entry:
%0 = tail call i32 @foo()
%rem = srem i32 %0, 5
%add = add nsw i32 %rem , 511
br label %for.body
for.body:
%k = phi i32 [ 0, %entry ], [ %inc, %cond.end ]
%mul = mul nuw nsw i32 %k, 5
%sub1 = sub nsw i32 %mul, %rem
%cmp26 = icmp ult i32 %sub1, 512
br i1 %cmp26, label %cond.true, label %cond.end
cond.true:
%sub2 = sub nsw i32 %add, %mul
%idxprom = sext i32 %sub2 to i64
%arryidx = getelementptr inbounds float, ptr %p, i64 %idxprom
store float 1.0, ptr %arryidx, align 4
br label %cond.end
cond.end:
%inc = add nuw nsw i32 %k, 1
%exitcond = icmp ne i32 %inc, 100
br i1 %exitcond, label %for.body, label %for.end
for.end:
ret void
}
@extern_array = global [1024 x i32] poison, align 16
; Test lowerToSingleIndexGEPs with a global variable pointer
define void @test_A_sub_B_add_ConstantInt_gv_baseptr(ptr %p) {
; CHECK-LABEL: @test_A_sub_B_add_ConstantInt_gv_baseptr(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[TMP0:%.*]] = tail call i32 @foo()
; CHECK-NEXT: [[REM:%.*]] = srem i32 [[TMP0]], 5
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
; CHECK: for.body:
; CHECK-NEXT: [[K:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[COND_END:%.*]] ]
; CHECK-NEXT: [[MUL:%.*]] = mul nuw nsw i32 [[K]], 5
; CHECK-NEXT: [[SUB1:%.*]] = sub nsw i32 [[MUL]], [[REM]]
; CHECK-NEXT: [[CMP26:%.*]] = icmp ult i32 [[SUB1]], 512
; CHECK-NEXT: br i1 [[CMP26]], label [[COND_TRUE:%.*]], label [[COND_END]]
; CHECK: cond.true:
; CHECK-NEXT: [[TMP1:%.*]] = sext i32 [[MUL]] to i64
; CHECK-NEXT: [[TMP2:%.*]] = sext i32 [[REM]] to i64
; CHECK-NEXT: [[SUB22:%.*]] = sub i64 [[TMP2]], [[TMP1]]
; CHECK-NEXT: [[TMP3:%.*]] = shl i64 [[SUB22]], 2
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr inbounds i8, ptr @extern_array, i64 2044
; CHECK-NEXT: [[UGLYGEP3:%.*]] = getelementptr i8, ptr [[UGLYGEP]], i64 [[TMP3]]
; CHECK-NEXT: store float 1.000000e+00, ptr [[UGLYGEP3]], align 4
; CHECK-NEXT: br label [[COND_END]]
; CHECK: cond.end:
; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[K]], 1
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp ne i32 [[INC]], 100
; CHECK-NEXT: br i1 [[EXITCOND]], label [[FOR_BODY]], label [[FOR_END:%.*]]
; CHECK: for.end:
; CHECK-NEXT: ret void
;
entry:
%0 = tail call i32 @foo()
%rem = srem i32 %0, 5
%add = add nsw i32 %rem , 511
br label %for.body
for.body:
%k = phi i32 [ 0, %entry ], [ %inc, %cond.end ]
%mul = mul nuw nsw i32 %k, 5
%sub1 = sub nsw i32 %mul, %rem
%cmp26 = icmp ult i32 %sub1, 512
br i1 %cmp26, label %cond.true, label %cond.end
cond.true:
%sub2 = sub nsw i32 %add, %mul
%idxprom = sext i32 %sub2 to i64
%arryidx = getelementptr inbounds float, ptr @extern_array, i64 %idxprom
store float 1.0, ptr %arryidx, align 4
br label %cond.end
cond.end:
%inc = add nuw nsw i32 %k, 1
%exitcond = icmp ne i32 %inc, 100
br i1 %exitcond, label %for.body, label %for.end
for.end:
ret void
}
; Test lowerToSingleIndexGEPs with a constant data variable pointer
define void @test_A_sub_B_add_ConstantInt_null_basptr() {
; CHECK-LABEL: @test_A_sub_B_add_ConstantInt_null_basptr(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[TMP0:%.*]] = tail call i32 @foo()
; CHECK-NEXT: [[REM:%.*]] = srem i32 [[TMP0]], 5
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
; CHECK: for.body:
; CHECK-NEXT: [[K:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[COND_END:%.*]] ]
; CHECK-NEXT: [[MUL:%.*]] = mul nuw nsw i32 [[K]], 5
; CHECK-NEXT: [[SUB1:%.*]] = sub nsw i32 [[MUL]], [[REM]]
; CHECK-NEXT: [[CMP26:%.*]] = icmp ult i32 [[SUB1]], 512
; CHECK-NEXT: br i1 [[CMP26]], label [[COND_TRUE:%.*]], label [[COND_END]]
; CHECK: cond.true:
; CHECK-NEXT: [[TMP1:%.*]] = sext i32 [[MUL]] to i64
; CHECK-NEXT: [[TMP2:%.*]] = sext i32 [[REM]] to i64
; CHECK-NEXT: [[SUB22:%.*]] = sub i64 [[TMP2]], [[TMP1]]
; CHECK-NEXT: [[TMP3:%.*]] = shl i64 [[SUB22]], 2
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr inbounds i8, ptr null, i64 2044
; CHECK-NEXT: [[UGLYGEP3:%.*]] = getelementptr i8, ptr [[UGLYGEP]], i64 [[TMP3]]
; CHECK-NEXT: store float 1.000000e+00, ptr [[UGLYGEP3]], align 4
; CHECK-NEXT: br label [[COND_END]]
; CHECK: cond.end:
; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[K]], 1
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp ne i32 [[INC]], 100
; CHECK-NEXT: br i1 [[EXITCOND]], label [[FOR_BODY]], label [[FOR_END:%.*]]
; CHECK: for.end:
; CHECK-NEXT: ret void
;
entry:
%0 = tail call i32 @foo()
%rem = srem i32 %0, 5
%add = add nsw i32 %rem , 511
br label %for.body
for.body:
%k = phi i32 [ 0, %entry ], [ %inc, %cond.end ]
%mul = mul nuw nsw i32 %k, 5
%sub1 = sub nsw i32 %mul, %rem
%cmp26 = icmp ult i32 %sub1, 512
br i1 %cmp26, label %cond.true, label %cond.end
cond.true:
%sub2 = sub nsw i32 %add, %mul
%idxprom = sext i32 %sub2 to i64
%arryidx = getelementptr inbounds float, ptr null, i64 %idxprom
store float 1.0, ptr %arryidx, align 4
br label %cond.end
cond.end:
%inc = add nuw nsw i32 %k, 1
%exitcond = icmp ne i32 %inc, 100
br i1 %exitcond, label %for.body, label %for.end
for.end:
ret void
}
declare i32 @foo()
define amdgpu_kernel void @multi_use_in_loop(ptr addrspace(1) nocapture readonly %arg, ptr addrspace(1) nocapture %arg1, i32 %arg2) {
; CHECK-LABEL: @multi_use_in_loop(
; CHECK-NEXT: bb:
; CHECK-NEXT: [[TMP:%.*]] = sext i32 [[ARG2:%.*]] to i64
; CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds i32, ptr addrspace(1) [[ARG:%.*]], i64 [[TMP]]
; CHECK-NEXT: [[TMP4:%.*]] = load i32, ptr addrspace(1) [[TMP3]], align 4
; CHECK-NEXT: [[TMP5:%.*]] = icmp sgt i32 [[TMP4]], 0
; CHECK-NEXT: br i1 [[TMP5]], label [[BB6:%.*]], label [[BB8:%.*]]
; CHECK: bb6:
; CHECK-NEXT: br label [[BB11:%.*]]
; CHECK: bb7:
; CHECK-NEXT: br label [[BB8]]
; CHECK: bb8:
; CHECK-NEXT: [[TMP9:%.*]] = phi i32 [ 0, [[BB:%.*]] ], [ [[TMP30:%.*]], [[BB7:%.*]] ]
; CHECK-NEXT: [[TMP10:%.*]] = getelementptr inbounds i32, ptr addrspace(1) [[ARG1:%.*]], i64 [[TMP]]
; CHECK-NEXT: store i32 [[TMP9]], ptr addrspace(1) [[TMP10]], align 4
; CHECK-NEXT: ret void
; CHECK: bb11:
; CHECK-NEXT: [[TMP12:%.*]] = phi i32 [ [[TMP30]], [[BB22:%.*]] ], [ 0, [[BB6]] ]
; CHECK-NEXT: [[TMP13:%.*]] = phi i32 [ [[TMP25:%.*]], [[BB22]] ], [ 0, [[BB6]] ]
; CHECK-NEXT: [[TMP14:%.*]] = srem i32 [[TMP13]], [[ARG2]]
; CHECK-NEXT: [[TMP15:%.*]] = sext i32 [[TMP14]] to i64
; CHECK-NEXT: [[TMP16:%.*]] = getelementptr inbounds i32, ptr addrspace(1) [[ARG]], i64 [[TMP15]]
; CHECK-NEXT: [[TMP17:%.*]] = load i32, ptr addrspace(1) [[TMP16]], align 4
; CHECK-NEXT: [[TMP18:%.*]] = icmp sgt i32 [[TMP17]], 100
; CHECK-NEXT: [[TMP19:%.*]] = sext i32 [[TMP13]] to i64
; CHECK-NEXT: br i1 [[TMP18]], label [[BB20:%.*]], label [[BB22]]
; CHECK: bb20:
; CHECK-NEXT: [[TMP21:%.*]] = getelementptr inbounds i32, ptr addrspace(1) [[ARG1]], i64 [[TMP19]]
; CHECK-NEXT: store i32 0, ptr addrspace(1) [[TMP21]], align 4
; CHECK-NEXT: br label [[BB22]]
; CHECK: bb22:
; CHECK-NEXT: [[TMP23:%.*]] = getelementptr inbounds i32, ptr addrspace(1) [[ARG]], i64 [[TMP19]]
; CHECK-NEXT: [[TMP24:%.*]] = load i32, ptr addrspace(1) [[TMP23]], align 4
; CHECK-NEXT: [[TMP25]] = add nuw nsw i32 [[TMP13]], 1
; CHECK-NEXT: [[TMP0:%.*]] = sext i32 [[TMP13]] to i64
; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[TMP0]], 2
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr i8, ptr addrspace(1) [[ARG1]], i64 [[TMP1]]
; CHECK-NEXT: [[UGLYGEP2:%.*]] = getelementptr i8, ptr addrspace(1) [[UGLYGEP]], i64 4
; CHECK-NEXT: [[TMP28:%.*]] = load i32, ptr addrspace(1) [[UGLYGEP2]], align 4
; CHECK-NEXT: [[TMP29:%.*]] = add i32 [[TMP24]], [[TMP12]]
; CHECK-NEXT: [[TMP30]] = add i32 [[TMP29]], [[TMP28]]
; CHECK-NEXT: [[TMP31:%.*]] = icmp eq i32 [[TMP25]], [[TMP4]]
; CHECK-NEXT: br i1 [[TMP31]], label [[BB7]], label [[BB11]]
;
bb:
%tmp = sext i32 %arg2 to i64
%tmp3 = getelementptr inbounds i32, ptr addrspace(1) %arg, i64 %tmp
%tmp4 = load i32, ptr addrspace(1) %tmp3, align 4
%tmp5 = icmp sgt i32 %tmp4, 0
br i1 %tmp5, label %bb6, label %bb8
bb6: ; preds = %bb
br label %bb11
bb7: ; preds = %bb22
br label %bb8
bb8: ; preds = %bb7, %bb
%tmp9 = phi i32 [ 0, %bb ], [ %tmp30, %bb7 ]
%tmp10 = getelementptr inbounds i32, ptr addrspace(1) %arg1, i64 %tmp
store i32 %tmp9, ptr addrspace(1) %tmp10, align 4
ret void
bb11: ; preds = %bb22, %bb6
%tmp12 = phi i32 [ %tmp30, %bb22 ], [ 0, %bb6 ]
%tmp13 = phi i32 [ %tmp25, %bb22 ], [ 0, %bb6 ]
%tmp14 = srem i32 %tmp13, %arg2
%tmp15 = sext i32 %tmp14 to i64
%tmp16 = getelementptr inbounds i32, ptr addrspace(1) %arg, i64 %tmp15
%tmp17 = load i32, ptr addrspace(1) %tmp16, align 4
%tmp18 = icmp sgt i32 %tmp17, 100
%tmp19 = sext i32 %tmp13 to i64
br i1 %tmp18, label %bb20, label %bb22
bb20: ; preds = %bb11
%tmp21 = getelementptr inbounds i32, ptr addrspace(1) %arg1, i64 %tmp19
store i32 0, ptr addrspace(1) %tmp21, align 4
br label %bb22
bb22: ; preds = %bb20, %bb11
%tmp23 = getelementptr inbounds i32, ptr addrspace(1) %arg, i64 %tmp19
%tmp24 = load i32, ptr addrspace(1) %tmp23, align 4
%tmp25 = add nuw nsw i32 %tmp13, 1
%tmp26 = sext i32 %tmp25 to i64
%tmp27 = getelementptr inbounds i32, ptr addrspace(1) %arg1, i64 %tmp26
%tmp28 = load i32, ptr addrspace(1) %tmp27, align 4
%tmp29 = add i32 %tmp24, %tmp12
%tmp30 = add i32 %tmp29, %tmp28
%tmp31 = icmp eq i32 %tmp25, %tmp4
br i1 %tmp31, label %bb7, label %bb11
}
@extern_array_1 = external addrspace(1) global [4096 x i32], align 16
@llvm.used = appending global [1 x ptr] [ptr addrspacecast (ptr addrspace(1) @extern_array_1 to ptr) ]
define void @use_in_other_func() {
; CHECK-LABEL: @use_in_other_func(
; CHECK-NEXT: store i32 0, ptr addrspace(1) @extern_array_1, align 4
; CHECK-NEXT: store i32 0, ptr addrspace(1) @extern_array_1, align 4
; CHECK-NEXT: ret void
;
store i32 0, ptr addrspace(1) @extern_array_1
store i32 0, ptr addrspace(1) @extern_array_1
ret void
}
define amdgpu_kernel void @multi_use_in_loop_global_base_address(ptr addrspace(1) nocapture readonly %arg, i32 %arg2) {
; CHECK-LABEL: @multi_use_in_loop_global_base_address(
; CHECK-NEXT: bb:
; CHECK-NEXT: [[TMP:%.*]] = sext i32 [[ARG2:%.*]] to i64
; CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds i32, ptr addrspace(1) [[ARG:%.*]], i64 [[TMP]]
; CHECK-NEXT: [[TMP4:%.*]] = load i32, ptr addrspace(1) [[TMP3]], align 4
; CHECK-NEXT: [[TMP5:%.*]] = icmp sgt i32 [[TMP4]], 0
; CHECK-NEXT: br i1 [[TMP5]], label [[BB6:%.*]], label [[BB8:%.*]]
; CHECK: bb6:
; CHECK-NEXT: br label [[BB11:%.*]]
; CHECK: bb7:
; CHECK-NEXT: br label [[BB8]]
; CHECK: bb8:
; CHECK-NEXT: [[TMP9:%.*]] = phi i32 [ 0, [[BB:%.*]] ], [ [[TMP30:%.*]], [[BB7:%.*]] ]
; CHECK-NEXT: [[TMP10:%.*]] = getelementptr inbounds i32, ptr addrspace(1) @extern_array_1, i64 [[TMP]]
; CHECK-NEXT: store i32 [[TMP9]], ptr addrspace(1) [[TMP10]], align 4
; CHECK-NEXT: ret void
; CHECK: bb11:
; CHECK-NEXT: [[TMP12:%.*]] = phi i32 [ [[TMP30]], [[BB22:%.*]] ], [ 0, [[BB6]] ]
; CHECK-NEXT: [[TMP13:%.*]] = phi i32 [ [[TMP25:%.*]], [[BB22]] ], [ 0, [[BB6]] ]
; CHECK-NEXT: [[TMP14:%.*]] = srem i32 [[TMP13]], [[ARG2]]
; CHECK-NEXT: [[TMP15:%.*]] = sext i32 [[TMP14]] to i64
; CHECK-NEXT: [[TMP16:%.*]] = getelementptr inbounds i32, ptr addrspace(1) @extern_array_1, i64 [[TMP15]]
; CHECK-NEXT: [[TMP17:%.*]] = load i32, ptr addrspace(1) [[TMP16]], align 4
; CHECK-NEXT: [[TMP18:%.*]] = icmp sgt i32 [[TMP17]], 100
; CHECK-NEXT: [[TMP19:%.*]] = sext i32 [[TMP13]] to i64
; CHECK-NEXT: br i1 [[TMP18]], label [[BB20:%.*]], label [[BB22]]
; CHECK: bb20:
; CHECK-NEXT: [[TMP21:%.*]] = getelementptr inbounds i32, ptr addrspace(1) @extern_array_1, i64 [[TMP19]]
; CHECK-NEXT: store i32 0, ptr addrspace(1) [[TMP21]], align 4
; CHECK-NEXT: br label [[BB22]]
; CHECK: bb22:
; CHECK-NEXT: [[TMP23:%.*]] = getelementptr inbounds i32, ptr addrspace(1) @extern_array_1, i64 [[TMP19]]
; CHECK-NEXT: [[TMP24:%.*]] = load i32, ptr addrspace(1) [[TMP23]], align 4
; CHECK-NEXT: [[TMP25]] = add nuw nsw i32 [[TMP13]], 1
; CHECK-NEXT: [[TMP0:%.*]] = sext i32 [[TMP13]] to i64
; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[TMP0]], 2
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr i8, ptr addrspace(1) @extern_array_1, i64 4
; CHECK-NEXT: [[UGLYGEP2:%.*]] = getelementptr i8, ptr addrspace(1) [[UGLYGEP]], i64 [[TMP1]]
; CHECK-NEXT: [[TMP28:%.*]] = load i32, ptr addrspace(1) [[UGLYGEP2]], align 4
; CHECK-NEXT: [[TMP29:%.*]] = add i32 [[TMP24]], [[TMP12]]
; CHECK-NEXT: [[TMP30]] = add i32 [[TMP29]], [[TMP28]]
; CHECK-NEXT: [[TMP31:%.*]] = icmp eq i32 [[TMP25]], [[TMP4]]
; CHECK-NEXT: br i1 [[TMP31]], label [[BB7]], label [[BB11]]
;
bb:
%tmp = sext i32 %arg2 to i64
%tmp3 = getelementptr inbounds i32, ptr addrspace(1) %arg, i64 %tmp
%tmp4 = load i32, ptr addrspace(1) %tmp3, align 4
%tmp5 = icmp sgt i32 %tmp4, 0
br i1 %tmp5, label %bb6, label %bb8
bb6: ; preds = %bb
br label %bb11
bb7: ; preds = %bb22
br label %bb8
bb8: ; preds = %bb7, %bb
%tmp9 = phi i32 [ 0, %bb ], [ %tmp30, %bb7 ]
%tmp10 = getelementptr inbounds i32, ptr addrspace(1) @extern_array_1, i64 %tmp
store i32 %tmp9, ptr addrspace(1) %tmp10, align 4
ret void
bb11: ; preds = %bb22, %bb6
%tmp12 = phi i32 [ %tmp30, %bb22 ], [ 0, %bb6 ]
%tmp13 = phi i32 [ %tmp25, %bb22 ], [ 0, %bb6 ]
%tmp14 = srem i32 %tmp13, %arg2
%tmp15 = sext i32 %tmp14 to i64
%tmp16 = getelementptr inbounds i32, ptr addrspace(1) @extern_array_1, i64 %tmp15
%tmp17 = load i32, ptr addrspace(1) %tmp16, align 4
%tmp18 = icmp sgt i32 %tmp17, 100
%tmp19 = sext i32 %tmp13 to i64
br i1 %tmp18, label %bb20, label %bb22
bb20: ; preds = %bb11
%tmp21 = getelementptr inbounds i32, ptr addrspace(1) @extern_array_1, i64 %tmp19
store i32 0, ptr addrspace(1) %tmp21, align 4
br label %bb22
bb22: ; preds = %bb20, %bb11
%tmp23 = getelementptr inbounds i32, ptr addrspace(1) @extern_array_1, i64 %tmp19
%tmp24 = load i32, ptr addrspace(1) %tmp23, align 4
%tmp25 = add nuw nsw i32 %tmp13, 1
%tmp26 = sext i32 %tmp25 to i64
%tmp27 = getelementptr inbounds i32, ptr addrspace(1) @extern_array_1, i64 %tmp26
%tmp28 = load i32, ptr addrspace(1) %tmp27, align 4
%tmp29 = add i32 %tmp24, %tmp12
%tmp30 = add i32 %tmp29, %tmp28
%tmp31 = icmp eq i32 %tmp25, %tmp4
br i1 %tmp31, label %bb7, label %bb11
}