blob: 90e56c1166edfd96d926a12c8af34b9231615225 [file] [log] [blame]
// RUN: mlir-opt %s --pass-pipeline="builtin.module(llvm.func(mem2reg{region-simplify=false}))" --split-input-file | FileCheck %s
// CHECK-LABEL: llvm.func @default_value
llvm.func @default_value() -> i32 {
// CHECK: %[[UNDEF:.*]] = llvm.mlir.undef : i32
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
%2 = llvm.load %1 {alignment = 4 : i64} : !llvm.ptr -> i32
// CHECK: llvm.return %[[UNDEF]] : i32
llvm.return %2 : i32
}
// -----
// CHECK-LABEL: llvm.func @store_of_ptr
llvm.func @store_of_ptr() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(4 : i32) : i32
%2 = llvm.mlir.zero : !llvm.ptr
// CHECK: %[[ALLOCA:.*]] = llvm.alloca
%3 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
// CHECK: llvm.store %{{.*}}, %[[ALLOCA]]
llvm.store %1, %3 {alignment = 4 : i64} : i32, !llvm.ptr
// CHECK: llvm.store %[[ALLOCA]], %{{.*}}
llvm.store %3, %2 {alignment = 8 : i64} : !llvm.ptr, !llvm.ptr
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @unreachable
llvm.func @unreachable() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(0 : i32) : i32
// CHECK-NOT: = llvm.alloca
%2 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.return
// CHECK: ^{{.*}}:
// CHECK-NEXT: llvm.return
^bb1: // no predecessors
llvm.store %1, %2 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @unreachable_in_loop
// CHECK-NOT: = llvm.alloca
llvm.func @unreachable_in_loop() -> i32 {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(6 : i32) : i32
%2 = llvm.mlir.constant(5 : i32) : i32
%3 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.store %1, %3 {alignment = 4 : i64} : i32, !llvm.ptr
// CHECK: llvm.br ^[[LOOP:.*]]
llvm.br ^bb1
// CHECK: ^[[LOOP]]:
^bb1: // 2 preds: ^bb0, ^bb3
// CHECK-NEXT: llvm.br ^[[ENDOFLOOP:.*]]
llvm.store %2, %3 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb3
// CHECK: ^[[UNREACHABLE:.*]]:
^bb2: // no predecessors
// CHECK-NEXT: llvm.br ^[[ENDOFLOOP]]
llvm.br ^bb3
// CHECK: ^[[ENDOFLOOP]]:
^bb3: // 2 preds: ^bb1, ^bb2
// CHECK-NEXT: llvm.br ^[[LOOP]]
llvm.br ^bb1
}
// -----
// CHECK-LABEL: llvm.func @branching
// CHECK-NOT: = llvm.alloca
llvm.func @branching(%arg0: i1, %arg1: i1) -> i32 {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(2 : i32) : i32
%2 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
// CHECK: llvm.cond_br %{{.*}}, ^[[BB2:.*]](%{{.*}} : i32), ^{{.*}}
llvm.cond_br %arg0, ^bb2, ^bb1
^bb1: // pred: ^bb0
llvm.store %1, %2 {alignment = 4 : i64} : i32, !llvm.ptr
// CHECK: llvm.cond_br %{{.*}}, ^[[BB2]](%{{.*}} : i32), ^[[BB2]](%{{.*}} : i32)
llvm.cond_br %arg1, ^bb2, ^bb2
// CHECK: ^[[BB2]](%[[V3:.*]]: i32):
^bb2: // 3 preds: ^bb0, ^bb1, ^bb1
%3 = llvm.load %2 {alignment = 4 : i64} : !llvm.ptr -> i32
// CHECK: llvm.return %[[V3]] : i32
llvm.return %3 : i32
}
// -----
// CHECK-LABEL: llvm.func @recursive_alloca
// CHECK-NOT: = llvm.alloca
llvm.func @recursive_alloca() -> i32 {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(0 : i32) : i32
%2 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
%3 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
%4 = llvm.alloca %0 x !llvm.ptr {alignment = 8 : i64} : (i32) -> !llvm.ptr
llvm.store %1, %3 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.store %3, %4 {alignment = 8 : i64} : !llvm.ptr, !llvm.ptr
%5 = llvm.load %4 {alignment = 8 : i64} : !llvm.ptr -> !llvm.ptr
%6 = llvm.load %5 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.store %6, %2 {alignment = 4 : i64} : i32, !llvm.ptr
%7 = llvm.load %2 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.return %7 : i32
}
// -----
// CHECK-LABEL: llvm.func @reset_in_branch
// CHECK-NOT: = llvm.alloca
// CHECK-NOT: ^{{.*}}({{.*}}):
llvm.func @reset_in_branch(%arg0: i32, %arg1: i1) {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(true) : i1
%2 = llvm.mlir.constant(false) : i1
%3 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.store %arg0, %3 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.cond_br %arg1, ^bb1, ^bb2
^bb1: // pred: ^bb0
llvm.store %arg0, %3 {alignment = 4 : i64} : i32, !llvm.ptr
%4 = llvm.load %3 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.call @reset_in_branch(%4, %2) : (i32, i1) -> ()
llvm.br ^bb3
^bb2: // pred: ^bb0
%5 = llvm.load %3 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.call @reset_in_branch(%5, %1) : (i32, i1) -> ()
llvm.br ^bb3
^bb3: // 2 preds: ^bb1, ^bb2
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @intertwined_alloca
// CHECK-NOT: = llvm.alloca
llvm.func @intertwined_alloca(%arg0: !llvm.ptr, %arg1: i32) {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(0 : i32) : i32
%2 = llvm.alloca %0 x !llvm.ptr {alignment = 8 : i64} : (i32) -> !llvm.ptr
%3 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
%4 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
%5 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
%6 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.store %arg0, %2 {alignment = 8 : i64} : !llvm.ptr, !llvm.ptr
llvm.store %arg1, %3 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.store %1, %4 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb1
^bb1: // 2 preds: ^bb0, ^bb4
%7 = llvm.load %3 {alignment = 4 : i64} : !llvm.ptr -> i32
%8 = llvm.add %7, %0 : i32
%9 = llvm.load %4 {alignment = 4 : i64} : !llvm.ptr -> i32
%10 = llvm.icmp "sgt" %8, %9 : i32
%11 = llvm.zext %10 : i1 to i32
llvm.cond_br %10, ^bb2, ^bb5
^bb2: // pred: ^bb1
%12 = llvm.load %6 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.store %12, %5 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.store %1, %6 {alignment = 4 : i64} : i32, !llvm.ptr
%13 = llvm.load %4 {alignment = 4 : i64} : !llvm.ptr -> i32
%14 = llvm.icmp "sgt" %13, %1 : i32
%15 = llvm.zext %14 : i1 to i32
llvm.cond_br %14, ^bb3, ^bb4
^bb3: // pred: ^bb2
%16 = llvm.load %2 {alignment = 8 : i64} : !llvm.ptr -> !llvm.ptr
%17 = llvm.load %4 {alignment = 4 : i64} : !llvm.ptr -> i32
%18 = llvm.sub %17, %0 : i32
%19 = llvm.getelementptr %16[%18] : (!llvm.ptr, i32) -> !llvm.ptr, i8
%20 = llvm.load %5 {alignment = 4 : i64} : !llvm.ptr -> i32
%21 = llvm.trunc %20 : i32 to i8
llvm.store %21, %19 {alignment = 1 : i64} : i8, !llvm.ptr
llvm.br ^bb4
^bb4: // 2 preds: ^bb2, ^bb3
%22 = llvm.load %4 {alignment = 4 : i64} : !llvm.ptr -> i32
%23 = llvm.add %22, %0 : i32
llvm.store %23, %4 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb1
^bb5: // pred: ^bb1
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @complex_cf
// CHECK-NOT: = llvm.alloca
llvm.func @complex_cf(%arg0: i32, ...) {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(false) : i1
%2 = llvm.mlir.constant(0 : i32) : i32
%3 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.cond_br %1, ^bb1, ^bb2
^bb1: // pred: ^bb0
llvm.br ^bb2
^bb2: // 2 preds: ^bb0, ^bb1
llvm.store %2, %3 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb3
^bb3: // 2 preds: ^bb2, ^bb16
llvm.cond_br %1, ^bb4, ^bb17
^bb4: // pred: ^bb3
llvm.cond_br %1, ^bb5, ^bb14
^bb5: // pred: ^bb4
llvm.cond_br %1, ^bb7, ^bb6
^bb6: // pred: ^bb5
llvm.br ^bb7
^bb7: // 2 preds: ^bb5, ^bb6
llvm.cond_br %1, ^bb9, ^bb8
^bb8: // pred: ^bb7
llvm.br ^bb9
^bb9: // 2 preds: ^bb7, ^bb8
llvm.cond_br %1, ^bb11, ^bb10
^bb10: // pred: ^bb9
llvm.br ^bb11
^bb11: // 2 preds: ^bb9, ^bb10
llvm.cond_br %1, ^bb12, ^bb13
^bb12: // pred: ^bb11
llvm.br ^bb13
^bb13: // 2 preds: ^bb11, ^bb12
llvm.br ^bb14
^bb14: // 2 preds: ^bb4, ^bb13
llvm.cond_br %1, ^bb15, ^bb16
^bb15: // pred: ^bb14
llvm.br ^bb16
^bb16: // 2 preds: ^bb14, ^bb15
llvm.br ^bb3
^bb17: // pred: ^bb3
llvm.br ^bb20
^bb18: // no predecessors
%4 = llvm.load %3 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.br ^bb24
^bb19: // no predecessors
llvm.br ^bb20
^bb20: // 2 preds: ^bb17, ^bb19
llvm.cond_br %1, ^bb21, ^bb22
^bb21: // pred: ^bb20
llvm.br ^bb23
^bb22: // pred: ^bb20
llvm.br ^bb23
^bb23: // 2 preds: ^bb21, ^bb22
llvm.br ^bb24
^bb24: // 2 preds: ^bb18, ^bb23
llvm.br ^bb26
^bb25: // no predecessors
llvm.br ^bb26
^bb26: // 2 preds: ^bb24, ^bb25
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @llvm_crash
llvm.func @llvm_crash() -> i32 {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(0 : i32) : i32
%2 = llvm.mlir.addressof @j : !llvm.ptr
%3 = llvm.mlir.constant(0 : i8) : i8
// CHECK-NOT: = llvm.alloca
// CHECK: %[[VOLATILE_ALLOCA:.*]] = llvm.alloca
// CHECK-NOT: = llvm.alloca
%4 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
%5 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
%6 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
%7 = llvm.bitcast %1 : i32 to i32
// CHECK: llvm.store volatile %{{.*}}, %[[VOLATILE_ALLOCA]]
llvm.store volatile %1, %5 {alignment = 4 : i64} : i32, !llvm.ptr
%8 = llvm.call @_setjmp(%2) : (!llvm.ptr) -> i32
%9 = llvm.icmp "ne" %8, %1 : i32
%10 = llvm.zext %9 : i1 to i8
%11 = llvm.icmp "ne" %10, %3 : i8
llvm.cond_br %11, ^bb1, ^bb2
^bb1: // pred: ^bb0
// CHECK: = llvm.load volatile %[[VOLATILE_ALLOCA]]
%12 = llvm.load volatile %5 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.store %12, %6 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb3
^bb2: // pred: ^bb0
// CHECK: llvm.store volatile %{{.*}}, %[[VOLATILE_ALLOCA]]
llvm.store volatile %0, %5 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.call @g() : () -> ()
llvm.store %1, %6 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb3
^bb3: // 2 preds: ^bb1, ^bb2
%13 = llvm.load %6 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.store %13, %4 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb4
^bb4: // pred: ^bb3
%14 = llvm.load %4 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.return %14 : i32
}
llvm.mlir.global external @j() {addr_space = 0 : i32} : !llvm.array<1 x struct<"struct.__jmp_buf_tag", (array<6 x i32>, i32, struct<"struct.__sigset_t", (array<32 x i32>)>)>>
llvm.func @_setjmp(!llvm.ptr) -> i32 attributes {passthrough = ["returns_twice"]}
llvm.func @g()
// -----
// CHECK-LABEL: llvm.func amdgpu_kernelcc @addrspace_discard
// CHECK-NOT: = llvm.alloca
llvm.func amdgpu_kernelcc @addrspace_discard() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(2 : i64) : i64
%2 = llvm.alloca %0 x i8 {alignment = 8 : i64} : (i32) -> !llvm.ptr<5>
%3 = llvm.addrspacecast %2 : !llvm.ptr<5> to !llvm.ptr
llvm.intr.lifetime.start 2, %3 : !llvm.ptr
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @ignore_atomic
// CHECK-SAME: (%[[ARG0:.*]]: i32) -> i32
llvm.func @ignore_atomic(%arg0: i32) -> i32 {
// CHECK-NOT: = llvm.alloca
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.store %arg0, %1 atomic seq_cst {alignment = 4 : i64} : i32, !llvm.ptr
%2 = llvm.load %1 atomic seq_cst {alignment = 4 : i64} : !llvm.ptr -> i32
// CHECK: llvm.return %[[ARG0]] : i32
llvm.return %2 : i32
}
// -----
// CHECK: llvm.func @landing_pad
// CHECK-NOT: = llvm.alloca
llvm.func @landing_pad() -> i32 attributes {personality = @__gxx_personality_v0} {
// CHECK-NOT: = llvm.alloca
// CHECK: %[[UNDEF:.*]] = llvm.mlir.undef : i32
// CHECK-NOT: = llvm.alloca
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
// CHECK: %[[V2:.*]] = llvm.invoke
%2 = llvm.invoke @landing_padf() to ^bb1 unwind ^bb3 : () -> i32
// CHECK: ^{{.*}}:
^bb1:// pred: ^bb0
llvm.store %2, %1 {alignment = 4 : i64} : i32, !llvm.ptr
// CHECK: llvm.br ^[[BB2:.*]](%[[V2]] : i32)
llvm.br ^bb2
// CHECK: ^[[BB2]]([[V3:.*]]: i32):
^bb2:// 2 preds: ^bb1, ^bb3
%3 = llvm.load %1 {alignment = 4 : i64} : !llvm.ptr -> i32
// CHECK: llvm.return [[V3]] : i32
llvm.return %3 : i32
// CHECK: ^{{.*}}:
^bb3:// pred: ^bb0
%4 = llvm.landingpad cleanup : !llvm.struct<(ptr, i32)>
// CHECK: llvm.br ^[[BB2:.*]](%[[UNDEF]] : i32)
llvm.br ^bb2
}
llvm.func @landing_padf() -> i32
llvm.func @__gxx_personality_v0(...) -> i32
// -----
// CHECK-LABEL: llvm.func @unreachable_defines
llvm.func @unreachable_defines() -> i32 {
// CHECK-NOT: = llvm.alloca
// CHECK: %[[UNDEF:.*]] = llvm.mlir.undef : i32
// CHECK-NOT: = llvm.alloca
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.br ^bb1
^bb1: // 2 preds: ^bb0, ^bb2
%2 = llvm.load %1 {alignment = 4 : i64} : !llvm.ptr -> i32
// CHECK: llvm.return %[[UNDEF]] : i32
llvm.return %2 : i32
^bb2: // no predecessors
%3 = llvm.load %1 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.store %3, %1 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb1
}
// -----
// CHECK-LABEL: llvm.func @unreachable_jumps_to_merge_point
// CHECK-NOT: = llvm.alloca
llvm.func @unreachable_jumps_to_merge_point(%arg0: i1) -> i32 {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(6 : i32) : i32
%2 = llvm.mlir.constant(5 : i32) : i32
%3 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.cond_br %arg0, ^bb1, ^bb2
^bb1: // 2 preds: ^bb0, ^bb4
llvm.store %1, %3 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb4
^bb2: // pred: ^bb0
llvm.store %2, %3 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.br ^bb4
^bb3: // no predecessors
llvm.br ^bb4
^bb4: // 3 preds: ^bb1, ^bb2, ^bb3
%4 = llvm.load %3 {alignment = 4 : i64} : !llvm.ptr -> i32
llvm.return %4 : i32
}
// -----
// CHECK-LABEL: llvm.func @ignore_lifetime
// CHECK-NOT: = llvm.alloca
llvm.func @ignore_lifetime() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.intr.lifetime.start 2, %1 : !llvm.ptr
llvm.store %0, %1 {alignment = 4 : i64} : i32, !llvm.ptr
llvm.intr.lifetime.end 2, %1 : !llvm.ptr
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @ignore_discardable_tree
// CHECK-NOT: = llvm.alloca
llvm.func @ignore_discardable_tree() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(0 : i16) : i16
%2 = llvm.mlir.constant(0 : i8) : i8
%3 = llvm.mlir.undef : !llvm.struct<(i8, i16)>
%4 = llvm.insertvalue %2, %3[0] : !llvm.struct<(i8, i16)>
%5 = llvm.insertvalue %1, %4[1] : !llvm.struct<(i8, i16)>
%6 = llvm.alloca %0 x !llvm.struct<(i8, i16)> {alignment = 8 : i64} : (i32) -> !llvm.ptr
%7 = llvm.getelementptr %6[0, 0] : (!llvm.ptr) -> !llvm.ptr, !llvm.struct<(i8, i16)>
llvm.intr.lifetime.start 2, %7 : !llvm.ptr
llvm.store %5, %6 {alignment = 2 : i64} : !llvm.struct<(i8, i16)>, !llvm.ptr
llvm.intr.lifetime.end 2, %7 : !llvm.ptr
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @store_load_forward
llvm.func @store_load_forward() -> i32 {
// CHECK-NOT: = llvm.alloca
%0 = llvm.mlir.constant(1 : i32) : i32
// CHECK: %[[RES:.*]] = llvm.mlir.constant(0 : i32) : i32
%1 = llvm.mlir.constant(0 : i32) : i32
%2 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.store %1, %2 {alignment = 4 : i64} : i32, !llvm.ptr
%3 = llvm.load %2 {alignment = 4 : i64} : !llvm.ptr -> i32
// CHECK: llvm.return %[[RES]] : i32
llvm.return %3 : i32
}
// -----
// CHECK-LABEL: llvm.func @store_load_wrong_type
llvm.func @store_load_wrong_type() -> i16 {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(0 : i32) : i32
// CHECK: = llvm.alloca
%2 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
llvm.store %1, %2 {alignment = 4 : i64} : i32, !llvm.ptr
%3 = llvm.load %2 {alignment = 2 : i64} : !llvm.ptr -> i16
llvm.return %3 : i16
}
// -----
// CHECK-LABEL: llvm.func @merge_point_cycle
llvm.func @merge_point_cycle() {
// CHECK: %[[UNDEF:.*]] = llvm.mlir.undef : i32
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(7 : i32) : i32
%2 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
// CHECK: llvm.br ^[[BB1:.*]](%[[UNDEF]] : i32)
llvm.br ^bb1
// CHECK: ^[[BB1]](%[[BARG:.*]]: i32):
^bb1: // 2 preds: ^bb0, ^bb1
%3 = llvm.load %2 {alignment = 4 : i64} : !llvm.ptr -> i32
// CHECK: = llvm.call @use(%[[BARG]])
%4 = llvm.call @use(%3) : (i32) -> i1
// CHECK: %[[DEF:.*]] = llvm.call @def
%5 = llvm.call @def(%1) : (i32) -> i32
llvm.store %5, %2 {alignment = 4 : i64} : i32, !llvm.ptr
// CHECK: llvm.cond_br %{{.*}}, ^[[BB1]](%[[DEF]] : i32), ^{{.*}}
llvm.cond_br %4, ^bb1, ^bb2
^bb2: // pred: ^bb1
llvm.return
}
llvm.func @def(i32) -> i32
llvm.func @use(i32) -> i1
// -----
// CHECK-LABEL: llvm.func @no_unnecessary_arguments
llvm.func @no_unnecessary_arguments() {
// CHECK: %[[UNDEF:.*]] = llvm.mlir.undef : i32
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.alloca %0 x i32 {alignment = 4 : i64} : (i32) -> !llvm.ptr
// CHECK: llvm.br ^[[BB1:.*]]
llvm.br ^bb1
// CHECK: ^[[BB1]]:
^bb1: // 2 preds: ^bb0, ^bb1
%2 = llvm.load %1 {alignment = 4 : i64} : !llvm.ptr -> i32
// CHECK: = llvm.call @use(%[[UNDEF]])
%3 = llvm.call @use(%2) : (i32) -> i1
// CHECK: llvm.cond_br %{{.*}}, ^[[BB1]], ^{{.*}}
llvm.cond_br %3, ^bb1, ^bb2
^bb2: // pred: ^bb1
llvm.return
}
llvm.func @use(i32) -> i1
// -----
// CHECK-LABEL: llvm.func @discardable_use_tree
// CHECK-NOT: = llvm.alloca
llvm.func @discardable_use_tree() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(2 : i64) : i64
%2 = llvm.alloca %0 x i8 {alignment = 8 : i64} : (i32) -> !llvm.ptr
%3 = llvm.bitcast %2 : !llvm.ptr to !llvm.ptr
%4 = llvm.bitcast %3 : !llvm.ptr to !llvm.ptr
llvm.intr.lifetime.start 2, %3 : !llvm.ptr
llvm.intr.lifetime.start 2, %4 : !llvm.ptr
%5 = llvm.intr.invariant.start 2, %3 : !llvm.ptr
llvm.intr.invariant.end %5, 2, %3 : !llvm.ptr
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @non_discardable_use_tree
llvm.func @non_discardable_use_tree() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(2 : i64) : i64
// CHECK: = llvm.alloca
%2 = llvm.alloca %0 x i8 {alignment = 8 : i64} : (i32) -> !llvm.ptr
%3 = llvm.bitcast %2 : !llvm.ptr to !llvm.ptr
%4 = llvm.bitcast %3 : !llvm.ptr to !llvm.ptr
llvm.intr.lifetime.start 2, %3 : !llvm.ptr
llvm.intr.lifetime.start 2, %4 : !llvm.ptr
llvm.call @use(%4) : (!llvm.ptr) -> i1
llvm.return
}
llvm.func @use(!llvm.ptr) -> i1
// -----
// CHECK-LABEL: llvm.func @trivial_get_element_ptr
// CHECK-NOT: = llvm.alloca
llvm.func @trivial_get_element_ptr() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(2 : i64) : i64
%2 = llvm.alloca %0 x i8 {alignment = 8 : i64} : (i32) -> !llvm.ptr
%3 = llvm.bitcast %2 : !llvm.ptr to !llvm.ptr
%4 = llvm.getelementptr %3[0] : (!llvm.ptr) -> !llvm.ptr, i8
llvm.intr.lifetime.start 2, %3 : !llvm.ptr
llvm.intr.lifetime.start 2, %4 : !llvm.ptr
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @nontrivial_get_element_ptr
llvm.func @nontrivial_get_element_ptr() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(2 : i64) : i64
// CHECK: = llvm.alloca
%2 = llvm.alloca %0 x i8 {alignment = 8 : i64} : (i32) -> !llvm.ptr
%4 = llvm.getelementptr %2[1] : (!llvm.ptr) -> !llvm.ptr, i8
llvm.intr.lifetime.start 2, %2 : !llvm.ptr
llvm.intr.lifetime.start 2, %4 : !llvm.ptr
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @dynamic_get_element_ptr
llvm.func @dynamic_get_element_ptr() {
%0 = llvm.mlir.constant(1 : i32) : i32
%1 = llvm.mlir.constant(2 : i64) : i64
// CHECK: = llvm.alloca
%2 = llvm.alloca %0 x i8 {alignment = 8 : i64} : (i32) -> !llvm.ptr
%3 = llvm.bitcast %2 : !llvm.ptr to !llvm.ptr
%4 = llvm.getelementptr %3[%0] : (!llvm.ptr, i32) -> !llvm.ptr, i8
llvm.intr.lifetime.start 2, %3 : !llvm.ptr
llvm.intr.lifetime.start 2, %4 : !llvm.ptr
llvm.return
}
// -----
// CHECK-LABEL: llvm.func @live_cycle
// CHECK-SAME: (%[[ARG0:.*]]: i64, %{{.*}}: i1, %[[ARG2:.*]]: i64) -> i64
llvm.func @live_cycle(%arg0: i64, %arg1: i1, %arg2: i64) -> i64 {
%0 = llvm.mlir.constant(1 : i32) : i32
// CHECK-NOT: = llvm.alloca
%1 = llvm.alloca %0 x i64 {alignment = 8 : i64} : (i32) -> !llvm.ptr
llvm.store %arg2, %1 {alignment = 4 : i64} : i64, !llvm.ptr
// CHECK: llvm.cond_br %{{.*}}, ^[[BB1:.*]](%[[ARG2]] : i64), ^[[BB2:.*]](%[[ARG2]] : i64)
llvm.cond_br %arg1, ^bb1, ^bb2
// CHECK: ^[[BB1]](%[[V1:.*]]: i64):
^bb1:
%2 = llvm.load %1 {alignment = 4 : i64} : !llvm.ptr -> i64
// CHECK: llvm.call @use(%[[V1]])
llvm.call @use(%2) : (i64) -> ()
llvm.store %arg0, %1 {alignment = 4 : i64} : i64, !llvm.ptr
// CHECK: llvm.br ^[[BB2]](%[[ARG0]] : i64)
llvm.br ^bb2
// CHECK: ^[[BB2]](%[[V2:.*]]: i64):
^bb2:
// CHECK: llvm.br ^[[BB1]](%[[V2]] : i64)
llvm.br ^bb1
}
llvm.func @use(i64)
// -----
// This test should no longer be an issue once promotion within subregions
// is supported.
// CHECK-LABEL: llvm.func @subregion_block_promotion
// CHECK-SAME: (%[[ARG0:.*]]: i64, %[[ARG1:.*]]: i64) -> i64
llvm.func @subregion_block_promotion(%arg0: i64, %arg1: i64) -> i64 {
%0 = llvm.mlir.constant(1 : i32) : i32
// CHECK: %[[ALLOCA:.*]] = llvm.alloca
%1 = llvm.alloca %0 x i64 {alignment = 8 : i64} : (i32) -> !llvm.ptr
// CHECK: llvm.store %[[ARG1]], %[[ALLOCA]]
llvm.store %arg1, %1 {alignment = 4 : i64} : i64, !llvm.ptr
// CHECK: scf.execute_region {
scf.execute_region {
// CHECK: llvm.store %[[ARG0]], %[[ALLOCA]]
llvm.store %arg0, %1 {alignment = 4 : i64} : i64, !llvm.ptr
scf.yield
}
// CHECK: }
// CHECK: %[[RES:.*]] = llvm.load %[[ALLOCA]]
%2 = llvm.load %1 {alignment = 4 : i64} : !llvm.ptr -> i64
// CHECK: llvm.return %[[RES]] : i64
llvm.return %2 : i64
}
// -----
// CHECK-LABEL: llvm.func @subregion_simple_transitive_promotion
// CHECK-SAME: (%[[ARG0:.*]]: i64, %[[ARG1:.*]]: i64) -> i64
llvm.func @subregion_simple_transitive_promotion(%arg0: i64, %arg1: i64) -> i64 {
%0 = llvm.mlir.constant(1 : i32) : i32
// CHECK-NOT: = llvm.alloca
%1 = llvm.alloca %0 x i64 {alignment = 8 : i64} : (i32) -> !llvm.ptr
llvm.store %arg1, %1 {alignment = 4 : i64} : i64, !llvm.ptr
%2 = llvm.load %1 {alignment = 4 : i64} : !llvm.ptr -> i64
// CHECK: scf.execute_region {
scf.execute_region {
// CHECK: llvm.call @use(%[[ARG1]])
llvm.call @use(%2) : (i64) -> ()
scf.yield
}
// CHECK: }
// CHECK: llvm.return %[[ARG1]] : i64
llvm.return %2 : i64
}
llvm.func @use(i64)
// -----
// This behavior is specific to the LLVM dialect, because LLVM semantics are
// that reaching an alloca multiple times allocates on the stack multiple
// times. Promoting an alloca that is reached multiple times could lead to
// changes in observable behavior. Thus only allocas in the entry block are
// promoted.
// CHECK-LABEL: llvm.func @no_inner_alloca_promotion
// CHECK-SAME: (%[[ARG:.*]]: i64) -> i64
llvm.func @no_inner_alloca_promotion(%arg: i64) -> i64 {
%0 = llvm.mlir.constant(1 : i32) : i32
llvm.br ^bb1
^bb1:
// CHECK: %[[ALLOCA:.*]] = llvm.alloca
%1 = llvm.alloca %0 x i64 {alignment = 8 : i64} : (i32) -> !llvm.ptr
// CHECK: llvm.store %[[ARG]], %[[ALLOCA]]
llvm.store %arg, %1 {alignment = 4 : i64} : i64, !llvm.ptr
// CHECK: %[[RES:.*]] = llvm.load %[[ALLOCA]]
%2 = llvm.load %1 {alignment = 4 : i64} : !llvm.ptr -> i64
// CHECK: llvm.return %[[RES]] : i64
llvm.return %2 : i64
}
// -----
// CHECK-LABEL: @transitive_reaching_def
llvm.func @transitive_reaching_def() -> !llvm.ptr {
%0 = llvm.mlir.constant(1 : i32) : i32
// CHECK-NOT: alloca
%1 = llvm.alloca %0 x !llvm.ptr {alignment = 8 : i64} : (i32) -> !llvm.ptr
%2 = llvm.load %1 {alignment = 8 : i64} : !llvm.ptr -> !llvm.ptr
llvm.store %2, %1 {alignment = 8 : i64} : !llvm.ptr, !llvm.ptr
%3 = llvm.load %1 {alignment = 8 : i64} : !llvm.ptr -> !llvm.ptr
llvm.return %3 : !llvm.ptr
}