| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 6 |
| ; RUN: llc -mtriple=riscv64 -mattr=+m -O2 < %s | FileCheck %s -check-prefix=RV64 |
| ; RUN: llc -mtriple=riscv32 -mattr=+m -O2 < %s | FileCheck %s -check-prefix=RV32 |
| |
| ; Test that very large outgoing call frames in functions with variable-sized |
| ; objects get proper stack probing. The outgoing args are large enough to force |
| ; the PROBED_STACKALLOC path, which must be expanded in a non-entry block. |
| |
| define void @f(i64 %n) #0 { |
| ; RV64-LABEL: f: |
| ; RV64: # %bb.0: # %entry |
| ; RV64-NEXT: addi sp, sp, -16 |
| ; RV64-NEXT: .cfi_def_cfa_offset 16 |
| ; RV64-NEXT: sd zero, 0(sp) |
| ; RV64-NEXT: sd ra, 8(sp) # 8-byte Folded Spill |
| ; RV64-NEXT: sd s0, 0(sp) # 8-byte Folded Spill |
| ; RV64-NEXT: .cfi_offset ra, -8 |
| ; RV64-NEXT: .cfi_offset s0, -16 |
| ; RV64-NEXT: addi s0, sp, 16 |
| ; RV64-NEXT: .cfi_def_cfa s0, 0 |
| ; RV64-NEXT: slli a0, a0, 2 |
| ; RV64-NEXT: addi a0, a0, 15 |
| ; RV64-NEXT: andi a0, a0, -16 |
| ; RV64-NEXT: sub a0, sp, a0 |
| ; RV64-NEXT: lui a1, 1 |
| ; RV64-NEXT: .LBB0_1: # %entry |
| ; RV64-NEXT: # =>This Inner Loop Header: Depth=1 |
| ; RV64-NEXT: sub sp, sp, a1 |
| ; RV64-NEXT: sd zero, 0(sp) |
| ; RV64-NEXT: bltu a0, sp, .LBB0_1 |
| ; RV64-NEXT: # %bb.2: # %entry |
| ; RV64-NEXT: mv sp, a0 |
| ; RV64-NEXT: lui a1, 5 |
| ; RV64-NEXT: sub t1, sp, a1 |
| ; RV64-NEXT: lui t2, 1 |
| ; RV64-NEXT: .LBB0_3: # %entry |
| ; RV64-NEXT: # =>This Inner Loop Header: Depth=1 |
| ; RV64-NEXT: sub sp, sp, t2 |
| ; RV64-NEXT: sd zero, 0(sp) |
| ; RV64-NEXT: bne sp, t1, .LBB0_3 |
| ; RV64-NEXT: # %bb.4: # %entry |
| ; RV64-NEXT: addi sp, sp, -2048 |
| ; RV64-NEXT: addi sp, sp, -1424 |
| ; RV64-NEXT: sd zero, 0(sp) |
| ; RV64-NEXT: call g |
| ; RV64-NEXT: lui a0, 6 |
| ; RV64-NEXT: addi a0, a0, -624 |
| ; RV64-NEXT: add sp, sp, a0 |
| ; RV64-NEXT: addi sp, s0, -16 |
| ; RV64-NEXT: .cfi_def_cfa sp, 16 |
| ; RV64-NEXT: ld ra, 8(sp) # 8-byte Folded Reload |
| ; RV64-NEXT: ld s0, 0(sp) # 8-byte Folded Reload |
| ; RV64-NEXT: .cfi_restore ra |
| ; RV64-NEXT: .cfi_restore s0 |
| ; RV64-NEXT: addi sp, sp, 16 |
| ; RV64-NEXT: .cfi_def_cfa_offset 0 |
| ; RV64-NEXT: ret |
| ; |
| ; RV32-LABEL: f: |
| ; RV32: # %bb.0: # %entry |
| ; RV32-NEXT: addi sp, sp, -16 |
| ; RV32-NEXT: .cfi_def_cfa_offset 16 |
| ; RV32-NEXT: sw zero, 0(sp) |
| ; RV32-NEXT: sw ra, 12(sp) # 4-byte Folded Spill |
| ; RV32-NEXT: sw s0, 8(sp) # 4-byte Folded Spill |
| ; RV32-NEXT: .cfi_offset ra, -4 |
| ; RV32-NEXT: .cfi_offset s0, -8 |
| ; RV32-NEXT: addi s0, sp, 16 |
| ; RV32-NEXT: .cfi_def_cfa s0, 0 |
| ; RV32-NEXT: slli a0, a0, 2 |
| ; RV32-NEXT: addi a0, a0, 15 |
| ; RV32-NEXT: andi a0, a0, -16 |
| ; RV32-NEXT: sub a0, sp, a0 |
| ; RV32-NEXT: lui a1, 1 |
| ; RV32-NEXT: .LBB0_1: # %entry |
| ; RV32-NEXT: # =>This Inner Loop Header: Depth=1 |
| ; RV32-NEXT: sub sp, sp, a1 |
| ; RV32-NEXT: sw zero, 0(sp) |
| ; RV32-NEXT: bltu a0, sp, .LBB0_1 |
| ; RV32-NEXT: # %bb.2: # %entry |
| ; RV32-NEXT: mv sp, a0 |
| ; RV32-NEXT: lui a1, 5 |
| ; RV32-NEXT: sub t1, sp, a1 |
| ; RV32-NEXT: lui t2, 1 |
| ; RV32-NEXT: .LBB0_3: # %entry |
| ; RV32-NEXT: # =>This Inner Loop Header: Depth=1 |
| ; RV32-NEXT: sub sp, sp, t2 |
| ; RV32-NEXT: sw zero, 0(sp) |
| ; RV32-NEXT: bne sp, t1, .LBB0_3 |
| ; RV32-NEXT: # %bb.4: # %entry |
| ; RV32-NEXT: addi sp, sp, -2048 |
| ; RV32-NEXT: addi sp, sp, -1456 |
| ; RV32-NEXT: sw zero, 0(sp) |
| ; RV32-NEXT: call g |
| ; RV32-NEXT: lui a0, 6 |
| ; RV32-NEXT: addi a0, a0, -592 |
| ; RV32-NEXT: add sp, sp, a0 |
| ; RV32-NEXT: addi sp, s0, -16 |
| ; RV32-NEXT: .cfi_def_cfa sp, 16 |
| ; RV32-NEXT: lw ra, 12(sp) # 4-byte Folded Reload |
| ; RV32-NEXT: lw s0, 8(sp) # 4-byte Folded Reload |
| ; RV32-NEXT: .cfi_restore ra |
| ; RV32-NEXT: .cfi_restore s0 |
| ; RV32-NEXT: addi sp, sp, 16 |
| ; RV32-NEXT: .cfi_def_cfa_offset 0 |
| ; RV32-NEXT: ret |
| entry: |
| %v = alloca i32, i64 %n |
| call void @g(ptr %v, [3000 x i64] poison) |
| ret void |
| } |
| |
| declare void @g(ptr, [3000 x i64]) |
| |
| attributes #0 = { "probe-stack"="inline-asm" } |