blob: 6001e6040a74175cb05d03b2d752b83fd7b65900 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals
; RUN: opt -passes=tailcallelim -S %s -o - | FileCheck %s --check-prefixes=CHECK,ENABLED
; RUN: opt -passes=tailcallelim -tre-disable-entrycount-recompute -S %s -o - | FileCheck %s --check-prefixes=CHECK,DISABLED
; Test that tail call elimination correctly adjusts function entry counts
; when eliminating tail recursive calls.
; Basic test: eliminate a tail call and adjust entry count
define i32 @test_basic_entry_count_adjustment(i32 %n) !prof !0 {
; CHECK-LABEL: @test_basic_entry_count_adjustment(
; CHECK-NEXT: entry:
; CHECK-NEXT: br label [[TAILRECURSE:%.*]]
; CHECK: tailrecurse:
; CHECK-NEXT: [[N_TR:%.*]] = phi i32 [ [[N:%.*]], [[ENTRY:%.*]] ], [ [[SUB:%.*]], [[IF_THEN:%.*]] ]
; CHECK-NEXT: [[CMP:%.*]] = icmp sgt i32 [[N_TR]], 0
; CHECK-NEXT: br i1 [[CMP]], label [[IF_THEN]], label [[IF_ELSE:%.*]], !prof [[PROF1:![0-9]+]]
; CHECK: if.then:
; CHECK-NEXT: [[SUB]] = sub i32 [[N_TR]], 1
; CHECK-NEXT: br label [[TAILRECURSE]]
; CHECK: if.else:
; CHECK-NEXT: ret i32 0
;
entry:
%cmp = icmp sgt i32 %n, 0
br i1 %cmp, label %if.then, label %if.else, !prof !1
if.then: ; preds = %entry
%sub = sub i32 %n, 1
%call = tail call i32 @test_basic_entry_count_adjustment(i32 %sub)
ret i32 %call
if.else: ; preds = %entry
ret i32 0
}
; Test multiple tail calls in different blocks with different frequencies
define i32 @test_multiple_blocks_entry_count(i32 %n, i32 %flag) !prof !2 {
; CHECK-LABEL: @test_multiple_blocks_entry_count(
; CHECK-NEXT: entry:
; CHECK-NEXT: br label [[TAILRECURSE:%.*]]
; CHECK: tailrecurse:
; CHECK-NEXT: [[N_TR:%.*]] = phi i32 [ [[N:%.*]], [[ENTRY:%.*]] ], [ [[SUB1:%.*]], [[BLOCK1:%.*]] ], [ [[SUB2:%.*]], [[BLOCK2:%.*]] ]
; CHECK-NEXT: [[CMP:%.*]] = icmp sgt i32 [[N_TR]], 0
; CHECK-NEXT: br i1 [[CMP]], label [[CHECK_FLAG:%.*]], label [[BASE_CASE:%.*]], !prof [[PROF3:![0-9]+]]
; CHECK: check.flag:
; CHECK-NEXT: [[CMP_FLAG:%.*]] = icmp eq i32 [[FLAG:%.*]], 1
; CHECK-NEXT: br i1 [[CMP_FLAG]], label [[BLOCK1]], label [[BLOCK2]], !prof [[PROF4:![0-9]+]]
; CHECK: block1:
; CHECK-NEXT: [[SUB1]] = sub i32 [[N_TR]], 1
; CHECK-NEXT: br label [[TAILRECURSE]]
; CHECK: block2:
; CHECK-NEXT: [[SUB2]] = sub i32 [[N_TR]], 2
; CHECK-NEXT: br label [[TAILRECURSE]]
; CHECK: base.case:
; CHECK-NEXT: ret i32 1
;
entry:
%cmp = icmp sgt i32 %n, 0
br i1 %cmp, label %check.flag, label %base.case, !prof !3
check.flag:
%cmp.flag = icmp eq i32 %flag, 1
br i1 %cmp.flag, label %block1, label %block2, !prof !4
block1: ; preds = %check.flag
%sub1 = sub i32 %n, 1
%call1 = tail call i32 @test_multiple_blocks_entry_count(i32 %sub1, i32 %flag)
ret i32 %call1
block2: ; preds = %check.flag
%sub2 = sub i32 %n, 2
%call2 = tail call i32 @test_multiple_blocks_entry_count(i32 %sub2, i32 %flag)
ret i32 %call2
base.case: ; preds = %entry
ret i32 1
}
define i32 @test_no_entry_count(i32 %n) {
; CHECK-LABEL: @test_no_entry_count(
; CHECK-NEXT: entry:
; CHECK-NEXT: br label [[TAILRECURSE:%.*]]
; CHECK: tailrecurse:
; CHECK-NEXT: [[N_TR:%.*]] = phi i32 [ [[N:%.*]], [[ENTRY:%.*]] ], [ [[SUB:%.*]], [[IF_THEN:%.*]] ]
; CHECK-NEXT: [[CMP:%.*]] = icmp sgt i32 [[N_TR]], 0
; CHECK-NEXT: br i1 [[CMP]], label [[IF_THEN]], label [[IF_ELSE:%.*]]
; CHECK: if.then:
; CHECK-NEXT: [[SUB]] = sub i32 [[N_TR]], 1
; CHECK-NEXT: br label [[TAILRECURSE]]
; CHECK: if.else:
; CHECK-NEXT: ret i32 0
;
entry:
%cmp = icmp sgt i32 %n, 0
br i1 %cmp, label %if.then, label %if.else
if.then: ; preds = %entry
%sub = sub i32 %n, 1
%call = tail call i32 @test_no_entry_count(i32 %sub)
ret i32 %call
if.else: ; preds = %entry
ret i32 0
}
; Function entry count metadata
!0 = !{!"function_entry_count", i64 1000}
!1 = !{!"branch_weights", i32 800, i32 200}
!2 = !{!"function_entry_count", i64 2000}
!3 = !{!"branch_weights", i32 3, i32 1}
!4 = !{!"branch_weights", i32 100, i32 900}
;.
; ENABLED: [[META0:![0-9]+]] = !{!"function_entry_count", i64 200}
; ENABLED: [[PROF1]] = !{!"branch_weights", i32 800, i32 200}
; ENABLED: [[META2:![0-9]+]] = !{!"function_entry_count", i64 500}
; ENABLED: [[PROF3]] = !{!"branch_weights", i32 3, i32 1}
; ENABLED: [[PROF4]] = !{!"branch_weights", i32 100, i32 900}
;.
; DISABLED: [[META0:![0-9]+]] = !{!"function_entry_count", i64 1000}
; DISABLED: [[PROF1]] = !{!"branch_weights", i32 800, i32 200}
; DISABLED: [[META2:![0-9]+]] = !{!"function_entry_count", i64 2000}
; DISABLED: [[PROF3]] = !{!"branch_weights", i32 3, i32 1}
; DISABLED: [[PROF4]] = !{!"branch_weights", i32 100, i32 900}
;.