| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py |
| ; RUN: opt -passes="ipsccp<func-spec>" -funcspec-max-clones=0 -funcspec-min-function-size=14 -S < %s | FileCheck %s --check-prefix=NONE |
| ; RUN: opt -passes="ipsccp<func-spec>" -funcspec-max-clones=1 -funcspec-min-function-size=14 -S < %s | FileCheck %s --check-prefix=ONE |
| ; RUN: opt -passes="ipsccp<func-spec>" -funcspec-max-clones=2 -funcspec-min-function-size=14 -S < %s | FileCheck %s --check-prefix=TWO |
| ; RUN: opt -passes="ipsccp<func-spec>" -funcspec-max-clones=3 -funcspec-min-function-size=14 -S < %s | FileCheck %s --check-prefix=THREE |
| |
| ; Make sure that we iterate correctly after sorting the specializations: |
| ; FnSpecialization: Specializations for function compute |
| ; FnSpecialization: Gain = 608 |
| ; FnSpecialization: FormalArg = binop1, ActualArg = power |
| ; FnSpecialization: FormalArg = binop2, ActualArg = mul |
| ; FnSpecialization: Gain = 982 |
| ; FnSpecialization: FormalArg = binop1, ActualArg = plus |
| ; FnSpecialization: FormalArg = binop2, ActualArg = minus |
| ; FnSpecialization: Gain = 795 |
| ; FnSpecialization: FormalArg = binop1, ActualArg = minus |
| ; FnSpecialization: FormalArg = binop2, ActualArg = power |
| |
| define i64 @main(i64 %x, i64 %y, i1 %flag) { |
| ; NONE-LABEL: @main( |
| ; NONE-NEXT: entry: |
| ; NONE-NEXT: br i1 [[FLAG:%.*]], label [[PLUS:%.*]], label [[MINUS:%.*]] |
| ; NONE: plus: |
| ; NONE-NEXT: [[TMP0:%.*]] = call i64 @compute(i64 [[X:%.*]], i64 [[Y:%.*]], ptr @power, ptr @mul) |
| ; NONE-NEXT: br label [[MERGE:%.*]] |
| ; NONE: minus: |
| ; NONE-NEXT: [[TMP1:%.*]] = call i64 @compute(i64 [[X]], i64 [[Y]], ptr @plus, ptr @minus) |
| ; NONE-NEXT: br label [[MERGE]] |
| ; NONE: merge: |
| ; NONE-NEXT: [[TMP2:%.*]] = phi i64 [ [[TMP0]], [[PLUS]] ], [ [[TMP1]], [[MINUS]] ] |
| ; NONE-NEXT: [[TMP3:%.*]] = call i64 @compute(i64 [[TMP2]], i64 42, ptr @minus, ptr @power) |
| ; NONE-NEXT: ret i64 [[TMP3]] |
| ; |
| ; ONE-LABEL: @main( |
| ; ONE-NEXT: entry: |
| ; ONE-NEXT: br i1 [[FLAG:%.*]], label [[PLUS:%.*]], label [[MINUS:%.*]] |
| ; ONE: plus: |
| ; ONE-NEXT: [[TMP0:%.*]] = call i64 @compute(i64 [[X:%.*]], i64 [[Y:%.*]], ptr @power, ptr @mul) |
| ; ONE-NEXT: br label [[MERGE:%.*]] |
| ; ONE: minus: |
| ; ONE-NEXT: [[TMP1:%.*]] = call i64 @compute.specialized.1(i64 [[X]], i64 [[Y]], ptr @plus, ptr @minus) |
| ; ONE-NEXT: br label [[MERGE]] |
| ; ONE: merge: |
| ; ONE-NEXT: [[TMP2:%.*]] = phi i64 [ [[TMP0]], [[PLUS]] ], [ [[TMP1]], [[MINUS]] ] |
| ; ONE-NEXT: [[TMP3:%.*]] = call i64 @compute(i64 [[TMP2]], i64 42, ptr @minus, ptr @power) |
| ; ONE-NEXT: ret i64 [[TMP3]] |
| ; |
| ; TWO-LABEL: @main( |
| ; TWO-NEXT: entry: |
| ; TWO-NEXT: br i1 [[FLAG:%.*]], label [[PLUS:%.*]], label [[MINUS:%.*]] |
| ; TWO: plus: |
| ; TWO-NEXT: [[TMP0:%.*]] = call i64 @compute(i64 [[X:%.*]], i64 [[Y:%.*]], ptr @power, ptr @mul) |
| ; TWO-NEXT: br label [[MERGE:%.*]] |
| ; TWO: minus: |
| ; TWO-NEXT: [[TMP1:%.*]] = call i64 @compute.specialized.2(i64 [[X]], i64 [[Y]], ptr @plus, ptr @minus) |
| ; TWO-NEXT: br label [[MERGE]] |
| ; TWO: merge: |
| ; TWO-NEXT: [[TMP2:%.*]] = phi i64 [ [[TMP0]], [[PLUS]] ], [ [[TMP1]], [[MINUS]] ] |
| ; TWO-NEXT: [[TMP3:%.*]] = call i64 @compute.specialized.1(i64 [[TMP2]], i64 42, ptr @minus, ptr @power) |
| ; TWO-NEXT: ret i64 [[TMP3]] |
| ; |
| ; THREE-LABEL: @main( |
| ; THREE-NEXT: entry: |
| ; THREE-NEXT: br i1 [[FLAG:%.*]], label [[PLUS:%.*]], label [[MINUS:%.*]] |
| ; THREE: plus: |
| ; THREE-NEXT: [[TMP0:%.*]] = call i64 @compute.specialized.1(i64 [[X:%.*]], i64 [[Y:%.*]], ptr @power, ptr @mul) |
| ; THREE-NEXT: br label [[MERGE:%.*]] |
| ; THREE: minus: |
| ; THREE-NEXT: [[TMP1:%.*]] = call i64 @compute.specialized.2(i64 [[X]], i64 [[Y]], ptr @plus, ptr @minus) |
| ; THREE-NEXT: br label [[MERGE]] |
| ; THREE: merge: |
| ; THREE-NEXT: [[TMP2:%.*]] = phi i64 [ [[TMP0]], [[PLUS]] ], [ [[TMP1]], [[MINUS]] ] |
| ; THREE-NEXT: [[TMP3:%.*]] = call i64 @compute.specialized.3(i64 [[TMP2]], i64 42, ptr @minus, ptr @power) |
| ; THREE-NEXT: ret i64 [[TMP3]] |
| ; |
| entry: |
| br i1 %flag, label %plus, label %minus |
| |
| plus: |
| %tmp0 = call i64 @compute(i64 %x, i64 %y, ptr @power, ptr @mul) |
| br label %merge |
| |
| minus: |
| %tmp1 = call i64 @compute(i64 %x, i64 %y, ptr @plus, ptr @minus) |
| br label %merge |
| |
| merge: |
| %tmp2 = phi i64 [ %tmp0, %plus ], [ %tmp1, %minus] |
| %tmp3 = call i64 @compute(i64 %tmp2, i64 42, ptr @minus, ptr @power) |
| ret i64 %tmp3 |
| } |
| |
| ; THREE-NOT: define internal i64 @compute |
| ; |
| ; THREE-LABEL: define internal i64 @compute.specialized.1(i64 %x, i64 %y, ptr %binop1, ptr %binop2) { |
| ; THREE-NEXT: entry: |
| ; THREE-NEXT: [[TMP0:%.+]] = call i64 @power(i64 %x, i64 %y) |
| ; THREE-NEXT: [[TMP1:%.+]] = call i64 @mul(i64 %x, i64 %y) |
| ; THREE-NEXT: [[TMP2:%.+]] = add i64 [[TMP0]], [[TMP1]] |
| ; THREE-NEXT: [[TMP3:%.+]] = sdiv i64 [[TMP2]], %x |
| ; THREE-NEXT: [[TMP4:%.+]] = sub i64 [[TMP3]], %y |
| ; THREE-NEXT: [[TMP5:%.+]] = mul i64 [[TMP4]], 2 |
| ; THREE-NEXT: ret i64 [[TMP5]] |
| ; THREE-NEXT: } |
| ; |
| ; THREE-LABEL: define internal i64 @compute.specialized.2(i64 %x, i64 %y, ptr %binop1, ptr %binop2) { |
| ; THREE-NEXT: entry: |
| ; THREE-NEXT: [[TMP0:%.+]] = call i64 @plus(i64 %x, i64 %y) |
| ; THREE-NEXT: [[TMP1:%.+]] = call i64 @minus(i64 %x, i64 %y) |
| ; THREE-NEXT: [[TMP2:%.+]] = add i64 [[TMP0]], [[TMP1]] |
| ; THREE-NEXT: [[TMP3:%.+]] = sdiv i64 [[TMP2]], %x |
| ; THREE-NEXT: [[TMP4:%.+]] = sub i64 [[TMP3]], %y |
| ; THREE-NEXT: [[TMP5:%.+]] = mul i64 [[TMP4]], 2 |
| ; THREE-NEXT: ret i64 [[TMP5]] |
| ; THREE-NEXT: } |
| ; |
| ; THREE-LABEL: define internal i64 @compute.specialized.3(i64 %x, i64 %y, ptr %binop1, ptr %binop2) { |
| ; THREE-NEXT: entry: |
| ; THREE-NEXT: [[TMP0:%.+]] = call i64 @minus(i64 %x, i64 %y) |
| ; THREE-NEXT: [[TMP1:%.+]] = call i64 @power(i64 %x, i64 %y) |
| ; THREE-NEXT: [[TMP2:%.+]] = add i64 [[TMP0]], [[TMP1]] |
| ; THREE-NEXT: [[TMP3:%.+]] = sdiv i64 [[TMP2]], %x |
| ; THREE-NEXT: [[TMP4:%.+]] = sub i64 [[TMP3]], %y |
| ; THREE-NEXT: [[TMP5:%.+]] = mul i64 [[TMP4]], 2 |
| ; THREE-NEXT: ret i64 [[TMP5]] |
| ; THREE-NEXT: } |
| ; |
| define internal i64 @compute(i64 %x, i64 %y, ptr %binop1, ptr %binop2) { |
| entry: |
| %tmp0 = call i64 %binop1(i64 %x, i64 %y) |
| %tmp1 = call i64 %binop2(i64 %x, i64 %y) |
| %add = add i64 %tmp0, %tmp1 |
| %div = sdiv i64 %add, %x |
| %sub = sub i64 %div, %y |
| %mul = mul i64 %sub, 2 |
| ret i64 %mul |
| } |
| |
| define internal i64 @plus(i64 %x, i64 %y) { |
| entry: |
| %tmp0 = add i64 %x, %y |
| ret i64 %tmp0 |
| } |
| |
| define internal i64 @minus(i64 %x, i64 %y) { |
| entry: |
| %tmp0 = sub i64 %x, %y |
| ret i64 %tmp0 |
| } |
| |
| define internal i64 @mul(i64 %x, i64 %n) { |
| entry: |
| %cmp6 = icmp sgt i64 %n, 1 |
| br i1 %cmp6, label %for.body, label %for.cond.cleanup |
| |
| for.cond.cleanup: ; preds = %for.body, %entry |
| %x.addr.0.lcssa = phi i64 [ %x, %entry ], [ %add, %for.body ] |
| ret i64 %x.addr.0.lcssa |
| |
| for.body: ; preds = %entry, %for.body |
| %indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 1, %entry ] |
| %x.addr.07 = phi i64 [ %add, %for.body ], [ %x, %entry ] |
| %add = shl nsw i64 %x.addr.07, 1 |
| %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1 |
| %exitcond.not = icmp eq i64 %indvars.iv.next, %n |
| br i1 %exitcond.not, label %for.cond.cleanup, label %for.body |
| } |
| |
| define internal i64 @power(i64 %x, i64 %n) { |
| entry: |
| %cmp6 = icmp sgt i64 %n, 1 |
| br i1 %cmp6, label %for.body, label %for.cond.cleanup |
| |
| for.cond.cleanup: ; preds = %for.body, %entry |
| %x.addr.0.lcssa = phi i64 [ %x, %entry ], [ %mul, %for.body ] |
| ret i64 %x.addr.0.lcssa |
| |
| for.body: ; preds = %entry, %for.body |
| %indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 1, %entry ] |
| %x.addr.07 = phi i64 [ %mul, %for.body ], [ %x, %entry ] |
| %mul = mul nsw i64 %x.addr.07, %x.addr.07 |
| %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1 |
| %exitcond.not = icmp eq i64 %indvars.iv.next, %n |
| br i1 %exitcond.not, label %for.cond.cleanup, label %for.body |
| } |