test/Transforms/LoopStrengthReduce/X86/lsr-filtering-scaledreg.ll - llvm - Git at Google

 ; RUN: opt < %s -loop-reduce -lsr-filter-same-scaled-reg=true -mtriple=x86_64-unknown-linux-gnu -S | FileCheck %s

 target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"

 %struct.ham = type { i8, i8, [5 x i32], i64, i64, i64 }

 @global = external local_unnamed_addr global %struct.ham, align 8

 define void @foo() local_unnamed_addr {
 bb:
   %tmp = load i64, i64* getelementptr inbounds (%struct.ham, %struct.ham* @global, i64 0, i32 3), align 8
   %tmp1 = and i64 %tmp, 1792
   %tmp2 = load i64, i64* getelementptr inbounds (%struct.ham, %struct.ham* @global, i64 0, i32 4), align 8
   %tmp3 = add i64 %tmp1, %tmp2
   %tmp4 = load i8*, i8** null, align 8
   %tmp5 = getelementptr inbounds i8, i8* %tmp4, i64 0
   %tmp6 = sub i64 0, %tmp3
   %tmp7 = getelementptr inbounds i8, i8* %tmp4, i64 %tmp6
   %tmp8 = inttoptr i64 0 to i8*
   br label %bb9

 ; Without filtering non-optimal formulae with the same ScaledReg and Scale, the strategy
 ; to narrow LSR search space by picking winner reg will generate only one lsr.iv and
 ; unoptimal result.
 ; CHECK-LABEL: @foo(
 ; CHECK: bb9:
 ; CHECK-NEXT: = phi i8*
 ; CHECK-NEXT: = phi i8*

 bb9:                                              ; preds = %bb12, %bb
   %tmp10 = phi i8* [ %tmp7, %bb ], [ %tmp16, %bb12 ]
   %tmp11 = phi i8* [ %tmp8, %bb ], [ %tmp17, %bb12 ]
   br i1 false, label %bb18, label %bb12

 bb12:                                             ; preds = %bb9
   %tmp13 = getelementptr inbounds i8, i8* %tmp10, i64 8
   %tmp14 = bitcast i8* %tmp13 to i64*
   %tmp15 = load i64, i64* %tmp14, align 1
   %tmp16 = getelementptr inbounds i8, i8* %tmp10, i64 16
   %tmp17 = getelementptr inbounds i8, i8* %tmp11, i64 16
   br label %bb9

 bb18:                                             ; preds = %bb9
   %tmp19 = icmp ugt i8* %tmp11, null
   %tmp20 = getelementptr inbounds i8, i8* %tmp10, i64 8
   %tmp21 = getelementptr inbounds i8, i8* %tmp11, i64 8
   %tmp22 = select i1 %tmp19, i8* %tmp10, i8* %tmp20
   %tmp23 = select i1 %tmp19, i8* %tmp11, i8* %tmp21
   br label %bb24

 bb24:                                             ; preds = %bb24, %bb18
   %tmp25 = phi i8* [ %tmp27, %bb24 ], [ %tmp22, %bb18 ]
   %tmp26 = phi i8* [ %tmp29, %bb24 ], [ %tmp23, %bb18 ]
   %tmp27 = getelementptr inbounds i8, i8* %tmp25, i64 1
   %tmp28 = load i8, i8* %tmp25, align 1
   %tmp29 = getelementptr inbounds i8, i8* %tmp26, i64 1
   store i8 %tmp28, i8* %tmp26, align 1
   %tmp30 = icmp eq i8* %tmp29, %tmp5
   br label %bb24
 }
	; RUN: opt < %s -loop-reduce -lsr-filter-same-scaled-reg=true -mtriple=x86_64-unknown-linux-gnu -S \| FileCheck %s

	target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"

	%struct.ham = type { i8, i8, [5 x i32], i64, i64, i64 }

	@global = external local_unnamed_addr global %struct.ham, align 8

	define void @foo() local_unnamed_addr {
	bb:
	%tmp = load i64, i64* getelementptr inbounds (%struct.ham, %struct.ham* @global, i64 0, i32 3), align 8
	%tmp1 = and i64 %tmp, 1792
	%tmp2 = load i64, i64* getelementptr inbounds (%struct.ham, %struct.ham* @global, i64 0, i32 4), align 8
	%tmp3 = add i64 %tmp1, %tmp2
	%tmp4 = load i8, i8* null, align 8
	%tmp5 = getelementptr inbounds i8, i8* %tmp4, i64 0
	%tmp6 = sub i64 0, %tmp3
	%tmp7 = getelementptr inbounds i8, i8* %tmp4, i64 %tmp6
	%tmp8 = inttoptr i64 0 to i8*
	br label %bb9

	; Without filtering non-optimal formulae with the same ScaledReg and Scale, the strategy
	; to narrow LSR search space by picking winner reg will generate only one lsr.iv and
	; unoptimal result.
	; CHECK-LABEL: @foo(
	; CHECK: bb9:
	; CHECK-NEXT: = phi i8*
	; CHECK-NEXT: = phi i8*

	bb9: ; preds = %bb12, %bb
	%tmp10 = phi i8* [ %tmp7, %bb ], [ %tmp16, %bb12 ]
	%tmp11 = phi i8* [ %tmp8, %bb ], [ %tmp17, %bb12 ]
	br i1 false, label %bb18, label %bb12

	bb12: ; preds = %bb9
	%tmp13 = getelementptr inbounds i8, i8* %tmp10, i64 8
	%tmp14 = bitcast i8* %tmp13 to i64*
	%tmp15 = load i64, i64* %tmp14, align 1
	%tmp16 = getelementptr inbounds i8, i8* %tmp10, i64 16
	%tmp17 = getelementptr inbounds i8, i8* %tmp11, i64 16
	br label %bb9

	bb18: ; preds = %bb9
	%tmp19 = icmp ugt i8* %tmp11, null
	%tmp20 = getelementptr inbounds i8, i8* %tmp10, i64 8
	%tmp21 = getelementptr inbounds i8, i8* %tmp11, i64 8
	%tmp22 = select i1 %tmp19, i8* %tmp10, i8* %tmp20
	%tmp23 = select i1 %tmp19, i8* %tmp11, i8* %tmp21
	br label %bb24

	bb24: ; preds = %bb24, %bb18
	%tmp25 = phi i8* [ %tmp27, %bb24 ], [ %tmp22, %bb18 ]
	%tmp26 = phi i8* [ %tmp29, %bb24 ], [ %tmp23, %bb18 ]
	%tmp27 = getelementptr inbounds i8, i8* %tmp25, i64 1
	%tmp28 = load i8, i8* %tmp25, align 1
	%tmp29 = getelementptr inbounds i8, i8* %tmp26, i64 1
	store i8 %tmp28, i8* %tmp26, align 1
	%tmp30 = icmp eq i8* %tmp29, %tmp5
	br label %bb24
	}