test/Transforms/InstCombine/redundant-right-shift-input-masking.ll - llvm-project/llvm - Git at Google

 ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
 ; RUN: opt < %s -passes=instcombine -S | FileCheck %s

 ; If we have:
 ;   (data & (-1 << nbits)) outer>> nbits
 ; Or
 ;   ((data inner>> nbits) << nbits) outer>> nbits
 ; The mask is redundant, and can be dropped:
 ;   data outer>> nbits
 ; This is valid for both lshr and ashr in both positions and any combination.
 ; We must *not* preserve 'exact' on that final right-shift.

 define i32 @t0_lshr(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @t0_lshr(
 ; CHECK-NEXT:    [[T0:%.*]] = shl i32 -1, [[NBITS:%.*]]
 ; CHECK-NEXT:    [[T1:%.*]] = and i32 [[T0]], [[DATA:%.*]]
 ; CHECK-NEXT:    [[T2:%.*]] = lshr exact i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = shl i32 -1, %nbits
   %t1 = and i32 %t0, %data
   %t2 = lshr exact i32 %t1, %nbits ; while there, test that we *don't* propagate 'exact'
   ret i32 %t2
 }
 define i32 @t1_sshr(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @t1_sshr(
 ; CHECK-NEXT:    [[T0:%.*]] = shl i32 -1, [[NBITS:%.*]]
 ; CHECK-NEXT:    [[T1:%.*]] = and i32 [[T0]], [[DATA:%.*]]
 ; CHECK-NEXT:    [[T2:%.*]] = ashr exact i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = shl i32 -1, %nbits
   %t1 = and i32 %t0, %data
   %t2 = ashr exact i32 %t1, %nbits ; while there, test that we *don't* propagate 'exact'
   ret i32 %t2
 }

 ; Vectors

 define <4 x i32> @t2_vec(<4 x i32> %data, <4 x i32> %nbits) {
 ; CHECK-LABEL: @t2_vec(
 ; CHECK-NEXT:    [[T0:%.*]] = shl <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>, [[NBITS:%.*]]
 ; CHECK-NEXT:    [[T1:%.*]] = and <4 x i32> [[T0]], [[DATA:%.*]]
 ; CHECK-NEXT:    [[T2:%.*]] = lshr <4 x i32> [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret <4 x i32> [[T2]]
 ;
   %t0 = shl <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>, %nbits
   %t1 = and <4 x i32> %t0, %data
   %t2 = lshr <4 x i32> %t1, %nbits
   ret <4 x i32> %t2
 }

 define <4 x i32> @t3_vec_undef(<4 x i32> %data, <4 x i32> %nbits) {
 ; CHECK-LABEL: @t3_vec_undef(
 ; CHECK-NEXT:    [[T0:%.*]] = shl <4 x i32> <i32 -1, i32 -1, i32 undef, i32 -1>, [[NBITS:%.*]]
 ; CHECK-NEXT:    [[T1:%.*]] = and <4 x i32> [[T0]], [[DATA:%.*]]
 ; CHECK-NEXT:    [[T2:%.*]] = lshr <4 x i32> [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret <4 x i32> [[T2]]
 ;
   %t0 = shl <4 x i32> <i32 -1, i32 -1, i32 undef, i32 -1>, %nbits
   %t1 = and <4 x i32> %t0, %data
   %t2 = lshr <4 x i32> %t1, %nbits
   ret <4 x i32> %t2
 }

 ; Extra uses

 declare void @use32(i32)

 define i32 @t4_extrause0(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @t4_extrause0(
 ; CHECK-NEXT:    [[T0:%.*]] = shl i32 -1, [[NBITS:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T0]])
 ; CHECK-NEXT:    [[T1:%.*]] = and i32 [[T0]], [[DATA:%.*]]
 ; CHECK-NEXT:    [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = shl i32 -1, %nbits
   call void @use32(i32 %t0)
   %t1 = and i32 %t0, %data
   %t2 = lshr i32 %t1, %nbits
   ret i32 %t2
 }

 define i32 @t5_extrause1(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @t5_extrause1(
 ; CHECK-NEXT:    [[T0:%.*]] = shl i32 -1, [[NBITS:%.*]]
 ; CHECK-NEXT:    [[T1:%.*]] = and i32 [[T0]], [[DATA:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T1]])
 ; CHECK-NEXT:    [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = shl i32 -1, %nbits
   %t1 = and i32 %t0, %data
   call void @use32(i32 %t1)
   %t2 = lshr i32 %t1, %nbits
   ret i32 %t2
 }

 define i32 @t6_extrause2(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @t6_extrause2(
 ; CHECK-NEXT:    [[T0:%.*]] = shl i32 -1, [[NBITS:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T0]])
 ; CHECK-NEXT:    [[T1:%.*]] = and i32 [[T0]], [[DATA:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T1]])
 ; CHECK-NEXT:    [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = shl i32 -1, %nbits
   call void @use32(i32 %t0)
   %t1 = and i32 %t0, %data
   call void @use32(i32 %t1)
   %t2 = lshr i32 %t1, %nbits
   ret i32 %t2
 }

 ; Non-canonical mask pattern. Let's just test a single case with all-extra uses.

 define i32 @t7_noncanonical_lshr_lshr_extrauses(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @t7_noncanonical_lshr_lshr_extrauses(
 ; CHECK-NEXT:    [[T0:%.*]] = lshr i32 [[DATA:%.*]], [[NBITS:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T0]])
 ; CHECK-NEXT:    [[T1:%.*]] = shl i32 [[T0]], [[NBITS]]
 ; CHECK-NEXT:    call void @use32(i32 [[T1]])
 ; CHECK-NEXT:    [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = lshr i32 %data, %nbits
   call void @use32(i32 %t0)
   %t1 = shl i32 %t0, %nbits
   call void @use32(i32 %t1)
   %t2 = lshr i32 %t1, %nbits
   ret i32 %t2
 }

 define i32 @t8_noncanonical_lshr_ashr_extrauses(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @t8_noncanonical_lshr_ashr_extrauses(
 ; CHECK-NEXT:    [[T0:%.*]] = lshr i32 [[DATA:%.*]], [[NBITS:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T0]])
 ; CHECK-NEXT:    [[T1:%.*]] = shl i32 [[T0]], [[NBITS]]
 ; CHECK-NEXT:    call void @use32(i32 [[T1]])
 ; CHECK-NEXT:    [[T2:%.*]] = ashr i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = lshr i32 %data, %nbits
   call void @use32(i32 %t0)
   %t1 = shl i32 %t0, %nbits
   call void @use32(i32 %t1)
   %t2 = ashr i32 %t1, %nbits
   ret i32 %t2
 }

 define i32 @t9_noncanonical_ashr_lshr_extrauses(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @t9_noncanonical_ashr_lshr_extrauses(
 ; CHECK-NEXT:    [[T0:%.*]] = ashr i32 [[DATA:%.*]], [[NBITS:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T0]])
 ; CHECK-NEXT:    [[T1:%.*]] = shl i32 [[T0]], [[NBITS]]
 ; CHECK-NEXT:    call void @use32(i32 [[T1]])
 ; CHECK-NEXT:    [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = ashr i32 %data, %nbits
   call void @use32(i32 %t0)
   %t1 = shl i32 %t0, %nbits
   call void @use32(i32 %t1)
   %t2 = lshr i32 %t1, %nbits
   ret i32 %t2
 }

 define i32 @t10_noncanonical_ashr_ashr_extrauses(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @t10_noncanonical_ashr_ashr_extrauses(
 ; CHECK-NEXT:    [[T0:%.*]] = ashr i32 [[DATA:%.*]], [[NBITS:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T0]])
 ; CHECK-NEXT:    [[T1:%.*]] = shl i32 [[T0]], [[NBITS]]
 ; CHECK-NEXT:    call void @use32(i32 [[T1]])
 ; CHECK-NEXT:    [[T2:%.*]] = ashr i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = ashr i32 %data, %nbits
   call void @use32(i32 %t0)
   %t1 = shl i32 %t0, %nbits
   call void @use32(i32 %t1)
   %t2 = ashr i32 %t1, %nbits
   ret i32 %t2
 }

 ; Commutativity

 declare i32 @gen32()

 define i32 @t11_commutative(i32 %nbits) {
 ; CHECK-LABEL: @t11_commutative(
 ; CHECK-NEXT:    [[DATA:%.*]] = call i32 @gen32()
 ; CHECK-NEXT:    [[T0:%.*]] = shl i32 -1, [[NBITS:%.*]]
 ; CHECK-NEXT:    [[T1:%.*]] = and i32 [[DATA]], [[T0]]
 ; CHECK-NEXT:    [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %data = call i32 @gen32()
   %t0 = shl i32 -1, %nbits
   %t1 = and i32 %data, %t0 ; swapped
   %t2 = lshr i32 %t1, %nbits
   ret i32 %t2
 }

 ; Negative tests

 define i32 @n12(i32 %data, i32 %nbits) {
 ; CHECK-LABEL: @n12(
 ; CHECK-NEXT:    [[T0:%.*]] = shl i32 2147483647, [[NBITS:%.*]]
 ; CHECK-NEXT:    [[T1:%.*]] = and i32 [[T0]], [[DATA:%.*]]
 ; CHECK-NEXT:    [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = shl i32 2147483647, %nbits ; must be shifting -1
   %t1 = and i32 %t0, %data
   %t2 = lshr i32 %t1, %nbits
   ret i32 %t2
 }

 define i32 @n13(i32 %data, i32 %nbits0, i32 %nbits1) {
 ; CHECK-LABEL: @n13(
 ; CHECK-NEXT:    [[T0:%.*]] = shl i32 -1, [[NBITS0:%.*]]
 ; CHECK-NEXT:    [[T1:%.*]] = and i32 [[T0]], [[DATA:%.*]]
 ; CHECK-NEXT:    [[T2:%.*]] = lshr i32 [[T1]], [[NBITS1:%.*]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = shl i32 -1, %nbits0
   %t1 = and i32 %t0, %data
   %t2 = lshr i32 %t1, %nbits1 ; different shift amounts
   ret i32 %t2
 }

 define i32 @n14(i32 %data, i32 %nbits0, i32 %nbits1, i32 %nbits2) {
 ; CHECK-LABEL: @n14(
 ; CHECK-NEXT:    [[T0:%.*]] = lshr i32 [[DATA:%.*]], [[NBITS0:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T0]])
 ; CHECK-NEXT:    [[T1:%.*]] = shl i32 [[T0]], [[NBITS1:%.*]]
 ; CHECK-NEXT:    call void @use32(i32 [[T1]])
 ; CHECK-NEXT:    [[T2:%.*]] = lshr i32 [[T1]], [[NBITS2:%.*]]
 ; CHECK-NEXT:    ret i32 [[T2]]
 ;
   %t0 = lshr i32 %data, %nbits0
   call void @use32(i32 %t0)
   %t1 = shl i32 %t0, %nbits1 ; different shift amounts
   call void @use32(i32 %t1)
   %t2 = lshr i32 %t1, %nbits2 ; different shift amounts
   ret i32 %t2
 }
	; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
	; RUN: opt < %s -passes=instcombine -S \| FileCheck %s

	; If we have:
	; (data & (-1 << nbits)) outer>> nbits
	; Or
	; ((data inner>> nbits) << nbits) outer>> nbits
	; The mask is redundant, and can be dropped:
	; data outer>> nbits
	; This is valid for both lshr and ashr in both positions and any combination.
	; We must not preserve 'exact' on that final right-shift.

	define i32 @t0_lshr(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @t0_lshr(
	; CHECK-NEXT: [[T0:%.]] = shl i32 -1, [[NBITS:%.]]
	; CHECK-NEXT: [[T1:%.]] = and i32 [[T0]], [[DATA:%.]]
	; CHECK-NEXT: [[T2:%.*]] = lshr exact i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = shl i32 -1, %nbits
	%t1 = and i32 %t0, %data
	%t2 = lshr exact i32 %t1, %nbits ; while there, test that we don't propagate 'exact'
	ret i32 %t2
	}
	define i32 @t1_sshr(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @t1_sshr(
	; CHECK-NEXT: [[T0:%.]] = shl i32 -1, [[NBITS:%.]]
	; CHECK-NEXT: [[T1:%.]] = and i32 [[T0]], [[DATA:%.]]
	; CHECK-NEXT: [[T2:%.*]] = ashr exact i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = shl i32 -1, %nbits
	%t1 = and i32 %t0, %data
	%t2 = ashr exact i32 %t1, %nbits ; while there, test that we don't propagate 'exact'
	ret i32 %t2
	}

	; Vectors

	define <4 x i32> @t2_vec(<4 x i32> %data, <4 x i32> %nbits) {
	; CHECK-LABEL: @t2_vec(
	; CHECK-NEXT: [[T0:%.]] = shl <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>, [[NBITS:%.]]
	; CHECK-NEXT: [[T1:%.]] = and <4 x i32> [[T0]], [[DATA:%.]]
	; CHECK-NEXT: [[T2:%.*]] = lshr <4 x i32> [[T1]], [[NBITS]]
	; CHECK-NEXT: ret <4 x i32> [[T2]]
	;
	%t0 = shl <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>, %nbits
	%t1 = and <4 x i32> %t0, %data
	%t2 = lshr <4 x i32> %t1, %nbits
	ret <4 x i32> %t2
	}

	define <4 x i32> @t3_vec_undef(<4 x i32> %data, <4 x i32> %nbits) {
	; CHECK-LABEL: @t3_vec_undef(
	; CHECK-NEXT: [[T0:%.]] = shl <4 x i32> <i32 -1, i32 -1, i32 undef, i32 -1>, [[NBITS:%.]]
	; CHECK-NEXT: [[T1:%.]] = and <4 x i32> [[T0]], [[DATA:%.]]
	; CHECK-NEXT: [[T2:%.*]] = lshr <4 x i32> [[T1]], [[NBITS]]
	; CHECK-NEXT: ret <4 x i32> [[T2]]
	;
	%t0 = shl <4 x i32> <i32 -1, i32 -1, i32 undef, i32 -1>, %nbits
	%t1 = and <4 x i32> %t0, %data
	%t2 = lshr <4 x i32> %t1, %nbits
	ret <4 x i32> %t2
	}

	; Extra uses

	declare void @use32(i32)

	define i32 @t4_extrause0(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @t4_extrause0(
	; CHECK-NEXT: [[T0:%.]] = shl i32 -1, [[NBITS:%.]]
	; CHECK-NEXT: call void @use32(i32 [[T0]])
	; CHECK-NEXT: [[T1:%.]] = and i32 [[T0]], [[DATA:%.]]
	; CHECK-NEXT: [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = shl i32 -1, %nbits
	call void @use32(i32 %t0)
	%t1 = and i32 %t0, %data
	%t2 = lshr i32 %t1, %nbits
	ret i32 %t2
	}

	define i32 @t5_extrause1(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @t5_extrause1(
	; CHECK-NEXT: [[T0:%.]] = shl i32 -1, [[NBITS:%.]]
	; CHECK-NEXT: [[T1:%.]] = and i32 [[T0]], [[DATA:%.]]
	; CHECK-NEXT: call void @use32(i32 [[T1]])
	; CHECK-NEXT: [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = shl i32 -1, %nbits
	%t1 = and i32 %t0, %data
	call void @use32(i32 %t1)
	%t2 = lshr i32 %t1, %nbits
	ret i32 %t2
	}

	define i32 @t6_extrause2(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @t6_extrause2(
	; CHECK-NEXT: [[T0:%.]] = shl i32 -1, [[NBITS:%.]]
	; CHECK-NEXT: call void @use32(i32 [[T0]])
	; CHECK-NEXT: [[T1:%.]] = and i32 [[T0]], [[DATA:%.]]
	; CHECK-NEXT: call void @use32(i32 [[T1]])
	; CHECK-NEXT: [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = shl i32 -1, %nbits
	call void @use32(i32 %t0)
	%t1 = and i32 %t0, %data
	call void @use32(i32 %t1)
	%t2 = lshr i32 %t1, %nbits
	ret i32 %t2
	}

	; Non-canonical mask pattern. Let's just test a single case with all-extra uses.

	define i32 @t7_noncanonical_lshr_lshr_extrauses(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @t7_noncanonical_lshr_lshr_extrauses(
	; CHECK-NEXT: [[T0:%.]] = lshr i32 [[DATA:%.]], [[NBITS:%.*]]
	; CHECK-NEXT: call void @use32(i32 [[T0]])
	; CHECK-NEXT: [[T1:%.*]] = shl i32 [[T0]], [[NBITS]]
	; CHECK-NEXT: call void @use32(i32 [[T1]])
	; CHECK-NEXT: [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = lshr i32 %data, %nbits
	call void @use32(i32 %t0)
	%t1 = shl i32 %t0, %nbits
	call void @use32(i32 %t1)
	%t2 = lshr i32 %t1, %nbits
	ret i32 %t2
	}

	define i32 @t8_noncanonical_lshr_ashr_extrauses(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @t8_noncanonical_lshr_ashr_extrauses(
	; CHECK-NEXT: [[T0:%.]] = lshr i32 [[DATA:%.]], [[NBITS:%.*]]
	; CHECK-NEXT: call void @use32(i32 [[T0]])
	; CHECK-NEXT: [[T1:%.*]] = shl i32 [[T0]], [[NBITS]]
	; CHECK-NEXT: call void @use32(i32 [[T1]])
	; CHECK-NEXT: [[T2:%.*]] = ashr i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = lshr i32 %data, %nbits
	call void @use32(i32 %t0)
	%t1 = shl i32 %t0, %nbits
	call void @use32(i32 %t1)
	%t2 = ashr i32 %t1, %nbits
	ret i32 %t2
	}

	define i32 @t9_noncanonical_ashr_lshr_extrauses(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @t9_noncanonical_ashr_lshr_extrauses(
	; CHECK-NEXT: [[T0:%.]] = ashr i32 [[DATA:%.]], [[NBITS:%.*]]
	; CHECK-NEXT: call void @use32(i32 [[T0]])
	; CHECK-NEXT: [[T1:%.*]] = shl i32 [[T0]], [[NBITS]]
	; CHECK-NEXT: call void @use32(i32 [[T1]])
	; CHECK-NEXT: [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = ashr i32 %data, %nbits
	call void @use32(i32 %t0)
	%t1 = shl i32 %t0, %nbits
	call void @use32(i32 %t1)
	%t2 = lshr i32 %t1, %nbits
	ret i32 %t2
	}

	define i32 @t10_noncanonical_ashr_ashr_extrauses(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @t10_noncanonical_ashr_ashr_extrauses(
	; CHECK-NEXT: [[T0:%.]] = ashr i32 [[DATA:%.]], [[NBITS:%.*]]
	; CHECK-NEXT: call void @use32(i32 [[T0]])
	; CHECK-NEXT: [[T1:%.*]] = shl i32 [[T0]], [[NBITS]]
	; CHECK-NEXT: call void @use32(i32 [[T1]])
	; CHECK-NEXT: [[T2:%.*]] = ashr i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = ashr i32 %data, %nbits
	call void @use32(i32 %t0)
	%t1 = shl i32 %t0, %nbits
	call void @use32(i32 %t1)
	%t2 = ashr i32 %t1, %nbits
	ret i32 %t2
	}

	; Commutativity

	declare i32 @gen32()

	define i32 @t11_commutative(i32 %nbits) {
	; CHECK-LABEL: @t11_commutative(
	; CHECK-NEXT: [[DATA:%.*]] = call i32 @gen32()
	; CHECK-NEXT: [[T0:%.]] = shl i32 -1, [[NBITS:%.]]
	; CHECK-NEXT: [[T1:%.*]] = and i32 [[DATA]], [[T0]]
	; CHECK-NEXT: [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%data = call i32 @gen32()
	%t0 = shl i32 -1, %nbits
	%t1 = and i32 %data, %t0 ; swapped
	%t2 = lshr i32 %t1, %nbits
	ret i32 %t2
	}

	; Negative tests

	define i32 @n12(i32 %data, i32 %nbits) {
	; CHECK-LABEL: @n12(
	; CHECK-NEXT: [[T0:%.]] = shl i32 2147483647, [[NBITS:%.]]
	; CHECK-NEXT: [[T1:%.]] = and i32 [[T0]], [[DATA:%.]]
	; CHECK-NEXT: [[T2:%.*]] = lshr i32 [[T1]], [[NBITS]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = shl i32 2147483647, %nbits ; must be shifting -1
	%t1 = and i32 %t0, %data
	%t2 = lshr i32 %t1, %nbits
	ret i32 %t2
	}

	define i32 @n13(i32 %data, i32 %nbits0, i32 %nbits1) {
	; CHECK-LABEL: @n13(
	; CHECK-NEXT: [[T0:%.]] = shl i32 -1, [[NBITS0:%.]]
	; CHECK-NEXT: [[T1:%.]] = and i32 [[T0]], [[DATA:%.]]
	; CHECK-NEXT: [[T2:%.]] = lshr i32 [[T1]], [[NBITS1:%.]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = shl i32 -1, %nbits0
	%t1 = and i32 %t0, %data
	%t2 = lshr i32 %t1, %nbits1 ; different shift amounts
	ret i32 %t2
	}

	define i32 @n14(i32 %data, i32 %nbits0, i32 %nbits1, i32 %nbits2) {
	; CHECK-LABEL: @n14(
	; CHECK-NEXT: [[T0:%.]] = lshr i32 [[DATA:%.]], [[NBITS0:%.*]]
	; CHECK-NEXT: call void @use32(i32 [[T0]])
	; CHECK-NEXT: [[T1:%.]] = shl i32 [[T0]], [[NBITS1:%.]]
	; CHECK-NEXT: call void @use32(i32 [[T1]])
	; CHECK-NEXT: [[T2:%.]] = lshr i32 [[T1]], [[NBITS2:%.]]
	; CHECK-NEXT: ret i32 [[T2]]
	;
	%t0 = lshr i32 %data, %nbits0
	call void @use32(i32 %t0)
	%t1 = shl i32 %t0, %nbits1 ; different shift amounts
	call void @use32(i32 %t1)
	%t2 = lshr i32 %t1, %nbits2 ; different shift amounts
	ret i32 %t2
	}