| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py |
| ; RUN: opt < %s -passes=instcombine -S | FileCheck %s |
| |
| target datalayout = "n8:16:32" |
| |
| ; Given pattern: |
| ; (trunc (x << Q) to iDst) << K |
| ; we should rewrite it as |
| ; (trunc (x << (Q+K)) to iDst) iff (Q+K) u< iDst |
| ; This is only valid for shl. |
| ; THIS FOLD DOES *NOT* REQUIRE ANY 'nuw'/`nsw` FLAGS! |
| |
| ; Basic scalar test |
| |
| define i16 @t0(i32 %x, i16 %y) { |
| ; CHECK-LABEL: @t0( |
| ; CHECK-NEXT: [[X_TR:%.*]] = trunc i32 [[X:%.*]] to i16 |
| ; CHECK-NEXT: [[T5:%.*]] = shl i16 [[X_TR]], 8 |
| ; CHECK-NEXT: ret i16 [[T5]] |
| ; |
| %t0 = sub i16 32, %y |
| %t1 = zext i16 %t0 to i32 |
| %t2 = shl i32 %x, %t1 |
| %t3 = trunc i32 %t2 to i16 |
| %t4 = add i16 %y, -24 |
| %t5 = shl i16 %t3, %t4 |
| ret i16 %t5 |
| } |
| |
| define <2 x i16> @t1_vec_splat(<2 x i32> %x, <2 x i16> %y) { |
| ; CHECK-LABEL: @t1_vec_splat( |
| ; CHECK-NEXT: [[X_TR:%.*]] = trunc <2 x i32> [[X:%.*]] to <2 x i16> |
| ; CHECK-NEXT: [[T5:%.*]] = shl <2 x i16> [[X_TR]], <i16 8, i16 8> |
| ; CHECK-NEXT: ret <2 x i16> [[T5]] |
| ; |
| %t0 = sub <2 x i16> <i16 32, i16 32>, %y |
| %t1 = zext <2 x i16> %t0 to <2 x i32> |
| %t2 = shl <2 x i32> %x, %t1 |
| %t3 = trunc <2 x i32> %t2 to <2 x i16> |
| %t4 = add <2 x i16> %y, <i16 -24, i16 -24> |
| %t5 = shl <2 x i16> %t3, %t4 |
| ret <2 x i16> %t5 |
| } |
| |
| define <2 x i16> @t2_vec_nonsplat(<2 x i32> %x, <2 x i16> %y) { |
| ; CHECK-LABEL: @t2_vec_nonsplat( |
| ; CHECK-NEXT: [[TMP1:%.*]] = shl <2 x i32> [[X:%.*]], <i32 8, i32 30> |
| ; CHECK-NEXT: [[T5:%.*]] = trunc <2 x i32> [[TMP1]] to <2 x i16> |
| ; CHECK-NEXT: ret <2 x i16> [[T5]] |
| ; |
| %t0 = sub <2 x i16> <i16 32, i16 30>, %y |
| %t1 = zext <2 x i16> %t0 to <2 x i32> |
| %t2 = shl <2 x i32> %x, %t1 |
| %t3 = trunc <2 x i32> %t2 to <2 x i16> |
| %t4 = add <2 x i16> %y, <i16 -24, i16 0> |
| %t5 = shl <2 x i16> %t3, %t4 |
| ret <2 x i16> %t5 |
| } |
| |
| ; Basic vector tests |
| |
| define <3 x i16> @t3_vec_nonsplat_poison0(<3 x i32> %x, <3 x i16> %y) { |
| ; CHECK-LABEL: @t3_vec_nonsplat_poison0( |
| ; CHECK-NEXT: [[X_TR:%.*]] = trunc <3 x i32> [[X:%.*]] to <3 x i16> |
| ; CHECK-NEXT: [[T5:%.*]] = shl <3 x i16> [[X_TR]], <i16 8, i16 poison, i16 8> |
| ; CHECK-NEXT: ret <3 x i16> [[T5]] |
| ; |
| %t0 = sub <3 x i16> <i16 32, i16 poison, i16 32>, %y |
| %t1 = zext <3 x i16> %t0 to <3 x i32> |
| %t2 = shl <3 x i32> %x, %t1 |
| %t3 = trunc <3 x i32> %t2 to <3 x i16> |
| %t4 = add <3 x i16> %y, <i16 -24, i16 -24, i16 -24> |
| %t5 = shl <3 x i16> %t3, %t4 |
| ret <3 x i16> %t5 |
| } |
| |
| define <3 x i16> @t4_vec_nonsplat_poison1(<3 x i32> %x, <3 x i16> %y) { |
| ; CHECK-LABEL: @t4_vec_nonsplat_poison1( |
| ; CHECK-NEXT: [[X_TR:%.*]] = trunc <3 x i32> [[X:%.*]] to <3 x i16> |
| ; CHECK-NEXT: [[T5:%.*]] = shl <3 x i16> [[X_TR]], <i16 8, i16 poison, i16 8> |
| ; CHECK-NEXT: ret <3 x i16> [[T5]] |
| ; |
| %t0 = sub <3 x i16> <i16 32, i16 32, i16 32>, %y |
| %t1 = zext <3 x i16> %t0 to <3 x i32> |
| %t2 = shl <3 x i32> %x, %t1 |
| %t3 = trunc <3 x i32> %t2 to <3 x i16> |
| %t4 = add <3 x i16> %y, <i16 -24, i16 poison, i16 -24> |
| %t5 = shl <3 x i16> %t3, %t4 |
| ret <3 x i16> %t5 |
| } |
| |
| define <3 x i16> @t5_vec_nonsplat_poison1(<3 x i32> %x, <3 x i16> %y) { |
| ; CHECK-LABEL: @t5_vec_nonsplat_poison1( |
| ; CHECK-NEXT: [[X_TR:%.*]] = trunc <3 x i32> [[X:%.*]] to <3 x i16> |
| ; CHECK-NEXT: [[T5:%.*]] = shl <3 x i16> [[X_TR]], <i16 8, i16 poison, i16 8> |
| ; CHECK-NEXT: ret <3 x i16> [[T5]] |
| ; |
| %t0 = sub <3 x i16> <i16 32, i16 poison, i16 32>, %y |
| %t1 = zext <3 x i16> %t0 to <3 x i32> |
| %t2 = shl <3 x i32> %x, %t1 |
| %t3 = trunc <3 x i32> %t2 to <3 x i16> |
| %t4 = add <3 x i16> %y, <i16 -24, i16 poison, i16 -24> |
| %t5 = shl <3 x i16> %t3, %t4 |
| ret <3 x i16> %t5 |
| } |
| |
| ; One-use tests |
| |
| declare void @use16(i16) |
| declare void @use32(i32) |
| |
| define i16 @t6_extrause0(i32 %x, i16 %y) { |
| ; CHECK-LABEL: @t6_extrause0( |
| ; CHECK-NEXT: [[T0:%.*]] = sub i16 32, [[Y:%.*]] |
| ; CHECK-NEXT: [[T1:%.*]] = zext i16 [[T0]] to i32 |
| ; CHECK-NEXT: [[T2:%.*]] = shl i32 [[X:%.*]], [[T1]] |
| ; CHECK-NEXT: [[T3:%.*]] = trunc i32 [[T2]] to i16 |
| ; CHECK-NEXT: call void @use16(i16 [[T3]]) |
| ; CHECK-NEXT: [[X_TR:%.*]] = trunc i32 [[X]] to i16 |
| ; CHECK-NEXT: [[T5:%.*]] = shl i16 [[X_TR]], 8 |
| ; CHECK-NEXT: ret i16 [[T5]] |
| ; |
| %t0 = sub i16 32, %y |
| %t1 = zext i16 %t0 to i32 |
| %t2 = shl i32 %x, %t1 |
| %t3 = trunc i32 %t2 to i16 |
| %t4 = add i16 %y, -24 |
| call void @use16(i16 %t3) |
| %t5 = shl i16 %t3, %t4 |
| ret i16 %t5 |
| } |
| |
| define i16 @t7_extrause1(i32 %x, i16 %y) { |
| ; CHECK-LABEL: @t7_extrause1( |
| ; CHECK-NEXT: [[T4:%.*]] = add i16 [[Y:%.*]], -24 |
| ; CHECK-NEXT: call void @use16(i16 [[T4]]) |
| ; CHECK-NEXT: [[X_TR:%.*]] = trunc i32 [[X:%.*]] to i16 |
| ; CHECK-NEXT: [[T5:%.*]] = shl i16 [[X_TR]], 8 |
| ; CHECK-NEXT: ret i16 [[T5]] |
| ; |
| %t0 = sub i16 32, %y |
| %t1 = zext i16 %t0 to i32 |
| %t2 = shl i32 %x, %t1 |
| %t3 = trunc i32 %t2 to i16 |
| %t4 = add i16 %y, -24 |
| call void @use16(i16 %t4) |
| %t5 = shl i16 %t3, %t4 |
| ret i16 %t5 |
| } |
| |
| define i16 @t8_extrause2(i32 %x, i16 %y) { |
| ; CHECK-LABEL: @t8_extrause2( |
| ; CHECK-NEXT: [[T0:%.*]] = sub i16 32, [[Y:%.*]] |
| ; CHECK-NEXT: [[T1:%.*]] = zext i16 [[T0]] to i32 |
| ; CHECK-NEXT: [[T2:%.*]] = shl i32 [[X:%.*]], [[T1]] |
| ; CHECK-NEXT: [[T3:%.*]] = trunc i32 [[T2]] to i16 |
| ; CHECK-NEXT: [[T4:%.*]] = add i16 [[Y]], -24 |
| ; CHECK-NEXT: call void @use16(i16 [[T3]]) |
| ; CHECK-NEXT: call void @use16(i16 [[T4]]) |
| ; CHECK-NEXT: [[T5:%.*]] = shl i16 [[T3]], [[T4]] |
| ; CHECK-NEXT: ret i16 [[T5]] |
| ; |
| %t0 = sub i16 32, %y |
| %t1 = zext i16 %t0 to i32 |
| %t2 = shl i32 %x, %t1 |
| %t3 = trunc i32 %t2 to i16 |
| %t4 = add i16 %y, -24 |
| call void @use16(i16 %t3) |
| call void @use16(i16 %t4) |
| %t5 = shl i16 %t3, %t4 |
| ret i16 %t5 |
| } |
| |
| ; No 'nuw'/'nsw' flags are to be propagated! |
| ; But we can't test that, such IR does not reach that code. |
| |
| ; Negative tests |
| |
| ; Can't fold, total shift would be 32 |
| define i16 @n11(i32 %x, i16 %y) { |
| ; CHECK-LABEL: @n11( |
| ; CHECK-NEXT: [[T0:%.*]] = sub i16 30, [[Y:%.*]] |
| ; CHECK-NEXT: [[T1:%.*]] = zext i16 [[T0]] to i32 |
| ; CHECK-NEXT: [[T2:%.*]] = shl i32 [[X:%.*]], [[T1]] |
| ; CHECK-NEXT: [[T3:%.*]] = trunc i32 [[T2]] to i16 |
| ; CHECK-NEXT: [[T4:%.*]] = add i16 [[Y]], -31 |
| ; CHECK-NEXT: [[T5:%.*]] = shl i16 [[T3]], [[T4]] |
| ; CHECK-NEXT: ret i16 [[T5]] |
| ; |
| %t0 = sub i16 30, %y |
| %t1 = zext i16 %t0 to i32 |
| %t2 = shl i32 %x, %t1 |
| %t3 = trunc i32 %t2 to i16 |
| %t4 = add i16 %y, -31 |
| %t5 = shl i16 %t3, %t4 |
| ret i16 %t5 |
| } |
| |
| ; Bit width mismatch of shift amount |
| |
| @Y32 = global i32 42 |
| @Y16 = global i16 42 |
| define i16 @t01(i32 %x) { |
| ; CHECK-LABEL: @t01( |
| ; CHECK-NEXT: [[T0:%.*]] = shl i32 [[X:%.*]], ptrtoint (ptr @Y32 to i32) |
| ; CHECK-NEXT: [[T1:%.*]] = trunc i32 [[T0]] to i16 |
| ; CHECK-NEXT: [[T2:%.*]] = shl i16 [[T1]], ptrtoint (ptr @Y16 to i16) |
| ; CHECK-NEXT: ret i16 [[T2]] |
| ; |
| %t0 = shl i32 %x, ptrtoint (ptr @Y32 to i32) |
| %t1 = trunc i32 %t0 to i16 |
| %t2 = shl i16 %t1, ptrtoint (ptr @Y16 to i16) |
| ret i16 %t2 |
| } |
| |
| define i16 @shl_tr_shl_constant_shift_amount_uses(i32 %x) { |
| ; CHECK-LABEL: @shl_tr_shl_constant_shift_amount_uses( |
| ; CHECK-NEXT: [[SHL:%.*]] = shl i32 [[X:%.*]], 3 |
| ; CHECK-NEXT: call void @use32(i32 [[SHL]]) |
| ; CHECK-NEXT: [[TR:%.*]] = trunc i32 [[SHL]] to i16 |
| ; CHECK-NEXT: call void @use16(i16 [[TR]]) |
| ; CHECK-NEXT: [[R:%.*]] = shl i16 [[TR]], 4 |
| ; CHECK-NEXT: ret i16 [[R]] |
| ; |
| %shl = shl i32 %x, 3 |
| call void @use32(i32 %shl) |
| %tr = trunc i32 %shl to i16 |
| call void @use16(i16 %tr) |
| %r = shl i16 %tr, 4 |
| ret i16 %r |
| } |
| |
| ; This would infinite loop because we did not process the |
| ; poison shift before trying to fold shift-of-shift. To reach |
| ; the problematic transform, it needs a datalayout to specify |
| ; that the narrow types are legal, but i64 is not. |
| |
| define i1 @PR51657(i64 %x, i1 %c1) { |
| ; CHECK-LABEL: @PR51657( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: br i1 [[C1:%.*]], label [[COND_FALSE:%.*]], label [[COND_END:%.*]] |
| ; CHECK: cond.false: |
| ; CHECK-NEXT: br label [[COND_END]] |
| ; CHECK: cond.end: |
| ; CHECK-NEXT: ret i1 true |
| ; |
| entry: |
| br i1 %c1, label %cond.false, label %cond.end |
| |
| cond.false: |
| %shl = shl i64 %x, 64 |
| %conv26 = trunc i64 %shl to i32 |
| %t1 = trunc i64 %shl to i8 |
| br label %cond.end |
| |
| cond.end: |
| %cond = phi i32 [ %conv26, %cond.false ], [ 0, %entry ] |
| %t2 = phi i8 [ %t1, %cond.false ], [ 0, %entry ] |
| %conv27 = sext i8 %t2 to i32 |
| %eq = icmp eq i32 %cond, %conv27 |
| ret i1 %eq |
| } |
| |
| |
| define i16 @extra_use_on_first_shift(i32 %x) { |
| ; CHECK-LABEL: @extra_use_on_first_shift( |
| ; CHECK-NEXT: [[A:%.*]] = ashr i32 [[X:%.*]], 3 |
| ; CHECK-NEXT: call void @use32(i32 [[A]]) |
| ; CHECK-NEXT: [[TR:%.*]] = trunc i32 [[A]] to i16 |
| ; CHECK-NEXT: [[SH:%.*]] = lshr i16 [[TR]], 6 |
| ; CHECK-NEXT: ret i16 [[SH]] |
| ; |
| %a = ashr i32 %x, 3 |
| call void @use32(i32 %a) |
| %tr = trunc i32 %a to i16 |
| %sh = lshr i16 %tr, 6 |
| ret i16 %sh |
| } |