| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6 |
| ; RUN: opt %s -passes=gvn -S -enable-gvn-memdep=false | FileCheck %s |
| ; RUN: opt %s -passes=gvn -S -enable-gvn-memdep=true | FileCheck %s |
| |
| ; Check that llvm.x86.avx2.gather.d.ps.256 intrinsic is not eliminated by GVN |
| ; with and without memory dependence info. |
| target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| ; Function Attrs: nounwind readonly |
| declare <8 x float> @llvm.x86.avx2.gather.d.ps.256(<8 x float>, ptr, <8 x i32>, <8 x float>, i8) #0 |
| |
| ; Function Attrs: nounwind |
| define <8 x float> @foo1(ptr noalias readonly %arr.ptr, ptr noalias readonly %vix.ptr, ptr noalias %t2.ptr) #1 { |
| ; CHECK-LABEL: define <8 x float> @foo1( |
| ; CHECK-SAME: ptr noalias readonly [[ARR_PTR:%.*]], ptr noalias readonly [[VIX_PTR:%.*]], ptr noalias [[T2_PTR:%.*]]) { |
| ; CHECK-NEXT: [[ALLOCAS:.*:]] |
| ; CHECK-NEXT: [[VIX:%.*]] = load <8 x i32>, ptr [[VIX_PTR]], align 4 |
| ; CHECK-NEXT: [[T1_PTR:%.*]] = getelementptr i8, ptr [[ARR_PTR]], i8 4 |
| ; CHECK-NEXT: [[V1:%.*]] = tail call <8 x float> @llvm.x86.avx2.gather.d.ps.256(<8 x float> undef, ptr [[ARR_PTR]], <8 x i32> [[VIX]], <8 x float> splat (float 0xFFFFFFFFE0000000), i8 1) |
| ; CHECK-NEXT: store i8 1, ptr [[T1_PTR]], align 4 |
| ; CHECK-NEXT: [[V2:%.*]] = tail call <8 x float> @llvm.x86.avx2.gather.d.ps.256(<8 x float> undef, ptr [[ARR_PTR]], <8 x i32> [[VIX]], <8 x float> splat (float 0xFFFFFFFFE0000000), i8 1) |
| ; CHECK-NEXT: [[RES:%.*]] = fadd <8 x float> [[V1]], [[V2]] |
| ; CHECK-NEXT: ret <8 x float> [[RES]] |
| ; |
| allocas: |
| %vix = load <8 x i32>, ptr %vix.ptr, align 4 |
| %t1.ptr = getelementptr i8, ptr %arr.ptr, i8 4 |
| |
| %v1 = tail call <8 x float> @llvm.x86.avx2.gather.d.ps.256(<8 x float> undef, ptr %arr.ptr, <8 x i32> %vix, <8 x float> <float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000>, i8 1) #2 |
| store i8 1, ptr %t1.ptr, align 4 |
| |
| %v2 = tail call <8 x float> @llvm.x86.avx2.gather.d.ps.256(<8 x float> undef, ptr %arr.ptr, <8 x i32> %vix, <8 x float> <float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000>, i8 1) #2 |
| %res = fadd <8 x float> %v1, %v2 |
| |
| ret <8 x float> %res |
| } |