| ; RUN: opt -S -dxil-resource-access -mtriple=dxil %s | FileCheck %s |
| ; |
| ; Test for when we have indices into both the array and the vector: ie, s[1][3] |
| |
| ; cbuffer CB : register(b0) { |
| ; uint4 s[3]; // offset 0, size 16 * 3 |
| ; } |
| %__cblayout_CB = type <{ [2 x <4 x i32>] }> |
| |
| @CB.cb = local_unnamed_addr global target("dx.CBuffer", %__cblayout_CB) poison |
| |
| ; CHECK: define void @f |
| define void @f(ptr %dst) { |
| entry: |
| %CB.cb_h = tail call target("dx.CBuffer", %__cblayout_CB) @llvm.dx.resource.handlefromimplicitbinding(i32 1, i32 0, i32 1, i32 0, ptr null) |
| store target("dx.CBuffer", %__cblayout_CB) %CB.cb_h, ptr @CB.cb, align 4 |
| |
| ; CHECK: [[CB:%.*]] = load target("dx.CBuffer", %__cblayout_CB), ptr @CB.cb |
| %CB.cb = load target("dx.CBuffer", %__cblayout_CB), ptr @CB.cb, align 4 |
| |
| ;; s[1][3] |
| ; |
| ; CHECK: [[LOAD:%.*]] = call { i32, i32, i32, i32 } @llvm.dx.resource.load.cbufferrow.4.{{.*}}(target("dx.CBuffer", %__cblayout_CB) [[CB]], i32 1) |
| ; CHECK: [[X:%.*]] = extractvalue { i32, i32, i32, i32 } [[LOAD]], 3 |
| ; CHECK: store i32 [[X]], ptr %dst |
| %i8_ptr = call ptr addrspace(2) @llvm.dx.resource.getpointer(target("dx.CBuffer", %__cblayout_CB) %CB.cb, i32 0) |
| %i8_gep = getelementptr inbounds nuw i8, ptr addrspace(2) %i8_ptr, i32 28 |
| %i8_vecext = load i32, ptr addrspace(2) %i8_gep, align 4 |
| store i32 %i8_vecext, ptr %dst, align 4 |
| |
| ;; s[2].w |
| ; |
| ; CHECK: [[LOAD:%.*]] = call { i32, i32, i32, i32 } @llvm.dx.resource.load.cbufferrow.4.{{.*}}(target("dx.CBuffer", %__cblayout_CB) [[CB]], i32 2) |
| ; CHECK: [[X:%.*]] = extractvalue { i32, i32, i32, i32 } [[LOAD]], 3 |
| ;; |
| ;; It would be nice to avoid the redundant vector creation here, but that's |
| ;; outside of the scope of this pass. |
| ;; |
| ; CHECK: [[X_VEC:%.*]] = insertelement <4 x i32> {{%.*}}, i32 [[X]], i32 3 |
| ; CHECK: [[X_EXT:%.*]] = extractelement <4 x i32> [[X_VEC]], i32 3 |
| ; CHECK: store i32 [[X_EXT]], ptr %dst |
| %typed_ptr = call ptr addrspace(2) @llvm.dx.resource.getpointer(target("dx.CBuffer", %__cblayout_CB) %CB.cb, i32 0) |
| %typed_gep = getelementptr <4 x i32>, ptr addrspace(2) %typed_ptr, i32 2 |
| %typed_load = load <4 x i32>, ptr addrspace(2) %typed_gep, align 16 |
| %typed_vecext = extractelement <4 x i32> %typed_load, i32 3 |
| store i32 %typed_vecext, ptr %dst, align 4 |
| |
| ret void |
| } |