blob: 615fc5ea07eca9cd252739c060fe3fb32da8509a [file] [log] [blame]
; RUN: opt -S -dxil-resource-access -mtriple=dxil %s | FileCheck %s
;
; Test for when we have indices into both the array and the vector: ie, s[1][3]
; cbuffer CB : register(b0) {
; uint4 s[3]; // offset 0, size 16 * 3
; }
%__cblayout_CB = type <{ [2 x <4 x i32>] }>
@CB.cb = local_unnamed_addr global target("dx.CBuffer", %__cblayout_CB) poison
; CHECK: define void @f
define void @f(ptr %dst) {
entry:
%CB.cb_h = tail call target("dx.CBuffer", %__cblayout_CB) @llvm.dx.resource.handlefromimplicitbinding(i32 1, i32 0, i32 1, i32 0, ptr null)
store target("dx.CBuffer", %__cblayout_CB) %CB.cb_h, ptr @CB.cb, align 4
; CHECK: [[CB:%.*]] = load target("dx.CBuffer", %__cblayout_CB), ptr @CB.cb
%CB.cb = load target("dx.CBuffer", %__cblayout_CB), ptr @CB.cb, align 4
;; s[1][3]
;
; CHECK: [[LOAD:%.*]] = call { i32, i32, i32, i32 } @llvm.dx.resource.load.cbufferrow.4.{{.*}}(target("dx.CBuffer", %__cblayout_CB) [[CB]], i32 1)
; CHECK: [[X:%.*]] = extractvalue { i32, i32, i32, i32 } [[LOAD]], 3
; CHECK: store i32 [[X]], ptr %dst
%i8_ptr = call ptr addrspace(2) @llvm.dx.resource.getpointer(target("dx.CBuffer", %__cblayout_CB) %CB.cb, i32 0)
%i8_gep = getelementptr inbounds nuw i8, ptr addrspace(2) %i8_ptr, i32 28
%i8_vecext = load i32, ptr addrspace(2) %i8_gep, align 4
store i32 %i8_vecext, ptr %dst, align 4
;; s[2].w
;
; CHECK: [[LOAD:%.*]] = call { i32, i32, i32, i32 } @llvm.dx.resource.load.cbufferrow.4.{{.*}}(target("dx.CBuffer", %__cblayout_CB) [[CB]], i32 2)
; CHECK: [[X:%.*]] = extractvalue { i32, i32, i32, i32 } [[LOAD]], 3
;;
;; It would be nice to avoid the redundant vector creation here, but that's
;; outside of the scope of this pass.
;;
; CHECK: [[X_VEC:%.*]] = insertelement <4 x i32> {{%.*}}, i32 [[X]], i32 3
; CHECK: [[X_EXT:%.*]] = extractelement <4 x i32> [[X_VEC]], i32 3
; CHECK: store i32 [[X_EXT]], ptr %dst
%typed_ptr = call ptr addrspace(2) @llvm.dx.resource.getpointer(target("dx.CBuffer", %__cblayout_CB) %CB.cb, i32 0)
%typed_gep = getelementptr <4 x i32>, ptr addrspace(2) %typed_ptr, i32 2
%typed_load = load <4 x i32>, ptr addrspace(2) %typed_gep, align 16
%typed_vecext = extractelement <4 x i32> %typed_load, i32 3
store i32 %typed_vecext, ptr %dst, align 4
ret void
}