blob: 4095347d786243fdf8ff6eb4edb3b075f3a09cdb [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-promote-alloca < %s | FileCheck %s
; Check that types where the store/allocation sizes don't match the type size
; don't crash.
define <7 x i9> @load_elem_i9_access_7xi9() {
; CHECK-LABEL: @load_elem_i9_access_7xi9(
; CHECK-NEXT: [[P:%.*]] = alloca <16 x i9>, align 1, addrspace(5)
; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4
; CHECK-NEXT: [[L:%.*]] = load <7 x i9>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <7 x i9> [[L]]
;
%p = alloca <16 x i9>, align 1, addrspace(5)
%g = getelementptr i8, ptr addrspace(5) %p, i64 4
%l = load <7 x i9>, ptr addrspace(5) %g, align 1
ret <7 x i9> %l
}
define <8 x i1> @load_elem_i1_access_8xi1() {
; CHECK-LABEL: @load_elem_i1_access_8xi1(
; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5)
; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4
; CHECK-NEXT: [[L:%.*]] = load <8 x i1>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <8 x i1> [[L]]
;
%p = alloca <16 x i1>, align 1, addrspace(5)
%g = getelementptr i8, ptr addrspace(5) %p, i64 4
%l = load <8 x i1>, ptr addrspace(5) %g, align 1
ret <8 x i1> %l
}
define <3 x i1> @load_elem_i1_access_3xi1() {
; CHECK-LABEL: @load_elem_i1_access_3xi1(
; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5)
; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4
; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <3 x i1> [[L]]
;
%p = alloca <16 x i1>, align 1, addrspace(5)
%g = getelementptr i8, ptr addrspace(5) %p, i64 4
%l = load <3 x i1>, ptr addrspace(5) %g, align 1
ret <3 x i1> %l
}
define <3 x i1> @load_elem_i8_access_3xi1() {
; CHECK-LABEL: @load_elem_i8_access_3xi1(
; CHECK-NEXT: [[P:%.*]] = alloca <8 x i8>, align 1, addrspace(5)
; CHECK-NEXT: store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) [[P]], align 1
; CHECK-NEXT: [[G:%.*]] = getelementptr <4 x i8>, ptr addrspace(5) [[P]], i64 1
; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <3 x i1> [[L]]
;
%p = alloca <8 x i8>, align 1, addrspace(5)
store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1
%g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1
%l = load <3 x i1>, ptr addrspace(5) %g, align 1
ret <3 x i1> %l
}
; This one is actually not problematic.
define <8 x i1> @load_elem_i8_access_8xi1() {
; CHECK-LABEL: @load_elem_i8_access_8xi1(
; CHECK-NEXT: [[P:%.*]] = freeze <8 x i8> poison
; CHECK-NEXT: ret <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>
;
%p = alloca <8 x i8>, align 1, addrspace(5)
store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1
%g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1
%l = load <8 x i1>, ptr addrspace(5) %g, align 1
ret <8 x i1> %l
}
define <8 x i1> @storeload_elem_i1_access_8xi1() {
; CHECK-LABEL: @storeload_elem_i1_access_8xi1(
; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5)
; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4
; CHECK-NEXT: store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: [[L:%.*]] = load <8 x i1>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <8 x i1> [[L]]
;
%p = alloca <16 x i1>, align 1, addrspace(5)
%g = getelementptr i8, ptr addrspace(5) %p, i64 4
store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) %g, align 1
%l = load <8 x i1>, ptr addrspace(5) %g, align 1
ret <8 x i1> %l
}
define <3 x i1> @storeload_elem_i1_access_3xi1() {
; CHECK-LABEL: @storeload_elem_i1_access_3xi1(
; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5)
; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4
; CHECK-NEXT: store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <3 x i1> [[L]]
;
%p = alloca <16 x i1>, align 1, addrspace(5)
%g = getelementptr i8, ptr addrspace(5) %p, i64 4
store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) %g, align 1
%l = load <3 x i1>, ptr addrspace(5) %g, align 1
ret <3 x i1> %l
}
define <3 x i1> @storeload_elem_i8_access_3xi1() {
; CHECK-LABEL: @storeload_elem_i8_access_3xi1(
; CHECK-NEXT: [[P:%.*]] = alloca <8 x i8>, align 1, addrspace(5)
; CHECK-NEXT: store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) [[P]], align 1
; CHECK-NEXT: [[G:%.*]] = getelementptr <4 x i8>, ptr addrspace(5) [[P]], i64 1
; CHECK-NEXT: store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <3 x i1> [[L]]
;
%p = alloca <8 x i8>, align 1, addrspace(5)
store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1
%g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1
store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) %g, align 1
%l = load <3 x i1>, ptr addrspace(5) %g, align 1
ret <3 x i1> %l
}
; This one is actually not problematic.
define <8 x i1> @storeload_elem_i8_access_8xi1() {
; CHECK-LABEL: @storeload_elem_i8_access_8xi1(
; CHECK-NEXT: [[P:%.*]] = freeze <8 x i8> poison
; CHECK-NEXT: ret <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>
;
%p = alloca <8 x i8>, align 1, addrspace(5)
store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1
%g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1
store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) %g, align 1
%l = load <8 x i1>, ptr addrspace(5) %g, align 1
ret <8 x i1> %l
}
define <8 x i1> @array_of_vec_elem_i1_access_8xi1() {
; CHECK-LABEL: @array_of_vec_elem_i1_access_8xi1(
; CHECK-NEXT: [[P:%.*]] = alloca [2 x <16 x i1>], align 1, addrspace(5)
; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4
; CHECK-NEXT: store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: [[L:%.*]] = load <8 x i1>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <8 x i1> [[L]]
;
%p = alloca [2 x <16 x i1>], align 1, addrspace(5)
%g = getelementptr i8, ptr addrspace(5) %p, i64 4
store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) %g, align 1
%l = load <8 x i1>, ptr addrspace(5) %g, align 1
ret <8 x i1> %l
}
define <3 x i1> @array_of_vec_elem_i1_access_3xi1() {
; CHECK-LABEL: @array_of_vec_elem_i1_access_3xi1(
; CHECK-NEXT: [[P:%.*]] = alloca [2 x <16 x i1>], align 1, addrspace(5)
; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4
; CHECK-NEXT: store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <3 x i1> [[L]]
;
%p = alloca [2 x <16 x i1>], align 1, addrspace(5)
%g = getelementptr i8, ptr addrspace(5) %p, i64 4
store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) %g, align 1
%l = load <3 x i1>, ptr addrspace(5) %g, align 1
ret <3 x i1> %l
}
define <3 x i1> @array_of_vec_elem_i8_access_3xi1() {
; CHECK-LABEL: @array_of_vec_elem_i8_access_3xi1(
; CHECK-NEXT: [[P:%.*]] = alloca [2 x <8 x i8>], align 1, addrspace(5)
; CHECK-NEXT: store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) [[P]], align 1
; CHECK-NEXT: [[G:%.*]] = getelementptr <4 x i8>, ptr addrspace(5) [[P]], i64 1
; CHECK-NEXT: store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1
; CHECK-NEXT: ret <3 x i1> [[L]]
;
%p = alloca [2 x <8 x i8>], align 1, addrspace(5)
store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1
%g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1
store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) %g, align 1
%l = load <3 x i1>, ptr addrspace(5) %g, align 1
ret <3 x i1> %l
}
; This one is actually not problematic.
define <8 x i1> @array_of_vec_elem_i8_access_8xi1() {
; CHECK-LABEL: @array_of_vec_elem_i8_access_8xi1(
; CHECK-NEXT: [[P:%.*]] = freeze <16 x i8> poison
; CHECK-NEXT: [[TMP1:%.*]] = insertelement <16 x i8> [[P]], i8 1, i32 0
; CHECK-NEXT: [[TMP2:%.*]] = insertelement <16 x i8> [[TMP1]], i8 2, i32 1
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <16 x i8> [[TMP2]], i8 3, i32 2
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <16 x i8> [[TMP3]], i8 4, i32 3
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <16 x i8> [[TMP4]], i8 5, i32 4
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <16 x i8> [[TMP5]], i8 6, i32 5
; CHECK-NEXT: [[TMP7:%.*]] = insertelement <16 x i8> [[TMP6]], i8 7, i32 6
; CHECK-NEXT: [[TMP8:%.*]] = insertelement <16 x i8> [[TMP7]], i8 8, i32 7
; CHECK-NEXT: [[TMP9:%.*]] = insertelement <16 x i8> [[TMP8]], i8 5, i32 4
; CHECK-NEXT: ret <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>
;
%p = alloca [2 x <8 x i8>], align 1, addrspace(5)
store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1
%g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1
store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) %g, align 1
%l = load <8 x i1>, ptr addrspace(5) %g, align 1
ret <8 x i1> %l
}