| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py |
| ; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-promote-alloca < %s | FileCheck %s |
| |
| ; Check that types where the store/allocation sizes don't match the type size |
| ; don't crash. |
| |
| |
| define <7 x i9> @load_elem_i9_access_7xi9() { |
| ; CHECK-LABEL: @load_elem_i9_access_7xi9( |
| ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i9>, align 1, addrspace(5) |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 |
| ; CHECK-NEXT: [[L:%.*]] = load <7 x i9>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <7 x i9> [[L]] |
| ; |
| %p = alloca <16 x i9>, align 1, addrspace(5) |
| %g = getelementptr i8, ptr addrspace(5) %p, i64 4 |
| %l = load <7 x i9>, ptr addrspace(5) %g, align 1 |
| ret <7 x i9> %l |
| } |
| |
| define <8 x i1> @load_elem_i1_access_8xi1() { |
| ; CHECK-LABEL: @load_elem_i1_access_8xi1( |
| ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5) |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 |
| ; CHECK-NEXT: [[L:%.*]] = load <8 x i1>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <8 x i1> [[L]] |
| ; |
| %p = alloca <16 x i1>, align 1, addrspace(5) |
| %g = getelementptr i8, ptr addrspace(5) %p, i64 4 |
| %l = load <8 x i1>, ptr addrspace(5) %g, align 1 |
| ret <8 x i1> %l |
| } |
| |
| define <3 x i1> @load_elem_i1_access_3xi1() { |
| ; CHECK-LABEL: @load_elem_i1_access_3xi1( |
| ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5) |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 |
| ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <3 x i1> [[L]] |
| ; |
| %p = alloca <16 x i1>, align 1, addrspace(5) |
| %g = getelementptr i8, ptr addrspace(5) %p, i64 4 |
| %l = load <3 x i1>, ptr addrspace(5) %g, align 1 |
| ret <3 x i1> %l |
| } |
| |
| define <3 x i1> @load_elem_i8_access_3xi1() { |
| ; CHECK-LABEL: @load_elem_i8_access_3xi1( |
| ; CHECK-NEXT: [[P:%.*]] = alloca <8 x i8>, align 1, addrspace(5) |
| ; CHECK-NEXT: store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) [[P]], align 1 |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr <4 x i8>, ptr addrspace(5) [[P]], i64 1 |
| ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <3 x i1> [[L]] |
| ; |
| %p = alloca <8 x i8>, align 1, addrspace(5) |
| store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1 |
| %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 |
| %l = load <3 x i1>, ptr addrspace(5) %g, align 1 |
| ret <3 x i1> %l |
| } |
| |
| ; This one is actually not problematic. |
| define <8 x i1> @load_elem_i8_access_8xi1() { |
| ; CHECK-LABEL: @load_elem_i8_access_8xi1( |
| ; CHECK-NEXT: [[P:%.*]] = freeze <8 x i8> poison |
| ; CHECK-NEXT: ret <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false> |
| ; |
| %p = alloca <8 x i8>, align 1, addrspace(5) |
| store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1 |
| %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 |
| %l = load <8 x i1>, ptr addrspace(5) %g, align 1 |
| ret <8 x i1> %l |
| } |
| |
| define <8 x i1> @storeload_elem_i1_access_8xi1() { |
| ; CHECK-LABEL: @storeload_elem_i1_access_8xi1( |
| ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5) |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 |
| ; CHECK-NEXT: store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: [[L:%.*]] = load <8 x i1>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <8 x i1> [[L]] |
| ; |
| %p = alloca <16 x i1>, align 1, addrspace(5) |
| %g = getelementptr i8, ptr addrspace(5) %p, i64 4 |
| store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) %g, align 1 |
| %l = load <8 x i1>, ptr addrspace(5) %g, align 1 |
| ret <8 x i1> %l |
| } |
| |
| define <3 x i1> @storeload_elem_i1_access_3xi1() { |
| ; CHECK-LABEL: @storeload_elem_i1_access_3xi1( |
| ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5) |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 |
| ; CHECK-NEXT: store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <3 x i1> [[L]] |
| ; |
| %p = alloca <16 x i1>, align 1, addrspace(5) |
| %g = getelementptr i8, ptr addrspace(5) %p, i64 4 |
| store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) %g, align 1 |
| %l = load <3 x i1>, ptr addrspace(5) %g, align 1 |
| ret <3 x i1> %l |
| } |
| |
| define <3 x i1> @storeload_elem_i8_access_3xi1() { |
| ; CHECK-LABEL: @storeload_elem_i8_access_3xi1( |
| ; CHECK-NEXT: [[P:%.*]] = alloca <8 x i8>, align 1, addrspace(5) |
| ; CHECK-NEXT: store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) [[P]], align 1 |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr <4 x i8>, ptr addrspace(5) [[P]], i64 1 |
| ; CHECK-NEXT: store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <3 x i1> [[L]] |
| ; |
| %p = alloca <8 x i8>, align 1, addrspace(5) |
| store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1 |
| %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 |
| store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) %g, align 1 |
| %l = load <3 x i1>, ptr addrspace(5) %g, align 1 |
| ret <3 x i1> %l |
| } |
| |
| ; This one is actually not problematic. |
| define <8 x i1> @storeload_elem_i8_access_8xi1() { |
| ; CHECK-LABEL: @storeload_elem_i8_access_8xi1( |
| ; CHECK-NEXT: [[P:%.*]] = freeze <8 x i8> poison |
| ; CHECK-NEXT: ret <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false> |
| ; |
| %p = alloca <8 x i8>, align 1, addrspace(5) |
| store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1 |
| %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 |
| store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) %g, align 1 |
| %l = load <8 x i1>, ptr addrspace(5) %g, align 1 |
| ret <8 x i1> %l |
| } |
| |
| define <8 x i1> @array_of_vec_elem_i1_access_8xi1() { |
| ; CHECK-LABEL: @array_of_vec_elem_i1_access_8xi1( |
| ; CHECK-NEXT: [[P:%.*]] = alloca [2 x <16 x i1>], align 1, addrspace(5) |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 |
| ; CHECK-NEXT: store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: [[L:%.*]] = load <8 x i1>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <8 x i1> [[L]] |
| ; |
| %p = alloca [2 x <16 x i1>], align 1, addrspace(5) |
| %g = getelementptr i8, ptr addrspace(5) %p, i64 4 |
| store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) %g, align 1 |
| %l = load <8 x i1>, ptr addrspace(5) %g, align 1 |
| ret <8 x i1> %l |
| } |
| |
| define <3 x i1> @array_of_vec_elem_i1_access_3xi1() { |
| ; CHECK-LABEL: @array_of_vec_elem_i1_access_3xi1( |
| ; CHECK-NEXT: [[P:%.*]] = alloca [2 x <16 x i1>], align 1, addrspace(5) |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 |
| ; CHECK-NEXT: store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <3 x i1> [[L]] |
| ; |
| %p = alloca [2 x <16 x i1>], align 1, addrspace(5) |
| %g = getelementptr i8, ptr addrspace(5) %p, i64 4 |
| store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) %g, align 1 |
| %l = load <3 x i1>, ptr addrspace(5) %g, align 1 |
| ret <3 x i1> %l |
| } |
| |
| define <3 x i1> @array_of_vec_elem_i8_access_3xi1() { |
| ; CHECK-LABEL: @array_of_vec_elem_i8_access_3xi1( |
| ; CHECK-NEXT: [[P:%.*]] = alloca [2 x <8 x i8>], align 1, addrspace(5) |
| ; CHECK-NEXT: store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) [[P]], align 1 |
| ; CHECK-NEXT: [[G:%.*]] = getelementptr <4 x i8>, ptr addrspace(5) [[P]], i64 1 |
| ; CHECK-NEXT: store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 |
| ; CHECK-NEXT: ret <3 x i1> [[L]] |
| ; |
| %p = alloca [2 x <8 x i8>], align 1, addrspace(5) |
| store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1 |
| %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 |
| store <3 x i1> <i1 true, i1 false, i1 true>, ptr addrspace(5) %g, align 1 |
| %l = load <3 x i1>, ptr addrspace(5) %g, align 1 |
| ret <3 x i1> %l |
| } |
| |
| ; This one is actually not problematic. |
| define <8 x i1> @array_of_vec_elem_i8_access_8xi1() { |
| ; CHECK-LABEL: @array_of_vec_elem_i8_access_8xi1( |
| ; CHECK-NEXT: [[P:%.*]] = freeze <16 x i8> poison |
| ; CHECK-NEXT: [[TMP1:%.*]] = insertelement <16 x i8> [[P]], i8 1, i32 0 |
| ; CHECK-NEXT: [[TMP2:%.*]] = insertelement <16 x i8> [[TMP1]], i8 2, i32 1 |
| ; CHECK-NEXT: [[TMP3:%.*]] = insertelement <16 x i8> [[TMP2]], i8 3, i32 2 |
| ; CHECK-NEXT: [[TMP4:%.*]] = insertelement <16 x i8> [[TMP3]], i8 4, i32 3 |
| ; CHECK-NEXT: [[TMP5:%.*]] = insertelement <16 x i8> [[TMP4]], i8 5, i32 4 |
| ; CHECK-NEXT: [[TMP6:%.*]] = insertelement <16 x i8> [[TMP5]], i8 6, i32 5 |
| ; CHECK-NEXT: [[TMP7:%.*]] = insertelement <16 x i8> [[TMP6]], i8 7, i32 6 |
| ; CHECK-NEXT: [[TMP8:%.*]] = insertelement <16 x i8> [[TMP7]], i8 8, i32 7 |
| ; CHECK-NEXT: [[TMP9:%.*]] = insertelement <16 x i8> [[TMP8]], i8 5, i32 4 |
| ; CHECK-NEXT: ret <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false> |
| ; |
| %p = alloca [2 x <8 x i8>], align 1, addrspace(5) |
| store <8 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, ptr addrspace(5) %p, align 1 |
| %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 |
| store <8 x i1> <i1 true, i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false>, ptr addrspace(5) %g, align 1 |
| %l = load <8 x i1>, ptr addrspace(5) %g, align 1 |
| ret <8 x i1> %l |
| } |