| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5 |
| ; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -loop-reduce %s | FileCheck %s |
| |
| ; Test for assert resulting from inconsistent isLegalAddressingMode |
| ; answers when the address space was dropped from the query. |
| |
| %0 = type { i32, double, i32, float } |
| |
| |
| define amdgpu_kernel void @lsr_crash_preserve_addrspace_unknown_type() #0 { |
| ; CHECK-LABEL: define amdgpu_kernel void @lsr_crash_preserve_addrspace_unknown_type( |
| ; CHECK-SAME: ) #[[ATTR0:[0-9]+]] { |
| ; CHECK-NEXT: [[BB:.*]]: |
| ; CHECK-NEXT: br label %[[BB1:.*]] |
| ; CHECK: [[BB1]]: |
| ; CHECK-NEXT: [[TMP:%.*]] = phi ptr addrspace(3) [ undef, %[[BB]] ], [ [[TMP18:%.*]], %[[BB17:.*]] ] |
| ; CHECK-NEXT: [[SCEVGEP1:%.*]] = getelementptr i8, ptr addrspace(3) [[TMP]], i32 8 |
| ; CHECK-NEXT: [[TMP3:%.*]] = load double, ptr addrspace(3) [[SCEVGEP1]], align 8 |
| ; CHECK-NEXT: br label %[[BB4:.*]] |
| ; CHECK: [[BB4]]: |
| ; CHECK-NEXT: br i1 false, label %[[BB8:.*]], label %[[BB5:.*]] |
| ; CHECK: [[BB5]]: |
| ; CHECK-NEXT: unreachable |
| ; CHECK: [[BB8]]: |
| ; CHECK-NEXT: [[TMP10:%.*]] = load i32, ptr addrspace(3) [[TMP]], align 4 |
| ; CHECK-NEXT: [[TMP11:%.*]] = icmp eq i32 0, [[TMP10]] |
| ; CHECK-NEXT: br i1 [[TMP11]], label %[[BB12:.*]], label %[[BB17]] |
| ; CHECK: [[BB12]]: |
| ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr addrspace(3) [[TMP]], i32 16 |
| ; CHECK-NEXT: [[TMP14:%.*]] = load i32, ptr addrspace(3) [[SCEVGEP]], align 4 |
| ; CHECK-NEXT: [[TMP15:%.*]] = icmp eq i32 0, [[TMP14]] |
| ; CHECK-NEXT: br i1 [[TMP15]], label %[[BB16:.*]], label %[[BB17]] |
| ; CHECK: [[BB16]]: |
| ; CHECK-NEXT: unreachable |
| ; CHECK: [[BB17]]: |
| ; CHECK-NEXT: [[TMP18]] = getelementptr inbounds [[TMP0:%.*]], ptr addrspace(3) [[TMP]], i64 2 |
| ; CHECK-NEXT: br label %[[BB1]] |
| ; |
| bb: |
| br label %bb1 |
| |
| bb1: ; preds = %bb17, %bb |
| %tmp = phi ptr addrspace(3) [ undef, %bb ], [ %tmp18, %bb17 ] |
| %tmp2 = getelementptr inbounds %0, ptr addrspace(3) %tmp, i64 0, i32 1 |
| %tmp3 = load double, ptr addrspace(3) %tmp2, align 8 |
| br label %bb4 |
| |
| bb4: ; preds = %bb1 |
| br i1 false, label %bb8, label %bb5 |
| |
| bb5: ; preds = %bb4 |
| unreachable |
| |
| bb8: ; preds = %bb4 |
| %tmp10 = load i32, ptr addrspace(3) %tmp, align 4 |
| %tmp11 = icmp eq i32 0, %tmp10 |
| br i1 %tmp11, label %bb12, label %bb17 |
| |
| bb12: ; preds = %bb8 |
| %tmp13 = getelementptr inbounds %0, ptr addrspace(3) %tmp, i64 0, i32 2 |
| %tmp14 = load i32, ptr addrspace(3) %tmp13, align 4 |
| %tmp15 = icmp eq i32 0, %tmp14 |
| br i1 %tmp15, label %bb16, label %bb17 |
| |
| bb16: ; preds = %bb12 |
| unreachable |
| |
| bb17: ; preds = %bb12, %bb8 |
| %tmp18 = getelementptr inbounds %0, ptr addrspace(3) %tmp, i64 2 |
| br label %bb1 |
| } |
| |
| define void @lsr_crash_preserve_addrspace_unknown_type2(ptr addrspace(5) %array, ptr addrspace(3) %array2) { |
| ; CHECK-LABEL: define void @lsr_crash_preserve_addrspace_unknown_type2( |
| ; CHECK-SAME: ptr addrspace(5) [[ARRAY:%.*]], ptr addrspace(3) [[ARRAY2:%.*]]) { |
| ; CHECK-NEXT: [[ENTRY:.*]]: |
| ; CHECK-NEXT: br label %[[FOR_BODY:.*]] |
| ; CHECK: [[FOR_BODY]]: |
| ; CHECK-NEXT: [[J:%.*]] = phi i32 [ [[ADD:%.*]], %[[FOR_INC:.*]] ], [ 0, %[[ENTRY]] ] |
| ; CHECK-NEXT: [[IDX:%.*]] = getelementptr i8, ptr addrspace(5) [[ARRAY]], i32 [[J]] |
| ; CHECK-NEXT: [[IDX1:%.*]] = getelementptr i8, ptr addrspace(3) [[ARRAY2]], i32 [[J]] |
| ; CHECK-NEXT: [[T:%.*]] = getelementptr i8, ptr addrspace(5) [[ARRAY]], i32 [[J]] |
| ; CHECK-NEXT: [[N8:%.*]] = load i8, ptr addrspace(5) [[T]], align 4 |
| ; CHECK-NEXT: [[N7:%.*]] = getelementptr i8, ptr addrspace(5) [[T]], i32 42 |
| ; CHECK-NEXT: [[N9:%.*]] = load i8, ptr addrspace(5) [[N7]], align 4 |
| ; CHECK-NEXT: [[CMP:%.*]] = icmp sgt i32 [[J]], 42 |
| ; CHECK-NEXT: br i1 [[CMP]], label %[[IF_THEN17:.*]], label %[[FOR_INC]] |
| ; CHECK: [[IF_THEN17]]: |
| ; CHECK-NEXT: call void @llvm.memcpy.p5.p3.i64(ptr addrspace(5) [[IDX]], ptr addrspace(3) [[IDX1]], i64 42, i1 false) |
| ; CHECK-NEXT: call void @llvm.memmove.p5.p3.i64(ptr addrspace(5) [[IDX]], ptr addrspace(3) [[IDX1]], i64 42, i1 false) |
| ; CHECK-NEXT: call void @llvm.memset.p5.i64(ptr addrspace(5) [[IDX]], i8 42, i64 42, i1 false) |
| ; CHECK-NEXT: br label %[[FOR_INC]] |
| ; CHECK: [[FOR_INC]]: |
| ; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i1 [[CMP]], true |
| ; CHECK-NEXT: [[ADD]] = add nuw nsw i32 [[J]], 1 |
| ; CHECK-NEXT: br i1 [[EXITCOND]], label %[[END:.*]], label %[[FOR_BODY]] |
| ; CHECK: [[END]]: |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| br label %for.body |
| |
| for.body: ; preds = %entry, %for.inc |
| %j = phi i32 [ %add, %for.inc ], [ 0, %entry ] |
| %idx = getelementptr inbounds i8, ptr addrspace(5) %array, i32 %j |
| %idx1 = getelementptr inbounds i8, ptr addrspace(3) %array2, i32 %j |
| %t = getelementptr inbounds i8, ptr addrspace(5) %array, i32 %j |
| %n8 = load i8, ptr addrspace(5) %t, align 4 |
| %n7 = getelementptr inbounds i8, ptr addrspace(5) %t, i32 42 |
| %n9 = load i8, ptr addrspace(5) %n7, align 4 |
| %cmp = icmp sgt i32 %j, 42 |
| %add = add nuw nsw i32 %j, 1 |
| br i1 %cmp, label %if.then17, label %for.inc |
| |
| if.then17: ; preds = %for.body |
| call void @llvm.memcpy.p5.p5.i64(ptr addrspace(5) %idx, ptr addrspace(3) %idx1, i64 42, i1 false) |
| call void @llvm.memmove.p5.p5.i64(ptr addrspace(5) %idx, ptr addrspace(3) %idx1, i64 42, i1 false) |
| call void @llvm.memset.p5.i64(ptr addrspace(5) %idx, i8 42, i64 42, i1 false) |
| br label %for.inc |
| |
| for.inc: ; preds = %for.body, %if.then17 |
| %exitcond = icmp eq i1 %cmp, 1 |
| br i1 %exitcond, label %end, label %for.body |
| |
| end: ; preds = %for.inc |
| ret void |
| } |
| |
| declare void @llvm.memcpy.p5.p5.i64(ptr addrspace(5), ptr addrspace(3), i64, i1) |
| declare void @llvm.memmove.p5.p5.i64(ptr addrspace(5), ptr addrspace(3), i64, i1) |
| declare void @llvm.memset.p5.i64(ptr addrspace(5), i8, i64, i1) |
| |
| attributes #0 = { nounwind } |
| attributes #1 = { nounwind readnone } |