blob: 3787452db194373d2088af5508801d8c8594808b [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt < %s -mtriple=amdgcn -passes=instcombine -S | FileCheck %s --check-prefixes=CHECK,DEFAULT
; RUN: opt < %s -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -passes=instcombine -S | FileCheck %s --check-prefixes=CHECK,GFX9
; RUN: opt < %s -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1010 -passes=instcombine -S | FileCheck %s --check-prefixes=CHECK,GFX10
; RUN: opt < %s -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1100 -passes=instcombine -S | FileCheck %s --check-prefixes=CHECK,GFX11
; Test that the m0 operand is folded to poison for message types that don't use it.
; For the default target (no mcpu), conflicting encodings (IDs 2, 3) should NOT be folded.
; MSG_INTERRUPT (1) DOES use m0 - should NOT be folded
define void @test_sendmsg_interrupt(i32 %val) {
; CHECK-LABEL: @test_sendmsg_interrupt(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 1, i32 [[VAL:%.*]])
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 1, i32 %val)
ret void
}
; MSG_GS (2) + GS_OP_EMIT (2 << 4) DOES use m0 (pre-GFX11) - should NOT be folded
; On GFX11+ this is MSG_HS_TESSFACTOR which also uses m0 - should NOT be folded
; On default target, this should NOT be folded (conflicting encoding)
define void @test_sendmsg_gs_emit(i32 %val) {
; DEFAULT-LABEL: @test_sendmsg_gs_emit(
; DEFAULT-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 34, i32 [[VAL:%.*]])
; DEFAULT-NEXT: ret void
;
; GFX9-LABEL: @test_sendmsg_gs_emit(
; GFX9-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 34, i32 [[VAL:%.*]])
; GFX9-NEXT: ret void
;
; GFX10-LABEL: @test_sendmsg_gs_emit(
; GFX10-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 34, i32 [[VAL:%.*]])
; GFX10-NEXT: ret void
;
; GFX11-LABEL: @test_sendmsg_gs_emit(
; GFX11-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 34, i32 [[VAL:%.*]])
; GFX11-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 34, i32 %val)
ret void
}
; MSG_GS_DONE (3) DOES use m0 (pre-GFX11) - should NOT be folded
; On GFX11+ this is ID_DEALLOC_VGPRS which doesn't use m0
; On default target, this should NOT be folded (conflicting encoding)
define void @test_sendmsg_gs_done(i32 %val) {
; DEFAULT-LABEL: @test_sendmsg_gs_done(
; DEFAULT-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 3, i32 [[VAL:%.*]])
; DEFAULT-NEXT: ret void
;
; GFX9-LABEL: @test_sendmsg_gs_done(
; GFX9-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 3, i32 [[VAL:%.*]])
; GFX9-NEXT: ret void
;
; GFX10-LABEL: @test_sendmsg_gs_done(
; GFX10-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 3, i32 [[VAL:%.*]])
; GFX10-NEXT: ret void
;
; GFX11-LABEL: @test_sendmsg_gs_done(
; GFX11-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 3, i32 poison)
; GFX11-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 3, i32 %val)
ret void
}
; MSG_SAVEWAVE (4) doesn't use m0 (GFX8-GFX10)
define void @test_sendmsg_savewave(i32 %val) {
; CHECK-LABEL: @test_sendmsg_savewave(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 4, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 4, i32 %val)
ret void
}
; MSG_STALL_WAVE_GEN (5) doesn't use m0 (GFX9-GFX11)
define void @test_sendmsg_stall_wave_gen(i32 %val) {
; CHECK-LABEL: @test_sendmsg_stall_wave_gen(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 5, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 5, i32 %val)
ret void
}
; MSG_HALT_WAVES (6) doesn't use m0 (GFX9-GFX11)
define void @test_sendmsg_halt_waves(i32 %val) {
; CHECK-LABEL: @test_sendmsg_halt_waves(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 6, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 6, i32 %val)
ret void
}
; MSG_ORDERED_PS_DONE (7) doesn't use m0 (GFX9-GFX10)
define void @test_sendmsg_ordered_ps_done(i32 %val) {
; CHECK-LABEL: @test_sendmsg_ordered_ps_done(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 7, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 7, i32 %val)
ret void
}
; MSG_EARLY_PRIM_DEALLOC (8) doesn't use m0 (GFX9 only)
define void @test_sendmsg_early_prim_dealloc(i32 %val) {
; CHECK-LABEL: @test_sendmsg_early_prim_dealloc(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 8, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 8, i32 %val)
ret void
}
; MSG_GS_ALLOC_REQ (9) DOES use m0 - should NOT be folded
define void @test_sendmsg_gs_alloc_req(i32 %val) {
; CHECK-LABEL: @test_sendmsg_gs_alloc_req(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 9, i32 [[VAL:%.*]])
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 9, i32 %val)
ret void
}
; MSG_GET_DOORBELL (10) doesn't use m0 (GFX9-GFX10)
define void @test_sendmsg_get_doorbell(i32 %val) {
; CHECK-LABEL: @test_sendmsg_get_doorbell(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 10, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 10, i32 %val)
ret void
}
; MSG_GET_DDID (11) doesn't use m0 (GFX10 only)
define void @test_sendmsg_get_ddid(i32 %val) {
; CHECK-LABEL: @test_sendmsg_get_ddid(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 11, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 11, i32 %val)
ret void
}
; MSG_SYSMSG (15) doesn't use m0
define void @test_sendmsg_sysmsg(i32 %val) {
; CHECK-LABEL: @test_sendmsg_sysmsg(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 15, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 15, i32 %val)
ret void
}
; Test sendmsghalt as well - MSG_INTERRUPT (1) DOES use m0 - should NOT be folded
define void @test_sendmsghalt_interrupt(i32 %val) {
; CHECK-LABEL: @test_sendmsghalt_interrupt(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsghalt(i32 1, i32 [[VAL:%.*]])
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsghalt(i32 1, i32 %val)
ret void
}
; Test sendmsghalt - MSG_GS_ALLOC_REQ (9) DOES use m0 - should NOT be folded
define void @test_sendmsghalt_gs_alloc_req(i32 %val) {
; CHECK-LABEL: @test_sendmsghalt_gs_alloc_req(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsghalt(i32 9, i32 [[VAL:%.*]])
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsghalt(i32 9, i32 %val)
ret void
}
; m0 already poison - should be a no-op
define void @test_sendmsg_already_poison() {
; CHECK-LABEL: @test_sendmsg_already_poison(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 1, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 1, i32 poison)
ret void
}
; Test that noundef attribute is dropped when folding to poison
; Using MSG_SAVEWAVE (4) which doesn't use m0
define void @test_sendmsg_noundef(i32 noundef %val) {
; CHECK-LABEL: @test_sendmsg_noundef(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 4, i32 poison)
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 4, i32 noundef %val)
ret void
}
; Test unknown message ID - should NOT be folded (future-proofing)
define void @test_sendmsg_unknown_id(i32 %val) {
; CHECK-LABEL: @test_sendmsg_unknown_id(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 14, i32 [[VAL:%.*]])
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 14, i32 %val)
ret void
}
; Test MSG_HS_TESSFACTOR (2) on GFX11+ - DOES use m0, should NOT be folded
; On pre-GFX11, this is MSG_GS which also uses m0
define void @test_sendmsg_hs_tessfactor(i32 %val) {
; CHECK-LABEL: @test_sendmsg_hs_tessfactor(
; CHECK-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 2, i32 [[VAL:%.*]])
; CHECK-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 2, i32 %val)
ret void
}
; Test MSG_DEALLOC_VGPRS (3) on GFX11+ - doesn't use m0
; On default target, this should NOT be folded (conflicting encoding with MSG_GS_DONE)
define void @test_sendmsg_dealloc_vgprs(i32 %val) {
; DEFAULT-LABEL: @test_sendmsg_dealloc_vgprs(
; DEFAULT-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 3, i32 [[VAL:%.*]])
; DEFAULT-NEXT: ret void
;
; GFX9-LABEL: @test_sendmsg_dealloc_vgprs(
; GFX9-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 3, i32 [[VAL:%.*]])
; GFX9-NEXT: ret void
;
; GFX10-LABEL: @test_sendmsg_dealloc_vgprs(
; GFX10-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 3, i32 [[VAL:%.*]])
; GFX10-NEXT: ret void
;
; GFX11-LABEL: @test_sendmsg_dealloc_vgprs(
; GFX11-NEXT: call void @llvm.amdgcn.s.sendmsg(i32 3, i32 poison)
; GFX11-NEXT: ret void
;
call void @llvm.amdgcn.s.sendmsg(i32 3, i32 %val)
ret void
}
declare void @llvm.amdgcn.s.sendmsg(i32 immarg, i32)
declare void @llvm.amdgcn.s.sendmsghalt(i32 immarg, i32)