| # NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py |
| # RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx900 -run-pass=legalizer %s -o - | FileCheck -check-prefix=GFX9 %s |
| # RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx1200 -mattr=-real-true16 -run-pass=legalizer %s -o - | FileCheck -check-prefixes=GFX12 %s |
| |
| --- |
| name: test_fminimum_f16 |
| body: | |
| bb.0: |
| liveins: $vgpr0, $vgpr1 |
| |
| ; GFX9-LABEL: name: test_fminimum_f16 |
| ; GFX9: liveins: $vgpr0, $vgpr1 |
| ; GFX9-NEXT: {{ $}} |
| ; GFX9-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX9-NEXT: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[COPY]](s32) |
| ; GFX9-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX9-NEXT: [[TRUNC1:%[0-9]+]]:_(s16) = G_TRUNC [[COPY1]](s32) |
| ; GFX9-NEXT: [[FMINNUM_IEEE:%[0-9]+]]:_(s16) = G_FMINNUM_IEEE [[TRUNC]], [[TRUNC1]] |
| ; GFX9-NEXT: [[FCMP:%[0-9]+]]:_(s1) = G_FCMP floatpred(ord), [[TRUNC]](s16), [[TRUNC1]] |
| ; GFX9-NEXT: [[C:%[0-9]+]]:_(s16) = G_FCONSTANT half 0xH7E00 |
| ; GFX9-NEXT: [[SELECT:%[0-9]+]]:_(s16) = G_SELECT [[FCMP]](s1), [[FMINNUM_IEEE]], [[C]] |
| ; GFX9-NEXT: [[COPY2:%[0-9]+]]:_(s16) = COPY [[SELECT]](s16) |
| ; GFX9-NEXT: [[ANYEXT:%[0-9]+]]:_(s32) = G_ANYEXT [[COPY2]](s16) |
| ; GFX9-NEXT: $vgpr0 = COPY [[ANYEXT]](s32) |
| ; GFX9-NEXT: SI_RETURN implicit $vgpr0 |
| ; |
| ; GFX12-LABEL: name: test_fminimum_f16 |
| ; GFX12: liveins: $vgpr0, $vgpr1 |
| ; GFX12-NEXT: {{ $}} |
| ; GFX12-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX12-NEXT: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[COPY]](s32) |
| ; GFX12-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX12-NEXT: [[TRUNC1:%[0-9]+]]:_(s16) = G_TRUNC [[COPY1]](s32) |
| ; GFX12-NEXT: [[FMINIMUM:%[0-9]+]]:_(s16) = G_FMINIMUM [[TRUNC]], [[TRUNC1]] |
| ; GFX12-NEXT: [[ANYEXT:%[0-9]+]]:_(s32) = G_ANYEXT [[FMINIMUM]](s16) |
| ; GFX12-NEXT: $vgpr0 = COPY [[ANYEXT]](s32) |
| ; GFX12-NEXT: SI_RETURN implicit $vgpr0 |
| %0:_(s32) = COPY $vgpr0 |
| %1:_(s16) = G_TRUNC %0(s32) |
| %2:_(s32) = COPY $vgpr1 |
| %3:_(s16) = G_TRUNC %2(s32) |
| %4:_(s16) = G_FMINIMUM %1, %3 |
| %5:_(s32) = G_ANYEXT %4(s16) |
| $vgpr0 = COPY %5(s32) |
| SI_RETURN implicit $vgpr0 |
| ... |
| --- |
| name: test_fminimum_f32 |
| body: | |
| bb.0: |
| liveins: $vgpr0, $vgpr1 |
| |
| ; GFX9-LABEL: name: test_fminimum_f32 |
| ; GFX9: liveins: $vgpr0, $vgpr1 |
| ; GFX9-NEXT: {{ $}} |
| ; GFX9-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX9-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX9-NEXT: [[FMINNUM_IEEE:%[0-9]+]]:_(s32) = G_FMINNUM_IEEE [[COPY]], [[COPY1]] |
| ; GFX9-NEXT: [[FCMP:%[0-9]+]]:_(s1) = G_FCMP floatpred(ord), [[COPY]](s32), [[COPY1]] |
| ; GFX9-NEXT: [[C:%[0-9]+]]:_(s32) = G_FCONSTANT float 0x7FF8000000000000 |
| ; GFX9-NEXT: [[SELECT:%[0-9]+]]:_(s32) = G_SELECT [[FCMP]](s1), [[FMINNUM_IEEE]], [[C]] |
| ; GFX9-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY [[SELECT]](s32) |
| ; GFX9-NEXT: $vgpr0 = COPY [[COPY2]](s32) |
| ; GFX9-NEXT: SI_RETURN implicit $vgpr0 |
| ; |
| ; GFX12-LABEL: name: test_fminimum_f32 |
| ; GFX12: liveins: $vgpr0, $vgpr1 |
| ; GFX12-NEXT: {{ $}} |
| ; GFX12-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX12-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX12-NEXT: [[FMINIMUM:%[0-9]+]]:_(s32) = G_FMINIMUM [[COPY]], [[COPY1]] |
| ; GFX12-NEXT: $vgpr0 = COPY [[FMINIMUM]](s32) |
| ; GFX12-NEXT: SI_RETURN implicit $vgpr0 |
| %0:_(s32) = COPY $vgpr0 |
| %1:_(s32) = COPY $vgpr1 |
| %2:_(s32) = G_FMINIMUM %0, %1 |
| $vgpr0 = COPY %2(s32) |
| SI_RETURN implicit $vgpr0 |
| ... |
| --- |
| name: test_fminimum_f64 |
| body: | |
| bb.0: |
| liveins: $vgpr0_vgpr1, $vgpr2_vgpr3 |
| |
| ; GFX9-LABEL: name: test_fminimum_f64 |
| ; GFX9: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3 |
| ; GFX9-NEXT: {{ $}} |
| ; GFX9-NEXT: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1 |
| ; GFX9-NEXT: [[COPY1:%[0-9]+]]:_(s64) = COPY $vgpr2_vgpr3 |
| ; GFX9-NEXT: [[FMINNUM_IEEE:%[0-9]+]]:_(s64) = G_FMINNUM_IEEE [[COPY]], [[COPY1]] |
| ; GFX9-NEXT: [[FCMP:%[0-9]+]]:_(s1) = G_FCMP floatpred(ord), [[COPY]](s64), [[COPY1]] |
| ; GFX9-NEXT: [[C:%[0-9]+]]:_(s64) = G_FCONSTANT double 0x7FF8000000000000 |
| ; GFX9-NEXT: [[SELECT:%[0-9]+]]:_(s64) = G_SELECT [[FCMP]](s1), [[FMINNUM_IEEE]], [[C]] |
| ; GFX9-NEXT: [[COPY2:%[0-9]+]]:_(s64) = COPY [[SELECT]](s64) |
| ; GFX9-NEXT: $vgpr0_vgpr1 = COPY [[COPY2]](s64) |
| ; GFX9-NEXT: SI_RETURN implicit $vgpr0_vgpr1 |
| ; |
| ; GFX12-LABEL: name: test_fminimum_f64 |
| ; GFX12: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3 |
| ; GFX12-NEXT: {{ $}} |
| ; GFX12-NEXT: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1 |
| ; GFX12-NEXT: [[COPY1:%[0-9]+]]:_(s64) = COPY $vgpr2_vgpr3 |
| ; GFX12-NEXT: [[FMINIMUM:%[0-9]+]]:_(s64) = G_FMINIMUM [[COPY]], [[COPY1]] |
| ; GFX12-NEXT: $vgpr0_vgpr1 = COPY [[FMINIMUM]](s64) |
| ; GFX12-NEXT: SI_RETURN implicit $vgpr0_vgpr1 |
| %0:_(s64) = COPY $vgpr0_vgpr1 |
| %1:_(s64) = COPY $vgpr2_vgpr3 |
| %2:_(s64) = G_FMINIMUM %0, %1 |
| $vgpr0_vgpr1 = COPY %2(s64) |
| SI_RETURN implicit $vgpr0_vgpr1 |
| ... |
| --- |
| name: test_fminimum_v2f16 |
| body: | |
| bb.0: |
| liveins: $vgpr0, $vgpr1 |
| |
| ; GFX9-LABEL: name: test_fminimum_v2f16 |
| ; GFX9: liveins: $vgpr0, $vgpr1 |
| ; GFX9-NEXT: {{ $}} |
| ; GFX9-NEXT: [[COPY:%[0-9]+]]:_(<2 x s16>) = COPY $vgpr0 |
| ; GFX9-NEXT: [[COPY1:%[0-9]+]]:_(<2 x s16>) = COPY $vgpr1 |
| ; GFX9-NEXT: [[FMINNUM_IEEE:%[0-9]+]]:_(<2 x s16>) = G_FMINNUM_IEEE [[COPY]], [[COPY1]] |
| ; GFX9-NEXT: [[BITCAST:%[0-9]+]]:_(s32) = G_BITCAST [[COPY]](<2 x s16>) |
| ; GFX9-NEXT: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[BITCAST]](s32) |
| ; GFX9-NEXT: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 16 |
| ; GFX9-NEXT: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[BITCAST]], [[C]](s32) |
| ; GFX9-NEXT: [[TRUNC1:%[0-9]+]]:_(s16) = G_TRUNC [[LSHR]](s32) |
| ; GFX9-NEXT: [[BITCAST1:%[0-9]+]]:_(s32) = G_BITCAST [[COPY1]](<2 x s16>) |
| ; GFX9-NEXT: [[TRUNC2:%[0-9]+]]:_(s16) = G_TRUNC [[BITCAST1]](s32) |
| ; GFX9-NEXT: [[LSHR1:%[0-9]+]]:_(s32) = G_LSHR [[BITCAST1]], [[C]](s32) |
| ; GFX9-NEXT: [[TRUNC3:%[0-9]+]]:_(s16) = G_TRUNC [[LSHR1]](s32) |
| ; GFX9-NEXT: [[FCMP:%[0-9]+]]:_(s1) = G_FCMP floatpred(ord), [[TRUNC]](s16), [[TRUNC2]] |
| ; GFX9-NEXT: [[FCMP1:%[0-9]+]]:_(s1) = G_FCMP floatpred(ord), [[TRUNC1]](s16), [[TRUNC3]] |
| ; GFX9-NEXT: [[C1:%[0-9]+]]:_(s16) = G_FCONSTANT half 0xH7E00 |
| ; GFX9-NEXT: [[BITCAST2:%[0-9]+]]:_(s32) = G_BITCAST [[FMINNUM_IEEE]](<2 x s16>) |
| ; GFX9-NEXT: [[TRUNC4:%[0-9]+]]:_(s16) = G_TRUNC [[BITCAST2]](s32) |
| ; GFX9-NEXT: [[LSHR2:%[0-9]+]]:_(s32) = G_LSHR [[BITCAST2]], [[C]](s32) |
| ; GFX9-NEXT: [[TRUNC5:%[0-9]+]]:_(s16) = G_TRUNC [[LSHR2]](s32) |
| ; GFX9-NEXT: [[SELECT:%[0-9]+]]:_(s16) = G_SELECT [[FCMP]](s1), [[TRUNC4]], [[C1]] |
| ; GFX9-NEXT: [[SELECT1:%[0-9]+]]:_(s16) = G_SELECT [[FCMP1]](s1), [[TRUNC5]], [[C1]] |
| ; GFX9-NEXT: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s16>) = G_BUILD_VECTOR [[SELECT]](s16), [[SELECT1]](s16) |
| ; GFX9-NEXT: [[COPY2:%[0-9]+]]:_(<2 x s16>) = COPY [[BUILD_VECTOR]](<2 x s16>) |
| ; GFX9-NEXT: $vgpr0 = COPY [[COPY2]](<2 x s16>) |
| ; GFX9-NEXT: SI_RETURN implicit $vgpr0 |
| ; |
| ; GFX12-LABEL: name: test_fminimum_v2f16 |
| ; GFX12: liveins: $vgpr0, $vgpr1 |
| ; GFX12-NEXT: {{ $}} |
| ; GFX12-NEXT: [[COPY:%[0-9]+]]:_(<2 x s16>) = COPY $vgpr0 |
| ; GFX12-NEXT: [[COPY1:%[0-9]+]]:_(<2 x s16>) = COPY $vgpr1 |
| ; GFX12-NEXT: [[FMINIMUM:%[0-9]+]]:_(<2 x s16>) = G_FMINIMUM [[COPY]], [[COPY1]] |
| ; GFX12-NEXT: $vgpr0 = COPY [[FMINIMUM]](<2 x s16>) |
| ; GFX12-NEXT: SI_RETURN implicit $vgpr0 |
| %0:_(<2 x s16>) = COPY $vgpr0 |
| %1:_(<2 x s16>) = COPY $vgpr1 |
| %2:_(<2 x s16>) = G_FMINIMUM %0, %1 |
| $vgpr0 = COPY %2(<2 x s16>) |
| SI_RETURN implicit $vgpr0 |
| ... |
| --- |
| name: test_fminimum_v2f32 |
| body: | |
| bb.0: |
| liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3 |
| |
| ; GFX9-LABEL: name: test_fminimum_v2f32 |
| ; GFX9: liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3 |
| ; GFX9-NEXT: {{ $}} |
| ; GFX9-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX9-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX9-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY $vgpr2 |
| ; GFX9-NEXT: [[COPY3:%[0-9]+]]:_(s32) = COPY $vgpr3 |
| ; GFX9-NEXT: [[FMINNUM_IEEE:%[0-9]+]]:_(s32) = G_FMINNUM_IEEE [[COPY]], [[COPY2]] |
| ; GFX9-NEXT: [[FCMP:%[0-9]+]]:_(s1) = G_FCMP floatpred(ord), [[COPY]](s32), [[COPY2]] |
| ; GFX9-NEXT: [[C:%[0-9]+]]:_(s32) = G_FCONSTANT float 0x7FF8000000000000 |
| ; GFX9-NEXT: [[SELECT:%[0-9]+]]:_(s32) = G_SELECT [[FCMP]](s1), [[FMINNUM_IEEE]], [[C]] |
| ; GFX9-NEXT: [[COPY4:%[0-9]+]]:_(s32) = COPY [[SELECT]](s32) |
| ; GFX9-NEXT: [[FMINNUM_IEEE1:%[0-9]+]]:_(s32) = G_FMINNUM_IEEE [[COPY1]], [[COPY3]] |
| ; GFX9-NEXT: [[FCMP1:%[0-9]+]]:_(s1) = G_FCMP floatpred(ord), [[COPY1]](s32), [[COPY3]] |
| ; GFX9-NEXT: [[SELECT1:%[0-9]+]]:_(s32) = G_SELECT [[FCMP1]](s1), [[FMINNUM_IEEE1]], [[C]] |
| ; GFX9-NEXT: [[COPY5:%[0-9]+]]:_(s32) = COPY [[SELECT1]](s32) |
| ; GFX9-NEXT: $vgpr0 = COPY [[COPY4]](s32) |
| ; GFX9-NEXT: $vgpr1 = COPY [[COPY5]](s32) |
| ; GFX9-NEXT: SI_RETURN implicit $vgpr0, implicit $vgpr1 |
| ; |
| ; GFX12-LABEL: name: test_fminimum_v2f32 |
| ; GFX12: liveins: $vgpr0, $vgpr1, $vgpr2, $vgpr3 |
| ; GFX12-NEXT: {{ $}} |
| ; GFX12-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX12-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX12-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY $vgpr2 |
| ; GFX12-NEXT: [[COPY3:%[0-9]+]]:_(s32) = COPY $vgpr3 |
| ; GFX12-NEXT: [[FMINIMUM:%[0-9]+]]:_(s32) = G_FMINIMUM [[COPY]], [[COPY2]] |
| ; GFX12-NEXT: [[FMINIMUM1:%[0-9]+]]:_(s32) = G_FMINIMUM [[COPY1]], [[COPY3]] |
| ; GFX12-NEXT: $vgpr0 = COPY [[FMINIMUM]](s32) |
| ; GFX12-NEXT: $vgpr1 = COPY [[FMINIMUM1]](s32) |
| ; GFX12-NEXT: SI_RETURN implicit $vgpr0, implicit $vgpr1 |
| %0:_(s32) = COPY $vgpr0 |
| %1:_(s32) = COPY $vgpr1 |
| %2:_(<2 x s32>) = G_BUILD_VECTOR %0(s32), %1(s32) |
| %3:_(s32) = COPY $vgpr2 |
| %4:_(s32) = COPY $vgpr3 |
| %5:_(<2 x s32>) = G_BUILD_VECTOR %3(s32), %4(s32) |
| %6:_(<2 x s32>) = G_FMINIMUM %2, %5 |
| %7:_(s32), %8:_(s32) = G_UNMERGE_VALUES %6(<2 x s32>) |
| $vgpr0 = COPY %7(s32) |
| $vgpr1 = COPY %8(s32) |
| SI_RETURN implicit $vgpr0, implicit $vgpr1 |
| ... |
| --- |
| name: test_fminimum_nsz_f32 |
| body: | |
| bb.0: |
| liveins: $vgpr0, $vgpr1 |
| |
| ; GFX9-LABEL: name: test_fminimum_nsz_f32 |
| ; GFX9: liveins: $vgpr0, $vgpr1 |
| ; GFX9-NEXT: {{ $}} |
| ; GFX9-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX9-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX9-NEXT: [[FMINNUM_IEEE:%[0-9]+]]:_(s32) = G_FMINNUM_IEEE [[COPY]], [[COPY1]] |
| ; GFX9-NEXT: [[FCMP:%[0-9]+]]:_(s1) = G_FCMP floatpred(ord), [[COPY]](s32), [[COPY1]] |
| ; GFX9-NEXT: [[C:%[0-9]+]]:_(s32) = G_FCONSTANT float 0x7FF8000000000000 |
| ; GFX9-NEXT: [[SELECT:%[0-9]+]]:_(s32) = G_SELECT [[FCMP]](s1), [[FMINNUM_IEEE]], [[C]] |
| ; GFX9-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY [[SELECT]](s32) |
| ; GFX9-NEXT: $vgpr0 = COPY [[COPY2]](s32) |
| ; GFX9-NEXT: SI_RETURN implicit $vgpr0 |
| ; |
| ; GFX12-LABEL: name: test_fminimum_nsz_f32 |
| ; GFX12: liveins: $vgpr0, $vgpr1 |
| ; GFX12-NEXT: {{ $}} |
| ; GFX12-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX12-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX12-NEXT: [[FMINIMUM:%[0-9]+]]:_(s32) = nsz G_FMINIMUM [[COPY]], [[COPY1]] |
| ; GFX12-NEXT: $vgpr0 = COPY [[FMINIMUM]](s32) |
| ; GFX12-NEXT: SI_RETURN implicit $vgpr0 |
| %0:_(s32) = COPY $vgpr0 |
| %1:_(s32) = COPY $vgpr1 |
| %2:_(s32) = nsz G_FMINIMUM %0, %1 |
| $vgpr0 = COPY %2(s32) |
| SI_RETURN implicit $vgpr0 |
| ... |
| --- |
| name: test_fminimum_nnan_f32 |
| body: | |
| bb.0: |
| liveins: $vgpr0, $vgpr1 |
| |
| ; GFX9-LABEL: name: test_fminimum_nnan_f32 |
| ; GFX9: liveins: $vgpr0, $vgpr1 |
| ; GFX9-NEXT: {{ $}} |
| ; GFX9-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX9-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX9-NEXT: [[FMINNUM_IEEE:%[0-9]+]]:_(s32) = G_FMINNUM_IEEE [[COPY]], [[COPY1]] |
| ; GFX9-NEXT: [[COPY2:%[0-9]+]]:_(s32) = COPY [[FMINNUM_IEEE]](s32) |
| ; GFX9-NEXT: $vgpr0 = COPY [[COPY2]](s32) |
| ; GFX9-NEXT: SI_RETURN implicit $vgpr0 |
| ; |
| ; GFX12-LABEL: name: test_fminimum_nnan_f32 |
| ; GFX12: liveins: $vgpr0, $vgpr1 |
| ; GFX12-NEXT: {{ $}} |
| ; GFX12-NEXT: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0 |
| ; GFX12-NEXT: [[COPY1:%[0-9]+]]:_(s32) = COPY $vgpr1 |
| ; GFX12-NEXT: [[FMINIMUM:%[0-9]+]]:_(s32) = nnan G_FMINIMUM [[COPY]], [[COPY1]] |
| ; GFX12-NEXT: $vgpr0 = COPY [[FMINIMUM]](s32) |
| ; GFX12-NEXT: SI_RETURN implicit $vgpr0 |
| %0:_(s32) = COPY $vgpr0 |
| %1:_(s32) = COPY $vgpr1 |
| %2:_(s32) = nnan G_FMINIMUM %0, %1 |
| $vgpr0 = COPY %2(s32) |
| SI_RETURN implicit $vgpr0 |
| ... |
| |