blob: 4df4f8aff56a974506161efdaf77514b1854be3a [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=powerpc64le -mcpu=pwr9 < %s | FileCheck %s
define float @frem32(float %a, float %b) {
; CHECK-LABEL: frem32:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: mflr 0
; CHECK-NEXT: std 0, 16(1)
; CHECK-NEXT: stdu 1, -32(1)
; CHECK-NEXT: .cfi_def_cfa_offset 32
; CHECK-NEXT: .cfi_offset lr, 16
; CHECK-NEXT: bl fmodf
; CHECK-NEXT: nop
; CHECK-NEXT: addi 1, 1, 32
; CHECK-NEXT: ld 0, 16(1)
; CHECK-NEXT: mtlr 0
; CHECK-NEXT: blr
entry:
%rem = frem fast float %a, %b
ret float %rem
}
define double @frem64(double %a, double %b) {
; CHECK-LABEL: frem64:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: mflr 0
; CHECK-NEXT: std 0, 16(1)
; CHECK-NEXT: stdu 1, -32(1)
; CHECK-NEXT: .cfi_def_cfa_offset 32
; CHECK-NEXT: .cfi_offset lr, 16
; CHECK-NEXT: bl fmod
; CHECK-NEXT: nop
; CHECK-NEXT: addi 1, 1, 32
; CHECK-NEXT: ld 0, 16(1)
; CHECK-NEXT: mtlr 0
; CHECK-NEXT: blr
entry:
%rem = frem fast double %a, %b
ret double %rem
}
define <4 x float> @frem4x32(<4 x float> %a, <4 x float> %b) {
; CHECK-LABEL: frem4x32:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: mflr 0
; CHECK-NEXT: std 0, 16(1)
; CHECK-NEXT: stdu 1, -96(1)
; CHECK-NEXT: .cfi_def_cfa_offset 96
; CHECK-NEXT: .cfi_offset lr, 16
; CHECK-NEXT: .cfi_offset v28, -64
; CHECK-NEXT: .cfi_offset v29, -48
; CHECK-NEXT: .cfi_offset v30, -32
; CHECK-NEXT: .cfi_offset v31, -16
; CHECK-NEXT: xxsldwi 0, 34, 34, 3
; CHECK-NEXT: stxv 60, 32(1) # 16-byte Folded Spill
; CHECK-NEXT: xscvspdpn 1, 0
; CHECK-NEXT: xxsldwi 0, 35, 35, 3
; CHECK-NEXT: stxv 61, 48(1) # 16-byte Folded Spill
; CHECK-NEXT: stxv 62, 64(1) # 16-byte Folded Spill
; CHECK-NEXT: stxv 63, 80(1) # 16-byte Folded Spill
; CHECK-NEXT: xscvspdpn 2, 0
; CHECK-NEXT: vmr 31, 3
; CHECK-NEXT: vmr 30, 2
; CHECK-NEXT: bl fmodf
; CHECK-NEXT: nop
; CHECK-NEXT: xxsldwi 0, 62, 62, 1
; CHECK-NEXT: xscpsgndp 61, 1, 1
; CHECK-NEXT: xscvspdpn 1, 0
; CHECK-NEXT: xxsldwi 0, 63, 63, 1
; CHECK-NEXT: xscvspdpn 2, 0
; CHECK-NEXT: bl fmodf
; CHECK-NEXT: nop
; CHECK-NEXT: # kill: def $f1 killed $f1 def $vsl1
; CHECK-NEXT: xxmrghd 0, 1, 61
; CHECK-NEXT: xscvspdpn 1, 62
; CHECK-NEXT: xscvspdpn 2, 63
; CHECK-NEXT: xvcvdpsp 60, 0
; CHECK-NEXT: bl fmodf
; CHECK-NEXT: nop
; CHECK-NEXT: xxswapd 0, 62
; CHECK-NEXT: xscpsgndp 61, 1, 1
; CHECK-NEXT: xscvspdpn 1, 0
; CHECK-NEXT: xxswapd 0, 63
; CHECK-NEXT: xscvspdpn 2, 0
; CHECK-NEXT: bl fmodf
; CHECK-NEXT: nop
; CHECK-NEXT: # kill: def $f1 killed $f1 def $vsl1
; CHECK-NEXT: xxmrghd 0, 61, 1
; CHECK-NEXT: lxv 63, 80(1) # 16-byte Folded Reload
; CHECK-NEXT: lxv 62, 64(1) # 16-byte Folded Reload
; CHECK-NEXT: lxv 61, 48(1) # 16-byte Folded Reload
; CHECK-NEXT: xvcvdpsp 34, 0
; CHECK-NEXT: vmrgew 2, 2, 28
; CHECK-NEXT: lxv 60, 32(1) # 16-byte Folded Reload
; CHECK-NEXT: addi 1, 1, 96
; CHECK-NEXT: ld 0, 16(1)
; CHECK-NEXT: mtlr 0
; CHECK-NEXT: blr
entry:
%rem = frem fast <4 x float> %a, %b
ret <4 x float> %rem
}
define <2 x double> @frem2x64(<2 x double> %a, <2 x double> %b) {
; CHECK-LABEL: frem2x64:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: mflr 0
; CHECK-NEXT: std 0, 16(1)
; CHECK-NEXT: stdu 1, -80(1)
; CHECK-NEXT: .cfi_def_cfa_offset 80
; CHECK-NEXT: .cfi_offset lr, 16
; CHECK-NEXT: .cfi_offset v29, -48
; CHECK-NEXT: .cfi_offset v30, -32
; CHECK-NEXT: .cfi_offset v31, -16
; CHECK-NEXT: stxv 62, 48(1) # 16-byte Folded Spill
; CHECK-NEXT: stxv 63, 64(1) # 16-byte Folded Spill
; CHECK-NEXT: vmr 31, 3
; CHECK-NEXT: xscpsgndp 2, 63, 63
; CHECK-NEXT: vmr 30, 2
; CHECK-NEXT: xscpsgndp 1, 62, 62
; CHECK-NEXT: stxv 61, 32(1) # 16-byte Folded Spill
; CHECK-NEXT: bl fmod
; CHECK-NEXT: nop
; CHECK-NEXT: xscpsgndp 61, 1, 1
; CHECK-NEXT: xxswapd 1, 62
; CHECK-NEXT: xxswapd 2, 63
; CHECK-NEXT: # kill: def $f1 killed $f1 killed $vsl1
; CHECK-NEXT: # kill: def $f2 killed $f2 killed $vsl2
; CHECK-NEXT: bl fmod
; CHECK-NEXT: nop
; CHECK-NEXT: # kill: def $f1 killed $f1 def $vsl1
; CHECK-NEXT: xxmrghd 34, 61, 1
; CHECK-NEXT: lxv 63, 64(1) # 16-byte Folded Reload
; CHECK-NEXT: lxv 62, 48(1) # 16-byte Folded Reload
; CHECK-NEXT: lxv 61, 32(1) # 16-byte Folded Reload
; CHECK-NEXT: addi 1, 1, 80
; CHECK-NEXT: ld 0, 16(1)
; CHECK-NEXT: mtlr 0
; CHECK-NEXT: blr
entry:
%rem = frem fast <2 x double> %a, %b
ret <2 x double> %rem
}