blob: 550a2b54b2dea7d24b7139293d394c599f6ad592 [file] [log] [blame] [edit]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=hexagon -hexagon-bit=false < %s | FileCheck %s
define bfloat @load_scalar_bf(ptr %addr) {
; CHECK-LABEL: load_scalar_bf:
; CHECK: .cfi_startproc
; CHECK-NEXT: // %bb.0: // %entry
; CHECK-NEXT: {
; CHECK-NEXT: [[REG:r[0-9]+]] = memuh(r0+#0)
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: r0 = aslh([[REG]])
; CHECK-NEXT: jumpr r31
; CHECK-NEXT: }
entry:
%0 = load bfloat, ptr %addr, align 2
ret bfloat %0
}
define void @store_scalar_bf(bfloat %v, ptr %addr) {
; CHECK-LABEL: store_scalar_bf:
; CHECK: .cfi_startproc
; CHECK-NEXT: // %bb.0: // %entry
; CHECK-NEXT: {
; CHECK-NEXT: [[R_A:r[0-9]+]] = ##131071
; CHECK-NEXT: [[R_B:r[0-9]+]] = ##32768
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R_C:r[0-9]+]] = ##65535
; CHECK-NEXT: [[R_D:r[0-9]+]] = asrh(r0)
; CHECK-NEXT: [[R_A]] = and(r0,[[R_A]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[P0:p[0-9]+]] = sfclass(r0,#16)
; CHECK-NEXT: [[R_E:r[0-9]+]] = and(r0,[[R_B]])
; CHECK-NEXT: [[P1:p[0-9]+]] = cmp.eq([[R_A]],[[R_B]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: r0 = add(r0,[[R_E]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: r0 = asrh(r0)
; CHECK-NEXT: if ([[P1]]) [[R_B]] = and([[R_D]],[[R_C]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: if (![[P1]]) [[R_B]] = and(r0,[[R_C]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: if ([[P0]]) [[R_B]] = ##32767
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: jumpr r31
; CHECK-NEXT: memh(r1+#0) = [[R_B]]
; CHECK-NEXT: }
entry:
store bfloat %v, ptr %addr, align 2
ret void
}
define bfloat @sum(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: sum:
; CHECK: .cfi_startproc
; CHECK-NEXT: // %bb.0: // %entry
; CHECK-NEXT: {
; CHECK-NEXT: [[R3:r[0-9]+]] = ##32768
; CHECK-NEXT: [[R4:r[0-9]+]] = ##131071
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R2:r[0-9]+]] = ##65535
; CHECK-NEXT: [[R6:r[0-9]+]] = and(r0,[[R3]])
; CHECK-NEXT: [[R5:r[0-9]+]] = and(r0,[[R4]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R8:r[0-9]+]] = and(r1,[[R3]])
; CHECK-NEXT: [[R7:r[0-9]+]] = and(r1,[[R4]])
; CHECK-NEXT: [[R6]] = add(r0,[[R6]])
; CHECK-NEXT: [[P0:p[0-9]+]] = cmp.eq([[R5]],[[R3]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R5]] = asrh(r0)
; CHECK-NEXT: [[P1:p[0-9]+]] = cmp.eq([[R7]],[[R3]])
; CHECK-NEXT: [[R7]] = asrh(r1)
; CHECK-NEXT: [[R8]] = add(r1,[[R8]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R6]] = asrh([[R6]])
; CHECK-NEXT: if ([[P0]]) [[R5]] = and([[R5]],[[R2]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[P0]] = sfclass(r0,#16)
; CHECK-NEXT: if (![[P0]]) [[R5]] = and([[R6]],[[R2]])
; CHECK-NEXT: [[R6]] = asrh([[R8]])
; CHECK-NEXT: if ([[P1]]) [[R7]] = and([[R7]],[[R2]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[P1]] = sfclass(r1,#16)
; CHECK-NEXT: [[R0:r[0-9]+]] = #32767
; CHECK-NEXT: if (![[P1]]) [[R7]] = and([[R6]],[[R2]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: if ([[P0]]) [[R5]] = add([[R0]],#0)
; CHECK-NEXT: if ([[P1]]) [[R7]] = add([[R0]],#0)
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R6]] = aslh([[R7]])
; CHECK-NEXT: [[R5]] = aslh([[R5]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R1:r[0-9]+]] = sfadd([[R5]],[[R6]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R5]] = and([[R1]],[[R3]])
; CHECK-NEXT: [[R4]] = and([[R1]],[[R4]])
; CHECK-NEXT: [[R6]] = asrh([[R1]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[P0]] = cmp.eq([[R4]],[[R3]])
; CHECK-NEXT: [[R5]] = add([[R1]],[[R5]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R3]] = asrh([[R5]])
; CHECK-NEXT: if ([[P0]]) [[R4]] = and([[R6]],[[R2]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[P0]] = sfclass([[R1]],#16)
; CHECK-NEXT: if (![[P0]]) [[R4]] = and([[R3]],[[R2]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: if ([[P0]]) [[R4]] = add([[R0]],#0)
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: r0 = aslh([[R4]])
; CHECK-NEXT: jumpr r31
; CHECK-NEXT: }
entry:
%add = fadd bfloat %a, %b
ret bfloat %add
}
; Function Attrs: noinline nounwind optnone
define dso_local i32 @double_bf16(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: double_bf16:
; CHECK: .cfi_startproc
; CHECK-NEXT: // %bb.0: // %entry
; CHECK-NEXT: {
; CHECK-NEXT: [[PAIR_A:r[0-9]+:[0-9]+]] = convert_sf2df(r0)
; CHECK-NEXT: [[PAIR_B:r[0-9]+:[0-9]+]] = convert_sf2df(r1)
; CHECK-NEXT: [[SP:r[0-9]+]] = add([[SP]],#-16)
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[RESULT:r[0-9]+:[0-9]+]] = dfadd([[PAIR_A]],[[PAIR_B]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: memd([[SP]]+#8) = [[RESULT]]
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[TMP:r[0-9]+]] = convert_df2sf([[RESULT]])
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[TMP1:r[0-9]+]] = lsr([[TMP]],#16)
; CHECK-NEXT: [[R0:r[0-9]+]] = and([[TMP]],##-65536)
; CHECK-NEXT: memh([[SP]]+#6) = [[TMP1]].new
; CHECK-NEXT: }
; CHECK-NEXT: {
; CHECK-NEXT: [[R0]] = convert_sf2w([[R0]]):chop
; CHECK-NEXT: jumpr r31
; CHECK-NEXT: [[SP]] = add([[SP]],#16)
; CHECK-NEXT: }
entry:
%c = alloca double, align 8
%d = alloca bfloat, align 2
%conv = fpext bfloat %a to double
%conv1 = fpext bfloat %b to double
%add = fadd double %conv, %conv1
store double %add, ptr %c, align 8
%2 = load double, ptr %c, align 8
%conv2 = fptrunc double %2 to bfloat
store bfloat %conv2, ptr %d, align 2
%3 = load bfloat, ptr %d, align 2
%conv3 = fptosi bfloat %3 to i32
ret i32 %conv3
}