| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| ; RUN: llc -mtriple=hexagon -hexagon-bit=false < %s | FileCheck %s |
| |
| define bfloat @load_scalar_bf(ptr %addr) { |
| ; CHECK-LABEL: load_scalar_bf: |
| ; CHECK: .cfi_startproc |
| ; CHECK-NEXT: // %bb.0: // %entry |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[REG:r[0-9]+]] = memuh(r0+#0) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: r0 = aslh([[REG]]) |
| ; CHECK-NEXT: jumpr r31 |
| ; CHECK-NEXT: } |
| |
| entry: |
| %0 = load bfloat, ptr %addr, align 2 |
| ret bfloat %0 |
| } |
| |
| define void @store_scalar_bf(bfloat %v, ptr %addr) { |
| ; CHECK-LABEL: store_scalar_bf: |
| ; CHECK: .cfi_startproc |
| ; CHECK-NEXT: // %bb.0: // %entry |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R_A:r[0-9]+]] = ##131071 |
| ; CHECK-NEXT: [[R_B:r[0-9]+]] = ##32768 |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R_C:r[0-9]+]] = ##65535 |
| ; CHECK-NEXT: [[R_D:r[0-9]+]] = asrh(r0) |
| ; CHECK-NEXT: [[R_A]] = and(r0,[[R_A]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[P0:p[0-9]+]] = sfclass(r0,#16) |
| ; CHECK-NEXT: [[R_E:r[0-9]+]] = and(r0,[[R_B]]) |
| ; CHECK-NEXT: [[P1:p[0-9]+]] = cmp.eq([[R_A]],[[R_B]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: r0 = add(r0,[[R_E]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: r0 = asrh(r0) |
| ; CHECK-NEXT: if ([[P1]]) [[R_B]] = and([[R_D]],[[R_C]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: if (![[P1]]) [[R_B]] = and(r0,[[R_C]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: if ([[P0]]) [[R_B]] = ##32767 |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: jumpr r31 |
| ; CHECK-NEXT: memh(r1+#0) = [[R_B]] |
| ; CHECK-NEXT: } |
| |
| entry: |
| store bfloat %v, ptr %addr, align 2 |
| ret void |
| } |
| |
| define bfloat @sum(bfloat %a, bfloat %b) #0 { |
| ; CHECK-LABEL: sum: |
| ; CHECK: .cfi_startproc |
| ; CHECK-NEXT: // %bb.0: // %entry |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R3:r[0-9]+]] = ##32768 |
| ; CHECK-NEXT: [[R4:r[0-9]+]] = ##131071 |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R2:r[0-9]+]] = ##65535 |
| ; CHECK-NEXT: [[R6:r[0-9]+]] = and(r0,[[R3]]) |
| ; CHECK-NEXT: [[R5:r[0-9]+]] = and(r0,[[R4]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R8:r[0-9]+]] = and(r1,[[R3]]) |
| ; CHECK-NEXT: [[R7:r[0-9]+]] = and(r1,[[R4]]) |
| ; CHECK-NEXT: [[R6]] = add(r0,[[R6]]) |
| ; CHECK-NEXT: [[P0:p[0-9]+]] = cmp.eq([[R5]],[[R3]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R5]] = asrh(r0) |
| ; CHECK-NEXT: [[P1:p[0-9]+]] = cmp.eq([[R7]],[[R3]]) |
| ; CHECK-NEXT: [[R7]] = asrh(r1) |
| ; CHECK-NEXT: [[R8]] = add(r1,[[R8]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R6]] = asrh([[R6]]) |
| ; CHECK-NEXT: if ([[P0]]) [[R5]] = and([[R5]],[[R2]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[P0]] = sfclass(r0,#16) |
| ; CHECK-NEXT: if (![[P0]]) [[R5]] = and([[R6]],[[R2]]) |
| ; CHECK-NEXT: [[R6]] = asrh([[R8]]) |
| ; CHECK-NEXT: if ([[P1]]) [[R7]] = and([[R7]],[[R2]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[P1]] = sfclass(r1,#16) |
| ; CHECK-NEXT: [[R0:r[0-9]+]] = #32767 |
| ; CHECK-NEXT: if (![[P1]]) [[R7]] = and([[R6]],[[R2]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: if ([[P0]]) [[R5]] = add([[R0]],#0) |
| ; CHECK-NEXT: if ([[P1]]) [[R7]] = add([[R0]],#0) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R6]] = aslh([[R7]]) |
| ; CHECK-NEXT: [[R5]] = aslh([[R5]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R1:r[0-9]+]] = sfadd([[R5]],[[R6]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R5]] = and([[R1]],[[R3]]) |
| ; CHECK-NEXT: [[R4]] = and([[R1]],[[R4]]) |
| ; CHECK-NEXT: [[R6]] = asrh([[R1]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[P0]] = cmp.eq([[R4]],[[R3]]) |
| ; CHECK-NEXT: [[R5]] = add([[R1]],[[R5]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R3]] = asrh([[R5]]) |
| ; CHECK-NEXT: if ([[P0]]) [[R4]] = and([[R6]],[[R2]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[P0]] = sfclass([[R1]],#16) |
| ; CHECK-NEXT: if (![[P0]]) [[R4]] = and([[R3]],[[R2]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: if ([[P0]]) [[R4]] = add([[R0]],#0) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: r0 = aslh([[R4]]) |
| ; CHECK-NEXT: jumpr r31 |
| ; CHECK-NEXT: } |
| |
| entry: |
| %add = fadd bfloat %a, %b |
| ret bfloat %add |
| } |
| |
| ; Function Attrs: noinline nounwind optnone |
| define dso_local i32 @double_bf16(bfloat %a, bfloat %b) #0 { |
| ; CHECK-LABEL: double_bf16: |
| ; CHECK: .cfi_startproc |
| ; CHECK-NEXT: // %bb.0: // %entry |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[PAIR_A:r[0-9]+:[0-9]+]] = convert_sf2df(r0) |
| ; CHECK-NEXT: [[PAIR_B:r[0-9]+:[0-9]+]] = convert_sf2df(r1) |
| ; CHECK-NEXT: [[SP:r[0-9]+]] = add([[SP]],#-16) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[RESULT:r[0-9]+:[0-9]+]] = dfadd([[PAIR_A]],[[PAIR_B]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: memd([[SP]]+#8) = [[RESULT]] |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[TMP:r[0-9]+]] = convert_df2sf([[RESULT]]) |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[TMP1:r[0-9]+]] = lsr([[TMP]],#16) |
| ; CHECK-NEXT: [[R0:r[0-9]+]] = and([[TMP]],##-65536) |
| ; CHECK-NEXT: memh([[SP]]+#6) = [[TMP1]].new |
| ; CHECK-NEXT: } |
| ; CHECK-NEXT: { |
| ; CHECK-NEXT: [[R0]] = convert_sf2w([[R0]]):chop |
| ; CHECK-NEXT: jumpr r31 |
| ; CHECK-NEXT: [[SP]] = add([[SP]],#16) |
| ; CHECK-NEXT: } |
| |
| entry: |
| %c = alloca double, align 8 |
| %d = alloca bfloat, align 2 |
| %conv = fpext bfloat %a to double |
| %conv1 = fpext bfloat %b to double |
| %add = fadd double %conv, %conv1 |
| store double %add, ptr %c, align 8 |
| %2 = load double, ptr %c, align 8 |
| %conv2 = fptrunc double %2 to bfloat |
| store bfloat %conv2, ptr %d, align 2 |
| %3 = load bfloat, ptr %d, align 2 |
| %conv3 = fptosi bfloat %3 to i32 |
| ret i32 %conv3 |
| } |