blob: d1d7d92adc05ae3cdc7d99fe5ad7ccf64aa441b1 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
; RUN: llc -mtriple=aarch64-gnu-linux < %s | FileCheck -check-prefixes=CHECK %s
define { half, half } @test_sincospi_f16(half %a) {
; CHECK-LABEL: test_sincospi_f16:
; CHECK: // %bb.0:
; CHECK-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-NEXT: .cfi_def_cfa_offset 16
; CHECK-NEXT: .cfi_offset w30, -16
; CHECK-NEXT: fcvt s0, h0
; CHECK-NEXT: add x0, sp, #12
; CHECK-NEXT: add x1, sp, #8
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldp s1, s0, [sp, #8]
; CHECK-NEXT: fcvt h0, s0
; CHECK-NEXT: fcvt h1, s1
; CHECK-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-NEXT: ret
%result = call { half, half } @llvm.sincospi.f16(half %a)
ret { half, half } %result
}
define half @test_sincospi_f16_only_use_sin(half %a) {
; CHECK-LABEL: test_sincospi_f16_only_use_sin:
; CHECK: // %bb.0:
; CHECK-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-NEXT: .cfi_def_cfa_offset 16
; CHECK-NEXT: .cfi_offset w30, -16
; CHECK-NEXT: fcvt s0, h0
; CHECK-NEXT: add x0, sp, #12
; CHECK-NEXT: add x1, sp, #8
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldr s0, [sp, #12]
; CHECK-NEXT: fcvt h0, s0
; CHECK-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-NEXT: ret
%result = call { half, half } @llvm.sincospi.f16(half %a)
%result.0 = extractvalue { half, half } %result, 0
ret half %result.0
}
define half @test_sincospi_f16_only_use_cos(half %a) {
; CHECK-LABEL: test_sincospi_f16_only_use_cos:
; CHECK: // %bb.0:
; CHECK-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-NEXT: .cfi_def_cfa_offset 16
; CHECK-NEXT: .cfi_offset w30, -16
; CHECK-NEXT: fcvt s0, h0
; CHECK-NEXT: add x0, sp, #12
; CHECK-NEXT: add x1, sp, #8
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldr s0, [sp, #8]
; CHECK-NEXT: fcvt h0, s0
; CHECK-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-NEXT: ret
%result = call { half, half } @llvm.sincospi.f16(half %a)
%result.1 = extractvalue { half, half } %result, 1
ret half %result.1
}
define { <2 x half>, <2 x half> } @test_sincospi_v2f16(<2 x half> %a) {
; CHECK-LABEL: test_sincospi_v2f16:
; CHECK: // %bb.0:
; CHECK-NEXT: sub sp, sp, #64
; CHECK-NEXT: str x30, [sp, #48] // 8-byte Folded Spill
; CHECK-NEXT: .cfi_def_cfa_offset 64
; CHECK-NEXT: .cfi_offset w30, -16
; CHECK-NEXT: // kill: def $d0 killed $d0 def $q0
; CHECK-NEXT: mov h1, v0.h[1]
; CHECK-NEXT: str q0, [sp] // 16-byte Folded Spill
; CHECK-NEXT: add x0, sp, #36
; CHECK-NEXT: add x1, sp, #32
; CHECK-NEXT: fcvt s0, h1
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldr q0, [sp] // 16-byte Folded Reload
; CHECK-NEXT: add x0, sp, #28
; CHECK-NEXT: add x1, sp, #24
; CHECK-NEXT: fcvt s0, h0
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldr q0, [sp] // 16-byte Folded Reload
; CHECK-NEXT: add x0, sp, #44
; CHECK-NEXT: add x1, sp, #40
; CHECK-NEXT: mov h0, v0.h[2]
; CHECK-NEXT: fcvt s0, h0
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldr q0, [sp] // 16-byte Folded Reload
; CHECK-NEXT: add x0, sp, #60
; CHECK-NEXT: add x1, sp, #56
; CHECK-NEXT: mov h0, v0.h[3]
; CHECK-NEXT: fcvt s0, h0
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldp s2, s0, [sp, #32]
; CHECK-NEXT: ldr x30, [sp, #48] // 8-byte Folded Reload
; CHECK-NEXT: ldp s3, s1, [sp, #24]
; CHECK-NEXT: fcvt h4, s0
; CHECK-NEXT: fcvt h2, s2
; CHECK-NEXT: fcvt h0, s1
; CHECK-NEXT: fcvt h1, s3
; CHECK-NEXT: ldp s5, s3, [sp, #40]
; CHECK-NEXT: fcvt h3, s3
; CHECK-NEXT: mov v0.h[1], v4.h[0]
; CHECK-NEXT: fcvt h4, s5
; CHECK-NEXT: mov v1.h[1], v2.h[0]
; CHECK-NEXT: ldp s5, s2, [sp, #56]
; CHECK-NEXT: mov v0.h[2], v3.h[0]
; CHECK-NEXT: fcvt h2, s2
; CHECK-NEXT: fcvt h3, s5
; CHECK-NEXT: mov v1.h[2], v4.h[0]
; CHECK-NEXT: mov v0.h[3], v2.h[0]
; CHECK-NEXT: mov v1.h[3], v3.h[0]
; CHECK-NEXT: // kill: def $d0 killed $d0 killed $q0
; CHECK-NEXT: // kill: def $d1 killed $d1 killed $q1
; CHECK-NEXT: add sp, sp, #64
; CHECK-NEXT: ret
%result = call { <2 x half>, <2 x half> } @llvm.sincospi.v2f16(<2 x half> %a)
ret { <2 x half>, <2 x half> } %result
}
define { float, float } @test_sincospi_f32(float %a) {
; CHECK-LABEL: test_sincospi_f32:
; CHECK: // %bb.0:
; CHECK-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-NEXT: .cfi_def_cfa_offset 16
; CHECK-NEXT: .cfi_offset w30, -16
; CHECK-NEXT: add x0, sp, #12
; CHECK-NEXT: add x1, sp, #8
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldp s1, s0, [sp, #8]
; CHECK-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-NEXT: ret
%result = call { float, float } @llvm.sincospi.f32(float %a)
ret { float, float } %result
}
define { <3 x float>, <3 x float> } @test_sincospi_v3f32(<3 x float> %a) {
; CHECK-LABEL: test_sincospi_v3f32:
; CHECK: // %bb.0:
; CHECK-NEXT: sub sp, sp, #80
; CHECK-NEXT: str x30, [sp, #32] // 8-byte Folded Spill
; CHECK-NEXT: stp x22, x21, [sp, #48] // 16-byte Folded Spill
; CHECK-NEXT: stp x20, x19, [sp, #64] // 16-byte Folded Spill
; CHECK-NEXT: .cfi_def_cfa_offset 80
; CHECK-NEXT: .cfi_offset w19, -8
; CHECK-NEXT: .cfi_offset w20, -16
; CHECK-NEXT: .cfi_offset w21, -24
; CHECK-NEXT: .cfi_offset w22, -32
; CHECK-NEXT: .cfi_offset w30, -48
; CHECK-NEXT: add x0, sp, #20
; CHECK-NEXT: add x1, sp, #16
; CHECK-NEXT: str q0, [sp] // 16-byte Folded Spill
; CHECK-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldr q0, [sp] // 16-byte Folded Reload
; CHECK-NEXT: add x0, sp, #28
; CHECK-NEXT: add x1, sp, #24
; CHECK-NEXT: add x19, sp, #28
; CHECK-NEXT: add x20, sp, #24
; CHECK-NEXT: mov s0, v0.s[1]
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldr q0, [sp] // 16-byte Folded Reload
; CHECK-NEXT: add x0, sp, #44
; CHECK-NEXT: add x1, sp, #40
; CHECK-NEXT: add x21, sp, #44
; CHECK-NEXT: add x22, sp, #40
; CHECK-NEXT: mov s0, v0.s[2]
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldp s1, s0, [sp, #16]
; CHECK-NEXT: ldr x30, [sp, #32] // 8-byte Folded Reload
; CHECK-NEXT: ld1 { v0.s }[1], [x19]
; CHECK-NEXT: ld1 { v1.s }[1], [x20]
; CHECK-NEXT: ldp x20, x19, [sp, #64] // 16-byte Folded Reload
; CHECK-NEXT: ld1 { v0.s }[2], [x21]
; CHECK-NEXT: ld1 { v1.s }[2], [x22]
; CHECK-NEXT: ldp x22, x21, [sp, #48] // 16-byte Folded Reload
; CHECK-NEXT: add sp, sp, #80
; CHECK-NEXT: ret
%result = call { <3 x float>, <3 x float> } @llvm.sincospi.v3f32(<3 x float> %a)
ret { <3 x float>, <3 x float> } %result
}
define { <2 x float>, <2 x float> } @test_sincospi_v2f32(<2 x float> %a) {
; CHECK-LABEL: test_sincospi_v2f32:
; CHECK: // %bb.0:
; CHECK-NEXT: sub sp, sp, #64
; CHECK-NEXT: str x30, [sp, #32] // 8-byte Folded Spill
; CHECK-NEXT: stp x20, x19, [sp, #48] // 16-byte Folded Spill
; CHECK-NEXT: .cfi_def_cfa_offset 64
; CHECK-NEXT: .cfi_offset w19, -8
; CHECK-NEXT: .cfi_offset w20, -16
; CHECK-NEXT: .cfi_offset w30, -32
; CHECK-NEXT: // kill: def $d0 killed $d0 def $q0
; CHECK-NEXT: add x0, sp, #44
; CHECK-NEXT: add x1, sp, #40
; CHECK-NEXT: str q0, [sp] // 16-byte Folded Spill
; CHECK-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldr q0, [sp] // 16-byte Folded Reload
; CHECK-NEXT: add x0, sp, #28
; CHECK-NEXT: add x1, sp, #24
; CHECK-NEXT: add x19, sp, #28
; CHECK-NEXT: add x20, sp, #24
; CHECK-NEXT: mov s0, v0.s[1]
; CHECK-NEXT: bl sincospif
; CHECK-NEXT: ldp s1, s0, [sp, #40]
; CHECK-NEXT: ldr x30, [sp, #32] // 8-byte Folded Reload
; CHECK-NEXT: ld1 { v0.s }[1], [x19]
; CHECK-NEXT: ld1 { v1.s }[1], [x20]
; CHECK-NEXT: ldp x20, x19, [sp, #48] // 16-byte Folded Reload
; CHECK-NEXT: // kill: def $d0 killed $d0 killed $q0
; CHECK-NEXT: // kill: def $d1 killed $d1 killed $q1
; CHECK-NEXT: add sp, sp, #64
; CHECK-NEXT: ret
%result = call { <2 x float>, <2 x float> } @llvm.sincospi.v2f32(<2 x float> %a)
ret { <2 x float>, <2 x float> } %result
}
define { double, double } @test_sincospi_f64(double %a) {
; CHECK-LABEL: test_sincospi_f64:
; CHECK: // %bb.0:
; CHECK-NEXT: sub sp, sp, #32
; CHECK-NEXT: str x30, [sp, #16] // 8-byte Folded Spill
; CHECK-NEXT: .cfi_def_cfa_offset 32
; CHECK-NEXT: .cfi_offset w30, -16
; CHECK-NEXT: add x0, sp, #24
; CHECK-NEXT: add x1, sp, #8
; CHECK-NEXT: bl sincospi
; CHECK-NEXT: ldr d0, [sp, #24]
; CHECK-NEXT: ldr d1, [sp, #8]
; CHECK-NEXT: ldr x30, [sp, #16] // 8-byte Folded Reload
; CHECK-NEXT: add sp, sp, #32
; CHECK-NEXT: ret
%result = call { double, double } @llvm.sincospi.f64(double %a)
ret { double, double } %result
}
define { <2 x double>, <2 x double> } @test_sincospi_v2f64(<2 x double> %a) {
; CHECK-LABEL: test_sincospi_v2f64:
; CHECK: // %bb.0:
; CHECK-NEXT: sub sp, sp, #80
; CHECK-NEXT: str x30, [sp, #48] // 8-byte Folded Spill
; CHECK-NEXT: stp x20, x19, [sp, #64] // 16-byte Folded Spill
; CHECK-NEXT: .cfi_def_cfa_offset 80
; CHECK-NEXT: .cfi_offset w19, -8
; CHECK-NEXT: .cfi_offset w20, -16
; CHECK-NEXT: .cfi_offset w30, -32
; CHECK-NEXT: add x0, sp, #56
; CHECK-NEXT: add x1, sp, #40
; CHECK-NEXT: str q0, [sp] // 16-byte Folded Spill
; CHECK-NEXT: // kill: def $d0 killed $d0 killed $q0
; CHECK-NEXT: bl sincospi
; CHECK-NEXT: ldr q0, [sp] // 16-byte Folded Reload
; CHECK-NEXT: add x0, sp, #32
; CHECK-NEXT: add x1, sp, #24
; CHECK-NEXT: add x19, sp, #32
; CHECK-NEXT: add x20, sp, #24
; CHECK-NEXT: mov d0, v0.d[1]
; CHECK-NEXT: bl sincospi
; CHECK-NEXT: ldr d0, [sp, #56]
; CHECK-NEXT: ldr d1, [sp, #40]
; CHECK-NEXT: ldr x30, [sp, #48] // 8-byte Folded Reload
; CHECK-NEXT: ld1 { v0.d }[1], [x19]
; CHECK-NEXT: ld1 { v1.d }[1], [x20]
; CHECK-NEXT: ldp x20, x19, [sp, #64] // 16-byte Folded Reload
; CHECK-NEXT: add sp, sp, #80
; CHECK-NEXT: ret
%result = call { <2 x double>, <2 x double> } @llvm.sincospi.v2f64(<2 x double> %a)
ret { <2 x double>, <2 x double> } %result
}