blob: 7998fb6b5eaacf1b828357961d04691a01c90327 [file] [log] [blame] [edit]
//===---- CIRGenBuiltinAArch64.cpp - Emit CIR for AArch64 builtins --------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// This contains code to emit ARM64 Builtin calls as CIR or a function call
// to be later resolved.
//
//===----------------------------------------------------------------------===//
#include "CIRGenBuilder.h"
#include "CIRGenFunction.h"
#include "clang/Basic/TargetBuiltins.h"
#include "clang/CIR/MissingFeatures.h"
// TODO(cir): once all builtins are covered, decide whether we still
// need to use LLVM intrinsics or if there's a better approach to follow. Right
// now the intrinsics are reused to make it convenient to encode all thousands
// of them and passing down to LLVM lowering.
#include "llvm/IR/Intrinsics.h"
#include "llvm/IR/IntrinsicsAArch64.h"
#include "mlir/IR/Value.h"
#include "clang/AST/GlobalDecl.h"
#include "clang/Basic/Builtins.h"
using namespace clang;
using namespace clang::CIRGen;
using namespace llvm;
template <typename... Operands>
static mlir::Value emitIntrinsicCallOp(CIRGenBuilderTy &builder,
mlir::Location loc, const StringRef str,
const mlir::Type &resTy,
Operands &&...op) {
return cir::LLVMIntrinsicCallOp::create(builder, loc,
builder.getStringAttr(str), resTy,
std::forward<Operands>(op)...)
.getResult();
}
// Generate vscale * scalingFactor
static mlir::Value genVscaleTimesFactor(mlir::Location loc,
CIRGenBuilderTy builder,
mlir::Type cirTy,
int32_t scalingFactor) {
mlir::Value vscale = emitIntrinsicCallOp(builder, loc, "vscale", cirTy);
return builder.createNUWAMul(loc, vscale,
builder.getUInt64(scalingFactor, loc));
}
static bool aarch64SVEIntrinsicsProvenSorted = false;
namespace {
struct AArch64BuiltinInfo {
unsigned builtinID;
unsigned llvmIntrinsic;
uint64_t typeModifier;
bool operator<(unsigned rhsBuiltinID) const {
return builtinID < rhsBuiltinID;
}
bool operator<(const AArch64BuiltinInfo &te) const {
return builtinID < te.builtinID;
}
};
} // end anonymous namespace
#define SVEMAP1(NameBase, llvmIntrinsic, TypeModifier) \
{SVE::BI__builtin_sve_##NameBase, Intrinsic::llvmIntrinsic, TypeModifier}
#define SVEMAP2(NameBase, TypeModifier) \
{SVE::BI__builtin_sve_##NameBase, 0, TypeModifier}
static const AArch64BuiltinInfo aarch64SVEIntrinsicMap[] = {
#define GET_SVE_LLVM_INTRINSIC_MAP
#include "clang/Basic/arm_sve_builtin_cg.inc"
#undef GET_SVE_LLVM_INTRINSIC_MAP
};
static const AArch64BuiltinInfo *
findARMVectorIntrinsicInMap(ArrayRef<AArch64BuiltinInfo> intrinsicMap,
unsigned builtinID, bool &mapProvenSorted) {
#ifndef NDEBUG
if (!mapProvenSorted) {
assert(llvm::is_sorted(intrinsicMap));
mapProvenSorted = true;
}
#endif
const AArch64BuiltinInfo *info = llvm::lower_bound(intrinsicMap, builtinID);
if (info != intrinsicMap.end() && info->builtinID == builtinID)
return info;
return nullptr;
}
bool CIRGenFunction::getAArch64SVEProcessedOperands(
unsigned builtinID, const CallExpr *expr, SmallVectorImpl<mlir::Value> &ops,
SVETypeFlags typeFlags) {
// Find out if any arguments are required to be integer constant expressions.
unsigned iceArguments = 0;
ASTContext::GetBuiltinTypeError error;
getContext().GetBuiltinType(builtinID, error, &iceArguments);
assert(error == ASTContext::GE_None && "Should not codegen an error");
for (unsigned i = 0, e = expr->getNumArgs(); i != e; i++) {
bool isIce = iceArguments & (1 << i);
mlir::Value arg = emitScalarExpr(expr->getArg(i));
if (isIce) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
}
// FIXME: Handle types like svint16x2_t, which are currently incorrectly
// converted to i32. These should be treated as structs and unpacked.
ops.push_back(arg);
}
return true;
}
std::optional<mlir::Value>
CIRGenFunction::emitAArch64SVEBuiltinExpr(unsigned builtinID,
const CallExpr *expr) {
if (builtinID >= SVE::BI__builtin_sve_reinterpret_s8_s8 &&
builtinID <= SVE::BI__builtin_sve_reinterpret_f64_f64_x4) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
assert(!cir::MissingFeatures::aarch64SVEIntrinsics());
auto *builtinIntrInfo = findARMVectorIntrinsicInMap(
aarch64SVEIntrinsicMap, builtinID, aarch64SVEIntrinsicsProvenSorted);
// The operands of the builtin call
llvm::SmallVector<mlir::Value> ops;
SVETypeFlags typeFlags(builtinIntrInfo->typeModifier);
if (!CIRGenFunction::getAArch64SVEProcessedOperands(builtinID, expr, ops,
typeFlags))
return mlir::Value{};
if (typeFlags.isLoad() || typeFlags.isStore() || typeFlags.isGatherLoad() ||
typeFlags.isScatterStore() || typeFlags.isPrefetch() ||
typeFlags.isGatherPrefetch() || typeFlags.isStructLoad() ||
typeFlags.isStructStore() || typeFlags.isTupleSet() ||
typeFlags.isTupleGet() || typeFlags.isTupleCreate() ||
typeFlags.isUndef())
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
mlir::Location loc = getLoc(expr->getExprLoc());
if (builtinIntrInfo->llvmIntrinsic != 0) {
std::string llvmIntrName(Intrinsic::getBaseName(
(llvm::Intrinsic::ID)builtinIntrInfo->llvmIntrinsic));
llvmIntrName.erase(0, /*std::strlen(".llvm")=*/5);
return emitIntrinsicCallOp(builder, loc, llvmIntrName,
convertType(expr->getType()),
mlir::ValueRange{ops});
}
switch (builtinID) {
default:
return std::nullopt;
case SVE::BI__builtin_sve_svreinterpret_b:
case SVE::BI__builtin_sve_svreinterpret_c:
case SVE::BI__builtin_sve_svpsel_lane_b8:
case SVE::BI__builtin_sve_svpsel_lane_b16:
case SVE::BI__builtin_sve_svpsel_lane_b32:
case SVE::BI__builtin_sve_svpsel_lane_b64:
case SVE::BI__builtin_sve_svpsel_lane_c8:
case SVE::BI__builtin_sve_svpsel_lane_c16:
case SVE::BI__builtin_sve_svpsel_lane_c32:
case SVE::BI__builtin_sve_svpsel_lane_c64:
case SVE::BI__builtin_sve_svmov_b_z:
case SVE::BI__builtin_sve_svnot_b_z:
case SVE::BI__builtin_sve_svmovlb_u16:
case SVE::BI__builtin_sve_svmovlb_u32:
case SVE::BI__builtin_sve_svmovlb_u64:
case SVE::BI__builtin_sve_svmovlb_s16:
case SVE::BI__builtin_sve_svmovlb_s32:
case SVE::BI__builtin_sve_svmovlb_s64:
case SVE::BI__builtin_sve_svmovlt_u16:
case SVE::BI__builtin_sve_svmovlt_u32:
case SVE::BI__builtin_sve_svmovlt_u64:
case SVE::BI__builtin_sve_svmovlt_s16:
case SVE::BI__builtin_sve_svmovlt_s32:
case SVE::BI__builtin_sve_svmovlt_s64:
case SVE::BI__builtin_sve_svpmullt_u16:
case SVE::BI__builtin_sve_svpmullt_u64:
case SVE::BI__builtin_sve_svpmullt_n_u16:
case SVE::BI__builtin_sve_svpmullt_n_u64:
case SVE::BI__builtin_sve_svpmullb_u16:
case SVE::BI__builtin_sve_svpmullb_u64:
case SVE::BI__builtin_sve_svpmullb_n_u16:
case SVE::BI__builtin_sve_svpmullb_n_u64:
case SVE::BI__builtin_sve_svdup_n_b8:
case SVE::BI__builtin_sve_svdup_n_b16:
case SVE::BI__builtin_sve_svdup_n_b32:
case SVE::BI__builtin_sve_svdup_n_b64:
case SVE::BI__builtin_sve_svdupq_n_b8:
case SVE::BI__builtin_sve_svdupq_n_b16:
case SVE::BI__builtin_sve_svdupq_n_b32:
case SVE::BI__builtin_sve_svdupq_n_b64:
case SVE::BI__builtin_sve_svdupq_n_u8:
case SVE::BI__builtin_sve_svdupq_n_s8:
case SVE::BI__builtin_sve_svdupq_n_u64:
case SVE::BI__builtin_sve_svdupq_n_f64:
case SVE::BI__builtin_sve_svdupq_n_s64:
case SVE::BI__builtin_sve_svdupq_n_u16:
case SVE::BI__builtin_sve_svdupq_n_f16:
case SVE::BI__builtin_sve_svdupq_n_bf16:
case SVE::BI__builtin_sve_svdupq_n_s16:
case SVE::BI__builtin_sve_svdupq_n_u32:
case SVE::BI__builtin_sve_svdupq_n_f32:
case SVE::BI__builtin_sve_svdupq_n_s32:
case SVE::BI__builtin_sve_svpfalse_b:
case SVE::BI__builtin_sve_svpfalse_c:
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
case SVE::BI__builtin_sve_svlen_u8:
case SVE::BI__builtin_sve_svlen_s8:
return genVscaleTimesFactor(loc, builder, convertType(expr->getType()), 16);
case SVE::BI__builtin_sve_svlen_u16:
case SVE::BI__builtin_sve_svlen_s16:
case SVE::BI__builtin_sve_svlen_f16:
case SVE::BI__builtin_sve_svlen_bf16:
return genVscaleTimesFactor(loc, builder, convertType(expr->getType()), 8);
case SVE::BI__builtin_sve_svlen_u32:
case SVE::BI__builtin_sve_svlen_s32:
case SVE::BI__builtin_sve_svlen_f32:
return genVscaleTimesFactor(loc, builder, convertType(expr->getType()), 4);
case SVE::BI__builtin_sve_svlen_u64:
case SVE::BI__builtin_sve_svlen_s64:
case SVE::BI__builtin_sve_svlen_f64:
return genVscaleTimesFactor(loc, builder, convertType(expr->getType()), 2);
case SVE::BI__builtin_sve_svtbl2_u8:
case SVE::BI__builtin_sve_svtbl2_s8:
case SVE::BI__builtin_sve_svtbl2_u16:
case SVE::BI__builtin_sve_svtbl2_s16:
case SVE::BI__builtin_sve_svtbl2_u32:
case SVE::BI__builtin_sve_svtbl2_s32:
case SVE::BI__builtin_sve_svtbl2_u64:
case SVE::BI__builtin_sve_svtbl2_s64:
case SVE::BI__builtin_sve_svtbl2_f16:
case SVE::BI__builtin_sve_svtbl2_bf16:
case SVE::BI__builtin_sve_svtbl2_f32:
case SVE::BI__builtin_sve_svtbl2_f64:
case SVE::BI__builtin_sve_svset_neonq_s8:
case SVE::BI__builtin_sve_svset_neonq_s16:
case SVE::BI__builtin_sve_svset_neonq_s32:
case SVE::BI__builtin_sve_svset_neonq_s64:
case SVE::BI__builtin_sve_svset_neonq_u8:
case SVE::BI__builtin_sve_svset_neonq_u16:
case SVE::BI__builtin_sve_svset_neonq_u32:
case SVE::BI__builtin_sve_svset_neonq_u64:
case SVE::BI__builtin_sve_svset_neonq_f16:
case SVE::BI__builtin_sve_svset_neonq_f32:
case SVE::BI__builtin_sve_svset_neonq_f64:
case SVE::BI__builtin_sve_svset_neonq_bf16:
case SVE::BI__builtin_sve_svget_neonq_s8:
case SVE::BI__builtin_sve_svget_neonq_s16:
case SVE::BI__builtin_sve_svget_neonq_s32:
case SVE::BI__builtin_sve_svget_neonq_s64:
case SVE::BI__builtin_sve_svget_neonq_u8:
case SVE::BI__builtin_sve_svget_neonq_u16:
case SVE::BI__builtin_sve_svget_neonq_u32:
case SVE::BI__builtin_sve_svget_neonq_u64:
case SVE::BI__builtin_sve_svget_neonq_f16:
case SVE::BI__builtin_sve_svget_neonq_f32:
case SVE::BI__builtin_sve_svget_neonq_f64:
case SVE::BI__builtin_sve_svget_neonq_bf16:
case SVE::BI__builtin_sve_svdup_neonq_s8:
case SVE::BI__builtin_sve_svdup_neonq_s16:
case SVE::BI__builtin_sve_svdup_neonq_s32:
case SVE::BI__builtin_sve_svdup_neonq_s64:
case SVE::BI__builtin_sve_svdup_neonq_u8:
case SVE::BI__builtin_sve_svdup_neonq_u16:
case SVE::BI__builtin_sve_svdup_neonq_u32:
case SVE::BI__builtin_sve_svdup_neonq_u64:
case SVE::BI__builtin_sve_svdup_neonq_f16:
case SVE::BI__builtin_sve_svdup_neonq_f32:
case SVE::BI__builtin_sve_svdup_neonq_f64:
case SVE::BI__builtin_sve_svdup_neonq_bf16:
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
// Unreachable: All cases in the switch above return.
}
std::optional<mlir::Value>
CIRGenFunction::emitAArch64SMEBuiltinExpr(unsigned builtinID,
const CallExpr *expr) {
assert(!cir::MissingFeatures::aarch64SMEIntrinsics());
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
// Some intrinsics are equivalent for codegen.
static const std::pair<unsigned, unsigned> neonEquivalentIntrinsicMap[] = {
{
NEON::BI__builtin_neon_splat_lane_bf16,
NEON::BI__builtin_neon_splat_lane_v,
},
{
NEON::BI__builtin_neon_splat_laneq_bf16,
NEON::BI__builtin_neon_splat_laneq_v,
},
{
NEON::BI__builtin_neon_splatq_lane_bf16,
NEON::BI__builtin_neon_splatq_lane_v,
},
{
NEON::BI__builtin_neon_splatq_laneq_bf16,
NEON::BI__builtin_neon_splatq_laneq_v,
},
{
NEON::BI__builtin_neon_vabd_f16,
NEON::BI__builtin_neon_vabd_v,
},
{
NEON::BI__builtin_neon_vabdq_f16,
NEON::BI__builtin_neon_vabdq_v,
},
{
NEON::BI__builtin_neon_vabs_f16,
NEON::BI__builtin_neon_vabs_v,
},
{
NEON::BI__builtin_neon_vabsq_f16,
NEON::BI__builtin_neon_vabsq_v,
},
{
NEON::BI__builtin_neon_vcage_f16,
NEON::BI__builtin_neon_vcage_v,
},
{
NEON::BI__builtin_neon_vcageq_f16,
NEON::BI__builtin_neon_vcageq_v,
},
{
NEON::BI__builtin_neon_vcagt_f16,
NEON::BI__builtin_neon_vcagt_v,
},
{
NEON::BI__builtin_neon_vcagtq_f16,
NEON::BI__builtin_neon_vcagtq_v,
},
{
NEON::BI__builtin_neon_vcale_f16,
NEON::BI__builtin_neon_vcale_v,
},
{
NEON::BI__builtin_neon_vcaleq_f16,
NEON::BI__builtin_neon_vcaleq_v,
},
{
NEON::BI__builtin_neon_vcalt_f16,
NEON::BI__builtin_neon_vcalt_v,
},
{
NEON::BI__builtin_neon_vcaltq_f16,
NEON::BI__builtin_neon_vcaltq_v,
},
{
NEON::BI__builtin_neon_vceqz_f16,
NEON::BI__builtin_neon_vceqz_v,
},
{
NEON::BI__builtin_neon_vceqzq_f16,
NEON::BI__builtin_neon_vceqzq_v,
},
{
NEON::BI__builtin_neon_vcgez_f16,
NEON::BI__builtin_neon_vcgez_v,
},
{
NEON::BI__builtin_neon_vcgezq_f16,
NEON::BI__builtin_neon_vcgezq_v,
},
{
NEON::BI__builtin_neon_vcgtz_f16,
NEON::BI__builtin_neon_vcgtz_v,
},
{
NEON::BI__builtin_neon_vcgtzq_f16,
NEON::BI__builtin_neon_vcgtzq_v,
},
{
NEON::BI__builtin_neon_vclez_f16,
NEON::BI__builtin_neon_vclez_v,
},
{
NEON::BI__builtin_neon_vclezq_f16,
NEON::BI__builtin_neon_vclezq_v,
},
{
NEON::BI__builtin_neon_vcltz_f16,
NEON::BI__builtin_neon_vcltz_v,
},
{
NEON::BI__builtin_neon_vcltzq_f16,
NEON::BI__builtin_neon_vcltzq_v,
},
{
NEON::BI__builtin_neon_vfma_f16,
NEON::BI__builtin_neon_vfma_v,
},
{
NEON::BI__builtin_neon_vfma_lane_f16,
NEON::BI__builtin_neon_vfma_lane_v,
},
{
NEON::BI__builtin_neon_vfma_laneq_f16,
NEON::BI__builtin_neon_vfma_laneq_v,
},
{
NEON::BI__builtin_neon_vfmaq_f16,
NEON::BI__builtin_neon_vfmaq_v,
},
{
NEON::BI__builtin_neon_vfmaq_lane_f16,
NEON::BI__builtin_neon_vfmaq_lane_v,
},
{
NEON::BI__builtin_neon_vfmaq_laneq_f16,
NEON::BI__builtin_neon_vfmaq_laneq_v,
},
{NEON::BI__builtin_neon_vld1_bf16_x2, NEON::BI__builtin_neon_vld1_x2_v},
{NEON::BI__builtin_neon_vld1_bf16_x3, NEON::BI__builtin_neon_vld1_x3_v},
{NEON::BI__builtin_neon_vld1_bf16_x4, NEON::BI__builtin_neon_vld1_x4_v},
{NEON::BI__builtin_neon_vld1_bf16, NEON::BI__builtin_neon_vld1_v},
{NEON::BI__builtin_neon_vld1_dup_bf16, NEON::BI__builtin_neon_vld1_dup_v},
{NEON::BI__builtin_neon_vld1_lane_bf16, NEON::BI__builtin_neon_vld1_lane_v},
{NEON::BI__builtin_neon_vld1q_bf16_x2, NEON::BI__builtin_neon_vld1q_x2_v},
{NEON::BI__builtin_neon_vld1q_bf16_x3, NEON::BI__builtin_neon_vld1q_x3_v},
{NEON::BI__builtin_neon_vld1q_bf16_x4, NEON::BI__builtin_neon_vld1q_x4_v},
{NEON::BI__builtin_neon_vld1q_bf16, NEON::BI__builtin_neon_vld1q_v},
{NEON::BI__builtin_neon_vld1q_dup_bf16, NEON::BI__builtin_neon_vld1q_dup_v},
{NEON::BI__builtin_neon_vld1q_lane_bf16,
NEON::BI__builtin_neon_vld1q_lane_v},
{NEON::BI__builtin_neon_vld2_bf16, NEON::BI__builtin_neon_vld2_v},
{NEON::BI__builtin_neon_vld2_dup_bf16, NEON::BI__builtin_neon_vld2_dup_v},
{NEON::BI__builtin_neon_vld2_lane_bf16, NEON::BI__builtin_neon_vld2_lane_v},
{NEON::BI__builtin_neon_vld2q_bf16, NEON::BI__builtin_neon_vld2q_v},
{NEON::BI__builtin_neon_vld2q_dup_bf16, NEON::BI__builtin_neon_vld2q_dup_v},
{NEON::BI__builtin_neon_vld2q_lane_bf16,
NEON::BI__builtin_neon_vld2q_lane_v},
{NEON::BI__builtin_neon_vld3_bf16, NEON::BI__builtin_neon_vld3_v},
{NEON::BI__builtin_neon_vld3_dup_bf16, NEON::BI__builtin_neon_vld3_dup_v},
{NEON::BI__builtin_neon_vld3_lane_bf16, NEON::BI__builtin_neon_vld3_lane_v},
{NEON::BI__builtin_neon_vld3q_bf16, NEON::BI__builtin_neon_vld3q_v},
{NEON::BI__builtin_neon_vld3q_dup_bf16, NEON::BI__builtin_neon_vld3q_dup_v},
{NEON::BI__builtin_neon_vld3q_lane_bf16,
NEON::BI__builtin_neon_vld3q_lane_v},
{NEON::BI__builtin_neon_vld4_bf16, NEON::BI__builtin_neon_vld4_v},
{NEON::BI__builtin_neon_vld4_dup_bf16, NEON::BI__builtin_neon_vld4_dup_v},
{NEON::BI__builtin_neon_vld4_lane_bf16, NEON::BI__builtin_neon_vld4_lane_v},
{NEON::BI__builtin_neon_vld4q_bf16, NEON::BI__builtin_neon_vld4q_v},
{NEON::BI__builtin_neon_vld4q_dup_bf16, NEON::BI__builtin_neon_vld4q_dup_v},
{NEON::BI__builtin_neon_vld4q_lane_bf16,
NEON::BI__builtin_neon_vld4q_lane_v},
{
NEON::BI__builtin_neon_vmax_f16,
NEON::BI__builtin_neon_vmax_v,
},
{
NEON::BI__builtin_neon_vmaxnm_f16,
NEON::BI__builtin_neon_vmaxnm_v,
},
{
NEON::BI__builtin_neon_vmaxnmq_f16,
NEON::BI__builtin_neon_vmaxnmq_v,
},
{
NEON::BI__builtin_neon_vmaxq_f16,
NEON::BI__builtin_neon_vmaxq_v,
},
{
NEON::BI__builtin_neon_vmin_f16,
NEON::BI__builtin_neon_vmin_v,
},
{
NEON::BI__builtin_neon_vminnm_f16,
NEON::BI__builtin_neon_vminnm_v,
},
{
NEON::BI__builtin_neon_vminnmq_f16,
NEON::BI__builtin_neon_vminnmq_v,
},
{
NEON::BI__builtin_neon_vminq_f16,
NEON::BI__builtin_neon_vminq_v,
},
{
NEON::BI__builtin_neon_vmulx_f16,
NEON::BI__builtin_neon_vmulx_v,
},
{
NEON::BI__builtin_neon_vmulxq_f16,
NEON::BI__builtin_neon_vmulxq_v,
},
{
NEON::BI__builtin_neon_vpadd_f16,
NEON::BI__builtin_neon_vpadd_v,
},
{
NEON::BI__builtin_neon_vpaddq_f16,
NEON::BI__builtin_neon_vpaddq_v,
},
{
NEON::BI__builtin_neon_vpmax_f16,
NEON::BI__builtin_neon_vpmax_v,
},
{
NEON::BI__builtin_neon_vpmaxnm_f16,
NEON::BI__builtin_neon_vpmaxnm_v,
},
{
NEON::BI__builtin_neon_vpmaxnmq_f16,
NEON::BI__builtin_neon_vpmaxnmq_v,
},
{
NEON::BI__builtin_neon_vpmaxq_f16,
NEON::BI__builtin_neon_vpmaxq_v,
},
{
NEON::BI__builtin_neon_vpmin_f16,
NEON::BI__builtin_neon_vpmin_v,
},
{
NEON::BI__builtin_neon_vpminnm_f16,
NEON::BI__builtin_neon_vpminnm_v,
},
{
NEON::BI__builtin_neon_vpminnmq_f16,
NEON::BI__builtin_neon_vpminnmq_v,
},
{
NEON::BI__builtin_neon_vpminq_f16,
NEON::BI__builtin_neon_vpminq_v,
},
{
NEON::BI__builtin_neon_vrecpe_f16,
NEON::BI__builtin_neon_vrecpe_v,
},
{
NEON::BI__builtin_neon_vrecpeq_f16,
NEON::BI__builtin_neon_vrecpeq_v,
},
{
NEON::BI__builtin_neon_vrecps_f16,
NEON::BI__builtin_neon_vrecps_v,
},
{
NEON::BI__builtin_neon_vrecpsq_f16,
NEON::BI__builtin_neon_vrecpsq_v,
},
{
NEON::BI__builtin_neon_vrnd_f16,
NEON::BI__builtin_neon_vrnd_v,
},
{
NEON::BI__builtin_neon_vrnda_f16,
NEON::BI__builtin_neon_vrnda_v,
},
{
NEON::BI__builtin_neon_vrndaq_f16,
NEON::BI__builtin_neon_vrndaq_v,
},
{
NEON::BI__builtin_neon_vrndi_f16,
NEON::BI__builtin_neon_vrndi_v,
},
{
NEON::BI__builtin_neon_vrndiq_f16,
NEON::BI__builtin_neon_vrndiq_v,
},
{
NEON::BI__builtin_neon_vrndm_f16,
NEON::BI__builtin_neon_vrndm_v,
},
{
NEON::BI__builtin_neon_vrndmq_f16,
NEON::BI__builtin_neon_vrndmq_v,
},
{
NEON::BI__builtin_neon_vrndn_f16,
NEON::BI__builtin_neon_vrndn_v,
},
{
NEON::BI__builtin_neon_vrndnq_f16,
NEON::BI__builtin_neon_vrndnq_v,
},
{
NEON::BI__builtin_neon_vrndp_f16,
NEON::BI__builtin_neon_vrndp_v,
},
{
NEON::BI__builtin_neon_vrndpq_f16,
NEON::BI__builtin_neon_vrndpq_v,
},
{
NEON::BI__builtin_neon_vrndq_f16,
NEON::BI__builtin_neon_vrndq_v,
},
{
NEON::BI__builtin_neon_vrndx_f16,
NEON::BI__builtin_neon_vrndx_v,
},
{
NEON::BI__builtin_neon_vrndxq_f16,
NEON::BI__builtin_neon_vrndxq_v,
},
{
NEON::BI__builtin_neon_vrsqrte_f16,
NEON::BI__builtin_neon_vrsqrte_v,
},
{
NEON::BI__builtin_neon_vrsqrteq_f16,
NEON::BI__builtin_neon_vrsqrteq_v,
},
{
NEON::BI__builtin_neon_vrsqrts_f16,
NEON::BI__builtin_neon_vrsqrts_v,
},
{
NEON::BI__builtin_neon_vrsqrtsq_f16,
NEON::BI__builtin_neon_vrsqrtsq_v,
},
{
NEON::BI__builtin_neon_vsqrt_f16,
NEON::BI__builtin_neon_vsqrt_v,
},
{
NEON::BI__builtin_neon_vsqrtq_f16,
NEON::BI__builtin_neon_vsqrtq_v,
},
{NEON::BI__builtin_neon_vst1_bf16_x2, NEON::BI__builtin_neon_vst1_x2_v},
{NEON::BI__builtin_neon_vst1_bf16_x3, NEON::BI__builtin_neon_vst1_x3_v},
{NEON::BI__builtin_neon_vst1_bf16_x4, NEON::BI__builtin_neon_vst1_x4_v},
{NEON::BI__builtin_neon_vst1_bf16, NEON::BI__builtin_neon_vst1_v},
{NEON::BI__builtin_neon_vst1_lane_bf16, NEON::BI__builtin_neon_vst1_lane_v},
{NEON::BI__builtin_neon_vst1q_bf16_x2, NEON::BI__builtin_neon_vst1q_x2_v},
{NEON::BI__builtin_neon_vst1q_bf16_x3, NEON::BI__builtin_neon_vst1q_x3_v},
{NEON::BI__builtin_neon_vst1q_bf16_x4, NEON::BI__builtin_neon_vst1q_x4_v},
{NEON::BI__builtin_neon_vst1q_bf16, NEON::BI__builtin_neon_vst1q_v},
{NEON::BI__builtin_neon_vst1q_lane_bf16,
NEON::BI__builtin_neon_vst1q_lane_v},
{NEON::BI__builtin_neon_vst2_bf16, NEON::BI__builtin_neon_vst2_v},
{NEON::BI__builtin_neon_vst2_lane_bf16, NEON::BI__builtin_neon_vst2_lane_v},
{NEON::BI__builtin_neon_vst2q_bf16, NEON::BI__builtin_neon_vst2q_v},
{NEON::BI__builtin_neon_vst2q_lane_bf16,
NEON::BI__builtin_neon_vst2q_lane_v},
{NEON::BI__builtin_neon_vst3_bf16, NEON::BI__builtin_neon_vst3_v},
{NEON::BI__builtin_neon_vst3_lane_bf16, NEON::BI__builtin_neon_vst3_lane_v},
{NEON::BI__builtin_neon_vst3q_bf16, NEON::BI__builtin_neon_vst3q_v},
{NEON::BI__builtin_neon_vst3q_lane_bf16,
NEON::BI__builtin_neon_vst3q_lane_v},
{NEON::BI__builtin_neon_vst4_bf16, NEON::BI__builtin_neon_vst4_v},
{NEON::BI__builtin_neon_vst4_lane_bf16, NEON::BI__builtin_neon_vst4_lane_v},
{NEON::BI__builtin_neon_vst4q_bf16, NEON::BI__builtin_neon_vst4q_v},
{NEON::BI__builtin_neon_vst4q_lane_bf16,
NEON::BI__builtin_neon_vst4q_lane_v},
// The mangling rules cause us to have one ID for each type for
// vldap1(q)_lane and vstl1(q)_lane, but codegen is equivalent for all of
// them. Choose an arbitrary one to be handled as tha canonical variation.
{NEON::BI__builtin_neon_vldap1_lane_u64,
NEON::BI__builtin_neon_vldap1_lane_s64},
{NEON::BI__builtin_neon_vldap1_lane_f64,
NEON::BI__builtin_neon_vldap1_lane_s64},
{NEON::BI__builtin_neon_vldap1_lane_p64,
NEON::BI__builtin_neon_vldap1_lane_s64},
{NEON::BI__builtin_neon_vldap1q_lane_u64,
NEON::BI__builtin_neon_vldap1q_lane_s64},
{NEON::BI__builtin_neon_vldap1q_lane_f64,
NEON::BI__builtin_neon_vldap1q_lane_s64},
{NEON::BI__builtin_neon_vldap1q_lane_p64,
NEON::BI__builtin_neon_vldap1q_lane_s64},
{NEON::BI__builtin_neon_vstl1_lane_u64,
NEON::BI__builtin_neon_vstl1_lane_s64},
{NEON::BI__builtin_neon_vstl1_lane_f64,
NEON::BI__builtin_neon_vstl1_lane_s64},
{NEON::BI__builtin_neon_vstl1_lane_p64,
NEON::BI__builtin_neon_vstl1_lane_s64},
{NEON::BI__builtin_neon_vstl1q_lane_u64,
NEON::BI__builtin_neon_vstl1q_lane_s64},
{NEON::BI__builtin_neon_vstl1q_lane_f64,
NEON::BI__builtin_neon_vstl1q_lane_s64},
{NEON::BI__builtin_neon_vstl1q_lane_p64,
NEON::BI__builtin_neon_vstl1q_lane_s64},
};
std::optional<mlir::Value>
CIRGenFunction::emitAArch64BuiltinExpr(unsigned builtinID, const CallExpr *expr,
ReturnValueSlot returnValue,
llvm::Triple::ArchType arch) {
if (builtinID >= clang::AArch64::FirstSVEBuiltin &&
builtinID <= clang::AArch64::LastSVEBuiltin)
return emitAArch64SVEBuiltinExpr(builtinID, expr);
if (builtinID >= clang::AArch64::FirstSMEBuiltin &&
builtinID <= clang::AArch64::LastSMEBuiltin)
return emitAArch64SMEBuiltinExpr(builtinID, expr);
if (builtinID == Builtin::BI__builtin_cpu_supports) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
switch (builtinID) {
default:
break;
case clang::AArch64::BI__builtin_arm_nop:
case clang::AArch64::BI__builtin_arm_yield:
case clang::AArch64::BI__yield:
case clang::AArch64::BI__builtin_arm_wfe:
case clang::AArch64::BI__wfe:
case clang::AArch64::BI__builtin_arm_wfi:
case clang::AArch64::BI__wfi:
case clang::AArch64::BI__builtin_arm_sev:
case clang::AArch64::BI__sev:
case clang::AArch64::BI__builtin_arm_sevl:
case clang::AArch64::BI__sevl:
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_trap) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_get_sme_state) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_rbit) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_rbit64) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_clz ||
builtinID == clang::AArch64::BI__builtin_arm_clz64) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_cls) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_cls64) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_rint32zf ||
builtinID == clang::AArch64::BI__builtin_arm_rint32z) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_rint64zf ||
builtinID == clang::AArch64::BI__builtin_arm_rint64z) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_rint32xf ||
builtinID == clang::AArch64::BI__builtin_arm_rint32x) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_rint64xf ||
builtinID == clang::AArch64::BI__builtin_arm_rint64x) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_jcvt) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_ld64b ||
builtinID == clang::AArch64::BI__builtin_arm_st64b ||
builtinID == clang::AArch64::BI__builtin_arm_st64bv ||
builtinID == clang::AArch64::BI__builtin_arm_st64bv0) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_rndr ||
builtinID == clang::AArch64::BI__builtin_arm_rndrrs) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__clear_cache) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if ((builtinID == clang::AArch64::BI__builtin_arm_ldrex ||
builtinID == clang::AArch64::BI__builtin_arm_ldaex) &&
getContext().getTypeSize(expr->getType()) == 128) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_ldrex ||
builtinID == clang::AArch64::BI__builtin_arm_ldaex) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if ((builtinID == clang::AArch64::BI__builtin_arm_strex ||
builtinID == clang::AArch64::BI__builtin_arm_stlex) &&
getContext().getTypeSize(expr->getArg(0)->getType()) == 128) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_strex ||
builtinID == clang::AArch64::BI__builtin_arm_stlex) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__getReg) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__break) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_clrex) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI_ReadWriteBarrier) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
// CRC32
Intrinsic::ID crcIntrinsicID = Intrinsic::not_intrinsic;
switch (builtinID) {
case clang::AArch64::BI__builtin_arm_crc32b:
crcIntrinsicID = Intrinsic::aarch64_crc32b;
break;
case clang::AArch64::BI__builtin_arm_crc32cb:
crcIntrinsicID = Intrinsic::aarch64_crc32cb;
break;
case clang::AArch64::BI__builtin_arm_crc32h:
crcIntrinsicID = Intrinsic::aarch64_crc32h;
break;
case clang::AArch64::BI__builtin_arm_crc32ch:
crcIntrinsicID = Intrinsic::aarch64_crc32ch;
break;
case clang::AArch64::BI__builtin_arm_crc32w:
crcIntrinsicID = Intrinsic::aarch64_crc32w;
break;
case clang::AArch64::BI__builtin_arm_crc32cw:
crcIntrinsicID = Intrinsic::aarch64_crc32cw;
break;
case clang::AArch64::BI__builtin_arm_crc32d:
crcIntrinsicID = Intrinsic::aarch64_crc32x;
break;
case clang::AArch64::BI__builtin_arm_crc32cd:
crcIntrinsicID = Intrinsic::aarch64_crc32cx;
break;
}
if (crcIntrinsicID != Intrinsic::not_intrinsic) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
// Memory Operations (MOPS)
if (builtinID == AArch64::BI__builtin_arm_mops_memset_tag) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
// Memory Tagging Extensions (MTE) Intrinsics
Intrinsic::ID mteIntrinsicID = Intrinsic::not_intrinsic;
switch (builtinID) {
case clang::AArch64::BI__builtin_arm_irg:
mteIntrinsicID = Intrinsic::aarch64_irg;
break;
case clang::AArch64::BI__builtin_arm_addg:
mteIntrinsicID = Intrinsic::aarch64_addg;
break;
case clang::AArch64::BI__builtin_arm_gmi:
mteIntrinsicID = Intrinsic::aarch64_gmi;
break;
case clang::AArch64::BI__builtin_arm_ldg:
mteIntrinsicID = Intrinsic::aarch64_ldg;
break;
case clang::AArch64::BI__builtin_arm_stg:
mteIntrinsicID = Intrinsic::aarch64_stg;
break;
case clang::AArch64::BI__builtin_arm_subp:
mteIntrinsicID = Intrinsic::aarch64_subp;
break;
}
if (mteIntrinsicID != Intrinsic::not_intrinsic) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_arm_rsr ||
builtinID == clang::AArch64::BI__builtin_arm_rsr64 ||
builtinID == clang::AArch64::BI__builtin_arm_rsr128 ||
builtinID == clang::AArch64::BI__builtin_arm_rsrp ||
builtinID == clang::AArch64::BI__builtin_arm_wsr ||
builtinID == clang::AArch64::BI__builtin_arm_wsr64 ||
builtinID == clang::AArch64::BI__builtin_arm_wsr128 ||
builtinID == clang::AArch64::BI__builtin_arm_wsrp) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI_ReadStatusReg ||
builtinID == clang::AArch64::BI_WriteStatusReg ||
builtinID == clang::AArch64::BI__sys) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI_AddressOfReturnAddress) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__builtin_sponentry) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == clang::AArch64::BI__mulh ||
builtinID == clang::AArch64::BI__umulh) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == AArch64::BI__writex18byte ||
builtinID == AArch64::BI__writex18word ||
builtinID == AArch64::BI__writex18dword ||
builtinID == AArch64::BI__writex18qword) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == AArch64::BI__readx18byte ||
builtinID == AArch64::BI__readx18word ||
builtinID == AArch64::BI__readx18dword ||
builtinID == AArch64::BI__readx18qword) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == AArch64::BI__addx18byte ||
builtinID == AArch64::BI__addx18word ||
builtinID == AArch64::BI__addx18dword ||
builtinID == AArch64::BI__addx18qword ||
builtinID == AArch64::BI__incx18byte ||
builtinID == AArch64::BI__incx18word ||
builtinID == AArch64::BI__incx18dword ||
builtinID == AArch64::BI__incx18qword) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == AArch64::BI_CopyDoubleFromInt64 ||
builtinID == AArch64::BI_CopyFloatFromInt32 ||
builtinID == AArch64::BI_CopyInt32FromFloat ||
builtinID == AArch64::BI_CopyInt64FromDouble) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == AArch64::BI_CountLeadingOnes ||
builtinID == AArch64::BI_CountLeadingOnes64 ||
builtinID == AArch64::BI_CountLeadingZeros ||
builtinID == AArch64::BI_CountLeadingZeros64) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == AArch64::BI_CountLeadingSigns ||
builtinID == AArch64::BI_CountLeadingSigns64) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == AArch64::BI_CountOneBits ||
builtinID == AArch64::BI_CountOneBits64) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == AArch64::BI__prefetch) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == AArch64::BI__hlt) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
if (builtinID == NEON::BI__builtin_neon_vcvth_bf16_f32) {
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
// Handle MSVC intrinsics before argument evaluation to prevent double
// evaluation.
assert(!cir::MissingFeatures::msvcBuiltins());
// Some intrinsics are equivalent - if they are use the base intrinsic ID.
auto it = llvm::find_if(neonEquivalentIntrinsicMap, [builtinID](auto &p) {
return p.first == builtinID;
});
if (it != end(neonEquivalentIntrinsicMap))
builtinID = it->second;
// Find out if any arguments are required to be integer constant
// expressions.
assert(!cir::MissingFeatures::handleBuiltinICEArguments());
assert(!cir::MissingFeatures::neonSISDIntrinsics());
// Handle non-overloaded intrinsics first.
switch (builtinID) {
default:
break;
case NEON::BI__builtin_neon_vabsh_f16:
case NEON::BI__builtin_neon_vaddq_p128:
case NEON::BI__builtin_neon_vldrq_p128:
case NEON::BI__builtin_neon_vstrq_p128:
case NEON::BI__builtin_neon_vcvts_f32_u32:
case NEON::BI__builtin_neon_vcvtd_f64_u64:
case NEON::BI__builtin_neon_vcvts_f32_s32:
case NEON::BI__builtin_neon_vcvtd_f64_s64:
case NEON::BI__builtin_neon_vcvth_f16_u16:
case NEON::BI__builtin_neon_vcvth_f16_u32:
case NEON::BI__builtin_neon_vcvth_f16_u64:
case NEON::BI__builtin_neon_vcvth_f16_s16:
case NEON::BI__builtin_neon_vcvth_f16_s32:
case NEON::BI__builtin_neon_vcvth_f16_s64:
case NEON::BI__builtin_neon_vcvtah_u16_f16:
case NEON::BI__builtin_neon_vcvtmh_u16_f16:
case NEON::BI__builtin_neon_vcvtnh_u16_f16:
case NEON::BI__builtin_neon_vcvtph_u16_f16:
case NEON::BI__builtin_neon_vcvth_u16_f16:
case NEON::BI__builtin_neon_vcvtah_s16_f16:
case NEON::BI__builtin_neon_vcvtmh_s16_f16:
case NEON::BI__builtin_neon_vcvtnh_s16_f16:
case NEON::BI__builtin_neon_vcvtph_s16_f16:
case NEON::BI__builtin_neon_vcvth_s16_f16:
case NEON::BI__builtin_neon_vcaleh_f16:
case NEON::BI__builtin_neon_vcalth_f16:
case NEON::BI__builtin_neon_vcageh_f16:
case NEON::BI__builtin_neon_vcagth_f16:
case NEON::BI__builtin_neon_vcvth_n_s16_f16:
case NEON::BI__builtin_neon_vcvth_n_u16_f16:
case NEON::BI__builtin_neon_vcvth_n_f16_s16:
case NEON::BI__builtin_neon_vcvth_n_f16_u16:
case NEON::BI__builtin_neon_vpaddd_s64:
case NEON::BI__builtin_neon_vpaddd_f64:
case NEON::BI__builtin_neon_vpadds_f32:
case NEON::BI__builtin_neon_vceqzd_s64:
case NEON::BI__builtin_neon_vceqzd_f64:
case NEON::BI__builtin_neon_vceqzs_f32:
case NEON::BI__builtin_neon_vceqzh_f16:
case NEON::BI__builtin_neon_vcgezd_s64:
case NEON::BI__builtin_neon_vcgezd_f64:
case NEON::BI__builtin_neon_vcgezs_f32:
case NEON::BI__builtin_neon_vcgezh_f16:
case NEON::BI__builtin_neon_vclezd_s64:
case NEON::BI__builtin_neon_vclezd_f64:
case NEON::BI__builtin_neon_vclezs_f32:
case NEON::BI__builtin_neon_vclezh_f16:
case NEON::BI__builtin_neon_vcgtzd_s64:
case NEON::BI__builtin_neon_vcgtzd_f64:
case NEON::BI__builtin_neon_vcgtzs_f32:
case NEON::BI__builtin_neon_vcgtzh_f16:
case NEON::BI__builtin_neon_vcltzd_s64:
case NEON::BI__builtin_neon_vcltzd_f64:
case NEON::BI__builtin_neon_vcltzs_f32:
case NEON::BI__builtin_neon_vcltzh_f16:
case NEON::BI__builtin_neon_vceqzd_u64:
case NEON::BI__builtin_neon_vceqd_f64:
case NEON::BI__builtin_neon_vcled_f64:
case NEON::BI__builtin_neon_vcltd_f64:
case NEON::BI__builtin_neon_vcged_f64:
case NEON::BI__builtin_neon_vcgtd_f64:
case NEON::BI__builtin_neon_vceqs_f32:
case NEON::BI__builtin_neon_vcles_f32:
case NEON::BI__builtin_neon_vclts_f32:
case NEON::BI__builtin_neon_vcges_f32:
case NEON::BI__builtin_neon_vcgts_f32:
case NEON::BI__builtin_neon_vceqh_f16:
case NEON::BI__builtin_neon_vcleh_f16:
case NEON::BI__builtin_neon_vclth_f16:
case NEON::BI__builtin_neon_vcgeh_f16:
case NEON::BI__builtin_neon_vcgth_f16:
case NEON::BI__builtin_neon_vceqd_s64:
case NEON::BI__builtin_neon_vceqd_u64:
case NEON::BI__builtin_neon_vcgtd_s64:
case NEON::BI__builtin_neon_vcgtd_u64:
case NEON::BI__builtin_neon_vcltd_s64:
case NEON::BI__builtin_neon_vcltd_u64:
case NEON::BI__builtin_neon_vcged_u64:
case NEON::BI__builtin_neon_vcged_s64:
case NEON::BI__builtin_neon_vcled_u64:
case NEON::BI__builtin_neon_vcled_s64:
case NEON::BI__builtin_neon_vtstd_s64:
case NEON::BI__builtin_neon_vtstd_u64:
case NEON::BI__builtin_neon_vset_lane_i8:
case NEON::BI__builtin_neon_vset_lane_i16:
case NEON::BI__builtin_neon_vset_lane_i32:
case NEON::BI__builtin_neon_vset_lane_i64:
case NEON::BI__builtin_neon_vset_lane_bf16:
case NEON::BI__builtin_neon_vset_lane_f32:
case NEON::BI__builtin_neon_vsetq_lane_i8:
case NEON::BI__builtin_neon_vsetq_lane_i16:
case NEON::BI__builtin_neon_vsetq_lane_i32:
case NEON::BI__builtin_neon_vsetq_lane_i64:
case NEON::BI__builtin_neon_vsetq_lane_bf16:
case NEON::BI__builtin_neon_vsetq_lane_f32:
case NEON::BI__builtin_neon_vset_lane_f64:
case NEON::BI__builtin_neon_vset_lane_mf8:
case NEON::BI__builtin_neon_vsetq_lane_mf8:
case NEON::BI__builtin_neon_vsetq_lane_f64:
case NEON::BI__builtin_neon_vget_lane_i8:
case NEON::BI__builtin_neon_vdupb_lane_i8:
case NEON::BI__builtin_neon_vgetq_lane_i8:
case NEON::BI__builtin_neon_vdupb_laneq_i8:
case NEON::BI__builtin_neon_vget_lane_mf8:
case NEON::BI__builtin_neon_vdupb_lane_mf8:
case NEON::BI__builtin_neon_vgetq_lane_mf8:
case NEON::BI__builtin_neon_vdupb_laneq_mf8:
case NEON::BI__builtin_neon_vget_lane_i16:
case NEON::BI__builtin_neon_vduph_lane_i16:
case NEON::BI__builtin_neon_vgetq_lane_i16:
case NEON::BI__builtin_neon_vduph_laneq_i16:
case NEON::BI__builtin_neon_vget_lane_i32:
case NEON::BI__builtin_neon_vdups_lane_i32:
case NEON::BI__builtin_neon_vdups_lane_f32:
case NEON::BI__builtin_neon_vgetq_lane_i32:
case NEON::BI__builtin_neon_vdups_laneq_i32:
case NEON::BI__builtin_neon_vget_lane_i64:
case NEON::BI__builtin_neon_vdupd_lane_i64:
case NEON::BI__builtin_neon_vdupd_lane_f64:
case NEON::BI__builtin_neon_vgetq_lane_i64:
case NEON::BI__builtin_neon_vdupd_laneq_i64:
case NEON::BI__builtin_neon_vget_lane_f32:
case NEON::BI__builtin_neon_vget_lane_f64:
case NEON::BI__builtin_neon_vgetq_lane_f32:
case NEON::BI__builtin_neon_vdups_laneq_f32:
case NEON::BI__builtin_neon_vgetq_lane_f64:
case NEON::BI__builtin_neon_vdupd_laneq_f64:
case NEON::BI__builtin_neon_vaddh_f16:
case NEON::BI__builtin_neon_vsubh_f16:
case NEON::BI__builtin_neon_vmulh_f16:
case NEON::BI__builtin_neon_vdivh_f16:
case NEON::BI__builtin_neon_vfmah_f16:
case NEON::BI__builtin_neon_vfmsh_f16:
case NEON::BI__builtin_neon_vaddd_s64:
case NEON::BI__builtin_neon_vaddd_u64:
case NEON::BI__builtin_neon_vsubd_s64:
case NEON::BI__builtin_neon_vsubd_u64:
case NEON::BI__builtin_neon_vqdmlalh_s16:
case NEON::BI__builtin_neon_vqdmlslh_s16:
case NEON::BI__builtin_neon_vqshlud_n_s64:
case NEON::BI__builtin_neon_vqshld_n_u64:
case NEON::BI__builtin_neon_vqshld_n_s64:
case NEON::BI__builtin_neon_vrshrd_n_u64:
case NEON::BI__builtin_neon_vrshrd_n_s64:
case NEON::BI__builtin_neon_vrsrad_n_u64:
case NEON::BI__builtin_neon_vrsrad_n_s64:
case NEON::BI__builtin_neon_vshld_n_s64:
case NEON::BI__builtin_neon_vshld_n_u64:
case NEON::BI__builtin_neon_vshrd_n_s64:
case NEON::BI__builtin_neon_vshrd_n_u64:
case NEON::BI__builtin_neon_vsrad_n_s64:
case NEON::BI__builtin_neon_vsrad_n_u64:
case NEON::BI__builtin_neon_vqdmlalh_lane_s16:
case NEON::BI__builtin_neon_vqdmlalh_laneq_s16:
case NEON::BI__builtin_neon_vqdmlslh_lane_s16:
case NEON::BI__builtin_neon_vqdmlslh_laneq_s16:
case NEON::BI__builtin_neon_vqdmlals_s32:
case NEON::BI__builtin_neon_vqdmlsls_s32:
case NEON::BI__builtin_neon_vqdmlals_lane_s32:
case NEON::BI__builtin_neon_vqdmlals_laneq_s32:
case NEON::BI__builtin_neon_vqdmlsls_lane_s32:
case NEON::BI__builtin_neon_vqdmlsls_laneq_s32:
case NEON::BI__builtin_neon_vget_lane_bf16:
case NEON::BI__builtin_neon_vduph_lane_bf16:
case NEON::BI__builtin_neon_vduph_lane_f16:
case NEON::BI__builtin_neon_vgetq_lane_bf16:
case NEON::BI__builtin_neon_vduph_laneq_bf16:
case NEON::BI__builtin_neon_vduph_laneq_f16:
case NEON::BI__builtin_neon_vcvt_bf16_f32:
case NEON::BI__builtin_neon_vcvtq_low_bf16_f32:
case NEON::BI__builtin_neon_vcvtq_high_bf16_f32:
case clang::AArch64::BI_InterlockedAdd:
case clang::AArch64::BI_InterlockedAdd_acq:
case clang::AArch64::BI_InterlockedAdd_rel:
case clang::AArch64::BI_InterlockedAdd_nf:
case clang::AArch64::BI_InterlockedAdd64:
case clang::AArch64::BI_InterlockedAdd64_acq:
case clang::AArch64::BI_InterlockedAdd64_rel:
case clang::AArch64::BI_InterlockedAdd64_nf:
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
// Not all intrinsics handled by the common case work for AArch64 yet, so only
// defer to common code if it's been added to our special map.
assert(!cir::MissingFeatures::aarch64SIMDIntrinsics());
assert(!cir::MissingFeatures::aarch64TblBuiltinExpr());
switch (builtinID) {
default:
return std::nullopt;
case NEON::BI__builtin_neon_vbsl_v:
case NEON::BI__builtin_neon_vbslq_v:
case NEON::BI__builtin_neon_vfma_lane_v:
case NEON::BI__builtin_neon_vfmaq_lane_v:
case NEON::BI__builtin_neon_vfma_laneq_v:
case NEON::BI__builtin_neon_vfmaq_laneq_v:
case NEON::BI__builtin_neon_vfmah_lane_f16:
case NEON::BI__builtin_neon_vfmas_lane_f32:
case NEON::BI__builtin_neon_vfmah_laneq_f16:
case NEON::BI__builtin_neon_vfmas_laneq_f32:
case NEON::BI__builtin_neon_vfmad_lane_f64:
case NEON::BI__builtin_neon_vfmad_laneq_f64:
case NEON::BI__builtin_neon_vmull_v:
case NEON::BI__builtin_neon_vmax_v:
case NEON::BI__builtin_neon_vmaxq_v:
case NEON::BI__builtin_neon_vmaxh_f16:
case NEON::BI__builtin_neon_vmin_v:
case NEON::BI__builtin_neon_vminq_v:
case NEON::BI__builtin_neon_vminh_f16:
case NEON::BI__builtin_neon_vabd_v:
case NEON::BI__builtin_neon_vabdq_v:
case NEON::BI__builtin_neon_vpadal_v:
case NEON::BI__builtin_neon_vpadalq_v:
case NEON::BI__builtin_neon_vpmin_v:
case NEON::BI__builtin_neon_vpminq_v:
case NEON::BI__builtin_neon_vpmax_v:
case NEON::BI__builtin_neon_vpmaxq_v:
case NEON::BI__builtin_neon_vminnm_v:
case NEON::BI__builtin_neon_vminnmq_v:
case NEON::BI__builtin_neon_vminnmh_f16:
case NEON::BI__builtin_neon_vmaxnm_v:
case NEON::BI__builtin_neon_vmaxnmq_v:
case NEON::BI__builtin_neon_vmaxnmh_f16:
case NEON::BI__builtin_neon_vrecpss_f32:
case NEON::BI__builtin_neon_vrecpsd_f64:
case NEON::BI__builtin_neon_vrecpsh_f16:
case NEON::BI__builtin_neon_vqshrun_n_v:
case NEON::BI__builtin_neon_vqrshrun_n_v:
case NEON::BI__builtin_neon_vqshrn_n_v:
case NEON::BI__builtin_neon_vrshrn_n_v:
case NEON::BI__builtin_neon_vqrshrn_n_v:
case NEON::BI__builtin_neon_vrndah_f16:
case NEON::BI__builtin_neon_vrnda_v:
case NEON::BI__builtin_neon_vrndaq_v:
case NEON::BI__builtin_neon_vrndih_f16:
case NEON::BI__builtin_neon_vrndmh_f16:
case NEON::BI__builtin_neon_vrndm_v:
case NEON::BI__builtin_neon_vrndmq_v:
case NEON::BI__builtin_neon_vrndnh_f16:
case NEON::BI__builtin_neon_vrndn_v:
case NEON::BI__builtin_neon_vrndnq_v:
case NEON::BI__builtin_neon_vrndns_f32:
case NEON::BI__builtin_neon_vrndph_f16:
case NEON::BI__builtin_neon_vrndp_v:
case NEON::BI__builtin_neon_vrndpq_v:
case NEON::BI__builtin_neon_vrndxh_f16:
case NEON::BI__builtin_neon_vrndx_v:
case NEON::BI__builtin_neon_vrndxq_v:
case NEON::BI__builtin_neon_vrndh_f16:
case NEON::BI__builtin_neon_vrnd32x_f32:
case NEON::BI__builtin_neon_vrnd32xq_f32:
case NEON::BI__builtin_neon_vrnd32x_f64:
case NEON::BI__builtin_neon_vrnd32xq_f64:
case NEON::BI__builtin_neon_vrnd32z_f32:
case NEON::BI__builtin_neon_vrnd32zq_f32:
case NEON::BI__builtin_neon_vrnd32z_f64:
case NEON::BI__builtin_neon_vrnd32zq_f64:
case NEON::BI__builtin_neon_vrnd64x_f32:
case NEON::BI__builtin_neon_vrnd64xq_f32:
case NEON::BI__builtin_neon_vrnd64x_f64:
case NEON::BI__builtin_neon_vrnd64xq_f64:
case NEON::BI__builtin_neon_vrnd64z_f32:
case NEON::BI__builtin_neon_vrnd64zq_f32:
case NEON::BI__builtin_neon_vrnd64z_f64:
case NEON::BI__builtin_neon_vrnd64zq_f64:
case NEON::BI__builtin_neon_vrnd_v:
case NEON::BI__builtin_neon_vrndq_v:
case NEON::BI__builtin_neon_vcvt_f64_v:
case NEON::BI__builtin_neon_vcvtq_f64_v:
case NEON::BI__builtin_neon_vcvt_f64_f32:
case NEON::BI__builtin_neon_vcvt_f32_f64:
case NEON::BI__builtin_neon_vcvt_s32_v:
case NEON::BI__builtin_neon_vcvt_u32_v:
case NEON::BI__builtin_neon_vcvt_s64_v:
case NEON::BI__builtin_neon_vcvt_u64_v:
case NEON::BI__builtin_neon_vcvt_s16_f16:
case NEON::BI__builtin_neon_vcvt_u16_f16:
case NEON::BI__builtin_neon_vcvtq_s32_v:
case NEON::BI__builtin_neon_vcvtq_u32_v:
case NEON::BI__builtin_neon_vcvtq_s64_v:
case NEON::BI__builtin_neon_vcvtq_u64_v:
case NEON::BI__builtin_neon_vcvtq_s16_f16:
case NEON::BI__builtin_neon_vcvtq_u16_f16:
case NEON::BI__builtin_neon_vcvta_s16_f16:
case NEON::BI__builtin_neon_vcvta_u16_f16:
case NEON::BI__builtin_neon_vcvta_s32_v:
case NEON::BI__builtin_neon_vcvtaq_s16_f16:
case NEON::BI__builtin_neon_vcvtaq_s32_v:
case NEON::BI__builtin_neon_vcvta_u32_v:
case NEON::BI__builtin_neon_vcvtaq_u16_f16:
case NEON::BI__builtin_neon_vcvtaq_u32_v:
case NEON::BI__builtin_neon_vcvta_s64_v:
case NEON::BI__builtin_neon_vcvtaq_s64_v:
case NEON::BI__builtin_neon_vcvta_u64_v:
case NEON::BI__builtin_neon_vcvtaq_u64_v:
case NEON::BI__builtin_neon_vcvtm_s16_f16:
case NEON::BI__builtin_neon_vcvtm_s32_v:
case NEON::BI__builtin_neon_vcvtmq_s16_f16:
case NEON::BI__builtin_neon_vcvtmq_s32_v:
case NEON::BI__builtin_neon_vcvtm_u16_f16:
case NEON::BI__builtin_neon_vcvtm_u32_v:
case NEON::BI__builtin_neon_vcvtmq_u16_f16:
case NEON::BI__builtin_neon_vcvtmq_u32_v:
case NEON::BI__builtin_neon_vcvtm_s64_v:
case NEON::BI__builtin_neon_vcvtmq_s64_v:
case NEON::BI__builtin_neon_vcvtm_u64_v:
case NEON::BI__builtin_neon_vcvtmq_u64_v:
case NEON::BI__builtin_neon_vcvtn_s16_f16:
case NEON::BI__builtin_neon_vcvtn_s32_v:
case NEON::BI__builtin_neon_vcvtnq_s16_f16:
case NEON::BI__builtin_neon_vcvtnq_s32_v:
case NEON::BI__builtin_neon_vcvtn_u16_f16:
case NEON::BI__builtin_neon_vcvtn_u32_v:
case NEON::BI__builtin_neon_vcvtnq_u16_f16:
case NEON::BI__builtin_neon_vcvtnq_u32_v:
case NEON::BI__builtin_neon_vcvtn_s64_v:
case NEON::BI__builtin_neon_vcvtnq_s64_v:
case NEON::BI__builtin_neon_vcvtn_u64_v:
case NEON::BI__builtin_neon_vcvtnq_u64_v:
case NEON::BI__builtin_neon_vcvtp_s16_f16:
case NEON::BI__builtin_neon_vcvtp_s32_v:
case NEON::BI__builtin_neon_vcvtpq_s16_f16:
case NEON::BI__builtin_neon_vcvtpq_s32_v:
case NEON::BI__builtin_neon_vcvtp_u16_f16:
case NEON::BI__builtin_neon_vcvtp_u32_v:
case NEON::BI__builtin_neon_vcvtpq_u16_f16:
case NEON::BI__builtin_neon_vcvtpq_u32_v:
case NEON::BI__builtin_neon_vcvtp_s64_v:
case NEON::BI__builtin_neon_vcvtpq_s64_v:
case NEON::BI__builtin_neon_vcvtp_u64_v:
case NEON::BI__builtin_neon_vcvtpq_u64_v:
case NEON::BI__builtin_neon_vmulx_v:
case NEON::BI__builtin_neon_vmulxq_v:
case NEON::BI__builtin_neon_vmulxh_lane_f16:
case NEON::BI__builtin_neon_vmulxh_laneq_f16:
case NEON::BI__builtin_neon_vmul_lane_v:
case NEON::BI__builtin_neon_vmul_laneq_v:
case NEON::BI__builtin_neon_vnegd_s64:
case NEON::BI__builtin_neon_vnegh_f16:
case NEON::BI__builtin_neon_vpmaxnm_v:
case NEON::BI__builtin_neon_vpmaxnmq_v:
case NEON::BI__builtin_neon_vpminnm_v:
case NEON::BI__builtin_neon_vpminnmq_v:
case NEON::BI__builtin_neon_vsqrth_f16:
case NEON::BI__builtin_neon_vsqrt_v:
case NEON::BI__builtin_neon_vsqrtq_v:
case NEON::BI__builtin_neon_vrbit_v:
case NEON::BI__builtin_neon_vrbitq_v:
case NEON::BI__builtin_neon_vmaxv_f16:
case NEON::BI__builtin_neon_vmaxvq_f16:
case NEON::BI__builtin_neon_vminv_f16:
case NEON::BI__builtin_neon_vminvq_f16:
case NEON::BI__builtin_neon_vmaxnmv_f16:
case NEON::BI__builtin_neon_vmaxnmvq_f16:
case NEON::BI__builtin_neon_vminnmv_f16:
case NEON::BI__builtin_neon_vminnmvq_f16:
case NEON::BI__builtin_neon_vmul_n_f64:
case NEON::BI__builtin_neon_vaddlv_u8:
case NEON::BI__builtin_neon_vaddlv_u16:
case NEON::BI__builtin_neon_vaddlvq_u8:
case NEON::BI__builtin_neon_vaddlvq_u16:
case NEON::BI__builtin_neon_vaddlv_s8:
case NEON::BI__builtin_neon_vaddlv_s16:
case NEON::BI__builtin_neon_vaddlvq_s8:
case NEON::BI__builtin_neon_vaddlvq_s16:
case NEON::BI__builtin_neon_vsri_n_v:
case NEON::BI__builtin_neon_vsriq_n_v:
case NEON::BI__builtin_neon_vsli_n_v:
case NEON::BI__builtin_neon_vsliq_n_v:
case NEON::BI__builtin_neon_vsra_n_v:
case NEON::BI__builtin_neon_vsraq_n_v:
case NEON::BI__builtin_neon_vrsra_n_v:
case NEON::BI__builtin_neon_vrsraq_n_v:
case NEON::BI__builtin_neon_vld1_v:
case NEON::BI__builtin_neon_vld1q_v:
case NEON::BI__builtin_neon_vst1_v:
case NEON::BI__builtin_neon_vst1q_v:
case NEON::BI__builtin_neon_vld1_lane_v:
case NEON::BI__builtin_neon_vld1q_lane_v:
case NEON::BI__builtin_neon_vldap1_lane_s64:
case NEON::BI__builtin_neon_vldap1q_lane_s64:
case NEON::BI__builtin_neon_vld1_dup_v:
case NEON::BI__builtin_neon_vld1q_dup_v:
case NEON::BI__builtin_neon_vst1_lane_v:
case NEON::BI__builtin_neon_vst1q_lane_v:
case NEON::BI__builtin_neon_vstl1_lane_s64:
case NEON::BI__builtin_neon_vstl1q_lane_s64:
case NEON::BI__builtin_neon_vld2_v:
case NEON::BI__builtin_neon_vld2q_v:
case NEON::BI__builtin_neon_vld3_v:
case NEON::BI__builtin_neon_vld3q_v:
case NEON::BI__builtin_neon_vld4_v:
case NEON::BI__builtin_neon_vld4q_v:
case NEON::BI__builtin_neon_vld2_dup_v:
case NEON::BI__builtin_neon_vld2q_dup_v:
case NEON::BI__builtin_neon_vld3_dup_v:
case NEON::BI__builtin_neon_vld3q_dup_v:
case NEON::BI__builtin_neon_vld4_dup_v:
case NEON::BI__builtin_neon_vld4q_dup_v:
case NEON::BI__builtin_neon_vld2_lane_v:
case NEON::BI__builtin_neon_vld2q_lane_v:
case NEON::BI__builtin_neon_vld3_lane_v:
case NEON::BI__builtin_neon_vld3q_lane_v:
case NEON::BI__builtin_neon_vld4_lane_v:
case NEON::BI__builtin_neon_vld4q_lane_v:
case NEON::BI__builtin_neon_vst2_v:
case NEON::BI__builtin_neon_vst2q_v:
case NEON::BI__builtin_neon_vst2_lane_v:
case NEON::BI__builtin_neon_vst2q_lane_v:
case NEON::BI__builtin_neon_vst3_v:
case NEON::BI__builtin_neon_vst3q_v:
case NEON::BI__builtin_neon_vst3_lane_v:
case NEON::BI__builtin_neon_vst3q_lane_v:
case NEON::BI__builtin_neon_vst4_v:
case NEON::BI__builtin_neon_vst4q_v:
case NEON::BI__builtin_neon_vst4_lane_v:
case NEON::BI__builtin_neon_vst4q_lane_v:
case NEON::BI__builtin_neon_vtrn_v:
case NEON::BI__builtin_neon_vtrnq_v:
case NEON::BI__builtin_neon_vuzp_v:
case NEON::BI__builtin_neon_vuzpq_v:
case NEON::BI__builtin_neon_vzip_v:
case NEON::BI__builtin_neon_vzipq_v:
case NEON::BI__builtin_neon_vqtbl1q_v:
case NEON::BI__builtin_neon_vqtbl2q_v:
case NEON::BI__builtin_neon_vqtbl3q_v:
case NEON::BI__builtin_neon_vqtbl4q_v:
case NEON::BI__builtin_neon_vqtbx1q_v:
case NEON::BI__builtin_neon_vqtbx2q_v:
case NEON::BI__builtin_neon_vqtbx3q_v:
case NEON::BI__builtin_neon_vqtbx4q_v:
case NEON::BI__builtin_neon_vsqadd_v:
case NEON::BI__builtin_neon_vsqaddq_v:
case NEON::BI__builtin_neon_vuqadd_v:
case NEON::BI__builtin_neon_vuqaddq_v:
case NEON::BI__builtin_neon_vluti2_laneq_mf8:
case NEON::BI__builtin_neon_vluti2_laneq_bf16:
case NEON::BI__builtin_neon_vluti2_laneq_f16:
case NEON::BI__builtin_neon_vluti2_laneq_p16:
case NEON::BI__builtin_neon_vluti2_laneq_p8:
case NEON::BI__builtin_neon_vluti2_laneq_s16:
case NEON::BI__builtin_neon_vluti2_laneq_s8:
case NEON::BI__builtin_neon_vluti2_laneq_u16:
case NEON::BI__builtin_neon_vluti2_laneq_u8:
case NEON::BI__builtin_neon_vluti2q_laneq_mf8:
case NEON::BI__builtin_neon_vluti2q_laneq_bf16:
case NEON::BI__builtin_neon_vluti2q_laneq_f16:
case NEON::BI__builtin_neon_vluti2q_laneq_p16:
case NEON::BI__builtin_neon_vluti2q_laneq_p8:
case NEON::BI__builtin_neon_vluti2q_laneq_s16:
case NEON::BI__builtin_neon_vluti2q_laneq_s8:
case NEON::BI__builtin_neon_vluti2q_laneq_u16:
case NEON::BI__builtin_neon_vluti2q_laneq_u8:
case NEON::BI__builtin_neon_vluti2_lane_mf8:
case NEON::BI__builtin_neon_vluti2_lane_bf16:
case NEON::BI__builtin_neon_vluti2_lane_f16:
case NEON::BI__builtin_neon_vluti2_lane_p16:
case NEON::BI__builtin_neon_vluti2_lane_p8:
case NEON::BI__builtin_neon_vluti2_lane_s16:
case NEON::BI__builtin_neon_vluti2_lane_s8:
case NEON::BI__builtin_neon_vluti2_lane_u16:
case NEON::BI__builtin_neon_vluti2_lane_u8:
case NEON::BI__builtin_neon_vluti2q_lane_mf8:
case NEON::BI__builtin_neon_vluti2q_lane_bf16:
case NEON::BI__builtin_neon_vluti2q_lane_f16:
case NEON::BI__builtin_neon_vluti2q_lane_p16:
case NEON::BI__builtin_neon_vluti2q_lane_p8:
case NEON::BI__builtin_neon_vluti2q_lane_s16:
case NEON::BI__builtin_neon_vluti2q_lane_s8:
case NEON::BI__builtin_neon_vluti2q_lane_u16:
case NEON::BI__builtin_neon_vluti2q_lane_u8:
case NEON::BI__builtin_neon_vluti4q_lane_mf8:
case NEON::BI__builtin_neon_vluti4q_lane_p8:
case NEON::BI__builtin_neon_vluti4q_lane_s8:
case NEON::BI__builtin_neon_vluti4q_lane_u8:
case NEON::BI__builtin_neon_vluti4q_laneq_mf8:
case NEON::BI__builtin_neon_vluti4q_laneq_p8:
case NEON::BI__builtin_neon_vluti4q_laneq_s8:
case NEON::BI__builtin_neon_vluti4q_laneq_u8:
case NEON::BI__builtin_neon_vluti4q_lane_bf16_x2:
case NEON::BI__builtin_neon_vluti4q_lane_f16_x2:
case NEON::BI__builtin_neon_vluti4q_lane_p16_x2:
case NEON::BI__builtin_neon_vluti4q_lane_s16_x2:
case NEON::BI__builtin_neon_vluti4q_lane_u16_x2:
case NEON::BI__builtin_neon_vluti4q_laneq_bf16_x2:
case NEON::BI__builtin_neon_vluti4q_laneq_f16_x2:
case NEON::BI__builtin_neon_vluti4q_laneq_p16_x2:
case NEON::BI__builtin_neon_vluti4q_laneq_s16_x2:
case NEON::BI__builtin_neon_vluti4q_laneq_u16_x2:
case NEON::BI__builtin_neon_vmmlaq_f16_mf8_fpm:
case NEON::BI__builtin_neon_vmmlaq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vcvt1_low_bf16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt1_bf16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt1_high_bf16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt2_low_bf16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt2_bf16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt2_high_bf16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt1_low_f16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt1_f16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt1_high_f16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt2_low_f16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt2_f16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt2_high_f16_mf8_fpm:
case NEON::BI__builtin_neon_vcvt_mf8_f32_fpm:
case NEON::BI__builtin_neon_vcvt_mf8_f16_fpm:
case NEON::BI__builtin_neon_vcvtq_mf8_f16_fpm:
case NEON::BI__builtin_neon_vcvt_high_mf8_f32_fpm:
case NEON::BI__builtin_neon_vdot_f16_mf8_fpm:
case NEON::BI__builtin_neon_vdotq_f16_mf8_fpm:
case NEON::BI__builtin_neon_vdot_lane_f16_mf8_fpm:
case NEON::BI__builtin_neon_vdotq_lane_f16_mf8_fpm:
case NEON::BI__builtin_neon_vdot_laneq_f16_mf8_fpm:
case NEON::BI__builtin_neon_vdotq_laneq_f16_mf8_fpm:
case NEON::BI__builtin_neon_vdot_f32_mf8_fpm:
case NEON::BI__builtin_neon_vdotq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vdot_lane_f32_mf8_fpm:
case NEON::BI__builtin_neon_vdotq_lane_f32_mf8_fpm:
case NEON::BI__builtin_neon_vdot_laneq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vdotq_laneq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlalbq_f16_mf8_fpm:
case NEON::BI__builtin_neon_vmlaltq_f16_mf8_fpm:
case NEON::BI__builtin_neon_vmlallbbq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlallbtq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlalltbq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlallttq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlalbq_lane_f16_mf8_fpm:
case NEON::BI__builtin_neon_vmlalbq_laneq_f16_mf8_fpm:
case NEON::BI__builtin_neon_vmlaltq_lane_f16_mf8_fpm:
case NEON::BI__builtin_neon_vmlaltq_laneq_f16_mf8_fpm:
case NEON::BI__builtin_neon_vmlallbbq_lane_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlallbbq_laneq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlallbtq_lane_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlallbtq_laneq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlalltbq_lane_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlalltbq_laneq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlallttq_lane_f32_mf8_fpm:
case NEON::BI__builtin_neon_vmlallttq_laneq_f32_mf8_fpm:
case NEON::BI__builtin_neon_vamin_f16:
case NEON::BI__builtin_neon_vaminq_f16:
case NEON::BI__builtin_neon_vamin_f32:
case NEON::BI__builtin_neon_vaminq_f32:
case NEON::BI__builtin_neon_vaminq_f64:
case NEON::BI__builtin_neon_vamax_f16:
case NEON::BI__builtin_neon_vamaxq_f16:
case NEON::BI__builtin_neon_vamax_f32:
case NEON::BI__builtin_neon_vamaxq_f32:
case NEON::BI__builtin_neon_vamaxq_f64:
case NEON::BI__builtin_neon_vscale_f16:
case NEON::BI__builtin_neon_vscaleq_f16:
case NEON::BI__builtin_neon_vscale_f32:
case NEON::BI__builtin_neon_vscaleq_f32:
case NEON::BI__builtin_neon_vscaleq_f64:
cgm.errorNYI(expr->getSourceRange(),
std::string("unimplemented AArch64 builtin call: ") +
getContext().BuiltinInfo.getName(builtinID));
return mlir::Value{};
}
// Unreachable: All cases in the switch above return.
}