| //===-- MipsSEISelDAGToDAG.cpp - A Dag to Dag Inst Selector for MipsSE ----===// |
| // |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // Subclass of MipsDAGToDAGISel specialized for mips32/64. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "MipsSEISelDAGToDAG.h" |
| #include "MCTargetDesc/MipsBaseInfo.h" |
| #include "Mips.h" |
| #include "MipsAnalyzeImmediate.h" |
| #include "MipsMachineFunction.h" |
| #include "MipsRegisterInfo.h" |
| #include "llvm/CodeGen/MachineConstantPool.h" |
| #include "llvm/CodeGen/MachineFrameInfo.h" |
| #include "llvm/CodeGen/MachineFunction.h" |
| #include "llvm/CodeGen/MachineInstrBuilder.h" |
| #include "llvm/CodeGen/MachineRegisterInfo.h" |
| #include "llvm/CodeGen/SelectionDAGNodes.h" |
| #include "llvm/IR/CFG.h" |
| #include "llvm/IR/Dominators.h" |
| #include "llvm/IR/GlobalValue.h" |
| #include "llvm/IR/Instructions.h" |
| #include "llvm/IR/Intrinsics.h" |
| #include "llvm/IR/IntrinsicsMips.h" |
| #include "llvm/IR/Type.h" |
| #include "llvm/Support/Debug.h" |
| #include "llvm/Support/ErrorHandling.h" |
| #include "llvm/Support/raw_ostream.h" |
| #include "llvm/Target/TargetMachine.h" |
| using namespace llvm; |
| |
| #define DEBUG_TYPE "mips-isel" |
| |
| bool MipsSEDAGToDAGISel::runOnMachineFunction(MachineFunction &MF) { |
| Subtarget = &static_cast<const MipsSubtarget &>(MF.getSubtarget()); |
| if (Subtarget->inMips16Mode()) |
| return false; |
| return MipsDAGToDAGISel::runOnMachineFunction(MF); |
| } |
| |
| void MipsSEDAGToDAGISel::getAnalysisUsage(AnalysisUsage &AU) const { |
| AU.addRequired<DominatorTreeWrapperPass>(); |
| SelectionDAGISel::getAnalysisUsage(AU); |
| } |
| |
| void MipsSEDAGToDAGISel::addDSPCtrlRegOperands(bool IsDef, MachineInstr &MI, |
| MachineFunction &MF) { |
| MachineInstrBuilder MIB(MF, &MI); |
| unsigned Mask = MI.getOperand(1).getImm(); |
| unsigned Flag = |
| IsDef ? RegState::ImplicitDefine : RegState::Implicit | RegState::Undef; |
| |
| if (Mask & 1) |
| MIB.addReg(Mips::DSPPos, Flag); |
| |
| if (Mask & 2) |
| MIB.addReg(Mips::DSPSCount, Flag); |
| |
| if (Mask & 4) |
| MIB.addReg(Mips::DSPCarry, Flag); |
| |
| if (Mask & 8) |
| MIB.addReg(Mips::DSPOutFlag, Flag); |
| |
| if (Mask & 16) |
| MIB.addReg(Mips::DSPCCond, Flag); |
| |
| if (Mask & 32) |
| MIB.addReg(Mips::DSPEFI, Flag); |
| } |
| |
| unsigned MipsSEDAGToDAGISel::getMSACtrlReg(const SDValue RegIdx) const { |
| uint64_t RegNum = cast<ConstantSDNode>(RegIdx)->getZExtValue(); |
| return Mips::MSACtrlRegClass.getRegister(RegNum); |
| } |
| |
| bool MipsSEDAGToDAGISel::replaceUsesWithZeroReg(MachineRegisterInfo *MRI, |
| const MachineInstr& MI) { |
| unsigned DstReg = 0, ZeroReg = 0; |
| |
| // Check if MI is "addiu $dst, $zero, 0" or "daddiu $dst, $zero, 0". |
| if ((MI.getOpcode() == Mips::ADDiu) && |
| (MI.getOperand(1).getReg() == Mips::ZERO) && |
| (MI.getOperand(2).isImm()) && |
| (MI.getOperand(2).getImm() == 0)) { |
| DstReg = MI.getOperand(0).getReg(); |
| ZeroReg = Mips::ZERO; |
| } else if ((MI.getOpcode() == Mips::DADDiu) && |
| (MI.getOperand(1).getReg() == Mips::ZERO_64) && |
| (MI.getOperand(2).isImm()) && |
| (MI.getOperand(2).getImm() == 0)) { |
| DstReg = MI.getOperand(0).getReg(); |
| ZeroReg = Mips::ZERO_64; |
| } |
| |
| if (!DstReg) |
| return false; |
| |
| // Replace uses with ZeroReg. |
| for (MachineRegisterInfo::use_iterator U = MRI->use_begin(DstReg), |
| E = MRI->use_end(); U != E;) { |
| MachineOperand &MO = *U; |
| unsigned OpNo = U.getOperandNo(); |
| MachineInstr *MI = MO.getParent(); |
| ++U; |
| |
| // Do not replace if it is a phi's operand or is tied to def operand. |
| if (MI->isPHI() || MI->isRegTiedToDefOperand(OpNo) || MI->isPseudo()) |
| continue; |
| |
| // Also, we have to check that the register class of the operand |
| // contains the zero register. |
| if (!MRI->getRegClass(MO.getReg())->contains(ZeroReg)) |
| continue; |
| |
| MO.setReg(ZeroReg); |
| } |
| |
| return true; |
| } |
| |
| void MipsSEDAGToDAGISel::emitMCountABI(MachineInstr &MI, MachineBasicBlock &MBB, |
| MachineFunction &MF) { |
| MachineInstrBuilder MIB(MF, &MI); |
| if (!Subtarget->isABI_O32()) { // N32, N64 |
| // Save current return address. |
| BuildMI(MBB, &MI, MI.getDebugLoc(), TII->get(Mips::OR64)) |
| .addDef(Mips::AT_64) |
| .addUse(Mips::RA_64, RegState::Undef) |
| .addUse(Mips::ZERO_64); |
| // Stops instruction above from being removed later on. |
| MIB.addUse(Mips::AT_64, RegState::Implicit); |
| } else { // O32 |
| // Save current return address. |
| BuildMI(MBB, &MI, MI.getDebugLoc(), TII->get(Mips::OR)) |
| .addDef(Mips::AT) |
| .addUse(Mips::RA, RegState::Undef) |
| .addUse(Mips::ZERO); |
| // _mcount pops 2 words from stack. |
| BuildMI(MBB, &MI, MI.getDebugLoc(), TII->get(Mips::ADDiu)) |
| .addDef(Mips::SP) |
| .addUse(Mips::SP) |
| .addImm(-8); |
| // Stops first instruction above from being removed later on. |
| MIB.addUse(Mips::AT, RegState::Implicit); |
| } |
| } |
| |
| void MipsSEDAGToDAGISel::processFunctionAfterISel(MachineFunction &MF) { |
| MF.getInfo<MipsFunctionInfo>()->initGlobalBaseReg(MF); |
| |
| MachineRegisterInfo *MRI = &MF.getRegInfo(); |
| |
| for (auto &MBB: MF) { |
| for (auto &MI: MBB) { |
| switch (MI.getOpcode()) { |
| case Mips::RDDSP: |
| addDSPCtrlRegOperands(false, MI, MF); |
| break; |
| case Mips::WRDSP: |
| addDSPCtrlRegOperands(true, MI, MF); |
| break; |
| case Mips::BuildPairF64_64: |
| case Mips::ExtractElementF64_64: |
| if (!Subtarget->useOddSPReg()) { |
| MI.addOperand(MachineOperand::CreateReg(Mips::SP, false, true)); |
| break; |
| } |
| LLVM_FALLTHROUGH; |
| case Mips::BuildPairF64: |
| case Mips::ExtractElementF64: |
| if (Subtarget->isABI_FPXX() && !Subtarget->hasMTHC1()) |
| MI.addOperand(MachineOperand::CreateReg(Mips::SP, false, true)); |
| break; |
| case Mips::JAL: |
| case Mips::JAL_MM: |
| if (MI.getOperand(0).isGlobal() && |
| MI.getOperand(0).getGlobal()->getGlobalIdentifier() == "_mcount") |
| emitMCountABI(MI, MBB, MF); |
| break; |
| case Mips::JALRPseudo: |
| case Mips::JALR64Pseudo: |
| case Mips::JALR16_MM: |
| if (MI.getOperand(2).isMCSymbol() && |
| MI.getOperand(2).getMCSymbol()->getName() == "_mcount") |
| emitMCountABI(MI, MBB, MF); |
| break; |
| case Mips::JALR: |
| if (MI.getOperand(3).isMCSymbol() && |
| MI.getOperand(3).getMCSymbol()->getName() == "_mcount") |
| emitMCountABI(MI, MBB, MF); |
| break; |
| default: |
| replaceUsesWithZeroReg(MRI, MI); |
| } |
| } |
| } |
| } |
| |
| void MipsSEDAGToDAGISel::selectAddE(SDNode *Node, const SDLoc &DL) const { |
| SDValue InFlag = Node->getOperand(2); |
| unsigned Opc = InFlag.getOpcode(); |
| SDValue LHS = Node->getOperand(0), RHS = Node->getOperand(1); |
| EVT VT = LHS.getValueType(); |
| |
| // In the base case, we can rely on the carry bit from the addsc |
| // instruction. |
| if (Opc == ISD::ADDC) { |
| SDValue Ops[3] = {LHS, RHS, InFlag}; |
| CurDAG->SelectNodeTo(Node, Mips::ADDWC, VT, MVT::Glue, Ops); |
| return; |
| } |
| |
| assert(Opc == ISD::ADDE && "ISD::ADDE not in a chain of ADDE nodes!"); |
| |
| // The more complex case is when there is a chain of ISD::ADDE nodes like: |
| // (adde (adde (adde (addc a b) c) d) e). |
| // |
| // The addwc instruction does not write to the carry bit, instead it writes |
| // to bit 20 of the dsp control register. To match this series of nodes, each |
| // intermediate adde node must be expanded to write the carry bit before the |
| // addition. |
| |
| // Start by reading the overflow field for addsc and moving the value to the |
| // carry field. The usage of 1 here with MipsISD::RDDSP / Mips::WRDSP |
| // corresponds to reading/writing the entire control register to/from a GPR. |
| |
| SDValue CstOne = CurDAG->getTargetConstant(1, DL, MVT::i32); |
| |
| SDValue OuFlag = CurDAG->getTargetConstant(20, DL, MVT::i32); |
| |
| SDNode *DSPCtrlField = CurDAG->getMachineNode(Mips::RDDSP, DL, MVT::i32, |
| MVT::Glue, CstOne, InFlag); |
| |
| SDNode *Carry = CurDAG->getMachineNode( |
| Mips::EXT, DL, MVT::i32, SDValue(DSPCtrlField, 0), OuFlag, CstOne); |
| |
| SDValue Ops[4] = {SDValue(DSPCtrlField, 0), |
| CurDAG->getTargetConstant(6, DL, MVT::i32), CstOne, |
| SDValue(Carry, 0)}; |
| SDNode *DSPCFWithCarry = CurDAG->getMachineNode(Mips::INS, DL, MVT::i32, Ops); |
| |
| // My reading of the MIPS DSP 3.01 specification isn't as clear as I |
| // would like about whether bit 20 always gets overwritten by addwc. |
| // Hence take an extremely conservative view and presume it's sticky. We |
| // therefore need to clear it. |
| |
| SDValue Zero = CurDAG->getRegister(Mips::ZERO, MVT::i32); |
| |
| SDValue InsOps[4] = {Zero, OuFlag, CstOne, SDValue(DSPCFWithCarry, 0)}; |
| SDNode *DSPCtrlFinal = |
| CurDAG->getMachineNode(Mips::INS, DL, MVT::i32, InsOps); |
| |
| SDNode *WrDSP = CurDAG->getMachineNode(Mips::WRDSP, DL, MVT::Glue, |
| SDValue(DSPCtrlFinal, 0), CstOne); |
| |
| SDValue Operands[3] = {LHS, RHS, SDValue(WrDSP, 0)}; |
| CurDAG->SelectNodeTo(Node, Mips::ADDWC, VT, MVT::Glue, Operands); |
| } |
| |
| /// Match frameindex |
| bool MipsSEDAGToDAGISel::selectAddrFrameIndex(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| if (FrameIndexSDNode *FIN = dyn_cast<FrameIndexSDNode>(Addr)) { |
| EVT ValTy = Addr.getValueType(); |
| |
| Base = CurDAG->getTargetFrameIndex(FIN->getIndex(), ValTy); |
| Offset = CurDAG->getTargetConstant(0, SDLoc(Addr), ValTy); |
| return true; |
| } |
| return false; |
| } |
| |
| /// Match frameindex+offset and frameindex|offset |
| bool MipsSEDAGToDAGISel::selectAddrFrameIndexOffset( |
| SDValue Addr, SDValue &Base, SDValue &Offset, unsigned OffsetBits, |
| unsigned ShiftAmount = 0) const { |
| if (CurDAG->isBaseWithConstantOffset(Addr)) { |
| ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Addr.getOperand(1)); |
| if (isIntN(OffsetBits + ShiftAmount, CN->getSExtValue())) { |
| EVT ValTy = Addr.getValueType(); |
| |
| // If the first operand is a FI, get the TargetFI Node |
| if (FrameIndexSDNode *FIN = |
| dyn_cast<FrameIndexSDNode>(Addr.getOperand(0))) |
| Base = CurDAG->getTargetFrameIndex(FIN->getIndex(), ValTy); |
| else { |
| Base = Addr.getOperand(0); |
| // If base is a FI, additional offset calculation is done in |
| // eliminateFrameIndex, otherwise we need to check the alignment |
| const Align Alignment(1ULL << ShiftAmount); |
| if (!isAligned(Alignment, CN->getZExtValue())) |
| return false; |
| } |
| |
| Offset = CurDAG->getTargetConstant(CN->getZExtValue(), SDLoc(Addr), |
| ValTy); |
| return true; |
| } |
| } |
| return false; |
| } |
| |
| /// ComplexPattern used on MipsInstrInfo |
| /// Used on Mips Load/Store instructions |
| bool MipsSEDAGToDAGISel::selectAddrRegImm(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| // if Address is FI, get the TargetFrameIndex. |
| if (selectAddrFrameIndex(Addr, Base, Offset)) |
| return true; |
| |
| // on PIC code Load GA |
| if (Addr.getOpcode() == MipsISD::Wrapper) { |
| Base = Addr.getOperand(0); |
| Offset = Addr.getOperand(1); |
| return true; |
| } |
| |
| if (!TM.isPositionIndependent()) { |
| if ((Addr.getOpcode() == ISD::TargetExternalSymbol || |
| Addr.getOpcode() == ISD::TargetGlobalAddress)) |
| return false; |
| } |
| |
| // Addresses of the form FI+const or FI|const |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 16)) |
| return true; |
| |
| // Operand is a result from an ADD. |
| if (Addr.getOpcode() == ISD::ADD) { |
| // When loading from constant pools, load the lower address part in |
| // the instruction itself. Example, instead of: |
| // lui $2, %hi($CPI1_0) |
| // addiu $2, $2, %lo($CPI1_0) |
| // lwc1 $f0, 0($2) |
| // Generate: |
| // lui $2, %hi($CPI1_0) |
| // lwc1 $f0, %lo($CPI1_0)($2) |
| if (Addr.getOperand(1).getOpcode() == MipsISD::Lo || |
| Addr.getOperand(1).getOpcode() == MipsISD::GPRel) { |
| SDValue Opnd0 = Addr.getOperand(1).getOperand(0); |
| if (isa<ConstantPoolSDNode>(Opnd0) || isa<GlobalAddressSDNode>(Opnd0) || |
| isa<JumpTableSDNode>(Opnd0)) { |
| Base = Addr.getOperand(0); |
| Offset = Opnd0; |
| return true; |
| } |
| } |
| } |
| |
| return false; |
| } |
| |
| /// ComplexPattern used on MipsInstrInfo |
| /// Used on Mips Load/Store instructions |
| bool MipsSEDAGToDAGISel::selectAddrDefault(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| Base = Addr; |
| Offset = CurDAG->getTargetConstant(0, SDLoc(Addr), Addr.getValueType()); |
| return true; |
| } |
| |
| bool MipsSEDAGToDAGISel::selectIntAddr(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| return selectAddrRegImm(Addr, Base, Offset) || |
| selectAddrDefault(Addr, Base, Offset); |
| } |
| |
| bool MipsSEDAGToDAGISel::selectAddrRegImm9(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| if (selectAddrFrameIndex(Addr, Base, Offset)) |
| return true; |
| |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 9)) |
| return true; |
| |
| return false; |
| } |
| |
| /// Used on microMIPS LWC2, LDC2, SWC2 and SDC2 instructions (11-bit offset) |
| bool MipsSEDAGToDAGISel::selectAddrRegImm11(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| if (selectAddrFrameIndex(Addr, Base, Offset)) |
| return true; |
| |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 11)) |
| return true; |
| |
| return false; |
| } |
| |
| /// Used on microMIPS Load/Store unaligned instructions (12-bit offset) |
| bool MipsSEDAGToDAGISel::selectAddrRegImm12(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| if (selectAddrFrameIndex(Addr, Base, Offset)) |
| return true; |
| |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 12)) |
| return true; |
| |
| return false; |
| } |
| |
| bool MipsSEDAGToDAGISel::selectAddrRegImm16(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| if (selectAddrFrameIndex(Addr, Base, Offset)) |
| return true; |
| |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 16)) |
| return true; |
| |
| return false; |
| } |
| |
| bool MipsSEDAGToDAGISel::selectIntAddr11MM(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| return selectAddrRegImm11(Addr, Base, Offset) || |
| selectAddrDefault(Addr, Base, Offset); |
| } |
| |
| bool MipsSEDAGToDAGISel::selectIntAddr12MM(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| return selectAddrRegImm12(Addr, Base, Offset) || |
| selectAddrDefault(Addr, Base, Offset); |
| } |
| |
| bool MipsSEDAGToDAGISel::selectIntAddr16MM(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| return selectAddrRegImm16(Addr, Base, Offset) || |
| selectAddrDefault(Addr, Base, Offset); |
| } |
| |
| bool MipsSEDAGToDAGISel::selectIntAddrLSL2MM(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 7)) { |
| if (isa<FrameIndexSDNode>(Base)) |
| return false; |
| |
| if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Offset)) { |
| unsigned CnstOff = CN->getZExtValue(); |
| return (CnstOff == (CnstOff & 0x3c)); |
| } |
| |
| return false; |
| } |
| |
| // For all other cases where "lw" would be selected, don't select "lw16" |
| // because it would result in additional instructions to prepare operands. |
| if (selectAddrRegImm(Addr, Base, Offset)) |
| return false; |
| |
| return selectAddrDefault(Addr, Base, Offset); |
| } |
| |
| bool MipsSEDAGToDAGISel::selectIntAddrSImm10(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| |
| if (selectAddrFrameIndex(Addr, Base, Offset)) |
| return true; |
| |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10)) |
| return true; |
| |
| return selectAddrDefault(Addr, Base, Offset); |
| } |
| |
| bool MipsSEDAGToDAGISel::selectIntAddrSImm10Lsl1(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| if (selectAddrFrameIndex(Addr, Base, Offset)) |
| return true; |
| |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10, 1)) |
| return true; |
| |
| return selectAddrDefault(Addr, Base, Offset); |
| } |
| |
| bool MipsSEDAGToDAGISel::selectIntAddrSImm10Lsl2(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| if (selectAddrFrameIndex(Addr, Base, Offset)) |
| return true; |
| |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10, 2)) |
| return true; |
| |
| return selectAddrDefault(Addr, Base, Offset); |
| } |
| |
| bool MipsSEDAGToDAGISel::selectIntAddrSImm10Lsl3(SDValue Addr, SDValue &Base, |
| SDValue &Offset) const { |
| if (selectAddrFrameIndex(Addr, Base, Offset)) |
| return true; |
| |
| if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10, 3)) |
| return true; |
| |
| return selectAddrDefault(Addr, Base, Offset); |
| } |
| |
| // Select constant vector splats. |
| // |
| // Returns true and sets Imm if: |
| // * MSA is enabled |
| // * N is a ISD::BUILD_VECTOR representing a constant splat |
| bool MipsSEDAGToDAGISel::selectVSplat(SDNode *N, APInt &Imm, |
| unsigned MinSizeInBits) const { |
| if (!Subtarget->hasMSA()) |
| return false; |
| |
| BuildVectorSDNode *Node = dyn_cast<BuildVectorSDNode>(N); |
| |
| if (!Node) |
| return false; |
| |
| APInt SplatValue, SplatUndef; |
| unsigned SplatBitSize; |
| bool HasAnyUndefs; |
| |
| if (!Node->isConstantSplat(SplatValue, SplatUndef, SplatBitSize, HasAnyUndefs, |
| MinSizeInBits, !Subtarget->isLittle())) |
| return false; |
| |
| Imm = SplatValue; |
| |
| return true; |
| } |
| |
| // Select constant vector splats. |
| // |
| // In addition to the requirements of selectVSplat(), this function returns |
| // true and sets Imm if: |
| // * The splat value is the same width as the elements of the vector |
| // * The splat value fits in an integer with the specified signed-ness and |
| // width. |
| // |
| // This function looks through ISD::BITCAST nodes. |
| // TODO: This might not be appropriate for big-endian MSA since BITCAST is |
| // sometimes a shuffle in big-endian mode. |
| // |
| // It's worth noting that this function is not used as part of the selection |
| // of ldi.[bhwd] since it does not permit using the wrong-typed ldi.[bhwd] |
| // instruction to achieve the desired bit pattern. ldi.[bhwd] is selected in |
| // MipsSEDAGToDAGISel::selectNode. |
| bool MipsSEDAGToDAGISel:: |
| selectVSplatCommon(SDValue N, SDValue &Imm, bool Signed, |
| unsigned ImmBitSize) const { |
| APInt ImmValue; |
| EVT EltTy = N->getValueType(0).getVectorElementType(); |
| |
| if (N->getOpcode() == ISD::BITCAST) |
| N = N->getOperand(0); |
| |
| if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) && |
| ImmValue.getBitWidth() == EltTy.getSizeInBits()) { |
| |
| if (( Signed && ImmValue.isSignedIntN(ImmBitSize)) || |
| (!Signed && ImmValue.isIntN(ImmBitSize))) { |
| Imm = CurDAG->getTargetConstant(ImmValue, SDLoc(N), EltTy); |
| return true; |
| } |
| } |
| |
| return false; |
| } |
| |
| // Select constant vector splats. |
| bool MipsSEDAGToDAGISel:: |
| selectVSplatUimm1(SDValue N, SDValue &Imm) const { |
| return selectVSplatCommon(N, Imm, false, 1); |
| } |
| |
| bool MipsSEDAGToDAGISel:: |
| selectVSplatUimm2(SDValue N, SDValue &Imm) const { |
| return selectVSplatCommon(N, Imm, false, 2); |
| } |
| |
| bool MipsSEDAGToDAGISel:: |
| selectVSplatUimm3(SDValue N, SDValue &Imm) const { |
| return selectVSplatCommon(N, Imm, false, 3); |
| } |
| |
| // Select constant vector splats. |
| bool MipsSEDAGToDAGISel:: |
| selectVSplatUimm4(SDValue N, SDValue &Imm) const { |
| return selectVSplatCommon(N, Imm, false, 4); |
| } |
| |
| // Select constant vector splats. |
| bool MipsSEDAGToDAGISel:: |
| selectVSplatUimm5(SDValue N, SDValue &Imm) const { |
| return selectVSplatCommon(N, Imm, false, 5); |
| } |
| |
| // Select constant vector splats. |
| bool MipsSEDAGToDAGISel:: |
| selectVSplatUimm6(SDValue N, SDValue &Imm) const { |
| return selectVSplatCommon(N, Imm, false, 6); |
| } |
| |
| // Select constant vector splats. |
| bool MipsSEDAGToDAGISel:: |
| selectVSplatUimm8(SDValue N, SDValue &Imm) const { |
| return selectVSplatCommon(N, Imm, false, 8); |
| } |
| |
| // Select constant vector splats. |
| bool MipsSEDAGToDAGISel:: |
| selectVSplatSimm5(SDValue N, SDValue &Imm) const { |
| return selectVSplatCommon(N, Imm, true, 5); |
| } |
| |
| // Select constant vector splats whose value is a power of 2. |
| // |
| // In addition to the requirements of selectVSplat(), this function returns |
| // true and sets Imm if: |
| // * The splat value is the same width as the elements of the vector |
| // * The splat value is a power of two. |
| // |
| // This function looks through ISD::BITCAST nodes. |
| // TODO: This might not be appropriate for big-endian MSA since BITCAST is |
| // sometimes a shuffle in big-endian mode. |
| bool MipsSEDAGToDAGISel::selectVSplatUimmPow2(SDValue N, SDValue &Imm) const { |
| APInt ImmValue; |
| EVT EltTy = N->getValueType(0).getVectorElementType(); |
| |
| if (N->getOpcode() == ISD::BITCAST) |
| N = N->getOperand(0); |
| |
| if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) && |
| ImmValue.getBitWidth() == EltTy.getSizeInBits()) { |
| int32_t Log2 = ImmValue.exactLogBase2(); |
| |
| if (Log2 != -1) { |
| Imm = CurDAG->getTargetConstant(Log2, SDLoc(N), EltTy); |
| return true; |
| } |
| } |
| |
| return false; |
| } |
| |
| // Select constant vector splats whose value only has a consecutive sequence |
| // of left-most bits set (e.g. 0b11...1100...00). |
| // |
| // In addition to the requirements of selectVSplat(), this function returns |
| // true and sets Imm if: |
| // * The splat value is the same width as the elements of the vector |
| // * The splat value is a consecutive sequence of left-most bits. |
| // |
| // This function looks through ISD::BITCAST nodes. |
| // TODO: This might not be appropriate for big-endian MSA since BITCAST is |
| // sometimes a shuffle in big-endian mode. |
| bool MipsSEDAGToDAGISel::selectVSplatMaskL(SDValue N, SDValue &Imm) const { |
| APInt ImmValue; |
| EVT EltTy = N->getValueType(0).getVectorElementType(); |
| |
| if (N->getOpcode() == ISD::BITCAST) |
| N = N->getOperand(0); |
| |
| if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) && |
| ImmValue.getBitWidth() == EltTy.getSizeInBits()) { |
| // Extract the run of set bits starting with bit zero from the bitwise |
| // inverse of ImmValue, and test that the inverse of this is the same |
| // as the original value. |
| if (ImmValue == ~(~ImmValue & ~(~ImmValue + 1))) { |
| |
| Imm = CurDAG->getTargetConstant(ImmValue.countPopulation() - 1, SDLoc(N), |
| EltTy); |
| return true; |
| } |
| } |
| |
| return false; |
| } |
| |
| // Select constant vector splats whose value only has a consecutive sequence |
| // of right-most bits set (e.g. 0b00...0011...11). |
| // |
| // In addition to the requirements of selectVSplat(), this function returns |
| // true and sets Imm if: |
| // * The splat value is the same width as the elements of the vector |
| // * The splat value is a consecutive sequence of right-most bits. |
| // |
| // This function looks through ISD::BITCAST nodes. |
| // TODO: This might not be appropriate for big-endian MSA since BITCAST is |
| // sometimes a shuffle in big-endian mode. |
| bool MipsSEDAGToDAGISel::selectVSplatMaskR(SDValue N, SDValue &Imm) const { |
| APInt ImmValue; |
| EVT EltTy = N->getValueType(0).getVectorElementType(); |
| |
| if (N->getOpcode() == ISD::BITCAST) |
| N = N->getOperand(0); |
| |
| if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) && |
| ImmValue.getBitWidth() == EltTy.getSizeInBits()) { |
| // Extract the run of set bits starting with bit zero, and test that the |
| // result is the same as the original value |
| if (ImmValue == (ImmValue & ~(ImmValue + 1))) { |
| Imm = CurDAG->getTargetConstant(ImmValue.countPopulation() - 1, SDLoc(N), |
| EltTy); |
| return true; |
| } |
| } |
| |
| return false; |
| } |
| |
| bool MipsSEDAGToDAGISel::selectVSplatUimmInvPow2(SDValue N, |
| SDValue &Imm) const { |
| APInt ImmValue; |
| EVT EltTy = N->getValueType(0).getVectorElementType(); |
| |
| if (N->getOpcode() == ISD::BITCAST) |
| N = N->getOperand(0); |
| |
| if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) && |
| ImmValue.getBitWidth() == EltTy.getSizeInBits()) { |
| int32_t Log2 = (~ImmValue).exactLogBase2(); |
| |
| if (Log2 != -1) { |
| Imm = CurDAG->getTargetConstant(Log2, SDLoc(N), EltTy); |
| return true; |
| } |
| } |
| |
| return false; |
| } |
| |
| bool MipsSEDAGToDAGISel::trySelect(SDNode *Node) { |
| unsigned Opcode = Node->getOpcode(); |
| SDLoc DL(Node); |
| |
| /// |
| // Instruction Selection not handled by the auto-generated |
| // tablegen selection should be handled here. |
| /// |
| switch(Opcode) { |
| default: break; |
| |
| case Mips::PseudoD_SELECT_I: |
| case Mips::PseudoD_SELECT_I64: { |
| MVT VT = Subtarget->isGP64bit() ? MVT::i64 : MVT::i32; |
| SDValue cond = Node->getOperand(0); |
| SDValue Hi1 = Node->getOperand(1); |
| SDValue Lo1 = Node->getOperand(2); |
| SDValue Hi2 = Node->getOperand(3); |
| SDValue Lo2 = Node->getOperand(4); |
| |
| SDValue ops[] = {cond, Hi1, Lo1, Hi2, Lo2}; |
| EVT NodeTys[] = {VT, VT}; |
| ReplaceNode(Node, CurDAG->getMachineNode(Subtarget->isGP64bit() |
| ? Mips::PseudoD_SELECT_I64 |
| : Mips::PseudoD_SELECT_I, |
| DL, NodeTys, ops)); |
| return true; |
| } |
| |
| case ISD::ADDE: { |
| selectAddE(Node, DL); |
| return true; |
| } |
| |
| case ISD::ConstantFP: { |
| auto *CN = cast<ConstantFPSDNode>(Node); |
| if (Node->getValueType(0) == MVT::f64 && CN->isExactlyValue(+0.0)) { |
| if (Subtarget->isGP64bit()) { |
| SDValue Zero = CurDAG->getCopyFromReg(CurDAG->getEntryNode(), DL, |
| Mips::ZERO_64, MVT::i64); |
| ReplaceNode(Node, |
| CurDAG->getMachineNode(Mips::DMTC1, DL, MVT::f64, Zero)); |
| } else if (Subtarget->isFP64bit()) { |
| SDValue Zero = CurDAG->getCopyFromReg(CurDAG->getEntryNode(), DL, |
| Mips::ZERO, MVT::i32); |
| ReplaceNode(Node, CurDAG->getMachineNode(Mips::BuildPairF64_64, DL, |
| MVT::f64, Zero, Zero)); |
| } else { |
| SDValue Zero = CurDAG->getCopyFromReg(CurDAG->getEntryNode(), DL, |
| Mips::ZERO, MVT::i32); |
| ReplaceNode(Node, CurDAG->getMachineNode(Mips::BuildPairF64, DL, |
| MVT::f64, Zero, Zero)); |
| } |
| return true; |
| } |
| break; |
| } |
| |
| case ISD::Constant: { |
| auto *CN = cast<ConstantSDNode>(Node); |
| int64_t Imm = CN->getSExtValue(); |
| unsigned Size = CN->getValueSizeInBits(0); |
| |
| if (isInt<32>(Imm)) |
| break; |
| |
| MipsAnalyzeImmediate AnalyzeImm; |
| |
| const MipsAnalyzeImmediate::InstSeq &Seq = |
| AnalyzeImm.Analyze(Imm, Size, false); |
| |
| MipsAnalyzeImmediate::InstSeq::const_iterator Inst = Seq.begin(); |
| SDLoc DL(CN); |
| SDNode *RegOpnd; |
| SDValue ImmOpnd = CurDAG->getTargetConstant(SignExtend64<16>(Inst->ImmOpnd), |
| DL, MVT::i64); |
| |
| // The first instruction can be a LUi which is different from other |
| // instructions (ADDiu, ORI and SLL) in that it does not have a register |
| // operand. |
| if (Inst->Opc == Mips::LUi64) |
| RegOpnd = CurDAG->getMachineNode(Inst->Opc, DL, MVT::i64, ImmOpnd); |
| else |
| RegOpnd = |
| CurDAG->getMachineNode(Inst->Opc, DL, MVT::i64, |
| CurDAG->getRegister(Mips::ZERO_64, MVT::i64), |
| ImmOpnd); |
| |
| // The remaining instructions in the sequence are handled here. |
| for (++Inst; Inst != Seq.end(); ++Inst) { |
| ImmOpnd = CurDAG->getTargetConstant(SignExtend64<16>(Inst->ImmOpnd), DL, |
| MVT::i64); |
| RegOpnd = CurDAG->getMachineNode(Inst->Opc, DL, MVT::i64, |
| SDValue(RegOpnd, 0), ImmOpnd); |
| } |
| |
| ReplaceNode(Node, RegOpnd); |
| return true; |
| } |
| |
| case ISD::INTRINSIC_W_CHAIN: { |
| const unsigned IntrinsicOpcode = |
| cast<ConstantSDNode>(Node->getOperand(1))->getZExtValue(); |
| switch (IntrinsicOpcode) { |
| default: |
| break; |
| |
| case Intrinsic::mips_cfcmsa: { |
| SDValue ChainIn = Node->getOperand(0); |
| SDValue RegIdx = Node->getOperand(2); |
| SDValue Reg = CurDAG->getCopyFromReg(ChainIn, DL, |
| getMSACtrlReg(RegIdx), MVT::i32); |
| ReplaceNode(Node, Reg.getNode()); |
| return true; |
| } |
| case Intrinsic::mips_ldr_d: |
| case Intrinsic::mips_ldr_w: { |
| unsigned Op = (IntrinsicOpcode == Intrinsic::mips_ldr_d) ? Mips::LDR_D |
| : Mips::LDR_W; |
| |
| SDLoc DL(Node); |
| assert(Node->getNumOperands() == 4 && "Unexpected number of operands."); |
| const SDValue &Chain = Node->getOperand(0); |
| const SDValue &Intrinsic = Node->getOperand(1); |
| const SDValue &Pointer = Node->getOperand(2); |
| const SDValue &Constant = Node->getOperand(3); |
| |
| assert(Chain.getValueType() == MVT::Other); |
| (void)Intrinsic; |
| assert(Intrinsic.getOpcode() == ISD::TargetConstant && |
| Constant.getOpcode() == ISD::Constant && |
| "Invalid instruction operand."); |
| |
| // Convert Constant to TargetConstant. |
| const ConstantInt *Val = |
| cast<ConstantSDNode>(Constant)->getConstantIntValue(); |
| SDValue Imm = |
| CurDAG->getTargetConstant(*Val, DL, Constant.getValueType()); |
| |
| SmallVector<SDValue, 3> Ops{Pointer, Imm, Chain}; |
| |
| assert(Node->getNumValues() == 2); |
| assert(Node->getValueType(0).is128BitVector()); |
| assert(Node->getValueType(1) == MVT::Other); |
| SmallVector<EVT, 2> ResTys{Node->getValueType(0), Node->getValueType(1)}; |
| |
| ReplaceNode(Node, CurDAG->getMachineNode(Op, DL, ResTys, Ops)); |
| |
| return true; |
| } |
| } |
| break; |
| } |
| |
| case ISD::INTRINSIC_WO_CHAIN: { |
| switch (cast<ConstantSDNode>(Node->getOperand(0))->getZExtValue()) { |
| default: |
| break; |
| |
| case Intrinsic::mips_move_v: |
| // Like an assignment but will always produce a move.v even if |
| // unnecessary. |
| ReplaceNode(Node, CurDAG->getMachineNode(Mips::MOVE_V, DL, |
| Node->getValueType(0), |
| Node->getOperand(1))); |
| return true; |
| } |
| break; |
| } |
| |
| case ISD::INTRINSIC_VOID: { |
| const unsigned IntrinsicOpcode = |
| cast<ConstantSDNode>(Node->getOperand(1))->getZExtValue(); |
| switch (IntrinsicOpcode) { |
| default: |
| break; |
| |
| case Intrinsic::mips_ctcmsa: { |
| SDValue ChainIn = Node->getOperand(0); |
| SDValue RegIdx = Node->getOperand(2); |
| SDValue Value = Node->getOperand(3); |
| SDValue ChainOut = CurDAG->getCopyToReg(ChainIn, DL, |
| getMSACtrlReg(RegIdx), Value); |
| ReplaceNode(Node, ChainOut.getNode()); |
| return true; |
| } |
| case Intrinsic::mips_str_d: |
| case Intrinsic::mips_str_w: { |
| unsigned Op = (IntrinsicOpcode == Intrinsic::mips_str_d) ? Mips::STR_D |
| : Mips::STR_W; |
| |
| SDLoc DL(Node); |
| assert(Node->getNumOperands() == 5 && "Unexpected number of operands."); |
| const SDValue &Chain = Node->getOperand(0); |
| const SDValue &Intrinsic = Node->getOperand(1); |
| const SDValue &Vec = Node->getOperand(2); |
| const SDValue &Pointer = Node->getOperand(3); |
| const SDValue &Constant = Node->getOperand(4); |
| |
| assert(Chain.getValueType() == MVT::Other); |
| (void)Intrinsic; |
| assert(Intrinsic.getOpcode() == ISD::TargetConstant && |
| Constant.getOpcode() == ISD::Constant && |
| "Invalid instruction operand."); |
| |
| // Convert Constant to TargetConstant. |
| const ConstantInt *Val = |
| cast<ConstantSDNode>(Constant)->getConstantIntValue(); |
| SDValue Imm = |
| CurDAG->getTargetConstant(*Val, DL, Constant.getValueType()); |
| |
| SmallVector<SDValue, 4> Ops{Vec, Pointer, Imm, Chain}; |
| |
| assert(Node->getNumValues() == 1); |
| assert(Node->getValueType(0) == MVT::Other); |
| SmallVector<EVT, 1> ResTys{Node->getValueType(0)}; |
| |
| ReplaceNode(Node, CurDAG->getMachineNode(Op, DL, ResTys, Ops)); |
| return true; |
| } |
| } |
| break; |
| } |
| |
| // Manually match MipsISD::Ins nodes to get the correct instruction. It has |
| // to be done in this fashion so that we respect the differences between |
| // dins and dinsm, as the difference is that the size operand has the range |
| // 0 < size <= 32 for dins while dinsm has the range 2 <= size <= 64 which |
| // means SelectionDAGISel would have to test all the operands at once to |
| // match the instruction. |
| case MipsISD::Ins: { |
| |
| // Validating the node operands. |
| if (Node->getValueType(0) != MVT::i32 && Node->getValueType(0) != MVT::i64) |
| return false; |
| |
| if (Node->getNumOperands() != 4) |
| return false; |
| |
| if (Node->getOperand(1)->getOpcode() != ISD::Constant || |
| Node->getOperand(2)->getOpcode() != ISD::Constant) |
| return false; |
| |
| MVT ResTy = Node->getSimpleValueType(0); |
| uint64_t Pos = Node->getConstantOperandVal(1); |
| uint64_t Size = Node->getConstantOperandVal(2); |
| |
| // Size has to be >0 for 'ins', 'dins' and 'dinsu'. |
| if (!Size) |
| return false; |
| |
| if (Pos + Size > 64) |
| return false; |
| |
| if (ResTy != MVT::i32 && ResTy != MVT::i64) |
| return false; |
| |
| unsigned Opcode = 0; |
| if (ResTy == MVT::i32) { |
| if (Pos + Size <= 32) |
| Opcode = Mips::INS; |
| } else { |
| if (Pos + Size <= 32) |
| Opcode = Mips::DINS; |
| else if (Pos < 32 && 1 < Size) |
| Opcode = Mips::DINSM; |
| else |
| Opcode = Mips::DINSU; |
| } |
| |
| if (Opcode) { |
| SDValue Ops[4] = { |
| Node->getOperand(0), CurDAG->getTargetConstant(Pos, DL, MVT::i32), |
| CurDAG->getTargetConstant(Size, DL, MVT::i32), Node->getOperand(3)}; |
| |
| ReplaceNode(Node, CurDAG->getMachineNode(Opcode, DL, ResTy, Ops)); |
| return true; |
| } |
| |
| return false; |
| } |
| |
| case MipsISD::ThreadPointer: { |
| EVT PtrVT = getTargetLowering()->getPointerTy(CurDAG->getDataLayout()); |
| unsigned RdhwrOpc, DestReg; |
| |
| if (PtrVT == MVT::i32) { |
| RdhwrOpc = Mips::RDHWR; |
| DestReg = Mips::V1; |
| } else { |
| RdhwrOpc = Mips::RDHWR64; |
| DestReg = Mips::V1_64; |
| } |
| |
| SDNode *Rdhwr = |
| CurDAG->getMachineNode(RdhwrOpc, DL, Node->getValueType(0), MVT::Glue, |
| CurDAG->getRegister(Mips::HWR29, MVT::i32), |
| CurDAG->getTargetConstant(0, DL, MVT::i32)); |
| SDValue Chain = CurDAG->getCopyToReg(CurDAG->getEntryNode(), DL, DestReg, |
| SDValue(Rdhwr, 0), SDValue(Rdhwr, 1)); |
| SDValue ResNode = CurDAG->getCopyFromReg(Chain, DL, DestReg, PtrVT, |
| Chain.getValue(1)); |
| ReplaceNode(Node, ResNode.getNode()); |
| return true; |
| } |
| |
| case ISD::BUILD_VECTOR: { |
| // Select appropriate ldi.[bhwd] instructions for constant splats of |
| // 128-bit when MSA is enabled. Fixup any register class mismatches that |
| // occur as a result. |
| // |
| // This allows the compiler to use a wider range of immediates than would |
| // otherwise be allowed. If, for example, v4i32 could only use ldi.h then |
| // it would not be possible to load { 0x01010101, 0x01010101, 0x01010101, |
| // 0x01010101 } without using a constant pool. This would be sub-optimal |
| // when // 'ldi.b wd, 1' is capable of producing that bit-pattern in the |
| // same set/ of registers. Similarly, ldi.h isn't capable of producing { |
| // 0x00000000, 0x00000001, 0x00000000, 0x00000001 } but 'ldi.d wd, 1' can. |
| |
| const MipsABIInfo &ABI = |
| static_cast<const MipsTargetMachine &>(TM).getABI(); |
| |
| BuildVectorSDNode *BVN = cast<BuildVectorSDNode>(Node); |
| APInt SplatValue, SplatUndef; |
| unsigned SplatBitSize; |
| bool HasAnyUndefs; |
| unsigned LdiOp; |
| EVT ResVecTy = BVN->getValueType(0); |
| EVT ViaVecTy; |
| |
| if (!Subtarget->hasMSA() || !BVN->getValueType(0).is128BitVector()) |
| return false; |
| |
| if (!BVN->isConstantSplat(SplatValue, SplatUndef, SplatBitSize, |
| HasAnyUndefs, 8, |
| !Subtarget->isLittle())) |
| return false; |
| |
| switch (SplatBitSize) { |
| default: |
| return false; |
| case 8: |
| LdiOp = Mips::LDI_B; |
| ViaVecTy = MVT::v16i8; |
| break; |
| case 16: |
| LdiOp = Mips::LDI_H; |
| ViaVecTy = MVT::v8i16; |
| break; |
| case 32: |
| LdiOp = Mips::LDI_W; |
| ViaVecTy = MVT::v4i32; |
| break; |
| case 64: |
| LdiOp = Mips::LDI_D; |
| ViaVecTy = MVT::v2i64; |
| break; |
| } |
| |
| SDNode *Res = nullptr; |
| |
| // If we have a signed 10 bit integer, we can splat it directly. |
| // |
| // If we have something bigger we can synthesize the value into a GPR and |
| // splat from there. |
| if (SplatValue.isSignedIntN(10)) { |
| SDValue Imm = CurDAG->getTargetConstant(SplatValue, DL, |
| ViaVecTy.getVectorElementType()); |
| |
| Res = CurDAG->getMachineNode(LdiOp, DL, ViaVecTy, Imm); |
| } else if (SplatValue.isSignedIntN(16) && |
| ((ABI.IsO32() && SplatBitSize < 64) || |
| (ABI.IsN32() || ABI.IsN64()))) { |
| // Only handle signed 16 bit values when the element size is GPR width. |
| // MIPS64 can handle all the cases but MIPS32 would need to handle |
| // negative cases specifically here. Instead, handle those cases as |
| // 64bit values. |
| |
| bool Is32BitSplat = ABI.IsO32() || SplatBitSize < 64; |
| const unsigned ADDiuOp = Is32BitSplat ? Mips::ADDiu : Mips::DADDiu; |
| const MVT SplatMVT = Is32BitSplat ? MVT::i32 : MVT::i64; |
| SDValue ZeroVal = CurDAG->getRegister( |
| Is32BitSplat ? Mips::ZERO : Mips::ZERO_64, SplatMVT); |
| |
| const unsigned FILLOp = |
| SplatBitSize == 16 |
| ? Mips::FILL_H |
| : (SplatBitSize == 32 ? Mips::FILL_W |
| : (SplatBitSize == 64 ? Mips::FILL_D : 0)); |
| |
| assert(FILLOp != 0 && "Unknown FILL Op for splat synthesis!"); |
| assert((!ABI.IsO32() || (FILLOp != Mips::FILL_D)) && |
| "Attempting to use fill.d on MIPS32!"); |
| |
| const unsigned Lo = SplatValue.getLoBits(16).getZExtValue(); |
| SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, SplatMVT); |
| |
| Res = CurDAG->getMachineNode(ADDiuOp, DL, SplatMVT, ZeroVal, LoVal); |
| Res = CurDAG->getMachineNode(FILLOp, DL, ViaVecTy, SDValue(Res, 0)); |
| |
| } else if (SplatValue.isSignedIntN(32) && SplatBitSize == 32) { |
| // Only handle the cases where the splat size agrees with the size |
| // of the SplatValue here. |
| const unsigned Lo = SplatValue.getLoBits(16).getZExtValue(); |
| const unsigned Hi = SplatValue.lshr(16).getLoBits(16).getZExtValue(); |
| SDValue ZeroVal = CurDAG->getRegister(Mips::ZERO, MVT::i32); |
| |
| SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, MVT::i32); |
| SDValue HiVal = CurDAG->getTargetConstant(Hi, DL, MVT::i32); |
| |
| if (Hi) |
| Res = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HiVal); |
| |
| if (Lo) |
| Res = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32, |
| Hi ? SDValue(Res, 0) : ZeroVal, LoVal); |
| |
| assert((Hi || Lo) && "Zero case reached 32 bit case splat synthesis!"); |
| Res = |
| CurDAG->getMachineNode(Mips::FILL_W, DL, MVT::v4i32, SDValue(Res, 0)); |
| |
| } else if (SplatValue.isSignedIntN(32) && SplatBitSize == 64 && |
| (ABI.IsN32() || ABI.IsN64())) { |
| // N32 and N64 can perform some tricks that O32 can't for signed 32 bit |
| // integers due to having 64bit registers. lui will cause the necessary |
| // zero/sign extension. |
| const unsigned Lo = SplatValue.getLoBits(16).getZExtValue(); |
| const unsigned Hi = SplatValue.lshr(16).getLoBits(16).getZExtValue(); |
| SDValue ZeroVal = CurDAG->getRegister(Mips::ZERO, MVT::i32); |
| |
| SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, MVT::i32); |
| SDValue HiVal = CurDAG->getTargetConstant(Hi, DL, MVT::i32); |
| |
| if (Hi) |
| Res = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HiVal); |
| |
| if (Lo) |
| Res = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32, |
| Hi ? SDValue(Res, 0) : ZeroVal, LoVal); |
| |
| Res = CurDAG->getMachineNode( |
| Mips::SUBREG_TO_REG, DL, MVT::i64, |
| CurDAG->getTargetConstant(((Hi >> 15) & 0x1), DL, MVT::i64), |
| SDValue(Res, 0), |
| CurDAG->getTargetConstant(Mips::sub_32, DL, MVT::i64)); |
| |
| Res = |
| CurDAG->getMachineNode(Mips::FILL_D, DL, MVT::v2i64, SDValue(Res, 0)); |
| |
| } else if (SplatValue.isSignedIntN(64)) { |
| // If we have a 64 bit Splat value, we perform a similar sequence to the |
| // above: |
| // |
| // MIPS32: MIPS64: |
| // lui $res, %highest(val) lui $res, %highest(val) |
| // ori $res, $res, %higher(val) ori $res, $res, %higher(val) |
| // lui $res2, %hi(val) lui $res2, %hi(val) |
| // ori $res2, %res2, %lo(val) ori $res2, %res2, %lo(val) |
| // $res3 = fill $res2 dinsu $res, $res2, 0, 32 |
| // $res4 = insert.w $res3[1], $res fill.d $res |
| // splat.d $res4, 0 |
| // |
| // The ability to use dinsu is guaranteed as MSA requires MIPSR5. |
| // This saves having to materialize the value by shifts and ors. |
| // |
| // FIXME: Implement the preferred sequence for MIPS64R6: |
| // |
| // MIPS64R6: |
| // ori $res, $zero, %lo(val) |
| // daui $res, $res, %hi(val) |
| // dahi $res, $res, %higher(val) |
| // dati $res, $res, %highest(cal) |
| // fill.d $res |
| // |
| |
| const unsigned Lo = SplatValue.getLoBits(16).getZExtValue(); |
| const unsigned Hi = SplatValue.lshr(16).getLoBits(16).getZExtValue(); |
| const unsigned Higher = SplatValue.lshr(32).getLoBits(16).getZExtValue(); |
| const unsigned Highest = SplatValue.lshr(48).getLoBits(16).getZExtValue(); |
| |
| SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, MVT::i32); |
| SDValue HiVal = CurDAG->getTargetConstant(Hi, DL, MVT::i32); |
| SDValue HigherVal = CurDAG->getTargetConstant(Higher, DL, MVT::i32); |
| SDValue HighestVal = CurDAG->getTargetConstant(Highest, DL, MVT::i32); |
| SDValue ZeroVal = CurDAG->getRegister(Mips::ZERO, MVT::i32); |
| |
| // Independent of whether we're targeting MIPS64 or not, the basic |
| // operations are the same. Also, directly use the $zero register if |
| // the 16 bit chunk is zero. |
| // |
| // For optimization purposes we always synthesize the splat value as |
| // an i32 value, then if we're targetting MIPS64, use SUBREG_TO_REG |
| // just before combining the values with dinsu to produce an i64. This |
| // enables SelectionDAG to aggressively share components of splat values |
| // where possible. |
| // |
| // FIXME: This is the general constant synthesis problem. This code |
| // should be factored out into a class shared between all the |
| // classes that need it. Specifically, for a splat size of 64 |
| // bits that's a negative number we can do better than LUi/ORi |
| // for the upper 32bits. |
| |
| if (Hi) |
| Res = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HiVal); |
| |
| if (Lo) |
| Res = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32, |
| Hi ? SDValue(Res, 0) : ZeroVal, LoVal); |
| |
| SDNode *HiRes; |
| if (Highest) |
| HiRes = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HighestVal); |
| |
| if (Higher) |
| HiRes = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32, |
| Highest ? SDValue(HiRes, 0) : ZeroVal, |
| HigherVal); |
| |
| |
| if (ABI.IsO32()) { |
| Res = CurDAG->getMachineNode(Mips::FILL_W, DL, MVT::v4i32, |
| (Hi || Lo) ? SDValue(Res, 0) : ZeroVal); |
| |
| Res = CurDAG->getMachineNode( |
| Mips::INSERT_W, DL, MVT::v4i32, SDValue(Res, 0), |
| (Highest || Higher) ? SDValue(HiRes, 0) : ZeroVal, |
| CurDAG->getTargetConstant(1, DL, MVT::i32)); |
| |
| const TargetLowering *TLI = getTargetLowering(); |
| const TargetRegisterClass *RC = |
| TLI->getRegClassFor(ViaVecTy.getSimpleVT()); |
| |
| Res = CurDAG->getMachineNode( |
| Mips::COPY_TO_REGCLASS, DL, ViaVecTy, SDValue(Res, 0), |
| CurDAG->getTargetConstant(RC->getID(), DL, MVT::i32)); |
| |
| Res = CurDAG->getMachineNode( |
| Mips::SPLATI_D, DL, MVT::v2i64, SDValue(Res, 0), |
| CurDAG->getTargetConstant(0, DL, MVT::i32)); |
| } else if (ABI.IsN64() || ABI.IsN32()) { |
| |
| SDValue Zero64Val = CurDAG->getRegister(Mips::ZERO_64, MVT::i64); |
| const bool HiResNonZero = Highest || Higher; |
| const bool ResNonZero = Hi || Lo; |
| |
| if (HiResNonZero) |
| HiRes = CurDAG->getMachineNode( |
| Mips::SUBREG_TO_REG, DL, MVT::i64, |
| CurDAG->getTargetConstant(((Highest >> 15) & 0x1), DL, MVT::i64), |
| SDValue(HiRes, 0), |
| CurDAG->getTargetConstant(Mips::sub_32, DL, MVT::i64)); |
| |
| if (ResNonZero) |
| Res = CurDAG->getMachineNode( |
| Mips::SUBREG_TO_REG, DL, MVT::i64, |
| CurDAG->getTargetConstant(((Hi >> 15) & 0x1), DL, MVT::i64), |
| SDValue(Res, 0), |
| CurDAG->getTargetConstant(Mips::sub_32, DL, MVT::i64)); |
| |
| // We have 3 cases: |
| // The HiRes is nonzero but Res is $zero => dsll32 HiRes, 0 |
| // The Res is nonzero but HiRes is $zero => dinsu Res, $zero, 32, 32 |
| // Both are non zero => dinsu Res, HiRes, 32, 32 |
| // |
| // The obvious "missing" case is when both are zero, but that case is |
| // handled by the ldi case. |
| if (ResNonZero) { |
| IntegerType *Int32Ty = |
| IntegerType::get(MF->getFunction().getContext(), 32); |
| const ConstantInt *Const32 = ConstantInt::get(Int32Ty, 32); |
| SDValue Ops[4] = {HiResNonZero ? SDValue(HiRes, 0) : Zero64Val, |
| CurDAG->getConstant(*Const32, DL, MVT::i32), |
| CurDAG->getConstant(*Const32, DL, MVT::i32), |
| SDValue(Res, 0)}; |
| |
| Res = CurDAG->getMachineNode(Mips::DINSU, DL, MVT::i64, Ops); |
| } else if (HiResNonZero) { |
| Res = CurDAG->getMachineNode( |
| Mips::DSLL32, DL, MVT::i64, SDValue(HiRes, 0), |
| CurDAG->getTargetConstant(0, DL, MVT::i32)); |
| } else |
| llvm_unreachable( |
| "Zero splat value handled by non-zero 64bit splat synthesis!"); |
| |
| Res = CurDAG->getMachineNode(Mips::FILL_D, DL, MVT::v2i64, |
| SDValue(Res, 0)); |
| } else |
| llvm_unreachable("Unknown ABI in MipsISelDAGToDAG!"); |
| |
| } else |
| return false; |
| |
| if (ResVecTy != ViaVecTy) { |
| // If LdiOp is writing to a different register class to ResVecTy, then |
| // fix it up here. This COPY_TO_REGCLASS should never cause a move.v |
| // since the source and destination register sets contain the same |
| // registers. |
| const TargetLowering *TLI = getTargetLowering(); |
| MVT ResVecTySimple = ResVecTy.getSimpleVT(); |
| const TargetRegisterClass *RC = TLI->getRegClassFor(ResVecTySimple); |
| Res = CurDAG->getMachineNode(Mips::COPY_TO_REGCLASS, DL, |
| ResVecTy, SDValue(Res, 0), |
| CurDAG->getTargetConstant(RC->getID(), DL, |
| MVT::i32)); |
| } |
| |
| ReplaceNode(Node, Res); |
| return true; |
| } |
| |
| } |
| |
| return false; |
| } |
| |
| bool MipsSEDAGToDAGISel:: |
| SelectInlineAsmMemoryOperand(const SDValue &Op, unsigned ConstraintID, |
| std::vector<SDValue> &OutOps) { |
| SDValue Base, Offset; |
| |
| switch(ConstraintID) { |
| default: |
| llvm_unreachable("Unexpected asm memory constraint"); |
| // All memory constraints can at least accept raw pointers. |
| case InlineAsm::Constraint_m: |
| case InlineAsm::Constraint_o: |
| if (selectAddrRegImm16(Op, Base, Offset)) { |
| OutOps.push_back(Base); |
| OutOps.push_back(Offset); |
| return false; |
| } |
| OutOps.push_back(Op); |
| OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32)); |
| return false; |
| case InlineAsm::Constraint_R: |
| // The 'R' constraint is supposed to be much more complicated than this. |
| // However, it's becoming less useful due to architectural changes and |
| // ought to be replaced by other constraints such as 'ZC'. |
| // For now, support 9-bit signed offsets which is supportable by all |
| // subtargets for all instructions. |
| if (selectAddrRegImm9(Op, Base, Offset)) { |
| OutOps.push_back(Base); |
| OutOps.push_back(Offset); |
| return false; |
| } |
| OutOps.push_back(Op); |
| OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32)); |
| return false; |
| case InlineAsm::Constraint_ZC: |
| // ZC matches whatever the pref, ll, and sc instructions can handle for the |
| // given subtarget. |
| if (Subtarget->inMicroMipsMode()) { |
| // On microMIPS, they can handle 12-bit offsets. |
| if (selectAddrRegImm12(Op, Base, Offset)) { |
| OutOps.push_back(Base); |
| OutOps.push_back(Offset); |
| return false; |
| } |
| } else if (Subtarget->hasMips32r6()) { |
| // On MIPS32r6/MIPS64r6, they can only handle 9-bit offsets. |
| if (selectAddrRegImm9(Op, Base, Offset)) { |
| OutOps.push_back(Base); |
| OutOps.push_back(Offset); |
| return false; |
| } |
| } else if (selectAddrRegImm16(Op, Base, Offset)) { |
| // Prior to MIPS32r6/MIPS64r6, they can handle 16-bit offsets. |
| OutOps.push_back(Base); |
| OutOps.push_back(Offset); |
| return false; |
| } |
| // In all cases, 0-bit offsets are acceptable. |
| OutOps.push_back(Op); |
| OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32)); |
| return false; |
| } |
| return true; |
| } |
| |
| FunctionPass *llvm::createMipsSEISelDag(MipsTargetMachine &TM, |
| CodeGenOpt::Level OptLevel) { |
| return new MipsSEDAGToDAGISel(TM, OptLevel); |
| } |