utils/TableGen/CodeEmitterGen.cpp - llvm-project/llvm - Git at Google

 //===- CodeEmitterGen.cpp - Code Emitter Generator ------------------------===//
 //
 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 // See https://llvm.org/LICENSE.txt for license information.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//
 //
 // CodeEmitterGen uses the descriptions of instructions and their fields to
 // construct an automated code emitter: a function that, given a MachineInstr,
 // returns the (currently, 32-bit unsigned) value of the instruction.
 //
 //===----------------------------------------------------------------------===//

 #include "CodeGenHwModes.h"
 #include "CodeGenInstruction.h"
 #include "CodeGenTarget.h"
 #include "InfoByHwMode.h"
 #include "VarLenCodeEmitterGen.h"
 #include "llvm/ADT/APInt.h"
 #include "llvm/ADT/ArrayRef.h"
 #include "llvm/ADT/StringExtras.h"
 #include "llvm/Support/Casting.h"
 #include "llvm/Support/raw_ostream.h"
 #include "llvm/TableGen/Error.h"
 #include "llvm/TableGen/Record.h"
 #include "llvm/TableGen/TableGenBackend.h"
 #include <cstdint>
 #include <map>
 #include <set>
 #include <string>
 #include <utility>
 #include <vector>

 using namespace llvm;

 namespace {

 class CodeEmitterGen {
   RecordKeeper &Records;

 public:
   CodeEmitterGen(RecordKeeper &R) : Records(R) {}

   void run(raw_ostream &o);

 private:
   int getVariableBit(const std::string &VarName, BitsInit *BI, int bit);
   std::string getInstructionCase(Record *R, CodeGenTarget &Target);
   std::string getInstructionCaseForEncoding(Record *R, Record *EncodingDef,
                                             CodeGenTarget &Target);
   bool addCodeToMergeInOperand(Record *R, BitsInit *BI,
                                const std::string &VarName,
                                std::string &Case, CodeGenTarget &Target);

   void emitInstructionBaseValues(
       raw_ostream &o, ArrayRef<const CodeGenInstruction *> NumberedInstructions,
       CodeGenTarget &Target, int HwMode = -1);
   unsigned BitWidth = 0u;
   bool UseAPInt = false;
 };

 // If the VarBitInit at position 'bit' matches the specified variable then
 // return the variable bit position.  Otherwise return -1.
 int CodeEmitterGen::getVariableBit(const std::string &VarName,
                                    BitsInit *BI, int bit) {
   if (VarBitInit *VBI = dyn_cast<VarBitInit>(BI->getBit(bit))) {
     if (VarInit *VI = dyn_cast<VarInit>(VBI->getBitVar()))
       if (VI->getName() == VarName)
         return VBI->getBitNum();
   } else if (VarInit *VI = dyn_cast<VarInit>(BI->getBit(bit))) {
     if (VI->getName() == VarName)
       return 0;
   }

   return -1;
 }

 // Returns true if it succeeds, false if an error.
 bool CodeEmitterGen::addCodeToMergeInOperand(Record *R, BitsInit *BI,
                                              const std::string &VarName,
                                              std::string &Case,
                                              CodeGenTarget &Target) {
   CodeGenInstruction &CGI = Target.getInstruction(R);

   // Determine if VarName actually contributes to the Inst encoding.
   int bit = BI->getNumBits()-1;

   // Scan for a bit that this contributed to.
   for (; bit >= 0; ) {
     if (getVariableBit(VarName, BI, bit) != -1)
       break;

     --bit;
   }

   // If we found no bits, ignore this value, otherwise emit the call to get the
   // operand encoding.
   if (bit < 0)
     return true;

   // If the operand matches by name, reference according to that
   // operand number. Non-matching operands are assumed to be in
   // order.
   unsigned OpIdx;
   std::pair<unsigned, unsigned> SubOp;
   if (CGI.Operands.hasSubOperandAlias(VarName, SubOp)) {
     OpIdx = CGI.Operands[SubOp.first].MIOperandNo + SubOp.second;
   } else if (CGI.Operands.hasOperandNamed(VarName, OpIdx)) {
     // Get the machine operand number for the indicated operand.
     OpIdx = CGI.Operands[OpIdx].MIOperandNo;
   } else {
     PrintError(R, Twine("No operand named ") + VarName + " in record " + R->getName());
     return false;
   }

   if (CGI.Operands.isFlatOperandNotEmitted(OpIdx)) {
     PrintError(R, "Operand " + VarName + " used but also marked as not emitted!");
     return false;
   }

   std::pair<unsigned, unsigned> SO = CGI.Operands.getSubOperandNumber(OpIdx);
   std::string &EncoderMethodName =
       CGI.Operands[SO.first].EncoderMethodNames[SO.second];

   if (UseAPInt)
     Case += "      op.clearAllBits();\n";

   Case += "      // op: " + VarName + "\n";

   // If the source operand has a custom encoder, use it.
   if (!EncoderMethodName.empty()) {
     if (UseAPInt) {
       Case += "      " + EncoderMethodName + "(MI, " + utostr(OpIdx);
       Case += ", op";
     } else {
       Case += "      op = " + EncoderMethodName + "(MI, " + utostr(OpIdx);
     }
     Case += ", Fixups, STI);\n";
   } else {
     if (UseAPInt) {
       Case += "      getMachineOpValue(MI, MI.getOperand(" + utostr(OpIdx) + ")";
       Case += ", op, Fixups, STI";
     } else {
       Case += "      op = getMachineOpValue(MI, MI.getOperand(" + utostr(OpIdx) + ")";
       Case += ", Fixups, STI";
     }
     Case += ");\n";
   }

   // Precalculate the number of lits this variable contributes to in the
   // operand. If there is a single lit (consecutive range of bits) we can use a
   // destructive sequence on APInt that reduces memory allocations.
   int numOperandLits = 0;
   for (int tmpBit = bit; tmpBit >= 0;) {
     int varBit = getVariableBit(VarName, BI, tmpBit);

     // If this bit isn't from a variable, skip it.
     if (varBit == -1) {
       --tmpBit;
       continue;
     }

     // Figure out the consecutive range of bits covered by this operand, in
     // order to generate better encoding code.
     int beginVarBit = varBit;
     int N = 1;
     for (--tmpBit; tmpBit >= 0;) {
       varBit = getVariableBit(VarName, BI, tmpBit);
       if (varBit == -1 || varBit != (beginVarBit - N))
         break;
       ++N;
       --tmpBit;
     }
     ++numOperandLits;
   }

   for (; bit >= 0; ) {
     int varBit = getVariableBit(VarName, BI, bit);

     // If this bit isn't from a variable, skip it.
     if (varBit == -1) {
       --bit;
       continue;
     }

     // Figure out the consecutive range of bits covered by this operand, in
     // order to generate better encoding code.
     int beginInstBit = bit;
     int beginVarBit = varBit;
     int N = 1;
     for (--bit; bit >= 0;) {
       varBit = getVariableBit(VarName, BI, bit);
       if (varBit == -1 || varBit != (beginVarBit - N)) break;
       ++N;
       --bit;
     }

     std::string maskStr;
     int opShift;

     unsigned loBit = beginVarBit - N + 1;
     unsigned hiBit = loBit + N;
     unsigned loInstBit = beginInstBit - N + 1;
     if (UseAPInt) {
       std::string extractStr;
       if (N >= 64) {
         extractStr = "op.extractBits(" + itostr(hiBit - loBit) + ", " +
                      itostr(loBit) + ")";
         Case += "      Value.insertBits(" + extractStr + ", " +
                 itostr(loInstBit) + ");\n";
       } else {
         extractStr = "op.extractBitsAsZExtValue(" + itostr(hiBit - loBit) +
                      ", " + itostr(loBit) + ")";
         Case += "      Value.insertBits(" + extractStr + ", " +
                 itostr(loInstBit) + ", " + itostr(hiBit - loBit) + ");\n";
       }
     } else {
       uint64_t opMask = ~(uint64_t)0 >> (64 - N);
       opShift = beginVarBit - N + 1;
       opMask <<= opShift;
       maskStr = "UINT64_C(" + utostr(opMask) + ")";
       opShift = beginInstBit - beginVarBit;

       if (numOperandLits == 1) {
         Case += "      op &= " + maskStr + ";\n";
         if (opShift > 0) {
           Case += "      op <<= " + itostr(opShift) + ";\n";
         } else if (opShift < 0) {
           Case += "      op >>= " + itostr(-opShift) + ";\n";
         }
         Case += "      Value |= op;\n";
       } else {
         if (opShift > 0) {
           Case += "      Value |= (op & " + maskStr + ") << " +
                   itostr(opShift) + ";\n";
         } else if (opShift < 0) {
           Case += "      Value |= (op & " + maskStr + ") >> " +
                   itostr(-opShift) + ";\n";
         } else {
           Case += "      Value |= (op & " + maskStr + ");\n";
         }
       }
     }
   }
   return true;
 }

 std::string CodeEmitterGen::getInstructionCase(Record *R,
                                                CodeGenTarget &Target) {
   std::string Case;
   if (const RecordVal *RV = R->getValue("EncodingInfos")) {
     if (auto *DI = dyn_cast_or_null<DefInit>(RV->getValue())) {
       const CodeGenHwModes &HWM = Target.getHwModes();
       EncodingInfoByHwMode EBM(DI->getDef(), HWM);
       Case += "      switch (HwMode) {\n";
       Case += "      default: llvm_unreachable(\"Unhandled HwMode\");\n";
       for (auto &KV : EBM) {
         Case += "      case " + itostr(KV.first) + ": {\n";
         Case += getInstructionCaseForEncoding(R, KV.second, Target);
         Case += "      break;\n";
         Case += "      }\n";
       }
       Case += "      }\n";
       return Case;
     }
   }
   return getInstructionCaseForEncoding(R, R, Target);
 }

 std::string CodeEmitterGen::getInstructionCaseForEncoding(Record *R, Record *EncodingDef,
                                                           CodeGenTarget &Target) {
   std::string Case;
   BitsInit *BI = EncodingDef->getValueAsBitsInit("Inst");

   // Loop over all of the fields in the instruction, determining which are the
   // operands to the instruction.
   bool Success = true;
   for (const RecordVal &RV : EncodingDef->getValues()) {
     // Ignore fixed fields in the record, we're looking for values like:
     //    bits<5> RST = { ?, ?, ?, ?, ? };
     if (RV.isNonconcreteOK() || RV.getValue()->isComplete())
       continue;

     Success &=
         addCodeToMergeInOperand(R, BI, std::string(RV.getName()),
                                 Case, Target);
   }

   if (!Success) {
     // Dump the record, so we can see what's going on...
     std::string E;
     raw_string_ostream S(E);
     S << "Dumping record for previous error:\n";
     S << *R;
     PrintNote(E);
   }

   StringRef PostEmitter = R->getValueAsString("PostEncoderMethod");
   if (!PostEmitter.empty()) {
     Case += "      Value = ";
     Case += PostEmitter;
     Case += "(MI, Value";
     Case += ", STI";
     Case += ");\n";
   }

   return Case;
 }

 static void emitInstBits(raw_ostream &OS, const APInt &Bits) {
   for (unsigned I = 0; I < Bits.getNumWords(); ++I)
     OS << ((I > 0) ? ", " : "") << "UINT64_C(" << utostr(Bits.getRawData()[I])
        << ")";
 }

 void CodeEmitterGen::emitInstructionBaseValues(
     raw_ostream &o, ArrayRef<const CodeGenInstruction *> NumberedInstructions,
     CodeGenTarget &Target, int HwMode) {
   const CodeGenHwModes &HWM = Target.getHwModes();
   if (HwMode == -1)
     o << "  static const uint64_t InstBits[] = {\n";
   else
     o << "  static const uint64_t InstBits_" << HWM.getMode(HwMode).Name
       << "[] = {\n";

   for (const CodeGenInstruction *CGI : NumberedInstructions) {
     Record *R = CGI->TheDef;

     if (R->getValueAsString("Namespace") == "TargetOpcode" ||
         R->getValueAsBit("isPseudo")) {
       o << "    "; emitInstBits(o, APInt(BitWidth, 0)); o << ",\n";
       continue;
     }

     Record *EncodingDef = R;
     if (const RecordVal *RV = R->getValue("EncodingInfos")) {
       if (auto *DI = dyn_cast_or_null<DefInit>(RV->getValue())) {
         EncodingInfoByHwMode EBM(DI->getDef(), HWM);
         if (EBM.hasMode(HwMode))
           EncodingDef = EBM.get(HwMode);
       }
     }
     BitsInit *BI = EncodingDef->getValueAsBitsInit("Inst");

     // Start by filling in fixed values.
     APInt Value(BitWidth, 0);
     for (unsigned i = 0, e = BI->getNumBits(); i != e; ++i) {
       if (auto *B = dyn_cast<BitInit>(BI->getBit(i)); B && B->getValue())
         Value.setBit(i);
     }
     o << "    ";
     emitInstBits(o, Value);
     o << "," << '\t' << "// " << R->getName() << "\n";
   }
   o << "    UINT64_C(0)\n  };\n";
 }

 void CodeEmitterGen::run(raw_ostream &o) {
   emitSourceFileHeader("Machine Code Emitter", o);

   CodeGenTarget Target(Records);
   std::vector<Record*> Insts = Records.getAllDerivedDefinitions("Instruction");

   // For little-endian instruction bit encodings, reverse the bit order
   Target.reverseBitsForLittleEndianEncoding();

   ArrayRef<const CodeGenInstruction*> NumberedInstructions =
     Target.getInstructionsByEnumValue();

   if (any_of(NumberedInstructions, [](const CodeGenInstruction *CGI) {
         Record *R = CGI->TheDef;
         return R->getValue("Inst") && isa<DagInit>(R->getValueInit("Inst"));
       })) {
     emitVarLenCodeEmitter(Records, o);
   } else {
     const CodeGenHwModes &HWM = Target.getHwModes();
     // The set of HwModes used by instruction encodings.
     std::set<unsigned> HwModes;
     BitWidth = 0;
     for (const CodeGenInstruction *CGI : NumberedInstructions) {
       Record *R = CGI->TheDef;
       if (R->getValueAsString("Namespace") == "TargetOpcode" ||
           R->getValueAsBit("isPseudo"))
         continue;

       if (const RecordVal *RV = R->getValue("EncodingInfos")) {
         if (DefInit *DI = dyn_cast_or_null<DefInit>(RV->getValue())) {
           EncodingInfoByHwMode EBM(DI->getDef(), HWM);
           for (auto &KV : EBM) {
             BitsInit *BI = KV.second->getValueAsBitsInit("Inst");
             BitWidth = std::max(BitWidth, BI->getNumBits());
             HwModes.insert(KV.first);
           }
           continue;
         }
       }
       BitsInit *BI = R->getValueAsBitsInit("Inst");
       BitWidth = std::max(BitWidth, BI->getNumBits());
     }
     UseAPInt = BitWidth > 64;

     // Emit function declaration
     if (UseAPInt) {
       o << "void " << Target.getName()
         << "MCCodeEmitter::getBinaryCodeForInstr(const MCInst &MI,\n"
         << "    SmallVectorImpl<MCFixup> &Fixups,\n"
         << "    APInt &Inst,\n"
         << "    APInt &Scratch,\n"
         << "    const MCSubtargetInfo &STI) const {\n";
     } else {
       o << "uint64_t " << Target.getName();
       o << "MCCodeEmitter::getBinaryCodeForInstr(const MCInst &MI,\n"
         << "    SmallVectorImpl<MCFixup> &Fixups,\n"
         << "    const MCSubtargetInfo &STI) const {\n";
     }

     // Emit instruction base values
     if (HwModes.empty()) {
       emitInstructionBaseValues(o, NumberedInstructions, Target, -1);
     } else {
       for (unsigned HwMode : HwModes)
         emitInstructionBaseValues(o, NumberedInstructions, Target, (int)HwMode);
     }

     if (!HwModes.empty()) {
       o << "  const uint64_t *InstBits;\n";
       o << "  unsigned HwMode = STI.getHwMode();\n";
       o << "  switch (HwMode) {\n";
       o << "  default: llvm_unreachable(\"Unknown hardware mode!\"); break;\n";
       for (unsigned I : HwModes) {
         o << "  case " << I << ": InstBits = InstBits_" << HWM.getMode(I).Name
           << "; break;\n";
       }
       o << "  };\n";
     }

     // Map to accumulate all the cases.
     std::map<std::string, std::vector<std::string>> CaseMap;

     // Construct all cases statement for each opcode
     for (Record *R : Insts) {
       if (R->getValueAsString("Namespace") == "TargetOpcode" ||
           R->getValueAsBit("isPseudo"))
         continue;
       std::string InstName =
           (R->getValueAsString("Namespace") + "::" + R->getName()).str();
       std::string Case = getInstructionCase(R, Target);

       CaseMap[Case].push_back(std::move(InstName));
     }

     // Emit initial function code
     if (UseAPInt) {
       int NumWords = APInt::getNumWords(BitWidth);
       o << "  const unsigned opcode = MI.getOpcode();\n"
         << "  if (Scratch.getBitWidth() != " << BitWidth << ")\n"
         << "    Scratch = Scratch.zext(" << BitWidth << ");\n"
         << "  Inst = APInt(" << BitWidth << ", ArrayRef(InstBits + opcode * "
         << NumWords << ", " << NumWords << "));\n"
         << "  APInt &Value = Inst;\n"
         << "  APInt &op = Scratch;\n"
         << "  switch (opcode) {\n";
     } else {
       o << "  const unsigned opcode = MI.getOpcode();\n"
         << "  uint64_t Value = InstBits[opcode];\n"
         << "  uint64_t op = 0;\n"
         << "  (void)op;  // suppress warning\n"
         << "  switch (opcode) {\n";
     }

     // Emit each case statement
     std::map<std::string, std::vector<std::string>>::iterator IE, EE;
     for (IE = CaseMap.begin(), EE = CaseMap.end(); IE != EE; ++IE) {
       const std::string &Case = IE->first;
       std::vector<std::string> &InstList = IE->second;

       for (int i = 0, N = InstList.size(); i < N; i++) {
         if (i)
           o << "\n";
         o << "    case " << InstList[i] << ":";
       }
       o << " {\n";
       o << Case;
       o << "      break;\n"
         << "    }\n";
     }

     // Default case: unhandled opcode
     o << "  default:\n"
       << "    std::string msg;\n"
       << "    raw_string_ostream Msg(msg);\n"
       << "    Msg << \"Not supported instr: \" << MI;\n"
       << "    report_fatal_error(Msg.str().c_str());\n"
       << "  }\n";
     if (UseAPInt)
       o << "  Inst = Value;\n";
     else
       o << "  return Value;\n";
     o << "}\n\n";
   }
 }

 } // end anonymous namespace

 static TableGen::Emitter::OptClass<CodeEmitterGen>
     X("gen-emitter", "Generate machine code emitter");
	//===- CodeEmitterGen.cpp - Code Emitter Generator ------------------------===//
	//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//
	//===----------------------------------------------------------------------===//
	//
	// CodeEmitterGen uses the descriptions of instructions and their fields to
	// construct an automated code emitter: a function that, given a MachineInstr,
	// returns the (currently, 32-bit unsigned) value of the instruction.
	//
	//===----------------------------------------------------------------------===//

	#include "CodeGenHwModes.h"
	#include "CodeGenInstruction.h"
	#include "CodeGenTarget.h"
	#include "InfoByHwMode.h"
	#include "VarLenCodeEmitterGen.h"
	#include "llvm/ADT/APInt.h"
	#include "llvm/ADT/ArrayRef.h"
	#include "llvm/ADT/StringExtras.h"
	#include "llvm/Support/Casting.h"
	#include "llvm/Support/raw_ostream.h"
	#include "llvm/TableGen/Error.h"
	#include "llvm/TableGen/Record.h"
	#include "llvm/TableGen/TableGenBackend.h"
	#include <cstdint>
	#include <map>
	#include <set>
	#include <string>
	#include <utility>
	#include <vector>

	using namespace llvm;

	namespace {

	class CodeEmitterGen {
	RecordKeeper &Records;

	public:
	CodeEmitterGen(RecordKeeper &R) : Records(R) {}

	void run(raw_ostream &o);

	private:
	int getVariableBit(const std::string &VarName, BitsInit *BI, int bit);
	std::string getInstructionCase(Record *R, CodeGenTarget &Target);
	std::string getInstructionCaseForEncoding(Record R, Record EncodingDef,
	CodeGenTarget &Target);
	bool addCodeToMergeInOperand(Record R, BitsInit BI,
	const std::string &VarName,
	std::string &Case, CodeGenTarget &Target);

	void emitInstructionBaseValues(
	raw_ostream &o, ArrayRef<const CodeGenInstruction *> NumberedInstructions,
	CodeGenTarget &Target, int HwMode = -1);
	unsigned BitWidth = 0u;
	bool UseAPInt = false;
	};

	// If the VarBitInit at position 'bit' matches the specified variable then
	// return the variable bit position. Otherwise return -1.
	int CodeEmitterGen::getVariableBit(const std::string &VarName,
	BitsInit *BI, int bit) {
	if (VarBitInit *VBI = dyn_cast<VarBitInit>(BI->getBit(bit))) {
	if (VarInit *VI = dyn_cast<VarInit>(VBI->getBitVar()))
	if (VI->getName() == VarName)
	return VBI->getBitNum();
	} else if (VarInit *VI = dyn_cast<VarInit>(BI->getBit(bit))) {
	if (VI->getName() == VarName)
	return 0;
	}

	return -1;
	}

	// Returns true if it succeeds, false if an error.
	bool CodeEmitterGen::addCodeToMergeInOperand(Record R, BitsInit BI,
	const std::string &VarName,
	std::string &Case,
	CodeGenTarget &Target) {
	CodeGenInstruction &CGI = Target.getInstruction(R);

	// Determine if VarName actually contributes to the Inst encoding.
	int bit = BI->getNumBits()-1;

	// Scan for a bit that this contributed to.
	for (; bit >= 0; ) {
	if (getVariableBit(VarName, BI, bit) != -1)
	break;

	--bit;
	}

	// If we found no bits, ignore this value, otherwise emit the call to get the
	// operand encoding.
	if (bit < 0)
	return true;

	// If the operand matches by name, reference according to that
	// operand number. Non-matching operands are assumed to be in
	// order.
	unsigned OpIdx;
	std::pair<unsigned, unsigned> SubOp;
	if (CGI.Operands.hasSubOperandAlias(VarName, SubOp)) {
	OpIdx = CGI.Operands[SubOp.first].MIOperandNo + SubOp.second;
	} else if (CGI.Operands.hasOperandNamed(VarName, OpIdx)) {
	// Get the machine operand number for the indicated operand.
	OpIdx = CGI.Operands[OpIdx].MIOperandNo;
	} else {
	PrintError(R, Twine("No operand named ") + VarName + " in record " + R->getName());
	return false;
	}

	if (CGI.Operands.isFlatOperandNotEmitted(OpIdx)) {
	PrintError(R, "Operand " + VarName + " used but also marked as not emitted!");
	return false;
	}

	std::pair<unsigned, unsigned> SO = CGI.Operands.getSubOperandNumber(OpIdx);
	std::string &EncoderMethodName =
	CGI.Operands[SO.first].EncoderMethodNames[SO.second];

	if (UseAPInt)
	Case += " op.clearAllBits();\n";

	Case += " // op: " + VarName + "\n";

	// If the source operand has a custom encoder, use it.
	if (!EncoderMethodName.empty()) {
	if (UseAPInt) {
	Case += " " + EncoderMethodName + "(MI, " + utostr(OpIdx);
	Case += ", op";
	} else {
	Case += " op = " + EncoderMethodName + "(MI, " + utostr(OpIdx);
	}
	Case += ", Fixups, STI);\n";
	} else {
	if (UseAPInt) {
	Case += " getMachineOpValue(MI, MI.getOperand(" + utostr(OpIdx) + ")";
	Case += ", op, Fixups, STI";
	} else {
	Case += " op = getMachineOpValue(MI, MI.getOperand(" + utostr(OpIdx) + ")";
	Case += ", Fixups, STI";
	}
	Case += ");\n";
	}

	// Precalculate the number of lits this variable contributes to in the
	// operand. If there is a single lit (consecutive range of bits) we can use a
	// destructive sequence on APInt that reduces memory allocations.
	int numOperandLits = 0;
	for (int tmpBit = bit; tmpBit >= 0;) {
	int varBit = getVariableBit(VarName, BI, tmpBit);

	// If this bit isn't from a variable, skip it.
	if (varBit == -1) {
	--tmpBit;
	continue;
	}

	// Figure out the consecutive range of bits covered by this operand, in
	// order to generate better encoding code.
	int beginVarBit = varBit;
	int N = 1;
	for (--tmpBit; tmpBit >= 0;) {
	varBit = getVariableBit(VarName, BI, tmpBit);
	if (varBit == -1 \|\| varBit != (beginVarBit - N))
	break;
	++N;
	--tmpBit;
	}
	++numOperandLits;
	}

	for (; bit >= 0; ) {
	int varBit = getVariableBit(VarName, BI, bit);

	// If this bit isn't from a variable, skip it.
	if (varBit == -1) {
	--bit;
	continue;
	}

	// Figure out the consecutive range of bits covered by this operand, in
	// order to generate better encoding code.
	int beginInstBit = bit;
	int beginVarBit = varBit;
	int N = 1;
	for (--bit; bit >= 0;) {
	varBit = getVariableBit(VarName, BI, bit);
	if (varBit == -1 \|\| varBit != (beginVarBit - N)) break;
	++N;
	--bit;
	}

	std::string maskStr;
	int opShift;

	unsigned loBit = beginVarBit - N + 1;
	unsigned hiBit = loBit + N;
	unsigned loInstBit = beginInstBit - N + 1;
	if (UseAPInt) {
	std::string extractStr;
	if (N >= 64) {
	extractStr = "op.extractBits(" + itostr(hiBit - loBit) + ", " +
	itostr(loBit) + ")";
	Case += " Value.insertBits(" + extractStr + ", " +
	itostr(loInstBit) + ");\n";
	} else {
	extractStr = "op.extractBitsAsZExtValue(" + itostr(hiBit - loBit) +
	", " + itostr(loBit) + ")";
	Case += " Value.insertBits(" + extractStr + ", " +
	itostr(loInstBit) + ", " + itostr(hiBit - loBit) + ");\n";
	}
	} else {
	uint64_t opMask = ~(uint64_t)0 >> (64 - N);
	opShift = beginVarBit - N + 1;
	opMask <<= opShift;
	maskStr = "UINT64_C(" + utostr(opMask) + ")";
	opShift = beginInstBit - beginVarBit;

	if (numOperandLits == 1) {
	Case += " op &= " + maskStr + ";\n";
	if (opShift > 0) {
	Case += " op <<= " + itostr(opShift) + ";\n";
	} else if (opShift < 0) {
	Case += " op >>= " + itostr(-opShift) + ";\n";
	}
	Case += " Value \|= op;\n";
	} else {
	if (opShift > 0) {
	Case += " Value \|= (op & " + maskStr + ") << " +
	itostr(opShift) + ";\n";
	} else if (opShift < 0) {
	Case += " Value \|= (op & " + maskStr + ") >> " +
	itostr(-opShift) + ";\n";
	} else {
	Case += " Value \|= (op & " + maskStr + ");\n";
	}
	}
	}
	}
	return true;
	}

	std::string CodeEmitterGen::getInstructionCase(Record *R,
	CodeGenTarget &Target) {
	std::string Case;
	if (const RecordVal *RV = R->getValue("EncodingInfos")) {
	if (auto *DI = dyn_cast_or_null<DefInit>(RV->getValue())) {
	const CodeGenHwModes &HWM = Target.getHwModes();
	EncodingInfoByHwMode EBM(DI->getDef(), HWM);
	Case += " switch (HwMode) {\n";
	Case += " default: llvm_unreachable(\"Unhandled HwMode\");\n";
	for (auto &KV : EBM) {
	Case += " case " + itostr(KV.first) + ": {\n";
	Case += getInstructionCaseForEncoding(R, KV.second, Target);
	Case += " break;\n";
	Case += " }\n";
	}
	Case += " }\n";
	return Case;
	}
	}
	return getInstructionCaseForEncoding(R, R, Target);
	}

	std::string CodeEmitterGen::getInstructionCaseForEncoding(Record R, Record EncodingDef,
	CodeGenTarget &Target) {
	std::string Case;
	BitsInit *BI = EncodingDef->getValueAsBitsInit("Inst");

	// Loop over all of the fields in the instruction, determining which are the
	// operands to the instruction.
	bool Success = true;
	for (const RecordVal &RV : EncodingDef->getValues()) {
	// Ignore fixed fields in the record, we're looking for values like:
	// bits<5> RST = { ?, ?, ?, ?, ? };
	if (RV.isNonconcreteOK() \|\| RV.getValue()->isComplete())
	continue;

	Success &=
	addCodeToMergeInOperand(R, BI, std::string(RV.getName()),
	Case, Target);
	}

	if (!Success) {
	// Dump the record, so we can see what's going on...
	std::string E;
	raw_string_ostream S(E);
	S << "Dumping record for previous error:\n";
	S << *R;
	PrintNote(E);
	}

	StringRef PostEmitter = R->getValueAsString("PostEncoderMethod");
	if (!PostEmitter.empty()) {
	Case += " Value = ";
	Case += PostEmitter;
	Case += "(MI, Value";
	Case += ", STI";
	Case += ");\n";
	}

	return Case;
	}

	static void emitInstBits(raw_ostream &OS, const APInt &Bits) {
	for (unsigned I = 0; I < Bits.getNumWords(); ++I)
	OS << ((I > 0) ? ", " : "") << "UINT64_C(" << utostr(Bits.getRawData()[I])
	<< ")";
	}

	void CodeEmitterGen::emitInstructionBaseValues(
	raw_ostream &o, ArrayRef<const CodeGenInstruction *> NumberedInstructions,
	CodeGenTarget &Target, int HwMode) {
	const CodeGenHwModes &HWM = Target.getHwModes();
	if (HwMode == -1)
	o << " static const uint64_t InstBits[] = {\n";
	else
	o << " static const uint64_t InstBits_" << HWM.getMode(HwMode).Name
	<< "[] = {\n";

	for (const CodeGenInstruction *CGI : NumberedInstructions) {
	Record *R = CGI->TheDef;

	if (R->getValueAsString("Namespace") == "TargetOpcode" \|\|
	R->getValueAsBit("isPseudo")) {
	o << " "; emitInstBits(o, APInt(BitWidth, 0)); o << ",\n";
	continue;
	}

	Record *EncodingDef = R;
	if (const RecordVal *RV = R->getValue("EncodingInfos")) {
	if (auto *DI = dyn_cast_or_null<DefInit>(RV->getValue())) {
	EncodingInfoByHwMode EBM(DI->getDef(), HWM);
	if (EBM.hasMode(HwMode))
	EncodingDef = EBM.get(HwMode);
	}
	}
	BitsInit *BI = EncodingDef->getValueAsBitsInit("Inst");

	// Start by filling in fixed values.
	APInt Value(BitWidth, 0);
	for (unsigned i = 0, e = BI->getNumBits(); i != e; ++i) {
	if (auto *B = dyn_cast<BitInit>(BI->getBit(i)); B && B->getValue())
	Value.setBit(i);
	}
	o << " ";
	emitInstBits(o, Value);
	o << "," << '\t' << "// " << R->getName() << "\n";
	}
	o << " UINT64_C(0)\n };\n";
	}

	void CodeEmitterGen::run(raw_ostream &o) {
	emitSourceFileHeader("Machine Code Emitter", o);

	CodeGenTarget Target(Records);
	std::vector<Record*> Insts = Records.getAllDerivedDefinitions("Instruction");

	// For little-endian instruction bit encodings, reverse the bit order
	Target.reverseBitsForLittleEndianEncoding();

	ArrayRef<const CodeGenInstruction*> NumberedInstructions =
	Target.getInstructionsByEnumValue();

	if (any_of(NumberedInstructions, [](const CodeGenInstruction *CGI) {
	Record *R = CGI->TheDef;
	return R->getValue("Inst") && isa<DagInit>(R->getValueInit("Inst"));
	})) {
	emitVarLenCodeEmitter(Records, o);
	} else {
	const CodeGenHwModes &HWM = Target.getHwModes();
	// The set of HwModes used by instruction encodings.
	std::set<unsigned> HwModes;
	BitWidth = 0;
	for (const CodeGenInstruction *CGI : NumberedInstructions) {
	Record *R = CGI->TheDef;
	if (R->getValueAsString("Namespace") == "TargetOpcode" \|\|
	R->getValueAsBit("isPseudo"))
	continue;

	if (const RecordVal *RV = R->getValue("EncodingInfos")) {
	if (DefInit *DI = dyn_cast_or_null<DefInit>(RV->getValue())) {
	EncodingInfoByHwMode EBM(DI->getDef(), HWM);
	for (auto &KV : EBM) {
	BitsInit *BI = KV.second->getValueAsBitsInit("Inst");
	BitWidth = std::max(BitWidth, BI->getNumBits());
	HwModes.insert(KV.first);
	}
	continue;
	}
	}
	BitsInit *BI = R->getValueAsBitsInit("Inst");
	BitWidth = std::max(BitWidth, BI->getNumBits());
	}
	UseAPInt = BitWidth > 64;

	// Emit function declaration
	if (UseAPInt) {
	o << "void " << Target.getName()
	<< "MCCodeEmitter::getBinaryCodeForInstr(const MCInst &MI,\n"
	<< " SmallVectorImpl<MCFixup> &Fixups,\n"
	<< " APInt &Inst,\n"
	<< " APInt &Scratch,\n"
	<< " const MCSubtargetInfo &STI) const {\n";
	} else {
	o << "uint64_t " << Target.getName();
	o << "MCCodeEmitter::getBinaryCodeForInstr(const MCInst &MI,\n"
	<< " SmallVectorImpl<MCFixup> &Fixups,\n"
	<< " const MCSubtargetInfo &STI) const {\n";
	}

	// Emit instruction base values
	if (HwModes.empty()) {
	emitInstructionBaseValues(o, NumberedInstructions, Target, -1);
	} else {
	for (unsigned HwMode : HwModes)
	emitInstructionBaseValues(o, NumberedInstructions, Target, (int)HwMode);
	}

	if (!HwModes.empty()) {
	o << " const uint64_t *InstBits;\n";
	o << " unsigned HwMode = STI.getHwMode();\n";
	o << " switch (HwMode) {\n";
	o << " default: llvm_unreachable(\"Unknown hardware mode!\"); break;\n";
	for (unsigned I : HwModes) {
	o << " case " << I << ": InstBits = InstBits_" << HWM.getMode(I).Name
	<< "; break;\n";
	}
	o << " };\n";
	}

	// Map to accumulate all the cases.
	std::map<std::string, std::vector<std::string>> CaseMap;

	// Construct all cases statement for each opcode
	for (Record *R : Insts) {
	if (R->getValueAsString("Namespace") == "TargetOpcode" \|\|
	R->getValueAsBit("isPseudo"))
	continue;
	std::string InstName =
	(R->getValueAsString("Namespace") + "::" + R->getName()).str();
	std::string Case = getInstructionCase(R, Target);

	CaseMap[Case].push_back(std::move(InstName));
	}

	// Emit initial function code
	if (UseAPInt) {
	int NumWords = APInt::getNumWords(BitWidth);
	o << " const unsigned opcode = MI.getOpcode();\n"
	<< " if (Scratch.getBitWidth() != " << BitWidth << ")\n"
	<< " Scratch = Scratch.zext(" << BitWidth << ");\n"
	<< " Inst = APInt(" << BitWidth << ", ArrayRef(InstBits + opcode * "
	<< NumWords << ", " << NumWords << "));\n"
	<< " APInt &Value = Inst;\n"
	<< " APInt &op = Scratch;\n"
	<< " switch (opcode) {\n";
	} else {
	o << " const unsigned opcode = MI.getOpcode();\n"
	<< " uint64_t Value = InstBits[opcode];\n"
	<< " uint64_t op = 0;\n"
	<< " (void)op; // suppress warning\n"
	<< " switch (opcode) {\n";
	}

	// Emit each case statement
	std::map<std::string, std::vector<std::string>>::iterator IE, EE;
	for (IE = CaseMap.begin(), EE = CaseMap.end(); IE != EE; ++IE) {
	const std::string &Case = IE->first;
	std::vector<std::string> &InstList = IE->second;

	for (int i = 0, N = InstList.size(); i < N; i++) {
	if (i)
	o << "\n";
	o << " case " << InstList[i] << ":";
	}
	o << " {\n";
	o << Case;
	o << " break;\n"
	<< " }\n";
	}

	// Default case: unhandled opcode
	o << " default:\n"
	<< " std::string msg;\n"
	<< " raw_string_ostream Msg(msg);\n"
	<< " Msg << \"Not supported instr: \" << MI;\n"
	<< " report_fatal_error(Msg.str().c_str());\n"
	<< " }\n";
	if (UseAPInt)
	o << " Inst = Value;\n";
	else
	o << " return Value;\n";
	o << "}\n\n";
	}
	}

	} // end anonymous namespace

	static TableGen::Emitter::OptClass<CodeEmitterGen>
	X("gen-emitter", "Generate machine code emitter");