| //===------------ FixedLenDecoderEmitter.cpp - Decoder Generator ----------===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // It contains the tablegen backend that emits the decoder functions for |
| // targets with fixed length instruction set. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "CodeGenInstruction.h" |
| #include "CodeGenTarget.h" |
| #include "llvm/ADT/APInt.h" |
| #include "llvm/ADT/ArrayRef.h" |
| #include "llvm/ADT/CachedHashString.h" |
| #include "llvm/ADT/SmallString.h" |
| #include "llvm/ADT/SetVector.h" |
| #include "llvm/ADT/STLExtras.h" |
| #include "llvm/ADT/StringExtras.h" |
| #include "llvm/ADT/StringRef.h" |
| #include "llvm/MC/MCFixedLenDisassembler.h" |
| #include "llvm/Support/Casting.h" |
| #include "llvm/Support/Debug.h" |
| #include "llvm/Support/ErrorHandling.h" |
| #include "llvm/Support/FormattedStream.h" |
| #include "llvm/Support/LEB128.h" |
| #include "llvm/Support/raw_ostream.h" |
| #include "llvm/TableGen/Error.h" |
| #include "llvm/TableGen/Record.h" |
| #include <algorithm> |
| #include <cassert> |
| #include <cstddef> |
| #include <cstdint> |
| #include <map> |
| #include <memory> |
| #include <set> |
| #include <string> |
| #include <utility> |
| #include <vector> |
| |
| using namespace llvm; |
| |
| #define DEBUG_TYPE "decoder-emitter" |
| |
| namespace { |
| |
| struct EncodingField { |
| unsigned Base, Width, Offset; |
| EncodingField(unsigned B, unsigned W, unsigned O) |
| : Base(B), Width(W), Offset(O) { } |
| }; |
| |
| struct OperandInfo { |
| std::vector<EncodingField> Fields; |
| std::string Decoder; |
| bool HasCompleteDecoder; |
| |
| OperandInfo(std::string D, bool HCD) |
| : Decoder(std::move(D)), HasCompleteDecoder(HCD) {} |
| |
| void addField(unsigned Base, unsigned Width, unsigned Offset) { |
| Fields.push_back(EncodingField(Base, Width, Offset)); |
| } |
| |
| unsigned numFields() const { return Fields.size(); } |
| |
| typedef std::vector<EncodingField>::const_iterator const_iterator; |
| |
| const_iterator begin() const { return Fields.begin(); } |
| const_iterator end() const { return Fields.end(); } |
| }; |
| |
| typedef std::vector<uint8_t> DecoderTable; |
| typedef uint32_t DecoderFixup; |
| typedef std::vector<DecoderFixup> FixupList; |
| typedef std::vector<FixupList> FixupScopeList; |
| typedef SmallSetVector<CachedHashString, 16> PredicateSet; |
| typedef SmallSetVector<CachedHashString, 16> DecoderSet; |
| struct DecoderTableInfo { |
| DecoderTable Table; |
| FixupScopeList FixupStack; |
| PredicateSet Predicates; |
| DecoderSet Decoders; |
| }; |
| |
| class FixedLenDecoderEmitter { |
| ArrayRef<const CodeGenInstruction *> NumberedInstructions; |
| |
| public: |
| // Defaults preserved here for documentation, even though they aren't |
| // strictly necessary given the way that this is currently being called. |
| FixedLenDecoderEmitter(RecordKeeper &R, std::string PredicateNamespace, |
| std::string GPrefix = "if (", |
| std::string GPostfix = " == MCDisassembler::Fail)", |
| std::string ROK = "MCDisassembler::Success", |
| std::string RFail = "MCDisassembler::Fail", |
| std::string L = "") |
| : Target(R), PredicateNamespace(std::move(PredicateNamespace)), |
| GuardPrefix(std::move(GPrefix)), GuardPostfix(std::move(GPostfix)), |
| ReturnOK(std::move(ROK)), ReturnFail(std::move(RFail)), |
| Locals(std::move(L)) {} |
| |
| // Emit the decoder state machine table. |
| void emitTable(formatted_raw_ostream &o, DecoderTable &Table, |
| unsigned Indentation, unsigned BitWidth, |
| StringRef Namespace) const; |
| void emitPredicateFunction(formatted_raw_ostream &OS, |
| PredicateSet &Predicates, |
| unsigned Indentation) const; |
| void emitDecoderFunction(formatted_raw_ostream &OS, |
| DecoderSet &Decoders, |
| unsigned Indentation) const; |
| |
| // run - Output the code emitter |
| void run(raw_ostream &o); |
| |
| private: |
| CodeGenTarget Target; |
| |
| public: |
| std::string PredicateNamespace; |
| std::string GuardPrefix, GuardPostfix; |
| std::string ReturnOK, ReturnFail; |
| std::string Locals; |
| }; |
| |
| } // end anonymous namespace |
| |
| // The set (BIT_TRUE, BIT_FALSE, BIT_UNSET) represents a ternary logic system |
| // for a bit value. |
| // |
| // BIT_UNFILTERED is used as the init value for a filter position. It is used |
| // only for filter processings. |
| typedef enum { |
| BIT_TRUE, // '1' |
| BIT_FALSE, // '0' |
| BIT_UNSET, // '?' |
| BIT_UNFILTERED // unfiltered |
| } bit_value_t; |
| |
| static bool ValueSet(bit_value_t V) { |
| return (V == BIT_TRUE || V == BIT_FALSE); |
| } |
| |
| static bool ValueNotSet(bit_value_t V) { |
| return (V == BIT_UNSET); |
| } |
| |
| static int Value(bit_value_t V) { |
| return ValueNotSet(V) ? -1 : (V == BIT_FALSE ? 0 : 1); |
| } |
| |
| static bit_value_t bitFromBits(const BitsInit &bits, unsigned index) { |
| if (BitInit *bit = dyn_cast<BitInit>(bits.getBit(index))) |
| return bit->getValue() ? BIT_TRUE : BIT_FALSE; |
| |
| // The bit is uninitialized. |
| return BIT_UNSET; |
| } |
| |
| // Prints the bit value for each position. |
| static void dumpBits(raw_ostream &o, const BitsInit &bits) { |
| for (unsigned index = bits.getNumBits(); index > 0; --index) { |
| switch (bitFromBits(bits, index - 1)) { |
| case BIT_TRUE: |
| o << "1"; |
| break; |
| case BIT_FALSE: |
| o << "0"; |
| break; |
| case BIT_UNSET: |
| o << "_"; |
| break; |
| default: |
| llvm_unreachable("unexpected return value from bitFromBits"); |
| } |
| } |
| } |
| |
| static BitsInit &getBitsField(const Record &def, StringRef str) { |
| BitsInit *bits = def.getValueAsBitsInit(str); |
| return *bits; |
| } |
| |
| // Representation of the instruction to work on. |
| typedef std::vector<bit_value_t> insn_t; |
| |
| namespace { |
| |
| class FilterChooser; |
| |
| /// Filter - Filter works with FilterChooser to produce the decoding tree for |
| /// the ISA. |
| /// |
| /// It is useful to think of a Filter as governing the switch stmts of the |
| /// decoding tree in a certain level. Each case stmt delegates to an inferior |
| /// FilterChooser to decide what further decoding logic to employ, or in another |
| /// words, what other remaining bits to look at. The FilterChooser eventually |
| /// chooses a best Filter to do its job. |
| /// |
| /// This recursive scheme ends when the number of Opcodes assigned to the |
| /// FilterChooser becomes 1 or if there is a conflict. A conflict happens when |
| /// the Filter/FilterChooser combo does not know how to distinguish among the |
| /// Opcodes assigned. |
| /// |
| /// An example of a conflict is |
| /// |
| /// Conflict: |
| /// 111101000.00........00010000.... |
| /// 111101000.00........0001........ |
| /// 1111010...00........0001........ |
| /// 1111010...00.................... |
| /// 1111010......................... |
| /// 1111............................ |
| /// ................................ |
| /// VST4q8a 111101000_00________00010000____ |
| /// VST4q8b 111101000_00________00010000____ |
| /// |
| /// The Debug output shows the path that the decoding tree follows to reach the |
| /// the conclusion that there is a conflict. VST4q8a is a vst4 to double-spaced |
| /// even registers, while VST4q8b is a vst4 to double-spaced odd registers. |
| /// |
| /// The encoding info in the .td files does not specify this meta information, |
| /// which could have been used by the decoder to resolve the conflict. The |
| /// decoder could try to decode the even/odd register numbering and assign to |
| /// VST4q8a or VST4q8b, but for the time being, the decoder chooses the "a" |
| /// version and return the Opcode since the two have the same Asm format string. |
| class Filter { |
| protected: |
| const FilterChooser *Owner;// points to the FilterChooser who owns this filter |
| unsigned StartBit; // the starting bit position |
| unsigned NumBits; // number of bits to filter |
| bool Mixed; // a mixed region contains both set and unset bits |
| |
| // Map of well-known segment value to the set of uid's with that value. |
| std::map<uint64_t, std::vector<unsigned>> FilteredInstructions; |
| |
| // Set of uid's with non-constant segment values. |
| std::vector<unsigned> VariableInstructions; |
| |
| // Map of well-known segment value to its delegate. |
| std::map<unsigned, std::unique_ptr<const FilterChooser>> FilterChooserMap; |
| |
| // Number of instructions which fall under FilteredInstructions category. |
| unsigned NumFiltered; |
| |
| // Keeps track of the last opcode in the filtered bucket. |
| unsigned LastOpcFiltered; |
| |
| public: |
| Filter(Filter &&f); |
| Filter(FilterChooser &owner, unsigned startBit, unsigned numBits, bool mixed); |
| |
| ~Filter() = default; |
| |
| unsigned getNumFiltered() const { return NumFiltered; } |
| |
| unsigned getSingletonOpc() const { |
| assert(NumFiltered == 1); |
| return LastOpcFiltered; |
| } |
| |
| // Return the filter chooser for the group of instructions without constant |
| // segment values. |
| const FilterChooser &getVariableFC() const { |
| assert(NumFiltered == 1); |
| assert(FilterChooserMap.size() == 1); |
| return *(FilterChooserMap.find((unsigned)-1)->second); |
| } |
| |
| // Divides the decoding task into sub tasks and delegates them to the |
| // inferior FilterChooser's. |
| // |
| // A special case arises when there's only one entry in the filtered |
| // instructions. In order to unambiguously decode the singleton, we need to |
| // match the remaining undecoded encoding bits against the singleton. |
| void recurse(); |
| |
| // Emit table entries to decode instructions given a segment or segments of |
| // bits. |
| void emitTableEntry(DecoderTableInfo &TableInfo) const; |
| |
| // Returns the number of fanout produced by the filter. More fanout implies |
| // the filter distinguishes more categories of instructions. |
| unsigned usefulness() const; |
| }; // end class Filter |
| |
| } // end anonymous namespace |
| |
| // These are states of our finite state machines used in FilterChooser's |
| // filterProcessor() which produces the filter candidates to use. |
| typedef enum { |
| ATTR_NONE, |
| ATTR_FILTERED, |
| ATTR_ALL_SET, |
| ATTR_ALL_UNSET, |
| ATTR_MIXED |
| } bitAttr_t; |
| |
| /// FilterChooser - FilterChooser chooses the best filter among a set of Filters |
| /// in order to perform the decoding of instructions at the current level. |
| /// |
| /// Decoding proceeds from the top down. Based on the well-known encoding bits |
| /// of instructions available, FilterChooser builds up the possible Filters that |
| /// can further the task of decoding by distinguishing among the remaining |
| /// candidate instructions. |
| /// |
| /// Once a filter has been chosen, it is called upon to divide the decoding task |
| /// into sub-tasks and delegates them to its inferior FilterChoosers for further |
| /// processings. |
| /// |
| /// It is useful to think of a Filter as governing the switch stmts of the |
| /// decoding tree. And each case is delegated to an inferior FilterChooser to |
| /// decide what further remaining bits to look at. |
| namespace { |
| |
| class FilterChooser { |
| protected: |
| friend class Filter; |
| |
| // Vector of codegen instructions to choose our filter. |
| ArrayRef<const CodeGenInstruction *> AllInstructions; |
| |
| // Vector of uid's for this filter chooser to work on. |
| const std::vector<unsigned> &Opcodes; |
| |
| // Lookup table for the operand decoding of instructions. |
| const std::map<unsigned, std::vector<OperandInfo>> &Operands; |
| |
| // Vector of candidate filters. |
| std::vector<Filter> Filters; |
| |
| // Array of bit values passed down from our parent. |
| // Set to all BIT_UNFILTERED's for Parent == NULL. |
| std::vector<bit_value_t> FilterBitValues; |
| |
| // Links to the FilterChooser above us in the decoding tree. |
| const FilterChooser *Parent; |
| |
| // Index of the best filter from Filters. |
| int BestIndex; |
| |
| // Width of instructions |
| unsigned BitWidth; |
| |
| // Parent emitter |
| const FixedLenDecoderEmitter *Emitter; |
| |
| public: |
| FilterChooser(ArrayRef<const CodeGenInstruction *> Insts, |
| const std::vector<unsigned> &IDs, |
| const std::map<unsigned, std::vector<OperandInfo>> &Ops, |
| unsigned BW, |
| const FixedLenDecoderEmitter *E) |
| : AllInstructions(Insts), Opcodes(IDs), Operands(Ops), |
| FilterBitValues(BW, BIT_UNFILTERED), Parent(nullptr), BestIndex(-1), |
| BitWidth(BW), Emitter(E) { |
| doFilter(); |
| } |
| |
| FilterChooser(ArrayRef<const CodeGenInstruction *> Insts, |
| const std::vector<unsigned> &IDs, |
| const std::map<unsigned, std::vector<OperandInfo>> &Ops, |
| const std::vector<bit_value_t> &ParentFilterBitValues, |
| const FilterChooser &parent) |
| : AllInstructions(Insts), Opcodes(IDs), Operands(Ops), |
| FilterBitValues(ParentFilterBitValues), Parent(&parent), BestIndex(-1), |
| BitWidth(parent.BitWidth), Emitter(parent.Emitter) { |
| doFilter(); |
| } |
| |
| FilterChooser(const FilterChooser &) = delete; |
| void operator=(const FilterChooser &) = delete; |
| |
| unsigned getBitWidth() const { return BitWidth; } |
| |
| protected: |
| // Populates the insn given the uid. |
| void insnWithID(insn_t &Insn, unsigned Opcode) const { |
| BitsInit &Bits = getBitsField(*AllInstructions[Opcode]->TheDef, "Inst"); |
| |
| // We may have a SoftFail bitmask, which specifies a mask where an encoding |
| // may differ from the value in "Inst" and yet still be valid, but the |
| // disassembler should return SoftFail instead of Success. |
| // |
| // This is used for marking UNPREDICTABLE instructions in the ARM world. |
| BitsInit *SFBits = |
| AllInstructions[Opcode]->TheDef->getValueAsBitsInit("SoftFail"); |
| |
| for (unsigned i = 0; i < BitWidth; ++i) { |
| if (SFBits && bitFromBits(*SFBits, i) == BIT_TRUE) |
| Insn.push_back(BIT_UNSET); |
| else |
| Insn.push_back(bitFromBits(Bits, i)); |
| } |
| } |
| |
| // Returns the record name. |
| const StringRef nameWithID(unsigned Opcode) const { |
| return AllInstructions[Opcode]->TheDef->getName(); |
| } |
| |
| // Populates the field of the insn given the start position and the number of |
| // consecutive bits to scan for. |
| // |
| // Returns false if there exists any uninitialized bit value in the range. |
| // Returns true, otherwise. |
| bool fieldFromInsn(uint64_t &Field, insn_t &Insn, unsigned StartBit, |
| unsigned NumBits) const; |
| |
| /// dumpFilterArray - dumpFilterArray prints out debugging info for the given |
| /// filter array as a series of chars. |
| void dumpFilterArray(raw_ostream &o, |
| const std::vector<bit_value_t> & filter) const; |
| |
| /// dumpStack - dumpStack traverses the filter chooser chain and calls |
| /// dumpFilterArray on each filter chooser up to the top level one. |
| void dumpStack(raw_ostream &o, const char *prefix) const; |
| |
| Filter &bestFilter() { |
| assert(BestIndex != -1 && "BestIndex not set"); |
| return Filters[BestIndex]; |
| } |
| |
| bool PositionFiltered(unsigned i) const { |
| return ValueSet(FilterBitValues[i]); |
| } |
| |
| // Calculates the island(s) needed to decode the instruction. |
| // This returns a lit of undecoded bits of an instructions, for example, |
| // Inst{20} = 1 && Inst{3-0} == 0b1111 represents two islands of yet-to-be |
| // decoded bits in order to verify that the instruction matches the Opcode. |
| unsigned getIslands(std::vector<unsigned> &StartBits, |
| std::vector<unsigned> &EndBits, |
| std::vector<uint64_t> &FieldVals, |
| const insn_t &Insn) const; |
| |
| // Emits code to check the Predicates member of an instruction are true. |
| // Returns true if predicate matches were emitted, false otherwise. |
| bool emitPredicateMatch(raw_ostream &o, unsigned &Indentation, |
| unsigned Opc) const; |
| |
| bool doesOpcodeNeedPredicate(unsigned Opc) const; |
| unsigned getPredicateIndex(DecoderTableInfo &TableInfo, StringRef P) const; |
| void emitPredicateTableEntry(DecoderTableInfo &TableInfo, |
| unsigned Opc) const; |
| |
| void emitSoftFailTableEntry(DecoderTableInfo &TableInfo, |
| unsigned Opc) const; |
| |
| // Emits table entries to decode the singleton. |
| void emitSingletonTableEntry(DecoderTableInfo &TableInfo, |
| unsigned Opc) const; |
| |
| // Emits code to decode the singleton, and then to decode the rest. |
| void emitSingletonTableEntry(DecoderTableInfo &TableInfo, |
| const Filter &Best) const; |
| |
| void emitBinaryParser(raw_ostream &o, unsigned &Indentation, |
| const OperandInfo &OpInfo, |
| bool &OpHasCompleteDecoder) const; |
| |
| void emitDecoder(raw_ostream &OS, unsigned Indentation, unsigned Opc, |
| bool &HasCompleteDecoder) const; |
| unsigned getDecoderIndex(DecoderSet &Decoders, unsigned Opc, |
| bool &HasCompleteDecoder) const; |
| |
| // Assign a single filter and run with it. |
| void runSingleFilter(unsigned startBit, unsigned numBit, bool mixed); |
| |
| // reportRegion is a helper function for filterProcessor to mark a region as |
| // eligible for use as a filter region. |
| void reportRegion(bitAttr_t RA, unsigned StartBit, unsigned BitIndex, |
| bool AllowMixed); |
| |
| // FilterProcessor scans the well-known encoding bits of the instructions and |
| // builds up a list of candidate filters. It chooses the best filter and |
| // recursively descends down the decoding tree. |
| bool filterProcessor(bool AllowMixed, bool Greedy = true); |
| |
| // Decides on the best configuration of filter(s) to use in order to decode |
| // the instructions. A conflict of instructions may occur, in which case we |
| // dump the conflict set to the standard error. |
| void doFilter(); |
| |
| public: |
| // emitTableEntries - Emit state machine entries to decode our share of |
| // instructions. |
| void emitTableEntries(DecoderTableInfo &TableInfo) const; |
| }; |
| |
| } // end anonymous namespace |
| |
| /////////////////////////// |
| // // |
| // Filter Implementation // |
| // // |
| /////////////////////////// |
| |
| Filter::Filter(Filter &&f) |
| : Owner(f.Owner), StartBit(f.StartBit), NumBits(f.NumBits), Mixed(f.Mixed), |
| FilteredInstructions(std::move(f.FilteredInstructions)), |
| VariableInstructions(std::move(f.VariableInstructions)), |
| FilterChooserMap(std::move(f.FilterChooserMap)), NumFiltered(f.NumFiltered), |
| LastOpcFiltered(f.LastOpcFiltered) { |
| } |
| |
| Filter::Filter(FilterChooser &owner, unsigned startBit, unsigned numBits, |
| bool mixed) |
| : Owner(&owner), StartBit(startBit), NumBits(numBits), Mixed(mixed) { |
| assert(StartBit + NumBits - 1 < Owner->BitWidth); |
| |
| NumFiltered = 0; |
| LastOpcFiltered = 0; |
| |
| for (unsigned i = 0, e = Owner->Opcodes.size(); i != e; ++i) { |
| insn_t Insn; |
| |
| // Populates the insn given the uid. |
| Owner->insnWithID(Insn, Owner->Opcodes[i]); |
| |
| uint64_t Field; |
| // Scans the segment for possibly well-specified encoding bits. |
| bool ok = Owner->fieldFromInsn(Field, Insn, StartBit, NumBits); |
| |
| if (ok) { |
| // The encoding bits are well-known. Lets add the uid of the |
| // instruction into the bucket keyed off the constant field value. |
| LastOpcFiltered = Owner->Opcodes[i]; |
| FilteredInstructions[Field].push_back(LastOpcFiltered); |
| ++NumFiltered; |
| } else { |
| // Some of the encoding bit(s) are unspecified. This contributes to |
| // one additional member of "Variable" instructions. |
| VariableInstructions.push_back(Owner->Opcodes[i]); |
| } |
| } |
| |
| assert((FilteredInstructions.size() + VariableInstructions.size() > 0) |
| && "Filter returns no instruction categories"); |
| } |
| |
| // Divides the decoding task into sub tasks and delegates them to the |
| // inferior FilterChooser's. |
| // |
| // A special case arises when there's only one entry in the filtered |
| // instructions. In order to unambiguously decode the singleton, we need to |
| // match the remaining undecoded encoding bits against the singleton. |
| void Filter::recurse() { |
| // Starts by inheriting our parent filter chooser's filter bit values. |
| std::vector<bit_value_t> BitValueArray(Owner->FilterBitValues); |
| |
| if (!VariableInstructions.empty()) { |
| // Conservatively marks each segment position as BIT_UNSET. |
| for (unsigned bitIndex = 0; bitIndex < NumBits; ++bitIndex) |
| BitValueArray[StartBit + bitIndex] = BIT_UNSET; |
| |
| // Delegates to an inferior filter chooser for further processing on this |
| // group of instructions whose segment values are variable. |
| FilterChooserMap.insert( |
| std::make_pair(-1U, llvm::make_unique<FilterChooser>( |
| Owner->AllInstructions, VariableInstructions, |
| Owner->Operands, BitValueArray, *Owner))); |
| } |
| |
| // No need to recurse for a singleton filtered instruction. |
| // See also Filter::emit*(). |
| if (getNumFiltered() == 1) { |
| assert(FilterChooserMap.size() == 1); |
| return; |
| } |
| |
| // Otherwise, create sub choosers. |
| for (const auto &Inst : FilteredInstructions) { |
| |
| // Marks all the segment positions with either BIT_TRUE or BIT_FALSE. |
| for (unsigned bitIndex = 0; bitIndex < NumBits; ++bitIndex) { |
| if (Inst.first & (1ULL << bitIndex)) |
| BitValueArray[StartBit + bitIndex] = BIT_TRUE; |
| else |
| BitValueArray[StartBit + bitIndex] = BIT_FALSE; |
| } |
| |
| // Delegates to an inferior filter chooser for further processing on this |
| // category of instructions. |
| FilterChooserMap.insert(std::make_pair( |
| Inst.first, llvm::make_unique<FilterChooser>( |
| Owner->AllInstructions, Inst.second, |
| Owner->Operands, BitValueArray, *Owner))); |
| } |
| } |
| |
| static void resolveTableFixups(DecoderTable &Table, const FixupList &Fixups, |
| uint32_t DestIdx) { |
| // Any NumToSkip fixups in the current scope can resolve to the |
| // current location. |
| for (FixupList::const_reverse_iterator I = Fixups.rbegin(), |
| E = Fixups.rend(); |
| I != E; ++I) { |
| // Calculate the distance from the byte following the fixup entry byte |
| // to the destination. The Target is calculated from after the 16-bit |
| // NumToSkip entry itself, so subtract two from the displacement here |
| // to account for that. |
| uint32_t FixupIdx = *I; |
| uint32_t Delta = DestIdx - FixupIdx - 3; |
| // Our NumToSkip entries are 24-bits. Make sure our table isn't too |
| // big. |
| assert(Delta < (1u << 24)); |
| Table[FixupIdx] = (uint8_t)Delta; |
| Table[FixupIdx + 1] = (uint8_t)(Delta >> 8); |
| Table[FixupIdx + 2] = (uint8_t)(Delta >> 16); |
| } |
| } |
| |
| // Emit table entries to decode instructions given a segment or segments |
| // of bits. |
| void Filter::emitTableEntry(DecoderTableInfo &TableInfo) const { |
| TableInfo.Table.push_back(MCD::OPC_ExtractField); |
| TableInfo.Table.push_back(StartBit); |
| TableInfo.Table.push_back(NumBits); |
| |
| // A new filter entry begins a new scope for fixup resolution. |
| TableInfo.FixupStack.emplace_back(); |
| |
| DecoderTable &Table = TableInfo.Table; |
| |
| size_t PrevFilter = 0; |
| bool HasFallthrough = false; |
| for (auto &Filter : FilterChooserMap) { |
| // Field value -1 implies a non-empty set of variable instructions. |
| // See also recurse(). |
| if (Filter.first == (unsigned)-1) { |
| HasFallthrough = true; |
| |
| // Each scope should always have at least one filter value to check |
| // for. |
| assert(PrevFilter != 0 && "empty filter set!"); |
| FixupList &CurScope = TableInfo.FixupStack.back(); |
| // Resolve any NumToSkip fixups in the current scope. |
| resolveTableFixups(Table, CurScope, Table.size()); |
| CurScope.clear(); |
| PrevFilter = 0; // Don't re-process the filter's fallthrough. |
| } else { |
| Table.push_back(MCD::OPC_FilterValue); |
| // Encode and emit the value to filter against. |
| uint8_t Buffer[16]; |
| unsigned Len = encodeULEB128(Filter.first, Buffer); |
| Table.insert(Table.end(), Buffer, Buffer + Len); |
| // Reserve space for the NumToSkip entry. We'll backpatch the value |
| // later. |
| PrevFilter = Table.size(); |
| Table.push_back(0); |
| Table.push_back(0); |
| Table.push_back(0); |
| } |
| |
| // We arrive at a category of instructions with the same segment value. |
| // Now delegate to the sub filter chooser for further decodings. |
| // The case may fallthrough, which happens if the remaining well-known |
| // encoding bits do not match exactly. |
| Filter.second->emitTableEntries(TableInfo); |
| |
| // Now that we've emitted the body of the handler, update the NumToSkip |
| // of the filter itself to be able to skip forward when false. Subtract |
| // two as to account for the width of the NumToSkip field itself. |
| if (PrevFilter) { |
| uint32_t NumToSkip = Table.size() - PrevFilter - 3; |
| assert(NumToSkip < (1u << 24) && "disassembler decoding table too large!"); |
| Table[PrevFilter] = (uint8_t)NumToSkip; |
| Table[PrevFilter + 1] = (uint8_t)(NumToSkip >> 8); |
| Table[PrevFilter + 2] = (uint8_t)(NumToSkip >> 16); |
| } |
| } |
| |
| // Any remaining unresolved fixups bubble up to the parent fixup scope. |
| assert(TableInfo.FixupStack.size() > 1 && "fixup stack underflow!"); |
| FixupScopeList::iterator Source = TableInfo.FixupStack.end() - 1; |
| FixupScopeList::iterator Dest = Source - 1; |
| Dest->insert(Dest->end(), Source->begin(), Source->end()); |
| TableInfo.FixupStack.pop_back(); |
| |
| // If there is no fallthrough, then the final filter should get fixed |
| // up according to the enclosing scope rather than the current position. |
| if (!HasFallthrough) |
| TableInfo.FixupStack.back().push_back(PrevFilter); |
| } |
| |
| // Returns the number of fanout produced by the filter. More fanout implies |
| // the filter distinguishes more categories of instructions. |
| unsigned Filter::usefulness() const { |
| if (!VariableInstructions.empty()) |
| return FilteredInstructions.size(); |
| else |
| return FilteredInstructions.size() + 1; |
| } |
| |
| ////////////////////////////////// |
| // // |
| // Filterchooser Implementation // |
| // // |
| ////////////////////////////////// |
| |
| // Emit the decoder state machine table. |
| void FixedLenDecoderEmitter::emitTable(formatted_raw_ostream &OS, |
| DecoderTable &Table, |
| unsigned Indentation, |
| unsigned BitWidth, |
| StringRef Namespace) const { |
| OS.indent(Indentation) << "static const uint8_t DecoderTable" << Namespace |
| << BitWidth << "[] = {\n"; |
| |
| Indentation += 2; |
| |
| // FIXME: We may be able to use the NumToSkip values to recover |
| // appropriate indentation levels. |
| DecoderTable::const_iterator I = Table.begin(); |
| DecoderTable::const_iterator E = Table.end(); |
| while (I != E) { |
| assert (I < E && "incomplete decode table entry!"); |
| |
| uint64_t Pos = I - Table.begin(); |
| OS << "/* " << Pos << " */"; |
| OS.PadToColumn(12); |
| |
| switch (*I) { |
| default: |
| PrintFatalError("invalid decode table opcode"); |
| case MCD::OPC_ExtractField: { |
| ++I; |
| unsigned Start = *I++; |
| unsigned Len = *I++; |
| OS.indent(Indentation) << "MCD::OPC_ExtractField, " << Start << ", " |
| << Len << ", // Inst{"; |
| if (Len > 1) |
| OS << (Start + Len - 1) << "-"; |
| OS << Start << "} ...\n"; |
| break; |
| } |
| case MCD::OPC_FilterValue: { |
| ++I; |
| OS.indent(Indentation) << "MCD::OPC_FilterValue, "; |
| // The filter value is ULEB128 encoded. |
| while (*I >= 128) |
| OS << (unsigned)*I++ << ", "; |
| OS << (unsigned)*I++ << ", "; |
| |
| // 24-bit numtoskip value. |
| uint8_t Byte = *I++; |
| uint32_t NumToSkip = Byte; |
| OS << (unsigned)Byte << ", "; |
| Byte = *I++; |
| OS << (unsigned)Byte << ", "; |
| NumToSkip |= Byte << 8; |
| Byte = *I++; |
| OS << utostr(Byte) << ", "; |
| NumToSkip |= Byte << 16; |
| OS << "// Skip to: " << ((I - Table.begin()) + NumToSkip) << "\n"; |
| break; |
| } |
| case MCD::OPC_CheckField: { |
| ++I; |
| unsigned Start = *I++; |
| unsigned Len = *I++; |
| OS.indent(Indentation) << "MCD::OPC_CheckField, " << Start << ", " |
| << Len << ", ";// << Val << ", " << NumToSkip << ",\n"; |
| // ULEB128 encoded field value. |
| for (; *I >= 128; ++I) |
| OS << (unsigned)*I << ", "; |
| OS << (unsigned)*I++ << ", "; |
| // 24-bit numtoskip value. |
| uint8_t Byte = *I++; |
| uint32_t NumToSkip = Byte; |
| OS << (unsigned)Byte << ", "; |
| Byte = *I++; |
| OS << (unsigned)Byte << ", "; |
| NumToSkip |= Byte << 8; |
| Byte = *I++; |
| OS << utostr(Byte) << ", "; |
| NumToSkip |= Byte << 16; |
| OS << "// Skip to: " << ((I - Table.begin()) + NumToSkip) << "\n"; |
| break; |
| } |
| case MCD::OPC_CheckPredicate: { |
| ++I; |
| OS.indent(Indentation) << "MCD::OPC_CheckPredicate, "; |
| for (; *I >= 128; ++I) |
| OS << (unsigned)*I << ", "; |
| OS << (unsigned)*I++ << ", "; |
| |
| // 24-bit numtoskip value. |
| uint8_t Byte = *I++; |
| uint32_t NumToSkip = Byte; |
| OS << (unsigned)Byte << ", "; |
| Byte = *I++; |
| OS << (unsigned)Byte << ", "; |
| NumToSkip |= Byte << 8; |
| Byte = *I++; |
| OS << utostr(Byte) << ", "; |
| NumToSkip |= Byte << 16; |
| OS << "// Skip to: " << ((I - Table.begin()) + NumToSkip) << "\n"; |
| break; |
| } |
| case MCD::OPC_Decode: |
| case MCD::OPC_TryDecode: { |
| bool IsTry = *I == MCD::OPC_TryDecode; |
| ++I; |
| // Extract the ULEB128 encoded Opcode to a buffer. |
| uint8_t Buffer[16], *p = Buffer; |
| while ((*p++ = *I++) >= 128) |
| assert((p - Buffer) <= (ptrdiff_t)sizeof(Buffer) |
| && "ULEB128 value too large!"); |
| // Decode the Opcode value. |
| unsigned Opc = decodeULEB128(Buffer); |
| OS.indent(Indentation) << "MCD::OPC_" << (IsTry ? "Try" : "") |
| << "Decode, "; |
| for (p = Buffer; *p >= 128; ++p) |
| OS << (unsigned)*p << ", "; |
| OS << (unsigned)*p << ", "; |
| |
| // Decoder index. |
| for (; *I >= 128; ++I) |
| OS << (unsigned)*I << ", "; |
| OS << (unsigned)*I++ << ", "; |
| |
| if (!IsTry) { |
| OS << "// Opcode: " |
| << NumberedInstructions[Opc]->TheDef->getName() << "\n"; |
| break; |
| } |
| |
| // Fallthrough for OPC_TryDecode. |
| |
| // 24-bit numtoskip value. |
| uint8_t Byte = *I++; |
| uint32_t NumToSkip = Byte; |
| OS << (unsigned)Byte << ", "; |
| Byte = *I++; |
| OS << (unsigned)Byte << ", "; |
| NumToSkip |= Byte << 8; |
| Byte = *I++; |
| OS << utostr(Byte) << ", "; |
| NumToSkip |= Byte << 16; |
| |
| OS << "// Opcode: " |
| << NumberedInstructions[Opc]->TheDef->getName() |
| << ", skip to: " << ((I - Table.begin()) + NumToSkip) << "\n"; |
| break; |
| } |
| case MCD::OPC_SoftFail: { |
| ++I; |
| OS.indent(Indentation) << "MCD::OPC_SoftFail"; |
| // Positive mask |
| uint64_t Value = 0; |
| unsigned Shift = 0; |
| do { |
| OS << ", " << (unsigned)*I; |
| Value += (*I & 0x7f) << Shift; |
| Shift += 7; |
| } while (*I++ >= 128); |
| if (Value > 127) { |
| OS << " /* 0x"; |
| OS.write_hex(Value); |
| OS << " */"; |
| } |
| // Negative mask |
| Value = 0; |
| Shift = 0; |
| do { |
| OS << ", " << (unsigned)*I; |
| Value += (*I & 0x7f) << Shift; |
| Shift += 7; |
| } while (*I++ >= 128); |
| if (Value > 127) { |
| OS << " /* 0x"; |
| OS.write_hex(Value); |
| OS << " */"; |
| } |
| OS << ",\n"; |
| break; |
| } |
| case MCD::OPC_Fail: { |
| ++I; |
| OS.indent(Indentation) << "MCD::OPC_Fail,\n"; |
| break; |
| } |
| } |
| } |
| OS.indent(Indentation) << "0\n"; |
| |
| Indentation -= 2; |
| |
| OS.indent(Indentation) << "};\n\n"; |
| } |
| |
| void FixedLenDecoderEmitter:: |
| emitPredicateFunction(formatted_raw_ostream &OS, PredicateSet &Predicates, |
| unsigned Indentation) const { |
| // The predicate function is just a big switch statement based on the |
| // input predicate index. |
| OS.indent(Indentation) << "static bool checkDecoderPredicate(unsigned Idx, " |
| << "const FeatureBitset& Bits) {\n"; |
| Indentation += 2; |
| if (!Predicates.empty()) { |
| OS.indent(Indentation) << "switch (Idx) {\n"; |
| OS.indent(Indentation) << "default: llvm_unreachable(\"Invalid index!\");\n"; |
| unsigned Index = 0; |
| for (const auto &Predicate : Predicates) { |
| OS.indent(Indentation) << "case " << Index++ << ":\n"; |
| OS.indent(Indentation+2) << "return (" << Predicate << ");\n"; |
| } |
| OS.indent(Indentation) << "}\n"; |
| } else { |
| // No case statement to emit |
| OS.indent(Indentation) << "llvm_unreachable(\"Invalid index!\");\n"; |
| } |
| Indentation -= 2; |
| OS.indent(Indentation) << "}\n\n"; |
| } |
| |
| void FixedLenDecoderEmitter:: |
| emitDecoderFunction(formatted_raw_ostream &OS, DecoderSet &Decoders, |
| unsigned Indentation) const { |
| // The decoder function is just a big switch statement based on the |
| // input decoder index. |
| OS.indent(Indentation) << "template<typename InsnType>\n"; |
| OS.indent(Indentation) << "static DecodeStatus decodeToMCInst(DecodeStatus S," |
| << " unsigned Idx, InsnType insn, MCInst &MI,\n"; |
| OS.indent(Indentation) << " uint64_t " |
| << "Address, const void *Decoder, bool &DecodeComplete) {\n"; |
| Indentation += 2; |
| OS.indent(Indentation) << "DecodeComplete = true;\n"; |
| OS.indent(Indentation) << "InsnType tmp;\n"; |
| OS.indent(Indentation) << "switch (Idx) {\n"; |
| OS.indent(Indentation) << "default: llvm_unreachable(\"Invalid index!\");\n"; |
| unsigned Index = 0; |
| for (const auto &Decoder : Decoders) { |
| OS.indent(Indentation) << "case " << Index++ << ":\n"; |
| OS << Decoder; |
| OS.indent(Indentation+2) << "return S;\n"; |
| } |
| OS.indent(Indentation) << "}\n"; |
| Indentation -= 2; |
| OS.indent(Indentation) << "}\n\n"; |
| } |
| |
| // Populates the field of the insn given the start position and the number of |
| // consecutive bits to scan for. |
| // |
| // Returns false if and on the first uninitialized bit value encountered. |
| // Returns true, otherwise. |
| bool FilterChooser::fieldFromInsn(uint64_t &Field, insn_t &Insn, |
| unsigned StartBit, unsigned NumBits) const { |
| Field = 0; |
| |
| for (unsigned i = 0; i < NumBits; ++i) { |
| if (Insn[StartBit + i] == BIT_UNSET) |
| return false; |
| |
| if (Insn[StartBit + i] == BIT_TRUE) |
| Field = Field | (1ULL << i); |
| } |
| |
| return true; |
| } |
| |
| /// dumpFilterArray - dumpFilterArray prints out debugging info for the given |
| /// filter array as a series of chars. |
| void FilterChooser::dumpFilterArray(raw_ostream &o, |
| const std::vector<bit_value_t> &filter) const { |
| for (unsigned bitIndex = BitWidth; bitIndex > 0; bitIndex--) { |
| switch (filter[bitIndex - 1]) { |
| case BIT_UNFILTERED: |
| o << "."; |
| break; |
| case BIT_UNSET: |
| o << "_"; |
| break; |
| case BIT_TRUE: |
| o << "1"; |
| break; |
| case BIT_FALSE: |
| o << "0"; |
| break; |
| } |
| } |
| } |
| |
| /// dumpStack - dumpStack traverses the filter chooser chain and calls |
| /// dumpFilterArray on each filter chooser up to the top level one. |
| void FilterChooser::dumpStack(raw_ostream &o, const char *prefix) const { |
| const FilterChooser *current = this; |
| |
| while (current) { |
| o << prefix; |
| dumpFilterArray(o, current->FilterBitValues); |
| o << '\n'; |
| current = current->Parent; |
| } |
| } |
| |
| // Calculates the island(s) needed to decode the instruction. |
| // This returns a list of undecoded bits of an instructions, for example, |
| // Inst{20} = 1 && Inst{3-0} == 0b1111 represents two islands of yet-to-be |
| // decoded bits in order to verify that the instruction matches the Opcode. |
| unsigned FilterChooser::getIslands(std::vector<unsigned> &StartBits, |
| std::vector<unsigned> &EndBits, |
| std::vector<uint64_t> &FieldVals, |
| const insn_t &Insn) const { |
| unsigned Num, BitNo; |
| Num = BitNo = 0; |
| |
| uint64_t FieldVal = 0; |
| |
| // 0: Init |
| // 1: Water (the bit value does not affect decoding) |
| // 2: Island (well-known bit value needed for decoding) |
| int State = 0; |
| int Val = -1; |
| |
| for (unsigned i = 0; i < BitWidth; ++i) { |
| Val = Value(Insn[i]); |
| bool Filtered = PositionFiltered(i); |
| switch (State) { |
| default: llvm_unreachable("Unreachable code!"); |
| case 0: |
| case 1: |
| if (Filtered || Val == -1) |
| State = 1; // Still in Water |
| else { |
| State = 2; // Into the Island |
| BitNo = 0; |
| StartBits.push_back(i); |
| FieldVal = Val; |
| } |
| break; |
| case 2: |
| if (Filtered || Val == -1) { |
| State = 1; // Into the Water |
| EndBits.push_back(i - 1); |
| FieldVals.push_back(FieldVal); |
| ++Num; |
| } else { |
| State = 2; // Still in Island |
| ++BitNo; |
| FieldVal = FieldVal | Val << BitNo; |
| } |
| break; |
| } |
| } |
| // If we are still in Island after the loop, do some housekeeping. |
| if (State == 2) { |
| EndBits.push_back(BitWidth - 1); |
| FieldVals.push_back(FieldVal); |
| ++Num; |
| } |
| |
| assert(StartBits.size() == Num && EndBits.size() == Num && |
| FieldVals.size() == Num); |
| return Num; |
| } |
| |
| void FilterChooser::emitBinaryParser(raw_ostream &o, unsigned &Indentation, |
| const OperandInfo &OpInfo, |
| bool &OpHasCompleteDecoder) const { |
| const std::string &Decoder = OpInfo.Decoder; |
| |
| if (OpInfo.numFields() != 1) |
| o.indent(Indentation) << "tmp = 0;\n"; |
| |
| for (const EncodingField &EF : OpInfo) { |
| o.indent(Indentation) << "tmp "; |
| if (OpInfo.numFields() != 1) o << '|'; |
| o << "= fieldFromInstruction" |
| << "(insn, " << EF.Base << ", " << EF.Width << ')'; |
| if (OpInfo.numFields() != 1 || EF.Offset != 0) |
| o << " << " << EF.Offset; |
| o << ";\n"; |
| } |
| |
| if (Decoder != "") { |
| OpHasCompleteDecoder = OpInfo.HasCompleteDecoder; |
| o.indent(Indentation) << Emitter->GuardPrefix << Decoder |
| << "(MI, tmp, Address, Decoder)" |
| << Emitter->GuardPostfix |
| << " { " << (OpHasCompleteDecoder ? "" : "DecodeComplete = false; ") |
| << "return MCDisassembler::Fail; }\n"; |
| } else { |
| OpHasCompleteDecoder = true; |
| o.indent(Indentation) << "MI.addOperand(MCOperand::createImm(tmp));\n"; |
| } |
| } |
| |
| void FilterChooser::emitDecoder(raw_ostream &OS, unsigned Indentation, |
| unsigned Opc, bool &HasCompleteDecoder) const { |
| HasCompleteDecoder = true; |
| |
| for (const auto &Op : Operands.find(Opc)->second) { |
| // If a custom instruction decoder was specified, use that. |
| if (Op.numFields() == 0 && !Op.Decoder.empty()) { |
| HasCompleteDecoder = Op.HasCompleteDecoder; |
| OS.indent(Indentation) << Emitter->GuardPrefix << Op.Decoder |
| << "(MI, insn, Address, Decoder)" |
| << Emitter->GuardPostfix |
| << " { " << (HasCompleteDecoder ? "" : "DecodeComplete = false; ") |
| << "return MCDisassembler::Fail; }\n"; |
| break; |
| } |
| |
| bool OpHasCompleteDecoder; |
| emitBinaryParser(OS, Indentation, Op, OpHasCompleteDecoder); |
| if (!OpHasCompleteDecoder) |
| HasCompleteDecoder = false; |
| } |
| } |
| |
| unsigned FilterChooser::getDecoderIndex(DecoderSet &Decoders, |
| unsigned Opc, |
| bool &HasCompleteDecoder) const { |
| // Build up the predicate string. |
| SmallString<256> Decoder; |
| // FIXME: emitDecoder() function can take a buffer directly rather than |
| // a stream. |
| raw_svector_ostream S(Decoder); |
| unsigned I = 4; |
| emitDecoder(S, I, Opc, HasCompleteDecoder); |
| |
| // Using the full decoder string as the key value here is a bit |
| // heavyweight, but is effective. If the string comparisons become a |
| // performance concern, we can implement a mangling of the predicate |
| // data easily enough with a map back to the actual string. That's |
| // overkill for now, though. |
| |
| // Make sure the predicate is in the table. |
| Decoders.insert(CachedHashString(Decoder)); |
| // Now figure out the index for when we write out the table. |
| DecoderSet::const_iterator P = find(Decoders, Decoder.str()); |
| return (unsigned)(P - Decoders.begin()); |
| } |
| |
| static void emitSinglePredicateMatch(raw_ostream &o, StringRef str, |
| const std::string &PredicateNamespace) { |
| if (str[0] == '!') |
| o << "!Bits[" << PredicateNamespace << "::" |
| << str.slice(1,str.size()) << "]"; |
| else |
| o << "Bits[" << PredicateNamespace << "::" << str << "]"; |
| } |
| |
| bool FilterChooser::emitPredicateMatch(raw_ostream &o, unsigned &Indentation, |
| unsigned Opc) const { |
| ListInit *Predicates = |
| AllInstructions[Opc]->TheDef->getValueAsListInit("Predicates"); |
| bool IsFirstEmission = true; |
| for (unsigned i = 0; i < Predicates->size(); ++i) { |
| Record *Pred = Predicates->getElementAsRecord(i); |
| if (!Pred->getValue("AssemblerMatcherPredicate")) |
| continue; |
| |
| StringRef P = Pred->getValueAsString("AssemblerCondString"); |
| |
| if (P.empty()) |
| continue; |
| |
| if (!IsFirstEmission) |
| o << " && "; |
| |
| std::pair<StringRef, StringRef> pairs = P.split(','); |
| while (!pairs.second.empty()) { |
| emitSinglePredicateMatch(o, pairs.first, Emitter->PredicateNamespace); |
| o << " && "; |
| pairs = pairs.second.split(','); |
| } |
| emitSinglePredicateMatch(o, pairs.first, Emitter->PredicateNamespace); |
| IsFirstEmission = false; |
| } |
| return !Predicates->empty(); |
| } |
| |
| bool FilterChooser::doesOpcodeNeedPredicate(unsigned Opc) const { |
| ListInit *Predicates = |
| AllInstructions[Opc]->TheDef->getValueAsListInit("Predicates"); |
| for (unsigned i = 0; i < Predicates->size(); ++i) { |
| Record *Pred = Predicates->getElementAsRecord(i); |
| if (!Pred->getValue("AssemblerMatcherPredicate")) |
| continue; |
| |
| StringRef P = Pred->getValueAsString("AssemblerCondString"); |
| |
| if (P.empty()) |
| continue; |
| |
| return true; |
| } |
| return false; |
| } |
| |
| unsigned FilterChooser::getPredicateIndex(DecoderTableInfo &TableInfo, |
| StringRef Predicate) const { |
| // Using the full predicate string as the key value here is a bit |
| // heavyweight, but is effective. If the string comparisons become a |
| // performance concern, we can implement a mangling of the predicate |
| // data easily enough with a map back to the actual string. That's |
| // overkill for now, though. |
| |
| // Make sure the predicate is in the table. |
| TableInfo.Predicates.insert(CachedHashString(Predicate)); |
| // Now figure out the index for when we write out the table. |
| PredicateSet::const_iterator P = find(TableInfo.Predicates, Predicate); |
| return (unsigned)(P - TableInfo.Predicates.begin()); |
| } |
| |
| void FilterChooser::emitPredicateTableEntry(DecoderTableInfo &TableInfo, |
| unsigned Opc) const { |
| if (!doesOpcodeNeedPredicate(Opc)) |
| return; |
| |
| // Build up the predicate string. |
| SmallString<256> Predicate; |
| // FIXME: emitPredicateMatch() functions can take a buffer directly rather |
| // than a stream. |
| raw_svector_ostream PS(Predicate); |
| unsigned I = 0; |
| emitPredicateMatch(PS, I, Opc); |
| |
| // Figure out the index into the predicate table for the predicate just |
| // computed. |
| unsigned PIdx = getPredicateIndex(TableInfo, PS.str()); |
| SmallString<16> PBytes; |
| raw_svector_ostream S(PBytes); |
| encodeULEB128(PIdx, S); |
| |
| TableInfo.Table.push_back(MCD::OPC_CheckPredicate); |
| // Predicate index |
| for (unsigned i = 0, e = PBytes.size(); i != e; ++i) |
| TableInfo.Table.push_back(PBytes[i]); |
| // Push location for NumToSkip backpatching. |
| TableInfo.FixupStack.back().push_back(TableInfo.Table.size()); |
| TableInfo.Table.push_back(0); |
| TableInfo.Table.push_back(0); |
| TableInfo.Table.push_back(0); |
| } |
| |
| void FilterChooser::emitSoftFailTableEntry(DecoderTableInfo &TableInfo, |
| unsigned Opc) const { |
| BitsInit *SFBits = |
| AllInstructions[Opc]->TheDef->getValueAsBitsInit("SoftFail"); |
| if (!SFBits) return; |
| BitsInit *InstBits = AllInstructions[Opc]->TheDef->getValueAsBitsInit("Inst"); |
| |
| APInt PositiveMask(BitWidth, 0ULL); |
| APInt NegativeMask(BitWidth, 0ULL); |
| for (unsigned i = 0; i < BitWidth; ++i) { |
| bit_value_t B = bitFromBits(*SFBits, i); |
| bit_value_t IB = bitFromBits(*InstBits, i); |
| |
| if (B != BIT_TRUE) continue; |
| |
| switch (IB) { |
| case BIT_FALSE: |
| // The bit is meant to be false, so emit a check to see if it is true. |
| PositiveMask.setBit(i); |
| break; |
| case BIT_TRUE: |
| // The bit is meant to be true, so emit a check to see if it is false. |
| NegativeMask.setBit(i); |
| break; |
| default: |
| // The bit is not set; this must be an error! |
| StringRef Name = AllInstructions[Opc]->TheDef->getName(); |
| errs() << "SoftFail Conflict: bit SoftFail{" << i << "} in " << Name |
| << " is set but Inst{" << i << "} is unset!\n" |
| << " - You can only mark a bit as SoftFail if it is fully defined" |
| << " (1/0 - not '?') in Inst\n"; |
| return; |
| } |
| } |
| |
| bool NeedPositiveMask = PositiveMask.getBoolValue(); |
| bool NeedNegativeMask = NegativeMask.getBoolValue(); |
| |
| if (!NeedPositiveMask && !NeedNegativeMask) |
| return; |
| |
| TableInfo.Table.push_back(MCD::OPC_SoftFail); |
| |
| SmallString<16> MaskBytes; |
| raw_svector_ostream S(MaskBytes); |
| if (NeedPositiveMask) { |
| encodeULEB128(PositiveMask.getZExtValue(), S); |
| for (unsigned i = 0, e = MaskBytes.size(); i != e; ++i) |
| TableInfo.Table.push_back(MaskBytes[i]); |
| } else |
| TableInfo.Table.push_back(0); |
| if (NeedNegativeMask) { |
| MaskBytes.clear(); |
| encodeULEB128(NegativeMask.getZExtValue(), S); |
| for (unsigned i = 0, e = MaskBytes.size(); i != e; ++i) |
| TableInfo.Table.push_back(MaskBytes[i]); |
| } else |
| TableInfo.Table.push_back(0); |
| } |
| |
| // Emits table entries to decode the singleton. |
| void FilterChooser::emitSingletonTableEntry(DecoderTableInfo &TableInfo, |
| unsigned Opc) const { |
| std::vector<unsigned> StartBits; |
| std::vector<unsigned> EndBits; |
| std::vector<uint64_t> FieldVals; |
| insn_t Insn; |
| insnWithID(Insn, Opc); |
| |
| // Look for islands of undecoded bits of the singleton. |
| getIslands(StartBits, EndBits, FieldVals, Insn); |
| |
| unsigned Size = StartBits.size(); |
| |
| // Emit the predicate table entry if one is needed. |
| emitPredicateTableEntry(TableInfo, Opc); |
| |
| // Check any additional encoding fields needed. |
| for (unsigned I = Size; I != 0; --I) { |
| unsigned NumBits = EndBits[I-1] - StartBits[I-1] + 1; |
| TableInfo.Table.push_back(MCD::OPC_CheckField); |
| TableInfo.Table.push_back(StartBits[I-1]); |
| TableInfo.Table.push_back(NumBits); |
| uint8_t Buffer[16], *p; |
| encodeULEB128(FieldVals[I-1], Buffer); |
| for (p = Buffer; *p >= 128 ; ++p) |
| TableInfo.Table.push_back(*p); |
| TableInfo.Table.push_back(*p); |
| // Push location for NumToSkip backpatching. |
| TableInfo.FixupStack.back().push_back(TableInfo.Table.size()); |
| // The fixup is always 24-bits, so go ahead and allocate the space |
| // in the table so all our relative position calculations work OK even |
| // before we fully resolve the real value here. |
| TableInfo.Table.push_back(0); |
| TableInfo.Table.push_back(0); |
| TableInfo.Table.push_back(0); |
| } |
| |
| // Check for soft failure of the match. |
| emitSoftFailTableEntry(TableInfo, Opc); |
| |
| bool HasCompleteDecoder; |
| unsigned DIdx = getDecoderIndex(TableInfo.Decoders, Opc, HasCompleteDecoder); |
| |
| // Produce OPC_Decode or OPC_TryDecode opcode based on the information |
| // whether the instruction decoder is complete or not. If it is complete |
| // then it handles all possible values of remaining variable/unfiltered bits |
| // and for any value can determine if the bitpattern is a valid instruction |
| // or not. This means OPC_Decode will be the final step in the decoding |
| // process. If it is not complete, then the Fail return code from the |
| // decoder method indicates that additional processing should be done to see |
| // if there is any other instruction that also matches the bitpattern and |
| // can decode it. |
| TableInfo.Table.push_back(HasCompleteDecoder ? MCD::OPC_Decode : |
| MCD::OPC_TryDecode); |
| uint8_t Buffer[16], *p; |
| encodeULEB128(Opc, Buffer); |
| for (p = Buffer; *p >= 128 ; ++p) |
| TableInfo.Table.push_back(*p); |
| TableInfo.Table.push_back(*p); |
| |
| SmallString<16> Bytes; |
| raw_svector_ostream S(Bytes); |
| encodeULEB128(DIdx, S); |
| |
| // Decoder index |
| for (unsigned i = 0, e = Bytes.size(); i != e; ++i) |
| TableInfo.Table.push_back(Bytes[i]); |
| |
| if (!HasCompleteDecoder) { |
| // Push location for NumToSkip backpatching. |
| TableInfo.FixupStack.back().push_back(TableInfo.Table.size()); |
| // Allocate the space for the fixup. |
| TableInfo.Table.push_back(0); |
| TableInfo.Table.push_back(0); |
| TableInfo.Table.push_back(0); |
| } |
| } |
| |
| // Emits table entries to decode the singleton, and then to decode the rest. |
| void FilterChooser::emitSingletonTableEntry(DecoderTableInfo &TableInfo, |
| const Filter &Best) const { |
| unsigned Opc = Best.getSingletonOpc(); |
| |
| // complex singletons need predicate checks from the first singleton |
| // to refer forward to the variable filterchooser that follows. |
| TableInfo.FixupStack.emplace_back(); |
| |
| emitSingletonTableEntry(TableInfo, Opc); |
| |
| resolveTableFixups(TableInfo.Table, TableInfo.FixupStack.back(), |
| TableInfo.Table.size()); |
| TableInfo.FixupStack.pop_back(); |
| |
| Best.getVariableFC().emitTableEntries(TableInfo); |
| } |
| |
| // Assign a single filter and run with it. Top level API client can initialize |
| // with a single filter to start the filtering process. |
| void FilterChooser::runSingleFilter(unsigned startBit, unsigned numBit, |
| bool mixed) { |
| Filters.clear(); |
| Filters.emplace_back(*this, startBit, numBit, true); |
| BestIndex = 0; // Sole Filter instance to choose from. |
| bestFilter().recurse(); |
| } |
| |
| // reportRegion is a helper function for filterProcessor to mark a region as |
| // eligible for use as a filter region. |
| void FilterChooser::reportRegion(bitAttr_t RA, unsigned StartBit, |
| unsigned BitIndex, bool AllowMixed) { |
| if (RA == ATTR_MIXED && AllowMixed) |
| Filters.emplace_back(*this, StartBit, BitIndex - StartBit, true); |
| else if (RA == ATTR_ALL_SET && !AllowMixed) |
| Filters.emplace_back(*this, StartBit, BitIndex - StartBit, false); |
| } |
| |
| // FilterProcessor scans the well-known encoding bits of the instructions and |
| // builds up a list of candidate filters. It chooses the best filter and |
| // recursively descends down the decoding tree. |
| bool FilterChooser::filterProcessor(bool AllowMixed, bool Greedy) { |
| Filters.clear(); |
| BestIndex = -1; |
| unsigned numInstructions = Opcodes.size(); |
| |
| assert(numInstructions && "Filter created with no instructions"); |
| |
| // No further filtering is necessary. |
| if (numInstructions == 1) |
| return true; |
| |
| // Heuristics. See also doFilter()'s "Heuristics" comment when num of |
| // instructions is 3. |
| if (AllowMixed && !Greedy) { |
| assert(numInstructions == 3); |
| |
| for (unsigned i = 0; i < Opcodes.size(); ++i) { |
| std::vector<unsigned> StartBits; |
| std::vector<unsigned> EndBits; |
| std::vector<uint64_t> FieldVals; |
| insn_t Insn; |
| |
| insnWithID(Insn, Opcodes[i]); |
| |
| // Look for islands of undecoded bits of any instruction. |
| if (getIslands(StartBits, EndBits, FieldVals, Insn) > 0) { |
| // Found an instruction with island(s). Now just assign a filter. |
| runSingleFilter(StartBits[0], EndBits[0] - StartBits[0] + 1, true); |
| return true; |
| } |
| } |
| } |
| |
| unsigned BitIndex; |
| |
| // We maintain BIT_WIDTH copies of the bitAttrs automaton. |
| // The automaton consumes the corresponding bit from each |
| // instruction. |
| // |
| // Input symbols: 0, 1, and _ (unset). |
| // States: NONE, FILTERED, ALL_SET, ALL_UNSET, and MIXED. |
| // Initial state: NONE. |
| // |
| // (NONE) ------- [01] -> (ALL_SET) |
| // (NONE) ------- _ ----> (ALL_UNSET) |
| // (ALL_SET) ---- [01] -> (ALL_SET) |
| // (ALL_SET) ---- _ ----> (MIXED) |
| // (ALL_UNSET) -- [01] -> (MIXED) |
| // (ALL_UNSET) -- _ ----> (ALL_UNSET) |
| // (MIXED) ------ . ----> (MIXED) |
| // (FILTERED)---- . ----> (FILTERED) |
| |
| std::vector<bitAttr_t> bitAttrs; |
| |
| // FILTERED bit positions provide no entropy and are not worthy of pursuing. |
| // Filter::recurse() set either BIT_TRUE or BIT_FALSE for each position. |
| for (BitIndex = 0; BitIndex < BitWidth; ++BitIndex) |
| if (FilterBitValues[BitIndex] == BIT_TRUE || |
| FilterBitValues[BitIndex] == BIT_FALSE) |
| bitAttrs.push_back(ATTR_FILTERED); |
| else |
| bitAttrs.push_back(ATTR_NONE); |
| |
| for (unsigned InsnIndex = 0; InsnIndex < numInstructions; ++InsnIndex) { |
| insn_t insn; |
| |
| insnWithID(insn, Opcodes[InsnIndex]); |
| |
| for (BitIndex = 0; BitIndex < BitWidth; ++BitIndex) { |
| switch (bitAttrs[BitIndex]) { |
| case ATTR_NONE: |
| if (insn[BitIndex] == BIT_UNSET) |
| bitAttrs[BitIndex] = ATTR_ALL_UNSET; |
| else |
| bitAttrs[BitIndex] = ATTR_ALL_SET; |
| break; |
| case ATTR_ALL_SET: |
| if (insn[BitIndex] == BIT_UNSET) |
| bitAttrs[BitIndex] = ATTR_MIXED; |
| break; |
| case ATTR_ALL_UNSET: |
| if (insn[BitIndex] != BIT_UNSET) |
| bitAttrs[BitIndex] = ATTR_MIXED; |
| break; |
| case ATTR_MIXED: |
| case ATTR_FILTERED: |
| break; |
| } |
| } |
| } |
| |
| // The regionAttr automaton consumes the bitAttrs automatons' state, |
| // lowest-to-highest. |
| // |
| // Input symbols: F(iltered), (all_)S(et), (all_)U(nset), M(ixed) |
| // States: NONE, ALL_SET, MIXED |
| // Initial state: NONE |
| // |
| // (NONE) ----- F --> (NONE) |
| // (NONE) ----- S --> (ALL_SET) ; and set region start |
| // (NONE) ----- U --> (NONE) |
| // (NONE) ----- M --> (MIXED) ; and set region start |
| // (ALL_SET) -- F --> (NONE) ; and report an ALL_SET region |
| // (ALL_SET) -- S --> (ALL_SET) |
| // (ALL_SET) -- U --> (NONE) ; and report an ALL_SET region |
| // (ALL_SET) -- M --> (MIXED) ; and report an ALL_SET region |
| // (MIXED) ---- F --> (NONE) ; and report a MIXED region |
| // (MIXED) ---- S --> (ALL_SET) ; and report a MIXED region |
| // (MIXED) ---- U --> (NONE) ; and report a MIXED region |
| // (MIXED) ---- M --> (MIXED) |
| |
| bitAttr_t RA = ATTR_NONE; |
| unsigned StartBit = 0; |
| |
| for (BitIndex = 0; BitIndex < BitWidth; ++BitIndex) { |
| bitAttr_t bitAttr = bitAttrs[BitIndex]; |
| |
| assert(bitAttr != ATTR_NONE && "Bit without attributes"); |
| |
| switch (RA) { |
| case ATTR_NONE: |
| switch (bitAttr) { |
| case ATTR_FILTERED: |
| break; |
| case ATTR_ALL_SET: |
| StartBit = BitIndex; |
| RA = ATTR_ALL_SET; |
| break; |
| case ATTR_ALL_UNSET: |
| break; |
| case ATTR_MIXED: |
| StartBit = BitIndex; |
| RA = ATTR_MIXED; |
| break; |
| default: |
| llvm_unreachable("Unexpected bitAttr!"); |
| } |
| break; |
| case ATTR_ALL_SET: |
| switch (bitAttr) { |
| case ATTR_FILTERED: |
| reportRegion(RA, StartBit, BitIndex, AllowMixed); |
| RA = ATTR_NONE; |
| break; |
| case ATTR_ALL_SET: |
| break; |
| case ATTR_ALL_UNSET: |
| reportRegion(RA, StartBit, BitIndex, AllowMixed); |
| RA = ATTR_NONE; |
| break; |
| case ATTR_MIXED: |
| reportRegion(RA, StartBit, BitIndex, AllowMixed); |
| StartBit = BitIndex; |
| RA = ATTR_MIXED; |
| break; |
| default: |
| llvm_unreachable("Unexpected bitAttr!"); |
| } |
| break; |
| case ATTR_MIXED: |
| switch (bitAttr) { |
| case ATTR_FILTERED: |
| reportRegion(RA, StartBit, BitIndex, AllowMixed); |
| StartBit = BitIndex; |
| RA = ATTR_NONE; |
| break; |
| case ATTR_ALL_SET: |
| reportRegion(RA, StartBit, BitIndex, AllowMixed); |
| StartBit = BitIndex; |
| RA = ATTR_ALL_SET; |
| break; |
| case ATTR_ALL_UNSET: |
| reportRegion(RA, StartBit, BitIndex, AllowMixed); |
| RA = ATTR_NONE; |
| break; |
| case ATTR_MIXED: |
| break; |
| default: |
| llvm_unreachable("Unexpected bitAttr!"); |
| } |
| break; |
| case ATTR_ALL_UNSET: |
| llvm_unreachable("regionAttr state machine has no ATTR_UNSET state"); |
| case ATTR_FILTERED: |
| llvm_unreachable("regionAttr state machine has no ATTR_FILTERED state"); |
| } |
| } |
| |
| // At the end, if we're still in ALL_SET or MIXED states, report a region |
| switch (RA) { |
| case ATTR_NONE: |
| break; |
| case ATTR_FILTERED: |
| break; |
| case ATTR_ALL_SET: |
| reportRegion(RA, StartBit, BitIndex, AllowMixed); |
| break; |
| case ATTR_ALL_UNSET: |
| break; |
| case ATTR_MIXED: |
| reportRegion(RA, StartBit, BitIndex, AllowMixed); |
| break; |
| } |
| |
| // We have finished with the filter processings. Now it's time to choose |
| // the best performing filter. |
| BestIndex = 0; |
| bool AllUseless = true; |
| unsigned BestScore = 0; |
| |
| for (unsigned i = 0, e = Filters.size(); i != e; ++i) { |
| unsigned Usefulness = Filters[i].usefulness(); |
| |
| if (Usefulness) |
| AllUseless = false; |
| |
| if (Usefulness > BestScore) { |
| BestIndex = i; |
| BestScore = Usefulness; |
| } |
| } |
| |
| if (!AllUseless) |
| bestFilter().recurse(); |
| |
| return !AllUseless; |
| } // end of FilterChooser::filterProcessor(bool) |
| |
| // Decides on the best configuration of filter(s) to use in order to decode |
| // the instructions. A conflict of instructions may occur, in which case we |
| // dump the conflict set to the standard error. |
| void FilterChooser::doFilter() { |
| unsigned Num = Opcodes.size(); |
| assert(Num && "FilterChooser created with no instructions"); |
| |
| // Try regions of consecutive known bit values first. |
| if (filterProcessor(false)) |
| return; |
| |
| // Then regions of mixed bits (both known and unitialized bit values allowed). |
| if (filterProcessor(true)) |
| return; |
| |
| // Heuristics to cope with conflict set {t2CMPrs, t2SUBSrr, t2SUBSrs} where |
| // no single instruction for the maximum ATTR_MIXED region Inst{14-4} has a |
| // well-known encoding pattern. In such case, we backtrack and scan for the |
| // the very first consecutive ATTR_ALL_SET region and assign a filter to it. |
| if (Num == 3 && filterProcessor(true, false)) |
| return; |
| |
| // If we come to here, the instruction decoding has failed. |
| // Set the BestIndex to -1 to indicate so. |
| BestIndex = -1; |
| } |
| |
| // emitTableEntries - Emit state machine entries to decode our share of |
| // instructions. |
| void FilterChooser::emitTableEntries(DecoderTableInfo &TableInfo) const { |
| if (Opcodes.size() == 1) { |
| // There is only one instruction in the set, which is great! |
| // Call emitSingletonDecoder() to see whether there are any remaining |
| // encodings bits. |
| emitSingletonTableEntry(TableInfo, Opcodes[0]); |
| return; |
| } |
| |
| // Choose the best filter to do the decodings! |
| if (BestIndex != -1) { |
| const Filter &Best = Filters[BestIndex]; |
| if (Best.getNumFiltered() == 1) |
| emitSingletonTableEntry(TableInfo, Best); |
| else |
| Best.emitTableEntry(TableInfo); |
| return; |
| } |
| |
| // We don't know how to decode these instructions! Dump the |
| // conflict set and bail. |
| |
| // Print out useful conflict information for postmortem analysis. |
| errs() << "Decoding Conflict:\n"; |
| |
| dumpStack(errs(), "\t\t"); |
| |
| for (unsigned i = 0; i < Opcodes.size(); ++i) { |
| errs() << '\t' << nameWithID(Opcodes[i]) << " "; |
| dumpBits(errs(), |
| getBitsField(*AllInstructions[Opcodes[i]]->TheDef, "Inst")); |
| errs() << '\n'; |
| } |
| } |
| |
| static std::string findOperandDecoderMethod(TypedInit *TI) { |
| std::string Decoder; |
| |
| Record *Record = cast<DefInit>(TI)->getDef(); |
| |
| RecordVal *DecoderString = Record->getValue("DecoderMethod"); |
| StringInit *String = DecoderString ? |
| dyn_cast<StringInit>(DecoderString->getValue()) : nullptr; |
| if (String) { |
| Decoder = String->getValue(); |
| if (!Decoder.empty()) |
| return Decoder; |
| } |
| |
| if (Record->isSubClassOf("RegisterOperand")) |
| Record = Record->getValueAsDef("RegClass"); |
| |
| if (Record->isSubClassOf("RegisterClass")) { |
| Decoder = "Decode" + Record->getName().str() + "RegisterClass"; |
| } else if (Record->isSubClassOf("PointerLikeRegClass")) { |
| Decoder = "DecodePointerLikeRegClass" + |
| utostr(Record->getValueAsInt("RegClassKind")); |
| } |
| |
| return Decoder; |
| } |
| |
| static bool populateInstruction(CodeGenTarget &Target, |
| const CodeGenInstruction &CGI, unsigned Opc, |
| std::map<unsigned, std::vector<OperandInfo>> &Operands){ |
| const Record &Def = *CGI.TheDef; |
| // If all the bit positions are not specified; do not decode this instruction. |
| // We are bound to fail! For proper disassembly, the well-known encoding bits |
| // of the instruction must be fully specified. |
| |
| BitsInit &Bits = getBitsField(Def, "Inst"); |
| if (Bits.allInComplete()) return false; |
| |
| std::vector<OperandInfo> InsnOperands; |
| |
| // If the instruction has specified a custom decoding hook, use that instead |
| // of trying to auto-generate the decoder. |
| StringRef InstDecoder = Def.getValueAsString("DecoderMethod"); |
| if (InstDecoder != "") { |
| bool HasCompleteInstDecoder = Def.getValueAsBit("hasCompleteDecoder"); |
| InsnOperands.push_back(OperandInfo(InstDecoder, HasCompleteInstDecoder)); |
| Operands[Opc] = InsnOperands; |
| return true; |
| } |
| |
| // Generate a description of the operand of the instruction that we know |
| // how to decode automatically. |
| // FIXME: We'll need to have a way to manually override this as needed. |
| |
| // Gather the outputs/inputs of the instruction, so we can find their |
| // positions in the encoding. This assumes for now that they appear in the |
| // MCInst in the order that they're listed. |
| std::vector<std::pair<Init*, StringRef>> InOutOperands; |
| DagInit *Out = Def.getValueAsDag("OutOperandList"); |
| DagInit *In = Def.getValueAsDag("InOperandList"); |
| for (unsigned i = 0; i < Out->getNumArgs(); ++i) |
| InOutOperands.push_back(std::make_pair(Out->getArg(i), |
| Out->getArgNameStr(i))); |
| for (unsigned i = 0; i < In->getNumArgs(); ++i) |
| InOutOperands.push_back(std::make_pair(In->getArg(i), |
| In->getArgNameStr(i))); |
| |
| // Search for tied operands, so that we can correctly instantiate |
| // operands that are not explicitly represented in the encoding. |
| std::map<std::string, std::string> TiedNames; |
| for (unsigned i = 0; i < CGI.Operands.size(); ++i) { |
| int tiedTo = CGI.Operands[i].getTiedRegister(); |
| if (tiedTo != -1) { |
| std::pair<unsigned, unsigned> SO = |
| CGI.Operands.getSubOperandNumber(tiedTo); |
| TiedNames[InOutOperands[i].second] = InOutOperands[SO.first].second; |
| TiedNames[InOutOperands[SO.first].second] = InOutOperands[i].second; |
| } |
| } |
| |
| std::map<std::string, std::vector<OperandInfo>> NumberedInsnOperands; |
| std::set<std::string> NumberedInsnOperandsNoTie; |
| if (Target.getInstructionSet()-> |
| getValueAsBit("decodePositionallyEncodedOperands")) { |
| const std::vector<RecordVal> &Vals = Def.getValues(); |
| unsigned NumberedOp = 0; |
| |
| std::set<unsigned> NamedOpIndices; |
| if (Target.getInstructionSet()-> |
| getValueAsBit("noNamedPositionallyEncodedOperands")) |
| // Collect the set of operand indices that might correspond to named |
| // operand, and skip these when assigning operands based on position. |
| for (unsigned i = 0, e = Vals.size(); i != e; ++i) { |
| unsigned OpIdx; |
| if (!CGI.Operands.hasOperandNamed(Vals[i].getName(), OpIdx)) |
| continue; |
| |
| NamedOpIndices.insert(OpIdx); |
| } |
| |
| for (unsigned i = 0, e = Vals.size(); i != e; ++i) { |
| // Ignore fixed fields in the record, we're looking for values like: |
| // bits<5> RST = { ?, ?, ?, ?, ? }; |
| if (Vals[i].getPrefix() || Vals[i].getValue()->isComplete()) |
| continue; |
| |
| // Determine if Vals[i] actually contributes to the Inst encoding. |
| unsigned bi = 0; |
| for (; bi < Bits.getNumBits(); ++bi) { |
| VarInit *Var = nullptr; |
| VarBitInit *BI = dyn_cast<VarBitInit>(Bits.getBit(bi)); |
| if (BI) |
| Var = dyn_cast<VarInit>(BI->getBitVar()); |
| else |
| Var = dyn_cast<VarInit>(Bits.getBit(bi)); |
| |
| if (Var && Var->getName() == Vals[i].getName()) |
| break; |
| } |
| |
| if (bi == Bits.getNumBits()) |
| continue; |
| |
| // Skip variables that correspond to explicitly-named operands. |
| unsigned OpIdx; |
| if (CGI.Operands.hasOperandNamed(Vals[i].getName(), OpIdx)) |
| continue; |
| |
| // Get the bit range for this operand: |
| unsigned bitStart = bi++, bitWidth = 1; |
| for (; bi < Bits.getNumBits(); ++bi) { |
| VarInit *Var = nullptr; |
| VarBitInit *BI = dyn_cast<VarBitInit>(Bits.getBit(bi)); |
| if (BI) |
| Var = dyn_cast<VarInit>(BI->getBitVar()); |
| else |
| Var = dyn_cast<VarInit>(Bits.getBit(bi)); |
| |
| if (!Var) |
| break; |
| |
| if (Var->getName() != Vals[i].getName()) |
| break; |
| |
| ++bitWidth; |
| } |
| |
| unsigned NumberOps = CGI.Operands.size(); |
| while (NumberedOp < NumberOps && |
| (CGI.Operands.isFlatOperandNotEmitted(NumberedOp) || |
| (!NamedOpIndices.empty() && NamedOpIndices.count( |
| CGI.Operands.getSubOperandNumber(NumberedOp).first)))) |
| ++NumberedOp; |
| |
| OpIdx = NumberedOp++; |
| |
| // OpIdx now holds the ordered operand number of Vals[i]. |
| std::pair<unsigned, unsigned> SO = |
| CGI.Operands.getSubOperandNumber(OpIdx); |
| const std::string &Name = CGI.Operands[SO.first].Name; |
| |
| LLVM_DEBUG(dbgs() << "Numbered operand mapping for " << Def.getName() |
| << ": " << Name << "(" << SO.first << ", " << SO.second |
| << ") => " << Vals[i].getName() << "\n"); |
| |
| std::string Decoder; |
| Record *TypeRecord = CGI.Operands[SO.first].Rec; |
| |
| RecordVal *DecoderString = TypeRecord->getValue("DecoderMethod"); |
| StringInit *String = DecoderString ? |
| dyn_cast<StringInit>(DecoderString->getValue()) : nullptr; |
| if (String && String->getValue() != "") |
| Decoder = String->getValue(); |
| |
| if (Decoder == "" && |
| CGI.Operands[SO.first].MIOperandInfo && |
| CGI.Operands[SO.first].MIOperandInfo->getNumArgs()) { |
| Init *Arg = CGI.Operands[SO.first].MIOperandInfo-> |
| getArg(SO.second); |
| if (DefInit *DI = cast<DefInit>(Arg)) |
| TypeRecord = DI->getDef(); |
| } |
| |
| bool isReg = false; |
| if (TypeRecord->isSubClassOf("RegisterOperand")) |
| TypeRecord = TypeRecord->getValueAsDef("RegClass"); |
| if (TypeRecord->isSubClassOf("RegisterClass")) { |
| Decoder = "Decode" + TypeRecord->getName().str() + "RegisterClass"; |
| isReg = true; |
| } else if (TypeRecord->isSubClassOf("PointerLikeRegClass")) { |
| Decoder = "DecodePointerLikeRegClass" + |
| utostr(TypeRecord->getValueAsInt("RegClassKind")); |
| isReg = true; |
| } |
| |
| DecoderString = TypeRecord->getValue("DecoderMethod"); |
| String = DecoderString ? |
| dyn_cast<StringInit>(DecoderString->getValue()) : nullptr; |
| if (!isReg && String && String->getValue() != "") |
| Decoder = String->getValue(); |
| |
| RecordVal *HasCompleteDecoderVal = |
| TypeRecord->getValue("hasCompleteDecoder"); |
| BitInit *HasCompleteDecoderBit = HasCompleteDecoderVal ? |
| dyn_cast<BitInit>(HasCompleteDecoderVal->getValue()) : nullptr; |
| bool HasCompleteDecoder = HasCompleteDecoderBit ? |
| HasCompleteDecoderBit->getValue() : true; |
| |
| OperandInfo OpInfo(Decoder, HasCompleteDecoder); |
| OpInfo.addField(bitStart, bitWidth, 0); |
| |
| NumberedInsnOperands[Name].push_back(OpInfo); |
| |
| // FIXME: For complex operands with custom decoders we can't handle tied |
| // sub-operands automatically. Skip those here and assume that this is |
| // fixed up elsewhere. |
| if (CGI.Operands[SO.first].MIOperandInfo && |
| CGI.Operands[SO.first].MIOperandInfo->getNumArgs() > 1 && |
| String && String->getValue() != "") |
| NumberedInsnOperandsNoTie.insert(Name); |
| } |
| } |
| |
| // For each operand, see if we can figure out where it is encoded. |
| for (const auto &Op : InOutOperands) { |
| if (!NumberedInsnOperands[Op.second].empty()) { |
| InsnOperands.insert(InsnOperands.end(), |
| NumberedInsnOperands[Op.second].begin(), |
| NumberedInsnOperands[Op.second].end()); |
| continue; |
| } |
| if (!NumberedInsnOperands[TiedNames[Op.second]].empty()) { |
| if (!NumberedInsnOperandsNoTie.count(TiedNames[Op.second])) { |
| // Figure out to which (sub)operand we're tied. |
| unsigned i = CGI.Operands.getOperandNamed(TiedNames[Op.second]); |
| int tiedTo = CGI.Operands[i].getTiedRegister(); |
| if (tiedTo == -1) { |
| i = CGI.Operands.getOperandNamed(Op.second); |
| tiedTo = CGI.Operands[i].getTiedRegister(); |
| } |
| |
| if (tiedTo != -1) { |
| std::pair<unsigned, unsigned> SO = |
| CGI.Operands.getSubOperandNumber(tiedTo); |
| |
| InsnOperands.push_back(NumberedInsnOperands[TiedNames[Op.second]] |
| [SO.second]); |
| } |
| } |
| continue; |
| } |
| |
| TypedInit *TI = cast<TypedInit>(Op.first); |
| |
| // At this point, we can locate the decoder field, but we need to know how |
| // to interpret it. As a first step, require the target to provide |
| // callbacks for decoding register classes. |
| std::string Decoder = findOperandDecoderMethod(TI); |
| Record *TypeRecord = cast<DefInit>(TI)->getDef(); |
| |
| RecordVal *HasCompleteDecoderVal = |
| TypeRecord->getValue("hasCompleteDecoder"); |
| BitInit *HasCompleteDecoderBit = HasCompleteDecoderVal ? |
| dyn_cast<BitInit>(HasCompleteDecoderVal->getValue()) : nullptr; |
| bool HasCompleteDecoder = HasCompleteDecoderBit ? |
| HasCompleteDecoderBit->getValue() : true; |
| |
| OperandInfo OpInfo(Decoder, HasCompleteDecoder); |
| unsigned Base = ~0U; |
| unsigned Width = 0; |
| unsigned Offset = 0; |
| |
| for (unsigned bi = 0; bi < Bits.getNumBits(); ++bi) { |
| VarInit *Var = nullptr; |
| VarBitInit *BI = dyn_cast<VarBitInit>(Bits.getBit(bi)); |
| if (BI) |
| Var = dyn_cast<VarInit>(BI->getBitVar()); |
| else |
| Var = dyn_cast<VarInit>(Bits.getBit(bi)); |
| |
| if (!Var) { |
| if (Base != ~0U) { |
| OpInfo.addField(Base, Width, Offset); |
| Base = ~0U; |
| Width = 0; |
| Offset = 0; |
| } |
| continue; |
| } |
| |
| if (Var->getName() != Op.second && |
| Var->getName() != TiedNames[Op.second]) { |
| if (Base != ~0U) { |
| OpInfo.addField(Base, Width, Offset); |
| Base = ~0U; |
| Width = 0; |
| Offset = 0; |
| } |
| continue; |
| } |
| |
| if (Base == ~0U) { |
| Base = bi; |
| Width = 1; |
| Offset = BI ? BI->getBitNum() : 0; |
| } else if (BI && BI->getBitNum() != Offset + Width) { |
| OpInfo.addField(Base, Width, Offset); |
| Base = bi; |
| Width = 1; |
| Offset = BI->getBitNum(); |
| } else { |
| ++Width; |
| } |
| } |
| |
| if (Base != ~0U) |
| OpInfo.addField(Base, Width, Offset); |
| |
| if (OpInfo.numFields() > 0) |
| InsnOperands.push_back(OpInfo); |
| } |
| |
| Operands[Opc] = InsnOperands; |
| |
| #if 0 |
| LLVM_DEBUG({ |
| // Dumps the instruction encoding bits. |
| dumpBits(errs(), Bits); |
| |
| errs() << '\n'; |
| |
| // Dumps the list of operand info. |
| for (unsigned i = 0, e = CGI.Operands.size(); i != e; ++i) { |
| const CGIOperandList::OperandInfo &Info = CGI.Operands[i]; |
| const std::string &OperandName = Info.Name; |
| const Record &OperandDef = *Info.Rec; |
| |
| errs() << "\t" << OperandName << " (" << OperandDef.getName() << ")\n"; |
| } |
| }); |
| #endif |
| |
| return true; |
| } |
| |
| // emitFieldFromInstruction - Emit the templated helper function |
| // fieldFromInstruction(). |
| // On Windows we make sure that this function is not inlined when |
| // using the VS compiler. It has a bug which causes the function |
| // to be optimized out in some circustances. See llvm.org/pr38292 |
| static void emitFieldFromInstruction(formatted_raw_ostream &OS) { |
| OS << "// Helper function for extracting fields from encoded instructions.\n" |
| << "template<typename InsnType>\n" |
| << "#if defined(_MSC_VER) && !defined(__clang__)\n" |
| << "__declspec(noinline)\n" |
| << "#endif\n" |
| << "static InsnType fieldFromInstruction(InsnType insn, unsigned startBit,\n" |
| << " unsigned numBits) {\n" |
| << " assert(startBit + numBits <= (sizeof(InsnType)*8) &&\n" |
| << " \"Instruction field out of bounds!\");\n" |
| << " InsnType fieldMask;\n" |
| << " if (numBits == sizeof(InsnType)*8)\n" |
| << " fieldMask = (InsnType)(-1LL);\n" |
| << " else\n" |
| << " fieldMask = (((InsnType)1 << numBits) - 1) << startBit;\n" |
| << " return (insn & fieldMask) >> startBit;\n" |
| << "}\n\n"; |
| } |
| |
| // emitDecodeInstruction - Emit the templated helper function |
| // decodeInstruction(). |
| static void emitDecodeInstruction(formatted_raw_ostream &OS) { |
| OS << "template<typename InsnType>\n" |
| << "static DecodeStatus decodeInstruction(const uint8_t DecodeTable[], " |
| "MCInst &MI,\n" |
| << " InsnType insn, uint64_t " |
| "Address,\n" |
| << " const void *DisAsm,\n" |
| << " const MCSubtargetInfo &STI) {\n" |
| << " const FeatureBitset& Bits = STI.getFeatureBits();\n" |
| << "\n" |
| << " const uint8_t *Ptr = DecodeTable;\n" |
| << " uint32_t CurFieldValue = 0;\n" |
| << " DecodeStatus S = MCDisassembler::Success;\n" |
| << " while (true) {\n" |
| << " ptrdiff_t Loc = Ptr - DecodeTable;\n" |
| << " switch (*Ptr) {\n" |
| << " default:\n" |
| << " errs() << Loc << \": Unexpected decode table opcode!\\n\";\n" |
| << " return MCDisassembler::Fail;\n" |
| << " case MCD::OPC_ExtractField: {\n" |
| << " unsigned Start = *++Ptr;\n" |
| << " unsigned Len = *++Ptr;\n" |
| << " ++Ptr;\n" |
| << " CurFieldValue = fieldFromInstruction(insn, Start, Len);\n" |
| << " LLVM_DEBUG(dbgs() << Loc << \": OPC_ExtractField(\" << Start << " |
| "\", \"\n" |
| << " << Len << \"): \" << CurFieldValue << \"\\n\");\n" |
| << " break;\n" |
| << " }\n" |
| << " case MCD::OPC_FilterValue: {\n" |
| << " // Decode the field value.\n" |
| << " unsigned Len;\n" |
| << " InsnType Val = decodeULEB128(++Ptr, &Len);\n" |
| << " Ptr += Len;\n" |
| << " // NumToSkip is a plain 24-bit integer.\n" |
| << " unsigned NumToSkip = *Ptr++;\n" |
| << " NumToSkip |= (*Ptr++) << 8;\n" |
| << " NumToSkip |= (*Ptr++) << 16;\n" |
| << "\n" |
| << " // Perform the filter operation.\n" |
| << " if (Val != CurFieldValue)\n" |
| << " Ptr += NumToSkip;\n" |
| << " LLVM_DEBUG(dbgs() << Loc << \": OPC_FilterValue(\" << Val << " |
| "\", \" << NumToSkip\n" |
| << " << \"): \" << ((Val != CurFieldValue) ? \"FAIL:\" " |
| ": \"PASS:\")\n" |
| << " << \" continuing at \" << (Ptr - DecodeTable) << " |
| "\"\\n\");\n" |
| << "\n" |
| << " break;\n" |
| << " }\n" |
| << " case MCD::OPC_CheckField: {\n" |
| << " unsigned Start = *++Ptr;\n" |
| << " unsigned Len = *++Ptr;\n" |
| << " InsnType FieldValue = fieldFromInstruction(insn, Start, Len);\n" |
| << " // Decode the field value.\n" |
| << " uint32_t ExpectedValue = decodeULEB128(++Ptr, &Len);\n" |
| << " Ptr += Len;\n" |
| << " // NumToSkip is a plain 24-bit integer.\n" |
| << " unsigned NumToSkip = *Ptr++;\n" |
| << " NumToSkip |= (*Ptr++) << 8;\n" |
| << " NumToSkip |= (*Ptr++) << 16;\n" |
| << "\n" |
| << " // If the actual and expected values don't match, skip.\n" |
| << " if (ExpectedValue != FieldValue)\n" |
| << " Ptr += NumToSkip;\n" |
| << " LLVM_DEBUG(dbgs() << Loc << \": OPC_CheckField(\" << Start << " |
| "\", \"\n" |
| << " << Len << \", \" << ExpectedValue << \", \" << " |
| "NumToSkip\n" |
| << " << \"): FieldValue = \" << FieldValue << \", " |
| "ExpectedValue = \"\n" |
| << " << ExpectedValue << \": \"\n" |
| << " << ((ExpectedValue == FieldValue) ? \"PASS\\n\" : " |
| "\"FAIL\\n\"));\n" |
| << " break;\n" |
| << " }\n" |
| << " case MCD::OPC_CheckPredicate: {\n" |
| << " unsigned Len;\n" |
| << " // Decode the Predicate Index value.\n" |
| << " unsigned PIdx = decodeULEB128(++Ptr, &Len);\n" |
| << " Ptr += Len;\n" |
| << " // NumToSkip is a plain 24-bit integer.\n" |
| << " unsigned NumToSkip = *Ptr++;\n" |
| << " NumToSkip |= (*Ptr++) << 8;\n" |
| << " NumToSkip |= (*Ptr++) << 16;\n" |
| << " // Check the predicate.\n" |
| << " bool Pred;\n" |
| << " if (!(Pred = checkDecoderPredicate(PIdx, Bits)))\n" |
| << " Ptr += NumToSkip;\n" |
| << " (void)Pred;\n" |
| << " LLVM_DEBUG(dbgs() << Loc << \": OPC_CheckPredicate(\" << PIdx " |
| "<< \"): \"\n" |
| << " << (Pred ? \"PASS\\n\" : \"FAIL\\n\"));\n" |
| << "\n" |
| << " break;\n" |
| << " }\n" |
| << " case MCD::OPC_Decode: {\n" |
| << " unsigned Len;\n" |
| << " // Decode the Opcode value.\n" |
| << " unsigned Opc = decodeULEB128(++Ptr, &Len);\n" |
| << " Ptr += Len;\n" |
| << " unsigned DecodeIdx = decodeULEB128(Ptr, &Len);\n" |
| << " Ptr += Len;\n" |
| << "\n" |
| << " MI.clear();\n" |
| << " MI.setOpcode(Opc);\n" |
| << " bool DecodeComplete;\n" |
| << " S = decodeToMCInst(S, DecodeIdx, insn, MI, Address, DisAsm, " |
| "DecodeComplete);\n" |
| << " assert(DecodeComplete);\n" |
| << "\n" |
| << " LLVM_DEBUG(dbgs() << Loc << \": OPC_Decode: opcode \" << Opc\n" |
| << " << \", using decoder \" << DecodeIdx << \": \"\n" |
| << " << (S != MCDisassembler::Fail ? \"PASS\" : " |
| "\"FAIL\") << \"\\n\");\n" |
| << " return S;\n" |
| << " }\n" |
| << " case MCD::OPC_TryDecode: {\n" |
| << " unsigned Len;\n" |
| << " // Decode the Opcode value.\n" |
| << " unsigned Opc = decodeULEB128(++Ptr, &Len);\n" |
| << " Ptr += Len;\n" |
| << " unsigned DecodeIdx = decodeULEB128(Ptr, &Len);\n" |
| << " Ptr += Len;\n" |
| << " // NumToSkip is a plain 24-bit integer.\n" |
| << " unsigned NumToSkip = *Ptr++;\n" |
| << " NumToSkip |= (*Ptr++) << 8;\n" |
| << " NumToSkip |= (*Ptr++) << 16;\n" |
| << "\n" |
| << " // Perform the decode operation.\n" |
| << " MCInst TmpMI;\n" |
| << " TmpMI.setOpcode(Opc);\n" |
| << " bool DecodeComplete;\n" |
| << " S = decodeToMCInst(S, DecodeIdx, insn, TmpMI, Address, DisAsm, " |
| "DecodeComplete);\n" |
| << " LLVM_DEBUG(dbgs() << Loc << \": OPC_TryDecode: opcode \" << " |
| "Opc\n" |
| << " << \", using decoder \" << DecodeIdx << \": \");\n" |
| << "\n" |
| << " if (DecodeComplete) {\n" |
| << " // Decoding complete.\n" |
| << " LLVM_DEBUG(dbgs() << (S != MCDisassembler::Fail ? \"PASS\" : " |
| "\"FAIL\") << \"\\n\");\n" |
| << " MI = TmpMI;\n" |
| << " return S;\n" |
| << " } else {\n" |
| << " assert(S == MCDisassembler::Fail);\n" |
| << " // If the decoding was incomplete, skip.\n" |
| << " Ptr += NumToSkip;\n" |
| << " LLVM_DEBUG(dbgs() << \"FAIL: continuing at \" << (Ptr - " |
| "DecodeTable) << \"\\n\");\n" |
| << " // Reset decode status. This also drops a SoftFail status " |
| "that could be\n" |
| << " // set before the decode attempt.\n" |
| << " S = MCDisassembler::Success;\n" |
| << " }\n" |
| << " break;\n" |
| << " }\n" |
| << " case MCD::OPC_SoftFail: {\n" |
| << " // Decode the mask values.\n" |
| << " unsigned Len;\n" |
| << " InsnType PositiveMask = decodeULEB128(++Ptr, &Len);\n" |
| << " Ptr += Len;\n" |
| << " InsnType NegativeMask = decodeULEB128(Ptr, &Len);\n" |
| << " Ptr += Len;\n" |
| << " bool Fail = (insn & PositiveMask) || (~insn & NegativeMask);\n" |
| << " if (Fail)\n" |
| << " S = MCDisassembler::SoftFail;\n" |
| << " LLVM_DEBUG(dbgs() << Loc << \": OPC_SoftFail: \" << (Fail ? " |
| "\"FAIL\\n\":\"PASS\\n\"));\n" |
| << " break;\n" |
| << " }\n" |
| << " case MCD::OPC_Fail: {\n" |
| << " LLVM_DEBUG(dbgs() << Loc << \": OPC_Fail\\n\");\n" |
| << " return MCDisassembler::Fail;\n" |
| << " }\n" |
| << " }\n" |
| << " }\n" |
| << " llvm_unreachable(\"bogosity detected in disassembler state " |
| "machine!\");\n" |
| << "}\n\n"; |
| } |
| |
| // Emits disassembler code for instruction decoding. |
| void FixedLenDecoderEmitter::run(raw_ostream &o) { |
| formatted_raw_ostream OS(o); |
| OS << "#include \"llvm/MC/MCInst.h\"\n"; |
| OS << "#include \"llvm/Support/Debug.h\"\n"; |
| OS << "#include \"llvm/Support/DataTypes.h\"\n"; |
| OS << "#include \"llvm/Support/LEB128.h\"\n"; |
| OS << "#include \"llvm/Support/raw_ostream.h\"\n"; |
| OS << "#include <assert.h>\n"; |
| OS << '\n'; |
| OS << "namespace llvm {\n\n"; |
| |
| emitFieldFromInstruction(OS); |
| |
| Target.reverseBitsForLittleEndianEncoding(); |
| |
| // Parameterize the decoders based on namespace and instruction width. |
| NumberedInstructions = Target.getInstructionsByEnumValue(); |
| std::map<std::pair<std::string, unsigned>, |
| std::vector<unsigned>> OpcMap; |
| std::map<unsigned, std::vector<OperandInfo>> Operands; |
| |
| for (unsigned i = 0; i < NumberedInstructions.size(); ++i) { |
| const CodeGenInstruction *Inst = NumberedInstructions[i]; |
| const Record *Def = Inst->TheDef; |
| unsigned Size = Def->getValueAsInt("Size"); |
| if (Def->getValueAsString("Namespace") == "TargetOpcode" || |
| Def->getValueAsBit("isPseudo") || |
| Def->getValueAsBit("isAsmParserOnly") || |
| Def->getValueAsBit("isCodeGenOnly")) |
| continue; |
| |
| StringRef DecoderNamespace = Def->getValueAsString("DecoderNamespace"); |
| |
| if (Size) { |
| if (populateInstruction(Target, *Inst, i, Operands)) { |
| OpcMap[std::make_pair(DecoderNamespace, Size)].push_back(i); |
| } |
| } |
| } |
| |
| DecoderTableInfo TableInfo; |
| for (const auto &Opc : OpcMap) { |
| // Emit the decoder for this namespace+width combination. |
| FilterChooser FC(NumberedInstructions, Opc.second, Operands, |
| 8*Opc.first.second, this); |
| |
| // The decode table is cleared for each top level decoder function. The |
| // predicates and decoders themselves, however, are shared across all |
| // decoders to give more opportunities for uniqueing. |
| TableInfo.Table.clear(); |
| TableInfo.FixupStack.clear(); |
| TableInfo.Table.reserve(16384); |
| TableInfo.FixupStack.emplace_back(); |
| FC.emitTableEntries(TableInfo); |
| // Any NumToSkip fixups in the top level scope can resolve to the |
| // OPC_Fail at the end of the table. |
| assert(TableInfo.FixupStack.size() == 1 && "fixup stack phasing error!"); |
| // Resolve any NumToSkip fixups in the current scope. |
| resolveTableFixups(TableInfo.Table, TableInfo.FixupStack.back(), |
| TableInfo.Table.size()); |
| TableInfo.FixupStack.clear(); |
| |
| TableInfo.Table.push_back(MCD::OPC_Fail); |
| |
| // Print the table to the output stream. |
| emitTable(OS, TableInfo.Table, 0, FC.getBitWidth(), Opc.first.first); |
| OS.flush(); |
| } |
| |
| // Emit the predicate function. |
| emitPredicateFunction(OS, TableInfo.Predicates, 0); |
| |
| // Emit the decoder function. |
| emitDecoderFunction(OS, TableInfo.Decoders, 0); |
| |
| // Emit the main entry point for the decoder, decodeInstruction(). |
| emitDecodeInstruction(OS); |
| |
| OS << "\n} // End llvm namespace\n"; |
| } |
| |
| namespace llvm { |
| |
| void EmitFixedLenDecoder(RecordKeeper &RK, raw_ostream &OS, |
| const std::string &PredicateNamespace, |
| const std::string &GPrefix, |
| const std::string &GPostfix, const std::string &ROK, |
| const std::string &RFail, const std::string &L) { |
| FixedLenDecoderEmitter(RK, PredicateNamespace, GPrefix, GPostfix, |
| ROK, RFail, L).run(OS); |
| } |
| |
| } // end namespace llvm |