| //===-EDToken.h - LLVM Enhanced Disassembler --------------------*- C++ -*-===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file defines the interface for the Enhanced Disassembly library's token |
| // class. The token is responsible for vending information about the token, |
| // such as its type and logical value. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #ifndef LLVM_EDTOKEN_H |
| #define LLVM_EDTOKEN_H |
| |
| #include "llvm/ADT/StringRef.h" |
| #include "llvm/Support/DataTypes.h" |
| #include <string> |
| #include <vector> |
| |
| namespace llvm { |
| |
| struct EDDisassembler; |
| |
| /// EDToken - Encapsulates a single token, which can provide a string |
| /// representation of itself or interpret itself in various ways, depending |
| /// on the token type. |
| struct EDToken { |
| enum tokenType { |
| kTokenWhitespace, |
| kTokenOpcode, |
| kTokenLiteral, |
| kTokenRegister, |
| kTokenPunctuation |
| }; |
| |
| /// The parent disassembler |
| EDDisassembler &Disassembler; |
| |
| /// The token's string representation |
| llvm::StringRef Str; |
| /// The token's string representation, but in a form suitable for export |
| std::string PermStr; |
| /// The type of the token, as exposed through the external API |
| enum tokenType Type; |
| /// The type of the token, as recorded by the syntax-specific tokenizer |
| uint64_t LocalType; |
| /// The operand corresponding to the token, or (unsigned int)-1 if not |
| /// part of an operand. |
| int OperandID; |
| |
| /// The sign if the token is a literal (1 if negative, 0 otherwise) |
| bool LiteralSign; |
| /// The absolute value if the token is a literal |
| uint64_t LiteralAbsoluteValue; |
| /// The LLVM register ID if the token is a register name |
| unsigned RegisterID; |
| |
| /// Constructor - Initializes an EDToken with the information common to all |
| /// tokens |
| /// |
| /// @arg str - The string corresponding to the token |
| /// @arg type - The token's type as exposed through the public API |
| /// @arg localType - The token's type as recorded by the tokenizer |
| /// @arg disassembler - The disassembler responsible for the token |
| EDToken(llvm::StringRef str, |
| enum tokenType type, |
| uint64_t localType, |
| EDDisassembler &disassembler); |
| |
| /// makeLiteral - Adds the information specific to a literal |
| /// @arg sign - The sign of the literal (1 if negative, 0 |
| /// otherwise) |
| /// |
| /// @arg absoluteValue - The absolute value of the literal |
| void makeLiteral(bool sign, uint64_t absoluteValue); |
| /// makeRegister - Adds the information specific to a register |
| /// |
| /// @arg registerID - The LLVM register ID |
| void makeRegister(unsigned registerID); |
| |
| /// setOperandID - Links the token to a numbered operand |
| /// |
| /// @arg operandID - The operand ID to link to |
| void setOperandID(int operandID); |
| |
| ~EDToken(); |
| |
| /// type - Returns the public type of the token |
| enum tokenType type() const; |
| /// localType - Returns the tokenizer-specific type of the token |
| uint64_t localType() const; |
| /// string - Returns the string representation of the token |
| llvm::StringRef string() const; |
| /// operandID - Returns the operand ID of the token |
| int operandID() const; |
| |
| /// literalSign - Returns the sign of the token |
| /// (1 if negative, 0 if positive or unsigned, -1 if it is not a literal) |
| int literalSign() const; |
| /// literalAbsoluteValue - Retrieves the absolute value of the token, and |
| /// returns -1 if the token is not a literal |
| /// @arg value - A reference to a value that is filled in with the absolute |
| /// value, if it is valid |
| int literalAbsoluteValue(uint64_t &value) const; |
| /// registerID - Retrieves the register ID of the token, and returns -1 if the |
| /// token is not a register |
| /// |
| /// @arg registerID - A reference to a value that is filled in with the |
| /// register ID, if it is valid |
| int registerID(unsigned ®isterID) const; |
| |
| /// tokenize - Tokenizes a string using the platform- and syntax-specific |
| /// tokenizer, and returns 0 on success (-1 on failure) |
| /// |
| /// @arg tokens - A vector that will be filled in with pointers to |
| /// allocated tokens |
| /// @arg str - The string, as outputted by the AsmPrinter |
| /// @arg operandOrder - The order of the operands from the operandFlags array |
| /// as they appear in str |
| /// @arg disassembler - The disassembler for the desired target and |
| // assembly syntax |
| static int tokenize(std::vector<EDToken*> &tokens, |
| std::string &str, |
| const signed char *operandOrder, |
| EDDisassembler &disassembler); |
| |
| /// getString - Directs a character pointer to the string, returning 0 on |
| /// success (-1 on failure) |
| /// @arg buf - A reference to a pointer that is set to point to the string. |
| /// The string is still owned by the token. |
| int getString(const char*& buf); |
| }; |
| |
| } // end namespace llvm |
| #endif |