diff options
| author | Chandler Carruth <chandlerc@gmail.com> | 2018-08-16 23:11:05 +0000 | 
|---|---|---|
| committer | Chandler Carruth <chandlerc@gmail.com> | 2018-08-16 23:11:05 +0000 | 
| commit | 75ca6be1c11c8084e86a2f44d150699fc9965363 (patch) | |
| tree | cdcad1a49bdafabac386f175b356120a5170fc51 /llvm/lib/CodeGen/MIRParser | |
| parent | 103018e9d99f008bc5dbe956bc978342b26e3658 (diff) | |
| download | bcm5719-llvm-75ca6be1c11c8084e86a2f44d150699fc9965363.tar.gz bcm5719-llvm-75ca6be1c11c8084e86a2f44d150699fc9965363.zip | |
[x86/MIR] Implement support for pre- and post-instruction symbols, as
well as MIR parsing support for `MCSymbol` `MachineOperand`s.
The only real way to test pre- and post-instruction symbol support is to
use them in operands, so I ended up implementing that within the patch
as well. I can split out the operand support if folks really want but it
doesn't really seem worth it.
The functional implementation of pre- and post-instruction symbols is
now *completely trivial*. Two tiny bits of code in the (misnamed)
AsmPrinter. It should be completely target independent as well. We emit
these exactly the same way as we emit basic block labels. Most of the
code here is to give full dumping, MIR printing, and MIR parsing support
so that we can write useful tests.
The MIR parsing of MC symbol operands still isn't 100%, as it forces the
symbols to be non-temporary and non-local symbols with names. However,
those names often can encode most (if not all) of the special semantics
desired, and unnamed symbols seem especially annoying to serialize and
de-serialize. While this isn't perfect or full support, it seems plenty
to write tests that exercise usage of these kinds of operands.
The MIR support for pre-and post-instruction symbols was quite
straightforward. I chose to print them out in an as-if-operand syntax
similar to debug locations as this seemed the cleanest way and let me
use nice introducer tokens rather than inventing more magic punctuation
like we use for memoperands.
However, supporting MIR-based parsing of these symbols caused me to
change the design of the symbol support to allow setting arbitrary
symbols. Without this, I don't see any reasonable way to test things
with MIR.
Differential Revision: https://reviews.llvm.org/D50833
llvm-svn: 339962
Diffstat (limited to 'llvm/lib/CodeGen/MIRParser')
| -rw-r--r-- | llvm/lib/CodeGen/MIRParser/MILexer.cpp | 51 | ||||
| -rw-r--r-- | llvm/lib/CodeGen/MIRParser/MILexer.h | 3 | ||||
| -rw-r--r-- | llvm/lib/CodeGen/MIRParser/MIParser.cpp | 67 | 
3 files changed, 117 insertions, 4 deletions
| diff --git a/llvm/lib/CodeGen/MIRParser/MILexer.cpp b/llvm/lib/CodeGen/MIRParser/MILexer.cpp index da05c9a2278..400e0981a16 100644 --- a/llvm/lib/CodeGen/MIRParser/MILexer.cpp +++ b/llvm/lib/CodeGen/MIRParser/MILexer.cpp @@ -245,6 +245,8 @@ static MIToken::TokenKind getIdentifierKind(StringRef Identifier) {        .Case("successors", MIToken::kw_successors)        .Case("floatpred", MIToken::kw_floatpred)        .Case("intpred", MIToken::kw_intpred) +      .Case("pre-instr-symbol", MIToken::kw_pre_instr_symbol) +      .Case("post-instr-symbol", MIToken::kw_post_instr_symbol)        .Default(MIToken::Identifier);  } @@ -460,6 +462,53 @@ static Cursor maybeLexExternalSymbol(Cursor C, MIToken &Token,                   ErrorCallback);  } +static Cursor maybeLexMCSymbol(Cursor C, MIToken &Token, +                               ErrorCallbackType ErrorCallback) { +  const StringRef Rule = "<mcsymbol "; +  if (!C.remaining().startswith(Rule)) +    return None; +  auto Start = C; +  C.advance(Rule.size()); + +  // Try a simple unquoted name. +  if (C.peek() != '"') { +    while (isIdentifierChar(C.peek())) +      C.advance(); +    StringRef String = Start.upto(C).drop_front(Rule.size()); +    if (C.peek() != '>') { +      ErrorCallback(C.location(), +                    "expected the '<mcsymbol ...' to be closed by a '>'"); +      Token.reset(MIToken::Error, Start.remaining()); +      return Start; +    } +    C.advance(); + +    Token.reset(MIToken::MCSymbol, Start.upto(C)).setStringValue(String); +    return C; +  } + +  // Otherwise lex out a quoted name. +  Cursor R = lexStringConstant(C, ErrorCallback); +  if (!R) { +    ErrorCallback(C.location(), +                  "unable to parse quoted string from opening quote"); +    Token.reset(MIToken::Error, Start.remaining()); +    return Start; +  } +  StringRef String = Start.upto(R).drop_front(Rule.size()); +  if (R.peek() != '>') { +    ErrorCallback(R.location(), +                  "expected the '<mcsymbol ...' to be closed by a '>'"); +    Token.reset(MIToken::Error, Start.remaining()); +    return Start; +  } +  R.advance(); + +  Token.reset(MIToken::MCSymbol, Start.upto(R)) +      .setOwnedStringValue(unescapeQuotedString(String)); +  return R; +} +  static bool isValidHexFloatingPointPrefix(char C) {    return C == 'H' || C == 'K' || C == 'L' || C == 'M';  } @@ -657,6 +706,8 @@ StringRef llvm::lexMIToken(StringRef Source, MIToken &Token,      return R.remaining();    if (Cursor R = maybeLexExternalSymbol(C, Token, ErrorCallback))      return R.remaining(); +  if (Cursor R = maybeLexMCSymbol(C, Token, ErrorCallback)) +    return R.remaining();    if (Cursor R = maybeLexHexadecimalLiteral(C, Token))      return R.remaining();    if (Cursor R = maybeLexNumericalLiteral(C, Token)) diff --git a/llvm/lib/CodeGen/MIRParser/MILexer.h b/llvm/lib/CodeGen/MIRParser/MILexer.h index e21c71532f7..94b460e9ac2 100644 --- a/llvm/lib/CodeGen/MIRParser/MILexer.h +++ b/llvm/lib/CodeGen/MIRParser/MILexer.h @@ -113,6 +113,8 @@ struct MIToken {      kw_successors,      kw_floatpred,      kw_intpred, +    kw_pre_instr_symbol, +    kw_post_instr_symbol,      // Named metadata keywords      md_tbaa, @@ -132,6 +134,7 @@ struct MIToken {      NamedGlobalValue,      GlobalValue,      ExternalSymbol, +    MCSymbol,      // Other tokens      IntegerLiteral, diff --git a/llvm/lib/CodeGen/MIRParser/MIParser.cpp b/llvm/lib/CodeGen/MIRParser/MIParser.cpp index 86d4a380ac7..956f6eceb82 100644 --- a/llvm/lib/CodeGen/MIRParser/MIParser.cpp +++ b/llvm/lib/CodeGen/MIRParser/MIParser.cpp @@ -54,6 +54,7 @@  #include "llvm/IR/Value.h"  #include "llvm/IR/ValueSymbolTable.h"  #include "llvm/MC/LaneBitmask.h" +#include "llvm/MC/MCContext.h"  #include "llvm/MC/MCDwarf.h"  #include "llvm/MC/MCInstrDesc.h"  #include "llvm/MC/MCRegisterInfo.h" @@ -221,6 +222,7 @@ public:    bool parseSubRegisterIndexOperand(MachineOperand &Dest);    bool parseJumpTableIndexOperand(MachineOperand &Dest);    bool parseExternalSymbolOperand(MachineOperand &Dest); +  bool parseMCSymbolOperand(MachineOperand &Dest);    bool parseMDNode(MDNode *&Node);    bool parseDIExpression(MDNode *&Expr);    bool parseMetadataOperand(MachineOperand &Dest); @@ -250,6 +252,7 @@ public:    bool parseOptionalScope(LLVMContext &Context, SyncScope::ID &SSID);    bool parseOptionalAtomicOrdering(AtomicOrdering &Order);    bool parseMachineMemoryOperand(MachineMemOperand *&Dest); +  bool parsePreOrPostInstrSymbol(MCSymbol *&Symbol);  private:    /// Convert the integer literal in the current token into an unsigned integer. @@ -346,6 +349,9 @@ private:    /// Return true if the name isn't a name of a target MMO flag.    bool getMMOTargetFlag(StringRef Name, MachineMemOperand::Flags &Flag); +  /// Get or create an MCSymbol for a given name. +  MCSymbol *getOrCreateMCSymbol(StringRef Name); +    /// parseStringConstant    ///   ::= StringConstant    bool parseStringConstant(std::string &Result); @@ -737,7 +743,9 @@ bool MIParser::parse(MachineInstr *&MI) {      return true;    // Parse the remaining machine operands. -  while (!Token.isNewlineOrEOF() && Token.isNot(MIToken::kw_debug_location) && +  while (!Token.isNewlineOrEOF() && Token.isNot(MIToken::kw_pre_instr_symbol) && +         Token.isNot(MIToken::kw_post_instr_symbol) && +         Token.isNot(MIToken::kw_debug_location) &&           Token.isNot(MIToken::coloncolon) && Token.isNot(MIToken::lbrace)) {      auto Loc = Token.location();      Optional<unsigned> TiedDefIdx; @@ -753,6 +761,15 @@ bool MIParser::parse(MachineInstr *&MI) {      lex();    } +  MCSymbol *PreInstrSymbol = nullptr; +  if (Token.is(MIToken::kw_pre_instr_symbol)) +    if (parsePreOrPostInstrSymbol(PreInstrSymbol)) +      return true; +  MCSymbol *PostInstrSymbol = nullptr; +  if (Token.is(MIToken::kw_post_instr_symbol)) +    if (parsePreOrPostInstrSymbol(PostInstrSymbol)) +      return true; +    DebugLoc DebugLocation;    if (Token.is(MIToken::kw_debug_location)) {      lex(); @@ -795,9 +812,12 @@ bool MIParser::parse(MachineInstr *&MI) {      MI->addOperand(MF, Operand.Operand);    if (assignRegisterTies(*MI, Operands))      return true; -  if (MemOperands.empty()) -    return false; -  MI->setMemRefs(MF, MemOperands); +  if (PreInstrSymbol) +    MI->setPreInstrSymbol(MF, PreInstrSymbol); +  if (PostInstrSymbol) +    MI->setPostInstrSymbol(MF, PostInstrSymbol); +  if (!MemOperands.empty()) +    MI->setMemRefs(MF, MemOperands);    return false;  } @@ -1570,6 +1590,16 @@ bool MIParser::parseExternalSymbolOperand(MachineOperand &Dest) {    return false;  } +bool MIParser::parseMCSymbolOperand(MachineOperand &Dest) { +  assert(Token.is(MIToken::MCSymbol)); +  MCSymbol *Symbol = getOrCreateMCSymbol(Token.stringValue()); +  lex(); +  Dest = MachineOperand::CreateMCSymbol(Symbol); +  if (parseOperandsOffset(Dest)) +    return true; +  return false; +} +  bool MIParser::parseSubRegisterIndexOperand(MachineOperand &Dest) {    assert(Token.is(MIToken::SubRegisterIndex));    StringRef Name = Token.stringValue(); @@ -2047,6 +2077,8 @@ bool MIParser::parseMachineOperand(MachineOperand &Dest,      return parseJumpTableIndexOperand(Dest);    case MIToken::ExternalSymbol:      return parseExternalSymbolOperand(Dest); +  case MIToken::MCSymbol: +    return parseMCSymbolOperand(Dest);    case MIToken::SubRegisterIndex:      return parseSubRegisterIndexOperand(Dest);    case MIToken::md_diexpr: @@ -2526,6 +2558,24 @@ bool MIParser::parseMachineMemoryOperand(MachineMemOperand *&Dest) {    return false;  } +bool MIParser::parsePreOrPostInstrSymbol(MCSymbol *&Symbol) { +  assert((Token.is(MIToken::kw_pre_instr_symbol) || +          Token.is(MIToken::kw_post_instr_symbol)) && +         "Invalid token for a pre- post-instruction symbol!"); +  lex(); +  if (Token.isNot(MIToken::MCSymbol)) +    return error("expected a symbol after 'pre-instr-symbol'"); +  Symbol = getOrCreateMCSymbol(Token.stringValue()); +  lex(); +  if (Token.isNewlineOrEOF() || Token.is(MIToken::coloncolon) || +      Token.is(MIToken::lbrace)) +    return false; +  if (Token.isNot(MIToken::comma)) +    return error("expected ',' before the next machine operand"); +  lex(); +  return false; +} +  void MIParser::initNames2InstrOpCodes() {    if (!Names2InstrOpCodes.empty())      return; @@ -2756,6 +2806,15 @@ bool MIParser::getMMOTargetFlag(StringRef Name,    return false;  } +MCSymbol *MIParser::getOrCreateMCSymbol(StringRef Name) { +  // FIXME: Currently we can't recognize temporary or local symbols and call all +  // of the appropriate forms to create them. However, this handles basic cases +  // well as most of the special aspects are recognized by a prefix on their +  // name, and the input names should already be unique. For test cases, keeping +  // the symbol name out of the symbol table isn't terribly important. +  return MF.getContext().getOrCreateSymbol(Name); +} +  bool MIParser::parseStringConstant(std::string &Result) {    if (Token.isNot(MIToken::StringConstant))      return error("expected string constant"); | 

