doxygen/AsmLexer_8cpp_source.html

//===- AsmLexer.cpp - Lexer for Assembly Files ----------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This class implements the lexer for assembly files.

//

//===----------------------------------------------------------------------===//


#include "llvm/MC/MCParser/AsmLexer.h"

#include "llvm/ADT/APInt.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/ADT/StringExtras.h"

#include "llvm/ADT/StringRef.h"

#include "llvm/MC/MCAsmInfo.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/SMLoc.h"

#include "llvm/Support/SaveAndRestore.h"

#include "llvm/Support/raw_ostream.h"

#include <cassert>

#include <cctype>

#include <cstdio>

#include <cstring>

#include <string>


using namespace llvm;


SMLoc AsmToken::getLoc() const { return SMLoc::getFromPointer(Str.data()); }


SMLoc AsmToken::getEndLoc() const {

  return SMLoc::getFromPointer(Str.data() + Str.size());

}


SMRange AsmToken::getLocRange() const { return SMRange(getLoc(), getEndLoc()); }


void AsmToken::dump(raw_ostream &OS) const {

  switch (Kind) {

  case AsmToken::Error:

    OS << "error";

    break;

  case AsmToken::Identifier:

    OS << "identifier: " << getString();

    break;

  case AsmToken::Integer:

    OS << "int: " << getString();

    break;

  case AsmToken::Real:

    OS << "real: " << getString();

    break;

  case AsmToken::String:

    OS << "string: " << getString();

    break;


    // clang-format off

  case AsmToken::Amp:                OS << "Amp"; break;

  case AsmToken::AmpAmp:             OS << "AmpAmp"; break;

  case AsmToken::At:                 OS << "At"; break;

  case AsmToken::BackSlash:          OS << "BackSlash"; break;

  case AsmToken::BigNum:             OS << "BigNum"; break;

  case AsmToken::Caret:              OS << "Caret"; break;

  case AsmToken::Colon:              OS << "Colon"; break;

  case AsmToken::Comma:              OS << "Comma"; break;

  case AsmToken::Comment:            OS << "Comment"; break;

  case AsmToken::Dollar:             OS << "Dollar"; break;

  case AsmToken::Dot:                OS << "Dot"; break;

  case AsmToken::EndOfStatement:     OS << "EndOfStatement"; break;

  case AsmToken::Eof:                OS << "Eof"; break;

  case AsmToken::Equal:              OS << "Equal"; break;

  case AsmToken::EqualEqual:         OS << "EqualEqual"; break;

  case AsmToken::Exclaim:            OS << "Exclaim"; break;

  case AsmToken::ExclaimEqual:       OS << "ExclaimEqual"; break;

  case AsmToken::Greater:            OS << "Greater"; break;

  case AsmToken::GreaterEqual:       OS << "GreaterEqual"; break;

  case AsmToken::GreaterGreater:     OS << "GreaterGreater"; break;

  case AsmToken::Hash:               OS << "Hash"; break;

  case AsmToken::HashDirective:      OS << "HashDirective"; break;

  case AsmToken::LBrac:              OS << "LBrac"; break;

  case AsmToken::LCurly:             OS << "LCurly"; break;

  case AsmToken::LParen:             OS << "LParen"; break;

  case AsmToken::Less:               OS << "Less"; break;

  case AsmToken::LessEqual:          OS << "LessEqual"; break;

  case AsmToken::LessGreater:        OS << "LessGreater"; break;

  case AsmToken::LessLess:           OS << "LessLess"; break;

  case AsmToken::Minus:              OS << "Minus"; break;

  case AsmToken::MinusGreater:       OS << "MinusGreater"; break;

  case AsmToken::Percent:            OS << "Percent"; break;

  case AsmToken::Pipe:               OS << "Pipe"; break;

  case AsmToken::PipePipe:           OS << "PipePipe"; break;

  case AsmToken::Plus:               OS << "Plus"; break;

  case AsmToken::Question:           OS << "Question"; break;

  case AsmToken::RBrac:              OS << "RBrac"; break;

  case AsmToken::RCurly:             OS << "RCurly"; break;

  case AsmToken::RParen:             OS << "RParen"; break;

  case AsmToken::Slash:              OS << "Slash"; break;

  case AsmToken::Space:              OS << "Space"; break;

  case AsmToken::Star:               OS << "Star"; break;

  case AsmToken::Tilde:              OS << "Tilde"; break;

    // clang-format on

  }


  // Print the token string.

  OS << " (\"";

  OS.write_escaped(getString());

  OS << "\")";

}


AsmLexer::AsmLexer(const MCAsmInfo &MAI) : MAI(MAI) {

  // For COFF targets, this is true, while for ELF targets, it should be false.

  // Currently, @specifier parsing depends on '@' being included in the token.

  AllowAtInIdentifier = !StringRef(MAI.getCommentString()).starts_with("@") &&

                        MAI.useAtForSpecifier();

  LexMotorolaIntegers = MAI.shouldUseMotorolaIntegers();


  CurTok.emplace_back(AsmToken::Space, StringRef());

}


void AsmLexer::setBuffer(StringRef Buf, const char *ptr,

                         bool EndStatementAtEOF) {

  // Buffer must be NULL-terminated. NULL terminator must reside at `Buf.end()`.

  // It must be safe to dereference `Buf.end()`.

  assert(*Buf.end() == '\0' &&

         "Buffer provided to AsmLexer lacks null terminator.");


  CurBuf = Buf;


  if (ptr)

    CurPtr = ptr;

  else

    CurPtr = CurBuf.begin();


  TokStart = nullptr;

  this->EndStatementAtEOF = EndStatementAtEOF;

}


/// ReturnError - Set the error to the specified string at the specified

/// location.  This is defined to always return AsmToken::Error.

AsmToken AsmLexer::ReturnError(const char *Loc, const std::string &Msg) {

  SetError(SMLoc::getFromPointer(Loc), Msg);


  return AsmToken(AsmToken::Error, StringRef(Loc, CurPtr - Loc));

}


int AsmLexer::getNextChar() {

  if (CurPtr == CurBuf.end())

    return EOF;

  return (unsigned char)*CurPtr++;

}


int AsmLexer::peekNextChar() {

  if (CurPtr == CurBuf.end())

    return EOF;

  return (unsigned char)*CurPtr;

}


/// The leading integral digit sequence and dot should have already been

/// consumed, some or all of the fractional digit sequence *can* have been

/// consumed.

AsmToken AsmLexer::LexFloatLiteral() {

  // Skip the fractional digit sequence.

  while (isDigit(*CurPtr))

    ++CurPtr;


  if (*CurPtr == '-' || *CurPtr == '+')

    return ReturnError(CurPtr, "invalid sign in float literal");


  // Check for exponent

  if ((*CurPtr == 'e' || *CurPtr == 'E')) {

    ++CurPtr;


    if (*CurPtr == '-' || *CurPtr == '+')

      ++CurPtr;


    while (isDigit(*CurPtr))

      ++CurPtr;

  }


  return AsmToken(AsmToken::Real,

                  StringRef(TokStart, CurPtr - TokStart));

}


/// LexHexFloatLiteral matches essentially (.[0-9a-fA-F]*)?[pP][+-]?[0-9a-fA-F]+

/// while making sure there are enough actual digits around for the constant to

/// be valid.

///

/// The leading "0x[0-9a-fA-F]*" (i.e. integer part) has already been consumed

/// before we get here.

AsmToken AsmLexer::LexHexFloatLiteral(bool NoIntDigits) {

  assert((*CurPtr == 'p' || *CurPtr == 'P' || *CurPtr == '.') &&

         "unexpected parse state in floating hex");

  bool NoFracDigits = true;


  // Skip the fractional part if there is one

  if (*CurPtr == '.') {

    ++CurPtr;


    const char *FracStart = CurPtr;

    while (isHexDigit(*CurPtr))

      ++CurPtr;


    NoFracDigits = CurPtr == FracStart;

  }


  if (NoIntDigits && NoFracDigits)

    return ReturnError(TokStart, "invalid hexadecimal floating-point constant: "

                                 "expected at least one significand digit");


  // Make sure we do have some kind of proper exponent part

  if (*CurPtr != 'p' && *CurPtr != 'P')

    return ReturnError(TokStart, "invalid hexadecimal floating-point constant: "

                                 "expected exponent part 'p'");

  ++CurPtr;


  if (*CurPtr == '+' || *CurPtr == '-')

    ++CurPtr;


  // N.b. exponent digits are *not* hex

  const char *ExpStart = CurPtr;

  while (isDigit(*CurPtr))

    ++CurPtr;


  if (CurPtr == ExpStart)

    return ReturnError(TokStart, "invalid hexadecimal floating-point constant: "

                                 "expected at least one exponent digit");


  return AsmToken(AsmToken::Real, StringRef(TokStart, CurPtr - TokStart));

}


/// LexIdentifier: [a-zA-Z_$.@?][a-zA-Z0-9_$.@#?]*


static bool isIdentifierChar(char C, bool AllowAt, bool AllowHash) {

  return isAlnum(C) || C == '_' || C == '$' || C == '.' || C == '?' ||

         (AllowAt && C == '@') || (AllowHash && C == '#');

}


AsmToken AsmLexer::LexIdentifier() {

  // Check for floating point literals.

  if (CurPtr[-1] == '.' && isDigit(*CurPtr)) {

    // Disambiguate a .1243foo identifier from a floating literal.

    while (isDigit(*CurPtr))

      ++CurPtr;


    if (!isIdentifierChar(*CurPtr, AllowAtInIdentifier,

                          AllowHashInIdentifier) ||

        *CurPtr == 'e' || *CurPtr == 'E')

      return LexFloatLiteral();

  }


  while (isIdentifierChar(*CurPtr, AllowAtInIdentifier, AllowHashInIdentifier))

    ++CurPtr;


  // Handle . as a special case.

  if (CurPtr == TokStart+1 && TokStart[0] == '.')

    return AsmToken(AsmToken::Dot, StringRef(TokStart, 1));


  return AsmToken(AsmToken::Identifier, StringRef(TokStart, CurPtr - TokStart));

}


/// LexSlash: Slash: /

///           C-Style Comment: /* ... */

///           C-style Comment: // ...

AsmToken AsmLexer::LexSlash() {

  if (!MAI.shouldAllowAdditionalComments()) {

    IsAtStartOfStatement = false;

    return AsmToken(AsmToken::Slash, StringRef(TokStart, 1));

  }


  switch (*CurPtr) {

  case '*':

    IsAtStartOfStatement = false;

    break; // C style comment.

  case '/':

    ++CurPtr;

    return LexLineComment();

  default:

    IsAtStartOfStatement = false;

    return AsmToken(AsmToken::Slash, StringRef(TokStart, 1));

  }


  // C Style comment.

  ++CurPtr;  // skip the star.

  const char *CommentTextStart = CurPtr;

  while (CurPtr != CurBuf.end()) {

    switch (*CurPtr++) {

    case '*':

      // End of the comment?

      if (*CurPtr != '/')

        break;

      // If we have a CommentConsumer, notify it about the comment.

      if (CommentConsumer) {

        CommentConsumer->HandleComment(

            SMLoc::getFromPointer(CommentTextStart),

            StringRef(CommentTextStart, CurPtr - 1 - CommentTextStart));

      }

      ++CurPtr;   // End the */.

      return AsmToken(AsmToken::Comment,

                      StringRef(TokStart, CurPtr - TokStart));

    }

  }

  return ReturnError(TokStart, "unterminated comment");

}


/// LexLineComment: Comment: #[^\n]*

///                        : //[^\n]*

AsmToken AsmLexer::LexLineComment() {

  // Mark This as an end of statement with a body of the

  // comment. While it would be nicer to leave this two tokens,

  // backwards compatability with TargetParsers makes keeping this in this form

  // better.

  const char *CommentTextStart = CurPtr;

  int CurChar = getNextChar();

  while (CurChar != '\n' && CurChar != '\r' && CurChar != EOF)

    CurChar = getNextChar();

  const char *NewlinePtr = CurPtr;

  if (CurChar == '\r' && CurPtr != CurBuf.end() && *CurPtr == '\n')

    ++CurPtr;


  // If we have a CommentConsumer, notify it about the comment.

  if (CommentConsumer) {

    CommentConsumer->HandleComment(

        SMLoc::getFromPointer(CommentTextStart),

        StringRef(CommentTextStart, NewlinePtr - 1 - CommentTextStart));

  }


  IsAtStartOfLine = true;

  // This is a whole line comment. leave newline

  if (IsAtStartOfStatement)

    return AsmToken(AsmToken::EndOfStatement,

                    StringRef(TokStart, CurPtr - TokStart));

  IsAtStartOfStatement = true;


  return AsmToken(AsmToken::EndOfStatement,

                  StringRef(TokStart, CurPtr - 1 - TokStart));

}


static void SkipIgnoredIntegerSuffix(const char *&CurPtr) {

  // Skip case-insensitive ULL, UL, U, L and LL suffixes.

  if (CurPtr[0] == 'U' || CurPtr[0] == 'u')

    ++CurPtr;

  if (CurPtr[0] == 'L' || CurPtr[0] == 'l')

    ++CurPtr;

  if (CurPtr[0] == 'L' || CurPtr[0] == 'l')

    ++CurPtr;

}


// Look ahead to search for first non-hex digit, if it's [hH], then we treat the

// integer as a hexadecimal, possibly with leading zeroes.


static unsigned doHexLookAhead(const char *&CurPtr, unsigned DefaultRadix,

                               bool LexHex) {

  const char *FirstNonDec = nullptr;

  const char *LookAhead = CurPtr;

  while (true) {

    if (isDigit(*LookAhead)) {

      ++LookAhead;

    } else {

      if (!FirstNonDec)

        FirstNonDec = LookAhead;


      // Keep going if we are looking for a 'h' suffix.

      if (LexHex && isHexDigit(*LookAhead))

        ++LookAhead;

      else

        break;

    }

  }

  bool isHex = LexHex && (*LookAhead == 'h' || *LookAhead == 'H');

  CurPtr = isHex || !FirstNonDec ? LookAhead : FirstNonDec;

  if (isHex)

    return 16;

  return DefaultRadix;

}


static const char *findLastDigit(const char *CurPtr, unsigned DefaultRadix) {

  while (hexDigitValue(*CurPtr) < DefaultRadix) {

    ++CurPtr;

  }

  return CurPtr;

}


static AsmToken intToken(StringRef Ref, APInt &Value) {

  if (Value.isIntN(64))

    return AsmToken(AsmToken::Integer, Ref, Value);

  return AsmToken(AsmToken::BigNum, Ref, Value);

}


static std::string radixName(unsigned Radix) {

  switch (Radix) {

  case 2:

    return "binary";

  case 8:

    return "octal";

  case 10:

    return "decimal";

  case 16:

    return "hexadecimal";

  default:

    return "base-" + std::to_string(Radix);

  }

}


/// LexDigit: First character is [0-9].

///   Local Label: [0-9][:]

///   Forward/Backward Label: [0-9][fb]

///   Binary integer: 0b[01]+

///   Octal integer: 0[0-7]+

///   Hex integer: 0x[0-9a-fA-F]+ or [0x]?[0-9][0-9a-fA-F]*[hH]

///   Decimal integer: [1-9][0-9]*

AsmToken AsmLexer::LexDigit() {

  // MASM-flavor binary integer: [01]+[yY] (if DefaultRadix < 16, [bByY])

  // MASM-flavor octal integer: [0-7]+[oOqQ]

  // MASM-flavor decimal integer: [0-9]+[tT] (if DefaultRadix < 16, [dDtT])

  // MASM-flavor hexadecimal integer: [0-9][0-9a-fA-F]*[hH]

  if (LexMasmIntegers && isdigit(CurPtr[-1])) {

    const char *FirstNonBinary =

        (CurPtr[-1] != '0' && CurPtr[-1] != '1') ? CurPtr - 1 : nullptr;

    const char *FirstNonDecimal =

        (CurPtr[-1] < '0' || CurPtr[-1] > '9') ? CurPtr - 1 : nullptr;

    const char *OldCurPtr = CurPtr;

    while (isHexDigit(*CurPtr)) {

      switch (*CurPtr) {

      default:

        if (!FirstNonDecimal) {

          FirstNonDecimal = CurPtr;

        }

        [[fallthrough]];

      case '9':

      case '8':

      case '7':

      case '6':

      case '5':

      case '4':

      case '3':

      case '2':

        if (!FirstNonBinary) {

          FirstNonBinary = CurPtr;

        }

        break;

      case '1':

      case '0':

        break;

      }

      ++CurPtr;

    }

    if (*CurPtr == '.') {

      // MASM float literals (other than hex floats) always contain a ".", and

      // are always written in decimal.

      ++CurPtr;

      return LexFloatLiteral();

    }


    if (LexMasmHexFloats && (*CurPtr == 'r' || *CurPtr == 'R')) {

      ++CurPtr;

      return AsmToken(AsmToken::Real, StringRef(TokStart, CurPtr - TokStart));

    }


    unsigned Radix = 0;

    if (*CurPtr == 'h' || *CurPtr == 'H') {

      // hexadecimal number

      ++CurPtr;

      Radix = 16;

    } else if (*CurPtr == 't' || *CurPtr == 'T') {

      // decimal number

      ++CurPtr;

      Radix = 10;

    } else if (*CurPtr == 'o' || *CurPtr == 'O' || *CurPtr == 'q' ||

               *CurPtr == 'Q') {

      // octal number

      ++CurPtr;

      Radix = 8;

    } else if (*CurPtr == 'y' || *CurPtr == 'Y') {

      // binary number

      ++CurPtr;

      Radix = 2;

    } else if (FirstNonDecimal && FirstNonDecimal + 1 == CurPtr &&

               DefaultRadix < 14 &&

               (*FirstNonDecimal == 'd' || *FirstNonDecimal == 'D')) {

      Radix = 10;

    } else if (FirstNonBinary && FirstNonBinary + 1 == CurPtr &&

               DefaultRadix < 12 &&

               (*FirstNonBinary == 'b' || *FirstNonBinary == 'B')) {

      Radix = 2;

    }


    if (Radix) {

      StringRef Result(TokStart, CurPtr - TokStart);

      APInt Value(128, 0, true);


      if (Result.drop_back().getAsInteger(Radix, Value))

        return ReturnError(TokStart, "invalid " + radixName(Radix) + " number");


      // MSVC accepts and ignores type suffices on integer literals.

      SkipIgnoredIntegerSuffix(CurPtr);


      return intToken(Result, Value);

    }


    // default-radix integers, or floating point numbers, fall through

    CurPtr = OldCurPtr;

  }


  // MASM default-radix integers: [0-9a-fA-F]+

  // (All other integer literals have a radix specifier.)

  if (LexMasmIntegers && UseMasmDefaultRadix) {

    CurPtr = findLastDigit(CurPtr, 16);

    StringRef Result(TokStart, CurPtr - TokStart);


    APInt Value(128, 0, true);

    if (Result.getAsInteger(DefaultRadix, Value)) {

      return ReturnError(TokStart,

                         "invalid " + radixName(DefaultRadix) + " number");

    }


    return intToken(Result, Value);

  }


  // Motorola hex integers: $[0-9a-fA-F]+

  if (LexMotorolaIntegers && CurPtr[-1] == '$') {

    const char *NumStart = CurPtr;

    while (isHexDigit(CurPtr[0]))

      ++CurPtr;


    APInt Result(128, 0);

    if (StringRef(NumStart, CurPtr - NumStart).getAsInteger(16, Result))

      return ReturnError(TokStart, "invalid hexadecimal number");


    return intToken(StringRef(TokStart, CurPtr - TokStart), Result);

  }


  // Motorola binary integers: %[01]+

  if (LexMotorolaIntegers && CurPtr[-1] == '%') {

    const char *NumStart = CurPtr;

    while (*CurPtr == '0' || *CurPtr == '1')

      ++CurPtr;


    APInt Result(128, 0);

    if (StringRef(NumStart, CurPtr - NumStart).getAsInteger(2, Result))

      return ReturnError(TokStart, "invalid binary number");


    return intToken(StringRef(TokStart, CurPtr - TokStart), Result);

  }


  // Decimal integer: [1-9][0-9]*

  // HLASM-flavour decimal integer: [0-9][0-9]*

  // FIXME: Later on, support for fb for HLASM has to be added in

  // as they probably would be needed for asm goto

  if (LexHLASMIntegers || CurPtr[-1] != '0' || CurPtr[0] == '.') {

    unsigned Radix = doHexLookAhead(CurPtr, 10, LexMasmIntegers);


    if (!LexHLASMIntegers) {

      bool IsHex = Radix == 16;

      // Check for floating point literals.

      if (!IsHex && (*CurPtr == '.' || *CurPtr == 'e' || *CurPtr == 'E')) {

        if (*CurPtr == '.')

          ++CurPtr;

        return LexFloatLiteral();

      }

    }


    StringRef Result(TokStart, CurPtr - TokStart);


    APInt Value(128, 0, true);

    if (Result.getAsInteger(Radix, Value))

      return ReturnError(TokStart, "invalid " + radixName(Radix) + " number");


    if (!LexHLASMIntegers)

      // The darwin/x86 (and x86-64) assembler accepts and ignores type

      // suffices on integer literals.

      SkipIgnoredIntegerSuffix(CurPtr);


    return intToken(Result, Value);

  }


  if (!LexMasmIntegers && ((*CurPtr == 'b') || (*CurPtr == 'B'))) {

    ++CurPtr;

    // See if we actually have "0b" as part of something like "jmp 0b\n"

    if (!isDigit(CurPtr[0])) {

      --CurPtr;

      StringRef Result(TokStart, CurPtr - TokStart);

      return AsmToken(AsmToken::Integer, Result, 0);

    }

    const char *NumStart = CurPtr;

    while (CurPtr[0] == '0' || CurPtr[0] == '1')

      ++CurPtr;


    // Requires at least one binary digit.

    if (CurPtr == NumStart)

      return ReturnError(TokStart, "invalid binary number");


    StringRef Result(TokStart, CurPtr - TokStart);


    APInt Value(128, 0, true);

    if (Result.substr(2).getAsInteger(2, Value))

      return ReturnError(TokStart, "invalid binary number");


    // The darwin/x86 (and x86-64) assembler accepts and ignores ULL and LL

    // suffixes on integer literals.

    SkipIgnoredIntegerSuffix(CurPtr);


    return intToken(Result, Value);

  }


  if ((*CurPtr == 'x') || (*CurPtr == 'X')) {

    ++CurPtr;

    const char *NumStart = CurPtr;

    while (isHexDigit(CurPtr[0]))

      ++CurPtr;


    // "0x.0p0" is valid, and "0x0p0" (but not "0xp0" for example, which will be

    // diagnosed by LexHexFloatLiteral).

    if (CurPtr[0] == '.' || CurPtr[0] == 'p' || CurPtr[0] == 'P')

      return LexHexFloatLiteral(NumStart == CurPtr);


    // Otherwise requires at least one hex digit.

    if (CurPtr == NumStart)

      return ReturnError(CurPtr-2, "invalid hexadecimal number");


    APInt Result(128, 0);

    if (StringRef(TokStart, CurPtr - TokStart).getAsInteger(0, Result))

      return ReturnError(TokStart, "invalid hexadecimal number");


    // Consume the optional [hH].

    if (LexMasmIntegers && (*CurPtr == 'h' || *CurPtr == 'H'))

      ++CurPtr;


    // The darwin/x86 (and x86-64) assembler accepts and ignores ULL and LL

    // suffixes on integer literals.

    SkipIgnoredIntegerSuffix(CurPtr);


    return intToken(StringRef(TokStart, CurPtr - TokStart), Result);

  }


  // Either octal or hexadecimal.

  APInt Value(128, 0, true);

  unsigned Radix = doHexLookAhead(CurPtr, 8, LexMasmIntegers);

  StringRef Result(TokStart, CurPtr - TokStart);

  if (Result.getAsInteger(Radix, Value))

    return ReturnError(TokStart, "invalid " + radixName(Radix) + " number");


  // Consume the [hH].

  if (Radix == 16)

    ++CurPtr;


  // The darwin/x86 (and x86-64) assembler accepts and ignores ULL and LL

  // suffixes on integer literals.

  SkipIgnoredIntegerSuffix(CurPtr);


  return intToken(Result, Value);

}


/// LexSingleQuote: Integer: 'b'

AsmToken AsmLexer::LexSingleQuote() {

  int CurChar = getNextChar();


  if (LexHLASMStrings)

    return ReturnError(TokStart, "invalid usage of character literals");


  if (LexMasmStrings) {

    while (CurChar != EOF) {

      if (CurChar != '\'') {

        CurChar = getNextChar();

      } else if (peekNextChar() == '\'') {

        // In MASM single-quote strings, doubled single-quotes mean an escaped

        // single quote, so should be lexed in.

        (void)getNextChar();

        CurChar = getNextChar();

      } else {

        break;

      }

    }

    if (CurChar == EOF)

      return ReturnError(TokStart, "unterminated string constant");

    return AsmToken(AsmToken::String, StringRef(TokStart, CurPtr - TokStart));

  }


  if (CurChar == '\\')

    CurChar = getNextChar();


  if (CurChar == EOF)

    return ReturnError(TokStart, "unterminated single quote");


  CurChar = getNextChar();


  if (CurChar != '\'')

    return ReturnError(TokStart, "single quote way too long");


  // The idea here being that 'c' is basically just an integral

  // constant.

  StringRef Res = StringRef(TokStart,CurPtr - TokStart);

  long long Value;


  if (Res.starts_with("\'\\")) {

    char theChar = Res[2];

    switch (theChar) {

      default: Value = theChar; break;

      case '\'': Value = '\''; break;

      case 't': Value = '\t'; break;

      case 'n': Value = '\n'; break;

      case 'b': Value = '\b'; break;

      case 'f': Value = '\f'; break;

      case 'r': Value = '\r'; break;

    }

  } else

    Value = TokStart[1];


  return AsmToken(AsmToken::Integer, Res, Value);

}


/// LexQuote: String: "..."

AsmToken AsmLexer::LexQuote() {

  int CurChar = getNextChar();

  if (LexHLASMStrings)

    return ReturnError(TokStart, "invalid usage of string literals");


  if (LexMasmStrings) {

    while (CurChar != EOF) {

      if (CurChar != '"') {

        CurChar = getNextChar();

      } else if (peekNextChar() == '"') {

        // In MASM double-quoted strings, doubled double-quotes mean an escaped

        // double quote, so should be lexed in.

        (void)getNextChar();

        CurChar = getNextChar();

      } else {

        break;

      }

    }

    if (CurChar == EOF)

      return ReturnError(TokStart, "unterminated string constant");

    return AsmToken(AsmToken::String, StringRef(TokStart, CurPtr - TokStart));

  }


  while (CurChar != '"') {

    if (CurChar == '\\') {

      // Allow \", etc.

      CurChar = getNextChar();

    }


    if (CurChar == EOF)

      return ReturnError(TokStart, "unterminated string constant");


    CurChar = getNextChar();

  }


  return AsmToken(AsmToken::String, StringRef(TokStart, CurPtr - TokStart));

}


StringRef AsmLexer::LexUntilEndOfStatement() {

  TokStart = CurPtr;


  while (!isAtStartOfComment(CurPtr) &&     // Start of line comment.

         !isAtStatementSeparator(CurPtr) && // End of statement marker.

         *CurPtr != '\n' && *CurPtr != '\r' && CurPtr != CurBuf.end()) {

    ++CurPtr;

  }

  return StringRef(TokStart, CurPtr-TokStart);

}


StringRef AsmLexer::LexUntilEndOfLine() {

  TokStart = CurPtr;


  while (*CurPtr != '\n' && *CurPtr != '\r' && CurPtr != CurBuf.end()) {

    ++CurPtr;

  }

  return StringRef(TokStart, CurPtr-TokStart);

}


size_t AsmLexer::peekTokens(MutableArrayRef<AsmToken> Buf,

                            bool ShouldSkipSpace) {

  SaveAndRestore SavedTokenStart(TokStart);

  SaveAndRestore SavedCurPtr(CurPtr);

  SaveAndRestore SavedAtStartOfLine(IsAtStartOfLine);

  SaveAndRestore SavedAtStartOfStatement(IsAtStartOfStatement);

  SaveAndRestore SavedSkipSpace(SkipSpace, ShouldSkipSpace);

  SaveAndRestore SavedIsPeeking(IsPeeking, true);

  std::string SavedErr = getErr();

  SMLoc SavedErrLoc = getErrLoc();


  size_t ReadCount;

  for (ReadCount = 0; ReadCount < Buf.size(); ++ReadCount) {

    AsmToken Token = LexToken();


    Buf[ReadCount] = Token;


    if (Token.is(AsmToken::Eof)) {

      ReadCount++;

      break;

    }

  }


  SetError(SavedErrLoc, SavedErr);

  return ReadCount;

}


bool AsmLexer::isAtStartOfComment(const char *Ptr) {

  if (MAI.isHLASM() && !IsAtStartOfStatement)

    return false;


  StringRef CommentString = MAI.getCommentString();


  if (CommentString.size() == 1)

    return CommentString[0] == Ptr[0];


  // Allow # preprocessor comments also be counted as comments for "##" cases

  if (CommentString[1] == '#')

    return CommentString[0] == Ptr[0];


  return strncmp(Ptr, CommentString.data(), CommentString.size()) == 0;

}


bool AsmLexer::isAtStatementSeparator(const char *Ptr) {

  return strncmp(Ptr, MAI.getSeparatorString(),

                 strlen(MAI.getSeparatorString())) == 0;

}


AsmToken AsmLexer::LexToken() {

  TokStart = CurPtr;

  // This always consumes at least one character.

  int CurChar = getNextChar();


  if (!IsPeeking && CurChar == '#' && IsAtStartOfStatement) {

    // If this starts with a '#', this may be a cpp

    // hash directive and otherwise a line comment.

    AsmToken TokenBuf[2];

    MutableArrayRef<AsmToken> Buf(TokenBuf, 2);

    size_t num = peekTokens(Buf, true);

    // There cannot be a space preceding this

    if (IsAtStartOfLine && num == 2 && TokenBuf[0].is(AsmToken::Integer) &&

        TokenBuf[1].is(AsmToken::String)) {

      CurPtr = TokStart; // reset curPtr;

      StringRef s = LexUntilEndOfLine();

      UnLex(TokenBuf[1]);

      UnLex(TokenBuf[0]);

      return AsmToken(AsmToken::HashDirective, s);

    }


    if (MAI.shouldAllowAdditionalComments())

      return LexLineComment();

  }


  if (isAtStartOfComment(TokStart)) {

    StringRef CommentString = MAI.getCommentString();

    // For multi-char comment strings, advance CurPtr only if we matched the

    // full string. This stops us from accidentally eating the newline if the

    // current line ends in a single comment char.

    if (CommentString.size() > 1 &&

        StringRef(TokStart, CommentString.size()) == CommentString) {

      CurPtr += CommentString.size() - 1;

    }

    return LexLineComment();

  }


  if (isAtStatementSeparator(TokStart)) {

    CurPtr += strlen(MAI.getSeparatorString()) - 1;

    IsAtStartOfLine = true;

    IsAtStartOfStatement = true;

    return AsmToken(AsmToken::EndOfStatement,

                    StringRef(TokStart, strlen(MAI.getSeparatorString())));

  }


  // If we're missing a newline at EOF, make sure we still get an

  // EndOfStatement token before the Eof token.

  if (CurChar == EOF && !IsAtStartOfStatement && EndStatementAtEOF) {

    IsAtStartOfLine = true;

    IsAtStartOfStatement = true;

    return AsmToken(AsmToken::EndOfStatement, StringRef(TokStart, 0));

  }

  IsAtStartOfLine = false;

  bool OldIsAtStartOfStatement = IsAtStartOfStatement;

  IsAtStartOfStatement = false;

  switch (CurChar) {

  default:

    // Handle identifier: [a-zA-Z_.$@#?][a-zA-Z0-9_.$@#?]*

    // Whether or not the lexer accepts '$', '@', '#' and '?' at the start of

    // an identifier is target-dependent. These characters are handled in the

    // respective switch cases.

    if (isalpha(CurChar) || CurChar == '_' || CurChar == '.')

      return LexIdentifier();


    // Unknown character, emit an error.

    return ReturnError(TokStart, "invalid character in input");

  case EOF:

    if (EndStatementAtEOF) {

      IsAtStartOfLine = true;

      IsAtStartOfStatement = true;

    }

    return AsmToken(AsmToken::Eof, StringRef(TokStart, 0));

  case 0:

  case ' ':

  case '\t':

    IsAtStartOfStatement = OldIsAtStartOfStatement;

    while (*CurPtr == ' ' || *CurPtr == '\t')

      CurPtr++;

    if (SkipSpace)

      return LexToken(); // Ignore whitespace.

    else

      return AsmToken(AsmToken::Space, StringRef(TokStart, CurPtr - TokStart));

  case '\r': {

    IsAtStartOfLine = true;

    IsAtStartOfStatement = true;

    // If this is a CR followed by LF, treat that as one token.

    if (CurPtr != CurBuf.end() && *CurPtr == '\n')

      ++CurPtr;

    return AsmToken(AsmToken::EndOfStatement,

                    StringRef(TokStart, CurPtr - TokStart));

  }

  case '\n':

    IsAtStartOfLine = true;

    IsAtStartOfStatement = true;

    return AsmToken(AsmToken::EndOfStatement, StringRef(TokStart, 1));

  case ':': return AsmToken(AsmToken::Colon, StringRef(TokStart, 1));

  case '+': return AsmToken(AsmToken::Plus, StringRef(TokStart, 1));

  case '~': return AsmToken(AsmToken::Tilde, StringRef(TokStart, 1));

  case '(': return AsmToken(AsmToken::LParen, StringRef(TokStart, 1));

  case ')': return AsmToken(AsmToken::RParen, StringRef(TokStart, 1));

  case '[': return AsmToken(AsmToken::LBrac, StringRef(TokStart, 1));

  case ']': return AsmToken(AsmToken::RBrac, StringRef(TokStart, 1));

  case '{': return AsmToken(AsmToken::LCurly, StringRef(TokStart, 1));

  case '}': return AsmToken(AsmToken::RCurly, StringRef(TokStart, 1));

  case '*': return AsmToken(AsmToken::Star, StringRef(TokStart, 1));

  case ',': return AsmToken(AsmToken::Comma, StringRef(TokStart, 1));

  case '$': {

    if (LexMotorolaIntegers && isHexDigit(*CurPtr))

      return LexDigit();

    if (MAI.doesAllowDollarAtStartOfIdentifier())

      return LexIdentifier();

    return AsmToken(AsmToken::Dollar, StringRef(TokStart, 1));

  }

  case '@':

    if (MAI.doesAllowAtAtStartOfIdentifier())

      return LexIdentifier();

    return AsmToken(AsmToken::At, StringRef(TokStart, 1));

  case '#':

    if (MAI.isHLASM())

      return LexIdentifier();

    return AsmToken(AsmToken::Hash, StringRef(TokStart, 1));

  case '?':

    if (MAI.doesAllowQuestionAtStartOfIdentifier())

      return LexIdentifier();

    return AsmToken(AsmToken::Question, StringRef(TokStart, 1));

  case '\\': return AsmToken(AsmToken::BackSlash, StringRef(TokStart, 1));

  case '=':

    if (*CurPtr == '=') {

      ++CurPtr;

      return AsmToken(AsmToken::EqualEqual, StringRef(TokStart, 2));

    }

    return AsmToken(AsmToken::Equal, StringRef(TokStart, 1));

  case '-':

    if (*CurPtr == '>') {

      ++CurPtr;

      return AsmToken(AsmToken::MinusGreater, StringRef(TokStart, 2));

    }

    return AsmToken(AsmToken::Minus, StringRef(TokStart, 1));

  case '|':

    if (*CurPtr == '|') {

      ++CurPtr;

      return AsmToken(AsmToken::PipePipe, StringRef(TokStart, 2));

    }

    return AsmToken(AsmToken::Pipe, StringRef(TokStart, 1));

  case '^': return AsmToken(AsmToken::Caret, StringRef(TokStart, 1));

  case '&':

    if (*CurPtr == '&') {

      ++CurPtr;

      return AsmToken(AsmToken::AmpAmp, StringRef(TokStart, 2));

    }

    return AsmToken(AsmToken::Amp, StringRef(TokStart, 1));

  case '!':

    if (*CurPtr == '=') {

      ++CurPtr;

      return AsmToken(AsmToken::ExclaimEqual, StringRef(TokStart, 2));

    }

    return AsmToken(AsmToken::Exclaim, StringRef(TokStart, 1));

  case '%':

    if (LexMotorolaIntegers && (*CurPtr == '0' || *CurPtr == '1')) {

      return LexDigit();

    }

    return AsmToken(AsmToken::Percent, StringRef(TokStart, 1));

  case '/':

    IsAtStartOfStatement = OldIsAtStartOfStatement;

    return LexSlash();

  case '\'': return LexSingleQuote();

  case '"': return LexQuote();

  case '0': case '1': case '2': case '3': case '4':

  case '5': case '6': case '7': case '8': case '9':

    return LexDigit();

  case '<':

    switch (*CurPtr) {

    case '<':

      ++CurPtr;

      return AsmToken(AsmToken::LessLess, StringRef(TokStart, 2));

    case '=':

      ++CurPtr;

      return AsmToken(AsmToken::LessEqual, StringRef(TokStart, 2));

    case '>':

      ++CurPtr;

      return AsmToken(AsmToken::LessGreater, StringRef(TokStart, 2));

    default:

      return AsmToken(AsmToken::Less, StringRef(TokStart, 1));

    }

  case '>':

    switch (*CurPtr) {

    case '>':

      ++CurPtr;

      return AsmToken(AsmToken::GreaterGreater, StringRef(TokStart, 2));

    case '=':

      ++CurPtr;

      return AsmToken(AsmToken::GreaterEqual, StringRef(TokStart, 2));

    default:

      return AsmToken(AsmToken::Greater, StringRef(TokStart, 1));

    }


  // TODO: Quoted identifiers (objc methods etc)

  // local labels: [0-9][:]

  // Forward/backward labels: [0-9][fb]

  // Integers, fp constants, character constants.

  }

}

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

APInt.h
This file implements a class to represent arbitrary precision integral constant values and operations...

ArrayRef.h

radixName
static std::string radixName(unsigned Radix)
Definition AsmLexer.cpp:387

SkipIgnoredIntegerSuffix
static void SkipIgnoredIntegerSuffix(const char *&CurPtr)
Definition AsmLexer.cpp:337

doHexLookAhead
static unsigned doHexLookAhead(const char *&CurPtr, unsigned DefaultRadix, bool LexHex)
Definition AsmLexer.cpp:349

intToken
static AsmToken intToken(StringRef Ref, APInt &Value)
Definition AsmLexer.cpp:381

findLastDigit
static const char * findLastDigit(const char *CurPtr, unsigned DefaultRadix)
Definition AsmLexer.cpp:374

AsmLexer.h

Compiler.h

MCAsmInfo.h

isIdentifierChar
static bool isIdentifierChar(char C)
Return true if the given character satisfies the following regular expression: [-a-zA-Z$....
Definition MILexer.cpp:118

SMLoc.h

SaveAndRestore.h
This file provides utility classes that use RAII to save and restore values.

StringExtras.h
This file contains some functions that are useful when dealing with strings.

StringRef.h

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::ArrayRef::size
size_t size() const
size - Get the array size.
Definition ArrayRef.h:142

llvm::AsmLexer::AsmLexer
LLVM_ABI AsmLexer(const MCAsmInfo &MAI)
Definition AsmLexer.cpp:110

llvm::AsmLexer::UnLex
void UnLex(AsmToken const &Token)
Definition AsmLexer.h:106

llvm::AsmLexer::is
bool is(AsmToken::TokenKind K) const
Check if the current token has kind K.
Definition AsmLexer.h:147

llvm::AsmLexer::getErrLoc
SMLoc getErrLoc()
Get the current error location.
Definition AsmLexer.h:138

llvm::AsmLexer::getErr
const std::string & getErr()
Get the current error string.
Definition AsmLexer.h:141

llvm::AsmLexer::LexUntilEndOfStatement
LLVM_ABI StringRef LexUntilEndOfStatement()
Definition AsmLexer.cpp:748

llvm::AsmLexer::setBuffer
LLVM_ABI void setBuffer(StringRef Buf, const char *ptr=nullptr, bool EndStatementAtEOF=true)
Set buffer to be lexed.
Definition AsmLexer.cpp:120

llvm::AsmLexer::peekTokens
LLVM_ABI size_t peekTokens(MutableArrayRef< AsmToken > Buf, bool ShouldSkipSpace=true)
Look ahead an arbitrary number of tokens.
Definition AsmLexer.cpp:768

llvm::AsmToken
Target independent representation for an assembler token.
Definition MCAsmMacro.h:22

llvm::AsmToken::getLoc
LLVM_ABI SMLoc getLoc() const
Definition AsmLexer.cpp:31

llvm::AsmToken::getString
StringRef getString() const
Get the string for the current token, this includes all characters (for example, the quotes on string...
Definition MCAsmMacro.h:103

llvm::AsmToken::is
bool is(TokenKind K) const
Definition MCAsmMacro.h:75

llvm::AsmToken::getEndLoc
LLVM_ABI SMLoc getEndLoc() const
Definition AsmLexer.cpp:33

llvm::AsmToken::dump
LLVM_ABI void dump(raw_ostream &OS) const
Definition AsmLexer.cpp:39

llvm::AsmToken::Comment
@ Comment
Definition MCAsmMacro.h:40

llvm::AsmToken::Greater
@ Greater
Definition MCAsmMacro.h:55

llvm::AsmToken::Minus
@ Minus
Definition MCAsmMacro.h:46

llvm::AsmToken::Eof
@ Eof
Definition MCAsmMacro.h:26

llvm::AsmToken::Tilde
@ Tilde
Definition MCAsmMacro.h:46

llvm::AsmToken::String
@ String
Definition MCAsmMacro.h:30

llvm::AsmToken::Error
@ Error
Definition MCAsmMacro.h:26

llvm::AsmToken::Space
@ Space
Definition MCAsmMacro.h:45

llvm::AsmToken::Integer
@ Integer
Definition MCAsmMacro.h:33

llvm::AsmToken::RBrac
@ RBrac
Definition MCAsmMacro.h:49

llvm::AsmToken::Colon
@ Colon
Definition MCAsmMacro.h:44

llvm::AsmToken::LessLess
@ LessLess
Definition MCAsmMacro.h:54

llvm::AsmToken::Percent
@ Percent
Definition MCAsmMacro.h:53

llvm::AsmToken::LBrac
@ LBrac
Definition MCAsmMacro.h:49

llvm::AsmToken::BackSlash
@ BackSlash
Definition MCAsmMacro.h:48

llvm::AsmToken::Caret
@ Caret
Definition MCAsmMacro.h:52

llvm::AsmToken::RCurly
@ RCurly
Definition MCAsmMacro.h:49

llvm::AsmToken::LessEqual
@ LessEqual
Definition MCAsmMacro.h:54

llvm::AsmToken::At
@ At
Definition MCAsmMacro.h:55

llvm::AsmToken::AmpAmp
@ AmpAmp
Definition MCAsmMacro.h:53

llvm::AsmToken::GreaterEqual
@ GreaterEqual
Definition MCAsmMacro.h:55

llvm::AsmToken::HashDirective
@ HashDirective
Definition MCAsmMacro.h:41

llvm::AsmToken::Question
@ Question
Definition MCAsmMacro.h:50

llvm::AsmToken::LessGreater
@ LessGreater
Definition MCAsmMacro.h:54

llvm::AsmToken::Pipe
@ Pipe
Definition MCAsmMacro.h:52

llvm::AsmToken::Hash
@ Hash
Definition MCAsmMacro.h:53

llvm::AsmToken::Identifier
@ Identifier
Definition MCAsmMacro.h:29

llvm::AsmToken::Amp
@ Amp
Definition MCAsmMacro.h:53

llvm::AsmToken::LParen
@ LParen
Definition MCAsmMacro.h:49

llvm::AsmToken::Star
@ Star
Definition MCAsmMacro.h:50

llvm::AsmToken::BigNum
@ BigNum
Definition MCAsmMacro.h:34

llvm::AsmToken::EqualEqual
@ EqualEqual
Definition MCAsmMacro.h:50

llvm::AsmToken::Less
@ Less
Definition MCAsmMacro.h:54

llvm::AsmToken::LCurly
@ LCurly
Definition MCAsmMacro.h:49

llvm::AsmToken::Slash
@ Slash
Definition MCAsmMacro.h:47

llvm::AsmToken::RParen
@ RParen
Definition MCAsmMacro.h:49

llvm::AsmToken::GreaterGreater
@ GreaterGreater
Definition MCAsmMacro.h:55

llvm::AsmToken::PipePipe
@ PipePipe
Definition MCAsmMacro.h:52

llvm::AsmToken::Equal
@ Equal
Definition MCAsmMacro.h:50

llvm::AsmToken::Dollar
@ Dollar
Definition MCAsmMacro.h:50

llvm::AsmToken::MinusGreater
@ MinusGreater
Definition MCAsmMacro.h:55

llvm::AsmToken::Comma
@ Comma
Definition MCAsmMacro.h:50

llvm::AsmToken::Plus
@ Plus
Definition MCAsmMacro.h:46

llvm::AsmToken::Real
@ Real
Definition MCAsmMacro.h:37

llvm::AsmToken::ExclaimEqual
@ ExclaimEqual
Definition MCAsmMacro.h:53

llvm::AsmToken::EndOfStatement
@ EndOfStatement
Definition MCAsmMacro.h:43

llvm::AsmToken::Dot
@ Dot
Definition MCAsmMacro.h:50

llvm::AsmToken::Exclaim
@ Exclaim
Definition MCAsmMacro.h:53

llvm::AsmToken::getLocRange
LLVM_ABI SMRange getLocRange() const
Definition AsmLexer.cpp:37

llvm::MCAsmInfo
This class is intended to be used as a base class for asm properties and features specific to the tar...
Definition MCAsmInfo.h:64

llvm::MCAsmInfo::isHLASM
bool isHLASM() const
Definition MCAsmInfo.h:520

llvm::MCAsmInfo::getCommentString
StringRef getCommentString() const
Definition MCAsmInfo.h:538

llvm::MCAsmInfo::getSeparatorString
const char * getSeparatorString() const
Definition MCAsmInfo.h:533

llvm::MutableArrayRef
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
Definition ArrayRef.h:298

llvm::SMLoc
Represents a location in source code.
Definition SMLoc.h:22

llvm::SMLoc::getFromPointer
static SMLoc getFromPointer(const char *Ptr)
Definition SMLoc.h:35

llvm::SMRange
Represents a range in source code.
Definition SMLoc.h:47

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55

llvm::StringRef::starts_with
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
Definition StringRef.h:261

llvm::StringRef::size
constexpr size_t size() const
size - Get the string size.
Definition StringRef.h:146

llvm::StringRef::data
constexpr const char * data() const
data - Get a pointer to the start of the string (which may not be null terminated).
Definition StringRef.h:140

llvm::StringRef::end
iterator end() const
Definition StringRef.h:114

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53

llvm::raw_ostream::write_escaped
raw_ostream & write_escaped(StringRef Str, bool UseHexEscapes=false)
Output Str, turning '\', '\t', ' ', '"', and anything that doesn't satisfy llvm::isPrint into an esca...
Definition raw_ostream.cpp:158

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::Loc
Definition DwarfDebug.h:129

llvm::ms_demangle::QualifierMangleMode::Result
@ Result
Definition MicrosoftDemangle.h:132

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::hexDigitValue
unsigned hexDigitValue(char C)
Interpret the given character C as a hexadecimal digit and return its value.
Definition StringExtras.h:81

llvm::isDigit
bool isDigit(char C)
Checks if character C is one of the 10 decimal digits.
Definition StringExtras.h:106

llvm::isAlnum
bool isAlnum(char C)
Checks whether character C is either a decimal digit or an uppercase or lowercase letter as classifie...
Definition StringExtras.h:122

llvm::MutableArrayRef
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >

llvm::ModRefInfo::Ref
@ Ref
The access may reference the value stored in memory.
Definition ModRef.h:32

llvm::isHexDigit
bool isHexDigit(char C)
Checks if character C is a hexadecimal numeric character.
Definition StringExtras.h:109

raw_ostream.h

llvm::SaveAndRestore
A utility class that uses RAII to save and restore the value of a variable.
Definition SaveAndRestore.h:23