|
|
//===-- llvm/MC/MCAsmLexer.h - Abstract Asm Lexer Interface -----*- C++ -*-===//
//
// The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
#ifndef LLVM_MC_MCPARSER_MCASMLEXER_H
#define LLVM_MC_MCPARSER_MCASMLEXER_H
#include "llvm/ADT/StringRef.h"
#include "llvm/Support/Compiler.h"
#include "llvm/Support/DataTypes.h"
#include "llvm/Support/SMLoc.h"
namespace llvm {
/// AsmToken - Target independent representation for an assembler token.
class AsmToken { public: enum TokenKind { // Markers
Eof, Error,
// String values.
Identifier, String,
// Integer values.
Integer,
// Real values.
Real,
// No-value.
EndOfStatement, Colon, Space, Plus, Minus, Tilde, Slash, // '/'
BackSlash, // '\'
LParen, RParen, LBrac, RBrac, LCurly, RCurly, Star, Dot, Comma, Dollar, Equal, EqualEqual,
Pipe, PipePipe, Caret, Amp, AmpAmp, Exclaim, ExclaimEqual, Percent, Hash, Less, LessEqual, LessLess, LessGreater, Greater, GreaterEqual, GreaterGreater, At };
private: TokenKind Kind;
/// A reference to the entire token contents; this is always a pointer into
/// a memory buffer owned by the source manager.
StringRef Str;
int64_t IntVal;
public: AsmToken() {} AsmToken(TokenKind _Kind, StringRef _Str, int64_t _IntVal = 0) : Kind(_Kind), Str(_Str), IntVal(_IntVal) {}
TokenKind getKind() const { return Kind; } bool is(TokenKind K) const { return Kind == K; } bool isNot(TokenKind K) const { return Kind != K; }
SMLoc getLoc() const; SMLoc getEndLoc() const;
/// getStringContents - Get the contents of a string token (without quotes).
StringRef getStringContents() const { assert(Kind == String && "This token isn't a string!"); return Str.slice(1, Str.size() - 1); }
/// getIdentifier - Get the identifier string for the current token, which
/// should be an identifier or a string. This gets the portion of the string
/// which should be used as the identifier, e.g., it does not include the
/// quotes on strings.
StringRef getIdentifier() const { if (Kind == Identifier) return getString(); return getStringContents(); }
/// getString - Get the string for the current token, this includes all
/// characters (for example, the quotes on strings) in the token.
///
/// The returned StringRef points into the source manager's memory buffer, and
/// is safe to store across calls to Lex().
StringRef getString() const { return Str; }
// FIXME: Don't compute this in advance, it makes every token larger, and is
// also not generally what we want (it is nicer for recovery etc. to lex 123br
// as a single token, then diagnose as an invalid number).
int64_t getIntVal() const { assert(Kind == Integer && "This token isn't an integer!"); return IntVal; } };
/// MCAsmLexer - Generic assembler lexer interface, for use by target specific
/// assembly lexers.
class MCAsmLexer { /// The current token, stored in the base class for faster access.
AsmToken CurTok;
/// The location and description of the current error
SMLoc ErrLoc; std::string Err;
MCAsmLexer(const MCAsmLexer &) LLVM_DELETED_FUNCTION; void operator=(const MCAsmLexer &) LLVM_DELETED_FUNCTION; protected: // Can only create subclasses.
const char *TokStart; bool SkipSpace;
MCAsmLexer();
virtual AsmToken LexToken() = 0;
void SetError(const SMLoc &errLoc, const std::string &err) { ErrLoc = errLoc; Err = err; }
public: virtual ~MCAsmLexer();
/// Lex - Consume the next token from the input stream and return it.
///
/// The lexer will continuosly return the end-of-file token once the end of
/// the main input file has been reached.
const AsmToken &Lex() { return CurTok = LexToken(); }
virtual StringRef LexUntilEndOfStatement() = 0;
/// getLoc - Get the current source location.
SMLoc getLoc() const;
/// getTok - Get the current (last) lexed token.
const AsmToken &getTok() { return CurTok; }
/// getErrLoc - Get the current error location
const SMLoc &getErrLoc() { return ErrLoc; }
/// getErr - Get the current error string
const std::string &getErr() { return Err; }
/// getKind - Get the kind of current token.
AsmToken::TokenKind getKind() const { return CurTok.getKind(); }
/// is - Check if the current token has kind \p K.
bool is(AsmToken::TokenKind K) const { return CurTok.is(K); }
/// isNot - Check if the current token has kind \p K.
bool isNot(AsmToken::TokenKind K) const { return CurTok.isNot(K); }
/// setSkipSpace - Set whether spaces should be ignored by the lexer
void setSkipSpace(bool val) { SkipSpace = val; } };
} // End llvm namespace
#endif
|