llvm-project/llvm/tools/llvm-mc/AsmLexer.h

119 lines
3.0 KiB
C
Raw Normal View History

2009-06-21 15:19:10 +08:00
//===- AsmLexer.h - Lexer for Assembly Files --------------------*- C++ -*-===//
//
// The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
//
// This class declares the lexer for assembly files.
//
//===----------------------------------------------------------------------===//
#ifndef ASMLEXER_H
#define ASMLEXER_H
#include "llvm/Support/DataTypes.h"
#include <string>
#include <cassert>
namespace llvm {
class MemoryBuffer;
class SourceMgr;
class SMLoc;
namespace asmtok {
enum TokKind {
// Markers
Eof, Error,
2009-06-22 03:56:35 +08:00
// String values.
2009-06-21 15:19:10 +08:00
Identifier,
Register,
2009-06-22 03:56:35 +08:00
String,
// Integer values.
2009-06-21 15:19:10 +08:00
IntVal,
2009-06-22 03:56:35 +08:00
// No-value.
EndOfStatement,
2009-06-21 15:19:10 +08:00
Colon,
Plus, Minus, Tilde,
Slash, // '/'
LParen, RParen,
Star, Comma, Dollar, Equal, EqualEqual,
Pipe, PipePipe, Caret,
Amp, AmpAmp, Exclaim, ExclaimEqual, Percent,
Less, LessEqual, LessLess, LessGreater,
Greater, GreaterEqual, GreaterGreater
2009-06-21 15:19:10 +08:00
};
}
/// AsmLexer - Lexer class for assembly files.
class AsmLexer {
SourceMgr &SrcMgr;
const char *CurPtr;
const MemoryBuffer *CurBuf;
// A llvm::StringSet<>, which provides uniqued and null-terminated strings.
void *TheStringSet;
2009-06-21 15:19:10 +08:00
// Information about the current token.
const char *TokStart;
asmtok::TokKind CurKind;
const char *CurStrVal; // This is valid for Identifier.
2009-06-21 15:19:10 +08:00
int64_t CurIntVal;
/// CurBuffer - This is the current buffer index we're lexing from as managed
/// by the SourceMgr object.
int CurBuffer;
void operator=(const AsmLexer&); // DO NOT IMPLEMENT
AsmLexer(const AsmLexer&); // DO NOT IMPLEMENT
2009-06-21 15:19:10 +08:00
public:
AsmLexer(SourceMgr &SrcMgr);
~AsmLexer();
2009-06-21 15:19:10 +08:00
asmtok::TokKind Lex() {
return CurKind = LexToken();
}
asmtok::TokKind getKind() const { return CurKind; }
bool is(asmtok::TokKind K) const { return CurKind == K; }
bool isNot(asmtok::TokKind K) const { return CurKind != K; }
2009-06-21 15:19:10 +08:00
const char *getCurStrVal() const {
2009-06-22 03:56:35 +08:00
assert((CurKind == asmtok::Identifier || CurKind == asmtok::Register ||
CurKind == asmtok::String) &&
2009-06-21 15:19:10 +08:00
"This token doesn't have a string value");
return CurStrVal;
}
int64_t getCurIntVal() const {
assert(CurKind == asmtok::IntVal && "This token isn't an integer");
return CurIntVal;
}
SMLoc getLoc() const;
void PrintMessage(SMLoc Loc, const std::string &Msg, const char *Type) const;
2009-06-21 15:19:10 +08:00
private:
int getNextChar();
asmtok::TokKind ReturnError(const char *Loc, const std::string &Msg);
2009-06-21 15:19:10 +08:00
/// LexToken - Read the next token and return its code.
asmtok::TokKind LexToken();
asmtok::TokKind LexIdentifier();
asmtok::TokKind LexPercent();
asmtok::TokKind LexSlash();
asmtok::TokKind LexLineComment();
asmtok::TokKind LexDigit();
2009-06-22 03:56:35 +08:00
asmtok::TokKind LexQuote();
2009-06-21 15:19:10 +08:00
};
} // end namespace llvm
#endif