2007-11-18 16:46:26 +08:00
|
|
|
//===- LLLexer.h - Lexer for LLVM Assembly Files ----------------*- C++ -*-===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
2007-12-30 04:36:04 +08:00
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
2007-11-18 16:46:26 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This class represents the Lexer for .ll files.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2014-08-14 00:26:38 +08:00
|
|
|
#ifndef LLVM_LIB_ASMPARSER_LLLEXER_H
|
|
|
|
#define LLVM_LIB_ASMPARSER_LLLEXER_H
|
2007-11-18 16:46:26 +08:00
|
|
|
|
2009-01-02 15:01:27 +08:00
|
|
|
#include "LLToken.h"
|
|
|
|
#include "llvm/ADT/APFloat.h"
|
2012-12-04 15:12:27 +08:00
|
|
|
#include "llvm/ADT/APSInt.h"
|
2009-07-03 07:08:13 +08:00
|
|
|
#include "llvm/Support/SourceMgr.h"
|
2009-01-03 06:49:28 +08:00
|
|
|
#include <string>
|
2007-11-18 16:46:26 +08:00
|
|
|
|
|
|
|
namespace llvm {
|
|
|
|
class MemoryBuffer;
|
2009-01-02 15:01:27 +08:00
|
|
|
class Type;
|
2009-07-03 06:46:18 +08:00
|
|
|
class SMDiagnostic;
|
2009-08-12 01:45:13 +08:00
|
|
|
class LLVMContext;
|
2009-01-03 06:46:48 +08:00
|
|
|
|
2013-09-12 02:05:11 +08:00
|
|
|
class LLLexer {
|
2007-11-18 16:46:26 +08:00
|
|
|
const char *CurPtr;
|
2014-08-19 06:28:28 +08:00
|
|
|
StringRef CurBuf;
|
2009-07-03 06:46:18 +08:00
|
|
|
SMDiagnostic &ErrorInfo;
|
2009-07-03 07:08:13 +08:00
|
|
|
SourceMgr &SM;
|
2009-07-08 02:44:11 +08:00
|
|
|
LLVMContext &Context;
|
2009-01-02 15:01:27 +08:00
|
|
|
|
|
|
|
// Information about the current token.
|
2007-11-18 16:46:26 +08:00
|
|
|
const char *TokStart;
|
2009-01-02 15:01:27 +08:00
|
|
|
lltok::Kind CurKind;
|
|
|
|
std::string StrVal;
|
|
|
|
unsigned UIntVal;
|
Land the long talked about "type system rewrite" patch. This
patch brings numerous advantages to LLVM. One way to look at it
is through diffstat:
109 files changed, 3005 insertions(+), 5906 deletions(-)
Removing almost 3K lines of code is a good thing. Other advantages
include:
1. Value::getType() is a simple load that can be CSE'd, not a mutating
union-find operation.
2. Types a uniqued and never move once created, defining away PATypeHolder.
3. Structs can be "named" now, and their name is part of the identity that
uniques them. This means that the compiler doesn't merge them structurally
which makes the IR much less confusing.
4. Now that there is no way to get a cycle in a type graph without a named
struct type, "upreferences" go away.
5. Type refinement is completely gone, which should make LTO much MUCH faster
in some common cases with C++ code.
6. Types are now generally immutable, so we can use "Type *" instead
"const Type *" everywhere.
Downsides of this patch are that it removes some functions from the C API,
so people using those will have to upgrade to (not yet added) new API.
"LLVM 3.0" is the right time to do this.
There are still some cleanups pending after this, this patch is large enough
as-is.
llvm-svn: 134829
2011-07-10 01:41:24 +08:00
|
|
|
Type *TyVal;
|
2009-01-02 15:01:27 +08:00
|
|
|
APFloat APFloatVal;
|
|
|
|
APSInt APSIntVal;
|
2009-01-03 06:46:48 +08:00
|
|
|
|
2018-06-26 21:56:49 +08:00
|
|
|
// When false (default), an identifier ending in ':' is a label token.
|
|
|
|
// When true, the ':' is treated as a separate token.
|
|
|
|
bool IgnoreColonInIdentifiers;
|
|
|
|
|
2007-11-18 16:46:26 +08:00
|
|
|
public:
|
2014-08-19 06:28:28 +08:00
|
|
|
explicit LLLexer(StringRef StartBuf, SourceMgr &SM, SMDiagnostic &,
|
2009-07-08 02:44:11 +08:00
|
|
|
LLVMContext &C);
|
2007-11-18 16:46:26 +08:00
|
|
|
|
2009-01-02 15:01:27 +08:00
|
|
|
lltok::Kind Lex() {
|
|
|
|
return CurKind = LexToken();
|
|
|
|
}
|
|
|
|
|
2009-07-03 07:08:13 +08:00
|
|
|
typedef SMLoc LocTy;
|
|
|
|
LocTy getLoc() const { return SMLoc::getFromPointer(TokStart); }
|
2009-01-02 15:01:27 +08:00
|
|
|
lltok::Kind getKind() const { return CurKind; }
|
2010-04-01 12:53:22 +08:00
|
|
|
const std::string &getStrVal() const { return StrVal; }
|
Land the long talked about "type system rewrite" patch. This
patch brings numerous advantages to LLVM. One way to look at it
is through diffstat:
109 files changed, 3005 insertions(+), 5906 deletions(-)
Removing almost 3K lines of code is a good thing. Other advantages
include:
1. Value::getType() is a simple load that can be CSE'd, not a mutating
union-find operation.
2. Types a uniqued and never move once created, defining away PATypeHolder.
3. Structs can be "named" now, and their name is part of the identity that
uniques them. This means that the compiler doesn't merge them structurally
which makes the IR much less confusing.
4. Now that there is no way to get a cycle in a type graph without a named
struct type, "upreferences" go away.
5. Type refinement is completely gone, which should make LTO much MUCH faster
in some common cases with C++ code.
6. Types are now generally immutable, so we can use "Type *" instead
"const Type *" everywhere.
Downsides of this patch are that it removes some functions from the C API,
so people using those will have to upgrade to (not yet added) new API.
"LLVM 3.0" is the right time to do this.
There are still some cleanups pending after this, this patch is large enough
as-is.
llvm-svn: 134829
2011-07-10 01:41:24 +08:00
|
|
|
Type *getTyVal() const { return TyVal; }
|
2009-01-02 15:01:27 +08:00
|
|
|
unsigned getUIntVal() const { return UIntVal; }
|
|
|
|
const APSInt &getAPSIntVal() const { return APSIntVal; }
|
|
|
|
const APFloat &getAPFloatVal() const { return APFloatVal; }
|
|
|
|
|
2018-06-26 21:56:49 +08:00
|
|
|
void setIgnoreColonInIdentifiers(bool val) {
|
|
|
|
IgnoreColonInIdentifiers = val;
|
|
|
|
}
|
2009-01-03 06:46:48 +08:00
|
|
|
|
2018-07-12 10:03:53 +08:00
|
|
|
bool Error(LocTy ErrorLoc, const Twine &Msg) const;
|
2010-09-28 01:42:11 +08:00
|
|
|
bool Error(const Twine &Msg) const { return Error(getLoc(), Msg); }
|
2014-04-06 06:42:53 +08:00
|
|
|
|
|
|
|
void Warning(LocTy WarningLoc, const Twine &Msg) const;
|
|
|
|
void Warning(const Twine &Msg) const { return Warning(getLoc(), Msg); }
|
|
|
|
|
2007-11-18 16:46:26 +08:00
|
|
|
private:
|
2009-01-02 15:01:27 +08:00
|
|
|
lltok::Kind LexToken();
|
|
|
|
|
2007-11-18 16:46:26 +08:00
|
|
|
int getNextChar();
|
|
|
|
void SkipLineComment();
|
2011-06-05 02:16:26 +08:00
|
|
|
lltok::Kind ReadString(lltok::Kind kind);
|
|
|
|
bool ReadVarName();
|
|
|
|
|
2009-01-02 15:01:27 +08:00
|
|
|
lltok::Kind LexIdentifier();
|
|
|
|
lltok::Kind LexDigitOrNegative();
|
|
|
|
lltok::Kind LexPositive();
|
|
|
|
lltok::Kind LexAt();
|
2014-06-28 02:19:56 +08:00
|
|
|
lltok::Kind LexDollar();
|
2009-12-30 12:56:59 +08:00
|
|
|
lltok::Kind LexExclaim();
|
2009-01-02 15:01:27 +08:00
|
|
|
lltok::Kind LexPercent();
|
2018-05-26 10:34:13 +08:00
|
|
|
lltok::Kind LexUIntID(lltok::Kind Token);
|
2014-12-10 08:43:17 +08:00
|
|
|
lltok::Kind LexVar(lltok::Kind Var, lltok::Kind VarID);
|
2009-01-02 15:01:27 +08:00
|
|
|
lltok::Kind LexQuote();
|
|
|
|
lltok::Kind Lex0x();
|
2013-02-06 14:52:58 +08:00
|
|
|
lltok::Kind LexHash();
|
2018-05-26 10:34:13 +08:00
|
|
|
lltok::Kind LexCaret();
|
2009-01-03 06:46:48 +08:00
|
|
|
|
2009-01-02 15:01:27 +08:00
|
|
|
uint64_t atoull(const char *Buffer, const char *End);
|
|
|
|
uint64_t HexIntToVal(const char *Buffer, const char *End);
|
|
|
|
void HexToIntPair(const char *Buffer, const char *End, uint64_t Pair[2]);
|
2018-07-12 10:03:53 +08:00
|
|
|
void FP80HexToIntPair(const char *Buffer, const char *End, uint64_t Pair[2]);
|
2007-11-18 16:46:26 +08:00
|
|
|
};
|
|
|
|
} // end namespace llvm
|
|
|
|
|
|
|
|
#endif
|