123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146 |
- //===- LLLexer.cpp - Lexer for .ll Files ----------------------------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- // Implement the Lexer for .ll files.
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/AsmParser/LLLexer.h"
- #include "llvm/ADT/APInt.h"
- #include "llvm/ADT/STLExtras.h"
- #include "llvm/ADT/StringExtras.h"
- #include "llvm/ADT/Twine.h"
- #include "llvm/IR/DerivedTypes.h"
- #include "llvm/IR/Instruction.h"
- #include "llvm/Support/ErrorHandling.h"
- #include "llvm/Support/SourceMgr.h"
- #include <cassert>
- #include <cctype>
- #include <cstdio>
- using namespace llvm;
- bool LLLexer::Error(LocTy ErrorLoc, const Twine &Msg) const {
- ErrorInfo = SM.GetMessage(ErrorLoc, SourceMgr::DK_Error, Msg);
- return true;
- }
- void LLLexer::Warning(LocTy WarningLoc, const Twine &Msg) const {
- SM.PrintMessage(WarningLoc, SourceMgr::DK_Warning, Msg);
- }
- //===----------------------------------------------------------------------===//
- // Helper functions.
- //===----------------------------------------------------------------------===//
- // atoull - Convert an ascii string of decimal digits into the unsigned long
- // long representation... this does not have to do input error checking,
- // because we know that the input will be matched by a suitable regex...
- //
- uint64_t LLLexer::atoull(const char *Buffer, const char *End) {
- uint64_t Result = 0;
- for (; Buffer != End; Buffer++) {
- uint64_t OldRes = Result;
- Result *= 10;
- Result += *Buffer-'0';
- if (Result < OldRes) { // Uh, oh, overflow detected!!!
- Error("constant bigger than 64 bits detected!");
- return 0;
- }
- }
- return Result;
- }
- uint64_t LLLexer::HexIntToVal(const char *Buffer, const char *End) {
- uint64_t Result = 0;
- for (; Buffer != End; ++Buffer) {
- uint64_t OldRes = Result;
- Result *= 16;
- Result += hexDigitValue(*Buffer);
- if (Result < OldRes) { // Uh, oh, overflow detected!!!
- Error("constant bigger than 64 bits detected!");
- return 0;
- }
- }
- return Result;
- }
- void LLLexer::HexToIntPair(const char *Buffer, const char *End,
- uint64_t Pair[2]) {
- Pair[0] = 0;
- if (End - Buffer >= 16) {
- for (int i = 0; i < 16; i++, Buffer++) {
- assert(Buffer != End);
- Pair[0] *= 16;
- Pair[0] += hexDigitValue(*Buffer);
- }
- }
- Pair[1] = 0;
- for (int i = 0; i < 16 && Buffer != End; i++, Buffer++) {
- Pair[1] *= 16;
- Pair[1] += hexDigitValue(*Buffer);
- }
- if (Buffer != End)
- Error("constant bigger than 128 bits detected!");
- }
- /// FP80HexToIntPair - translate an 80 bit FP80 number (20 hexits) into
- /// { low64, high16 } as usual for an APInt.
- void LLLexer::FP80HexToIntPair(const char *Buffer, const char *End,
- uint64_t Pair[2]) {
- Pair[1] = 0;
- for (int i=0; i<4 && Buffer != End; i++, Buffer++) {
- assert(Buffer != End);
- Pair[1] *= 16;
- Pair[1] += hexDigitValue(*Buffer);
- }
- Pair[0] = 0;
- for (int i = 0; i < 16 && Buffer != End; i++, Buffer++) {
- Pair[0] *= 16;
- Pair[0] += hexDigitValue(*Buffer);
- }
- if (Buffer != End)
- Error("constant bigger than 128 bits detected!");
- }
- // UnEscapeLexed - Run through the specified buffer and change \xx codes to the
- // appropriate character.
- static void UnEscapeLexed(std::string &Str) {
- if (Str.empty()) return;
- char *Buffer = &Str[0], *EndBuffer = Buffer+Str.size();
- char *BOut = Buffer;
- for (char *BIn = Buffer; BIn != EndBuffer; ) {
- if (BIn[0] == '\\') {
- if (BIn < EndBuffer-1 && BIn[1] == '\\') {
- *BOut++ = '\\'; // Two \ becomes one
- BIn += 2;
- } else if (BIn < EndBuffer-2 &&
- isxdigit(static_cast<unsigned char>(BIn[1])) &&
- isxdigit(static_cast<unsigned char>(BIn[2]))) {
- *BOut = hexDigitValue(BIn[1]) * 16 + hexDigitValue(BIn[2]);
- BIn += 3; // Skip over handled chars
- ++BOut;
- } else {
- *BOut++ = *BIn++;
- }
- } else {
- *BOut++ = *BIn++;
- }
- }
- Str.resize(BOut-Buffer);
- }
- /// isLabelChar - Return true for [-a-zA-Z$._0-9].
- static bool isLabelChar(char C) {
- return isalnum(static_cast<unsigned char>(C)) || C == '-' || C == '$' ||
- C == '.' || C == '_';
- }
- /// isLabelTail - Return true if this pointer points to a valid end of a label.
- static const char *isLabelTail(const char *CurPtr) {
- while (true) {
- if (CurPtr[0] == ':') return CurPtr+1;
- if (!isLabelChar(CurPtr[0])) return nullptr;
- ++CurPtr;
- }
- }
- //===----------------------------------------------------------------------===//
- // Lexer definition.
- //===----------------------------------------------------------------------===//
- LLLexer::LLLexer(StringRef StartBuf, SourceMgr &SM, SMDiagnostic &Err,
- LLVMContext &C)
- : CurBuf(StartBuf), ErrorInfo(Err), SM(SM), Context(C), APFloatVal(0.0),
- IgnoreColonInIdentifiers(false) {
- CurPtr = CurBuf.begin();
- }
- int LLLexer::getNextChar() {
- char CurChar = *CurPtr++;
- switch (CurChar) {
- default: return (unsigned char)CurChar;
- case 0:
- // A nul character in the stream is either the end of the current buffer or
- // a random nul in the file. Disambiguate that here.
- if (CurPtr-1 != CurBuf.end())
- return 0; // Just whitespace.
- // Otherwise, return end of file.
- --CurPtr; // Another call to lex will return EOF again.
- return EOF;
- }
- }
- lltok::Kind LLLexer::LexToken() {
- while (true) {
- TokStart = CurPtr;
- int CurChar = getNextChar();
- switch (CurChar) {
- default:
- // Handle letters: [a-zA-Z_]
- if (isalpha(static_cast<unsigned char>(CurChar)) || CurChar == '_')
- return LexIdentifier();
- return lltok::Error;
- case EOF: return lltok::Eof;
- case 0:
- case ' ':
- case '\t':
- case '\n':
- case '\r':
- // Ignore whitespace.
- continue;
- case '+': return LexPositive();
- case '@': return LexAt();
- case '$': return LexDollar();
- case '%': return LexPercent();
- case '"': return LexQuote();
- case '.':
- if (const char *Ptr = isLabelTail(CurPtr)) {
- CurPtr = Ptr;
- StrVal.assign(TokStart, CurPtr-1);
- return lltok::LabelStr;
- }
- if (CurPtr[0] == '.' && CurPtr[1] == '.') {
- CurPtr += 2;
- return lltok::dotdotdot;
- }
- return lltok::Error;
- case ';':
- SkipLineComment();
- continue;
- case '!': return LexExclaim();
- case '^':
- return LexCaret();
- case ':':
- return lltok::colon;
- case '#': return LexHash();
- case '0': case '1': case '2': case '3': case '4':
- case '5': case '6': case '7': case '8': case '9':
- case '-':
- return LexDigitOrNegative();
- case '=': return lltok::equal;
- case '[': return lltok::lsquare;
- case ']': return lltok::rsquare;
- case '{': return lltok::lbrace;
- case '}': return lltok::rbrace;
- case '<': return lltok::less;
- case '>': return lltok::greater;
- case '(': return lltok::lparen;
- case ')': return lltok::rparen;
- case ',': return lltok::comma;
- case '*': return lltok::star;
- case '|': return lltok::bar;
- }
- }
- }
- void LLLexer::SkipLineComment() {
- while (true) {
- if (CurPtr[0] == '\n' || CurPtr[0] == '\r' || getNextChar() == EOF)
- return;
- }
- }
- /// Lex all tokens that start with an @ character.
- /// GlobalVar @\"[^\"]*\"
- /// GlobalVar @[-a-zA-Z$._][-a-zA-Z$._0-9]*
- /// GlobalVarID @[0-9]+
- lltok::Kind LLLexer::LexAt() {
- return LexVar(lltok::GlobalVar, lltok::GlobalID);
- }
- lltok::Kind LLLexer::LexDollar() {
- if (const char *Ptr = isLabelTail(TokStart)) {
- CurPtr = Ptr;
- StrVal.assign(TokStart, CurPtr - 1);
- return lltok::LabelStr;
- }
- // Handle DollarStringConstant: $\"[^\"]*\"
- if (CurPtr[0] == '"') {
- ++CurPtr;
- while (true) {
- int CurChar = getNextChar();
- if (CurChar == EOF) {
- Error("end of file in COMDAT variable name");
- return lltok::Error;
- }
- if (CurChar == '"') {
- StrVal.assign(TokStart + 2, CurPtr - 1);
- UnEscapeLexed(StrVal);
- if (StringRef(StrVal).find_first_of(0) != StringRef::npos) {
- Error("Null bytes are not allowed in names");
- return lltok::Error;
- }
- return lltok::ComdatVar;
- }
- }
- }
- // Handle ComdatVarName: $[-a-zA-Z$._][-a-zA-Z$._0-9]*
- if (ReadVarName())
- return lltok::ComdatVar;
- return lltok::Error;
- }
- /// ReadString - Read a string until the closing quote.
- lltok::Kind LLLexer::ReadString(lltok::Kind kind) {
- const char *Start = CurPtr;
- while (true) {
- int CurChar = getNextChar();
- if (CurChar == EOF) {
- Error("end of file in string constant");
- return lltok::Error;
- }
- if (CurChar == '"') {
- StrVal.assign(Start, CurPtr-1);
- UnEscapeLexed(StrVal);
- return kind;
- }
- }
- }
- /// ReadVarName - Read the rest of a token containing a variable name.
- bool LLLexer::ReadVarName() {
- const char *NameStart = CurPtr;
- if (isalpha(static_cast<unsigned char>(CurPtr[0])) ||
- CurPtr[0] == '-' || CurPtr[0] == '$' ||
- CurPtr[0] == '.' || CurPtr[0] == '_') {
- ++CurPtr;
- while (isalnum(static_cast<unsigned char>(CurPtr[0])) ||
- CurPtr[0] == '-' || CurPtr[0] == '$' ||
- CurPtr[0] == '.' || CurPtr[0] == '_')
- ++CurPtr;
- StrVal.assign(NameStart, CurPtr);
- return true;
- }
- return false;
- }
- // Lex an ID: [0-9]+. On success, the ID is stored in UIntVal and Token is
- // returned, otherwise the Error token is returned.
- lltok::Kind LLLexer::LexUIntID(lltok::Kind Token) {
- if (!isdigit(static_cast<unsigned char>(CurPtr[0])))
- return lltok::Error;
- for (++CurPtr; isdigit(static_cast<unsigned char>(CurPtr[0])); ++CurPtr)
- /*empty*/;
- uint64_t Val = atoull(TokStart + 1, CurPtr);
- if ((unsigned)Val != Val)
- Error("invalid value number (too large)!");
- UIntVal = unsigned(Val);
- return Token;
- }
- lltok::Kind LLLexer::LexVar(lltok::Kind Var, lltok::Kind VarID) {
- // Handle StringConstant: \"[^\"]*\"
- if (CurPtr[0] == '"') {
- ++CurPtr;
- while (true) {
- int CurChar = getNextChar();
- if (CurChar == EOF) {
- Error("end of file in global variable name");
- return lltok::Error;
- }
- if (CurChar == '"') {
- StrVal.assign(TokStart+2, CurPtr-1);
- UnEscapeLexed(StrVal);
- if (StringRef(StrVal).find_first_of(0) != StringRef::npos) {
- Error("Null bytes are not allowed in names");
- return lltok::Error;
- }
- return Var;
- }
- }
- }
- // Handle VarName: [-a-zA-Z$._][-a-zA-Z$._0-9]*
- if (ReadVarName())
- return Var;
- // Handle VarID: [0-9]+
- return LexUIntID(VarID);
- }
- /// Lex all tokens that start with a % character.
- /// LocalVar ::= %\"[^\"]*\"
- /// LocalVar ::= %[-a-zA-Z$._][-a-zA-Z$._0-9]*
- /// LocalVarID ::= %[0-9]+
- lltok::Kind LLLexer::LexPercent() {
- return LexVar(lltok::LocalVar, lltok::LocalVarID);
- }
- /// Lex all tokens that start with a " character.
- /// QuoteLabel "[^"]+":
- /// StringConstant "[^"]*"
- lltok::Kind LLLexer::LexQuote() {
- lltok::Kind kind = ReadString(lltok::StringConstant);
- if (kind == lltok::Error || kind == lltok::Eof)
- return kind;
- if (CurPtr[0] == ':') {
- ++CurPtr;
- if (StringRef(StrVal).find_first_of(0) != StringRef::npos) {
- Error("Null bytes are not allowed in names");
- kind = lltok::Error;
- } else {
- kind = lltok::LabelStr;
- }
- }
- return kind;
- }
- /// Lex all tokens that start with a ! character.
- /// !foo
- /// !
- lltok::Kind LLLexer::LexExclaim() {
- // Lex a metadata name as a MetadataVar.
- if (isalpha(static_cast<unsigned char>(CurPtr[0])) ||
- CurPtr[0] == '-' || CurPtr[0] == '$' ||
- CurPtr[0] == '.' || CurPtr[0] == '_' || CurPtr[0] == '\\') {
- ++CurPtr;
- while (isalnum(static_cast<unsigned char>(CurPtr[0])) ||
- CurPtr[0] == '-' || CurPtr[0] == '$' ||
- CurPtr[0] == '.' || CurPtr[0] == '_' || CurPtr[0] == '\\')
- ++CurPtr;
- StrVal.assign(TokStart+1, CurPtr); // Skip !
- UnEscapeLexed(StrVal);
- return lltok::MetadataVar;
- }
- return lltok::exclaim;
- }
- /// Lex all tokens that start with a ^ character.
- /// SummaryID ::= ^[0-9]+
- lltok::Kind LLLexer::LexCaret() {
- // Handle SummaryID: ^[0-9]+
- return LexUIntID(lltok::SummaryID);
- }
- /// Lex all tokens that start with a # character.
- /// AttrGrpID ::= #[0-9]+
- lltok::Kind LLLexer::LexHash() {
- // Handle AttrGrpID: #[0-9]+
- return LexUIntID(lltok::AttrGrpID);
- }
- /// Lex a label, integer type, keyword, or hexadecimal integer constant.
- /// Label [-a-zA-Z$._0-9]+:
- /// IntegerType i[0-9]+
- /// Keyword sdiv, float, ...
- /// HexIntConstant [us]0x[0-9A-Fa-f]+
- lltok::Kind LLLexer::LexIdentifier() {
- const char *StartChar = CurPtr;
- const char *IntEnd = CurPtr[-1] == 'i' ? nullptr : StartChar;
- const char *KeywordEnd = nullptr;
- for (; isLabelChar(*CurPtr); ++CurPtr) {
- // If we decide this is an integer, remember the end of the sequence.
- if (!IntEnd && !isdigit(static_cast<unsigned char>(*CurPtr)))
- IntEnd = CurPtr;
- if (!KeywordEnd && !isalnum(static_cast<unsigned char>(*CurPtr)) &&
- *CurPtr != '_')
- KeywordEnd = CurPtr;
- }
- // If we stopped due to a colon, unless we were directed to ignore it,
- // this really is a label.
- if (!IgnoreColonInIdentifiers && *CurPtr == ':') {
- StrVal.assign(StartChar-1, CurPtr++);
- return lltok::LabelStr;
- }
- // Otherwise, this wasn't a label. If this was valid as an integer type,
- // return it.
- if (!IntEnd) IntEnd = CurPtr;
- if (IntEnd != StartChar) {
- CurPtr = IntEnd;
- uint64_t NumBits = atoull(StartChar, CurPtr);
- if (NumBits < IntegerType::MIN_INT_BITS ||
- NumBits > IntegerType::MAX_INT_BITS) {
- Error("bitwidth for integer type out of range!");
- return lltok::Error;
- }
- TyVal = IntegerType::get(Context, NumBits);
- return lltok::Type;
- }
- // Otherwise, this was a letter sequence. See which keyword this is.
- if (!KeywordEnd) KeywordEnd = CurPtr;
- CurPtr = KeywordEnd;
- --StartChar;
- StringRef Keyword(StartChar, CurPtr - StartChar);
- #define KEYWORD(STR) \
- do { \
- if (Keyword == #STR) \
- return lltok::kw_##STR; \
- } while (false)
- KEYWORD(true); KEYWORD(false);
- KEYWORD(declare); KEYWORD(define);
- KEYWORD(global); KEYWORD(constant);
- KEYWORD(dso_local);
- KEYWORD(dso_preemptable);
- KEYWORD(private);
- KEYWORD(internal);
- KEYWORD(available_externally);
- KEYWORD(linkonce);
- KEYWORD(linkonce_odr);
- KEYWORD(weak); // Use as a linkage, and a modifier for "cmpxchg".
- KEYWORD(weak_odr);
- KEYWORD(appending);
- KEYWORD(dllimport);
- KEYWORD(dllexport);
- KEYWORD(common);
- KEYWORD(default);
- KEYWORD(hidden);
- KEYWORD(protected);
- KEYWORD(unnamed_addr);
- KEYWORD(local_unnamed_addr);
- KEYWORD(externally_initialized);
- KEYWORD(extern_weak);
- KEYWORD(external);
- KEYWORD(thread_local);
- KEYWORD(localdynamic);
- KEYWORD(initialexec);
- KEYWORD(localexec);
- KEYWORD(zeroinitializer);
- KEYWORD(undef);
- KEYWORD(null);
- KEYWORD(none);
- KEYWORD(poison);
- KEYWORD(to);
- KEYWORD(caller);
- KEYWORD(within);
- KEYWORD(from);
- KEYWORD(tail);
- KEYWORD(musttail);
- KEYWORD(notail);
- KEYWORD(target);
- KEYWORD(triple);
- KEYWORD(source_filename);
- KEYWORD(unwind);
- KEYWORD(datalayout);
- KEYWORD(volatile);
- KEYWORD(atomic);
- KEYWORD(unordered);
- KEYWORD(monotonic);
- KEYWORD(acquire);
- KEYWORD(release);
- KEYWORD(acq_rel);
- KEYWORD(seq_cst);
- KEYWORD(syncscope);
- KEYWORD(nnan);
- KEYWORD(ninf);
- KEYWORD(nsz);
- KEYWORD(arcp);
- KEYWORD(contract);
- KEYWORD(reassoc);
- KEYWORD(afn);
- KEYWORD(fast);
- KEYWORD(nuw);
- KEYWORD(nsw);
- KEYWORD(exact);
- KEYWORD(inbounds);
- KEYWORD(inrange);
- KEYWORD(addrspace);
- KEYWORD(section);
- KEYWORD(partition);
- KEYWORD(alias);
- KEYWORD(ifunc);
- KEYWORD(module);
- KEYWORD(asm);
- KEYWORD(sideeffect);
- KEYWORD(inteldialect);
- KEYWORD(gc);
- KEYWORD(prefix);
- KEYWORD(prologue);
- KEYWORD(no_sanitize_address);
- KEYWORD(no_sanitize_hwaddress);
- KEYWORD(sanitize_address_dyninit);
- KEYWORD(ccc);
- KEYWORD(fastcc);
- KEYWORD(coldcc);
- KEYWORD(cfguard_checkcc);
- KEYWORD(x86_stdcallcc);
- KEYWORD(x86_fastcallcc);
- KEYWORD(x86_thiscallcc);
- KEYWORD(x86_vectorcallcc);
- KEYWORD(arm_apcscc);
- KEYWORD(arm_aapcscc);
- KEYWORD(arm_aapcs_vfpcc);
- KEYWORD(aarch64_vector_pcs);
- KEYWORD(aarch64_sve_vector_pcs);
- KEYWORD(aarch64_sme_preservemost_from_x0);
- KEYWORD(aarch64_sme_preservemost_from_x2);
- KEYWORD(msp430_intrcc);
- KEYWORD(avr_intrcc);
- KEYWORD(avr_signalcc);
- KEYWORD(ptx_kernel);
- KEYWORD(ptx_device);
- KEYWORD(spir_kernel);
- KEYWORD(spir_func);
- KEYWORD(intel_ocl_bicc);
- KEYWORD(x86_64_sysvcc);
- KEYWORD(win64cc);
- KEYWORD(x86_regcallcc);
- KEYWORD(webkit_jscc);
- KEYWORD(swiftcc);
- KEYWORD(swifttailcc);
- KEYWORD(anyregcc);
- KEYWORD(preserve_mostcc);
- KEYWORD(preserve_allcc);
- KEYWORD(ghccc);
- KEYWORD(x86_intrcc);
- KEYWORD(hhvmcc);
- KEYWORD(hhvm_ccc);
- KEYWORD(cxx_fast_tlscc);
- KEYWORD(amdgpu_vs);
- KEYWORD(amdgpu_ls);
- KEYWORD(amdgpu_hs);
- KEYWORD(amdgpu_es);
- KEYWORD(amdgpu_gs);
- KEYWORD(amdgpu_ps);
- KEYWORD(amdgpu_cs);
- KEYWORD(amdgpu_kernel);
- KEYWORD(amdgpu_gfx);
- KEYWORD(tailcc);
- KEYWORD(cc);
- KEYWORD(c);
- KEYWORD(attributes);
- KEYWORD(sync);
- KEYWORD(async);
- #define GET_ATTR_NAMES
- #define ATTRIBUTE_ENUM(ENUM_NAME, DISPLAY_NAME) \
- KEYWORD(DISPLAY_NAME);
- #include "llvm/IR/Attributes.inc"
- KEYWORD(read);
- KEYWORD(write);
- KEYWORD(readwrite);
- KEYWORD(argmem);
- KEYWORD(inaccessiblemem);
- KEYWORD(argmemonly);
- KEYWORD(inaccessiblememonly);
- KEYWORD(inaccessiblemem_or_argmemonly);
- KEYWORD(type);
- KEYWORD(opaque);
- KEYWORD(comdat);
- // Comdat types
- KEYWORD(any);
- KEYWORD(exactmatch);
- KEYWORD(largest);
- KEYWORD(nodeduplicate);
- KEYWORD(samesize);
- KEYWORD(eq); KEYWORD(ne); KEYWORD(slt); KEYWORD(sgt); KEYWORD(sle);
- KEYWORD(sge); KEYWORD(ult); KEYWORD(ugt); KEYWORD(ule); KEYWORD(uge);
- KEYWORD(oeq); KEYWORD(one); KEYWORD(olt); KEYWORD(ogt); KEYWORD(ole);
- KEYWORD(oge); KEYWORD(ord); KEYWORD(uno); KEYWORD(ueq); KEYWORD(une);
- KEYWORD(xchg); KEYWORD(nand); KEYWORD(max); KEYWORD(min); KEYWORD(umax);
- KEYWORD(umin); KEYWORD(fmax); KEYWORD(fmin);
- KEYWORD(uinc_wrap);
- KEYWORD(udec_wrap);
- KEYWORD(vscale);
- KEYWORD(x);
- KEYWORD(blockaddress);
- KEYWORD(dso_local_equivalent);
- KEYWORD(no_cfi);
- // Metadata types.
- KEYWORD(distinct);
- // Use-list order directives.
- KEYWORD(uselistorder);
- KEYWORD(uselistorder_bb);
- KEYWORD(personality);
- KEYWORD(cleanup);
- KEYWORD(catch);
- KEYWORD(filter);
- // Summary index keywords.
- KEYWORD(path);
- KEYWORD(hash);
- KEYWORD(gv);
- KEYWORD(guid);
- KEYWORD(name);
- KEYWORD(summaries);
- KEYWORD(flags);
- KEYWORD(blockcount);
- KEYWORD(linkage);
- KEYWORD(visibility);
- KEYWORD(notEligibleToImport);
- KEYWORD(live);
- KEYWORD(dsoLocal);
- KEYWORD(canAutoHide);
- KEYWORD(function);
- KEYWORD(insts);
- KEYWORD(funcFlags);
- KEYWORD(readNone);
- KEYWORD(readOnly);
- KEYWORD(noRecurse);
- KEYWORD(returnDoesNotAlias);
- KEYWORD(noInline);
- KEYWORD(alwaysInline);
- KEYWORD(noUnwind);
- KEYWORD(mayThrow);
- KEYWORD(hasUnknownCall);
- KEYWORD(mustBeUnreachable);
- KEYWORD(calls);
- KEYWORD(callee);
- KEYWORD(params);
- KEYWORD(param);
- KEYWORD(hotness);
- KEYWORD(unknown);
- KEYWORD(critical);
- KEYWORD(relbf);
- KEYWORD(variable);
- KEYWORD(vTableFuncs);
- KEYWORD(virtFunc);
- KEYWORD(aliasee);
- KEYWORD(refs);
- KEYWORD(typeIdInfo);
- KEYWORD(typeTests);
- KEYWORD(typeTestAssumeVCalls);
- KEYWORD(typeCheckedLoadVCalls);
- KEYWORD(typeTestAssumeConstVCalls);
- KEYWORD(typeCheckedLoadConstVCalls);
- KEYWORD(vFuncId);
- KEYWORD(offset);
- KEYWORD(args);
- KEYWORD(typeid);
- KEYWORD(typeidCompatibleVTable);
- KEYWORD(summary);
- KEYWORD(typeTestRes);
- KEYWORD(kind);
- KEYWORD(unsat);
- KEYWORD(byteArray);
- KEYWORD(inline);
- KEYWORD(single);
- KEYWORD(allOnes);
- KEYWORD(sizeM1BitWidth);
- KEYWORD(alignLog2);
- KEYWORD(sizeM1);
- KEYWORD(bitMask);
- KEYWORD(inlineBits);
- KEYWORD(vcall_visibility);
- KEYWORD(wpdResolutions);
- KEYWORD(wpdRes);
- KEYWORD(indir);
- KEYWORD(singleImpl);
- KEYWORD(branchFunnel);
- KEYWORD(singleImplName);
- KEYWORD(resByArg);
- KEYWORD(byArg);
- KEYWORD(uniformRetVal);
- KEYWORD(uniqueRetVal);
- KEYWORD(virtualConstProp);
- KEYWORD(info);
- KEYWORD(byte);
- KEYWORD(bit);
- KEYWORD(varFlags);
- KEYWORD(callsites);
- KEYWORD(clones);
- KEYWORD(stackIds);
- KEYWORD(allocs);
- KEYWORD(versions);
- KEYWORD(memProf);
- KEYWORD(notcold);
- KEYWORD(notcoldandcold);
- #undef KEYWORD
- // Keywords for types.
- #define TYPEKEYWORD(STR, LLVMTY) \
- do { \
- if (Keyword == STR) { \
- TyVal = LLVMTY; \
- return lltok::Type; \
- } \
- } while (false)
- TYPEKEYWORD("void", Type::getVoidTy(Context));
- TYPEKEYWORD("half", Type::getHalfTy(Context));
- TYPEKEYWORD("bfloat", Type::getBFloatTy(Context));
- TYPEKEYWORD("float", Type::getFloatTy(Context));
- TYPEKEYWORD("double", Type::getDoubleTy(Context));
- TYPEKEYWORD("x86_fp80", Type::getX86_FP80Ty(Context));
- TYPEKEYWORD("fp128", Type::getFP128Ty(Context));
- TYPEKEYWORD("ppc_fp128", Type::getPPC_FP128Ty(Context));
- TYPEKEYWORD("label", Type::getLabelTy(Context));
- TYPEKEYWORD("metadata", Type::getMetadataTy(Context));
- TYPEKEYWORD("x86_mmx", Type::getX86_MMXTy(Context));
- TYPEKEYWORD("x86_amx", Type::getX86_AMXTy(Context));
- TYPEKEYWORD("token", Type::getTokenTy(Context));
- if (Keyword == "ptr") {
- if (Context.supportsTypedPointers()) {
- Warning("ptr type is only supported in -opaque-pointers mode");
- return lltok::Error;
- }
- TyVal = PointerType::getUnqual(Context);
- return lltok::Type;
- }
- #undef TYPEKEYWORD
- // Keywords for instructions.
- #define INSTKEYWORD(STR, Enum) \
- do { \
- if (Keyword == #STR) { \
- UIntVal = Instruction::Enum; \
- return lltok::kw_##STR; \
- } \
- } while (false)
- INSTKEYWORD(fneg, FNeg);
- INSTKEYWORD(add, Add); INSTKEYWORD(fadd, FAdd);
- INSTKEYWORD(sub, Sub); INSTKEYWORD(fsub, FSub);
- INSTKEYWORD(mul, Mul); INSTKEYWORD(fmul, FMul);
- INSTKEYWORD(udiv, UDiv); INSTKEYWORD(sdiv, SDiv); INSTKEYWORD(fdiv, FDiv);
- INSTKEYWORD(urem, URem); INSTKEYWORD(srem, SRem); INSTKEYWORD(frem, FRem);
- INSTKEYWORD(shl, Shl); INSTKEYWORD(lshr, LShr); INSTKEYWORD(ashr, AShr);
- INSTKEYWORD(and, And); INSTKEYWORD(or, Or); INSTKEYWORD(xor, Xor);
- INSTKEYWORD(icmp, ICmp); INSTKEYWORD(fcmp, FCmp);
- INSTKEYWORD(phi, PHI);
- INSTKEYWORD(call, Call);
- INSTKEYWORD(trunc, Trunc);
- INSTKEYWORD(zext, ZExt);
- INSTKEYWORD(sext, SExt);
- INSTKEYWORD(fptrunc, FPTrunc);
- INSTKEYWORD(fpext, FPExt);
- INSTKEYWORD(uitofp, UIToFP);
- INSTKEYWORD(sitofp, SIToFP);
- INSTKEYWORD(fptoui, FPToUI);
- INSTKEYWORD(fptosi, FPToSI);
- INSTKEYWORD(inttoptr, IntToPtr);
- INSTKEYWORD(ptrtoint, PtrToInt);
- INSTKEYWORD(bitcast, BitCast);
- INSTKEYWORD(addrspacecast, AddrSpaceCast);
- INSTKEYWORD(select, Select);
- INSTKEYWORD(va_arg, VAArg);
- INSTKEYWORD(ret, Ret);
- INSTKEYWORD(br, Br);
- INSTKEYWORD(switch, Switch);
- INSTKEYWORD(indirectbr, IndirectBr);
- INSTKEYWORD(invoke, Invoke);
- INSTKEYWORD(resume, Resume);
- INSTKEYWORD(unreachable, Unreachable);
- INSTKEYWORD(callbr, CallBr);
- INSTKEYWORD(alloca, Alloca);
- INSTKEYWORD(load, Load);
- INSTKEYWORD(store, Store);
- INSTKEYWORD(cmpxchg, AtomicCmpXchg);
- INSTKEYWORD(atomicrmw, AtomicRMW);
- INSTKEYWORD(fence, Fence);
- INSTKEYWORD(getelementptr, GetElementPtr);
- INSTKEYWORD(extractelement, ExtractElement);
- INSTKEYWORD(insertelement, InsertElement);
- INSTKEYWORD(shufflevector, ShuffleVector);
- INSTKEYWORD(extractvalue, ExtractValue);
- INSTKEYWORD(insertvalue, InsertValue);
- INSTKEYWORD(landingpad, LandingPad);
- INSTKEYWORD(cleanupret, CleanupRet);
- INSTKEYWORD(catchret, CatchRet);
- INSTKEYWORD(catchswitch, CatchSwitch);
- INSTKEYWORD(catchpad, CatchPad);
- INSTKEYWORD(cleanuppad, CleanupPad);
- INSTKEYWORD(freeze, Freeze);
- #undef INSTKEYWORD
- #define DWKEYWORD(TYPE, TOKEN) \
- do { \
- if (Keyword.startswith("DW_" #TYPE "_")) { \
- StrVal.assign(Keyword.begin(), Keyword.end()); \
- return lltok::TOKEN; \
- } \
- } while (false)
- DWKEYWORD(TAG, DwarfTag);
- DWKEYWORD(ATE, DwarfAttEncoding);
- DWKEYWORD(VIRTUALITY, DwarfVirtuality);
- DWKEYWORD(LANG, DwarfLang);
- DWKEYWORD(CC, DwarfCC);
- DWKEYWORD(OP, DwarfOp);
- DWKEYWORD(MACINFO, DwarfMacinfo);
- #undef DWKEYWORD
- if (Keyword.startswith("DIFlag")) {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::DIFlag;
- }
- if (Keyword.startswith("DISPFlag")) {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::DISPFlag;
- }
- if (Keyword.startswith("CSK_")) {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::ChecksumKind;
- }
- if (Keyword == "NoDebug" || Keyword == "FullDebug" ||
- Keyword == "LineTablesOnly" || Keyword == "DebugDirectivesOnly") {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::EmissionKind;
- }
- if (Keyword == "GNU" || Keyword == "None" || Keyword == "Default") {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::NameTableKind;
- }
- // Check for [us]0x[0-9A-Fa-f]+ which are Hexadecimal constant generated by
- // the CFE to avoid forcing it to deal with 64-bit numbers.
- if ((TokStart[0] == 'u' || TokStart[0] == 's') &&
- TokStart[1] == '0' && TokStart[2] == 'x' &&
- isxdigit(static_cast<unsigned char>(TokStart[3]))) {
- int len = CurPtr-TokStart-3;
- uint32_t bits = len * 4;
- StringRef HexStr(TokStart + 3, len);
- if (!all_of(HexStr, isxdigit)) {
- // Bad token, return it as an error.
- CurPtr = TokStart+3;
- return lltok::Error;
- }
- APInt Tmp(bits, HexStr, 16);
- uint32_t activeBits = Tmp.getActiveBits();
- if (activeBits > 0 && activeBits < bits)
- Tmp = Tmp.trunc(activeBits);
- APSIntVal = APSInt(Tmp, TokStart[0] == 'u');
- return lltok::APSInt;
- }
- // If this is "cc1234", return this as just "cc".
- if (TokStart[0] == 'c' && TokStart[1] == 'c') {
- CurPtr = TokStart+2;
- return lltok::kw_cc;
- }
- // Finally, if this isn't known, return an error.
- CurPtr = TokStart+1;
- return lltok::Error;
- }
- /// Lex all tokens that start with a 0x prefix, knowing they match and are not
- /// labels.
- /// HexFPConstant 0x[0-9A-Fa-f]+
- /// HexFP80Constant 0xK[0-9A-Fa-f]+
- /// HexFP128Constant 0xL[0-9A-Fa-f]+
- /// HexPPC128Constant 0xM[0-9A-Fa-f]+
- /// HexHalfConstant 0xH[0-9A-Fa-f]+
- /// HexBFloatConstant 0xR[0-9A-Fa-f]+
- lltok::Kind LLLexer::Lex0x() {
- CurPtr = TokStart + 2;
- char Kind;
- if ((CurPtr[0] >= 'K' && CurPtr[0] <= 'M') || CurPtr[0] == 'H' ||
- CurPtr[0] == 'R') {
- Kind = *CurPtr++;
- } else {
- Kind = 'J';
- }
- if (!isxdigit(static_cast<unsigned char>(CurPtr[0]))) {
- // Bad token, return it as an error.
- CurPtr = TokStart+1;
- return lltok::Error;
- }
- while (isxdigit(static_cast<unsigned char>(CurPtr[0])))
- ++CurPtr;
- if (Kind == 'J') {
- // HexFPConstant - Floating point constant represented in IEEE format as a
- // hexadecimal number for when exponential notation is not precise enough.
- // Half, BFloat, Float, and double only.
- APFloatVal = APFloat(APFloat::IEEEdouble(),
- APInt(64, HexIntToVal(TokStart + 2, CurPtr)));
- return lltok::APFloat;
- }
- uint64_t Pair[2];
- switch (Kind) {
- default: llvm_unreachable("Unknown kind!");
- case 'K':
- // F80HexFPConstant - x87 long double in hexadecimal format (10 bytes)
- FP80HexToIntPair(TokStart+3, CurPtr, Pair);
- APFloatVal = APFloat(APFloat::x87DoubleExtended(), APInt(80, Pair));
- return lltok::APFloat;
- case 'L':
- // F128HexFPConstant - IEEE 128-bit in hexadecimal format (16 bytes)
- HexToIntPair(TokStart+3, CurPtr, Pair);
- APFloatVal = APFloat(APFloat::IEEEquad(), APInt(128, Pair));
- return lltok::APFloat;
- case 'M':
- // PPC128HexFPConstant - PowerPC 128-bit in hexadecimal format (16 bytes)
- HexToIntPair(TokStart+3, CurPtr, Pair);
- APFloatVal = APFloat(APFloat::PPCDoubleDouble(), APInt(128, Pair));
- return lltok::APFloat;
- case 'H':
- APFloatVal = APFloat(APFloat::IEEEhalf(),
- APInt(16,HexIntToVal(TokStart+3, CurPtr)));
- return lltok::APFloat;
- case 'R':
- // Brain floating point
- APFloatVal = APFloat(APFloat::BFloat(),
- APInt(16, HexIntToVal(TokStart + 3, CurPtr)));
- return lltok::APFloat;
- }
- }
- /// Lex tokens for a label or a numeric constant, possibly starting with -.
- /// Label [-a-zA-Z$._0-9]+:
- /// NInteger -[0-9]+
- /// FPConstant [-+]?[0-9]+[.][0-9]*([eE][-+]?[0-9]+)?
- /// PInteger [0-9]+
- /// HexFPConstant 0x[0-9A-Fa-f]+
- /// HexFP80Constant 0xK[0-9A-Fa-f]+
- /// HexFP128Constant 0xL[0-9A-Fa-f]+
- /// HexPPC128Constant 0xM[0-9A-Fa-f]+
- lltok::Kind LLLexer::LexDigitOrNegative() {
- // If the letter after the negative is not a number, this is probably a label.
- if (!isdigit(static_cast<unsigned char>(TokStart[0])) &&
- !isdigit(static_cast<unsigned char>(CurPtr[0]))) {
- // Okay, this is not a number after the -, it's probably a label.
- if (const char *End = isLabelTail(CurPtr)) {
- StrVal.assign(TokStart, End-1);
- CurPtr = End;
- return lltok::LabelStr;
- }
- return lltok::Error;
- }
- // At this point, it is either a label, int or fp constant.
- // Skip digits, we have at least one.
- for (; isdigit(static_cast<unsigned char>(CurPtr[0])); ++CurPtr)
- /*empty*/;
- // Check if this is a fully-numeric label:
- if (isdigit(TokStart[0]) && CurPtr[0] == ':') {
- uint64_t Val = atoull(TokStart, CurPtr);
- ++CurPtr; // Skip the colon.
- if ((unsigned)Val != Val)
- Error("invalid value number (too large)!");
- UIntVal = unsigned(Val);
- return lltok::LabelID;
- }
- // Check to see if this really is a string label, e.g. "-1:".
- if (isLabelChar(CurPtr[0]) || CurPtr[0] == ':') {
- if (const char *End = isLabelTail(CurPtr)) {
- StrVal.assign(TokStart, End-1);
- CurPtr = End;
- return lltok::LabelStr;
- }
- }
- // If the next character is a '.', then it is a fp value, otherwise its
- // integer.
- if (CurPtr[0] != '.') {
- if (TokStart[0] == '0' && TokStart[1] == 'x')
- return Lex0x();
- APSIntVal = APSInt(StringRef(TokStart, CurPtr - TokStart));
- return lltok::APSInt;
- }
- ++CurPtr;
- // Skip over [0-9]*([eE][-+]?[0-9]+)?
- while (isdigit(static_cast<unsigned char>(CurPtr[0]))) ++CurPtr;
- if (CurPtr[0] == 'e' || CurPtr[0] == 'E') {
- if (isdigit(static_cast<unsigned char>(CurPtr[1])) ||
- ((CurPtr[1] == '-' || CurPtr[1] == '+') &&
- isdigit(static_cast<unsigned char>(CurPtr[2])))) {
- CurPtr += 2;
- while (isdigit(static_cast<unsigned char>(CurPtr[0]))) ++CurPtr;
- }
- }
- APFloatVal = APFloat(APFloat::IEEEdouble(),
- StringRef(TokStart, CurPtr - TokStart));
- return lltok::APFloat;
- }
- /// Lex a floating point constant starting with +.
- /// FPConstant [-+]?[0-9]+[.][0-9]*([eE][-+]?[0-9]+)?
- lltok::Kind LLLexer::LexPositive() {
- // If the letter after the negative is a number, this is probably not a
- // label.
- if (!isdigit(static_cast<unsigned char>(CurPtr[0])))
- return lltok::Error;
- // Skip digits.
- for (++CurPtr; isdigit(static_cast<unsigned char>(CurPtr[0])); ++CurPtr)
- /*empty*/;
- // At this point, we need a '.'.
- if (CurPtr[0] != '.') {
- CurPtr = TokStart+1;
- return lltok::Error;
- }
- ++CurPtr;
- // Skip over [0-9]*([eE][-+]?[0-9]+)?
- while (isdigit(static_cast<unsigned char>(CurPtr[0]))) ++CurPtr;
- if (CurPtr[0] == 'e' || CurPtr[0] == 'E') {
- if (isdigit(static_cast<unsigned char>(CurPtr[1])) ||
- ((CurPtr[1] == '-' || CurPtr[1] == '+') &&
- isdigit(static_cast<unsigned char>(CurPtr[2])))) {
- CurPtr += 2;
- while (isdigit(static_cast<unsigned char>(CurPtr[0]))) ++CurPtr;
- }
- }
- APFloatVal = APFloat(APFloat::IEEEdouble(),
- StringRef(TokStart, CurPtr - TokStart));
- return lltok::APFloat;
- }
|