12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193 |
- //===- LLLexer.cpp - Lexer for .ll Files ----------------------------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- // Implement the Lexer for .ll files.
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/AsmParser/LLLexer.h"
- #include "llvm/ADT/APInt.h"
- #include "llvm/ADT/STLExtras.h"
- #include "llvm/ADT/StringExtras.h"
- #include "llvm/ADT/Twine.h"
- #include "llvm/IR/DerivedTypes.h"
- #include "llvm/IR/Instruction.h"
- #include "llvm/Support/ErrorHandling.h"
- #include "llvm/Support/SourceMgr.h"
- #include <cassert>
- #include <cctype>
- #include <cstdio>
- using namespace llvm;
- bool LLLexer::Error(LocTy ErrorLoc, const Twine &Msg) const {
- ErrorInfo = SM.GetMessage(ErrorLoc, SourceMgr::DK_Error, Msg);
- return true;
- }
- void LLLexer::Warning(LocTy WarningLoc, const Twine &Msg) const {
- SM.PrintMessage(WarningLoc, SourceMgr::DK_Warning, Msg);
- }
- //===----------------------------------------------------------------------===//
- // Helper functions.
- //===----------------------------------------------------------------------===//
- // atoull - Convert an ascii string of decimal digits into the unsigned long
- // long representation... this does not have to do input error checking,
- // because we know that the input will be matched by a suitable regex...
- //
- uint64_t LLLexer::atoull(const char *Buffer, const char *End) {
- uint64_t Result = 0;
- for (; Buffer != End; Buffer++) {
- uint64_t OldRes = Result;
- Result *= 10;
- Result += *Buffer-'0';
- if (Result < OldRes) { // Uh, oh, overflow detected!!!
- Error("constant bigger than 64 bits detected!");
- return 0;
- }
- }
- return Result;
- }
- uint64_t LLLexer::HexIntToVal(const char *Buffer, const char *End) {
- uint64_t Result = 0;
- for (; Buffer != End; ++Buffer) {
- uint64_t OldRes = Result;
- Result *= 16;
- Result += hexDigitValue(*Buffer);
- if (Result < OldRes) { // Uh, oh, overflow detected!!!
- Error("constant bigger than 64 bits detected!");
- return 0;
- }
- }
- return Result;
- }
- void LLLexer::HexToIntPair(const char *Buffer, const char *End,
- uint64_t Pair[2]) {
- Pair[0] = 0;
- if (End - Buffer >= 16) {
- for (int i = 0; i < 16; i++, Buffer++) {
- assert(Buffer != End);
- Pair[0] *= 16;
- Pair[0] += hexDigitValue(*Buffer);
- }
- }
- Pair[1] = 0;
- for (int i = 0; i < 16 && Buffer != End; i++, Buffer++) {
- Pair[1] *= 16;
- Pair[1] += hexDigitValue(*Buffer);
- }
- if (Buffer != End)
- Error("constant bigger than 128 bits detected!");
- }
- /// FP80HexToIntPair - translate an 80 bit FP80 number (20 hexits) into
- /// { low64, high16 } as usual for an APInt.
- void LLLexer::FP80HexToIntPair(const char *Buffer, const char *End,
- uint64_t Pair[2]) {
- Pair[1] = 0;
- for (int i=0; i<4 && Buffer != End; i++, Buffer++) {
- assert(Buffer != End);
- Pair[1] *= 16;
- Pair[1] += hexDigitValue(*Buffer);
- }
- Pair[0] = 0;
- for (int i = 0; i < 16 && Buffer != End; i++, Buffer++) {
- Pair[0] *= 16;
- Pair[0] += hexDigitValue(*Buffer);
- }
- if (Buffer != End)
- Error("constant bigger than 128 bits detected!");
- }
- // UnEscapeLexed - Run through the specified buffer and change \xx codes to the
- // appropriate character.
- static void UnEscapeLexed(std::string &Str) {
- if (Str.empty()) return;
- char *Buffer = &Str[0], *EndBuffer = Buffer+Str.size();
- char *BOut = Buffer;
- for (char *BIn = Buffer; BIn != EndBuffer; ) {
- if (BIn[0] == '\\') {
- if (BIn < EndBuffer-1 && BIn[1] == '\\') {
- *BOut++ = '\\'; // Two \ becomes one
- BIn += 2;
- } else if (BIn < EndBuffer-2 &&
- isxdigit(static_cast<unsigned char>(BIn[1])) &&
- isxdigit(static_cast<unsigned char>(BIn[2]))) {
- *BOut = hexDigitValue(BIn[1]) * 16 + hexDigitValue(BIn[2]);
- BIn += 3; // Skip over handled chars
- ++BOut;
- } else {
- *BOut++ = *BIn++;
- }
- } else {
- *BOut++ = *BIn++;
- }
- }
- Str.resize(BOut-Buffer);
- }
- /// isLabelChar - Return true for [-a-zA-Z$._0-9].
- static bool isLabelChar(char C) {
- return isalnum(static_cast<unsigned char>(C)) || C == '-' || C == '$' ||
- C == '.' || C == '_';
- }
- /// isLabelTail - Return true if this pointer points to a valid end of a label.
- static const char *isLabelTail(const char *CurPtr) {
- while (true) {
- if (CurPtr[0] == ':') return CurPtr+1;
- if (!isLabelChar(CurPtr[0])) return nullptr;
- ++CurPtr;
- }
- }
- //===----------------------------------------------------------------------===//
- // Lexer definition.
- //===----------------------------------------------------------------------===//
- LLLexer::LLLexer(StringRef StartBuf, SourceMgr &SM, SMDiagnostic &Err,
- LLVMContext &C)
- : CurBuf(StartBuf), ErrorInfo(Err), SM(SM), Context(C), APFloatVal(0.0),
- IgnoreColonInIdentifiers(false) {
- CurPtr = CurBuf.begin();
- }
- int LLLexer::getNextChar() {
- char CurChar = *CurPtr++;
- switch (CurChar) {
- default: return (unsigned char)CurChar;
- case 0:
- // A nul character in the stream is either the end of the current buffer or
- // a random nul in the file. Disambiguate that here.
- if (CurPtr-1 != CurBuf.end())
- return 0; // Just whitespace.
- // Otherwise, return end of file.
- --CurPtr; // Another call to lex will return EOF again.
- return EOF;
- }
- }
- lltok::Kind LLLexer::LexToken() {
- while (true) {
- TokStart = CurPtr;
- int CurChar = getNextChar();
- switch (CurChar) {
- default:
- // Handle letters: [a-zA-Z_]
- if (isalpha(static_cast<unsigned char>(CurChar)) || CurChar == '_')
- return LexIdentifier();
- return lltok::Error;
- case EOF: return lltok::Eof;
- case 0:
- case ' ':
- case '\t':
- case '\n':
- case '\r':
- // Ignore whitespace.
- continue;
- case '+': return LexPositive();
- case '@': return LexAt();
- case '$': return LexDollar();
- case '%': return LexPercent();
- case '"': return LexQuote();
- case '.':
- if (const char *Ptr = isLabelTail(CurPtr)) {
- CurPtr = Ptr;
- StrVal.assign(TokStart, CurPtr-1);
- return lltok::LabelStr;
- }
- if (CurPtr[0] == '.' && CurPtr[1] == '.') {
- CurPtr += 2;
- return lltok::dotdotdot;
- }
- return lltok::Error;
- case ';':
- SkipLineComment();
- continue;
- case '!': return LexExclaim();
- case '^':
- return LexCaret();
- case ':':
- return lltok::colon;
- case '#': return LexHash();
- case '0': case '1': case '2': case '3': case '4':
- case '5': case '6': case '7': case '8': case '9':
- case '-':
- return LexDigitOrNegative();
- case '=': return lltok::equal;
- case '[': return lltok::lsquare;
- case ']': return lltok::rsquare;
- case '{': return lltok::lbrace;
- case '}': return lltok::rbrace;
- case '<': return lltok::less;
- case '>': return lltok::greater;
- case '(': return lltok::lparen;
- case ')': return lltok::rparen;
- case ',': return lltok::comma;
- case '*': return lltok::star;
- case '|': return lltok::bar;
- }
- }
- }
- void LLLexer::SkipLineComment() {
- while (true) {
- if (CurPtr[0] == '\n' || CurPtr[0] == '\r' || getNextChar() == EOF)
- return;
- }
- }
- /// Lex all tokens that start with an @ character.
- /// GlobalVar @\"[^\"]*\"
- /// GlobalVar @[-a-zA-Z$._][-a-zA-Z$._0-9]*
- /// GlobalVarID @[0-9]+
- lltok::Kind LLLexer::LexAt() {
- return LexVar(lltok::GlobalVar, lltok::GlobalID);
- }
- lltok::Kind LLLexer::LexDollar() {
- if (const char *Ptr = isLabelTail(TokStart)) {
- CurPtr = Ptr;
- StrVal.assign(TokStart, CurPtr - 1);
- return lltok::LabelStr;
- }
- // Handle DollarStringConstant: $\"[^\"]*\"
- if (CurPtr[0] == '"') {
- ++CurPtr;
- while (true) {
- int CurChar = getNextChar();
- if (CurChar == EOF) {
- Error("end of file in COMDAT variable name");
- return lltok::Error;
- }
- if (CurChar == '"') {
- StrVal.assign(TokStart + 2, CurPtr - 1);
- UnEscapeLexed(StrVal);
- if (StringRef(StrVal).find_first_of(0) != StringRef::npos) {
- Error("Null bytes are not allowed in names");
- return lltok::Error;
- }
- return lltok::ComdatVar;
- }
- }
- }
- // Handle ComdatVarName: $[-a-zA-Z$._][-a-zA-Z$._0-9]*
- if (ReadVarName())
- return lltok::ComdatVar;
- return lltok::Error;
- }
- /// ReadString - Read a string until the closing quote.
- lltok::Kind LLLexer::ReadString(lltok::Kind kind) {
- const char *Start = CurPtr;
- while (true) {
- int CurChar = getNextChar();
- if (CurChar == EOF) {
- Error("end of file in string constant");
- return lltok::Error;
- }
- if (CurChar == '"') {
- StrVal.assign(Start, CurPtr-1);
- UnEscapeLexed(StrVal);
- return kind;
- }
- }
- }
- /// ReadVarName - Read the rest of a token containing a variable name.
- bool LLLexer::ReadVarName() {
- const char *NameStart = CurPtr;
- if (isalpha(static_cast<unsigned char>(CurPtr[0])) ||
- CurPtr[0] == '-' || CurPtr[0] == '$' ||
- CurPtr[0] == '.' || CurPtr[0] == '_') {
- ++CurPtr;
- while (isalnum(static_cast<unsigned char>(CurPtr[0])) ||
- CurPtr[0] == '-' || CurPtr[0] == '$' ||
- CurPtr[0] == '.' || CurPtr[0] == '_')
- ++CurPtr;
- StrVal.assign(NameStart, CurPtr);
- return true;
- }
- return false;
- }
- // Lex an ID: [0-9]+. On success, the ID is stored in UIntVal and Token is
- // returned, otherwise the Error token is returned.
- lltok::Kind LLLexer::LexUIntID(lltok::Kind Token) {
- if (!isdigit(static_cast<unsigned char>(CurPtr[0])))
- return lltok::Error;
- for (++CurPtr; isdigit(static_cast<unsigned char>(CurPtr[0])); ++CurPtr)
- /*empty*/;
- uint64_t Val = atoull(TokStart + 1, CurPtr);
- if ((unsigned)Val != Val)
- Error("invalid value number (too large)!");
- UIntVal = unsigned(Val);
- return Token;
- }
- lltok::Kind LLLexer::LexVar(lltok::Kind Var, lltok::Kind VarID) {
- // Handle StringConstant: \"[^\"]*\"
- if (CurPtr[0] == '"') {
- ++CurPtr;
- while (true) {
- int CurChar = getNextChar();
- if (CurChar == EOF) {
- Error("end of file in global variable name");
- return lltok::Error;
- }
- if (CurChar == '"') {
- StrVal.assign(TokStart+2, CurPtr-1);
- UnEscapeLexed(StrVal);
- if (StringRef(StrVal).find_first_of(0) != StringRef::npos) {
- Error("Null bytes are not allowed in names");
- return lltok::Error;
- }
- return Var;
- }
- }
- }
- // Handle VarName: [-a-zA-Z$._][-a-zA-Z$._0-9]*
- if (ReadVarName())
- return Var;
- // Handle VarID: [0-9]+
- return LexUIntID(VarID);
- }
- /// Lex all tokens that start with a % character.
- /// LocalVar ::= %\"[^\"]*\"
- /// LocalVar ::= %[-a-zA-Z$._][-a-zA-Z$._0-9]*
- /// LocalVarID ::= %[0-9]+
- lltok::Kind LLLexer::LexPercent() {
- return LexVar(lltok::LocalVar, lltok::LocalVarID);
- }
- /// Lex all tokens that start with a " character.
- /// QuoteLabel "[^"]+":
- /// StringConstant "[^"]*"
- lltok::Kind LLLexer::LexQuote() {
- lltok::Kind kind = ReadString(lltok::StringConstant);
- if (kind == lltok::Error || kind == lltok::Eof)
- return kind;
- if (CurPtr[0] == ':') {
- ++CurPtr;
- if (StringRef(StrVal).find_first_of(0) != StringRef::npos) {
- Error("Null bytes are not allowed in names");
- kind = lltok::Error;
- } else {
- kind = lltok::LabelStr;
- }
- }
- return kind;
- }
- /// Lex all tokens that start with a ! character.
- /// !foo
- /// !
- lltok::Kind LLLexer::LexExclaim() {
- // Lex a metadata name as a MetadataVar.
- if (isalpha(static_cast<unsigned char>(CurPtr[0])) ||
- CurPtr[0] == '-' || CurPtr[0] == '$' ||
- CurPtr[0] == '.' || CurPtr[0] == '_' || CurPtr[0] == '\\') {
- ++CurPtr;
- while (isalnum(static_cast<unsigned char>(CurPtr[0])) ||
- CurPtr[0] == '-' || CurPtr[0] == '$' ||
- CurPtr[0] == '.' || CurPtr[0] == '_' || CurPtr[0] == '\\')
- ++CurPtr;
- StrVal.assign(TokStart+1, CurPtr); // Skip !
- UnEscapeLexed(StrVal);
- return lltok::MetadataVar;
- }
- return lltok::exclaim;
- }
- /// Lex all tokens that start with a ^ character.
- /// SummaryID ::= ^[0-9]+
- lltok::Kind LLLexer::LexCaret() {
- // Handle SummaryID: ^[0-9]+
- return LexUIntID(lltok::SummaryID);
- }
- /// Lex all tokens that start with a # character.
- /// AttrGrpID ::= #[0-9]+
- lltok::Kind LLLexer::LexHash() {
- // Handle AttrGrpID: #[0-9]+
- return LexUIntID(lltok::AttrGrpID);
- }
- /// Lex a label, integer type, keyword, or hexadecimal integer constant.
- /// Label [-a-zA-Z$._0-9]+:
- /// IntegerType i[0-9]+
- /// Keyword sdiv, float, ...
- /// HexIntConstant [us]0x[0-9A-Fa-f]+
- lltok::Kind LLLexer::LexIdentifier() {
- const char *StartChar = CurPtr;
- const char *IntEnd = CurPtr[-1] == 'i' ? nullptr : StartChar;
- const char *KeywordEnd = nullptr;
- for (; isLabelChar(*CurPtr); ++CurPtr) {
- // If we decide this is an integer, remember the end of the sequence.
- if (!IntEnd && !isdigit(static_cast<unsigned char>(*CurPtr)))
- IntEnd = CurPtr;
- if (!KeywordEnd && !isalnum(static_cast<unsigned char>(*CurPtr)) &&
- *CurPtr != '_')
- KeywordEnd = CurPtr;
- }
- // If we stopped due to a colon, unless we were directed to ignore it,
- // this really is a label.
- if (!IgnoreColonInIdentifiers && *CurPtr == ':') {
- StrVal.assign(StartChar-1, CurPtr++);
- return lltok::LabelStr;
- }
- // Otherwise, this wasn't a label. If this was valid as an integer type,
- // return it.
- if (!IntEnd) IntEnd = CurPtr;
- if (IntEnd != StartChar) {
- CurPtr = IntEnd;
- uint64_t NumBits = atoull(StartChar, CurPtr);
- if (NumBits < IntegerType::MIN_INT_BITS ||
- NumBits > IntegerType::MAX_INT_BITS) {
- Error("bitwidth for integer type out of range!");
- return lltok::Error;
- }
- TyVal = IntegerType::get(Context, NumBits);
- return lltok::Type;
- }
- // Otherwise, this was a letter sequence. See which keyword this is.
- if (!KeywordEnd) KeywordEnd = CurPtr;
- CurPtr = KeywordEnd;
- --StartChar;
- StringRef Keyword(StartChar, CurPtr - StartChar);
- #define KEYWORD(STR) \
- do { \
- if (Keyword == #STR) \
- return lltok::kw_##STR; \
- } while (false)
- KEYWORD(true); KEYWORD(false);
- KEYWORD(declare); KEYWORD(define);
- KEYWORD(global); KEYWORD(constant);
- KEYWORD(dso_local);
- KEYWORD(dso_preemptable);
- KEYWORD(private);
- KEYWORD(internal);
- KEYWORD(available_externally);
- KEYWORD(linkonce);
- KEYWORD(linkonce_odr);
- KEYWORD(weak); // Use as a linkage, and a modifier for "cmpxchg".
- KEYWORD(weak_odr);
- KEYWORD(appending);
- KEYWORD(dllimport);
- KEYWORD(dllexport);
- KEYWORD(common);
- KEYWORD(default);
- KEYWORD(hidden);
- KEYWORD(protected);
- KEYWORD(unnamed_addr);
- KEYWORD(local_unnamed_addr);
- KEYWORD(externally_initialized);
- KEYWORD(extern_weak);
- KEYWORD(external);
- KEYWORD(thread_local);
- KEYWORD(localdynamic);
- KEYWORD(initialexec);
- KEYWORD(localexec);
- KEYWORD(zeroinitializer);
- KEYWORD(undef);
- KEYWORD(null);
- KEYWORD(none);
- KEYWORD(poison);
- KEYWORD(to);
- KEYWORD(caller);
- KEYWORD(within);
- KEYWORD(from);
- KEYWORD(tail);
- KEYWORD(musttail);
- KEYWORD(notail);
- KEYWORD(target);
- KEYWORD(triple);
- KEYWORD(source_filename);
- KEYWORD(unwind);
- KEYWORD(datalayout);
- KEYWORD(volatile);
- KEYWORD(atomic);
- KEYWORD(unordered);
- KEYWORD(monotonic);
- KEYWORD(acquire);
- KEYWORD(release);
- KEYWORD(acq_rel);
- KEYWORD(seq_cst);
- KEYWORD(syncscope);
- KEYWORD(nnan);
- KEYWORD(ninf);
- KEYWORD(nsz);
- KEYWORD(arcp);
- KEYWORD(contract);
- KEYWORD(reassoc);
- KEYWORD(afn);
- KEYWORD(fast);
- KEYWORD(nuw);
- KEYWORD(nsw);
- KEYWORD(exact);
- KEYWORD(inbounds);
- KEYWORD(inrange);
- KEYWORD(align);
- KEYWORD(addrspace);
- KEYWORD(section);
- KEYWORD(partition);
- KEYWORD(alias);
- KEYWORD(ifunc);
- KEYWORD(module);
- KEYWORD(asm);
- KEYWORD(sideeffect);
- KEYWORD(alignstack);
- KEYWORD(inteldialect);
- KEYWORD(gc);
- KEYWORD(prefix);
- KEYWORD(prologue);
- KEYWORD(ccc);
- KEYWORD(fastcc);
- KEYWORD(coldcc);
- KEYWORD(cfguard_checkcc);
- KEYWORD(x86_stdcallcc);
- KEYWORD(x86_fastcallcc);
- KEYWORD(x86_thiscallcc);
- KEYWORD(x86_vectorcallcc);
- KEYWORD(arm_apcscc);
- KEYWORD(arm_aapcscc);
- KEYWORD(arm_aapcs_vfpcc);
- KEYWORD(aarch64_vector_pcs);
- KEYWORD(aarch64_sve_vector_pcs);
- KEYWORD(msp430_intrcc);
- KEYWORD(avr_intrcc);
- KEYWORD(avr_signalcc);
- KEYWORD(ptx_kernel);
- KEYWORD(ptx_device);
- KEYWORD(spir_kernel);
- KEYWORD(spir_func);
- KEYWORD(intel_ocl_bicc);
- KEYWORD(x86_64_sysvcc);
- KEYWORD(win64cc);
- KEYWORD(x86_regcallcc);
- KEYWORD(webkit_jscc);
- KEYWORD(swiftcc);
- KEYWORD(swifttailcc);
- KEYWORD(anyregcc);
- KEYWORD(preserve_mostcc);
- KEYWORD(preserve_allcc);
- KEYWORD(ghccc);
- KEYWORD(x86_intrcc);
- KEYWORD(hhvmcc);
- KEYWORD(hhvm_ccc);
- KEYWORD(cxx_fast_tlscc);
- KEYWORD(amdgpu_vs);
- KEYWORD(amdgpu_ls);
- KEYWORD(amdgpu_hs);
- KEYWORD(amdgpu_es);
- KEYWORD(amdgpu_gs);
- KEYWORD(amdgpu_ps);
- KEYWORD(amdgpu_cs);
- KEYWORD(amdgpu_kernel);
- KEYWORD(amdgpu_gfx);
- KEYWORD(tailcc);
- KEYWORD(cc);
- KEYWORD(c);
- KEYWORD(attributes);
- KEYWORD(alwaysinline);
- KEYWORD(allocsize);
- KEYWORD(argmemonly);
- KEYWORD(builtin);
- KEYWORD(byval);
- KEYWORD(inalloca);
- KEYWORD(cold);
- KEYWORD(convergent);
- KEYWORD(dereferenceable);
- KEYWORD(dereferenceable_or_null);
- KEYWORD(disable_sanitizer_instrumentation);
- KEYWORD(elementtype);
- KEYWORD(inaccessiblememonly);
- KEYWORD(inaccessiblemem_or_argmemonly);
- KEYWORD(inlinehint);
- KEYWORD(inreg);
- KEYWORD(jumptable);
- KEYWORD(minsize);
- KEYWORD(naked);
- KEYWORD(nest);
- KEYWORD(noalias);
- KEYWORD(nobuiltin);
- KEYWORD(nocallback);
- KEYWORD(nocapture);
- KEYWORD(noduplicate);
- KEYWORD(nofree);
- KEYWORD(noimplicitfloat);
- KEYWORD(noinline);
- KEYWORD(norecurse);
- KEYWORD(nonlazybind);
- KEYWORD(nomerge);
- KEYWORD(nonnull);
- KEYWORD(noprofile);
- KEYWORD(noredzone);
- KEYWORD(noreturn);
- KEYWORD(nosync);
- KEYWORD(nocf_check);
- KEYWORD(noundef);
- KEYWORD(nounwind);
- KEYWORD(nosanitize_coverage);
- KEYWORD(null_pointer_is_valid);
- KEYWORD(optforfuzzing);
- KEYWORD(optnone);
- KEYWORD(optsize);
- KEYWORD(preallocated);
- KEYWORD(readnone);
- KEYWORD(readonly);
- KEYWORD(returned);
- KEYWORD(returns_twice);
- KEYWORD(signext);
- KEYWORD(speculatable);
- KEYWORD(sret);
- KEYWORD(ssp);
- KEYWORD(sspreq);
- KEYWORD(sspstrong);
- KEYWORD(strictfp);
- KEYWORD(safestack);
- KEYWORD(shadowcallstack);
- KEYWORD(sanitize_address);
- KEYWORD(sanitize_hwaddress);
- KEYWORD(sanitize_memtag);
- KEYWORD(sanitize_thread);
- KEYWORD(sanitize_memory);
- KEYWORD(speculative_load_hardening);
- KEYWORD(swifterror);
- KEYWORD(swiftself);
- KEYWORD(swiftasync);
- KEYWORD(uwtable);
- KEYWORD(vscale_range);
- KEYWORD(willreturn);
- KEYWORD(writeonly);
- KEYWORD(zeroext);
- KEYWORD(immarg);
- KEYWORD(byref);
- KEYWORD(mustprogress);
- KEYWORD(type);
- KEYWORD(opaque);
- KEYWORD(comdat);
- // Comdat types
- KEYWORD(any);
- KEYWORD(exactmatch);
- KEYWORD(largest);
- KEYWORD(nodeduplicate);
- KEYWORD(samesize);
- KEYWORD(eq); KEYWORD(ne); KEYWORD(slt); KEYWORD(sgt); KEYWORD(sle);
- KEYWORD(sge); KEYWORD(ult); KEYWORD(ugt); KEYWORD(ule); KEYWORD(uge);
- KEYWORD(oeq); KEYWORD(one); KEYWORD(olt); KEYWORD(ogt); KEYWORD(ole);
- KEYWORD(oge); KEYWORD(ord); KEYWORD(uno); KEYWORD(ueq); KEYWORD(une);
- KEYWORD(xchg); KEYWORD(nand); KEYWORD(max); KEYWORD(min); KEYWORD(umax);
- KEYWORD(umin);
- KEYWORD(vscale);
- KEYWORD(x);
- KEYWORD(blockaddress);
- KEYWORD(dso_local_equivalent);
- KEYWORD(no_cfi);
- // Metadata types.
- KEYWORD(distinct);
- // Use-list order directives.
- KEYWORD(uselistorder);
- KEYWORD(uselistorder_bb);
- KEYWORD(personality);
- KEYWORD(cleanup);
- KEYWORD(catch);
- KEYWORD(filter);
- // Summary index keywords.
- KEYWORD(path);
- KEYWORD(hash);
- KEYWORD(gv);
- KEYWORD(guid);
- KEYWORD(name);
- KEYWORD(summaries);
- KEYWORD(flags);
- KEYWORD(blockcount);
- KEYWORD(linkage);
- KEYWORD(visibility);
- KEYWORD(notEligibleToImport);
- KEYWORD(live);
- KEYWORD(dsoLocal);
- KEYWORD(canAutoHide);
- KEYWORD(function);
- KEYWORD(insts);
- KEYWORD(funcFlags);
- KEYWORD(readNone);
- KEYWORD(readOnly);
- KEYWORD(noRecurse);
- KEYWORD(returnDoesNotAlias);
- KEYWORD(noInline);
- KEYWORD(alwaysInline);
- KEYWORD(noUnwind);
- KEYWORD(mayThrow);
- KEYWORD(hasUnknownCall);
- KEYWORD(mustBeUnreachable);
- KEYWORD(calls);
- KEYWORD(callee);
- KEYWORD(params);
- KEYWORD(param);
- KEYWORD(hotness);
- KEYWORD(unknown);
- KEYWORD(hot);
- KEYWORD(critical);
- KEYWORD(relbf);
- KEYWORD(variable);
- KEYWORD(vTableFuncs);
- KEYWORD(virtFunc);
- KEYWORD(aliasee);
- KEYWORD(refs);
- KEYWORD(typeIdInfo);
- KEYWORD(typeTests);
- KEYWORD(typeTestAssumeVCalls);
- KEYWORD(typeCheckedLoadVCalls);
- KEYWORD(typeTestAssumeConstVCalls);
- KEYWORD(typeCheckedLoadConstVCalls);
- KEYWORD(vFuncId);
- KEYWORD(offset);
- KEYWORD(args);
- KEYWORD(typeid);
- KEYWORD(typeidCompatibleVTable);
- KEYWORD(summary);
- KEYWORD(typeTestRes);
- KEYWORD(kind);
- KEYWORD(unsat);
- KEYWORD(byteArray);
- KEYWORD(inline);
- KEYWORD(single);
- KEYWORD(allOnes);
- KEYWORD(sizeM1BitWidth);
- KEYWORD(alignLog2);
- KEYWORD(sizeM1);
- KEYWORD(bitMask);
- KEYWORD(inlineBits);
- KEYWORD(vcall_visibility);
- KEYWORD(wpdResolutions);
- KEYWORD(wpdRes);
- KEYWORD(indir);
- KEYWORD(singleImpl);
- KEYWORD(branchFunnel);
- KEYWORD(singleImplName);
- KEYWORD(resByArg);
- KEYWORD(byArg);
- KEYWORD(uniformRetVal);
- KEYWORD(uniqueRetVal);
- KEYWORD(virtualConstProp);
- KEYWORD(info);
- KEYWORD(byte);
- KEYWORD(bit);
- KEYWORD(varFlags);
- #undef KEYWORD
- // Keywords for types.
- #define TYPEKEYWORD(STR, LLVMTY) \
- do { \
- if (Keyword == STR) { \
- TyVal = LLVMTY; \
- return lltok::Type; \
- } \
- } while (false)
- TYPEKEYWORD("void", Type::getVoidTy(Context));
- TYPEKEYWORD("half", Type::getHalfTy(Context));
- TYPEKEYWORD("bfloat", Type::getBFloatTy(Context));
- TYPEKEYWORD("float", Type::getFloatTy(Context));
- TYPEKEYWORD("double", Type::getDoubleTy(Context));
- TYPEKEYWORD("x86_fp80", Type::getX86_FP80Ty(Context));
- TYPEKEYWORD("fp128", Type::getFP128Ty(Context));
- TYPEKEYWORD("ppc_fp128", Type::getPPC_FP128Ty(Context));
- TYPEKEYWORD("label", Type::getLabelTy(Context));
- TYPEKEYWORD("metadata", Type::getMetadataTy(Context));
- TYPEKEYWORD("x86_mmx", Type::getX86_MMXTy(Context));
- TYPEKEYWORD("x86_amx", Type::getX86_AMXTy(Context));
- TYPEKEYWORD("token", Type::getTokenTy(Context));
- if (Keyword == "ptr") {
- if (Context.supportsTypedPointers()) {
- Warning("ptr type is only supported in -opaque-pointers mode");
- return lltok::Error;
- }
- TyVal = PointerType::getUnqual(Context);
- return lltok::Type;
- }
- #undef TYPEKEYWORD
- // Keywords for instructions.
- #define INSTKEYWORD(STR, Enum) \
- do { \
- if (Keyword == #STR) { \
- UIntVal = Instruction::Enum; \
- return lltok::kw_##STR; \
- } \
- } while (false)
- INSTKEYWORD(fneg, FNeg);
- INSTKEYWORD(add, Add); INSTKEYWORD(fadd, FAdd);
- INSTKEYWORD(sub, Sub); INSTKEYWORD(fsub, FSub);
- INSTKEYWORD(mul, Mul); INSTKEYWORD(fmul, FMul);
- INSTKEYWORD(udiv, UDiv); INSTKEYWORD(sdiv, SDiv); INSTKEYWORD(fdiv, FDiv);
- INSTKEYWORD(urem, URem); INSTKEYWORD(srem, SRem); INSTKEYWORD(frem, FRem);
- INSTKEYWORD(shl, Shl); INSTKEYWORD(lshr, LShr); INSTKEYWORD(ashr, AShr);
- INSTKEYWORD(and, And); INSTKEYWORD(or, Or); INSTKEYWORD(xor, Xor);
- INSTKEYWORD(icmp, ICmp); INSTKEYWORD(fcmp, FCmp);
- INSTKEYWORD(phi, PHI);
- INSTKEYWORD(call, Call);
- INSTKEYWORD(trunc, Trunc);
- INSTKEYWORD(zext, ZExt);
- INSTKEYWORD(sext, SExt);
- INSTKEYWORD(fptrunc, FPTrunc);
- INSTKEYWORD(fpext, FPExt);
- INSTKEYWORD(uitofp, UIToFP);
- INSTKEYWORD(sitofp, SIToFP);
- INSTKEYWORD(fptoui, FPToUI);
- INSTKEYWORD(fptosi, FPToSI);
- INSTKEYWORD(inttoptr, IntToPtr);
- INSTKEYWORD(ptrtoint, PtrToInt);
- INSTKEYWORD(bitcast, BitCast);
- INSTKEYWORD(addrspacecast, AddrSpaceCast);
- INSTKEYWORD(select, Select);
- INSTKEYWORD(va_arg, VAArg);
- INSTKEYWORD(ret, Ret);
- INSTKEYWORD(br, Br);
- INSTKEYWORD(switch, Switch);
- INSTKEYWORD(indirectbr, IndirectBr);
- INSTKEYWORD(invoke, Invoke);
- INSTKEYWORD(resume, Resume);
- INSTKEYWORD(unreachable, Unreachable);
- INSTKEYWORD(callbr, CallBr);
- INSTKEYWORD(alloca, Alloca);
- INSTKEYWORD(load, Load);
- INSTKEYWORD(store, Store);
- INSTKEYWORD(cmpxchg, AtomicCmpXchg);
- INSTKEYWORD(atomicrmw, AtomicRMW);
- INSTKEYWORD(fence, Fence);
- INSTKEYWORD(getelementptr, GetElementPtr);
- INSTKEYWORD(extractelement, ExtractElement);
- INSTKEYWORD(insertelement, InsertElement);
- INSTKEYWORD(shufflevector, ShuffleVector);
- INSTKEYWORD(extractvalue, ExtractValue);
- INSTKEYWORD(insertvalue, InsertValue);
- INSTKEYWORD(landingpad, LandingPad);
- INSTKEYWORD(cleanupret, CleanupRet);
- INSTKEYWORD(catchret, CatchRet);
- INSTKEYWORD(catchswitch, CatchSwitch);
- INSTKEYWORD(catchpad, CatchPad);
- INSTKEYWORD(cleanuppad, CleanupPad);
- INSTKEYWORD(freeze, Freeze);
- #undef INSTKEYWORD
- #define DWKEYWORD(TYPE, TOKEN) \
- do { \
- if (Keyword.startswith("DW_" #TYPE "_")) { \
- StrVal.assign(Keyword.begin(), Keyword.end()); \
- return lltok::TOKEN; \
- } \
- } while (false)
- DWKEYWORD(TAG, DwarfTag);
- DWKEYWORD(ATE, DwarfAttEncoding);
- DWKEYWORD(VIRTUALITY, DwarfVirtuality);
- DWKEYWORD(LANG, DwarfLang);
- DWKEYWORD(CC, DwarfCC);
- DWKEYWORD(OP, DwarfOp);
- DWKEYWORD(MACINFO, DwarfMacinfo);
- #undef DWKEYWORD
- if (Keyword.startswith("DIFlag")) {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::DIFlag;
- }
- if (Keyword.startswith("DISPFlag")) {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::DISPFlag;
- }
- if (Keyword.startswith("CSK_")) {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::ChecksumKind;
- }
- if (Keyword == "NoDebug" || Keyword == "FullDebug" ||
- Keyword == "LineTablesOnly" || Keyword == "DebugDirectivesOnly") {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::EmissionKind;
- }
- if (Keyword == "GNU" || Keyword == "None" || Keyword == "Default") {
- StrVal.assign(Keyword.begin(), Keyword.end());
- return lltok::NameTableKind;
- }
- // Check for [us]0x[0-9A-Fa-f]+ which are Hexadecimal constant generated by
- // the CFE to avoid forcing it to deal with 64-bit numbers.
- if ((TokStart[0] == 'u' || TokStart[0] == 's') &&
- TokStart[1] == '0' && TokStart[2] == 'x' &&
- isxdigit(static_cast<unsigned char>(TokStart[3]))) {
- int len = CurPtr-TokStart-3;
- uint32_t bits = len * 4;
- StringRef HexStr(TokStart + 3, len);
- if (!all_of(HexStr, isxdigit)) {
- // Bad token, return it as an error.
- CurPtr = TokStart+3;
- return lltok::Error;
- }
- APInt Tmp(bits, HexStr, 16);
- uint32_t activeBits = Tmp.getActiveBits();
- if (activeBits > 0 && activeBits < bits)
- Tmp = Tmp.trunc(activeBits);
- APSIntVal = APSInt(Tmp, TokStart[0] == 'u');
- return lltok::APSInt;
- }
- // If this is "cc1234", return this as just "cc".
- if (TokStart[0] == 'c' && TokStart[1] == 'c') {
- CurPtr = TokStart+2;
- return lltok::kw_cc;
- }
- // Finally, if this isn't known, return an error.
- CurPtr = TokStart+1;
- return lltok::Error;
- }
- /// Lex all tokens that start with a 0x prefix, knowing they match and are not
- /// labels.
- /// HexFPConstant 0x[0-9A-Fa-f]+
- /// HexFP80Constant 0xK[0-9A-Fa-f]+
- /// HexFP128Constant 0xL[0-9A-Fa-f]+
- /// HexPPC128Constant 0xM[0-9A-Fa-f]+
- /// HexHalfConstant 0xH[0-9A-Fa-f]+
- /// HexBFloatConstant 0xR[0-9A-Fa-f]+
- lltok::Kind LLLexer::Lex0x() {
- CurPtr = TokStart + 2;
- char Kind;
- if ((CurPtr[0] >= 'K' && CurPtr[0] <= 'M') || CurPtr[0] == 'H' ||
- CurPtr[0] == 'R') {
- Kind = *CurPtr++;
- } else {
- Kind = 'J';
- }
- if (!isxdigit(static_cast<unsigned char>(CurPtr[0]))) {
- // Bad token, return it as an error.
- CurPtr = TokStart+1;
- return lltok::Error;
- }
- while (isxdigit(static_cast<unsigned char>(CurPtr[0])))
- ++CurPtr;
- if (Kind == 'J') {
- // HexFPConstant - Floating point constant represented in IEEE format as a
- // hexadecimal number for when exponential notation is not precise enough.
- // Half, BFloat, Float, and double only.
- APFloatVal = APFloat(APFloat::IEEEdouble(),
- APInt(64, HexIntToVal(TokStart + 2, CurPtr)));
- return lltok::APFloat;
- }
- uint64_t Pair[2];
- switch (Kind) {
- default: llvm_unreachable("Unknown kind!");
- case 'K':
- // F80HexFPConstant - x87 long double in hexadecimal format (10 bytes)
- FP80HexToIntPair(TokStart+3, CurPtr, Pair);
- APFloatVal = APFloat(APFloat::x87DoubleExtended(), APInt(80, Pair));
- return lltok::APFloat;
- case 'L':
- // F128HexFPConstant - IEEE 128-bit in hexadecimal format (16 bytes)
- HexToIntPair(TokStart+3, CurPtr, Pair);
- APFloatVal = APFloat(APFloat::IEEEquad(), APInt(128, Pair));
- return lltok::APFloat;
- case 'M':
- // PPC128HexFPConstant - PowerPC 128-bit in hexadecimal format (16 bytes)
- HexToIntPair(TokStart+3, CurPtr, Pair);
- APFloatVal = APFloat(APFloat::PPCDoubleDouble(), APInt(128, Pair));
- return lltok::APFloat;
- case 'H':
- APFloatVal = APFloat(APFloat::IEEEhalf(),
- APInt(16,HexIntToVal(TokStart+3, CurPtr)));
- return lltok::APFloat;
- case 'R':
- // Brain floating point
- APFloatVal = APFloat(APFloat::BFloat(),
- APInt(16, HexIntToVal(TokStart + 3, CurPtr)));
- return lltok::APFloat;
- }
- }
- /// Lex tokens for a label or a numeric constant, possibly starting with -.
- /// Label [-a-zA-Z$._0-9]+:
- /// NInteger -[0-9]+
- /// FPConstant [-+]?[0-9]+[.][0-9]*([eE][-+]?[0-9]+)?
- /// PInteger [0-9]+
- /// HexFPConstant 0x[0-9A-Fa-f]+
- /// HexFP80Constant 0xK[0-9A-Fa-f]+
- /// HexFP128Constant 0xL[0-9A-Fa-f]+
- /// HexPPC128Constant 0xM[0-9A-Fa-f]+
- lltok::Kind LLLexer::LexDigitOrNegative() {
- // If the letter after the negative is not a number, this is probably a label.
- if (!isdigit(static_cast<unsigned char>(TokStart[0])) &&
- !isdigit(static_cast<unsigned char>(CurPtr[0]))) {
- // Okay, this is not a number after the -, it's probably a label.
- if (const char *End = isLabelTail(CurPtr)) {
- StrVal.assign(TokStart, End-1);
- CurPtr = End;
- return lltok::LabelStr;
- }
- return lltok::Error;
- }
- // At this point, it is either a label, int or fp constant.
- // Skip digits, we have at least one.
- for (; isdigit(static_cast<unsigned char>(CurPtr[0])); ++CurPtr)
- /*empty*/;
- // Check if this is a fully-numeric label:
- if (isdigit(TokStart[0]) && CurPtr[0] == ':') {
- uint64_t Val = atoull(TokStart, CurPtr);
- ++CurPtr; // Skip the colon.
- if ((unsigned)Val != Val)
- Error("invalid value number (too large)!");
- UIntVal = unsigned(Val);
- return lltok::LabelID;
- }
- // Check to see if this really is a string label, e.g. "-1:".
- if (isLabelChar(CurPtr[0]) || CurPtr[0] == ':') {
- if (const char *End = isLabelTail(CurPtr)) {
- StrVal.assign(TokStart, End-1);
- CurPtr = End;
- return lltok::LabelStr;
- }
- }
- // If the next character is a '.', then it is a fp value, otherwise its
- // integer.
- if (CurPtr[0] != '.') {
- if (TokStart[0] == '0' && TokStart[1] == 'x')
- return Lex0x();
- APSIntVal = APSInt(StringRef(TokStart, CurPtr - TokStart));
- return lltok::APSInt;
- }
- ++CurPtr;
- // Skip over [0-9]*([eE][-+]?[0-9]+)?
- while (isdigit(static_cast<unsigned char>(CurPtr[0]))) ++CurPtr;
- if (CurPtr[0] == 'e' || CurPtr[0] == 'E') {
- if (isdigit(static_cast<unsigned char>(CurPtr[1])) ||
- ((CurPtr[1] == '-' || CurPtr[1] == '+') &&
- isdigit(static_cast<unsigned char>(CurPtr[2])))) {
- CurPtr += 2;
- while (isdigit(static_cast<unsigned char>(CurPtr[0]))) ++CurPtr;
- }
- }
- APFloatVal = APFloat(APFloat::IEEEdouble(),
- StringRef(TokStart, CurPtr - TokStart));
- return lltok::APFloat;
- }
- /// Lex a floating point constant starting with +.
- /// FPConstant [-+]?[0-9]+[.][0-9]*([eE][-+]?[0-9]+)?
- lltok::Kind LLLexer::LexPositive() {
- // If the letter after the negative is a number, this is probably not a
- // label.
- if (!isdigit(static_cast<unsigned char>(CurPtr[0])))
- return lltok::Error;
- // Skip digits.
- for (++CurPtr; isdigit(static_cast<unsigned char>(CurPtr[0])); ++CurPtr)
- /*empty*/;
- // At this point, we need a '.'.
- if (CurPtr[0] != '.') {
- CurPtr = TokStart+1;
- return lltok::Error;
- }
- ++CurPtr;
- // Skip over [0-9]*([eE][-+]?[0-9]+)?
- while (isdigit(static_cast<unsigned char>(CurPtr[0]))) ++CurPtr;
- if (CurPtr[0] == 'e' || CurPtr[0] == 'E') {
- if (isdigit(static_cast<unsigned char>(CurPtr[1])) ||
- ((CurPtr[1] == '-' || CurPtr[1] == '+') &&
- isdigit(static_cast<unsigned char>(CurPtr[2])))) {
- CurPtr += 2;
- while (isdigit(static_cast<unsigned char>(CurPtr[0]))) ++CurPtr;
- }
- }
- APFloatVal = APFloat(APFloat::IEEEdouble(),
- StringRef(TokStart, CurPtr - TokStart));
- return lltok::APFloat;
- }
|