123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476 |
- //===- BitstreamReader.cpp - BitstreamReader implementation ---------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/Bitstream/BitstreamReader.h"
- #include "llvm/ADT/StringRef.h"
- #include <cassert>
- #include <string>
- using namespace llvm;
- //===----------------------------------------------------------------------===//
- // BitstreamCursor implementation
- //===----------------------------------------------------------------------===//
- /// Having read the ENTER_SUBBLOCK abbrevid, enter the block.
- Error BitstreamCursor::EnterSubBlock(unsigned BlockID, unsigned *NumWordsP) {
- // Save the current block's state on BlockScope.
- BlockScope.push_back(Block(CurCodeSize));
- BlockScope.back().PrevAbbrevs.swap(CurAbbrevs);
- // Add the abbrevs specific to this block to the CurAbbrevs list.
- if (BlockInfo) {
- if (const BitstreamBlockInfo::BlockInfo *Info =
- BlockInfo->getBlockInfo(BlockID)) {
- llvm::append_range(CurAbbrevs, Info->Abbrevs);
- }
- }
- // Get the codesize of this block.
- Expected<uint32_t> MaybeVBR = ReadVBR(bitc::CodeLenWidth);
- if (!MaybeVBR)
- return MaybeVBR.takeError();
- CurCodeSize = MaybeVBR.get();
- if (CurCodeSize > MaxChunkSize)
- return llvm::createStringError(
- std::errc::illegal_byte_sequence,
- "can't read more than %zu at a time, trying to read %u", +MaxChunkSize,
- CurCodeSize);
- SkipToFourByteBoundary();
- Expected<word_t> MaybeNum = Read(bitc::BlockSizeWidth);
- if (!MaybeNum)
- return MaybeNum.takeError();
- word_t NumWords = MaybeNum.get();
- if (NumWordsP)
- *NumWordsP = NumWords;
- if (CurCodeSize == 0)
- return llvm::createStringError(
- std::errc::illegal_byte_sequence,
- "can't enter sub-block: current code size is 0");
- if (AtEndOfStream())
- return llvm::createStringError(
- std::errc::illegal_byte_sequence,
- "can't enter sub block: already at end of stream");
- return Error::success();
- }
- static Expected<uint64_t> readAbbreviatedField(BitstreamCursor &Cursor,
- const BitCodeAbbrevOp &Op) {
- assert(!Op.isLiteral() && "Not to be used with literals!");
- // Decode the value as we are commanded.
- switch (Op.getEncoding()) {
- case BitCodeAbbrevOp::Array:
- case BitCodeAbbrevOp::Blob:
- llvm_unreachable("Should not reach here");
- case BitCodeAbbrevOp::Fixed:
- assert((unsigned)Op.getEncodingData() <= Cursor.MaxChunkSize);
- return Cursor.Read((unsigned)Op.getEncodingData());
- case BitCodeAbbrevOp::VBR:
- assert((unsigned)Op.getEncodingData() <= Cursor.MaxChunkSize);
- return Cursor.ReadVBR64((unsigned)Op.getEncodingData());
- case BitCodeAbbrevOp::Char6:
- if (Expected<unsigned> Res = Cursor.Read(6))
- return BitCodeAbbrevOp::DecodeChar6(Res.get());
- else
- return Res.takeError();
- }
- llvm_unreachable("invalid abbreviation encoding");
- }
- /// skipRecord - Read the current record and discard it.
- Expected<unsigned> BitstreamCursor::skipRecord(unsigned AbbrevID) {
- // Skip unabbreviated records by reading past their entries.
- if (AbbrevID == bitc::UNABBREV_RECORD) {
- Expected<uint32_t> MaybeCode = ReadVBR(6);
- if (!MaybeCode)
- return MaybeCode.takeError();
- unsigned Code = MaybeCode.get();
- Expected<uint32_t> MaybeVBR = ReadVBR(6);
- if (!MaybeVBR)
- return MaybeVBR.get();
- unsigned NumElts = MaybeVBR.get();
- for (unsigned i = 0; i != NumElts; ++i)
- if (Expected<uint64_t> Res = ReadVBR64(6))
- ; // Skip!
- else
- return Res.takeError();
- return Code;
- }
- const BitCodeAbbrev *Abbv = getAbbrev(AbbrevID);
- const BitCodeAbbrevOp &CodeOp = Abbv->getOperandInfo(0);
- unsigned Code;
- if (CodeOp.isLiteral())
- Code = CodeOp.getLiteralValue();
- else {
- if (CodeOp.getEncoding() == BitCodeAbbrevOp::Array ||
- CodeOp.getEncoding() == BitCodeAbbrevOp::Blob)
- return llvm::createStringError(
- std::errc::illegal_byte_sequence,
- "Abbreviation starts with an Array or a Blob");
- Expected<uint64_t> MaybeCode = readAbbreviatedField(*this, CodeOp);
- if (!MaybeCode)
- return MaybeCode.takeError();
- Code = MaybeCode.get();
- }
- for (unsigned i = 1, e = Abbv->getNumOperandInfos(); i < e; ++i) {
- const BitCodeAbbrevOp &Op = Abbv->getOperandInfo(i);
- if (Op.isLiteral())
- continue;
- if (Op.getEncoding() != BitCodeAbbrevOp::Array &&
- Op.getEncoding() != BitCodeAbbrevOp::Blob) {
- if (Expected<uint64_t> MaybeField = readAbbreviatedField(*this, Op))
- continue;
- else
- return MaybeField.takeError();
- }
- if (Op.getEncoding() == BitCodeAbbrevOp::Array) {
- // Array case. Read the number of elements as a vbr6.
- Expected<uint32_t> MaybeNum = ReadVBR(6);
- if (!MaybeNum)
- return MaybeNum.takeError();
- unsigned NumElts = MaybeNum.get();
- // Get the element encoding.
- assert(i+2 == e && "array op not second to last?");
- const BitCodeAbbrevOp &EltEnc = Abbv->getOperandInfo(++i);
- // Read all the elements.
- // Decode the value as we are commanded.
- switch (EltEnc.getEncoding()) {
- default:
- report_fatal_error("Array element type can't be an Array or a Blob");
- case BitCodeAbbrevOp::Fixed:
- assert((unsigned)EltEnc.getEncodingData() <= MaxChunkSize);
- if (Error Err =
- JumpToBit(GetCurrentBitNo() + static_cast<uint64_t>(NumElts) *
- EltEnc.getEncodingData()))
- return std::move(Err);
- break;
- case BitCodeAbbrevOp::VBR:
- assert((unsigned)EltEnc.getEncodingData() <= MaxChunkSize);
- for (; NumElts; --NumElts)
- if (Expected<uint64_t> Res =
- ReadVBR64((unsigned)EltEnc.getEncodingData()))
- ; // Skip!
- else
- return Res.takeError();
- break;
- case BitCodeAbbrevOp::Char6:
- if (Error Err = JumpToBit(GetCurrentBitNo() + NumElts * 6))
- return std::move(Err);
- break;
- }
- continue;
- }
- assert(Op.getEncoding() == BitCodeAbbrevOp::Blob);
- // Blob case. Read the number of bytes as a vbr6.
- Expected<uint32_t> MaybeNum = ReadVBR(6);
- if (!MaybeNum)
- return MaybeNum.takeError();
- unsigned NumElts = MaybeNum.get();
- SkipToFourByteBoundary(); // 32-bit alignment
- // Figure out where the end of this blob will be including tail padding.
- const size_t NewEnd = GetCurrentBitNo() + alignTo(NumElts, 4) * 8;
- // If this would read off the end of the bitcode file, just set the
- // record to empty and return.
- if (!canSkipToPos(NewEnd/8)) {
- skipToEnd();
- break;
- }
- // Skip over the blob.
- if (Error Err = JumpToBit(NewEnd))
- return std::move(Err);
- }
- return Code;
- }
- Expected<unsigned> BitstreamCursor::readRecord(unsigned AbbrevID,
- SmallVectorImpl<uint64_t> &Vals,
- StringRef *Blob) {
- if (AbbrevID == bitc::UNABBREV_RECORD) {
- Expected<uint32_t> MaybeCode = ReadVBR(6);
- if (!MaybeCode)
- return MaybeCode.takeError();
- uint32_t Code = MaybeCode.get();
- Expected<uint32_t> MaybeNumElts = ReadVBR(6);
- if (!MaybeNumElts)
- return MaybeNumElts.takeError();
- uint32_t NumElts = MaybeNumElts.get();
- Vals.reserve(Vals.size() + NumElts);
- for (unsigned i = 0; i != NumElts; ++i)
- if (Expected<uint64_t> MaybeVal = ReadVBR64(6))
- Vals.push_back(MaybeVal.get());
- else
- return MaybeVal.takeError();
- return Code;
- }
- const BitCodeAbbrev *Abbv = getAbbrev(AbbrevID);
- // Read the record code first.
- assert(Abbv->getNumOperandInfos() != 0 && "no record code in abbreviation?");
- const BitCodeAbbrevOp &CodeOp = Abbv->getOperandInfo(0);
- unsigned Code;
- if (CodeOp.isLiteral())
- Code = CodeOp.getLiteralValue();
- else {
- if (CodeOp.getEncoding() == BitCodeAbbrevOp::Array ||
- CodeOp.getEncoding() == BitCodeAbbrevOp::Blob)
- report_fatal_error("Abbreviation starts with an Array or a Blob");
- if (Expected<uint64_t> MaybeCode = readAbbreviatedField(*this, CodeOp))
- Code = MaybeCode.get();
- else
- return MaybeCode.takeError();
- }
- for (unsigned i = 1, e = Abbv->getNumOperandInfos(); i != e; ++i) {
- const BitCodeAbbrevOp &Op = Abbv->getOperandInfo(i);
- if (Op.isLiteral()) {
- Vals.push_back(Op.getLiteralValue());
- continue;
- }
- if (Op.getEncoding() != BitCodeAbbrevOp::Array &&
- Op.getEncoding() != BitCodeAbbrevOp::Blob) {
- if (Expected<uint64_t> MaybeVal = readAbbreviatedField(*this, Op))
- Vals.push_back(MaybeVal.get());
- else
- return MaybeVal.takeError();
- continue;
- }
- if (Op.getEncoding() == BitCodeAbbrevOp::Array) {
- // Array case. Read the number of elements as a vbr6.
- Expected<uint32_t> MaybeNumElts = ReadVBR(6);
- if (!MaybeNumElts)
- return MaybeNumElts.takeError();
- uint32_t NumElts = MaybeNumElts.get();
- Vals.reserve(Vals.size() + NumElts);
- // Get the element encoding.
- if (i + 2 != e)
- report_fatal_error("Array op not second to last");
- const BitCodeAbbrevOp &EltEnc = Abbv->getOperandInfo(++i);
- if (!EltEnc.isEncoding())
- report_fatal_error(
- "Array element type has to be an encoding of a type");
- // Read all the elements.
- switch (EltEnc.getEncoding()) {
- default:
- report_fatal_error("Array element type can't be an Array or a Blob");
- case BitCodeAbbrevOp::Fixed:
- for (; NumElts; --NumElts)
- if (Expected<SimpleBitstreamCursor::word_t> MaybeVal =
- Read((unsigned)EltEnc.getEncodingData()))
- Vals.push_back(MaybeVal.get());
- else
- return MaybeVal.takeError();
- break;
- case BitCodeAbbrevOp::VBR:
- for (; NumElts; --NumElts)
- if (Expected<uint64_t> MaybeVal =
- ReadVBR64((unsigned)EltEnc.getEncodingData()))
- Vals.push_back(MaybeVal.get());
- else
- return MaybeVal.takeError();
- break;
- case BitCodeAbbrevOp::Char6:
- for (; NumElts; --NumElts)
- if (Expected<SimpleBitstreamCursor::word_t> MaybeVal = Read(6))
- Vals.push_back(BitCodeAbbrevOp::DecodeChar6(MaybeVal.get()));
- else
- return MaybeVal.takeError();
- }
- continue;
- }
- assert(Op.getEncoding() == BitCodeAbbrevOp::Blob);
- // Blob case. Read the number of bytes as a vbr6.
- Expected<uint32_t> MaybeNumElts = ReadVBR(6);
- if (!MaybeNumElts)
- return MaybeNumElts.takeError();
- uint32_t NumElts = MaybeNumElts.get();
- SkipToFourByteBoundary(); // 32-bit alignment
- // Figure out where the end of this blob will be including tail padding.
- size_t CurBitPos = GetCurrentBitNo();
- const size_t NewEnd = CurBitPos + alignTo(NumElts, 4) * 8;
- // If this would read off the end of the bitcode file, just set the
- // record to empty and return.
- if (!canSkipToPos(NewEnd/8)) {
- Vals.append(NumElts, 0);
- skipToEnd();
- break;
- }
- // Otherwise, inform the streamer that we need these bytes in memory. Skip
- // over tail padding first, in case jumping to NewEnd invalidates the Blob
- // pointer.
- if (Error Err = JumpToBit(NewEnd))
- return std::move(Err);
- const char *Ptr = (const char *)getPointerToBit(CurBitPos, NumElts);
- // If we can return a reference to the data, do so to avoid copying it.
- if (Blob) {
- *Blob = StringRef(Ptr, NumElts);
- } else {
- // Otherwise, unpack into Vals with zero extension.
- auto *UPtr = reinterpret_cast<const unsigned char *>(Ptr);
- Vals.append(UPtr, UPtr + NumElts);
- }
- }
- return Code;
- }
- Error BitstreamCursor::ReadAbbrevRecord() {
- auto Abbv = std::make_shared<BitCodeAbbrev>();
- Expected<uint32_t> MaybeNumOpInfo = ReadVBR(5);
- if (!MaybeNumOpInfo)
- return MaybeNumOpInfo.takeError();
- unsigned NumOpInfo = MaybeNumOpInfo.get();
- for (unsigned i = 0; i != NumOpInfo; ++i) {
- Expected<word_t> MaybeIsLiteral = Read(1);
- if (!MaybeIsLiteral)
- return MaybeIsLiteral.takeError();
- bool IsLiteral = MaybeIsLiteral.get();
- if (IsLiteral) {
- Expected<uint64_t> MaybeOp = ReadVBR64(8);
- if (!MaybeOp)
- return MaybeOp.takeError();
- Abbv->Add(BitCodeAbbrevOp(MaybeOp.get()));
- continue;
- }
- Expected<word_t> MaybeEncoding = Read(3);
- if (!MaybeEncoding)
- return MaybeEncoding.takeError();
- BitCodeAbbrevOp::Encoding E =
- (BitCodeAbbrevOp::Encoding)MaybeEncoding.get();
- if (BitCodeAbbrevOp::hasEncodingData(E)) {
- Expected<uint64_t> MaybeData = ReadVBR64(5);
- if (!MaybeData)
- return MaybeData.takeError();
- uint64_t Data = MaybeData.get();
- // As a special case, handle fixed(0) (i.e., a fixed field with zero bits)
- // and vbr(0) as a literal zero. This is decoded the same way, and avoids
- // a slow path in Read() to have to handle reading zero bits.
- if ((E == BitCodeAbbrevOp::Fixed || E == BitCodeAbbrevOp::VBR) &&
- Data == 0) {
- Abbv->Add(BitCodeAbbrevOp(0));
- continue;
- }
- if ((E == BitCodeAbbrevOp::Fixed || E == BitCodeAbbrevOp::VBR) &&
- Data > MaxChunkSize)
- report_fatal_error(
- "Fixed or VBR abbrev record with size > MaxChunkData");
- Abbv->Add(BitCodeAbbrevOp(E, Data));
- } else
- Abbv->Add(BitCodeAbbrevOp(E));
- }
- if (Abbv->getNumOperandInfos() == 0)
- report_fatal_error("Abbrev record with no operands");
- CurAbbrevs.push_back(std::move(Abbv));
- return Error::success();
- }
- Expected<Optional<BitstreamBlockInfo>>
- BitstreamCursor::ReadBlockInfoBlock(bool ReadBlockInfoNames) {
- if (llvm::Error Err = EnterSubBlock(bitc::BLOCKINFO_BLOCK_ID))
- return std::move(Err);
- BitstreamBlockInfo NewBlockInfo;
- SmallVector<uint64_t, 64> Record;
- BitstreamBlockInfo::BlockInfo *CurBlockInfo = nullptr;
- // Read all the records for this module.
- while (true) {
- Expected<BitstreamEntry> MaybeEntry =
- advanceSkippingSubblocks(AF_DontAutoprocessAbbrevs);
- if (!MaybeEntry)
- return MaybeEntry.takeError();
- BitstreamEntry Entry = MaybeEntry.get();
- switch (Entry.Kind) {
- case llvm::BitstreamEntry::SubBlock: // Handled for us already.
- case llvm::BitstreamEntry::Error:
- return None;
- case llvm::BitstreamEntry::EndBlock:
- return std::move(NewBlockInfo);
- case llvm::BitstreamEntry::Record:
- // The interesting case.
- break;
- }
- // Read abbrev records, associate them with CurBID.
- if (Entry.ID == bitc::DEFINE_ABBREV) {
- if (!CurBlockInfo) return None;
- if (Error Err = ReadAbbrevRecord())
- return std::move(Err);
- // ReadAbbrevRecord installs the abbrev in CurAbbrevs. Move it to the
- // appropriate BlockInfo.
- CurBlockInfo->Abbrevs.push_back(std::move(CurAbbrevs.back()));
- CurAbbrevs.pop_back();
- continue;
- }
- // Read a record.
- Record.clear();
- Expected<unsigned> MaybeBlockInfo = readRecord(Entry.ID, Record);
- if (!MaybeBlockInfo)
- return MaybeBlockInfo.takeError();
- switch (MaybeBlockInfo.get()) {
- default:
- break; // Default behavior, ignore unknown content.
- case bitc::BLOCKINFO_CODE_SETBID:
- if (Record.size() < 1)
- return None;
- CurBlockInfo = &NewBlockInfo.getOrCreateBlockInfo((unsigned)Record[0]);
- break;
- case bitc::BLOCKINFO_CODE_BLOCKNAME: {
- if (!CurBlockInfo)
- return None;
- if (!ReadBlockInfoNames)
- break; // Ignore name.
- CurBlockInfo->Name = std::string(Record.begin(), Record.end());
- break;
- }
- case bitc::BLOCKINFO_CODE_SETRECORDNAME: {
- if (!CurBlockInfo) return None;
- if (!ReadBlockInfoNames)
- break; // Ignore name.
- CurBlockInfo->RecordNames.emplace_back(
- (unsigned)Record[0], std::string(Record.begin() + 1, Record.end()));
- break;
- }
- }
- }
- }
|