123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235 |
- //===-- DataExtractor.cpp -------------------------------------------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/Support/DataExtractor.h"
- #include "llvm/Support/Errc.h"
- #include "llvm/Support/ErrorHandling.h"
- #include "llvm/Support/LEB128.h"
- #include "llvm/Support/SwapByteOrder.h"
- using namespace llvm;
- bool DataExtractor::prepareRead(uint64_t Offset, uint64_t Size,
- Error *E) const {
- if (isValidOffsetForDataOfSize(Offset, Size))
- return true;
- if (E) {
- if (Offset <= Data.size())
- *E = createStringError(
- errc::illegal_byte_sequence,
- "unexpected end of data at offset 0x%zx while reading [0x%" PRIx64
- ", 0x%" PRIx64 ")",
- Data.size(), Offset, Offset + Size);
- else
- *E = createStringError(errc::invalid_argument,
- "offset 0x%" PRIx64
- " is beyond the end of data at 0x%zx",
- Offset, Data.size());
- }
- return false;
- }
- static bool isError(Error *E) { return E && *E; }
- template <typename T>
- T DataExtractor::getU(uint64_t *offset_ptr, Error *Err) const {
- ErrorAsOutParameter ErrAsOut(Err);
- T val = 0;
- if (isError(Err))
- return val;
- uint64_t offset = *offset_ptr;
- if (!prepareRead(offset, sizeof(T), Err))
- return val;
- std::memcpy(&val, &Data.data()[offset], sizeof(val));
- if (sys::IsLittleEndianHost != IsLittleEndian)
- sys::swapByteOrder(val);
- // Advance the offset
- *offset_ptr += sizeof(val);
- return val;
- }
- template <typename T>
- T *DataExtractor::getUs(uint64_t *offset_ptr, T *dst, uint32_t count,
- Error *Err) const {
- ErrorAsOutParameter ErrAsOut(Err);
- if (isError(Err))
- return nullptr;
- uint64_t offset = *offset_ptr;
- if (!prepareRead(offset, sizeof(*dst) * count, Err))
- return nullptr;
- for (T *value_ptr = dst, *end = dst + count; value_ptr != end;
- ++value_ptr, offset += sizeof(*dst))
- *value_ptr = getU<T>(offset_ptr, Err);
- // Advance the offset
- *offset_ptr = offset;
- // Return a non-NULL pointer to the converted data as an indicator of
- // success
- return dst;
- }
- uint8_t DataExtractor::getU8(uint64_t *offset_ptr, llvm::Error *Err) const {
- return getU<uint8_t>(offset_ptr, Err);
- }
- uint8_t *DataExtractor::getU8(uint64_t *offset_ptr, uint8_t *dst,
- uint32_t count) const {
- return getUs<uint8_t>(offset_ptr, dst, count, nullptr);
- }
- uint8_t *DataExtractor::getU8(Cursor &C, uint8_t *Dst, uint32_t Count) const {
- return getUs<uint8_t>(&C.Offset, Dst, Count, &C.Err);
- }
- uint16_t DataExtractor::getU16(uint64_t *offset_ptr, llvm::Error *Err) const {
- return getU<uint16_t>(offset_ptr, Err);
- }
- uint16_t *DataExtractor::getU16(uint64_t *offset_ptr, uint16_t *dst,
- uint32_t count) const {
- return getUs<uint16_t>(offset_ptr, dst, count, nullptr);
- }
- uint32_t DataExtractor::getU24(uint64_t *OffsetPtr, Error *Err) const {
- uint24_t ExtractedVal = getU<uint24_t>(OffsetPtr, Err);
- // The 3 bytes are in the correct byte order for the host.
- return ExtractedVal.getAsUint32(sys::IsLittleEndianHost);
- }
- uint32_t DataExtractor::getU32(uint64_t *offset_ptr, llvm::Error *Err) const {
- return getU<uint32_t>(offset_ptr, Err);
- }
- uint32_t *DataExtractor::getU32(uint64_t *offset_ptr, uint32_t *dst,
- uint32_t count) const {
- return getUs<uint32_t>(offset_ptr, dst, count, nullptr);
- }
- uint64_t DataExtractor::getU64(uint64_t *offset_ptr, llvm::Error *Err) const {
- return getU<uint64_t>(offset_ptr, Err);
- }
- uint64_t *DataExtractor::getU64(uint64_t *offset_ptr, uint64_t *dst,
- uint32_t count) const {
- return getUs<uint64_t>(offset_ptr, dst, count, nullptr);
- }
- uint64_t DataExtractor::getUnsigned(uint64_t *offset_ptr, uint32_t byte_size,
- llvm::Error *Err) const {
- switch (byte_size) {
- case 1:
- return getU8(offset_ptr, Err);
- case 2:
- return getU16(offset_ptr, Err);
- case 4:
- return getU32(offset_ptr, Err);
- case 8:
- return getU64(offset_ptr, Err);
- }
- llvm_unreachable("getUnsigned unhandled case!");
- }
- int64_t
- DataExtractor::getSigned(uint64_t *offset_ptr, uint32_t byte_size) const {
- switch (byte_size) {
- case 1:
- return (int8_t)getU8(offset_ptr);
- case 2:
- return (int16_t)getU16(offset_ptr);
- case 4:
- return (int32_t)getU32(offset_ptr);
- case 8:
- return (int64_t)getU64(offset_ptr);
- }
- llvm_unreachable("getSigned unhandled case!");
- }
- StringRef DataExtractor::getCStrRef(uint64_t *OffsetPtr, Error *Err) const {
- ErrorAsOutParameter ErrAsOut(Err);
- if (isError(Err))
- return StringRef();
- uint64_t Start = *OffsetPtr;
- StringRef::size_type Pos = Data.find('\0', Start);
- if (Pos != StringRef::npos) {
- *OffsetPtr = Pos + 1;
- return StringRef(Data.data() + Start, Pos - Start);
- }
- if (Err)
- *Err = createStringError(errc::illegal_byte_sequence,
- "no null terminated string at offset 0x%" PRIx64,
- Start);
- return StringRef();
- }
- StringRef DataExtractor::getFixedLengthString(uint64_t *OffsetPtr,
- uint64_t Length,
- StringRef TrimChars) const {
- StringRef Bytes(getBytes(OffsetPtr, Length));
- return Bytes.trim(TrimChars);
- }
- StringRef DataExtractor::getBytes(uint64_t *OffsetPtr, uint64_t Length,
- Error *Err) const {
- ErrorAsOutParameter ErrAsOut(Err);
- if (isError(Err))
- return StringRef();
- if (!prepareRead(*OffsetPtr, Length, Err))
- return StringRef();
- StringRef Result = Data.substr(*OffsetPtr, Length);
- *OffsetPtr += Length;
- return Result;
- }
- template <typename T>
- static T getLEB128(StringRef Data, uint64_t *OffsetPtr, Error *Err,
- T (&Decoder)(const uint8_t *p, unsigned *n,
- const uint8_t *end, const char **error)) {
- ArrayRef<uint8_t> Bytes = arrayRefFromStringRef(Data);
- assert(*OffsetPtr <= Bytes.size());
- ErrorAsOutParameter ErrAsOut(Err);
- if (isError(Err))
- return T();
- const char *error;
- unsigned bytes_read;
- T result =
- Decoder(Bytes.data() + *OffsetPtr, &bytes_read, Bytes.end(), &error);
- if (error) {
- if (Err)
- *Err = createStringError(errc::illegal_byte_sequence,
- "unable to decode LEB128 at offset 0x%8.8" PRIx64
- ": %s",
- *OffsetPtr, error);
- return T();
- }
- *OffsetPtr += bytes_read;
- return result;
- }
- uint64_t DataExtractor::getULEB128(uint64_t *offset_ptr, Error *Err) const {
- return getLEB128(Data, offset_ptr, Err, decodeULEB128);
- }
- int64_t DataExtractor::getSLEB128(uint64_t *offset_ptr, Error *Err) const {
- return getLEB128(Data, offset_ptr, Err, decodeSLEB128);
- }
- void DataExtractor::skip(Cursor &C, uint64_t Length) const {
- ErrorAsOutParameter ErrAsOut(&C.Err);
- if (isError(&C.Err))
- return;
- if (prepareRead(C.Offset, Length, &C.Err))
- C.Offset += Length;
- }
|