//===-- DataExtractor.cpp -------------------------------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "llvm/Support/DataExtractor.h" #include "llvm/Support/Errc.h" #include "llvm/Support/ErrorHandling.h" #include "llvm/Support/Host.h" #include "llvm/Support/LEB128.h" #include "llvm/Support/SwapByteOrder.h" using namespace llvm; bool DataExtractor::prepareRead(uint64_t Offset, uint64_t Size, Error *E) const { if (isValidOffsetForDataOfSize(Offset, Size)) return true; if (E) { if (Offset <= Data.size()) *E = createStringError( errc::illegal_byte_sequence, "unexpected end of data at offset 0x%zx while reading [0x%" PRIx64 ", 0x%" PRIx64 ")", Data.size(), Offset, Offset + Size); else *E = createStringError(errc::invalid_argument, "offset 0x%" PRIx64 " is beyond the end of data at 0x%zx", Offset, Data.size()); } return false; } static bool isError(Error *E) { return E && *E; } template T DataExtractor::getU(uint64_t *offset_ptr, Error *Err) const { ErrorAsOutParameter ErrAsOut(Err); T val = 0; if (isError(Err)) return val; uint64_t offset = *offset_ptr; if (!prepareRead(offset, sizeof(T), Err)) return val; std::memcpy(&val, &Data.data()[offset], sizeof(val)); if (sys::IsLittleEndianHost != IsLittleEndian) sys::swapByteOrder(val); // Advance the offset *offset_ptr += sizeof(val); return val; } template T *DataExtractor::getUs(uint64_t *offset_ptr, T *dst, uint32_t count, Error *Err) const { ErrorAsOutParameter ErrAsOut(Err); if (isError(Err)) return nullptr; uint64_t offset = *offset_ptr; if (!prepareRead(offset, sizeof(*dst) * count, Err)) return nullptr; for (T *value_ptr = dst, *end = dst + count; value_ptr != end; ++value_ptr, offset += sizeof(*dst)) *value_ptr = getU(offset_ptr, Err); // Advance the offset *offset_ptr = offset; // Return a non-NULL pointer to the converted data as an indicator of // success return dst; } uint8_t DataExtractor::getU8(uint64_t *offset_ptr, llvm::Error *Err) const { return getU(offset_ptr, Err); } uint8_t *DataExtractor::getU8(uint64_t *offset_ptr, uint8_t *dst, uint32_t count) const { return getUs(offset_ptr, dst, count, nullptr); } uint8_t *DataExtractor::getU8(Cursor &C, uint8_t *Dst, uint32_t Count) const { return getUs(&C.Offset, Dst, Count, &C.Err); } uint16_t DataExtractor::getU16(uint64_t *offset_ptr, llvm::Error *Err) const { return getU(offset_ptr, Err); } uint16_t *DataExtractor::getU16(uint64_t *offset_ptr, uint16_t *dst, uint32_t count) const { return getUs(offset_ptr, dst, count, nullptr); } uint32_t DataExtractor::getU24(uint64_t *OffsetPtr, Error *Err) const { uint24_t ExtractedVal = getU(OffsetPtr, Err); // The 3 bytes are in the correct byte order for the host. return ExtractedVal.getAsUint32(sys::IsLittleEndianHost); } uint32_t DataExtractor::getU32(uint64_t *offset_ptr, llvm::Error *Err) const { return getU(offset_ptr, Err); } uint32_t *DataExtractor::getU32(uint64_t *offset_ptr, uint32_t *dst, uint32_t count) const { return getUs(offset_ptr, dst, count, nullptr); } uint64_t DataExtractor::getU64(uint64_t *offset_ptr, llvm::Error *Err) const { return getU(offset_ptr, Err); } uint64_t *DataExtractor::getU64(uint64_t *offset_ptr, uint64_t *dst, uint32_t count) const { return getUs(offset_ptr, dst, count, nullptr); } uint64_t DataExtractor::getUnsigned(uint64_t *offset_ptr, uint32_t byte_size, llvm::Error *Err) const { switch (byte_size) { case 1: return getU8(offset_ptr, Err); case 2: return getU16(offset_ptr, Err); case 4: return getU32(offset_ptr, Err); case 8: return getU64(offset_ptr, Err); } llvm_unreachable("getUnsigned unhandled case!"); } int64_t DataExtractor::getSigned(uint64_t *offset_ptr, uint32_t byte_size) const { switch (byte_size) { case 1: return (int8_t)getU8(offset_ptr); case 2: return (int16_t)getU16(offset_ptr); case 4: return (int32_t)getU32(offset_ptr); case 8: return (int64_t)getU64(offset_ptr); } llvm_unreachable("getSigned unhandled case!"); } StringRef DataExtractor::getCStrRef(uint64_t *OffsetPtr, Error *Err) const { ErrorAsOutParameter ErrAsOut(Err); if (isError(Err)) return StringRef(); uint64_t Start = *OffsetPtr; StringRef::size_type Pos = Data.find('\0', Start); if (Pos != StringRef::npos) { *OffsetPtr = Pos + 1; return StringRef(Data.data() + Start, Pos - Start); } if (Err) *Err = createStringError(errc::illegal_byte_sequence, "no null terminated string at offset 0x%" PRIx64, Start); return StringRef(); } StringRef DataExtractor::getFixedLengthString(uint64_t *OffsetPtr, uint64_t Length, StringRef TrimChars) const { StringRef Bytes(getBytes(OffsetPtr, Length)); return Bytes.trim(TrimChars); } StringRef DataExtractor::getBytes(uint64_t *OffsetPtr, uint64_t Length, Error *Err) const { ErrorAsOutParameter ErrAsOut(Err); if (isError(Err)) return StringRef(); if (!prepareRead(*OffsetPtr, Length, Err)) return StringRef(); StringRef Result = Data.substr(*OffsetPtr, Length); *OffsetPtr += Length; return Result; } template static T getLEB128(StringRef Data, uint64_t *OffsetPtr, Error *Err, T (&Decoder)(const uint8_t *p, unsigned *n, const uint8_t *end, const char **error)) { ArrayRef Bytes = arrayRefFromStringRef(Data); assert(*OffsetPtr <= Bytes.size()); ErrorAsOutParameter ErrAsOut(Err); if (isError(Err)) return T(); const char *error; unsigned bytes_read; T result = Decoder(Bytes.data() + *OffsetPtr, &bytes_read, Bytes.end(), &error); if (error) { if (Err) *Err = createStringError(errc::illegal_byte_sequence, "unable to decode LEB128 at offset 0x%8.8" PRIx64 ": %s", *OffsetPtr, error); return T(); } *OffsetPtr += bytes_read; return result; } uint64_t DataExtractor::getULEB128(uint64_t *offset_ptr, Error *Err) const { return getLEB128(Data, offset_ptr, Err, decodeULEB128); } int64_t DataExtractor::getSLEB128(uint64_t *offset_ptr, Error *Err) const { return getLEB128(Data, offset_ptr, Err, decodeSLEB128); } void DataExtractor::skip(Cursor &C, uint64_t Length) const { ErrorAsOutParameter ErrAsOut(&C.Err); if (isError(&C.Err)) return; if (prepareRead(C.Offset, Length, &C.Err)) C.Offset += Length; }