diff options
Diffstat (limited to 'llvm/lib/Support/DataExtractor.cpp')
-rw-r--r-- | llvm/lib/Support/DataExtractor.cpp | 164 |
1 files changed, 91 insertions, 73 deletions
diff --git a/llvm/lib/Support/DataExtractor.cpp b/llvm/lib/Support/DataExtractor.cpp index a98297cdb35f2..133d674275e8c 100644 --- a/llvm/lib/Support/DataExtractor.cpp +++ b/llvm/lib/Support/DataExtractor.cpp @@ -15,29 +15,40 @@ using namespace llvm; -static void unexpectedEndReached(Error *E) { - if (E) - *E = createStringError(errc::illegal_byte_sequence, - "unexpected end of data"); +bool DataExtractor::prepareRead(uint64_t Offset, uint64_t Size, + Error *E) const { + if (isValidOffsetForDataOfSize(Offset, Size)) + return true; + if (E) { + if (Offset <= Data.size()) + *E = createStringError( + errc::illegal_byte_sequence, + "unexpected end of data at offset 0x%zx while reading [0x%" PRIx64 + ", 0x%" PRIx64 ")", + Data.size(), Offset, Offset + Size); + else + *E = createStringError(errc::invalid_argument, + "offset 0x%" PRIx64 + " is beyond the end of data at 0x%zx", + Offset, Data.size()); + } + return false; } static bool isError(Error *E) { return E && *E; } template <typename T> -static T getU(uint64_t *offset_ptr, const DataExtractor *de, - bool isLittleEndian, const char *Data, llvm::Error *Err) { +T DataExtractor::getU(uint64_t *offset_ptr, Error *Err) const { ErrorAsOutParameter ErrAsOut(Err); T val = 0; if (isError(Err)) return val; uint64_t offset = *offset_ptr; - if (!de->isValidOffsetForDataOfSize(offset, sizeof(T))) { - unexpectedEndReached(Err); + if (!prepareRead(offset, sizeof(T), Err)) return val; - } - std::memcpy(&val, &Data[offset], sizeof(val)); - if (sys::IsLittleEndianHost != isLittleEndian) + std::memcpy(&val, &Data.data()[offset], sizeof(val)); + if (sys::IsLittleEndianHost != IsLittleEndian) sys::swapByteOrder(val); // Advance the offset @@ -46,22 +57,19 @@ static T getU(uint64_t *offset_ptr, const DataExtractor *de, } template <typename T> -static T *getUs(uint64_t *offset_ptr, T *dst, uint32_t count, - const DataExtractor *de, bool isLittleEndian, const char *Data, - llvm::Error *Err) { +T *DataExtractor::getUs(uint64_t *offset_ptr, T *dst, uint32_t count, + Error *Err) const { ErrorAsOutParameter ErrAsOut(Err); if (isError(Err)) return nullptr; uint64_t offset = *offset_ptr; - if (!de->isValidOffsetForDataOfSize(offset, sizeof(*dst) * count)) { - unexpectedEndReached(Err); + if (!prepareRead(offset, sizeof(*dst) * count, Err)) return nullptr; - } for (T *value_ptr = dst, *end = dst + count; value_ptr != end; ++value_ptr, offset += sizeof(*dst)) - *value_ptr = getU<T>(offset_ptr, de, isLittleEndian, Data, Err); + *value_ptr = getU<T>(offset_ptr, Err); // Advance the offset *offset_ptr = offset; // Return a non-NULL pointer to the converted data as an indicator of @@ -70,55 +78,49 @@ static T *getUs(uint64_t *offset_ptr, T *dst, uint32_t count, } uint8_t DataExtractor::getU8(uint64_t *offset_ptr, llvm::Error *Err) const { - return getU<uint8_t>(offset_ptr, this, IsLittleEndian, Data.data(), Err); + return getU<uint8_t>(offset_ptr, Err); } -uint8_t * -DataExtractor::getU8(uint64_t *offset_ptr, uint8_t *dst, uint32_t count) const { - return getUs<uint8_t>(offset_ptr, dst, count, this, IsLittleEndian, - Data.data(), nullptr); +uint8_t *DataExtractor::getU8(uint64_t *offset_ptr, uint8_t *dst, + uint32_t count) const { + return getUs<uint8_t>(offset_ptr, dst, count, nullptr); } uint8_t *DataExtractor::getU8(Cursor &C, uint8_t *Dst, uint32_t Count) const { - return getUs<uint8_t>(&C.Offset, Dst, Count, this, IsLittleEndian, - Data.data(), &C.Err); + return getUs<uint8_t>(&C.Offset, Dst, Count, &C.Err); } uint16_t DataExtractor::getU16(uint64_t *offset_ptr, llvm::Error *Err) const { - return getU<uint16_t>(offset_ptr, this, IsLittleEndian, Data.data(), Err); + return getU<uint16_t>(offset_ptr, Err); } uint16_t *DataExtractor::getU16(uint64_t *offset_ptr, uint16_t *dst, uint32_t count) const { - return getUs<uint16_t>(offset_ptr, dst, count, this, IsLittleEndian, - Data.data(), nullptr); + return getUs<uint16_t>(offset_ptr, dst, count, nullptr); } -uint32_t DataExtractor::getU24(uint64_t *offset_ptr) const { - uint24_t ExtractedVal = - getU<uint24_t>(offset_ptr, this, IsLittleEndian, Data.data(), nullptr); +uint32_t DataExtractor::getU24(uint64_t *OffsetPtr, Error *Err) const { + uint24_t ExtractedVal = getU<uint24_t>(OffsetPtr, Err); // The 3 bytes are in the correct byte order for the host. return ExtractedVal.getAsUint32(sys::IsLittleEndianHost); } uint32_t DataExtractor::getU32(uint64_t *offset_ptr, llvm::Error *Err) const { - return getU<uint32_t>(offset_ptr, this, IsLittleEndian, Data.data(), Err); + return getU<uint32_t>(offset_ptr, Err); } uint32_t *DataExtractor::getU32(uint64_t *offset_ptr, uint32_t *dst, uint32_t count) const { - return getUs<uint32_t>(offset_ptr, dst, count, this, IsLittleEndian, - Data.data(), nullptr); + return getUs<uint32_t>(offset_ptr, dst, count, nullptr); } uint64_t DataExtractor::getU64(uint64_t *offset_ptr, llvm::Error *Err) const { - return getU<uint64_t>(offset_ptr, this, IsLittleEndian, Data.data(), Err); + return getU<uint64_t>(offset_ptr, Err); } uint64_t *DataExtractor::getU64(uint64_t *offset_ptr, uint64_t *dst, uint32_t count) const { - return getUs<uint64_t>(offset_ptr, dst, count, this, IsLittleEndian, - Data.data(), nullptr); + return getUs<uint64_t>(offset_ptr, dst, count, nullptr); } uint64_t DataExtractor::getUnsigned(uint64_t *offset_ptr, uint32_t byte_size, @@ -151,59 +153,77 @@ DataExtractor::getSigned(uint64_t *offset_ptr, uint32_t byte_size) const { llvm_unreachable("getSigned unhandled case!"); } -const char *DataExtractor::getCStr(uint64_t *offset_ptr) const { - uint64_t offset = *offset_ptr; - StringRef::size_type pos = Data.find('\0', offset); - if (pos != StringRef::npos) { - *offset_ptr = pos + 1; - return Data.data() + offset; - } - return nullptr; -} +StringRef DataExtractor::getCStrRef(uint64_t *OffsetPtr, Error *Err) const { + ErrorAsOutParameter ErrAsOut(Err); + if (isError(Err)) + return StringRef(); -StringRef DataExtractor::getCStrRef(uint64_t *offset_ptr) const { - uint64_t Start = *offset_ptr; + uint64_t Start = *OffsetPtr; StringRef::size_type Pos = Data.find('\0', Start); if (Pos != StringRef::npos) { - *offset_ptr = Pos + 1; + *OffsetPtr = Pos + 1; return StringRef(Data.data() + Start, Pos - Start); } + if (Err) + *Err = createStringError(errc::illegal_byte_sequence, + "no null terminated string at offset 0x%" PRIx64, + Start); return StringRef(); } -uint64_t DataExtractor::getULEB128(uint64_t *offset_ptr, - llvm::Error *Err) const { - assert(*offset_ptr <= Data.size()); +StringRef DataExtractor::getFixedLengthString(uint64_t *OffsetPtr, + uint64_t Length, + StringRef TrimChars) const { + StringRef Bytes(getBytes(OffsetPtr, Length)); + return Bytes.trim(TrimChars); +} + +StringRef DataExtractor::getBytes(uint64_t *OffsetPtr, uint64_t Length, + Error *Err) const { ErrorAsOutParameter ErrAsOut(Err); if (isError(Err)) - return 0; + return StringRef(); + + if (!prepareRead(*OffsetPtr, Length, Err)) + return StringRef(); + + StringRef Result = Data.substr(*OffsetPtr, Length); + *OffsetPtr += Length; + return Result; +} + +template <typename T> +static T getLEB128(StringRef Data, uint64_t *OffsetPtr, Error *Err, + T (&Decoder)(const uint8_t *p, unsigned *n, + const uint8_t *end, const char **error)) { + ArrayRef<uint8_t> Bytes = arrayRefFromStringRef(Data); + assert(*OffsetPtr <= Bytes.size()); + ErrorAsOutParameter ErrAsOut(Err); + if (isError(Err)) + return T(); const char *error; unsigned bytes_read; - uint64_t result = decodeULEB128( - reinterpret_cast<const uint8_t *>(Data.data() + *offset_ptr), &bytes_read, - reinterpret_cast<const uint8_t *>(Data.data() + Data.size()), &error); + T result = + Decoder(Bytes.data() + *OffsetPtr, &bytes_read, Bytes.end(), &error); if (error) { if (Err) - *Err = createStringError(errc::illegal_byte_sequence, error); - return 0; + *Err = createStringError(errc::illegal_byte_sequence, + "unable to decode LEB128 at offset 0x%8.8" PRIx64 + ": %s", + *OffsetPtr, error); + return T(); } - *offset_ptr += bytes_read; + *OffsetPtr += bytes_read; return result; } -int64_t DataExtractor::getSLEB128(uint64_t *offset_ptr) const { - assert(*offset_ptr <= Data.size()); +uint64_t DataExtractor::getULEB128(uint64_t *offset_ptr, Error *Err) const { + return getLEB128(Data, offset_ptr, Err, decodeULEB128); +} - const char *error; - unsigned bytes_read; - int64_t result = decodeSLEB128( - reinterpret_cast<const uint8_t *>(Data.data() + *offset_ptr), &bytes_read, - reinterpret_cast<const uint8_t *>(Data.data() + Data.size()), &error); - if (error) - return 0; - *offset_ptr += bytes_read; - return result; +int64_t DataExtractor::getSLEB128(uint64_t *offset_ptr, Error *Err) const { + return getLEB128(Data, offset_ptr, Err, decodeSLEB128); } void DataExtractor::skip(Cursor &C, uint64_t Length) const { @@ -211,8 +231,6 @@ void DataExtractor::skip(Cursor &C, uint64_t Length) const { if (isError(&C.Err)) return; - if (isValidOffsetForDataOfSize(C.Offset, Length)) + if (prepareRead(C.Offset, Length, &C.Err)) C.Offset += Length; - else - unexpectedEndReached(&C.Err); } |