237 lines
7.2 KiB
C++
237 lines
7.2 KiB
C++
|
//===-- DataExtractor.cpp -------------------------------------------------===//
|
||
|
//
|
||
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||
|
// See https://llvm.org/LICENSE.txt for license information.
|
||
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||
|
//
|
||
|
//===----------------------------------------------------------------------===//
|
||
|
|
||
|
#include "llvm/Support/DataExtractor.h"
|
||
|
#include "llvm/Support/Errc.h"
|
||
|
#include "llvm/Support/ErrorHandling.h"
|
||
|
#include "llvm/Support/Host.h"
|
||
|
#include "llvm/Support/LEB128.h"
|
||
|
#include "llvm/Support/SwapByteOrder.h"
|
||
|
|
||
|
using namespace llvm;
|
||
|
|
||
|
bool DataExtractor::prepareRead(uint64_t Offset, uint64_t Size,
|
||
|
Error *E) const {
|
||
|
if (isValidOffsetForDataOfSize(Offset, Size))
|
||
|
return true;
|
||
|
if (E) {
|
||
|
if (Offset <= Data.size())
|
||
|
*E = createStringError(
|
||
|
errc::illegal_byte_sequence,
|
||
|
"unexpected end of data at offset 0x%zx while reading [0x%" PRIx64
|
||
|
", 0x%" PRIx64 ")",
|
||
|
Data.size(), Offset, Offset + Size);
|
||
|
else
|
||
|
*E = createStringError(errc::invalid_argument,
|
||
|
"offset 0x%" PRIx64
|
||
|
" is beyond the end of data at 0x%zx",
|
||
|
Offset, Data.size());
|
||
|
}
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
static bool isError(Error *E) { return E && *E; }
|
||
|
|
||
|
template <typename T>
|
||
|
T DataExtractor::getU(uint64_t *offset_ptr, Error *Err) const {
|
||
|
ErrorAsOutParameter ErrAsOut(Err);
|
||
|
T val = 0;
|
||
|
if (isError(Err))
|
||
|
return val;
|
||
|
|
||
|
uint64_t offset = *offset_ptr;
|
||
|
if (!prepareRead(offset, sizeof(T), Err))
|
||
|
return val;
|
||
|
std::memcpy(&val, &Data.data()[offset], sizeof(val));
|
||
|
if (sys::IsLittleEndianHost != IsLittleEndian)
|
||
|
sys::swapByteOrder(val);
|
||
|
|
||
|
// Advance the offset
|
||
|
*offset_ptr += sizeof(val);
|
||
|
return val;
|
||
|
}
|
||
|
|
||
|
template <typename T>
|
||
|
T *DataExtractor::getUs(uint64_t *offset_ptr, T *dst, uint32_t count,
|
||
|
Error *Err) const {
|
||
|
ErrorAsOutParameter ErrAsOut(Err);
|
||
|
if (isError(Err))
|
||
|
return nullptr;
|
||
|
|
||
|
uint64_t offset = *offset_ptr;
|
||
|
|
||
|
if (!prepareRead(offset, sizeof(*dst) * count, Err))
|
||
|
return nullptr;
|
||
|
for (T *value_ptr = dst, *end = dst + count; value_ptr != end;
|
||
|
++value_ptr, offset += sizeof(*dst))
|
||
|
*value_ptr = getU<T>(offset_ptr, Err);
|
||
|
// Advance the offset
|
||
|
*offset_ptr = offset;
|
||
|
// Return a non-NULL pointer to the converted data as an indicator of
|
||
|
// success
|
||
|
return dst;
|
||
|
}
|
||
|
|
||
|
uint8_t DataExtractor::getU8(uint64_t *offset_ptr, llvm::Error *Err) const {
|
||
|
return getU<uint8_t>(offset_ptr, Err);
|
||
|
}
|
||
|
|
||
|
uint8_t *DataExtractor::getU8(uint64_t *offset_ptr, uint8_t *dst,
|
||
|
uint32_t count) const {
|
||
|
return getUs<uint8_t>(offset_ptr, dst, count, nullptr);
|
||
|
}
|
||
|
|
||
|
uint8_t *DataExtractor::getU8(Cursor &C, uint8_t *Dst, uint32_t Count) const {
|
||
|
return getUs<uint8_t>(&C.Offset, Dst, Count, &C.Err);
|
||
|
}
|
||
|
|
||
|
uint16_t DataExtractor::getU16(uint64_t *offset_ptr, llvm::Error *Err) const {
|
||
|
return getU<uint16_t>(offset_ptr, Err);
|
||
|
}
|
||
|
|
||
|
uint16_t *DataExtractor::getU16(uint64_t *offset_ptr, uint16_t *dst,
|
||
|
uint32_t count) const {
|
||
|
return getUs<uint16_t>(offset_ptr, dst, count, nullptr);
|
||
|
}
|
||
|
|
||
|
uint32_t DataExtractor::getU24(uint64_t *OffsetPtr, Error *Err) const {
|
||
|
uint24_t ExtractedVal = getU<uint24_t>(OffsetPtr, Err);
|
||
|
// The 3 bytes are in the correct byte order for the host.
|
||
|
return ExtractedVal.getAsUint32(sys::IsLittleEndianHost);
|
||
|
}
|
||
|
|
||
|
uint32_t DataExtractor::getU32(uint64_t *offset_ptr, llvm::Error *Err) const {
|
||
|
return getU<uint32_t>(offset_ptr, Err);
|
||
|
}
|
||
|
|
||
|
uint32_t *DataExtractor::getU32(uint64_t *offset_ptr, uint32_t *dst,
|
||
|
uint32_t count) const {
|
||
|
return getUs<uint32_t>(offset_ptr, dst, count, nullptr);
|
||
|
}
|
||
|
|
||
|
uint64_t DataExtractor::getU64(uint64_t *offset_ptr, llvm::Error *Err) const {
|
||
|
return getU<uint64_t>(offset_ptr, Err);
|
||
|
}
|
||
|
|
||
|
uint64_t *DataExtractor::getU64(uint64_t *offset_ptr, uint64_t *dst,
|
||
|
uint32_t count) const {
|
||
|
return getUs<uint64_t>(offset_ptr, dst, count, nullptr);
|
||
|
}
|
||
|
|
||
|
uint64_t DataExtractor::getUnsigned(uint64_t *offset_ptr, uint32_t byte_size,
|
||
|
llvm::Error *Err) const {
|
||
|
switch (byte_size) {
|
||
|
case 1:
|
||
|
return getU8(offset_ptr, Err);
|
||
|
case 2:
|
||
|
return getU16(offset_ptr, Err);
|
||
|
case 4:
|
||
|
return getU32(offset_ptr, Err);
|
||
|
case 8:
|
||
|
return getU64(offset_ptr, Err);
|
||
|
}
|
||
|
llvm_unreachable("getUnsigned unhandled case!");
|
||
|
}
|
||
|
|
||
|
int64_t
|
||
|
DataExtractor::getSigned(uint64_t *offset_ptr, uint32_t byte_size) const {
|
||
|
switch (byte_size) {
|
||
|
case 1:
|
||
|
return (int8_t)getU8(offset_ptr);
|
||
|
case 2:
|
||
|
return (int16_t)getU16(offset_ptr);
|
||
|
case 4:
|
||
|
return (int32_t)getU32(offset_ptr);
|
||
|
case 8:
|
||
|
return (int64_t)getU64(offset_ptr);
|
||
|
}
|
||
|
llvm_unreachable("getSigned unhandled case!");
|
||
|
}
|
||
|
|
||
|
StringRef DataExtractor::getCStrRef(uint64_t *OffsetPtr, Error *Err) const {
|
||
|
ErrorAsOutParameter ErrAsOut(Err);
|
||
|
if (isError(Err))
|
||
|
return StringRef();
|
||
|
|
||
|
uint64_t Start = *OffsetPtr;
|
||
|
StringRef::size_type Pos = Data.find('\0', Start);
|
||
|
if (Pos != StringRef::npos) {
|
||
|
*OffsetPtr = Pos + 1;
|
||
|
return StringRef(Data.data() + Start, Pos - Start);
|
||
|
}
|
||
|
if (Err)
|
||
|
*Err = createStringError(errc::illegal_byte_sequence,
|
||
|
"no null terminated string at offset 0x%" PRIx64,
|
||
|
Start);
|
||
|
return StringRef();
|
||
|
}
|
||
|
|
||
|
StringRef DataExtractor::getFixedLengthString(uint64_t *OffsetPtr,
|
||
|
uint64_t Length,
|
||
|
StringRef TrimChars) const {
|
||
|
StringRef Bytes(getBytes(OffsetPtr, Length));
|
||
|
return Bytes.trim(TrimChars);
|
||
|
}
|
||
|
|
||
|
StringRef DataExtractor::getBytes(uint64_t *OffsetPtr, uint64_t Length,
|
||
|
Error *Err) const {
|
||
|
ErrorAsOutParameter ErrAsOut(Err);
|
||
|
if (isError(Err))
|
||
|
return StringRef();
|
||
|
|
||
|
if (!prepareRead(*OffsetPtr, Length, Err))
|
||
|
return StringRef();
|
||
|
|
||
|
StringRef Result = Data.substr(*OffsetPtr, Length);
|
||
|
*OffsetPtr += Length;
|
||
|
return Result;
|
||
|
}
|
||
|
|
||
|
template <typename T>
|
||
|
static T getLEB128(StringRef Data, uint64_t *OffsetPtr, Error *Err,
|
||
|
T (&Decoder)(const uint8_t *p, unsigned *n,
|
||
|
const uint8_t *end, const char **error)) {
|
||
|
ArrayRef<uint8_t> Bytes = arrayRefFromStringRef(Data);
|
||
|
assert(*OffsetPtr <= Bytes.size());
|
||
|
ErrorAsOutParameter ErrAsOut(Err);
|
||
|
if (isError(Err))
|
||
|
return T();
|
||
|
|
||
|
const char *error;
|
||
|
unsigned bytes_read;
|
||
|
T result =
|
||
|
Decoder(Bytes.data() + *OffsetPtr, &bytes_read, Bytes.end(), &error);
|
||
|
if (error) {
|
||
|
if (Err)
|
||
|
*Err = createStringError(errc::illegal_byte_sequence,
|
||
|
"unable to decode LEB128 at offset 0x%8.8" PRIx64
|
||
|
": %s",
|
||
|
*OffsetPtr, error);
|
||
|
return T();
|
||
|
}
|
||
|
*OffsetPtr += bytes_read;
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
uint64_t DataExtractor::getULEB128(uint64_t *offset_ptr, Error *Err) const {
|
||
|
return getLEB128(Data, offset_ptr, Err, decodeULEB128);
|
||
|
}
|
||
|
|
||
|
int64_t DataExtractor::getSLEB128(uint64_t *offset_ptr, Error *Err) const {
|
||
|
return getLEB128(Data, offset_ptr, Err, decodeSLEB128);
|
||
|
}
|
||
|
|
||
|
void DataExtractor::skip(Cursor &C, uint64_t Length) const {
|
||
|
ErrorAsOutParameter ErrAsOut(&C.Err);
|
||
|
if (isError(&C.Err))
|
||
|
return;
|
||
|
|
||
|
if (prepareRead(C.Offset, Length, &C.Err))
|
||
|
C.Offset += Length;
|
||
|
}
|