236 lines
		
	
	
		
			7.2 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			236 lines
		
	
	
		
			7.2 KiB
		
	
	
	
		
			C++
		
	
	
	
| //===-- DataExtractor.cpp -------------------------------------------------===//
 | |
| //
 | |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 | |
| // See https://llvm.org/LICENSE.txt for license information.
 | |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| 
 | |
| #include "llvm/Support/DataExtractor.h"
 | |
| #include "llvm/Support/Errc.h"
 | |
| #include "llvm/Support/ErrorHandling.h"
 | |
| #include "llvm/Support/LEB128.h"
 | |
| #include "llvm/Support/SwapByteOrder.h"
 | |
| 
 | |
| using namespace llvm;
 | |
| 
 | |
| bool DataExtractor::prepareRead(uint64_t Offset, uint64_t Size,
 | |
|                                 Error *E) const {
 | |
|   if (isValidOffsetForDataOfSize(Offset, Size))
 | |
|     return true;
 | |
|   if (E) {
 | |
|     if (Offset <= Data.size())
 | |
|       *E = createStringError(
 | |
|           errc::illegal_byte_sequence,
 | |
|           "unexpected end of data at offset 0x%zx while reading [0x%" PRIx64
 | |
|           ", 0x%" PRIx64 ")",
 | |
|           Data.size(), Offset, Offset + Size);
 | |
|     else
 | |
|       *E = createStringError(errc::invalid_argument,
 | |
|                              "offset 0x%" PRIx64
 | |
|                              " is beyond the end of data at 0x%zx",
 | |
|                              Offset, Data.size());
 | |
|   }
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| static bool isError(Error *E) { return E && *E; }
 | |
| 
 | |
| template <typename T>
 | |
| T DataExtractor::getU(uint64_t *offset_ptr, Error *Err) const {
 | |
|   ErrorAsOutParameter ErrAsOut(Err);
 | |
|   T val = 0;
 | |
|   if (isError(Err))
 | |
|     return val;
 | |
| 
 | |
|   uint64_t offset = *offset_ptr;
 | |
|   if (!prepareRead(offset, sizeof(T), Err))
 | |
|     return val;
 | |
|   std::memcpy(&val, &Data.data()[offset], sizeof(val));
 | |
|   if (sys::IsLittleEndianHost != IsLittleEndian)
 | |
|     sys::swapByteOrder(val);
 | |
| 
 | |
|   // Advance the offset
 | |
|   *offset_ptr += sizeof(val);
 | |
|   return val;
 | |
| }
 | |
| 
 | |
| template <typename T>
 | |
| T *DataExtractor::getUs(uint64_t *offset_ptr, T *dst, uint32_t count,
 | |
|                         Error *Err) const {
 | |
|   ErrorAsOutParameter ErrAsOut(Err);
 | |
|   if (isError(Err))
 | |
|     return nullptr;
 | |
| 
 | |
|   uint64_t offset = *offset_ptr;
 | |
| 
 | |
|   if (!prepareRead(offset, sizeof(*dst) * count, Err))
 | |
|     return nullptr;
 | |
|   for (T *value_ptr = dst, *end = dst + count; value_ptr != end;
 | |
|        ++value_ptr, offset += sizeof(*dst))
 | |
|     *value_ptr = getU<T>(offset_ptr, Err);
 | |
|   // Advance the offset
 | |
|   *offset_ptr = offset;
 | |
|   // Return a non-NULL pointer to the converted data as an indicator of
 | |
|   // success
 | |
|   return dst;
 | |
| }
 | |
| 
 | |
| uint8_t DataExtractor::getU8(uint64_t *offset_ptr, llvm::Error *Err) const {
 | |
|   return getU<uint8_t>(offset_ptr, Err);
 | |
| }
 | |
| 
 | |
| uint8_t *DataExtractor::getU8(uint64_t *offset_ptr, uint8_t *dst,
 | |
|                               uint32_t count) const {
 | |
|   return getUs<uint8_t>(offset_ptr, dst, count, nullptr);
 | |
| }
 | |
| 
 | |
| uint8_t *DataExtractor::getU8(Cursor &C, uint8_t *Dst, uint32_t Count) const {
 | |
|   return getUs<uint8_t>(&C.Offset, Dst, Count, &C.Err);
 | |
| }
 | |
| 
 | |
| uint16_t DataExtractor::getU16(uint64_t *offset_ptr, llvm::Error *Err) const {
 | |
|   return getU<uint16_t>(offset_ptr, Err);
 | |
| }
 | |
| 
 | |
| uint16_t *DataExtractor::getU16(uint64_t *offset_ptr, uint16_t *dst,
 | |
|                                 uint32_t count) const {
 | |
|   return getUs<uint16_t>(offset_ptr, dst, count, nullptr);
 | |
| }
 | |
| 
 | |
| uint32_t DataExtractor::getU24(uint64_t *OffsetPtr, Error *Err) const {
 | |
|   uint24_t ExtractedVal = getU<uint24_t>(OffsetPtr, Err);
 | |
|   // The 3 bytes are in the correct byte order for the host.
 | |
|   return ExtractedVal.getAsUint32(sys::IsLittleEndianHost);
 | |
| }
 | |
| 
 | |
| uint32_t DataExtractor::getU32(uint64_t *offset_ptr, llvm::Error *Err) const {
 | |
|   return getU<uint32_t>(offset_ptr, Err);
 | |
| }
 | |
| 
 | |
| uint32_t *DataExtractor::getU32(uint64_t *offset_ptr, uint32_t *dst,
 | |
|                                 uint32_t count) const {
 | |
|   return getUs<uint32_t>(offset_ptr, dst, count, nullptr);
 | |
| }
 | |
| 
 | |
| uint64_t DataExtractor::getU64(uint64_t *offset_ptr, llvm::Error *Err) const {
 | |
|   return getU<uint64_t>(offset_ptr, Err);
 | |
| }
 | |
| 
 | |
| uint64_t *DataExtractor::getU64(uint64_t *offset_ptr, uint64_t *dst,
 | |
|                                 uint32_t count) const {
 | |
|   return getUs<uint64_t>(offset_ptr, dst, count, nullptr);
 | |
| }
 | |
| 
 | |
| uint64_t DataExtractor::getUnsigned(uint64_t *offset_ptr, uint32_t byte_size,
 | |
|                                     llvm::Error *Err) const {
 | |
|   switch (byte_size) {
 | |
|   case 1:
 | |
|     return getU8(offset_ptr, Err);
 | |
|   case 2:
 | |
|     return getU16(offset_ptr, Err);
 | |
|   case 4:
 | |
|     return getU32(offset_ptr, Err);
 | |
|   case 8:
 | |
|     return getU64(offset_ptr, Err);
 | |
|   }
 | |
|   llvm_unreachable("getUnsigned unhandled case!");
 | |
| }
 | |
| 
 | |
| int64_t
 | |
| DataExtractor::getSigned(uint64_t *offset_ptr, uint32_t byte_size) const {
 | |
|   switch (byte_size) {
 | |
|   case 1:
 | |
|     return (int8_t)getU8(offset_ptr);
 | |
|   case 2:
 | |
|     return (int16_t)getU16(offset_ptr);
 | |
|   case 4:
 | |
|     return (int32_t)getU32(offset_ptr);
 | |
|   case 8:
 | |
|     return (int64_t)getU64(offset_ptr);
 | |
|   }
 | |
|   llvm_unreachable("getSigned unhandled case!");
 | |
| }
 | |
| 
 | |
| StringRef DataExtractor::getCStrRef(uint64_t *OffsetPtr, Error *Err) const {
 | |
|   ErrorAsOutParameter ErrAsOut(Err);
 | |
|   if (isError(Err))
 | |
|     return StringRef();
 | |
| 
 | |
|   uint64_t Start = *OffsetPtr;
 | |
|   StringRef::size_type Pos = Data.find('\0', Start);
 | |
|   if (Pos != StringRef::npos) {
 | |
|     *OffsetPtr = Pos + 1;
 | |
|     return StringRef(Data.data() + Start, Pos - Start);
 | |
|   }
 | |
|   if (Err)
 | |
|     *Err = createStringError(errc::illegal_byte_sequence,
 | |
|                              "no null terminated string at offset 0x%" PRIx64,
 | |
|                              Start);
 | |
|   return StringRef();
 | |
| }
 | |
| 
 | |
| StringRef DataExtractor::getFixedLengthString(uint64_t *OffsetPtr,
 | |
|                                               uint64_t Length,
 | |
|                                               StringRef TrimChars) const {
 | |
|   StringRef Bytes(getBytes(OffsetPtr, Length));
 | |
|   return Bytes.trim(TrimChars);
 | |
| }
 | |
| 
 | |
| StringRef DataExtractor::getBytes(uint64_t *OffsetPtr, uint64_t Length,
 | |
|                                   Error *Err) const {
 | |
|   ErrorAsOutParameter ErrAsOut(Err);
 | |
|   if (isError(Err))
 | |
|     return StringRef();
 | |
| 
 | |
|   if (!prepareRead(*OffsetPtr, Length, Err))
 | |
|     return StringRef();
 | |
| 
 | |
|   StringRef Result = Data.substr(*OffsetPtr, Length);
 | |
|   *OffsetPtr += Length;
 | |
|   return Result;
 | |
| }
 | |
| 
 | |
| template <typename T>
 | |
| static T getLEB128(StringRef Data, uint64_t *OffsetPtr, Error *Err,
 | |
|                    T (&Decoder)(const uint8_t *p, unsigned *n,
 | |
|                                 const uint8_t *end, const char **error)) {
 | |
|   ArrayRef<uint8_t> Bytes = arrayRefFromStringRef(Data);
 | |
|   assert(*OffsetPtr <= Bytes.size());
 | |
|   ErrorAsOutParameter ErrAsOut(Err);
 | |
|   if (isError(Err))
 | |
|     return T();
 | |
| 
 | |
|   const char *error;
 | |
|   unsigned bytes_read;
 | |
|   T result =
 | |
|       Decoder(Bytes.data() + *OffsetPtr, &bytes_read, Bytes.end(), &error);
 | |
|   if (error) {
 | |
|     if (Err)
 | |
|       *Err = createStringError(errc::illegal_byte_sequence,
 | |
|                                "unable to decode LEB128 at offset 0x%8.8" PRIx64
 | |
|                                ": %s",
 | |
|                                *OffsetPtr, error);
 | |
|     return T();
 | |
|   }
 | |
|   *OffsetPtr += bytes_read;
 | |
|   return result;
 | |
| }
 | |
| 
 | |
| uint64_t DataExtractor::getULEB128(uint64_t *offset_ptr, Error *Err) const {
 | |
|   return getLEB128(Data, offset_ptr, Err, decodeULEB128);
 | |
| }
 | |
| 
 | |
| int64_t DataExtractor::getSLEB128(uint64_t *offset_ptr, Error *Err) const {
 | |
|   return getLEB128(Data, offset_ptr, Err, decodeSLEB128);
 | |
| }
 | |
| 
 | |
| void DataExtractor::skip(Cursor &C, uint64_t Length) const {
 | |
|   ErrorAsOutParameter ErrAsOut(&C.Err);
 | |
|   if (isError(&C.Err))
 | |
|     return;
 | |
| 
 | |
|   if (prepareRead(C.Offset, Length, &C.Err))
 | |
|     C.Offset += Length;
 | |
| }
 |