blob: a98297cdb35f2c198d7223e69ad17b37083bde32 [file] [log] [blame]
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +00001//===-- DataExtractor.cpp -------------------------------------------------===//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +00006//
7//===----------------------------------------------------------------------===//
8
9#include "llvm/Support/DataExtractor.h"
Pavel Labathb1f29ce2019-08-27 11:24:08 +000010#include "llvm/Support/Errc.h"
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000011#include "llvm/Support/ErrorHandling.h"
12#include "llvm/Support/Host.h"
David Blaikie8242f352019-06-24 20:43:36 +000013#include "llvm/Support/LEB128.h"
Pavel Labathb1f29ce2019-08-27 11:24:08 +000014#include "llvm/Support/SwapByteOrder.h"
15
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000016using namespace llvm;
17
Pavel Labathb1f29ce2019-08-27 11:24:08 +000018static void unexpectedEndReached(Error *E) {
19 if (E)
20 *E = createStringError(errc::illegal_byte_sequence,
21 "unexpected end of data");
22}
23
24static bool isError(Error *E) { return E && *E; }
25
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000026template <typename T>
Igor Kudrinf5f35c52019-08-06 10:47:20 +000027static T getU(uint64_t *offset_ptr, const DataExtractor *de,
Pavel Labathb1f29ce2019-08-27 11:24:08 +000028 bool isLittleEndian, const char *Data, llvm::Error *Err) {
29 ErrorAsOutParameter ErrAsOut(Err);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000030 T val = 0;
Pavel Labathb1f29ce2019-08-27 11:24:08 +000031 if (isError(Err))
32 return val;
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000033
Pavel Labathb1f29ce2019-08-27 11:24:08 +000034 uint64_t offset = *offset_ptr;
35 if (!de->isValidOffsetForDataOfSize(offset, sizeof(T))) {
36 unexpectedEndReached(Err);
37 return val;
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000038 }
Pavel Labathb1f29ce2019-08-27 11:24:08 +000039 std::memcpy(&val, &Data[offset], sizeof(val));
40 if (sys::IsLittleEndianHost != isLittleEndian)
41 sys::swapByteOrder(val);
42
43 // Advance the offset
44 *offset_ptr += sizeof(val);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000045 return val;
46}
47
48template <typename T>
Igor Kudrinf5f35c52019-08-06 10:47:20 +000049static T *getUs(uint64_t *offset_ptr, T *dst, uint32_t count,
Pavel Labathb1f29ce2019-08-27 11:24:08 +000050 const DataExtractor *de, bool isLittleEndian, const char *Data,
51 llvm::Error *Err) {
52 ErrorAsOutParameter ErrAsOut(Err);
53 if (isError(Err))
54 return nullptr;
55
Igor Kudrinf5f35c52019-08-06 10:47:20 +000056 uint64_t offset = *offset_ptr;
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000057
Pavel Labathb1f29ce2019-08-27 11:24:08 +000058 if (!de->isValidOffsetForDataOfSize(offset, sizeof(*dst) * count)) {
59 unexpectedEndReached(Err);
60 return nullptr;
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000061 }
Pavel Labathb1f29ce2019-08-27 11:24:08 +000062 for (T *value_ptr = dst, *end = dst + count; value_ptr != end;
63 ++value_ptr, offset += sizeof(*dst))
64 *value_ptr = getU<T>(offset_ptr, de, isLittleEndian, Data, Err);
65 // Advance the offset
66 *offset_ptr = offset;
67 // Return a non-NULL pointer to the converted data as an indicator of
68 // success
69 return dst;
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000070}
71
Pavel Labathb1f29ce2019-08-27 11:24:08 +000072uint8_t DataExtractor::getU8(uint64_t *offset_ptr, llvm::Error *Err) const {
73 return getU<uint8_t>(offset_ptr, this, IsLittleEndian, Data.data(), Err);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000074}
75
76uint8_t *
Igor Kudrinf5f35c52019-08-06 10:47:20 +000077DataExtractor::getU8(uint64_t *offset_ptr, uint8_t *dst, uint32_t count) const {
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000078 return getUs<uint8_t>(offset_ptr, dst, count, this, IsLittleEndian,
Pavel Labathb1f29ce2019-08-27 11:24:08 +000079 Data.data(), nullptr);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000080}
81
Pavel Labathb1f29ce2019-08-27 11:24:08 +000082uint8_t *DataExtractor::getU8(Cursor &C, uint8_t *Dst, uint32_t Count) const {
83 return getUs<uint8_t>(&C.Offset, Dst, Count, this, IsLittleEndian,
84 Data.data(), &C.Err);
85}
86
87uint16_t DataExtractor::getU16(uint64_t *offset_ptr, llvm::Error *Err) const {
88 return getU<uint16_t>(offset_ptr, this, IsLittleEndian, Data.data(), Err);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000089}
90
Igor Kudrinf5f35c52019-08-06 10:47:20 +000091uint16_t *DataExtractor::getU16(uint64_t *offset_ptr, uint16_t *dst,
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000092 uint32_t count) const {
93 return getUs<uint16_t>(offset_ptr, dst, count, this, IsLittleEndian,
Pavel Labathb1f29ce2019-08-27 11:24:08 +000094 Data.data(), nullptr);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +000095}
96
Igor Kudrinf5f35c52019-08-06 10:47:20 +000097uint32_t DataExtractor::getU24(uint64_t *offset_ptr) const {
Wolfgang Pieb258927e2017-06-21 19:37:44 +000098 uint24_t ExtractedVal =
Pavel Labathb1f29ce2019-08-27 11:24:08 +000099 getU<uint24_t>(offset_ptr, this, IsLittleEndian, Data.data(), nullptr);
Wolfgang Pieb258927e2017-06-21 19:37:44 +0000100 // The 3 bytes are in the correct byte order for the host.
101 return ExtractedVal.getAsUint32(sys::IsLittleEndianHost);
102}
103
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000104uint32_t DataExtractor::getU32(uint64_t *offset_ptr, llvm::Error *Err) const {
105 return getU<uint32_t>(offset_ptr, this, IsLittleEndian, Data.data(), Err);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000106}
107
Igor Kudrinf5f35c52019-08-06 10:47:20 +0000108uint32_t *DataExtractor::getU32(uint64_t *offset_ptr, uint32_t *dst,
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000109 uint32_t count) const {
110 return getUs<uint32_t>(offset_ptr, dst, count, this, IsLittleEndian,
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000111 Data.data(), nullptr);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000112}
113
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000114uint64_t DataExtractor::getU64(uint64_t *offset_ptr, llvm::Error *Err) const {
115 return getU<uint64_t>(offset_ptr, this, IsLittleEndian, Data.data(), Err);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000116}
117
Igor Kudrinf5f35c52019-08-06 10:47:20 +0000118uint64_t *DataExtractor::getU64(uint64_t *offset_ptr, uint64_t *dst,
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000119 uint32_t count) const {
120 return getUs<uint64_t>(offset_ptr, dst, count, this, IsLittleEndian,
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000121 Data.data(), nullptr);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000122}
123
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000124uint64_t DataExtractor::getUnsigned(uint64_t *offset_ptr, uint32_t byte_size,
125 llvm::Error *Err) const {
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000126 switch (byte_size) {
127 case 1:
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000128 return getU8(offset_ptr, Err);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000129 case 2:
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000130 return getU16(offset_ptr, Err);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000131 case 4:
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000132 return getU32(offset_ptr, Err);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000133 case 8:
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000134 return getU64(offset_ptr, Err);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000135 }
136 llvm_unreachable("getUnsigned unhandled case!");
137}
138
139int64_t
Igor Kudrinf5f35c52019-08-06 10:47:20 +0000140DataExtractor::getSigned(uint64_t *offset_ptr, uint32_t byte_size) const {
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000141 switch (byte_size) {
142 case 1:
143 return (int8_t)getU8(offset_ptr);
144 case 2:
145 return (int16_t)getU16(offset_ptr);
146 case 4:
147 return (int32_t)getU32(offset_ptr);
148 case 8:
149 return (int64_t)getU64(offset_ptr);
150 }
151 llvm_unreachable("getSigned unhandled case!");
152}
153
Igor Kudrinf5f35c52019-08-06 10:47:20 +0000154const char *DataExtractor::getCStr(uint64_t *offset_ptr) const {
155 uint64_t offset = *offset_ptr;
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000156 StringRef::size_type pos = Data.find('\0', offset);
157 if (pos != StringRef::npos) {
158 *offset_ptr = pos + 1;
159 return Data.data() + offset;
160 }
Craig Topperc10719f2014-04-07 04:17:22 +0000161 return nullptr;
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000162}
163
Igor Kudrinf5f35c52019-08-06 10:47:20 +0000164StringRef DataExtractor::getCStrRef(uint64_t *offset_ptr) const {
165 uint64_t Start = *offset_ptr;
Paul Robinsonba1c9152017-05-02 17:37:32 +0000166 StringRef::size_type Pos = Data.find('\0', Start);
167 if (Pos != StringRef::npos) {
Igor Kudrinf5f35c52019-08-06 10:47:20 +0000168 *offset_ptr = Pos + 1;
Paul Robinsonba1c9152017-05-02 17:37:32 +0000169 return StringRef(Data.data() + Start, Pos - Start);
170 }
171 return StringRef();
172}
173
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000174uint64_t DataExtractor::getULEB128(uint64_t *offset_ptr,
175 llvm::Error *Err) const {
David Blaikie8242f352019-06-24 20:43:36 +0000176 assert(*offset_ptr <= Data.size());
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000177 ErrorAsOutParameter ErrAsOut(Err);
178 if (isError(Err))
179 return 0;
David Blaikie8242f352019-06-24 20:43:36 +0000180
181 const char *error;
182 unsigned bytes_read;
183 uint64_t result = decodeULEB128(
184 reinterpret_cast<const uint8_t *>(Data.data() + *offset_ptr), &bytes_read,
185 reinterpret_cast<const uint8_t *>(Data.data() + Data.size()), &error);
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000186 if (error) {
187 if (Err)
188 *Err = createStringError(errc::illegal_byte_sequence, error);
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000189 return 0;
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000190 }
David Blaikie8242f352019-06-24 20:43:36 +0000191 *offset_ptr += bytes_read;
192 return result;
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000193}
194
Igor Kudrinf5f35c52019-08-06 10:47:20 +0000195int64_t DataExtractor::getSLEB128(uint64_t *offset_ptr) const {
David Blaikief895e1b2019-06-24 23:45:18 +0000196 assert(*offset_ptr <= Data.size());
197
198 const char *error;
199 unsigned bytes_read;
200 int64_t result = decodeSLEB128(
201 reinterpret_cast<const uint8_t *>(Data.data() + *offset_ptr), &bytes_read,
202 reinterpret_cast<const uint8_t *>(Data.data() + Data.size()), &error);
203 if (error)
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000204 return 0;
David Blaikief895e1b2019-06-24 23:45:18 +0000205 *offset_ptr += bytes_read;
206 return result;
Benjamin Kramer88a1d9f2011-09-13 19:42:16 +0000207}
Pavel Labathb1f29ce2019-08-27 11:24:08 +0000208
209void DataExtractor::skip(Cursor &C, uint64_t Length) const {
210 ErrorAsOutParameter ErrAsOut(&C.Err);
211 if (isError(&C.Err))
212 return;
213
214 if (isValidOffsetForDataOfSize(C.Offset, Length))
215 C.Offset += Length;
216 else
217 unexpectedEndReached(&C.Err);
218}