/src/WasmEdge/lib/loader/filemgr.cpp
Line | Count | Source (jump to first uncovered line) |
1 | | // SPDX-License-Identifier: Apache-2.0 |
2 | | // SPDX-FileCopyrightText: 2019-2024 Second State INC |
3 | | |
4 | | #include "loader/filemgr.h" |
5 | | |
6 | | #include <algorithm> |
7 | | #include <iterator> |
8 | | |
9 | | // Error logging of file manager need to be handled in caller. |
10 | | |
11 | | namespace WasmEdge { |
12 | | |
13 | | // Set path to file manager. See "include/loader/filemgr.h". |
14 | 0 | Expect<void> FileMgr::setPath(const std::filesystem::path &FilePath) { |
15 | 0 | reset(); |
16 | 0 | std::error_code ErrCode; |
17 | 0 | Size = std::filesystem::file_size(FilePath, ErrCode); |
18 | 0 | if (likely(!ErrCode)) { |
19 | 0 | if (!MMap::supported()) { |
20 | 0 | Size = 0; |
21 | 0 | Status = ErrCode::Value::IllegalPath; |
22 | 0 | return Unexpect(Status); |
23 | 0 | } |
24 | 0 | FileMap.emplace(FilePath); |
25 | 0 | if (auto *Pointer = FileMap->address(); likely(Pointer)) { |
26 | 0 | Data = reinterpret_cast<const Byte *>(Pointer); |
27 | 0 | Status = ErrCode::Value::Success; |
28 | 0 | } else { |
29 | | // File size is 0, mmap failed. |
30 | | // Will get 'UnexpectedEnd' error while the first reading. |
31 | 0 | FileMap.reset(); |
32 | 0 | } |
33 | 0 | return {}; |
34 | 0 | } |
35 | 0 | Size = 0; |
36 | 0 | Status = ErrCode::Value::IllegalPath; |
37 | 0 | return Unexpect(Status); |
38 | 0 | } |
39 | | |
40 | | // Set code data. See "include/loader/filemgr.h". |
41 | 9.30k | Expect<void> FileMgr::setCode(Span<const Byte> CodeData) { |
42 | 9.30k | reset(); |
43 | 9.30k | Data = CodeData.data(); |
44 | 9.30k | Size = CodeData.size(); |
45 | 9.30k | Status = ErrCode::Value::Success; |
46 | 9.30k | return {}; |
47 | 9.30k | } |
48 | | |
49 | | // Set code data. See "include/loader/filemgr.h". |
50 | 0 | Expect<void> FileMgr::setCode(std::vector<Byte> CodeData) { |
51 | 0 | reset(); |
52 | | // Tell GCC 14 that DataHolder has no data. |
53 | | // Fix the false positive warning, |
54 | | // which is reported by GCC 14 with `maybe-uninitialized` |
55 | 0 | assuming(!DataHolder); |
56 | | |
57 | 0 | DataHolder.emplace(std::move(CodeData)); |
58 | 0 | Data = DataHolder->data(); |
59 | 0 | Size = DataHolder->size(); |
60 | 0 | Status = ErrCode::Value::Success; |
61 | 0 | return {}; |
62 | 0 | } |
63 | | |
64 | | // Read one byte. See "include/loader/filemgr.h". |
65 | 9.13M | Expect<Byte> FileMgr::readByte() { |
66 | 9.13M | if (unlikely(Status != ErrCode::Value::Success)) { |
67 | 0 | return Unexpect(Status); |
68 | 0 | } |
69 | | // Set the flag to the start offset. |
70 | 9.13M | LastPos = Pos; |
71 | | // Check if exceed the data boundary and section boundary. |
72 | 9.13M | EXPECTED_TRY(testRead(1)); |
73 | 9.12M | return Data[Pos++]; |
74 | 9.13M | } |
75 | | |
76 | | // Read number of bytes. See "include/loader/filemgr.h". |
77 | 67.1k | Expect<std::vector<Byte>> FileMgr::readBytes(size_t SizeToRead) { |
78 | | // Set the flag to the start offset. |
79 | 67.1k | LastPos = Pos; |
80 | | // Read bytes into vector. |
81 | 67.1k | std::vector<Byte> Buf(SizeToRead); |
82 | 67.1k | EXPECTED_TRY(readBytes(Buf)); |
83 | 67.0k | return Buf; |
84 | 67.1k | } |
85 | | |
86 | | // Decode and read an unsigned int. See "include/loader/filemgr.h". |
87 | 1.78M | Expect<uint32_t> FileMgr::readU32() { |
88 | 1.78M | if (unlikely(Status != ErrCode::Value::Success)) { |
89 | 0 | return Unexpect(Status); |
90 | 0 | } |
91 | | // Set the flag to the start offset. |
92 | 1.78M | LastPos = Pos; |
93 | | |
94 | | // Read and decode U32. |
95 | 1.78M | uint32_t Result = 0; |
96 | 1.78M | uint32_t Offset = 0; |
97 | 1.78M | Byte Byte = 0x80; |
98 | 4.10M | while (Byte & 0x80) { |
99 | 2.32M | if (unlikely(Offset >= 32)) { |
100 | 10 | Status = ErrCode::Value::IntegerTooLong; |
101 | 10 | return Unexpect(Status); |
102 | 10 | } |
103 | 2.32M | EXPECTED_TRY(testRead(1)); |
104 | 2.32M | Byte = Data[Pos++]; |
105 | 2.32M | Result |= (Byte & UINT32_C(0x7F)) << Offset; |
106 | 2.32M | if (Offset == 28 && unlikely((Byte & UINT32_C(0x70)) != 0)) { |
107 | 53 | Status = ErrCode::Value::IntegerTooLarge; |
108 | 53 | return Unexpect(Status); |
109 | 53 | } |
110 | 2.32M | Offset += 7; |
111 | 2.32M | } |
112 | 1.78M | return Result; |
113 | 1.78M | } |
114 | | |
115 | | // Decode and read an unsigned long long int. See "include/loader/filemgr.h". |
116 | 0 | Expect<uint64_t> FileMgr::readU64() { |
117 | 0 | if (Status != ErrCode::Value::Success) { |
118 | 0 | return Unexpect(Status); |
119 | 0 | } |
120 | | // Set the flag to the start offset. |
121 | 0 | LastPos = Pos; |
122 | | |
123 | | // Read and decode U64. |
124 | 0 | uint64_t Result = 0; |
125 | 0 | uint64_t Offset = 0; |
126 | 0 | Byte Byte = 0x80; |
127 | 0 | while (Byte & 0x80) { |
128 | 0 | if (unlikely(Offset >= 64)) { |
129 | 0 | Status = ErrCode::Value::IntegerTooLong; |
130 | 0 | return Unexpect(Status); |
131 | 0 | } |
132 | 0 | EXPECTED_TRY(testRead(1)); |
133 | 0 | Byte = Data[Pos++]; |
134 | 0 | Result |= (Byte & UINT64_C(0x7F)) << Offset; |
135 | 0 | if (Offset == 63 && unlikely((Byte & UINT32_C(0x7E)) != 0)) { |
136 | 0 | Status = ErrCode::Value::IntegerTooLarge; |
137 | 0 | return Unexpect(Status); |
138 | 0 | } |
139 | 0 | Offset += 7; |
140 | 0 | } |
141 | 0 | return Result; |
142 | 0 | } |
143 | | |
144 | 2.46M | template <typename RetType, size_t N> Expect<RetType> FileMgr::readSN() { |
145 | 2.46M | static_assert(N >= 8, "The N of S_N must have at least length of a byte"); |
146 | 2.46M | static_assert(8 * sizeof(RetType) >= N, |
147 | 2.46M | "RetType cannot hold the full range of S_N"); |
148 | 2.46M | static_assert(std::is_signed_v<RetType>, |
149 | 2.46M | "RetType of S_N must be signed type"); |
150 | | |
151 | 2.46M | if (Status != ErrCode::Value::Success) { |
152 | 0 | return Unexpect(Status); |
153 | 0 | } |
154 | | // Set the flag to the start offset. |
155 | 2.46M | LastPos = Pos; |
156 | | |
157 | | // Read and decode S_N. |
158 | 2.46M | RetType Result = 0; |
159 | 2.46M | size_t Offset = 0; |
160 | 2.46M | size_t RemainingBits = N; |
161 | 2.69M | while (true) { |
162 | 2.69M | if (RemainingBits <= 0) { |
163 | 0 | Status = ErrCode::Value::IntegerTooLong; |
164 | 0 | return Unexpect(Status); |
165 | 0 | } |
166 | | |
167 | | // In the rest logic, RemainingBits must be at least 1. |
168 | 2.69M | EXPECTED_TRY(testRead(1)); |
169 | 2.69M | WasmEdge::Byte Byte = Data[Pos++]; |
170 | | |
171 | 2.69M | const WasmEdge::Byte HighestBitMask = 1 << 7; |
172 | 2.69M | const WasmEdge::Byte SecondHighestBitMask = 1 << 6; |
173 | 2.69M | if (Byte & HighestBitMask) { |
174 | | // The byte has leading 1. It contains 7 bits payload. |
175 | | |
176 | 230k | if (unlikely(RemainingBits < 7)) { |
177 | 47 | Status = ErrCode::Value::IntegerTooLong; |
178 | 47 | return Unexpect(Status); |
179 | 47 | } |
180 | | |
181 | 229k | std::make_unsigned_t<RetType> Payload = |
182 | 229k | Byte & (~HighestBitMask); // & 0b01111111 |
183 | 229k | Result |= (Payload << Offset); |
184 | 229k | Offset += 7; |
185 | 229k | RemainingBits -= 7; |
186 | 2.46M | } else { |
187 | | // The byte has leading 0. It will be the last byte. |
188 | | |
189 | | // The number of bits that take effect in the byte. Since RemainingBits |
190 | | // must be at least 1, EffectiveBits also must be at least 1. It is also |
191 | | // at most 7. |
192 | 2.46M | size_t EffectiveBits = RemainingBits < 7 ? RemainingBits : 7; |
193 | 2.46M | std::make_unsigned_t<RetType> Payload = Byte; |
194 | 2.46M | if (Byte & SecondHighestBitMask) { |
195 | | // The byte is signed. |
196 | 1.86M | if (Byte >= (1 << 7) - (1 << (EffectiveBits - 1))) { |
197 | 1.86M | Payload -= (1 << 7); |
198 | 1.86M | } else { |
199 | 15 | Status = ErrCode::Value::IntegerTooLarge; |
200 | 15 | return Unexpect(Status); |
201 | 15 | } |
202 | 1.86M | } else { |
203 | | // The byte is unsigned. |
204 | 592k | if (Byte >= (1 << (EffectiveBits - 1))) { |
205 | 19 | Status = ErrCode::Value::IntegerTooLarge; |
206 | 19 | return Unexpect(Status); |
207 | 19 | } |
208 | 592k | } |
209 | 2.45M | Result |= (Payload << Offset); |
210 | 2.45M | break; |
211 | 2.46M | } |
212 | 2.69M | } |
213 | | |
214 | 2.45M | return Result; |
215 | 2.46M | } cxx20::expected<long, WasmEdge::ErrCode> WasmEdge::FileMgr::readSN<long, 33ul>() Line | Count | Source | 144 | 293k | template <typename RetType, size_t N> Expect<RetType> FileMgr::readSN() { | 145 | 293k | static_assert(N >= 8, "The N of S_N must have at least length of a byte"); | 146 | 293k | static_assert(8 * sizeof(RetType) >= N, | 147 | 293k | "RetType cannot hold the full range of S_N"); | 148 | 293k | static_assert(std::is_signed_v<RetType>, | 149 | 293k | "RetType of S_N must be signed type"); | 150 | | | 151 | 293k | if (Status != ErrCode::Value::Success) { | 152 | 0 | return Unexpect(Status); | 153 | 0 | } | 154 | | // Set the flag to the start offset. | 155 | 293k | LastPos = Pos; | 156 | | | 157 | | // Read and decode S_N. | 158 | 293k | RetType Result = 0; | 159 | 293k | size_t Offset = 0; | 160 | 293k | size_t RemainingBits = N; | 161 | 303k | while (true) { | 162 | 303k | if (RemainingBits <= 0) { | 163 | 0 | Status = ErrCode::Value::IntegerTooLong; | 164 | 0 | return Unexpect(Status); | 165 | 0 | } | 166 | | | 167 | | // In the rest logic, RemainingBits must be at least 1. | 168 | 303k | EXPECTED_TRY(testRead(1)); | 169 | 303k | WasmEdge::Byte Byte = Data[Pos++]; | 170 | | | 171 | 303k | const WasmEdge::Byte HighestBitMask = 1 << 7; | 172 | 303k | const WasmEdge::Byte SecondHighestBitMask = 1 << 6; | 173 | 303k | if (Byte & HighestBitMask) { | 174 | | // The byte has leading 1. It contains 7 bits payload. | 175 | | | 176 | 9.33k | if (unlikely(RemainingBits < 7)) { | 177 | 19 | Status = ErrCode::Value::IntegerTooLong; | 178 | 19 | return Unexpect(Status); | 179 | 19 | } | 180 | | | 181 | 9.31k | std::make_unsigned_t<RetType> Payload = | 182 | 9.31k | Byte & (~HighestBitMask); // & 0b01111111 | 183 | 9.31k | Result |= (Payload << Offset); | 184 | 9.31k | Offset += 7; | 185 | 9.31k | RemainingBits -= 7; | 186 | 293k | } else { | 187 | | // The byte has leading 0. It will be the last byte. | 188 | | | 189 | | // The number of bits that take effect in the byte. Since RemainingBits | 190 | | // must be at least 1, EffectiveBits also must be at least 1. It is also | 191 | | // at most 7. | 192 | 293k | size_t EffectiveBits = RemainingBits < 7 ? RemainingBits : 7; | 193 | 293k | std::make_unsigned_t<RetType> Payload = Byte; | 194 | 293k | if (Byte & SecondHighestBitMask) { | 195 | | // The byte is signed. | 196 | 112k | if (Byte >= (1 << 7) - (1 << (EffectiveBits - 1))) { | 197 | 112k | Payload -= (1 << 7); | 198 | 112k | } else { | 199 | 4 | Status = ErrCode::Value::IntegerTooLarge; | 200 | 4 | return Unexpect(Status); | 201 | 4 | } | 202 | 181k | } else { | 203 | | // The byte is unsigned. | 204 | 181k | if (Byte >= (1 << (EffectiveBits - 1))) { | 205 | 6 | Status = ErrCode::Value::IntegerTooLarge; | 206 | 6 | return Unexpect(Status); | 207 | 6 | } | 208 | 181k | } | 209 | 293k | Result |= (Payload << Offset); | 210 | 293k | break; | 211 | 293k | } | 212 | 303k | } | 213 | | | 214 | 293k | return Result; | 215 | 293k | } |
cxx20::expected<int, WasmEdge::ErrCode> WasmEdge::FileMgr::readSN<int, 32ul>() Line | Count | Source | 144 | 1.92M | template <typename RetType, size_t N> Expect<RetType> FileMgr::readSN() { | 145 | 1.92M | static_assert(N >= 8, "The N of S_N must have at least length of a byte"); | 146 | 1.92M | static_assert(8 * sizeof(RetType) >= N, | 147 | 1.92M | "RetType cannot hold the full range of S_N"); | 148 | 1.92M | static_assert(std::is_signed_v<RetType>, | 149 | 1.92M | "RetType of S_N must be signed type"); | 150 | | | 151 | 1.92M | if (Status != ErrCode::Value::Success) { | 152 | 0 | return Unexpect(Status); | 153 | 0 | } | 154 | | // Set the flag to the start offset. | 155 | 1.92M | LastPos = Pos; | 156 | | | 157 | | // Read and decode S_N. | 158 | 1.92M | RetType Result = 0; | 159 | 1.92M | size_t Offset = 0; | 160 | 1.92M | size_t RemainingBits = N; | 161 | 2.05M | while (true) { | 162 | 2.05M | if (RemainingBits <= 0) { | 163 | 0 | Status = ErrCode::Value::IntegerTooLong; | 164 | 0 | return Unexpect(Status); | 165 | 0 | } | 166 | | | 167 | | // In the rest logic, RemainingBits must be at least 1. | 168 | 2.05M | EXPECTED_TRY(testRead(1)); | 169 | 2.05M | WasmEdge::Byte Byte = Data[Pos++]; | 170 | | | 171 | 2.05M | const WasmEdge::Byte HighestBitMask = 1 << 7; | 172 | 2.05M | const WasmEdge::Byte SecondHighestBitMask = 1 << 6; | 173 | 2.05M | if (Byte & HighestBitMask) { | 174 | | // The byte has leading 1. It contains 7 bits payload. | 175 | | | 176 | 129k | if (unlikely(RemainingBits < 7)) { | 177 | 12 | Status = ErrCode::Value::IntegerTooLong; | 178 | 12 | return Unexpect(Status); | 179 | 12 | } | 180 | | | 181 | 129k | std::make_unsigned_t<RetType> Payload = | 182 | 129k | Byte & (~HighestBitMask); // & 0b01111111 | 183 | 129k | Result |= (Payload << Offset); | 184 | 129k | Offset += 7; | 185 | 129k | RemainingBits -= 7; | 186 | 1.92M | } else { | 187 | | // The byte has leading 0. It will be the last byte. | 188 | | | 189 | | // The number of bits that take effect in the byte. Since RemainingBits | 190 | | // must be at least 1, EffectiveBits also must be at least 1. It is also | 191 | | // at most 7. | 192 | 1.92M | size_t EffectiveBits = RemainingBits < 7 ? RemainingBits : 7; | 193 | 1.92M | std::make_unsigned_t<RetType> Payload = Byte; | 194 | 1.92M | if (Byte & SecondHighestBitMask) { | 195 | | // The byte is signed. | 196 | 1.52M | if (Byte >= (1 << 7) - (1 << (EffectiveBits - 1))) { | 197 | 1.52M | Payload -= (1 << 7); | 198 | 1.52M | } else { | 199 | 5 | Status = ErrCode::Value::IntegerTooLarge; | 200 | 5 | return Unexpect(Status); | 201 | 5 | } | 202 | 1.52M | } else { | 203 | | // The byte is unsigned. | 204 | 392k | if (Byte >= (1 << (EffectiveBits - 1))) { | 205 | 5 | Status = ErrCode::Value::IntegerTooLarge; | 206 | 5 | return Unexpect(Status); | 207 | 5 | } | 208 | 392k | } | 209 | 1.92M | Result |= (Payload << Offset); | 210 | 1.92M | break; | 211 | 1.92M | } | 212 | 2.05M | } | 213 | | | 214 | 1.92M | return Result; | 215 | 1.92M | } |
cxx20::expected<long, WasmEdge::ErrCode> WasmEdge::FileMgr::readSN<long, 64ul>() Line | Count | Source | 144 | 244k | template <typename RetType, size_t N> Expect<RetType> FileMgr::readSN() { | 145 | 244k | static_assert(N >= 8, "The N of S_N must have at least length of a byte"); | 146 | 244k | static_assert(8 * sizeof(RetType) >= N, | 147 | 244k | "RetType cannot hold the full range of S_N"); | 148 | 244k | static_assert(std::is_signed_v<RetType>, | 149 | 244k | "RetType of S_N must be signed type"); | 150 | | | 151 | 244k | if (Status != ErrCode::Value::Success) { | 152 | 0 | return Unexpect(Status); | 153 | 0 | } | 154 | | // Set the flag to the start offset. | 155 | 244k | LastPos = Pos; | 156 | | | 157 | | // Read and decode S_N. | 158 | 244k | RetType Result = 0; | 159 | 244k | size_t Offset = 0; | 160 | 244k | size_t RemainingBits = N; | 161 | 335k | while (true) { | 162 | 335k | if (RemainingBits <= 0) { | 163 | 0 | Status = ErrCode::Value::IntegerTooLong; | 164 | 0 | return Unexpect(Status); | 165 | 0 | } | 166 | | | 167 | | // In the rest logic, RemainingBits must be at least 1. | 168 | 335k | EXPECTED_TRY(testRead(1)); | 169 | 335k | WasmEdge::Byte Byte = Data[Pos++]; | 170 | | | 171 | 335k | const WasmEdge::Byte HighestBitMask = 1 << 7; | 172 | 335k | const WasmEdge::Byte SecondHighestBitMask = 1 << 6; | 173 | 335k | if (Byte & HighestBitMask) { | 174 | | // The byte has leading 1. It contains 7 bits payload. | 175 | | | 176 | 90.8k | if (unlikely(RemainingBits < 7)) { | 177 | 16 | Status = ErrCode::Value::IntegerTooLong; | 178 | 16 | return Unexpect(Status); | 179 | 16 | } | 180 | | | 181 | 90.8k | std::make_unsigned_t<RetType> Payload = | 182 | 90.8k | Byte & (~HighestBitMask); // & 0b01111111 | 183 | 90.8k | Result |= (Payload << Offset); | 184 | 90.8k | Offset += 7; | 185 | 90.8k | RemainingBits -= 7; | 186 | 244k | } else { | 187 | | // The byte has leading 0. It will be the last byte. | 188 | | | 189 | | // The number of bits that take effect in the byte. Since RemainingBits | 190 | | // must be at least 1, EffectiveBits also must be at least 1. It is also | 191 | | // at most 7. | 192 | 244k | size_t EffectiveBits = RemainingBits < 7 ? RemainingBits : 7; | 193 | 244k | std::make_unsigned_t<RetType> Payload = Byte; | 194 | 244k | if (Byte & SecondHighestBitMask) { | 195 | | // The byte is signed. | 196 | 225k | if (Byte >= (1 << 7) - (1 << (EffectiveBits - 1))) { | 197 | 225k | Payload -= (1 << 7); | 198 | 225k | } else { | 199 | 6 | Status = ErrCode::Value::IntegerTooLarge; | 200 | 6 | return Unexpect(Status); | 201 | 6 | } | 202 | 225k | } else { | 203 | | // The byte is unsigned. | 204 | 19.0k | if (Byte >= (1 << (EffectiveBits - 1))) { | 205 | 8 | Status = ErrCode::Value::IntegerTooLarge; | 206 | 8 | return Unexpect(Status); | 207 | 8 | } | 208 | 19.0k | } | 209 | 244k | Result |= (Payload << Offset); | 210 | 244k | break; | 211 | 244k | } | 212 | 335k | } | 213 | | | 214 | 244k | return Result; | 215 | 244k | } |
|
216 | | |
217 | 293k | Expect<int64_t> FileMgr::readS33() { return readSN<int64_t, 33>(); } |
218 | | |
219 | | // Decode and read a signed int. See "include/loader/filemgr.h". |
220 | 1.92M | Expect<int32_t> FileMgr::readS32() { return readSN<int32_t, 32>(); } |
221 | | |
222 | | // Decode and read a signed long long int. See "include/loader/filemgr.h". |
223 | 244k | Expect<int64_t> FileMgr::readS64() { return readSN<int64_t, 64>(); } |
224 | | |
225 | | // Copy bytes to a float. See "include/loader/filemgr.h". |
226 | 35.2k | Expect<float> FileMgr::readF32() { |
227 | 35.2k | if (Status != ErrCode::Value::Success) { |
228 | 0 | return Unexpect(Status); |
229 | 0 | } |
230 | | // Set the flag to the start offset. |
231 | 35.2k | LastPos = Pos; |
232 | | |
233 | 35.2k | uint32_t Buf = 0; |
234 | 35.2k | Byte Byte = 0x00; |
235 | | // Check if exceed the data boundary and section boundary. |
236 | 35.2k | EXPECTED_TRY(testRead(4)); |
237 | 176k | for (uint32_t I = 0; I < 4; I++) { |
238 | 140k | Byte = Data[Pos++]; |
239 | 140k | Buf |= (Byte & UINT32_C(0xFF)) << (I * UINT32_C(8)); |
240 | 140k | } |
241 | 35.2k | float Result; |
242 | 35.2k | static_assert(sizeof(Buf) == sizeof(Result)); |
243 | 35.2k | std::memcpy(&Result, &Buf, sizeof(Result)); |
244 | 35.2k | return Result; |
245 | 35.2k | } |
246 | | |
247 | | // Copy bytes to a double. See "include/loader/filemgr.h". |
248 | 15.4k | Expect<double> FileMgr::readF64() { |
249 | 15.4k | if (Status != ErrCode::Value::Success) { |
250 | 0 | return Unexpect(Status); |
251 | 0 | } |
252 | | // Set the flag to the start offset. |
253 | 15.4k | LastPos = Pos; |
254 | | |
255 | 15.4k | uint64_t Buf = 0; |
256 | 15.4k | Byte Byte = 0x00; |
257 | | // Check if exceed the data boundary and section boundary. |
258 | 15.4k | EXPECTED_TRY(testRead(8)); |
259 | 139k | for (uint32_t I = 0; I < 8; I++) { |
260 | 123k | Byte = Data[Pos++]; |
261 | 123k | Buf |= (Byte & UINT64_C(0xFF)) << (I * UINT64_C(8)); |
262 | 123k | } |
263 | 15.4k | double Result; |
264 | 15.4k | static_assert(sizeof(Buf) == sizeof(Result)); |
265 | 15.4k | std::memcpy(&Result, &Buf, sizeof(Result)); |
266 | 15.4k | return Result; |
267 | 15.4k | } |
268 | | |
269 | | // Read a vector of bytes. See "include/loader/filemgr.h". |
270 | 89.3k | Expect<std::string> FileMgr::readName() { |
271 | 89.3k | if (unlikely(Status != ErrCode::Value::Success)) { |
272 | 0 | return Unexpect(Status); |
273 | 0 | } |
274 | | // If UTF-8 validation or readU32() or readBytes() failed, the last succeeded |
275 | | // reading offset will be at the start of `Name`. |
276 | 89.3k | LastPos = Pos; |
277 | | |
278 | | // Read the name size. |
279 | 89.3k | EXPECTED_TRY(uint32_t SizeToRead, readU32()); |
280 | | |
281 | | // Check if string length exceed the data boundary. |
282 | 89.2k | if (auto Res = testRead(SizeToRead); unlikely(!Res)) { |
283 | 55 | return Unexpect(ErrCode::Value::LengthOutOfBounds); |
284 | 55 | } |
285 | | |
286 | | // Read the UTF-8 bytes. |
287 | 89.2k | std::string Str(SizeToRead, '\0'); |
288 | 89.2k | EXPECTED_TRY( |
289 | 89.2k | readBytes(Span<Byte>(reinterpret_cast<Byte *>(Str.data()), Str.size()))); |
290 | | |
291 | | // UTF-8 validation. |
292 | 89.2k | bool Valid = true; |
293 | 446k | for (uint32_t I = 0; I < Str.size() && Valid; ++I) { |
294 | 357k | char C = Str.data()[I]; |
295 | 357k | uint32_t N = 0; |
296 | 357k | if ((C & '\x80') == 0) { |
297 | | // 0xxxxxxx, 7 bits UCS, ASCII |
298 | 343k | N = 0; |
299 | 343k | } else if ((C & '\xE0') == '\xC0') { |
300 | | // 110xxxxx, 11 bits UCS, U+80 to U+7FF |
301 | 3.36k | N = 1; |
302 | 9.96k | } else if ((C & '\xF0') == '\xE0') { |
303 | | // 1110xxxx, 16 bits UCS, U+800 to U+D7FF and U+E000 to U+FFFF |
304 | 6.81k | N = 2; |
305 | 6.81k | } else if ((C & '\xF8') == '\xF0') { |
306 | | // 11110xxx, 21 bits UCS, U+10000 to U+10FFFF |
307 | 3.09k | N = 3; |
308 | 3.09k | } else { |
309 | 60 | Valid = false; |
310 | 60 | } |
311 | | |
312 | | // Need to have N more bytes |
313 | 357k | if (I + N >= Str.size()) { |
314 | 18 | Valid = false; |
315 | 18 | } |
316 | | // Invalid ranges |
317 | 357k | if (N == 1 && (C & '\xDE') == '\xC0') { |
318 | | // 11 bits UCS, U+0 to U+80, FAIL |
319 | 2 | Valid = false; |
320 | 357k | } else if (N == 2 && |
321 | 357k | ((C == '\xE0' && (Str.data()[I + 1] & '\xA0') == '\x80') || |
322 | | // 16 bits UCS, U+0 to U+7FF, FAIL |
323 | 6.81k | (C == '\xED' && (Str.data()[I + 1] & '\xA0') == '\xA0') |
324 | | // 16 bits UCS, U+D800 to U+DFFF, FAIL |
325 | 6.81k | )) { |
326 | 4 | Valid = false; |
327 | 357k | } else if (N == 3 && |
328 | 357k | ((C == '\xF0' && (Str.data()[I + 1] & '\xB0') == '\x80') || |
329 | | // 21 bits UCS, U+0 to U+FFFF, FAIL |
330 | 3.09k | (C == '\xF4' && (Str.data()[I + 1] & '\xB0') != '\x80') || |
331 | | // 21 bits UCS, U+110000 to U+13FFFF, FAIL |
332 | 3.09k | (C != '\xF4' && (C & '\xF4') == '\xF4') |
333 | | // 21 bits UCS, U+140000 to U+1FFFFF, FAIL |
334 | 3.09k | )) { |
335 | 14 | Valid = false; |
336 | 14 | } |
337 | | |
338 | 383k | for (uint32_t J = 0; J < N && Valid; ++J) { |
339 | | // N bytes needs to match 10xxxxxx |
340 | 26.1k | if ((Str.data()[I + J + 1] & '\xC0') != '\x80') { |
341 | 46 | Valid = false; |
342 | 46 | } |
343 | 26.1k | } |
344 | 357k | I += N; |
345 | 357k | } |
346 | | |
347 | 89.2k | if (!Valid) { |
348 | 143 | Status = ErrCode::Value::MalformedUTF8; |
349 | 143 | return Unexpect(Status); |
350 | 143 | } |
351 | 89.0k | return Str; |
352 | 89.2k | } |
353 | | |
354 | | // Peek one byte. See "include/loader/filemgr.h". |
355 | 145k | Expect<Byte> FileMgr::peekByte() { |
356 | 145k | EXPECTED_TRY(Byte B, readByte()); |
357 | 145k | Pos--; |
358 | 145k | return B; |
359 | 145k | } |
360 | | |
361 | | // Get the file header type. See "include/loader/filemgr.h". |
362 | 9.30k | FileMgr::FileHeader FileMgr::getHeaderType() { |
363 | 9.30k | if (Size >= 4) { |
364 | 9.27k | Byte WASMMagic[] = {0x00, 0x61, 0x73, 0x6D}; |
365 | 9.27k | Byte ELFMagic[] = {0x7F, 0x45, 0x4C, 0x46}; |
366 | 9.27k | Byte MAC32agic[] = {0xCE, 0xFA, 0xED, 0xFE}; |
367 | 9.27k | Byte MAC64agic[] = {0xCF, 0xFA, 0xED, 0xFE}; |
368 | 9.27k | if (std::equal(WASMMagic, WASMMagic + 4, Data)) { |
369 | 9.19k | return FileMgr::FileHeader::Wasm; |
370 | 9.19k | } else if (std::equal(ELFMagic, ELFMagic + 4, Data)) { |
371 | 1 | return FileMgr::FileHeader::ELF; |
372 | 81 | } else if (std::equal(MAC32agic, MAC32agic + 4, Data)) { |
373 | 1 | return FileMgr::FileHeader::MachO_32; |
374 | 80 | } else if (std::equal(MAC64agic, MAC64agic + 4, Data)) { |
375 | 1 | return FileMgr::FileHeader::MachO_64; |
376 | 1 | } |
377 | 9.27k | } |
378 | 111 | if (Size >= 2) { |
379 | 109 | Byte DLLMagic[] = {0x4D, 0x5A}; |
380 | 109 | if (std::equal(DLLMagic, DLLMagic + 2, Data)) { |
381 | 1 | return FileMgr::FileHeader::DLL; |
382 | 1 | } |
383 | 109 | } |
384 | 110 | return FileMgr::FileHeader::Unknown; |
385 | 111 | } |
386 | | |
387 | | // Jump a section. See "include/loader/filemgr.h". |
388 | 0 | Expect<void> FileMgr::jumpContent() { |
389 | 0 | if (unlikely(Status != ErrCode::Value::Success)) { |
390 | 0 | return Unexpect(Status); |
391 | 0 | } |
392 | | // Set the flag to the start offset. |
393 | 0 | LastPos = Pos; |
394 | | // Read the section size. |
395 | 0 | EXPECTED_TRY(uint32_t SecSize, readU32()); |
396 | | // Jump the content. |
397 | 0 | EXPECTED_TRY(testRead(SecSize)); |
398 | 0 | Pos += SecSize; |
399 | 0 | return {}; |
400 | 0 | } |
401 | | |
402 | | // Helper function for reading number of bytes. See "include/loader/filemgr.h". |
403 | 156k | Expect<void> FileMgr::readBytes(Span<Byte> Buffer) { |
404 | 156k | if (unlikely(Status != ErrCode::Value::Success)) { |
405 | 0 | return Unexpect(Status); |
406 | 0 | } |
407 | | // The adjustment of `LastPos` should be handled by caller. |
408 | 156k | auto SizeToRead = Buffer.size(); |
409 | 156k | if (likely(SizeToRead > 0)) { |
410 | | // Check if exceed the data boundary. |
411 | 54.9k | EXPECTED_TRY(testRead(SizeToRead)); |
412 | 54.9k | std::copy_n(Data + Pos, SizeToRead, Buffer.begin()); |
413 | 54.9k | Pos += SizeToRead; |
414 | 54.9k | } |
415 | 156k | return {}; |
416 | 156k | } |
417 | | |
418 | | // Helper function for checking boundary. See "include/loader/filemgr.h". |
419 | 14.3M | Expect<void> FileMgr::testRead(uint64_t Read) { |
420 | | // Check if exceed the data boundary |
421 | 14.3M | if (unlikely(getRemainSize() < Read)) { |
422 | 6.53k | Pos = Size; |
423 | 6.53k | LastPos = Pos; |
424 | 6.53k | Status = ErrCode::Value::UnexpectedEnd; |
425 | 6.53k | return Unexpect(Status); |
426 | 6.53k | } |
427 | 14.3M | return {}; |
428 | 14.3M | } |
429 | | |
430 | | } // namespace WasmEdge |