/Users/eugenesiegel/btc/bitcoin/src/util/asmap.cpp
Line | Count | Source (jump to first uncovered line) |
1 | | // Copyright (c) 2019-2022 The Bitcoin Core developers |
2 | | // Distributed under the MIT software license, see the accompanying |
3 | | // file COPYING or http://www.opensource.org/licenses/mit-license.php. |
4 | | |
5 | | #include <util/asmap.h> |
6 | | |
7 | | #include <clientversion.h> |
8 | | #include <logging.h> |
9 | | #include <serialize.h> |
10 | | #include <streams.h> |
11 | | #include <util/fs.h> |
12 | | |
13 | | #include <algorithm> |
14 | | #include <bit> |
15 | | #include <cassert> |
16 | | #include <cstdio> |
17 | | #include <utility> |
18 | | #include <vector> |
19 | | |
20 | | namespace { |
21 | | |
22 | | constexpr uint32_t INVALID = 0xFFFFFFFF; |
23 | | |
24 | | uint32_t DecodeBits(std::vector<bool>::const_iterator& bitpos, const std::vector<bool>::const_iterator& endpos, uint8_t minval, const std::vector<uint8_t> &bit_sizes) |
25 | 0 | { |
26 | 0 | uint32_t val = minval; |
27 | 0 | bool bit; |
28 | 0 | for (std::vector<uint8_t>::const_iterator bit_sizes_it = bit_sizes.begin(); |
29 | 0 | bit_sizes_it != bit_sizes.end(); ++bit_sizes_it) { |
30 | 0 | if (bit_sizes_it + 1 != bit_sizes.end()) { |
31 | 0 | if (bitpos == endpos) break; |
32 | 0 | bit = *bitpos; |
33 | 0 | bitpos++; |
34 | 0 | } else { |
35 | 0 | bit = 0; |
36 | 0 | } |
37 | 0 | if (bit) { |
38 | 0 | val += (1 << *bit_sizes_it); |
39 | 0 | } else { |
40 | 0 | for (int b = 0; b < *bit_sizes_it; b++) { |
41 | 0 | if (bitpos == endpos) return INVALID; // Reached EOF in mantissa |
42 | 0 | bit = *bitpos; |
43 | 0 | bitpos++; |
44 | 0 | val += bit << (*bit_sizes_it - 1 - b); |
45 | 0 | } |
46 | 0 | return val; |
47 | 0 | } |
48 | 0 | } |
49 | 0 | return INVALID; // Reached EOF in exponent |
50 | 0 | } |
51 | | |
52 | | enum class Instruction : uint32_t |
53 | | { |
54 | | RETURN = 0, |
55 | | JUMP = 1, |
56 | | MATCH = 2, |
57 | | DEFAULT = 3, |
58 | | }; |
59 | | |
60 | | const std::vector<uint8_t> TYPE_BIT_SIZES{0, 0, 1}; |
61 | | Instruction DecodeType(std::vector<bool>::const_iterator& bitpos, const std::vector<bool>::const_iterator& endpos) |
62 | 0 | { |
63 | 0 | return Instruction(DecodeBits(bitpos, endpos, 0, TYPE_BIT_SIZES)); |
64 | 0 | } |
65 | | |
66 | | const std::vector<uint8_t> ASN_BIT_SIZES{15, 16, 17, 18, 19, 20, 21, 22, 23, 24}; |
67 | | uint32_t DecodeASN(std::vector<bool>::const_iterator& bitpos, const std::vector<bool>::const_iterator& endpos) |
68 | 0 | { |
69 | 0 | return DecodeBits(bitpos, endpos, 1, ASN_BIT_SIZES); |
70 | 0 | } |
71 | | |
72 | | |
73 | | const std::vector<uint8_t> MATCH_BIT_SIZES{1, 2, 3, 4, 5, 6, 7, 8}; |
74 | | uint32_t DecodeMatch(std::vector<bool>::const_iterator& bitpos, const std::vector<bool>::const_iterator& endpos) |
75 | 0 | { |
76 | 0 | return DecodeBits(bitpos, endpos, 2, MATCH_BIT_SIZES); |
77 | 0 | } |
78 | | |
79 | | |
80 | | const std::vector<uint8_t> JUMP_BIT_SIZES{5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30}; |
81 | | uint32_t DecodeJump(std::vector<bool>::const_iterator& bitpos, const std::vector<bool>::const_iterator& endpos) |
82 | 0 | { |
83 | 0 | return DecodeBits(bitpos, endpos, 17, JUMP_BIT_SIZES); |
84 | 0 | } |
85 | | |
86 | | } |
87 | | |
88 | | uint32_t Interpret(const std::vector<bool> &asmap, const std::vector<bool> &ip) |
89 | 0 | { |
90 | 0 | std::vector<bool>::const_iterator pos = asmap.begin(); |
91 | 0 | const std::vector<bool>::const_iterator endpos = asmap.end(); |
92 | 0 | uint8_t bits = ip.size(); |
93 | 0 | uint32_t default_asn = 0; |
94 | 0 | uint32_t jump, match, matchlen; |
95 | 0 | Instruction opcode; |
96 | 0 | while (pos != endpos) { |
97 | 0 | opcode = DecodeType(pos, endpos); |
98 | 0 | if (opcode == Instruction::RETURN) { |
99 | 0 | default_asn = DecodeASN(pos, endpos); |
100 | 0 | if (default_asn == INVALID) break; // ASN straddles EOF |
101 | 0 | return default_asn; |
102 | 0 | } else if (opcode == Instruction::JUMP) { |
103 | 0 | jump = DecodeJump(pos, endpos); |
104 | 0 | if (jump == INVALID) break; // Jump offset straddles EOF |
105 | 0 | if (bits == 0) break; // No input bits left |
106 | 0 | if (int64_t{jump} >= int64_t{endpos - pos}) break; // Jumping past EOF |
107 | 0 | if (ip[ip.size() - bits]) { |
108 | 0 | pos += jump; |
109 | 0 | } |
110 | 0 | bits--; |
111 | 0 | } else if (opcode == Instruction::MATCH) { |
112 | 0 | match = DecodeMatch(pos, endpos); |
113 | 0 | if (match == INVALID) break; // Match bits straddle EOF |
114 | 0 | matchlen = std::bit_width(match) - 1; |
115 | 0 | if (bits < matchlen) break; // Not enough input bits |
116 | 0 | for (uint32_t bit = 0; bit < matchlen; bit++) { |
117 | 0 | if ((ip[ip.size() - bits]) != ((match >> (matchlen - 1 - bit)) & 1)) { |
118 | 0 | return default_asn; |
119 | 0 | } |
120 | 0 | bits--; |
121 | 0 | } |
122 | 0 | } else if (opcode == Instruction::DEFAULT) { |
123 | 0 | default_asn = DecodeASN(pos, endpos); |
124 | 0 | if (default_asn == INVALID) break; // ASN straddles EOF |
125 | 0 | } else { |
126 | 0 | break; // Instruction straddles EOF |
127 | 0 | } |
128 | 0 | } |
129 | 0 | assert(false); // Reached EOF without RETURN, or aborted (see any of the breaks above) - should have been caught by SanityCheckASMap below |
130 | 0 | return 0; // 0 is not a valid ASN |
131 | 0 | } |
132 | | |
133 | | bool SanityCheckASMap(const std::vector<bool>& asmap, int bits) |
134 | 0 | { |
135 | 0 | const std::vector<bool>::const_iterator begin = asmap.begin(), endpos = asmap.end(); |
136 | 0 | std::vector<bool>::const_iterator pos = begin; |
137 | 0 | std::vector<std::pair<uint32_t, int>> jumps; // All future positions we may jump to (bit offset in asmap -> bits to consume left) |
138 | 0 | jumps.reserve(bits); |
139 | 0 | Instruction prevopcode = Instruction::JUMP; |
140 | 0 | bool had_incomplete_match = false; |
141 | 0 | while (pos != endpos) { |
142 | 0 | uint32_t offset = pos - begin; |
143 | 0 | if (!jumps.empty() && offset >= jumps.back().first) return false; // There was a jump into the middle of the previous instruction |
144 | 0 | Instruction opcode = DecodeType(pos, endpos); |
145 | 0 | if (opcode == Instruction::RETURN) { |
146 | 0 | if (prevopcode == Instruction::DEFAULT) return false; // There should not be any RETURN immediately after a DEFAULT (could be combined into just RETURN) |
147 | 0 | uint32_t asn = DecodeASN(pos, endpos); |
148 | 0 | if (asn == INVALID) return false; // ASN straddles EOF |
149 | 0 | if (jumps.empty()) { |
150 | | // Nothing to execute anymore |
151 | 0 | if (endpos - pos > 7) return false; // Excessive padding |
152 | 0 | while (pos != endpos) { |
153 | 0 | if (*pos) return false; // Nonzero padding bit |
154 | 0 | ++pos; |
155 | 0 | } |
156 | 0 | return true; // Sanely reached EOF |
157 | 0 | } else { |
158 | | // Continue by pretending we jumped to the next instruction |
159 | 0 | offset = pos - begin; |
160 | 0 | if (offset != jumps.back().first) return false; // Unreachable code |
161 | 0 | bits = jumps.back().second; // Restore the number of bits we would have had left after this jump |
162 | 0 | jumps.pop_back(); |
163 | 0 | prevopcode = Instruction::JUMP; |
164 | 0 | } |
165 | 0 | } else if (opcode == Instruction::JUMP) { |
166 | 0 | uint32_t jump = DecodeJump(pos, endpos); |
167 | 0 | if (jump == INVALID) return false; // Jump offset straddles EOF |
168 | 0 | if (int64_t{jump} > int64_t{endpos - pos}) return false; // Jump out of range |
169 | 0 | if (bits == 0) return false; // Consuming bits past the end of the input |
170 | 0 | --bits; |
171 | 0 | uint32_t jump_offset = pos - begin + jump; |
172 | 0 | if (!jumps.empty() && jump_offset >= jumps.back().first) return false; // Intersecting jumps |
173 | 0 | jumps.emplace_back(jump_offset, bits); |
174 | 0 | prevopcode = Instruction::JUMP; |
175 | 0 | } else if (opcode == Instruction::MATCH) { |
176 | 0 | uint32_t match = DecodeMatch(pos, endpos); |
177 | 0 | if (match == INVALID) return false; // Match bits straddle EOF |
178 | 0 | int matchlen = std::bit_width(match) - 1; |
179 | 0 | if (prevopcode != Instruction::MATCH) had_incomplete_match = false; |
180 | 0 | if (matchlen < 8 && had_incomplete_match) return false; // Within a sequence of matches only at most one should be incomplete |
181 | 0 | had_incomplete_match = (matchlen < 8); |
182 | 0 | if (bits < matchlen) return false; // Consuming bits past the end of the input |
183 | 0 | bits -= matchlen; |
184 | 0 | prevopcode = Instruction::MATCH; |
185 | 0 | } else if (opcode == Instruction::DEFAULT) { |
186 | 0 | if (prevopcode == Instruction::DEFAULT) return false; // There should not be two successive DEFAULTs (they could be combined into one) |
187 | 0 | uint32_t asn = DecodeASN(pos, endpos); |
188 | 0 | if (asn == INVALID) return false; // ASN straddles EOF |
189 | 0 | prevopcode = Instruction::DEFAULT; |
190 | 0 | } else { |
191 | 0 | return false; // Instruction straddles EOF |
192 | 0 | } |
193 | 0 | } |
194 | 0 | return false; // Reached EOF without RETURN instruction |
195 | 0 | } |
196 | | |
197 | | std::vector<bool> DecodeAsmap(fs::path path) |
198 | 0 | { |
199 | 0 | std::vector<bool> bits; |
200 | 0 | FILE *filestr = fsbridge::fopen(path, "rb"); |
201 | 0 | AutoFile file{filestr}; |
202 | 0 | if (file.IsNull()) { |
203 | 0 | LogPrintf("Failed to open asmap file from disk\n"); Line | Count | Source | 266 | 0 | #define LogPrintf(...) LogInfo(__VA_ARGS__) Line | Count | Source | 261 | 0 | #define LogInfo(...) LogPrintLevel_(BCLog::LogFlags::ALL, BCLog::Level::Info, __VA_ARGS__) Line | Count | Source | 255 | 0 | #define LogPrintLevel_(category, level, ...) LogPrintFormatInternal(__func__, __FILE__, __LINE__, category, level, __VA_ARGS__) |
|
|
|
204 | 0 | return bits; |
205 | 0 | } |
206 | 0 | file.seek(0, SEEK_END); |
207 | 0 | int length = file.tell(); |
208 | 0 | LogPrintf("Opened asmap file %s (%d bytes) from disk\n", fs::quoted(fs::PathToString(path)), length); Line | Count | Source | 266 | 0 | #define LogPrintf(...) LogInfo(__VA_ARGS__) Line | Count | Source | 261 | 0 | #define LogInfo(...) LogPrintLevel_(BCLog::LogFlags::ALL, BCLog::Level::Info, __VA_ARGS__) Line | Count | Source | 255 | 0 | #define LogPrintLevel_(category, level, ...) LogPrintFormatInternal(__func__, __FILE__, __LINE__, category, level, __VA_ARGS__) |
|
|
|
209 | 0 | file.seek(0, SEEK_SET); |
210 | 0 | uint8_t cur_byte; |
211 | 0 | for (int i = 0; i < length; ++i) { |
212 | 0 | file >> cur_byte; |
213 | 0 | for (int bit = 0; bit < 8; ++bit) { |
214 | 0 | bits.push_back((cur_byte >> bit) & 1); |
215 | 0 | } |
216 | 0 | } |
217 | 0 | if (!SanityCheckASMap(bits, 128)) { |
218 | 0 | LogPrintf("Sanity check of asmap file %s failed\n", fs::quoted(fs::PathToString(path))); Line | Count | Source | 266 | 0 | #define LogPrintf(...) LogInfo(__VA_ARGS__) Line | Count | Source | 261 | 0 | #define LogInfo(...) LogPrintLevel_(BCLog::LogFlags::ALL, BCLog::Level::Info, __VA_ARGS__) Line | Count | Source | 255 | 0 | #define LogPrintLevel_(category, level, ...) LogPrintFormatInternal(__func__, __FILE__, __LINE__, category, level, __VA_ARGS__) |
|
|
|
219 | 0 | return {}; |
220 | 0 | } |
221 | 0 | return bits; |
222 | 0 | } |
223 | | |