-
Notifications
You must be signed in to change notification settings - Fork 302
/
Copy pathfuzzer.cpp
385 lines (309 loc) · 13.6 KB
/
fuzzer.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
// evmone-fuzzer: LibFuzzer based testing tool for EVMC-compatible EVM implementations.
// Copyright 2019 The evmone Authors.
// SPDX-License-Identifier: Apache-2.0
#include <evmc/mocked_host.hpp>
#include <evmone/evmone.h>
#include <test/utils/bytecode.hpp>
#include <test/utils/utils.hpp>
#include <cstring>
#include <iostream>
#include <limits>
inline std::ostream& operator<<(std::ostream& os, const evmc_address& addr)
{
return os << hex({addr.bytes, sizeof(addr.bytes)});
}
inline std::ostream& operator<<(std::ostream& os, const evmc_bytes32& v)
{
return os << hex({v.bytes, sizeof(v.bytes)});
}
inline std::ostream& operator<<(std::ostream& os, const bytes_view& v)
{
return os << hex(v);
}
[[clang::always_inline]] inline void assert_true(
bool cond, const char* cond_str, const char* file, int line)
{
if (!cond)
{
std::cerr << "ASSERTION FAILED: \"" << cond_str << "\"\n\tin " << file << ":" << line
<< std::endl;
__builtin_trap();
}
}
#define ASSERT(COND) assert_true(COND, #COND, __FILE__, __LINE__)
template <typename T1, typename T2>
[[clang::always_inline]] inline void assert_eq(
const T1& a, const T2& b, const char* a_str, const char* b_str, const char* file, int line)
{
if (!(a == b))
{
std::cerr << "ASSERTION FAILED: \"" << a_str << " == " << b_str << "\"\n\twith " << a
<< " != " << b << "\n\tin " << file << ":" << line << std::endl;
__builtin_trap();
}
}
#define ASSERT_EQ(A, B) assert_eq(A, B, #A, #B, __FILE__, __LINE__)
static auto print_input = std::getenv("PRINT");
/// The reference VM: evmone Baseline
static auto ref_vm = evmc::VM{evmc_create_evmone()};
static evmc::VM external_vms[] = {
evmc::VM{evmc_create_evmone(), {{"advanced", ""}}},
};
class FuzzHost : public evmc::MockedHost
{
public:
uint8_t gas_left_factor = 0;
evmc::Result call(const evmc_message& msg) noexcept override
{
auto result = MockedHost::call(msg);
// Set gas_left.
if (gas_left_factor == 0)
result.gas_left = 0;
else if (gas_left_factor == 1)
result.gas_left = msg.gas;
else
result.gas_left = msg.gas / (gas_left_factor + 3);
if (msg.kind == EVMC_CREATE || msg.kind == EVMC_CREATE2)
{
// Use the output to fill the create address.
// We still keep the output to check if VM is going to ignore it.
std::memcpy(result.create_address.bytes, result.output_data,
std::min(sizeof(result.create_address), result.output_size));
}
return result;
}
};
/// The newest "old" EVM revision. Lower priority.
static constexpr auto old_rev = EVMC_SPURIOUS_DRAGON;
/// The additional gas limit cap for "old" EVM revisions.
static constexpr auto old_rev_max_gas = 500000;
struct fuzz_input
{
evmc_revision rev{};
evmc_message msg{};
FuzzHost host;
/// Creates invalid input.
fuzz_input() noexcept { msg.gas = -1; }
explicit operator bool() const noexcept { return msg.gas != -1; }
};
inline evmc::uint256be generate_interesting_value(uint8_t b) noexcept
{
const auto s = (b >> 6) & 0b11;
const auto fill = (b >> 5) & 0b1;
const auto above = (b >> 4) & 0b1;
const auto val = b & 0b1111;
auto z = evmc::uint256be{};
const size_t size = s == 0 ? 1 : 1 << (s + 2);
if (fill)
{
for (auto i = sizeof(z) - size; i < sizeof(z); ++i)
z.bytes[i] = 0xff;
}
if (above)
z.bytes[sizeof(z) - size % sizeof(z) - 1] ^= val;
else
z.bytes[sizeof(z) - size] ^= val << 4;
return z;
}
inline evmc::address generate_interesting_address(uint8_t b) noexcept
{
const auto s = (b >> 6) & 0b11;
const auto fill = (b >> 5) & 0b1;
const auto above = (b >> 4) & 0b1;
const auto val = b & 0b1111;
auto z = evmc::address{};
const size_t size = s == 3 ? 20 : 1 << s;
if (fill)
{
for (auto i = sizeof(z) - size; i < sizeof(z); ++i)
z.bytes[i] = 0xff;
}
if (above)
z.bytes[sizeof(z) - size % sizeof(z) - 1] ^= val;
else
z.bytes[sizeof(z) - size] ^= val << 4;
return z;
}
inline int generate_depth(uint8_t x_2bits) noexcept
{
const auto h = (x_2bits >> 1) & 0b1;
const auto l = x_2bits & 0b1;
return 1023 * h + l; // 0, 1, 1023, 1024.
}
/// Creates the block number value from 8-bit value.
/// The result is still quite small because block number affects blockhash().
inline int expand_block_number(uint8_t x) noexcept
{
return x * 97;
}
inline int64_t expand_block_timestamp(uint8_t x) noexcept
{
// TODO: If timestamp is -1 Aleth and evmone disagrees how to convert it to uint256.
return x < 255 ? int64_t{16777619} * x : std::numeric_limits<int64_t>::max();
}
inline int64_t expand_block_gas_limit(uint8_t x) noexcept
{
return x == 0 ? 0 : std::numeric_limits<int64_t>::max() / x;
}
fuzz_input populate_input(const uint8_t* data, size_t data_size) noexcept
{
auto in = fuzz_input{};
constexpr auto min_required_size = 24;
if (data_size < min_required_size)
return in;
const auto rev_4bits = data[0] >> 4;
const auto kind_1bit = (data[0] >> 3) & 0b1;
const auto static_1bit = (data[0] >> 2) & 0b1;
const auto depth_2bits = uint8_t(data[0] & 0b11);
const auto gas_24bits = (data[1] << 16) | (data[2] << 8) | data[3]; // Max 16777216.
const auto input_size_16bits = unsigned(data[4] << 8) | data[5];
const auto destination_8bits = data[6];
const auto sender_8bits = data[7];
const auto value_8bits = data[8];
const auto create2_salt_8bits = data[9];
const auto tx_gas_price_8bits = data[10];
const auto tx_origin_8bits = data[11];
const auto block_coinbase_8bits = data[12];
const auto block_number_8bits = data[13];
const auto block_timestamp_8bits = data[14];
const auto block_gas_limit_8bits = data[15];
const auto block_prev_randao_8bits = data[16];
const auto chainid_8bits = data[17];
const auto account_balance_8bits = data[18];
const auto account_storage_key1_8bits = data[19];
const auto account_storage_key2_8bits = data[20];
const auto account_codehash_8bits = data[21];
// TODO: Add another account?
const auto call_result_status_4bits = data[22] >> 4;
const auto call_result_gas_left_factor_4bits = uint8_t(data[23] & 0b1111);
data += min_required_size;
data_size -= min_required_size;
if (data_size < input_size_16bits) // Not enough data for input.
return in;
in.rev = (rev_4bits > EVMC_LATEST_STABLE_REVISION) ? EVMC_LATEST_STABLE_REVISION :
static_cast<evmc_revision>(rev_4bits);
// The message king should not matter but this 1 bit was free.
in.msg.kind = kind_1bit ? EVMC_CREATE : EVMC_CALL;
in.msg.flags = static_1bit ? EVMC_STATIC : 0;
in.msg.depth = generate_depth(depth_2bits);
// Set the gas limit. For old revisions cap the gas limit more because:
// - they are less priority,
// - pre Tangerine Whistle calls are extremely cheap and it is easy to find slow running units.
in.msg.gas = in.rev <= old_rev ? std::min(gas_24bits, old_rev_max_gas) : gas_24bits;
in.msg.recipient = generate_interesting_address(destination_8bits);
in.msg.sender = generate_interesting_address(sender_8bits);
in.msg.input_size = input_size_16bits;
in.msg.input_data = data;
in.msg.value = generate_interesting_value(value_8bits);
// Should be ignored by VMs.
in.msg.create2_salt = generate_interesting_value(create2_salt_8bits);
data += in.msg.input_size;
data_size -= in.msg.input_size;
in.host.tx_context.tx_gas_price = generate_interesting_value(tx_gas_price_8bits);
in.host.tx_context.tx_origin = generate_interesting_address(tx_origin_8bits);
in.host.tx_context.block_coinbase = generate_interesting_address(block_coinbase_8bits);
in.host.tx_context.block_number = expand_block_number(block_number_8bits);
in.host.tx_context.block_timestamp = expand_block_timestamp(block_timestamp_8bits);
in.host.tx_context.block_gas_limit = expand_block_gas_limit(block_gas_limit_8bits);
in.host.tx_context.block_prev_randao = generate_interesting_value(block_prev_randao_8bits);
in.host.tx_context.chain_id = generate_interesting_value(chainid_8bits);
auto& account = in.host.accounts[in.msg.recipient];
account.balance = generate_interesting_value(account_balance_8bits);
const auto storage_key1 = generate_interesting_value(account_storage_key1_8bits);
const auto storage_key2 = generate_interesting_value(account_storage_key2_8bits);
account.storage[{}] = storage_key2;
account.storage[storage_key1] = storage_key2;
// Add dirty value as if it has been already modified in this transaction.
account.storage[storage_key2] = {storage_key1, storage_key2};
account.codehash = generate_interesting_value(account_codehash_8bits);
account.code = {data, data_size}; // Use remaining data as code.
in.host.call_result.status_code = static_cast<evmc_status_code>(call_result_status_4bits);
in.host.gas_left_factor = call_result_gas_left_factor_4bits;
// Use 3/5 of the input from the and as the potential call output.
const auto offset = in.msg.input_size * 2 / 5;
in.host.call_result.output_data = &in.msg.input_data[offset];
in.host.call_result.output_size = in.msg.input_size - offset;
return in;
}
inline auto hex(const evmc_address& addr) noexcept
{
return hex({addr.bytes, sizeof(addr)});
}
inline evmc_status_code check_and_normalize(evmc_status_code status) noexcept
{
ASSERT(status >= 0);
return status <= EVMC_REVERT ? status : EVMC_FAILURE;
}
extern "C" int LLVMFuzzerTestOneInput(const uint8_t* data, size_t data_size) noexcept
{
auto in = populate_input(data, data_size);
if (!in)
return 0;
auto ref_host = in.host; // Copy Host.
const auto& code = ref_host.accounts[in.msg.recipient].code;
if (print_input != nullptr)
{
std::cout << "rev: " << int{in.rev} << "\n";
std::cout << "depth: " << int{in.msg.depth} << "\n";
std::cout << "code: " << hex(code) << "\n";
std::cout << "decoded: " << decode(code) << "\n";
std::cout << "input: " << hex({in.msg.input_data, in.msg.input_size}) << "\n";
std::cout << "account: " << hex(in.msg.recipient) << "\n";
std::cout << "caller: " << hex(in.msg.sender) << "\n";
std::cout << "value: " << in.msg.value << "\n";
std::cout << "gas: " << in.msg.gas << "\n";
std::cout << "balance: " << in.host.accounts[in.msg.recipient].balance << "\n";
std::cout << "coinbase: " << in.host.tx_context.block_coinbase << "\n";
std::cout << "prevrandao: " << in.host.tx_context.block_prev_randao << "\n";
std::cout << "timestamp: " << in.host.tx_context.block_timestamp << "\n";
std::cout << "chainid: " << in.host.tx_context.chain_id << "\n";
}
const auto ref_res = ref_vm.execute(ref_host, in.rev, in.msg, code.data(), code.size());
const auto ref_status = check_and_normalize(ref_res.status_code);
if (ref_status == EVMC_FAILURE)
ASSERT_EQ(ref_res.gas_left, 0);
for (auto& vm : external_vms)
{
auto host = in.host; // Copy Host.
const auto res = vm.execute(host, in.rev, in.msg, code.data(), code.size());
const auto status = check_and_normalize(res.status_code);
ASSERT_EQ(status, ref_status);
ASSERT_EQ(res.gas_left, ref_res.gas_left);
ASSERT_EQ(bytes_view(res.output_data, res.output_size),
bytes_view(ref_res.output_data, ref_res.output_size));
if (ref_status != EVMC_FAILURE)
{
ASSERT_EQ(ref_host.recorded_calls.size(), host.recorded_calls.size());
for (size_t i = 0; i < ref_host.recorded_calls.size(); ++i)
{
const auto& m1 = ref_host.recorded_calls[i];
const auto& m2 = host.recorded_calls[i];
ASSERT_EQ(m1.kind, m2.kind);
ASSERT_EQ(m1.flags, m2.flags);
ASSERT_EQ(m1.depth, m2.depth);
ASSERT_EQ(m1.gas, m2.gas);
ASSERT_EQ(evmc::address{m1.recipient}, evmc::address{m2.recipient});
ASSERT_EQ(evmc::address{m1.sender}, evmc::address{m2.sender});
ASSERT_EQ(bytes_view(m1.input_data, m1.input_size),
bytes_view(m2.input_data, m2.input_size));
ASSERT_EQ(evmc::uint256be{m1.value}, evmc::uint256be{m2.value});
ASSERT_EQ(evmc::bytes32{m1.create2_salt}, evmc::bytes32{m2.create2_salt});
}
ASSERT(std::equal(ref_host.recorded_logs.begin(), ref_host.recorded_logs.end(),
host.recorded_logs.begin(), host.recorded_logs.end()));
ASSERT_EQ(ref_host.recorded_blockhashes.size(), host.recorded_blockhashes.size());
ASSERT(std::equal(ref_host.recorded_blockhashes.begin(),
ref_host.recorded_blockhashes.end(), host.recorded_blockhashes.begin(),
host.recorded_blockhashes.end()));
ASSERT(std::equal(ref_host.recorded_selfdestructs.begin(),
ref_host.recorded_selfdestructs.end(), host.recorded_selfdestructs.begin(),
host.recorded_selfdestructs.end()));
// TODO: Enable account accesses check. Currently this is not possible because Aleth
// is doing additional unnecessary account existence checks in calls.
// ASSERT(std::equal(ref_host.recorded_account_accesses.begin(),
// ref_host.recorded_account_accesses.end(), host.recorded_account_accesses.begin(),
// host.recorded_account_accesses.end()));
}
}
return 0;
}