mirror of
https://github.com/AFLplusplus/AFLplusplus.git
synced 2025-06-17 20:28:08 +00:00
lots of fixes
This commit is contained in:
@ -3,4 +3,4 @@ cmplog: only add tokens that were found to fit?
|
|||||||
create from thin air if no good seed after a cycle and dict large enough?
|
create from thin air if no good seed after a cycle and dict large enough?
|
||||||
(static u32 no_of_struct_inputs;)
|
(static u32 no_of_struct_inputs;)
|
||||||
|
|
||||||
splicing -> check if whitespace/token is needed
|
splicing -> check if whitespace/token is needed
|
||||||
|
@ -38,8 +38,10 @@ typedef struct my_mutator {
|
|||||||
|
|
||||||
} my_mutator_t;
|
} my_mutator_t;
|
||||||
|
|
||||||
#define DEBUG \
|
#undef DEBUGF
|
||||||
|
#define DEBUGF \
|
||||||
if (unlikely(debug)) fprintf
|
if (unlikely(debug)) fprintf
|
||||||
|
#define IFDEBUG if (unlikely(debug))
|
||||||
|
|
||||||
static afl_state *afl_ptr;
|
static afl_state *afl_ptr;
|
||||||
static int debug = AUTOTOKENS_DEBUG;
|
static int debug = AUTOTOKENS_DEBUG;
|
||||||
@ -57,12 +59,12 @@ static unordered_map<u32, vector<u32> *> id_mapping;
|
|||||||
static unordered_map<string, u32> token_to_id;
|
static unordered_map<string, u32> token_to_id;
|
||||||
static unordered_map<u32, string> id_to_token;
|
static unordered_map<u32, string> id_to_token;
|
||||||
static string whitespace = AUTOTOKENS_WHITESPACE;
|
static string whitespace = AUTOTOKENS_WHITESPACE;
|
||||||
|
static string output;
|
||||||
static regex *regex_comment_custom;
|
static regex *regex_comment_custom;
|
||||||
static regex regex_comment_star("/\\*([:print:]|\n)*?\\*/",
|
static regex regex_comment_star("/\\*([:print:]|\n)*?\\*/",
|
||||||
regex::multiline | regex::optimize);
|
regex::multiline | regex::optimize);
|
||||||
static regex regex_word("[A-Za-z0-9_$.-]+", regex::optimize);
|
static regex regex_word("[A-Za-z0-9_$.-]+", regex::optimize);
|
||||||
static regex regex_whitespace(R"([ \t]+)", regex::optimize);
|
static regex regex_whitespace(R"([ \t]+)", regex::optimize);
|
||||||
static regex regex_string("\"[[:print:]]*?\"|'[[:print:]]*?'", regex::optimize);
|
|
||||||
static vector<u32> *s; // the structure of the currently selected input
|
static vector<u32> *s; // the structure of the currently selected input
|
||||||
|
|
||||||
u32 good_whitespace_or_singleval() {
|
u32 good_whitespace_or_singleval() {
|
||||||
@ -104,7 +106,7 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
MAX(AUTOTOKENS_CHANGE_MIN,
|
MAX(AUTOTOKENS_CHANGE_MIN,
|
||||||
MIN(m_size >> 3, HAVOC_CYCLES * afl_ptr->queue_cur->perf_score *
|
MIN(m_size >> 3, HAVOC_CYCLES * afl_ptr->queue_cur->perf_score *
|
||||||
afl_ptr->havoc_div / 256));
|
afl_ptr->havoc_div / 256));
|
||||||
// DEBUG(stderr, "structure size: %lu, rounds: %u \n", m.size(), rounds);
|
// DEBUGF(stderr, "structure size: %lu, rounds: %u \n", m.size(), rounds);
|
||||||
|
|
||||||
#if AUTOTOKENS_SPLICE_DISABLE == 1
|
#if AUTOTOKENS_SPLICE_DISABLE == 1
|
||||||
#define AUTOTOKENS_MUT_MAX 12
|
#define AUTOTOKENS_MUT_MAX 12
|
||||||
@ -112,7 +114,7 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
#define AUTOTOKENS_MUT_MAX 14
|
#define AUTOTOKENS_MUT_MAX 14
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
u32 max_rand = AUTOTOKENS_MUT_MAX;
|
u32 max_rand = AUTOTOKENS_MUT_MAX, new_item, pos;
|
||||||
|
|
||||||
for (i = 0; i < rounds; ++i) {
|
for (i = 0; i < rounds; ++i) {
|
||||||
|
|
||||||
@ -122,8 +124,8 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
case 0 ... 7: /* fall through */
|
case 0 ... 7: /* fall through */
|
||||||
{
|
{
|
||||||
|
|
||||||
u32 pos = rand_below(afl_ptr, m_size);
|
pos = rand_below(afl_ptr, m_size);
|
||||||
u32 cur_item = m[pos], new_item;
|
u32 cur_item = m[pos];
|
||||||
do {
|
do {
|
||||||
|
|
||||||
new_item = rand_below(afl_ptr, current_id);
|
new_item = rand_below(afl_ptr, current_id);
|
||||||
@ -135,7 +137,7 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
((whitespace_ids < new_item && whitespace_ids >= cur_item) ||
|
((whitespace_ids < new_item && whitespace_ids >= cur_item) ||
|
||||||
(whitespace_ids >= new_item && whitespace_ids < cur_item)))));
|
(whitespace_ids >= new_item && whitespace_ids < cur_item)))));
|
||||||
|
|
||||||
DEBUG(stderr, "MUT: %u -> %u\n", cur_item, new_item);
|
DEBUGF(stderr, "MUT: %u -> %u\n", cur_item, new_item);
|
||||||
m[pos] = new_item;
|
m[pos] = new_item;
|
||||||
break;
|
break;
|
||||||
|
|
||||||
@ -144,7 +146,6 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
/* INSERT (m_size +1 so we insert also after last place) */
|
/* INSERT (m_size +1 so we insert also after last place) */
|
||||||
case 8 ... 9: {
|
case 8 ... 9: {
|
||||||
|
|
||||||
u32 new_item;
|
|
||||||
do {
|
do {
|
||||||
|
|
||||||
new_item = rand_below(afl_ptr, current_id);
|
new_item = rand_below(afl_ptr, current_id);
|
||||||
@ -154,7 +155,7 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
u32 pos = rand_below(afl_ptr, m_size + 1);
|
u32 pos = rand_below(afl_ptr, m_size + 1);
|
||||||
m.insert(m.begin() + pos, new_item);
|
m.insert(m.begin() + pos, new_item);
|
||||||
++m_size;
|
++m_size;
|
||||||
DEBUG(stderr, "INS: %u at %u\n", new_item, pos);
|
DEBUGF(stderr, "INS: %u at %u\n", new_item, pos);
|
||||||
|
|
||||||
if (likely(!alternative_tokenize)) {
|
if (likely(!alternative_tokenize)) {
|
||||||
|
|
||||||
@ -212,7 +213,8 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
m.insert(m.begin() + dst_off, src->begin() + src_off,
|
m.insert(m.begin() + dst_off, src->begin() + src_off,
|
||||||
src->begin() + src_off + n);
|
src->begin() + src_off + n);
|
||||||
m_size += n;
|
m_size += n;
|
||||||
DEBUG(stderr, "SPLICE-INS: %u at %u\n", n, dst_off);
|
DEBUGF(stderr, "SPLICE-INS: %u at %u\n", n, dst_off);
|
||||||
|
|
||||||
break;
|
break;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -231,13 +233,36 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
copy(src->begin() + src_off, src->begin() + src_off + n,
|
copy(src->begin() + src_off, src->begin() + src_off + n,
|
||||||
m.begin() + dst_off);
|
m.begin() + dst_off);
|
||||||
|
|
||||||
DEBUG(stderr, "SPLICE-MUT: %u at %u\n", n, dst_off);
|
DEBUGF(stderr, "SPLICE-MUT: %u at %u\n", n, dst_off);
|
||||||
break;
|
break;
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (likely(!alternative_tokenize)) {
|
||||||
|
|
||||||
|
// do we need a whitespace/token at the beginning?
|
||||||
|
if (dst_off && id_to_token[m[dst_off - 1]].size() > 1 &&
|
||||||
|
id_to_token[m[dst_off]].size() > 1) {
|
||||||
|
|
||||||
|
m.insert(m.begin() + dst_off, good_whitespace_or_singleval());
|
||||||
|
++m_size;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
// do we need a whitespace/token at the end?
|
||||||
|
if (dst_off + n < m_size &&
|
||||||
|
id_to_token[m[dst_off + n - 1]].size() > 1 &&
|
||||||
|
id_to_token[m[dst_off + n]].size() > 1) {
|
||||||
|
|
||||||
|
m.insert(m.begin() + dst_off + n, good_whitespace_or_singleval());
|
||||||
|
++m_size;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
break;
|
break;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -249,11 +274,32 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
|
|
||||||
if (m_size > 8) {
|
if (m_size > 8) {
|
||||||
|
|
||||||
m.erase(m.begin() + rand_below(afl_ptr, m_size));
|
do {
|
||||||
--m_size;
|
|
||||||
|
pos = rand_below(afl_ptr, m_size);
|
||||||
|
|
||||||
|
} while (unlikely(pos < whitespace_ids));
|
||||||
|
|
||||||
|
// if what we delete will result in a missing whitespace/token,
|
||||||
|
// instead of deleting we switch the item to a whitespace or token.
|
||||||
|
if (likely(!alternative_tokenize) && pos && pos < m_size &&
|
||||||
|
id_to_token[m[pos - 1]].size() > 1 &&
|
||||||
|
id_to_token[m[pos + 1]].size() > 1) {
|
||||||
|
|
||||||
|
m[pos] = good_whitespace_or_singleval();
|
||||||
|
|
||||||
|
} else {
|
||||||
|
|
||||||
|
m.erase(m.begin() + pos);
|
||||||
|
--m_size;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
} else {
|
} else {
|
||||||
|
|
||||||
|
// if the data is already too small do not try to make it smaller
|
||||||
|
// again this run.
|
||||||
|
|
||||||
max_rand = AUTOTOKENS_MUT_MAX - 2;
|
max_rand = AUTOTOKENS_MUT_MAX - 2;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -262,14 +308,12 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// TODO: add full line insert splice, replace splace, delete
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
string output;
|
u32 m_size_1 = m_size - 1;
|
||||||
u32 m_size_1 = m_size - 1;
|
output = "";
|
||||||
|
|
||||||
for (i = 0; i < m_size; ++i) {
|
for (i = 0; i < m_size; ++i) {
|
||||||
|
|
||||||
@ -282,31 +326,108 @@ extern "C" size_t afl_custom_fuzz(my_mutator_t *data, u8 *buf, size_t buf_size,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
u32 mutated_size = output.size();
|
u32 mutated_size = (u32)output.size();
|
||||||
u8 *mutated_out = (u8 *)afl_realloc((void **)out_buf, mutated_size);
|
u8 *mutated_out = (u8 *)output.data();
|
||||||
|
|
||||||
if (unlikely(!mutated_out)) {
|
if (unlikely(mutated_size > max_size)) { mutated_size = max_size; }
|
||||||
|
|
||||||
*out_buf = NULL;
|
IFDEBUG {
|
||||||
return 0;
|
|
||||||
|
|
||||||
}
|
DEBUGF(stderr, "MUTATED to %u bytes:\n", mutated_size);
|
||||||
|
|
||||||
if (unlikely(debug)) {
|
|
||||||
|
|
||||||
DEBUG(stderr, "MUTATED to %u bytes:\n", mutated_size);
|
|
||||||
fwrite(output.data(), 1, mutated_size, stderr);
|
fwrite(output.data(), 1, mutated_size, stderr);
|
||||||
DEBUG(stderr, "\n---\n");
|
DEBUGF(stderr, "\n---\n");
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
memcpy(mutated_out, output.data(), mutated_size);
|
|
||||||
*out_buf = mutated_out;
|
*out_buf = mutated_out;
|
||||||
++fuzz_count;
|
++fuzz_count;
|
||||||
return mutated_size;
|
return mutated_size;
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* I get f*cking stack overflow using C++ regex with a regex of
|
||||||
|
"\"[[:print:]]*?\"" if this matches a long string even with regex::optimize
|
||||||
|
enabled :-( */
|
||||||
|
u8 my_search_string(string::const_iterator cur, string::const_iterator ende,
|
||||||
|
string::const_iterator *match_begin,
|
||||||
|
string::const_iterator *match_end) {
|
||||||
|
|
||||||
|
string::const_iterator start = cur, found_begin;
|
||||||
|
u8 quote_type = 0;
|
||||||
|
|
||||||
|
while (cur < ende) {
|
||||||
|
|
||||||
|
switch (*cur) {
|
||||||
|
|
||||||
|
case '"': {
|
||||||
|
|
||||||
|
if (cur == start || *(cur - 1) != '\\') {
|
||||||
|
|
||||||
|
if (!quote_type) {
|
||||||
|
|
||||||
|
found_begin = cur;
|
||||||
|
quote_type = 1;
|
||||||
|
|
||||||
|
} else if (quote_type == 1) {
|
||||||
|
|
||||||
|
*match_begin = found_begin;
|
||||||
|
*match_end = cur + 1;
|
||||||
|
return 1;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
break;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
case '\'': {
|
||||||
|
|
||||||
|
if (cur == start || *(cur - 1) != '\\') {
|
||||||
|
|
||||||
|
if (!quote_type) {
|
||||||
|
|
||||||
|
found_begin = cur;
|
||||||
|
quote_type = 2;
|
||||||
|
|
||||||
|
} else if (quote_type == 2) {
|
||||||
|
|
||||||
|
*match_begin = found_begin;
|
||||||
|
*match_end = cur + 1;
|
||||||
|
return 1;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
break;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
case '\n':
|
||||||
|
case '\r':
|
||||||
|
case 0: {
|
||||||
|
|
||||||
|
quote_type = 0;
|
||||||
|
break;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
default:
|
||||||
|
if (unlikely(quote_type && !isprint(*cur))) { quote_type = 0; }
|
||||||
|
break;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
++cur;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
return 0;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
/* We are not using afl_custom_queue_new_entry() because not every corpus entry
|
/* We are not using afl_custom_queue_new_entry() because not every corpus entry
|
||||||
will be necessarily fuzzed. so we use afl_custom_queue_get() instead */
|
will be necessarily fuzzed. so we use afl_custom_queue_get() instead */
|
||||||
|
|
||||||
@ -321,7 +442,7 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
(only_fav && !afl_ptr->queue_cur->favored)) {
|
(only_fav && !afl_ptr->queue_cur->favored)) {
|
||||||
|
|
||||||
s = NULL;
|
s = NULL;
|
||||||
DEBUG(stderr, "cmplog not ascii or only_fav and not favorite\n");
|
DEBUGF(stderr, "cmplog not ascii or only_fav and not favorite\n");
|
||||||
return 0;
|
return 0;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -356,7 +477,7 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
}
|
}
|
||||||
|
|
||||||
++extras_cnt;
|
++extras_cnt;
|
||||||
DEBUG(stderr, "Added from dictionary: \"%s\"\n", ptr);
|
DEBUGF(stderr, "Added from dictionary: \"%s\"\n", ptr);
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -385,7 +506,7 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
}
|
}
|
||||||
|
|
||||||
++a_extras_cnt;
|
++a_extras_cnt;
|
||||||
DEBUG(stderr, "Added from auto dictionary: \"%s\"\n", ptr);
|
DEBUGF(stderr, "Added from auto dictionary: \"%s\"\n", ptr);
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -415,7 +536,7 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
fclose(fp);
|
fclose(fp);
|
||||||
file_mapping[fn] = structure; // NULL ptr so we don't read the file again
|
file_mapping[fn] = structure; // NULL ptr so we don't read the file again
|
||||||
s = NULL;
|
s = NULL;
|
||||||
DEBUG(stderr, "Too short (%lu) %s\n", len, filename);
|
DEBUGF(stderr, "Too short (%lu) %s\n", len, filename);
|
||||||
return 0;
|
return 0;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -443,14 +564,14 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
file_mapping[fn] = NULL;
|
file_mapping[fn] = NULL;
|
||||||
s = NULL;
|
s = NULL;
|
||||||
DEBUG(stderr, "Not text (%lu) %s\n", len, filename);
|
DEBUGF(stderr, "Not text (%lu) %s\n", len, filename);
|
||||||
return 0;
|
return 0;
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// DEBUG(stderr, "Read %lu bytes for %s\nBefore comment trim:\n%s\n",
|
// DEBUGF(stderr, "Read %lu bytes for %s\nBefore comment trim:\n%s\n",
|
||||||
// input.size(), filename, input.c_str());
|
// input.size(), filename, input.c_str());
|
||||||
|
|
||||||
if (regex_comment_custom) {
|
if (regex_comment_custom) {
|
||||||
@ -463,15 +584,15 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
DEBUG(stderr, "After replace %lu bytes for %s\n%s\n", input.size(),
|
DEBUGF(stderr, "After replace %lu bytes for %s\n%s\n", input.size(),
|
||||||
filename, input.c_str());
|
filename, input.c_str());
|
||||||
|
|
||||||
u32 spaces = count(input.begin(), input.end(), ' ');
|
u32 spaces = count(input.begin(), input.end(), ' ');
|
||||||
u32 tabs = count(input.begin(), input.end(), '\t');
|
u32 tabs = count(input.begin(), input.end(), '\t');
|
||||||
u32 linefeeds = count(input.begin(), input.end(), '\n');
|
u32 linefeeds = count(input.begin(), input.end(), '\n');
|
||||||
bool ends_with_linefeed = input[input.length() - 1] == '\n';
|
bool ends_with_linefeed = input[input.length() - 1] == '\n';
|
||||||
DEBUG(stderr, "spaces=%u tabs=%u linefeeds=%u ends=%u\n", spaces, tabs,
|
DEBUGF(stderr, "spaces=%u tabs=%u linefeeds=%u ends=%u\n", spaces, tabs,
|
||||||
linefeeds, ends_with_linefeed);
|
linefeeds, ends_with_linefeed);
|
||||||
all_spaces += spaces;
|
all_spaces += spaces;
|
||||||
all_tabs += tabs;
|
all_tabs += tabs;
|
||||||
all_lf += linefeeds;
|
all_lf += linefeeds;
|
||||||
@ -479,25 +600,28 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
// now extract all tokens
|
// now extract all tokens
|
||||||
vector<string> tokens;
|
vector<string> tokens;
|
||||||
smatch match;
|
string::const_iterator cur = input.begin(), ende = input.end(), found, prev,
|
||||||
string::const_iterator cur = input.begin(), ende = input.end(), found, prev;
|
match_begin, match_end;
|
||||||
|
|
||||||
DEBUG(stderr, "START!\n");
|
DEBUGF(stderr, "START!\n");
|
||||||
|
|
||||||
if (likely(!alternative_tokenize)) {
|
if (likely(!alternative_tokenize)) {
|
||||||
|
|
||||||
while (regex_search(cur, ende, match, regex_string,
|
while (my_search_string(cur, ende, &match_begin, &match_end)) {
|
||||||
regex_constants::match_any |
|
|
||||||
regex_constants::match_not_null |
|
|
||||||
regex_constants::match_continuous)) {
|
|
||||||
|
|
||||||
prev = cur;
|
prev = cur;
|
||||||
found = match[0].first;
|
found = match_begin;
|
||||||
cur = match[0].second;
|
cur = match_end;
|
||||||
DEBUG(stderr,
|
|
||||||
"string %s found at start %lu offset %lu continue at %lu\n",
|
IFDEBUG {
|
||||||
match[0].str().c_str(), prev - input.begin(), match.position(),
|
|
||||||
cur - input.begin());
|
string foo(match_begin, match_end);
|
||||||
|
DEBUGF(stderr,
|
||||||
|
"string %s found at start %lu offset %lu continue at %lu\n",
|
||||||
|
foo.c_str(), prev - input.begin(), found - prev,
|
||||||
|
cur - input.begin());
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
if (prev < found) { // there are items between search start and find
|
if (prev < found) { // there are items between search start and find
|
||||||
while (prev < found) {
|
while (prev < found) {
|
||||||
@ -512,8 +636,8 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
}
|
}
|
||||||
|
|
||||||
tokens.push_back(std::string(start, prev));
|
tokens.push_back(std::string(start, prev));
|
||||||
DEBUG(stderr, "WHITESPACE %ld \"%s\"\n", prev - start,
|
DEBUGF(stderr, "WHITESPACE %ld \"%s\"\n", prev - start,
|
||||||
tokens[tokens.size() - 1].c_str());
|
tokens[tokens.size() - 1].c_str());
|
||||||
|
|
||||||
} else if (isalnum(*prev) || *prev == '$' || *prev == '_') {
|
} else if (isalnum(*prev) || *prev == '$' || *prev == '_') {
|
||||||
|
|
||||||
@ -525,14 +649,14 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
tokens.push_back(std::string(start, prev));
|
tokens.push_back(string(start, prev));
|
||||||
DEBUG(stderr, "IDENTIFIER %ld \"%s\"\n", prev - start,
|
DEBUGF(stderr, "IDENTIFIER %ld \"%s\"\n", prev - start,
|
||||||
tokens[tokens.size() - 1].c_str());
|
tokens[tokens.size() - 1].c_str());
|
||||||
|
|
||||||
} else {
|
} else {
|
||||||
|
|
||||||
tokens.push_back(std::string(prev, prev + 1));
|
tokens.push_back(string(prev, prev + 1));
|
||||||
DEBUG(stderr, "OTHER \"%c\"\n", *prev);
|
DEBUGF(stderr, "OTHER \"%c\"\n", *prev);
|
||||||
++prev;
|
++prev;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -541,11 +665,12 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (match[0].length() > 0) { tokens.push_back(match[0]); }
|
tokens.push_back(string(match_begin, match_end));
|
||||||
|
DEBUGF(stderr, "TOK: %s\n", tokens[tokens.size() - 1].c_str());
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
DEBUG(stderr, "AFTER all strings\n");
|
DEBUGF(stderr, "AFTER all strings\n");
|
||||||
|
|
||||||
if (cur < ende) {
|
if (cur < ende) {
|
||||||
|
|
||||||
@ -561,8 +686,8 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
}
|
}
|
||||||
|
|
||||||
tokens.push_back(std::string(start, cur));
|
tokens.push_back(std::string(start, cur));
|
||||||
DEBUG(stderr, "WHITESPACE %ld \"%s\"\n", cur - start,
|
DEBUGF(stderr, "WHITESPACE %ld \"%s\"\n", cur - start,
|
||||||
tokens[tokens.size() - 1].c_str());
|
tokens[tokens.size() - 1].c_str());
|
||||||
|
|
||||||
} else if (isalnum(*cur) || *cur == '$' || *cur == '_') {
|
} else if (isalnum(*cur) || *cur == '$' || *cur == '_') {
|
||||||
|
|
||||||
@ -575,13 +700,13 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
}
|
}
|
||||||
|
|
||||||
tokens.push_back(std::string(start, cur));
|
tokens.push_back(std::string(start, cur));
|
||||||
DEBUG(stderr, "IDENTIFIER %ld \"%s\"\n", cur - start,
|
DEBUGF(stderr, "IDENTIFIER %ld \"%s\"\n", cur - start,
|
||||||
tokens[tokens.size() - 1].c_str());
|
tokens[tokens.size() - 1].c_str());
|
||||||
|
|
||||||
} else {
|
} else {
|
||||||
|
|
||||||
tokens.push_back(std::string(cur, cur + 1));
|
tokens.push_back(std::string(cur, cur + 1));
|
||||||
DEBUG(stderr, "OTHER \"%c\"\n", *cur);
|
DEBUGF(stderr, "OTHER \"%c\"\n", *cur);
|
||||||
++cur;
|
++cur;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -593,19 +718,21 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
} else {
|
} else {
|
||||||
|
|
||||||
// alternative tokenize
|
// alternative tokenize
|
||||||
|
while (my_search_string(cur, ende, &match_begin, &match_end)) {
|
||||||
while (regex_search(cur, ende, match, regex_string,
|
|
||||||
regex_constants::match_any |
|
|
||||||
regex_constants::match_not_null |
|
|
||||||
regex_constants::match_continuous)) {
|
|
||||||
|
|
||||||
prev = cur;
|
prev = cur;
|
||||||
found = match[0].first;
|
found = match_begin;
|
||||||
cur = match[0].second;
|
cur = match_end;
|
||||||
DEBUG(stderr,
|
IFDEBUG {
|
||||||
"string %s found at start %lu offset %lu continue at %lu\n",
|
|
||||||
match[0].str().c_str(), prev - input.begin(), match.position(),
|
string foo(match_begin, match_end);
|
||||||
cur - input.begin());
|
DEBUGF(stderr,
|
||||||
|
"string %s found at start %lu offset %lu continue at %lu\n",
|
||||||
|
foo.c_str(), prev - input.begin(), found - prev,
|
||||||
|
cur - input.begin());
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
if (prev < found) { // there are items between search start and find
|
if (prev < found) { // there are items between search start and find
|
||||||
sregex_token_iterator it{prev, found, regex_whitespace, -1};
|
sregex_token_iterator it{prev, found, regex_whitespace, -1};
|
||||||
vector<std::string> tokenized{it, {}};
|
vector<std::string> tokenized{it, {}};
|
||||||
@ -619,10 +746,10 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
tokenized.end());
|
tokenized.end());
|
||||||
tokens.reserve(tokens.size() + tokenized.size() * 2 + 1);
|
tokens.reserve(tokens.size() + tokenized.size() * 2 + 1);
|
||||||
|
|
||||||
if (unlikely(debug)) {
|
IFDEBUG {
|
||||||
|
|
||||||
DEBUG(stderr, "tokens: %lu input size: %lu\n", tokenized.size(),
|
DEBUGF(stderr, "tokens1: %lu input size: %lu\n", tokenized.size(),
|
||||||
input.size());
|
input.size());
|
||||||
for (auto x : tokenized) {
|
for (auto x : tokenized) {
|
||||||
|
|
||||||
cerr << x << endl;
|
cerr << x << endl;
|
||||||
@ -636,10 +763,7 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
string::const_iterator c = token.begin(), e = token.end(), f, p;
|
string::const_iterator c = token.begin(), e = token.end(), f, p;
|
||||||
smatch m;
|
smatch m;
|
||||||
|
|
||||||
while (regex_search(c, e, m, regex_word,
|
while (regex_search(c, e, m, regex_word)) {
|
||||||
regex_constants::match_any |
|
|
||||||
regex_constants::match_not_null |
|
|
||||||
regex_constants::match_continuous)) {
|
|
||||||
|
|
||||||
p = c;
|
p = c;
|
||||||
f = m[0].first;
|
f = m[0].first;
|
||||||
@ -649,10 +773,10 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
// there are items between search start and find
|
// there are items between search start and find
|
||||||
while (p < f) {
|
while (p < f) {
|
||||||
|
|
||||||
if (unlikely(debug)) {
|
IFDEBUG {
|
||||||
|
|
||||||
string foo(p, p + 1);
|
string foo(p, p + 1);
|
||||||
DEBUG(stderr, "before string: \"%s\"\n", foo.c_str());
|
DEBUGF(stderr, "before string: \"%s\"\n", foo.c_str());
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -661,20 +785,21 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
IFDEBUG {
|
||||||
string foo(p, f);
|
|
||||||
DEBUG(stderr, "before string: \"%s\"\n",
|
string foo(p, f);
|
||||||
foo.c_str()); tokens.push_back(std::string(p, f));
|
DEBUGF(stderr, "before string: \"%s\"\n", foo.c_str());
|
||||||
*/
|
tokens.push_back(std::string(p, f));
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
DEBUG(
|
DEBUGF(stderr,
|
||||||
stderr,
|
"SUBstring \"%s\" found at start %lu offset %lu continue "
|
||||||
"SUBstring \"%s\" found at start %lu offset %lu continue at "
|
"at %lu\n",
|
||||||
"%lu\n",
|
m[0].str().c_str(), p - input.begin(), m.position(),
|
||||||
m[0].str().c_str(), p - input.begin(), m.position(),
|
c - token.begin());
|
||||||
c - token.begin());
|
|
||||||
tokens.push_back(m[0].str());
|
tokens.push_back(m[0].str());
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -683,10 +808,10 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
while (c < e) {
|
while (c < e) {
|
||||||
|
|
||||||
if (unlikely(debug)) {
|
IFDEBUG {
|
||||||
|
|
||||||
string foo(c, c + 1);
|
string foo(c, c + 1);
|
||||||
DEBUG(stderr, "after string: \"%s\"\n", foo.c_str());
|
DEBUGF(stderr, "after string: \"%s\"\n", foo.c_str());
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -695,17 +820,14 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
IFDEBUG {
|
||||||
if (unlikely(debug)) {
|
|
||||||
|
|
||||||
string foo(c, e);
|
string foo(c, e);
|
||||||
DEBUG(stderr, "after string: \"%s\"\n",
|
DEBUGF(stderr, "after string: \"%s\"\n", foo.c_str());
|
||||||
foo.c_str());
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
tokens.push_back(std::string(c, e));
|
tokens.push_back(std::string(c, e));
|
||||||
*/
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -713,7 +835,7 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (match[0].length() > 0) { tokens.push_back(match[0]); }
|
tokens.push_back(string(match_begin, match_end));
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -727,10 +849,10 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
tokenized.end());
|
tokenized.end());
|
||||||
tokens.reserve(tokens.size() + tokenized.size() * 2 + 1);
|
tokens.reserve(tokens.size() + tokenized.size() * 2 + 1);
|
||||||
|
|
||||||
if (unlikely(debug)) {
|
IFDEBUG {
|
||||||
|
|
||||||
DEBUG(stderr, "tokens: %lu input size: %lu\n", tokenized.size(),
|
DEBUGF(stderr, "tokens2: %lu input size: %lu\n", tokenized.size(),
|
||||||
input.size());
|
input.size());
|
||||||
for (auto x : tokenized) {
|
for (auto x : tokenized) {
|
||||||
|
|
||||||
cerr << x << endl;
|
cerr << x << endl;
|
||||||
@ -744,10 +866,7 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
string::const_iterator c = token.begin(), e = token.end(), f, p;
|
string::const_iterator c = token.begin(), e = token.end(), f, p;
|
||||||
smatch m;
|
smatch m;
|
||||||
|
|
||||||
while (regex_search(c, e, m, regex_word,
|
while (regex_search(c, e, m, regex_word)) {
|
||||||
regex_constants::match_any |
|
|
||||||
regex_constants::match_not_null |
|
|
||||||
regex_constants::match_continuous)) {
|
|
||||||
|
|
||||||
p = c;
|
p = c;
|
||||||
f = m[0].first;
|
f = m[0].first;
|
||||||
@ -757,10 +876,10 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
// there are items between search start and find
|
// there are items between search start and find
|
||||||
while (p < f) {
|
while (p < f) {
|
||||||
|
|
||||||
if (unlikely(debug)) {
|
IFDEBUG {
|
||||||
|
|
||||||
string foo(p, p + 1);
|
string foo(p, p + 1);
|
||||||
DEBUG(stderr, "before string: \"%s\"\n", foo.c_str());
|
DEBUGF(stderr, "before string: \"%s\"\n", foo.c_str());
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -769,25 +888,22 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
IFDEBUG {
|
||||||
if (unlikely(debug)) {
|
|
||||||
|
|
||||||
string foo(p, f);
|
string foo(p, f);
|
||||||
DEBUG(stderr, "before string: \"%s\"\n",
|
DEBUGF(stderr, "before string: \"%s\"\n", foo.c_str());
|
||||||
foo.c_str());
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
tokens.push_back(std::string(p, f));
|
tokens.push_back(std::string(p, f));
|
||||||
*/
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
DEBUG(stderr,
|
DEBUGF(stderr,
|
||||||
"SUB2string \"%s\" found at start %lu offset %lu continue at "
|
"SUB2string \"%s\" found at start %lu offset %lu continue "
|
||||||
"%lu\n",
|
"at %lu\n",
|
||||||
m[0].str().c_str(), p - input.begin(), m.position(),
|
m[0].str().c_str(), p - input.begin(), m.position(),
|
||||||
c - token.begin());
|
c - token.begin());
|
||||||
tokens.push_back(m[0].str());
|
tokens.push_back(m[0].str());
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -796,10 +912,10 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
while (c < e) {
|
while (c < e) {
|
||||||
|
|
||||||
if (unlikely(debug)) {
|
IFDEBUG {
|
||||||
|
|
||||||
string foo(c, c + 1);
|
string foo(c, c + 1);
|
||||||
DEBUG(stderr, "after string: \"%s\"\n", foo.c_str());
|
DEBUGF(stderr, "after string: \"%s\"\n", foo.c_str());
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -808,16 +924,14 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
IFDEBUG {
|
||||||
if (unlikely(debug)) {
|
|
||||||
|
|
||||||
string foo(c, e);
|
string foo(c, e);
|
||||||
DEBUG(stderr, "after string: \"%s\"\n", foo.c_str());
|
DEBUGF(stderr, "after string: \"%s\"\n", foo.c_str());
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
tokens.push_back(std::string(c, e));
|
tokens.push_back(std::string(c, e));
|
||||||
*/
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -827,22 +941,22 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (unlikely(debug)) {
|
IFDEBUG {
|
||||||
|
|
||||||
DEBUG(stderr, "DUMPING TOKENS:\n");
|
DEBUGF(stderr, "DUMPING TOKENS:\n");
|
||||||
u32 size_1 = tokens.size() - 1;
|
u32 size_1 = tokens.size() - 1;
|
||||||
for (u32 i = 0; i < tokens.size(); ++i) {
|
for (u32 i = 0; i < tokens.size(); ++i) {
|
||||||
|
|
||||||
DEBUG(stderr, "%s", tokens[i].c_str());
|
DEBUGF(stderr, "%s", tokens[i].c_str());
|
||||||
if (unlikely(alternative_tokenize && i < size_1)) {
|
if (unlikely(alternative_tokenize && i < size_1)) {
|
||||||
|
|
||||||
DEBUG(stderr, "%s", whitespace.c_str());
|
DEBUGF(stderr, "%s", whitespace.c_str());
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
DEBUG(stderr, "---------------------------\n");
|
DEBUGF(stderr, "---------------------------\n");
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -850,7 +964,7 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
|
|
||||||
file_mapping[fn] = NULL;
|
file_mapping[fn] = NULL;
|
||||||
s = NULL;
|
s = NULL;
|
||||||
DEBUG(stderr, "too few tokens\n");
|
DEBUGF(stderr, "too few tokens\n");
|
||||||
return 0;
|
return 0;
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -886,21 +1000,23 @@ extern "C" unsigned char afl_custom_queue_get(void *data,
|
|||||||
all_structure_items += structure->size();
|
all_structure_items += structure->size();
|
||||||
|
|
||||||
// we are done!
|
// we are done!
|
||||||
DEBUG(stderr, "DONE! We have %lu tokens in the structure\n",
|
DEBUGF(stderr, "DONE! We have %lu tokens in the structure\n",
|
||||||
structure->size());
|
structure->size());
|
||||||
|
|
||||||
} else {
|
}
|
||||||
|
|
||||||
|
else {
|
||||||
|
|
||||||
if (entry->second == NULL) {
|
if (entry->second == NULL) {
|
||||||
|
|
||||||
DEBUG(stderr, "Skipping %s\n", filename);
|
DEBUGF(stderr, "Skipping %s\n", filename);
|
||||||
s = NULL;
|
s = NULL;
|
||||||
return 0;
|
return 0;
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
s = entry->second;
|
s = entry->second;
|
||||||
DEBUG(stderr, "OK %s\n", filename);
|
DEBUGF(stderr, "OK %s\n", filename);
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -150,6 +150,7 @@ def deinit(): # optional for Python
|
|||||||
sense to use it. You would only skip this if `post_process` is used to fix
|
sense to use it. You would only skip this if `post_process` is used to fix
|
||||||
checksums etc. so if you are using it, e.g., as a post processing library.
|
checksums etc. so if you are using it, e.g., as a post processing library.
|
||||||
Note that a length > 0 *must* be returned!
|
Note that a length > 0 *must* be returned!
|
||||||
|
The returned output buffer is under **your** memory management!
|
||||||
|
|
||||||
- `describe` (optional):
|
- `describe` (optional):
|
||||||
|
|
||||||
|
@ -844,15 +844,16 @@ struct custom_mutator {
|
|||||||
/**
|
/**
|
||||||
* Perform custom mutations on a given input
|
* Perform custom mutations on a given input
|
||||||
*
|
*
|
||||||
* (Optional for now. Required in the future)
|
* (Optional)
|
||||||
*
|
*
|
||||||
* @param data pointer returned in afl_custom_init by this custom mutator
|
* Getting an add_buf can be skipped by using afl_custom_splice_optout().
|
||||||
|
*
|
||||||
|
* @param[in] data Pointer returned in afl_custom_init by this custom mutator
|
||||||
* @param[in] buf Pointer to the input data to be mutated and the mutated
|
* @param[in] buf Pointer to the input data to be mutated and the mutated
|
||||||
* output
|
* output
|
||||||
* @param[in] buf_size Size of the input/output data
|
* @param[in] buf_size Size of the input/output data
|
||||||
* @param[out] out_buf the new buffer. We may reuse *buf if large enough.
|
* @param[out] out_buf The new buffer, under your memory mgmt.
|
||||||
* *out_buf = NULL is treated as FATAL.
|
* @param[in] add_buf Buffer containing an additional test case (splicing)
|
||||||
* @param[in] add_buf Buffer containing the additional test case
|
|
||||||
* @param[in] add_buf_size Size of the additional test case
|
* @param[in] add_buf_size Size of the additional test case
|
||||||
* @param[in] max_size Maximum size of the mutated output. The mutation must
|
* @param[in] max_size Maximum size of the mutated output. The mutation must
|
||||||
* not produce data larger than max_size.
|
* not produce data larger than max_size.
|
||||||
|
@ -564,8 +564,7 @@ u8 fuzz_one_original(afl_state_t *afl) {
|
|||||||
if (afl->cmplog_lvl == 3 ||
|
if (afl->cmplog_lvl == 3 ||
|
||||||
(afl->cmplog_lvl == 2 && afl->queue_cur->tc_ref) ||
|
(afl->cmplog_lvl == 2 && afl->queue_cur->tc_ref) ||
|
||||||
afl->queue_cur->favored ||
|
afl->queue_cur->favored ||
|
||||||
!(afl->fsrv.total_execs % afl->queued_items) ||
|
get_cur_time() - afl->last_find_time > 600000) { // 600 seconds
|
||||||
get_cur_time() - afl->last_find_time > 300000) { // 300 seconds
|
|
||||||
|
|
||||||
if (input_to_state_stage(afl, in_buf, out_buf, len)) {
|
if (input_to_state_stage(afl, in_buf, out_buf, len)) {
|
||||||
|
|
||||||
|
Reference in New Issue
Block a user