2020-02-20 05:11:08 +01:00
|
|
|
/*
|
|
|
|
* fuzzing driver
|
|
|
|
*
|
|
|
|
* Copyright Red Hat Inc., 2019
|
|
|
|
*
|
|
|
|
* Authors:
|
|
|
|
* Alexander Bulekov <alxndr@bu.edu>
|
|
|
|
*
|
|
|
|
* This work is licensed under the terms of the GNU GPL, version 2 or later.
|
|
|
|
* See the COPYING file in the top-level directory.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "qemu/osdep.h"
|
|
|
|
|
|
|
|
#include <wordexp.h>
|
|
|
|
|
2020-10-28 12:36:57 +01:00
|
|
|
#include "qemu/datadir.h"
|
2020-02-20 05:11:08 +01:00
|
|
|
#include "sysemu/qtest.h"
|
|
|
|
#include "sysemu/runstate.h"
|
|
|
|
#include "sysemu/sysemu.h"
|
|
|
|
#include "qemu/main-loop.h"
|
2020-07-08 22:01:04 +02:00
|
|
|
#include "qemu/rcu.h"
|
2020-08-04 20:00:40 +02:00
|
|
|
#include "tests/qtest/libqos/libqtest.h"
|
2020-02-20 05:11:08 +01:00
|
|
|
#include "tests/qtest/libqos/qgraph.h"
|
|
|
|
#include "fuzz.h"
|
|
|
|
|
|
|
|
#define MAX_EVENT_LOOPS 10
|
|
|
|
|
|
|
|
typedef struct FuzzTargetState {
|
|
|
|
FuzzTarget *target;
|
|
|
|
QSLIST_ENTRY(FuzzTargetState) target_list;
|
|
|
|
} FuzzTargetState;
|
|
|
|
|
|
|
|
typedef QSLIST_HEAD(, FuzzTargetState) FuzzTargetList;
|
|
|
|
|
|
|
|
static const char *fuzz_arch = TARGET_NAME;
|
|
|
|
|
|
|
|
static FuzzTargetList *fuzz_target_list;
|
|
|
|
static FuzzTarget *fuzz_target;
|
|
|
|
static QTestState *fuzz_qts;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
void flush_events(QTestState *s)
|
|
|
|
{
|
|
|
|
int i = MAX_EVENT_LOOPS;
|
|
|
|
while (g_main_context_pending(NULL) && i-- > 0) {
|
|
|
|
main_loop_wait(false);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static QTestState *qtest_setup(void)
|
|
|
|
{
|
|
|
|
qtest_server_set_send_handler(&qtest_client_inproc_recv, &fuzz_qts);
|
|
|
|
return qtest_inproc_init(&fuzz_qts, false, fuzz_arch,
|
|
|
|
&qtest_server_inproc_recv);
|
|
|
|
}
|
|
|
|
|
|
|
|
void fuzz_add_target(const FuzzTarget *target)
|
|
|
|
{
|
|
|
|
FuzzTargetState *tmp;
|
|
|
|
FuzzTargetState *target_state;
|
|
|
|
if (!fuzz_target_list) {
|
|
|
|
fuzz_target_list = g_new0(FuzzTargetList, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
QSLIST_FOREACH(tmp, fuzz_target_list, target_list) {
|
|
|
|
if (g_strcmp0(tmp->target->name, target->name) == 0) {
|
|
|
|
fprintf(stderr, "Error: Fuzz target name %s already in use\n",
|
|
|
|
target->name);
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
target_state = g_new0(FuzzTargetState, 1);
|
|
|
|
target_state->target = g_new0(FuzzTarget, 1);
|
|
|
|
*(target_state->target) = *target;
|
|
|
|
QSLIST_INSERT_HEAD(fuzz_target_list, target_state, target_list);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
static void usage(char *path)
|
|
|
|
{
|
|
|
|
printf("Usage: %s --fuzz-target=FUZZ_TARGET [LIBFUZZER ARGUMENTS]\n", path);
|
|
|
|
printf("where FUZZ_TARGET is one of:\n");
|
|
|
|
FuzzTargetState *tmp;
|
|
|
|
if (!fuzz_target_list) {
|
|
|
|
fprintf(stderr, "Fuzz target list not initialized\n");
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
QSLIST_FOREACH(tmp, fuzz_target_list, target_list) {
|
|
|
|
printf(" * %s : %s\n", tmp->target->name,
|
|
|
|
tmp->target->description);
|
|
|
|
}
|
2020-05-30 00:14:49 +02:00
|
|
|
printf("Alternatively, add -target-FUZZ_TARGET to the executable name\n\n"
|
|
|
|
"Set the environment variable FUZZ_SERIALIZE_QTEST=1 to serialize\n"
|
|
|
|
"QTest commands into an ASCII protocol. Useful for building crash\n"
|
2020-05-30 00:14:50 +02:00
|
|
|
"reproducers, but slows down execution.\n\n"
|
|
|
|
"Set the environment variable QTEST_LOG=1 to log all qtest commands"
|
|
|
|
"\n");
|
2020-02-20 05:11:08 +01:00
|
|
|
exit(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
static FuzzTarget *fuzz_get_target(char* name)
|
|
|
|
{
|
|
|
|
FuzzTargetState *tmp;
|
|
|
|
if (!fuzz_target_list) {
|
|
|
|
fprintf(stderr, "Fuzz target list not initialized\n");
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
QSLIST_FOREACH(tmp, fuzz_target_list, target_list) {
|
|
|
|
if (strcmp(tmp->target->name, name) == 0) {
|
|
|
|
return tmp->target;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-10-23 17:07:36 +02:00
|
|
|
/* Sometimes called by libfuzzer to mutate two inputs into one */
|
|
|
|
size_t LLVMFuzzerCustomCrossOver(const uint8_t *data1, size_t size1,
|
|
|
|
const uint8_t *data2, size_t size2,
|
|
|
|
uint8_t *out, size_t max_out_size,
|
|
|
|
unsigned int seed)
|
|
|
|
{
|
|
|
|
if (fuzz_target->crossover) {
|
|
|
|
return fuzz_target->crossover(data1, size1, data2, size2, out,
|
|
|
|
max_out_size, seed);
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-02-20 05:11:08 +01:00
|
|
|
/* Executed for each fuzzing-input */
|
|
|
|
int LLVMFuzzerTestOneInput(const unsigned char *Data, size_t Size)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* Do the pre-fuzz-initialization before the first fuzzing iteration,
|
|
|
|
* instead of before the actual fuzz loop. This is needed since libfuzzer
|
|
|
|
* may fork off additional workers, prior to the fuzzing loop, and if
|
|
|
|
* pre_fuzz() sets up e.g. shared memory, this should be done for the
|
|
|
|
* individual worker processes
|
|
|
|
*/
|
|
|
|
static int pre_fuzz_done;
|
|
|
|
if (!pre_fuzz_done && fuzz_target->pre_fuzz) {
|
|
|
|
fuzz_target->pre_fuzz(fuzz_qts);
|
|
|
|
pre_fuzz_done = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
fuzz_target->fuzz(fuzz_qts, Data, Size);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Executed once, prior to fuzzing */
|
|
|
|
int LLVMFuzzerInitialize(int *argc, char ***argv, char ***envp)
|
|
|
|
{
|
|
|
|
|
|
|
|
char *target_name;
|
2020-08-18 12:11:02 +02:00
|
|
|
const char *bindir;
|
|
|
|
char *datadir;
|
2020-05-30 00:14:49 +02:00
|
|
|
bool serialize = false;
|
2020-02-20 05:11:08 +01:00
|
|
|
|
|
|
|
/* Initialize qgraph and modules */
|
|
|
|
qos_graph_init();
|
|
|
|
module_call_init(MODULE_INIT_FUZZ_TARGET);
|
|
|
|
module_call_init(MODULE_INIT_QOM);
|
|
|
|
module_call_init(MODULE_INIT_LIBQOS);
|
|
|
|
|
2020-08-31 13:58:10 +02:00
|
|
|
qemu_init_exec_dir(**argv);
|
2020-04-21 20:22:30 +02:00
|
|
|
target_name = strstr(**argv, "-target-");
|
|
|
|
if (target_name) { /* The binary name specifies the target */
|
|
|
|
target_name += strlen("-target-");
|
2020-05-12 05:01:30 +02:00
|
|
|
/*
|
|
|
|
* With oss-fuzz, the executable is kept in the root of a directory (we
|
|
|
|
* cannot assume the path). All data (including bios binaries) must be
|
|
|
|
* in the same dir, or a subdir. Thus, we cannot place the pc-bios so
|
|
|
|
* that it would be in exec_dir/../pc-bios.
|
|
|
|
* As a workaround, oss-fuzz allows us to use argv[0] to get the
|
|
|
|
* location of the executable. Using this we add exec_dir/pc-bios to
|
|
|
|
* the datadirs.
|
|
|
|
*/
|
2020-08-31 13:58:10 +02:00
|
|
|
bindir = qemu_get_exec_dir();
|
2020-07-17 18:35:23 +02:00
|
|
|
datadir = g_build_filename(bindir, "pc-bios", NULL);
|
|
|
|
if (g_file_test(datadir, G_FILE_TEST_IS_DIR)) {
|
|
|
|
qemu_add_data_dir(datadir);
|
2020-08-18 11:57:56 +02:00
|
|
|
} else {
|
|
|
|
g_free(datadir);
|
|
|
|
}
|
2020-04-21 20:22:30 +02:00
|
|
|
} else if (*argc > 1) { /* The target is specified as an argument */
|
|
|
|
target_name = (*argv)[1];
|
|
|
|
if (!strstr(target_name, "--fuzz-target=")) {
|
|
|
|
usage(**argv);
|
|
|
|
}
|
|
|
|
target_name += strlen("--fuzz-target=");
|
|
|
|
} else {
|
2020-02-20 05:11:08 +01:00
|
|
|
usage(**argv);
|
|
|
|
}
|
|
|
|
|
2020-05-30 00:14:49 +02:00
|
|
|
/* Should we always serialize qtest commands? */
|
|
|
|
if (getenv("FUZZ_SERIALIZE_QTEST")) {
|
|
|
|
serialize = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
fuzz_qtest_set_serialize(serialize);
|
|
|
|
|
2020-02-20 05:11:08 +01:00
|
|
|
/* Identify the fuzz target */
|
|
|
|
fuzz_target = fuzz_get_target(target_name);
|
|
|
|
if (!fuzz_target) {
|
|
|
|
usage(**argv);
|
|
|
|
}
|
|
|
|
|
|
|
|
fuzz_qts = qtest_setup();
|
|
|
|
|
|
|
|
if (fuzz_target->pre_vm_init) {
|
|
|
|
fuzz_target->pre_vm_init();
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Run QEMU's softmmu main with the fuzz-target dependent arguments */
|
2020-07-14 19:46:16 +02:00
|
|
|
GString *cmd_line = fuzz_target->get_init_cmdline(fuzz_target);
|
2020-08-19 08:10:56 +02:00
|
|
|
g_string_append_printf(cmd_line, " %s -qtest /dev/null ",
|
|
|
|
getenv("QTEST_LOG") ? "" : "-qtest-log none");
|
2020-02-20 05:11:08 +01:00
|
|
|
|
|
|
|
/* Split the runcmd into an argv and argc */
|
|
|
|
wordexp_t result;
|
2020-07-14 19:46:16 +02:00
|
|
|
wordexp(cmd_line->str, &result, 0);
|
|
|
|
g_string_free(cmd_line, true);
|
2020-02-20 05:11:08 +01:00
|
|
|
|
|
|
|
qemu_init(result.we_wordc, result.we_wordv, NULL);
|
|
|
|
|
2020-06-18 18:05:16 +02:00
|
|
|
/* re-enable the rcu atfork, which was previously disabled in qemu_init */
|
|
|
|
rcu_enable_atfork();
|
|
|
|
|
fuzz: Disable QEMU's SIG{INT,HUP,TERM} handlers
Prior to this patch, the only way I found to terminate the fuzzer was
either to:
1. Explicitly specify the number of fuzzer runs with the -runs= flag
2. SIGKILL the process with "pkill -9 qemu-fuzz-*" or similar
In addition to being annoying to deal with, SIGKILLing the process skips
over any exit handlers(e.g. registered with atexit()). This is bad,
since some fuzzers might create temporary files that should ideally be
removed on exit using an exit handler. The only way to achieve a clean
exit now is to specify -runs=N , but the desired "N" is tricky to
identify prior to fuzzing.
Why doesn't the process exit with standard SIGINT,SIGHUP,SIGTERM
signals? QEMU installs its own handlers for these signals in
os-posix.c:os_setup_signal_handling, which notify the main loop that an
exit was requested. The fuzzer, however, does not run qemu_main_loop,
which performs the main_loop_should_exit() check. This means that the
fuzzer effectively ignores these signals. As we don't really care about
cleanly stopping the disposable fuzzer "VM", this patch uninstalls
QEMU's signal handlers. Thus, we can stop the fuzzer with
SIG{INT,HUP,TERM} and the fuzzing code can optionally use atexit() to
clean up temporary files/resources.
Reviewed-by: Darren Kenny <darren.kenny@oracle.com>
Signed-off-by: Alexander Bulekov <alxndr@bu.edu>
Message-Id: <20201014142157.46028-1-alxndr@bu.edu>
Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
2020-10-14 16:21:57 +02:00
|
|
|
/*
|
|
|
|
* Disable QEMU's signal handlers, since we manually control the main_loop,
|
|
|
|
* and don't check for main_loop_should_exit
|
|
|
|
*/
|
|
|
|
signal(SIGINT, SIG_DFL);
|
|
|
|
signal(SIGHUP, SIG_DFL);
|
|
|
|
signal(SIGTERM, SIG_DFL);
|
|
|
|
|
2020-02-20 05:11:08 +01:00
|
|
|
return 0;
|
|
|
|
}
|