qga: add --retry-path option for re-initializing channel on failure

This adds an option to instruct the agent to periodically attempt
re-opening the communication channel after a channel error has
occurred. The main use-case for this is providing an OS-independent
way of allowing the agent to survive situations like hotplug/unplug of
the communication channel, or initial guest set up where the agent may
be installed/started prior to the installation of the channel device's
driver.

There are nicer ways of implementing this functionality via things
like systemd services, but this option is useful for platforms like
*BSD/w32.

Currently a channel error will result in the GSource for that channel
being removed from the GMainLoop, but the main loop continuing to run.
That behavior results in a dead loop when --retry-path isn't set, and
prevents us from knowing when to attempt re-opening the channel when
it is set, so we also force the loop to exit as part of this patch.

Signed-off-by: Michael Roth <mdroth@linux.vnet.ibm.com>
This commit is contained in:
Michael Roth 2018-10-07 14:02:20 +03:00
parent d88495a864
commit d951fadad6
1 changed files with 54 additions and 8 deletions

View File

@ -58,6 +58,7 @@
#endif #endif
#define QGA_SENTINEL_BYTE 0xFF #define QGA_SENTINEL_BYTE 0xFF
#define QGA_CONF_DEFAULT CONFIG_QEMU_CONFDIR G_DIR_SEPARATOR_S "qemu-ga.conf" #define QGA_CONF_DEFAULT CONFIG_QEMU_CONFDIR G_DIR_SEPARATOR_S "qemu-ga.conf"
#define QGA_RETRY_INTERVAL 5
static struct { static struct {
const char *state_dir; const char *state_dir;
@ -98,6 +99,7 @@ struct GAState {
GAPersistentState pstate; GAPersistentState pstate;
GAConfig *config; GAConfig *config;
int socket_activation; int socket_activation;
bool force_exit;
}; };
struct GAState *ga_state; struct GAState *ga_state;
@ -120,6 +122,7 @@ DWORD WINAPI service_ctrl_handler(DWORD ctrl, DWORD type, LPVOID data,
VOID WINAPI service_main(DWORD argc, TCHAR *argv[]); VOID WINAPI service_main(DWORD argc, TCHAR *argv[]);
#endif #endif
static int run_agent(GAState *s); static int run_agent(GAState *s);
static void stop_agent(GAState *s, bool requested);
static void static void
init_dfl_pathnames(void) init_dfl_pathnames(void)
@ -168,9 +171,7 @@ static void quit_handler(int sig)
} }
g_debug("received signal num %d, quitting", sig); g_debug("received signal num %d, quitting", sig);
if (g_main_loop_is_running(ga_state->main_loop)) { stop_agent(ga_state, true);
g_main_loop_quit(ga_state->main_loop);
}
} }
#ifndef _WIN32 #ifndef _WIN32
@ -255,6 +256,10 @@ QEMU_COPYRIGHT "\n"
" to list available RPCs)\n" " to list available RPCs)\n"
" -D, --dump-conf dump a qemu-ga config file based on current config\n" " -D, --dump-conf dump a qemu-ga config file based on current config\n"
" options / command-line parameters to stdout\n" " options / command-line parameters to stdout\n"
" -r, --retry-path attempt re-opening path if it's unavailable or closed\n"
" due to an error which may be recoverable in the future\n"
" (virtio-serial driver re-install, serial device hot\n"
" plug/unplug, etc.)\n"
" -h, --help display this help and exit\n" " -h, --help display this help and exit\n"
"\n" "\n"
QEMU_HELP_BOTTOM "\n" QEMU_HELP_BOTTOM "\n"
@ -614,6 +619,7 @@ static gboolean channel_event_cb(GIOCondition condition, gpointer data)
switch (status) { switch (status) {
case G_IO_STATUS_ERROR: case G_IO_STATUS_ERROR:
g_warning("error reading channel"); g_warning("error reading channel");
stop_agent(s, false);
return false; return false;
case G_IO_STATUS_NORMAL: case G_IO_STATUS_NORMAL:
buf[count] = 0; buf[count] = 0;
@ -927,6 +933,7 @@ struct GAConfig {
int daemonize; int daemonize;
GLogLevelFlags log_level; GLogLevelFlags log_level;
int dumpconf; int dumpconf;
bool retry_path;
}; };
static void config_load(GAConfig *config) static void config_load(GAConfig *config)
@ -976,6 +983,10 @@ static void config_load(GAConfig *config)
/* enable all log levels */ /* enable all log levels */
config->log_level = G_LOG_LEVEL_MASK; config->log_level = G_LOG_LEVEL_MASK;
} }
if (g_key_file_has_key(keyfile, "general", "retry-path", NULL)) {
config->retry_path =
g_key_file_get_boolean(keyfile, "general", "retry-path", &gerr);
}
if (g_key_file_has_key(keyfile, "general", "blacklist", NULL)) { if (g_key_file_has_key(keyfile, "general", "blacklist", NULL)) {
config->bliststr = config->bliststr =
g_key_file_get_string(keyfile, "general", "blacklist", &gerr); g_key_file_get_string(keyfile, "general", "blacklist", &gerr);
@ -1037,6 +1048,8 @@ static void config_dump(GAConfig *config)
g_key_file_set_string(keyfile, "general", "statedir", config->state_dir); g_key_file_set_string(keyfile, "general", "statedir", config->state_dir);
g_key_file_set_boolean(keyfile, "general", "verbose", g_key_file_set_boolean(keyfile, "general", "verbose",
config->log_level == G_LOG_LEVEL_MASK); config->log_level == G_LOG_LEVEL_MASK);
g_key_file_set_boolean(keyfile, "general", "retry-path",
config->retry_path);
tmp = list_join(config->blacklist, ','); tmp = list_join(config->blacklist, ',');
g_key_file_set_string(keyfile, "general", "blacklist", tmp); g_key_file_set_string(keyfile, "general", "blacklist", tmp);
g_free(tmp); g_free(tmp);
@ -1055,7 +1068,7 @@ static void config_dump(GAConfig *config)
static void config_parse(GAConfig *config, int argc, char **argv) static void config_parse(GAConfig *config, int argc, char **argv)
{ {
const char *sopt = "hVvdm:p:l:f:F::b:s:t:D"; const char *sopt = "hVvdm:p:l:f:F::b:s:t:Dr";
int opt_ind = 0, ch; int opt_ind = 0, ch;
const struct option lopt[] = { const struct option lopt[] = {
{ "help", 0, NULL, 'h' }, { "help", 0, NULL, 'h' },
@ -1075,6 +1088,7 @@ static void config_parse(GAConfig *config, int argc, char **argv)
{ "service", 1, NULL, 's' }, { "service", 1, NULL, 's' },
#endif #endif
{ "statedir", 1, NULL, 't' }, { "statedir", 1, NULL, 't' },
{ "retry-path", 0, NULL, 'r' },
{ NULL, 0, NULL, 0 } { NULL, 0, NULL, 0 }
}; };
@ -1119,6 +1133,9 @@ static void config_parse(GAConfig *config, int argc, char **argv)
case 'D': case 'D':
config->dumpconf = 1; config->dumpconf = 1;
break; break;
case 'r':
config->retry_path = true;
break;
case 'b': { case 'b': {
if (is_help_option(optarg)) { if (is_help_option(optarg)) {
qmp_for_each_command(&ga_commands, ga_print_cmd, NULL); qmp_for_each_command(&ga_commands, ga_print_cmd, NULL);
@ -1322,9 +1339,6 @@ static void cleanup_agent(GAState *s)
ga_command_state_free(s->command_state); ga_command_state_free(s->command_state);
json_message_parser_destroy(&s->parser); json_message_parser_destroy(&s->parser);
} }
if (s->channel) {
ga_channel_free(s->channel);
}
g_free(s->pstate_filepath); g_free(s->pstate_filepath);
g_free(s->state_filepath_isfrozen); g_free(s->state_filepath_isfrozen);
if (s->main_loop) { if (s->main_loop) {
@ -1334,7 +1348,7 @@ static void cleanup_agent(GAState *s)
ga_state = NULL; ga_state = NULL;
} }
static int run_agent(GAState *s) static int run_agent_once(GAState *s)
{ {
if (!channel_init(s, s->config->method, s->config->channel_path, if (!channel_init(s, s->config->method, s->config->channel_path,
s->socket_activation ? FIRST_SOCKET_ACTIVATION_FD : -1)) { s->socket_activation ? FIRST_SOCKET_ACTIVATION_FD : -1)) {
@ -1344,9 +1358,41 @@ static int run_agent(GAState *s)
g_main_loop_run(ga_state->main_loop); g_main_loop_run(ga_state->main_loop);
if (s->channel) {
ga_channel_free(s->channel);
}
return EXIT_SUCCESS; return EXIT_SUCCESS;
} }
static int run_agent(GAState *s)
{
int ret = EXIT_SUCCESS;
s->force_exit = false;
do {
ret = run_agent_once(s);
if (s->config->retry_path && !s->force_exit) {
g_warning("agent stopped unexpectedly, restarting...");
sleep(QGA_RETRY_INTERVAL);
}
} while (s->config->retry_path && !s->force_exit);
return ret;
}
static void stop_agent(GAState *s, bool requested)
{
if (!s->force_exit) {
s->force_exit = requested;
}
if (g_main_loop_is_running(s->main_loop)) {
g_main_loop_quit(s->main_loop);
}
}
int main(int argc, char **argv) int main(int argc, char **argv)
{ {
int ret = EXIT_SUCCESS; int ret = EXIT_SUCCESS;