X-Git-Url: http://git.tuebingen.mpg.de/?p=dss.git;a=blobdiff_plain;f=dss.c;h=07a60425170ddab063ee6071d4901993a9db8c62;hp=c64156188bc753f7ee264f7434db1e254bbbc8f2;hb=05e75054398c9d39f62f8c4b9be7b874a2019a3c;hpb=31638f52b0fe420f4881dca4afdecf7132d1ab91 diff --git a/dss.c b/dss.c index c641561..07a6042 100644 --- a/dss.c +++ b/dss.c @@ -45,6 +45,8 @@ static int signal_pipe; static pid_t create_pid; /** Whether the pre-create-hook/rsync/post-create-hook is currently stopped. */ static int create_process_stopped; +/** How many times in a row the rsync command failed. */ +static int num_consecutive_rsync_errors; /** Process id of current pre-remove/rm/post-remove process. */ static pid_t remove_pid; /** When the next snapshot is due. */ @@ -125,6 +127,7 @@ static void dump_dss_config(const char *msg) "reference_snapshot: %s\n" "snapshot_creation_status: %s\n" "snapshot_removal_status: %s\n" + "num_consecutive_rsync_errors: %d\n" , (int) getpid(), logfile? conf.logfile_arg : "stderr", @@ -135,7 +138,8 @@ static void dump_dss_config(const char *msg) name_of_reference_snapshot? name_of_reference_snapshot : "(none)", hook_status_description[snapshot_creation_status], - hook_status_description[snapshot_removal_status] + hook_status_description[snapshot_removal_status], + num_consecutive_rsync_errors ); if (create_pid != 0) fprintf(log, @@ -844,23 +848,23 @@ static int handle_rsync_exit(int status) es = WEXITSTATUS(status); /* * Restart rsync on non-fatal errors: - * 12: Error in rsync protocol data stream - * 13: Errors with program diagnostics + * 24: Partial transfer due to vanished source files */ - if (es == 12 || es == 13) { - DSS_WARNING_LOG(("rsync process %d returned %d -- restarting\n", - (int)create_pid, es)); + if (es != 0 && es != 24) { + DSS_WARNING_LOG(("rsync exit code %d, error count %d\n", + es, ++num_consecutive_rsync_errors)); + if (num_consecutive_rsync_errors > conf.max_rsync_errors_arg) { + ret = -E_TOO_MANY_RSYNC_ERRORS; + snapshot_creation_status = HS_READY; + goto out; + } + DSS_WARNING_LOG(("restarting rsync process\n")); snapshot_creation_status = HS_NEEDS_RESTART; next_snapshot_time = get_current_time() + 60; ret = 1; goto out; } - if (es != 0 && es != 23 && es != 24) { - DSS_ERROR_LOG(("rsync process %d returned %d\n", (int)create_pid, es)); - ret = -E_BAD_EXIT_CODE; - snapshot_creation_status = HS_READY; - goto out; - } + num_consecutive_rsync_errors = 0; ret = rename_incomplete_snapshot(current_snapshot_creation_time); if (ret < 0) goto out;