rgw: RGWMetaSyncShardControlCR retries with backoff on all error codes

author Casey Bodley <cbodley@redhat.com>

Mon, 20 Feb 2017 21:00:01 +0000 (16:00 -0500)

committer Nathan Cutler <ncutler@suse.com>

Wed, 8 Mar 2017 14:09:32 +0000 (15:09 +0100)
author Casey Bodley <cbodley@redhat.com>
Mon, 20 Feb 2017 21:00:01 +0000 (16:00 -0500)
committer Nathan Cutler <ncutler@suse.com>
Wed, 8 Mar 2017 14:09:32 +0000 (15:09 +0100)
diff --git a/src/rgw/rgw_sync.cc b/src/rgw/rgw_sync.cc

index 3128a18e455a46dba3aed0eefe799ca08ed68a2c..45605a1ea8cf60c6cb22ad9451c39e6df66947c2 100644 (file)
--- a/src/rgw/rgw_sync.cc
+++ b/src/rgw/rgw_sync.cc
@@ -1557,6 +1557,7 @@ public:
            ldout(sync_env->cct, 10) << *this << ": failed to fetch more log entries, retcode=" << retcode << dendl;
            yield lease_cr->go_down();
            drain_all();
+          *reset_backoff = false; // back off and try again later
            return retcode;
          }
          *reset_backoff = true; /* if we got to this point, all systems function */
@@ -1566,6 +1567,13 @@ public:
            yield call(new RGWReadMDLogEntriesCR(sync_env, mdlog, shard_id,
                                                 &max_marker, INCREMENTAL_MAX_ENTRIES,
                                                 &log_entries, &truncated));
+          if (retcode < 0) {
+            ldout(sync_env->cct, 10) << *this << ": failed to list mdlog entries, retcode=" << retcode << dendl;
+            yield lease_cr->go_down();
+            drain_all();
+            *reset_backoff = false; // back off and try again later
+            return retcode;
+          }
            for (log_iter = log_entries.begin(); log_iter != log_entries.end(); ++log_iter) {
              if (!period_marker.empty() && period_marker < log_iter->id) {
                done_with_period = true;
@@ -1636,12 +1644,13 @@ class RGWMetaSyncShardControlCR : public RGWBackoffControlCR
    rgw_meta_sync_marker sync_marker;
    const std::string period_marker;
  
+  static constexpr bool exit_on_error = false; // retry on all errors
  public:
    RGWMetaSyncShardControlCR(RGWMetaSyncEnv *_sync_env, const rgw_bucket& _pool,
                              const std::string& period, RGWMetadataLog* mdlog,
                              uint32_t _shard_id, const rgw_meta_sync_marker& _marker,
                              std::string&& period_marker)
-    : RGWBackoffControlCR(_sync_env->cct, true), sync_env(_sync_env),
+    : RGWBackoffControlCR(_sync_env->cct, exit_on_error), sync_env(_sync_env),
        pool(_pool), period(period), mdlog(mdlog), shard_id(_shard_id),
        sync_marker(_marker), period_marker(std::move(period_marker)) {}
author	Casey Bodley <cbodley@redhat.com>
	Mon, 20 Feb 2017 21:00:01 +0000 (16:00 -0500)
committer	Nathan Cutler <ncutler@suse.com>
	Wed, 8 Mar 2017 14:09:32 +0000 (15:09 +0100)