osd: Always send EC messages to all shards following error.

author Alex Ainscow <aainscow@uk.ibm.com>

Mon, 14 Jul 2025 22:57:49 +0000 (23:57 +0100)

committer Jon <jonathan.bailey1@ibm.com>

Fri, 3 Oct 2025 13:31:24 +0000 (14:31 +0100)
author Alex Ainscow <aainscow@uk.ibm.com>
Mon, 14 Jul 2025 22:57:49 +0000 (23:57 +0100)
committer Jon <jonathan.bailey1@ibm.com>
Fri, 3 Oct 2025 13:31:24 +0000 (14:31 +0100)
diff --git a/src/osd/ECCommon.cc b/src/osd/ECCommon.cc

index b81bb5ffc6e8808df2a6b9a73c849d264d59a835..34304f932f969fc2840e056f22de4ad9af464071 100644 (file)
--- a/src/osd/ECCommon.cc
+++ b/src/osd/ECCommon.cc
@@ -791,12 +791,15 @@ void ECCommon::RMWPipeline::cache_ready(Op &op) {
       * As such we must never skip a transaction completely.  Note that if
       * should_send is false, then an empty transaction is sent.
       */
-    if (should_send && op.skip_transaction(pending_roll_forward, shard, transaction)) {
+    if (!next_write_all_shards && should_send && op.skip_transaction(pending_roll_forward, shard, transaction)) {
        // Must be an empty transaction
        ceph_assert(transaction.empty());
        dout(20) << __func__ << " Skipping transaction for shard " << shard << dendl;
        continue;
      }
+    if (!should_send || transaction.empty()) {
+      dout(20) << __func__ << " Sending empty transaction for shard " << shard << dendl;
+    }
      op.pending_commits++;
      const pg_stat_t &stats =
          (should_send || !backfill_shards.contains(pg_shard))
@@ -845,6 +848,8 @@ void ECCommon::RMWPipeline::cache_ready(Op &op) {
      }
    }
  
+  next_write_all_shards = false;
+
    if (!messages.empty()) {
      get_parent()->send_message_osd_cluster(messages, get_osdmap_epoch());
    }
@@ -956,6 +961,7 @@ void ECCommon::RMWPipeline::on_change() {
    tid_to_op_map.clear();
    oid_to_version.clear();
    waiting_commit.clear();
+  next_write_all_shards = false;
  }
  
  void ECCommon::RMWPipeline::on_change2() {
@@ -963,5 +969,6 @@ void ECCommon::RMWPipeline::on_change2() {
  }
  
  void ECCommon::RMWPipeline::call_write_ordered(std::function<void(void)> &&cb) {
+  next_write_all_shards = true;
    extent_cache.add_on_write(std::move(cb));
  }
 \ No newline at end of file
diff --git a/src/osd/ECCommon.h b/src/osd/ECCommon.h

index b564acbf7b38d6ec1373007f29da141bd7ee8d5b..2a4dc63de67976b398bf1cb2c91a30830d8a0413 100644 (file)
--- a/src/osd/ECCommon.h
+++ b/src/osd/ECCommon.h
@@ -612,6 +612,7 @@ struct ECCommon {
      ECCommon &ec_backend;
      ECExtentCache extent_cache;
      uint64_t ec_pdw_write_mode;
+    bool next_write_all_shards = false;
  
      RMWPipeline(CephContext *cct,
                  ceph::ErasureCodeInterfaceRef ec_impl,
author	Alex Ainscow <aainscow@uk.ibm.com>
	Mon, 14 Jul 2025 22:57:49 +0000 (23:57 +0100)
committer	Jon <jonathan.bailey1@ibm.com>
	Fri, 3 Oct 2025 13:31:24 +0000 (14:31 +0100)
src/osd/ECCommon.cc		patch \| blob \| history
src/osd/ECCommon.h		patch \| blob \| history