osd/osd_types: use appropriate cost value for PullOp

author Sridhar Seshasayee <sseshasa@redhat.com>

Fri, 3 Feb 2023 12:12:46 +0000 (17:42 +0530)

committer Sridhar Seshasayee <sseshasa@redhat.com>

Mon, 8 May 2023 09:16:24 +0000 (14:46 +0530)
author Sridhar Seshasayee <sseshasa@redhat.com>
Fri, 3 Feb 2023 12:12:46 +0000 (17:42 +0530)
committer Sridhar Seshasayee <sseshasa@redhat.com>
Mon, 8 May 2023 09:16:24 +0000 (14:46 +0530)
diff --git a/src/osd/osd_types.cc b/src/osd/osd_types.cc

index bd8cac4ddcc57b93407c1414aa989d37ee975f81..829646809c5c00219d5d285fbcfedfbd9eafc47d 100644 (file)
--- a/src/osd/osd_types.cc
+++ b/src/osd/osd_types.cc
@@ -15,6 +15,7 @@
   *
   */
  
+#include <algorithm>
  #include <list>
  #include <map>
  #include <ostream>
@@ -6779,8 +6780,20 @@ ostream& operator<<(ostream& out, const PullOp &op)
  
  uint64_t PullOp::cost(CephContext *cct) const
  {
-  return cct->_conf->osd_push_per_object_cost +
-    cct->_conf->osd_recovery_max_chunk;
+  if (cct->_conf->osd_op_queue == "mclock_scheduler") {
+    return std::clamp<uint64_t>(
+      recovery_progress.estimate_remaining_data_to_recover(recovery_info),
+      1,
+      cct->_conf->osd_recovery_max_chunk);
+  } else {
+    /* We retain this legacy behavior for WeightedPriorityQueue. It seems to
+     * require very large costs for several messages in order to do any
+     * meaningful amount of throttling.  This branch should be removed after
+     * Reef.
+     */
+    return cct->_conf->osd_push_per_object_cost +
+      cct->_conf->osd_recovery_max_chunk;
+  }
  }
  
  // -- PushOp --
diff --git a/src/osd/osd_types.h b/src/osd/osd_types.h

index 0d0e743fc8c8b0f5aadd7327a0603ed8bf0a8f0f..e36fb17056f3d77f795f6d7a27b3d8e91d17f58a 100644 (file)
--- a/src/osd/osd_types.h
+++ b/src/osd/osd_types.h
@@ -6061,6 +6061,11 @@ struct ObjectRecoveryProgress {
        omap_complete;
    }
  
+  uint64_t estimate_remaining_data_to_recover(const ObjectRecoveryInfo& info) const {
+    // Overestimates in case of clones, but avoids traversing copy_subset
+    return info.size - data_recovered_to;
+  }
+
    static void generate_test_instances(std::list<ObjectRecoveryProgress*>& o);
    void encode(ceph::buffer::list &bl) const;
    void decode(ceph::buffer::list::const_iterator &bl);
author	Sridhar Seshasayee <sseshasa@redhat.com>
	Fri, 3 Feb 2023 12:12:46 +0000 (17:42 +0530)
committer	Sridhar Seshasayee <sseshasa@redhat.com>
	Mon, 8 May 2023 09:16:24 +0000 (14:46 +0530)
src/osd/osd_types.cc		patch \| blob \| history
src/osd/osd_types.h		patch \| blob \| history