blk/KernelDevice: Introduce a cap on the number of pending discards

author Joshua Baergen <jbaergen@digitalocean.com>

Wed, 18 Dec 2024 17:27:58 +0000 (10:27 -0700)

committer Joshua Baergen <jbaergen@digitalocean.com>

Fri, 24 Jan 2025 17:13:37 +0000 (10:13 -0700)
author Joshua Baergen <jbaergen@digitalocean.com>
Wed, 18 Dec 2024 17:27:58 +0000 (10:27 -0700)
committer Joshua Baergen <jbaergen@digitalocean.com>
Fri, 24 Jan 2025 17:13:37 +0000 (10:13 -0700)
diff --git a/src/blk/kernel/KernelDevice.cc b/src/blk/kernel/KernelDevice.cc

index 72921e6d9f08bf2fa9317a0e78547ec1a581207c..a073c39334bf0055220c5490a6e045023560fb7b 100644 (file)
--- a/src/blk/kernel/KernelDevice.cc
+++ b/src/blk/kernel/KernelDevice.cc
@@ -815,14 +815,21 @@ void KernelDevice::_discard_thread(uint64_t tid)
  
  // this is private and is expected that the caller checks that discard
  // threads are running via _discard_started()
-void KernelDevice::_queue_discard(interval_set<uint64_t> &to_release)
+bool KernelDevice::_queue_discard(interval_set<uint64_t> &to_release)
  {
    if (to_release.empty())
-    return;
+    return false;
+
+  auto max_pending = cct->_conf->bdev_async_discard_max_pending;
  
    std::lock_guard l(discard_lock);
+
+  if (max_pending > 0 && discard_queued.num_intervals() >= max_pending)
+    return false;
+
    discard_queued.insert(to_release);
    discard_cond.notify_one();
+  return true;
  }
  
  // return true only if discard was queued, so caller won't have to do
@@ -833,8 +840,7 @@ bool KernelDevice::try_discard(interval_set<uint64_t> &to_release, bool async)
      return false;
  
    if (async && _discard_started()) {
-    _queue_discard(to_release);
-    return true;
+    return _queue_discard(to_release);
    } else {
      for (auto p = to_release.begin(); p != to_release.end(); ++p) {
        _discard(p.get_start(), p.get_len());
diff --git a/src/blk/kernel/KernelDevice.h b/src/blk/kernel/KernelDevice.h

index ac555cdd3daf37dc2afe994f83ee377d3ccde613..c8a7b8d96a2a877441400885aa2a506b5aa5e90f 100644 (file)
--- a/src/blk/kernel/KernelDevice.h
+++ b/src/blk/kernel/KernelDevice.h
@@ -93,7 +93,7 @@ private:
  
    void _aio_thread();
    void _discard_thread(uint64_t tid);
-  void _queue_discard(interval_set<uint64_t> &to_release);
+  bool _queue_discard(interval_set<uint64_t> &to_release);
    bool try_discard(interval_set<uint64_t> &to_release, bool async = true) override;
  
    int _aio_start();
diff --git a/src/common/options/global.yaml.in b/src/common/options/global.yaml.in

index 04da93ccbec57737e4ed05c89cc047063e1c386d..b9e7db4f6e297659aa7d03b28eb5785151f538fd 100644 (file)
--- a/src/common/options/global.yaml.in
+++ b/src/common/options/global.yaml.in
@@ -4114,6 +4114,23 @@ options:
    - runtime
    see_also:
    - bdev_enable_discard
+  - bdev_async_discard_max_pending
+- name: bdev_async_discard_max_pending
+  desc: maximum number of pending discards
+  long_desc: The maximum number of pending async discards that can be queued and not claimed by an
+    async discard thread. Discards will not be issued once the queue is full and blocks will be
+    freed back to the allocator immediately instead. This is useful if you have a device with slow
+    discard performance that can't keep up to a consistently high write workload. 0 means
+    'unlimited'.
+  type: uint
+  level: advanced
+  default: 1000000
+  min: 0
+  with_legacy: true
+  flags:
+  - runtime
+  see_also:
+  - bdev_async_discard_threads
  - name: bdev_flock_retry_interval
    type: float
    level: advanced
author	Joshua Baergen <jbaergen@digitalocean.com>
	Wed, 18 Dec 2024 17:27:58 +0000 (10:27 -0700)
committer	Joshua Baergen <jbaergen@digitalocean.com>
	Fri, 24 Jan 2025 17:13:37 +0000 (10:13 -0700)
src/blk/kernel/KernelDevice.cc		patch \| blob \| history
src/blk/kernel/KernelDevice.h		patch \| blob \| history
src/common/options/global.yaml.in		patch \| blob \| history