]> git-server-git.apps.pok.os.sepia.ceph.com Git - ceph.git/commitdiff
mgr/prometheus: Log collection issues
authorBoris Ranto <branto@redhat.com>
Wed, 25 Nov 2020 09:32:35 +0000 (10:32 +0100)
committerBoris Ranto <branto@redhat.com>
Mon, 30 Nov 2020 10:37:27 +0000 (11:37 +0100)
Log any issues encountered during the data collection and continue to
collect the data anyway (after a sleep).

Signed-off-by: Boris Ranto <branto@redhat.com>
(cherry picked from commit 28a5c13bf993679e3098d73df27ded249f34dc99)

src/pybind/mgr/prometheus/module.py

index e58a9b8df2b1ee020880939b0f8387d2ce7b2233..02157f215e3bb798523e094af1d774f0ecff17f5 100644 (file)
@@ -190,7 +190,15 @@ class MetricCollectionThread(threading.Thread):
             self.mod.log.debug('collecting cache in thread')
             if self.mod.have_mon_connection():
                 start_time = time.time()
-                data = self.mod.collect()
+
+                try:
+                    data = self.mod.collect()
+                except Exception as e:
+                    # Log any issues encountered during the data collection and continue
+                    self.mod.log.exception("failed to collect metrics:")
+                    time.sleep(self.mod.scrape_interval)
+                    continue
+
                 duration = time.time() - start_time
                 
                 sleep_time = self.mod.scrape_interval - duration