Re: [PATCH v2] ceph: add min/max latency support for read/write/metadata metrics

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On 2020/3/17 1:25, Jeff Layton wrote:
On Mon, 2020-03-16 at 11:52 -0400, xiubli@xxxxxxxxxx wrote:
From: Xiubo Li <xiubli@xxxxxxxxxx>

These will be very useful help diagnose problems.

URL: https://tracker.ceph.com/issues/44533
Signed-off-by: Xiubo Li <xiubli@xxxxxxxxxx>
---

Changed in V2:
- switch spin lock to cmpxchg

  fs/ceph/debugfs.c    | 26 ++++++++++++++++----
  fs/ceph/mds_client.c |  9 +++++++
  fs/ceph/metric.h     | 69 +++++++++++++++++++++++++++++++++++++++++++++++++++-
  3 files changed, 98 insertions(+), 6 deletions(-)

diff --git a/fs/ceph/debugfs.c b/fs/ceph/debugfs.c
index 60f3e307..bcf7215 100644
--- a/fs/ceph/debugfs.c
+++ b/fs/ceph/debugfs.c
@@ -130,27 +130,43 @@ static int metric_show(struct seq_file *s, void *p)
  	struct ceph_mds_client *mdsc = fsc->mdsc;
  	int i, nr_caps = 0;
  	s64 total, sum, avg = 0;
+	unsigned long min, max;
- seq_printf(s, "item total sum_lat(us) avg_lat(us)\n");
-	seq_printf(s, "-----------------------------------------------------\n");
+	seq_printf(s, "item          total       sum_lat(us)     avg_lat(us)     min_lat(us)     max_lat(us)\n");
+	seq_printf(s, "-------------------------------------------------------------------------------------\n");
total = percpu_counter_sum(&mdsc->metric.total_reads);
  	sum = percpu_counter_sum(&mdsc->metric.read_latency_sum);
  	sum = jiffies_to_usecs(sum);
  	avg = total ? sum / total : 0;
-	seq_printf(s, "%-14s%-12lld%-16lld%lld\n", "read", total, sum, avg);
+	min = atomic_long_read(&mdsc->metric.read_latency_min);
+	min = jiffies_to_usecs(min == ULONG_MAX ? 0 : min);
+	max = atomic_long_read(&mdsc->metric.read_latency_max);
+	max = jiffies_to_usecs(max);
+	seq_printf(s, "%-14s%-12lld%-16lld%-16lld%-16ld%ld\n", "read",
+		   total, sum, avg, min, max);
total = percpu_counter_sum(&mdsc->metric.total_writes);
  	sum = percpu_counter_sum(&mdsc->metric.write_latency_sum);
  	sum = jiffies_to_usecs(sum);
  	avg = total ? sum / total : 0;
-	seq_printf(s, "%-14s%-12lld%-16lld%lld\n", "write", total, sum, avg);
+	min = atomic_long_read(&mdsc->metric.write_latency_min);
+	min = jiffies_to_usecs(min == ULONG_MAX ? 0 : min);
+	max = atomic_long_read(&mdsc->metric.write_latency_max);
+	max = jiffies_to_usecs(max);
+	seq_printf(s, "%-14s%-12lld%-16lld%-16lld%-16ld%ld\n", "write",
+		   total, sum, avg, min, max);
total = percpu_counter_sum(&mdsc->metric.total_metadatas);
  	sum = percpu_counter_sum(&mdsc->metric.metadata_latency_sum);
  	sum = jiffies_to_usecs(sum);
  	avg = total ? sum / total : 0;
-	seq_printf(s, "%-14s%-12lld%-16lld%lld\n", "metadata", total, sum, avg);
+	min = atomic_long_read(&mdsc->metric.metadata_latency_min);
+	min = jiffies_to_usecs(min == ULONG_MAX ? 0 : min);
+	max = atomic_long_read(&mdsc->metric.metadata_latency_max);
+	max = jiffies_to_usecs(max);
+	seq_printf(s, "%-14s%-12lld%-16lld%-16lld%-16ld%ld\n", "metadata",
+		   total, sum, avg, min, max);
seq_printf(s, "\n");
  	seq_printf(s, "item          total           miss            hit\n");
diff --git a/fs/ceph/mds_client.c b/fs/ceph/mds_client.c
index 5c03ed3..7844aa6 100644
--- a/fs/ceph/mds_client.c
+++ b/fs/ceph/mds_client.c
@@ -4358,6 +4358,9 @@ static int ceph_mdsc_metric_init(struct ceph_client_metric *metric)
  	if (ret)
  		goto err_read_latency_sum;
+ atomic_long_set(&metric->read_latency_min, ULONG_MAX);
+	atomic_long_set(&metric->read_latency_max, 0);
+
  	ret = percpu_counter_init(&metric->total_writes, 0, GFP_KERNEL);
  	if (ret)
  		goto err_total_writes;
@@ -4366,6 +4369,9 @@ static int ceph_mdsc_metric_init(struct ceph_client_metric *metric)
  	if (ret)
  		goto err_write_latency_sum;
+ atomic_long_set(&metric->write_latency_min, ULONG_MAX);
+	atomic_long_set(&metric->write_latency_max, 0);
+
  	ret = percpu_counter_init(&metric->total_metadatas, 0, GFP_KERNEL);
  	if (ret)
  		goto err_total_metadatas;
@@ -4374,6 +4380,9 @@ static int ceph_mdsc_metric_init(struct ceph_client_metric *metric)
  	if (ret)
  		goto err_metadata_latency_sum;
+ atomic_long_set(&metric->metadata_latency_min, ULONG_MAX);
+	atomic_long_set(&metric->metadata_latency_max, 0);
+
  	return 0;
err_metadata_latency_sum:
diff --git a/fs/ceph/metric.h b/fs/ceph/metric.h
index faba142..a399201 100644
--- a/fs/ceph/metric.h
+++ b/fs/ceph/metric.h
@@ -2,6 +2,10 @@
  #ifndef _FS_CEPH_MDS_METRIC_H
  #define _FS_CEPH_MDS_METRIC_H
+#include <linux/atomic.h>
+#include <linux/percpu.h>
+#include <linux/spinlock.h>
+
  /* This is the global metrics */
  struct ceph_client_metric {
  	atomic64_t            total_dentries;
@@ -13,12 +17,18 @@ struct ceph_client_metric {
struct percpu_counter total_reads;
  	struct percpu_counter read_latency_sum;
+	atomic_long_t read_latency_min;
+	atomic_long_t read_latency_max;
struct percpu_counter total_writes;
  	struct percpu_counter write_latency_sum;
+	atomic_long_t write_latency_min;
+	atomic_long_t write_latency_max;
struct percpu_counter total_metadatas;
  	struct percpu_counter metadata_latency_sum;
+	atomic_long_t metadata_latency_min;
+	atomic_long_t metadata_latency_max;
  };
static inline void ceph_update_cap_hit(struct ceph_client_metric *m)
@@ -36,11 +46,30 @@ static inline void ceph_update_read_latency(struct ceph_client_metric *m,
  					    unsigned long r_end,
  					    int rc)
  {
+	unsigned long lat = r_end - r_start;
+	unsigned long cur, old;
+
  	if (rc < 0 && rc != -ENOENT && rc != -ETIMEDOUT)
  		return;
percpu_counter_inc(&m->total_reads);
-	percpu_counter_add(&m->read_latency_sum, r_end - r_start);
+	percpu_counter_add(&m->read_latency_sum, lat);
+
+	cur = atomic_long_read(&m->read_latency_min);
+	do {
+		old = cur;
+		if (likely(lat > old))
+			break;
+		cur = atomic_long_cmpxchg(&m->read_latency_min, old, lat);
+	} while (cur != old);
+
+	cur = atomic_long_read(&m->read_latency_max);
+	do {
+		old = cur;
+		if (likely(lat < old))
This should probably be (lat <= old). After all, there's no need to do
the cmpxchg if nothing would change anyway.

All these loops look pretty similar too. Maybe you could add a pair of
helper functions for this (one for min and one for max) ?

Yeah, both make sense.

Will fix it.

Thanks.


+			break;
+		cur = atomic_long_cmpxchg(&m->read_latency_max, old, lat);
+	} while (cur != old);
  }
static inline void ceph_update_write_latency(struct ceph_client_metric *m,
@@ -48,11 +77,30 @@ static inline void ceph_update_write_latency(struct ceph_client_metric *m,
  					     unsigned long r_end,
  					     int rc)
  {
+	unsigned long lat = r_end - r_start;
+	unsigned long cur, old;
+
  	if (rc && rc != -ETIMEDOUT)
  		return;
percpu_counter_inc(&m->total_writes);
  	percpu_counter_add(&m->write_latency_sum, r_end - r_start);
+
+	cur = atomic_long_read(&m->write_latency_min);
+	do {
+		old = cur;
+		if (likely(lat > old))
+			break;
+		cur = atomic_long_cmpxchg(&m->write_latency_min, old, lat);
+	} while (cur != old);
+
+	cur = atomic_long_read(&m->write_latency_max);
+	do {
+		old = cur;
+		if (likely(lat < old))
+			break;
+		cur = atomic_long_cmpxchg(&m->write_latency_max, old, lat);
+	} while (cur != old);
  }
static inline void ceph_update_metadata_latency(struct ceph_client_metric *m,
@@ -60,10 +108,29 @@ static inline void ceph_update_metadata_latency(struct ceph_client_metric *m,
  						unsigned long r_end,
  						int rc)
  {
+	unsigned long lat = r_end - r_start;
+	unsigned long cur, old;
+
  	if (rc && rc != -ENOENT)
  		return;
percpu_counter_inc(&m->total_metadatas);
  	percpu_counter_add(&m->metadata_latency_sum, r_end - r_start);
+
+	cur = atomic_long_read(&m->metadata_latency_min);
+	do {
+		old = cur;
+		if (likely(lat > old))
+			break;
+		cur = atomic_long_cmpxchg(&m->metadata_latency_min, old, lat);
+	} while (cur != old);
+
+	cur = atomic_long_read(&m->metadata_latency_max);
+	do {
+		old = cur;
+		if (likely(lat < old))
+			break;
+		cur = atomic_long_cmpxchg(&m->metadata_latency_max, old, lat);
+	} while (cur != old);
  }
  #endif /* _FS_CEPH_MDS_METRIC_H */





[Index of Archives]     [CEPH Users]     [Ceph Large]     [Ceph Dev]     [Information on CEPH]     [Linux BTRFS]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]

  Powered by Linux