block: add scalable completion tracking of requests

For legacy block, we simply track them in the request queue. For blk-mq, we track them on a per-sw queue basis, which we can then sum up through the hardware queues and finally to a per device state. The stats are tracked in, roughly, 0.1s interval windows. Add sysfs files to display the stats. The feature is off by default, to avoid any extra overhead. In-kernel users of it can turn it on by setting QUEUE_FLAG_STATS in the queue flags. We currently don't turn it on if someone just reads any of the stats files, that is something we could add as well. Signed-off-by: Jens Axboe <axboe@fb.com>
author: Jens Axboe <axboe@fb.com> 2016-11-07 21:32:37 -0700
committer: Jens Axboe <axboe@fb.com> 2016-11-10 13:53:26 -0700
commit: cf43e6be865a582ba66ee4747ae27a0513f6bba1 (patch)
tree: 53b71dd2f456e4880428683631fd09c9dc0747a5 /block/blk-mq.c
parent: ebc4ff661fbe76781c6b16dfb7b754a5d5073f8e (diff)
download: talos-obmc-linux-cf43e6be865a582ba66ee4747ae27a0513f6bba1.tar.gz
talos-obmc-linux-cf43e6be865a582ba66ee4747ae27a0513f6bba1.zip
1 files changed, 25 insertions, 0 deletions
diff --git a/block/blk-mq.c b/block/blk-mq.c
index 6f5cb3f3dcac..19795886d46e 100644
--- a/block/blk-mq.c
+++ b/block/blk-mq.c
@@ -30,6 +30,7 @@
 #include "blk.h"
 #include "blk-mq.h"
 #include "blk-mq-tag.h"
+#include "blk-stat.h"
 
 static DEFINE_MUTEX(all_q_mutex);
 static LIST_HEAD(all_q_list);
@@ -403,10 +404,27 @@ static void blk_mq_ipi_complete_request(struct request *rq)
 	put_cpu();
 }
 
+static void blk_mq_stat_add(struct request *rq)
+{
+	if (rq->rq_flags & RQF_STATS) {
+		/*
+		 * We could rq->mq_ctx here, but there's less of a risk
+		 * of races if we have the completion event add the stats
+		 * to the local software queue.
+		 */
+		struct blk_mq_ctx *ctx;
+
+		ctx = __blk_mq_get_ctx(rq->q, raw_smp_processor_id());
+		blk_stat_add(&ctx->stat[rq_data_dir(rq)], rq);
+	}
+}
+
 static void __blk_mq_complete_request(struct request *rq)
 {
 	struct request_queue *q = rq->q;
 
+	blk_mq_stat_add(rq);
+
 	if (!q->softirq_done_fn)
 		blk_mq_end_request(rq, rq->errors);
 	else
@@ -450,6 +468,11 @@ void blk_mq_start_request(struct request *rq)
 	if (unlikely(blk_bidi_rq(rq)))
 		rq->next_rq->resid_len = blk_rq_bytes(rq->next_rq);
 
+	if (test_bit(QUEUE_FLAG_STATS, &q->queue_flags)) {
+		blk_stat_set_issue_time(&rq->issue_stat);
+		rq->rq_flags |= RQF_STATS;
+	}
+
 	blk_add_timer(rq);
 
 	/*
@@ -1784,6 +1807,8 @@ static void blk_mq_init_cpu_queues(struct request_queue *q,
 		spin_lock_init(&__ctx->lock);
 		INIT_LIST_HEAD(&__ctx->rq_list);
 		__ctx->queue = q;
+		blk_stat_init(&__ctx->stat[BLK_STAT_READ]);
+		blk_stat_init(&__ctx->stat[BLK_STAT_WRITE]);
 
 		/* If the cpu isn't online, the cpu is mapped to first hctx */
 		if (!cpu_online(i))
author	Jens Axboe <axboe@fb.com>	2016-11-07 21:32:37 -0700
committer	Jens Axboe <axboe@fb.com>	2016-11-10 13:53:26 -0700
commit	cf43e6be865a582ba66ee4747ae27a0513f6bba1 (patch)
tree	53b71dd2f456e4880428683631fd09c9dc0747a5 /block/blk-mq.c
parent	ebc4ff661fbe76781c6b16dfb7b754a5d5073f8e (diff)
download	talos-obmc-linux-cf43e6be865a582ba66ee4747ae27a0513f6bba1.tar.gz talos-obmc-linux-cf43e6be865a582ba66ee4747ae27a0513f6bba1.zip