| #include <linux/kernel.h> |
| #include <linux/module.h> |
| #include <linux/backing-dev.h> |
| #include <linux/bio.h> |
| #include <linux/blkdev.h> |
| #include <linux/mm.h> |
| #include <linux/init.h> |
| #include <linux/slab.h> |
| #include <linux/workqueue.h> |
| #include <linux/smp.h> |
| |
| #include <linux/blk-mq.h> |
| #include "blk-mq.h" |
| #include "blk-mq-tag.h" |
| |
| static void blk_mq_sysfs_release(struct kobject *kobj) |
| { |
| } |
| |
| struct blk_mq_ctx_sysfs_entry { |
| struct attribute attr; |
| ssize_t (*show)(struct blk_mq_ctx *, char *); |
| ssize_t (*store)(struct blk_mq_ctx *, const char *, size_t); |
| }; |
| |
| struct blk_mq_hw_ctx_sysfs_entry { |
| struct attribute attr; |
| ssize_t (*show)(struct blk_mq_hw_ctx *, char *); |
| ssize_t (*store)(struct blk_mq_hw_ctx *, const char *, size_t); |
| }; |
| |
| static ssize_t blk_mq_sysfs_show(struct kobject *kobj, struct attribute *attr, |
| char *page) |
| { |
| struct blk_mq_ctx_sysfs_entry *entry; |
| struct blk_mq_ctx *ctx; |
| struct request_queue *q; |
| ssize_t res; |
| |
| entry = container_of(attr, struct blk_mq_ctx_sysfs_entry, attr); |
| ctx = container_of(kobj, struct blk_mq_ctx, kobj); |
| q = ctx->queue; |
| |
| if (!entry->show) |
| return -EIO; |
| |
| res = -ENOENT; |
| mutex_lock(&q->sysfs_lock); |
| if (!blk_queue_dying(q)) |
| res = entry->show(ctx, page); |
| mutex_unlock(&q->sysfs_lock); |
| return res; |
| } |
| |
| static ssize_t blk_mq_sysfs_store(struct kobject *kobj, struct attribute *attr, |
| const char *page, size_t length) |
| { |
| struct blk_mq_ctx_sysfs_entry *entry; |
| struct blk_mq_ctx *ctx; |
| struct request_queue *q; |
| ssize_t res; |
| |
| entry = container_of(attr, struct blk_mq_ctx_sysfs_entry, attr); |
| ctx = container_of(kobj, struct blk_mq_ctx, kobj); |
| q = ctx->queue; |
| |
| if (!entry->store) |
| return -EIO; |
| |
| res = -ENOENT; |
| mutex_lock(&q->sysfs_lock); |
| if (!blk_queue_dying(q)) |
| res = entry->store(ctx, page, length); |
| mutex_unlock(&q->sysfs_lock); |
| return res; |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_show(struct kobject *kobj, |
| struct attribute *attr, char *page) |
| { |
| struct blk_mq_hw_ctx_sysfs_entry *entry; |
| struct blk_mq_hw_ctx *hctx; |
| struct request_queue *q; |
| ssize_t res; |
| |
| entry = container_of(attr, struct blk_mq_hw_ctx_sysfs_entry, attr); |
| hctx = container_of(kobj, struct blk_mq_hw_ctx, kobj); |
| q = hctx->queue; |
| |
| if (!entry->show) |
| return -EIO; |
| |
| res = -ENOENT; |
| mutex_lock(&q->sysfs_lock); |
| if (!blk_queue_dying(q)) |
| res = entry->show(hctx, page); |
| mutex_unlock(&q->sysfs_lock); |
| return res; |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_store(struct kobject *kobj, |
| struct attribute *attr, const char *page, |
| size_t length) |
| { |
| struct blk_mq_hw_ctx_sysfs_entry *entry; |
| struct blk_mq_hw_ctx *hctx; |
| struct request_queue *q; |
| ssize_t res; |
| |
| entry = container_of(attr, struct blk_mq_hw_ctx_sysfs_entry, attr); |
| hctx = container_of(kobj, struct blk_mq_hw_ctx, kobj); |
| q = hctx->queue; |
| |
| if (!entry->store) |
| return -EIO; |
| |
| res = -ENOENT; |
| mutex_lock(&q->sysfs_lock); |
| if (!blk_queue_dying(q)) |
| res = entry->store(hctx, page, length); |
| mutex_unlock(&q->sysfs_lock); |
| return res; |
| } |
| |
| static ssize_t blk_mq_sysfs_dispatched_show(struct blk_mq_ctx *ctx, char *page) |
| { |
| return sprintf(page, "%lu %lu\n", ctx->rq_dispatched[1], |
| ctx->rq_dispatched[0]); |
| } |
| |
| static ssize_t blk_mq_sysfs_merged_show(struct blk_mq_ctx *ctx, char *page) |
| { |
| return sprintf(page, "%lu\n", ctx->rq_merged); |
| } |
| |
| static ssize_t blk_mq_sysfs_completed_show(struct blk_mq_ctx *ctx, char *page) |
| { |
| return sprintf(page, "%lu %lu\n", ctx->rq_completed[1], |
| ctx->rq_completed[0]); |
| } |
| |
| static ssize_t sysfs_list_show(char *page, struct list_head *list, char *msg) |
| { |
| struct request *rq; |
| int len = snprintf(page, PAGE_SIZE - 1, "%s:\n", msg); |
| |
| list_for_each_entry(rq, list, queuelist) { |
| const int rq_len = 2 * sizeof(rq) + 2; |
| |
| /* if the output will be truncated */ |
| if (PAGE_SIZE - 1 < len + rq_len) { |
| /* backspacing if it can't hold '\t...\n' */ |
| if (PAGE_SIZE - 1 < len + 5) |
| len -= rq_len; |
| len += snprintf(page + len, PAGE_SIZE - 1 - len, |
| "\t...\n"); |
| break; |
| } |
| len += snprintf(page + len, PAGE_SIZE - 1 - len, |
| "\t%p\n", rq); |
| } |
| |
| return len; |
| } |
| |
| static ssize_t blk_mq_sysfs_rq_list_show(struct blk_mq_ctx *ctx, char *page) |
| { |
| ssize_t ret; |
| |
| spin_lock(&ctx->lock); |
| ret = sysfs_list_show(page, &ctx->rq_list, "CTX pending"); |
| spin_unlock(&ctx->lock); |
| |
| return ret; |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_poll_show(struct blk_mq_hw_ctx *hctx, char *page) |
| { |
| return sprintf(page, "considered=%lu, invoked=%lu, success=%lu\n", |
| hctx->poll_considered, hctx->poll_invoked, |
| hctx->poll_success); |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_poll_store(struct blk_mq_hw_ctx *hctx, |
| const char *page, size_t size) |
| { |
| hctx->poll_considered = hctx->poll_invoked = hctx->poll_success = 0; |
| |
| return size; |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_queued_show(struct blk_mq_hw_ctx *hctx, |
| char *page) |
| { |
| return sprintf(page, "%lu\n", hctx->queued); |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_run_show(struct blk_mq_hw_ctx *hctx, char *page) |
| { |
| return sprintf(page, "%lu\n", hctx->run); |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_dispatched_show(struct blk_mq_hw_ctx *hctx, |
| char *page) |
| { |
| char *start_page = page; |
| int i; |
| |
| page += sprintf(page, "%8u\t%lu\n", 0U, hctx->dispatched[0]); |
| |
| for (i = 1; i < BLK_MQ_MAX_DISPATCH_ORDER - 1; i++) { |
| unsigned int d = 1U << (i - 1); |
| |
| page += sprintf(page, "%8u\t%lu\n", d, hctx->dispatched[i]); |
| } |
| |
| page += sprintf(page, "%8u+\t%lu\n", 1U << (i - 1), |
| hctx->dispatched[i]); |
| return page - start_page; |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_rq_list_show(struct blk_mq_hw_ctx *hctx, |
| char *page) |
| { |
| ssize_t ret; |
| |
| spin_lock(&hctx->lock); |
| ret = sysfs_list_show(page, &hctx->dispatch, "HCTX pending"); |
| spin_unlock(&hctx->lock); |
| |
| return ret; |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_tags_show(struct blk_mq_hw_ctx *hctx, char *page) |
| { |
| return blk_mq_tag_sysfs_show(hctx->tags, page); |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_active_show(struct blk_mq_hw_ctx *hctx, char *page) |
| { |
| return sprintf(page, "%u\n", atomic_read(&hctx->nr_active)); |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_cpus_show(struct blk_mq_hw_ctx *hctx, char *page) |
| { |
| unsigned int i, first = 1; |
| ssize_t ret = 0; |
| |
| for_each_cpu(i, hctx->cpumask) { |
| if (first) |
| ret += sprintf(ret + page, "%u", i); |
| else |
| ret += sprintf(ret + page, ", %u", i); |
| |
| first = 0; |
| } |
| |
| ret += sprintf(ret + page, "\n"); |
| return ret; |
| } |
| |
| static void blk_mq_stat_clear(struct blk_mq_hw_ctx *hctx) |
| { |
| struct blk_mq_ctx *ctx; |
| unsigned int i; |
| |
| hctx_for_each_ctx(hctx, ctx, i) { |
| blk_stat_init(&ctx->stat[BLK_STAT_READ]); |
| blk_stat_init(&ctx->stat[BLK_STAT_WRITE]); |
| } |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_stat_store(struct blk_mq_hw_ctx *hctx, |
| const char *page, size_t count) |
| { |
| blk_mq_stat_clear(hctx); |
| return count; |
| } |
| |
| static ssize_t print_stat(char *page, struct blk_rq_stat *stat, const char *pre) |
| { |
| return sprintf(page, "%s samples=%llu, mean=%lld, min=%lld, max=%lld\n", |
| pre, (long long) stat->nr_samples, |
| (long long) stat->mean, (long long) stat->min, |
| (long long) stat->max); |
| } |
| |
| static ssize_t blk_mq_hw_sysfs_stat_show(struct blk_mq_hw_ctx *hctx, char *page) |
| { |
| struct blk_rq_stat stat[2]; |
| ssize_t ret; |
| |
| blk_stat_init(&stat[BLK_STAT_READ]); |
| blk_stat_init(&stat[BLK_STAT_WRITE]); |
| |
| blk_hctx_stat_get(hctx, stat); |
| |
| ret = print_stat(page, &stat[BLK_STAT_READ], "read :"); |
| ret += print_stat(page + ret, &stat[BLK_STAT_WRITE], "write:"); |
| return ret; |
| } |
| |
| static struct blk_mq_ctx_sysfs_entry blk_mq_sysfs_dispatched = { |
| .attr = {.name = "dispatched", .mode = S_IRUGO }, |
| .show = blk_mq_sysfs_dispatched_show, |
| }; |
| static struct blk_mq_ctx_sysfs_entry blk_mq_sysfs_merged = { |
| .attr = {.name = "merged", .mode = S_IRUGO }, |
| .show = blk_mq_sysfs_merged_show, |
| }; |
| static struct blk_mq_ctx_sysfs_entry blk_mq_sysfs_completed = { |
| .attr = {.name = "completed", .mode = S_IRUGO }, |
| .show = blk_mq_sysfs_completed_show, |
| }; |
| static struct blk_mq_ctx_sysfs_entry blk_mq_sysfs_rq_list = { |
| .attr = {.name = "rq_list", .mode = S_IRUGO }, |
| .show = blk_mq_sysfs_rq_list_show, |
| }; |
| |
| static struct attribute *default_ctx_attrs[] = { |
| &blk_mq_sysfs_dispatched.attr, |
| &blk_mq_sysfs_merged.attr, |
| &blk_mq_sysfs_completed.attr, |
| &blk_mq_sysfs_rq_list.attr, |
| NULL, |
| }; |
| |
| static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_queued = { |
| .attr = {.name = "queued", .mode = S_IRUGO }, |
| .show = blk_mq_hw_sysfs_queued_show, |
| }; |
| static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_run = { |
| .attr = {.name = "run", .mode = S_IRUGO }, |
| .show = blk_mq_hw_sysfs_run_show, |
| }; |
| static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_dispatched = { |
| .attr = {.name = "dispatched", .mode = S_IRUGO }, |
| .show = blk_mq_hw_sysfs_dispatched_show, |
| }; |
| static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_active = { |
| .attr = {.name = "active", .mode = S_IRUGO }, |
| .show = blk_mq_hw_sysfs_active_show, |
| }; |
| static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_pending = { |
| .attr = {.name = "pending", .mode = S_IRUGO }, |
| .show = blk_mq_hw_sysfs_rq_list_show, |
| }; |
| static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_tags = { |
| .attr = {.name = "tags", .mode = S_IRUGO }, |
| .show = blk_mq_hw_sysfs_tags_show, |
| }; |
| static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_cpus = { |
| .attr = {.name = "cpu_list", .mode = S_IRUGO }, |
| .show = blk_mq_hw_sysfs_cpus_show, |
| }; |
| static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_poll = { |
| .attr = {.name = "io_poll", .mode = S_IWUSR | S_IRUGO }, |
| .show = blk_mq_hw_sysfs_poll_show, |
| .store = blk_mq_hw_sysfs_poll_store, |
| }; |
| static struct blk_mq_hw_ctx_sysfs_entry blk_mq_hw_sysfs_stat = { |
| .attr = {.name = "stats", .mode = S_IRUGO | S_IWUSR }, |
| .show = blk_mq_hw_sysfs_stat_show, |
| .store = blk_mq_hw_sysfs_stat_store, |
| }; |
| |
| static struct attribute *default_hw_ctx_attrs[] = { |
| &blk_mq_hw_sysfs_queued.attr, |
| &blk_mq_hw_sysfs_run.attr, |
| &blk_mq_hw_sysfs_dispatched.attr, |
| &blk_mq_hw_sysfs_pending.attr, |
| &blk_mq_hw_sysfs_tags.attr, |
| &blk_mq_hw_sysfs_cpus.attr, |
| &blk_mq_hw_sysfs_active.attr, |
| &blk_mq_hw_sysfs_poll.attr, |
| &blk_mq_hw_sysfs_stat.attr, |
| NULL, |
| }; |
| |
| static const struct sysfs_ops blk_mq_sysfs_ops = { |
| .show = blk_mq_sysfs_show, |
| .store = blk_mq_sysfs_store, |
| }; |
| |
| static const struct sysfs_ops blk_mq_hw_sysfs_ops = { |
| .show = blk_mq_hw_sysfs_show, |
| .store = blk_mq_hw_sysfs_store, |
| }; |
| |
| static struct kobj_type blk_mq_ktype = { |
| .sysfs_ops = &blk_mq_sysfs_ops, |
| .release = blk_mq_sysfs_release, |
| }; |
| |
| static struct kobj_type blk_mq_ctx_ktype = { |
| .sysfs_ops = &blk_mq_sysfs_ops, |
| .default_attrs = default_ctx_attrs, |
| .release = blk_mq_sysfs_release, |
| }; |
| |
| static struct kobj_type blk_mq_hw_ktype = { |
| .sysfs_ops = &blk_mq_hw_sysfs_ops, |
| .default_attrs = default_hw_ctx_attrs, |
| .release = blk_mq_sysfs_release, |
| }; |
| |
| static void blk_mq_unregister_hctx(struct blk_mq_hw_ctx *hctx) |
| { |
| struct blk_mq_ctx *ctx; |
| int i; |
| |
| if (!hctx->nr_ctx) |
| return; |
| |
| hctx_for_each_ctx(hctx, ctx, i) |
| kobject_del(&ctx->kobj); |
| |
| kobject_del(&hctx->kobj); |
| } |
| |
| static int blk_mq_register_hctx(struct blk_mq_hw_ctx *hctx) |
| { |
| struct request_queue *q = hctx->queue; |
| struct blk_mq_ctx *ctx; |
| int i, ret; |
| |
| if (!hctx->nr_ctx) |
| return 0; |
| |
| ret = kobject_add(&hctx->kobj, &q->mq_kobj, "%u", hctx->queue_num); |
| if (ret) |
| return ret; |
| |
| hctx_for_each_ctx(hctx, ctx, i) { |
| ret = kobject_add(&ctx->kobj, &hctx->kobj, "cpu%u", ctx->cpu); |
| if (ret) |
| break; |
| } |
| |
| return ret; |
| } |
| |
| static void __blk_mq_unregister_dev(struct device *dev, struct request_queue *q) |
| { |
| struct blk_mq_hw_ctx *hctx; |
| struct blk_mq_ctx *ctx; |
| int i, j; |
| |
| queue_for_each_hw_ctx(q, hctx, i) { |
| blk_mq_unregister_hctx(hctx); |
| |
| hctx_for_each_ctx(hctx, ctx, j) |
| kobject_put(&ctx->kobj); |
| |
| kobject_put(&hctx->kobj); |
| } |
| |
| kobject_uevent(&q->mq_kobj, KOBJ_REMOVE); |
| kobject_del(&q->mq_kobj); |
| kobject_put(&q->mq_kobj); |
| |
| kobject_put(&dev->kobj); |
| |
| q->mq_sysfs_init_done = false; |
| } |
| |
| void blk_mq_unregister_dev(struct device *dev, struct request_queue *q) |
| { |
| blk_mq_disable_hotplug(); |
| __blk_mq_unregister_dev(dev, q); |
| blk_mq_enable_hotplug(); |
| } |
| |
| void blk_mq_hctx_kobj_init(struct blk_mq_hw_ctx *hctx) |
| { |
| kobject_init(&hctx->kobj, &blk_mq_hw_ktype); |
| } |
| |
| static void blk_mq_sysfs_init(struct request_queue *q) |
| { |
| struct blk_mq_ctx *ctx; |
| int cpu; |
| |
| kobject_init(&q->mq_kobj, &blk_mq_ktype); |
| |
| for_each_possible_cpu(cpu) { |
| ctx = per_cpu_ptr(q->queue_ctx, cpu); |
| kobject_init(&ctx->kobj, &blk_mq_ctx_ktype); |
| } |
| } |
| |
| int blk_mq_register_dev(struct device *dev, struct request_queue *q) |
| { |
| struct blk_mq_hw_ctx *hctx; |
| int ret, i; |
| |
| blk_mq_disable_hotplug(); |
| |
| blk_mq_sysfs_init(q); |
| |
| ret = kobject_add(&q->mq_kobj, kobject_get(&dev->kobj), "%s", "mq"); |
| if (ret < 0) |
| goto out; |
| |
| kobject_uevent(&q->mq_kobj, KOBJ_ADD); |
| |
| queue_for_each_hw_ctx(q, hctx, i) { |
| ret = blk_mq_register_hctx(hctx); |
| if (ret) |
| break; |
| } |
| |
| if (ret) |
| __blk_mq_unregister_dev(dev, q); |
| else |
| q->mq_sysfs_init_done = true; |
| out: |
| blk_mq_enable_hotplug(); |
| |
| return ret; |
| } |
| EXPORT_SYMBOL_GPL(blk_mq_register_dev); |
| |
| void blk_mq_sysfs_unregister(struct request_queue *q) |
| { |
| struct blk_mq_hw_ctx *hctx; |
| int i; |
| |
| if (!q->mq_sysfs_init_done) |
| return; |
| |
| queue_for_each_hw_ctx(q, hctx, i) |
| blk_mq_unregister_hctx(hctx); |
| } |
| |
| int blk_mq_sysfs_register(struct request_queue *q) |
| { |
| struct blk_mq_hw_ctx *hctx; |
| int i, ret = 0; |
| |
| if (!q->mq_sysfs_init_done) |
| return ret; |
| |
| queue_for_each_hw_ctx(q, hctx, i) { |
| ret = blk_mq_register_hctx(hctx); |
| if (ret) |
| break; |
| } |
| |
| return ret; |
| } |