blk-mq: add ->init_request and ->exit_request methods
authorChristoph Hellwig <hch@lst.de>
Tue, 15 Apr 2014 19:59:10 +0000 (13:59 -0600)
committerJens Axboe <axboe@fb.com>
Tue, 15 Apr 2014 20:03:03 +0000 (14:03 -0600)
The current blk_mq_init_commands/blk_mq_free_commands interface has a
two problems:

 1) Because only the constructor is passed to blk_mq_init_commands there
    is no easy way to clean up when a comman initialization failed.  The
    current code simply leaks the allocations done in the constructor.

 2) There is no good place to call blk_mq_free_commands: before
    blk_cleanup_queue there is no guarantee that all outstanding
    commands have completed, so we can't free them yet.  After
    blk_cleanup_queue the queue has usually been freed.  This can be
    worked around by grabbing an unconditional reference before calling
    blk_cleanup_queue and dropping it after blk_mq_free_commands is
    done, although that's not exatly pretty and driver writers are
    guaranteed to get it wrong sooner or later.

Both issues are easily fixed by making the request constructor and
destructor normal blk_mq_ops methods.

Signed-off-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Jens Axboe <axboe@fb.com>
block/blk-mq.c
drivers/block/virtio_blk.c
include/linux/blk-mq.h

index e644feec068c258b7b1fce66a34f1821209543e5..48d2d8495f5e5d3b0e91f391556aa752ce86d94f 100644 (file)
@@ -1031,74 +1031,20 @@ static void blk_mq_hctx_notify(void *data, unsigned long action,
        blk_mq_put_ctx(ctx);
 }
 
-static int blk_mq_init_hw_commands(struct blk_mq_hw_ctx *hctx,
-                                  int (*init)(void *, struct blk_mq_hw_ctx *,
-                                       struct request *, unsigned int),
-                                  void *data)
+static void blk_mq_free_rq_map(struct blk_mq_hw_ctx *hctx, void *driver_data)
 {
-       unsigned int i;
-       int ret = 0;
-
-       for (i = 0; i < hctx->queue_depth; i++) {
-               struct request *rq = hctx->rqs[i];
-
-               ret = init(data, hctx, rq, i);
-               if (ret)
-                       break;
-       }
-
-       return ret;
-}
-
-int blk_mq_init_commands(struct request_queue *q,
-                        int (*init)(void *, struct blk_mq_hw_ctx *,
-                                       struct request *, unsigned int),
-                        void *data)
-{
-       struct blk_mq_hw_ctx *hctx;
-       unsigned int i;
-       int ret = 0;
-
-       queue_for_each_hw_ctx(q, hctx, i) {
-               ret = blk_mq_init_hw_commands(hctx, init, data);
-               if (ret)
-                       break;
-       }
-
-       return ret;
-}
-EXPORT_SYMBOL(blk_mq_init_commands);
-
-static void blk_mq_free_hw_commands(struct blk_mq_hw_ctx *hctx,
-                                   void (*free)(void *, struct blk_mq_hw_ctx *,
-                                       struct request *, unsigned int),
-                                   void *data)
-{
-       unsigned int i;
+       struct page *page;
 
-       for (i = 0; i < hctx->queue_depth; i++) {
-               struct request *rq = hctx->rqs[i];
+       if (hctx->rqs && hctx->queue->mq_ops->exit_request) {
+               int i;
 
-               free(data, hctx, rq, i);
+               for (i = 0; i < hctx->queue_depth; i++) {
+                       if (!hctx->rqs[i])
+                               continue;
+                       hctx->queue->mq_ops->exit_request(driver_data, hctx,
+                                                         hctx->rqs[i], i);
+               }
        }
-}
-
-void blk_mq_free_commands(struct request_queue *q,
-                         void (*free)(void *, struct blk_mq_hw_ctx *,
-                                       struct request *, unsigned int),
-                         void *data)
-{
-       struct blk_mq_hw_ctx *hctx;
-       unsigned int i;
-
-       queue_for_each_hw_ctx(q, hctx, i)
-               blk_mq_free_hw_commands(hctx, free, data);
-}
-EXPORT_SYMBOL(blk_mq_free_commands);
-
-static void blk_mq_free_rq_map(struct blk_mq_hw_ctx *hctx)
-{
-       struct page *page;
 
        while (!list_empty(&hctx->page_list)) {
                page = list_first_entry(&hctx->page_list, struct page, lru);
@@ -1123,10 +1069,12 @@ static size_t order_to_size(unsigned int order)
 }
 
 static int blk_mq_init_rq_map(struct blk_mq_hw_ctx *hctx,
-                             unsigned int reserved_tags, int node)
+               struct blk_mq_reg *reg, void *driver_data, int node)
 {
+       unsigned int reserved_tags = reg->reserved_tags;
        unsigned int i, j, entries_per_page, max_order = 4;
        size_t rq_size, left;
+       int error;
 
        INIT_LIST_HEAD(&hctx->page_list);
 
@@ -1175,14 +1123,23 @@ static int blk_mq_init_rq_map(struct blk_mq_hw_ctx *hctx,
                for (j = 0; j < to_do; j++) {
                        hctx->rqs[i] = p;
                        blk_rq_init(hctx->queue, hctx->rqs[i]);
+                       if (reg->ops->init_request) {
+                               error = reg->ops->init_request(driver_data,
+                                               hctx, hctx->rqs[i], i);
+                               if (error)
+                                       goto err_rq_map;
+                       }
+
                        p += rq_size;
                        i++;
                }
        }
 
-       if (i < (reserved_tags + BLK_MQ_TAG_MIN))
+       if (i < (reserved_tags + BLK_MQ_TAG_MIN)) {
+               error = -ENOMEM;
                goto err_rq_map;
-       else if (i != hctx->queue_depth) {
+       }
+       if (i != hctx->queue_depth) {
                hctx->queue_depth = i;
                pr_warn("%s: queue depth set to %u because of low memory\n",
                                        __func__, i);
@@ -1190,12 +1147,14 @@ static int blk_mq_init_rq_map(struct blk_mq_hw_ctx *hctx,
 
        hctx->tags = blk_mq_init_tags(hctx->queue_depth, reserved_tags, node);
        if (!hctx->tags) {
-err_rq_map:
-               blk_mq_free_rq_map(hctx);
-               return -ENOMEM;
+               error = -ENOMEM;
+               goto err_rq_map;
        }
 
        return 0;
+err_rq_map:
+       blk_mq_free_rq_map(hctx, driver_data);
+       return error;
 }
 
 static int blk_mq_init_hw_queues(struct request_queue *q,
@@ -1228,7 +1187,7 @@ static int blk_mq_init_hw_queues(struct request_queue *q,
                                                blk_mq_hctx_notify, hctx);
                blk_mq_register_cpu_notifier(&hctx->cpu_notifier);
 
-               if (blk_mq_init_rq_map(hctx, reg->reserved_tags, node))
+               if (blk_mq_init_rq_map(hctx, reg, driver_data, node))
                        break;
 
                /*
@@ -1268,7 +1227,7 @@ static int blk_mq_init_hw_queues(struct request_queue *q,
                        reg->ops->exit_hctx(hctx, j);
 
                blk_mq_unregister_cpu_notifier(&hctx->cpu_notifier);
-               blk_mq_free_rq_map(hctx);
+               blk_mq_free_rq_map(hctx, driver_data);
                kfree(hctx->ctxs);
        }
 
@@ -1455,7 +1414,7 @@ void blk_mq_free_queue(struct request_queue *q)
        queue_for_each_hw_ctx(q, hctx, i) {
                kfree(hctx->ctx_map);
                kfree(hctx->ctxs);
-               blk_mq_free_rq_map(hctx);
+               blk_mq_free_rq_map(hctx, q->queuedata);
                blk_mq_unregister_cpu_notifier(&hctx->cpu_notifier);
                if (q->mq_ops->exit_hctx)
                        q->mq_ops->exit_hctx(hctx, i);
index c7d02bc9d945cf590931d479ff552b65a75fc3b3..d06206abd340e27f302b423a9c788f322d078def 100644 (file)
@@ -480,11 +480,22 @@ static const struct device_attribute dev_attr_cache_type_rw =
        __ATTR(cache_type, S_IRUGO|S_IWUSR,
               virtblk_cache_type_show, virtblk_cache_type_store);
 
+static int virtblk_init_request(void *data, struct blk_mq_hw_ctx *hctx,
+               struct request *rq, unsigned int nr)
+{
+       struct virtio_blk *vblk = data;
+       struct virtblk_req *vbr = blk_mq_rq_to_pdu(rq);
+
+       sg_init_table(vbr->sg, vblk->sg_elems);
+       return 0;
+}
+
 static struct blk_mq_ops virtio_mq_ops = {
        .queue_rq       = virtio_queue_rq,
        .map_queue      = blk_mq_map_queue,
        .alloc_hctx     = blk_mq_alloc_single_hw_queue,
        .free_hctx      = blk_mq_free_single_hw_queue,
+       .init_request   = virtblk_init_request,
        .complete       = virtblk_request_done,
 };
 
@@ -497,16 +508,6 @@ static struct blk_mq_reg virtio_mq_reg = {
 };
 module_param_named(queue_depth, virtio_mq_reg.queue_depth, uint, 0444);
 
-static int virtblk_init_vbr(void *data, struct blk_mq_hw_ctx *hctx,
-                            struct request *rq, unsigned int nr)
-{
-       struct virtio_blk *vblk = data;
-       struct virtblk_req *vbr = blk_mq_rq_to_pdu(rq);
-
-       sg_init_table(vbr->sg, vblk->sg_elems);
-       return 0;
-}
-
 static int virtblk_probe(struct virtio_device *vdev)
 {
        struct virtio_blk *vblk;
@@ -577,8 +578,6 @@ static int virtblk_probe(struct virtio_device *vdev)
                goto out_put_disk;
        }
 
-       blk_mq_init_commands(q, virtblk_init_vbr, vblk);
-
        q->queuedata = vblk;
 
        virtblk_name_format("vd", index, vblk->disk->disk_name, DISK_NAME_LEN);
index b6ee48740458232d9e0ce56edffd0195e833ab4d..29c1a6e83814b319d9a241cc0965c507c054756c 100644 (file)
@@ -67,6 +67,10 @@ typedef struct blk_mq_hw_ctx *(alloc_hctx_fn)(struct blk_mq_reg *,unsigned int);
 typedef void (free_hctx_fn)(struct blk_mq_hw_ctx *, unsigned int);
 typedef int (init_hctx_fn)(struct blk_mq_hw_ctx *, void *, unsigned int);
 typedef void (exit_hctx_fn)(struct blk_mq_hw_ctx *, unsigned int);
+typedef int (init_request_fn)(void *, struct blk_mq_hw_ctx *,
+               struct request *, unsigned int);
+typedef void (exit_request_fn)(void *, struct blk_mq_hw_ctx *,
+               struct request *, unsigned int);
 
 struct blk_mq_ops {
        /*
@@ -99,6 +103,14 @@ struct blk_mq_ops {
         */
        init_hctx_fn            *init_hctx;
        exit_hctx_fn            *exit_hctx;
+
+       /*
+        * Called for every command allocated by the block layer to allow
+        * the driver to set up driver specific data.
+        * Ditto for exit/teardown.
+        */
+       init_request_fn         *init_request;
+       exit_request_fn         *exit_request;
 };
 
 enum {
@@ -118,8 +130,6 @@ enum {
 struct request_queue *blk_mq_init_queue(struct blk_mq_reg *, void *);
 int blk_mq_register_disk(struct gendisk *);
 void blk_mq_unregister_disk(struct gendisk *);
-int blk_mq_init_commands(struct request_queue *, int (*init)(void *data, struct blk_mq_hw_ctx *, struct request *, unsigned int), void *data);
-void blk_mq_free_commands(struct request_queue *, void (*free)(void *data, struct blk_mq_hw_ctx *, struct request *, unsigned int), void *data);
 
 void blk_mq_flush_plug_list(struct blk_plug *plug, bool from_schedule);