nvme-rdma: support separate queue maps for read and write
authorSagi Grimberg <sagi@grimberg.me>
Wed, 12 Dec 2018 07:38:58 +0000 (23:38 -0800)
committerChristoph Hellwig <hch@lst.de>
Thu, 13 Dec 2018 08:59:10 +0000 (09:59 +0100)
llow NVMF_OPT_NR_WRITE_QUEUES to describe additional write queues.  In
addition, implement .map_queues that will apply 2 queue maps for read
and write queue sets.

Note that with the separate queue map, HCTX_TYPE_READ will always use
nr_io_queues and HCTX_TYPE_DEFAULT will use nr_write_queues.

Signed-off-by: Sagi Grimberg <sagi@grimberg.me>
Signed-off-by: Christoph Hellwig <hch@lst.de>
drivers/nvme/host/rdma.c

index 5057d5ab5aaae58c3ca4c6369b0ec26f52ce0a6f..ed726da77b5b48f2ecab2e8830ef35a279a9d830 100644 (file)
@@ -645,6 +645,8 @@ static int nvme_rdma_alloc_io_queues(struct nvme_rdma_ctrl *ctrl)
        nr_io_queues = min_t(unsigned int, nr_io_queues,
                                ibdev->num_comp_vectors);
 
+       nr_io_queues += min(opts->nr_write_queues, num_online_cpus());
+
        ret = nvme_set_queue_count(&ctrl->ctrl, &nr_io_queues);
        if (ret)
                return ret;
@@ -714,6 +716,7 @@ static struct blk_mq_tag_set *nvme_rdma_alloc_tagset(struct nvme_ctrl *nctrl,
                set->driver_data = ctrl;
                set->nr_hw_queues = nctrl->queue_count - 1;
                set->timeout = NVME_IO_TIMEOUT;
+               set->nr_maps = 2 /* default + read */;
        }
 
        ret = blk_mq_alloc_tag_set(set);
@@ -1751,7 +1754,25 @@ static int nvme_rdma_map_queues(struct blk_mq_tag_set *set)
 {
        struct nvme_rdma_ctrl *ctrl = set->driver_data;
 
-       return blk_mq_rdma_map_queues(&set->map[0], ctrl->device->dev, 0);
+       set->map[HCTX_TYPE_DEFAULT].queue_offset = 0;
+       set->map[HCTX_TYPE_READ].nr_queues = ctrl->ctrl.opts->nr_io_queues;
+       if (ctrl->ctrl.opts->nr_write_queues) {
+               /* separate read/write queues */
+               set->map[HCTX_TYPE_DEFAULT].nr_queues =
+                               ctrl->ctrl.opts->nr_write_queues;
+               set->map[HCTX_TYPE_READ].queue_offset =
+                               ctrl->ctrl.opts->nr_write_queues;
+       } else {
+               /* mixed read/write queues */
+               set->map[HCTX_TYPE_DEFAULT].nr_queues =
+                               ctrl->ctrl.opts->nr_io_queues;
+               set->map[HCTX_TYPE_READ].queue_offset = 0;
+       }
+       blk_mq_rdma_map_queues(&set->map[HCTX_TYPE_DEFAULT],
+                       ctrl->device->dev, 0);
+       blk_mq_rdma_map_queues(&set->map[HCTX_TYPE_READ],
+                       ctrl->device->dev, 0);
+       return 0;
 }
 
 static const struct blk_mq_ops nvme_rdma_mq_ops = {
@@ -1906,7 +1927,7 @@ static struct nvme_ctrl *nvme_rdma_create_ctrl(struct device *dev,
        INIT_WORK(&ctrl->err_work, nvme_rdma_error_recovery_work);
        INIT_WORK(&ctrl->ctrl.reset_work, nvme_rdma_reset_ctrl_work);
 
-       ctrl->ctrl.queue_count = opts->nr_io_queues + 1; /* +1 for admin queue */
+       ctrl->ctrl.queue_count = opts->nr_io_queues + opts->nr_write_queues + 1;
        ctrl->ctrl.sqsize = opts->queue_size - 1;
        ctrl->ctrl.kato = opts->kato;
 
@@ -1957,7 +1978,8 @@ static struct nvmf_transport_ops nvme_rdma_transport = {
        .module         = THIS_MODULE,
        .required_opts  = NVMF_OPT_TRADDR,
        .allowed_opts   = NVMF_OPT_TRSVCID | NVMF_OPT_RECONNECT_DELAY |
-                         NVMF_OPT_HOST_TRADDR | NVMF_OPT_CTRL_LOSS_TMO,
+                         NVMF_OPT_HOST_TRADDR | NVMF_OPT_CTRL_LOSS_TMO |
+                         NVMF_OPT_NR_WRITE_QUEUES,
        .create_ctrl    = nvme_rdma_create_ctrl,
 };