blk-mq: introduce BLK_STS_DEV_RESOURCE

author Ming Lei <ming.lei@redhat.com>

Wed, 27 Nov 2019 20:18:13 +0000 (17:18 -0300)

committer Marcelo Henrique Cerri <marcelo.cerri@canonical.com>

Fri, 17 Jan 2020 17:23:12 +0000 (14:23 -0300)
author Ming Lei <ming.lei@redhat.com>
Wed, 27 Nov 2019 20:18:13 +0000 (17:18 -0300)
committer Marcelo Henrique Cerri <marcelo.cerri@canonical.com>
Fri, 17 Jan 2020 17:23:12 +0000 (14:23 -0300)
diff --git a/block/blk-core.c b/block/blk-core.c

index 1ae88e0a7ed4dde83f28f61e46ae6dea4d8c89b9..30a3cb2eca5a14a53685697da75ded6621d1ef5d 100644 (file)
--- a/block/blk-core.c
+++ b/block/blk-core.c
@@ -143,6 +143,7 @@ static const struct {
         [BLK_STS_MEDIUM]        = { -ENODATA,   "critical medium" },
         [BLK_STS_PROTECTION]    = { -EILSEQ,    "protection" },
         [BLK_STS_RESOURCE]      = { -ENOMEM,    "kernel resource" },
+       [BLK_STS_DEV_RESOURCE]  = { -EBUSY,     "device resource" },
         [BLK_STS_AGAIN]         = { -EAGAIN,    "nonblocking retry" },
  
         /* device mapper special case, should not leak out: */
diff --git a/block/blk-mq.c b/block/blk-mq.c

index 9e2650020281640e65058d309a802fcc5bd6d6f5..6e2014cd5101e9865eb30f79318ed3570b40a373 100644 (file)
--- a/block/blk-mq.c
+++ b/block/blk-mq.c
@@ -1121,6 +1121,8 @@ static bool blk_mq_mark_tag_wait(struct blk_mq_hw_ctx **hctx,
         }
  }
  
+#define BLK_MQ_RESOURCE_DELAY  3               /* ms units */
+
  bool blk_mq_dispatch_rq_list(struct request_queue *q, struct list_head *list,
                              bool got_budget)
  {
@@ -1128,6 +1130,7 @@ bool blk_mq_dispatch_rq_list(struct request_queue *q, struct list_head *list,
         struct request *rq, *nxt;
         bool no_tag = false;
         int errors, queued;
+       blk_status_t ret = BLK_STS_OK;
  
         if (list_empty(list))
                 return false;
@@ -1140,7 +1143,6 @@ bool blk_mq_dispatch_rq_list(struct request_queue *q, struct list_head *list,
         errors = queued = 0;
         do {
                 struct blk_mq_queue_data bd;
-               blk_status_t ret;
  
                 rq = list_first_entry(list, struct request, queuelist);
  
@@ -1184,7 +1186,7 @@ bool blk_mq_dispatch_rq_list(struct request_queue *q, struct list_head *list,
                 }
  
                 ret = q->mq_ops->queue_rq(hctx, &bd);
-               if (ret == BLK_STS_RESOURCE) {
+               if (ret == BLK_STS_RESOURCE || ret == BLK_STS_DEV_RESOURCE) {
                         /*
                          * If an I/O scheduler has been configured and we got a
                          * driver tag for the next request already, free it
@@ -1215,6 +1217,8 @@ bool blk_mq_dispatch_rq_list(struct request_queue *q, struct list_head *list,
          * that is where we will continue on next queue run.
          */
         if (!list_empty(list)) {
+               bool needs_restart;
+
                 spin_lock(&hctx->lock);
                 list_splice_init(list, &hctx->dispatch);
                 spin_unlock(&hctx->lock);
@@ -1238,10 +1242,17 @@ bool blk_mq_dispatch_rq_list(struct request_queue *q, struct list_head *list,
                  * - Some but not all block drivers stop a queue before
                  *   returning BLK_STS_RESOURCE. Two exceptions are scsi-mq
                  *   and dm-rq.
+                *
+                * If driver returns BLK_STS_RESOURCE and SCHED_RESTART
+                * bit is set, run queue after a delay to avoid IO stalls
+                * that could otherwise occur if the queue is idle.
                  */
-               if (!blk_mq_sched_needs_restart(hctx) ||
+               needs_restart = blk_mq_sched_needs_restart(hctx);
+               if (!needs_restart ||
                     (no_tag && list_empty_careful(&hctx->dispatch_wait.entry)))
                         blk_mq_run_hw_queue(hctx, true);
+               else if (needs_restart && (ret == BLK_STS_RESOURCE))
+                       blk_mq_delay_run_hw_queue(hctx, BLK_MQ_RESOURCE_DELAY);
         }
  
         return (queued + errors) != 0;
@@ -1722,6 +1733,7 @@ static blk_status_t __blk_mq_issue_directly(struct blk_mq_hw_ctx *hctx,
                 *cookie = new_cookie;
                 break;
         case BLK_STS_RESOURCE:
+       case BLK_STS_DEV_RESOURCE:
                 __blk_mq_requeue_request(rq);
                 break;
         default:
@@ -1784,7 +1796,7 @@ static void blk_mq_try_issue_directly(struct blk_mq_hw_ctx *hctx,
         hctx_lock(hctx, &srcu_idx);
  
         ret = __blk_mq_try_issue_directly(hctx, rq, cookie, false);
-       if (ret == BLK_STS_RESOURCE)
+       if (ret == BLK_STS_RESOURCE || ret == BLK_STS_DEV_RESOURCE)
                 blk_mq_sched_insert_request(rq, false, true, false);
         else if (ret != BLK_STS_OK)
                 blk_mq_end_request(rq, ret);
diff --git a/drivers/block/null_blk.c b/drivers/block/null_blk.c

index b7d9528c3b9d512d773cd05219ced3515f88f940..79b896f07b010d96b284bdd1722686fca4aadda9 100644 (file)
--- a/drivers/block/null_blk.c
+++ b/drivers/block/null_blk.c
@@ -1239,7 +1239,7 @@ static blk_status_t null_handle_cmd(struct nullb_cmd *cmd)
                                 return BLK_STS_OK;
                         } else
                                 /* requeue request */
-                               return BLK_STS_RESOURCE;
+                               return BLK_STS_DEV_RESOURCE;
                 }
         }
  
diff --git a/drivers/block/virtio_blk.c b/drivers/block/virtio_blk.c

index 8767401f75e0420823942c48e6c22b2c24c71655..78dbaab476334a864a0ac8c98a76880440ec6ca3 100644 (file)
--- a/drivers/block/virtio_blk.c
+++ b/drivers/block/virtio_blk.c
@@ -276,7 +276,7 @@ static blk_status_t virtio_queue_rq(struct blk_mq_hw_ctx *hctx,
                 /* Out of mem doesn't actually happen, since we fall back
                  * to direct descriptors */
                 if (err == -ENOMEM || err == -ENOSPC)
-                       return BLK_STS_RESOURCE;
+                       return BLK_STS_DEV_RESOURCE;
                 return BLK_STS_IOERR;
         }
  
diff --git a/drivers/block/xen-blkfront.c b/drivers/block/xen-blkfront.c

index 32ac5f551e55f22cdc4c14b7321007cfd939156b..a98f78b9c4c6eb74c9a7f23d7ccde1236f9daddc 100644 (file)
--- a/drivers/block/xen-blkfront.c
+++ b/drivers/block/xen-blkfront.c
@@ -912,7 +912,7 @@ out_err:
  out_busy:
         blk_mq_stop_hw_queue(hctx);
         spin_unlock_irqrestore(&rinfo->ring_lock, flags);
-       return BLK_STS_RESOURCE;
+       return BLK_STS_DEV_RESOURCE;
  }
  
  static void blkif_complete_rq(struct request *rq)
diff --git a/drivers/md/dm-rq.c b/drivers/md/dm-rq.c

index 134cd855ba35a39364bf9881529976ce31da227d..2af020c6bea2dc513b92f8a5f71821a38d21f22e 100644 (file)
--- a/drivers/md/dm-rq.c
+++ b/drivers/md/dm-rq.c
@@ -404,7 +404,7 @@ static blk_status_t dm_dispatch_clone_request(struct request *clone, struct requ
  
         clone->start_time = jiffies;
         r = blk_insert_cloned_request(clone->q, clone);
-       if (r != BLK_STS_OK && r != BLK_STS_RESOURCE)
+       if (r != BLK_STS_OK && r != BLK_STS_RESOURCE && r != BLK_STS_DEV_RESOURCE)
                 /* must complete clone in terms of original request */
                 dm_complete_request(rq, r);
         return r;
@@ -496,7 +496,7 @@ check_again:
                 trace_block_rq_remap(clone->q, clone, disk_devt(dm_disk(md)),
                                      blk_rq_pos(rq));
                 ret = dm_dispatch_clone_request(clone, rq);
-               if (ret == BLK_STS_RESOURCE) {
+               if (ret == BLK_STS_RESOURCE || ret == BLK_STS_DEV_RESOURCE) {
                         blk_rq_unprep_clone(clone);
                         tio->ti->type->release_clone_rq(clone, &tio->info);
                         tio->clone = NULL;
@@ -771,7 +771,6 @@ static blk_status_t dm_mq_queue_rq(struct blk_mq_hw_ctx *hctx,
                 /* Undo dm_start_request() before requeuing */
                 rq_end_stats(md, rq);
                 rq_completed(md, rq_data_dir(rq), false);
-               blk_mq_delay_run_hw_queue(hctx, 100/*ms*/);
                 return BLK_STS_RESOURCE;
         }
  
diff --git a/drivers/nvme/host/fc.c b/drivers/nvme/host/fc.c

index 25356a55cae2591cb413696c750c63194c99c499..636765f6d394f9b5334338f0f5099848879cd317 100644 (file)
--- a/drivers/nvme/host/fc.c
+++ b/drivers/nvme/host/fc.c
@@ -35,8 +35,6 @@ enum nvme_fc_queue_flags {
         NVME_FC_Q_LIVE,
  };
  
-#define NVMEFC_QUEUE_DELAY     3               /* ms units */
-
  #define NVME_FC_DEFAULT_DEV_LOSS_TMO   60      /* seconds */
  
  struct nvme_fc_queue {
@@ -2231,7 +2229,7 @@ nvme_fc_start_fcp_op(struct nvme_fc_ctrl *ctrl, struct nvme_fc_queue *queue,
          * the target device is present
          */
         if (ctrl->rport->remoteport.port_state != FC_OBJSTATE_ONLINE)
-               goto busy;
+               return BLK_STS_RESOURCE;
  
         if (!nvme_fc_ctrl_get(ctrl))
                 return BLK_STS_IOERR;
@@ -2311,16 +2309,10 @@ nvme_fc_start_fcp_op(struct nvme_fc_ctrl *ctrl, struct nvme_fc_queue *queue,
                                 ret != -EBUSY)
                         return BLK_STS_IOERR;
  
-               goto busy;
+               return BLK_STS_RESOURCE;
         }
  
         return BLK_STS_OK;
-
-busy:
-       if (!(op->flags & FCOP_FLAGS_AEN) && queue->hctx)
-               blk_mq_delay_run_hw_queue(queue->hctx, NVMEFC_QUEUE_DELAY);
-
-       return BLK_STS_RESOURCE;
  }
  
  static inline blk_status_t nvme_fc_is_ready(struct nvme_fc_queue *queue,
diff --git a/drivers/scsi/scsi_lib.c b/drivers/scsi/scsi_lib.c

index 9e37ba09ddefc66e306d69d1ddbafc46f54f38bf..df8cbe8998829322e68c3c200a4810b86d31b502 100644 (file)
--- a/drivers/scsi/scsi_lib.c
+++ b/drivers/scsi/scsi_lib.c
@@ -2069,9 +2069,9 @@ out_put_budget:
         case BLK_STS_OK:
                 break;
         case BLK_STS_RESOURCE:
-               if (atomic_read(&sdev->device_busy) == 0 &&
-                   !scsi_device_blocked(sdev))
-                       blk_mq_delay_run_hw_queue(hctx, SCSI_QUEUE_DELAY);
+               if (atomic_read(&sdev->device_busy) ||
+                   scsi_device_blocked(sdev))
+                       ret = BLK_STS_DEV_RESOURCE;
                 break;
         default:
                 if (unlikely(!scsi_device_online(sdev)))
diff --git a/include/linux/blk_types.h b/include/linux/blk_types.h

index 3c1b51f67914b18f2e1777f771704b94320ec873..297978a0e48677819418b1703766dd1a1541ecb1 100644 (file)
--- a/include/linux/blk_types.h
+++ b/include/linux/blk_types.h
@@ -44,6 +44,24 @@ typedef u8 __bitwise blk_status_t;
  
  #define BLK_STS_AGAIN          ((__force blk_status_t)12)
  
+/*
+ * BLK_STS_DEV_RESOURCE is returned from the driver to the block layer if
+ * device related resources are unavailable, but the driver can guarantee
+ * that the queue will be rerun in the future once resources become
+ * available again. This is typically the case for device specific
+ * resources that are consumed for IO. If the driver fails allocating these
+ * resources, we know that inflight (or pending) IO will free these
+ * resource upon completion.
+ *
+ * This is different from BLK_STS_RESOURCE in that it explicitly references
+ * a device specific resource. For resources of wider scope, allocation
+ * failure can happen without having pending IO. This means that we can't
+ * rely on request completions freeing these resources, as IO may not be in
+ * flight. Examples of that are kernel memory allocations, DMA mappings, or
+ * any other system wide resources.
+ */
+#define BLK_STS_DEV_RESOURCE   ((__force blk_status_t)13)
+
  struct blk_issue_stat {
         u64 stat;
  };
author	Ming Lei <ming.lei@redhat.com>
	Wed, 27 Nov 2019 20:18:13 +0000 (17:18 -0300)
committer	Marcelo Henrique Cerri <marcelo.cerri@canonical.com>
	Fri, 17 Jan 2020 17:23:12 +0000 (14:23 -0300)
block/blk-core.c		patch \| blob \| blame \| history
block/blk-mq.c		patch \| blob \| blame \| history
drivers/block/null_blk.c		patch \| blob \| blame \| history
drivers/block/virtio_blk.c		patch \| blob \| blame \| history
drivers/block/xen-blkfront.c		patch \| blob \| blame \| history
drivers/md/dm-rq.c		patch \| blob \| blame \| history
drivers/nvme/host/fc.c		patch \| blob \| blame \| history
drivers/scsi/scsi_lib.c		patch \| blob \| blame \| history
include/linux/blk_types.h		patch \| blob \| blame \| history