blk-mq: move hctx lock/unlock into a helper

[mirror_ubuntu-bionic-kernel.git] / block / blk-mq.c
diff --git a/block/blk-mq.c b/block/blk-mq.c

index 7384bb7335331a6eeb514c54624a24f07ac87e81..da42485cb39d954c475a078db62967e9a47772e7 100644 (file)
--- a/block/blk-mq.c
+++ b/block/blk-mq.c
@@ -580,6 +580,22 @@ static void __blk_mq_complete_request(struct request *rq)
         put_cpu();
  }
  
+static void hctx_unlock(struct blk_mq_hw_ctx *hctx, int srcu_idx)
+{
+       if (!(hctx->flags & BLK_MQ_F_BLOCKING))
+               rcu_read_unlock();
+       else
+               srcu_read_unlock(hctx->queue_rq_srcu, srcu_idx);
+}
+
+static void hctx_lock(struct blk_mq_hw_ctx *hctx, int *srcu_idx)
+{
+       if (!(hctx->flags & BLK_MQ_F_BLOCKING))
+               rcu_read_lock();
+       else
+               *srcu_idx = srcu_read_lock(hctx->queue_rq_srcu);
+}
+
  /**
   * blk_mq_complete_request - end I/O on a request
   * @rq:                the request being processed
@@ -1266,17 +1282,11 @@ static void __blk_mq_run_hw_queue(struct blk_mq_hw_ctx *hctx)
          */
         WARN_ON_ONCE(in_interrupt());
  
-       if (!(hctx->flags & BLK_MQ_F_BLOCKING)) {
-               rcu_read_lock();
-               blk_mq_sched_dispatch_requests(hctx);
-               rcu_read_unlock();
-       } else {
-               might_sleep();
+       might_sleep_if(hctx->flags & BLK_MQ_F_BLOCKING);
  
-               srcu_idx = srcu_read_lock(hctx->queue_rq_srcu);
-               blk_mq_sched_dispatch_requests(hctx);
-               srcu_read_unlock(hctx->queue_rq_srcu, srcu_idx);
-       }
+       hctx_lock(hctx, &srcu_idx);
+       blk_mq_sched_dispatch_requests(hctx);
+       hctx_unlock(hctx, srcu_idx);
  }
  
  static inline int blk_mq_first_mapped_cpu(struct blk_mq_hw_ctx *hctx)
@@ -1363,7 +1373,23 @@ EXPORT_SYMBOL(blk_mq_delay_run_hw_queue);
  
  bool blk_mq_run_hw_queue(struct blk_mq_hw_ctx *hctx, bool async)
  {
-       if (blk_mq_hctx_has_pending(hctx)) {
+       int srcu_idx;
+       bool need_run;
+
+       /*
+        * When queue is quiesced, we may be switching io scheduler, or
+        * updating nr_hw_queues, or other things, and we can't run queue
+        * any more, even __blk_mq_hctx_has_pending() can't be called safely.
+        *
+        * And queue will be rerun in blk_mq_unquiesce_queue() if it is
+        * quiesced.
+        */
+       hctx_lock(hctx, &srcu_idx);
+       need_run = !blk_queue_quiesced(hctx->queue) &&
+               blk_mq_hctx_has_pending(hctx);
+       hctx_unlock(hctx, srcu_idx);
+
+       if (need_run) {
                 __blk_mq_delay_run_hw_queue(hctx, async, 0);
                 return true;
         }
@@ -1673,7 +1699,7 @@ static blk_qc_t request_to_qc_t(struct blk_mq_hw_ctx *hctx, struct request *rq)
  
  static void __blk_mq_try_issue_directly(struct blk_mq_hw_ctx *hctx,
                                         struct request *rq,
-                                       blk_qc_t *cookie, bool may_sleep)
+                                       blk_qc_t *cookie)
  {
         struct request_queue *q = rq->q;
         struct blk_mq_queue_data bd = {
@@ -1723,25 +1749,20 @@ static void __blk_mq_try_issue_directly(struct blk_mq_hw_ctx *hctx,
         }
  
  insert:
-       blk_mq_sched_insert_request(rq, false, run_queue, false, may_sleep);
+       blk_mq_sched_insert_request(rq, false, run_queue, false,
+                                       hctx->flags & BLK_MQ_F_BLOCKING);
  }
  
  static void blk_mq_try_issue_directly(struct blk_mq_hw_ctx *hctx,
                 struct request *rq, blk_qc_t *cookie)
  {
-       if (!(hctx->flags & BLK_MQ_F_BLOCKING)) {
-               rcu_read_lock();
-               __blk_mq_try_issue_directly(hctx, rq, cookie, false);
-               rcu_read_unlock();
-       } else {
-               unsigned int srcu_idx;
+       int srcu_idx;
  
-               might_sleep();
+       might_sleep_if(hctx->flags & BLK_MQ_F_BLOCKING);
  
-               srcu_idx = srcu_read_lock(hctx->queue_rq_srcu);
-               __blk_mq_try_issue_directly(hctx, rq, cookie, true);
-               srcu_read_unlock(hctx->queue_rq_srcu, srcu_idx);
-       }
+       hctx_lock(hctx, &srcu_idx);
+       __blk_mq_try_issue_directly(hctx, rq, cookie);
+       hctx_unlock(hctx, srcu_idx);
  }
  
  static blk_qc_t blk_mq_make_request(struct request_queue *q, struct bio *bio)
@@ -2081,12 +2102,7 @@ static void blk_mq_exit_hctx(struct request_queue *q,
         if (set->ops->exit_hctx)
                 set->ops->exit_hctx(hctx, hctx_idx);
  
-       if (hctx->flags & BLK_MQ_F_BLOCKING)
-               cleanup_srcu_struct(hctx->queue_rq_srcu);
-
         blk_mq_remove_cpuhp(hctx);
-       blk_free_flush_queue(hctx->fq);
-       sbitmap_free(&hctx->ctx_map);
  }
  
  static void blk_mq_exit_hw_queues(struct request_queue *q,
@@ -2127,12 +2143,12 @@ static int blk_mq_init_hctx(struct request_queue *q,
          * runtime
          */
         hctx->ctxs = kmalloc_array_node(nr_cpu_ids, sizeof(void *),
-                                       GFP_KERNEL, node);
+                       GFP_NOIO | __GFP_NOWARN | __GFP_NORETRY, node);
         if (!hctx->ctxs)
                 goto unregister_cpu_notifier;
  
-       if (sbitmap_init_node(&hctx->ctx_map, nr_cpu_ids, ilog2(8), GFP_KERNEL,
-                             node))
+       if (sbitmap_init_node(&hctx->ctx_map, nr_cpu_ids, ilog2(8),
+                               GFP_NOIO | __GFP_NOWARN | __GFP_NORETRY, node))
                 goto free_ctxs;
  
         hctx->nr_ctx = 0;
@@ -2147,7 +2163,8 @@ static int blk_mq_init_hctx(struct request_queue *q,
         if (blk_mq_sched_init_hctx(q, hctx, hctx_idx))
                 goto exit_hctx;
  
-       hctx->fq = blk_alloc_flush_queue(q, hctx->numa_node, set->cmd_size);
+       hctx->fq = blk_alloc_flush_queue(q, hctx->numa_node, set->cmd_size,
+                       GFP_NOIO | __GFP_NOWARN | __GFP_NORETRY);
         if (!hctx->fq)
                 goto sched_exit_hctx;
  
@@ -2164,7 +2181,7 @@ static int blk_mq_init_hctx(struct request_queue *q,
         return 0;
  
   free_fq:
-       kfree(hctx->fq);
+       blk_free_flush_queue(hctx->fq);
   sched_exit_hctx:
         blk_mq_sched_exit_hctx(q, hctx, hctx_idx);
   exit_hctx:
@@ -2468,12 +2485,14 @@ static void blk_mq_realloc_hw_ctxs(struct blk_mq_tag_set *set,
  
                 node = blk_mq_hw_queue_to_node(q->mq_map, i);
                 hctxs[i] = kzalloc_node(blk_mq_hw_ctx_size(set),
-                                       GFP_KERNEL, node);
+                               GFP_NOIO | __GFP_NOWARN | __GFP_NORETRY,
+                               node);
                 if (!hctxs[i])
                         break;
  
-               if (!zalloc_cpumask_var_node(&hctxs[i]->cpumask, GFP_KERNEL,
-                                               node)) {
+               if (!zalloc_cpumask_var_node(&hctxs[i]->cpumask,
+                                       GFP_NOIO | __GFP_NOWARN | __GFP_NORETRY,
+                                       node)) {
                         kfree(hctxs[i]);
                         hctxs[i] = NULL;
                         break;
@@ -2595,7 +2614,8 @@ err_exit:
  }
  EXPORT_SYMBOL(blk_mq_init_allocated_queue);
  
-void blk_mq_free_queue(struct request_queue *q)
+/* tags can _not_ be used after returning from blk_mq_exit_queue */
+void blk_mq_exit_queue(struct request_queue *q)
  {
         struct blk_mq_tag_set   *set = q->tag_set;
  
@@ -2808,6 +2828,7 @@ int blk_mq_update_nr_requests(struct request_queue *q, unsigned int nr)
                 return 0;
  
         blk_mq_freeze_queue(q);
+       blk_mq_quiesce_queue(q);
  
         ret = 0;
         queue_for_each_hw_ctx(q, hctx, i) {
@@ -2831,6 +2852,7 @@ int blk_mq_update_nr_requests(struct request_queue *q, unsigned int nr)
         if (!ret)
                 q->nr_requests = nr;
  
+       blk_mq_unquiesce_queue(q);
         blk_mq_unfreeze_queue(q);
  
         return ret;