blk-mq: make sure hctx->next_cpu is set correctly

author Ming Lei <ming.lei@redhat.com>

Wed, 17 Jan 2018 16:41:51 +0000 (00:41 +0800)

committer Jens Axboe <axboe@kernel.dk>

Wed, 17 Jan 2018 16:46:26 +0000 (09:46 -0700)
author Ming Lei <ming.lei@redhat.com>
Wed, 17 Jan 2018 16:41:51 +0000 (00:41 +0800)
committer Jens Axboe <axboe@kernel.dk>
Wed, 17 Jan 2018 16:46:26 +0000 (09:46 -0700)
diff --git a/block/blk-mq.c b/block/blk-mq.c

index c8f62e6be6b6acf183e86ffe2594be0c9076c2d4..3bd41f1066ee13db678c9b7b53300f576301c1cc 100644 (file)
--- a/block/blk-mq.c
+++ b/block/blk-mq.c
@@ -1319,21 +1319,47 @@ static void __blk_mq_run_hw_queue(struct blk_mq_hw_ctx *hctx)
   */
  static int blk_mq_hctx_next_cpu(struct blk_mq_hw_ctx *hctx)
  {
+       bool tried = false;
+
         if (hctx->queue->nr_hw_queues == 1)
                 return WORK_CPU_UNBOUND;
  
         if (--hctx->next_cpu_batch <= 0) {
                 int next_cpu;
-
+select_cpu:
                 next_cpu = cpumask_next_and(hctx->next_cpu, hctx->cpumask,
                                 cpu_online_mask);
                 if (next_cpu >= nr_cpu_ids)
                         next_cpu = cpumask_first_and(hctx->cpumask,cpu_online_mask);
  
-               hctx->next_cpu = next_cpu;
+               /*
+                * No online CPU is found, so have to make sure hctx->next_cpu
+                * is set correctly for not breaking workqueue.
+                */
+               if (next_cpu >= nr_cpu_ids)
+                       hctx->next_cpu = cpumask_first(hctx->cpumask);
+               else
+                       hctx->next_cpu = next_cpu;
                 hctx->next_cpu_batch = BLK_MQ_CPU_WORK_BATCH;
         }
  
+       /*
+        * Do unbound schedule if we can't find a online CPU for this hctx,
+        * and it should only happen in the path of handling CPU DEAD.
+        */
+       if (!cpu_online(hctx->next_cpu)) {
+               if (!tried) {
+                       tried = true;
+                       goto select_cpu;
+               }
+
+               /*
+                * Make sure to re-select CPU next time once after CPUs
+                * in hctx->cpumask become online again.
+                */
+               hctx->next_cpu_batch = 1;
+               return WORK_CPU_UNBOUND;
+       }
         return hctx->next_cpu;
  }
author	Ming Lei <ming.lei@redhat.com>
	Wed, 17 Jan 2018 16:41:51 +0000 (00:41 +0800)
committer	Jens Axboe <axboe@kernel.dk>
	Wed, 17 Jan 2018 16:46:26 +0000 (09:46 -0700)