workqueue: Fix missing kfree(rescuer) in destroy_workqueue()

[mirror_ubuntu-bionic-kernel.git] / kernel / workqueue.c
diff --git a/kernel/workqueue.c b/kernel/workqueue.c

index 43d18cb46308385865d14ce40906c4646d378063..fb7e133e89ced4986214ebc2934f29312089ab2f 100644 (file)
--- a/kernel/workqueue.c
+++ b/kernel/workqueue.c
@@ -48,6 +48,7 @@
  #include <linux/moduleparam.h>
  #include <linux/uaccess.h>
  #include <linux/sched/isolation.h>
+#include <linux/nmi.h>
  
  #include "workqueue_internal.h"
  
@@ -1603,6 +1604,40 @@ bool mod_delayed_work_on(int cpu, struct workqueue_struct *wq,
  }
  EXPORT_SYMBOL_GPL(mod_delayed_work_on);
  
+static void rcu_work_rcufn(struct rcu_head *rcu)
+{
+       struct rcu_work *rwork = container_of(rcu, struct rcu_work, rcu);
+
+       /* read the comment in __queue_work() */
+       local_irq_disable();
+       __queue_work(WORK_CPU_UNBOUND, rwork->wq, &rwork->work);
+       local_irq_enable();
+}
+
+/**
+ * queue_rcu_work - queue work after a RCU grace period
+ * @wq: workqueue to use
+ * @rwork: work to queue
+ *
+ * Return: %false if @rwork was already pending, %true otherwise.  Note
+ * that a full RCU grace period is guaranteed only after a %true return.
+ * While @rwork is guarnateed to be executed after a %false return, the
+ * execution may happen before a full RCU grace period has passed.
+ */
+bool queue_rcu_work(struct workqueue_struct *wq, struct rcu_work *rwork)
+{
+       struct work_struct *work = &rwork->work;
+
+       if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
+               rwork->wq = wq;
+               call_rcu(&rwork->rcu, rcu_work_rcufn);
+               return true;
+       }
+
+       return false;
+}
+EXPORT_SYMBOL(queue_rcu_work);
+
  /**
   * worker_enter_idle - enter idle state
   * @worker: worker which is entering idle state
@@ -2364,8 +2399,14 @@ repeat:
                          */
                         if (need_to_create_worker(pool)) {
                                 spin_lock(&wq_mayday_lock);
-                               get_pwq(pwq);
-                               list_move_tail(&pwq->mayday_node, &wq->maydays);
+                               /*
+                                * Queue iff we aren't racing destruction
+                                * and somebody else hasn't queued it already.
+                                */
+                               if (wq->rescuer && list_empty(&pwq->mayday_node)) {
+                                       get_pwq(pwq);
+                                       list_add_tail(&pwq->mayday_node, &wq->maydays);
+                               }
                                 spin_unlock(&wq_mayday_lock);
                         }
                 }
@@ -2604,6 +2645,9 @@ void flush_workqueue(struct workqueue_struct *wq)
         if (WARN_ON(!wq_online))
                 return;
  
+       lock_map_acquire(&wq->lockdep_map);
+       lock_map_release(&wq->lockdep_map);
+
         mutex_lock(&wq->mutex);
  
         /*
@@ -2795,7 +2839,8 @@ reflush:
  }
  EXPORT_SYMBOL_GPL(drain_workqueue);
  
-static bool start_flush_work(struct work_struct *work, struct wq_barrier *barr)
+static bool start_flush_work(struct work_struct *work, struct wq_barrier *barr,
+                            bool from_cancel)
  {
         struct worker *worker = NULL;
         struct worker_pool *pool;
@@ -2837,7 +2882,8 @@ static bool start_flush_work(struct work_struct *work, struct wq_barrier *barr)
          * workqueues the deadlock happens when the rescuer stalls, blocking
          * forward progress.
          */
-       if (pwq->wq->saved_max_active == 1 || pwq->wq->rescuer) {
+       if (!from_cancel &&
+           (pwq->wq->saved_max_active == 1 || pwq->wq->rescuer)) {
                 lock_map_acquire(&pwq->wq->lockdep_map);
                 lock_map_release(&pwq->wq->lockdep_map);
         }
@@ -2848,6 +2894,30 @@ already_gone:
         return false;
  }
  
+static bool __flush_work(struct work_struct *work, bool from_cancel)
+{
+       struct wq_barrier barr;
+
+       if (WARN_ON(!wq_online))
+               return false;
+
+       if (WARN_ON(!work->func))
+               return false;
+
+       if (!from_cancel) {
+               lock_map_acquire(&work->lockdep_map);
+               lock_map_release(&work->lockdep_map);
+       }
+
+       if (start_flush_work(work, &barr, from_cancel)) {
+               wait_for_completion(&barr.done);
+               destroy_work_on_stack(&barr.work);
+               return true;
+       } else {
+               return false;
+       }
+}
+
  /**
   * flush_work - wait for a work to finish executing the last queueing instance
   * @work: the work to flush
@@ -2861,18 +2931,7 @@ already_gone:
   */
  bool flush_work(struct work_struct *work)
  {
-       struct wq_barrier barr;
-
-       if (WARN_ON(!wq_online))
-               return false;
-
-       if (start_flush_work(work, &barr)) {
-               wait_for_completion(&barr.done);
-               destroy_work_on_stack(&barr.work);
-               return true;
-       } else {
-               return false;
-       }
+       return __flush_work(work, false);
  }
  EXPORT_SYMBOL_GPL(flush_work);
  
@@ -2938,7 +2997,7 @@ static bool __cancel_work_timer(struct work_struct *work, bool is_dwork)
          * isn't executing.
          */
         if (wq_online)
-               flush_work(work);
+               __flush_work(work, true);
  
         clear_work_data(work);
  
@@ -3000,6 +3059,26 @@ bool flush_delayed_work(struct delayed_work *dwork)
  }
  EXPORT_SYMBOL(flush_delayed_work);
  
+/**
+ * flush_rcu_work - wait for a rwork to finish executing the last queueing
+ * @rwork: the rcu work to flush
+ *
+ * Return:
+ * %true if flush_rcu_work() waited for the work to finish execution,
+ * %false if it was already idle.
+ */
+bool flush_rcu_work(struct rcu_work *rwork)
+{
+       if (test_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(&rwork->work))) {
+               rcu_barrier();
+               flush_work(&rwork->work);
+               return true;
+       } else {
+               return flush_work(&rwork->work);
+       }
+}
+EXPORT_SYMBOL(flush_rcu_work);
+
  static bool __cancel_work(struct work_struct *work, bool is_dwork)
  {
         unsigned long flags;
@@ -4067,9 +4146,29 @@ void destroy_workqueue(struct workqueue_struct *wq)
         struct pool_workqueue *pwq;
         int node;
  
+       /*
+        * Remove it from sysfs first so that sanity check failure doesn't
+        * lead to sysfs name conflicts.
+        */
+       workqueue_sysfs_unregister(wq);
+
         /* drain it before proceeding with destruction */
         drain_workqueue(wq);
  
+       /* kill rescuer, if sanity checks fail, leave it w/o rescuer */
+       if (wq->rescuer) {
+               struct worker *rescuer = wq->rescuer;
+
+               /* this prevents new queueing */
+               spin_lock_irq(&wq_mayday_lock);
+               wq->rescuer = NULL;
+               spin_unlock_irq(&wq_mayday_lock);
+
+               /* rescuer will empty maydays list before exiting */
+               kthread_stop(rescuer->task);
+               kfree(rescuer);
+       }
+
         /* sanity checks */
         mutex_lock(&wq->mutex);
         for_each_pwq(pwq, wq) {
@@ -4101,11 +4200,6 @@ void destroy_workqueue(struct workqueue_struct *wq)
         list_del_rcu(&wq->list);
         mutex_unlock(&wq_pool_mutex);
  
-       workqueue_sysfs_unregister(wq);
-
-       if (wq->rescuer)
-               kthread_stop(wq->rescuer->task);
-
         if (!(wq->flags & WQ_UNBOUND)) {
                 /*
                  * The base ref is never dropped on per-cpu pwqs.  Directly
@@ -4167,6 +4261,22 @@ void workqueue_set_max_active(struct workqueue_struct *wq, int max_active)
  }
  EXPORT_SYMBOL_GPL(workqueue_set_max_active);
  
+/**
+ * current_work - retrieve %current task's work struct
+ *
+ * Determine if %current task is a workqueue worker and what it's working on.
+ * Useful to find out the context that the %current task is running in.
+ *
+ * Return: work struct if %current task is a workqueue worker, %NULL otherwise.
+ */
+struct work_struct *current_work(void)
+{
+       struct worker *worker = current_wq_worker();
+
+       return worker ? worker->current_work : NULL;
+}
+EXPORT_SYMBOL(current_work);
+
  /**
   * current_is_workqueue_rescuer - is %current workqueue rescuer?
   *
@@ -4366,7 +4476,8 @@ static void show_pwq(struct pool_workqueue *pwq)
         pr_info("  pwq %d:", pool->id);
         pr_cont_pool_info(pool);
  
-       pr_cont(" active=%d/%d%s\n", pwq->nr_active, pwq->max_active,
+       pr_cont(" active=%d/%d refcnt=%d%s\n",
+               pwq->nr_active, pwq->max_active, pwq->refcnt,
                 !list_empty(&pwq->mayday_node) ? " MAYDAY" : "");
  
         hash_for_each(pool->busy_hash, bkt, worker, hentry) {
@@ -4463,6 +4574,12 @@ void show_workqueue_state(void)
                         if (pwq->nr_active || !list_empty(&pwq->delayed_works))
                                 show_pwq(pwq);
                         spin_unlock_irqrestore(&pwq->pool->lock, flags);
+                       /*
+                        * We could be printing a lot from atomic context, e.g.
+                        * sysrq-t -> show_workqueue_state(). Avoid triggering
+                        * hard lockup.
+                        */
+                       touch_nmi_watchdog();
                 }
         }
  
@@ -4490,6 +4607,12 @@ void show_workqueue_state(void)
                 pr_cont("\n");
         next_pool:
                 spin_unlock_irqrestore(&pool->lock, flags);
+               /*
+                * We could be printing a lot from atomic context, e.g.
+                * sysrq-t -> show_workqueue_state(). Avoid triggering
+                * hard lockup.
+                */
+               touch_nmi_watchdog();
         }
  
         rcu_read_unlock_sched();
@@ -5297,7 +5420,7 @@ int workqueue_sysfs_register(struct workqueue_struct *wq)
  
         ret = device_register(&wq_dev->dev);
         if (ret) {
-               kfree(wq_dev);
+               put_device(&wq_dev->dev);
                 wq->wq_dev = NULL;
                 return ret;
         }
@@ -5428,7 +5551,7 @@ static void wq_watchdog_timer_fn(struct timer_list *unused)
         mod_timer(&wq_watchdog_timer, jiffies + thresh);
  }
  
-void wq_watchdog_touch(int cpu)
+notrace void wq_watchdog_touch(int cpu)
  {
         if (cpu >= 0)
                 per_cpu(wq_watchdog_touched_cpu, cpu) = jiffies;