workqueue: fix ordered workqueues in NUMA setups

author Tejun Heo <tj@kernel.org>

Thu, 5 Sep 2013 16:30:04 +0000 (12:30 -0400)

committer Tejun Heo <tj@kernel.org>

Fri, 22 Nov 2013 23:14:02 +0000 (18:14 -0500)
author Tejun Heo <tj@kernel.org>
Thu, 5 Sep 2013 16:30:04 +0000 (12:30 -0400)
committer Tejun Heo <tj@kernel.org>
Fri, 22 Nov 2013 23:14:02 +0000 (18:14 -0500)
diff --git a/kernel/workqueue.c b/kernel/workqueue.c

index f894242..bbb5e98 100644 (file)
--- a/kernel/workqueue.c
+++ b/kernel/workqueue.c
@@ -305,6 +305,9 @@ static DEFINE_HASHTABLE(unbound_pool_hash, UNBOUND_POOL_HASH_ORDER);
  /* I: attributes used when instantiating standard unbound pools on demand */
  static struct workqueue_attrs *unbound_std_wq_attrs[NR_STD_WORKER_POOLS];
  
+/* I: attributes used when instantiating ordered pools on demand */
+static struct workqueue_attrs *ordered_wq_attrs[NR_STD_WORKER_POOLS];
+
  struct workqueue_struct *system_wq __read_mostly;
  EXPORT_SYMBOL(system_wq);
  struct workqueue_struct *system_highpri_wq __read_mostly;
@@ -4107,7 +4110,7 @@ out_unlock:
  static int alloc_and_link_pwqs(struct workqueue_struct *wq)
  {
         bool highpri = wq->flags & WQ_HIGHPRI;
-       int cpu;
+       int cpu, ret;
  
         if (!(wq->flags & WQ_UNBOUND)) {
                 wq->cpu_pwqs = alloc_percpu(struct pool_workqueue);
@@ -4127,6 +4130,13 @@ static int alloc_and_link_pwqs(struct workqueue_struct *wq)
                         mutex_unlock(&wq->mutex);
                 }
                 return 0;
+       } else if (wq->flags & __WQ_ORDERED) {
+               ret = apply_workqueue_attrs(wq, ordered_wq_attrs[highpri]);
+               /* there should only be single pwq for ordering guarantee */
+               WARN(!ret && (wq->pwqs.next != &wq->dfl_pwq->pwqs_node ||
+                             wq->pwqs.prev != &wq->dfl_pwq->pwqs_node),
+                    "ordering guarantee broken for workqueue %s\n", wq->name);
+               return ret;
         } else {
                 return apply_workqueue_attrs(wq, unbound_std_wq_attrs[highpri]);
         }
@@ -5052,13 +5062,23 @@ static int __init init_workqueues(void)
                 }
         }
  
-       /* create default unbound wq attrs */
+       /* create default unbound and ordered wq attrs */
         for (i = 0; i < NR_STD_WORKER_POOLS; i++) {
                 struct workqueue_attrs *attrs;
  
                 BUG_ON(!(attrs = alloc_workqueue_attrs(GFP_KERNEL)));
                 attrs->nice = std_nice[i];
                 unbound_std_wq_attrs[i] = attrs;
+
+               /*
+                * An ordered wq should have only one pwq as ordering is
+                * guaranteed by max_active which is enforced by pwqs.
+                * Turn off NUMA so that dfl_pwq is used for all nodes.
+                */
+               BUG_ON(!(attrs = alloc_workqueue_attrs(GFP_KERNEL)));
+               attrs->nice = std_nice[i];
+               attrs->no_numa = true;
+               ordered_wq_attrs[i] = attrs;
         }
  
         system_wq = alloc_workqueue("events", 0, 0);
author	Tejun Heo <tj@kernel.org>
	Thu, 5 Sep 2013 16:30:04 +0000 (12:30 -0400)
committer	Tejun Heo <tj@kernel.org>
	Fri, 22 Nov 2013 23:14:02 +0000 (18:14 -0500)