On Wed, Oct 14, 2015 at 09:43:21AM +0200, Daniel Wagner wrote:
> From: Paul Gortmaker <paul.gortma...@windriver.com>
> 
> As of commit dae6e64d2bcfd4b06304ab864c7e3a4f6b5fedf4 ("rcu: Introduce
> proper blocking to no-CBs kthreads GP waits") the RCU subsystem started
> making use of wait queues.
> 
> Here we convert all additions of RCU wait queues to use simple wait queues,
> since they don't need the extra overhead of the full wait queue features.
> 
> Originally this was done for RT kernels[1], since we would get things like...
> 
>   BUG: sleeping function called from invalid context at kernel/rtmutex.c:659
>   in_atomic(): 1, irqs_disabled(): 1, pid: 8, name: rcu_preempt
>   Pid: 8, comm: rcu_preempt Not tainted
>   Call Trace:
>    [<ffffffff8106c8d0>] __might_sleep+0xd0/0xf0
>    [<ffffffff817d77b4>] rt_spin_lock+0x24/0x50
>    [<ffffffff8106fcf6>] __wake_up+0x36/0x70
>    [<ffffffff810c4542>] rcu_gp_kthread+0x4d2/0x680
>    [<ffffffff8105f910>] ? __init_waitqueue_head+0x50/0x50
>    [<ffffffff810c4070>] ? rcu_gp_fqs+0x80/0x80
>    [<ffffffff8105eabb>] kthread+0xdb/0xe0
>    [<ffffffff8106b912>] ? finish_task_switch+0x52/0x100
>    [<ffffffff817e0754>] kernel_thread_helper+0x4/0x10
>    [<ffffffff8105e9e0>] ? __init_kthread_worker+0x60/0x60
>    [<ffffffff817e0750>] ? gs_change+0xb/0xb
> 
> ...and hence simple wait queues were deployed on RT out of necessity
> (as simple wait uses a raw lock), but mainline might as well take
> advantage of the more streamline support as well.
> 
> [1] This is a carry forward of work from v3.10-rt; the original conversion
> was by Thomas on an earlier -rt version, and Sebastian extended it to
> additional post-3.10 added RCU waiters; here I've added a commit log and
> unified the RCU changes into one, and uprev'd it to match mainline RCU.
> 
> Signed-off-by: Paul Gortmaker <paul.gortma...@windriver.com>
> Signed-off-by: Daniel Wagner <daniel.wag...@bmw-carit.de>
> Cc: Thomas Gleixner <t...@linutronix.de>
> Cc: Sebastian Andrzej Siewior <bige...@linutronix.de>
> Cc: Paul E. McKenney <paul...@linux.vnet.ibm.com>
> Cc: Steven Rostedt <rost...@goodmis.org>
> Cc: linux-kernel@vger.kernel.org

One comment below on an unneeded fix.  I will try queueing these for
testing.

                                                        Thanx, Paul

> ---
>  kernel/rcu/tree.c        | 13 +++++++------
>  kernel/rcu/tree.h        |  7 ++++---
>  kernel/rcu/tree_plugin.h | 18 +++++++++---------
>  3 files changed, 20 insertions(+), 18 deletions(-)
> 
> diff --git a/kernel/rcu/tree.c b/kernel/rcu/tree.c
> index 775d36c..f1c80aa 100644
> --- a/kernel/rcu/tree.c
> +++ b/kernel/rcu/tree.c
> @@ -1589,7 +1589,7 @@ static void rcu_gp_kthread_wake(struct rcu_state *rsp)
>           !READ_ONCE(rsp->gp_flags) ||
>           !rsp->gp_kthread)
>               return;
> -     wake_up(&rsp->gp_wq);
> +     swake_up(&rsp->gp_wq);
>  }
> 
>  /*
> @@ -2057,7 +2057,7 @@ static int __noreturn rcu_gp_kthread(void *arg)
>                                              READ_ONCE(rsp->gpnum),
>                                              TPS("reqwait"));
>                       rsp->gp_state = RCU_GP_WAIT_GPS;
> -                     wait_event_interruptible(rsp->gp_wq,
> +                     swait_event_interruptible(rsp->gp_wq,
>                                                READ_ONCE(rsp->gp_flags) &
>                                                RCU_GP_FLAG_INIT);
>                       rsp->gp_state = RCU_GP_DONE_GPS;
> @@ -2087,7 +2087,7 @@ static int __noreturn rcu_gp_kthread(void *arg)
>                                              READ_ONCE(rsp->gpnum),
>                                              TPS("fqswait"));
>                       rsp->gp_state = RCU_GP_WAIT_FQS;
> -                     ret = wait_event_interruptible_timeout(rsp->gp_wq,
> +                     ret = swait_event_interruptible_timeout(rsp->gp_wq,
>                                       rcu_gp_fqs_check_wake(rsp, &gf), j);
>                       rsp->gp_state = RCU_GP_DOING_FQS;
>                       /* Locking provides needed memory barriers. */
> @@ -2210,7 +2210,7 @@ static void rcu_report_qs_rsp(struct rcu_state *rsp, 
> unsigned long flags)
>       WARN_ON_ONCE(!rcu_gp_in_progress(rsp));
>       WRITE_ONCE(rsp->gp_flags, READ_ONCE(rsp->gp_flags) | RCU_GP_FLAG_FQS);
>       raw_spin_unlock_irqrestore(&rcu_get_root(rsp)->lock, flags);
> -     rcu_gp_kthread_wake(rsp);
> +     swake_up(&rsp->gp_wq);  /* Memory barrier implied by swake_up() path. */
>  }
> 
>  /*
> @@ -2871,7 +2871,7 @@ static void force_quiescent_state(struct rcu_state *rsp)
>       }
>       WRITE_ONCE(rsp->gp_flags, READ_ONCE(rsp->gp_flags) | RCU_GP_FLAG_FQS);
>       raw_spin_unlock_irqrestore(&rnp_old->lock, flags);
> -     rcu_gp_kthread_wake(rsp);
> +     swake_up(&rsp->gp_wq); /* Memory barrier implied by swake_up() path. */
>  }
> 
>  /*
> @@ -4178,7 +4178,8 @@ static void __init rcu_init_one(struct rcu_state *rsp,
>               }
>       }
> 
> -     init_waitqueue_head(&rsp->gp_wq);
> +     rsp->rda = rda;

This is initialized at compile time in current mainline, so the above
statement is not needed.

But now that you mention it, the second parameter to rcu_init_one() is
a bit pointless these days.  I have queued a patch eliminating it,
which should not conflict with our patch.

> +     init_swait_queue_head(&rsp->gp_wq);
>       rnp = rsp->level[rcu_num_lvls - 1];
>       for_each_possible_cpu(i) {
>               while (i > rnp->grphi)
> diff --git a/kernel/rcu/tree.h b/kernel/rcu/tree.h
> index 2e991f8..6aa3776 100644
> --- a/kernel/rcu/tree.h
> +++ b/kernel/rcu/tree.h
> @@ -27,6 +27,7 @@
>  #include <linux/threads.h>
>  #include <linux/cpumask.h>
>  #include <linux/seqlock.h>
> +#include <linux/swait.h>
>  #include <linux/stop_machine.h>
> 
>  /*
> @@ -244,7 +245,7 @@ struct rcu_node {
>                               /* Refused to boost: not sure why, though. */
>                               /*  This can happen due to race conditions. */
>  #ifdef CONFIG_RCU_NOCB_CPU
> -     wait_queue_head_t nocb_gp_wq[2];
> +     struct swait_queue_head nocb_gp_wq[2];
>                               /* Place for rcu_nocb_kthread() to wait GP. */
>  #endif /* #ifdef CONFIG_RCU_NOCB_CPU */
>       int need_future_gp[2];
> @@ -388,7 +389,7 @@ struct rcu_data {
>       atomic_long_t nocb_q_count_lazy; /*  invocation (all stages). */
>       struct rcu_head *nocb_follower_head; /* CBs ready to invoke. */
>       struct rcu_head **nocb_follower_tail;
> -     wait_queue_head_t nocb_wq;      /* For nocb kthreads to sleep on. */
> +     struct swait_queue_head nocb_wq; /* For nocb kthreads to sleep on. */
>       struct task_struct *nocb_kthread;
>       int nocb_defer_wakeup;          /* Defer wakeup of nocb_kthread. */
> 
> @@ -475,7 +476,7 @@ struct rcu_state {
>       unsigned long gpnum;                    /* Current gp number. */
>       unsigned long completed;                /* # of last completed gp. */
>       struct task_struct *gp_kthread;         /* Task for grace periods. */
> -     wait_queue_head_t gp_wq;                /* Where GP task waits. */
> +     struct swait_queue_head gp_wq;          /* Where GP task waits. */
>       short gp_flags;                         /* Commands for GP task. */
>       short gp_state;                         /* GP kthread sleep state. */
> 
> diff --git a/kernel/rcu/tree_plugin.h b/kernel/rcu/tree_plugin.h
> index b2bf396..545acdf 100644
> --- a/kernel/rcu/tree_plugin.h
> +++ b/kernel/rcu/tree_plugin.h
> @@ -1779,7 +1779,7 @@ early_param("rcu_nocb_poll", parse_rcu_nocb_poll);
>   */
>  static void rcu_nocb_gp_cleanup(struct rcu_state *rsp, struct rcu_node *rnp)
>  {
> -     wake_up_all(&rnp->nocb_gp_wq[rnp->completed & 0x1]);
> +     swake_up_all(&rnp->nocb_gp_wq[rnp->completed & 0x1]);
>  }
> 
>  /*
> @@ -1797,8 +1797,8 @@ static void rcu_nocb_gp_set(struct rcu_node *rnp, int 
> nrq)
> 
>  static void rcu_init_one_nocb(struct rcu_node *rnp)
>  {
> -     init_waitqueue_head(&rnp->nocb_gp_wq[0]);
> -     init_waitqueue_head(&rnp->nocb_gp_wq[1]);
> +     init_swait_queue_head(&rnp->nocb_gp_wq[0]);
> +     init_swait_queue_head(&rnp->nocb_gp_wq[1]);
>  }
> 
>  #ifndef CONFIG_RCU_NOCB_CPU_ALL
> @@ -1823,7 +1823,7 @@ static void wake_nocb_leader(struct rcu_data *rdp, bool 
> force)
>       if (READ_ONCE(rdp_leader->nocb_leader_sleep) || force) {
>               /* Prior smp_mb__after_atomic() orders against prior enqueue. */
>               WRITE_ONCE(rdp_leader->nocb_leader_sleep, false);
> -             wake_up(&rdp_leader->nocb_wq);
> +             swake_up(&rdp_leader->nocb_wq);
>       }
>  }
> 
> @@ -2036,7 +2036,7 @@ static void rcu_nocb_wait_gp(struct rcu_data *rdp)
>        */
>       trace_rcu_future_gp(rnp, rdp, c, TPS("StartWait"));
>       for (;;) {
> -             wait_event_interruptible(
> +             swait_event_interruptible(
>                       rnp->nocb_gp_wq[c & 0x1],
>                       (d = ULONG_CMP_GE(READ_ONCE(rnp->completed), c)));
>               if (likely(d))
> @@ -2064,7 +2064,7 @@ wait_again:
>       /* Wait for callbacks to appear. */
>       if (!rcu_nocb_poll) {
>               trace_rcu_nocb_wake(my_rdp->rsp->name, my_rdp->cpu, "Sleep");
> -             wait_event_interruptible(my_rdp->nocb_wq,
> +             swait_event_interruptible(my_rdp->nocb_wq,
>                               !READ_ONCE(my_rdp->nocb_leader_sleep));
>               /* Memory barrier handled by smp_mb() calls below and repoll. */
>       } else if (firsttime) {
> @@ -2139,7 +2139,7 @@ wait_again:
>                        * List was empty, wake up the follower.
>                        * Memory barriers supplied by atomic_long_add().
>                        */
> -                     wake_up(&rdp->nocb_wq);
> +                     swake_up(&rdp->nocb_wq);
>               }
>       }
> 
> @@ -2160,7 +2160,7 @@ static void nocb_follower_wait(struct rcu_data *rdp)
>               if (!rcu_nocb_poll) {
>                       trace_rcu_nocb_wake(rdp->rsp->name, rdp->cpu,
>                                           "FollowerSleep");
> -                     wait_event_interruptible(rdp->nocb_wq,
> +                     swait_event_interruptible(rdp->nocb_wq,
>                                                
> READ_ONCE(rdp->nocb_follower_head));
>               } else if (firsttime) {
>                       /* Don't drown trace log with "Poll"! */
> @@ -2319,7 +2319,7 @@ void __init rcu_init_nohz(void)
>  static void __init rcu_boot_init_nocb_percpu_data(struct rcu_data *rdp)
>  {
>       rdp->nocb_tail = &rdp->nocb_head;
> -     init_waitqueue_head(&rdp->nocb_wq);
> +     init_swait_queue_head(&rdp->nocb_wq);
>       rdp->nocb_follower_tail = &rdp->nocb_follower_head;
>  }
> 
> -- 
> 2.4.3
> 

--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

Reply via email to