Merge branches 'doc.2020.02.27a', 'fixes.2020.03.21a', 'kfree_rcu.2020.02.20a', ...

author Paul E. McKenney <[email protected]>

Sun, 22 Mar 2020 00:15:11 +0000 (17:15 -0700)

committer Paul E. McKenney <[email protected]>

Sun, 22 Mar 2020 00:15:11 +0000 (17:15 -0700)
author Paul E. McKenney <[email protected]>
Sun, 22 Mar 2020 00:15:11 +0000 (17:15 -0700)
committer Paul E. McKenney <[email protected]>
Sun, 22 Mar 2020 00:15:11 +0000 (17:15 -0700)
diff --combined Documentation/admin-guide/kernel-parameters.txt

index dbc22d68462751d2bb59ab35784c1c61c84bbb0a,dbc22d68462751d2bb59ab35784c1c61c84bbb0a,dbc22d68462751d2bb59ab35784c1c61c84bbb0a,dbc22d68462751d2bb59ab35784c1c61c84bbb0a,dbd4b4a65209ae6d605d66241d6213a8c7b15bc2,dbc22d68462751d2bb59ab35784c1c61c84bbb0a,dbc22d68462751d2bb59ab35784c1c61c84bbb0a,868f59a48580dfb768086474c13888ce6f23dab3..6d16b78d587550d7baed2f8430774299bfd9ffd3
--- 1/Documentation/admin-guide/kernel-parameters.txt
--- 2/Documentation/admin-guide/kernel-parameters.txt
--- 3/Documentation/admin-guide/kernel-parameters.txt
--- 4/Documentation/admin-guide/kernel-parameters.txt
--- 5/Documentation/admin-guide/kernel-parameters.txt
--- 6/Documentation/admin-guide/kernel-parameters.txt
--- 7/Documentation/admin-guide/kernel-parameters.txt
--- 8/Documentation/admin-guide/kernel-parameters.txt
+++ b/Documentation/admin-guide/kernel-parameters.txt
@@@@@@@@@ -3980,6 -3980,6 -3980,6 -3980,6 -3980,15 -3980,6 -3980,6 -3980,6 +3980,15 @@@@@@@@@
                                 Set threshold of queued RCU callbacks below which
                                 batch limiting is re-enabled.
         
++++ +++        rcutree.qovld= [KNL]
++++ +++                        Set threshold of queued RCU callbacks beyond which
++++ +++                        RCU's force-quiescent-state scan will aggressively
++++ +++                        enlist help from cond_resched() and sched IPIs to
++++ +++                        help CPUs more quickly reach quiescent states.
++++ +++                        Set to less than zero to make this be set based
++++ +++                        on rcutree.qhimark at boot time and to zero to
++++ +++                        disable more aggressive help enlistment.
++++ +++
                 rcutree.rcu_idle_gp_delay= [KNL]
                                 Set wakeup interval for idle CPUs that have
                                 RCU callbacks (RCU_FAST_NO_HZ=y).
@@@@@@@@@ -4195,6 -4195,6 -4195,6 -4195,6 -4204,6 -4195,6 -4195,6 -4195,12 +4204,12 @@@@@@@@@
                 rcupdate.rcu_cpu_stall_suppress= [KNL]
                                 Suppress RCU CPU stall warning messages.
         
+++++++         rcupdate.rcu_cpu_stall_suppress_at_boot= [KNL]
+++++++                         Suppress RCU CPU stall warning messages and
+++++++                         rcutorture writer stall warnings that occur
+++++++                         during early boot, that is, during the time
+++++++                         before the init task is spawned.
+++++++ 
                 rcupdate.rcu_cpu_stall_timeout= [KNL]
                                 Set timeout for RCU CPU stall warning messages.
         
@@@@@@@@@ -4867,6 -4867,6 -4867,6 -4867,6 -4876,6 -4867,6 -4867,6 -4873,10 +4882,10 @@@@@@@@@
                                 topology updates sent by the hypervisor to this
                                 LPAR.
         
+++++++         torture.disable_onoff_at_boot= [KNL]
+++++++                         Prevent the CPU-hotplug component of torturing
+++++++                         until after init has spawned.
+++++++ 
                 tp720=          [HW,PS2]
         
                 tpm_suspend_pcr=[HW,TPM]
diff --combined include/trace/events/rcu.h

index 5e49b06e810445f2d07e1144f7d176a7cf0697c2,d56d54c17497d2d7b1a6b7bee4cd7b71b2317a3b,49a49e68b916f3e86d1053e713fc26d4839970b2,5e49b06e810445f2d07e1144f7d176a7cf0697c2,5e49b06e810445f2d07e1144f7d176a7cf0697c2,5e49b06e810445f2d07e1144f7d176a7cf0697c2,5e49b06e810445f2d07e1144f7d176a7cf0697c2,5e49b06e810445f2d07e1144f7d176a7cf0697c2..f9a7811148e2ae155c55b02695b71abfb0258367
--- 1/include/trace/events/rcu.h
--- 2/include/trace/events/rcu.h
--- 3/include/trace/events/rcu.h
--- 4/include/trace/events/rcu.h
--- 5/include/trace/events/rcu.h
--- 6/include/trace/events/rcu.h
--- 7/include/trace/events/rcu.h
--- 8/include/trace/events/rcu.h
+++ b/include/trace/events/rcu.h
@@@@@@@@@ -623,6 -623,6 -623,34 -623,6 -623,6 -623,6 -623,6 -623,6 +623,34 @@@@@@@@@ TRACE_EVENT_RCU(rcu_invoke_kfree_callba
                           __entry->rcuname, __entry->rhp, __entry->offset)
         );
         
++ +++++/*
++ +++++ * Tracepoint for the invocation of a single RCU callback of the special
++ +++++ * kfree_bulk() form. The first argument is the RCU flavor, the second
++ +++++ * argument is a number of elements in array to free, the third is an
++ +++++ * address of the array holding nr_records entries.
++ +++++ */
++ +++++TRACE_EVENT_RCU(rcu_invoke_kfree_bulk_callback,
++ +++++
++ +++++        TP_PROTO(const char *rcuname, unsigned long nr_records, void **p),
++ +++++
++ +++++        TP_ARGS(rcuname, nr_records, p),
++ +++++
++ +++++        TP_STRUCT__entry(
++ +++++                __field(const char *, rcuname)
++ +++++                __field(unsigned long, nr_records)
++ +++++                __field(void **, p)
++ +++++        ),
++ +++++
++ +++++        TP_fast_assign(
++ +++++                __entry->rcuname = rcuname;
++ +++++                __entry->nr_records = nr_records;
++ +++++                __entry->p = p;
++ +++++        ),
++ +++++
++ +++++        TP_printk("%s bulk=0x%p nr_records=%lu",
++ +++++                __entry->rcuname, __entry->p, __entry->nr_records)
++ +++++);
++ +++++
         /*
          * Tracepoint for exiting rcu_do_batch after RCU callbacks have been
          * invoked.  The first argument is the name of the RCU flavor,
@@@@@@@@@ -712,6 -712,7 -740,6 -712,6 -712,6 -712,6 -712,6 -712,6 +740,7 @@@@@@@@@ TRACE_EVENT_RCU(rcu_torture_read
          *      "Begin": rcu_barrier() started.
          *      "EarlyExit": rcu_barrier() piggybacked, thus early exit.
          *      "Inc1": rcu_barrier() piggyback check counter incremented.
+ ++++++ *      "OfflineNoCBQ": rcu_barrier() found offline no-CBs CPU with callbacks.
          *      "OnlineQ": rcu_barrier() found online CPU with callbacks.
          *      "OnlineNQ": rcu_barrier() found online CPU, no callbacks.
          *      "IRQ": An rcu_barrier_callback() callback posted on remote CPU.
diff --combined kernel/rcu/rcu.h

index 05f936ed167a76acc484584ab8bd33b222c2fd49,f6ce173e35f67318b9127e9a3b17c97629f0f82d,05f936ed167a76acc484584ab8bd33b222c2fd49,05f936ed167a76acc484584ab8bd33b222c2fd49,05f936ed167a76acc484584ab8bd33b222c2fd49,05f936ed167a76acc484584ab8bd33b222c2fd49,05f936ed167a76acc484584ab8bd33b222c2fd49,1779cbf33cd1433e8dce20d27eed546f93b7e550..00ddc92c577428bf5b803aa9a09cbb7d4d5def1c
--- 1/kernel/rcu/rcu.h
--- 2/kernel/rcu/rcu.h
--- 3/kernel/rcu/rcu.h
--- 4/kernel/rcu/rcu.h
--- 5/kernel/rcu/rcu.h
--- 6/kernel/rcu/rcu.h
--- 7/kernel/rcu/rcu.h
--- 8/kernel/rcu/rcu.h
+++ b/kernel/rcu/rcu.h
@@@@@@@@@ -198,6 -198,6 -198,6 -198,6 -198,6 -198,6 -198,6 -198,13 +198,13 @@@@@@@@@ static inline void debug_rcu_head_unque
         }
         #endif  /* #else !CONFIG_DEBUG_OBJECTS_RCU_HEAD */
         
+++++++ extern int rcu_cpu_stall_suppress_at_boot;
+++++++ 
+++++++ static inline bool rcu_stall_is_suppressed_at_boot(void)
+++++++ {
+++++++         return rcu_cpu_stall_suppress_at_boot && !rcu_inkernel_boot_has_ended();
+++++++ }
+++++++ 
         #ifdef CONFIG_RCU_STALL_COMMON
         
         extern int rcu_cpu_stall_ftrace_dump;
@@@@@@@@@ -205,6 -205,6 -205,6 -205,6 -205,6 -205,6 -205,6 -212,11 +212,11 @@@@@@@@@ extern int rcu_cpu_stall_suppress
         extern int rcu_cpu_stall_timeout;
         int rcu_jiffies_till_stall_check(void);
         
+++++++ static inline bool rcu_stall_is_suppressed(void)
+++++++ {
+++++++         return rcu_stall_is_suppressed_at_boot() || rcu_cpu_stall_suppress;
+++++++ }
+++++++ 
         #define rcu_ftrace_dump_stall_suppress() \
         do { \
                 if (!rcu_cpu_stall_suppress) \
@@@@@@@@@ -218,6 -218,6 -218,6 -218,6 -218,6 -218,6 -218,6 -230,11 +230,11 @@@@@@@@@ do { 
         } while (0)
         
         #else /* #endif #ifdef CONFIG_RCU_STALL_COMMON */
+++++++ 
+++++++ static inline bool rcu_stall_is_suppressed(void)
+++++++ {
+++++++         return rcu_stall_is_suppressed_at_boot();
+++++++ }
         #define rcu_ftrace_dump_stall_suppress()
         #define rcu_ftrace_dump_stall_unsuppress()
         #endif /* #ifdef CONFIG_RCU_STALL_COMMON */
@@@@@@@@@ -325,7 -325,8 -325,7 -325,7 -325,7 -325,7 -325,7 -342,7 +342,8 @@@@@@@@@ static inline void rcu_init_levelspread
          * Iterate over all possible CPUs in a leaf RCU node.
          */
         #define for_each_leaf_node_possible_cpu(rnp, cpu) \
- ------        for ((cpu) = cpumask_next((rnp)->grplo - 1, cpu_possible_mask); \
+ ++++++        for (WARN_ON_ONCE(!rcu_is_leaf_node(rnp)), \
+ ++++++             (cpu) = cpumask_next((rnp)->grplo - 1, cpu_possible_mask); \
                      (cpu) <= rnp->grphi; \
                      (cpu) = cpumask_next((cpu), cpu_possible_mask))
         
@@@@@@@@@ -335,7 -336,8 -335,7 -335,7 -335,7 -335,7 -335,7 -352,7 +353,8 @@@@@@@@@
         #define rcu_find_next_bit(rnp, cpu, mask) \
                 ((rnp)->grplo + find_next_bit(&(mask), BITS_PER_LONG, (cpu)))
         #define for_each_leaf_node_cpu_mask(rnp, cpu, mask) \
- ------        for ((cpu) = rcu_find_next_bit((rnp), 0, (mask)); \
+ ++++++        for (WARN_ON_ONCE(!rcu_is_leaf_node(rnp)), \
+ ++++++             (cpu) = rcu_find_next_bit((rnp), 0, (mask)); \
                      (cpu) <= rnp->grphi; \
                      (cpu) = rcu_find_next_bit((rnp), (cpu) + 1 - (rnp->grplo), (mask)))
         
diff --combined kernel/rcu/srcutree.c

index 657e6a7d1c03e5dde1223fe2ca289acdd97777da,7ddb29cc7dbad33fe84bc2e3df91fdfd6d8eb6f8,657e6a7d1c03e5dde1223fe2ca289acdd97777da,657e6a7d1c03e5dde1223fe2ca289acdd97777da,657e6a7d1c03e5dde1223fe2ca289acdd97777da,657e6a7d1c03e5dde1223fe2ca289acdd97777da,c19c1df0d19861f6600162605026514d1e5b1660,657e6a7d1c03e5dde1223fe2ca289acdd97777da..0c71505f0e19cab229ccefea8f8089e17881dfba
--- 1/kernel/rcu/srcutree.c
--- 2/kernel/rcu/srcutree.c
--- 3/kernel/rcu/srcutree.c
--- 4/kernel/rcu/srcutree.c
--- 5/kernel/rcu/srcutree.c
--- 6/kernel/rcu/srcutree.c
--- 7/kernel/rcu/srcutree.c
--- 8/kernel/rcu/srcutree.c
+++ b/kernel/rcu/srcutree.c
@@@@@@@@@ -5,7 -5,7 -5,7 -5,7 -5,7 -5,7 -5,7 -5,7 +5,7 @@@@@@@@@
          * Copyright (C) IBM Corporation, 2006
          * Copyright (C) Fujitsu, 2012
          *
- ------ * Author: Paul McKenney <[email protected]>
+ ++++++ * Authors: Paul McKenney <[email protected]>
          *         Lai Jiangshan <[email protected]>
          *
          * For detailed explanation of Read-Copy Update mechanism see -
@@@@@@@@@ -450,7 -450,7 -450,7 -450,7 -450,7 -450,7 -450,7 -450,7 +450,7 @@@@@@@@@ static void srcu_gp_start(struct srcu_s
                 spin_unlock_rcu_node(sdp);  /* Interrupts remain disabled. */
                 smp_mb(); /* Order prior store to ->srcu_gp_seq_needed vs. GP start. */
                 rcu_seq_start(&ssp->srcu_gp_seq);
------ -        state = rcu_seq_state(READ_ONCE(ssp->srcu_gp_seq));
++++++ +        state = rcu_seq_state(ssp->srcu_gp_seq);
                 WARN_ON_ONCE(state != SRCU_STATE_SCAN1);
         }
         
@@@@@@@@@ -534,7 -534,7 -534,7 -534,7 -534,7 -534,7 -534,7 -534,7 +534,7 @@@@@@@@@ static void srcu_gp_end(struct srcu_str
                 rcu_seq_end(&ssp->srcu_gp_seq);
                 gpseq = rcu_seq_current(&ssp->srcu_gp_seq);
                 if (ULONG_CMP_LT(ssp->srcu_gp_seq_needed_exp, gpseq))
------ -                ssp->srcu_gp_seq_needed_exp = gpseq;
++++++ +                WRITE_ONCE(ssp->srcu_gp_seq_needed_exp, gpseq);
                 spin_unlock_irq_rcu_node(ssp);
                 mutex_unlock(&ssp->srcu_gp_mutex);
                 /* A new grace period can start at this point.  But only one. */
@@@@@@@@@ -550,7 -550,7 -550,7 -550,7 -550,7 -550,7 -550,7 -550,7 +550,7 @@@@@@@@@
                         snp->srcu_have_cbs[idx] = gpseq;
                         rcu_seq_set_state(&snp->srcu_have_cbs[idx], 1);
                         if (ULONG_CMP_LT(snp->srcu_gp_seq_needed_exp, gpseq))
------ -                        snp->srcu_gp_seq_needed_exp = gpseq;
++++++ +                        WRITE_ONCE(snp->srcu_gp_seq_needed_exp, gpseq);
                         mask = snp->srcu_data_have_cbs[idx];
                         snp->srcu_data_have_cbs[idx] = 0;
                         spin_unlock_irq_rcu_node(snp);
@@@@@@@@@ -614,7 -614,7 -614,7 -614,7 -614,7 -614,7 -614,7 -614,7 +614,7 @@@@@@@@@ static void srcu_funnel_exp_start(struc
                 }
                 spin_lock_irqsave_rcu_node(ssp, flags);
                 if (ULONG_CMP_LT(ssp->srcu_gp_seq_needed_exp, s))
------ -                ssp->srcu_gp_seq_needed_exp = s;
++++++ +                WRITE_ONCE(ssp->srcu_gp_seq_needed_exp, s);
                 spin_unlock_irqrestore_rcu_node(ssp, flags);
         }
         
@@@@@@@@@ -660,7 -660,7 -660,7 -660,7 -660,7 -660,7 -660,7 -660,7 +660,7 @@@@@@@@@ static void srcu_funnel_gp_start(struc
                         if (snp == sdp->mynode)
                                 snp->srcu_data_have_cbs[idx] |= sdp->grpmask;
                         if (!do_norm && ULONG_CMP_LT(snp->srcu_gp_seq_needed_exp, s))
------ -                        snp->srcu_gp_seq_needed_exp = s;
++++++ +                        WRITE_ONCE(snp->srcu_gp_seq_needed_exp, s);
                         spin_unlock_irqrestore_rcu_node(snp, flags);
                 }
         
@@@@@@@@@ -674,7 -674,7 -674,7 -674,7 -674,7 -674,7 -674,7 -674,7 +674,7 @@@@@@@@@
                         smp_store_release(&ssp->srcu_gp_seq_needed, s); /*^^^*/
                 }
                 if (!do_norm && ULONG_CMP_LT(ssp->srcu_gp_seq_needed_exp, s))
------ -                ssp->srcu_gp_seq_needed_exp = s;
++++++ +                WRITE_ONCE(ssp->srcu_gp_seq_needed_exp, s);
         
                 /* If grace period not already done and none in progress, start it. */
                 if (!rcu_seq_done(&ssp->srcu_gp_seq, s) &&
@@@@@@@@@ -1079,7 -1079,7 -1079,7 -1079,7 -1079,7 -1079,7 -1079,7 -1079,7 +1079,7 @@@@@@@@@ EXPORT_SYMBOL_GPL(srcu_barrier)
          */
         unsigned long srcu_batches_completed(struct srcu_struct *ssp)
         {
------ -        return ssp->srcu_idx;
++++++ +        return READ_ONCE(ssp->srcu_idx);
         }
         EXPORT_SYMBOL_GPL(srcu_batches_completed);
         
@@@@@@@@@ -1130,7 -1130,7 -1130,7 -1130,7 -1130,7 -1130,7 -1130,9 -1130,7 +1130,9 @@@@@@@@@ static void srcu_advance_state(struct s
                                 return; /* readers present, retry later. */
                         }
                         srcu_flip(ssp);
++++++ +                spin_lock_irq_rcu_node(ssp);
                         rcu_seq_set_state(&ssp->srcu_gp_seq, SRCU_STATE_SCAN2);
++++++ +                spin_unlock_irq_rcu_node(ssp);
                 }
         
                 if (rcu_seq_state(READ_ONCE(ssp->srcu_gp_seq)) == SRCU_STATE_SCAN2) {
diff --combined kernel/rcu/tree.c

index d91c9156fab2ef0ad64ef1b31a77c3a10626d254,35292c8ffd4aa163825d019b22188929c9b19841,909f97efb1ed26d4f35e1b00cff2c7969ca83a93,d91c9156fab2ef0ad64ef1b31a77c3a10626d254,0a9de9fd43ed7bd6f5badcb04c6ae266910b25c4,d91c9156fab2ef0ad64ef1b31a77c3a10626d254,d91c9156fab2ef0ad64ef1b31a77c3a10626d254,d91c9156fab2ef0ad64ef1b31a77c3a10626d254..550193a9ce76df0472826ed8b18891d99a324598
--- 1/kernel/rcu/tree.c
--- 2/kernel/rcu/tree.c
--- 3/kernel/rcu/tree.c
--- 4/kernel/rcu/tree.c
--- 5/kernel/rcu/tree.c
--- 6/kernel/rcu/tree.c
--- 7/kernel/rcu/tree.c
--- 8/kernel/rcu/tree.c
+++ b/kernel/rcu/tree.c
@@@@@@@@@ -1,12 -1,12 -1,12 -1,12 -1,12 -1,12 -1,12 -1,12 +1,12 @@@@@@@@@
         // SPDX-License-Identifier: GPL-2.0+
         /*
- ------ * Read-Copy Update mechanism for mutual exclusion
+ ++++++ * Read-Copy Update mechanism for mutual exclusion (tree-based version)
          *
          * Copyright IBM Corporation, 2008
          *
          * Authors: Dipankar Sarma <[email protected]>
          *          Manfred Spraul <[email protected]>
- ------ *          Paul E. McKenney <[email protected]> Hierarchical version
+ ++++++ *          Paul E. McKenney <[email protected]>
          *
          * Based on the original work by Paul McKenney <[email protected]>
          * and inputs from Rusty Russell, Andrea Arcangeli and Andi Kleen.
@@@@@@@@@ -150,6 -150,6 -150,6 -150,6 -150,7 -150,6 -150,6 -150,6 +150,7 @@@@@@@@@ static void rcu_boost_kthread_setaffini
         static void invoke_rcu_core(void);
         static void rcu_report_exp_rdp(struct rcu_data *rdp);
         static void sync_sched_exp_online_cleanup(int cpu);
++++ +++static void check_cb_ovld_locked(struct rcu_data *rdp, struct rcu_node *rnp);
         
         /* rcuc/rcub kthread realtime priority */
         static int kthread_prio = IS_ENABLED(CONFIG_RCU_BOOST) ? 1 : 0;
@@@@@@@@@ -342,14 -342,17 -342,14 -342,14 -343,14 -342,14 -342,14 -342,14 +343,17 @@@@@@@@@ bool rcu_eqs_special_set(int cpu
         {
                 int old;
                 int new;
+ ++++++        int new_old;
                 struct rcu_data *rdp = &per_cpu(rcu_data, cpu);
         
+ ++++++        new_old = atomic_read(&rdp->dynticks);
                 do {
- ------                old = atomic_read(&rdp->dynticks);
+ ++++++                old = new_old;
                         if (old & RCU_DYNTICK_CTRL_CTR)
                                 return false;
                         new = old | RCU_DYNTICK_CTRL_MASK;
- ------        } while (atomic_cmpxchg(&rdp->dynticks, old, new) != old);
+ ++++++                new_old = atomic_cmpxchg(&rdp->dynticks, old, new);
+ ++++++        } while (new_old != old);
                 return true;
         }
         
@@@@@@@@@ -410,10 -413,10 -410,10 -410,10 -411,15 -410,10 -410,10 -410,10 +414,15 @@@@@@@@@ static long blimit = DEFAULT_RCU_BLIMIT
         static long qhimark = DEFAULT_RCU_QHIMARK;
         #define DEFAULT_RCU_QLOMARK 100   /* Once only this many pending, use blimit. */
         static long qlowmark = DEFAULT_RCU_QLOMARK;
++++ +++#define DEFAULT_RCU_QOVLD_MULT 2
++++ +++#define DEFAULT_RCU_QOVLD (DEFAULT_RCU_QOVLD_MULT * DEFAULT_RCU_QHIMARK)
++++ +++static long qovld = DEFAULT_RCU_QOVLD; /* If this many pending, hammer QS. */
++++ +++static long qovld_calc = -1;      /* No pre-initialization lock acquisitions! */
         
         module_param(blimit, long, 0444);
         module_param(qhimark, long, 0444);
         module_param(qlowmark, long, 0444);
++++ +++module_param(qovld, long, 0444);
         
         static ulong jiffies_till_first_fqs = ULONG_MAX;
         static ulong jiffies_till_next_fqs = ULONG_MAX;
@@@@@@@@@ -818,11 -821,12 -818,11 -818,11 -824,11 -818,11 -818,11 -818,11 +827,12 @@@@@@@@@ static __always_inline void rcu_nmi_ent
                         incby = 1;
                 } else if (tick_nohz_full_cpu(rdp->cpu) &&
                            rdp->dynticks_nmi_nesting == DYNTICK_IRQ_NONIDLE &&
- ------                   READ_ONCE(rdp->rcu_urgent_qs) && !rdp->rcu_forced_tick) {
+ ++++++                   READ_ONCE(rdp->rcu_urgent_qs) &&
+ ++++++                   !READ_ONCE(rdp->rcu_forced_tick)) {
                         raw_spin_lock_rcu_node(rdp->mynode);
                         // Recheck under lock.
                         if (rdp->rcu_urgent_qs && !rdp->rcu_forced_tick) {
- ------                        rdp->rcu_forced_tick = true;
+ ++++++                        WRITE_ONCE(rdp->rcu_forced_tick, true);
                                 tick_dep_set_cpu(rdp->cpu, TICK_DEP_BIT_RCU);
                         }
                         raw_spin_unlock_rcu_node(rdp->mynode);
@@@@@@@@@ -899,7 -903,7 -899,7 -899,7 -905,7 -899,7 -899,7 -899,7 +909,7 @@@@@@@@@ static void rcu_disable_urgency_upon_qs
                 WRITE_ONCE(rdp->rcu_need_heavy_qs, false);
                 if (tick_nohz_full_cpu(rdp->cpu) && rdp->rcu_forced_tick) {
                         tick_dep_clear_cpu(rdp->cpu, TICK_DEP_BIT_RCU);
- ------                rdp->rcu_forced_tick = false;
+ ++++++                WRITE_ONCE(rdp->rcu_forced_tick, false);
                 }
         }
         
@@@@@@@@@ -1072,7 -1076,7 -1072,7 -1072,7 -1078,8 -1072,7 -1072,7 -1072,7 +1082,8 @@@@@@@@@ static int rcu_implicit_dynticks_qs(str
                 rnhqp = &per_cpu(rcu_data.rcu_need_heavy_qs, rdp->cpu);
                 if (!READ_ONCE(*rnhqp) &&
                     (time_after(jiffies, rcu_state.gp_start + jtsq * 2) ||
---- ---             time_after(jiffies, rcu_state.jiffies_resched))) {
++++ +++             time_after(jiffies, rcu_state.jiffies_resched) ||
++++ +++             rcu_state.cbovld)) {
                         WRITE_ONCE(*rnhqp, true);
                         /* Store rcu_need_heavy_qs before rcu_urgent_qs. */
                         smp_store_release(ruqp, true);
@@@@@@@@@ -1089,8 -1093,8 -1089,8 -1089,8 -1096,8 -1089,8 -1089,8 -1089,8 +1100,8 @@@@@@@@@
                  * So hit them over the head with the resched_cpu() hammer!
                  */
                 if (tick_nohz_full_cpu(rdp->cpu) &&
---- ---                   time_after(jiffies,
---- ---                              READ_ONCE(rdp->last_fqs_resched) + jtsq * 3)) {
++++ +++            (time_after(jiffies, READ_ONCE(rdp->last_fqs_resched) + jtsq * 3) ||
++++ +++             rcu_state.cbovld)) {
                         WRITE_ONCE(*ruqp, true);
                         resched_cpu(rdp->cpu);
                         WRITE_ONCE(rdp->last_fqs_resched, jiffies);
@@@@@@@@@ -1126,8 -1130,9 -1126,8 -1126,8 -1133,8 -1126,8 -1126,8 -1126,8 +1137,9 @@@@@@@@@
         static void trace_rcu_this_gp(struct rcu_node *rnp, struct rcu_data *rdp,
                                       unsigned long gp_seq_req, const char *s)
         {
- ------        trace_rcu_future_grace_period(rcu_state.name, rnp->gp_seq, gp_seq_req,
- ------                                      rnp->level, rnp->grplo, rnp->grphi, s);
+ ++++++        trace_rcu_future_grace_period(rcu_state.name, READ_ONCE(rnp->gp_seq),
+ ++++++                                      gp_seq_req, rnp->level,
+ ++++++                                      rnp->grplo, rnp->grphi, s);
         }
         
         /*
@@@@@@@@@ -1174,7 -1179,7 -1174,7 -1174,7 -1181,7 -1174,7 -1174,7 -1174,7 +1186,7 @@@@@@@@@ static bool rcu_start_this_gp(struct rc
                                                   TPS("Prestarted"));
                                 goto unlock_out;
                         }
- ------                rnp->gp_seq_needed = gp_seq_req;
+ ++++++                WRITE_ONCE(rnp->gp_seq_needed, gp_seq_req);
                         if (rcu_seq_state(rcu_seq_current(&rnp->gp_seq))) {
                                 /*
                                  * We just marked the leaf or internal node, and a
@@@@@@@@@ -1199,18 -1204,18 -1199,18 -1199,18 -1206,18 -1199,18 -1199,18 -1199,18 +1211,18 @@@@@@@@@
                 }
                 trace_rcu_this_gp(rnp, rdp, gp_seq_req, TPS("Startedroot"));
                 WRITE_ONCE(rcu_state.gp_flags, rcu_state.gp_flags | RCU_GP_FLAG_INIT);
- ------        rcu_state.gp_req_activity = jiffies;
- ------        if (!rcu_state.gp_kthread) {
+ ++++++        WRITE_ONCE(rcu_state.gp_req_activity, jiffies);
+ ++++++        if (!READ_ONCE(rcu_state.gp_kthread)) {
                         trace_rcu_this_gp(rnp, rdp, gp_seq_req, TPS("NoGPkthread"));
                         goto unlock_out;
                 }
- ------        trace_rcu_grace_period(rcu_state.name, READ_ONCE(rcu_state.gp_seq), TPS("newreq"));
+ ++++++        trace_rcu_grace_period(rcu_state.name, rcu_state.gp_seq, TPS("newreq"));
                 ret = true;  /* Caller must wake GP kthread. */
         unlock_out:
                 /* Push furthest requested GP to leaf node and rcu_data structure. */
                 if (ULONG_CMP_LT(gp_seq_req, rnp->gp_seq_needed)) {
- ------                rnp_start->gp_seq_needed = rnp->gp_seq_needed;
- ------                rdp->gp_seq_needed = rnp->gp_seq_needed;
+ ++++++                WRITE_ONCE(rnp_start->gp_seq_needed, rnp->gp_seq_needed);
+ ++++++                WRITE_ONCE(rdp->gp_seq_needed, rnp->gp_seq_needed);
                 }
                 if (rnp != rnp_start)
                         raw_spin_unlock_rcu_node(rnp);
@@@@@@@@@ -1235,12 -1240,13 -1235,12 -1235,12 -1242,12 -1235,12 -1235,12 -1235,12 +1247,13 @@@@@@@@@ static bool rcu_future_gp_cleanup(struc
         }
         
         /*
- ------ * Awaken the grace-period kthread.  Don't do a self-awaken (unless in
- ------ * an interrupt or softirq handler), and don't bother awakening when there
- ------ * is nothing for the grace-period kthread to do (as in several CPUs raced
- ------ * to awaken, and we lost), and finally don't try to awaken a kthread that
- ------ * has not yet been created.  If all those checks are passed, track some
- ------ * debug information and awaken.
+ ++++++ * Awaken the grace-period kthread.  Don't do a self-awaken (unless in an
+ ++++++ * interrupt or softirq handler, in which case we just might immediately
+ ++++++ * sleep upon return, resulting in a grace-period hang), and don't bother
+ ++++++ * awakening when there is nothing for the grace-period kthread to do
+ ++++++ * (as in several CPUs raced to awaken, we lost), and finally don't try
+ ++++++ * to awaken a kthread that has not yet been created.  If all those checks
+ ++++++ * are passed, track some debug information and awaken.
          *
          * So why do the self-wakeup when in an interrupt or softirq handler
          * in the grace-period kthread's context?  Because the kthread might have
@@@@@@@@@ -1250,10 -1256,10 -1250,10 -1250,10 -1257,10 -1250,10 -1250,10 -1250,10 +1263,10 @@@@@@@@@
          */
         static void rcu_gp_kthread_wake(void)
         {
- ------        if ((current == rcu_state.gp_kthread &&
- ------             !in_irq() && !in_serving_softirq()) ||
- ------            !READ_ONCE(rcu_state.gp_flags) ||
- ------            !rcu_state.gp_kthread)
+ ++++++        struct task_struct *t = READ_ONCE(rcu_state.gp_kthread);
+ ++++++
+ ++++++        if ((current == t && !in_irq() && !in_serving_softirq()) ||
+ ++++++            !READ_ONCE(rcu_state.gp_flags) || !t)
                         return;
                 WRITE_ONCE(rcu_state.gp_wake_time, jiffies);
                 WRITE_ONCE(rcu_state.gp_wake_seq, READ_ONCE(rcu_state.gp_seq));
@@@@@@@@@ -1321,7 -1327,7 -1321,7 -1321,7 -1328,7 -1321,7 -1321,7 -1321,7 +1334,7 @@@@@@@@@ static void rcu_accelerate_cbs_unlocked
         
                 rcu_lockdep_assert_cblist_protected(rdp);
                 c = rcu_seq_snap(&rcu_state.gp_seq);
- ------        if (!rdp->gpwrap && ULONG_CMP_GE(rdp->gp_seq_needed, c)) {
+ ++++++        if (!READ_ONCE(rdp->gpwrap) && ULONG_CMP_GE(rdp->gp_seq_needed, c)) {
                         /* Old request still live, so mark recent callbacks. */
                         (void)rcu_segcblist_accelerate(&rdp->cblist, c);
                         return;
@@@@@@@@@ -1386,7 -1392,7 -1386,7 -1386,7 -1393,7 -1386,7 -1386,7 -1386,7 +1399,7 @@@@@@@@@ static void __maybe_unused rcu_advance_
         static bool __note_gp_changes(struct rcu_node *rnp, struct rcu_data *rdp)
         {
                 bool ret = false;
---- ---        bool need_gp;
++++ +++        bool need_qs;
                 const bool offloaded = IS_ENABLED(CONFIG_RCU_NOCB_CPU) &&
                                        rcu_segcblist_is_offloaded(&rdp->cblist);
         
@@@@@@@@@ -1400,10 -1406,10 -1400,10 -1400,10 -1407,13 -1400,10 -1400,10 -1400,10 +1413,13 @@@@@@@@@
                     unlikely(READ_ONCE(rdp->gpwrap))) {
                         if (!offloaded)
                                 ret = rcu_advance_cbs(rnp, rdp); /* Advance CBs. */
++++ +++                rdp->core_needs_qs = false;
                         trace_rcu_grace_period(rcu_state.name, rdp->gp_seq, TPS("cpuend"));
                 } else {
                         if (!offloaded)
                                 ret = rcu_accelerate_cbs(rnp, rdp); /* Recent CBs. */
++++ +++                if (rdp->core_needs_qs)
++++ +++                        rdp->core_needs_qs = !!(rnp->qsmask & rdp->grpmask);
                 }
         
                 /* Now handle the beginnings of any new-to-this-CPU grace periods. */
@@@@@@@@@ -1415,14 -1421,14 -1415,14 -1415,14 -1425,14 -1415,14 -1415,14 -1415,14 +1431,14 @@@@@@@@@
                          * go looking for one.
                          */
                         trace_rcu_grace_period(rcu_state.name, rnp->gp_seq, TPS("cpustart"));
---- ---                need_gp = !!(rnp->qsmask & rdp->grpmask);
---- ---                rdp->cpu_no_qs.b.norm = need_gp;
---- ---                rdp->core_needs_qs = need_gp;
++++ +++                need_qs = !!(rnp->qsmask & rdp->grpmask);
++++ +++                rdp->cpu_no_qs.b.norm = need_qs;
++++ +++                rdp->core_needs_qs = need_qs;
                         zero_cpu_stall_ticks(rdp);
                 }
                 rdp->gp_seq = rnp->gp_seq;  /* Remember new grace-period state. */
                 if (ULONG_CMP_LT(rdp->gp_seq_needed, rnp->gp_seq_needed) || rdp->gpwrap)
- ------                rdp->gp_seq_needed = rnp->gp_seq_needed;
+ ++++++                WRITE_ONCE(rdp->gp_seq_needed, rnp->gp_seq_needed);
                 WRITE_ONCE(rdp->gpwrap, false);
                 rcu_gpnum_ovf(rnp, rdp);
                 return ret;
@@@@@@@@@ -1651,8 -1657,7 -1651,8 -1651,8 -1661,8 -1651,8 -1651,8 -1651,8 +1667,7 @@@@@@@@@ static void rcu_gp_fqs_loop(void
                                 WRITE_ONCE(rcu_state.jiffies_kick_kthreads,
                                            jiffies + (j ? 3 * j : 2));
                         }
- ------                trace_rcu_grace_period(rcu_state.name,
- ------                                       READ_ONCE(rcu_state.gp_seq),
+ ++++++                trace_rcu_grace_period(rcu_state.name, rcu_state.gp_seq,
                                                TPS("fqswait"));
                         rcu_state.gp_state = RCU_GP_WAIT_FQS;
                         ret = swait_event_idle_timeout_exclusive(
@@@@@@@@@ -1666,13 -1671,11 -1666,13 -1666,13 -1676,13 -1666,13 -1666,13 -1666,13 +1681,11 @@@@@@@@@
                         /* If time for quiescent-state forcing, do it. */
                         if (ULONG_CMP_GE(jiffies, rcu_state.jiffies_force_qs) ||
                             (gf & RCU_GP_FLAG_FQS)) {
- ------                        trace_rcu_grace_period(rcu_state.name,
- ------                                               READ_ONCE(rcu_state.gp_seq),
+ ++++++                        trace_rcu_grace_period(rcu_state.name, rcu_state.gp_seq,
                                                        TPS("fqsstart"));
                                 rcu_gp_fqs(first_gp_fqs);
                                 first_gp_fqs = false;
- ------                        trace_rcu_grace_period(rcu_state.name,
- ------                                               READ_ONCE(rcu_state.gp_seq),
+ ++++++                        trace_rcu_grace_period(rcu_state.name, rcu_state.gp_seq,
                                                        TPS("fqsend"));
                                 cond_resched_tasks_rcu_qs();
                                 WRITE_ONCE(rcu_state.gp_activity, jiffies);
@@@@@@@@@ -1683,8 -1686,7 -1683,8 -1683,8 -1693,8 -1683,8 -1683,8 -1683,8 +1696,7 @@@@@@@@@
                                 cond_resched_tasks_rcu_qs();
                                 WRITE_ONCE(rcu_state.gp_activity, jiffies);
                                 WARN_ON(signal_pending(current));
- ------                        trace_rcu_grace_period(rcu_state.name,
- ------                                               READ_ONCE(rcu_state.gp_seq),
+ ++++++                        trace_rcu_grace_period(rcu_state.name, rcu_state.gp_seq,
                                                        TPS("fqswaitsig"));
                                 ret = 1; /* Keep old FQS timing. */
                                 j = jiffies;
@@@@@@@@@ -1701,8 -1703,8 -1701,8 -1701,8 -1711,9 -1701,8 -1701,8 -1701,8 +1713,9 @@@@@@@@@
          */
         static void rcu_gp_cleanup(void)
         {
---- ---        unsigned long gp_duration;
++++ +++        int cpu;
                 bool needgp = false;
++++ +++        unsigned long gp_duration;
                 unsigned long new_gp_seq;
                 bool offloaded;
                 struct rcu_data *rdp;
@@@@@@@@@ -1748,6 -1750,6 -1748,6 -1748,6 -1759,12 -1748,6 -1748,6 -1748,6 +1761,12 @@@@@@@@@
                                 needgp = __note_gp_changes(rnp, rdp) || needgp;
                         /* smp_mb() provided by prior unlock-lock pair. */
                         needgp = rcu_future_gp_cleanup(rnp) || needgp;
++++ +++                // Reset overload indication for CPUs no longer overloaded
++++ +++                if (rcu_is_leaf_node(rnp))
++++ +++                        for_each_leaf_node_cpu_mask(rnp, cpu, rnp->cbovldmask) {
++++ +++                                rdp = per_cpu_ptr(&rcu_data, cpu);
++++ +++                                check_cb_ovld_locked(rdp, rnp);
++++ +++                        }
                         sq = rcu_nocb_gp_get(rnp);
                         raw_spin_unlock_irq_rcu_node(rnp);
                         rcu_nocb_gp_cleanup(sq);
@@@@@@@@@ -1774,9 -1776,9 -1774,9 -1774,9 -1791,9 -1774,9 -1774,9 -1774,9 +1793,9 @@@@@@@@@
                             rcu_segcblist_is_offloaded(&rdp->cblist);
                 if ((offloaded || !rcu_accelerate_cbs(rnp, rdp)) && needgp) {
                         WRITE_ONCE(rcu_state.gp_flags, RCU_GP_FLAG_INIT);
- ------                rcu_state.gp_req_activity = jiffies;
+ ++++++                WRITE_ONCE(rcu_state.gp_req_activity, jiffies);
                         trace_rcu_grace_period(rcu_state.name,
- ------                                       READ_ONCE(rcu_state.gp_seq),
+ ++++++                                       rcu_state.gp_seq,
                                                TPS("newreq"));
                 } else {
                         WRITE_ONCE(rcu_state.gp_flags,
@@@@@@@@@ -1795,8 -1797,7 -1795,8 -1795,8 -1812,8 -1795,8 -1795,8 -1795,8 +1814,7 @@@@@@@@@ static int __noreturn rcu_gp_kthread(vo
         
                         /* Handle grace-period start. */
                         for (;;) {
- ------                        trace_rcu_grace_period(rcu_state.name,
- ------                                               READ_ONCE(rcu_state.gp_seq),
+ ++++++                        trace_rcu_grace_period(rcu_state.name, rcu_state.gp_seq,
                                                        TPS("reqwait"));
                                 rcu_state.gp_state = RCU_GP_WAIT_GPS;
                                 swait_event_idle_exclusive(rcu_state.gp_wq,
@@@@@@@@@ -1809,8 -1810,7 -1809,8 -1809,8 -1826,8 -1809,8 -1809,8 -1809,8 +1827,7 @@@@@@@@@
                                 cond_resched_tasks_rcu_qs();
                                 WRITE_ONCE(rcu_state.gp_activity, jiffies);
                                 WARN_ON(signal_pending(current));
- ------                        trace_rcu_grace_period(rcu_state.name,
- ------                                               READ_ONCE(rcu_state.gp_seq),
+ ++++++                        trace_rcu_grace_period(rcu_state.name, rcu_state.gp_seq,
                                                        TPS("reqwaitsig"));
                         }
         
@@@@@@@@@ -1881,7 -1881,7 -1881,7 -1881,7 -1898,7 -1881,7 -1881,7 -1881,7 +1898,7 @@@@@@@@@ static void rcu_report_qs_rnp(unsigned 
                         WARN_ON_ONCE(oldmask); /* Any child must be all zeroed! */
                         WARN_ON_ONCE(!rcu_is_leaf_node(rnp) &&
                                      rcu_preempt_blocked_readers_cgp(rnp));
- ------                rnp->qsmask &= ~mask;
+ ++++++                WRITE_ONCE(rnp->qsmask, rnp->qsmask & ~mask);
                         trace_rcu_quiescent_state_report(rcu_state.name, rnp->gp_seq,
                                                          mask, rnp->qsmask, rnp->level,
                                                          rnp->grplo, rnp->grphi,
@@@@@@@@@ -1904,7 -1904,7 -1904,7 -1904,7 -1921,7 -1904,7 -1904,7 -1904,7 +1921,7 @@@@@@@@@
                         rnp_c = rnp;
                         rnp = rnp->parent;
                         raw_spin_lock_irqsave_rcu_node(rnp, flags);
- ------                oldmask = rnp_c->qsmask;
+ ++++++                oldmask = READ_ONCE(rnp_c->qsmask);
                 }
         
                 /*
@@@@@@@@@ -1987,6 -1987,6 -1987,6 -1987,6 -2004,8 -1987,6 -1987,6 -1987,6 +2004,8 @@@@@@@@@ rcu_report_qs_rdp(int cpu, struct rcu_d
                         return;
                 }
                 mask = rdp->grpmask;
++++ +++        if (rdp->cpu == smp_processor_id())
++++ +++                rdp->core_needs_qs = false;
                 if ((rnp->qsmask & mask) == 0) {
                         raw_spin_unlock_irqrestore_rcu_node(rnp, flags);
                 } else {
@@@@@@@@@ -2052,7 -2052,7 -2052,7 -2052,7 -2071,7 -2052,7 -2052,7 -2052,7 +2071,7 @@@@@@@@@ int rcutree_dying_cpu(unsigned int cpu
                         return 0;
         
                 blkd = !!(rnp->qsmask & rdp->grpmask);
- ------        trace_rcu_grace_period(rcu_state.name, rnp->gp_seq,
+ ++++++        trace_rcu_grace_period(rcu_state.name, READ_ONCE(rnp->gp_seq),
                                        blkd ? TPS("cpuofl") : TPS("cpuofl-bgp"));
                 return 0;
         }
@@@@@@@@@ -2294,10 -2294,10 -2294,10 -2294,10 -2313,13 -2294,10 -2294,10 -2294,10 +2313,13 @@@@@@@@@ static void force_qs_rnp(int (*f)(struc
                 struct rcu_data *rdp;
                 struct rcu_node *rnp;
         
++++ +++        rcu_state.cbovld = rcu_state.cbovldnext;
++++ +++        rcu_state.cbovldnext = false;
                 rcu_for_each_leaf_node(rnp) {
                         cond_resched_tasks_rcu_qs();
                         mask = 0;
                         raw_spin_lock_irqsave_rcu_node(rnp, flags);
++++ +++                rcu_state.cbovldnext |= !!rnp->cbovldmask;
                         if (rnp->qsmask == 0) {
                                 if (!IS_ENABLED(CONFIG_PREEMPT_RCU) ||
                                     rcu_preempt_blocked_readers_cgp(rnp)) {
@@@@@@@@@ -2579,11 -2579,11 -2579,11 -2579,11 -2601,48 -2579,11 -2579,11 -2579,11 +2601,48 @@@@@@@@@ static void rcu_leak_callback(struct rc
         }
         
         /*
---- --- * Helper function for call_rcu() and friends.  The cpu argument will
---- --- * normally be -1, indicating "currently running CPU".  It may specify
---- --- * a CPU only if that CPU is a no-CBs CPU.  Currently, only rcu_barrier()
---- --- * is expected to specify a CPU.
++++ +++ * Check and if necessary update the leaf rcu_node structure's
++++ +++ * ->cbovldmask bit corresponding to the current CPU based on that CPU's
++++ +++ * number of queued RCU callbacks.  The caller must hold the leaf rcu_node
++++ +++ * structure's ->lock.
+ +       */
++++ +++static void check_cb_ovld_locked(struct rcu_data *rdp, struct rcu_node *rnp)
++++ +++{
++++ +++        raw_lockdep_assert_held_rcu_node(rnp);
++++ +++        if (qovld_calc <= 0)
++++ +++                return; // Early boot and wildcard value set.
++++ +++        if (rcu_segcblist_n_cbs(&rdp->cblist) >= qovld_calc)
++++ +++                WRITE_ONCE(rnp->cbovldmask, rnp->cbovldmask | rdp->grpmask);
++++ +++        else
++++ +++                WRITE_ONCE(rnp->cbovldmask, rnp->cbovldmask & ~rdp->grpmask);
++++ +++}
++++ +++
++++ +++/*
++++ +++ * Check and if necessary update the leaf rcu_node structure's
++++ +++ * ->cbovldmask bit corresponding to the current CPU based on that CPU's
++++ +++ * number of queued RCU callbacks.  No locks need be held, but the
++++ +++ * caller must have disabled interrupts.
++++ +++ *
++++ +++ * Note that this function ignores the possibility that there are a lot
++++ +++ * of callbacks all of which have already seen the end of their respective
++++ +++ * grace periods.  This omission is due to the need for no-CBs CPUs to
++++ +++ * be holding ->nocb_lock to do this check, which is too heavy for a
++++ +++ * common-case operation.
+ ++ +++ */
++++ +++static void check_cb_ovld(struct rcu_data *rdp)
++++ +++{
++++ +++        struct rcu_node *const rnp = rdp->mynode;
++++ +++
++++ +++        if (qovld_calc <= 0 ||
++++ +++            ((rcu_segcblist_n_cbs(&rdp->cblist) >= qovld_calc) ==
++++ +++             !!(READ_ONCE(rnp->cbovldmask) & rdp->grpmask)))
++++ +++                return; // Early boot wildcard value or already set correctly.
++++ +++        raw_spin_lock_rcu_node(rnp);
++++ +++        check_cb_ovld_locked(rdp, rnp);
++++ +++        raw_spin_unlock_rcu_node(rnp);
++++ +++}
++++ +++
++++ +++/* Helper function for call_rcu() and friends.  */
         static void
         __call_rcu(struct rcu_head *head, rcu_callback_t func)
         {
@@@@@@@@@ -2621,9 -2621,9 -2621,9 -2621,9 -2680,10 -2621,9 -2621,9 -2621,9 +2680,10 @@@@@@@@@
                                 rcu_segcblist_init(&rdp->cblist);
                 }
         
++++ +++        check_cb_ovld(rdp);
                 if (rcu_nocb_try_bypass(rdp, head, &was_alldone, flags))
                         return; // Enqueued onto ->nocb_bypass, so just leave.
---- ---        /* If we get here, rcu_nocb_try_bypass() acquired ->nocb_lock. */
++++ +++        // If no-CBs CPU gets here, rcu_nocb_try_bypass() acquired ->nocb_lock.
                 rcu_segcblist_enqueue(&rdp->cblist, head);
                 if (__is_kfree_rcu_offset((unsigned long)func))
                         trace_rcu_kfree_callback(rcu_state.name, head,
@@@@@@@@@ -2689,22 -2689,22 -2689,47 -2689,22 -2749,22 -2689,22 -2689,22 -2689,22 +2749,47 @@@@@@@@@ EXPORT_SYMBOL_GPL(call_rcu)
         #define KFREE_DRAIN_JIFFIES (HZ / 50)
         #define KFREE_N_BATCHES 2
         
++ +++++/*
++ +++++ * This macro defines how many entries the "records" array
++ +++++ * will contain. It is based on the fact that the size of
++ +++++ * kfree_rcu_bulk_data structure becomes exactly one page.
++ +++++ */
++ +++++#define KFREE_BULK_MAX_ENTR ((PAGE_SIZE / sizeof(void *)) - 3)
++ +++++
++ +++++/**
++ +++++ * struct kfree_rcu_bulk_data - single block to store kfree_rcu() pointers
++ +++++ * @nr_records: Number of active pointers in the array
++ +++++ * @records: Array of the kfree_rcu() pointers
++ +++++ * @next: Next bulk object in the block chain
++ +++++ * @head_free_debug: For debug, when CONFIG_DEBUG_OBJECTS_RCU_HEAD is set
++ +++++ */
++ +++++struct kfree_rcu_bulk_data {
++ +++++        unsigned long nr_records;
++ +++++        void *records[KFREE_BULK_MAX_ENTR];
++ +++++        struct kfree_rcu_bulk_data *next;
++ +++++        struct rcu_head *head_free_debug;
++ +++++};
++ +++++
         /**
          * struct kfree_rcu_cpu_work - single batch of kfree_rcu() requests
          * @rcu_work: Let queue_rcu_work() invoke workqueue handler after grace period
          * @head_free: List of kfree_rcu() objects waiting for a grace period
++ +++++ * @bhead_free: Bulk-List of kfree_rcu() objects waiting for a grace period
          * @krcp: Pointer to @kfree_rcu_cpu structure
          */
         
         struct kfree_rcu_cpu_work {
                 struct rcu_work rcu_work;
                 struct rcu_head *head_free;
++ +++++        struct kfree_rcu_bulk_data *bhead_free;
                 struct kfree_rcu_cpu *krcp;
         };
         
         /**
          * struct kfree_rcu_cpu - batch up kfree_rcu() requests for RCU grace period
          * @head: List of kfree_rcu() objects not yet waiting for a grace period
++ +++++ * @bhead: Bulk-List of kfree_rcu() objects not yet waiting for a grace period
++ +++++ * @bcached: Keeps at most one object for later reuse when build chain blocks
          * @krw_arr: Array of batches of kfree_rcu() objects waiting for a grace period
          * @lock: Synchronize access to this structure
          * @monitor_work: Promote @head to @head_free after KFREE_DRAIN_JIFFIES
@@@@@@@@@ -2718,6 -2718,6 -2743,8 -2718,6 -2778,6 -2718,6 -2718,6 -2718,6 +2803,8 @@@@@@@@@
          */
         struct kfree_rcu_cpu {
                 struct rcu_head *head;
++ +++++        struct kfree_rcu_bulk_data *bhead;
++ +++++        struct kfree_rcu_bulk_data *bcached;
                 struct kfree_rcu_cpu_work krw_arr[KFREE_N_BATCHES];
                 spinlock_t lock;
                 struct delayed_work monitor_work;
@@@@@@@@@ -2727,14 -2727,14 -2754,24 -2727,14 -2787,14 -2727,14 -2727,14 -2727,14 +2814,24 @@@@@@@@@
         
         static DEFINE_PER_CPU(struct kfree_rcu_cpu, krc);
         
++ +++++static __always_inline void
++ +++++debug_rcu_head_unqueue_bulk(struct rcu_head *head)
++ +++++{
++ +++++#ifdef CONFIG_DEBUG_OBJECTS_RCU_HEAD
++ +++++        for (; head; head = head->next)
++ +++++                debug_rcu_head_unqueue(head);
++ +++++#endif
++ +++++}
++ +++++
         /*
          * This function is invoked in workqueue context after a grace period.
-- ----- * It frees all the objects queued on ->head_free.
++ +++++ * It frees all the objects queued on ->bhead_free or ->head_free.
          */
         static void kfree_rcu_work(struct work_struct *work)
         {
                 unsigned long flags;
                 struct rcu_head *head, *next;
++ +++++        struct kfree_rcu_bulk_data *bhead, *bnext;
                 struct kfree_rcu_cpu *krcp;
                 struct kfree_rcu_cpu_work *krwp;
         
@@@@@@@@@ -2744,22 -2744,22 -2781,44 -2744,22 -2804,22 -2744,22 -2744,22 -2744,22 +2841,44 @@@@@@@@@
                 spin_lock_irqsave(&krcp->lock, flags);
                 head = krwp->head_free;
                 krwp->head_free = NULL;
++ +++++        bhead = krwp->bhead_free;
++ +++++        krwp->bhead_free = NULL;
                 spin_unlock_irqrestore(&krcp->lock, flags);
         
-- -----        // List "head" is now private, so traverse locklessly.
++ +++++        /* "bhead" is now private, so traverse locklessly. */
++ +++++        for (; bhead; bhead = bnext) {
++ +++++                bnext = bhead->next;
++ +++++
++ +++++                debug_rcu_head_unqueue_bulk(bhead->head_free_debug);
++ +++++
++ +++++                rcu_lock_acquire(&rcu_callback_map);
++ +++++                trace_rcu_invoke_kfree_bulk_callback(rcu_state.name,
++ +++++                        bhead->nr_records, bhead->records);
++ +++++
++ +++++                kfree_bulk(bhead->nr_records, bhead->records);
++ +++++                rcu_lock_release(&rcu_callback_map);
++ +++++
++ +++++                if (cmpxchg(&krcp->bcached, NULL, bhead))
++ +++++                        free_page((unsigned long) bhead);
++ +++++
++ +++++                cond_resched_tasks_rcu_qs();
++ +++++        }
++ +++++
++ +++++        /*
++ +++++         * Emergency case only. It can happen under low memory
++ +++++         * condition when an allocation gets failed, so the "bulk"
++ +++++         * path can not be temporary maintained.
++ +++++         */
                 for (; head; head = next) {
                         unsigned long offset = (unsigned long)head->func;
         
                         next = head->next;
-- -----                // Potentially optimize with kfree_bulk in future.
                         debug_rcu_head_unqueue(head);
                         rcu_lock_acquire(&rcu_callback_map);
                         trace_rcu_invoke_kfree_callback(rcu_state.name, head, offset);
         
-- -----                if (!WARN_ON_ONCE(!__is_kfree_rcu_offset(offset))) {
-- -----                        /* Could be optimized with kfree_bulk() in future. */
++ +++++                if (!WARN_ON_ONCE(!__is_kfree_rcu_offset(offset)))
                                 kfree((void *)head - offset);
-- -----                }
         
                         rcu_lock_release(&rcu_callback_map);
                         cond_resched_tasks_rcu_qs();
@@@@@@@@@ -2774,26 -2774,26 -2833,48 -2774,26 -2834,26 -2774,26 -2774,26 -2774,26 +2893,48 @@@@@@@@@
          */
         static inline bool queue_kfree_rcu_work(struct kfree_rcu_cpu *krcp)
         {
++ +++++        struct kfree_rcu_cpu_work *krwp;
++ +++++        bool queued = false;
                 int i;
-- -----        struct kfree_rcu_cpu_work *krwp = NULL;
         
                 lockdep_assert_held(&krcp->lock);
-- -----        for (i = 0; i < KFREE_N_BATCHES; i++)
-- -----                if (!krcp->krw_arr[i].head_free) {
-- -----                        krwp = &(krcp->krw_arr[i]);
-- -----                        break;
-- -----                }
         
-- -----        // If a previous RCU batch is in progress, we cannot immediately
-- -----        // queue another one, so return false to tell caller to retry.
-- -----        if (!krwp)
-- -----                return false;
++ +++++        for (i = 0; i < KFREE_N_BATCHES; i++) {
++ +++++                krwp = &(krcp->krw_arr[i]);
         
-- -----        krwp->head_free = krcp->head;
-- -----        krcp->head = NULL;
-- -----        INIT_RCU_WORK(&krwp->rcu_work, kfree_rcu_work);
-- -----        queue_rcu_work(system_wq, &krwp->rcu_work);
-- -----        return true;
++ +++++                /*
++ +++++                 * Try to detach bhead or head and attach it over any
++ +++++                 * available corresponding free channel. It can be that
++ +++++                 * a previous RCU batch is in progress, it means that
++ +++++                 * immediately to queue another one is not possible so
++ +++++                 * return false to tell caller to retry.
++ +++++                 */
++ +++++                if ((krcp->bhead && !krwp->bhead_free) ||
++ +++++                                (krcp->head && !krwp->head_free)) {
++ +++++                        /* Channel 1. */
++ +++++                        if (!krwp->bhead_free) {
++ +++++                                krwp->bhead_free = krcp->bhead;
++ +++++                                krcp->bhead = NULL;
++ +++++                        }
++ +++++
++ +++++                        /* Channel 2. */
++ +++++                        if (!krwp->head_free) {
++ +++++                                krwp->head_free = krcp->head;
++ +++++                                krcp->head = NULL;
++ +++++                        }
++ +++++
++ +++++                        /*
++ +++++                         * One work is per one batch, so there are two "free channels",
++ +++++                         * "bhead_free" and "head_free" the batch can handle. It can be
++ +++++                         * that the work is in the pending state when two channels have
++ +++++                         * been detached following each other, one by one.
++ +++++                         */
++ +++++                        queue_rcu_work(system_wq, &krwp->rcu_work);
++ +++++                        queued = true;
++ +++++                }
++ +++++        }
++ +++++
++ +++++        return queued;
         }
         
         static inline void kfree_rcu_drain_unlock(struct kfree_rcu_cpu *krcp,
@@@@@@@@@ -2830,19 -2830,19 -2911,65 -2830,19 -2890,19 -2830,19 -2830,19 -2830,19 +2971,65 @@@@@@@@@ static void kfree_rcu_monitor(struct wo
                         spin_unlock_irqrestore(&krcp->lock, flags);
         }
         
++ +++++static inline bool
++ +++++kfree_call_rcu_add_ptr_to_bulk(struct kfree_rcu_cpu *krcp,
++ +++++        struct rcu_head *head, rcu_callback_t func)
++ +++++{
++ +++++        struct kfree_rcu_bulk_data *bnode;
++ +++++
++ +++++        if (unlikely(!krcp->initialized))
++ +++++                return false;
++ +++++
++ +++++        lockdep_assert_held(&krcp->lock);
++ +++++
++ +++++        /* Check if a new block is required. */
++ +++++        if (!krcp->bhead ||
++ +++++                        krcp->bhead->nr_records == KFREE_BULK_MAX_ENTR) {
++ +++++                bnode = xchg(&krcp->bcached, NULL);
++ +++++                if (!bnode) {
++ +++++                        WARN_ON_ONCE(sizeof(struct kfree_rcu_bulk_data) > PAGE_SIZE);
++ +++++
++ +++++                        bnode = (struct kfree_rcu_bulk_data *)
++ +++++                                __get_free_page(GFP_NOWAIT | __GFP_NOWARN);
++ +++++                }
++ +++++
++ +++++                /* Switch to emergency path. */
++ +++++                if (unlikely(!bnode))
++ +++++                        return false;
++ +++++
++ +++++                /* Initialize the new block. */
++ +++++                bnode->nr_records = 0;
++ +++++                bnode->next = krcp->bhead;
++ +++++                bnode->head_free_debug = NULL;
++ +++++
++ +++++                /* Attach it to the head. */
++ +++++                krcp->bhead = bnode;
++ +++++        }
++ +++++
++ +++++#ifdef CONFIG_DEBUG_OBJECTS_RCU_HEAD
++ +++++        head->func = func;
++ +++++        head->next = krcp->bhead->head_free_debug;
++ +++++        krcp->bhead->head_free_debug = head;
++ +++++#endif
++ +++++
++ +++++        /* Finally insert. */
++ +++++        krcp->bhead->records[krcp->bhead->nr_records++] =
++ +++++                (void *) head - (unsigned long) func;
++ +++++
++ +++++        return true;
++ +++++}
++ +++++
         /*
-- ----- * Queue a request for lazy invocation of kfree() after a grace period.
++ +++++ * Queue a request for lazy invocation of kfree_bulk()/kfree() after a grace
++ +++++ * period. Please note there are two paths are maintained, one is the main one
++ +++++ * that uses kfree_bulk() interface and second one is emergency one, that is
++ +++++ * used only when the main path can not be maintained temporary, due to memory
++ +++++ * pressure.
          *
          * Each kfree_call_rcu() request is added to a batch. The batch will be drained
-- ----- * every KFREE_DRAIN_JIFFIES number of jiffies. All the objects in the batch
-- ----- * will be kfree'd in workqueue context. This allows us to:
-- ----- *
-- ----- * 1.   Batch requests together to reduce the number of grace periods during
-- ----- *      heavy kfree_rcu() load.
-- ----- *
-- ----- * 2.   It makes it possible to use kfree_bulk() on a large number of
-- ----- *      kfree_rcu() requests thus reducing cache misses and the per-object
-- ----- *      overhead of kfree().
++ +++++ * every KFREE_DRAIN_JIFFIES number of jiffies. All the objects in the batch will
++ +++++ * be free'd in workqueue context. This allows us to: batch requests together to
++ +++++ * reduce the number of grace periods during heavy kfree_rcu() load.
          */
         void kfree_call_rcu(struct rcu_head *head, rcu_callback_t func)
         {
@@@@@@@@@ -2861,9 -2861,9 -2988,16 -2861,9 -2921,9 -2861,9 -2861,9 -2861,9 +3048,16 @@@@@@@@@
                                   __func__, head);
                         goto unlock_return;
                 }
-- -----        head->func = func;
-- -----        head->next = krcp->head;
-- -----        krcp->head = head;
++ +++++
++ +++++        /*
++ +++++         * Under high memory pressure GFP_NOWAIT can fail,
++ +++++         * in that case the emergency path is maintained.
++ +++++         */
++ +++++        if (unlikely(!kfree_call_rcu_add_ptr_to_bulk(krcp, head, func))) {
++ +++++                head->func = func;
++ +++++                head->next = krcp->head;
++ +++++                krcp->head = head;
++ +++++        }
         
                 // Set timer to drain after KFREE_DRAIN_JIFFIES.
                 if (rcu_scheduler_active == RCU_SCHEDULER_RUNNING &&
@@@@@@@@@ -3075,24 -3075,32 -3209,24 -3075,24 -3135,24 -3075,24 -3075,24 -3075,24 +3269,32 @@@@@@@@@ static void rcu_barrier_trace(const cha
         /*
          * RCU callback function for rcu_barrier().  If we are last, wake
          * up the task executing rcu_barrier().
+ ++++++ *
+ ++++++ * Note that the value of rcu_state.barrier_sequence must be captured
+ ++++++ * before the atomic_dec_and_test().  Otherwise, if this CPU is not last,
+ ++++++ * other CPUs might count the value down to zero before this CPU gets
+ ++++++ * around to invoking rcu_barrier_trace(), which might result in bogus
+ ++++++ * data from the next instance of rcu_barrier().
          */
         static void rcu_barrier_callback(struct rcu_head *rhp)
         {
+ ++++++        unsigned long __maybe_unused s = rcu_state.barrier_sequence;
+ ++++++
                 if (atomic_dec_and_test(&rcu_state.barrier_cpu_count)) {
- ------                rcu_barrier_trace(TPS("LastCB"), -1,
- ------                                  rcu_state.barrier_sequence);
+ ++++++                rcu_barrier_trace(TPS("LastCB"), -1, s);
                         complete(&rcu_state.barrier_completion);
                 } else {
- ------                rcu_barrier_trace(TPS("CB"), -1, rcu_state.barrier_sequence);
+ ++++++                rcu_barrier_trace(TPS("CB"), -1, s);
                 }
         }
         
         /*
          * Called with preemption disabled, and from cross-cpu IRQ context.
          */
- ------static void rcu_barrier_func(void *unused)
+ ++++++static void rcu_barrier_func(void *cpu_in)
         {
- ------        struct rcu_data *rdp = raw_cpu_ptr(&rcu_data);
+ ++++++        uintptr_t cpu = (uintptr_t)cpu_in;
+ ++++++        struct rcu_data *rdp = per_cpu_ptr(&rcu_data, cpu);
         
                 rcu_barrier_trace(TPS("IRQ"), -1, rcu_state.barrier_sequence);
                 rdp->barrier_head.func = rcu_barrier_callback;
@@@@@@@@@ -3119,7 -3127,7 -3253,7 -3119,7 -3179,7 -3119,7 -3119,7 -3119,7 +3321,7 @@@@@@@@@
          */
         void rcu_barrier(void)
         {
- ------        int cpu;
+ ++++++        uintptr_t cpu;
                 struct rcu_data *rdp;
                 unsigned long s = rcu_seq_snap(&rcu_state.barrier_sequence);
         
@@@@@@@@@ -3142,13 -3150,14 -3276,13 -3142,13 -3202,13 -3142,13 -3142,13 -3142,13 +3344,14 @@@@@@@@@
                 rcu_barrier_trace(TPS("Inc1"), -1, rcu_state.barrier_sequence);
         
                 /*
- ------         * Initialize the count to one rather than to zero in order to
- ------         * avoid a too-soon return to zero in case of a short grace period
- ------         * (or preemption of this task).  Exclude CPU-hotplug operations
- ------         * to ensure that no offline CPU has callbacks queued.
+ ++++++         * Initialize the count to two rather than to zero in order
+ ++++++         * to avoid a too-soon return to zero in case of an immediate
+ ++++++         * invocation of the just-enqueued callback (or preemption of
+ ++++++         * this task).  Exclude CPU-hotplug operations to ensure that no
+ ++++++         * offline non-offloaded CPU has callbacks queued.
                  */
                 init_completion(&rcu_state.barrier_completion);
- ------        atomic_set(&rcu_state.barrier_cpu_count, 1);
+ ++++++        atomic_set(&rcu_state.barrier_cpu_count, 2);
                 get_online_cpus();
         
                 /*
@@@@@@@@@ -3158,13 -3167,23 -3292,13 -3158,13 -3218,13 -3158,13 -3158,13 -3158,13 +3361,23 @@@@@@@@@
                  */
                 for_each_possible_cpu(cpu) {
                         rdp = per_cpu_ptr(&rcu_data, cpu);
- ------                if (!cpu_online(cpu) &&
+ ++++++                if (cpu_is_offline(cpu) &&
                             !rcu_segcblist_is_offloaded(&rdp->cblist))
                                 continue;
- ------                if (rcu_segcblist_n_cbs(&rdp->cblist)) {
+ ++++++                if (rcu_segcblist_n_cbs(&rdp->cblist) && cpu_online(cpu)) {
                                 rcu_barrier_trace(TPS("OnlineQ"), cpu,
                                                   rcu_state.barrier_sequence);
- ------                        smp_call_function_single(cpu, rcu_barrier_func, NULL, 1);
+ ++++++                        smp_call_function_single(cpu, rcu_barrier_func, (void *)cpu, 1);
+ ++++++                } else if (rcu_segcblist_n_cbs(&rdp->cblist) &&
+ ++++++                           cpu_is_offline(cpu)) {
+ ++++++                        rcu_barrier_trace(TPS("OfflineNoCBQ"), cpu,
+ ++++++                                          rcu_state.barrier_sequence);
+ ++++++                        local_irq_disable();
+ ++++++                        rcu_barrier_func((void *)cpu);
+ ++++++                        local_irq_enable();
+ ++++++                } else if (cpu_is_offline(cpu)) {
+ ++++++                        rcu_barrier_trace(TPS("OfflineNoCBNoQ"), cpu,
+ ++++++                                          rcu_state.barrier_sequence);
                         } else {
                                 rcu_barrier_trace(TPS("OnlineNQ"), cpu,
                                                   rcu_state.barrier_sequence);
@@@@@@@@@ -3176,7 -3195,7 -3310,7 -3176,7 -3236,7 -3176,7 -3176,7 -3176,7 +3389,7 @@@@@@@@@
                  * Now that we have an rcu_barrier_callback() callback on each
                  * CPU, and thus each counted, remove the initial count.
                  */
- ------        if (atomic_dec_and_test(&rcu_state.barrier_cpu_count))
+ ++++++        if (atomic_sub_and_test(2, &rcu_state.barrier_cpu_count))
                         complete(&rcu_state.barrier_completion);
         
                 /* Wait for all rcu_barrier_callback() callbacks to be invoked. */
@@@@@@@@@ -3275,12 -3294,12 -3409,12 -3275,12 -3335,12 -3275,12 -3275,12 -3275,12 +3488,12 @@@@@@@@@ int rcutree_prepare_cpu(unsigned int cp
                 rnp = rdp->mynode;
                 raw_spin_lock_rcu_node(rnp);            /* irqs already disabled. */
                 rdp->beenonline = true;  /* We have now been online. */
- ------        rdp->gp_seq = rnp->gp_seq;
- ------        rdp->gp_seq_needed = rnp->gp_seq;
+ ++++++        rdp->gp_seq = READ_ONCE(rnp->gp_seq);
+ ++++++        rdp->gp_seq_needed = rdp->gp_seq;
                 rdp->cpu_no_qs.b.norm = true;
                 rdp->core_needs_qs = false;
                 rdp->rcu_iw_pending = false;
- ------        rdp->rcu_iw_gp_seq = rnp->gp_seq - 1;
+ ++++++        rdp->rcu_iw_gp_seq = rdp->gp_seq - 1;
                 trace_rcu_grace_period(rcu_state.name, rdp->gp_seq, TPS("cpuonl"));
                 raw_spin_unlock_irqrestore_rcu_node(rnp, flags);
                 rcu_prepare_kthreads(cpu);
@@@@@@@@@ -3378,7 -3397,7 -3512,7 -3378,7 -3438,7 -3378,7 -3378,7 -3378,7 +3591,7 @@@@@@@@@ void rcu_cpu_starting(unsigned int cpu
                 rnp = rdp->mynode;
                 mask = rdp->grpmask;
                 raw_spin_lock_irqsave_rcu_node(rnp, flags);
- ------        rnp->qsmaskinitnext |= mask;
+ ++++++        WRITE_ONCE(rnp->qsmaskinitnext, rnp->qsmaskinitnext | mask);
                 oldmask = rnp->expmaskinitnext;
                 rnp->expmaskinitnext |= mask;
                 oldmask ^= rnp->expmaskinitnext;
@@@@@@@@@ -3431,7 -3450,7 -3565,7 -3431,7 -3491,7 -3431,7 -3431,7 -3431,7 +3644,7 @@@@@@@@@ void rcu_report_dead(unsigned int cpu
                         rcu_report_qs_rnp(mask, rnp, rnp->gp_seq, flags);
                         raw_spin_lock_irqsave_rcu_node(rnp, flags);
                 }
- ------        rnp->qsmaskinitnext &= ~mask;
+ ++++++        WRITE_ONCE(rnp->qsmaskinitnext, rnp->qsmaskinitnext & ~mask);
                 raw_spin_unlock_irqrestore_rcu_node(rnp, flags);
                 raw_spin_unlock(&rcu_state.ofl_lock);
         
@@@@@@@@@ -3545,7 -3564,10 -3679,7 -3545,7 -3605,7 -3545,7 -3545,7 -3545,7 +3758,10 @@@@@@@@@ static int __init rcu_spawn_gp_kthread(
                 }
                 rnp = rcu_get_root();
                 raw_spin_lock_irqsave_rcu_node(rnp, flags);
- ------        rcu_state.gp_kthread = t;
+ ++++++        WRITE_ONCE(rcu_state.gp_activity, jiffies);
+ ++++++        WRITE_ONCE(rcu_state.gp_req_activity, jiffies);
+ ++++++        // Reset .gp_activity and .gp_req_activity before setting .gp_kthread.
+ ++++++        smp_store_release(&rcu_state.gp_kthread, t);  /* ^^^ */
                 raw_spin_unlock_irqrestore_rcu_node(rnp, flags);
                 wake_up_process(t);
                 rcu_spawn_nocb_kthreads();
@@@@@@@@@ -3769,8 -3791,8 -3903,11 -3769,8 -3829,8 -3769,8 -3769,8 -3769,8 +3985,11 @@@@@@@@@ static void __init kfree_rcu_batch_init
                         struct kfree_rcu_cpu *krcp = per_cpu_ptr(&krc, cpu);
         
                         spin_lock_init(&krcp->lock);
-- -----                for (i = 0; i < KFREE_N_BATCHES; i++)
++ +++++                for (i = 0; i < KFREE_N_BATCHES; i++) {
++ +++++                        INIT_RCU_WORK(&krcp->krw_arr[i].rcu_work, kfree_rcu_work);
                                 krcp->krw_arr[i].krcp = krcp;
++ +++++                }
++ +++++
                         INIT_DELAYED_WORK(&krcp->monitor_work, kfree_rcu_monitor);
                         krcp->initialized = true;
                 }
@@@@@@@@@ -3809,6 -3831,6 -3946,6 -3809,6 -3869,13 -3809,6 -3809,6 -3809,6 +4028,13 @@@@@@@@@ void __init rcu_init(void
                 rcu_par_gp_wq = alloc_workqueue("rcu_par_gp", WQ_MEM_RECLAIM, 0);
                 WARN_ON(!rcu_par_gp_wq);
                 srcu_init();
++++ +++
++++ +++        /* Fill in default value for rcutree.qovld boot parameter. */
++++ +++        /* -After- the rcu_node ->lock fields are initialized! */
++++ +++        if (qovld < 0)
++++ +++                qovld_calc = DEFAULT_RCU_QOVLD_MULT * qhimark;
++++ +++        else
++++ +++                qovld_calc = qovld;
         }
         
         #include "tree_stall.h"
diff --combined kernel/rcu/tree_exp.h

index dcbd75791f3926f815391ff45406e53c3bfb0ef4,85b009e05637ff0282c68e2f05b450f6999fbd4f,dcbd75791f3926f815391ff45406e53c3bfb0ef4,dcbd75791f3926f815391ff45406e53c3bfb0ef4,dcbd75791f3926f815391ff45406e53c3bfb0ef4,dcbd75791f3926f815391ff45406e53c3bfb0ef4,dcbd75791f3926f815391ff45406e53c3bfb0ef4,c28d9f0034c31e8691140cf67a9dfd28b36331d7..1a617b9dffb0534776ff32ce879bb685d7278ea9
--- 1/kernel/rcu/tree_exp.h
--- 2/kernel/rcu/tree_exp.h
--- 3/kernel/rcu/tree_exp.h
--- 4/kernel/rcu/tree_exp.h
--- 5/kernel/rcu/tree_exp.h
--- 6/kernel/rcu/tree_exp.h
--- 7/kernel/rcu/tree_exp.h
--- 8/kernel/rcu/tree_exp.h
+++ b/kernel/rcu/tree_exp.h
@@@@@@@@@ -314,7 -314,7 -314,7 -314,7 -314,7 -314,7 -314,7 -314,7 +314,7 @@@@@@@@@ static bool exp_funnel_lock(unsigned lo
                                            sync_exp_work_done(s));
                                 return true;
                         }
- ------                rnp->exp_seq_rq = s; /* Followers can wait on us. */
+ ++++++                WRITE_ONCE(rnp->exp_seq_rq, s); /* Followers can wait on us. */
                         spin_unlock(&rnp->exp_lock);
                         trace_rcu_exp_funnel_lock(rcu_state.name, rnp->level,
                                                   rnp->grplo, rnp->grphi, TPS("nxtlvl"));
@@@@@@@@@ -485,6 -485,6 -485,6 -485,6 -485,6 -485,6 -485,6 -485,7 +485,7 @@@@@@@@@ static bool synchronize_rcu_expedited_w
         static void synchronize_rcu_expedited_wait(void)
         {
                 int cpu;
+++++++         unsigned long j;
                 unsigned long jiffies_stall;
                 unsigned long jiffies_start;
                 unsigned long mask;
@@@@@@@@@ -496,7 -496,7 -496,7 -496,7 -496,7 -496,7 -496,7 -497,7 +497,7 @@@@@@@@@
                 trace_rcu_exp_grace_period(rcu_state.name, rcu_exp_gp_seq_endval(), TPS("startwait"));
                 jiffies_stall = rcu_jiffies_till_stall_check();
                 jiffies_start = jiffies;
-------         if (IS_ENABLED(CONFIG_NO_HZ_FULL)) {
+++++++         if (tick_nohz_full_enabled() && rcu_inkernel_boot_has_ended()) {
                         if (synchronize_rcu_expedited_wait_once(1))
                                 return;
                         rcu_for_each_leaf_node(rnp) {
@@@@@@@@@ -508,12 -508,12 -508,12 -508,12 -508,12 -508,12 -508,12 -509,16 +509,16 @@@@@@@@@
                                         tick_dep_set_cpu(cpu, TICK_DEP_BIT_RCU_EXP);
                                 }
                         }
+++++++                 j = READ_ONCE(jiffies_till_first_fqs);
+++++++                 if (synchronize_rcu_expedited_wait_once(j + HZ))
+++++++                         return;
+++++++                 WARN_ON_ONCE(IS_ENABLED(CONFIG_PREEMPT_RT));
                 }
         
                 for (;;) {
                         if (synchronize_rcu_expedited_wait_once(jiffies_stall))
                                 return;
-------                 if (rcu_cpu_stall_suppress)
+++++++                 if (rcu_stall_is_suppressed())
                                 continue;
                         panic_on_rcu_stall();
                         pr_err("INFO: %s detected expedited stalls on CPUs/tasks: {",
@@@@@@@@@ -589,7 -589,7 -589,7 -589,7 -589,7 -589,7 -589,7 -594,7 +594,7 @@@@@@@@@ static void rcu_exp_wait_wake(unsigned 
                                 spin_lock(&rnp->exp_lock);
                                 /* Recheck, avoid hang in case someone just arrived. */
                                 if (ULONG_CMP_LT(rnp->exp_seq_rq, s))
- ------                                rnp->exp_seq_rq = s;
+ ++++++                                WRITE_ONCE(rnp->exp_seq_rq, s);
                                 spin_unlock(&rnp->exp_lock);
                         }
                         smp_mb(); /* All above changes before wakeup. */
diff --combined kernel/rcu/tree_plugin.h

index c6ea81cd41890e8f51ff6da9eb5565d34d1ffcef,36e71c99970a3f0941576008b1b856ae66a1af37,c6ea81cd41890e8f51ff6da9eb5565d34d1ffcef,c6ea81cd41890e8f51ff6da9eb5565d34d1ffcef,0765784012f877e1141e9430d609f404b2569e70,c6ea81cd41890e8f51ff6da9eb5565d34d1ffcef,c6ea81cd41890e8f51ff6da9eb5565d34d1ffcef,c6ea81cd41890e8f51ff6da9eb5565d34d1ffcef..097635c41135da1954de4b1fc5fc0efc676753f4
--- 1/kernel/rcu/tree_plugin.h
--- 2/kernel/rcu/tree_plugin.h
--- 3/kernel/rcu/tree_plugin.h
--- 4/kernel/rcu/tree_plugin.h
--- 5/kernel/rcu/tree_plugin.h
--- 6/kernel/rcu/tree_plugin.h
--- 7/kernel/rcu/tree_plugin.h
--- 8/kernel/rcu/tree_plugin.h
+++ b/kernel/rcu/tree_plugin.h
@@@@@@@@@ -56,6 -56,6 -56,6 -56,6 -56,8 -56,6 -56,6 -56,6 +56,8 @@@@@@@@@ static void __init rcu_bootup_announce_
                         pr_info("\tBoot-time adjustment of callback high-water mark to %ld.\n", qhimark);
                 if (qlowmark != DEFAULT_RCU_QLOMARK)
                         pr_info("\tBoot-time adjustment of callback low-water mark to %ld.\n", qlowmark);
++++ +++        if (qovld != DEFAULT_RCU_QOVLD)
++++ +++                pr_info("\tBoot-time adjustment of callback overload level to %ld.\n", qovld);
                 if (jiffies_till_first_fqs != ULONG_MAX)
                         pr_info("\tBoot-time adjustment of first FQS scan delay to %ld jiffies.\n", jiffies_till_first_fqs);
                 if (jiffies_till_next_fqs != ULONG_MAX)
@@@@@@@@@ -753,7 -753,7 -753,7 -753,7 -755,7 -753,7 -753,7 -753,7 +755,7 @@@@@@@@@ dump_blkd_tasks(struct rcu_node *rnp, i
                 raw_lockdep_assert_held_rcu_node(rnp);
                 pr_info("%s: grp: %d-%d level: %d ->gp_seq %ld ->completedqs %ld\n",
                         __func__, rnp->grplo, rnp->grphi, rnp->level,
- ------                (long)rnp->gp_seq, (long)rnp->completedqs);
+ ++++++                (long)READ_ONCE(rnp->gp_seq), (long)rnp->completedqs);
                 for (rnp1 = rnp; rnp1; rnp1 = rnp1->parent)
                         pr_info("%s: %d:%d ->qsmask %#lx ->qsmaskinit %#lx ->qsmaskinitnext %#lx\n",
                                 __func__, rnp1->grplo, rnp1->grphi, rnp1->qsmask, rnp1->qsmaskinit, rnp1->qsmaskinitnext);
@@@@@@@@@ -1032,18 -1032,18 -1032,18 -1032,18 -1034,18 -1032,18 -1032,18 -1032,18 +1034,18 @@@@@@@@@ static int rcu_boost_kthread(void *arg
         
                 trace_rcu_utilization(TPS("Start boost kthread@init"));
                 for (;;) {
- ------                rnp->boost_kthread_status = RCU_KTHREAD_WAITING;
+ ++++++                WRITE_ONCE(rnp->boost_kthread_status, RCU_KTHREAD_WAITING);
                         trace_rcu_utilization(TPS("End boost kthread@rcu_wait"));
                         rcu_wait(rnp->boost_tasks || rnp->exp_tasks);
                         trace_rcu_utilization(TPS("Start boost kthread@rcu_wait"));
- ------                rnp->boost_kthread_status = RCU_KTHREAD_RUNNING;
+ ++++++                WRITE_ONCE(rnp->boost_kthread_status, RCU_KTHREAD_RUNNING);
                         more2boost = rcu_boost(rnp);
                         if (more2boost)
                                 spincnt++;
                         else
                                 spincnt = 0;
                         if (spincnt > 10) {
- ------                        rnp->boost_kthread_status = RCU_KTHREAD_YIELDING;
+ ++++++                        WRITE_ONCE(rnp->boost_kthread_status, RCU_KTHREAD_YIELDING);
                                 trace_rcu_utilization(TPS("End boost kthread@rcu_yield"));
                                 schedule_timeout_interruptible(2);
                                 trace_rcu_utilization(TPS("Start boost kthread@rcu_yield"));
@@@@@@@@@ -1077,12 -1077,12 -1077,12 -1077,12 -1079,12 -1077,12 -1077,12 -1077,12 +1079,12 @@@@@@@@@ static void rcu_initiate_boost(struct r
                     (rnp->gp_tasks != NULL &&
                      rnp->boost_tasks == NULL &&
                      rnp->qsmask == 0 &&
---- ---             ULONG_CMP_GE(jiffies, rnp->boost_time))) {
++++ +++             (ULONG_CMP_GE(jiffies, rnp->boost_time) || rcu_state.cbovld))) {
                         if (rnp->exp_tasks == NULL)
                                 rnp->boost_tasks = rnp->gp_tasks;
                         raw_spin_unlock_irqrestore_rcu_node(rnp, flags);
                         rcu_wake_cond(rnp->boost_kthread_task,
- ------                              rnp->boost_kthread_status);
+ ++++++                              READ_ONCE(rnp->boost_kthread_status));
                 } else {
                         raw_spin_unlock_irqrestore_rcu_node(rnp, flags);
                 }
@@@@@@@@@ -1486,6 -1486,7 -1486,6 -1486,6 -1488,6 -1486,6 -1486,6 -1486,6 +1488,7 @@@@@@@@@ module_param(nocb_nobypass_lim_per_jiff
          * flag the contention.
          */
         static void rcu_nocb_bypass_lock(struct rcu_data *rdp)
+ ++++++        __acquires(&rdp->nocb_bypass_lock)
         {
                 lockdep_assert_irqs_disabled();
                 if (raw_spin_trylock(&rdp->nocb_bypass_lock))
@@@@@@@@@ -1529,6 -1530,7 -1529,6 -1529,6 -1531,6 -1529,6 -1529,6 -1529,6 +1532,7 @@@@@@@@@ static bool rcu_nocb_bypass_trylock(str
          * Release the specified rcu_data structure's ->nocb_bypass_lock.
          */
         static void rcu_nocb_bypass_unlock(struct rcu_data *rdp)
+ ++++++        __releases(&rdp->nocb_bypass_lock)
         {
                 lockdep_assert_irqs_disabled();
                 raw_spin_unlock(&rdp->nocb_bypass_lock);
@@@@@@@@@ -1577,8 -1579,7 -1577,8 -1577,8 -1579,8 -1577,8 -1577,8 -1577,8 +1581,7 @@@@@@@@@ static void rcu_nocb_unlock_irqrestore(
         static void rcu_lockdep_assert_cblist_protected(struct rcu_data *rdp)
         {
                 lockdep_assert_irqs_disabled();
- ------        if (rcu_segcblist_is_offloaded(&rdp->cblist) &&
- ------            cpu_online(rdp->cpu))
+ ++++++        if (rcu_segcblist_is_offloaded(&rdp->cblist))
                         lockdep_assert_held(&rdp->nocb_lock);
         }
         
@@@@@@@@@ -1930,6 -1931,7 -1930,6 -1930,6 -1932,6 -1930,6 -1930,6 -1930,6 +1933,7 @@@@@@@@@ static void nocb_gp_wait(struct rcu_dat
                 struct rcu_data *rdp;
                 struct rcu_node *rnp;
                 unsigned long wait_gp_seq = 0; // Suppress "use uninitialized" warning.
+ ++++++        bool wasempty = false;
         
                 /*
                  * Each pass through the following loop checks for CBs and for the
@@@@@@@@@ -1969,10 -1971,13 -1969,10 -1969,10 -1971,10 -1969,10 -1969,10 -1969,10 +1973,13 @@@@@@@@@
                              rcu_seq_done(&rnp->gp_seq, cur_gp_seq))) {
                                 raw_spin_lock_rcu_node(rnp); /* irqs disabled. */
                                 needwake_gp = rcu_advance_cbs(rnp, rdp);
+ ++++++                        wasempty = rcu_segcblist_restempty(&rdp->cblist,
+ ++++++                                                           RCU_NEXT_READY_TAIL);
                                 raw_spin_unlock_rcu_node(rnp); /* irqs disabled. */
                         }
                         // Need to wait on some grace period?
- ------                WARN_ON_ONCE(!rcu_segcblist_restempty(&rdp->cblist,
+ ++++++                WARN_ON_ONCE(wasempty &&
+ ++++++                             !rcu_segcblist_restempty(&rdp->cblist,
                                                               RCU_NEXT_READY_TAIL));
                         if (rcu_segcblist_nextgp(&rdp->cblist, &cur_gp_seq)) {
                                 if (!needwait_gp ||
diff --combined kernel/rcu/tree_stall.h

index 55f9b84790d3f110745759a715ff9391321b3286,16ad7ad9a1859c87dd577f4af7d80075cf4ab363,55f9b84790d3f110745759a715ff9391321b3286,55f9b84790d3f110745759a715ff9391321b3286,55f9b84790d3f110745759a715ff9391321b3286,55f9b84790d3f110745759a715ff9391321b3286,55f9b84790d3f110745759a715ff9391321b3286,7ee8a1cc0d8bde899ae95e743f7bdb3ce335e812..119ed6afd20feb84e940a0ea01a79ab36d43e423
--- 1/kernel/rcu/tree_stall.h
--- 2/kernel/rcu/tree_stall.h
--- 3/kernel/rcu/tree_stall.h
--- 4/kernel/rcu/tree_stall.h
--- 5/kernel/rcu/tree_stall.h
--- 6/kernel/rcu/tree_stall.h
--- 7/kernel/rcu/tree_stall.h
--- 8/kernel/rcu/tree_stall.h
+++ b/kernel/rcu/tree_stall.h
@@@@@@@@@ -102,7 -102,7 -102,7 -102,7 -102,7 -102,7 -102,7 -102,7 +102,7 @@@@@@@@@ static void record_gp_stall_check_time(
                 unsigned long j = jiffies;
                 unsigned long j1;
         
- ------        rcu_state.gp_start = j;
+ ++++++        WRITE_ONCE(rcu_state.gp_start, j);
                 j1 = rcu_jiffies_till_stall_check();
                 /* Record ->gp_start before ->jiffies_stall. */
                 smp_store_release(&rcu_state.jiffies_stall, j + j1); /* ^^^ */
@@@@@@@@@ -383,7 -383,7 -383,7 -383,7 -383,7 -383,7 -383,7 -383,7 +383,7 @@@@@@@@@ static void print_other_cpu_stall(unsig
         
                 /* Kick and suppress, if so configured. */
                 rcu_stall_kick_kthreads();
-------         if (rcu_cpu_stall_suppress)
+++++++         if (rcu_stall_is_suppressed())
                         return;
         
                 /*
@@@@@@@@@ -452,7 -452,7 -452,7 -452,7 -452,7 -452,7 -452,7 -452,7 +452,7 @@@@@@@@@ static void print_cpu_stall(void
         
                 /* Kick and suppress, if so configured. */
                 rcu_stall_kick_kthreads();
-------         if (rcu_cpu_stall_suppress)
+++++++         if (rcu_stall_is_suppressed())
                         return;
         
                 /*
@@@@@@@@@ -504,7 -504,7 -504,7 -504,7 -504,7 -504,7 -504,7 -504,7 +504,7 @@@@@@@@@ static void check_cpu_stall(struct rcu_
                 unsigned long js;
                 struct rcu_node *rnp;
         
-------         if ((rcu_cpu_stall_suppress && !rcu_kick_kthreads) ||
+++++++         if ((rcu_stall_is_suppressed() && !rcu_kick_kthreads) ||
                     !rcu_gp_in_progress())
                         return;
                 rcu_stall_kick_kthreads();
@@@@@@@@@ -578,6 -578,7 -578,6 -578,6 -578,6 -578,6 -578,6 -578,6 +578,7 @@@@@@@@@ void show_rcu_gp_kthreads(void
                 unsigned long jw;
                 struct rcu_data *rdp;
                 struct rcu_node *rnp;
+ ++++++        struct task_struct *t = READ_ONCE(rcu_state.gp_kthread);
         
                 j = jiffies;
                 ja = j - READ_ONCE(rcu_state.gp_activity);
@@@@@@@@@ -585,28 -586,28 -585,28 -585,28 -585,28 -585,28 -585,28 -585,28 +586,28 @@@@@@@@@
                 jw = j - READ_ONCE(rcu_state.gp_wake_time);
                 pr_info("%s: wait state: %s(%d) ->state: %#lx delta ->gp_activity %lu ->gp_req_activity %lu ->gp_wake_time %lu ->gp_wake_seq %ld ->gp_seq %ld ->gp_seq_needed %ld ->gp_flags %#x\n",
                         rcu_state.name, gp_state_getname(rcu_state.gp_state),
- ------                rcu_state.gp_state,
- ------                rcu_state.gp_kthread ? rcu_state.gp_kthread->state : 0x1ffffL,
+ ++++++                rcu_state.gp_state, t ? t->state : 0x1ffffL,
                         ja, jr, jw, (long)READ_ONCE(rcu_state.gp_wake_seq),
                         (long)READ_ONCE(rcu_state.gp_seq),
                         (long)READ_ONCE(rcu_get_root()->gp_seq_needed),
                         READ_ONCE(rcu_state.gp_flags));
                 rcu_for_each_node_breadth_first(rnp) {
- ------                if (ULONG_CMP_GE(rcu_state.gp_seq, rnp->gp_seq_needed))
+ ++++++                if (ULONG_CMP_GE(READ_ONCE(rcu_state.gp_seq),
+ ++++++                                 READ_ONCE(rnp->gp_seq_needed)))
                                 continue;
                         pr_info("\trcu_node %d:%d ->gp_seq %ld ->gp_seq_needed %ld\n",
- ------                        rnp->grplo, rnp->grphi, (long)rnp->gp_seq,
- ------                        (long)rnp->gp_seq_needed);
+ ++++++                        rnp->grplo, rnp->grphi, (long)READ_ONCE(rnp->gp_seq),
+ ++++++                        (long)READ_ONCE(rnp->gp_seq_needed));
                         if (!rcu_is_leaf_node(rnp))
                                 continue;
                         for_each_leaf_node_possible_cpu(rnp, cpu) {
                                 rdp = per_cpu_ptr(&rcu_data, cpu);
- ------                        if (rdp->gpwrap ||
- ------                            ULONG_CMP_GE(rcu_state.gp_seq,
- ------                                         rdp->gp_seq_needed))
+ ++++++                        if (READ_ONCE(rdp->gpwrap) ||
+ ++++++                            ULONG_CMP_GE(READ_ONCE(rcu_state.gp_seq),
+ ++++++                                         READ_ONCE(rdp->gp_seq_needed)))
                                         continue;
                                 pr_info("\tcpu %d ->gp_seq_needed %ld\n",
- ------                                cpu, (long)rdp->gp_seq_needed);
+ ++++++                                cpu, (long)READ_ONCE(rdp->gp_seq_needed));
                         }
                 }
                 for_each_possible_cpu(cpu) {
@@@@@@@@@ -631,7 -632,9 -631,7 -631,7 -631,7 -631,7 -631,7 -631,7 +632,9 @@@@@@@@@ static void rcu_check_gp_start_stall(st
                 static atomic_t warned = ATOMIC_INIT(0);
         
                 if (!IS_ENABLED(CONFIG_PROVE_RCU) || rcu_gp_in_progress() ||
- ------            ULONG_CMP_GE(rnp_root->gp_seq, rnp_root->gp_seq_needed))
+ ++++++            ULONG_CMP_GE(READ_ONCE(rnp_root->gp_seq),
+ ++++++                         READ_ONCE(rnp_root->gp_seq_needed)) ||
+ ++++++            !smp_load_acquire(&rcu_state.gp_kthread)) // Get stable kthread.
                         return;
                 j = jiffies; /* Expensive access, and in common case don't get here. */
                 if (time_before(j, READ_ONCE(rcu_state.gp_req_activity) + gpssdelay) ||
@@@@@@@@@ -642,7 -645,8 -642,7 -642,7 -642,7 -642,7 -642,7 -642,7 +645,8 @@@@@@@@@
                 raw_spin_lock_irqsave_rcu_node(rnp, flags);
                 j = jiffies;
                 if (rcu_gp_in_progress() ||
- ------            ULONG_CMP_GE(rnp_root->gp_seq, rnp_root->gp_seq_needed) ||
+ ++++++            ULONG_CMP_GE(READ_ONCE(rnp_root->gp_seq),
+ ++++++                         READ_ONCE(rnp_root->gp_seq_needed)) ||
                     time_before(j, READ_ONCE(rcu_state.gp_req_activity) + gpssdelay) ||
                     time_before(j, READ_ONCE(rcu_state.gp_activity) + gpssdelay) ||
                     atomic_read(&warned)) {
@@@@@@@@@ -655,9 -659,10 -655,9 -655,9 -655,9 -655,9 -655,9 -655,9 +659,10 @@@@@@@@@
                         raw_spin_lock_rcu_node(rnp_root); /* irqs already disabled. */
                 j = jiffies;
                 if (rcu_gp_in_progress() ||
- ------            ULONG_CMP_GE(rnp_root->gp_seq, rnp_root->gp_seq_needed) ||
- ------            time_before(j, rcu_state.gp_req_activity + gpssdelay) ||
- ------            time_before(j, rcu_state.gp_activity + gpssdelay) ||
+ ++++++            ULONG_CMP_GE(READ_ONCE(rnp_root->gp_seq),
+ ++++++                         READ_ONCE(rnp_root->gp_seq_needed)) ||
+ ++++++            time_before(j, READ_ONCE(rcu_state.gp_req_activity) + gpssdelay) ||
+ ++++++            time_before(j, READ_ONCE(rcu_state.gp_activity) + gpssdelay) ||
                     atomic_xchg(&warned, 1)) {
                         if (rnp_root != rnp)
                                 /* irqs remain disabled. */
diff --combined kernel/rcu/update.c

index 6c4b862f57d6fc0620e6a24f857cb9c1a54ce2d4,6c4b862f57d6fc0620e6a24f857cb9c1a54ce2d4,6c4b862f57d6fc0620e6a24f857cb9c1a54ce2d4,6c4b862f57d6fc0620e6a24f857cb9c1a54ce2d4,6c4b862f57d6fc0620e6a24f857cb9c1a54ce2d4,ede656c5e1e931d679e936f83d0ed2376845fb2e,6c4b862f57d6fc0620e6a24f857cb9c1a54ce2d4,085f08a898fe14f7f17578239522f729a1ec1bb0..a4ad8e0406c7f71f3a3e54d158ff7a6f815be7a0
--- 1/kernel/rcu/update.c
--- 2/kernel/rcu/update.c
--- 3/kernel/rcu/update.c
--- 4/kernel/rcu/update.c
--- 5/kernel/rcu/update.c
--- 6/kernel/rcu/update.c
--- 7/kernel/rcu/update.c
--- 8/kernel/rcu/update.c
+++ b/kernel/rcu/update.c
@@@@@@@@@ -183,6 -183,6 -183,6 -183,6 -183,6 -183,6 -183,6 -183,8 +183,8 @@@@@@@@@ void rcu_unexpedite_gp(void
         }
         EXPORT_SYMBOL_GPL(rcu_unexpedite_gp);
         
+++++++ static bool rcu_boot_ended __read_mostly;
+++++++ 
         /*
          * Inform RCU of the end of the in-kernel boot sequence.
          */
@@@@@@@@@ -191,8 -191,8 -191,8 -191,8 -191,8 -191,8 -191,8 -193,18 +193,18 @@@@@@@@@ void rcu_end_inkernel_boot(void
                 rcu_unexpedite_gp();
                 if (rcu_normal_after_boot)
                         WRITE_ONCE(rcu_normal, 1);
+++++++         rcu_boot_ended = 1;
         }
         
+++++++ /*
+++++++  * Let rcutorture know when it is OK to turn it up to eleven.
+++++++  */
+++++++ bool rcu_inkernel_boot_has_ended(void)
+++++++ {
+++++++         return rcu_boot_ended;
+++++++ }
+++++++ EXPORT_SYMBOL_GPL(rcu_inkernel_boot_has_ended);
+++++++ 
         #endif /* #ifndef CONFIG_TINY_RCU */
         
         /*
@@@@@@@@@ -464,13 -464,13 -464,13 -464,13 -464,13 -464,13 -464,13 -476,19 +476,19 @@@@@@@@@ EXPORT_SYMBOL_GPL(rcutorture_sched_seta
         #ifdef CONFIG_RCU_STALL_COMMON
         int rcu_cpu_stall_ftrace_dump __read_mostly;
         module_param(rcu_cpu_stall_ftrace_dump, int, 0644);
------- int rcu_cpu_stall_suppress __read_mostly; /* 1 = suppress stall warnings. */
+++++++ int rcu_cpu_stall_suppress __read_mostly; // !0 = suppress stall warnings.
         EXPORT_SYMBOL_GPL(rcu_cpu_stall_suppress);
         module_param(rcu_cpu_stall_suppress, int, 0644);
         int rcu_cpu_stall_timeout __read_mostly = CONFIG_RCU_CPU_STALL_TIMEOUT;
         module_param(rcu_cpu_stall_timeout, int, 0644);
         #endif /* #ifdef CONFIG_RCU_STALL_COMMON */
         
+++++++ // Suppress boot-time RCU CPU stall warnings and rcutorture writer stall
+++++++ // warnings.  Also used by rcutorture even if stall warnings are excluded.
+++++++ int rcu_cpu_stall_suppress_at_boot __read_mostly; // !0 = suppress boot stalls.
+++++++ EXPORT_SYMBOL_GPL(rcu_cpu_stall_suppress_at_boot);
+++++++ module_param(rcu_cpu_stall_suppress_at_boot, int, 0444);
+++++++ 
         #ifdef CONFIG_TASKS_RCU
         
         /*
@@@@@@@@@ -528,7 -528,7 -528,7 -528,7 -528,7 -528,7 -528,7 -546,7 +546,7 @@@@@@@@@ void call_rcu_tasks(struct rcu_head *rh
                 rhp->func = func;
                 raw_spin_lock_irqsave(&rcu_tasks_cbs_lock, flags);
                 needwake = !rcu_tasks_cbs_head;
----- --        *rcu_tasks_cbs_tail = rhp;
+++++ ++        WRITE_ONCE(*rcu_tasks_cbs_tail, rhp);
                 rcu_tasks_cbs_tail = &rhp->next;
                 raw_spin_unlock_irqrestore(&rcu_tasks_cbs_lock, flags);
                 /* We can't create the thread unless interrupts are enabled. */
@@@@@@@@@ -658,7 -658,7 -658,7 -658,7 -658,7 -658,7 -658,7 -676,7 +676,7 @@@@@@@@@ static int __noreturn rcu_tasks_kthread
                         /* If there were none, wait a bit and start over. */
                         if (!list) {
                                 wait_event_interruptible(rcu_tasks_cbs_wq,
----- --                                                 rcu_tasks_cbs_head);
+++++ ++                                                 READ_ONCE(rcu_tasks_cbs_head));
                                 if (!rcu_tasks_cbs_head) {
                                         WARN_ON(signal_pending(current));
                                         schedule_timeout_interruptible(HZ/10);
@@@@@@@@@ -801,7 -801,7 -801,7 -801,7 -801,7 -801,7 -801,7 -819,7 +819,7 @@@@@@@@@ static int __init rcu_spawn_tasks_kthre
         core_initcall(rcu_spawn_tasks_kthread);
         
         /* Do the srcu_read_lock() for the above synchronize_srcu().  */
----- --void exit_tasks_rcu_start(void)
+++++ ++void exit_tasks_rcu_start(void) __acquires(&tasks_rcu_exit_srcu)
         {
                 preempt_disable();
                 current->rcu_tasks_idx = __srcu_read_lock(&tasks_rcu_exit_srcu);
@@@@@@@@@ -809,7 -809,7 -809,7 -809,7 -809,7 -809,7 -809,7 -827,7 +827,7 @@@@@@@@@
         }
         
         /* Do the srcu_read_unlock() for the above synchronize_srcu().  */
----- --void exit_tasks_rcu_finish(void)
+++++ ++void exit_tasks_rcu_finish(void) __releases(&tasks_rcu_exit_srcu)
         {
                 preempt_disable();
                 __srcu_read_unlock(&tasks_rcu_exit_srcu, current->rcu_tasks_idx);
author	Paul E. McKenney <[email protected]>
	Sun, 22 Mar 2020 00:15:11 +0000 (17:15 -0700)
committer	Paul E. McKenney <[email protected]>
	Sun, 22 Mar 2020 00:15:11 +0000 (17:15 -0700)
		1	2	3	4	5	6	7	8
Documentation/admin-guide/kernel-parameters.txt	patch \|	diff1 \|	diff2 \|	diff3 \|	diff4 \|	diff5 \|	diff6 \|	diff7 \|	diff8 \|	blob \| history
include/trace/events/rcu.h	patch \|	diff1 \|	diff2 \|	diff3 \|	diff4 \|	diff5 \|	diff6 \|	diff7 \|	diff8 \|	blob \| history
kernel/rcu/rcu.h	patch \|	diff1 \|	diff2 \|	diff3 \|	diff4 \|	diff5 \|	diff6 \|	diff7 \|	diff8 \|	blob \| history
kernel/rcu/srcutree.c	patch \|	diff1 \|	diff2 \|	diff3 \|	diff4 \|	diff5 \|	diff6 \|	diff7 \|	diff8 \|	blob \| history
kernel/rcu/tree.c	patch \|	diff1 \|	diff2 \|	diff3 \|	diff4 \|	diff5 \|	diff6 \|	diff7 \|	diff8 \|	blob \| history
kernel/rcu/tree_exp.h	patch \|	diff1 \|	diff2 \|	diff3 \|	diff4 \|	diff5 \|	diff6 \|	diff7 \|	diff8 \|	blob \| history
kernel/rcu/tree_plugin.h	patch \|	diff1 \|	diff2 \|	diff3 \|	diff4 \|	diff5 \|	diff6 \|	diff7 \|	diff8 \|	blob \| history
kernel/rcu/tree_stall.h	patch \|	diff1 \|	diff2 \|	diff3 \|	diff4 \|	diff5 \|	diff6 \|	diff7 \|	diff8 \|	blob \| history
kernel/rcu/update.c	patch \|	diff1 \|	diff2 \|	diff3 \|	diff4 \|	diff5 \|	diff6 \|	diff7 \|	diff8 \|	blob \| history