Merge tag 'sched-core-2021-02-17' of git://git.kernel.org/pub/scm/linux/kernel/git...

author Linus Torvalds <torvalds@linux-foundation.org>

Sun, 21 Feb 2021 20:35:04 +0000 (12:35 -0800)

committer Linus Torvalds <torvalds@linux-foundation.org>

Sun, 21 Feb 2021 20:35:04 +0000 (12:35 -0800)
author Linus Torvalds <torvalds@linux-foundation.org>
Sun, 21 Feb 2021 20:35:04 +0000 (12:35 -0800)
committer Linus Torvalds <torvalds@linux-foundation.org>
Sun, 21 Feb 2021 20:35:04 +0000 (12:35 -0800)
diff --cc Documentation/admin-guide/kernel-parameters.txt
Simple merge
diff --cc arch/Kconfig
Simple merge
diff --cc arch/powerpc/platforms/cell/spufs/sched.c
Simple merge
diff --cc arch/x86/Kconfig
Simple merge
diff --cc include/asm-generic/vmlinux.lds.h
Simple merge
diff --cc include/linux/rcupdate.h

index ebd8dcc,36c2119..bd04f72
--- 1/include/linux/rcupdate.h
--- 2/include/linux/rcupdate.h
+++ b/include/linux/rcupdate.h
@@@ -112,12 -110,10 +112,14 @@@ static inline void rcu_user_exit(void) 
   
   #ifdef CONFIG_RCU_NOCB_CPU
   void rcu_init_nohz(void);
+ +int rcu_nocb_cpu_offload(int cpu);
+ +int rcu_nocb_cpu_deoffload(int cpu);
+ void rcu_nocb_flush_deferred_wakeup(void);
   #else /* #ifdef CONFIG_RCU_NOCB_CPU */
   static inline void rcu_init_nohz(void) { }
+ +static inline int rcu_nocb_cpu_offload(int cpu) { return -EINVAL; }
+ +static inline int rcu_nocb_cpu_deoffload(int cpu) { return 0; }
+ static inline void rcu_nocb_flush_deferred_wakeup(void) { }
   #endif /* #else #ifdef CONFIG_RCU_NOCB_CPU */
   
   /**
diff --cc init/Kconfig
Simple merge
diff --cc kernel/events/core.c
Simple merge
diff --cc kernel/locking/rtmutex.c
Simple merge
diff --cc kernel/rcu/tree.c
Simple merge
diff --cc kernel/rcu/tree.h
Simple merge
diff --cc kernel/rcu/tree_plugin.h

index 231a0c6,cdc1b76..2d60377
--- 1/kernel/rcu/tree_plugin.h
--- 2/kernel/rcu/tree_plugin.h
+++ b/kernel/rcu/tree_plugin.h
@@@ -2280,201 -2186,19 +2285,208 @@@ static void do_nocb_deferred_wakeup_tim
    * This means we do an inexact common-case check.  Note that if
    * we miss, ->nocb_timer will eventually clean things up.
    */
- static void do_nocb_deferred_wakeup(struct rcu_data *rdp)
+ static bool do_nocb_deferred_wakeup(struct rcu_data *rdp)
   {
         if (rcu_nocb_need_deferred_wakeup(rdp))
-               do_nocb_deferred_wakeup_common(rdp);
+               return do_nocb_deferred_wakeup_common(rdp);
+       return false;
+ }
+ 
+ void rcu_nocb_flush_deferred_wakeup(void)
+ {
+       do_nocb_deferred_wakeup(this_cpu_ptr(&rcu_data));
   }
+ EXPORT_SYMBOL_GPL(rcu_nocb_flush_deferred_wakeup);
   
+ +static int rdp_offload_toggle(struct rcu_data *rdp,
+ +                             bool offload, unsigned long flags)
+ +      __releases(rdp->nocb_lock)
+ +{
+ +      struct rcu_segcblist *cblist = &rdp->cblist;
+ +      struct rcu_data *rdp_gp = rdp->nocb_gp_rdp;
+ +      bool wake_gp = false;
+ +
+ +      rcu_segcblist_offload(cblist, offload);
+ +
+ +      if (rdp->nocb_cb_sleep)
+ +              rdp->nocb_cb_sleep = false;
+ +      rcu_nocb_unlock_irqrestore(rdp, flags);
+ +
+ +      /*
+ +       * Ignore former value of nocb_cb_sleep and force wake up as it could
+ +       * have been spuriously set to false already.
+ +       */
+ +      swake_up_one(&rdp->nocb_cb_wq);
+ +
+ +      raw_spin_lock_irqsave(&rdp_gp->nocb_gp_lock, flags);
+ +      if (rdp_gp->nocb_gp_sleep) {
+ +              rdp_gp->nocb_gp_sleep = false;
+ +              wake_gp = true;
+ +      }
+ +      raw_spin_unlock_irqrestore(&rdp_gp->nocb_gp_lock, flags);
+ +
+ +      if (wake_gp)
+ +              wake_up_process(rdp_gp->nocb_gp_kthread);
+ +
+ +      return 0;
+ +}
+ +
+ +static int __rcu_nocb_rdp_deoffload(struct rcu_data *rdp)
+ +{
+ +      struct rcu_segcblist *cblist = &rdp->cblist;
+ +      unsigned long flags;
+ +      int ret;
+ +
+ +      pr_info("De-offloading %d\n", rdp->cpu);
+ +
+ +      rcu_nocb_lock_irqsave(rdp, flags);
+ +      /*
+ +       * If there are still pending work offloaded, the offline
+ +       * CPU won't help much handling them.
+ +       */
+ +      if (cpu_is_offline(rdp->cpu) && !rcu_segcblist_empty(&rdp->cblist)) {
+ +              rcu_nocb_unlock_irqrestore(rdp, flags);
+ +              return -EBUSY;
+ +      }
+ +
+ +      ret = rdp_offload_toggle(rdp, false, flags);
+ +      swait_event_exclusive(rdp->nocb_state_wq,
+ +                            !rcu_segcblist_test_flags(cblist, SEGCBLIST_KTHREAD_CB |
+ +                                                      SEGCBLIST_KTHREAD_GP));
+ +      rcu_nocb_lock_irqsave(rdp, flags);
+ +      /* Make sure nocb timer won't stay around */
+ +      WRITE_ONCE(rdp->nocb_defer_wakeup, RCU_NOCB_WAKE_OFF);
+ +      rcu_nocb_unlock_irqrestore(rdp, flags);
+ +      del_timer_sync(&rdp->nocb_timer);
+ +
+ +      /*
+ +       * Flush bypass. While IRQs are disabled and once we set
+ +       * SEGCBLIST_SOFTIRQ_ONLY, no callback is supposed to be
+ +       * enqueued on bypass.
+ +       */
+ +      rcu_nocb_lock_irqsave(rdp, flags);
+ +      rcu_nocb_flush_bypass(rdp, NULL, jiffies);
+ +      rcu_segcblist_set_flags(cblist, SEGCBLIST_SOFTIRQ_ONLY);
+ +      /*
+ +       * With SEGCBLIST_SOFTIRQ_ONLY, we can't use
+ +       * rcu_nocb_unlock_irqrestore() anymore. Theoretically we
+ +       * could set SEGCBLIST_SOFTIRQ_ONLY with cb unlocked and IRQs
+ +       * disabled now, but let's be paranoid.
+ +       */
+ +      raw_spin_unlock_irqrestore(&rdp->nocb_lock, flags);
+ +
+ +      return ret;
+ +}
+ +
+ +static long rcu_nocb_rdp_deoffload(void *arg)
+ +{
+ +      struct rcu_data *rdp = arg;
+ +
+ +      WARN_ON_ONCE(rdp->cpu != raw_smp_processor_id());
+ +      return __rcu_nocb_rdp_deoffload(rdp);
+ +}
+ +
+ +int rcu_nocb_cpu_deoffload(int cpu)
+ +{
+ +      struct rcu_data *rdp = per_cpu_ptr(&rcu_data, cpu);
+ +      int ret = 0;
+ +
+ +      if (rdp == rdp->nocb_gp_rdp) {
+ +              pr_info("Can't deoffload an rdp GP leader (yet)\n");
+ +              return -EINVAL;
+ +      }
+ +      mutex_lock(&rcu_state.barrier_mutex);
+ +      cpus_read_lock();
+ +      if (rcu_segcblist_is_offloaded(&rdp->cblist)) {
+ +              if (cpu_online(cpu))
+ +                      ret = work_on_cpu(cpu, rcu_nocb_rdp_deoffload, rdp);
+ +              else
+ +                      ret = __rcu_nocb_rdp_deoffload(rdp);
+ +              if (!ret)
+ +                      cpumask_clear_cpu(cpu, rcu_nocb_mask);
+ +      }
+ +      cpus_read_unlock();
+ +      mutex_unlock(&rcu_state.barrier_mutex);
+ +
+ +      return ret;
+ +}
+ +EXPORT_SYMBOL_GPL(rcu_nocb_cpu_deoffload);
+ +
+ +static int __rcu_nocb_rdp_offload(struct rcu_data *rdp)
+ +{
+ +      struct rcu_segcblist *cblist = &rdp->cblist;
+ +      unsigned long flags;
+ +      int ret;
+ +
+ +      /*
+ +       * For now we only support re-offload, ie: the rdp must have been
+ +       * offloaded on boot first.
+ +       */
+ +      if (!rdp->nocb_gp_rdp)
+ +              return -EINVAL;
+ +
+ +      pr_info("Offloading %d\n", rdp->cpu);
+ +      /*
+ +       * Can't use rcu_nocb_lock_irqsave() while we are in
+ +       * SEGCBLIST_SOFTIRQ_ONLY mode.
+ +       */
+ +      raw_spin_lock_irqsave(&rdp->nocb_lock, flags);
+ +      /* Re-enable nocb timer */
+ +      WRITE_ONCE(rdp->nocb_defer_wakeup, RCU_NOCB_WAKE_NOT);
+ +      /*
+ +       * We didn't take the nocb lock while working on the
+ +       * rdp->cblist in SEGCBLIST_SOFTIRQ_ONLY mode.
+ +       * Every modifications that have been done previously on
+ +       * rdp->cblist must be visible remotely by the nocb kthreads
+ +       * upon wake up after reading the cblist flags.
+ +       *
+ +       * The layout against nocb_lock enforces that ordering:
+ +       *
+ +       *  __rcu_nocb_rdp_offload()   nocb_cb_wait()/nocb_gp_wait()
+ +       * -------------------------   ----------------------------
+ +       *      WRITE callbacks           rcu_nocb_lock()
+ +       *      rcu_nocb_lock()           READ flags
+ +       *      WRITE flags               READ callbacks
+ +       *      rcu_nocb_unlock()         rcu_nocb_unlock()
+ +       */
+ +      ret = rdp_offload_toggle(rdp, true, flags);
+ +      swait_event_exclusive(rdp->nocb_state_wq,
+ +                            rcu_segcblist_test_flags(cblist, SEGCBLIST_KTHREAD_CB) &&
+ +                            rcu_segcblist_test_flags(cblist, SEGCBLIST_KTHREAD_GP));
+ +
+ +      return ret;
+ +}
+ +
+ +static long rcu_nocb_rdp_offload(void *arg)
+ +{
+ +      struct rcu_data *rdp = arg;
+ +
+ +      WARN_ON_ONCE(rdp->cpu != raw_smp_processor_id());
+ +      return __rcu_nocb_rdp_offload(rdp);
+ +}
+ +
+ +int rcu_nocb_cpu_offload(int cpu)
+ +{
+ +      struct rcu_data *rdp = per_cpu_ptr(&rcu_data, cpu);
+ +      int ret = 0;
+ +
+ +      mutex_lock(&rcu_state.barrier_mutex);
+ +      cpus_read_lock();
+ +      if (!rcu_segcblist_is_offloaded(&rdp->cblist)) {
+ +              if (cpu_online(cpu))
+ +                      ret = work_on_cpu(cpu, rcu_nocb_rdp_offload, rdp);
+ +              else
+ +                      ret = __rcu_nocb_rdp_offload(rdp);
+ +              if (!ret)
+ +                      cpumask_set_cpu(cpu, rcu_nocb_mask);
+ +      }
+ +      cpus_read_unlock();
+ +      mutex_unlock(&rcu_state.barrier_mutex);
+ +
+ +      return ret;
+ +}
+ +EXPORT_SYMBOL_GPL(rcu_nocb_cpu_offload);
+ +
   void __init rcu_init_nohz(void)
   {
         int cpu;
diff --cc kernel/sched/core.c
Simple merge
author	Linus Torvalds <torvalds@linux-foundation.org>
	Sun, 21 Feb 2021 20:35:04 +0000 (12:35 -0800)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Sun, 21 Feb 2021 20:35:04 +0000 (12:35 -0800)
		1	2
Documentation/admin-guide/kernel-parameters.txt	patch \|	diff1 \|	diff2 \|	blob \| history
arch/Kconfig	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/platforms/cell/spufs/sched.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/Kconfig	patch \|	diff1 \|	diff2 \|	blob \| history
include/asm-generic/vmlinux.lds.h	patch \|	diff1 \|	diff2 \|	blob \| history
include/linux/rcupdate.h	patch \|	diff1 \|	diff2 \|	blob \| history
init/Kconfig	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/events/core.c	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/locking/rtmutex.c	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/rcu/tree.c	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/rcu/tree.h	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/rcu/tree_plugin.h	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/sched/core.c	patch \|	diff1 \|	diff2 \|	blob \| history