On Mon, Jun 15, 2026 at 09:55:16AM +0530, Vishal Chourasia wrote:
> On large idle systems, changing system-wide SMT level using the sysfs
> control interface still takes approximately 40-55 minutes. Changing SMT
> levels is an user triggered operation generally done when systems are
> fairly idle. This causes users to be blocked from doing other subsequent
> work.
> 
> Analyzing the collected profile data during SMT level switch, showed
> that CPU hotplug machinery was blocked on synchronize_rcu() calls.
> 
> Expedite RCU grace periods for the entire duration of triggered SMT
> switch operation via the sysfs control interface. Individual CPU hotplug
> operations via the online/offline interface are not affected.
> 
> On a PPC64 system with 400 CPUs:
> 
>   SMT8 to SMT1:
>     before:  1m14s
>     after:   3.2s   (~23x faster)
> 
>   SMT1 to SMT8:
>     before:  2m27s
>     after:   2.5s   (~58x faster)
> 
> On a large config system with 1920 CPUs, completion time improves from
> ~1 hour to 5-6 minutes.
> 
> Tested-by: Samir <[email protected]>
> Reviewed-by: Shrikanth Hegde <[email protected]>
> Signed-off-by: Vishal Chourasia <[email protected]>

>From an RCU viewpoint:

Reviewed-by: Paul E. McKenney <[email protected]>

I am guessing that you will be taking this up some other path, but if
you would like it to to via RCU, please let me know.

                                                        Thanx, Paul

> ---
>  include/linux/rcupdate.h | 8 ++++++++
>  kernel/cpu.c             | 4 ++++
>  kernel/rcu/rcu.h         | 4 ----
>  3 files changed, 12 insertions(+), 4 deletions(-)
> 
> diff --git a/include/linux/rcupdate.h b/include/linux/rcupdate.h
> index bfa765132de8..b6bccf131f1c 100644
> --- a/include/linux/rcupdate.h
> +++ b/include/linux/rcupdate.h
> @@ -1178,6 +1178,14 @@ rcu_head_after_call_rcu(struct rcu_head *rhp, 
> rcu_callback_t f)
>  extern int rcu_expedited;
>  extern int rcu_normal;
>  
> +#ifdef CONFIG_TINY_RCU
> +static inline void rcu_expedite_gp(void) { }
> +static inline void rcu_unexpedite_gp(void) { }
> +#else
> +void rcu_expedite_gp(void);
> +void rcu_unexpedite_gp(void);
> +#endif
> +
>  DEFINE_LOCK_GUARD_0(rcu, rcu_read_lock(), rcu_read_unlock())
>  DECLARE_LOCK_GUARD_0_ATTRS(rcu, __acquires_shared(RCU), 
> __releases_shared(RCU))
>  
> diff --git a/kernel/cpu.c b/kernel/cpu.c
> index bc4f7a9ba64e..6351da9dffdc 100644
> --- a/kernel/cpu.c
> +++ b/kernel/cpu.c
> @@ -2658,6 +2658,7 @@ int cpuhp_smt_disable(enum cpuhp_smt_control ctrlval)
>       int cpu, ret = 0;
>  
>       cpu_maps_update_begin();
> +     rcu_expedite_gp();
>       for_each_online_cpu(cpu) {
>               if (topology_is_primary_thread(cpu))
>                       continue;
> @@ -2687,6 +2688,7 @@ int cpuhp_smt_disable(enum cpuhp_smt_control ctrlval)
>       }
>       if (!ret)
>               cpu_smt_control = ctrlval;
> +     rcu_unexpedite_gp();
>       cpu_maps_update_done();
>       return ret;
>  }
> @@ -2704,6 +2706,7 @@ int cpuhp_smt_enable(void)
>       int cpu, ret = 0;
>  
>       cpu_maps_update_begin();
> +     rcu_expedite_gp();
>       cpu_smt_control = CPU_SMT_ENABLED;
>       for_each_present_cpu(cpu) {
>               /* Skip online CPUs and CPUs on offline nodes */
> @@ -2717,6 +2720,7 @@ int cpuhp_smt_enable(void)
>               /* See comment in cpuhp_smt_disable() */
>               cpuhp_online_cpu_device(cpu);
>       }
> +     rcu_unexpedite_gp();
>       cpu_maps_update_done();
>       return ret;
>  }
> diff --git a/kernel/rcu/rcu.h b/kernel/rcu/rcu.h
> index fa6d30ce73d1..d6a63ee60bc0 100644
> --- a/kernel/rcu/rcu.h
> +++ b/kernel/rcu/rcu.h
> @@ -521,8 +521,6 @@ do {                                                      
>                 \
>  static inline bool rcu_gp_is_normal(void) { return true; }
>  static inline bool rcu_gp_is_expedited(void) { return false; }
>  static inline bool rcu_async_should_hurry(void) { return false; }
> -static inline void rcu_expedite_gp(void) { }
> -static inline void rcu_unexpedite_gp(void) { }
>  static inline void rcu_async_hurry(void) { }
>  static inline void rcu_async_relax(void) { }
>  static inline bool rcu_cpu_online(int cpu) { return true; }
> @@ -530,8 +528,6 @@ static inline bool rcu_cpu_online(int cpu) { return true; 
> }
>  bool rcu_gp_is_normal(void);     /* Internal RCU use. */
>  bool rcu_gp_is_expedited(void);  /* Internal RCU use. */
>  bool rcu_async_should_hurry(void);  /* Internal RCU use. */
> -void rcu_expedite_gp(void);
> -void rcu_unexpedite_gp(void);
>  void rcu_async_hurry(void);
>  void rcu_async_relax(void);
>  void rcupdate_announce_bootup_oddness(void);
> -- 
> 2.54.0
> 

Reply via email to