110462d6fSPaul E. McKenney // SPDX-License-Identifier: GPL-2.0+ 210462d6fSPaul E. McKenney /* 310462d6fSPaul E. McKenney * RCU CPU stall warnings for normal RCU grace periods 410462d6fSPaul E. McKenney * 510462d6fSPaul E. McKenney * Copyright IBM Corporation, 2019 610462d6fSPaul E. McKenney * 710462d6fSPaul E. McKenney * Author: Paul E. McKenney <paulmck@linux.ibm.com> 810462d6fSPaul E. McKenney */ 910462d6fSPaul E. McKenney 10e23344c2SPaul E. McKenney ////////////////////////////////////////////////////////////////////////////// 11e23344c2SPaul E. McKenney // 12e23344c2SPaul E. McKenney // Controlling CPU stall warnings, including delay calculation. 1310462d6fSPaul E. McKenney 1432255d51SPaul E. McKenney /* panic() on RCU Stall sysctl. */ 1532255d51SPaul E. McKenney int sysctl_panic_on_rcu_stall __read_mostly; 1632255d51SPaul E. McKenney 1710462d6fSPaul E. McKenney #ifdef CONFIG_PROVE_RCU 1810462d6fSPaul E. McKenney #define RCU_STALL_DELAY_DELTA (5 * HZ) 1910462d6fSPaul E. McKenney #else 2010462d6fSPaul E. McKenney #define RCU_STALL_DELAY_DELTA 0 2110462d6fSPaul E. McKenney #endif 2210462d6fSPaul E. McKenney 23e23344c2SPaul E. McKenney /* Limit-check stall timeouts specified at boottime and runtime. */ 2410462d6fSPaul E. McKenney int rcu_jiffies_till_stall_check(void) 2510462d6fSPaul E. McKenney { 2610462d6fSPaul E. McKenney int till_stall_check = READ_ONCE(rcu_cpu_stall_timeout); 2710462d6fSPaul E. McKenney 2810462d6fSPaul E. McKenney /* 2910462d6fSPaul E. McKenney * Limit check must be consistent with the Kconfig limits 3010462d6fSPaul E. McKenney * for CONFIG_RCU_CPU_STALL_TIMEOUT. 3110462d6fSPaul E. McKenney */ 3210462d6fSPaul E. McKenney if (till_stall_check < 3) { 3310462d6fSPaul E. McKenney WRITE_ONCE(rcu_cpu_stall_timeout, 3); 3410462d6fSPaul E. McKenney till_stall_check = 3; 3510462d6fSPaul E. McKenney } else if (till_stall_check > 300) { 3610462d6fSPaul E. McKenney WRITE_ONCE(rcu_cpu_stall_timeout, 300); 3710462d6fSPaul E. McKenney till_stall_check = 300; 3810462d6fSPaul E. McKenney } 3910462d6fSPaul E. McKenney return till_stall_check * HZ + RCU_STALL_DELAY_DELTA; 4010462d6fSPaul E. McKenney } 4110462d6fSPaul E. McKenney EXPORT_SYMBOL_GPL(rcu_jiffies_till_stall_check); 4210462d6fSPaul E. McKenney 43e23344c2SPaul E. McKenney /* Don't do RCU CPU stall warnings during long sysrq printouts. */ 4410462d6fSPaul E. McKenney void rcu_sysrq_start(void) 4510462d6fSPaul E. McKenney { 4610462d6fSPaul E. McKenney if (!rcu_cpu_stall_suppress) 4710462d6fSPaul E. McKenney rcu_cpu_stall_suppress = 2; 4810462d6fSPaul E. McKenney } 4910462d6fSPaul E. McKenney 5010462d6fSPaul E. McKenney void rcu_sysrq_end(void) 5110462d6fSPaul E. McKenney { 5210462d6fSPaul E. McKenney if (rcu_cpu_stall_suppress == 2) 5310462d6fSPaul E. McKenney rcu_cpu_stall_suppress = 0; 5410462d6fSPaul E. McKenney } 5510462d6fSPaul E. McKenney 56e23344c2SPaul E. McKenney /* Don't print RCU CPU stall warnings during a kernel panic. */ 5710462d6fSPaul E. McKenney static int rcu_panic(struct notifier_block *this, unsigned long ev, void *ptr) 5810462d6fSPaul E. McKenney { 5910462d6fSPaul E. McKenney rcu_cpu_stall_suppress = 1; 6010462d6fSPaul E. McKenney return NOTIFY_DONE; 6110462d6fSPaul E. McKenney } 6210462d6fSPaul E. McKenney 6310462d6fSPaul E. McKenney static struct notifier_block rcu_panic_block = { 6410462d6fSPaul E. McKenney .notifier_call = rcu_panic, 6510462d6fSPaul E. McKenney }; 6610462d6fSPaul E. McKenney 6710462d6fSPaul E. McKenney static int __init check_cpu_stall_init(void) 6810462d6fSPaul E. McKenney { 6910462d6fSPaul E. McKenney atomic_notifier_chain_register(&panic_notifier_list, &rcu_panic_block); 7010462d6fSPaul E. McKenney return 0; 7110462d6fSPaul E. McKenney } 7210462d6fSPaul E. McKenney early_initcall(check_cpu_stall_init); 733fc3d170SPaul E. McKenney 74e23344c2SPaul E. McKenney /* If so specified via sysctl, panic, yielding cleaner stall-warning output. */ 75e23344c2SPaul E. McKenney static void panic_on_rcu_stall(void) 76e23344c2SPaul E. McKenney { 77e23344c2SPaul E. McKenney if (sysctl_panic_on_rcu_stall) 78e23344c2SPaul E. McKenney panic("RCU Stall\n"); 79e23344c2SPaul E. McKenney } 80e23344c2SPaul E. McKenney 81e23344c2SPaul E. McKenney /** 82e23344c2SPaul E. McKenney * rcu_cpu_stall_reset - prevent further stall warnings in current grace period 83e23344c2SPaul E. McKenney * 84e23344c2SPaul E. McKenney * Set the stall-warning timeout way off into the future, thus preventing 85e23344c2SPaul E. McKenney * any RCU CPU stall-warning messages from appearing in the current set of 86e23344c2SPaul E. McKenney * RCU grace periods. 87e23344c2SPaul E. McKenney * 88e23344c2SPaul E. McKenney * The caller must disable hard irqs. 89e23344c2SPaul E. McKenney */ 90e23344c2SPaul E. McKenney void rcu_cpu_stall_reset(void) 91e23344c2SPaul E. McKenney { 92e23344c2SPaul E. McKenney WRITE_ONCE(rcu_state.jiffies_stall, jiffies + ULONG_MAX / 2); 93e23344c2SPaul E. McKenney } 94e23344c2SPaul E. McKenney 95e23344c2SPaul E. McKenney ////////////////////////////////////////////////////////////////////////////// 96e23344c2SPaul E. McKenney // 97e23344c2SPaul E. McKenney // Interaction with RCU grace periods 98e23344c2SPaul E. McKenney 99e23344c2SPaul E. McKenney /* Start of new grace period, so record stall time (and forcing times). */ 100e23344c2SPaul E. McKenney static void record_gp_stall_check_time(void) 101e23344c2SPaul E. McKenney { 102e23344c2SPaul E. McKenney unsigned long j = jiffies; 103e23344c2SPaul E. McKenney unsigned long j1; 104e23344c2SPaul E. McKenney 10559881bcdSPaul E. McKenney WRITE_ONCE(rcu_state.gp_start, j); 106e23344c2SPaul E. McKenney j1 = rcu_jiffies_till_stall_check(); 107e23344c2SPaul E. McKenney /* Record ->gp_start before ->jiffies_stall. */ 108e23344c2SPaul E. McKenney smp_store_release(&rcu_state.jiffies_stall, j + j1); /* ^^^ */ 109e23344c2SPaul E. McKenney rcu_state.jiffies_resched = j + j1 / 2; 110e23344c2SPaul E. McKenney rcu_state.n_force_qs_gpstart = READ_ONCE(rcu_state.n_force_qs); 111e23344c2SPaul E. McKenney } 112e23344c2SPaul E. McKenney 113e23344c2SPaul E. McKenney /* Zero ->ticks_this_gp and snapshot the number of RCU softirq handlers. */ 114e23344c2SPaul E. McKenney static void zero_cpu_stall_ticks(struct rcu_data *rdp) 115e23344c2SPaul E. McKenney { 116e23344c2SPaul E. McKenney rdp->ticks_this_gp = 0; 117e23344c2SPaul E. McKenney rdp->softirq_snap = kstat_softirqs_cpu(RCU_SOFTIRQ, smp_processor_id()); 118e23344c2SPaul E. McKenney WRITE_ONCE(rdp->last_fqs_resched, jiffies); 119e23344c2SPaul E. McKenney } 120e23344c2SPaul E. McKenney 121e23344c2SPaul E. McKenney /* 122e23344c2SPaul E. McKenney * If too much time has passed in the current grace period, and if 123e23344c2SPaul E. McKenney * so configured, go kick the relevant kthreads. 124e23344c2SPaul E. McKenney */ 125e23344c2SPaul E. McKenney static void rcu_stall_kick_kthreads(void) 126e23344c2SPaul E. McKenney { 127e23344c2SPaul E. McKenney unsigned long j; 128e23344c2SPaul E. McKenney 129e23344c2SPaul E. McKenney if (!rcu_kick_kthreads) 130e23344c2SPaul E. McKenney return; 131e23344c2SPaul E. McKenney j = READ_ONCE(rcu_state.jiffies_kick_kthreads); 132e23344c2SPaul E. McKenney if (time_after(jiffies, j) && rcu_state.gp_kthread && 133e23344c2SPaul E. McKenney (rcu_gp_in_progress() || READ_ONCE(rcu_state.gp_flags))) { 134e23344c2SPaul E. McKenney WARN_ONCE(1, "Kicking %s grace-period kthread\n", 135e23344c2SPaul E. McKenney rcu_state.name); 136e23344c2SPaul E. McKenney rcu_ftrace_dump(DUMP_ALL); 137e23344c2SPaul E. McKenney wake_up_process(rcu_state.gp_kthread); 138e23344c2SPaul E. McKenney WRITE_ONCE(rcu_state.jiffies_kick_kthreads, j + HZ); 139e23344c2SPaul E. McKenney } 140e23344c2SPaul E. McKenney } 141e23344c2SPaul E. McKenney 1427ac1907cSPaul E. McKenney /* 1437ac1907cSPaul E. McKenney * Handler for the irq_work request posted about halfway into the RCU CPU 1447ac1907cSPaul E. McKenney * stall timeout, and used to detect excessive irq disabling. Set state 1457ac1907cSPaul E. McKenney * appropriately, but just complain if there is unexpected state on entry. 1467ac1907cSPaul E. McKenney */ 1477ac1907cSPaul E. McKenney static void rcu_iw_handler(struct irq_work *iwp) 1487ac1907cSPaul E. McKenney { 1497ac1907cSPaul E. McKenney struct rcu_data *rdp; 1507ac1907cSPaul E. McKenney struct rcu_node *rnp; 1517ac1907cSPaul E. McKenney 1527ac1907cSPaul E. McKenney rdp = container_of(iwp, struct rcu_data, rcu_iw); 1537ac1907cSPaul E. McKenney rnp = rdp->mynode; 1547ac1907cSPaul E. McKenney raw_spin_lock_rcu_node(rnp); 1557ac1907cSPaul E. McKenney if (!WARN_ON_ONCE(!rdp->rcu_iw_pending)) { 1567ac1907cSPaul E. McKenney rdp->rcu_iw_gp_seq = rnp->gp_seq; 1577ac1907cSPaul E. McKenney rdp->rcu_iw_pending = false; 1587ac1907cSPaul E. McKenney } 1597ac1907cSPaul E. McKenney raw_spin_unlock_rcu_node(rnp); 1607ac1907cSPaul E. McKenney } 1617ac1907cSPaul E. McKenney 162e23344c2SPaul E. McKenney ////////////////////////////////////////////////////////////////////////////// 163e23344c2SPaul E. McKenney // 164e23344c2SPaul E. McKenney // Printing RCU CPU stall warnings 165e23344c2SPaul E. McKenney 166c130d2dcSLai Jiangshan #ifdef CONFIG_PREEMPT_RCU 1673fc3d170SPaul E. McKenney 1683fc3d170SPaul E. McKenney /* 1693fc3d170SPaul E. McKenney * Dump detailed information for all tasks blocking the current RCU 1703fc3d170SPaul E. McKenney * grace period on the specified rcu_node structure. 1713fc3d170SPaul E. McKenney */ 1723fc3d170SPaul E. McKenney static void rcu_print_detail_task_stall_rnp(struct rcu_node *rnp) 1733fc3d170SPaul E. McKenney { 1743fc3d170SPaul E. McKenney unsigned long flags; 1753fc3d170SPaul E. McKenney struct task_struct *t; 1763fc3d170SPaul E. McKenney 1773fc3d170SPaul E. McKenney raw_spin_lock_irqsave_rcu_node(rnp, flags); 1783fc3d170SPaul E. McKenney if (!rcu_preempt_blocked_readers_cgp(rnp)) { 1793fc3d170SPaul E. McKenney raw_spin_unlock_irqrestore_rcu_node(rnp, flags); 1803fc3d170SPaul E. McKenney return; 1813fc3d170SPaul E. McKenney } 1823fc3d170SPaul E. McKenney t = list_entry(rnp->gp_tasks->prev, 1833fc3d170SPaul E. McKenney struct task_struct, rcu_node_entry); 1843fc3d170SPaul E. McKenney list_for_each_entry_continue(t, &rnp->blkd_tasks, rcu_node_entry) { 1853fc3d170SPaul E. McKenney /* 1863fc3d170SPaul E. McKenney * We could be printing a lot while holding a spinlock. 1873fc3d170SPaul E. McKenney * Avoid triggering hard lockup. 1883fc3d170SPaul E. McKenney */ 1893fc3d170SPaul E. McKenney touch_nmi_watchdog(); 1903fc3d170SPaul E. McKenney sched_show_task(t); 1913fc3d170SPaul E. McKenney } 1923fc3d170SPaul E. McKenney raw_spin_unlock_irqrestore_rcu_node(rnp, flags); 1933fc3d170SPaul E. McKenney } 1943fc3d170SPaul E. McKenney 1953fc3d170SPaul E. McKenney /* 1963fc3d170SPaul E. McKenney * Scan the current list of tasks blocked within RCU read-side critical 1973fc3d170SPaul E. McKenney * sections, printing out the tid of each. 1983fc3d170SPaul E. McKenney */ 1993fc3d170SPaul E. McKenney static int rcu_print_task_stall(struct rcu_node *rnp) 2003fc3d170SPaul E. McKenney { 2013fc3d170SPaul E. McKenney struct task_struct *t; 2023fc3d170SPaul E. McKenney int ndetected = 0; 2033fc3d170SPaul E. McKenney 2043fc3d170SPaul E. McKenney if (!rcu_preempt_blocked_readers_cgp(rnp)) 2053fc3d170SPaul E. McKenney return 0; 20621d0d79aSPaul E. McKenney pr_err("\tTasks blocked on level-%d rcu_node (CPUs %d-%d):", 20721d0d79aSPaul E. McKenney rnp->level, rnp->grplo, rnp->grphi); 2083fc3d170SPaul E. McKenney t = list_entry(rnp->gp_tasks->prev, 2093fc3d170SPaul E. McKenney struct task_struct, rcu_node_entry); 2103fc3d170SPaul E. McKenney list_for_each_entry_continue(t, &rnp->blkd_tasks, rcu_node_entry) { 2113fc3d170SPaul E. McKenney pr_cont(" P%d", t->pid); 2123fc3d170SPaul E. McKenney ndetected++; 2133fc3d170SPaul E. McKenney } 21421d0d79aSPaul E. McKenney pr_cont("\n"); 2153fc3d170SPaul E. McKenney return ndetected; 2163fc3d170SPaul E. McKenney } 2173fc3d170SPaul E. McKenney 218c130d2dcSLai Jiangshan #else /* #ifdef CONFIG_PREEMPT_RCU */ 2193fc3d170SPaul E. McKenney 2203fc3d170SPaul E. McKenney /* 2213fc3d170SPaul E. McKenney * Because preemptible RCU does not exist, we never have to check for 2223fc3d170SPaul E. McKenney * tasks blocked within RCU read-side critical sections. 2233fc3d170SPaul E. McKenney */ 22421d0d79aSPaul E. McKenney static void rcu_print_detail_task_stall_rnp(struct rcu_node *rnp) 2253fc3d170SPaul E. McKenney { 2263fc3d170SPaul E. McKenney } 2273fc3d170SPaul E. McKenney 2283fc3d170SPaul E. McKenney /* 2293fc3d170SPaul E. McKenney * Because preemptible RCU does not exist, we never have to check for 2303fc3d170SPaul E. McKenney * tasks blocked within RCU read-side critical sections. 2313fc3d170SPaul E. McKenney */ 2323fc3d170SPaul E. McKenney static int rcu_print_task_stall(struct rcu_node *rnp) 2333fc3d170SPaul E. McKenney { 2343fc3d170SPaul E. McKenney return 0; 2353fc3d170SPaul E. McKenney } 236c130d2dcSLai Jiangshan #endif /* #else #ifdef CONFIG_PREEMPT_RCU */ 23732255d51SPaul E. McKenney 23832255d51SPaul E. McKenney /* 23932255d51SPaul E. McKenney * Dump stacks of all tasks running on stalled CPUs. First try using 24032255d51SPaul E. McKenney * NMIs, but fall back to manual remote stack tracing on architectures 24132255d51SPaul E. McKenney * that don't support NMI-based stack dumps. The NMI-triggered stack 24232255d51SPaul E. McKenney * traces are more accurate because they are printed by the target CPU. 24332255d51SPaul E. McKenney */ 24432255d51SPaul E. McKenney static void rcu_dump_cpu_stacks(void) 24532255d51SPaul E. McKenney { 24632255d51SPaul E. McKenney int cpu; 24732255d51SPaul E. McKenney unsigned long flags; 24832255d51SPaul E. McKenney struct rcu_node *rnp; 24932255d51SPaul E. McKenney 25032255d51SPaul E. McKenney rcu_for_each_leaf_node(rnp) { 25132255d51SPaul E. McKenney raw_spin_lock_irqsave_rcu_node(rnp, flags); 25232255d51SPaul E. McKenney for_each_leaf_node_possible_cpu(rnp, cpu) 25332255d51SPaul E. McKenney if (rnp->qsmask & leaf_node_cpu_bit(rnp, cpu)) 25432255d51SPaul E. McKenney if (!trigger_single_cpu_backtrace(cpu)) 25532255d51SPaul E. McKenney dump_cpu_task(cpu); 25632255d51SPaul E. McKenney raw_spin_unlock_irqrestore_rcu_node(rnp, flags); 25732255d51SPaul E. McKenney } 25832255d51SPaul E. McKenney } 25932255d51SPaul E. McKenney 26059b73a27SPaul E. McKenney #ifdef CONFIG_RCU_FAST_NO_HZ 26159b73a27SPaul E. McKenney 26259b73a27SPaul E. McKenney static void print_cpu_stall_fast_no_hz(char *cp, int cpu) 26359b73a27SPaul E. McKenney { 26459b73a27SPaul E. McKenney struct rcu_data *rdp = &per_cpu(rcu_data, cpu); 26559b73a27SPaul E. McKenney 26677a40f97SJoel Fernandes (Google) sprintf(cp, "last_accelerate: %04lx/%04lx dyntick_enabled: %d", 26759b73a27SPaul E. McKenney rdp->last_accelerate & 0xffff, jiffies & 0xffff, 26877a40f97SJoel Fernandes (Google) !!rdp->tick_nohz_enabled_snap); 26959b73a27SPaul E. McKenney } 27059b73a27SPaul E. McKenney 27159b73a27SPaul E. McKenney #else /* #ifdef CONFIG_RCU_FAST_NO_HZ */ 27259b73a27SPaul E. McKenney 27359b73a27SPaul E. McKenney static void print_cpu_stall_fast_no_hz(char *cp, int cpu) 27459b73a27SPaul E. McKenney { 27559b73a27SPaul E. McKenney *cp = '\0'; 27659b73a27SPaul E. McKenney } 27759b73a27SPaul E. McKenney 27859b73a27SPaul E. McKenney #endif /* #else #ifdef CONFIG_RCU_FAST_NO_HZ */ 27959b73a27SPaul E. McKenney 280e2167b38SLai Jiangshan static const char * const gp_state_names[] = { 281e2167b38SLai Jiangshan [RCU_GP_IDLE] = "RCU_GP_IDLE", 282e2167b38SLai Jiangshan [RCU_GP_WAIT_GPS] = "RCU_GP_WAIT_GPS", 283e2167b38SLai Jiangshan [RCU_GP_DONE_GPS] = "RCU_GP_DONE_GPS", 284e2167b38SLai Jiangshan [RCU_GP_ONOFF] = "RCU_GP_ONOFF", 285e2167b38SLai Jiangshan [RCU_GP_INIT] = "RCU_GP_INIT", 286e2167b38SLai Jiangshan [RCU_GP_WAIT_FQS] = "RCU_GP_WAIT_FQS", 287e2167b38SLai Jiangshan [RCU_GP_DOING_FQS] = "RCU_GP_DOING_FQS", 288e2167b38SLai Jiangshan [RCU_GP_CLEANUP] = "RCU_GP_CLEANUP", 289e2167b38SLai Jiangshan [RCU_GP_CLEANED] = "RCU_GP_CLEANED", 290e2167b38SLai Jiangshan }; 291e2167b38SLai Jiangshan 292e2167b38SLai Jiangshan /* 293e2167b38SLai Jiangshan * Convert a ->gp_state value to a character string. 294e2167b38SLai Jiangshan */ 295e2167b38SLai Jiangshan static const char *gp_state_getname(short gs) 296e2167b38SLai Jiangshan { 297e2167b38SLai Jiangshan if (gs < 0 || gs >= ARRAY_SIZE(gp_state_names)) 298e2167b38SLai Jiangshan return "???"; 299e2167b38SLai Jiangshan return gp_state_names[gs]; 300e2167b38SLai Jiangshan } 301e2167b38SLai Jiangshan 302*88375825SPaul E. McKenney /* Is the RCU grace-period kthread being starved of CPU time? */ 303*88375825SPaul E. McKenney static bool rcu_is_gp_kthread_starving(unsigned long *jp) 304*88375825SPaul E. McKenney { 305*88375825SPaul E. McKenney unsigned long j = jiffies - READ_ONCE(rcu_state.gp_activity); 306*88375825SPaul E. McKenney 307*88375825SPaul E. McKenney if (jp) 308*88375825SPaul E. McKenney *jp = j; 309*88375825SPaul E. McKenney return j > 2 * HZ; 310*88375825SPaul E. McKenney } 311*88375825SPaul E. McKenney 31259b73a27SPaul E. McKenney /* 31359b73a27SPaul E. McKenney * Print out diagnostic information for the specified stalled CPU. 31459b73a27SPaul E. McKenney * 31559b73a27SPaul E. McKenney * If the specified CPU is aware of the current RCU grace period, then 31659b73a27SPaul E. McKenney * print the number of scheduling clock interrupts the CPU has taken 31759b73a27SPaul E. McKenney * during the time that it has been aware. Otherwise, print the number 31859b73a27SPaul E. McKenney * of RCU grace periods that this CPU is ignorant of, for example, "1" 31959b73a27SPaul E. McKenney * if the CPU was aware of the previous grace period. 32059b73a27SPaul E. McKenney * 32159b73a27SPaul E. McKenney * Also print out idle and (if CONFIG_RCU_FAST_NO_HZ) idle-entry info. 32259b73a27SPaul E. McKenney */ 32359b73a27SPaul E. McKenney static void print_cpu_stall_info(int cpu) 32459b73a27SPaul E. McKenney { 32559b73a27SPaul E. McKenney unsigned long delta; 326*88375825SPaul E. McKenney bool falsepositive; 32759b73a27SPaul E. McKenney char fast_no_hz[72]; 32859b73a27SPaul E. McKenney struct rcu_data *rdp = per_cpu_ptr(&rcu_data, cpu); 32959b73a27SPaul E. McKenney char *ticks_title; 33059b73a27SPaul E. McKenney unsigned long ticks_value; 33159b73a27SPaul E. McKenney 33259b73a27SPaul E. McKenney /* 33359b73a27SPaul E. McKenney * We could be printing a lot while holding a spinlock. Avoid 33459b73a27SPaul E. McKenney * triggering hard lockup. 33559b73a27SPaul E. McKenney */ 33659b73a27SPaul E. McKenney touch_nmi_watchdog(); 33759b73a27SPaul E. McKenney 33859b73a27SPaul E. McKenney ticks_value = rcu_seq_ctr(rcu_state.gp_seq - rdp->gp_seq); 33959b73a27SPaul E. McKenney if (ticks_value) { 34059b73a27SPaul E. McKenney ticks_title = "GPs behind"; 34159b73a27SPaul E. McKenney } else { 34259b73a27SPaul E. McKenney ticks_title = "ticks this GP"; 34359b73a27SPaul E. McKenney ticks_value = rdp->ticks_this_gp; 34459b73a27SPaul E. McKenney } 34559b73a27SPaul E. McKenney print_cpu_stall_fast_no_hz(fast_no_hz, cpu); 34659b73a27SPaul E. McKenney delta = rcu_seq_ctr(rdp->mynode->gp_seq - rdp->rcu_iw_gp_seq); 347*88375825SPaul E. McKenney falsepositive = rcu_is_gp_kthread_starving(NULL) && 348*88375825SPaul E. McKenney rcu_dynticks_in_eqs(rcu_dynticks_snap(rdp)); 349*88375825SPaul E. McKenney pr_err("\t%d-%c%c%c%c: (%lu %s) idle=%03x/%ld/%#lx softirq=%u/%u fqs=%ld %s%s\n", 35059b73a27SPaul E. McKenney cpu, 35159b73a27SPaul E. McKenney "O."[!!cpu_online(cpu)], 35259b73a27SPaul E. McKenney "o."[!!(rdp->grpmask & rdp->mynode->qsmaskinit)], 35359b73a27SPaul E. McKenney "N."[!!(rdp->grpmask & rdp->mynode->qsmaskinitnext)], 35459b73a27SPaul E. McKenney !IS_ENABLED(CONFIG_IRQ_WORK) ? '?' : 35559b73a27SPaul E. McKenney rdp->rcu_iw_pending ? (int)min(delta, 9UL) + '0' : 35659b73a27SPaul E. McKenney "!."[!delta], 35759b73a27SPaul E. McKenney ticks_value, ticks_title, 35859b73a27SPaul E. McKenney rcu_dynticks_snap(rdp) & 0xfff, 35959b73a27SPaul E. McKenney rdp->dynticks_nesting, rdp->dynticks_nmi_nesting, 36059b73a27SPaul E. McKenney rdp->softirq_snap, kstat_softirqs_cpu(RCU_SOFTIRQ, cpu), 361*88375825SPaul E. McKenney data_race(rcu_state.n_force_qs) - rcu_state.n_force_qs_gpstart, 362*88375825SPaul E. McKenney fast_no_hz, 363*88375825SPaul E. McKenney falsepositive ? " (false positive?)" : ""); 36459b73a27SPaul E. McKenney } 36559b73a27SPaul E. McKenney 366e23344c2SPaul E. McKenney /* Complain about starvation of grace-period kthread. */ 367e23344c2SPaul E. McKenney static void rcu_check_gp_kthread_starvation(void) 36859b73a27SPaul E. McKenney { 369e23344c2SPaul E. McKenney struct task_struct *gpk = rcu_state.gp_kthread; 370e23344c2SPaul E. McKenney unsigned long j; 371e23344c2SPaul E. McKenney 372*88375825SPaul E. McKenney if (rcu_is_gp_kthread_starving(&j)) { 373e23344c2SPaul E. McKenney pr_err("%s kthread starved for %ld jiffies! g%ld f%#x %s(%d) ->state=%#lx ->cpu=%d\n", 374e23344c2SPaul E. McKenney rcu_state.name, j, 375e23344c2SPaul E. McKenney (long)rcu_seq_current(&rcu_state.gp_seq), 376e23344c2SPaul E. McKenney READ_ONCE(rcu_state.gp_flags), 377e23344c2SPaul E. McKenney gp_state_getname(rcu_state.gp_state), rcu_state.gp_state, 378e23344c2SPaul E. McKenney gpk ? gpk->state : ~0, gpk ? task_cpu(gpk) : -1); 379e23344c2SPaul E. McKenney if (gpk) { 380*88375825SPaul E. McKenney pr_err("\tUnless %s kthread gets sufficient CPU time, OOM is now expected behavior.\n", rcu_state.name); 381e23344c2SPaul E. McKenney pr_err("RCU grace-period kthread stack dump:\n"); 382e23344c2SPaul E. McKenney sched_show_task(gpk); 383e23344c2SPaul E. McKenney wake_up_process(gpk); 384e23344c2SPaul E. McKenney } 385e23344c2SPaul E. McKenney } 38659b73a27SPaul E. McKenney } 38759b73a27SPaul E. McKenney 38832255d51SPaul E. McKenney static void print_other_cpu_stall(unsigned long gp_seq) 38932255d51SPaul E. McKenney { 39032255d51SPaul E. McKenney int cpu; 39132255d51SPaul E. McKenney unsigned long flags; 39232255d51SPaul E. McKenney unsigned long gpa; 39332255d51SPaul E. McKenney unsigned long j; 39432255d51SPaul E. McKenney int ndetected = 0; 39521d0d79aSPaul E. McKenney struct rcu_node *rnp; 39632255d51SPaul E. McKenney long totqlen = 0; 39732255d51SPaul E. McKenney 39832255d51SPaul E. McKenney /* Kick and suppress, if so configured. */ 39932255d51SPaul E. McKenney rcu_stall_kick_kthreads(); 40058c53360SPaul E. McKenney if (rcu_stall_is_suppressed()) 40132255d51SPaul E. McKenney return; 40232255d51SPaul E. McKenney 40332255d51SPaul E. McKenney /* 40432255d51SPaul E. McKenney * OK, time to rat on our buddy... 40532255d51SPaul E. McKenney * See Documentation/RCU/stallwarn.txt for info on how to debug 40632255d51SPaul E. McKenney * RCU CPU stall warnings. 40732255d51SPaul E. McKenney */ 40840e69ac7SPaul E. McKenney pr_err("INFO: %s detected stalls on CPUs/tasks:\n", rcu_state.name); 40932255d51SPaul E. McKenney rcu_for_each_leaf_node(rnp) { 41032255d51SPaul E. McKenney raw_spin_lock_irqsave_rcu_node(rnp, flags); 41132255d51SPaul E. McKenney ndetected += rcu_print_task_stall(rnp); 41232255d51SPaul E. McKenney if (rnp->qsmask != 0) { 41332255d51SPaul E. McKenney for_each_leaf_node_possible_cpu(rnp, cpu) 41432255d51SPaul E. McKenney if (rnp->qsmask & leaf_node_cpu_bit(rnp, cpu)) { 41532255d51SPaul E. McKenney print_cpu_stall_info(cpu); 41632255d51SPaul E. McKenney ndetected++; 41732255d51SPaul E. McKenney } 41832255d51SPaul E. McKenney } 41932255d51SPaul E. McKenney raw_spin_unlock_irqrestore_rcu_node(rnp, flags); 42032255d51SPaul E. McKenney } 42132255d51SPaul E. McKenney 42232255d51SPaul E. McKenney for_each_possible_cpu(cpu) 42332255d51SPaul E. McKenney totqlen += rcu_get_n_cbs_cpu(cpu); 42440e69ac7SPaul E. McKenney pr_cont("\t(detected by %d, t=%ld jiffies, g=%ld, q=%lu)\n", 42532255d51SPaul E. McKenney smp_processor_id(), (long)(jiffies - rcu_state.gp_start), 42632255d51SPaul E. McKenney (long)rcu_seq_current(&rcu_state.gp_seq), totqlen); 42732255d51SPaul E. McKenney if (ndetected) { 42832255d51SPaul E. McKenney rcu_dump_cpu_stacks(); 42932255d51SPaul E. McKenney 43032255d51SPaul E. McKenney /* Complain about tasks blocking the grace period. */ 43121d0d79aSPaul E. McKenney rcu_for_each_leaf_node(rnp) 43221d0d79aSPaul E. McKenney rcu_print_detail_task_stall_rnp(rnp); 43332255d51SPaul E. McKenney } else { 43432255d51SPaul E. McKenney if (rcu_seq_current(&rcu_state.gp_seq) != gp_seq) { 43532255d51SPaul E. McKenney pr_err("INFO: Stall ended before state dump start\n"); 43632255d51SPaul E. McKenney } else { 43732255d51SPaul E. McKenney j = jiffies; 43832255d51SPaul E. McKenney gpa = READ_ONCE(rcu_state.gp_activity); 43932255d51SPaul E. McKenney pr_err("All QSes seen, last %s kthread activity %ld (%ld-%ld), jiffies_till_next_fqs=%ld, root ->qsmask %#lx\n", 44032255d51SPaul E. McKenney rcu_state.name, j - gpa, j, gpa, 44132255d51SPaul E. McKenney READ_ONCE(jiffies_till_next_fqs), 44232255d51SPaul E. McKenney rcu_get_root()->qsmask); 44332255d51SPaul E. McKenney /* In this case, the current CPU might be at fault. */ 44432255d51SPaul E. McKenney sched_show_task(current); 44532255d51SPaul E. McKenney } 44632255d51SPaul E. McKenney } 44732255d51SPaul E. McKenney /* Rewrite if needed in case of slow consoles. */ 44832255d51SPaul E. McKenney if (ULONG_CMP_GE(jiffies, READ_ONCE(rcu_state.jiffies_stall))) 44932255d51SPaul E. McKenney WRITE_ONCE(rcu_state.jiffies_stall, 45032255d51SPaul E. McKenney jiffies + 3 * rcu_jiffies_till_stall_check() + 3); 45132255d51SPaul E. McKenney 45232255d51SPaul E. McKenney rcu_check_gp_kthread_starvation(); 45332255d51SPaul E. McKenney 45432255d51SPaul E. McKenney panic_on_rcu_stall(); 45532255d51SPaul E. McKenney 45632255d51SPaul E. McKenney rcu_force_quiescent_state(); /* Kick them all. */ 45732255d51SPaul E. McKenney } 45832255d51SPaul E. McKenney 45932255d51SPaul E. McKenney static void print_cpu_stall(void) 46032255d51SPaul E. McKenney { 46132255d51SPaul E. McKenney int cpu; 46232255d51SPaul E. McKenney unsigned long flags; 46332255d51SPaul E. McKenney struct rcu_data *rdp = this_cpu_ptr(&rcu_data); 46432255d51SPaul E. McKenney struct rcu_node *rnp = rcu_get_root(); 46532255d51SPaul E. McKenney long totqlen = 0; 46632255d51SPaul E. McKenney 46732255d51SPaul E. McKenney /* Kick and suppress, if so configured. */ 46832255d51SPaul E. McKenney rcu_stall_kick_kthreads(); 46958c53360SPaul E. McKenney if (rcu_stall_is_suppressed()) 47032255d51SPaul E. McKenney return; 47132255d51SPaul E. McKenney 47232255d51SPaul E. McKenney /* 47332255d51SPaul E. McKenney * OK, time to rat on ourselves... 47432255d51SPaul E. McKenney * See Documentation/RCU/stallwarn.txt for info on how to debug 47532255d51SPaul E. McKenney * RCU CPU stall warnings. 47632255d51SPaul E. McKenney */ 47740e69ac7SPaul E. McKenney pr_err("INFO: %s self-detected stall on CPU\n", rcu_state.name); 47832255d51SPaul E. McKenney raw_spin_lock_irqsave_rcu_node(rdp->mynode, flags); 47932255d51SPaul E. McKenney print_cpu_stall_info(smp_processor_id()); 48032255d51SPaul E. McKenney raw_spin_unlock_irqrestore_rcu_node(rdp->mynode, flags); 48132255d51SPaul E. McKenney for_each_possible_cpu(cpu) 48232255d51SPaul E. McKenney totqlen += rcu_get_n_cbs_cpu(cpu); 48340e69ac7SPaul E. McKenney pr_cont("\t(t=%lu jiffies g=%ld q=%lu)\n", 48432255d51SPaul E. McKenney jiffies - rcu_state.gp_start, 48532255d51SPaul E. McKenney (long)rcu_seq_current(&rcu_state.gp_seq), totqlen); 48632255d51SPaul E. McKenney 48732255d51SPaul E. McKenney rcu_check_gp_kthread_starvation(); 48832255d51SPaul E. McKenney 48932255d51SPaul E. McKenney rcu_dump_cpu_stacks(); 49032255d51SPaul E. McKenney 49132255d51SPaul E. McKenney raw_spin_lock_irqsave_rcu_node(rnp, flags); 49232255d51SPaul E. McKenney /* Rewrite if needed in case of slow consoles. */ 49332255d51SPaul E. McKenney if (ULONG_CMP_GE(jiffies, READ_ONCE(rcu_state.jiffies_stall))) 49432255d51SPaul E. McKenney WRITE_ONCE(rcu_state.jiffies_stall, 49532255d51SPaul E. McKenney jiffies + 3 * rcu_jiffies_till_stall_check() + 3); 49632255d51SPaul E. McKenney raw_spin_unlock_irqrestore_rcu_node(rnp, flags); 49732255d51SPaul E. McKenney 49832255d51SPaul E. McKenney panic_on_rcu_stall(); 49932255d51SPaul E. McKenney 50032255d51SPaul E. McKenney /* 50132255d51SPaul E. McKenney * Attempt to revive the RCU machinery by forcing a context switch. 50232255d51SPaul E. McKenney * 50332255d51SPaul E. McKenney * A context switch would normally allow the RCU state machine to make 50432255d51SPaul E. McKenney * progress and it could be we're stuck in kernel space without context 50532255d51SPaul E. McKenney * switches for an entirely unreasonable amount of time. 50632255d51SPaul E. McKenney */ 50732255d51SPaul E. McKenney set_tsk_need_resched(current); 50832255d51SPaul E. McKenney set_preempt_need_resched(); 50932255d51SPaul E. McKenney } 51032255d51SPaul E. McKenney 51132255d51SPaul E. McKenney static void check_cpu_stall(struct rcu_data *rdp) 51232255d51SPaul E. McKenney { 51332255d51SPaul E. McKenney unsigned long gs1; 51432255d51SPaul E. McKenney unsigned long gs2; 51532255d51SPaul E. McKenney unsigned long gps; 51632255d51SPaul E. McKenney unsigned long j; 51732255d51SPaul E. McKenney unsigned long jn; 51832255d51SPaul E. McKenney unsigned long js; 51932255d51SPaul E. McKenney struct rcu_node *rnp; 52032255d51SPaul E. McKenney 52158c53360SPaul E. McKenney if ((rcu_stall_is_suppressed() && !rcu_kick_kthreads) || 52232255d51SPaul E. McKenney !rcu_gp_in_progress()) 52332255d51SPaul E. McKenney return; 52432255d51SPaul E. McKenney rcu_stall_kick_kthreads(); 52532255d51SPaul E. McKenney j = jiffies; 52632255d51SPaul E. McKenney 52732255d51SPaul E. McKenney /* 52832255d51SPaul E. McKenney * Lots of memory barriers to reject false positives. 52932255d51SPaul E. McKenney * 53032255d51SPaul E. McKenney * The idea is to pick up rcu_state.gp_seq, then 53132255d51SPaul E. McKenney * rcu_state.jiffies_stall, then rcu_state.gp_start, and finally 53232255d51SPaul E. McKenney * another copy of rcu_state.gp_seq. These values are updated in 53332255d51SPaul E. McKenney * the opposite order with memory barriers (or equivalent) during 53432255d51SPaul E. McKenney * grace-period initialization and cleanup. Now, a false positive 53532255d51SPaul E. McKenney * can occur if we get an new value of rcu_state.gp_start and a old 53632255d51SPaul E. McKenney * value of rcu_state.jiffies_stall. But given the memory barriers, 53732255d51SPaul E. McKenney * the only way that this can happen is if one grace period ends 53832255d51SPaul E. McKenney * and another starts between these two fetches. This is detected 53932255d51SPaul E. McKenney * by comparing the second fetch of rcu_state.gp_seq with the 54032255d51SPaul E. McKenney * previous fetch from rcu_state.gp_seq. 54132255d51SPaul E. McKenney * 54232255d51SPaul E. McKenney * Given this check, comparisons of jiffies, rcu_state.jiffies_stall, 54332255d51SPaul E. McKenney * and rcu_state.gp_start suffice to forestall false positives. 54432255d51SPaul E. McKenney */ 54532255d51SPaul E. McKenney gs1 = READ_ONCE(rcu_state.gp_seq); 54632255d51SPaul E. McKenney smp_rmb(); /* Pick up ->gp_seq first... */ 54732255d51SPaul E. McKenney js = READ_ONCE(rcu_state.jiffies_stall); 54832255d51SPaul E. McKenney smp_rmb(); /* ...then ->jiffies_stall before the rest... */ 54932255d51SPaul E. McKenney gps = READ_ONCE(rcu_state.gp_start); 55032255d51SPaul E. McKenney smp_rmb(); /* ...and finally ->gp_start before ->gp_seq again. */ 55132255d51SPaul E. McKenney gs2 = READ_ONCE(rcu_state.gp_seq); 55232255d51SPaul E. McKenney if (gs1 != gs2 || 55332255d51SPaul E. McKenney ULONG_CMP_LT(j, js) || 55432255d51SPaul E. McKenney ULONG_CMP_GE(gps, js)) 55532255d51SPaul E. McKenney return; /* No stall or GP completed since entering function. */ 55632255d51SPaul E. McKenney rnp = rdp->mynode; 55732255d51SPaul E. McKenney jn = jiffies + 3 * rcu_jiffies_till_stall_check() + 3; 55832255d51SPaul E. McKenney if (rcu_gp_in_progress() && 55932255d51SPaul E. McKenney (READ_ONCE(rnp->qsmask) & rdp->grpmask) && 56032255d51SPaul E. McKenney cmpxchg(&rcu_state.jiffies_stall, js, jn) == js) { 56132255d51SPaul E. McKenney 56232255d51SPaul E. McKenney /* We haven't checked in, so go dump stack. */ 56332255d51SPaul E. McKenney print_cpu_stall(); 564cdc694b2SPaul E. McKenney if (rcu_cpu_stall_ftrace_dump) 565cdc694b2SPaul E. McKenney rcu_ftrace_dump(DUMP_ALL); 56632255d51SPaul E. McKenney 56732255d51SPaul E. McKenney } else if (rcu_gp_in_progress() && 56832255d51SPaul E. McKenney ULONG_CMP_GE(j, js + RCU_STALL_RAT_DELAY) && 56932255d51SPaul E. McKenney cmpxchg(&rcu_state.jiffies_stall, js, jn) == js) { 57032255d51SPaul E. McKenney 57132255d51SPaul E. McKenney /* They had a few time units to dump stack, so complain. */ 57232255d51SPaul E. McKenney print_other_cpu_stall(gs2); 573cdc694b2SPaul E. McKenney if (rcu_cpu_stall_ftrace_dump) 574cdc694b2SPaul E. McKenney rcu_ftrace_dump(DUMP_ALL); 57532255d51SPaul E. McKenney } 57632255d51SPaul E. McKenney } 577b51bcbbfSPaul E. McKenney 578b51bcbbfSPaul E. McKenney ////////////////////////////////////////////////////////////////////////////// 579b51bcbbfSPaul E. McKenney // 580b51bcbbfSPaul E. McKenney // RCU forward-progress mechanisms, including of callback invocation. 581b51bcbbfSPaul E. McKenney 582b51bcbbfSPaul E. McKenney 583b51bcbbfSPaul E. McKenney /* 584b51bcbbfSPaul E. McKenney * Show the state of the grace-period kthreads. 585b51bcbbfSPaul E. McKenney */ 586b51bcbbfSPaul E. McKenney void show_rcu_gp_kthreads(void) 587b51bcbbfSPaul E. McKenney { 588b51bcbbfSPaul E. McKenney int cpu; 589b51bcbbfSPaul E. McKenney unsigned long j; 590b51bcbbfSPaul E. McKenney unsigned long ja; 591b51bcbbfSPaul E. McKenney unsigned long jr; 592b51bcbbfSPaul E. McKenney unsigned long jw; 593b51bcbbfSPaul E. McKenney struct rcu_data *rdp; 594b51bcbbfSPaul E. McKenney struct rcu_node *rnp; 5955648d659SPaul E. McKenney struct task_struct *t = READ_ONCE(rcu_state.gp_kthread); 596b51bcbbfSPaul E. McKenney 597b51bcbbfSPaul E. McKenney j = jiffies; 598b51bcbbfSPaul E. McKenney ja = j - READ_ONCE(rcu_state.gp_activity); 599b51bcbbfSPaul E. McKenney jr = j - READ_ONCE(rcu_state.gp_req_activity); 600b51bcbbfSPaul E. McKenney jw = j - READ_ONCE(rcu_state.gp_wake_time); 601b51bcbbfSPaul E. McKenney pr_info("%s: wait state: %s(%d) ->state: %#lx delta ->gp_activity %lu ->gp_req_activity %lu ->gp_wake_time %lu ->gp_wake_seq %ld ->gp_seq %ld ->gp_seq_needed %ld ->gp_flags %#x\n", 602b51bcbbfSPaul E. McKenney rcu_state.name, gp_state_getname(rcu_state.gp_state), 6035648d659SPaul E. McKenney rcu_state.gp_state, t ? t->state : 0x1ffffL, 604b51bcbbfSPaul E. McKenney ja, jr, jw, (long)READ_ONCE(rcu_state.gp_wake_seq), 605b51bcbbfSPaul E. McKenney (long)READ_ONCE(rcu_state.gp_seq), 606b51bcbbfSPaul E. McKenney (long)READ_ONCE(rcu_get_root()->gp_seq_needed), 607b51bcbbfSPaul E. McKenney READ_ONCE(rcu_state.gp_flags)); 608b51bcbbfSPaul E. McKenney rcu_for_each_node_breadth_first(rnp) { 6098ff37290SPaul E. McKenney if (ULONG_CMP_GE(READ_ONCE(rcu_state.gp_seq), 6108ff37290SPaul E. McKenney READ_ONCE(rnp->gp_seq_needed))) 611b51bcbbfSPaul E. McKenney continue; 612b51bcbbfSPaul E. McKenney pr_info("\trcu_node %d:%d ->gp_seq %ld ->gp_seq_needed %ld\n", 6138ff37290SPaul E. McKenney rnp->grplo, rnp->grphi, (long)READ_ONCE(rnp->gp_seq), 6148ff37290SPaul E. McKenney (long)READ_ONCE(rnp->gp_seq_needed)); 615b51bcbbfSPaul E. McKenney if (!rcu_is_leaf_node(rnp)) 616b51bcbbfSPaul E. McKenney continue; 617b51bcbbfSPaul E. McKenney for_each_leaf_node_possible_cpu(rnp, cpu) { 618b51bcbbfSPaul E. McKenney rdp = per_cpu_ptr(&rcu_data, cpu); 619a5b89501SPaul E. McKenney if (READ_ONCE(rdp->gpwrap) || 6208ff37290SPaul E. McKenney ULONG_CMP_GE(READ_ONCE(rcu_state.gp_seq), 6218ff37290SPaul E. McKenney READ_ONCE(rdp->gp_seq_needed))) 622b51bcbbfSPaul E. McKenney continue; 623b51bcbbfSPaul E. McKenney pr_info("\tcpu %d ->gp_seq_needed %ld\n", 6248ff37290SPaul E. McKenney cpu, (long)READ_ONCE(rdp->gp_seq_needed)); 625b51bcbbfSPaul E. McKenney } 626b51bcbbfSPaul E. McKenney } 627f7a81b12SPaul E. McKenney for_each_possible_cpu(cpu) { 628f7a81b12SPaul E. McKenney rdp = per_cpu_ptr(&rcu_data, cpu); 629f7a81b12SPaul E. McKenney if (rcu_segcblist_is_offloaded(&rdp->cblist)) 630f7a81b12SPaul E. McKenney show_rcu_nocb_state(rdp); 631f7a81b12SPaul E. McKenney } 632b51bcbbfSPaul E. McKenney /* sched_show_task(rcu_state.gp_kthread); */ 633b51bcbbfSPaul E. McKenney } 634b51bcbbfSPaul E. McKenney EXPORT_SYMBOL_GPL(show_rcu_gp_kthreads); 635b51bcbbfSPaul E. McKenney 636b51bcbbfSPaul E. McKenney /* 637b51bcbbfSPaul E. McKenney * This function checks for grace-period requests that fail to motivate 638b51bcbbfSPaul E. McKenney * RCU to come out of its idle mode. 639b51bcbbfSPaul E. McKenney */ 640b51bcbbfSPaul E. McKenney static void rcu_check_gp_start_stall(struct rcu_node *rnp, struct rcu_data *rdp, 641b51bcbbfSPaul E. McKenney const unsigned long gpssdelay) 642b51bcbbfSPaul E. McKenney { 643b51bcbbfSPaul E. McKenney unsigned long flags; 644b51bcbbfSPaul E. McKenney unsigned long j; 645b51bcbbfSPaul E. McKenney struct rcu_node *rnp_root = rcu_get_root(); 646b51bcbbfSPaul E. McKenney static atomic_t warned = ATOMIC_INIT(0); 647b51bcbbfSPaul E. McKenney 648b51bcbbfSPaul E. McKenney if (!IS_ENABLED(CONFIG_PROVE_RCU) || rcu_gp_in_progress() || 6498ff37290SPaul E. McKenney ULONG_CMP_GE(READ_ONCE(rnp_root->gp_seq), 6505648d659SPaul E. McKenney READ_ONCE(rnp_root->gp_seq_needed)) || 6515648d659SPaul E. McKenney !smp_load_acquire(&rcu_state.gp_kthread)) // Get stable kthread. 652b51bcbbfSPaul E. McKenney return; 653b51bcbbfSPaul E. McKenney j = jiffies; /* Expensive access, and in common case don't get here. */ 654b51bcbbfSPaul E. McKenney if (time_before(j, READ_ONCE(rcu_state.gp_req_activity) + gpssdelay) || 655b51bcbbfSPaul E. McKenney time_before(j, READ_ONCE(rcu_state.gp_activity) + gpssdelay) || 656b51bcbbfSPaul E. McKenney atomic_read(&warned)) 657b51bcbbfSPaul E. McKenney return; 658b51bcbbfSPaul E. McKenney 659b51bcbbfSPaul E. McKenney raw_spin_lock_irqsave_rcu_node(rnp, flags); 660b51bcbbfSPaul E. McKenney j = jiffies; 661b51bcbbfSPaul E. McKenney if (rcu_gp_in_progress() || 6628ff37290SPaul E. McKenney ULONG_CMP_GE(READ_ONCE(rnp_root->gp_seq), 6638ff37290SPaul E. McKenney READ_ONCE(rnp_root->gp_seq_needed)) || 664b51bcbbfSPaul E. McKenney time_before(j, READ_ONCE(rcu_state.gp_req_activity) + gpssdelay) || 665b51bcbbfSPaul E. McKenney time_before(j, READ_ONCE(rcu_state.gp_activity) + gpssdelay) || 666b51bcbbfSPaul E. McKenney atomic_read(&warned)) { 667b51bcbbfSPaul E. McKenney raw_spin_unlock_irqrestore_rcu_node(rnp, flags); 668b51bcbbfSPaul E. McKenney return; 669b51bcbbfSPaul E. McKenney } 670b51bcbbfSPaul E. McKenney /* Hold onto the leaf lock to make others see warned==1. */ 671b51bcbbfSPaul E. McKenney 672b51bcbbfSPaul E. McKenney if (rnp_root != rnp) 673b51bcbbfSPaul E. McKenney raw_spin_lock_rcu_node(rnp_root); /* irqs already disabled. */ 674b51bcbbfSPaul E. McKenney j = jiffies; 675b51bcbbfSPaul E. McKenney if (rcu_gp_in_progress() || 6768ff37290SPaul E. McKenney ULONG_CMP_GE(READ_ONCE(rnp_root->gp_seq), 6778ff37290SPaul E. McKenney READ_ONCE(rnp_root->gp_seq_needed)) || 6788ff37290SPaul E. McKenney time_before(j, READ_ONCE(rcu_state.gp_req_activity) + gpssdelay) || 6798ff37290SPaul E. McKenney time_before(j, READ_ONCE(rcu_state.gp_activity) + gpssdelay) || 680b51bcbbfSPaul E. McKenney atomic_xchg(&warned, 1)) { 6813ae976a7SNeeraj Upadhyay if (rnp_root != rnp) 6823ae976a7SNeeraj Upadhyay /* irqs remain disabled. */ 6833ae976a7SNeeraj Upadhyay raw_spin_unlock_rcu_node(rnp_root); 684b51bcbbfSPaul E. McKenney raw_spin_unlock_irqrestore_rcu_node(rnp, flags); 685b51bcbbfSPaul E. McKenney return; 686b51bcbbfSPaul E. McKenney } 687b51bcbbfSPaul E. McKenney WARN_ON(1); 688b51bcbbfSPaul E. McKenney if (rnp_root != rnp) 689b51bcbbfSPaul E. McKenney raw_spin_unlock_rcu_node(rnp_root); 690b51bcbbfSPaul E. McKenney raw_spin_unlock_irqrestore_rcu_node(rnp, flags); 691b51bcbbfSPaul E. McKenney show_rcu_gp_kthreads(); 692b51bcbbfSPaul E. McKenney } 693b51bcbbfSPaul E. McKenney 694b51bcbbfSPaul E. McKenney /* 695b51bcbbfSPaul E. McKenney * Do a forward-progress check for rcutorture. This is normally invoked 696b51bcbbfSPaul E. McKenney * due to an OOM event. The argument "j" gives the time period during 697b51bcbbfSPaul E. McKenney * which rcutorture would like progress to have been made. 698b51bcbbfSPaul E. McKenney */ 699b51bcbbfSPaul E. McKenney void rcu_fwd_progress_check(unsigned long j) 700b51bcbbfSPaul E. McKenney { 701b51bcbbfSPaul E. McKenney unsigned long cbs; 702b51bcbbfSPaul E. McKenney int cpu; 703b51bcbbfSPaul E. McKenney unsigned long max_cbs = 0; 704b51bcbbfSPaul E. McKenney int max_cpu = -1; 705b51bcbbfSPaul E. McKenney struct rcu_data *rdp; 706b51bcbbfSPaul E. McKenney 707b51bcbbfSPaul E. McKenney if (rcu_gp_in_progress()) { 708b51bcbbfSPaul E. McKenney pr_info("%s: GP age %lu jiffies\n", 709b51bcbbfSPaul E. McKenney __func__, jiffies - rcu_state.gp_start); 710b51bcbbfSPaul E. McKenney show_rcu_gp_kthreads(); 711b51bcbbfSPaul E. McKenney } else { 712b51bcbbfSPaul E. McKenney pr_info("%s: Last GP end %lu jiffies ago\n", 713b51bcbbfSPaul E. McKenney __func__, jiffies - rcu_state.gp_end); 714b51bcbbfSPaul E. McKenney preempt_disable(); 715b51bcbbfSPaul E. McKenney rdp = this_cpu_ptr(&rcu_data); 716b51bcbbfSPaul E. McKenney rcu_check_gp_start_stall(rdp->mynode, rdp, j); 717b51bcbbfSPaul E. McKenney preempt_enable(); 718b51bcbbfSPaul E. McKenney } 719b51bcbbfSPaul E. McKenney for_each_possible_cpu(cpu) { 720b51bcbbfSPaul E. McKenney cbs = rcu_get_n_cbs_cpu(cpu); 721b51bcbbfSPaul E. McKenney if (!cbs) 722b51bcbbfSPaul E. McKenney continue; 723b51bcbbfSPaul E. McKenney if (max_cpu < 0) 724b51bcbbfSPaul E. McKenney pr_info("%s: callbacks", __func__); 725b51bcbbfSPaul E. McKenney pr_cont(" %d: %lu", cpu, cbs); 726b51bcbbfSPaul E. McKenney if (cbs <= max_cbs) 727b51bcbbfSPaul E. McKenney continue; 728b51bcbbfSPaul E. McKenney max_cbs = cbs; 729b51bcbbfSPaul E. McKenney max_cpu = cpu; 730b51bcbbfSPaul E. McKenney } 731b51bcbbfSPaul E. McKenney if (max_cpu >= 0) 732b51bcbbfSPaul E. McKenney pr_cont("\n"); 733b51bcbbfSPaul E. McKenney } 734b51bcbbfSPaul E. McKenney EXPORT_SYMBOL_GPL(rcu_fwd_progress_check); 735b51bcbbfSPaul E. McKenney 736b51bcbbfSPaul E. McKenney /* Commandeer a sysrq key to dump RCU's tree. */ 737b51bcbbfSPaul E. McKenney static bool sysrq_rcu; 738b51bcbbfSPaul E. McKenney module_param(sysrq_rcu, bool, 0444); 739b51bcbbfSPaul E. McKenney 740b51bcbbfSPaul E. McKenney /* Dump grace-period-request information due to commandeered sysrq. */ 741b51bcbbfSPaul E. McKenney static void sysrq_show_rcu(int key) 742b51bcbbfSPaul E. McKenney { 743b51bcbbfSPaul E. McKenney show_rcu_gp_kthreads(); 744b51bcbbfSPaul E. McKenney } 745b51bcbbfSPaul E. McKenney 746b51bcbbfSPaul E. McKenney static struct sysrq_key_op sysrq_rcudump_op = { 747b51bcbbfSPaul E. McKenney .handler = sysrq_show_rcu, 748b51bcbbfSPaul E. McKenney .help_msg = "show-rcu(y)", 749b51bcbbfSPaul E. McKenney .action_msg = "Show RCU tree", 750b51bcbbfSPaul E. McKenney .enable_mask = SYSRQ_ENABLE_DUMP, 751b51bcbbfSPaul E. McKenney }; 752b51bcbbfSPaul E. McKenney 753b51bcbbfSPaul E. McKenney static int __init rcu_sysrq_init(void) 754b51bcbbfSPaul E. McKenney { 755b51bcbbfSPaul E. McKenney if (sysrq_rcu) 756b51bcbbfSPaul E. McKenney return register_sysrq_key('y', &sysrq_rcudump_op); 757b51bcbbfSPaul E. McKenney return 0; 758b51bcbbfSPaul E. McKenney } 759b51bcbbfSPaul E. McKenney early_initcall(rcu_sysrq_init); 760