Re: [PATCH RT 0/2][RFC] fix RCU stall warning on ARM

From: Frank Rowand
Date: Tue Dec 04 2012 - 23:52:40 EST



This patch should __not__ be committed to the RT_PREEMPT tree.

Test scaffolding to force printing of rcu detected stall. Each time the
specified value is echoed into the proc file, the routine to be tested
will be called one time, from the context it would normally be called from.

# test print_cpu_stall()
echo 1 > /proc/sys/kernel/zzz_debug_print_stall_once

# test print_other_cpu_stall()
echo 2 > /proc/sys/kernel/zzz_debug_print_stall_once


Signed-off-by: Frank Rowand <frank.rowand@xxxxxxxxxxx>
---
kernel/rcutree.c | 26 26 + 0 - 0 !
kernel/sysctl.c | 11 11 + 0 - 0 !
2 files changed, 37 insertions(+)

Index: b/kernel/rcutree.c
===================================================================
--- a/kernel/rcutree.c
+++ b/kernel/rcutree.c
@@ -738,6 +738,7 @@ static void record_gp_stall_check_time(s
rsp->jiffies_stall = jiffies + jiffies_till_stall_check();
}

+int zzz_debug_print_other_cpu_stall;
static void print_other_cpu_stall(struct rcu_state *rsp)
{
int cpu;
@@ -750,10 +751,12 @@ static void print_other_cpu_stall(struct

raw_spin_lock_irqsave(&rnp->lock, flags);
delta = jiffies - rsp->jiffies_stall;
+if (!zzz_debug_print_other_cpu_stall) {
if (delta < RCU_STALL_RAT_DELAY || !rcu_gp_in_progress(rsp)) {
raw_spin_unlock_irqrestore(&rnp->lock, flags);
return;
}
+}
rsp->jiffies_stall = jiffies + 3 * jiffies_till_stall_check() + 3;
raw_spin_unlock_irqrestore(&rnp->lock, flags);

@@ -792,6 +795,10 @@ static void print_other_cpu_stall(struct
ndetected += rcu_print_task_stall(rnp);
raw_spin_unlock_irqrestore(&rnp->lock, flags);

+if (zzz_debug_print_other_cpu_stall) {
+ ndetected += 1;
+}
+
print_cpu_stall_info_end();
printk(KERN_CONT "(detected by %d, t=%ld jiffies)\n",
smp_processor_id(), (long)(jiffies - rsp->gp_start));
@@ -843,6 +850,7 @@ static void print_cpu_stall(struct rcu_s
set_need_resched(); /* kick ourselves to get things going. */
}

+int zzz_debug_print_stall_once;
static void check_cpu_stall(struct rcu_state *rsp, struct rcu_data *rdp)
{
unsigned long j;
@@ -851,6 +859,24 @@ static void check_cpu_stall(struct rcu_s

if (rcu_cpu_stall_suppress)
return;
+
+ if (zzz_debug_print_stall_once) {
+ int tmp = zzz_debug_print_stall_once;
+ zzz_debug_print_stall_once = 0;
+ if (tmp & 0x1) {
+ pr_crit("\n\n***** DEBUG -- test print_cpu_stall():\n\n");
+ print_cpu_stall(rsp);
+ }
+ if (tmp & 0x2) {
+ pr_crit("\n\n***** DEBUG -- test print_other_cpu_stall():\n\n");
+ zzz_debug_print_other_cpu_stall = 1;
+ print_other_cpu_stall(rsp);
+ zzz_debug_print_other_cpu_stall = 0;
+ }
+
+ return;
+ }
+
j = ACCESS_ONCE(jiffies);
js = ACCESS_ONCE(rsp->jiffies_stall);
rnp = rdp->mynode;
Index: b/kernel/sysctl.c
===================================================================
--- a/kernel/sysctl.c
+++ b/kernel/sysctl.c
@@ -132,6 +132,8 @@ static int one_hundred = 100;
static int ten_thousand = 10000;
#endif

+extern int zzz_debug_print_stall_once;
+
/* this is needed for the proc_doulongvec_minmax of vm_dirty_bytes */
static unsigned long dirty_bytes_min = 2 * PAGE_SIZE;

@@ -1000,6 +1002,15 @@ static struct ctl_table kern_table[] = {
.proc_handler = proc_dointvec,
},
#endif
+#ifdef CONFIG_SMP
+ {
+ .procname = "zzz_debug_print_stall_once",
+ .data = &zzz_debug_print_stall_once,
+ .maxlen = sizeof(int),
+ .mode = 0644,
+ .proc_handler = &proc_dointvec,
+ },
+#endif
{ }
};


--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/