Merge tag 'v3.15' into next

Linux 3.15
author: Paul Moore <pmoore@redhat.com> 2014-06-17 17:30:23 -0400
committer: Paul Moore <pmoore@redhat.com> 2014-06-17 17:30:23 -0400
commit: 170b5910d9fbea79de1bb40df22eda5f98250c0c (patch)
tree: ca9560e878d2842d45c6f99077d0d8b8f8b0f9ba /arch/x86/kernel/cpu/perf_event_p4.c
parent: 47dd0b76ace953bd2c0479076db0d3e3b9594003 (diff)
parent: 1860e379875dfe7271c649058aeddffe5afd9d0d (diff)
1 files changed, 33 insertions, 1 deletions
diff --git a/arch/x86/kernel/cpu/perf_event_p4.c b/arch/x86/kernel/cpu/perf_event_p4.c
index 3486e666035..5d466b7d860 100644
--- a/arch/x86/kernel/cpu/perf_event_p4.c
+++ b/arch/x86/kernel/cpu/perf_event_p4.c
@@ -1257,7 +1257,24 @@ again:
 			pass++;
 			goto again;
 		}
-
+		/*
+		 * Perf does test runs to see if a whole group can be assigned
+		 * together succesfully.  There can be multiple rounds of this.
+		 * Unfortunately, p4_pmu_swap_config_ts touches the hwc->config
+		 * bits, such that the next round of group assignments will
+		 * cause the above p4_should_swap_ts to pass instead of fail.
+		 * This leads to counters exclusive to thread0 being used by
+		 * thread1.
+		 *
+		 * Solve this with a cheap hack, reset the idx back to -1 to
+		 * force a new lookup (p4_next_cntr) to get the right counter
+		 * for the right thread.
+		 *
+		 * This probably doesn't comply with the general spirit of how
+		 * perf wants to work, but P4 is special. :-(
+		 */
+		if (p4_should_swap_ts(hwc->config, cpu))
+			hwc->idx = -1;
 		p4_pmu_swap_config_ts(hwc, cpu);
 		if (assign)
 			assign[i] = cntr_idx;
@@ -1322,6 +1339,7 @@ static __initconst const struct x86_pmu p4_pmu = {
 __init int p4_pmu_init(void)
 {
 	unsigned int low, high;
+	int i, reg;
 
 	/* If we get stripped -- indexing fails */
 	BUILD_BUG_ON(ARCH_P4_MAX_CCCR > INTEL_PMC_MAX_GENERIC);
@@ -1340,5 +1358,19 @@ __init int p4_pmu_init(void)
 
 	x86_pmu = p4_pmu;
 
+	/*
+	 * Even though the counters are configured to interrupt a particular
+	 * logical processor when an overflow happens, testing has shown that
+	 * on kdump kernels (which uses a single cpu), thread1's counter
+	 * continues to run and will report an NMI on thread0.  Due to the
+	 * overflow bug, this leads to a stream of unknown NMIs.
+	 *
+	 * Solve this by zero'ing out the registers to mimic a reset.
+	 */
+	for (i = 0; i < x86_pmu.num_counters; i++) {
+		reg = x86_pmu_config_addr(i);
+		wrmsrl_safe(reg, 0ULL);
+	}
+
 	return 0;
 }
author	Paul Moore <pmoore@redhat.com>	2014-06-17 17:30:23 -0400
committer	Paul Moore <pmoore@redhat.com>	2014-06-17 17:30:23 -0400
commit	170b5910d9fbea79de1bb40df22eda5f98250c0c (patch)
tree	ca9560e878d2842d45c6f99077d0d8b8f8b0f9ba /arch/x86/kernel/cpu/perf_event_p4.c
parent	47dd0b76ace953bd2c0479076db0d3e3b9594003 (diff)
parent	1860e379875dfe7271c649058aeddffe5afd9d0d (diff)