15 years ago · 5d70f79b5e
--- a/Documentation/kprobes.txt
+++ b/Documentation/kprobes.txt
@@ -542,9 +542,11 @@ Kprobes does not use mutexes or allocate memory except during
 
				 registration and unregistration.
			
 
				 
			
 
				 Probe handlers are run with preemption disabled.  Depending on the
			
 
				-architecture, handlers may also run with interrupts disabled.  In any
			
 
				-case, your handler should not yield the CPU (e.g., by attempting to
			
 
				-acquire a semaphore).
			
 
				+architecture and optimization state, handlers may also run with
			
 
				+interrupts disabled (e.g., kretprobe handlers and optimized kprobe
			
 
				+handlers run without interrupt disabled on x86/x86-64).  In any case,
			
 
				+your handler should not yield the CPU (e.g., by attempting to acquire
			
 
				+a semaphore).
			
 
				 
			
 
				 Since a return probe is implemented by replacing the return
			
 
				 address with the trampoline's address, stack backtraces and calls
			
--- a/Makefile
+++ b/Makefile
@@ -568,6 +568,12 @@ endif
 
				 
			
 
				 ifdef CONFIG_FUNCTION_TRACER
			
 
				 KBUILD_CFLAGS	+= -pg
			
 
				+ifdef CONFIG_DYNAMIC_FTRACE
			
 
				+	ifdef CONFIG_HAVE_C_RECORDMCOUNT
			
 
				+		BUILD_C_RECORDMCOUNT := y
			
 
				+		export BUILD_C_RECORDMCOUNT
			
 
				+	endif
			
 
				+endif
			
 
				 endif
			
 
				 
			
 
				 # We trigger additional mismatches with less inlining
			
@@ -591,6 +597,11 @@ KBUILD_CFLAGS	+= $(call cc-option,-fno-strict-overflow)
 
				 # conserve stack if available
			
 
				 KBUILD_CFLAGS   += $(call cc-option,-fconserve-stack)
			
 
				 
			
 
				+# check for 'asm goto'
			
 
				+ifeq ($(shell $(CONFIG_SHELL) $(srctree)/scripts/gcc-goto.sh $(CC)), y)
			
 
				+	KBUILD_CFLAGS += -DCC_HAVE_ASM_GOTO
			
 
				+endif
			
 
				+
			
 
				 # Add user supplied CPPFLAGS, AFLAGS and CFLAGS as the last assignments
			
 
				 # But warn user when we do so
			
 
				 warn-assign = \
			
--- a/arch/Kconfig
+++ b/arch/Kconfig
@@ -158,4 +158,7 @@ config HAVE_PERF_EVENTS_NMI
 
				 	  subsystem.  Also has support for calculating CPU cycle events
			
 
				 	  to determine how many clock cycles in a given period.
			
 
				 
			
 
				+config HAVE_ARCH_JUMP_LABEL
			
 
				+	bool
			
 
				+
			
 
				 source "kernel/gcov/Kconfig"
			
--- a/arch/alpha/Kconfig
+++ b/arch/alpha/Kconfig
@@ -9,6 +9,7 @@ config ALPHA
 
				 	select HAVE_IDE
			
 
				 	select HAVE_OPROFILE
			
 
				 	select HAVE_SYSCALL_WRAPPERS
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_PERF_EVENTS
			
 
				 	select HAVE_DMA_ATTRS
			
 
				 	help
			
--- a/arch/alpha/include/asm/perf_event.h
+++ b/arch/alpha/include/asm/perf_event.h
@@ -1,11 +1,6 @@
 
				 #ifndef __ASM_ALPHA_PERF_EVENT_H
			
 
				 #define __ASM_ALPHA_PERF_EVENT_H
			
 
				 
			
 
				-/* Alpha only supports software events through this interface. */
			
 
				-extern void set_perf_event_pending(void);
			
 
				-
			
 
				-#define PERF_EVENT_INDEX_OFFSET 0
			
 
				-
			
 
				 #ifdef CONFIG_PERF_EVENTS
			
 
				 extern void init_hw_perf_events(void);
			
 
				 #else
			
--- a/arch/alpha/kernel/perf_event.c
+++ b/arch/alpha/kernel/perf_event.c
@@ -307,7 +307,7 @@ again:
 
				 			     new_raw_count) != prev_raw_count)
			
 
				 		goto again;
			
 
				 
			
 
				-	delta = (new_raw_count  - (prev_raw_count & alpha_pmu->pmc_count_mask[idx])) + ovf;
			
 
				+	delta = (new_raw_count - (prev_raw_count & alpha_pmu->pmc_count_mask[idx])) + ovf;
			
 
				 
			
 
				 	/* It is possible on very rare occasions that the PMC has overflowed
			
 
				 	 * but the interrupt is yet to come.  Detect and fix this situation.
			
@@ -402,14 +402,13 @@ static void maybe_change_configuration(struct cpu_hw_events *cpuc)
 
				 		struct hw_perf_event *hwc = &pe->hw;
			
 
				 		int idx = hwc->idx;
			
 
				 
			
 
				-		if (cpuc->current_idx[j] != PMC_NO_INDEX) {
			
 
				-			cpuc->idx_mask |= (1<<cpuc->current_idx[j]);
			
 
				-			continue;
			
 
				+		if (cpuc->current_idx[j] == PMC_NO_INDEX) {
			
 
				+			alpha_perf_event_set_period(pe, hwc, idx);
			
 
				+			cpuc->current_idx[j] = idx;
			
 
				 		}
			
 
				 
			
 
				-		alpha_perf_event_set_period(pe, hwc, idx);
			
 
				-		cpuc->current_idx[j] = idx;
			
 
				-		cpuc->idx_mask |= (1<<cpuc->current_idx[j]);
			
 
				+		if (!(hwc->state & PERF_HES_STOPPED))
			
 
				+			cpuc->idx_mask |= (1<<cpuc->current_idx[j]);
			
 
				 	}
			
 
				 	cpuc->config = cpuc->event[0]->hw.config_base;
			
 
				 }
			
@@ -420,12 +419,13 @@ static void maybe_change_configuration(struct cpu_hw_events *cpuc)
 
				  *  - this function is called from outside this module via the pmu struct
			
 
				  *    returned from perf event initialisation.
			
 
				  */
			
 
				-static int alpha_pmu_enable(struct perf_event *event)
			
 
				+static int alpha_pmu_add(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				+	struct hw_perf_event *hwc = &event->hw;
			
 
				 	int n0;
			
 
				 	int ret;
			
 
				-	unsigned long flags;
			
 
				+	unsigned long irq_flags;
			
 
				 
			
 
				 	/*
			
 
				 	 * The Sparc code has the IRQ disable first followed by the perf
			
@@ -435,8 +435,8 @@ static int alpha_pmu_enable(struct perf_event *event)
 
				 	 * nevertheless we disable the PMCs first to enable a potential
			
 
				 	 * final PMI to occur before we disable interrupts.
			
 
				 	 */
			
 
				-	perf_disable();
			
 
				-	local_irq_save(flags);
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				+	local_irq_save(irq_flags);
			
 
				 
			
 
				 	/* Default to error to be returned */
			
 
				 	ret = -EAGAIN;
			
@@ -455,8 +455,12 @@ static int alpha_pmu_enable(struct perf_event *event)
 
				 		}
			
 
				 	}
			
 
				 
			
 
				-	local_irq_restore(flags);
			
 
				-	perf_enable();
			
 
				+	hwc->state = PERF_HES_UPTODATE;
			
 
				+	if (!(flags & PERF_EF_START))
			
 
				+		hwc->state |= PERF_HES_STOPPED;
			
 
				+
			
 
				+	local_irq_restore(irq_flags);
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 
			
 
				 	return ret;
			
 
				 }
			
@@ -467,15 +471,15 @@ static int alpha_pmu_enable(struct perf_event *event)
 
				  *  - this function is called from outside this module via the pmu struct
			
 
				  *    returned from perf event initialisation.
			
 
				  */
			
 
				-static void alpha_pmu_disable(struct perf_event *event)
			
 
				+static void alpha_pmu_del(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	struct hw_perf_event *hwc = &event->hw;
			
 
				-	unsigned long flags;
			
 
				+	unsigned long irq_flags;
			
 
				 	int j;
			
 
				 
			
 
				-	perf_disable();
			
 
				-	local_irq_save(flags);
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				+	local_irq_save(irq_flags);
			
 
				 
			
 
				 	for (j = 0; j < cpuc->n_events; j++) {
			
 
				 		if (event == cpuc->event[j]) {
			
@@ -501,8 +505,8 @@ static void alpha_pmu_disable(struct perf_event *event)
 
				 		}
			
 
				 	}
			
 
				 
			
 
				-	local_irq_restore(flags);
			
 
				-	perf_enable();
			
 
				+	local_irq_restore(irq_flags);
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 }
			
 
				 
			
 
				 
			
@@ -514,13 +518,44 @@ static void alpha_pmu_read(struct perf_event *event)
 
				 }
			
 
				 
			
 
				 
			
 
				-static void alpha_pmu_unthrottle(struct perf_event *event)
			
 
				+static void alpha_pmu_stop(struct perf_event *event, int flags)
			
 
				+{
			
 
				+	struct hw_perf_event *hwc = &event->hw;
			
 
				+	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				+
			
 
				+	if (!(hwc->state & PERF_HES_STOPPED)) {
			
 
				+		cpuc->idx_mask &= ~(1UL<<hwc->idx);
			
 
				+		hwc->state |= PERF_HES_STOPPED;
			
 
				+	}
			
 
				+
			
 
				+	if ((flags & PERF_EF_UPDATE) && !(hwc->state & PERF_HES_UPTODATE)) {
			
 
				+		alpha_perf_event_update(event, hwc, hwc->idx, 0);
			
 
				+		hwc->state |= PERF_HES_UPTODATE;
			
 
				+	}
			
 
				+
			
 
				+	if (cpuc->enabled)
			
 
				+		wrperfmon(PERFMON_CMD_DISABLE, (1UL<<hwc->idx));
			
 
				+}
			
 
				+
			
 
				+
			
 
				+static void alpha_pmu_start(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct hw_perf_event *hwc = &event->hw;
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
 
				+	if (WARN_ON_ONCE(!(hwc->state & PERF_HES_STOPPED)))
			
 
				+		return;
			
 
				+
			
 
				+	if (flags & PERF_EF_RELOAD) {
			
 
				+		WARN_ON_ONCE(!(hwc->state & PERF_HES_UPTODATE));
			
 
				+		alpha_perf_event_set_period(event, hwc, hwc->idx);
			
 
				+	}
			
 
				+
			
 
				+	hwc->state = 0;
			
 
				+
			
 
				 	cpuc->idx_mask |= 1UL<<hwc->idx;
			
 
				-	wrperfmon(PERFMON_CMD_ENABLE, (1UL<<hwc->idx));
			
 
				+	if (cpuc->enabled)
			
 
				+		wrperfmon(PERFMON_CMD_ENABLE, (1UL<<hwc->idx));
			
 
				 }
			
 
				 
			
 
				 
			
@@ -642,39 +677,36 @@ static int __hw_perf_event_init(struct perf_event *event)
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-static const struct pmu pmu = {
			
 
				-	.enable		= alpha_pmu_enable,
			
 
				-	.disable	= alpha_pmu_disable,
			
 
				-	.read		= alpha_pmu_read,
			
 
				-	.unthrottle	= alpha_pmu_unthrottle,
			
 
				-};
			
 
				-
			
 
				-
			
 
				 /*
			
 
				  * Main entry point to initialise a HW performance event.
			
 
				  */
			
 
				-const struct pmu *hw_perf_event_init(struct perf_event *event)
			
 
				+static int alpha_pmu_event_init(struct perf_event *event)
			
 
				 {
			
 
				 	int err;
			
 
				 
			
 
				+	switch (event->attr.type) {
			
 
				+	case PERF_TYPE_RAW:
			
 
				+	case PERF_TYPE_HARDWARE:
			
 
				+	case PERF_TYPE_HW_CACHE:
			
 
				+		break;
			
 
				+
			
 
				+	default:
			
 
				+		return -ENOENT;
			
 
				+	}
			
 
				+
			
 
				 	if (!alpha_pmu)
			
 
				-		return ERR_PTR(-ENODEV);
			
 
				+		return -ENODEV;
			
 
				 
			
 
				 	/* Do the real initialisation work. */
			
 
				 	err = __hw_perf_event_init(event);
			
 
				 
			
 
				-	if (err)
			
 
				-		return ERR_PTR(err);
			
 
				-
			
 
				-	return &pmu;
			
 
				+	return err;
			
 
				 }
			
 
				 
			
 
				-
			
 
				-
			
 
				 /*
			
 
				  * Main entry point - enable HW performance counters.
			
 
				  */
			
 
				-void hw_perf_enable(void)
			
 
				+static void alpha_pmu_enable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
@@ -700,7 +732,7 @@ void hw_perf_enable(void)
 
				  * Main entry point - disable HW performance counters.
			
 
				  */
			
 
				 
			
 
				-void hw_perf_disable(void)
			
 
				+static void alpha_pmu_disable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
@@ -713,6 +745,17 @@ void hw_perf_disable(void)
 
				 	wrperfmon(PERFMON_CMD_DISABLE, cpuc->idx_mask);
			
 
				 }
			
 
				 
			
 
				+static struct pmu pmu = {
			
 
				+	.pmu_enable	= alpha_pmu_enable,
			
 
				+	.pmu_disable	= alpha_pmu_disable,
			
 
				+	.event_init	= alpha_pmu_event_init,
			
 
				+	.add		= alpha_pmu_add,
			
 
				+	.del		= alpha_pmu_del,
			
 
				+	.start		= alpha_pmu_start,
			
 
				+	.stop		= alpha_pmu_stop,
			
 
				+	.read		= alpha_pmu_read,
			
 
				+};
			
 
				+
			
 
				 
			
 
				 /*
			
 
				  * Main entry point - don't know when this is called but it
			
@@ -766,7 +809,7 @@ static void alpha_perf_event_irq_handler(unsigned long la_ptr,
 
				 	wrperfmon(PERFMON_CMD_DISABLE, cpuc->idx_mask);
			
 
				 
			
 
				 	/* la_ptr is the counter that overflowed. */
			
 
				-	if (unlikely(la_ptr >= perf_max_events)) {
			
 
				+	if (unlikely(la_ptr >= alpha_pmu->num_pmcs)) {
			
 
				 		/* This should never occur! */
			
 
				 		irq_err_count++;
			
 
				 		pr_warning("PMI: silly index %ld\n", la_ptr);
			
@@ -807,7 +850,7 @@ static void alpha_perf_event_irq_handler(unsigned long la_ptr,
 
				 			/* Interrupts coming too quickly; "throttle" the
			
 
				 			 * counter, i.e., disable it for a little while.
			
 
				 			 */
			
 
				-			cpuc->idx_mask &= ~(1UL<<idx);
			
 
				+			alpha_pmu_stop(event, 0);
			
 
				 		}
			
 
				 	}
			
 
				 	wrperfmon(PERFMON_CMD_ENABLE, cpuc->idx_mask);
			
@@ -837,6 +880,7 @@ void __init init_hw_perf_events(void)
 
				 
			
 
				 	/* And set up PMU specification */
			
 
				 	alpha_pmu = &ev67_pmu;
			
 
				-	perf_max_events = alpha_pmu->num_pmcs;
			
 
				+
			
 
				+	perf_pmu_register(&pmu);
			
 
				 }
			
 
				 
			
--- a/arch/alpha/kernel/time.c
+++ b/arch/alpha/kernel/time.c
@@ -41,7 +41,7 @@
 
				 #include <linux/init.h>
			
 
				 #include <linux/bcd.h>
			
 
				 #include <linux/profile.h>
			
 
				-#include <linux/perf_event.h>
			
 
				+#include <linux/irq_work.h>
			
 
				 
			
 
				 #include <asm/uaccess.h>
			
 
				 #include <asm/io.h>
			
@@ -83,25 +83,25 @@ static struct {
 
				 
			
 
				 unsigned long est_cycle_freq;
			
 
				 
			
 
				-#ifdef CONFIG_PERF_EVENTS
			
 
				+#ifdef CONFIG_IRQ_WORK
			
 
				 
			
 
				-DEFINE_PER_CPU(u8, perf_event_pending);
			
 
				+DEFINE_PER_CPU(u8, irq_work_pending);
			
 
				 
			
 
				-#define set_perf_event_pending_flag()  __get_cpu_var(perf_event_pending) = 1
			
 
				-#define test_perf_event_pending()      __get_cpu_var(perf_event_pending)
			
 
				-#define clear_perf_event_pending()     __get_cpu_var(perf_event_pending) = 0
			
 
				+#define set_irq_work_pending_flag()  __get_cpu_var(irq_work_pending) = 1
			
 
				+#define test_irq_work_pending()      __get_cpu_var(irq_work_pending)
			
 
				+#define clear_irq_work_pending()     __get_cpu_var(irq_work_pending) = 0
			
 
				 
			
 
				-void set_perf_event_pending(void)
			
 
				+void set_irq_work_pending(void)
			
 
				 {
			
 
				-	set_perf_event_pending_flag();
			
 
				+	set_irq_work_pending_flag();
			
 
				 }
			
 
				 
			
 
				-#else  /* CONFIG_PERF_EVENTS */
			
 
				+#else  /* CONFIG_IRQ_WORK */
			
 
				 
			
 
				-#define test_perf_event_pending()      0
			
 
				-#define clear_perf_event_pending()
			
 
				+#define test_irq_work_pending()      0
			
 
				+#define clear_irq_work_pending()
			
 
				 
			
 
				-#endif /* CONFIG_PERF_EVENTS */
			
 
				+#endif /* CONFIG_IRQ_WORK */
			
 
				 
			
 
				 
			
 
				 static inline __u32 rpcc(void)
			
@@ -191,9 +191,9 @@ irqreturn_t timer_interrupt(int irq, void *dev)
 
				 
			
 
				 	write_sequnlock(&xtime_lock);
			
 
				 
			
 
				-	if (test_perf_event_pending()) {
			
 
				-		clear_perf_event_pending();
			
 
				-		perf_event_do_pending();
			
 
				+	if (test_irq_work_pending()) {
			
 
				+		clear_irq_work_pending();
			
 
				+		irq_work_run();
			
 
				 	}
			
 
				 
			
 
				 #ifndef CONFIG_SMP
			
--- a/arch/arm/Kconfig
+++ b/arch/arm/Kconfig
@@ -23,6 +23,7 @@ config ARM
 
				 	select HAVE_KERNEL_GZIP
			
 
				 	select HAVE_KERNEL_LZO
			
 
				 	select HAVE_KERNEL_LZMA
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_PERF_EVENTS
			
 
				 	select PERF_USE_VMALLOC
			
 
				 	select HAVE_REGS_AND_STACK_ACCESS_API
			
--- a/arch/arm/include/asm/perf_event.h
+++ b/arch/arm/include/asm/perf_event.h
@@ -12,18 +12,6 @@
 
				 #ifndef __ARM_PERF_EVENT_H__
			
 
				 #define __ARM_PERF_EVENT_H__
			
 
				 
			
 
				-/*
			
 
				- * NOP: on *most* (read: all supported) ARM platforms, the performance
			
 
				- * counter interrupts are regular interrupts and not an NMI. This
			
 
				- * means that when we receive the interrupt we can call
			
 
				- * perf_event_do_pending() that handles all of the work with
			
 
				- * interrupts disabled.
			
 
				- */
			
 
				-static inline void
			
 
				-set_perf_event_pending(void)
			
 
				-{
			
 
				-}
			
 
				-
			
 
				 /* ARM performance counters start from 1 (in the cp15 accesses) so use the
			
 
				  * same indexes here for consistency. */
			
 
				 #define PERF_EVENT_INDEX_OFFSET 1
			
--- a/arch/arm/kernel/perf_event.c
+++ b/arch/arm/kernel/perf_event.c
@@ -123,6 +123,12 @@ armpmu_get_max_events(void)
 
				 }
			
 
				 EXPORT_SYMBOL_GPL(armpmu_get_max_events);
			
 
				 
			
 
				+int perf_num_counters(void)
			
 
				+{
			
 
				+	return armpmu_get_max_events();
			
 
				+}
			
 
				+EXPORT_SYMBOL_GPL(perf_num_counters);
			
 
				+
			
 
				 #define HW_OP_UNSUPPORTED		0xFFFF
			
 
				 
			
 
				 #define C(_x) \
			
@@ -221,46 +227,56 @@ again:
 
				 }
			
 
				 
			
 
				 static void
			
 
				-armpmu_disable(struct perf_event *event)
			
 
				+armpmu_read(struct perf_event *event)
			
 
				 {
			
 
				-	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	struct hw_perf_event *hwc = &event->hw;
			
 
				-	int idx = hwc->idx;
			
 
				-
			
 
				-	WARN_ON(idx < 0);
			
 
				-
			
 
				-	clear_bit(idx, cpuc->active_mask);
			
 
				-	armpmu->disable(hwc, idx);
			
 
				-
			
 
				-	barrier();
			
 
				 
			
 
				-	armpmu_event_update(event, hwc, idx);
			
 
				-	cpuc->events[idx] = NULL;
			
 
				-	clear_bit(idx, cpuc->used_mask);
			
 
				+	/* Don't read disabled counters! */
			
 
				+	if (hwc->idx < 0)
			
 
				+		return;
			
 
				 
			
 
				-	perf_event_update_userpage(event);
			
 
				+	armpmu_event_update(event, hwc, hwc->idx);
			
 
				 }
			
 
				 
			
 
				 static void
			
 
				-armpmu_read(struct perf_event *event)
			
 
				+armpmu_stop(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct hw_perf_event *hwc = &event->hw;
			
 
				 
			
 
				-	/* Don't read disabled counters! */
			
 
				-	if (hwc->idx < 0)
			
 
				+	if (!armpmu)
			
 
				 		return;
			
 
				 
			
 
				-	armpmu_event_update(event, hwc, hwc->idx);
			
 
				+	/*
			
 
				+	 * ARM pmu always has to update the counter, so ignore
			
 
				+	 * PERF_EF_UPDATE, see comments in armpmu_start().
			
 
				+	 */
			
 
				+	if (!(hwc->state & PERF_HES_STOPPED)) {
			
 
				+		armpmu->disable(hwc, hwc->idx);
			
 
				+		barrier(); /* why? */
			
 
				+		armpmu_event_update(event, hwc, hwc->idx);
			
 
				+		hwc->state |= PERF_HES_STOPPED | PERF_HES_UPTODATE;
			
 
				+	}
			
 
				 }
			
 
				 
			
 
				 static void
			
 
				-armpmu_unthrottle(struct perf_event *event)
			
 
				+armpmu_start(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct hw_perf_event *hwc = &event->hw;
			
 
				 
			
 
				+	if (!armpmu)
			
 
				+		return;
			
 
				+
			
 
				+	/*
			
 
				+	 * ARM pmu always has to reprogram the period, so ignore
			
 
				+	 * PERF_EF_RELOAD, see the comment below.
			
 
				+	 */
			
 
				+	if (flags & PERF_EF_RELOAD)
			
 
				+		WARN_ON_ONCE(!(hwc->state & PERF_HES_UPTODATE));
			
 
				+
			
 
				+	hwc->state = 0;
			
 
				 	/*
			
 
				 	 * Set the period again. Some counters can't be stopped, so when we
			
 
				-	 * were throttled we simply disabled the IRQ source and the counter
			
 
				+	 * were stopped we simply disabled the IRQ source and the counter
			
 
				 	 * may have been left counting. If we don't do this step then we may
			
 
				 	 * get an interrupt too soon or *way* too late if the overflow has
			
 
				 	 * happened since disabling.
			
@@ -269,14 +285,33 @@ armpmu_unthrottle(struct perf_event *event)
 
				 	armpmu->enable(hwc, hwc->idx);
			
 
				 }
			
 
				 
			
 
				+static void
			
 
				+armpmu_del(struct perf_event *event, int flags)
			
 
				+{
			
 
				+	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				+	struct hw_perf_event *hwc = &event->hw;
			
 
				+	int idx = hwc->idx;
			
 
				+
			
 
				+	WARN_ON(idx < 0);
			
 
				+
			
 
				+	clear_bit(idx, cpuc->active_mask);
			
 
				+	armpmu_stop(event, PERF_EF_UPDATE);
			
 
				+	cpuc->events[idx] = NULL;
			
 
				+	clear_bit(idx, cpuc->used_mask);
			
 
				+
			
 
				+	perf_event_update_userpage(event);
			
 
				+}
			
 
				+
			
 
				 static int
			
 
				-armpmu_enable(struct perf_event *event)
			
 
				+armpmu_add(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	struct hw_perf_event *hwc = &event->hw;
			
 
				 	int idx;
			
 
				 	int err = 0;
			
 
				 
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				+
			
 
				 	/* If we don't have a space for the counter then finish early. */
			
 
				 	idx = armpmu->get_event_idx(cpuc, hwc);
			
 
				 	if (idx < 0) {
			
@@ -293,25 +328,19 @@ armpmu_enable(struct perf_event *event)
 
				 	cpuc->events[idx] = event;
			
 
				 	set_bit(idx, cpuc->active_mask);
			
 
				 
			
 
				-	/* Set the period for the event. */
			
 
				-	armpmu_event_set_period(event, hwc, idx);
			
 
				-
			
 
				-	/* Enable the event. */
			
 
				-	armpmu->enable(hwc, idx);
			
 
				+	hwc->state = PERF_HES_STOPPED | PERF_HES_UPTODATE;
			
 
				+	if (flags & PERF_EF_START)
			
 
				+		armpmu_start(event, PERF_EF_RELOAD);
			
 
				 
			
 
				 	/* Propagate our changes to the userspace mapping. */
			
 
				 	perf_event_update_userpage(event);
			
 
				 
			
 
				 out:
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 	return err;
			
 
				 }
			
 
				 
			
 
				-static struct pmu pmu = {
			
 
				-	.enable	    = armpmu_enable,
			
 
				-	.disable    = armpmu_disable,
			
 
				-	.unthrottle = armpmu_unthrottle,
			
 
				-	.read	    = armpmu_read,
			
 
				-};
			
 
				+static struct pmu pmu;
			
 
				 
			
 
				 static int
			
 
				 validate_event(struct cpu_hw_events *cpuc,
			
@@ -491,20 +520,29 @@ __hw_perf_event_init(struct perf_event *event)
 
				 	return err;
			
 
				 }
			
 
				 
			
 
				-const struct pmu *
			
 
				-hw_perf_event_init(struct perf_event *event)
			
 
				+static int armpmu_event_init(struct perf_event *event)
			
 
				 {
			
 
				 	int err = 0;
			
 
				 
			
 
				+	switch (event->attr.type) {
			
 
				+	case PERF_TYPE_RAW:
			
 
				+	case PERF_TYPE_HARDWARE:
			
 
				+	case PERF_TYPE_HW_CACHE:
			
 
				+		break;
			
 
				+
			
 
				+	default:
			
 
				+		return -ENOENT;
			
 
				+	}
			
 
				+
			
 
				 	if (!armpmu)
			
 
				-		return ERR_PTR(-ENODEV);
			
 
				+		return -ENODEV;
			
 
				 
			
 
				 	event->destroy = hw_perf_event_destroy;
			
 
				 
			
 
				 	if (!atomic_inc_not_zero(&active_events)) {
			
 
				-		if (atomic_read(&active_events) > perf_max_events) {
			
 
				+		if (atomic_read(&active_events) > armpmu->num_events) {
			
 
				 			atomic_dec(&active_events);
			
 
				-			return ERR_PTR(-ENOSPC);
			
 
				+			return -ENOSPC;
			
 
				 		}
			
 
				 
			
 
				 		mutex_lock(&pmu_reserve_mutex);
			
@@ -518,17 +556,16 @@ hw_perf_event_init(struct perf_event *event)
 
				 	}
			
 
				 
			
 
				 	if (err)
			
 
				-		return ERR_PTR(err);
			
 
				+		return err;
			
 
				 
			
 
				 	err = __hw_perf_event_init(event);
			
 
				 	if (err)
			
 
				 		hw_perf_event_destroy(event);
			
 
				 
			
 
				-	return err ? ERR_PTR(err) : &pmu;
			
 
				+	return err;
			
 
				 }
			
 
				 
			
 
				-void
			
 
				-hw_perf_enable(void)
			
 
				+static void armpmu_enable(struct pmu *pmu)
			
 
				 {
			
 
				 	/* Enable all of the perf events on hardware. */
			
 
				 	int idx;
			
@@ -549,13 +586,23 @@ hw_perf_enable(void)
 
				 	armpmu->start();
			
 
				 }
			
 
				 
			
 
				-void
			
 
				-hw_perf_disable(void)
			
 
				+static void armpmu_disable(struct pmu *pmu)
			
 
				 {
			
 
				 	if (armpmu)
			
 
				 		armpmu->stop();
			
 
				 }
			
 
				 
			
 
				+static struct pmu pmu = {
			
 
				+	.pmu_enable	= armpmu_enable,
			
 
				+	.pmu_disable	= armpmu_disable,
			
 
				+	.event_init	= armpmu_event_init,
			
 
				+	.add		= armpmu_add,
			
 
				+	.del		= armpmu_del,
			
 
				+	.start		= armpmu_start,
			
 
				+	.stop		= armpmu_stop,
			
 
				+	.read		= armpmu_read,
			
 
				+};
			
 
				+
			
 
				 /*
			
 
				  * ARMv6 Performance counter handling code.
			
 
				  *
			
@@ -1045,7 +1092,7 @@ armv6pmu_handle_irq(int irq_num,
 
				 	 * platforms that can have the PMU interrupts raised as an NMI, this
			
 
				 	 * will not work.
			
 
				 	 */
			
 
				-	perf_event_do_pending();
			
 
				+	irq_work_run();
			
 
				 
			
 
				 	return IRQ_HANDLED;
			
 
				 }
			
@@ -2021,7 +2068,7 @@ static irqreturn_t armv7pmu_handle_irq(int irq_num, void *dev)
 
				 	 * platforms that can have the PMU interrupts raised as an NMI, this
			
 
				 	 * will not work.
			
 
				 	 */
			
 
				-	perf_event_do_pending();
			
 
				+	irq_work_run();
			
 
				 
			
 
				 	return IRQ_HANDLED;
			
 
				 }
			
@@ -2389,7 +2436,7 @@ xscale1pmu_handle_irq(int irq_num, void *dev)
 
				 			armpmu->disable(hwc, idx);
			
 
				 	}
			
 
				 
			
 
				-	perf_event_do_pending();
			
 
				+	irq_work_run();
			
 
				 
			
 
				 	/*
			
 
				 	 * Re-enable the PMU.
			
@@ -2716,7 +2763,7 @@ xscale2pmu_handle_irq(int irq_num, void *dev)
 
				 			armpmu->disable(hwc, idx);
			
 
				 	}
			
 
				 
			
 
				-	perf_event_do_pending();
			
 
				+	irq_work_run();
			
 
				 
			
 
				 	/*
			
 
				 	 * Re-enable the PMU.
			
@@ -2933,14 +2980,12 @@ init_hw_perf_events(void)
 
				 			armpmu = &armv6pmu;
			
 
				 			memcpy(armpmu_perf_cache_map, armv6_perf_cache_map,
			
 
				 					sizeof(armv6_perf_cache_map));
			
 
				-			perf_max_events	= armv6pmu.num_events;
			
 
				 			break;
			
 
				 		case 0xB020:	/* ARM11mpcore */
			
 
				 			armpmu = &armv6mpcore_pmu;
			
 
				 			memcpy(armpmu_perf_cache_map,
			
 
				 			       armv6mpcore_perf_cache_map,
			
 
				 			       sizeof(armv6mpcore_perf_cache_map));
			
 
				-			perf_max_events = armv6mpcore_pmu.num_events;
			
 
				 			break;
			
 
				 		case 0xC080:	/* Cortex-A8 */
			
 
				 			armv7pmu.id = ARM_PERF_PMU_ID_CA8;
			
@@ -2952,7 +2997,6 @@ init_hw_perf_events(void)
 
				 			/* Reset PMNC and read the nb of CNTx counters
			
 
				 			    supported */
			
 
				 			armv7pmu.num_events = armv7_reset_read_pmnc();
			
 
				-			perf_max_events = armv7pmu.num_events;
			
 
				 			break;
			
 
				 		case 0xC090:	/* Cortex-A9 */
			
 
				 			armv7pmu.id = ARM_PERF_PMU_ID_CA9;
			
@@ -2964,7 +3008,6 @@ init_hw_perf_events(void)
 
				 			/* Reset PMNC and read the nb of CNTx counters
			
 
				 			    supported */
			
 
				 			armv7pmu.num_events = armv7_reset_read_pmnc();
			
 
				-			perf_max_events = armv7pmu.num_events;
			
 
				 			break;
			
 
				 		}
			
 
				 	/* Intel CPUs [xscale]. */
			
@@ -2975,13 +3018,11 @@ init_hw_perf_events(void)
 
				 			armpmu = &xscale1pmu;
			
 
				 			memcpy(armpmu_perf_cache_map, xscale_perf_cache_map,
			
 
				 					sizeof(xscale_perf_cache_map));
			
 
				-			perf_max_events	= xscale1pmu.num_events;
			
 
				 			break;
			
 
				 		case 2:
			
 
				 			armpmu = &xscale2pmu;
			
 
				 			memcpy(armpmu_perf_cache_map, xscale_perf_cache_map,
			
 
				 					sizeof(xscale_perf_cache_map));
			
 
				-			perf_max_events	= xscale2pmu.num_events;
			
 
				 			break;
			
 
				 		}
			
 
				 	}
			
@@ -2991,9 +3032,10 @@ init_hw_perf_events(void)
 
				 				arm_pmu_names[armpmu->id], armpmu->num_events);
			
 
				 	} else {
			
 
				 		pr_info("no hardware support available\n");
			
 
				-		perf_max_events = -1;
			
 
				 	}
			
 
				 
			
 
				+	perf_pmu_register(&pmu);
			
 
				+
			
 
				 	return 0;
			
 
				 }
			
 
				 arch_initcall(init_hw_perf_events);
			
@@ -3001,13 +3043,6 @@ arch_initcall(init_hw_perf_events);
 
				 /*
			
 
				  * Callchain handling code.
			
 
				  */
			
 
				-static inline void
			
 
				-callchain_store(struct perf_callchain_entry *entry,
			
 
				-		u64 ip)
			
 
				-{
			
 
				-	if (entry->nr < PERF_MAX_STACK_DEPTH)
			
 
				-		entry->ip[entry->nr++] = ip;
			
 
				-}
			
 
				 
			
 
				 /*
			
 
				  * The registers we're interested in are at the end of the variable
			
@@ -3039,7 +3074,7 @@ user_backtrace(struct frame_tail *tail,
 
				 	if (__copy_from_user_inatomic(&buftail, tail, sizeof(buftail)))
			
 
				 		return NULL;
			
 
				 
			
 
				-	callchain_store(entry, buftail.lr);
			
 
				+	perf_callchain_store(entry, buftail.lr);
			
 
				 
			
 
				 	/*
			
 
				 	 * Frame pointers should strictly progress back up the stack
			
@@ -3051,16 +3086,11 @@ user_backtrace(struct frame_tail *tail,
 
				 	return buftail.fp - 1;
			
 
				 }
			
 
				 
			
 
				-static void
			
 
				-perf_callchain_user(struct pt_regs *regs,
			
 
				-		    struct perf_callchain_entry *entry)
			
 
				+void
			
 
				+perf_callchain_user(struct perf_callchain_entry *entry, struct pt_regs *regs)
			
 
				 {
			
 
				 	struct frame_tail *tail;
			
 
				 
			
 
				-	callchain_store(entry, PERF_CONTEXT_USER);
			
 
				-
			
 
				-	if (!user_mode(regs))
			
 
				-		regs = task_pt_regs(current);
			
 
				 
			
 
				 	tail = (struct frame_tail *)regs->ARM_fp - 1;
			
 
				 
			
@@ -3078,56 +3108,18 @@ callchain_trace(struct stackframe *fr,
 
				 		void *data)
			
 
				 {
			
 
				 	struct perf_callchain_entry *entry = data;
			
 
				-	callchain_store(entry, fr->pc);
			
 
				+	perf_callchain_store(entry, fr->pc);
			
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-static void
			
 
				-perf_callchain_kernel(struct pt_regs *regs,
			
 
				-		      struct perf_callchain_entry *entry)
			
 
				+void
			
 
				+perf_callchain_kernel(struct perf_callchain_entry *entry, struct pt_regs *regs)
			
 
				 {
			
 
				 	struct stackframe fr;
			
 
				 
			
 
				-	callchain_store(entry, PERF_CONTEXT_KERNEL);
			
 
				 	fr.fp = regs->ARM_fp;
			
 
				 	fr.sp = regs->ARM_sp;
			
 
				 	fr.lr = regs->ARM_lr;
			
 
				 	fr.pc = regs->ARM_pc;
			
 
				 	walk_stackframe(&fr, callchain_trace, entry);
			
 
				 }
			
 
				-
			
 
				-static void
			
 
				-perf_do_callchain(struct pt_regs *regs,
			
 
				-		  struct perf_callchain_entry *entry)
			
 
				-{
			
 
				-	int is_user;
			
 
				-
			
 
				-	if (!regs)
			
 
				-		return;
			
 
				-
			
 
				-	is_user = user_mode(regs);
			
 
				-
			
 
				-	if (!current || !current->pid)
			
 
				-		return;
			
 
				-
			
 
				-	if (is_user && current->state != TASK_RUNNING)
			
 
				-		return;
			
 
				-
			
 
				-	if (!is_user)
			
 
				-		perf_callchain_kernel(regs, entry);
			
 
				-
			
 
				-	if (current->mm)
			
 
				-		perf_callchain_user(regs, entry);
			
 
				-}
			
 
				-
			
 
				-static DEFINE_PER_CPU(struct perf_callchain_entry, pmc_irq_entry);
			
 
				-
			
 
				-struct perf_callchain_entry *
			
 
				-perf_callchain(struct pt_regs *regs)
			
 
				-{
			
 
				-	struct perf_callchain_entry *entry = &__get_cpu_var(pmc_irq_entry);
			
 
				-
			
 
				-	entry->nr = 0;
			
 
				-	perf_do_callchain(regs, entry);
			
 
				-	return entry;
			
 
				-}
			
--- a/arch/arm/oprofile/Makefile
+++ b/arch/arm/oprofile/Makefile
@@ -6,4 +6,8 @@ DRIVER_OBJS = $(addprefix ../../../drivers/oprofile/, \
 
				 		oprofilefs.o oprofile_stats.o \
			
 
				 		timer_int.o )
			
 
				 
			
 
				+ifeq ($(CONFIG_HW_PERF_EVENTS),y)
			
 
				+DRIVER_OBJS += $(addprefix ../../../drivers/oprofile/, oprofile_perf.o)
			
 
				+endif
			
 
				+
			
 
				 oprofile-y				:= $(DRIVER_OBJS) common.o
			
--- a/arch/arm/oprofile/common.c
+++ b/arch/arm/oprofile/common.c
@@ -25,139 +25,10 @@
 
				 #include <asm/ptrace.h>
			
 
				 
			
 
				 #ifdef CONFIG_HW_PERF_EVENTS
			
 
				-/*
			
 
				- * Per performance monitor configuration as set via oprofilefs.
			
 
				- */
			
 
				-struct op_counter_config {
			
 
				-	unsigned long count;
			
 
				-	unsigned long enabled;
			
 
				-	unsigned long event;
			
 
				-	unsigned long unit_mask;
			
 
				-	unsigned long kernel;
			
 
				-	unsigned long user;
			
 
				-	struct perf_event_attr attr;
			
 
				-};
			
 
				-
			
 
				-static int op_arm_enabled;
			
 
				-static DEFINE_MUTEX(op_arm_mutex);
			
 
				-
			
 
				-static struct op_counter_config *counter_config;
			
 
				-static struct perf_event **perf_events[nr_cpumask_bits];
			
 
				-static int perf_num_counters;
			
 
				-
			
 
				-/*
			
 
				- * Overflow callback for oprofile.
			
 
				- */
			
 
				-static void op_overflow_handler(struct perf_event *event, int unused,
			
 
				-			struct perf_sample_data *data, struct pt_regs *regs)
			
 
				+char *op_name_from_perf_id(void)
			
 
				 {
			
 
				-	int id;
			
 
				-	u32 cpu = smp_processor_id();
			
 
				-
			
 
				-	for (id = 0; id < perf_num_counters; ++id)
			
 
				-		if (perf_events[cpu][id] == event)
			
 
				-			break;
			
 
				-
			
 
				-	if (id != perf_num_counters)
			
 
				-		oprofile_add_sample(regs, id);
			
 
				-	else
			
 
				-		pr_warning("oprofile: ignoring spurious overflow "
			
 
				-				"on cpu %u\n", cpu);
			
 
				-}
			
 
				-
			
 
				-/*
			
 
				- * Called by op_arm_setup to create perf attributes to mirror the oprofile
			
 
				- * settings in counter_config. Attributes are created as `pinned' events and
			
 
				- * so are permanently scheduled on the PMU.
			
 
				- */
			
 
				-static void op_perf_setup(void)
			
 
				-{
			
 
				-	int i;
			
 
				-	u32 size = sizeof(struct perf_event_attr);
			
 
				-	struct perf_event_attr *attr;
			
 
				-
			
 
				-	for (i = 0; i < perf_num_counters; ++i) {
			
 
				-		attr = &counter_config[i].attr;
			
 
				-		memset(attr, 0, size);
			
 
				-		attr->type		= PERF_TYPE_RAW;
			
 
				-		attr->size		= size;
			
 
				-		attr->config		= counter_config[i].event;
			
 
				-		attr->sample_period	= counter_config[i].count;
			
 
				-		attr->pinned		= 1;
			
 
				-	}
			
 
				-}
			
 
				-
			
 
				-static int op_create_counter(int cpu, int event)
			
 
				-{
			
 
				-	int ret = 0;
			
 
				-	struct perf_event *pevent;
			
 
				-
			
 
				-	if (!counter_config[event].enabled || (perf_events[cpu][event] != NULL))
			
 
				-		return ret;
			
 
				-
			
 
				-	pevent = perf_event_create_kernel_counter(&counter_config[event].attr,
			
 
				-						  cpu, -1,
			
 
				-						  op_overflow_handler);
			
 
				-
			
 
				-	if (IS_ERR(pevent)) {
			
 
				-		ret = PTR_ERR(pevent);
			
 
				-	} else if (pevent->state != PERF_EVENT_STATE_ACTIVE) {
			
 
				-		perf_event_release_kernel(pevent);
			
 
				-		pr_warning("oprofile: failed to enable event %d "
			
 
				-				"on CPU %d\n", event, cpu);
			
 
				-		ret = -EBUSY;
			
 
				-	} else {
			
 
				-		perf_events[cpu][event] = pevent;
			
 
				-	}
			
 
				-
			
 
				-	return ret;
			
 
				-}
			
 
				+	enum arm_perf_pmu_ids id = armpmu_get_pmu_id();
			
 
				 
			
 
				-static void op_destroy_counter(int cpu, int event)
			
 
				-{
			
 
				-	struct perf_event *pevent = perf_events[cpu][event];
			
 
				-
			
 
				-	if (pevent) {
			
 
				-		perf_event_release_kernel(pevent);
			
 
				-		perf_events[cpu][event] = NULL;
			
 
				-	}
			
 
				-}
			
 
				-
			
 
				-/*
			
 
				- * Called by op_arm_start to create active perf events based on the
			
 
				- * perviously configured attributes.
			
 
				- */
			
 
				-static int op_perf_start(void)
			
 
				-{
			
 
				-	int cpu, event, ret = 0;
			
 
				-
			
 
				-	for_each_online_cpu(cpu) {
			
 
				-		for (event = 0; event < perf_num_counters; ++event) {
			
 
				-			ret = op_create_counter(cpu, event);
			
 
				-			if (ret)
			
 
				-				goto out;
			
 
				-		}
			
 
				-	}
			
 
				-
			
 
				-out:
			
 
				-	return ret;
			
 
				-}
			
 
				-
			
 
				-/*
			
 
				- * Called by op_arm_stop at the end of a profiling run.
			
 
				- */
			
 
				-static void op_perf_stop(void)
			
 
				-{
			
 
				-	int cpu, event;
			
 
				-
			
 
				-	for_each_online_cpu(cpu)
			
 
				-		for (event = 0; event < perf_num_counters; ++event)
			
 
				-			op_destroy_counter(cpu, event);
			
 
				-}
			
 
				-
			
 
				-
			
 
				-static char *op_name_from_perf_id(enum arm_perf_pmu_ids id)
			
 
				-{
			
 
				 	switch (id) {
			
 
				 	case ARM_PERF_PMU_ID_XSCALE1:
			
 
				 		return "arm/xscale1";
			
@@ -176,116 +47,6 @@ static char *op_name_from_perf_id(enum arm_perf_pmu_ids id)
 
				 	}
			
 
				 }
			
 
				 
			
 
				-static int op_arm_create_files(struct super_block *sb, struct dentry *root)
			
 
				-{
			
 
				-	unsigned int i;
			
 
				-
			
 
				-	for (i = 0; i < perf_num_counters; i++) {
			
 
				-		struct dentry *dir;
			
 
				-		char buf[4];
			
 
				-
			
 
				-		snprintf(buf, sizeof buf, "%d", i);
			
 
				-		dir = oprofilefs_mkdir(sb, root, buf);
			
 
				-		oprofilefs_create_ulong(sb, dir, "enabled", &counter_config[i].enabled);
			
 
				-		oprofilefs_create_ulong(sb, dir, "event", &counter_config[i].event);
			
 
				-		oprofilefs_create_ulong(sb, dir, "count", &counter_config[i].count);
			
 
				-		oprofilefs_create_ulong(sb, dir, "unit_mask", &counter_config[i].unit_mask);
			
 
				-		oprofilefs_create_ulong(sb, dir, "kernel", &counter_config[i].kernel);
			
 
				-		oprofilefs_create_ulong(sb, dir, "user", &counter_config[i].user);
			
 
				-	}
			
 
				-
			
 
				-	return 0;
			
 
				-}
			
 
				-
			
 
				-static int op_arm_setup(void)
			
 
				-{
			
 
				-	spin_lock(&oprofilefs_lock);
			
 
				-	op_perf_setup();
			
 
				-	spin_unlock(&oprofilefs_lock);
			
 
				-	return 0;
			
 
				-}
			
 
				-
			
 
				-static int op_arm_start(void)
			
 
				-{
			
 
				-	int ret = -EBUSY;
			
 
				-
			
 
				-	mutex_lock(&op_arm_mutex);
			
 
				-	if (!op_arm_enabled) {
			
 
				-		ret = 0;
			
 
				-		op_perf_start();
			
 
				-		op_arm_enabled = 1;
			
 
				-	}
			
 
				-	mutex_unlock(&op_arm_mutex);
			
 
				-	return ret;
			
 
				-}
			
 
				-
			
 
				-static void op_arm_stop(void)
			
 
				-{
			
 
				-	mutex_lock(&op_arm_mutex);
			
 
				-	if (op_arm_enabled)
			
 
				-		op_perf_stop();
			
 
				-	op_arm_enabled = 0;
			
 
				-	mutex_unlock(&op_arm_mutex);
			
 
				-}
			
 
				-
			
 
				-#ifdef CONFIG_PM
			
 
				-static int op_arm_suspend(struct platform_device *dev, pm_message_t state)
			
 
				-{
			
 
				-	mutex_lock(&op_arm_mutex);
			
 
				-	if (op_arm_enabled)
			
 
				-		op_perf_stop();
			
 
				-	mutex_unlock(&op_arm_mutex);
			
 
				-	return 0;
			
 
				-}
			
 
				-
			
 
				-static int op_arm_resume(struct platform_device *dev)
			
 
				-{
			
 
				-	mutex_lock(&op_arm_mutex);
			
 
				-	if (op_arm_enabled && op_perf_start())
			
 
				-		op_arm_enabled = 0;
			
 
				-	mutex_unlock(&op_arm_mutex);
			
 
				-	return 0;
			
 
				-}
			
 
				-
			
 
				-static struct platform_driver oprofile_driver = {
			
 
				-	.driver		= {
			
 
				-		.name		= "arm-oprofile",
			
 
				-	},
			
 
				-	.resume		= op_arm_resume,
			
 
				-	.suspend	= op_arm_suspend,
			
 
				-};
			
 
				-
			
 
				-static struct platform_device *oprofile_pdev;
			
 
				-
			
 
				-static int __init init_driverfs(void)
			
 
				-{
			
 
				-	int ret;
			
 
				-
			
 
				-	ret = platform_driver_register(&oprofile_driver);
			
 
				-	if (ret)
			
 
				-		goto out;
			
 
				-
			
 
				-	oprofile_pdev =	platform_device_register_simple(
			
 
				-				oprofile_driver.driver.name, 0, NULL, 0);
			
 
				-	if (IS_ERR(oprofile_pdev)) {
			
 
				-		ret = PTR_ERR(oprofile_pdev);
			
 
				-		platform_driver_unregister(&oprofile_driver);
			
 
				-	}
			
 
				-
			
 
				-out:
			
 
				-	return ret;
			
 
				-}
			
 
				-
			
 
				-static void  exit_driverfs(void)
			
 
				-{
			
 
				-	platform_device_unregister(oprofile_pdev);
			
 
				-	platform_driver_unregister(&oprofile_driver);
			
 
				-}
			
 
				-#else
			
 
				-static int __init init_driverfs(void) { return 0; }
			
 
				-#define exit_driverfs() do { } while (0)
			
 
				-#endif /* CONFIG_PM */
			
 
				-
			
 
				 static int report_trace(struct stackframe *frame, void *d)
			
 
				 {
			
 
				 	unsigned int *depth = d;
			
@@ -350,74 +111,14 @@ static void arm_backtrace(struct pt_regs * const regs, unsigned int depth)
 
				 
			
 
				 int __init oprofile_arch_init(struct oprofile_operations *ops)
			
 
				 {
			
 
				-	int cpu, ret = 0;
			
 
				-
			
 
				-	perf_num_counters = armpmu_get_max_events();
			
 
				-
			
 
				-	counter_config = kcalloc(perf_num_counters,
			
 
				-			sizeof(struct op_counter_config), GFP_KERNEL);
			
 
				-
			
 
				-	if (!counter_config) {
			
 
				-		pr_info("oprofile: failed to allocate %d "
			
 
				-				"counters\n", perf_num_counters);
			
 
				-		return -ENOMEM;
			
 
				-	}
			
 
				-
			
 
				-	ret = init_driverfs();
			
 
				-	if (ret) {
			
 
				-		kfree(counter_config);
			
 
				-		counter_config = NULL;
			
 
				-		return ret;
			
 
				-	}
			
 
				-
			
 
				-	for_each_possible_cpu(cpu) {
			
 
				-		perf_events[cpu] = kcalloc(perf_num_counters,
			
 
				-				sizeof(struct perf_event *), GFP_KERNEL);
			
 
				-		if (!perf_events[cpu]) {
			
 
				-			pr_info("oprofile: failed to allocate %d perf events "
			
 
				-					"for cpu %d\n", perf_num_counters, cpu);
			
 
				-			while (--cpu >= 0)
			
 
				-				kfree(perf_events[cpu]);
			
 
				-			return -ENOMEM;
			
 
				-		}
			
 
				-	}
			
 
				-
			
 
				 	ops->backtrace		= arm_backtrace;
			
 
				-	ops->create_files	= op_arm_create_files;
			
 
				-	ops->setup		= op_arm_setup;
			
 
				-	ops->start		= op_arm_start;
			
 
				-	ops->stop		= op_arm_stop;
			
 
				-	ops->shutdown		= op_arm_stop;
			
 
				-	ops->cpu_type		= op_name_from_perf_id(armpmu_get_pmu_id());
			
 
				-
			
 
				-	if (!ops->cpu_type)
			
 
				-		ret = -ENODEV;
			
 
				-	else
			
 
				-		pr_info("oprofile: using %s\n", ops->cpu_type);
			
 
				 
			
 
				-	return ret;
			
 
				+	return oprofile_perf_init(ops);
			
 
				 }
			
 
				 
			
 
				-void oprofile_arch_exit(void)
			
 
				+void __exit oprofile_arch_exit(void)
			
 
				 {
			
 
				-	int cpu, id;
			
 
				-	struct perf_event *event;
			
 
				-
			
 
				-	if (*perf_events) {
			
 
				-		for_each_possible_cpu(cpu) {
			
 
				-			for (id = 0; id < perf_num_counters; ++id) {
			
 
				-				event = perf_events[cpu][id];
			
 
				-				if (event != NULL)
			
 
				-					perf_event_release_kernel(event);
			
 
				-			}
			
 
				-			kfree(perf_events[cpu]);
			
 
				-		}
			
 
				-	}
			
 
				-
			
 
				-	if (counter_config) {
			
 
				-		kfree(counter_config);
			
 
				-		exit_driverfs();
			
 
				-	}
			
 
				+	oprofile_perf_exit();
			
 
				 }
			
 
				 #else
			
 
				 int __init oprofile_arch_init(struct oprofile_operations *ops)
			
@@ -425,5 +126,5 @@ int __init oprofile_arch_init(struct oprofile_operations *ops)
 
				 	pr_info("oprofile: hardware counters not available\n");
			
 
				 	return -ENODEV;
			
 
				 }
			
 
				-void oprofile_arch_exit(void) {}
			
 
				+void __exit oprofile_arch_exit(void) {}
			
 
				 #endif /* CONFIG_HW_PERF_EVENTS */
			
--- a/arch/frv/Kconfig
+++ b/arch/frv/Kconfig
@@ -7,6 +7,7 @@ config FRV
 
				 	default y
			
 
				 	select HAVE_IDE
			
 
				 	select HAVE_ARCH_TRACEHOOK
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_PERF_EVENTS
			
 
				 
			
 
				 config ZONE_DMA
			
--- a/arch/frv/lib/Makefile
+++ b/arch/frv/lib/Makefile
@@ -5,4 +5,4 @@
 
				 lib-y := \
			
 
				 	__ashldi3.o __lshrdi3.o __muldi3.o __ashrdi3.o __negdi2.o __ucmpdi2.o \
			
 
				 	checksum.o memcpy.o memset.o atomic-ops.o atomic64-ops.o \
			
 
				-	outsl_ns.o outsl_sw.o insl_ns.o insl_sw.o cache.o perf_event.o
			
 
				+	outsl_ns.o outsl_sw.o insl_ns.o insl_sw.o cache.o
			
--- a/arch/frv/lib/perf_event.c
+++ b/arch/frv/lib/perf_event.c
@@ -1,19 +0,0 @@
 
				-/* Performance event handling
			
 
				- *
			
 
				- * Copyright (C) 2009 Red Hat, Inc. All Rights Reserved.
			
 
				- * Written by David Howells (dhowells@redhat.com)
			
 
				- *
			
 
				- * This program is free software; you can redistribute it and/or
			
 
				- * modify it under the terms of the GNU General Public Licence
			
 
				- * as published by the Free Software Foundation; either version
			
 
				- * 2 of the Licence, or (at your option) any later version.
			
 
				- */
			
 
				-
			
 
				-#include <linux/perf_event.h>
			
 
				-
			
 
				-/*
			
 
				- * mark the performance event as pending
			
 
				- */
			
 
				-void set_perf_event_pending(void)
			
 
				-{
			
 
				-}
			
--- a/arch/ia64/include/asm/hardirq.h
+++ b/arch/ia64/include/asm/hardirq.h
@@ -6,12 +6,6 @@
 
				  *	David Mosberger-Tang <davidm@hpl.hp.com>
			
 
				  */
			
 
				 
			
 
				-
			
 
				-#include <linux/threads.h>
			
 
				-#include <linux/irq.h>
			
 
				-
			
 
				-#include <asm/processor.h>
			
 
				-
			
 
				 /*
			
 
				  * No irq_cpustat_t for IA-64.  The data is held in the per-CPU data structure.
			
 
				  */
			
@@ -20,6 +14,11 @@
 
				 
			
 
				 #define local_softirq_pending()		(local_cpu_data->softirq_pending)
			
 
				 
			
 
				+#include <linux/threads.h>
			
 
				+#include <linux/irq.h>
			
 
				+
			
 
				+#include <asm/processor.h>
			
 
				+
			
 
				 extern void __iomem *ipi_base_addr;
			
 
				 
			
 
				 void ack_bad_irq(unsigned int irq);
			
--- a/arch/parisc/Kconfig
+++ b/arch/parisc/Kconfig
@@ -16,6 +16,7 @@ config PARISC
 
				 	select RTC_DRV_GENERIC
			
 
				 	select INIT_ALL_POSSIBLE
			
 
				 	select BUG
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_PERF_EVENTS
			
 
				 	select GENERIC_ATOMIC64 if !64BIT
			
 
				 	help
			
--- a/arch/parisc/include/asm/perf_event.h
+++ b/arch/parisc/include/asm/perf_event.h
@@ -1,7 +1,6 @@
 
				 #ifndef __ASM_PARISC_PERF_EVENT_H
			
 
				 #define __ASM_PARISC_PERF_EVENT_H
			
 
				 
			
 
				-/* parisc only supports software events through this interface. */
			
 
				-static inline void set_perf_event_pending(void) { }
			
 
				+/* Empty, just to avoid compiling error */
			
 
				 
			
 
				 #endif /* __ASM_PARISC_PERF_EVENT_H */
			
--- a/arch/powerpc/Kconfig
+++ b/arch/powerpc/Kconfig
@@ -138,6 +138,7 @@ config PPC
 
				 	select HAVE_OPROFILE
			
 
				 	select HAVE_SYSCALL_WRAPPERS if PPC64
			
 
				 	select GENERIC_ATOMIC64 if PPC32
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_PERF_EVENTS
			
 
				 	select HAVE_REGS_AND_STACK_ACCESS_API
			
 
				 	select HAVE_HW_BREAKPOINT if PERF_EVENTS && PPC_BOOK3S_64
			
--- a/arch/powerpc/include/asm/paca.h
+++ b/arch/powerpc/include/asm/paca.h
@@ -129,7 +129,7 @@ struct paca_struct {
 
				 	u8 soft_enabled;		/* irq soft-enable flag */
			
 
				 	u8 hard_enabled;		/* set if irqs are enabled in MSR */
			
 
				 	u8 io_sync;			/* writel() needs spin_unlock sync */
			
 
				-	u8 perf_event_pending;		/* PM interrupt while soft-disabled */
			
 
				+	u8 irq_work_pending;		/* IRQ_WORK interrupt while soft-disable */
			
 
				 
			
 
				 	/* Stuff for accurate time accounting */
			
 
				 	u64 user_time;			/* accumulated usermode TB ticks */
			
--- a/arch/powerpc/kernel/perf_callchain.c
+++ b/arch/powerpc/kernel/perf_callchain.c
@@ -23,18 +23,6 @@
 
				 #include "ppc32.h"
			
 
				 #endif
			
 
				 
			
 
				-/*
			
 
				- * Store another value in a callchain_entry.
			
 
				- */
			
 
				-static inline void callchain_store(struct perf_callchain_entry *entry, u64 ip)
			
 
				-{
			
 
				-	unsigned int nr = entry->nr;
			
 
				-
			
 
				-	if (nr < PERF_MAX_STACK_DEPTH) {
			
 
				-		entry->ip[nr] = ip;
			
 
				-		entry->nr = nr + 1;
			
 
				-	}
			
 
				-}
			
 
				 
			
 
				 /*
			
 
				  * Is sp valid as the address of the next kernel stack frame after prev_sp?
			
@@ -58,8 +46,8 @@ static int valid_next_sp(unsigned long sp, unsigned long prev_sp)
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-static void perf_callchain_kernel(struct pt_regs *regs,
			
 
				-				  struct perf_callchain_entry *entry)
			
 
				+void
			
 
				+perf_callchain_kernel(struct perf_callchain_entry *entry, struct pt_regs *regs)
			
 
				 {
			
 
				 	unsigned long sp, next_sp;
			
 
				 	unsigned long next_ip;
			
@@ -69,8 +57,7 @@ static void perf_callchain_kernel(struct pt_regs *regs,
 
				 
			
 
				 	lr = regs->link;
			
 
				 	sp = regs->gpr[1];
			
 
				-	callchain_store(entry, PERF_CONTEXT_KERNEL);
			
 
				-	callchain_store(entry, regs->nip);
			
 
				+	perf_callchain_store(entry, regs->nip);
			
 
				 
			
 
				 	if (!validate_sp(sp, current, STACK_FRAME_OVERHEAD))
			
 
				 		return;
			
@@ -89,7 +76,7 @@ static void perf_callchain_kernel(struct pt_regs *regs,
 
				 			next_ip = regs->nip;
			
 
				 			lr = regs->link;
			
 
				 			level = 0;
			
 
				-			callchain_store(entry, PERF_CONTEXT_KERNEL);
			
 
				+			perf_callchain_store(entry, PERF_CONTEXT_KERNEL);
			
 
				 
			
 
				 		} else {
			
 
				 			if (level == 0)
			
@@ -111,7 +98,7 @@ static void perf_callchain_kernel(struct pt_regs *regs,
 
				 			++level;
			
 
				 		}
			
 
				 
			
 
				-		callchain_store(entry, next_ip);
			
 
				+		perf_callchain_store(entry, next_ip);
			
 
				 		if (!valid_next_sp(next_sp, sp))
			
 
				 			return;
			
 
				 		sp = next_sp;
			
@@ -233,8 +220,8 @@ static int sane_signal_64_frame(unsigned long sp)
 
				 		puc == (unsigned long) &sf->uc;
			
 
				 }
			
 
				 
			
 
				-static void perf_callchain_user_64(struct pt_regs *regs,
			
 
				-				   struct perf_callchain_entry *entry)
			
 
				+static void perf_callchain_user_64(struct perf_callchain_entry *entry,
			
 
				+				   struct pt_regs *regs)
			
 
				 {
			
 
				 	unsigned long sp, next_sp;
			
 
				 	unsigned long next_ip;
			
@@ -246,8 +233,7 @@ static void perf_callchain_user_64(struct pt_regs *regs,
 
				 	next_ip = regs->nip;
			
 
				 	lr = regs->link;
			
 
				 	sp = regs->gpr[1];
			
 
				-	callchain_store(entry, PERF_CONTEXT_USER);
			
 
				-	callchain_store(entry, next_ip);
			
 
				+	perf_callchain_store(entry, next_ip);
			
 
				 
			
 
				 	for (;;) {
			
 
				 		fp = (unsigned long __user *) sp;
			
@@ -276,14 +262,14 @@ static void perf_callchain_user_64(struct pt_regs *regs,
 
				 			    read_user_stack_64(&uregs[PT_R1], &sp))
			
 
				 				return;
			
 
				 			level = 0;
			
 
				-			callchain_store(entry, PERF_CONTEXT_USER);
			
 
				-			callchain_store(entry, next_ip);
			
 
				+			perf_callchain_store(entry, PERF_CONTEXT_USER);
			
 
				+			perf_callchain_store(entry, next_ip);
			
 
				 			continue;
			
 
				 		}
			
 
				 
			
 
				 		if (level == 0)
			
 
				 			next_ip = lr;
			
 
				-		callchain_store(entry, next_ip);
			
 
				+		perf_callchain_store(entry, next_ip);
			
 
				 		++level;
			
 
				 		sp = next_sp;
			
 
				 	}
			
@@ -315,8 +301,8 @@ static int read_user_stack_32(unsigned int __user *ptr, unsigned int *ret)
 
				 	return __get_user_inatomic(*ret, ptr);
			
 
				 }
			
 
				 
			
 
				-static inline void perf_callchain_user_64(struct pt_regs *regs,
			
 
				-					  struct perf_callchain_entry *entry)
			
 
				+static inline void perf_callchain_user_64(struct perf_callchain_entry *entry,
			
 
				+					  struct pt_regs *regs)
			
 
				 {
			
 
				 }
			
 
				 
			
@@ -435,8 +421,8 @@ static unsigned int __user *signal_frame_32_regs(unsigned int sp,
 
				 	return mctx->mc_gregs;
			
 
				 }
			
 
				 
			
 
				-static void perf_callchain_user_32(struct pt_regs *regs,
			
 
				-				   struct perf_callchain_entry *entry)
			
 
				+static void perf_callchain_user_32(struct perf_callchain_entry *entry,
			
 
				+				   struct pt_regs *regs)
			
 
				 {
			
 
				 	unsigned int sp, next_sp;
			
 
				 	unsigned int next_ip;
			
@@ -447,8 +433,7 @@ static void perf_callchain_user_32(struct pt_regs *regs,
 
				 	next_ip = regs->nip;
			
 
				 	lr = regs->link;
			
 
				 	sp = regs->gpr[1];
			
 
				-	callchain_store(entry, PERF_CONTEXT_USER);
			
 
				-	callchain_store(entry, next_ip);
			
 
				+	perf_callchain_store(entry, next_ip);
			
 
				 
			
 
				 	while (entry->nr < PERF_MAX_STACK_DEPTH) {
			
 
				 		fp = (unsigned int __user *) (unsigned long) sp;
			
@@ -470,45 +455,24 @@ static void perf_callchain_user_32(struct pt_regs *regs,
 
				 			    read_user_stack_32(&uregs[PT_R1], &sp))
			
 
				 				return;
			
 
				 			level = 0;
			
 
				-			callchain_store(entry, PERF_CONTEXT_USER);
			
 
				-			callchain_store(entry, next_ip);
			
 
				+			perf_callchain_store(entry, PERF_CONTEXT_USER);
			
 
				+			perf_callchain_store(entry, next_ip);
			
 
				 			continue;
			
 
				 		}
			
 
				 
			
 
				 		if (level == 0)
			
 
				 			next_ip = lr;
			
 
				-		callchain_store(entry, next_ip);
			
 
				+		perf_callchain_store(entry, next_ip);
			
 
				 		++level;
			
 
				 		sp = next_sp;
			
 
				 	}
			
 
				 }
			
 
				 
			
 
				-/*
			
 
				- * Since we can't get PMU interrupts inside a PMU interrupt handler,
			
 
				- * we don't need separate irq and nmi entries here.
			
 
				- */
			
 
				-static DEFINE_PER_CPU(struct perf_callchain_entry, cpu_perf_callchain);
			
 
				-
			
 
				-struct perf_callchain_entry *perf_callchain(struct pt_regs *regs)
			
 
				+void
			
 
				+perf_callchain_user(struct perf_callchain_entry *entry, struct pt_regs *regs)
			
 
				 {
			
 
				-	struct perf_callchain_entry *entry = &__get_cpu_var(cpu_perf_callchain);
			
 
				-
			
 
				-	entry->nr = 0;
			
 
				-
			
 
				-	if (!user_mode(regs)) {
			
 
				-		perf_callchain_kernel(regs, entry);
			
 
				-		if (current->mm)
			
 
				-			regs = task_pt_regs(current);
			
 
				-		else
			
 
				-			regs = NULL;
			
 
				-	}
			
 
				-
			
 
				-	if (regs) {
			
 
				-		if (current_is_64bit())
			
 
				-			perf_callchain_user_64(regs, entry);
			
 
				-		else
			
 
				-			perf_callchain_user_32(regs, entry);
			
 
				-	}
			
 
				-
			
 
				-	return entry;
			
 
				+	if (current_is_64bit())
			
 
				+		perf_callchain_user_64(entry, regs);
			
 
				+	else
			
 
				+		perf_callchain_user_32(entry, regs);
			
 
				 }
			
--- a/arch/powerpc/kernel/perf_event.c
+++ b/arch/powerpc/kernel/perf_event.c
@@ -402,6 +402,9 @@ static void power_pmu_read(struct perf_event *event)
 
				 {
			
 
				 	s64 val, delta, prev;
			
 
				 
			
 
				+	if (event->hw.state & PERF_HES_STOPPED)
			
 
				+		return;
			
 
				+
			
 
				 	if (!event->hw.idx)
			
 
				 		return;
			
 
				 	/*
			
@@ -517,7 +520,7 @@ static void write_mmcr0(struct cpu_hw_events *cpuhw, unsigned long mmcr0)
 
				  * Disable all events to prevent PMU interrupts and to allow
			
 
				  * events to be added or removed.
			
 
				  */
			
 
				-void hw_perf_disable(void)
			
 
				+static void power_pmu_disable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw;
			
 
				 	unsigned long flags;
			
@@ -565,7 +568,7 @@ void hw_perf_disable(void)
 
				  * If we were previously disabled and events were added, then
			
 
				  * put the new config on the PMU.
			
 
				  */
			
 
				-void hw_perf_enable(void)
			
 
				+static void power_pmu_enable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct perf_event *event;
			
 
				 	struct cpu_hw_events *cpuhw;
			
@@ -672,6 +675,8 @@ void hw_perf_enable(void)
 
				 		}
			
 
				 		local64_set(&event->hw.prev_count, val);
			
 
				 		event->hw.idx = idx;
			
 
				+		if (event->hw.state & PERF_HES_STOPPED)
			
 
				+			val = 0;
			
 
				 		write_pmc(idx, val);
			
 
				 		perf_event_update_userpage(event);
			
 
				 	}
			
@@ -727,7 +732,7 @@ static int collect_events(struct perf_event *group, int max_count,
 
				  * re-enable the PMU in order to get hw_perf_enable to do the
			
 
				  * actual work of reconfiguring the PMU.
			
 
				  */
			
 
				-static int power_pmu_enable(struct perf_event *event)
			
 
				+static int power_pmu_add(struct perf_event *event, int ef_flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw;
			
 
				 	unsigned long flags;
			
@@ -735,7 +740,7 @@ static int power_pmu_enable(struct perf_event *event)
 
				 	int ret = -EAGAIN;
			
 
				 
			
 
				 	local_irq_save(flags);
			
 
				-	perf_disable();
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				 
			
 
				 	/*
			
 
				 	 * Add the event to the list (if there is room)
			
@@ -749,6 +754,9 @@ static int power_pmu_enable(struct perf_event *event)
 
				 	cpuhw->events[n0] = event->hw.config;
			
 
				 	cpuhw->flags[n0] = event->hw.event_base;
			
 
				 
			
 
				+	if (!(ef_flags & PERF_EF_START))
			
 
				+		event->hw.state = PERF_HES_STOPPED | PERF_HES_UPTODATE;
			
 
				+
			
 
				 	/*
			
 
				 	 * If group events scheduling transaction was started,
			
 
				 	 * skip the schedulability test here, it will be peformed
			
@@ -769,7 +777,7 @@ nocheck:
 
				 
			
 
				 	ret = 0;
			
 
				  out:
			
 
				-	perf_enable();
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 	local_irq_restore(flags);
			
 
				 	return ret;
			
 
				 }
			
@@ -777,14 +785,14 @@ nocheck:
 
				 /*
			
 
				  * Remove a event from the PMU.
			
 
				  */
			
 
				-static void power_pmu_disable(struct perf_event *event)
			
 
				+static void power_pmu_del(struct perf_event *event, int ef_flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw;
			
 
				 	long i;
			
 
				 	unsigned long flags;
			
 
				 
			
 
				 	local_irq_save(flags);
			
 
				-	perf_disable();
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				 
			
 
				 	power_pmu_read(event);
			
 
				 
			
@@ -821,34 +829,60 @@ static void power_pmu_disable(struct perf_event *event)
 
				 		cpuhw->mmcr[0] &= ~(MMCR0_PMXE | MMCR0_FCECE);
			
 
				 	}
			
 
				 
			
 
				-	perf_enable();
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 	local_irq_restore(flags);
			
 
				 }
			
 
				 
			
 
				 /*
			
 
				- * Re-enable interrupts on a event after they were throttled
			
 
				- * because they were coming too fast.
			
 
				+ * POWER-PMU does not support disabling individual counters, hence
			
 
				+ * program their cycle counter to their max value and ignore the interrupts.
			
 
				  */
			
 
				-static void power_pmu_unthrottle(struct perf_event *event)
			
 
				+
			
 
				+static void power_pmu_start(struct perf_event *event, int ef_flags)
			
 
				+{
			
 
				+	unsigned long flags;
			
 
				+	s64 left;
			
 
				+
			
 
				+	if (!event->hw.idx || !event->hw.sample_period)
			
 
				+		return;
			
 
				+
			
 
				+	if (!(event->hw.state & PERF_HES_STOPPED))
			
 
				+		return;
			
 
				+
			
 
				+	if (ef_flags & PERF_EF_RELOAD)
			
 
				+		WARN_ON_ONCE(!(event->hw.state & PERF_HES_UPTODATE));
			
 
				+
			
 
				+	local_irq_save(flags);
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				+
			
 
				+	event->hw.state = 0;
			
 
				+	left = local64_read(&event->hw.period_left);
			
 
				+	write_pmc(event->hw.idx, left);
			
 
				+
			
 
				+	perf_event_update_userpage(event);
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				+	local_irq_restore(flags);
			
 
				+}
			
 
				+
			
 
				+static void power_pmu_stop(struct perf_event *event, int ef_flags)
			
 
				 {
			
 
				-	s64 val, left;
			
 
				 	unsigned long flags;
			
 
				 
			
 
				 	if (!event->hw.idx || !event->hw.sample_period)
			
 
				 		return;
			
 
				+
			
 
				+	if (event->hw.state & PERF_HES_STOPPED)
			
 
				+		return;
			
 
				+
			
 
				 	local_irq_save(flags);
			
 
				-	perf_disable();
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				+
			
 
				 	power_pmu_read(event);
			
 
				-	left = event->hw.sample_period;
			
 
				-	event->hw.last_period = left;
			
 
				-	val = 0;
			
 
				-	if (left < 0x80000000L)
			
 
				-		val = 0x80000000L - left;
			
 
				-	write_pmc(event->hw.idx, val);
			
 
				-	local64_set(&event->hw.prev_count, val);
			
 
				-	local64_set(&event->hw.period_left, left);
			
 
				+	event->hw.state |= PERF_HES_STOPPED | PERF_HES_UPTODATE;
			
 
				+	write_pmc(event->hw.idx, 0);
			
 
				+
			
 
				 	perf_event_update_userpage(event);
			
 
				-	perf_enable();
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 	local_irq_restore(flags);
			
 
				 }
			
 
				 
			
@@ -857,10 +891,11 @@ static void power_pmu_unthrottle(struct perf_event *event)
 
				  * Set the flag to make pmu::enable() not perform the
			
 
				  * schedulability test, it will be performed at commit time
			
 
				  */
			
 
				-void power_pmu_start_txn(const struct pmu *pmu)
			
 
				+void power_pmu_start_txn(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
 
				+	perf_pmu_disable(pmu);
			
 
				 	cpuhw->group_flag |= PERF_EVENT_TXN;
			
 
				 	cpuhw->n_txn_start = cpuhw->n_events;
			
 
				 }
			
@@ -870,11 +905,12 @@ void power_pmu_start_txn(const struct pmu *pmu)
 
				  * Clear the flag and pmu::enable() will perform the
			
 
				  * schedulability test.
			
 
				  */
			
 
				-void power_pmu_cancel_txn(const struct pmu *pmu)
			
 
				+void power_pmu_cancel_txn(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
 
				 	cpuhw->group_flag &= ~PERF_EVENT_TXN;
			
 
				+	perf_pmu_enable(pmu);
			
 
				 }
			
 
				 
			
 
				 /*
			
@@ -882,7 +918,7 @@ void power_pmu_cancel_txn(const struct pmu *pmu)
 
				  * Perform the group schedulability test as a whole
			
 
				  * Return 0 if success
			
 
				  */
			
 
				-int power_pmu_commit_txn(const struct pmu *pmu)
			
 
				+int power_pmu_commit_txn(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw;
			
 
				 	long i, n;
			
@@ -901,19 +937,10 @@ int power_pmu_commit_txn(const struct pmu *pmu)
 
				 		cpuhw->event[i]->hw.config = cpuhw->events[i];
			
 
				 
			
 
				 	cpuhw->group_flag &= ~PERF_EVENT_TXN;
			
 
				+	perf_pmu_enable(pmu);
			
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-struct pmu power_pmu = {
			
 
				-	.enable		= power_pmu_enable,
			
 
				-	.disable	= power_pmu_disable,
			
 
				-	.read		= power_pmu_read,
			
 
				-	.unthrottle	= power_pmu_unthrottle,
			
 
				-	.start_txn	= power_pmu_start_txn,
			
 
				-	.cancel_txn	= power_pmu_cancel_txn,
			
 
				-	.commit_txn	= power_pmu_commit_txn,
			
 
				-};
			
 
				-
			
 
				 /*
			
 
				  * Return 1 if we might be able to put event on a limited PMC,
			
 
				  * or 0 if not.
			
@@ -1014,7 +1041,7 @@ static int hw_perf_cache_event(u64 config, u64 *eventp)
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-const struct pmu *hw_perf_event_init(struct perf_event *event)
			
 
				+static int power_pmu_event_init(struct perf_event *event)
			
 
				 {
			
 
				 	u64 ev;
			
 
				 	unsigned long flags;
			
@@ -1026,25 +1053,27 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 	struct cpu_hw_events *cpuhw;
			
 
				 
			
 
				 	if (!ppmu)
			
 
				-		return ERR_PTR(-ENXIO);
			
 
				+		return -ENOENT;
			
 
				+
			
 
				 	switch (event->attr.type) {
			
 
				 	case PERF_TYPE_HARDWARE:
			
 
				 		ev = event->attr.config;
			
 
				 		if (ev >= ppmu->n_generic || ppmu->generic_events[ev] == 0)
			
 
				-			return ERR_PTR(-EOPNOTSUPP);
			
 
				+			return -EOPNOTSUPP;
			
 
				 		ev = ppmu->generic_events[ev];
			
 
				 		break;
			
 
				 	case PERF_TYPE_HW_CACHE:
			
 
				 		err = hw_perf_cache_event(event->attr.config, &ev);
			
 
				 		if (err)
			
 
				-			return ERR_PTR(err);
			
 
				+			return err;
			
 
				 		break;
			
 
				 	case PERF_TYPE_RAW:
			
 
				 		ev = event->attr.config;
			
 
				 		break;
			
 
				 	default:
			
 
				-		return ERR_PTR(-EINVAL);
			
 
				+		return -ENOENT;
			
 
				 	}
			
 
				+
			
 
				 	event->hw.config_base = ev;
			
 
				 	event->hw.idx = 0;
			
 
				 
			
@@ -1063,7 +1092,7 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 	 * XXX we should check if the task is an idle task.
			
 
				 	 */
			
 
				 	flags = 0;
			
 
				-	if (event->ctx->task)
			
 
				+	if (event->attach_state & PERF_ATTACH_TASK)
			
 
				 		flags |= PPMU_ONLY_COUNT_RUN;
			
 
				 
			
 
				 	/*
			
@@ -1081,7 +1110,7 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 			 */
			
 
				 			ev = normal_pmc_alternative(ev, flags);
			
 
				 			if (!ev)
			
 
				-				return ERR_PTR(-EINVAL);
			
 
				+				return -EINVAL;
			
 
				 		}
			
 
				 	}
			
 
				 
			
@@ -1095,19 +1124,19 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 		n = collect_events(event->group_leader, ppmu->n_counter - 1,
			
 
				 				   ctrs, events, cflags);
			
 
				 		if (n < 0)
			
 
				-			return ERR_PTR(-EINVAL);
			
 
				+			return -EINVAL;
			
 
				 	}
			
 
				 	events[n] = ev;
			
 
				 	ctrs[n] = event;
			
 
				 	cflags[n] = flags;
			
 
				 	if (check_excludes(ctrs, cflags, n, 1))
			
 
				-		return ERR_PTR(-EINVAL);
			
 
				+		return -EINVAL;
			
 
				 
			
 
				 	cpuhw = &get_cpu_var(cpu_hw_events);
			
 
				 	err = power_check_constraints(cpuhw, events, cflags, n + 1);
			
 
				 	put_cpu_var(cpu_hw_events);
			
 
				 	if (err)
			
 
				-		return ERR_PTR(-EINVAL);
			
 
				+		return -EINVAL;
			
 
				 
			
 
				 	event->hw.config = events[n];
			
 
				 	event->hw.event_base = cflags[n];
			
@@ -1132,11 +1161,23 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 	}
			
 
				 	event->destroy = hw_perf_event_destroy;
			
 
				 
			
 
				-	if (err)
			
 
				-		return ERR_PTR(err);
			
 
				-	return &power_pmu;
			
 
				+	return err;
			
 
				 }
			
 
				 
			
 
				+struct pmu power_pmu = {
			
 
				+	.pmu_enable	= power_pmu_enable,
			
 
				+	.pmu_disable	= power_pmu_disable,
			
 
				+	.event_init	= power_pmu_event_init,
			
 
				+	.add		= power_pmu_add,
			
 
				+	.del		= power_pmu_del,
			
 
				+	.start		= power_pmu_start,
			
 
				+	.stop		= power_pmu_stop,
			
 
				+	.read		= power_pmu_read,
			
 
				+	.start_txn	= power_pmu_start_txn,
			
 
				+	.cancel_txn	= power_pmu_cancel_txn,
			
 
				+	.commit_txn	= power_pmu_commit_txn,
			
 
				+};
			
 
				+
			
 
				 /*
			
 
				  * A counter has overflowed; update its count and record
			
 
				  * things if requested.  Note that interrupts are hard-disabled
			
@@ -1149,6 +1190,11 @@ static void record_and_restart(struct perf_event *event, unsigned long val,
 
				 	s64 prev, delta, left;
			
 
				 	int record = 0;
			
 
				 
			
 
				+	if (event->hw.state & PERF_HES_STOPPED) {
			
 
				+		write_pmc(event->hw.idx, 0);
			
 
				+		return;
			
 
				+	}
			
 
				+
			
 
				 	/* we don't have to worry about interrupts here */
			
 
				 	prev = local64_read(&event->hw.prev_count);
			
 
				 	delta = (val - prev) & 0xfffffffful;
			
@@ -1171,6 +1217,11 @@ static void record_and_restart(struct perf_event *event, unsigned long val,
 
				 			val = 0x80000000LL - left;
			
 
				 	}
			
 
				 
			
 
				+	write_pmc(event->hw.idx, val);
			
 
				+	local64_set(&event->hw.prev_count, val);
			
 
				+	local64_set(&event->hw.period_left, left);
			
 
				+	perf_event_update_userpage(event);
			
 
				+
			
 
				 	/*
			
 
				 	 * Finally record data if requested.
			
 
				 	 */
			
@@ -1183,23 +1234,9 @@ static void record_and_restart(struct perf_event *event, unsigned long val,
 
				 		if (event->attr.sample_type & PERF_SAMPLE_ADDR)
			
 
				 			perf_get_data_addr(regs, &data.addr);
			
 
				 
			
 
				-		if (perf_event_overflow(event, nmi, &data, regs)) {
			
 
				-			/*
			
 
				-			 * Interrupts are coming too fast - throttle them
			
 
				-			 * by setting the event to 0, so it will be
			
 
				-			 * at least 2^30 cycles until the next interrupt
			
 
				-			 * (assuming each event counts at most 2 counts
			
 
				-			 * per cycle).
			
 
				-			 */
			
 
				-			val = 0;
			
 
				-			left = ~0ULL >> 1;
			
 
				-		}
			
 
				+		if (perf_event_overflow(event, nmi, &data, regs))
			
 
				+			power_pmu_stop(event, 0);
			
 
				 	}
			
 
				-
			
 
				-	write_pmc(event->hw.idx, val);
			
 
				-	local64_set(&event->hw.prev_count, val);
			
 
				-	local64_set(&event->hw.period_left, left);
			
 
				-	perf_event_update_userpage(event);
			
 
				 }
			
 
				 
			
 
				 /*
			
@@ -1342,6 +1379,7 @@ int register_power_pmu(struct power_pmu *pmu)
 
				 		freeze_events_kernel = MMCR0_FCHV;
			
 
				 #endif /* CONFIG_PPC64 */
			
 
				 
			
 
				+	perf_pmu_register(&power_pmu);
			
 
				 	perf_cpu_notifier(power_pmu_notifier);
			
 
				 
			
 
				 	return 0;
			
--- a/arch/powerpc/kernel/perf_event_fsl_emb.c
+++ b/arch/powerpc/kernel/perf_event_fsl_emb.c
@@ -156,6 +156,9 @@ static void fsl_emb_pmu_read(struct perf_event *event)
 
				 {
			
 
				 	s64 val, delta, prev;
			
 
				 
			
 
				+	if (event->hw.state & PERF_HES_STOPPED)
			
 
				+		return;
			
 
				+
			
 
				 	/*
			
 
				 	 * Performance monitor interrupts come even when interrupts
			
 
				 	 * are soft-disabled, as long as interrupts are hard-enabled.
			
@@ -177,7 +180,7 @@ static void fsl_emb_pmu_read(struct perf_event *event)
 
				  * Disable all events to prevent PMU interrupts and to allow
			
 
				  * events to be added or removed.
			
 
				  */
			
 
				-void hw_perf_disable(void)
			
 
				+static void fsl_emb_pmu_disable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw;
			
 
				 	unsigned long flags;
			
@@ -216,7 +219,7 @@ void hw_perf_disable(void)
 
				  * If we were previously disabled and events were added, then
			
 
				  * put the new config on the PMU.
			
 
				  */
			
 
				-void hw_perf_enable(void)
			
 
				+static void fsl_emb_pmu_enable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw;
			
 
				 	unsigned long flags;
			
@@ -262,8 +265,8 @@ static int collect_events(struct perf_event *group, int max_count,
 
				 	return n;
			
 
				 }
			
 
				 
			
 
				-/* perf must be disabled, context locked on entry */
			
 
				-static int fsl_emb_pmu_enable(struct perf_event *event)
			
 
				+/* context locked on entry */
			
 
				+static int fsl_emb_pmu_add(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw;
			
 
				 	int ret = -EAGAIN;
			
@@ -271,6 +274,7 @@ static int fsl_emb_pmu_enable(struct perf_event *event)
 
				 	u64 val;
			
 
				 	int i;
			
 
				 
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				 	cpuhw = &get_cpu_var(cpu_hw_events);
			
 
				 
			
 
				 	if (event->hw.config & FSL_EMB_EVENT_RESTRICTED)
			
@@ -301,6 +305,12 @@ static int fsl_emb_pmu_enable(struct perf_event *event)
 
				 			val = 0x80000000L - left;
			
 
				 	}
			
 
				 	local64_set(&event->hw.prev_count, val);
			
 
				+
			
 
				+	if (!(flags & PERF_EF_START)) {
			
 
				+		event->hw.state = PERF_HES_STOPPED | PERF_HES_UPTODATE;
			
 
				+		val = 0;
			
 
				+	}
			
 
				+
			
 
				 	write_pmc(i, val);
			
 
				 	perf_event_update_userpage(event);
			
 
				 
			
@@ -310,15 +320,17 @@ static int fsl_emb_pmu_enable(struct perf_event *event)
 
				 	ret = 0;
			
 
				  out:
			
 
				 	put_cpu_var(cpu_hw_events);
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 	return ret;
			
 
				 }
			
 
				 
			
 
				-/* perf must be disabled, context locked on entry */
			
 
				-static void fsl_emb_pmu_disable(struct perf_event *event)
			
 
				+/* context locked on entry */
			
 
				+static void fsl_emb_pmu_del(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw;
			
 
				 	int i = event->hw.idx;
			
 
				 
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				 	if (i < 0)
			
 
				 		goto out;
			
 
				 
			
@@ -346,44 +358,57 @@ static void fsl_emb_pmu_disable(struct perf_event *event)
 
				 	cpuhw->n_events--;
			
 
				 
			
 
				  out:
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 	put_cpu_var(cpu_hw_events);
			
 
				 }
			
 
				 
			
 
				-/*
			
 
				- * Re-enable interrupts on a event after they were throttled
			
 
				- * because they were coming too fast.
			
 
				- *
			
 
				- * Context is locked on entry, but perf is not disabled.
			
 
				- */
			
 
				-static void fsl_emb_pmu_unthrottle(struct perf_event *event)
			
 
				+static void fsl_emb_pmu_start(struct perf_event *event, int ef_flags)
			
 
				 {
			
 
				-	s64 val, left;
			
 
				 	unsigned long flags;
			
 
				+	s64 left;
			
 
				 
			
 
				 	if (event->hw.idx < 0 || !event->hw.sample_period)
			
 
				 		return;
			
 
				+
			
 
				+	if (!(event->hw.state & PERF_HES_STOPPED))
			
 
				+		return;
			
 
				+
			
 
				+	if (ef_flags & PERF_EF_RELOAD)
			
 
				+		WARN_ON_ONCE(!(event->hw.state & PERF_HES_UPTODATE));
			
 
				+
			
 
				 	local_irq_save(flags);
			
 
				-	perf_disable();
			
 
				-	fsl_emb_pmu_read(event);
			
 
				-	left = event->hw.sample_period;
			
 
				-	event->hw.last_period = left;
			
 
				-	val = 0;
			
 
				-	if (left < 0x80000000L)
			
 
				-		val = 0x80000000L - left;
			
 
				-	write_pmc(event->hw.idx, val);
			
 
				-	local64_set(&event->hw.prev_count, val);
			
 
				-	local64_set(&event->hw.period_left, left);
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				+
			
 
				+	event->hw.state = 0;
			
 
				+	left = local64_read(&event->hw.period_left);
			
 
				+	write_pmc(event->hw.idx, left);
			
 
				+
			
 
				 	perf_event_update_userpage(event);
			
 
				-	perf_enable();
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 	local_irq_restore(flags);
			
 
				 }
			
 
				 
			
 
				-static struct pmu fsl_emb_pmu = {
			
 
				-	.enable		= fsl_emb_pmu_enable,
			
 
				-	.disable	= fsl_emb_pmu_disable,
			
 
				-	.read		= fsl_emb_pmu_read,
			
 
				-	.unthrottle	= fsl_emb_pmu_unthrottle,
			
 
				-};
			
 
				+static void fsl_emb_pmu_stop(struct perf_event *event, int ef_flags)
			
 
				+{
			
 
				+	unsigned long flags;
			
 
				+
			
 
				+	if (event->hw.idx < 0 || !event->hw.sample_period)
			
 
				+		return;
			
 
				+
			
 
				+	if (event->hw.state & PERF_HES_STOPPED)
			
 
				+		return;
			
 
				+
			
 
				+	local_irq_save(flags);
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				+
			
 
				+	fsl_emb_pmu_read(event);
			
 
				+	event->hw.state |= PERF_HES_STOPPED | PERF_HES_UPTODATE;
			
 
				+	write_pmc(event->hw.idx, 0);
			
 
				+
			
 
				+	perf_event_update_userpage(event);
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				+	local_irq_restore(flags);
			
 
				+}
			
 
				 
			
 
				 /*
			
 
				  * Release the PMU if this is the last perf_event.
			
@@ -428,7 +453,7 @@ static int hw_perf_cache_event(u64 config, u64 *eventp)
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-const struct pmu *hw_perf_event_init(struct perf_event *event)
			
 
				+static int fsl_emb_pmu_event_init(struct perf_event *event)
			
 
				 {
			
 
				 	u64 ev;
			
 
				 	struct perf_event *events[MAX_HWEVENTS];
			
@@ -441,14 +466,14 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 	case PERF_TYPE_HARDWARE:
			
 
				 		ev = event->attr.config;
			
 
				 		if (ev >= ppmu->n_generic || ppmu->generic_events[ev] == 0)
			
 
				-			return ERR_PTR(-EOPNOTSUPP);
			
 
				+			return -EOPNOTSUPP;
			
 
				 		ev = ppmu->generic_events[ev];
			
 
				 		break;
			
 
				 
			
 
				 	case PERF_TYPE_HW_CACHE:
			
 
				 		err = hw_perf_cache_event(event->attr.config, &ev);
			
 
				 		if (err)
			
 
				-			return ERR_PTR(err);
			
 
				+			return err;
			
 
				 		break;
			
 
				 
			
 
				 	case PERF_TYPE_RAW:
			
@@ -456,12 +481,12 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 		break;
			
 
				 
			
 
				 	default:
			
 
				-		return ERR_PTR(-EINVAL);
			
 
				+		return -ENOENT;
			
 
				 	}
			
 
				 
			
 
				 	event->hw.config = ppmu->xlate_event(ev);
			
 
				 	if (!(event->hw.config & FSL_EMB_EVENT_VALID))
			
 
				-		return ERR_PTR(-EINVAL);
			
 
				+		return -EINVAL;
			
 
				 
			
 
				 	/*
			
 
				 	 * If this is in a group, check if it can go on with all the
			
@@ -473,7 +498,7 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 		n = collect_events(event->group_leader,
			
 
				 		                   ppmu->n_counter - 1, events);
			
 
				 		if (n < 0)
			
 
				-			return ERR_PTR(-EINVAL);
			
 
				+			return -EINVAL;
			
 
				 	}
			
 
				 
			
 
				 	if (event->hw.config & FSL_EMB_EVENT_RESTRICTED) {
			
@@ -484,7 +509,7 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 		}
			
 
				 
			
 
				 		if (num_restricted >= ppmu->n_restricted)
			
 
				-			return ERR_PTR(-EINVAL);
			
 
				+			return -EINVAL;
			
 
				 	}
			
 
				 
			
 
				 	event->hw.idx = -1;
			
@@ -497,7 +522,7 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 	if (event->attr.exclude_kernel)
			
 
				 		event->hw.config_base |= PMLCA_FCS;
			
 
				 	if (event->attr.exclude_idle)
			
 
				-		return ERR_PTR(-ENOTSUPP);
			
 
				+		return -ENOTSUPP;
			
 
				 
			
 
				 	event->hw.last_period = event->hw.sample_period;
			
 
				 	local64_set(&event->hw.period_left, event->hw.last_period);
			
@@ -523,11 +548,20 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 	}
			
 
				 	event->destroy = hw_perf_event_destroy;
			
 
				 
			
 
				-	if (err)
			
 
				-		return ERR_PTR(err);
			
 
				-	return &fsl_emb_pmu;
			
 
				+	return err;
			
 
				 }
			
 
				 
			
 
				+static struct pmu fsl_emb_pmu = {
			
 
				+	.pmu_enable	= fsl_emb_pmu_enable,
			
 
				+	.pmu_disable	= fsl_emb_pmu_disable,
			
 
				+	.event_init	= fsl_emb_pmu_event_init,
			
 
				+	.add		= fsl_emb_pmu_add,
			
 
				+	.del		= fsl_emb_pmu_del,
			
 
				+	.start		= fsl_emb_pmu_start,
			
 
				+	.stop		= fsl_emb_pmu_stop,
			
 
				+	.read		= fsl_emb_pmu_read,
			
 
				+};
			
 
				+
			
 
				 /*
			
 
				  * A counter has overflowed; update its count and record
			
 
				  * things if requested.  Note that interrupts are hard-disabled
			
@@ -540,6 +574,11 @@ static void record_and_restart(struct perf_event *event, unsigned long val,
 
				 	s64 prev, delta, left;
			
 
				 	int record = 0;
			
 
				 
			
 
				+	if (event->hw.state & PERF_HES_STOPPED) {
			
 
				+		write_pmc(event->hw.idx, 0);
			
 
				+		return;
			
 
				+	}
			
 
				+
			
 
				 	/* we don't have to worry about interrupts here */
			
 
				 	prev = local64_read(&event->hw.prev_count);
			
 
				 	delta = (val - prev) & 0xfffffffful;
			
@@ -562,6 +601,11 @@ static void record_and_restart(struct perf_event *event, unsigned long val,
 
				 			val = 0x80000000LL - left;
			
 
				 	}
			
 
				 
			
 
				+	write_pmc(event->hw.idx, val);
			
 
				+	local64_set(&event->hw.prev_count, val);
			
 
				+	local64_set(&event->hw.period_left, left);
			
 
				+	perf_event_update_userpage(event);
			
 
				+
			
 
				 	/*
			
 
				 	 * Finally record data if requested.
			
 
				 	 */
			
@@ -571,23 +615,9 @@ static void record_and_restart(struct perf_event *event, unsigned long val,
 
				 		perf_sample_data_init(&data, 0);
			
 
				 		data.period = event->hw.last_period;
			
 
				 
			
 
				-		if (perf_event_overflow(event, nmi, &data, regs)) {
			
 
				-			/*
			
 
				-			 * Interrupts are coming too fast - throttle them
			
 
				-			 * by setting the event to 0, so it will be
			
 
				-			 * at least 2^30 cycles until the next interrupt
			
 
				-			 * (assuming each event counts at most 2 counts
			
 
				-			 * per cycle).
			
 
				-			 */
			
 
				-			val = 0;
			
 
				-			left = ~0ULL >> 1;
			
 
				-		}
			
 
				+		if (perf_event_overflow(event, nmi, &data, regs))
			
 
				+			fsl_emb_pmu_stop(event, 0);
			
 
				 	}
			
 
				-
			
 
				-	write_pmc(event->hw.idx, val);
			
 
				-	local64_set(&event->hw.prev_count, val);
			
 
				-	local64_set(&event->hw.period_left, left);
			
 
				-	perf_event_update_userpage(event);
			
 
				 }
			
 
				 
			
 
				 static void perf_event_interrupt(struct pt_regs *regs)
			
@@ -651,5 +681,7 @@ int register_fsl_emb_pmu(struct fsl_emb_pmu *pmu)
 
				 	pr_info("%s performance monitor hardware support registered\n",
			
 
				 		pmu->name);
			
 
				 
			
 
				+	perf_pmu_register(&fsl_emb_pmu);
			
 
				+
			
 
				 	return 0;
			
 
				 }
			
--- a/arch/powerpc/kernel/time.c
+++ b/arch/powerpc/kernel/time.c
@@ -53,7 +53,7 @@
 
				 #include <linux/posix-timers.h>
			
 
				 #include <linux/irq.h>
			
 
				 #include <linux/delay.h>
			
 
				-#include <linux/perf_event.h>
			
 
				+#include <linux/irq_work.h>
			
 
				 #include <asm/trace.h>
			
 
				 
			
 
				 #include <asm/io.h>
			
@@ -493,60 +493,60 @@ void __init iSeries_time_init_early(void)
 
				 }
			
 
				 #endif /* CONFIG_PPC_ISERIES */
			
 
				 
			
 
				-#ifdef CONFIG_PERF_EVENTS
			
 
				+#ifdef CONFIG_IRQ_WORK
			
 
				 
			
 
				 /*
			
 
				  * 64-bit uses a byte in the PACA, 32-bit uses a per-cpu variable...
			
 
				  */
			
 
				 #ifdef CONFIG_PPC64
			
 
				-static inline unsigned long test_perf_event_pending(void)
			
 
				+static inline unsigned long test_irq_work_pending(void)
			
 
				 {
			
 
				 	unsigned long x;
			
 
				 
			
 
				 	asm volatile("lbz %0,%1(13)"
			
 
				 		: "=r" (x)
			
 
				-		: "i" (offsetof(struct paca_struct, perf_event_pending)));
			
 
				+		: "i" (offsetof(struct paca_struct, irq_work_pending)));
			
 
				 	return x;
			
 
				 }
			
 
				 
			
 
				-static inline void set_perf_event_pending_flag(void)
			
 
				+static inline void set_irq_work_pending_flag(void)
			
 
				 {
			
 
				 	asm volatile("stb %0,%1(13)" : :
			
 
				 		"r" (1),
			
 
				-		"i" (offsetof(struct paca_struct, perf_event_pending)));
			
 
				+		"i" (offsetof(struct paca_struct, irq_work_pending)));
			
 
				 }
			
 
				 
			
 
				-static inline void clear_perf_event_pending(void)
			
 
				+static inline void clear_irq_work_pending(void)
			
 
				 {
			
 
				 	asm volatile("stb %0,%1(13)" : :
			
 
				 		"r" (0),
			
 
				-		"i" (offsetof(struct paca_struct, perf_event_pending)));
			
 
				+		"i" (offsetof(struct paca_struct, irq_work_pending)));
			
 
				 }
			
 
				 
			
 
				 #else /* 32-bit */
			
 
				 
			
 
				-DEFINE_PER_CPU(u8, perf_event_pending);
			
 
				+DEFINE_PER_CPU(u8, irq_work_pending);
			
 
				 
			
 
				-#define set_perf_event_pending_flag()	__get_cpu_var(perf_event_pending) = 1
			
 
				-#define test_perf_event_pending()	__get_cpu_var(perf_event_pending)
			
 
				-#define clear_perf_event_pending()	__get_cpu_var(perf_event_pending) = 0
			
 
				+#define set_irq_work_pending_flag()	__get_cpu_var(irq_work_pending) = 1
			
 
				+#define test_irq_work_pending()		__get_cpu_var(irq_work_pending)
			
 
				+#define clear_irq_work_pending()	__get_cpu_var(irq_work_pending) = 0
			
 
				 
			
 
				 #endif /* 32 vs 64 bit */
			
 
				 
			
 
				-void set_perf_event_pending(void)
			
 
				+void set_irq_work_pending(void)
			
 
				 {
			
 
				 	preempt_disable();
			
 
				-	set_perf_event_pending_flag();
			
 
				+	set_irq_work_pending_flag();
			
 
				 	set_dec(1);
			
 
				 	preempt_enable();
			
 
				 }
			
 
				 
			
 
				-#else  /* CONFIG_PERF_EVENTS */
			
 
				+#else  /* CONFIG_IRQ_WORK */
			
 
				 
			
 
				-#define test_perf_event_pending()	0
			
 
				-#define clear_perf_event_pending()
			
 
				+#define test_irq_work_pending()	0
			
 
				+#define clear_irq_work_pending()
			
 
				 
			
 
				-#endif /* CONFIG_PERF_EVENTS */
			
 
				+#endif /* CONFIG_IRQ_WORK */
			
 
				 
			
 
				 /*
			
 
				  * For iSeries shared processors, we have to let the hypervisor
			
@@ -587,9 +587,9 @@ void timer_interrupt(struct pt_regs * regs)
 
				 
			
 
				 	calculate_steal_time();
			
 
				 
			
 
				-	if (test_perf_event_pending()) {
			
 
				-		clear_perf_event_pending();
			
 
				-		perf_event_do_pending();
			
 
				+	if (test_irq_work_pending()) {
			
 
				+		clear_irq_work_pending();
			
 
				+		irq_work_run();
			
 
				 	}
			
 
				 
			
 
				 #ifdef CONFIG_PPC_ISERIES
			
--- a/arch/s390/Kconfig
+++ b/arch/s390/Kconfig
@@ -95,6 +95,7 @@ config S390
 
				 	select HAVE_KVM if 64BIT
			
 
				 	select HAVE_ARCH_TRACEHOOK
			
 
				 	select INIT_ALL_POSSIBLE
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_PERF_EVENTS
			
 
				 	select HAVE_KERNEL_GZIP
			
 
				 	select HAVE_KERNEL_BZIP2
			
--- a/arch/s390/include/asm/hardirq.h
+++ b/arch/s390/include/asm/hardirq.h
@@ -12,10 +12,6 @@
 
				 #ifndef __ASM_HARDIRQ_H
			
 
				 #define __ASM_HARDIRQ_H
			
 
				 
			
 
				-#include <linux/threads.h>
			
 
				-#include <linux/sched.h>
			
 
				-#include <linux/cache.h>
			
 
				-#include <linux/interrupt.h>
			
 
				 #include <asm/lowcore.h>
			
 
				 
			
 
				 #define local_softirq_pending() (S390_lowcore.softirq_pending)
			
--- a/arch/s390/include/asm/perf_event.h
+++ b/arch/s390/include/asm/perf_event.h
@@ -4,7 +4,6 @@
 
				  * Copyright 2009 Martin Schwidefsky, IBM Corporation.
			
 
				  */
			
 
				 
			
 
				-static inline void set_perf_event_pending(void) {}
			
 
				-static inline void clear_perf_event_pending(void) {}
			
 
				+/* Empty, just to avoid compiling error */
			
 
				 
			
 
				 #define PERF_EVENT_INDEX_OFFSET 0
			
--- a/arch/sh/Kconfig
+++ b/arch/sh/Kconfig
@@ -16,6 +16,7 @@ config SUPERH
 
				 	select HAVE_ARCH_TRACEHOOK
			
 
				 	select HAVE_DMA_API_DEBUG
			
 
				 	select HAVE_DMA_ATTRS
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_PERF_EVENTS
			
 
				 	select PERF_USE_VMALLOC
			
 
				 	select HAVE_KERNEL_GZIP
			
@@ -249,6 +250,11 @@ config ARCH_SHMOBILE
 
				 	select PM
			
 
				 	select PM_RUNTIME
			
 
				 
			
 
				+config CPU_HAS_PMU
			
 
				+       depends on CPU_SH4 || CPU_SH4A
			
 
				+       default y
			
 
				+       bool
			
 
				+
			
 
				 if SUPERH32
			
 
				 
			
 
				 choice
			
@@ -738,6 +744,14 @@ config GUSA_RB
 
				 	  LLSC, this should be more efficient than the other alternative of
			
 
				 	  disabling interrupts around the atomic sequence.
			
 
				 
			
 
				+config HW_PERF_EVENTS
			
 
				+	bool "Enable hardware performance counter support for perf events"
			
 
				+	depends on PERF_EVENTS && CPU_HAS_PMU
			
 
				+	default y
			
 
				+	help
			
 
				+	  Enable hardware performance counter support for perf events. If
			
 
				+	  disabled, perf events will use software events only.
			
 
				+
			
 
				 source "drivers/sh/Kconfig"
			
 
				 
			
 
				 endmenu
			
--- a/arch/sh/include/asm/perf_event.h
+++ b/arch/sh/include/asm/perf_event.h
@@ -26,11 +26,4 @@ extern int register_sh_pmu(struct sh_pmu *);
 
				 extern int reserve_pmc_hardware(void);
			
 
				 extern void release_pmc_hardware(void);
			
 
				 
			
 
				-static inline void set_perf_event_pending(void)
			
 
				-{
			
 
				-	/* Nothing to see here, move along. */
			
 
				-}
			
 
				-
			
 
				-#define PERF_EVENT_INDEX_OFFSET	0
			
 
				-
			
 
				 #endif /* __ASM_SH_PERF_EVENT_H */
			
--- a/arch/sh/kernel/perf_callchain.c
+++ b/arch/sh/kernel/perf_callchain.c
@@ -14,11 +14,6 @@
 
				 #include <asm/unwinder.h>
			
 
				 #include <asm/ptrace.h>
			
 
				 
			
 
				-static inline void callchain_store(struct perf_callchain_entry *entry, u64 ip)
			
 
				-{
			
 
				-	if (entry->nr < PERF_MAX_STACK_DEPTH)
			
 
				-		entry->ip[entry->nr++] = ip;
			
 
				-}
			
 
				 
			
 
				 static void callchain_warning(void *data, char *msg)
			
 
				 {
			
@@ -39,7 +34,7 @@ static void callchain_address(void *data, unsigned long addr, int reliable)
 
				 	struct perf_callchain_entry *entry = data;
			
 
				 
			
 
				 	if (reliable)
			
 
				-		callchain_store(entry, addr);
			
 
				+		perf_callchain_store(entry, addr);
			
 
				 }
			
 
				 
			
 
				 static const struct stacktrace_ops callchain_ops = {
			
@@ -49,47 +44,10 @@ static const struct stacktrace_ops callchain_ops = {
 
				 	.address	= callchain_address,
			
 
				 };
			
 
				 
			
 
				-static void
			
 
				-perf_callchain_kernel(struct pt_regs *regs, struct perf_callchain_entry *entry)
			
 
				+void
			
 
				+perf_callchain_kernel(struct perf_callchain_entry *entry, struct pt_regs *regs)
			
 
				 {
			
 
				-	callchain_store(entry, PERF_CONTEXT_KERNEL);
			
 
				-	callchain_store(entry, regs->pc);
			
 
				+	perf_callchain_store(entry, regs->pc);
			
 
				 
			
 
				 	unwind_stack(NULL, regs, NULL, &callchain_ops, entry);
			
 
				 }
			
 
				-
			
 
				-static void
			
 
				-perf_do_callchain(struct pt_regs *regs, struct perf_callchain_entry *entry)
			
 
				-{
			
 
				-	int is_user;
			
 
				-
			
 
				-	if (!regs)
			
 
				-		return;
			
 
				-
			
 
				-	is_user = user_mode(regs);
			
 
				-
			
 
				-	if (is_user && current->state != TASK_RUNNING)
			
 
				-		return;
			
 
				-
			
 
				-	/*
			
 
				-	 * Only the kernel side is implemented for now.
			
 
				-	 */
			
 
				-	if (!is_user)
			
 
				-		perf_callchain_kernel(regs, entry);
			
 
				-}
			
 
				-
			
 
				-/*
			
 
				- * No need for separate IRQ and NMI entries.
			
 
				- */
			
 
				-static DEFINE_PER_CPU(struct perf_callchain_entry, callchain);
			
 
				-
			
 
				-struct perf_callchain_entry *perf_callchain(struct pt_regs *regs)
			
 
				-{
			
 
				-	struct perf_callchain_entry *entry = &__get_cpu_var(callchain);
			
 
				-
			
 
				-	entry->nr = 0;
			
 
				-
			
 
				-	perf_do_callchain(regs, entry);
			
 
				-
			
 
				-	return entry;
			
 
				-}
			
--- a/arch/sh/kernel/perf_event.c
+++ b/arch/sh/kernel/perf_event.c
@@ -59,6 +59,24 @@ static inline int sh_pmu_initialized(void)
 
				 	return !!sh_pmu;
			
 
				 }
			
 
				 
			
 
				+const char *perf_pmu_name(void)
			
 
				+{
			
 
				+	if (!sh_pmu)
			
 
				+		return NULL;
			
 
				+
			
 
				+	return sh_pmu->name;
			
 
				+}
			
 
				+EXPORT_SYMBOL_GPL(perf_pmu_name);
			
 
				+
			
 
				+int perf_num_counters(void)
			
 
				+{
			
 
				+	if (!sh_pmu)
			
 
				+		return 0;
			
 
				+
			
 
				+	return sh_pmu->num_events;
			
 
				+}
			
 
				+EXPORT_SYMBOL_GPL(perf_num_counters);
			
 
				+
			
 
				 /*
			
 
				  * Release the PMU if this is the last perf_event.
			
 
				  */
			
@@ -206,50 +224,80 @@ again:
 
				 	local64_add(delta, &event->count);
			
 
				 }
			
 
				 
			
 
				-static void sh_pmu_disable(struct perf_event *event)
			
 
				+static void sh_pmu_stop(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	struct hw_perf_event *hwc = &event->hw;
			
 
				 	int idx = hwc->idx;
			
 
				 
			
 
				-	clear_bit(idx, cpuc->active_mask);
			
 
				-	sh_pmu->disable(hwc, idx);
			
 
				+	if (!(event->hw.state & PERF_HES_STOPPED)) {
			
 
				+		sh_pmu->disable(hwc, idx);
			
 
				+		cpuc->events[idx] = NULL;
			
 
				+		event->hw.state |= PERF_HES_STOPPED;
			
 
				+	}
			
 
				+
			
 
				+	if ((flags & PERF_EF_UPDATE) && !(event->hw.state & PERF_HES_UPTODATE)) {
			
 
				+		sh_perf_event_update(event, &event->hw, idx);
			
 
				+		event->hw.state |= PERF_HES_UPTODATE;
			
 
				+	}
			
 
				+}
			
 
				+
			
 
				+static void sh_pmu_start(struct perf_event *event, int flags)
			
 
				+{
			
 
				+	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				+	struct hw_perf_event *hwc = &event->hw;
			
 
				+	int idx = hwc->idx;
			
 
				+
			
 
				+	if (WARN_ON_ONCE(idx == -1))
			
 
				+		return;
			
 
				+
			
 
				+	if (flags & PERF_EF_RELOAD)
			
 
				+		WARN_ON_ONCE(!(event->hw.state & PERF_HES_UPTODATE));
			
 
				 
			
 
				-	barrier();
			
 
				+	cpuc->events[idx] = event;
			
 
				+	event->hw.state = 0;
			
 
				+	sh_pmu->enable(hwc, idx);
			
 
				+}
			
 
				 
			
 
				-	sh_perf_event_update(event, &event->hw, idx);
			
 
				+static void sh_pmu_del(struct perf_event *event, int flags)
			
 
				+{
			
 
				+	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
 
				-	cpuc->events[idx] = NULL;
			
 
				-	clear_bit(idx, cpuc->used_mask);
			
 
				+	sh_pmu_stop(event, PERF_EF_UPDATE);
			
 
				+	__clear_bit(event->hw.idx, cpuc->used_mask);
			
 
				 
			
 
				 	perf_event_update_userpage(event);
			
 
				 }
			
 
				 
			
 
				-static int sh_pmu_enable(struct perf_event *event)
			
 
				+static int sh_pmu_add(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	struct hw_perf_event *hwc = &event->hw;
			
 
				 	int idx = hwc->idx;
			
 
				+	int ret = -EAGAIN;
			
 
				+
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				 
			
 
				-	if (test_and_set_bit(idx, cpuc->used_mask)) {
			
 
				+	if (__test_and_set_bit(idx, cpuc->used_mask)) {
			
 
				 		idx = find_first_zero_bit(cpuc->used_mask, sh_pmu->num_events);
			
 
				 		if (idx == sh_pmu->num_events)
			
 
				-			return -EAGAIN;
			
 
				+			goto out;
			
 
				 
			
 
				-		set_bit(idx, cpuc->used_mask);
			
 
				+		__set_bit(idx, cpuc->used_mask);
			
 
				 		hwc->idx = idx;
			
 
				 	}
			
 
				 
			
 
				 	sh_pmu->disable(hwc, idx);
			
 
				 
			
 
				-	cpuc->events[idx] = event;
			
 
				-	set_bit(idx, cpuc->active_mask);
			
 
				-
			
 
				-	sh_pmu->enable(hwc, idx);
			
 
				+	event->hw.state = PERF_HES_UPTODATE | PERF_HES_STOPPED;
			
 
				+	if (flags & PERF_EF_START)
			
 
				+		sh_pmu_start(event, PERF_EF_RELOAD);
			
 
				 
			
 
				 	perf_event_update_userpage(event);
			
 
				-
			
 
				-	return 0;
			
 
				+	ret = 0;
			
 
				+out:
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				+	return ret;
			
 
				 }
			
 
				 
			
 
				 static void sh_pmu_read(struct perf_event *event)
			
@@ -257,24 +305,56 @@ static void sh_pmu_read(struct perf_event *event)
 
				 	sh_perf_event_update(event, &event->hw, event->hw.idx);
			
 
				 }
			
 
				 
			
 
				-static const struct pmu pmu = {
			
 
				-	.enable		= sh_pmu_enable,
			
 
				-	.disable	= sh_pmu_disable,
			
 
				-	.read		= sh_pmu_read,
			
 
				-};
			
 
				-
			
 
				-const struct pmu *hw_perf_event_init(struct perf_event *event)
			
 
				+static int sh_pmu_event_init(struct perf_event *event)
			
 
				 {
			
 
				-	int err = __hw_perf_event_init(event);
			
 
				+	int err;
			
 
				+
			
 
				+	switch (event->attr.type) {
			
 
				+	case PERF_TYPE_RAW:
			
 
				+	case PERF_TYPE_HW_CACHE:
			
 
				+	case PERF_TYPE_HARDWARE:
			
 
				+		err = __hw_perf_event_init(event);
			
 
				+		break;
			
 
				+
			
 
				+	default:
			
 
				+		return -ENOENT;
			
 
				+	}
			
 
				+
			
 
				 	if (unlikely(err)) {
			
 
				 		if (event->destroy)
			
 
				 			event->destroy(event);
			
 
				-		return ERR_PTR(err);
			
 
				 	}
			
 
				 
			
 
				-	return &pmu;
			
 
				+	return err;
			
 
				+}
			
 
				+
			
 
				+static void sh_pmu_enable(struct pmu *pmu)
			
 
				+{
			
 
				+	if (!sh_pmu_initialized())
			
 
				+		return;
			
 
				+
			
 
				+	sh_pmu->enable_all();
			
 
				+}
			
 
				+
			
 
				+static void sh_pmu_disable(struct pmu *pmu)
			
 
				+{
			
 
				+	if (!sh_pmu_initialized())
			
 
				+		return;
			
 
				+
			
 
				+	sh_pmu->disable_all();
			
 
				 }
			
 
				 
			
 
				+static struct pmu pmu = {
			
 
				+	.pmu_enable	= sh_pmu_enable,
			
 
				+	.pmu_disable	= sh_pmu_disable,
			
 
				+	.event_init	= sh_pmu_event_init,
			
 
				+	.add		= sh_pmu_add,
			
 
				+	.del		= sh_pmu_del,
			
 
				+	.start		= sh_pmu_start,
			
 
				+	.stop		= sh_pmu_stop,
			
 
				+	.read		= sh_pmu_read,
			
 
				+};
			
 
				+
			
 
				 static void sh_pmu_setup(int cpu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw = &per_cpu(cpu_hw_events, cpu);
			
@@ -299,32 +379,17 @@ sh_pmu_notifier(struct notifier_block *self, unsigned long action, void *hcpu)
 
				 	return NOTIFY_OK;
			
 
				 }
			
 
				 
			
 
				-void hw_perf_enable(void)
			
 
				-{
			
 
				-	if (!sh_pmu_initialized())
			
 
				-		return;
			
 
				-
			
 
				-	sh_pmu->enable_all();
			
 
				-}
			
 
				-
			
 
				-void hw_perf_disable(void)
			
 
				-{
			
 
				-	if (!sh_pmu_initialized())
			
 
				-		return;
			
 
				-
			
 
				-	sh_pmu->disable_all();
			
 
				-}
			
 
				-
			
 
				-int __cpuinit register_sh_pmu(struct sh_pmu *pmu)
			
 
				+int __cpuinit register_sh_pmu(struct sh_pmu *_pmu)
			
 
				 {
			
 
				 	if (sh_pmu)
			
 
				 		return -EBUSY;
			
 
				-	sh_pmu = pmu;
			
 
				+	sh_pmu = _pmu;
			
 
				 
			
 
				-	pr_info("Performance Events: %s support registered\n", pmu->name);
			
 
				+	pr_info("Performance Events: %s support registered\n", _pmu->name);
			
 
				 
			
 
				-	WARN_ON(pmu->num_events > MAX_HWEVENTS);
			
 
				+	WARN_ON(_pmu->num_events > MAX_HWEVENTS);
			
 
				 
			
 
				+	perf_pmu_register(&pmu);
			
 
				 	perf_cpu_notifier(sh_pmu_notifier);
			
 
				 	return 0;
			
 
				 }
			
--- a/arch/sh/oprofile/Makefile
+++ b/arch/sh/oprofile/Makefile
@@ -6,4 +6,8 @@ DRIVER_OBJS = $(addprefix ../../../drivers/oprofile/, \
 
				 		oprofilefs.o oprofile_stats.o \
			
 
				 		timer_int.o )
			
 
				 
			
 
				+ifeq ($(CONFIG_HW_PERF_EVENTS),y)
			
 
				+DRIVER_OBJS += $(addprefix ../../../drivers/oprofile/, oprofile_perf.o)
			
 
				+endif
			
 
				+
			
 
				 oprofile-y	:= $(DRIVER_OBJS) common.o backtrace.o
			
--- a/arch/sh/oprofile/common.c
+++ b/arch/sh/oprofile/common.c
@@ -17,114 +17,45 @@
 
				 #include <linux/init.h>
			
 
				 #include <linux/errno.h>
			
 
				 #include <linux/smp.h>
			
 
				+#include <linux/perf_event.h>
			
 
				 #include <asm/processor.h>
			
 
				-#include "op_impl.h"
			
 
				-
			
 
				-static struct op_sh_model *model;
			
 
				-
			
 
				-static struct op_counter_config ctr[20];
			
 
				 
			
 
				+#ifdef CONFIG_HW_PERF_EVENTS
			
 
				 extern void sh_backtrace(struct pt_regs * const regs, unsigned int depth);
			
 
				 
			
 
				-static int op_sh_setup(void)
			
 
				-{
			
 
				-	/* Pre-compute the values to stuff in the hardware registers.  */
			
 
				-	model->reg_setup(ctr);
			
 
				-
			
 
				-	/* Configure the registers on all cpus.  */
			
 
				-	on_each_cpu(model->cpu_setup, NULL, 1);
			
 
				-
			
 
				-        return 0;
			
 
				-}
			
 
				-
			
 
				-static int op_sh_create_files(struct super_block *sb, struct dentry *root)
			
 
				+char *op_name_from_perf_id(void)
			
 
				 {
			
 
				-	int i, ret = 0;
			
 
				+	const char *pmu;
			
 
				+	char buf[20];
			
 
				+	int size;
			
 
				 
			
 
				-	for (i = 0; i < model->num_counters; i++) {
			
 
				-		struct dentry *dir;
			
 
				-		char buf[4];
			
 
				+	pmu = perf_pmu_name();
			
 
				+	if (!pmu)
			
 
				+		return NULL;
			
 
				 
			
 
				-		snprintf(buf, sizeof(buf), "%d", i);
			
 
				-		dir = oprofilefs_mkdir(sb, root, buf);
			
 
				+	size = snprintf(buf, sizeof(buf), "sh/%s", pmu);
			
 
				+	if (size > -1 && size < sizeof(buf))
			
 
				+		return buf;
			
 
				 
			
 
				-		ret |= oprofilefs_create_ulong(sb, dir, "enabled", &ctr[i].enabled);
			
 
				-		ret |= oprofilefs_create_ulong(sb, dir, "event", &ctr[i].event);
			
 
				-		ret |= oprofilefs_create_ulong(sb, dir, "kernel", &ctr[i].kernel);
			
 
				-		ret |= oprofilefs_create_ulong(sb, dir, "user", &ctr[i].user);
			
 
				-
			
 
				-		if (model->create_files)
			
 
				-			ret |= model->create_files(sb, dir);
			
 
				-		else
			
 
				-			ret |= oprofilefs_create_ulong(sb, dir, "count", &ctr[i].count);
			
 
				-
			
 
				-		/* Dummy entries */
			
 
				-		ret |= oprofilefs_create_ulong(sb, dir, "unit_mask", &ctr[i].unit_mask);
			
 
				-	}
			
 
				-
			
 
				-	return ret;
			
 
				+	return NULL;
			
 
				 }
			
 
				 
			
 
				-static int op_sh_start(void)
			
 
				+int __init oprofile_arch_init(struct oprofile_operations *ops)
			
 
				 {
			
 
				-	/* Enable performance monitoring for all counters.  */
			
 
				-	on_each_cpu(model->cpu_start, NULL, 1);
			
 
				+	ops->backtrace = sh_backtrace;
			
 
				 
			
 
				-	return 0;
			
 
				+	return oprofile_perf_init(ops);
			
 
				 }
			
 
				 
			
 
				-static void op_sh_stop(void)
			
 
				+void __exit oprofile_arch_exit(void)
			
 
				 {
			
 
				-	/* Disable performance monitoring for all counters.  */
			
 
				-	on_each_cpu(model->cpu_stop, NULL, 1);
			
 
				+	oprofile_perf_exit();
			
 
				 }
			
 
				-
			
 
				+#else
			
 
				 int __init oprofile_arch_init(struct oprofile_operations *ops)
			
 
				 {
			
 
				-	struct op_sh_model *lmodel = NULL;
			
 
				-	int ret;
			
 
				-
			
 
				-	/*
			
 
				-	 * Always assign the backtrace op. If the counter initialization
			
 
				-	 * fails, we fall back to the timer which will still make use of
			
 
				-	 * this.
			
 
				-	 */
			
 
				-	ops->backtrace = sh_backtrace;
			
 
				-
			
 
				-	/*
			
 
				-	 * XXX
			
 
				-	 *
			
 
				-	 * All of the SH7750/SH-4A counters have been converted to perf,
			
 
				-	 * this infrastructure hook is left for other users until they've
			
 
				-	 * had a chance to convert over, at which point all of this
			
 
				-	 * will be deleted.
			
 
				-	 */
			
 
				-
			
 
				-	if (!lmodel)
			
 
				-		return -ENODEV;
			
 
				-	if (!(current_cpu_data.flags & CPU_HAS_PERF_COUNTER))
			
 
				-		return -ENODEV;
			
 
				-
			
 
				-	ret = lmodel->init();
			
 
				-	if (unlikely(ret != 0))
			
 
				-		return ret;
			
 
				-
			
 
				-	model = lmodel;
			
 
				-
			
 
				-	ops->setup		= op_sh_setup;
			
 
				-	ops->create_files	= op_sh_create_files;
			
 
				-	ops->start		= op_sh_start;
			
 
				-	ops->stop		= op_sh_stop;
			
 
				-	ops->cpu_type		= lmodel->cpu_type;
			
 
				-
			
 
				-	printk(KERN_INFO "oprofile: using %s performance monitoring.\n",
			
 
				-	       lmodel->cpu_type);
			
 
				-
			
 
				-	return 0;
			
 
				-}
			
 
				-
			
 
				-void oprofile_arch_exit(void)
			
 
				-{
			
 
				-	if (model && model->exit)
			
 
				-		model->exit();
			
 
				+	pr_info("oprofile: hardware counters not available\n");
			
 
				+	return -ENODEV;
			
 
				 }
			
 
				+void __exit oprofile_arch_exit(void) {}
			
 
				+#endif /* CONFIG_HW_PERF_EVENTS */
			
--- a/arch/sh/oprofile/op_impl.h
+++ b/arch/sh/oprofile/op_impl.h
@@ -1,33 +0,0 @@
 
				-#ifndef __OP_IMPL_H
			
 
				-#define __OP_IMPL_H
			
 
				-
			
 
				-/* Per-counter configuration as set via oprofilefs.  */
			
 
				-struct op_counter_config {
			
 
				-	unsigned long enabled;
			
 
				-	unsigned long event;
			
 
				-
			
 
				-	unsigned long count;
			
 
				-
			
 
				-	/* Dummy values for userspace tool compliance */
			
 
				-	unsigned long kernel;
			
 
				-	unsigned long user;
			
 
				-	unsigned long unit_mask;
			
 
				-};
			
 
				-
			
 
				-/* Per-architecture configury and hooks.  */
			
 
				-struct op_sh_model {
			
 
				-	void (*reg_setup)(struct op_counter_config *);
			
 
				-	int (*create_files)(struct super_block *sb, struct dentry *dir);
			
 
				-	void (*cpu_setup)(void *dummy);
			
 
				-	int (*init)(void);
			
 
				-	void (*exit)(void);
			
 
				-	void (*cpu_start)(void *args);
			
 
				-	void (*cpu_stop)(void *args);
			
 
				-	char *cpu_type;
			
 
				-	unsigned char num_counters;
			
 
				-};
			
 
				-
			
 
				-/* arch/sh/oprofile/common.c */
			
 
				-extern void sh_backtrace(struct pt_regs * const regs, unsigned int depth);
			
 
				-
			
 
				-#endif /* __OP_IMPL_H */
			
--- a/arch/sparc/Kconfig
+++ b/arch/sparc/Kconfig
@@ -26,10 +26,12 @@ config SPARC
 
				 	select ARCH_WANT_OPTIONAL_GPIOLIB
			
 
				 	select RTC_CLASS
			
 
				 	select RTC_DRV_M48T59
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_PERF_EVENTS
			
 
				 	select PERF_USE_VMALLOC
			
 
				 	select HAVE_DMA_ATTRS
			
 
				 	select HAVE_DMA_API_DEBUG
			
 
				+	select HAVE_ARCH_JUMP_LABEL
			
 
				 
			
 
				 config SPARC32
			
 
				 	def_bool !64BIT
			
@@ -53,6 +55,7 @@ config SPARC64
 
				 	select RTC_DRV_BQ4802
			
 
				 	select RTC_DRV_SUN4V
			
 
				 	select RTC_DRV_STARFIRE
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_PERF_EVENTS
			
 
				 	select PERF_USE_VMALLOC
			
 
				 
			
--- a/arch/sparc/include/asm/jump_label.h
+++ b/arch/sparc/include/asm/jump_label.h
@@ -0,0 +1,32 @@
 
				+#ifndef _ASM_SPARC_JUMP_LABEL_H
			
 
				+#define _ASM_SPARC_JUMP_LABEL_H
			
 
				+
			
 
				+#ifdef __KERNEL__
			
 
				+
			
 
				+#include <linux/types.h>
			
 
				+#include <asm/system.h>
			
 
				+
			
 
				+#define JUMP_LABEL_NOP_SIZE 4
			
 
				+
			
 
				+#define JUMP_LABEL(key, label)					\
			
 
				+	do {							\
			
 
				+		asm goto("1:\n\t"				\
			
 
				+			 "nop\n\t"				\
			
 
				+			 "nop\n\t"				\
			
 
				+			 ".pushsection __jump_table,  \"a\"\n\t"\
			
 
				+			 ".word 1b, %l[" #label "], %c0\n\t"	\
			
 
				+			 ".popsection \n\t"			\
			
 
				+			 : :  "i" (key) :  : label);\
			
 
				+	} while (0)
			
 
				+
			
 
				+#endif /* __KERNEL__ */
			
 
				+
			
 
				+typedef u32 jump_label_t;
			
 
				+
			
 
				+struct jump_entry {
			
 
				+	jump_label_t code;
			
 
				+	jump_label_t target;
			
 
				+	jump_label_t key;
			
 
				+};
			
 
				+
			
 
				+#endif
			
--- a/arch/sparc/include/asm/perf_event.h
+++ b/arch/sparc/include/asm/perf_event.h
@@ -1,10 +1,6 @@
 
				 #ifndef __ASM_SPARC_PERF_EVENT_H
			
 
				 #define __ASM_SPARC_PERF_EVENT_H
			
 
				 
			
 
				-extern void set_perf_event_pending(void);
			
 
				-
			
 
				-#define	PERF_EVENT_INDEX_OFFSET	0
			
 
				-
			
 
				 #ifdef CONFIG_PERF_EVENTS
			
 
				 #include <asm/ptrace.h>
			
 
				 
			
--- a/arch/sparc/kernel/Makefile
+++ b/arch/sparc/kernel/Makefile
@@ -119,3 +119,5 @@ obj-$(CONFIG_COMPAT)    += $(audit--y)
 
				 
			
 
				 pc--$(CONFIG_PERF_EVENTS) := perf_event.o
			
 
				 obj-$(CONFIG_SPARC64)	+= $(pc--y)
			
 
				+
			
 
				+obj-$(CONFIG_SPARC64)	+= jump_label.o
			
--- a/arch/sparc/kernel/jump_label.c
+++ b/arch/sparc/kernel/jump_label.c
@@ -0,0 +1,47 @@
 
				+#include <linux/kernel.h>
			
 
				+#include <linux/types.h>
			
 
				+#include <linux/mutex.h>
			
 
				+#include <linux/cpu.h>
			
 
				+
			
 
				+#include <linux/jump_label.h>
			
 
				+#include <linux/memory.h>
			
 
				+
			
 
				+#ifdef HAVE_JUMP_LABEL
			
 
				+
			
 
				+void arch_jump_label_transform(struct jump_entry *entry,
			
 
				+			       enum jump_label_type type)
			
 
				+{
			
 
				+	u32 val;
			
 
				+	u32 *insn = (u32 *) (unsigned long) entry->code;
			
 
				+
			
 
				+	if (type == JUMP_LABEL_ENABLE) {
			
 
				+		s32 off = (s32)entry->target - (s32)entry->code;
			
 
				+
			
 
				+#ifdef CONFIG_SPARC64
			
 
				+		/* ba,pt %xcc, . + (off << 2) */
			
 
				+		val = 0x10680000 | ((u32) off >> 2);
			
 
				+#else
			
 
				+		/* ba . + (off << 2) */
			
 
				+		val = 0x10800000 | ((u32) off >> 2);
			
 
				+#endif
			
 
				+	} else {
			
 
				+		val = 0x01000000;
			
 
				+	}
			
 
				+
			
 
				+	get_online_cpus();
			
 
				+	mutex_lock(&text_mutex);
			
 
				+	*insn = val;
			
 
				+	flushi(insn);
			
 
				+	mutex_unlock(&text_mutex);
			
 
				+	put_online_cpus();
			
 
				+}
			
 
				+
			
 
				+void arch_jump_label_text_poke_early(jump_label_t addr)
			
 
				+{
			
 
				+	u32 *insn_p = (u32 *) (unsigned long) addr;
			
 
				+
			
 
				+	*insn_p = 0x01000000;
			
 
				+	flushi(insn_p);
			
 
				+}
			
 
				+
			
 
				+#endif
			
--- a/arch/sparc/kernel/module.c
+++ b/arch/sparc/kernel/module.c
@@ -18,6 +18,9 @@
 
				 #include <asm/spitfire.h>
			
 
				 
			
 
				 #ifdef CONFIG_SPARC64
			
 
				+
			
 
				+#include <linux/jump_label.h>
			
 
				+
			
 
				 static void *module_map(unsigned long size)
			
 
				 {
			
 
				 	struct vm_struct *area;
			
@@ -227,6 +230,9 @@ int module_finalize(const Elf_Ehdr *hdr,
 
				 		    const Elf_Shdr *sechdrs,
			
 
				 		    struct module *me)
			
 
				 {
			
 
				+	/* make jump label nops */
			
 
				+	jump_label_apply_nops(me);
			
 
				+
			
 
				 	/* Cheetah's I-cache is fully coherent.  */
			
 
				 	if (tlb_type == spitfire) {
			
 
				 		unsigned long va;
			
--- a/arch/sparc/kernel/pcr.c
+++ b/arch/sparc/kernel/pcr.c
@@ -7,7 +7,7 @@
 
				 #include <linux/init.h>
			
 
				 #include <linux/irq.h>
			
 
				 
			
 
				-#include <linux/perf_event.h>
			
 
				+#include <linux/irq_work.h>
			
 
				 #include <linux/ftrace.h>
			
 
				 
			
 
				 #include <asm/pil.h>
			
@@ -43,14 +43,14 @@ void __irq_entry deferred_pcr_work_irq(int irq, struct pt_regs *regs)
 
				 
			
 
				 	old_regs = set_irq_regs(regs);
			
 
				 	irq_enter();
			
 
				-#ifdef CONFIG_PERF_EVENTS
			
 
				-	perf_event_do_pending();
			
 
				+#ifdef CONFIG_IRQ_WORK
			
 
				+	irq_work_run();
			
 
				 #endif
			
 
				 	irq_exit();
			
 
				 	set_irq_regs(old_regs);
			
 
				 }
			
 
				 
			
 
				-void set_perf_event_pending(void)
			
 
				+void arch_irq_work_raise(void)
			
 
				 {
			
 
				 	set_softint(1 << PIL_DEFERRED_PCR_WORK);
			
 
				 }
			
--- a/arch/sparc/kernel/perf_event.c
+++ b/arch/sparc/kernel/perf_event.c
@@ -658,13 +658,16 @@ static u64 maybe_change_configuration(struct cpu_hw_events *cpuc, u64 pcr)
 
				 
			
 
				 		enc = perf_event_get_enc(cpuc->events[i]);
			
 
				 		pcr &= ~mask_for_index(idx);
			
 
				-		pcr |= event_encoding(enc, idx);
			
 
				+		if (hwc->state & PERF_HES_STOPPED)
			
 
				+			pcr |= nop_for_index(idx);
			
 
				+		else
			
 
				+			pcr |= event_encoding(enc, idx);
			
 
				 	}
			
 
				 out:
			
 
				 	return pcr;
			
 
				 }
			
 
				 
			
 
				-void hw_perf_enable(void)
			
 
				+static void sparc_pmu_enable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	u64 pcr;
			
@@ -691,7 +694,7 @@ void hw_perf_enable(void)
 
				 	pcr_ops->write(cpuc->pcr);
			
 
				 }
			
 
				 
			
 
				-void hw_perf_disable(void)
			
 
				+static void sparc_pmu_disable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	u64 val;
			
@@ -710,19 +713,65 @@ void hw_perf_disable(void)
 
				 	pcr_ops->write(cpuc->pcr);
			
 
				 }
			
 
				 
			
 
				-static void sparc_pmu_disable(struct perf_event *event)
			
 
				+static int active_event_index(struct cpu_hw_events *cpuc,
			
 
				+			      struct perf_event *event)
			
 
				+{
			
 
				+	int i;
			
 
				+
			
 
				+	for (i = 0; i < cpuc->n_events; i++) {
			
 
				+		if (cpuc->event[i] == event)
			
 
				+			break;
			
 
				+	}
			
 
				+	BUG_ON(i == cpuc->n_events);
			
 
				+	return cpuc->current_idx[i];
			
 
				+}
			
 
				+
			
 
				+static void sparc_pmu_start(struct perf_event *event, int flags)
			
 
				+{
			
 
				+	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				+	int idx = active_event_index(cpuc, event);
			
 
				+
			
 
				+	if (flags & PERF_EF_RELOAD) {
			
 
				+		WARN_ON_ONCE(!(event->hw.state & PERF_HES_UPTODATE));
			
 
				+		sparc_perf_event_set_period(event, &event->hw, idx);
			
 
				+	}
			
 
				+
			
 
				+	event->hw.state = 0;
			
 
				+
			
 
				+	sparc_pmu_enable_event(cpuc, &event->hw, idx);
			
 
				+}
			
 
				+
			
 
				+static void sparc_pmu_stop(struct perf_event *event, int flags)
			
 
				+{
			
 
				+	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				+	int idx = active_event_index(cpuc, event);
			
 
				+
			
 
				+	if (!(event->hw.state & PERF_HES_STOPPED)) {
			
 
				+		sparc_pmu_disable_event(cpuc, &event->hw, idx);
			
 
				+		event->hw.state |= PERF_HES_STOPPED;
			
 
				+	}
			
 
				+
			
 
				+	if (!(event->hw.state & PERF_HES_UPTODATE) && (flags & PERF_EF_UPDATE)) {
			
 
				+		sparc_perf_event_update(event, &event->hw, idx);
			
 
				+		event->hw.state |= PERF_HES_UPTODATE;
			
 
				+	}
			
 
				+}
			
 
				+
			
 
				+static void sparc_pmu_del(struct perf_event *event, int _flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				-	struct hw_perf_event *hwc = &event->hw;
			
 
				 	unsigned long flags;
			
 
				 	int i;
			
 
				 
			
 
				 	local_irq_save(flags);
			
 
				-	perf_disable();
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				 
			
 
				 	for (i = 0; i < cpuc->n_events; i++) {
			
 
				 		if (event == cpuc->event[i]) {
			
 
				-			int idx = cpuc->current_idx[i];
			
 
				+			/* Absorb the final count and turn off the
			
 
				+			 * event.
			
 
				+			 */
			
 
				+			sparc_pmu_stop(event, PERF_EF_UPDATE);
			
 
				 
			
 
				 			/* Shift remaining entries down into
			
 
				 			 * the existing slot.
			
@@ -734,13 +783,6 @@ static void sparc_pmu_disable(struct perf_event *event)
 
				 					cpuc->current_idx[i];
			
 
				 			}
			
 
				 
			
 
				-			/* Absorb the final count and turn off the
			
 
				-			 * event.
			
 
				-			 */
			
 
				-			sparc_pmu_disable_event(cpuc, hwc, idx);
			
 
				-			barrier();
			
 
				-			sparc_perf_event_update(event, hwc, idx);
			
 
				-
			
 
				 			perf_event_update_userpage(event);
			
 
				 
			
 
				 			cpuc->n_events--;
			
@@ -748,23 +790,10 @@ static void sparc_pmu_disable(struct perf_event *event)
 
				 		}
			
 
				 	}
			
 
				 
			
 
				-	perf_enable();
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 	local_irq_restore(flags);
			
 
				 }
			
 
				 
			
 
				-static int active_event_index(struct cpu_hw_events *cpuc,
			
 
				-			      struct perf_event *event)
			
 
				-{
			
 
				-	int i;
			
 
				-
			
 
				-	for (i = 0; i < cpuc->n_events; i++) {
			
 
				-		if (cpuc->event[i] == event)
			
 
				-			break;
			
 
				-	}
			
 
				-	BUG_ON(i == cpuc->n_events);
			
 
				-	return cpuc->current_idx[i];
			
 
				-}
			
 
				-
			
 
				 static void sparc_pmu_read(struct perf_event *event)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
@@ -774,15 +803,6 @@ static void sparc_pmu_read(struct perf_event *event)
 
				 	sparc_perf_event_update(event, hwc, idx);
			
 
				 }
			
 
				 
			
 
				-static void sparc_pmu_unthrottle(struct perf_event *event)
			
 
				-{
			
 
				-	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				-	int idx = active_event_index(cpuc, event);
			
 
				-	struct hw_perf_event *hwc = &event->hw;
			
 
				-
			
 
				-	sparc_pmu_enable_event(cpuc, hwc, idx);
			
 
				-}
			
 
				-
			
 
				 static atomic_t active_events = ATOMIC_INIT(0);
			
 
				 static DEFINE_MUTEX(pmc_grab_mutex);
			
 
				 
			
@@ -877,7 +897,7 @@ static int sparc_check_constraints(struct perf_event **evts,
 
				 	if (!n_ev)
			
 
				 		return 0;
			
 
				 
			
 
				-	if (n_ev > perf_max_events)
			
 
				+	if (n_ev > MAX_HWEVENTS)
			
 
				 		return -1;
			
 
				 
			
 
				 	msk0 = perf_event_get_msk(events[0]);
			
@@ -984,23 +1004,27 @@ static int collect_events(struct perf_event *group, int max_count,
 
				 	return n;
			
 
				 }
			
 
				 
			
 
				-static int sparc_pmu_enable(struct perf_event *event)
			
 
				+static int sparc_pmu_add(struct perf_event *event, int ef_flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	int n0, ret = -EAGAIN;
			
 
				 	unsigned long flags;
			
 
				 
			
 
				 	local_irq_save(flags);
			
 
				-	perf_disable();
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				 
			
 
				 	n0 = cpuc->n_events;
			
 
				-	if (n0 >= perf_max_events)
			
 
				+	if (n0 >= MAX_HWEVENTS)
			
 
				 		goto out;
			
 
				 
			
 
				 	cpuc->event[n0] = event;
			
 
				 	cpuc->events[n0] = event->hw.event_base;
			
 
				 	cpuc->current_idx[n0] = PIC_NO_INDEX;
			
 
				 
			
 
				+	event->hw.state = PERF_HES_UPTODATE;
			
 
				+	if (!(ef_flags & PERF_EF_START))
			
 
				+		event->hw.state |= PERF_HES_STOPPED;
			
 
				+
			
 
				 	/*
			
 
				 	 * If group events scheduling transaction was started,
			
 
				 	 * skip the schedulability test here, it will be peformed
			
@@ -1020,12 +1044,12 @@ nocheck:
 
				 
			
 
				 	ret = 0;
			
 
				 out:
			
 
				-	perf_enable();
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				 	local_irq_restore(flags);
			
 
				 	return ret;
			
 
				 }
			
 
				 
			
 
				-static int __hw_perf_event_init(struct perf_event *event)
			
 
				+static int sparc_pmu_event_init(struct perf_event *event)
			
 
				 {
			
 
				 	struct perf_event_attr *attr = &event->attr;
			
 
				 	struct perf_event *evts[MAX_HWEVENTS];
			
@@ -1038,22 +1062,33 @@ static int __hw_perf_event_init(struct perf_event *event)
 
				 	if (atomic_read(&nmi_active) < 0)
			
 
				 		return -ENODEV;
			
 
				 
			
 
				-	pmap = NULL;
			
 
				-	if (attr->type == PERF_TYPE_HARDWARE) {
			
 
				+	switch (attr->type) {
			
 
				+	case PERF_TYPE_HARDWARE:
			
 
				 		if (attr->config >= sparc_pmu->max_events)
			
 
				 			return -EINVAL;
			
 
				 		pmap = sparc_pmu->event_map(attr->config);
			
 
				-	} else if (attr->type == PERF_TYPE_HW_CACHE) {
			
 
				+		break;
			
 
				+
			
 
				+	case PERF_TYPE_HW_CACHE:
			
 
				 		pmap = sparc_map_cache_event(attr->config);
			
 
				 		if (IS_ERR(pmap))
			
 
				 			return PTR_ERR(pmap);
			
 
				-	} else if (attr->type != PERF_TYPE_RAW)
			
 
				-		return -EOPNOTSUPP;
			
 
				+		break;
			
 
				+
			
 
				+	case PERF_TYPE_RAW:
			
 
				+		pmap = NULL;
			
 
				+		break;
			
 
				+
			
 
				+	default:
			
 
				+		return -ENOENT;
			
 
				+
			
 
				+	}
			
 
				 
			
 
				 	if (pmap) {
			
 
				 		hwc->event_base = perf_event_encode(pmap);
			
 
				 	} else {
			
 
				-		/* User gives us "(encoding << 16) | pic_mask" for
			
 
				+		/*
			
 
				+		 * User gives us "(encoding << 16) | pic_mask" for
			
 
				 		 * PERF_TYPE_RAW events.
			
 
				 		 */
			
 
				 		hwc->event_base = attr->config;
			
@@ -1071,7 +1106,7 @@ static int __hw_perf_event_init(struct perf_event *event)
 
				 	n = 0;
			
 
				 	if (event->group_leader != event) {
			
 
				 		n = collect_events(event->group_leader,
			
 
				-				   perf_max_events - 1,
			
 
				+				   MAX_HWEVENTS - 1,
			
 
				 				   evts, events, current_idx_dmy);
			
 
				 		if (n < 0)
			
 
				 			return -EINVAL;
			
@@ -1107,10 +1142,11 @@ static int __hw_perf_event_init(struct perf_event *event)
 
				  * Set the flag to make pmu::enable() not perform the
			
 
				  * schedulability test, it will be performed at commit time
			
 
				  */
			
 
				-static void sparc_pmu_start_txn(const struct pmu *pmu)
			
 
				+static void sparc_pmu_start_txn(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
 
				+	perf_pmu_disable(pmu);
			
 
				 	cpuhw->group_flag |= PERF_EVENT_TXN;
			
 
				 }
			
 
				 
			
@@ -1119,11 +1155,12 @@ static void sparc_pmu_start_txn(const struct pmu *pmu)
 
				  * Clear the flag and pmu::enable() will perform the
			
 
				  * schedulability test.
			
 
				  */
			
 
				-static void sparc_pmu_cancel_txn(const struct pmu *pmu)
			
 
				+static void sparc_pmu_cancel_txn(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuhw = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
 
				 	cpuhw->group_flag &= ~PERF_EVENT_TXN;
			
 
				+	perf_pmu_enable(pmu);
			
 
				 }
			
 
				 
			
 
				 /*
			
@@ -1131,7 +1168,7 @@ static void sparc_pmu_cancel_txn(const struct pmu *pmu)
 
				  * Perform the group schedulability test as a whole
			
 
				  * Return 0 if success
			
 
				  */
			
 
				-static int sparc_pmu_commit_txn(const struct pmu *pmu)
			
 
				+static int sparc_pmu_commit_txn(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	int n;
			
@@ -1147,28 +1184,24 @@ static int sparc_pmu_commit_txn(const struct pmu *pmu)
 
				 		return -EAGAIN;
			
 
				 
			
 
				 	cpuc->group_flag &= ~PERF_EVENT_TXN;
			
 
				+	perf_pmu_enable(pmu);
			
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-static const struct pmu pmu = {
			
 
				-	.enable		= sparc_pmu_enable,
			
 
				-	.disable	= sparc_pmu_disable,
			
 
				+static struct pmu pmu = {
			
 
				+	.pmu_enable	= sparc_pmu_enable,
			
 
				+	.pmu_disable	= sparc_pmu_disable,
			
 
				+	.event_init	= sparc_pmu_event_init,
			
 
				+	.add		= sparc_pmu_add,
			
 
				+	.del		= sparc_pmu_del,
			
 
				+	.start		= sparc_pmu_start,
			
 
				+	.stop		= sparc_pmu_stop,
			
 
				 	.read		= sparc_pmu_read,
			
 
				-	.unthrottle	= sparc_pmu_unthrottle,
			
 
				 	.start_txn	= sparc_pmu_start_txn,
			
 
				 	.cancel_txn	= sparc_pmu_cancel_txn,
			
 
				 	.commit_txn	= sparc_pmu_commit_txn,
			
 
				 };
			
 
				 
			
 
				-const struct pmu *hw_perf_event_init(struct perf_event *event)
			
 
				-{
			
 
				-	int err = __hw_perf_event_init(event);
			
 
				-
			
 
				-	if (err)
			
 
				-		return ERR_PTR(err);
			
 
				-	return &pmu;
			
 
				-}
			
 
				-
			
 
				 void perf_event_print_debug(void)
			
 
				 {
			
 
				 	unsigned long flags;
			
@@ -1244,7 +1277,7 @@ static int __kprobes perf_event_nmi_handler(struct notifier_block *self,
 
				 			continue;
			
 
				 
			
 
				 		if (perf_event_overflow(event, 1, &data, regs))
			
 
				-			sparc_pmu_disable_event(cpuc, hwc, idx);
			
 
				+			sparc_pmu_stop(event, 0);
			
 
				 	}
			
 
				 
			
 
				 	return NOTIFY_STOP;
			
@@ -1285,28 +1318,21 @@ void __init init_hw_perf_events(void)
 
				 
			
 
				 	pr_cont("Supported PMU type is '%s'\n", sparc_pmu_type);
			
 
				 
			
 
				-	/* All sparc64 PMUs currently have 2 events.  */
			
 
				-	perf_max_events = 2;
			
 
				-
			
 
				+	perf_pmu_register(&pmu);
			
 
				 	register_die_notifier(&perf_event_nmi_notifier);
			
 
				 }
			
 
				 
			
 
				-static inline void callchain_store(struct perf_callchain_entry *entry, u64 ip)
			
 
				-{
			
 
				-	if (entry->nr < PERF_MAX_STACK_DEPTH)
			
 
				-		entry->ip[entry->nr++] = ip;
			
 
				-}
			
 
				-
			
 
				-static void perf_callchain_kernel(struct pt_regs *regs,
			
 
				-				  struct perf_callchain_entry *entry)
			
 
				+void perf_callchain_kernel(struct perf_callchain_entry *entry,
			
 
				+			   struct pt_regs *regs)
			
 
				 {
			
 
				 	unsigned long ksp, fp;
			
 
				 #ifdef CONFIG_FUNCTION_GRAPH_TRACER
			
 
				 	int graph = 0;
			
 
				 #endif
			
 
				 
			
 
				-	callchain_store(entry, PERF_CONTEXT_KERNEL);
			
 
				-	callchain_store(entry, regs->tpc);
			
 
				+	stack_trace_flush();
			
 
				+
			
 
				+	perf_callchain_store(entry, regs->tpc);
			
 
				 
			
 
				 	ksp = regs->u_regs[UREG_I6];
			
 
				 	fp = ksp + STACK_BIAS;
			
@@ -1330,13 +1356,13 @@ static void perf_callchain_kernel(struct pt_regs *regs,
 
				 			pc = sf->callers_pc;
			
 
				 			fp = (unsigned long)sf->fp + STACK_BIAS;
			
 
				 		}
			
 
				-		callchain_store(entry, pc);
			
 
				+		perf_callchain_store(entry, pc);
			
 
				 #ifdef CONFIG_FUNCTION_GRAPH_TRACER
			
 
				 		if ((pc + 8UL) == (unsigned long) &return_to_handler) {
			
 
				 			int index = current->curr_ret_stack;
			
 
				 			if (current->ret_stack && index >= graph) {
			
 
				 				pc = current->ret_stack[index - graph].ret;
			
 
				-				callchain_store(entry, pc);
			
 
				+				perf_callchain_store(entry, pc);
			
 
				 				graph++;
			
 
				 			}
			
 
				 		}
			
@@ -1344,13 +1370,12 @@ static void perf_callchain_kernel(struct pt_regs *regs,
 
				 	} while (entry->nr < PERF_MAX_STACK_DEPTH);
			
 
				 }
			
 
				 
			
 
				-static void perf_callchain_user_64(struct pt_regs *regs,
			
 
				-				   struct perf_callchain_entry *entry)
			
 
				+static void perf_callchain_user_64(struct perf_callchain_entry *entry,
			
 
				+				   struct pt_regs *regs)
			
 
				 {
			
 
				 	unsigned long ufp;
			
 
				 
			
 
				-	callchain_store(entry, PERF_CONTEXT_USER);
			
 
				-	callchain_store(entry, regs->tpc);
			
 
				+	perf_callchain_store(entry, regs->tpc);
			
 
				 
			
 
				 	ufp = regs->u_regs[UREG_I6] + STACK_BIAS;
			
 
				 	do {
			
@@ -1363,17 +1388,16 @@ static void perf_callchain_user_64(struct pt_regs *regs,
 
				 
			
 
				 		pc = sf.callers_pc;
			
 
				 		ufp = (unsigned long)sf.fp + STACK_BIAS;
			
 
				-		callchain_store(entry, pc);
			
 
				+		perf_callchain_store(entry, pc);
			
 
				 	} while (entry->nr < PERF_MAX_STACK_DEPTH);
			
 
				 }
			
 
				 
			
 
				-static void perf_callchain_user_32(struct pt_regs *regs,
			
 
				-				   struct perf_callchain_entry *entry)
			
 
				+static void perf_callchain_user_32(struct perf_callchain_entry *entry,
			
 
				+				   struct pt_regs *regs)
			
 
				 {
			
 
				 	unsigned long ufp;
			
 
				 
			
 
				-	callchain_store(entry, PERF_CONTEXT_USER);
			
 
				-	callchain_store(entry, regs->tpc);
			
 
				+	perf_callchain_store(entry, regs->tpc);
			
 
				 
			
 
				 	ufp = regs->u_regs[UREG_I6] & 0xffffffffUL;
			
 
				 	do {
			
@@ -1386,34 +1410,16 @@ static void perf_callchain_user_32(struct pt_regs *regs,
 
				 
			
 
				 		pc = sf.callers_pc;
			
 
				 		ufp = (unsigned long)sf.fp;
			
 
				-		callchain_store(entry, pc);
			
 
				+		perf_callchain_store(entry, pc);
			
 
				 	} while (entry->nr < PERF_MAX_STACK_DEPTH);
			
 
				 }
			
 
				 
			
 
				-/* Like powerpc we can't get PMU interrupts within the PMU handler,
			
 
				- * so no need for separate NMI and IRQ chains as on x86.
			
 
				- */
			
 
				-static DEFINE_PER_CPU(struct perf_callchain_entry, callchain);
			
 
				-
			
 
				-struct perf_callchain_entry *perf_callchain(struct pt_regs *regs)
			
 
				+void
			
 
				+perf_callchain_user(struct perf_callchain_entry *entry, struct pt_regs *regs)
			
 
				 {
			
 
				-	struct perf_callchain_entry *entry = &__get_cpu_var(callchain);
			
 
				-
			
 
				-	entry->nr = 0;
			
 
				-	if (!user_mode(regs)) {
			
 
				-		stack_trace_flush();
			
 
				-		perf_callchain_kernel(regs, entry);
			
 
				-		if (current->mm)
			
 
				-			regs = task_pt_regs(current);
			
 
				-		else
			
 
				-			regs = NULL;
			
 
				-	}
			
 
				-	if (regs) {
			
 
				-		flushw_user();
			
 
				-		if (test_thread_flag(TIF_32BIT))
			
 
				-			perf_callchain_user_32(regs, entry);
			
 
				-		else
			
 
				-			perf_callchain_user_64(regs, entry);
			
 
				-	}
			
 
				-	return entry;
			
 
				+	flushw_user();
			
 
				+	if (test_thread_flag(TIF_32BIT))
			
 
				+		perf_callchain_user_32(entry, regs);
			
 
				+	else
			
 
				+		perf_callchain_user_64(entry, regs);
			
 
				 }
			
--- a/arch/x86/Kconfig
+++ b/arch/x86/Kconfig
@@ -25,6 +25,7 @@ config X86
 
				 	select HAVE_IDE
			
 
				 	select HAVE_OPROFILE
			
 
				 	select HAVE_PERF_EVENTS if (!M386 && !M486)
			
 
				+	select HAVE_IRQ_WORK
			
 
				 	select HAVE_IOREMAP_PROT
			
 
				 	select HAVE_KPROBES
			
 
				 	select ARCH_WANT_OPTIONAL_GPIOLIB
			
@@ -33,6 +34,7 @@ config X86
 
				 	select HAVE_KRETPROBES
			
 
				 	select HAVE_OPTPROBES
			
 
				 	select HAVE_FTRACE_MCOUNT_RECORD
			
 
				+	select HAVE_C_RECORDMCOUNT
			
 
				 	select HAVE_DYNAMIC_FTRACE
			
 
				 	select HAVE_FUNCTION_TRACER
			
 
				 	select HAVE_FUNCTION_GRAPH_TRACER
			
@@ -59,6 +61,8 @@ config X86
 
				 	select ANON_INODES
			
 
				 	select HAVE_ARCH_KMEMCHECK
			
 
				 	select HAVE_USER_RETURN_NOTIFIER
			
 
				+	select HAVE_ARCH_JUMP_LABEL
			
 
				+	select HAVE_TEXT_POKE_SMP
			
 
				 
			
 
				 config INSTRUCTION_DECODER
			
 
				 	def_bool (KPROBES || PERF_EVENTS)
			
@@ -2125,6 +2129,10 @@ config HAVE_ATOMIC_IOMAP
 
				 	def_bool y
			
 
				 	depends on X86_32
			
 
				 
			
 
				+config HAVE_TEXT_POKE_SMP
			
 
				+	bool
			
 
				+	select STOP_MACHINE if SMP
			
 
				+
			
 
				 source "net/Kconfig"
			
 
				 
			
 
				 source "drivers/Kconfig"
			
--- a/arch/x86/include/asm/alternative.h
+++ b/arch/x86/include/asm/alternative.h
@@ -4,6 +4,7 @@
 
				 #include <linux/types.h>
			
 
				 #include <linux/stddef.h>
			
 
				 #include <linux/stringify.h>
			
 
				+#include <linux/jump_label.h>
			
 
				 #include <asm/asm.h>
			
 
				 
			
 
				 /*
			
@@ -160,6 +161,8 @@ static inline void apply_paravirt(struct paravirt_patch_site *start,
 
				 #define __parainstructions_end	NULL
			
 
				 #endif
			
 
				 
			
 
				+extern void *text_poke_early(void *addr, const void *opcode, size_t len);
			
 
				+
			
 
				 /*
			
 
				  * Clear and restore the kernel write-protection flag on the local CPU.
			
 
				  * Allows the kernel to edit read-only pages.
			
@@ -180,4 +183,12 @@ static inline void apply_paravirt(struct paravirt_patch_site *start,
 
				 extern void *text_poke(void *addr, const void *opcode, size_t len);
			
 
				 extern void *text_poke_smp(void *addr, const void *opcode, size_t len);
			
 
				 
			
 
				+#if defined(CONFIG_DYNAMIC_FTRACE) || defined(HAVE_JUMP_LABEL)
			
 
				+#define IDEAL_NOP_SIZE_5 5
			
 
				+extern unsigned char ideal_nop5[IDEAL_NOP_SIZE_5];
			
 
				+extern void arch_init_ideal_nop5(void);
			
 
				+#else
			
 
				+static inline void arch_init_ideal_nop5(void) {}
			
 
				+#endif
			
 
				+
			
 
				 #endif /* _ASM_X86_ALTERNATIVE_H */
			
--- a/arch/x86/include/asm/entry_arch.h
+++ b/arch/x86/include/asm/entry_arch.h
@@ -49,8 +49,8 @@ BUILD_INTERRUPT(apic_timer_interrupt,LOCAL_TIMER_VECTOR)
 
				 BUILD_INTERRUPT(error_interrupt,ERROR_APIC_VECTOR)
			
 
				 BUILD_INTERRUPT(spurious_interrupt,SPURIOUS_APIC_VECTOR)
			
 
				 
			
 
				-#ifdef CONFIG_PERF_EVENTS
			
 
				-BUILD_INTERRUPT(perf_pending_interrupt, LOCAL_PENDING_VECTOR)
			
 
				+#ifdef CONFIG_IRQ_WORK
			
 
				+BUILD_INTERRUPT(irq_work_interrupt, IRQ_WORK_VECTOR)
			
 
				 #endif
			
 
				 
			
 
				 #ifdef CONFIG_X86_THERMAL_VECTOR
			
--- a/arch/x86/include/asm/hardirq.h
+++ b/arch/x86/include/asm/hardirq.h
@@ -14,7 +14,7 @@ typedef struct {
 
				 #endif
			
 
				 	unsigned int x86_platform_ipis;	/* arch dependent */
			
 
				 	unsigned int apic_perf_irqs;
			
 
				-	unsigned int apic_pending_irqs;
			
 
				+	unsigned int apic_irq_work_irqs;
			
 
				 #ifdef CONFIG_SMP
			
 
				 	unsigned int irq_resched_count;
			
 
				 	unsigned int irq_call_count;
			
--- a/arch/x86/include/asm/hw_irq.h
+++ b/arch/x86/include/asm/hw_irq.h
@@ -29,7 +29,7 @@
 
				 extern void apic_timer_interrupt(void);
			
 
				 extern void x86_platform_ipi(void);
			
 
				 extern void error_interrupt(void);
			
 
				-extern void perf_pending_interrupt(void);
			
 
				+extern void irq_work_interrupt(void);
			
 
				 
			
 
				 extern void spurious_interrupt(void);
			
 
				 extern void thermal_interrupt(void);
			
--- a/arch/x86/include/asm/irq_vectors.h
+++ b/arch/x86/include/asm/irq_vectors.h
@@ -114,9 +114,9 @@
 
				 #define X86_PLATFORM_IPI_VECTOR		0xed
			
 
				 
			
 
				 /*
			
 
				- * Performance monitoring pending work vector:
			
 
				+ * IRQ work vector:
			
 
				  */
			
 
				-#define LOCAL_PENDING_VECTOR		0xec
			
 
				+#define IRQ_WORK_VECTOR			0xec
			
 
				 
			
 
				 #define UV_BAU_MESSAGE			0xea
			
 
				 
			
--- a/arch/x86/include/asm/jump_label.h
+++ b/arch/x86/include/asm/jump_label.h
@@ -0,0 +1,37 @@
 
				+#ifndef _ASM_X86_JUMP_LABEL_H
			
 
				+#define _ASM_X86_JUMP_LABEL_H
			
 
				+
			
 
				+#ifdef __KERNEL__
			
 
				+
			
 
				+#include <linux/types.h>
			
 
				+#include <asm/nops.h>
			
 
				+
			
 
				+#define JUMP_LABEL_NOP_SIZE 5
			
 
				+
			
 
				+# define JUMP_LABEL_INITIAL_NOP ".byte 0xe9 \n\t .long 0\n\t"
			
 
				+
			
 
				+# define JUMP_LABEL(key, label)					\
			
 
				+	do {							\
			
 
				+		asm goto("1:"					\
			
 
				+			JUMP_LABEL_INITIAL_NOP			\
			
 
				+			".pushsection __jump_table,  \"a\" \n\t"\
			
 
				+			_ASM_PTR "1b, %l[" #label "], %c0 \n\t" \
			
 
				+			".popsection \n\t"			\
			
 
				+			: :  "i" (key) :  : label);		\
			
 
				+	} while (0)
			
 
				+
			
 
				+#endif /* __KERNEL__ */
			
 
				+
			
 
				+#ifdef CONFIG_X86_64
			
 
				+typedef u64 jump_label_t;
			
 
				+#else
			
 
				+typedef u32 jump_label_t;
			
 
				+#endif
			
 
				+
			
 
				+struct jump_entry {
			
 
				+	jump_label_t code;
			
 
				+	jump_label_t target;
			
 
				+	jump_label_t key;
			
 
				+};
			
 
				+
			
 
				+#endif
			
--- a/arch/x86/include/asm/perf_event_p4.h
+++ b/arch/x86/include/asm/perf_event_p4.h
@@ -36,19 +36,6 @@
 
				 #define P4_ESCR_EMASK(v)	((v) << P4_ESCR_EVENTMASK_SHIFT)
			
 
				 #define P4_ESCR_TAG(v)		((v) << P4_ESCR_TAG_SHIFT)
			
 
				 
			
 
				-/* Non HT mask */
			
 
				-#define P4_ESCR_MASK			\
			
 
				-	(P4_ESCR_EVENT_MASK	|	\
			
 
				-	P4_ESCR_EVENTMASK_MASK	|	\
			
 
				-	P4_ESCR_TAG_MASK	|	\
			
 
				-	P4_ESCR_TAG_ENABLE	|	\
			
 
				-	P4_ESCR_T0_OS		|	\
			
 
				-	P4_ESCR_T0_USR)
			
 
				-
			
 
				-/* HT mask */
			
 
				-#define P4_ESCR_MASK_HT			\
			
 
				-	(P4_ESCR_MASK |	P4_ESCR_T1_OS | P4_ESCR_T1_USR)
			
 
				-
			
 
				 #define P4_CCCR_OVF			0x80000000U
			
 
				 #define P4_CCCR_CASCADE			0x40000000U
			
 
				 #define P4_CCCR_OVF_PMI_T0		0x04000000U
			
@@ -70,23 +57,6 @@
 
				 #define P4_CCCR_THRESHOLD(v)		((v) << P4_CCCR_THRESHOLD_SHIFT)
			
 
				 #define P4_CCCR_ESEL(v)			((v) << P4_CCCR_ESCR_SELECT_SHIFT)
			
 
				 
			
 
				-/* Non HT mask */
			
 
				-#define P4_CCCR_MASK				\
			
 
				-	(P4_CCCR_OVF			|	\
			
 
				-	P4_CCCR_CASCADE			|	\
			
 
				-	P4_CCCR_OVF_PMI_T0		|	\
			
 
				-	P4_CCCR_FORCE_OVF		|	\
			
 
				-	P4_CCCR_EDGE			|	\
			
 
				-	P4_CCCR_THRESHOLD_MASK		|	\
			
 
				-	P4_CCCR_COMPLEMENT		|	\
			
 
				-	P4_CCCR_COMPARE			|	\
			
 
				-	P4_CCCR_ESCR_SELECT_MASK	|	\
			
 
				-	P4_CCCR_ENABLE)
			
 
				-
			
 
				-/* HT mask */
			
 
				-#define P4_CCCR_MASK_HT				\
			
 
				-	(P4_CCCR_MASK | P4_CCCR_OVF_PMI_T1 | P4_CCCR_THREAD_ANY)
			
 
				-
			
 
				 #define P4_GEN_ESCR_EMASK(class, name, bit)	\
			
 
				 	class##__##name = ((1 << bit) << P4_ESCR_EVENTMASK_SHIFT)
			
 
				 #define P4_ESCR_EMASK_BIT(class, name)		class##__##name
			
@@ -127,6 +97,28 @@
 
				 #define P4_CONFIG_HT_SHIFT		63
			
 
				 #define P4_CONFIG_HT			(1ULL << P4_CONFIG_HT_SHIFT)
			
 
				 
			
 
				+/*
			
 
				+ * The bits we allow to pass for RAW events
			
 
				+ */
			
 
				+#define P4_CONFIG_MASK_ESCR		\
			
 
				+	P4_ESCR_EVENT_MASK	|	\
			
 
				+	P4_ESCR_EVENTMASK_MASK	|	\
			
 
				+	P4_ESCR_TAG_MASK	|	\
			
 
				+	P4_ESCR_TAG_ENABLE
			
 
				+
			
 
				+#define P4_CONFIG_MASK_CCCR		\
			
 
				+	P4_CCCR_EDGE		|	\
			
 
				+	P4_CCCR_THRESHOLD_MASK	|	\
			
 
				+	P4_CCCR_COMPLEMENT	|	\
			
 
				+	P4_CCCR_COMPARE		|	\
			
 
				+	P4_CCCR_THREAD_ANY	|	\
			
 
				+	P4_CCCR_RESERVED
			
 
				+
			
 
				+/* some dangerous bits are reserved for kernel internals */
			
 
				+#define P4_CONFIG_MASK				  	  \
			
 
				+	(p4_config_pack_escr(P4_CONFIG_MASK_ESCR))	| \
			
 
				+	(p4_config_pack_cccr(P4_CONFIG_MASK_CCCR))
			
 
				+
			
 
				 static inline bool p4_is_event_cascaded(u64 config)
			
 
				 {
			
 
				 	u32 cccr = p4_config_unpack_cccr(config);
			
--- a/arch/x86/kernel/Makefile
+++ b/arch/x86/kernel/Makefile
@@ -34,7 +34,8 @@ GCOV_PROFILE_paravirt.o		:= n
 
				 obj-y			:= process_$(BITS).o signal.o entry_$(BITS).o
			
 
				 obj-y			+= traps.o irq.o irq_$(BITS).o dumpstack_$(BITS).o
			
 
				 obj-y			+= time.o ioport.o ldt.o dumpstack.o
			
 
				-obj-y			+= setup.o x86_init.o i8259.o irqinit.o
			
 
				+obj-y			+= setup.o x86_init.o i8259.o irqinit.o jump_label.o
			
 
				+obj-$(CONFIG_IRQ_WORK)  += irq_work.o
			
 
				 obj-$(CONFIG_X86_VISWS)	+= visws_quirks.o
			
 
				 obj-$(CONFIG_X86_32)	+= probe_roms_32.o
			
 
				 obj-$(CONFIG_X86_32)	+= sys_i386_32.o i386_ksyms_32.o
			
--- a/arch/x86/kernel/alternative.c
+++ b/arch/x86/kernel/alternative.c
@@ -195,7 +195,7 @@ static void __init_or_module add_nops(void *insns, unsigned int len)
 
				 
			
 
				 extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
			
 
				 extern s32 __smp_locks[], __smp_locks_end[];
			
 
				-static void *text_poke_early(void *addr, const void *opcode, size_t len);
			
 
				+void *text_poke_early(void *addr, const void *opcode, size_t len);
			
 
				 
			
 
				 /* Replace instructions with better alternatives for this CPU type.
			
 
				    This runs before SMP is initialized to avoid SMP problems with
			
@@ -522,7 +522,7 @@ void __init alternative_instructions(void)
 
				  * instructions. And on the local CPU you need to be protected again NMI or MCE
			
 
				  * handlers seeing an inconsistent instruction while you patch.
			
 
				  */
			
 
				-static void *__init_or_module text_poke_early(void *addr, const void *opcode,
			
 
				+void *__init_or_module text_poke_early(void *addr, const void *opcode,
			
 
				 					      size_t len)
			
 
				 {
			
 
				 	unsigned long flags;
			
@@ -637,7 +637,72 @@ void *__kprobes text_poke_smp(void *addr, const void *opcode, size_t len)
 
				 	tpp.len = len;
			
 
				 	atomic_set(&stop_machine_first, 1);
			
 
				 	wrote_text = 0;
			
 
				-	stop_machine(stop_machine_text_poke, (void *)&tpp, NULL);
			
 
				+	/* Use __stop_machine() because the caller already got online_cpus. */
			
 
				+	__stop_machine(stop_machine_text_poke, (void *)&tpp, NULL);
			
 
				 	return addr;
			
 
				 }
			
 
				 
			
 
				+#if defined(CONFIG_DYNAMIC_FTRACE) || defined(HAVE_JUMP_LABEL)
			
 
				+
			
 
				+unsigned char ideal_nop5[IDEAL_NOP_SIZE_5];
			
 
				+
			
 
				+void __init arch_init_ideal_nop5(void)
			
 
				+{
			
 
				+	extern const unsigned char ftrace_test_p6nop[];
			
 
				+	extern const unsigned char ftrace_test_nop5[];
			
 
				+	extern const unsigned char ftrace_test_jmp[];
			
 
				+	int faulted = 0;
			
 
				+
			
 
				+	/*
			
 
				+	 * There is no good nop for all x86 archs.
			
 
				+	 * We will default to using the P6_NOP5, but first we
			
 
				+	 * will test to make sure that the nop will actually
			
 
				+	 * work on this CPU. If it faults, we will then
			
 
				+	 * go to a lesser efficient 5 byte nop. If that fails
			
 
				+	 * we then just use a jmp as our nop. This isn't the most
			
 
				+	 * efficient nop, but we can not use a multi part nop
			
 
				+	 * since we would then risk being preempted in the middle
			
 
				+	 * of that nop, and if we enabled tracing then, it might
			
 
				+	 * cause a system crash.
			
 
				+	 *
			
 
				+	 * TODO: check the cpuid to determine the best nop.
			
 
				+	 */
			
 
				+	asm volatile (
			
 
				+		"ftrace_test_jmp:"
			
 
				+		"jmp ftrace_test_p6nop\n"
			
 
				+		"nop\n"
			
 
				+		"nop\n"
			
 
				+		"nop\n"  /* 2 byte jmp + 3 bytes */
			
 
				+		"ftrace_test_p6nop:"
			
 
				+		P6_NOP5
			
 
				+		"jmp 1f\n"
			
 
				+		"ftrace_test_nop5:"
			
 
				+		".byte 0x66,0x66,0x66,0x66,0x90\n"
			
 
				+		"1:"
			
 
				+		".section .fixup, \"ax\"\n"
			
 
				+		"2:	movl $1, %0\n"
			
 
				+		"	jmp ftrace_test_nop5\n"
			
 
				+		"3:	movl $2, %0\n"
			
 
				+		"	jmp 1b\n"
			
 
				+		".previous\n"
			
 
				+		_ASM_EXTABLE(ftrace_test_p6nop, 2b)
			
 
				+		_ASM_EXTABLE(ftrace_test_nop5, 3b)
			
 
				+		: "=r"(faulted) : "0" (faulted));
			
 
				+
			
 
				+	switch (faulted) {
			
 
				+	case 0:
			
 
				+		pr_info("converting mcount calls to 0f 1f 44 00 00\n");
			
 
				+		memcpy(ideal_nop5, ftrace_test_p6nop, IDEAL_NOP_SIZE_5);
			
 
				+		break;
			
 
				+	case 1:
			
 
				+		pr_info("converting mcount calls to 66 66 66 66 90\n");
			
 
				+		memcpy(ideal_nop5, ftrace_test_nop5, IDEAL_NOP_SIZE_5);
			
 
				+		break;
			
 
				+	case 2:
			
 
				+		pr_info("converting mcount calls to jmp . + 5\n");
			
 
				+		memcpy(ideal_nop5, ftrace_test_jmp, IDEAL_NOP_SIZE_5);
			
 
				+		break;
			
 
				+	}
			
 
				+
			
 
				+}
			
 
				+#endif
			
--- a/arch/x86/kernel/cpu/perf_event.c
+++ b/arch/x86/kernel/cpu/perf_event.c
@@ -531,7 +531,7 @@ static int x86_pmu_hw_config(struct perf_event *event)
 
				 /*
			
 
				  * Setup the hardware configuration for a given attr_type
			
 
				  */
			
 
				-static int __hw_perf_event_init(struct perf_event *event)
			
 
				+static int __x86_pmu_event_init(struct perf_event *event)
			
 
				 {
			
 
				 	int err;
			
 
				 
			
@@ -584,7 +584,7 @@ static void x86_pmu_disable_all(void)
 
				 	}
			
 
				 }
			
 
				 
			
 
				-void hw_perf_disable(void)
			
 
				+static void x86_pmu_disable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
@@ -619,7 +619,7 @@ static void x86_pmu_enable_all(int added)
 
				 	}
			
 
				 }
			
 
				 
			
 
				-static const struct pmu pmu;
			
 
				+static struct pmu pmu;
			
 
				 
			
 
				 static inline int is_x86_event(struct perf_event *event)
			
 
				 {
			
@@ -801,10 +801,10 @@ static inline int match_prev_assignment(struct hw_perf_event *hwc,
 
				 		hwc->last_tag == cpuc->tags[i];
			
 
				 }
			
 
				 
			
 
				-static int x86_pmu_start(struct perf_event *event);
			
 
				-static void x86_pmu_stop(struct perf_event *event);
			
 
				+static void x86_pmu_start(struct perf_event *event, int flags);
			
 
				+static void x86_pmu_stop(struct perf_event *event, int flags);
			
 
				 
			
 
				-void hw_perf_enable(void)
			
 
				+static void x86_pmu_enable(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	struct perf_event *event;
			
@@ -840,7 +840,14 @@ void hw_perf_enable(void)
 
				 			    match_prev_assignment(hwc, cpuc, i))
			
 
				 				continue;
			
 
				 
			
 
				-			x86_pmu_stop(event);
			
 
				+			/*
			
 
				+			 * Ensure we don't accidentally enable a stopped
			
 
				+			 * counter simply because we rescheduled.
			
 
				+			 */
			
 
				+			if (hwc->state & PERF_HES_STOPPED)
			
 
				+				hwc->state |= PERF_HES_ARCH;
			
 
				+
			
 
				+			x86_pmu_stop(event, PERF_EF_UPDATE);
			
 
				 		}
			
 
				 
			
 
				 		for (i = 0; i < cpuc->n_events; i++) {
			
@@ -852,7 +859,10 @@ void hw_perf_enable(void)
 
				 			else if (i < n_running)
			
 
				 				continue;
			
 
				 
			
 
				-			x86_pmu_start(event);
			
 
				+			if (hwc->state & PERF_HES_ARCH)
			
 
				+				continue;
			
 
				+
			
 
				+			x86_pmu_start(event, PERF_EF_RELOAD);
			
 
				 		}
			
 
				 		cpuc->n_added = 0;
			
 
				 		perf_events_lapic_init();
			
@@ -953,15 +963,12 @@ static void x86_pmu_enable_event(struct perf_event *event)
 
				 }
			
 
				 
			
 
				 /*
			
 
				- * activate a single event
			
 
				+ * Add a single event to the PMU.
			
 
				  *
			
 
				  * The event is added to the group of enabled events
			
 
				  * but only if it can be scehduled with existing events.
			
 
				- *
			
 
				- * Called with PMU disabled. If successful and return value 1,
			
 
				- * then guaranteed to call perf_enable() and hw_perf_enable()
			
 
				  */
			
 
				-static int x86_pmu_enable(struct perf_event *event)
			
 
				+static int x86_pmu_add(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	struct hw_perf_event *hwc;
			
@@ -970,58 +977,67 @@ static int x86_pmu_enable(struct perf_event *event)
 
				 
			
 
				 	hwc = &event->hw;
			
 
				 
			
 
				+	perf_pmu_disable(event->pmu);
			
 
				 	n0 = cpuc->n_events;
			
 
				-	n = collect_events(cpuc, event, false);
			
 
				-	if (n < 0)
			
 
				-		return n;
			
 
				+	ret = n = collect_events(cpuc, event, false);
			
 
				+	if (ret < 0)
			
 
				+		goto out;
			
 
				+
			
 
				+	hwc->state = PERF_HES_UPTODATE | PERF_HES_STOPPED;
			
 
				+	if (!(flags & PERF_EF_START))
			
 
				+		hwc->state |= PERF_HES_ARCH;
			
 
				 
			
 
				 	/*
			
 
				 	 * If group events scheduling transaction was started,
			
 
				 	 * skip the schedulability test here, it will be peformed
			
 
				-	 * at commit time(->commit_txn) as a whole
			
 
				+	 * at commit time (->commit_txn) as a whole
			
 
				 	 */
			
 
				 	if (cpuc->group_flag & PERF_EVENT_TXN)
			
 
				-		goto out;
			
 
				+		goto done_collect;
			
 
				 
			
 
				 	ret = x86_pmu.schedule_events(cpuc, n, assign);
			
 
				 	if (ret)
			
 
				-		return ret;
			
 
				+		goto out;
			
 
				 	/*
			
 
				 	 * copy new assignment, now we know it is possible
			
 
				 	 * will be used by hw_perf_enable()
			
 
				 	 */
			
 
				 	memcpy(cpuc->assign, assign, n*sizeof(int));
			
 
				 
			
 
				-out:
			
 
				+done_collect:
			
 
				 	cpuc->n_events = n;
			
 
				 	cpuc->n_added += n - n0;
			
 
				 	cpuc->n_txn += n - n0;
			
 
				 
			
 
				-	return 0;
			
 
				+	ret = 0;
			
 
				+out:
			
 
				+	perf_pmu_enable(event->pmu);
			
 
				+	return ret;
			
 
				 }
			
 
				 
			
 
				-static int x86_pmu_start(struct perf_event *event)
			
 
				+static void x86_pmu_start(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	int idx = event->hw.idx;
			
 
				 
			
 
				-	if (idx == -1)
			
 
				-		return -EAGAIN;
			
 
				+	if (WARN_ON_ONCE(!(event->hw.state & PERF_HES_STOPPED)))
			
 
				+		return;
			
 
				+
			
 
				+	if (WARN_ON_ONCE(idx == -1))
			
 
				+		return;
			
 
				+
			
 
				+	if (flags & PERF_EF_RELOAD) {
			
 
				+		WARN_ON_ONCE(!(event->hw.state & PERF_HES_UPTODATE));
			
 
				+		x86_perf_event_set_period(event);
			
 
				+	}
			
 
				+
			
 
				+	event->hw.state = 0;
			
 
				 
			
 
				-	x86_perf_event_set_period(event);
			
 
				 	cpuc->events[idx] = event;
			
 
				 	__set_bit(idx, cpuc->active_mask);
			
 
				 	__set_bit(idx, cpuc->running);
			
 
				 	x86_pmu.enable(event);
			
 
				 	perf_event_update_userpage(event);
			
 
				-
			
 
				-	return 0;
			
 
				-}
			
 
				-
			
 
				-static void x86_pmu_unthrottle(struct perf_event *event)
			
 
				-{
			
 
				-	int ret = x86_pmu_start(event);
			
 
				-	WARN_ON_ONCE(ret);
			
 
				 }
			
 
				 
			
 
				 void perf_event_print_debug(void)
			
@@ -1078,27 +1094,29 @@ void perf_event_print_debug(void)
 
				 	local_irq_restore(flags);
			
 
				 }
			
 
				 
			
 
				-static void x86_pmu_stop(struct perf_event *event)
			
 
				+static void x86_pmu_stop(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	struct hw_perf_event *hwc = &event->hw;
			
 
				-	int idx = hwc->idx;
			
 
				 
			
 
				-	if (!__test_and_clear_bit(idx, cpuc->active_mask))
			
 
				-		return;
			
 
				-
			
 
				-	x86_pmu.disable(event);
			
 
				-
			
 
				-	/*
			
 
				-	 * Drain the remaining delta count out of a event
			
 
				-	 * that we are disabling:
			
 
				-	 */
			
 
				-	x86_perf_event_update(event);
			
 
				+	if (__test_and_clear_bit(hwc->idx, cpuc->active_mask)) {
			
 
				+		x86_pmu.disable(event);
			
 
				+		cpuc->events[hwc->idx] = NULL;
			
 
				+		WARN_ON_ONCE(hwc->state & PERF_HES_STOPPED);
			
 
				+		hwc->state |= PERF_HES_STOPPED;
			
 
				+	}
			
 
				 
			
 
				-	cpuc->events[idx] = NULL;
			
 
				+	if ((flags & PERF_EF_UPDATE) && !(hwc->state & PERF_HES_UPTODATE)) {
			
 
				+		/*
			
 
				+		 * Drain the remaining delta count out of a event
			
 
				+		 * that we are disabling:
			
 
				+		 */
			
 
				+		x86_perf_event_update(event);
			
 
				+		hwc->state |= PERF_HES_UPTODATE;
			
 
				+	}
			
 
				 }
			
 
				 
			
 
				-static void x86_pmu_disable(struct perf_event *event)
			
 
				+static void x86_pmu_del(struct perf_event *event, int flags)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	int i;
			
@@ -1111,7 +1129,7 @@ static void x86_pmu_disable(struct perf_event *event)
 
				 	if (cpuc->group_flag & PERF_EVENT_TXN)
			
 
				 		return;
			
 
				 
			
 
				-	x86_pmu_stop(event);
			
 
				+	x86_pmu_stop(event, PERF_EF_UPDATE);
			
 
				 
			
 
				 	for (i = 0; i < cpuc->n_events; i++) {
			
 
				 		if (event == cpuc->event_list[i]) {
			
@@ -1134,7 +1152,6 @@ static int x86_pmu_handle_irq(struct pt_regs *regs)
 
				 	struct perf_sample_data data;
			
 
				 	struct cpu_hw_events *cpuc;
			
 
				 	struct perf_event *event;
			
 
				-	struct hw_perf_event *hwc;
			
 
				 	int idx, handled = 0;
			
 
				 	u64 val;
			
 
				 
			
@@ -1155,7 +1172,6 @@ static int x86_pmu_handle_irq(struct pt_regs *regs)
 
				 		}
			
 
				 
			
 
				 		event = cpuc->events[idx];
			
 
				-		hwc = &event->hw;
			
 
				 
			
 
				 		val = x86_perf_event_update(event);
			
 
				 		if (val & (1ULL << (x86_pmu.cntval_bits - 1)))
			
@@ -1171,7 +1187,7 @@ static int x86_pmu_handle_irq(struct pt_regs *regs)
 
				 			continue;
			
 
				 
			
 
				 		if (perf_event_overflow(event, 1, &data, regs))
			
 
				-			x86_pmu_stop(event);
			
 
				+			x86_pmu_stop(event, 0);
			
 
				 	}
			
 
				 
			
 
				 	if (handled)
			
@@ -1180,25 +1196,6 @@ static int x86_pmu_handle_irq(struct pt_regs *regs)
 
				 	return handled;
			
 
				 }
			
 
				 
			
 
				-void smp_perf_pending_interrupt(struct pt_regs *regs)
			
 
				-{
			
 
				-	irq_enter();
			
 
				-	ack_APIC_irq();
			
 
				-	inc_irq_stat(apic_pending_irqs);
			
 
				-	perf_event_do_pending();
			
 
				-	irq_exit();
			
 
				-}
			
 
				-
			
 
				-void set_perf_event_pending(void)
			
 
				-{
			
 
				-#ifdef CONFIG_X86_LOCAL_APIC
			
 
				-	if (!x86_pmu.apic || !x86_pmu_initialized())
			
 
				-		return;
			
 
				-
			
 
				-	apic->send_IPI_self(LOCAL_PENDING_VECTOR);
			
 
				-#endif
			
 
				-}
			
 
				-
			
 
				 void perf_events_lapic_init(void)
			
 
				 {
			
 
				 	if (!x86_pmu.apic || !x86_pmu_initialized())
			
@@ -1388,7 +1385,6 @@ void __init init_hw_perf_events(void)
 
				 		x86_pmu.num_counters = X86_PMC_MAX_GENERIC;
			
 
				 	}
			
 
				 	x86_pmu.intel_ctrl = (1 << x86_pmu.num_counters) - 1;
			
 
				-	perf_max_events = x86_pmu.num_counters;
			
 
				 
			
 
				 	if (x86_pmu.num_counters_fixed > X86_PMC_MAX_FIXED) {
			
 
				 		WARN(1, KERN_ERR "hw perf events fixed %d > max(%d), clipping!",
			
@@ -1424,6 +1420,7 @@ void __init init_hw_perf_events(void)
 
				 	pr_info("... fixed-purpose events:   %d\n",     x86_pmu.num_counters_fixed);
			
 
				 	pr_info("... event mask:             %016Lx\n", x86_pmu.intel_ctrl);
			
 
				 
			
 
				+	perf_pmu_register(&pmu);
			
 
				 	perf_cpu_notifier(x86_pmu_notifier);
			
 
				 }
			
 
				 
			
@@ -1437,10 +1434,11 @@ static inline void x86_pmu_read(struct perf_event *event)
 
				  * Set the flag to make pmu::enable() not perform the
			
 
				  * schedulability test, it will be performed at commit time
			
 
				  */
			
 
				-static void x86_pmu_start_txn(const struct pmu *pmu)
			
 
				+static void x86_pmu_start_txn(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
 
				+	perf_pmu_disable(pmu);
			
 
				 	cpuc->group_flag |= PERF_EVENT_TXN;
			
 
				 	cpuc->n_txn = 0;
			
 
				 }
			
@@ -1450,7 +1448,7 @@ static void x86_pmu_start_txn(const struct pmu *pmu)
 
				  * Clear the flag and pmu::enable() will perform the
			
 
				  * schedulability test.
			
 
				  */
			
 
				-static void x86_pmu_cancel_txn(const struct pmu *pmu)
			
 
				+static void x86_pmu_cancel_txn(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
@@ -1460,6 +1458,7 @@ static void x86_pmu_cancel_txn(const struct pmu *pmu)
 
				 	 */
			
 
				 	cpuc->n_added -= cpuc->n_txn;
			
 
				 	cpuc->n_events -= cpuc->n_txn;
			
 
				+	perf_pmu_enable(pmu);
			
 
				 }
			
 
				 
			
 
				 /*
			
@@ -1467,7 +1466,7 @@ static void x86_pmu_cancel_txn(const struct pmu *pmu)
 
				  * Perform the group schedulability test as a whole
			
 
				  * Return 0 if success
			
 
				  */
			
 
				-static int x86_pmu_commit_txn(const struct pmu *pmu)
			
 
				+static int x86_pmu_commit_txn(struct pmu *pmu)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	int assign[X86_PMC_IDX_MAX];
			
@@ -1489,22 +1488,10 @@ static int x86_pmu_commit_txn(const struct pmu *pmu)
 
				 	memcpy(cpuc->assign, assign, n*sizeof(int));
			
 
				 
			
 
				 	cpuc->group_flag &= ~PERF_EVENT_TXN;
			
 
				-
			
 
				+	perf_pmu_enable(pmu);
			
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-static const struct pmu pmu = {
			
 
				-	.enable		= x86_pmu_enable,
			
 
				-	.disable	= x86_pmu_disable,
			
 
				-	.start		= x86_pmu_start,
			
 
				-	.stop		= x86_pmu_stop,
			
 
				-	.read		= x86_pmu_read,
			
 
				-	.unthrottle	= x86_pmu_unthrottle,
			
 
				-	.start_txn	= x86_pmu_start_txn,
			
 
				-	.cancel_txn	= x86_pmu_cancel_txn,
			
 
				-	.commit_txn	= x86_pmu_commit_txn,
			
 
				-};
			
 
				-
			
 
				 /*
			
 
				  * validate that we can schedule this event
			
 
				  */
			
@@ -1579,12 +1566,22 @@ out:
 
				 	return ret;
			
 
				 }
			
 
				 
			
 
				-const struct pmu *hw_perf_event_init(struct perf_event *event)
			
 
				+int x86_pmu_event_init(struct perf_event *event)
			
 
				 {
			
 
				-	const struct pmu *tmp;
			
 
				+	struct pmu *tmp;
			
 
				 	int err;
			
 
				 
			
 
				-	err = __hw_perf_event_init(event);
			
 
				+	switch (event->attr.type) {
			
 
				+	case PERF_TYPE_RAW:
			
 
				+	case PERF_TYPE_HARDWARE:
			
 
				+	case PERF_TYPE_HW_CACHE:
			
 
				+		break;
			
 
				+
			
 
				+	default:
			
 
				+		return -ENOENT;
			
 
				+	}
			
 
				+
			
 
				+	err = __x86_pmu_event_init(event);
			
 
				 	if (!err) {
			
 
				 		/*
			
 
				 		 * we temporarily connect event to its pmu
			
@@ -1604,26 +1601,31 @@ const struct pmu *hw_perf_event_init(struct perf_event *event)
 
				 	if (err) {
			
 
				 		if (event->destroy)
			
 
				 			event->destroy(event);
			
 
				-		return ERR_PTR(err);
			
 
				 	}
			
 
				 
			
 
				-	return &pmu;
			
 
				+	return err;
			
 
				 }
			
 
				 
			
 
				-/*
			
 
				- * callchain support
			
 
				- */
			
 
				+static struct pmu pmu = {
			
 
				+	.pmu_enable	= x86_pmu_enable,
			
 
				+	.pmu_disable	= x86_pmu_disable,
			
 
				 
			
 
				-static inline
			
 
				-void callchain_store(struct perf_callchain_entry *entry, u64 ip)
			
 
				-{
			
 
				-	if (entry->nr < PERF_MAX_STACK_DEPTH)
			
 
				-		entry->ip[entry->nr++] = ip;
			
 
				-}
			
 
				+	.event_init	= x86_pmu_event_init,
			
 
				 
			
 
				-static DEFINE_PER_CPU(struct perf_callchain_entry, pmc_irq_entry);
			
 
				-static DEFINE_PER_CPU(struct perf_callchain_entry, pmc_nmi_entry);
			
 
				+	.add		= x86_pmu_add,
			
 
				+	.del		= x86_pmu_del,
			
 
				+	.start		= x86_pmu_start,
			
 
				+	.stop		= x86_pmu_stop,
			
 
				+	.read		= x86_pmu_read,
			
 
				 
			
 
				+	.start_txn	= x86_pmu_start_txn,
			
 
				+	.cancel_txn	= x86_pmu_cancel_txn,
			
 
				+	.commit_txn	= x86_pmu_commit_txn,
			
 
				+};
			
 
				+
			
 
				+/*
			
 
				+ * callchain support
			
 
				+ */
			
 
				 
			
 
				 static void
			
 
				 backtrace_warning_symbol(void *data, char *msg, unsigned long symbol)
			
@@ -1645,7 +1647,7 @@ static void backtrace_address(void *data, unsigned long addr, int reliable)
 
				 {
			
 
				 	struct perf_callchain_entry *entry = data;
			
 
				 
			
 
				-	callchain_store(entry, addr);
			
 
				+	perf_callchain_store(entry, addr);
			
 
				 }
			
 
				 
			
 
				 static const struct stacktrace_ops backtrace_ops = {
			
@@ -1656,11 +1658,15 @@ static const struct stacktrace_ops backtrace_ops = {
 
				 	.walk_stack		= print_context_stack_bp,
			
 
				 };
			
 
				 
			
 
				-static void
			
 
				-perf_callchain_kernel(struct pt_regs *regs, struct perf_callchain_entry *entry)
			
 
				+void
			
 
				+perf_callchain_kernel(struct perf_callchain_entry *entry, struct pt_regs *regs)
			
 
				 {
			
 
				-	callchain_store(entry, PERF_CONTEXT_KERNEL);
			
 
				-	callchain_store(entry, regs->ip);
			
 
				+	if (perf_guest_cbs && perf_guest_cbs->is_in_guest()) {
			
 
				+		/* TODO: We don't support guest os callchain now */
			
 
				+		return;
			
 
				+	}
			
 
				+
			
 
				+	perf_callchain_store(entry, regs->ip);
			
 
				 
			
 
				 	dump_trace(NULL, regs, NULL, regs->bp, &backtrace_ops, entry);
			
 
				 }
			
@@ -1689,7 +1695,7 @@ perf_callchain_user32(struct pt_regs *regs, struct perf_callchain_entry *entry)
 
				 		if (fp < compat_ptr(regs->sp))
			
 
				 			break;
			
 
				 
			
 
				-		callchain_store(entry, frame.return_address);
			
 
				+		perf_callchain_store(entry, frame.return_address);
			
 
				 		fp = compat_ptr(frame.next_frame);
			
 
				 	}
			
 
				 	return 1;
			
@@ -1702,19 +1708,20 @@ perf_callchain_user32(struct pt_regs *regs, struct perf_callchain_entry *entry)
 
				 }
			
 
				 #endif
			
 
				 
			
 
				-static void
			
 
				-perf_callchain_user(struct pt_regs *regs, struct perf_callchain_entry *entry)
			
 
				+void
			
 
				+perf_callchain_user(struct perf_callchain_entry *entry, struct pt_regs *regs)
			
 
				 {
			
 
				 	struct stack_frame frame;
			
 
				 	const void __user *fp;
			
 
				 
			
 
				-	if (!user_mode(regs))
			
 
				-		regs = task_pt_regs(current);
			
 
				+	if (perf_guest_cbs && perf_guest_cbs->is_in_guest()) {
			
 
				+		/* TODO: We don't support guest os callchain now */
			
 
				+		return;
			
 
				+	}
			
 
				 
			
 
				 	fp = (void __user *)regs->bp;
			
 
				 
			
 
				-	callchain_store(entry, PERF_CONTEXT_USER);
			
 
				-	callchain_store(entry, regs->ip);
			
 
				+	perf_callchain_store(entry, regs->ip);
			
 
				 
			
 
				 	if (perf_callchain_user32(regs, entry))
			
 
				 		return;
			
@@ -1731,52 +1738,11 @@ perf_callchain_user(struct pt_regs *regs, struct perf_callchain_entry *entry)
 
				 		if ((unsigned long)fp < regs->sp)
			
 
				 			break;
			
 
				 
			
 
				-		callchain_store(entry, frame.return_address);
			
 
				+		perf_callchain_store(entry, frame.return_address);
			
 
				 		fp = frame.next_frame;
			
 
				 	}
			
 
				 }
			
 
				 
			
 
				-static void
			
 
				-perf_do_callchain(struct pt_regs *regs, struct perf_callchain_entry *entry)
			
 
				-{
			
 
				-	int is_user;
			
 
				-
			
 
				-	if (!regs)
			
 
				-		return;
			
 
				-
			
 
				-	is_user = user_mode(regs);
			
 
				-
			
 
				-	if (is_user && current->state != TASK_RUNNING)
			
 
				-		return;
			
 
				-
			
 
				-	if (!is_user)
			
 
				-		perf_callchain_kernel(regs, entry);
			
 
				-
			
 
				-	if (current->mm)
			
 
				-		perf_callchain_user(regs, entry);
			
 
				-}
			
 
				-
			
 
				-struct perf_callchain_entry *perf_callchain(struct pt_regs *regs)
			
 
				-{
			
 
				-	struct perf_callchain_entry *entry;
			
 
				-
			
 
				-	if (perf_guest_cbs && perf_guest_cbs->is_in_guest()) {
			
 
				-		/* TODO: We don't support guest os callchain now */
			
 
				-		return NULL;
			
 
				-	}
			
 
				-
			
 
				-	if (in_nmi())
			
 
				-		entry = &__get_cpu_var(pmc_nmi_entry);
			
 
				-	else
			
 
				-		entry = &__get_cpu_var(pmc_irq_entry);
			
 
				-
			
 
				-	entry->nr = 0;
			
 
				-
			
 
				-	perf_do_callchain(regs, entry);
			
 
				-
			
 
				-	return entry;
			
 
				-}
			
 
				-
			
 
				 unsigned long perf_instruction_pointer(struct pt_regs *regs)
			
 
				 {
			
 
				 	unsigned long ip;
			
--- a/arch/x86/kernel/cpu/perf_event_amd.c
+++ b/arch/x86/kernel/cpu/perf_event_amd.c
@@ -52,7 +52,7 @@ static __initconst const u64 amd_hw_cache_event_ids
 
				  [ C(DTLB) ] = {
			
 
				 	[ C(OP_READ) ] = {
			
 
				 		[ C(RESULT_ACCESS) ] = 0x0040, /* Data Cache Accesses        */
			
 
				-		[ C(RESULT_MISS)   ] = 0x0046, /* L1 DTLB and L2 DLTB Miss   */
			
 
				+		[ C(RESULT_MISS)   ] = 0x0746, /* L1_DTLB_AND_L2_DLTB_MISS.ALL */
			
 
				 	},
			
 
				 	[ C(OP_WRITE) ] = {
			
 
				 		[ C(RESULT_ACCESS) ] = 0,
			
@@ -66,7 +66,7 @@ static __initconst const u64 amd_hw_cache_event_ids
 
				  [ C(ITLB) ] = {
			
 
				 	[ C(OP_READ) ] = {
			
 
				 		[ C(RESULT_ACCESS) ] = 0x0080, /* Instruction fecthes        */
			
 
				-		[ C(RESULT_MISS)   ] = 0x0085, /* Instr. fetch ITLB misses   */
			
 
				+		[ C(RESULT_MISS)   ] = 0x0385, /* L1_ITLB_AND_L2_ITLB_MISS.ALL */
			
 
				 	},
			
 
				 	[ C(OP_WRITE) ] = {
			
 
				 		[ C(RESULT_ACCESS) ] = -1,
			
--- a/arch/x86/kernel/cpu/perf_event_intel.c
+++ b/arch/x86/kernel/cpu/perf_event_intel.c
@@ -713,18 +713,18 @@ static int intel_pmu_handle_irq(struct pt_regs *regs)
 
				 	struct cpu_hw_events *cpuc;
			
 
				 	int bit, loops;
			
 
				 	u64 status;
			
 
				-	int handled = 0;
			
 
				+	int handled;
			
 
				 
			
 
				 	perf_sample_data_init(&data, 0);
			
 
				 
			
 
				 	cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 
			
 
				 	intel_pmu_disable_all();
			
 
				-	intel_pmu_drain_bts_buffer();
			
 
				+	handled = intel_pmu_drain_bts_buffer();
			
 
				 	status = intel_pmu_get_status();
			
 
				 	if (!status) {
			
 
				 		intel_pmu_enable_all(0);
			
 
				-		return 0;
			
 
				+		return handled;
			
 
				 	}
			
 
				 
			
 
				 	loops = 0;
			
@@ -763,7 +763,7 @@ again:
 
				 		data.period = event->hw.last_period;
			
 
				 
			
 
				 		if (perf_event_overflow(event, 1, &data, regs))
			
 
				-			x86_pmu_stop(event);
			
 
				+			x86_pmu_stop(event, 0);
			
 
				 	}
			
 
				 
			
 
				 	/*
			
--- a/arch/x86/kernel/cpu/perf_event_intel_ds.c
+++ b/arch/x86/kernel/cpu/perf_event_intel_ds.c
@@ -214,7 +214,7 @@ static void intel_pmu_disable_bts(void)
 
				 	update_debugctlmsr(debugctlmsr);
			
 
				 }
			
 
				 
			
 
				-static void intel_pmu_drain_bts_buffer(void)
			
 
				+static int intel_pmu_drain_bts_buffer(void)
			
 
				 {
			
 
				 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
			
 
				 	struct debug_store *ds = cpuc->ds;
			
@@ -231,16 +231,16 @@ static void intel_pmu_drain_bts_buffer(void)
 
				 	struct pt_regs regs;
			
 
				 
			
 
				 	if (!event)
			
 
				-		return;
			
 
				+		return 0;
			
 
				 
			
 
				 	if (!ds)
			
 
				-		return;
			
 
				+		return 0;
			
 
				 
			
 
				 	at  = (struct bts_record *)(unsigned long)ds->bts_buffer_base;
			
 
				 	top = (struct bts_record *)(unsigned long)ds->bts_index;
			
 
				 
			
 
				 	if (top <= at)
			
 
				-		return;
			
 
				+		return 0;
			
 
				 
			
 
				 	ds->bts_index = ds->bts_buffer_base;
			
 
				 
			
@@ -256,7 +256,7 @@ static void intel_pmu_drain_bts_buffer(void)
 
				 	perf_prepare_sample(&header, &data, event, &regs);
			
 
				 
			
 
				 	if (perf_output_begin(&handle, event, header.size * (top - at), 1, 1))
			
 
				-		return;
			
 
				+		return 1;
			
 
				 
			
 
				 	for (; at < top; at++) {
			
 
				 		data.ip		= at->from;
			
@@ -270,6 +270,7 @@ static void intel_pmu_drain_bts_buffer(void)
 
				 	/* There's new data available. */
			
 
				 	event->hw.interrupts++;
			
 
				 	event->pending_kill = POLL_IN;
			
 
				+	return 1;
			
 
				 }
			
 
				 
			
 
				 /*
			
@@ -491,7 +492,7 @@ static void __intel_pmu_pebs_event(struct perf_event *event,
 
				 		regs.flags &= ~PERF_EFLAGS_EXACT;
			
 
				 
			
 
				 	if (perf_event_overflow(event, 1, &data, &regs))
			
 
				-		x86_pmu_stop(event);
			
 
				+		x86_pmu_stop(event, 0);
			
 
				 }
			
 
				 
			
 
				 static void intel_pmu_drain_pebs_core(struct pt_regs *iregs)
			
--- a/arch/x86/kernel/cpu/perf_event_p4.c
+++ b/arch/x86/kernel/cpu/perf_event_p4.c
@@ -18,6 +18,8 @@
 
				 struct p4_event_bind {
			
 
				 	unsigned int opcode;			/* Event code and ESCR selector */
			
 
				 	unsigned int escr_msr[2];		/* ESCR MSR for this event */
			
 
				+	unsigned int escr_emask;		/* valid ESCR EventMask bits */
			
 
				+	unsigned int shared;			/* event is shared across threads */
			
 
				 	char cntr[2][P4_CNTR_LIMIT];		/* counter index (offset), -1 on abscence */
			
 
				 };
			
 
				 
			
@@ -66,231 +68,435 @@ static struct p4_event_bind p4_event_bind_map[] = {
 
				 	[P4_EVENT_TC_DELIVER_MODE] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_TC_DELIVER_MODE),
			
 
				 		.escr_msr	= { MSR_P4_TC_ESCR0, MSR_P4_TC_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, DD)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, DB)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, DI)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, BD)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, BB)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, BI)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, ID),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {4, 5, -1}, {6, 7, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_BPU_FETCH_REQUEST] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_BPU_FETCH_REQUEST),
			
 
				 		.escr_msr	= { MSR_P4_BPU_ESCR0, MSR_P4_BPU_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BPU_FETCH_REQUEST, TCMISS),
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_ITLB_REFERENCE] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_ITLB_REFERENCE),
			
 
				 		.escr_msr	= { MSR_P4_ITLB_ESCR0, MSR_P4_ITLB_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_ITLB_REFERENCE, HIT)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_ITLB_REFERENCE, MISS)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_ITLB_REFERENCE, HIT_UK),
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_MEMORY_CANCEL] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_MEMORY_CANCEL),
			
 
				 		.escr_msr	= { MSR_P4_DAC_ESCR0, MSR_P4_DAC_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MEMORY_CANCEL, ST_RB_FULL)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MEMORY_CANCEL, 64K_CONF),
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_MEMORY_COMPLETE] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_MEMORY_COMPLETE),
			
 
				 		.escr_msr	= { MSR_P4_SAAT_ESCR0 , MSR_P4_SAAT_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MEMORY_COMPLETE, LSC)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MEMORY_COMPLETE, SSC),
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_LOAD_PORT_REPLAY] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_LOAD_PORT_REPLAY),
			
 
				 		.escr_msr	= { MSR_P4_SAAT_ESCR0, MSR_P4_SAAT_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_LOAD_PORT_REPLAY, SPLIT_LD),
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_STORE_PORT_REPLAY] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_STORE_PORT_REPLAY),
			
 
				 		.escr_msr	= { MSR_P4_SAAT_ESCR0 ,  MSR_P4_SAAT_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_STORE_PORT_REPLAY, SPLIT_ST),
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_MOB_LOAD_REPLAY] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_MOB_LOAD_REPLAY),
			
 
				 		.escr_msr	= { MSR_P4_MOB_ESCR0, MSR_P4_MOB_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MOB_LOAD_REPLAY, NO_STA)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MOB_LOAD_REPLAY, NO_STD)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MOB_LOAD_REPLAY, PARTIAL_DATA)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MOB_LOAD_REPLAY, UNALGN_ADDR),
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_PAGE_WALK_TYPE] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_PAGE_WALK_TYPE),
			
 
				 		.escr_msr	= { MSR_P4_PMH_ESCR0, MSR_P4_PMH_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_PAGE_WALK_TYPE, DTMISS)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_PAGE_WALK_TYPE, ITMISS),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_BSQ_CACHE_REFERENCE] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_BSQ_CACHE_REFERENCE),
			
 
				 		.escr_msr	= { MSR_P4_BSU_ESCR0, MSR_P4_BSU_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITS)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITM)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITS)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITM)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_MISS)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_MISS)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, WR_2ndL_MISS),
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_IOQ_ALLOCATION] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_IOQ_ALLOCATION),
			
 
				 		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, DEFAULT)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, ALL_READ)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, ALL_WRITE)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_UC)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_WC)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_WT)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_WP)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_WB)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, OWN)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, OTHER)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, PREFETCH),
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_IOQ_ACTIVE_ENTRIES] = {	/* shared ESCR */
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_IOQ_ACTIVE_ENTRIES),
			
 
				 		.escr_msr	= { MSR_P4_FSB_ESCR1,  MSR_P4_FSB_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, DEFAULT)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, ALL_READ)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, ALL_WRITE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_UC)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WC)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WT)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WP)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WB)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, OWN)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, OTHER)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, PREFETCH),
			
 
				 		.cntr		= { {2, -1, -1}, {3, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_FSB_DATA_ACTIVITY] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_FSB_DATA_ACTIVITY),
			
 
				 		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_DRV)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_OWN)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_OTHER)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DBSY_DRV)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DBSY_OWN)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DBSY_OTHER),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_BSQ_ALLOCATION] = {		/* shared ESCR, broken CCCR1 */
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_BSQ_ALLOCATION),
			
 
				 		.escr_msr	= { MSR_P4_BSU_ESCR0, MSR_P4_BSU_ESCR0 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_TYPE0)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_TYPE1)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_LEN0)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_LEN1)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_IO_TYPE)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_LOCK_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_CACHE_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_SPLIT_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_DEM_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_ORD_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, MEM_TYPE0)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, MEM_TYPE1)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, MEM_TYPE2),
			
 
				 		.cntr		= { {0, -1, -1}, {1, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_BSQ_ACTIVE_ENTRIES] = {	/* shared ESCR */
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_BSQ_ACTIVE_ENTRIES),
			
 
				 		.escr_msr	= { MSR_P4_BSU_ESCR1 , MSR_P4_BSU_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_TYPE0)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_TYPE1)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_LEN0)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_LEN1)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_IO_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_LOCK_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_CACHE_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_SPLIT_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_DEM_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_ORD_TYPE)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, MEM_TYPE0)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, MEM_TYPE1)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, MEM_TYPE2),
			
 
				 		.cntr		= { {2, -1, -1}, {3, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_SSE_INPUT_ASSIST] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_SSE_INPUT_ASSIST),
			
 
				 		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_SSE_INPUT_ASSIST, ALL),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_PACKED_SP_UOP] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_PACKED_SP_UOP),
			
 
				 		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_PACKED_SP_UOP, ALL),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_PACKED_DP_UOP] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_PACKED_DP_UOP),
			
 
				 		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_PACKED_DP_UOP, ALL),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_SCALAR_SP_UOP] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_SCALAR_SP_UOP),
			
 
				 		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_SCALAR_SP_UOP, ALL),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_SCALAR_DP_UOP] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_SCALAR_DP_UOP),
			
 
				 		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_SCALAR_DP_UOP, ALL),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_64BIT_MMX_UOP] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_64BIT_MMX_UOP),
			
 
				 		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_64BIT_MMX_UOP, ALL),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_128BIT_MMX_UOP] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_128BIT_MMX_UOP),
			
 
				 		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_128BIT_MMX_UOP, ALL),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_X87_FP_UOP] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_X87_FP_UOP),
			
 
				 		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_X87_FP_UOP, ALL),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_TC_MISC] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_TC_MISC),
			
 
				 		.escr_msr	= { MSR_P4_TC_ESCR0, MSR_P4_TC_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_TC_MISC, FLUSH),
			
 
				 		.cntr		= { {4, 5, -1}, {6, 7, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_GLOBAL_POWER_EVENTS] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_GLOBAL_POWER_EVENTS),
			
 
				 		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_GLOBAL_POWER_EVENTS, RUNNING),
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_TC_MS_XFER] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_TC_MS_XFER),
			
 
				 		.escr_msr	= { MSR_P4_MS_ESCR0, MSR_P4_MS_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_TC_MS_XFER, CISC),
			
 
				 		.cntr		= { {4, 5, -1}, {6, 7, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_UOP_QUEUE_WRITES] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_UOP_QUEUE_WRITES),
			
 
				 		.escr_msr	= { MSR_P4_MS_ESCR0, MSR_P4_MS_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_QUEUE_WRITES, FROM_TC_BUILD)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_QUEUE_WRITES, FROM_TC_DELIVER)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_QUEUE_WRITES, FROM_ROM),
			
 
				 		.cntr		= { {4, 5, -1}, {6, 7, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE),
			
 
				 		.escr_msr	= { MSR_P4_TBPU_ESCR0 , MSR_P4_TBPU_ESCR0 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, CONDITIONAL)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, CALL)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, RETURN)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, INDIRECT),
			
 
				 		.cntr		= { {4, 5, -1}, {6, 7, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_RETIRED_BRANCH_TYPE] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_RETIRED_BRANCH_TYPE),
			
 
				 		.escr_msr	= { MSR_P4_TBPU_ESCR0 , MSR_P4_TBPU_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, CONDITIONAL)	|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, CALL)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, RETURN)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, INDIRECT),
			
 
				 		.cntr		= { {4, 5, -1}, {6, 7, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_RESOURCE_STALL] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_RESOURCE_STALL),
			
 
				 		.escr_msr	= { MSR_P4_ALF_ESCR0, MSR_P4_ALF_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_RESOURCE_STALL, SBFULL),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_WC_BUFFER] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_WC_BUFFER),
			
 
				 		.escr_msr	= { MSR_P4_DAC_ESCR0, MSR_P4_DAC_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_WC_BUFFER, WCB_EVICTS)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_WC_BUFFER, WCB_FULL_EVICTS),
			
 
				+		.shared		= 1,
			
 
				 		.cntr		= { {8, 9, -1}, {10, 11, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_B2B_CYCLES] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_B2B_CYCLES),
			
 
				 		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
			
 
				+		.escr_emask	= 0,
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_BNR] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_BNR),
			
 
				 		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
			
 
				+		.escr_emask	= 0,
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_SNOOP] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_SNOOP),
			
 
				 		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
			
 
				+		.escr_emask	= 0,
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_RESPONSE] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_RESPONSE),
			
 
				 		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
			
 
				+		.escr_emask	= 0,
			
 
				 		.cntr		= { {0, -1, -1}, {2, -1, -1} },
			
 
				 	},
			
 
				 	[P4_EVENT_FRONT_END_EVENT] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_FRONT_END_EVENT),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_FRONT_END_EVENT, NBOGUS)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_FRONT_END_EVENT, BOGUS),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_EXECUTION_EVENT] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_EXECUTION_EVENT),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS0)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS1)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS2)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS3)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS0)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS1)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS2)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS3),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_REPLAY_EVENT] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_REPLAY_EVENT),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_REPLAY_EVENT, NBOGUS)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_REPLAY_EVENT, BOGUS),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_INSTR_RETIRED] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_INSTR_RETIRED),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, NBOGUSNTAG)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, NBOGUSTAG)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, BOGUSNTAG)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, BOGUSTAG),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_UOPS_RETIRED] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_UOPS_RETIRED),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_UOPS_RETIRED, NBOGUS)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_UOPS_RETIRED, BOGUS),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_UOP_TYPE] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_UOP_TYPE),
			
 
				 		.escr_msr	= { MSR_P4_RAT_ESCR0, MSR_P4_RAT_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_TYPE, TAGLOADS)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_TYPE, TAGSTORES),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_BRANCH_RETIRED] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_BRANCH_RETIRED),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BRANCH_RETIRED, MMNP)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BRANCH_RETIRED, MMNM)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BRANCH_RETIRED, MMTP)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_BRANCH_RETIRED, MMTM),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_MISPRED_BRANCH_RETIRED] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_MISPRED_BRANCH_RETIRED),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+		P4_ESCR_EMASK_BIT(P4_EVENT_MISPRED_BRANCH_RETIRED, NBOGUS),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_X87_ASSIST] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_X87_ASSIST),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, FPSU)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, FPSO)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, POAO)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, POAU)			|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, PREA),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_MACHINE_CLEAR] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_MACHINE_CLEAR),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MACHINE_CLEAR, CLEAR)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MACHINE_CLEAR, MOCLEAR)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_MACHINE_CLEAR, SMCLEAR),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 	[P4_EVENT_INSTR_COMPLETED] = {
			
 
				 		.opcode		= P4_OPCODE(P4_EVENT_INSTR_COMPLETED),
			
 
				 		.escr_msr	= { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 },
			
 
				+		.escr_emask	=
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_COMPLETED, NBOGUS)		|
			
 
				+			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_COMPLETED, BOGUS),
			
 
				 		.cntr		= { {12, 13, 16}, {14, 15, 17} },
			
 
				 	},
			
 
				 };
			
@@ -428,29 +634,73 @@ static u64 p4_pmu_event_map(int hw_event)
 
				 	return config;
			
 
				 }
			
 
				 
			
 
				+/* check cpu model specifics */
			
 
				+static bool p4_event_match_cpu_model(unsigned int event_idx)
			
 
				+{
			
 
				+	/* INSTR_COMPLETED event only exist for model 3, 4, 6 (Prescott) */
			
 
				+	if (event_idx == P4_EVENT_INSTR_COMPLETED) {
			
 
				+		if (boot_cpu_data.x86_model != 3 &&
			
 
				+			boot_cpu_data.x86_model != 4 &&
			
 
				+			boot_cpu_data.x86_model != 6)
			
 
				+			return false;
			
 
				+	}
			
 
				+
			
 
				+	/*
			
 
				+	 * For info
			
 
				+	 * - IQ_ESCR0, IQ_ESCR1 only for models 1 and 2
			
 
				+	 */
			
 
				+
			
 
				+	return true;
			
 
				+}
			
 
				+
			
 
				 static int p4_validate_raw_event(struct perf_event *event)
			
 
				 {
			
 
				-	unsigned int v;
			
 
				+	unsigned int v, emask;
			
 
				 
			
 
				-	/* user data may have out-of-bound event index */
			
 
				+	/* User data may have out-of-bound event index */
			
 
				 	v = p4_config_unpack_event(event->attr.config);
			
 
				-	if (v >= ARRAY_SIZE(p4_event_bind_map)) {
			
 
				-		pr_warning("P4 PMU: Unknown event code: %d\n", v);
			
 
				+	if (v >= ARRAY_SIZE(p4_event_bind_map))
			
 
				+		return -EINVAL;
			
 
				+
			
 
				+	/* It may be unsupported: */
			
 
				+	if (!p4_event_match_cpu_model(v))
			
 
				 		return -EINVAL;
			
 
				+
			
 
				+	/*
			
 
				+	 * NOTE: P4_CCCR_THREAD_ANY has not the same meaning as
			
 
				+	 * in Architectural Performance Monitoring, it means not
			
 
				+	 * on _which_ logical cpu to count but rather _when_, ie it
			
 
				+	 * depends on logical cpu state -- count event if one cpu active,
			
 
				+	 * none, both or any, so we just allow user to pass any value
			
 
				+	 * desired.
			
 
				+	 *
			
 
				+	 * In turn we always set Tx_OS/Tx_USR bits bound to logical
			
 
				+	 * cpu without their propagation to another cpu
			
 
				+	 */
			
 
				+
			
 
				+	/*
			
 
				+	 * if an event is shared accross the logical threads
			
 
				+	 * the user needs special permissions to be able to use it
			
 
				+	 */
			
 
				+	if (p4_event_bind_map[v].shared) {
			
 
				+		if (perf_paranoid_cpu() && !capable(CAP_SYS_ADMIN))
			
 
				+			return -EACCES;
			
 
				 	}
			
 
				 
			
 
				+	/* ESCR EventMask bits may be invalid */
			
 
				+	emask = p4_config_unpack_escr(event->attr.config) & P4_ESCR_EVENTMASK_MASK;
			
 
				+	if (emask & ~p4_event_bind_map[v].escr_emask)
			
 
				+		return -EINVAL;
			
 
				+
			
 
				 	/*
			
 
				-	 * it may have some screwed PEBS bits
			
 
				+	 * it may have some invalid PEBS bits
			
 
				 	 */
			
 
				-	if (p4_config_pebs_has(event->attr.config, P4_PEBS_CONFIG_ENABLE)) {
			
 
				-		pr_warning("P4 PMU: PEBS are not supported yet\n");
			
 
				+	if (p4_config_pebs_has(event->attr.config, P4_PEBS_CONFIG_ENABLE))
			
 
				 		return -EINVAL;
			
 
				-	}
			
 
				+
			
 
				 	v = p4_config_unpack_metric(event->attr.config);
			
 
				-	if (v >= ARRAY_SIZE(p4_pebs_bind_map)) {
			
 
				-		pr_warning("P4 PMU: Unknown metric code: %d\n", v);
			
 
				+	if (v >= ARRAY_SIZE(p4_pebs_bind_map))
			
 
				 		return -EINVAL;
			
 
				-	}
			
 
				 
			
 
				 	return 0;
			
 
				 }
			
@@ -478,27 +728,21 @@ static int p4_hw_config(struct perf_event *event)
 
				 
			
 
				 	if (event->attr.type == PERF_TYPE_RAW) {
			
 
				 
			
 
				+		/*
			
 
				+		 * Clear bits we reserve to be managed by kernel itself
			
 
				+		 * and never allowed from a user space
			
 
				+		 */
			
 
				+		 event->attr.config &= P4_CONFIG_MASK;
			
 
				+
			
 
				 		rc = p4_validate_raw_event(event);
			
 
				 		if (rc)
			
 
				 			goto out;
			
 
				 
			
 
				 		/*
			
 
				-		 * We don't control raw events so it's up to the caller
			
 
				-		 * to pass sane values (and we don't count the thread number
			
 
				-		 * on HT machine but allow HT-compatible specifics to be
			
 
				-		 * passed on)
			
 
				-		 *
			
 
				 		 * Note that for RAW events we allow user to use P4_CCCR_RESERVED
			
 
				 		 * bits since we keep additional info here (for cache events and etc)
			
 
				-		 *
			
 
				-		 * XXX: HT wide things should check perf_paranoid_cpu() &&
			
 
				-		 *      CAP_SYS_ADMIN
			
 
				 		 */
			
 
				-		event->hw.config |= event->attr.config &
			
 
				-			(p4_config_pack_escr(P4_ESCR_MASK_HT) |
			
 
				-			 p4_config_pack_cccr(P4_CCCR_MASK_HT | P4_CCCR_RESERVED));
			
 
				-
			
 
				-		event->hw.config &= ~P4_CCCR_FORCE_OVF;
			
 
				+		event->hw.config |= event->attr.config;
			
 
				 	}
			
 
				 
			
 
				 	rc = x86_setup_perfctr(event);
			
--- a/arch/x86/kernel/entry_64.S
+++ b/arch/x86/kernel/entry_64.S
@@ -1023,9 +1023,9 @@ apicinterrupt ERROR_APIC_VECTOR \
 
				 apicinterrupt SPURIOUS_APIC_VECTOR \
			
 
				 	spurious_interrupt smp_spurious_interrupt
			
 
				 
			
 
				-#ifdef CONFIG_PERF_EVENTS
			
 
				-apicinterrupt LOCAL_PENDING_VECTOR \
			
 
				-	perf_pending_interrupt smp_perf_pending_interrupt
			
 
				+#ifdef CONFIG_IRQ_WORK
			
 
				+apicinterrupt IRQ_WORK_VECTOR \
			
 
				+	irq_work_interrupt smp_irq_work_interrupt
			
 
				 #endif
			
 
				 
			
 
				 /*
			
--- a/arch/x86/kernel/ftrace.c
+++ b/arch/x86/kernel/ftrace.c
@@ -257,14 +257,9 @@ do_ftrace_mod_code(unsigned long ip, void *new_code)
 
				 	return mod_code_status;
			
 
				 }
			
 
				 
			
 
				-
			
 
				-
			
 
				-
			
 
				-static unsigned char ftrace_nop[MCOUNT_INSN_SIZE];
			
 
				-
			
 
				 static unsigned char *ftrace_nop_replace(void)
			
 
				 {
			
 
				-	return ftrace_nop;
			
 
				+	return ideal_nop5;
			
 
				 }
			
 
				 
			
 
				 static int
			
@@ -338,62 +333,6 @@ int ftrace_update_ftrace_func(ftrace_func_t func)
 
				 
			
 
				 int __init ftrace_dyn_arch_init(void *data)
			
 
				 {
			
 
				-	extern const unsigned char ftrace_test_p6nop[];
			
 
				-	extern const unsigned char ftrace_test_nop5[];
			
 
				-	extern const unsigned char ftrace_test_jmp[];
			
 
				-	int faulted = 0;
			
 
				-
			
 
				-	/*
			
 
				-	 * There is no good nop for all x86 archs.
			
 
				-	 * We will default to using the P6_NOP5, but first we
			
 
				-	 * will test to make sure that the nop will actually
			
 
				-	 * work on this CPU. If it faults, we will then
			
 
				-	 * go to a lesser efficient 5 byte nop. If that fails
			
 
				-	 * we then just use a jmp as our nop. This isn't the most
			
 
				-	 * efficient nop, but we can not use a multi part nop
			
 
				-	 * since we would then risk being preempted in the middle
			
 
				-	 * of that nop, and if we enabled tracing then, it might
			
 
				-	 * cause a system crash.
			
 
				-	 *
			
 
				-	 * TODO: check the cpuid to determine the best nop.
			
 
				-	 */
			
 
				-	asm volatile (
			
 
				-		"ftrace_test_jmp:"
			
 
				-		"jmp ftrace_test_p6nop\n"
			
 
				-		"nop\n"
			
 
				-		"nop\n"
			
 
				-		"nop\n"  /* 2 byte jmp + 3 bytes */
			
 
				-		"ftrace_test_p6nop:"
			
 
				-		P6_NOP5
			
 
				-		"jmp 1f\n"
			
 
				-		"ftrace_test_nop5:"
			
 
				-		".byte 0x66,0x66,0x66,0x66,0x90\n"
			
 
				-		"1:"
			
 
				-		".section .fixup, \"ax\"\n"
			
 
				-		"2:	movl $1, %0\n"
			
 
				-		"	jmp ftrace_test_nop5\n"
			
 
				-		"3:	movl $2, %0\n"
			
 
				-		"	jmp 1b\n"
			
 
				-		".previous\n"
			
 
				-		_ASM_EXTABLE(ftrace_test_p6nop, 2b)
			
 
				-		_ASM_EXTABLE(ftrace_test_nop5, 3b)
			
 
				-		: "=r"(faulted) : "0" (faulted));
			
 
				-
			
 
				-	switch (faulted) {
			
 
				-	case 0:
			
 
				-		pr_info("converting mcount calls to 0f 1f 44 00 00\n");
			
 
				-		memcpy(ftrace_nop, ftrace_test_p6nop, MCOUNT_INSN_SIZE);
			
 
				-		break;
			
 
				-	case 1:
			
 
				-		pr_info("converting mcount calls to 66 66 66 66 90\n");
			
 
				-		memcpy(ftrace_nop, ftrace_test_nop5, MCOUNT_INSN_SIZE);
			
 
				-		break;
			
 
				-	case 2:
			
 
				-		pr_info("converting mcount calls to jmp . + 5\n");
			
 
				-		memcpy(ftrace_nop, ftrace_test_jmp, MCOUNT_INSN_SIZE);
			
 
				-		break;
			
 
				-	}
			
 
				-
			
 
				 	/* The return code is retured via data */
			
 
				 	*(unsigned long *)data = 0;
			
 
				 
			
--- a/arch/x86/kernel/irq.c
+++ b/arch/x86/kernel/irq.c
@@ -67,10 +67,10 @@ static int show_other_interrupts(struct seq_file *p, int prec)
 
				 	for_each_online_cpu(j)
			
 
				 		seq_printf(p, "%10u ", irq_stats(j)->apic_perf_irqs);
			
 
				 	seq_printf(p, "  Performance monitoring interrupts\n");
			
 
				-	seq_printf(p, "%*s: ", prec, "PND");
			
 
				+	seq_printf(p, "%*s: ", prec, "IWI");
			
 
				 	for_each_online_cpu(j)
			
 
				-		seq_printf(p, "%10u ", irq_stats(j)->apic_pending_irqs);
			
 
				-	seq_printf(p, "  Performance pending work\n");
			
 
				+		seq_printf(p, "%10u ", irq_stats(j)->apic_irq_work_irqs);
			
 
				+	seq_printf(p, "  IRQ work interrupts\n");
			
 
				 #endif
			
 
				 	if (x86_platform_ipi_callback) {
			
 
				 		seq_printf(p, "%*s: ", prec, "PLT");
			
@@ -185,7 +185,7 @@ u64 arch_irq_stat_cpu(unsigned int cpu)
 
				 	sum += irq_stats(cpu)->apic_timer_irqs;
			
 
				 	sum += irq_stats(cpu)->irq_spurious_count;
			
 
				 	sum += irq_stats(cpu)->apic_perf_irqs;
			
 
				-	sum += irq_stats(cpu)->apic_pending_irqs;
			
 
				+	sum += irq_stats(cpu)->apic_irq_work_irqs;
			
 
				 #endif
			
 
				 	if (x86_platform_ipi_callback)
			
 
				 		sum += irq_stats(cpu)->x86_platform_ipis;
			
--- a/arch/x86/kernel/irq_work.c
+++ b/arch/x86/kernel/irq_work.c
@@ -0,0 +1,30 @@
 
				+/*
			
 
				+ * x86 specific code for irq_work
			
 
				+ *
			
 
				+ * Copyright (C) 2010 Red Hat, Inc., Peter Zijlstra <pzijlstr@redhat.com>
			
 
				+ */
			
 
				+
			
 
				+#include <linux/kernel.h>
			
 
				+#include <linux/irq_work.h>
			
 
				+#include <linux/hardirq.h>
			
 
				+#include <asm/apic.h>
			
 
				+
			
 
				+void smp_irq_work_interrupt(struct pt_regs *regs)
			
 
				+{
			
 
				+	irq_enter();
			
 
				+	ack_APIC_irq();
			
 
				+	inc_irq_stat(apic_irq_work_irqs);
			
 
				+	irq_work_run();
			
 
				+	irq_exit();
			
 
				+}
			
 
				+
			
 
				+void arch_irq_work_raise(void)
			
 
				+{
			
 
				+#ifdef CONFIG_X86_LOCAL_APIC
			
 
				+	if (!cpu_has_apic)
			
 
				+		return;
			
 
				+
			
 
				+	apic->send_IPI_self(IRQ_WORK_VECTOR);
			
 
				+	apic_wait_icr_idle();
			
 
				+#endif
			
 
				+}
			
--- a/arch/x86/kernel/irqinit.c
+++ b/arch/x86/kernel/irqinit.c
@@ -224,9 +224,9 @@ static void __init apic_intr_init(void)
 
				 	alloc_intr_gate(SPURIOUS_APIC_VECTOR, spurious_interrupt);
			
 
				 	alloc_intr_gate(ERROR_APIC_VECTOR, error_interrupt);
			
 
				 
			
 
				-	/* Performance monitoring interrupts: */
			
 
				-# ifdef CONFIG_PERF_EVENTS
			
 
				-	alloc_intr_gate(LOCAL_PENDING_VECTOR, perf_pending_interrupt);
			
 
				+	/* IRQ work interrupts: */
			
 
				+# ifdef CONFIG_IRQ_WORK
			
 
				+	alloc_intr_gate(IRQ_WORK_VECTOR, irq_work_interrupt);
			
 
				 # endif
			
 
				 
			
 
				 #endif
			
--- a/arch/x86/kernel/jump_label.c
+++ b/arch/x86/kernel/jump_label.c
@@ -0,0 +1,50 @@
 
				+/*
			
 
				+ * jump label x86 support
			
 
				+ *
			
 
				+ * Copyright (C) 2009 Jason Baron <jbaron@redhat.com>
			
 
				+ *
			
 
				+ */
			
 
				+#include <linux/jump_label.h>
			
 
				+#include <linux/memory.h>
			
 
				+#include <linux/uaccess.h>
			
 
				+#include <linux/module.h>
			
 
				+#include <linux/list.h>
			
 
				+#include <linux/jhash.h>
			
 
				+#include <linux/cpu.h>
			
 
				+#include <asm/kprobes.h>
			
 
				+#include <asm/alternative.h>
			
 
				+
			
 
				+#ifdef HAVE_JUMP_LABEL
			
 
				+
			
 
				+union jump_code_union {
			
 
				+	char code[JUMP_LABEL_NOP_SIZE];
			
 
				+	struct {
			
 
				+		char jump;
			
 
				+		int offset;
			
 
				+	} __attribute__((packed));
			
 
				+};
			
 
				+
			
 
				+void arch_jump_label_transform(struct jump_entry *entry,
			
 
				+			       enum jump_label_type type)
			
 
				+{
			
 
				+	union jump_code_union code;
			
 
				+
			
 
				+	if (type == JUMP_LABEL_ENABLE) {
			
 
				+		code.jump = 0xe9;
			
 
				+		code.offset = entry->target -
			
 
				+				(entry->code + JUMP_LABEL_NOP_SIZE);
			
 
				+	} else
			
 
				+		memcpy(&code, ideal_nop5, JUMP_LABEL_NOP_SIZE);
			
 
				+	get_online_cpus();
			
 
				+	mutex_lock(&text_mutex);
			
 
				+	text_poke_smp((void *)entry->code, &code, JUMP_LABEL_NOP_SIZE);
			
 
				+	mutex_unlock(&text_mutex);
			
 
				+	put_online_cpus();
			
 
				+}
			
 
				+
			
 
				+void arch_jump_label_text_poke_early(jump_label_t addr)
			
 
				+{
			
 
				+	text_poke_early((void *)addr, ideal_nop5, JUMP_LABEL_NOP_SIZE);
			
 
				+}
			
 
				+
			
 
				+#endif
			
--- a/arch/x86/kernel/kprobes.c
+++ b/arch/x86/kernel/kprobes.c
@@ -230,9 +230,6 @@ static int recover_probed_instruction(kprobe_opcode_t *buf, unsigned long addr)
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-/* Dummy buffers for kallsyms_lookup */
			
 
				-static char __dummy_buf[KSYM_NAME_LEN];
			
 
				-
			
 
				 /* Check if paddr is at an instruction boundary */
			
 
				 static int __kprobes can_probe(unsigned long paddr)
			
 
				 {
			
@@ -241,7 +238,7 @@ static int __kprobes can_probe(unsigned long paddr)
 
				 	struct insn insn;
			
 
				 	kprobe_opcode_t buf[MAX_INSN_SIZE];
			
 
				 
			
 
				-	if (!kallsyms_lookup(paddr, NULL, &offset, NULL, __dummy_buf))
			
 
				+	if (!kallsyms_lookup_size_offset(paddr, NULL, &offset))
			
 
				 		return 0;
			
 
				 
			
 
				 	/* Decode instructions */
			
@@ -1129,7 +1126,7 @@ static void __kprobes synthesize_set_arg1(kprobe_opcode_t *addr,
 
				 	*(unsigned long *)addr = val;
			
 
				 }
			
 
				 
			
 
				-void __kprobes kprobes_optinsn_template_holder(void)
			
 
				+static void __used __kprobes kprobes_optinsn_template_holder(void)
			
 
				 {
			
 
				 	asm volatile (
			
 
				 			".global optprobe_template_entry\n"
			
@@ -1221,7 +1218,8 @@ static int __kprobes copy_optimized_instructions(u8 *dest, u8 *src)
 
				 	}
			
 
				 	/* Check whether the address range is reserved */
			
 
				 	if (ftrace_text_reserved(src, src + len - 1) ||
			
 
				-	    alternatives_text_reserved(src, src + len - 1))
			
 
				+	    alternatives_text_reserved(src, src + len - 1) ||
			
 
				+	    jump_label_text_reserved(src, src + len - 1))
			
 
				 		return -EBUSY;
			
 
				 
			
 
				 	return len;
			
@@ -1269,11 +1267,9 @@ static int __kprobes can_optimize(unsigned long paddr)
 
				 	unsigned long addr, size = 0, offset = 0;
			
 
				 	struct insn insn;
			
 
				 	kprobe_opcode_t buf[MAX_INSN_SIZE];
			
 
				-	/* Dummy buffers for lookup_symbol_attrs */
			
 
				-	static char __dummy_buf[KSYM_NAME_LEN];
			
 
				 
			
 
				 	/* Lookup symbol including addr */
			
 
				-	if (!kallsyms_lookup(paddr, &size, &offset, NULL, __dummy_buf))
			
 
				+	if (!kallsyms_lookup_size_offset(paddr, &size, &offset))
			
 
				 		return 0;
			
 
				 
			
 
				 	/* Check there is enough space for a relative jump. */
			
--- a/arch/x86/kernel/module.c
+++ b/arch/x86/kernel/module.c
@@ -239,6 +239,9 @@ int module_finalize(const Elf_Ehdr *hdr,
 
				 		apply_paravirt(pseg, pseg + para->sh_size);
			
 
				 	}
			
 
				 
			
 
				+	/* make jump label nops */
			
 
				+	jump_label_apply_nops(me);
			
 
				+
			
 
				 	return 0;
			
 
				 }
			
 
				 
			
--- a/arch/x86/kernel/setup.c
+++ b/arch/x86/kernel/setup.c
@@ -112,6 +112,7 @@
 
				 #include <asm/numa_64.h>
			
 
				 #endif
			
 
				 #include <asm/mce.h>
			
 
				+#include <asm/alternative.h>
			
 
				 
			
 
				 /*
			
 
				  * end_pfn only includes RAM, while max_pfn_mapped includes all e820 entries.
			
@@ -726,6 +727,7 @@ void __init setup_arch(char **cmdline_p)
 
				 {
			
 
				 	int acpi = 0;
			
 
				 	int k8 = 0;
			
 
				+	unsigned long flags;
			
 
				 
			
 
				 #ifdef CONFIG_X86_32
			
 
				 	memcpy(&boot_cpu_data, &new_cpu_data, sizeof(new_cpu_data));
			
@@ -1071,6 +1073,10 @@ void __init setup_arch(char **cmdline_p)
 
				 	x86_init.oem.banner();
			
 
				 
			
 
				 	mcheck_init();
			
 
				+
			
 
				+	local_irq_save(flags);
			
 
				+	arch_init_ideal_nop5();
			
 
				+	local_irq_restore(flags);
			
 
				 }
			
 
				 
			
 
				 #ifdef CONFIG_X86_32
			
--- a/arch/x86/mm/fault.c
+++ b/arch/x86/mm/fault.c
@@ -251,6 +251,8 @@ static noinline __kprobes int vmalloc_fault(unsigned long address)
 
				 	if (!(address >= VMALLOC_START && address < VMALLOC_END))
			
 
				 		return -1;
			
 
				 
			
 
				+	WARN_ON_ONCE(in_nmi());
			
 
				+
			
 
				 	/*
			
 
				 	 * Synchronize this task's top level page-table
			
 
				 	 * with the 'reference' page table.
			
@@ -369,6 +371,8 @@ static noinline __kprobes int vmalloc_fault(unsigned long address)
 
				 	if (!(address >= VMALLOC_START && address < VMALLOC_END))
			
 
				 		return -1;
			
 
				 
			
 
				+	WARN_ON_ONCE(in_nmi());
			
 
				+
			
 
				 	/*
			
 
				 	 * Copy kernel mappings over when needed. This can also
			
 
				 	 * happen within a race in page table update. In the later
			
--- a/arch/x86/mm/kmemcheck/kmemcheck.c
+++ b/arch/x86/mm/kmemcheck/kmemcheck.c
@@ -631,6 +631,8 @@ bool kmemcheck_fault(struct pt_regs *regs, unsigned long address,
 
				 	if (!pte)
			
 
				 		return false;
			
 
				 
			
 
				+	WARN_ON_ONCE(in_nmi());
			
 
				+
			
 
				 	if (error_code & 2)
			
 
				 		kmemcheck_access(regs, address, KMEMCHECK_WRITE);
			
 
				 	else
			
--- a/arch/x86/oprofile/backtrace.c
+++ b/arch/x86/oprofile/backtrace.c
@@ -14,6 +14,7 @@
 
				 #include <asm/ptrace.h>
			
 
				 #include <asm/uaccess.h>
			
 
				 #include <asm/stacktrace.h>
			
 
				+#include <linux/compat.h>
			
 
				 
			
 
				 static void backtrace_warning_symbol(void *data, char *msg,
			
 
				 				     unsigned long symbol)
			
@@ -48,14 +49,12 @@ static struct stacktrace_ops backtrace_ops = {
 
				 	.walk_stack	= print_context_stack,
			
 
				 };
			
 
				 
			
 
				-struct frame_head {
			
 
				-	struct frame_head *bp;
			
 
				-	unsigned long ret;
			
 
				-} __attribute__((packed));
			
 
				-
			
 
				-static struct frame_head *dump_user_backtrace(struct frame_head *head)
			
 
				+#ifdef CONFIG_COMPAT
			
 
				+static struct stack_frame_ia32 *
			
 
				+dump_user_backtrace_32(struct stack_frame_ia32 *head)
			
 
				 {
			
 
				-	struct frame_head bufhead[2];
			
 
				+	struct stack_frame_ia32 bufhead[2];
			
 
				+	struct stack_frame_ia32 *fp;
			
 
				 
			
 
				 	/* Also check accessibility of one struct frame_head beyond */
			
 
				 	if (!access_ok(VERIFY_READ, head, sizeof(bufhead)))
			
@@ -63,20 +62,66 @@ static struct frame_head *dump_user_backtrace(struct frame_head *head)
 
				 	if (__copy_from_user_inatomic(bufhead, head, sizeof(bufhead)))
			
 
				 		return NULL;
			
 
				 
			
 
				-	oprofile_add_trace(bufhead[0].ret);
			
 
				+	fp = (struct stack_frame_ia32 *) compat_ptr(bufhead[0].next_frame);
			
 
				+
			
 
				+	oprofile_add_trace(bufhead[0].return_address);
			
 
				+
			
 
				+	/* frame pointers should strictly progress back up the stack
			
 
				+	* (towards higher addresses) */
			
 
				+	if (head >= fp)
			
 
				+		return NULL;
			
 
				+
			
 
				+	return fp;
			
 
				+}
			
 
				+
			
 
				+static inline int
			
 
				+x86_backtrace_32(struct pt_regs * const regs, unsigned int depth)
			
 
				+{
			
 
				+	struct stack_frame_ia32 *head;
			
 
				+
			
 
				+	/* User process is 32-bit */
			
 
				+	if (!current || !test_thread_flag(TIF_IA32))
			
 
				+		return 0;
			
 
				+
			
 
				+	head = (struct stack_frame_ia32 *) regs->bp;
			
 
				+	while (depth-- && head)
			
 
				+		head = dump_user_backtrace_32(head);
			
 
				+
			
 
				+	return 1;
			
 
				+}
			
 
				+
			
 
				+#else
			
 
				+static inline int
			
 
				+x86_backtrace_32(struct pt_regs * const regs, unsigned int depth)
			
 
				+{
			
 
				+	return 0;
			
 
				+}
			
 
				+#endif /* CONFIG_COMPAT */
			
 
				+
			
 
				+static struct stack_frame *dump_user_backtrace(struct stack_frame *head)
			
 
				+{
			
 
				+	struct stack_frame bufhead[2];
			
 
				+
			
 
				+	/* Also check accessibility of one struct stack_frame beyond */
			
 
				+	if (!access_ok(VERIFY_READ, head, sizeof(bufhead)))
			
 
				+		return NULL;
			
 
				+	if (__copy_from_user_inatomic(bufhead, head, sizeof(bufhead)))
			
 
				+		return NULL;
			
 
				+
			
 
				+	oprofile_add_trace(bufhead[0].return_address);
			
 
				 
			
 
				 	/* frame pointers should strictly progress back up the stack
			
 
				 	 * (towards higher addresses) */
			
 
				-	if (head >= bufhead[0].bp)
			
 
				+	if (head >= bufhead[0].next_frame)
			
 
				 		return NULL;
			
 
				 
			
 
				-	return bufhead[0].bp;
			
 
				+	return bufhead[0].next_frame;
			
 
				 }
			
 
				 
			
 
				 void
			
 
				 x86_backtrace(struct pt_regs * const regs, unsigned int depth)
			
 
				 {
			
 
				-	struct frame_head *head = (struct frame_head *)frame_pointer(regs);
			
 
				+	struct stack_frame *head = (struct stack_frame *)frame_pointer(regs);
			
 
				 
			
 
				 	if (!user_mode_vm(regs)) {
			
 
				 		unsigned long stack = kernel_stack_pointer(regs);
			
@@ -86,6 +131,9 @@ x86_backtrace(struct pt_regs * const regs, unsigned int depth)
 
				 		return;
			
 
				 	}
			
 
				 
			
 
				+	if (x86_backtrace_32(regs, depth))
			
 
				+		return;
			
 
				+
			
 
				 	while (depth-- && head)
			
 
				 		head = dump_user_backtrace(head);
			
 
				 }
			
--- a/arch/x86/oprofile/nmi_int.c
+++ b/arch/x86/oprofile/nmi_int.c
@@ -695,9 +695,6 @@ static int __init ppro_init(char **cpu_type)
 
				 	return 1;
			
 
				 }
			
 
				 
			
 
				-/* in order to get sysfs right */
			
 
				-static int using_nmi;
			
 
				-
			
 
				 int __init op_nmi_init(struct oprofile_operations *ops)
			
 
				 {
			
 
				 	__u8 vendor = boot_cpu_data.x86_vendor;
			
@@ -705,8 +702,6 @@ int __init op_nmi_init(struct oprofile_operations *ops)
 
				 	char *cpu_type = NULL;
			
 
				 	int ret = 0;
			
 
				 
			
 
				-	using_nmi = 0;
			
 
				-
			
 
				 	if (!cpu_has_apic)
			
 
				 		return -ENODEV;
			
 
				 
			
@@ -790,13 +785,11 @@ int __init op_nmi_init(struct oprofile_operations *ops)
 
				 	if (ret)
			
 
				 		return ret;
			
 
				 
			
 
				-	using_nmi = 1;
			
 
				 	printk(KERN_INFO "oprofile: using NMI interrupt.\n");
			
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				 void op_nmi_exit(void)
			
 
				 {
			
 
				-	if (using_nmi)
			
 
				-		exit_sysfs();
			
 
				+	exit_sysfs();
			
 
				 }
			
--- a/drivers/oprofile/oprof.c
+++ b/drivers/oprofile/oprof.c
@@ -225,26 +225,17 @@ post_sync:
 
				 	mutex_unlock(&start_mutex);
			
 
				 }
			
 
				 
			
 
				-int oprofile_set_backtrace(unsigned long val)
			
 
				+int oprofile_set_ulong(unsigned long *addr, unsigned long val)
			
 
				 {
			
 
				-	int err = 0;
			
 
				+	int err = -EBUSY;
			
 
				 
			
 
				 	mutex_lock(&start_mutex);
			
 
				-
			
 
				-	if (oprofile_started) {
			
 
				-		err = -EBUSY;
			
 
				-		goto out;
			
 
				-	}
			
 
				-
			
 
				-	if (!oprofile_ops.backtrace) {
			
 
				-		err = -EINVAL;
			
 
				-		goto out;
			
 
				+	if (!oprofile_started) {
			
 
				+		*addr = val;
			
 
				+		err = 0;
			
 
				 	}
			
 
				-
			
 
				-	oprofile_backtrace_depth = val;
			
 
				-
			
 
				-out:
			
 
				 	mutex_unlock(&start_mutex);
			
 
				+
			
 
				 	return err;
			
 
				 }
			
 
				 
			
@@ -257,16 +248,9 @@ static int __init oprofile_init(void)
 
				 		printk(KERN_INFO "oprofile: using timer interrupt.\n");
			
 
				 		err = oprofile_timer_init(&oprofile_ops);
			
 
				 		if (err)
			
 
				-			goto out_arch;
			
 
				+			return err;
			
 
				 	}
			
 
				-	err = oprofilefs_register();
			
 
				-	if (err)
			
 
				-		goto out_arch;
			
 
				-	return 0;
			
 
				-
			
 
				-out_arch:
			
 
				-	oprofile_arch_exit();
			
 
				-	return err;
			
 
				+	return oprofilefs_register();
			
 
				 }
			
 
				 
			
 
				 
			
--- a/drivers/oprofile/oprof.h
+++ b/drivers/oprofile/oprof.h
@@ -37,7 +37,7 @@ void oprofile_create_files(struct super_block *sb, struct dentry *root);
 
				 int oprofile_timer_init(struct oprofile_operations *ops);
			
 
				 void oprofile_timer_exit(void);
			
 
				 
			
 
				-int oprofile_set_backtrace(unsigned long depth);
			
 
				+int oprofile_set_ulong(unsigned long *addr, unsigned long val);
			
 
				 int oprofile_set_timeout(unsigned long time);
			
 
				 
			
 
				 #endif /* OPROF_H */
			
--- a/drivers/oprofile/oprofile_files.c
+++ b/drivers/oprofile/oprofile_files.c
@@ -79,14 +79,17 @@ static ssize_t depth_write(struct file *file, char const __user *buf, size_t cou
 
				 	if (*offset)
			
 
				 		return -EINVAL;
			
 
				 
			
 
				+	if (!oprofile_ops.backtrace)
			
 
				+		return -EINVAL;
			
 
				+
			
 
				 	retval = oprofilefs_ulong_from_user(&val, buf, count);
			
 
				 	if (retval)
			
 
				 		return retval;
			
 
				 
			
 
				-	retval = oprofile_set_backtrace(val);
			
 
				-
			
 
				+	retval = oprofile_set_ulong(&oprofile_backtrace_depth, val);
			
 
				 	if (retval)
			
 
				 		return retval;
			
 
				+
			
 
				 	return count;
			
 
				 }
			
 
				 
			
--- a/drivers/oprofile/oprofile_perf.c
+++ b/drivers/oprofile/oprofile_perf.c
@@ -0,0 +1,328 @@
 
				+/*
			
 
				+ * Copyright 2010 ARM Ltd.
			
 
				+ *
			
 
				+ * Perf-events backend for OProfile.
			
 
				+ */
			
 
				+#include <linux/perf_event.h>
			
 
				+#include <linux/platform_device.h>
			
 
				+#include <linux/oprofile.h>
			
 
				+#include <linux/slab.h>
			
 
				+
			
 
				+/*
			
 
				+ * Per performance monitor configuration as set via oprofilefs.
			
 
				+ */
			
 
				+struct op_counter_config {
			
 
				+	unsigned long count;
			
 
				+	unsigned long enabled;
			
 
				+	unsigned long event;
			
 
				+	unsigned long unit_mask;
			
 
				+	unsigned long kernel;
			
 
				+	unsigned long user;
			
 
				+	struct perf_event_attr attr;
			
 
				+};
			
 
				+
			
 
				+static int oprofile_perf_enabled;
			
 
				+static DEFINE_MUTEX(oprofile_perf_mutex);
			
 
				+
			
 
				+static struct op_counter_config *counter_config;
			
 
				+static struct perf_event **perf_events[nr_cpumask_bits];
			
 
				+static int num_counters;
			
 
				+
			
 
				+/*
			
 
				+ * Overflow callback for oprofile.
			
 
				+ */
			
 
				+static void op_overflow_handler(struct perf_event *event, int unused,
			
 
				+			struct perf_sample_data *data, struct pt_regs *regs)
			
 
				+{
			
 
				+	int id;
			
 
				+	u32 cpu = smp_processor_id();
			
 
				+
			
 
				+	for (id = 0; id < num_counters; ++id)
			
 
				+		if (perf_events[cpu][id] == event)
			
 
				+			break;
			
 
				+
			
 
				+	if (id != num_counters)
			
 
				+		oprofile_add_sample(regs, id);
			
 
				+	else
			
 
				+		pr_warning("oprofile: ignoring spurious overflow "
			
 
				+				"on cpu %u\n", cpu);
			
 
				+}
			
 
				+
			
 
				+/*
			
 
				+ * Called by oprofile_perf_setup to create perf attributes to mirror the oprofile
			
 
				+ * settings in counter_config. Attributes are created as `pinned' events and
			
 
				+ * so are permanently scheduled on the PMU.
			
 
				+ */
			
 
				+static void op_perf_setup(void)
			
 
				+{
			
 
				+	int i;
			
 
				+	u32 size = sizeof(struct perf_event_attr);
			
 
				+	struct perf_event_attr *attr;
			
 
				+
			
 
				+	for (i = 0; i < num_counters; ++i) {
			
 
				+		attr = &counter_config[i].attr;
			
 
				+		memset(attr, 0, size);
			
 
				+		attr->type		= PERF_TYPE_RAW;
			
 
				+		attr->size		= size;
			
 
				+		attr->config		= counter_config[i].event;
			
 
				+		attr->sample_period	= counter_config[i].count;
			
 
				+		attr->pinned		= 1;
			
 
				+	}
			
 
				+}
			
 
				+
			
 
				+static int op_create_counter(int cpu, int event)
			
 
				+{
			
 
				+	struct perf_event *pevent;
			
 
				+
			
 
				+	if (!counter_config[event].enabled || perf_events[cpu][event])
			
 
				+		return 0;
			
 
				+
			
 
				+	pevent = perf_event_create_kernel_counter(&counter_config[event].attr,
			
 
				+						  cpu, NULL,
			
 
				+						  op_overflow_handler);
			
 
				+
			
 
				+	if (IS_ERR(pevent))
			
 
				+		return PTR_ERR(pevent);
			
 
				+
			
 
				+	if (pevent->state != PERF_EVENT_STATE_ACTIVE) {
			
 
				+		perf_event_release_kernel(pevent);
			
 
				+		pr_warning("oprofile: failed to enable event %d "
			
 
				+				"on CPU %d\n", event, cpu);
			
 
				+		return -EBUSY;
			
 
				+	}
			
 
				+
			
 
				+	perf_events[cpu][event] = pevent;
			
 
				+
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+static void op_destroy_counter(int cpu, int event)
			
 
				+{
			
 
				+	struct perf_event *pevent = perf_events[cpu][event];
			
 
				+
			
 
				+	if (pevent) {
			
 
				+		perf_event_release_kernel(pevent);
			
 
				+		perf_events[cpu][event] = NULL;
			
 
				+	}
			
 
				+}
			
 
				+
			
 
				+/*
			
 
				+ * Called by oprofile_perf_start to create active perf events based on the
			
 
				+ * perviously configured attributes.
			
 
				+ */
			
 
				+static int op_perf_start(void)
			
 
				+{
			
 
				+	int cpu, event, ret = 0;
			
 
				+
			
 
				+	for_each_online_cpu(cpu) {
			
 
				+		for (event = 0; event < num_counters; ++event) {
			
 
				+			ret = op_create_counter(cpu, event);
			
 
				+			if (ret)
			
 
				+				return ret;
			
 
				+		}
			
 
				+	}
			
 
				+
			
 
				+	return ret;
			
 
				+}
			
 
				+
			
 
				+/*
			
 
				+ * Called by oprofile_perf_stop at the end of a profiling run.
			
 
				+ */
			
 
				+static void op_perf_stop(void)
			
 
				+{
			
 
				+	int cpu, event;
			
 
				+
			
 
				+	for_each_online_cpu(cpu)
			
 
				+		for (event = 0; event < num_counters; ++event)
			
 
				+			op_destroy_counter(cpu, event);
			
 
				+}
			
 
				+
			
 
				+static int oprofile_perf_create_files(struct super_block *sb, struct dentry *root)
			
 
				+{
			
 
				+	unsigned int i;
			
 
				+
			
 
				+	for (i = 0; i < num_counters; i++) {
			
 
				+		struct dentry *dir;
			
 
				+		char buf[4];
			
 
				+
			
 
				+		snprintf(buf, sizeof buf, "%d", i);
			
 
				+		dir = oprofilefs_mkdir(sb, root, buf);
			
 
				+		oprofilefs_create_ulong(sb, dir, "enabled", &counter_config[i].enabled);
			
 
				+		oprofilefs_create_ulong(sb, dir, "event", &counter_config[i].event);
			
 
				+		oprofilefs_create_ulong(sb, dir, "count", &counter_config[i].count);
			
 
				+		oprofilefs_create_ulong(sb, dir, "unit_mask", &counter_config[i].unit_mask);
			
 
				+		oprofilefs_create_ulong(sb, dir, "kernel", &counter_config[i].kernel);
			
 
				+		oprofilefs_create_ulong(sb, dir, "user", &counter_config[i].user);
			
 
				+	}
			
 
				+
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+static int oprofile_perf_setup(void)
			
 
				+{
			
 
				+	spin_lock(&oprofilefs_lock);
			
 
				+	op_perf_setup();
			
 
				+	spin_unlock(&oprofilefs_lock);
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+static int oprofile_perf_start(void)
			
 
				+{
			
 
				+	int ret = -EBUSY;
			
 
				+
			
 
				+	mutex_lock(&oprofile_perf_mutex);
			
 
				+	if (!oprofile_perf_enabled) {
			
 
				+		ret = 0;
			
 
				+		op_perf_start();
			
 
				+		oprofile_perf_enabled = 1;
			
 
				+	}
			
 
				+	mutex_unlock(&oprofile_perf_mutex);
			
 
				+	return ret;
			
 
				+}
			
 
				+
			
 
				+static void oprofile_perf_stop(void)
			
 
				+{
			
 
				+	mutex_lock(&oprofile_perf_mutex);
			
 
				+	if (oprofile_perf_enabled)
			
 
				+		op_perf_stop();
			
 
				+	oprofile_perf_enabled = 0;
			
 
				+	mutex_unlock(&oprofile_perf_mutex);
			
 
				+}
			
 
				+
			
 
				+#ifdef CONFIG_PM
			
 
				+
			
 
				+static int oprofile_perf_suspend(struct platform_device *dev, pm_message_t state)
			
 
				+{
			
 
				+	mutex_lock(&oprofile_perf_mutex);
			
 
				+	if (oprofile_perf_enabled)
			
 
				+		op_perf_stop();
			
 
				+	mutex_unlock(&oprofile_perf_mutex);
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+static int oprofile_perf_resume(struct platform_device *dev)
			
 
				+{
			
 
				+	mutex_lock(&oprofile_perf_mutex);
			
 
				+	if (oprofile_perf_enabled && op_perf_start())
			
 
				+		oprofile_perf_enabled = 0;
			
 
				+	mutex_unlock(&oprofile_perf_mutex);
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+static struct platform_driver oprofile_driver = {
			
 
				+	.driver		= {
			
 
				+		.name		= "oprofile-perf",
			
 
				+	},
			
 
				+	.resume		= oprofile_perf_resume,
			
 
				+	.suspend	= oprofile_perf_suspend,
			
 
				+};
			
 
				+
			
 
				+static struct platform_device *oprofile_pdev;
			
 
				+
			
 
				+static int __init init_driverfs(void)
			
 
				+{
			
 
				+	int ret;
			
 
				+
			
 
				+	ret = platform_driver_register(&oprofile_driver);
			
 
				+	if (ret)
			
 
				+		return ret;
			
 
				+
			
 
				+	oprofile_pdev =	platform_device_register_simple(
			
 
				+				oprofile_driver.driver.name, 0, NULL, 0);
			
 
				+	if (IS_ERR(oprofile_pdev)) {
			
 
				+		ret = PTR_ERR(oprofile_pdev);
			
 
				+		platform_driver_unregister(&oprofile_driver);
			
 
				+	}
			
 
				+
			
 
				+	return ret;
			
 
				+}
			
 
				+
			
 
				+static void exit_driverfs(void)
			
 
				+{
			
 
				+	platform_device_unregister(oprofile_pdev);
			
 
				+	platform_driver_unregister(&oprofile_driver);
			
 
				+}
			
 
				+
			
 
				+#else
			
 
				+
			
 
				+static inline int  init_driverfs(void) { return 0; }
			
 
				+static inline void exit_driverfs(void) { }
			
 
				+
			
 
				+#endif /* CONFIG_PM */
			
 
				+
			
 
				+void oprofile_perf_exit(void)
			
 
				+{
			
 
				+	int cpu, id;
			
 
				+	struct perf_event *event;
			
 
				+
			
 
				+	for_each_possible_cpu(cpu) {
			
 
				+		for (id = 0; id < num_counters; ++id) {
			
 
				+			event = perf_events[cpu][id];
			
 
				+			if (event)
			
 
				+				perf_event_release_kernel(event);
			
 
				+		}
			
 
				+
			
 
				+		kfree(perf_events[cpu]);
			
 
				+	}
			
 
				+
			
 
				+	kfree(counter_config);
			
 
				+	exit_driverfs();
			
 
				+}
			
 
				+
			
 
				+int __init oprofile_perf_init(struct oprofile_operations *ops)
			
 
				+{
			
 
				+	int cpu, ret = 0;
			
 
				+
			
 
				+	ret = init_driverfs();
			
 
				+	if (ret)
			
 
				+		return ret;
			
 
				+
			
 
				+	memset(&perf_events, 0, sizeof(perf_events));
			
 
				+
			
 
				+	num_counters = perf_num_counters();
			
 
				+	if (num_counters <= 0) {
			
 
				+		pr_info("oprofile: no performance counters\n");
			
 
				+		ret = -ENODEV;
			
 
				+		goto out;
			
 
				+	}
			
 
				+
			
 
				+	counter_config = kcalloc(num_counters,
			
 
				+			sizeof(struct op_counter_config), GFP_KERNEL);
			
 
				+
			
 
				+	if (!counter_config) {
			
 
				+		pr_info("oprofile: failed to allocate %d "
			
 
				+				"counters\n", num_counters);
			
 
				+		ret = -ENOMEM;
			
 
				+		num_counters = 0;
			
 
				+		goto out;
			
 
				+	}
			
 
				+
			
 
				+	for_each_possible_cpu(cpu) {
			
 
				+		perf_events[cpu] = kcalloc(num_counters,
			
 
				+				sizeof(struct perf_event *), GFP_KERNEL);
			
 
				+		if (!perf_events[cpu]) {
			
 
				+			pr_info("oprofile: failed to allocate %d perf events "
			
 
				+					"for cpu %d\n", num_counters, cpu);
			
 
				+			ret = -ENOMEM;
			
 
				+			goto out;
			
 
				+		}
			
 
				+	}
			
 
				+
			
 
				+	ops->create_files	= oprofile_perf_create_files;
			
 
				+	ops->setup		= oprofile_perf_setup;
			
 
				+	ops->start		= oprofile_perf_start;
			
 
				+	ops->stop		= oprofile_perf_stop;
			
 
				+	ops->shutdown		= oprofile_perf_stop;
			
 
				+	ops->cpu_type		= op_name_from_perf_id();
			
 
				+
			
 
				+	if (!ops->cpu_type)
			
 
				+		ret = -ENODEV;
			
 
				+	else
			
 
				+		pr_info("oprofile: using %s\n", ops->cpu_type);
			
 
				+
			
 
				+out:
			
 
				+	if (ret)
			
 
				+		oprofile_perf_exit();
			
 
				+
			
 
				+	return ret;
			
 
				+}
			
--- a/drivers/oprofile/oprofilefs.c
+++ b/drivers/oprofile/oprofilefs.c
@@ -91,16 +91,20 @@ static ssize_t ulong_read_file(struct file *file, char __user *buf, size_t count
 
				 
			
 
				 static ssize_t ulong_write_file(struct file *file, char const __user *buf, size_t count, loff_t *offset)
			
 
				 {
			
 
				-	unsigned long *value = file->private_data;
			
 
				+	unsigned long value;
			
 
				 	int retval;
			
 
				 
			
 
				 	if (*offset)
			
 
				 		return -EINVAL;
			
 
				 
			
 
				-	retval = oprofilefs_ulong_from_user(value, buf, count);
			
 
				+	retval = oprofilefs_ulong_from_user(&value, buf, count);
			
 
				+	if (retval)
			
 
				+		return retval;
			
 
				 
			
 
				+	retval = oprofile_set_ulong(file->private_data, value);
			
 
				 	if (retval)
			
 
				 		return retval;
			
 
				+
			
 
				 	return count;
			
 
				 }
			
 
				 
			
@@ -126,50 +130,41 @@ static const struct file_operations ulong_ro_fops = {
 
				 };
			
 
				 
			
 
				 
			
 
				-static struct dentry *__oprofilefs_create_file(struct super_block *sb,
			
 
				+static int __oprofilefs_create_file(struct super_block *sb,
			
 
				 	struct dentry *root, char const *name, const struct file_operations *fops,
			
 
				-	int perm)
			
 
				+	int perm, void *priv)
			
 
				 {
			
 
				 	struct dentry *dentry;
			
 
				 	struct inode *inode;
			
 
				 
			
 
				 	dentry = d_alloc_name(root, name);
			
 
				 	if (!dentry)
			
 
				-		return NULL;
			
 
				+		return -ENOMEM;
			
 
				 	inode = oprofilefs_get_inode(sb, S_IFREG | perm);
			
 
				 	if (!inode) {
			
 
				 		dput(dentry);
			
 
				-		return NULL;
			
 
				+		return -ENOMEM;
			
 
				 	}
			
 
				 	inode->i_fop = fops;
			
 
				 	d_add(dentry, inode);
			
 
				-	return dentry;
			
 
				+	dentry->d_inode->i_private = priv;
			
 
				+	return 0;
			
 
				 }
			
 
				 
			
 
				 
			
 
				 int oprofilefs_create_ulong(struct super_block *sb, struct dentry *root,
			
 
				 	char const *name, unsigned long *val)
			
 
				 {
			
 
				-	struct dentry *d = __oprofilefs_create_file(sb, root, name,
			
 
				-						     &ulong_fops, 0644);
			
 
				-	if (!d)
			
 
				-		return -EFAULT;
			
 
				-
			
 
				-	d->d_inode->i_private = val;
			
 
				-	return 0;
			
 
				+	return __oprofilefs_create_file(sb, root, name,
			
 
				+					&ulong_fops, 0644, val);
			
 
				 }
			
 
				 
			
 
				 
			
 
				 int oprofilefs_create_ro_ulong(struct super_block *sb, struct dentry *root,
			
 
				 	char const *name, unsigned long *val)
			
 
				 {
			
 
				-	struct dentry *d = __oprofilefs_create_file(sb, root, name,
			
 
				-						     &ulong_ro_fops, 0444);
			
 
				-	if (!d)
			
 
				-		return -EFAULT;
			
 
				-
			
 
				-	d->d_inode->i_private = val;
			
 
				-	return 0;
			
 
				+	return __oprofilefs_create_file(sb, root, name,
			
 
				+					&ulong_ro_fops, 0444, val);
			
 
				 }
			
 
				 
			
 
				 
			
@@ -189,31 +184,22 @@ static const struct file_operations atomic_ro_fops = {
 
				 int oprofilefs_create_ro_atomic(struct super_block *sb, struct dentry *root,
			
 
				 	char const *name, atomic_t *val)
			
 
				 {
			
 
				-	struct dentry *d = __oprofilefs_create_file(sb, root, name,
			
 
				-						     &atomic_ro_fops, 0444);
			
 
				-	if (!d)
			
 
				-		return -EFAULT;
			
 
				-
			
 
				-	d->d_inode->i_private = val;
			
 
				-	return 0;
			
 
				+	return __oprofilefs_create_file(sb, root, name,
			
 
				+					&atomic_ro_fops, 0444, val);
			
 
				 }
			
 
				 
			
 
				 
			
 
				 int oprofilefs_create_file(struct super_block *sb, struct dentry *root,
			
 
				 	char const *name, const struct file_operations *fops)
			
 
				 {
			
 
				-	if (!__oprofilefs_create_file(sb, root, name, fops, 0644))
			
 
				-		return -EFAULT;
			
 
				-	return 0;
			
 
				+	return __oprofilefs_create_file(sb, root, name, fops, 0644, NULL);
			
 
				 }
			
 
				 
			
 
				 
			
 
				 int oprofilefs_create_file_perm(struct super_block *sb, struct dentry *root,
			
 
				 	char const *name, const struct file_operations *fops, int perm)
			
 
				 {
			
 
				-	if (!__oprofilefs_create_file(sb, root, name, fops, perm))
			
 
				-		return -EFAULT;
			
 
				-	return 0;
			
 
				+	return __oprofilefs_create_file(sb, root, name, fops, perm, NULL);
			
 
				 }
			
 
				 
			
 
				 
			
--- a/include/asm-generic/hardirq.h
+++ b/include/asm-generic/hardirq.h
@@ -3,13 +3,13 @@
 
				 
			
 
				 #include <linux/cache.h>
			
 
				 #include <linux/threads.h>
			
 
				-#include <linux/irq.h>
			
 
				 
			
 
				 typedef struct {
			
 
				 	unsigned int __softirq_pending;
			
 
				 } ____cacheline_aligned irq_cpustat_t;
			
 
				 
			
 
				 #include <linux/irq_cpustat.h>	/* Standard mappings for irq_cpustat_t above */
			
 
				+#include <linux/irq.h>
			
 
				 
			
 
				 #ifndef ack_bad_irq
			
 
				 static inline void ack_bad_irq(unsigned int irq)
			
--- a/include/asm-generic/vmlinux.lds.h
+++ b/include/asm-generic/vmlinux.lds.h
@@ -220,6 +220,8 @@
 
				 									\
			
 
				 	BUG_TABLE							\
			
 
				 									\
			
 
				+	JUMP_TABLE							\
			
 
				+									\
			
 
				 	/* PCI quirks */						\
			
 
				 	.pci_fixup        : AT(ADDR(.pci_fixup) - LOAD_OFFSET) {	\
			
 
				 		VMLINUX_SYMBOL(__start_pci_fixups_early) = .;		\
			
@@ -563,6 +565,14 @@
 
				 #define BUG_TABLE
			
 
				 #endif
			
 
				 
			
 
				+#define JUMP_TABLE							\
			
 
				+	. = ALIGN(8);							\
			
 
				+	__jump_table : AT(ADDR(__jump_table) - LOAD_OFFSET) {		\
			
 
				+		VMLINUX_SYMBOL(__start___jump_table) = .;		\
			
 
				+		*(__jump_table)						\
			
 
				+		VMLINUX_SYMBOL(__stop___jump_table) = .;		\
			
 
				+	}
			
 
				+
			
 
				 #ifdef CONFIG_PM_TRACE
			
 
				 #define TRACEDATA							\
			
 
				 	. = ALIGN(4);							\
			
--- a/include/linux/dynamic_debug.h
+++ b/include/linux/dynamic_debug.h
@@ -1,6 +1,8 @@
 
				 #ifndef _DYNAMIC_DEBUG_H
			
 
				 #define _DYNAMIC_DEBUG_H
			
 
				 
			
 
				+#include <linux/jump_label.h>
			
 
				+
			
 
				 /* dynamic_printk_enabled, and dynamic_printk_enabled2 are bitmasks in which
			
 
				  * bit n is set to 1 if any modname hashes into the bucket n, 0 otherwise. They
			
 
				  * use independent hash functions, to reduce the chance of false positives.
			
@@ -22,8 +24,6 @@ struct _ddebug {
 
				 	const char *function;
			
 
				 	const char *filename;
			
 
				 	const char *format;
			
 
				-	char primary_hash;
			
 
				-	char secondary_hash;
			
 
				 	unsigned int lineno:24;
			
 
				 	/*
			
 
				  	 * The flags field controls the behaviour at the callsite.
			
@@ -33,6 +33,7 @@ struct _ddebug {
 
				 #define _DPRINTK_FLAGS_PRINT   (1<<0)  /* printk() a message using the format */
			
 
				 #define _DPRINTK_FLAGS_DEFAULT 0
			
 
				 	unsigned int flags:8;
			
 
				+	char enabled;
			
 
				 } __attribute__((aligned(8)));
			
 
				 
			
 
				 
			
@@ -42,33 +43,35 @@ int ddebug_add_module(struct _ddebug *tab, unsigned int n,
 
				 #if defined(CONFIG_DYNAMIC_DEBUG)
			
 
				 extern int ddebug_remove_module(const char *mod_name);
			
 
				 
			
 
				-#define __dynamic_dbg_enabled(dd)  ({	     \
			
 
				-	int __ret = 0;							     \
			
 
				-	if (unlikely((dynamic_debug_enabled & (1LL << DEBUG_HASH)) &&	     \
			
 
				-			(dynamic_debug_enabled2 & (1LL << DEBUG_HASH2))))   \
			
 
				-				if (unlikely(dd.flags))			     \
			
 
				-					__ret = 1;			     \
			
 
				-	__ret; })
			
 
				-
			
 
				 #define dynamic_pr_debug(fmt, ...) do {					\
			
 
				+	__label__ do_printk;						\
			
 
				+	__label__ out;							\
			
 
				 	static struct _ddebug descriptor				\
			
 
				 	__used								\
			
 
				 	__attribute__((section("__verbose"), aligned(8))) =		\
			
 
				-	{ KBUILD_MODNAME, __func__, __FILE__, fmt, DEBUG_HASH,	\
			
 
				-		DEBUG_HASH2, __LINE__, _DPRINTK_FLAGS_DEFAULT };	\
			
 
				-	if (__dynamic_dbg_enabled(descriptor))				\
			
 
				-		printk(KERN_DEBUG pr_fmt(fmt),	##__VA_ARGS__);		\
			
 
				+	{ KBUILD_MODNAME, __func__, __FILE__, fmt, __LINE__,		\
			
 
				+		_DPRINTK_FLAGS_DEFAULT };				\
			
 
				+	JUMP_LABEL(&descriptor.enabled, do_printk);			\
			
 
				+	goto out;							\
			
 
				+do_printk:								\
			
 
				+	printk(KERN_DEBUG pr_fmt(fmt),	##__VA_ARGS__);			\
			
 
				+out:	;								\
			
 
				 	} while (0)
			
 
				 
			
 
				 
			
 
				 #define dynamic_dev_dbg(dev, fmt, ...) do {				\
			
 
				+	__label__ do_printk;						\
			
 
				+	__label__ out;							\
			
 
				 	static struct _ddebug descriptor				\
			
 
				 	__used								\
			
 
				 	__attribute__((section("__verbose"), aligned(8))) =		\
			
 
				-	{ KBUILD_MODNAME, __func__, __FILE__, fmt, DEBUG_HASH,	\
			
 
				-		DEBUG_HASH2, __LINE__, _DPRINTK_FLAGS_DEFAULT };	\
			
 
				-	if (__dynamic_dbg_enabled(descriptor))				\
			
 
				-		dev_printk(KERN_DEBUG, dev, fmt, ##__VA_ARGS__);	\
			
 
				+	{ KBUILD_MODNAME, __func__, __FILE__, fmt, __LINE__,		\
			
 
				+		_DPRINTK_FLAGS_DEFAULT };				\
			
 
				+	JUMP_LABEL(&descriptor.enabled, do_printk);			\
			
 
				+	goto out;							\
			
 
				+do_printk:								\
			
 
				+	dev_printk(KERN_DEBUG, dev, fmt, ##__VA_ARGS__);		\
			
 
				+out:	;								\
			
 
				 	} while (0)
			
 
				 
			
 
				 #else
			
--- a/include/linux/ftrace_event.h
+++ b/include/linux/ftrace_event.h
@@ -191,8 +191,8 @@ struct ftrace_event_call {
 
				 	unsigned int		flags;
			
 
				 
			
 
				 #ifdef CONFIG_PERF_EVENTS
			
 
				-	int			perf_refcount;
			
 
				-	struct hlist_head	*perf_events;
			
 
				+	int				perf_refcount;
			
 
				+	struct hlist_head __percpu	*perf_events;
			
 
				 #endif
			
 
				 };
			
 
				 
			
@@ -252,8 +252,8 @@ DECLARE_PER_CPU(struct pt_regs, perf_trace_regs);
 
				 
			
 
				 extern int  perf_trace_init(struct perf_event *event);
			
 
				 extern void perf_trace_destroy(struct perf_event *event);
			
 
				-extern int  perf_trace_enable(struct perf_event *event);
			
 
				-extern void perf_trace_disable(struct perf_event *event);
			
 
				+extern int  perf_trace_add(struct perf_event *event, int flags);
			
 
				+extern void perf_trace_del(struct perf_event *event, int flags);
			
 
				 extern int  ftrace_profile_set_filter(struct perf_event *event, int event_id,
			
 
				 				     char *filter_str);
			
 
				 extern void ftrace_profile_free_filter(struct perf_event *event);
			
--- a/include/linux/interrupt.h
+++ b/include/linux/interrupt.h
@@ -18,6 +18,7 @@
 
				 #include <asm/atomic.h>
			
 
				 #include <asm/ptrace.h>
			
 
				 #include <asm/system.h>
			
 
				+#include <trace/events/irq.h>
			
 
				 
			
 
				 /*
			
 
				  * These correspond to the IORESOURCE_IRQ_* defines in
			
@@ -407,7 +408,12 @@ asmlinkage void do_softirq(void);
 
				 asmlinkage void __do_softirq(void);
			
 
				 extern void open_softirq(int nr, void (*action)(struct softirq_action *));
			
 
				 extern void softirq_init(void);
			
 
				-#define __raise_softirq_irqoff(nr) do { or_softirq_pending(1UL << (nr)); } while (0)
			
 
				+static inline void __raise_softirq_irqoff(unsigned int nr)
			
 
				+{
			
 
				+	trace_softirq_raise((struct softirq_action *)(unsigned long)nr, NULL);
			
 
				+	or_softirq_pending(1UL << nr);
			
 
				+}
			
 
				+
			
 
				 extern void raise_softirq_irqoff(unsigned int nr);
			
 
				 extern void raise_softirq(unsigned int nr);
			
 
				 extern void wakeup_softirqd(void);
			
--- a/include/linux/irq_work.h
+++ b/include/linux/irq_work.h
@@ -0,0 +1,20 @@
 
				+#ifndef _LINUX_IRQ_WORK_H
			
 
				+#define _LINUX_IRQ_WORK_H
			
 
				+
			
 
				+struct irq_work {
			
 
				+	struct irq_work *next;
			
 
				+	void (*func)(struct irq_work *);
			
 
				+};
			
 
				+
			
 
				+static inline
			
 
				+void init_irq_work(struct irq_work *entry, void (*func)(struct irq_work *))
			
 
				+{
			
 
				+	entry->next = NULL;
			
 
				+	entry->func = func;
			
 
				+}
			
 
				+
			
 
				+bool irq_work_queue(struct irq_work *entry);
			
 
				+void irq_work_run(void);
			
 
				+void irq_work_sync(struct irq_work *entry);
			
 
				+
			
 
				+#endif /* _LINUX_IRQ_WORK_H */
			
--- a/include/linux/jump_label.h
+++ b/include/linux/jump_label.h
@@ -0,0 +1,74 @@
 
				+#ifndef _LINUX_JUMP_LABEL_H
			
 
				+#define _LINUX_JUMP_LABEL_H
			
 
				+
			
 
				+#if defined(CC_HAVE_ASM_GOTO) && defined(CONFIG_HAVE_ARCH_JUMP_LABEL)
			
 
				+# include <asm/jump_label.h>
			
 
				+# define HAVE_JUMP_LABEL
			
 
				+#endif
			
 
				+
			
 
				+enum jump_label_type {
			
 
				+	JUMP_LABEL_ENABLE,
			
 
				+	JUMP_LABEL_DISABLE
			
 
				+};
			
 
				+
			
 
				+struct module;
			
 
				+
			
 
				+#ifdef HAVE_JUMP_LABEL
			
 
				+
			
 
				+extern struct jump_entry __start___jump_table[];
			
 
				+extern struct jump_entry __stop___jump_table[];
			
 
				+
			
 
				+extern void arch_jump_label_transform(struct jump_entry *entry,
			
 
				+				 enum jump_label_type type);
			
 
				+extern void arch_jump_label_text_poke_early(jump_label_t addr);
			
 
				+extern void jump_label_update(unsigned long key, enum jump_label_type type);
			
 
				+extern void jump_label_apply_nops(struct module *mod);
			
 
				+extern int jump_label_text_reserved(void *start, void *end);
			
 
				+
			
 
				+#define jump_label_enable(key) \
			
 
				+	jump_label_update((unsigned long)key, JUMP_LABEL_ENABLE);
			
 
				+
			
 
				+#define jump_label_disable(key) \
			
 
				+	jump_label_update((unsigned long)key, JUMP_LABEL_DISABLE);
			
 
				+
			
 
				+#else
			
 
				+
			
 
				+#define JUMP_LABEL(key, label)			\
			
 
				+do {						\
			
 
				+	if (unlikely(*key))			\
			
 
				+		goto label;			\
			
 
				+} while (0)
			
 
				+
			
 
				+#define jump_label_enable(cond_var)	\
			
 
				+do {					\
			
 
				+       *(cond_var) = 1;			\
			
 
				+} while (0)
			
 
				+
			
 
				+#define jump_label_disable(cond_var)	\
			
 
				+do {					\
			
 
				+       *(cond_var) = 0;			\
			
 
				+} while (0)
			
 
				+
			
 
				+static inline int jump_label_apply_nops(struct module *mod)
			
 
				+{
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+static inline int jump_label_text_reserved(void *start, void *end)
			
 
				+{
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+#endif
			
 
				+
			
 
				+#define COND_STMT(key, stmt)					\
			
 
				+do {								\
			
 
				+	__label__ jl_enabled;					\
			
 
				+	JUMP_LABEL(key, jl_enabled);				\
			
 
				+	if (0) {						\
			
 
				+jl_enabled:							\
			
 
				+		stmt;						\
			
 
				+	}							\
			
 
				+} while (0)
			
 
				+
			
 
				+#endif
			
--- a/include/linux/jump_label_ref.h
+++ b/include/linux/jump_label_ref.h
@@ -0,0 +1,44 @@
 
				+#ifndef _LINUX_JUMP_LABEL_REF_H
			
 
				+#define _LINUX_JUMP_LABEL_REF_H
			
 
				+
			
 
				+#include <linux/jump_label.h>
			
 
				+#include <asm/atomic.h>
			
 
				+
			
 
				+#ifdef HAVE_JUMP_LABEL
			
 
				+
			
 
				+static inline void jump_label_inc(atomic_t *key)
			
 
				+{
			
 
				+	if (atomic_add_return(1, key) == 1)
			
 
				+		jump_label_enable(key);
			
 
				+}
			
 
				+
			
 
				+static inline void jump_label_dec(atomic_t *key)
			
 
				+{
			
 
				+	if (atomic_dec_and_test(key))
			
 
				+		jump_label_disable(key);
			
 
				+}
			
 
				+
			
 
				+#else /* !HAVE_JUMP_LABEL */
			
 
				+
			
 
				+static inline void jump_label_inc(atomic_t *key)
			
 
				+{
			
 
				+	atomic_inc(key);
			
 
				+}
			
 
				+
			
 
				+static inline void jump_label_dec(atomic_t *key)
			
 
				+{
			
 
				+	atomic_dec(key);
			
 
				+}
			
 
				+
			
 
				+#undef JUMP_LABEL
			
 
				+#define JUMP_LABEL(key, label)						\
			
 
				+do {									\
			
 
				+	if (unlikely(__builtin_choose_expr(				\
			
 
				+	      __builtin_types_compatible_p(typeof(key), atomic_t *),	\
			
 
				+	      atomic_read((atomic_t *)(key)), *(key))))			\
			
 
				+		goto label;						\
			
 
				+} while (0)
			
 
				+
			
 
				+#endif /* HAVE_JUMP_LABEL */
			
 
				+
			
 
				+#endif /* _LINUX_JUMP_LABEL_REF_H */
			
--- a/include/linux/module.h
+++ b/include/linux/module.h
@@ -350,7 +350,10 @@ struct module
 
				 	struct tracepoint *tracepoints;
			
 
				 	unsigned int num_tracepoints;
			
 
				 #endif
			
 
				-
			
 
				+#ifdef HAVE_JUMP_LABEL
			
 
				+	struct jump_entry *jump_entries;
			
 
				+	unsigned int num_jump_entries;
			
 
				+#endif
			
 
				 #ifdef CONFIG_TRACING
			
 
				 	const char **trace_bprintk_fmt_start;
			
 
				 	unsigned int num_trace_bprintk_fmt;
			
--- a/include/linux/oprofile.h
+++ b/include/linux/oprofile.h
@@ -15,6 +15,7 @@
 
				 
			
 
				 #include <linux/types.h>
			
 
				 #include <linux/spinlock.h>
			
 
				+#include <linux/init.h>
			
 
				 #include <asm/atomic.h>
			
 
				  
			
 
				 /* Each escaped entry is prefixed by ESCAPE_CODE
			
@@ -185,4 +186,10 @@ int oprofile_add_data(struct op_entry *entry, unsigned long val);
 
				 int oprofile_add_data64(struct op_entry *entry, u64 val);
			
 
				 int oprofile_write_commit(struct op_entry *entry);
			
 
				 
			
 
				+#ifdef CONFIG_PERF_EVENTS
			
 
				+int __init oprofile_perf_init(struct oprofile_operations *ops);
			
 
				+void oprofile_perf_exit(void);
			
 
				+char *op_name_from_perf_id(void);
			
 
				+#endif /* CONFIG_PERF_EVENTS */
			
 
				+
			
 
				 #endif /* OPROFILE_H */
			
--- a/include/linux/percpu.h
+++ b/include/linux/percpu.h
@@ -39,6 +39,15 @@
 
				 	preempt_enable();				\
			
 
				 } while (0)
			
 
				 
			
 
				+#define get_cpu_ptr(var) ({				\
			
 
				+	preempt_disable();				\
			
 
				+	this_cpu_ptr(var); })
			
 
				+
			
 
				+#define put_cpu_ptr(var) do {				\
			
 
				+	(void)(var);					\
			
 
				+	preempt_enable();				\
			
 
				+} while (0)
			
 
				+
			
 
				 #ifdef CONFIG_SMP
			
 
				 
			
 
				 /* minimum unit size, also is the maximum supported allocation size */
			
--- a/include/linux/perf_event.h
+++ b/include/linux/perf_event.h
@@ -486,6 +486,8 @@ struct perf_guest_info_callbacks {
 
				 #include <linux/workqueue.h>
			
 
				 #include <linux/ftrace.h>
			
 
				 #include <linux/cpu.h>
			
 
				+#include <linux/irq_work.h>
			
 
				+#include <linux/jump_label_ref.h>
			
 
				 #include <asm/atomic.h>
			
 
				 #include <asm/local.h>
			
 
				 
			
@@ -529,16 +531,22 @@ struct hw_perf_event {
 
				 			int		last_cpu;
			
 
				 		};
			
 
				 		struct { /* software */
			
 
				-			s64		remaining;
			
 
				 			struct hrtimer	hrtimer;
			
 
				 		};
			
 
				 #ifdef CONFIG_HAVE_HW_BREAKPOINT
			
 
				 		struct { /* breakpoint */
			
 
				 			struct arch_hw_breakpoint	info;
			
 
				 			struct list_head		bp_list;
			
 
				+			/*
			
 
				+			 * Crufty hack to avoid the chicken and egg
			
 
				+			 * problem hw_breakpoint has with context
			
 
				+			 * creation and event initalization.
			
 
				+			 */
			
 
				+			struct task_struct		*bp_target;
			
 
				 		};
			
 
				 #endif
			
 
				 	};
			
 
				+	int				state;
			
 
				 	local64_t			prev_count;
			
 
				 	u64				sample_period;
			
 
				 	u64				last_period;
			
@@ -550,6 +558,13 @@ struct hw_perf_event {
 
				 #endif
			
 
				 };
			
 
				 
			
 
				+/*
			
 
				+ * hw_perf_event::state flags
			
 
				+ */
			
 
				+#define PERF_HES_STOPPED	0x01 /* the counter is stopped */
			
 
				+#define PERF_HES_UPTODATE	0x02 /* event->count up-to-date */
			
 
				+#define PERF_HES_ARCH		0x04
			
 
				+
			
 
				 struct perf_event;
			
 
				 
			
 
				 /*
			
@@ -561,36 +576,70 @@ struct perf_event;
 
				  * struct pmu - generic performance monitoring unit
			
 
				  */
			
 
				 struct pmu {
			
 
				-	int (*enable)			(struct perf_event *event);
			
 
				-	void (*disable)			(struct perf_event *event);
			
 
				-	int (*start)			(struct perf_event *event);
			
 
				-	void (*stop)			(struct perf_event *event);
			
 
				-	void (*read)			(struct perf_event *event);
			
 
				-	void (*unthrottle)		(struct perf_event *event);
			
 
				+	struct list_head		entry;
			
 
				+
			
 
				+	int * __percpu			pmu_disable_count;
			
 
				+	struct perf_cpu_context * __percpu pmu_cpu_context;
			
 
				+	int				task_ctx_nr;
			
 
				+
			
 
				+	/*
			
 
				+	 * Fully disable/enable this PMU, can be used to protect from the PMI
			
 
				+	 * as well as for lazy/batch writing of the MSRs.
			
 
				+	 */
			
 
				+	void (*pmu_enable)		(struct pmu *pmu); /* optional */
			
 
				+	void (*pmu_disable)		(struct pmu *pmu); /* optional */
			
 
				 
			
 
				 	/*
			
 
				-	 * Group events scheduling is treated as a transaction, add group
			
 
				-	 * events as a whole and perform one schedulability test. If the test
			
 
				-	 * fails, roll back the whole group
			
 
				+	 * Try and initialize the event for this PMU.
			
 
				+	 * Should return -ENOENT when the @event doesn't match this PMU.
			
 
				 	 */
			
 
				+	int (*event_init)		(struct perf_event *event);
			
 
				+
			
 
				+#define PERF_EF_START	0x01		/* start the counter when adding    */
			
 
				+#define PERF_EF_RELOAD	0x02		/* reload the counter when starting */
			
 
				+#define PERF_EF_UPDATE	0x04		/* update the counter when stopping */
			
 
				 
			
 
				 	/*
			
 
				-	 * Start the transaction, after this ->enable() doesn't need
			
 
				-	 * to do schedulability tests.
			
 
				+	 * Adds/Removes a counter to/from the PMU, can be done inside
			
 
				+	 * a transaction, see the ->*_txn() methods.
			
 
				 	 */
			
 
				-	void (*start_txn)	(const struct pmu *pmu);
			
 
				+	int  (*add)			(struct perf_event *event, int flags);
			
 
				+	void (*del)			(struct perf_event *event, int flags);
			
 
				+
			
 
				 	/*
			
 
				-	 * If ->start_txn() disabled the ->enable() schedulability test
			
 
				+	 * Starts/Stops a counter present on the PMU. The PMI handler
			
 
				+	 * should stop the counter when perf_event_overflow() returns
			
 
				+	 * !0. ->start() will be used to continue.
			
 
				+	 */
			
 
				+	void (*start)			(struct perf_event *event, int flags);
			
 
				+	void (*stop)			(struct perf_event *event, int flags);
			
 
				+
			
 
				+	/*
			
 
				+	 * Updates the counter value of the event.
			
 
				+	 */
			
 
				+	void (*read)			(struct perf_event *event);
			
 
				+
			
 
				+	/*
			
 
				+	 * Group events scheduling is treated as a transaction, add
			
 
				+	 * group events as a whole and perform one schedulability test.
			
 
				+	 * If the test fails, roll back the whole group
			
 
				+	 *
			
 
				+	 * Start the transaction, after this ->add() doesn't need to
			
 
				+	 * do schedulability tests.
			
 
				+	 */
			
 
				+	void (*start_txn)	(struct pmu *pmu); /* optional */
			
 
				+	/*
			
 
				+	 * If ->start_txn() disabled the ->add() schedulability test
			
 
				 	 * then ->commit_txn() is required to perform one. On success
			
 
				 	 * the transaction is closed. On error the transaction is kept
			
 
				 	 * open until ->cancel_txn() is called.
			
 
				 	 */
			
 
				-	int  (*commit_txn)	(const struct pmu *pmu);
			
 
				+	int  (*commit_txn)	(struct pmu *pmu); /* optional */
			
 
				 	/*
			
 
				-	 * Will cancel the transaction, assumes ->disable() is called for
			
 
				-	 * each successfull ->enable() during the transaction.
			
 
				+	 * Will cancel the transaction, assumes ->del() is called
			
 
				+	 * for each successfull ->add() during the transaction.
			
 
				 	 */
			
 
				-	void (*cancel_txn)	(const struct pmu *pmu);
			
 
				+	void (*cancel_txn)	(struct pmu *pmu); /* optional */
			
 
				 };
			
 
				 
			
 
				 /**
			
@@ -631,11 +680,6 @@ struct perf_buffer {
 
				 	void				*data_pages[0];
			
 
				 };
			
 
				 
			
 
				-struct perf_pending_entry {
			
 
				-	struct perf_pending_entry *next;
			
 
				-	void (*func)(struct perf_pending_entry *);
			
 
				-};
			
 
				-
			
 
				 struct perf_sample_data;
			
 
				 
			
 
				 typedef void (*perf_overflow_handler_t)(struct perf_event *, int,
			
@@ -656,6 +700,7 @@ struct swevent_hlist {
 
				 
			
 
				 #define PERF_ATTACH_CONTEXT	0x01
			
 
				 #define PERF_ATTACH_GROUP	0x02
			
 
				+#define PERF_ATTACH_TASK	0x04
			
 
				 
			
 
				 /**
			
 
				  * struct perf_event - performance event kernel representation:
			
@@ -669,7 +714,7 @@ struct perf_event {
 
				 	int				nr_siblings;
			
 
				 	int				group_flags;
			
 
				 	struct perf_event		*group_leader;
			
 
				-	const struct pmu		*pmu;
			
 
				+	struct pmu			*pmu;
			
 
				 
			
 
				 	enum perf_event_active_state	state;
			
 
				 	unsigned int			attach_state;
			
@@ -743,7 +788,7 @@ struct perf_event {
 
				 	int				pending_wakeup;
			
 
				 	int				pending_kill;
			
 
				 	int				pending_disable;
			
 
				-	struct perf_pending_entry	pending;
			
 
				+	struct irq_work			pending;
			
 
				 
			
 
				 	atomic_t			event_limit;
			
 
				 
			
@@ -763,12 +808,19 @@ struct perf_event {
 
				 #endif /* CONFIG_PERF_EVENTS */
			
 
				 };
			
 
				 
			
 
				+enum perf_event_context_type {
			
 
				+	task_context,
			
 
				+	cpu_context,
			
 
				+};
			
 
				+
			
 
				 /**
			
 
				  * struct perf_event_context - event context structure
			
 
				  *
			
 
				  * Used as a container for task events and CPU events as well:
			
 
				  */
			
 
				 struct perf_event_context {
			
 
				+	enum perf_event_context_type	type;
			
 
				+	struct pmu			*pmu;
			
 
				 	/*
			
 
				 	 * Protect the states of the events in the list,
			
 
				 	 * nr_active, and the list:
			
@@ -808,6 +860,12 @@ struct perf_event_context {
 
				 	struct rcu_head			rcu_head;
			
 
				 };
			
 
				 
			
 
				+/*
			
 
				+ * Number of contexts where an event can trigger:
			
 
				+ * 	task, softirq, hardirq, nmi.
			
 
				+ */
			
 
				+#define PERF_NR_CONTEXTS	4
			
 
				+
			
 
				 /**
			
 
				  * struct perf_event_cpu_context - per cpu event context structure
			
 
				  */
			
@@ -815,18 +873,9 @@ struct perf_cpu_context {
 
				 	struct perf_event_context	ctx;
			
 
				 	struct perf_event_context	*task_ctx;
			
 
				 	int				active_oncpu;
			
 
				-	int				max_pertask;
			
 
				 	int				exclusive;
			
 
				-	struct swevent_hlist		*swevent_hlist;
			
 
				-	struct mutex			hlist_mutex;
			
 
				-	int				hlist_refcount;
			
 
				-
			
 
				-	/*
			
 
				-	 * Recursion avoidance:
			
 
				-	 *
			
 
				-	 * task, softirq, irq, nmi context
			
 
				-	 */
			
 
				-	int				recursion[4];
			
 
				+	struct list_head		rotation_list;
			
 
				+	int				jiffies_interval;
			
 
				 };
			
 
				 
			
 
				 struct perf_output_handle {
			
@@ -842,26 +891,34 @@ struct perf_output_handle {
 
				 
			
 
				 #ifdef CONFIG_PERF_EVENTS
			
 
				 
			
 
				-/*
			
 
				- * Set by architecture code:
			
 
				- */
			
 
				-extern int perf_max_events;
			
 
				+extern int perf_pmu_register(struct pmu *pmu);
			
 
				+extern void perf_pmu_unregister(struct pmu *pmu);
			
 
				+
			
 
				+extern int perf_num_counters(void);
			
 
				+extern const char *perf_pmu_name(void);
			
 
				+extern void __perf_event_task_sched_in(struct task_struct *task);
			
 
				+extern void __perf_event_task_sched_out(struct task_struct *task, struct task_struct *next);
			
 
				 
			
 
				-extern const struct pmu *hw_perf_event_init(struct perf_event *event);
			
 
				+extern atomic_t perf_task_events;
			
 
				+
			
 
				+static inline void perf_event_task_sched_in(struct task_struct *task)
			
 
				+{
			
 
				+	COND_STMT(&perf_task_events, __perf_event_task_sched_in(task));
			
 
				+}
			
 
				+
			
 
				+static inline
			
 
				+void perf_event_task_sched_out(struct task_struct *task, struct task_struct *next)
			
 
				+{
			
 
				+	COND_STMT(&perf_task_events, __perf_event_task_sched_out(task, next));
			
 
				+}
			
 
				 
			
 
				-extern void perf_event_task_sched_in(struct task_struct *task);
			
 
				-extern void perf_event_task_sched_out(struct task_struct *task, struct task_struct *next);
			
 
				-extern void perf_event_task_tick(struct task_struct *task);
			
 
				 extern int perf_event_init_task(struct task_struct *child);
			
 
				 extern void perf_event_exit_task(struct task_struct *child);
			
 
				 extern void perf_event_free_task(struct task_struct *task);
			
 
				-extern void set_perf_event_pending(void);
			
 
				-extern void perf_event_do_pending(void);
			
 
				+extern void perf_event_delayed_put(struct task_struct *task);
			
 
				 extern void perf_event_print_debug(void);
			
 
				-extern void __perf_disable(void);
			
 
				-extern bool __perf_enable(void);
			
 
				-extern void perf_disable(void);
			
 
				-extern void perf_enable(void);
			
 
				+extern void perf_pmu_disable(struct pmu *pmu);
			
 
				+extern void perf_pmu_enable(struct pmu *pmu);
			
 
				 extern int perf_event_task_disable(void);
			
 
				 extern int perf_event_task_enable(void);
			
 
				 extern void perf_event_update_userpage(struct perf_event *event);
			
@@ -869,7 +926,7 @@ extern int perf_event_release_kernel(struct perf_event *event);
 
				 extern struct perf_event *
			
 
				 perf_event_create_kernel_counter(struct perf_event_attr *attr,
			
 
				 				int cpu,
			
 
				-				pid_t pid,
			
 
				+				struct task_struct *task,
			
 
				 				perf_overflow_handler_t callback);
			
 
				 extern u64 perf_event_read_value(struct perf_event *event,
			
 
				 				 u64 *enabled, u64 *running);
			
@@ -920,14 +977,7 @@ extern int perf_event_overflow(struct perf_event *event, int nmi,
 
				  */
			
 
				 static inline int is_software_event(struct perf_event *event)
			
 
				 {
			
 
				-	switch (event->attr.type) {
			
 
				-	case PERF_TYPE_SOFTWARE:
			
 
				-	case PERF_TYPE_TRACEPOINT:
			
 
				-	/* for now the breakpoint stuff also works as software event */
			
 
				-	case PERF_TYPE_BREAKPOINT:
			
 
				-		return 1;
			
 
				-	}
			
 
				-	return 0;
			
 
				+	return event->pmu->task_ctx_nr == perf_sw_context;
			
 
				 }
			
 
				 
			
 
				 extern atomic_t perf_swevent_enabled[PERF_COUNT_SW_MAX];
			
@@ -954,18 +1004,20 @@ static inline void perf_fetch_caller_regs(struct pt_regs *regs)
 
				 	perf_arch_fetch_caller_regs(regs, CALLER_ADDR0);
			
 
				 }
			
 
				 
			
 
				-static inline void
			
 
				+static __always_inline void
			
 
				 perf_sw_event(u32 event_id, u64 nr, int nmi, struct pt_regs *regs, u64 addr)
			
 
				 {
			
 
				-	if (atomic_read(&perf_swevent_enabled[event_id])) {
			
 
				-		struct pt_regs hot_regs;
			
 
				-
			
 
				-		if (!regs) {
			
 
				-			perf_fetch_caller_regs(&hot_regs);
			
 
				-			regs = &hot_regs;
			
 
				-		}
			
 
				-		__perf_sw_event(event_id, nr, nmi, regs, addr);
			
 
				+	struct pt_regs hot_regs;
			
 
				+
			
 
				+	JUMP_LABEL(&perf_swevent_enabled[event_id], have_event);
			
 
				+	return;
			
 
				+
			
 
				+have_event:
			
 
				+	if (!regs) {
			
 
				+		perf_fetch_caller_regs(&hot_regs);
			
 
				+		regs = &hot_regs;
			
 
				 	}
			
 
				+	__perf_sw_event(event_id, nr, nmi, regs, addr);
			
 
				 }
			
 
				 
			
 
				 extern void perf_event_mmap(struct vm_area_struct *vma);
			
@@ -976,7 +1028,21 @@ extern int perf_unregister_guest_info_callbacks(struct perf_guest_info_callbacks
 
				 extern void perf_event_comm(struct task_struct *tsk);
			
 
				 extern void perf_event_fork(struct task_struct *tsk);
			
 
				 
			
 
				-extern struct perf_callchain_entry *perf_callchain(struct pt_regs *regs);
			
 
				+/* Callchains */
			
 
				+DECLARE_PER_CPU(struct perf_callchain_entry, perf_callchain_entry);
			
 
				+
			
 
				+extern void perf_callchain_user(struct perf_callchain_entry *entry,
			
 
				+				struct pt_regs *regs);
			
 
				+extern void perf_callchain_kernel(struct perf_callchain_entry *entry,
			
 
				+				  struct pt_regs *regs);
			
 
				+
			
 
				+
			
 
				+static inline void
			
 
				+perf_callchain_store(struct perf_callchain_entry *entry, u64 ip)
			
 
				+{
			
 
				+	if (entry->nr < PERF_MAX_STACK_DEPTH)
			
 
				+		entry->ip[entry->nr++] = ip;
			
 
				+}
			
 
				 
			
 
				 extern int sysctl_perf_event_paranoid;
			
 
				 extern int sysctl_perf_event_mlock;
			
@@ -1019,21 +1085,18 @@ extern int perf_swevent_get_recursion_context(void);
 
				 extern void perf_swevent_put_recursion_context(int rctx);
			
 
				 extern void perf_event_enable(struct perf_event *event);
			
 
				 extern void perf_event_disable(struct perf_event *event);
			
 
				+extern void perf_event_task_tick(void);
			
 
				 #else
			
 
				 static inline void
			
 
				 perf_event_task_sched_in(struct task_struct *task)			{ }
			
 
				 static inline void
			
 
				 perf_event_task_sched_out(struct task_struct *task,
			
 
				 			    struct task_struct *next)			{ }
			
 
				-static inline void
			
 
				-perf_event_task_tick(struct task_struct *task)				{ }
			
 
				 static inline int perf_event_init_task(struct task_struct *child)	{ return 0; }
			
 
				 static inline void perf_event_exit_task(struct task_struct *child)	{ }
			
 
				 static inline void perf_event_free_task(struct task_struct *task)	{ }
			
 
				-static inline void perf_event_do_pending(void)				{ }
			
 
				+static inline void perf_event_delayed_put(struct task_struct *task)	{ }
			
 
				 static inline void perf_event_print_debug(void)				{ }
			
 
				-static inline void perf_disable(void)					{ }
			
 
				-static inline void perf_enable(void)					{ }
			
 
				 static inline int perf_event_task_disable(void)				{ return -EINVAL; }
			
 
				 static inline int perf_event_task_enable(void)				{ return -EINVAL; }
			
 
				 
			
@@ -1056,6 +1119,7 @@ static inline int  perf_swevent_get_recursion_context(void)		{ return -1; }
 
				 static inline void perf_swevent_put_recursion_context(int rctx)		{ }
			
 
				 static inline void perf_event_enable(struct perf_event *event)		{ }
			
 
				 static inline void perf_event_disable(struct perf_event *event)		{ }
			
 
				+static inline void perf_event_task_tick(void)				{ }
			
 
				 #endif
			
 
				 
			
 
				 #define perf_output_put(handle, x) \
			
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -1160,6 +1160,13 @@ struct sched_rt_entity {
 
				 
			
 
				 struct rcu_node;
			
 
				 
			
 
				+enum perf_event_task_context {
			
 
				+	perf_invalid_context = -1,
			
 
				+	perf_hw_context = 0,
			
 
				+	perf_sw_context,
			
 
				+	perf_nr_task_contexts,
			
 
				+};
			
 
				+
			
 
				 struct task_struct {
			
 
				 	volatile long state;	/* -1 unrunnable, 0 runnable, >0 stopped */
			
 
				 	void *stack;
			
@@ -1433,7 +1440,7 @@ struct task_struct {
 
				 	struct futex_pi_state *pi_state_cache;
			
 
				 #endif
			
 
				 #ifdef CONFIG_PERF_EVENTS
			
 
				-	struct perf_event_context *perf_event_ctxp;
			
 
				+	struct perf_event_context *perf_event_ctxp[perf_nr_task_contexts];
			
 
				 	struct mutex perf_event_mutex;
			
 
				 	struct list_head perf_event_list;
			
 
				 #endif
			
--- a/include/linux/stop_machine.h
+++ b/include/linux/stop_machine.h
@@ -126,8 +126,8 @@ int __stop_machine(int (*fn)(void *), void *data, const struct cpumask *cpus);
 
				 
			
 
				 #else	 /* CONFIG_STOP_MACHINE && CONFIG_SMP */
			
 
				 
			
 
				-static inline int stop_machine(int (*fn)(void *), void *data,
			
 
				-			       const struct cpumask *cpus)
			
 
				+static inline int __stop_machine(int (*fn)(void *), void *data,
			
 
				+				 const struct cpumask *cpus)
			
 
				 {
			
 
				 	int ret;
			
 
				 	local_irq_disable();
			
@@ -136,5 +136,11 @@ static inline int stop_machine(int (*fn)(void *), void *data,
 
				 	return ret;
			
 
				 }
			
 
				 
			
 
				+static inline int stop_machine(int (*fn)(void *), void *data,
			
 
				+			       const struct cpumask *cpus)
			
 
				+{
			
 
				+	return __stop_machine(fn, data, cpus);
			
 
				+}
			
 
				+
			
 
				 #endif	/* CONFIG_STOP_MACHINE && CONFIG_SMP */
			
 
				 #endif	/* _LINUX_STOP_MACHINE */
			
--- a/include/linux/tracepoint.h
+++ b/include/linux/tracepoint.h
@@ -17,6 +17,7 @@
 
				 #include <linux/errno.h>
			
 
				 #include <linux/types.h>
			
 
				 #include <linux/rcupdate.h>
			
 
				+#include <linux/jump_label.h>
			
 
				 
			
 
				 struct module;
			
 
				 struct tracepoint;
			
@@ -145,7 +146,9 @@ static inline void tracepoint_update_probe_range(struct tracepoint *begin,
 
				 	extern struct tracepoint __tracepoint_##name;			\
			
 
				 	static inline void trace_##name(proto)				\
			
 
				 	{								\
			
 
				-		if (unlikely(__tracepoint_##name.state))		\
			
 
				+		JUMP_LABEL(&__tracepoint_##name.state, do_trace);	\
			
 
				+		return;							\
			
 
				+do_trace:								\
			
 
				 			__DO_TRACE(&__tracepoint_##name,		\
			
 
				 				TP_PROTO(data_proto),			\
			
 
				 				TP_ARGS(data_args));			\
			
--- a/include/trace/events/irq.h
+++ b/include/trace/events/irq.h
@@ -5,7 +5,9 @@
 
				 #define _TRACE_IRQ_H
			
 
				 
			
 
				 #include <linux/tracepoint.h>
			
 
				-#include <linux/interrupt.h>
			
 
				+
			
 
				+struct irqaction;
			
 
				+struct softirq_action;
			
 
				 
			
 
				 #define softirq_name(sirq) { sirq##_SOFTIRQ, #sirq }
			
 
				 #define show_softirq_name(val)				\
			
@@ -93,7 +95,10 @@ DECLARE_EVENT_CLASS(softirq,
 
				 	),
			
 
				 
			
 
				 	TP_fast_assign(
			
 
				-		__entry->vec = (int)(h - vec);
			
 
				+		if (vec)
			
 
				+			__entry->vec = (int)(h - vec);
			
 
				+		else
			
 
				+			__entry->vec = (int)(long)h;
			
 
				 	),
			
 
				 
			
 
				 	TP_printk("vec=%d [action=%s]", __entry->vec,
			
@@ -136,6 +141,23 @@ DEFINE_EVENT(softirq, softirq_exit,
 
				 	TP_ARGS(h, vec)
			
 
				 );
			
 
				 
			
 
				+/**
			
 
				+ * softirq_raise - called immediately when a softirq is raised
			
 
				+ * @h: pointer to struct softirq_action
			
 
				+ * @vec: pointer to first struct softirq_action in softirq_vec array
			
 
				+ *
			
 
				+ * The @h parameter contains a pointer to the softirq vector number which is
			
 
				+ * raised. @vec is NULL and it means @h includes vector number not
			
 
				+ * softirq_action. When used in combination with the softirq_entry tracepoint
			
 
				+ * we can determine the softirq raise latency.
			
 
				+ */
			
 
				+DEFINE_EVENT(softirq, softirq_raise,
			
 
				+
			
 
				+	TP_PROTO(struct softirq_action *h, struct softirq_action *vec),
			
 
				+
			
 
				+	TP_ARGS(h, vec)
			
 
				+);
			
 
				+
			
 
				 #endif /*  _TRACE_IRQ_H */
			
 
				 
			
 
				 /* This part must be outside protection */
			
--- a/include/trace/events/napi.h
+++ b/include/trace/events/napi.h
@@ -6,10 +6,31 @@
 
				 
			
 
				 #include <linux/netdevice.h>
			
 
				 #include <linux/tracepoint.h>
			
 
				+#include <linux/ftrace.h>
			
 
				+
			
 
				+#define NO_DEV "(no_device)"
			
 
				+
			
 
				+TRACE_EVENT(napi_poll,
			
 
				 
			
 
				-DECLARE_TRACE(napi_poll,
			
 
				 	TP_PROTO(struct napi_struct *napi),
			
 
				-	TP_ARGS(napi));
			
 
				+
			
 
				+	TP_ARGS(napi),
			
 
				+
			
 
				+	TP_STRUCT__entry(
			
 
				+		__field(	struct napi_struct *,	napi)
			
 
				+		__string(	dev_name, napi->dev ? napi->dev->name : NO_DEV)
			
 
				+	),
			
 
				+
			
 
				+	TP_fast_assign(
			
 
				+		__entry->napi = napi;
			
 
				+		__assign_str(dev_name, napi->dev ? napi->dev->name : NO_DEV);
			
 
				+	),
			
 
				+
			
 
				+	TP_printk("napi poll on napi struct %p for device %s",
			
 
				+		__entry->napi, __get_str(dev_name))
			
 
				+);
			
 
				+
			
 
				+#undef NO_DEV
			
 
				 
			
 
				 #endif /* _TRACE_NAPI_H_ */
			
 
				 
			
--- a/include/trace/events/net.h
+++ b/include/trace/events/net.h
@@ -0,0 +1,82 @@
 
				+#undef TRACE_SYSTEM
			
 
				+#define TRACE_SYSTEM net
			
 
				+
			
 
				+#if !defined(_TRACE_NET_H) || defined(TRACE_HEADER_MULTI_READ)
			
 
				+#define _TRACE_NET_H
			
 
				+
			
 
				+#include <linux/skbuff.h>
			
 
				+#include <linux/netdevice.h>
			
 
				+#include <linux/ip.h>
			
 
				+#include <linux/tracepoint.h>
			
 
				+
			
 
				+TRACE_EVENT(net_dev_xmit,
			
 
				+
			
 
				+	TP_PROTO(struct sk_buff *skb,
			
 
				+		 int rc),
			
 
				+
			
 
				+	TP_ARGS(skb, rc),
			
 
				+
			
 
				+	TP_STRUCT__entry(
			
 
				+		__field(	void *,		skbaddr		)
			
 
				+		__field(	unsigned int,	len		)
			
 
				+		__field(	int,		rc		)
			
 
				+		__string(	name,		skb->dev->name	)
			
 
				+	),
			
 
				+
			
 
				+	TP_fast_assign(
			
 
				+		__entry->skbaddr = skb;
			
 
				+		__entry->len = skb->len;
			
 
				+		__entry->rc = rc;
			
 
				+		__assign_str(name, skb->dev->name);
			
 
				+	),
			
 
				+
			
 
				+	TP_printk("dev=%s skbaddr=%p len=%u rc=%d",
			
 
				+		__get_str(name), __entry->skbaddr, __entry->len, __entry->rc)
			
 
				+);
			
 
				+
			
 
				+DECLARE_EVENT_CLASS(net_dev_template,
			
 
				+
			
 
				+	TP_PROTO(struct sk_buff *skb),
			
 
				+
			
 
				+	TP_ARGS(skb),
			
 
				+
			
 
				+	TP_STRUCT__entry(
			
 
				+		__field(	void *,		skbaddr		)
			
 
				+		__field(	unsigned int,	len		)
			
 
				+		__string(	name,		skb->dev->name	)
			
 
				+	),
			
 
				+
			
 
				+	TP_fast_assign(
			
 
				+		__entry->skbaddr = skb;
			
 
				+		__entry->len = skb->len;
			
 
				+		__assign_str(name, skb->dev->name);
			
 
				+	),
			
 
				+
			
 
				+	TP_printk("dev=%s skbaddr=%p len=%u",
			
 
				+		__get_str(name), __entry->skbaddr, __entry->len)
			
 
				+)
			
 
				+
			
 
				+DEFINE_EVENT(net_dev_template, net_dev_queue,
			
 
				+
			
 
				+	TP_PROTO(struct sk_buff *skb),
			
 
				+
			
 
				+	TP_ARGS(skb)
			
 
				+);
			
 
				+
			
 
				+DEFINE_EVENT(net_dev_template, netif_receive_skb,
			
 
				+
			
 
				+	TP_PROTO(struct sk_buff *skb),
			
 
				+
			
 
				+	TP_ARGS(skb)
			
 
				+);
			
 
				+
			
 
				+DEFINE_EVENT(net_dev_template, netif_rx,
			
 
				+
			
 
				+	TP_PROTO(struct sk_buff *skb),
			
 
				+
			
 
				+	TP_ARGS(skb)
			
 
				+);
			
 
				+#endif /* _TRACE_NET_H */
			
 
				+
			
 
				+/* This part must be outside protection */
			
 
				+#include <trace/define_trace.h>
			
--- a/include/trace/events/power.h
+++ b/include/trace/events/power.h
@@ -10,12 +10,17 @@
 
				 #ifndef _TRACE_POWER_ENUM_
			
 
				 #define _TRACE_POWER_ENUM_
			
 
				 enum {
			
 
				-	POWER_NONE = 0,
			
 
				-	POWER_CSTATE = 1,
			
 
				-	POWER_PSTATE = 2,
			
 
				+	POWER_NONE	= 0,
			
 
				+	POWER_CSTATE	= 1,	/* C-State */
			
 
				+	POWER_PSTATE	= 2,	/* Fequency change or DVFS */
			
 
				+	POWER_SSTATE	= 3,	/* Suspend */
			
 
				 };
			
 
				 #endif
			
 
				 
			
 
				+/*
			
 
				+ * The power events are used for cpuidle & suspend (power_start, power_end)
			
 
				+ *  and for cpufreq (power_frequency)
			
 
				+ */
			
 
				 DECLARE_EVENT_CLASS(power,
			
 
				 
			
 
				 	TP_PROTO(unsigned int type, unsigned int state, unsigned int cpu_id),
			
@@ -70,6 +75,85 @@ TRACE_EVENT(power_end,
 
				 
			
 
				 );
			
 
				 
			
 
				+/*
			
 
				+ * The clock events are used for clock enable/disable and for
			
 
				+ *  clock rate change
			
 
				+ */
			
 
				+DECLARE_EVENT_CLASS(clock,
			
 
				+
			
 
				+	TP_PROTO(const char *name, unsigned int state, unsigned int cpu_id),
			
 
				+
			
 
				+	TP_ARGS(name, state, cpu_id),
			
 
				+
			
 
				+	TP_STRUCT__entry(
			
 
				+		__string(       name,           name            )
			
 
				+		__field(        u64,            state           )
			
 
				+		__field(        u64,            cpu_id          )
			
 
				+	),
			
 
				+
			
 
				+	TP_fast_assign(
			
 
				+		__assign_str(name, name);
			
 
				+		__entry->state = state;
			
 
				+		__entry->cpu_id = cpu_id;
			
 
				+	),
			
 
				+
			
 
				+	TP_printk("%s state=%lu cpu_id=%lu", __get_str(name),
			
 
				+		(unsigned long)__entry->state, (unsigned long)__entry->cpu_id)
			
 
				+);
			
 
				+
			
 
				+DEFINE_EVENT(clock, clock_enable,
			
 
				+
			
 
				+	TP_PROTO(const char *name, unsigned int state, unsigned int cpu_id),
			
 
				+
			
 
				+	TP_ARGS(name, state, cpu_id)
			
 
				+);
			
 
				+
			
 
				+DEFINE_EVENT(clock, clock_disable,
			
 
				+
			
 
				+	TP_PROTO(const char *name, unsigned int state, unsigned int cpu_id),
			
 
				+
			
 
				+	TP_ARGS(name, state, cpu_id)
			
 
				+);
			
 
				+
			
 
				+DEFINE_EVENT(clock, clock_set_rate,
			
 
				+
			
 
				+	TP_PROTO(const char *name, unsigned int state, unsigned int cpu_id),
			
 
				+
			
 
				+	TP_ARGS(name, state, cpu_id)
			
 
				+);
			
 
				+
			
 
				+/*
			
 
				+ * The power domain events are used for power domains transitions
			
 
				+ */
			
 
				+DECLARE_EVENT_CLASS(power_domain,
			
 
				+
			
 
				+	TP_PROTO(const char *name, unsigned int state, unsigned int cpu_id),
			
 
				+
			
 
				+	TP_ARGS(name, state, cpu_id),
			
 
				+
			
 
				+	TP_STRUCT__entry(
			
 
				+		__string(       name,           name            )
			
 
				+		__field(        u64,            state           )
			
 
				+		__field(        u64,            cpu_id          )
			
 
				+	),
			
 
				+
			
 
				+	TP_fast_assign(
			
 
				+		__assign_str(name, name);
			
 
				+		__entry->state = state;
			
 
				+		__entry->cpu_id = cpu_id;
			
 
				+),
			
 
				+
			
 
				+	TP_printk("%s state=%lu cpu_id=%lu", __get_str(name),
			
 
				+		(unsigned long)__entry->state, (unsigned long)__entry->cpu_id)
			
 
				+);
			
 
				+
			
 
				+DEFINE_EVENT(power_domain, power_domain_target,
			
 
				+
			
 
				+	TP_PROTO(const char *name, unsigned int state, unsigned int cpu_id),
			
 
				+
			
 
				+	TP_ARGS(name, state, cpu_id)
			
 
				+);
			
 
				+
			
 
				 #endif /* _TRACE_POWER_H */
			
 
				 
			
 
				 /* This part must be outside protection */
			
--- a/include/trace/events/skb.h
+++ b/include/trace/events/skb.h
@@ -35,6 +35,23 @@ TRACE_EVENT(kfree_skb,
 
				 		__entry->skbaddr, __entry->protocol, __entry->location)
			
 
				 );
			
 
				 
			
 
				+TRACE_EVENT(consume_skb,
			
 
				+
			
 
				+	TP_PROTO(struct sk_buff *skb),
			
 
				+
			
 
				+	TP_ARGS(skb),
			
 
				+
			
 
				+	TP_STRUCT__entry(
			
 
				+		__field(	void *,	skbaddr	)
			
 
				+	),
			
 
				+
			
 
				+	TP_fast_assign(
			
 
				+		__entry->skbaddr = skb;
			
 
				+	),
			
 
				+
			
 
				+	TP_printk("skbaddr=%p", __entry->skbaddr)
			
 
				+);
			
 
				+
			
 
				 TRACE_EVENT(skb_copy_datagram_iovec,
			
 
				 
			
 
				 	TP_PROTO(const struct sk_buff *skb, int len),
			
--- a/init/Kconfig
+++ b/init/Kconfig
@@ -21,6 +21,13 @@ config CONSTRUCTORS
 
				 	depends on !UML
			
 
				 	default y
			
 
				 
			
 
				+config HAVE_IRQ_WORK
			
 
				+	bool
			
 
				+
			
 
				+config IRQ_WORK
			
 
				+	bool
			
 
				+	depends on HAVE_IRQ_WORK
			
 
				+
			
 
				 menu "General setup"
			
 
				 
			
 
				 config EXPERIMENTAL
			
@@ -1005,6 +1012,7 @@ config PERF_EVENTS
 
				 	default y if (PROFILING || PERF_COUNTERS)
			
 
				 	depends on HAVE_PERF_EVENTS
			
 
				 	select ANON_INODES
			
 
				+	select IRQ_WORK
			
 
				 	help
			
 
				 	  Enable kernel support for various performance events provided
			
 
				 	  by software and hardware.
			
--- a/kernel/Makefile
+++ b/kernel/Makefile
@@ -10,7 +10,7 @@ obj-y     = sched.o fork.o exec_domain.o panic.o printk.o \
 
				 	    kthread.o wait.o kfifo.o sys_ni.o posix-cpu-timers.o mutex.o \
			
 
				 	    hrtimer.o rwsem.o nsproxy.o srcu.o semaphore.o \
			
 
				 	    notifier.o ksysfs.o pm_qos_params.o sched_clock.o cred.o \
			
 
				-	    async.o range.o
			
 
				+	    async.o range.o jump_label.o
			
 
				 obj-$(CONFIG_HAVE_EARLY_RES) += early_res.o
			
 
				 obj-y += groups.o
			
 
				 
			
@@ -23,6 +23,7 @@ CFLAGS_REMOVE_rtmutex-debug.o = -pg
 
				 CFLAGS_REMOVE_cgroup-debug.o = -pg
			
 
				 CFLAGS_REMOVE_sched_clock.o = -pg
			
 
				 CFLAGS_REMOVE_perf_event.o = -pg
			
 
				+CFLAGS_REMOVE_irq_work.o = -pg
			
 
				 endif
			
 
				 
			
 
				 obj-$(CONFIG_FREEZER) += freezer.o
			
@@ -101,6 +102,7 @@ obj-$(CONFIG_TRACING) += trace/
 
				 obj-$(CONFIG_X86_DS) += trace/
			
 
				 obj-$(CONFIG_RING_BUFFER) += trace/
			
 
				 obj-$(CONFIG_SMP) += sched_cpupri.o
			
 
				+obj-$(CONFIG_IRQ_WORK) += irq_work.o
			
 
				 obj-$(CONFIG_PERF_EVENTS) += perf_event.o
			
 
				 obj-$(CONFIG_HAVE_HW_BREAKPOINT) += hw_breakpoint.o
			
 
				 obj-$(CONFIG_USER_RETURN_NOTIFIER) += user-return-notifier.o
			
--- a/kernel/exit.c
+++ b/kernel/exit.c
@@ -149,9 +149,7 @@ static void delayed_put_task_struct(struct rcu_head *rhp)
 
				 {
			
 
				 	struct task_struct *tsk = container_of(rhp, struct task_struct, rcu);
			
 
				 
			
 
				-#ifdef CONFIG_PERF_EVENTS
			
 
				-	WARN_ON_ONCE(tsk->perf_event_ctxp);
			
 
				-#endif
			
 
				+	perf_event_delayed_put(tsk);
			
 
				 	trace_sched_process_free(tsk);
			
 
				 	put_task_struct(tsk);
			
 
				 }
			
--- a/kernel/hw_breakpoint.c
+++ b/kernel/hw_breakpoint.c
@@ -113,12 +113,12 @@ static unsigned int max_task_bp_pinned(int cpu, enum bp_type_idx type)
 
				  */
			
 
				 static int task_bp_pinned(struct perf_event *bp, enum bp_type_idx type)
			
 
				 {
			
 
				-	struct perf_event_context *ctx = bp->ctx;
			
 
				+	struct task_struct *tsk = bp->hw.bp_target;
			
 
				 	struct perf_event *iter;
			
 
				 	int count = 0;
			
 
				 
			
 
				 	list_for_each_entry(iter, &bp_task_head, hw.bp_list) {
			
 
				-		if (iter->ctx == ctx && find_slot_idx(iter) == type)
			
 
				+		if (iter->hw.bp_target == tsk && find_slot_idx(iter) == type)
			
 
				 			count += hw_breakpoint_weight(iter);
			
 
				 	}
			
 
				 
			
@@ -134,7 +134,7 @@ fetch_bp_busy_slots(struct bp_busy_slots *slots, struct perf_event *bp,
 
				 		    enum bp_type_idx type)
			
 
				 {
			
 
				 	int cpu = bp->cpu;
			
 
				-	struct task_struct *tsk = bp->ctx->task;
			
 
				+	struct task_struct *tsk = bp->hw.bp_target;
			
 
				 
			
 
				 	if (cpu >= 0) {
			
 
				 		slots->pinned = per_cpu(nr_cpu_bp_pinned[type], cpu);
			
@@ -213,7 +213,7 @@ toggle_bp_slot(struct perf_event *bp, bool enable, enum bp_type_idx type,
 
				 	       int weight)
			
 
				 {
			
 
				 	int cpu = bp->cpu;
			
 
				-	struct task_struct *tsk = bp->ctx->task;
			
 
				+	struct task_struct *tsk = bp->hw.bp_target;
			
 
				 
			
 
				 	/* Pinned counter cpu profiling */
			
 
				 	if (!tsk) {
			
@@ -433,8 +433,7 @@ register_user_hw_breakpoint(struct perf_event_attr *attr,
 
				 			    perf_overflow_handler_t triggered,
			
 
				 			    struct task_struct *tsk)
			
 
				 {
			
 
				-	return perf_event_create_kernel_counter(attr, -1, task_pid_vnr(tsk),
			
 
				-						triggered);
			
 
				+	return perf_event_create_kernel_counter(attr, -1, tsk, triggered);
			
 
				 }
			
 
				 EXPORT_SYMBOL_GPL(register_user_hw_breakpoint);
			
 
				 
			
@@ -516,7 +515,7 @@ register_wide_hw_breakpoint(struct perf_event_attr *attr,
 
				 	get_online_cpus();
			
 
				 	for_each_online_cpu(cpu) {
			
 
				 		pevent = per_cpu_ptr(cpu_events, cpu);
			
 
				-		bp = perf_event_create_kernel_counter(attr, cpu, -1, triggered);
			
 
				+		bp = perf_event_create_kernel_counter(attr, cpu, NULL, triggered);
			
 
				 
			
 
				 		*pevent = bp;
			
 
				 
			
@@ -566,6 +565,61 @@ static struct notifier_block hw_breakpoint_exceptions_nb = {
 
				 	.priority = 0x7fffffff
			
 
				 };
			
 
				 
			
 
				+static void bp_perf_event_destroy(struct perf_event *event)
			
 
				+{
			
 
				+	release_bp_slot(event);
			
 
				+}
			
 
				+
			
 
				+static int hw_breakpoint_event_init(struct perf_event *bp)
			
 
				+{
			
 
				+	int err;
			
 
				+
			
 
				+	if (bp->attr.type != PERF_TYPE_BREAKPOINT)
			
 
				+		return -ENOENT;
			
 
				+
			
 
				+	err = register_perf_hw_breakpoint(bp);
			
 
				+	if (err)
			
 
				+		return err;
			
 
				+
			
 
				+	bp->destroy = bp_perf_event_destroy;
			
 
				+
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+static int hw_breakpoint_add(struct perf_event *bp, int flags)
			
 
				+{
			
 
				+	if (!(flags & PERF_EF_START))
			
 
				+		bp->hw.state = PERF_HES_STOPPED;
			
 
				+
			
 
				+	return arch_install_hw_breakpoint(bp);
			
 
				+}
			
 
				+
			
 
				+static void hw_breakpoint_del(struct perf_event *bp, int flags)
			
 
				+{
			
 
				+	arch_uninstall_hw_breakpoint(bp);
			
 
				+}
			
 
				+
			
 
				+static void hw_breakpoint_start(struct perf_event *bp, int flags)
			
 
				+{
			
 
				+	bp->hw.state = 0;
			
 
				+}
			
 
				+
			
 
				+static void hw_breakpoint_stop(struct perf_event *bp, int flags)
			
 
				+{
			
 
				+	bp->hw.state = PERF_HES_STOPPED;
			
 
				+}
			
 
				+
			
 
				+static struct pmu perf_breakpoint = {
			
 
				+	.task_ctx_nr	= perf_sw_context, /* could eventually get its own */
			
 
				+
			
 
				+	.event_init	= hw_breakpoint_event_init,
			
 
				+	.add		= hw_breakpoint_add,
			
 
				+	.del		= hw_breakpoint_del,
			
 
				+	.start		= hw_breakpoint_start,
			
 
				+	.stop		= hw_breakpoint_stop,
			
 
				+	.read		= hw_breakpoint_pmu_read,
			
 
				+};
			
 
				+
			
 
				 static int __init init_hw_breakpoint(void)
			
 
				 {
			
 
				 	unsigned int **task_bp_pinned;
			
@@ -587,6 +641,8 @@ static int __init init_hw_breakpoint(void)
 
				 
			
 
				 	constraints_initialized = 1;
			
 
				 
			
 
				+	perf_pmu_register(&perf_breakpoint);
			
 
				+
			
 
				 	return register_die_notifier(&hw_breakpoint_exceptions_nb);
			
 
				 
			
 
				  err_alloc:
			
@@ -602,8 +658,3 @@ static int __init init_hw_breakpoint(void)
 
				 core_initcall(init_hw_breakpoint);
			
 
				 
			
 
				 
			
 
				-struct pmu perf_ops_bp = {
			
 
				-	.enable		= arch_install_hw_breakpoint,
			
 
				-	.disable	= arch_uninstall_hw_breakpoint,
			
 
				-	.read		= hw_breakpoint_pmu_read,
			
 
				-};
			
--- a/kernel/irq_work.c
+++ b/kernel/irq_work.c
@@ -0,0 +1,164 @@
 
				+/*
			
 
				+ * Copyright (C) 2010 Red Hat, Inc., Peter Zijlstra <pzijlstr@redhat.com>
			
 
				+ *
			
 
				+ * Provides a framework for enqueueing and running callbacks from hardirq
			
 
				+ * context. The enqueueing is NMI-safe.
			
 
				+ */
			
 
				+
			
 
				+#include <linux/kernel.h>
			
 
				+#include <linux/module.h>
			
 
				+#include <linux/irq_work.h>
			
 
				+#include <linux/hardirq.h>
			
 
				+
			
 
				+/*
			
 
				+ * An entry can be in one of four states:
			
 
				+ *
			
 
				+ * free	     NULL, 0 -> {claimed}       : free to be used
			
 
				+ * claimed   NULL, 3 -> {pending}       : claimed to be enqueued
			
 
				+ * pending   next, 3 -> {busy}          : queued, pending callback
			
 
				+ * busy      NULL, 2 -> {free, claimed} : callback in progress, can be claimed
			
 
				+ *
			
 
				+ * We use the lower two bits of the next pointer to keep PENDING and BUSY
			
 
				+ * flags.
			
 
				+ */
			
 
				+
			
 
				+#define IRQ_WORK_PENDING	1UL
			
 
				+#define IRQ_WORK_BUSY		2UL
			
 
				+#define IRQ_WORK_FLAGS		3UL
			
 
				+
			
 
				+static inline bool irq_work_is_set(struct irq_work *entry, int flags)
			
 
				+{
			
 
				+	return (unsigned long)entry->next & flags;
			
 
				+}
			
 
				+
			
 
				+static inline struct irq_work *irq_work_next(struct irq_work *entry)
			
 
				+{
			
 
				+	unsigned long next = (unsigned long)entry->next;
			
 
				+	next &= ~IRQ_WORK_FLAGS;
			
 
				+	return (struct irq_work *)next;
			
 
				+}
			
 
				+
			
 
				+static inline struct irq_work *next_flags(struct irq_work *entry, int flags)
			
 
				+{
			
 
				+	unsigned long next = (unsigned long)entry;
			
 
				+	next |= flags;
			
 
				+	return (struct irq_work *)next;
			
 
				+}
			
 
				+
			
 
				+static DEFINE_PER_CPU(struct irq_work *, irq_work_list);
			
 
				+
			
 
				+/*
			
 
				+ * Claim the entry so that no one else will poke at it.
			
 
				+ */
			
 
				+static bool irq_work_claim(struct irq_work *entry)
			
 
				+{
			
 
				+	struct irq_work *next, *nflags;
			
 
				+
			
 
				+	do {
			
 
				+		next = entry->next;
			
 
				+		if ((unsigned long)next & IRQ_WORK_PENDING)
			
 
				+			return false;
			
 
				+		nflags = next_flags(next, IRQ_WORK_FLAGS);
			
 
				+	} while (cmpxchg(&entry->next, next, nflags) != next);
			
 
				+
			
 
				+	return true;
			
 
				+}
			
 
				+
			
 
				+
			
 
				+void __weak arch_irq_work_raise(void)
			
 
				+{
			
 
				+	/*
			
 
				+	 * Lame architectures will get the timer tick callback
			
 
				+	 */
			
 
				+}
			
 
				+
			
 
				+/*
			
 
				+ * Queue the entry and raise the IPI if needed.
			
 
				+ */
			
 
				+static void __irq_work_queue(struct irq_work *entry)
			
 
				+{
			
 
				+	struct irq_work **head, *next;
			
 
				+
			
 
				+	head = &get_cpu_var(irq_work_list);
			
 
				+
			
 
				+	do {
			
 
				+		next = *head;
			
 
				+		/* Can assign non-atomic because we keep the flags set. */
			
 
				+		entry->next = next_flags(next, IRQ_WORK_FLAGS);
			
 
				+	} while (cmpxchg(head, next, entry) != next);
			
 
				+
			
 
				+	/* The list was empty, raise self-interrupt to start processing. */
			
 
				+	if (!irq_work_next(entry))
			
 
				+		arch_irq_work_raise();
			
 
				+
			
 
				+	put_cpu_var(irq_work_list);
			
 
				+}
			
 
				+
			
 
				+/*
			
 
				+ * Enqueue the irq_work @entry, returns true on success, failure when the
			
 
				+ * @entry was already enqueued by someone else.
			
 
				+ *
			
 
				+ * Can be re-enqueued while the callback is still in progress.
			
 
				+ */
			
 
				+bool irq_work_queue(struct irq_work *entry)
			
 
				+{
			
 
				+	if (!irq_work_claim(entry)) {
			
 
				+		/*
			
 
				+		 * Already enqueued, can't do!
			
 
				+		 */
			
 
				+		return false;
			
 
				+	}
			
 
				+
			
 
				+	__irq_work_queue(entry);
			
 
				+	return true;
			
 
				+}
			
 
				+EXPORT_SYMBOL_GPL(irq_work_queue);
			
 
				+
			
 
				+/*
			
 
				+ * Run the irq_work entries on this cpu. Requires to be ran from hardirq
			
 
				+ * context with local IRQs disabled.
			
 
				+ */
			
 
				+void irq_work_run(void)
			
 
				+{
			
 
				+	struct irq_work *list, **head;
			
 
				+
			
 
				+	head = &__get_cpu_var(irq_work_list);
			
 
				+	if (*head == NULL)
			
 
				+		return;
			
 
				+
			
 
				+	BUG_ON(!in_irq());
			
 
				+	BUG_ON(!irqs_disabled());
			
 
				+
			
 
				+	list = xchg(head, NULL);
			
 
				+	while (list != NULL) {
			
 
				+		struct irq_work *entry = list;
			
 
				+
			
 
				+		list = irq_work_next(list);
			
 
				+
			
 
				+		/*
			
 
				+		 * Clear the PENDING bit, after this point the @entry
			
 
				+		 * can be re-used.
			
 
				+		 */
			
 
				+		entry->next = next_flags(NULL, IRQ_WORK_BUSY);
			
 
				+		entry->func(entry);
			
 
				+		/*
			
 
				+		 * Clear the BUSY bit and return to the free state if
			
 
				+		 * no-one else claimed it meanwhile.
			
 
				+		 */
			
 
				+		cmpxchg(&entry->next, next_flags(NULL, IRQ_WORK_BUSY), NULL);
			
 
				+	}
			
 
				+}
			
 
				+EXPORT_SYMBOL_GPL(irq_work_run);
			
 
				+
			
 
				+/*
			
 
				+ * Synchronize against the irq_work @entry, ensures the entry is not
			
 
				+ * currently in use.
			
 
				+ */
			
 
				+void irq_work_sync(struct irq_work *entry)
			
 
				+{
			
 
				+	WARN_ON_ONCE(irqs_disabled());
			
 
				+
			
 
				+	while (irq_work_is_set(entry, IRQ_WORK_BUSY))
			
 
				+		cpu_relax();
			
 
				+}
			
 
				+EXPORT_SYMBOL_GPL(irq_work_sync);