13 years ago · 83c2f912b4
--- a/Documentation/kernel-parameters.txt
+++ b/Documentation/kernel-parameters.txt
@@ -2475,6 +2475,14 @@ bytes respectively. Such letter suffixes can also be entirely omitted.
 
				 	stacktrace	[FTRACE]
			
 
				 			Enabled the stack tracer on boot up.
			
 
				 
			
 
				+	stacktrace_filter=[function-list]
			
 
				+			[FTRACE] Limit the functions that the stack tracer
			
 
				+			will trace at boot up. function-list is a comma separated
			
 
				+			list of functions. This list can be changed at run
			
 
				+			time by the stack_trace_filter file in the debugfs
			
 
				+			tracing directory. Note, this enables stack tracing
			
 
				+			and the stacktrace above is not needed.
			
 
				+
			
 
				 	sti=		[PARISC,HW]
			
 
				 			Format: <num>
			
 
				 			Set the STI (builtin display/keyboard on the HP-PARISC
			
--- a/arch/x86/include/asm/debugreg.h
+++ b/arch/x86/include/asm/debugreg.h
@@ -101,6 +101,28 @@ extern void aout_dump_debugregs(struct user *dump);
 
				 
			
 
				 extern void hw_breakpoint_restore(void);
			
 
				 
			
 
				+#ifdef CONFIG_X86_64
			
 
				+DECLARE_PER_CPU(int, debug_stack_usage);
			
 
				+static inline void debug_stack_usage_inc(void)
			
 
				+{
			
 
				+	__get_cpu_var(debug_stack_usage)++;
			
 
				+}
			
 
				+static inline void debug_stack_usage_dec(void)
			
 
				+{
			
 
				+	__get_cpu_var(debug_stack_usage)--;
			
 
				+}
			
 
				+int is_debug_stack(unsigned long addr);
			
 
				+void debug_stack_set_zero(void);
			
 
				+void debug_stack_reset(void);
			
 
				+#else /* !X86_64 */
			
 
				+static inline int is_debug_stack(unsigned long addr) { return 0; }
			
 
				+static inline void debug_stack_set_zero(void) { }
			
 
				+static inline void debug_stack_reset(void) { }
			
 
				+static inline void debug_stack_usage_inc(void) { }
			
 
				+static inline void debug_stack_usage_dec(void) { }
			
 
				+#endif /* X86_64 */
			
 
				+
			
 
				+
			
 
				 #endif	/* __KERNEL__ */
			
 
				 
			
 
				 #endif /* _ASM_X86_DEBUGREG_H */
			
--- a/arch/x86/include/asm/desc.h
+++ b/arch/x86/include/asm/desc.h
@@ -35,6 +35,8 @@ static inline void fill_ldt(struct desc_struct *desc, const struct user_desc *in
 
				 
			
 
				 extern struct desc_ptr idt_descr;
			
 
				 extern gate_desc idt_table[];
			
 
				+extern struct desc_ptr nmi_idt_descr;
			
 
				+extern gate_desc nmi_idt_table[];
			
 
				 
			
 
				 struct gdt_page {
			
 
				 	struct desc_struct gdt[GDT_ENTRIES];
			
@@ -307,6 +309,16 @@ static inline void set_desc_limit(struct desc_struct *desc, unsigned long limit)
 
				 	desc->limit = (limit >> 16) & 0xf;
			
 
				 }
			
 
				 
			
 
				+#ifdef CONFIG_X86_64
			
 
				+static inline void set_nmi_gate(int gate, void *addr)
			
 
				+{
			
 
				+	gate_desc s;
			
 
				+
			
 
				+	pack_gate(&s, GATE_INTERRUPT, (unsigned long)addr, 0, 0, __KERNEL_CS);
			
 
				+	write_idt_entry(nmi_idt_table, gate, &s);
			
 
				+}
			
 
				+#endif
			
 
				+
			
 
				 static inline void _set_gate(int gate, unsigned type, void *addr,
			
 
				 			     unsigned dpl, unsigned ist, unsigned seg)
			
 
				 {
			
--- a/arch/x86/kernel/cpu/common.c
+++ b/arch/x86/kernel/cpu/common.c
@@ -1021,6 +1021,8 @@ __setup("clearcpuid=", setup_disablecpuid);
 
				 
			
 
				 #ifdef CONFIG_X86_64
			
 
				 struct desc_ptr idt_descr = { NR_VECTORS * 16 - 1, (unsigned long) idt_table };
			
 
				+struct desc_ptr nmi_idt_descr = { NR_VECTORS * 16 - 1,
			
 
				+				    (unsigned long) nmi_idt_table };
			
 
				 
			
 
				 DEFINE_PER_CPU_FIRST(union irq_stack_union,
			
 
				 		     irq_stack_union) __aligned(PAGE_SIZE);
			
@@ -1085,6 +1087,26 @@ unsigned long kernel_eflags;
 
				  */
			
 
				 DEFINE_PER_CPU(struct orig_ist, orig_ist);
			
 
				 
			
 
				+static DEFINE_PER_CPU(unsigned long, debug_stack_addr);
			
 
				+DEFINE_PER_CPU(int, debug_stack_usage);
			
 
				+
			
 
				+int is_debug_stack(unsigned long addr)
			
 
				+{
			
 
				+	return __get_cpu_var(debug_stack_usage) ||
			
 
				+		(addr <= __get_cpu_var(debug_stack_addr) &&
			
 
				+		 addr > (__get_cpu_var(debug_stack_addr) - DEBUG_STKSZ));
			
 
				+}
			
 
				+
			
 
				+void debug_stack_set_zero(void)
			
 
				+{
			
 
				+	load_idt((const struct desc_ptr *)&nmi_idt_descr);
			
 
				+}
			
 
				+
			
 
				+void debug_stack_reset(void)
			
 
				+{
			
 
				+	load_idt((const struct desc_ptr *)&idt_descr);
			
 
				+}
			
 
				+
			
 
				 #else	/* CONFIG_X86_64 */
			
 
				 
			
 
				 DEFINE_PER_CPU(struct task_struct *, current_task) = &init_task;
			
@@ -1212,6 +1234,8 @@ void __cpuinit cpu_init(void)
 
				 			estacks += exception_stack_sizes[v];
			
 
				 			oist->ist[v] = t->x86_tss.ist[v] =
			
 
				 					(unsigned long)estacks;
			
 
				+			if (v == DEBUG_STACK-1)
			
 
				+				per_cpu(debug_stack_addr, cpu) = (unsigned long)estacks;
			
 
				 		}
			
 
				 	}
			
 
				 
			
--- a/arch/x86/kernel/entry_64.S
+++ b/arch/x86/kernel/entry_64.S
@@ -1480,62 +1480,214 @@ ENTRY(error_exit)
 
				 	CFI_ENDPROC
			
 
				 END(error_exit)
			
 
				 
			
 
				+/*
			
 
				+ * Test if a given stack is an NMI stack or not.
			
 
				+ */
			
 
				+	.macro test_in_nmi reg stack nmi_ret normal_ret
			
 
				+	cmpq %\reg, \stack
			
 
				+	ja \normal_ret
			
 
				+	subq $EXCEPTION_STKSZ, %\reg
			
 
				+	cmpq %\reg, \stack
			
 
				+	jb \normal_ret
			
 
				+	jmp \nmi_ret
			
 
				+	.endm
			
 
				 
			
 
				 	/* runs on exception stack */
			
 
				 ENTRY(nmi)
			
 
				 	INTR_FRAME
			
 
				 	PARAVIRT_ADJUST_EXCEPTION_FRAME
			
 
				-	pushq_cfi $-1
			
 
				+	/*
			
 
				+	 * We allow breakpoints in NMIs. If a breakpoint occurs, then
			
 
				+	 * the iretq it performs will take us out of NMI context.
			
 
				+	 * This means that we can have nested NMIs where the next
			
 
				+	 * NMI is using the top of the stack of the previous NMI. We
			
 
				+	 * can't let it execute because the nested NMI will corrupt the
			
 
				+	 * stack of the previous NMI. NMI handlers are not re-entrant
			
 
				+	 * anyway.
			
 
				+	 *
			
 
				+	 * To handle this case we do the following:
			
 
				+	 *  Check the a special location on the stack that contains
			
 
				+	 *  a variable that is set when NMIs are executing.
			
 
				+	 *  The interrupted task's stack is also checked to see if it
			
 
				+	 *  is an NMI stack.
			
 
				+	 *  If the variable is not set and the stack is not the NMI
			
 
				+	 *  stack then:
			
 
				+	 *    o Set the special variable on the stack
			
 
				+	 *    o Copy the interrupt frame into a "saved" location on the stack
			
 
				+	 *    o Copy the interrupt frame into a "copy" location on the stack
			
 
				+	 *    o Continue processing the NMI
			
 
				+	 *  If the variable is set or the previous stack is the NMI stack:
			
 
				+	 *    o Modify the "copy" location to jump to the repeate_nmi
			
 
				+	 *    o return back to the first NMI
			
 
				+	 *
			
 
				+	 * Now on exit of the first NMI, we first clear the stack variable
			
 
				+	 * The NMI stack will tell any nested NMIs at that point that it is
			
 
				+	 * nested. Then we pop the stack normally with iret, and if there was
			
 
				+	 * a nested NMI that updated the copy interrupt stack frame, a
			
 
				+	 * jump will be made to the repeat_nmi code that will handle the second
			
 
				+	 * NMI.
			
 
				+	 */
			
 
				+
			
 
				+	/* Use %rdx as out temp variable throughout */
			
 
				+	pushq_cfi %rdx
			
 
				+
			
 
				+	/*
			
 
				+	 * Check the special variable on the stack to see if NMIs are
			
 
				+	 * executing.
			
 
				+	 */
			
 
				+	cmp $1, -8(%rsp)
			
 
				+	je nested_nmi
			
 
				+
			
 
				+	/*
			
 
				+	 * Now test if the previous stack was an NMI stack.
			
 
				+	 * We need the double check. We check the NMI stack to satisfy the
			
 
				+	 * race when the first NMI clears the variable before returning.
			
 
				+	 * We check the variable because the first NMI could be in a
			
 
				+	 * breakpoint routine using a breakpoint stack.
			
 
				+	 */
			
 
				+	lea 6*8(%rsp), %rdx
			
 
				+	test_in_nmi rdx, 4*8(%rsp), nested_nmi, first_nmi
			
 
				+
			
 
				+nested_nmi:
			
 
				+	/*
			
 
				+	 * Do nothing if we interrupted the fixup in repeat_nmi.
			
 
				+	 * It's about to repeat the NMI handler, so we are fine
			
 
				+	 * with ignoring this one.
			
 
				+	 */
			
 
				+	movq $repeat_nmi, %rdx
			
 
				+	cmpq 8(%rsp), %rdx
			
 
				+	ja 1f
			
 
				+	movq $end_repeat_nmi, %rdx
			
 
				+	cmpq 8(%rsp), %rdx
			
 
				+	ja nested_nmi_out
			
 
				+
			
 
				+1:
			
 
				+	/* Set up the interrupted NMIs stack to jump to repeat_nmi */
			
 
				+	leaq -6*8(%rsp), %rdx
			
 
				+	movq %rdx, %rsp
			
 
				+	CFI_ADJUST_CFA_OFFSET 6*8
			
 
				+	pushq_cfi $__KERNEL_DS
			
 
				+	pushq_cfi %rdx
			
 
				+	pushfq_cfi
			
 
				+	pushq_cfi $__KERNEL_CS
			
 
				+	pushq_cfi $repeat_nmi
			
 
				+
			
 
				+	/* Put stack back */
			
 
				+	addq $(11*8), %rsp
			
 
				+	CFI_ADJUST_CFA_OFFSET -11*8
			
 
				+
			
 
				+nested_nmi_out:
			
 
				+	popq_cfi %rdx
			
 
				+
			
 
				+	/* No need to check faults here */
			
 
				+	INTERRUPT_RETURN
			
 
				+
			
 
				+first_nmi:
			
 
				+	/*
			
 
				+	 * Because nested NMIs will use the pushed location that we
			
 
				+	 * stored in rdx, we must keep that space available.
			
 
				+	 * Here's what our stack frame will look like:
			
 
				+	 * +-------------------------+
			
 
				+	 * | original SS             |
			
 
				+	 * | original Return RSP     |
			
 
				+	 * | original RFLAGS         |
			
 
				+	 * | original CS             |
			
 
				+	 * | original RIP            |
			
 
				+	 * +-------------------------+
			
 
				+	 * | temp storage for rdx    |
			
 
				+	 * +-------------------------+
			
 
				+	 * | NMI executing variable  |
			
 
				+	 * +-------------------------+
			
 
				+	 * | Saved SS                |
			
 
				+	 * | Saved Return RSP        |
			
 
				+	 * | Saved RFLAGS            |
			
 
				+	 * | Saved CS                |
			
 
				+	 * | Saved RIP               |
			
 
				+	 * +-------------------------+
			
 
				+	 * | copied SS               |
			
 
				+	 * | copied Return RSP       |
			
 
				+	 * | copied RFLAGS           |
			
 
				+	 * | copied CS               |
			
 
				+	 * | copied RIP              |
			
 
				+	 * +-------------------------+
			
 
				+	 * | pt_regs                 |
			
 
				+	 * +-------------------------+
			
 
				+	 *
			
 
				+	 * The saved RIP is used to fix up the copied RIP that a nested
			
 
				+	 * NMI may zero out. The original stack frame and the temp storage
			
 
				+	 * is also used by nested NMIs and can not be trusted on exit.
			
 
				+	 */
			
 
				+	/* Set the NMI executing variable on the stack. */
			
 
				+	pushq_cfi $1
			
 
				+
			
 
				+	/* Copy the stack frame to the Saved frame */
			
 
				+	.rept 5
			
 
				+	pushq_cfi 6*8(%rsp)
			
 
				+	.endr
			
 
				+
			
 
				+	/* Make another copy, this one may be modified by nested NMIs */
			
 
				+	.rept 5
			
 
				+	pushq_cfi 4*8(%rsp)
			
 
				+	.endr
			
 
				+
			
 
				+	/* Do not pop rdx, nested NMIs will corrupt it */
			
 
				+	movq 11*8(%rsp), %rdx
			
 
				+
			
 
				+	/*
			
 
				+	 * Everything below this point can be preempted by a nested
			
 
				+	 * NMI if the first NMI took an exception. Repeated NMIs
			
 
				+	 * caused by an exception and nested NMI will start here, and
			
 
				+	 * can still be preempted by another NMI.
			
 
				+	 */
			
 
				+restart_nmi:
			
 
				+	pushq_cfi $-1		/* ORIG_RAX: no syscall to restart */
			
 
				 	subq $ORIG_RAX-R15, %rsp
			
 
				 	CFI_ADJUST_CFA_OFFSET ORIG_RAX-R15
			
 
				+	/*
			
 
				+	 * Use save_paranoid to handle SWAPGS, but no need to use paranoid_exit
			
 
				+	 * as we should not be calling schedule in NMI context.
			
 
				+	 * Even with normal interrupts enabled. An NMI should not be
			
 
				+	 * setting NEED_RESCHED or anything that normal interrupts and
			
 
				+	 * exceptions might do.
			
 
				+	 */
			
 
				 	call save_paranoid
			
 
				 	DEFAULT_FRAME 0
			
 
				 	/* paranoidentry do_nmi, 0; without TRACE_IRQS_OFF */
			
 
				 	movq %rsp,%rdi
			
 
				 	movq $-1,%rsi
			
 
				 	call do_nmi
			
 
				-#ifdef CONFIG_TRACE_IRQFLAGS
			
 
				-	/* paranoidexit; without TRACE_IRQS_OFF */
			
 
				-	/* ebx:	no swapgs flag */
			
 
				-	DISABLE_INTERRUPTS(CLBR_NONE)
			
 
				 	testl %ebx,%ebx				/* swapgs needed? */
			
 
				 	jnz nmi_restore
			
 
				-	testl $3,CS(%rsp)
			
 
				-	jnz nmi_userspace
			
 
				 nmi_swapgs:
			
 
				 	SWAPGS_UNSAFE_STACK
			
 
				 nmi_restore:
			
 
				 	RESTORE_ALL 8
			
 
				+	/* Clear the NMI executing stack variable */
			
 
				+	movq $0, 10*8(%rsp)
			
 
				 	jmp irq_return
			
 
				-nmi_userspace:
			
 
				-	GET_THREAD_INFO(%rcx)
			
 
				-	movl TI_flags(%rcx),%ebx
			
 
				-	andl $_TIF_WORK_MASK,%ebx
			
 
				-	jz nmi_swapgs
			
 
				-	movq %rsp,%rdi			/* &pt_regs */
			
 
				-	call sync_regs
			
 
				-	movq %rax,%rsp			/* switch stack for scheduling */
			
 
				-	testl $_TIF_NEED_RESCHED,%ebx
			
 
				-	jnz nmi_schedule
			
 
				-	movl %ebx,%edx			/* arg3: thread flags */
			
 
				-	ENABLE_INTERRUPTS(CLBR_NONE)
			
 
				-	xorl %esi,%esi 			/* arg2: oldset */
			
 
				-	movq %rsp,%rdi 			/* arg1: &pt_regs */
			
 
				-	call do_notify_resume
			
 
				-	DISABLE_INTERRUPTS(CLBR_NONE)
			
 
				-	jmp nmi_userspace
			
 
				-nmi_schedule:
			
 
				-	ENABLE_INTERRUPTS(CLBR_ANY)
			
 
				-	call schedule
			
 
				-	DISABLE_INTERRUPTS(CLBR_ANY)
			
 
				-	jmp nmi_userspace
			
 
				-	CFI_ENDPROC
			
 
				-#else
			
 
				-	jmp paranoid_exit
			
 
				 	CFI_ENDPROC
			
 
				-#endif
			
 
				 END(nmi)
			
 
				 
			
 
				+	/*
			
 
				+	 * If an NMI hit an iret because of an exception or breakpoint,
			
 
				+	 * it can lose its NMI context, and a nested NMI may come in.
			
 
				+	 * In that case, the nested NMI will change the preempted NMI's
			
 
				+	 * stack to jump to here when it does the final iret.
			
 
				+	 */
			
 
				+repeat_nmi:
			
 
				+	INTR_FRAME
			
 
				+	/* Update the stack variable to say we are still in NMI */
			
 
				+	movq $1, 5*8(%rsp)
			
 
				+
			
 
				+	/* copy the saved stack back to copy stack */
			
 
				+	.rept 5
			
 
				+	pushq_cfi 4*8(%rsp)
			
 
				+	.endr
			
 
				+
			
 
				+	jmp restart_nmi
			
 
				+	CFI_ENDPROC
			
 
				+end_repeat_nmi:
			
 
				+
			
 
				 ENTRY(ignore_sysret)
			
 
				 	CFI_STARTPROC
			
 
				 	mov $-ENOSYS,%eax
			
--- a/arch/x86/kernel/head_64.S
+++ b/arch/x86/kernel/head_64.S
@@ -417,6 +417,10 @@ ENTRY(phys_base)
 
				 ENTRY(idt_table)
			
 
				 	.skip IDT_ENTRIES * 16
			
 
				 
			
 
				+	.align L1_CACHE_BYTES
			
 
				+ENTRY(nmi_idt_table)
			
 
				+	.skip IDT_ENTRIES * 16
			
 
				+
			
 
				 	__PAGE_ALIGNED_BSS
			
 
				 	.align PAGE_SIZE
			
 
				 ENTRY(empty_zero_page)
			
--- a/arch/x86/kernel/nmi.c
+++ b/arch/x86/kernel/nmi.c
@@ -405,9 +405,108 @@ static notrace __kprobes void default_do_nmi(struct pt_regs *regs)
 
				 		unknown_nmi_error(reason, regs);
			
 
				 }
			
 
				 
			
 
				+/*
			
 
				+ * NMIs can hit breakpoints which will cause it to lose its
			
 
				+ * NMI context with the CPU when the breakpoint does an iret.
			
 
				+ */
			
 
				+#ifdef CONFIG_X86_32
			
 
				+/*
			
 
				+ * For i386, NMIs use the same stack as the kernel, and we can
			
 
				+ * add a workaround to the iret problem in C. Simply have 3 states
			
 
				+ * the NMI can be in.
			
 
				+ *
			
 
				+ *  1) not running
			
 
				+ *  2) executing
			
 
				+ *  3) latched
			
 
				+ *
			
 
				+ * When no NMI is in progress, it is in the "not running" state.
			
 
				+ * When an NMI comes in, it goes into the "executing" state.
			
 
				+ * Normally, if another NMI is triggered, it does not interrupt
			
 
				+ * the running NMI and the HW will simply latch it so that when
			
 
				+ * the first NMI finishes, it will restart the second NMI.
			
 
				+ * (Note, the latch is binary, thus multiple NMIs triggering,
			
 
				+ *  when one is running, are ignored. Only one NMI is restarted.)
			
 
				+ *
			
 
				+ * If an NMI hits a breakpoint that executes an iret, another
			
 
				+ * NMI can preempt it. We do not want to allow this new NMI
			
 
				+ * to run, but we want to execute it when the first one finishes.
			
 
				+ * We set the state to "latched", and the first NMI will perform
			
 
				+ * an cmpxchg on the state, and if it doesn't successfully
			
 
				+ * reset the state to "not running" it will restart the next
			
 
				+ * NMI.
			
 
				+ */
			
 
				+enum nmi_states {
			
 
				+	NMI_NOT_RUNNING,
			
 
				+	NMI_EXECUTING,
			
 
				+	NMI_LATCHED,
			
 
				+};
			
 
				+static DEFINE_PER_CPU(enum nmi_states, nmi_state);
			
 
				+
			
 
				+#define nmi_nesting_preprocess(regs)					\
			
 
				+	do {								\
			
 
				+		if (__get_cpu_var(nmi_state) != NMI_NOT_RUNNING) {	\
			
 
				+			__get_cpu_var(nmi_state) = NMI_LATCHED;		\
			
 
				+			return;						\
			
 
				+		}							\
			
 
				+	nmi_restart:							\
			
 
				+		__get_cpu_var(nmi_state) = NMI_EXECUTING;		\
			
 
				+	} while (0)
			
 
				+
			
 
				+#define nmi_nesting_postprocess()					\
			
 
				+	do {								\
			
 
				+		if (cmpxchg(&__get_cpu_var(nmi_state),			\
			
 
				+		    NMI_EXECUTING, NMI_NOT_RUNNING) != NMI_EXECUTING)	\
			
 
				+			goto nmi_restart;				\
			
 
				+	} while (0)
			
 
				+#else /* x86_64 */
			
 
				+/*
			
 
				+ * In x86_64 things are a bit more difficult. This has the same problem
			
 
				+ * where an NMI hitting a breakpoint that calls iret will remove the
			
 
				+ * NMI context, allowing a nested NMI to enter. What makes this more
			
 
				+ * difficult is that both NMIs and breakpoints have their own stack.
			
 
				+ * When a new NMI or breakpoint is executed, the stack is set to a fixed
			
 
				+ * point. If an NMI is nested, it will have its stack set at that same
			
 
				+ * fixed address that the first NMI had, and will start corrupting the
			
 
				+ * stack. This is handled in entry_64.S, but the same problem exists with
			
 
				+ * the breakpoint stack.
			
 
				+ *
			
 
				+ * If a breakpoint is being processed, and the debug stack is being used,
			
 
				+ * if an NMI comes in and also hits a breakpoint, the stack pointer
			
 
				+ * will be set to the same fixed address as the breakpoint that was
			
 
				+ * interrupted, causing that stack to be corrupted. To handle this case,
			
 
				+ * check if the stack that was interrupted is the debug stack, and if
			
 
				+ * so, change the IDT so that new breakpoints will use the current stack
			
 
				+ * and not switch to the fixed address. On return of the NMI, switch back
			
 
				+ * to the original IDT.
			
 
				+ */
			
 
				+static DEFINE_PER_CPU(int, update_debug_stack);
			
 
				+
			
 
				+static inline void nmi_nesting_preprocess(struct pt_regs *regs)
			
 
				+{
			
 
				+	/*
			
 
				+	 * If we interrupted a breakpoint, it is possible that
			
 
				+	 * the nmi handler will have breakpoints too. We need to
			
 
				+	 * change the IDT such that breakpoints that happen here
			
 
				+	 * continue to use the NMI stack.
			
 
				+	 */
			
 
				+	if (unlikely(is_debug_stack(regs->sp))) {
			
 
				+		debug_stack_set_zero();
			
 
				+		__get_cpu_var(update_debug_stack) = 1;
			
 
				+	}
			
 
				+}
			
 
				+
			
 
				+static inline void nmi_nesting_postprocess(void)
			
 
				+{
			
 
				+	if (unlikely(__get_cpu_var(update_debug_stack)))
			
 
				+		debug_stack_reset();
			
 
				+}
			
 
				+#endif
			
 
				+
			
 
				 dotraplinkage notrace __kprobes void
			
 
				 do_nmi(struct pt_regs *regs, long error_code)
			
 
				 {
			
 
				+	nmi_nesting_preprocess(regs);
			
 
				+
			
 
				 	nmi_enter();
			
 
				 
			
 
				 	inc_irq_stat(__nmi_count);
			
@@ -416,6 +515,9 @@ do_nmi(struct pt_regs *regs, long error_code)
 
				 		default_do_nmi(regs);
			
 
				 
			
 
				 	nmi_exit();
			
 
				+
			
 
				+	/* On i386, may loop back to preprocess */
			
 
				+	nmi_nesting_postprocess();
			
 
				 }
			
 
				 
			
 
				 void stop_nmi(void)
			
--- a/arch/x86/kernel/traps.c
+++ b/arch/x86/kernel/traps.c
@@ -311,9 +311,15 @@ dotraplinkage void __kprobes do_int3(struct pt_regs *regs, long error_code)
 
				 			== NOTIFY_STOP)
			
 
				 		return;
			
 
				 
			
 
				+	/*
			
 
				+	 * Let others (NMI) know that the debug stack is in use
			
 
				+	 * as we may switch to the interrupt stack.
			
 
				+	 */
			
 
				+	debug_stack_usage_inc();
			
 
				 	preempt_conditional_sti(regs);
			
 
				 	do_trap(3, SIGTRAP, "int3", regs, error_code, NULL);
			
 
				 	preempt_conditional_cli(regs);
			
 
				+	debug_stack_usage_dec();
			
 
				 }
			
 
				 
			
 
				 #ifdef CONFIG_X86_64
			
@@ -406,6 +412,12 @@ dotraplinkage void __kprobes do_debug(struct pt_regs *regs, long error_code)
 
				 							SIGTRAP) == NOTIFY_STOP)
			
 
				 		return;
			
 
				 
			
 
				+	/*
			
 
				+	 * Let others (NMI) know that the debug stack is in use
			
 
				+	 * as we may switch to the interrupt stack.
			
 
				+	 */
			
 
				+	debug_stack_usage_inc();
			
 
				+
			
 
				 	/* It's safe to allow irq's after DR6 has been saved */
			
 
				 	preempt_conditional_sti(regs);
			
 
				 
			
@@ -413,6 +425,7 @@ dotraplinkage void __kprobes do_debug(struct pt_regs *regs, long error_code)
 
				 		handle_vm86_trap((struct kernel_vm86_regs *) regs,
			
 
				 				error_code, 1);
			
 
				 		preempt_conditional_cli(regs);
			
 
				+		debug_stack_usage_dec();
			
 
				 		return;
			
 
				 	}
			
 
				 
			
@@ -432,6 +445,7 @@ dotraplinkage void __kprobes do_debug(struct pt_regs *regs, long error_code)
 
				 	if (tsk->thread.debugreg6 & (DR_STEP | DR_TRAP_BITS) || user_icebp)
			
 
				 		send_sigtrap(tsk, regs, error_code, si_code);
			
 
				 	preempt_conditional_cli(regs);
			
 
				+	debug_stack_usage_dec();
			
 
				 
			
 
				 	return;
			
 
				 }
			
@@ -718,4 +732,10 @@ void __init trap_init(void)
 
				 	cpu_init();
			
 
				 
			
 
				 	x86_init.irqs.trap_init();
			
 
				+
			
 
				+#ifdef CONFIG_X86_64
			
 
				+	memcpy(&nmi_idt_table, &idt_table, IDT_ENTRIES * 16);
			
 
				+	set_nmi_gate(1, &debug);
			
 
				+	set_nmi_gate(3, &int3);
			
 
				+#endif
			
 
				 }
			
--- a/include/linux/compiler-gcc.h
+++ b/include/linux/compiler-gcc.h
@@ -50,6 +50,11 @@
 
				 # define inline		inline		__attribute__((always_inline))
			
 
				 # define __inline__	__inline__	__attribute__((always_inline))
			
 
				 # define __inline	__inline	__attribute__((always_inline))
			
 
				+#else
			
 
				+/* A lot of inline functions can cause havoc with function tracing */
			
 
				+# define inline		inline		notrace
			
 
				+# define __inline__	__inline__	notrace
			
 
				+# define __inline	__inline	notrace
			
 
				 #endif
			
 
				 
			
 
				 #define __deprecated			__attribute__((deprecated))
			
--- a/include/linux/ftrace.h
+++ b/include/linux/ftrace.h
@@ -133,6 +133,8 @@ struct ftrace_func_command {
 
				 int ftrace_arch_code_modify_prepare(void);
			
 
				 int ftrace_arch_code_modify_post_process(void);
			
 
				 
			
 
				+void ftrace_bug(int err, unsigned long ip);
			
 
				+
			
 
				 struct seq_file;
			
 
				 
			
 
				 struct ftrace_probe_ops {
			
@@ -161,7 +163,6 @@ extern int ftrace_text_reserved(void *start, void *end);
 
				 
			
 
				 enum {
			
 
				 	FTRACE_FL_ENABLED	= (1 << 30),
			
 
				-	FTRACE_FL_FREE		= (1 << 31),
			
 
				 };
			
 
				 
			
 
				 #define FTRACE_FL_MASK		(0x3UL << 30)
			
@@ -172,10 +173,7 @@ struct dyn_ftrace {
 
				 		unsigned long		ip; /* address of mcount call-site */
			
 
				 		struct dyn_ftrace	*freelist;
			
 
				 	};
			
 
				-	union {
			
 
				-		unsigned long		flags;
			
 
				-		struct dyn_ftrace	*newlist;
			
 
				-	};
			
 
				+	unsigned long		flags;
			
 
				 	struct dyn_arch_ftrace		arch;
			
 
				 };
			
 
				 
			
@@ -190,6 +188,56 @@ void ftrace_set_global_notrace(unsigned char *buf, int len, int reset);
 
				 int register_ftrace_command(struct ftrace_func_command *cmd);
			
 
				 int unregister_ftrace_command(struct ftrace_func_command *cmd);
			
 
				 
			
 
				+enum {
			
 
				+	FTRACE_UPDATE_CALLS		= (1 << 0),
			
 
				+	FTRACE_DISABLE_CALLS		= (1 << 1),
			
 
				+	FTRACE_UPDATE_TRACE_FUNC	= (1 << 2),
			
 
				+	FTRACE_START_FUNC_RET		= (1 << 3),
			
 
				+	FTRACE_STOP_FUNC_RET		= (1 << 4),
			
 
				+};
			
 
				+
			
 
				+enum {
			
 
				+	FTRACE_UPDATE_IGNORE,
			
 
				+	FTRACE_UPDATE_MAKE_CALL,
			
 
				+	FTRACE_UPDATE_MAKE_NOP,
			
 
				+};
			
 
				+
			
 
				+enum {
			
 
				+	FTRACE_ITER_FILTER	= (1 << 0),
			
 
				+	FTRACE_ITER_NOTRACE	= (1 << 1),
			
 
				+	FTRACE_ITER_PRINTALL	= (1 << 2),
			
 
				+	FTRACE_ITER_DO_HASH	= (1 << 3),
			
 
				+	FTRACE_ITER_HASH	= (1 << 4),
			
 
				+	FTRACE_ITER_ENABLED	= (1 << 5),
			
 
				+};
			
 
				+
			
 
				+void arch_ftrace_update_code(int command);
			
 
				+
			
 
				+struct ftrace_rec_iter;
			
 
				+
			
 
				+struct ftrace_rec_iter *ftrace_rec_iter_start(void);
			
 
				+struct ftrace_rec_iter *ftrace_rec_iter_next(struct ftrace_rec_iter *iter);
			
 
				+struct dyn_ftrace *ftrace_rec_iter_record(struct ftrace_rec_iter *iter);
			
 
				+
			
 
				+int ftrace_update_record(struct dyn_ftrace *rec, int enable);
			
 
				+int ftrace_test_record(struct dyn_ftrace *rec, int enable);
			
 
				+void ftrace_run_stop_machine(int command);
			
 
				+int ftrace_location(unsigned long ip);
			
 
				+
			
 
				+extern ftrace_func_t ftrace_trace_function;
			
 
				+
			
 
				+int ftrace_regex_open(struct ftrace_ops *ops, int flag,
			
 
				+		  struct inode *inode, struct file *file);
			
 
				+ssize_t ftrace_filter_write(struct file *file, const char __user *ubuf,
			
 
				+			    size_t cnt, loff_t *ppos);
			
 
				+ssize_t ftrace_notrace_write(struct file *file, const char __user *ubuf,
			
 
				+			     size_t cnt, loff_t *ppos);
			
 
				+loff_t ftrace_regex_lseek(struct file *file, loff_t offset, int origin);
			
 
				+int ftrace_regex_release(struct inode *inode, struct file *file);
			
 
				+
			
 
				+void __init
			
 
				+ftrace_set_early_filter(struct ftrace_ops *ops, char *buf, int enable);
			
 
				+
			
 
				 /* defined in arch */
			
 
				 extern int ftrace_ip_converted(unsigned long ip);
			
 
				 extern int ftrace_dyn_arch_init(void *data);
			
@@ -284,6 +332,25 @@ static inline int ftrace_text_reserved(void *start, void *end)
 
				 {
			
 
				 	return 0;
			
 
				 }
			
 
				+
			
 
				+/*
			
 
				+ * Again users of functions that have ftrace_ops may not
			
 
				+ * have them defined when ftrace is not enabled, but these
			
 
				+ * functions may still be called. Use a macro instead of inline.
			
 
				+ */
			
 
				+#define ftrace_regex_open(ops, flag, inod, file) ({ -ENODEV; })
			
 
				+#define ftrace_set_early_filter(ops, buf, enable) do { } while (0)
			
 
				+
			
 
				+static inline ssize_t ftrace_filter_write(struct file *file, const char __user *ubuf,
			
 
				+			    size_t cnt, loff_t *ppos) { return -ENODEV; }
			
 
				+static inline ssize_t ftrace_notrace_write(struct file *file, const char __user *ubuf,
			
 
				+			     size_t cnt, loff_t *ppos) { return -ENODEV; }
			
 
				+static inline loff_t ftrace_regex_lseek(struct file *file, loff_t offset, int origin)
			
 
				+{
			
 
				+	return -ENODEV;
			
 
				+}
			
 
				+static inline int
			
 
				+ftrace_regex_release(struct inode *inode, struct file *file) { return -ENODEV; }
			
 
				 #endif /* CONFIG_DYNAMIC_FTRACE */
			
 
				 
			
 
				 /* totally disable ftrace - can not re-enable after this */
			
--- a/kernel/trace/ftrace.c
+++ b/kernel/trace/ftrace.c
--- a/kernel/trace/trace_events_filter.c
+++ b/kernel/trace/trace_events_filter.c
@@ -1738,11 +1738,121 @@ static int replace_system_preds(struct event_subsystem *system,
 
				 	return -ENOMEM;
			
 
				 }
			
 
				 
			
 
				+static int create_filter_start(char *filter_str, bool set_str,
			
 
				+			       struct filter_parse_state **psp,
			
 
				+			       struct event_filter **filterp)
			
 
				+{
			
 
				+	struct event_filter *filter;
			
 
				+	struct filter_parse_state *ps = NULL;
			
 
				+	int err = 0;
			
 
				+
			
 
				+	WARN_ON_ONCE(*psp || *filterp);
			
 
				+
			
 
				+	/* allocate everything, and if any fails, free all and fail */
			
 
				+	filter = __alloc_filter();
			
 
				+	if (filter && set_str)
			
 
				+		err = replace_filter_string(filter, filter_str);
			
 
				+
			
 
				+	ps = kzalloc(sizeof(*ps), GFP_KERNEL);
			
 
				+
			
 
				+	if (!filter || !ps || err) {
			
 
				+		kfree(ps);
			
 
				+		__free_filter(filter);
			
 
				+		return -ENOMEM;
			
 
				+	}
			
 
				+
			
 
				+	/* we're committed to creating a new filter */
			
 
				+	*filterp = filter;
			
 
				+	*psp = ps;
			
 
				+
			
 
				+	parse_init(ps, filter_ops, filter_str);
			
 
				+	err = filter_parse(ps);
			
 
				+	if (err && set_str)
			
 
				+		append_filter_err(ps, filter);
			
 
				+	return err;
			
 
				+}
			
 
				+
			
 
				+static void create_filter_finish(struct filter_parse_state *ps)
			
 
				+{
			
 
				+	if (ps) {
			
 
				+		filter_opstack_clear(ps);
			
 
				+		postfix_clear(ps);
			
 
				+		kfree(ps);
			
 
				+	}
			
 
				+}
			
 
				+
			
 
				+/**
			
 
				+ * create_filter - create a filter for a ftrace_event_call
			
 
				+ * @call: ftrace_event_call to create a filter for
			
 
				+ * @filter_str: filter string
			
 
				+ * @set_str: remember @filter_str and enable detailed error in filter
			
 
				+ * @filterp: out param for created filter (always updated on return)
			
 
				+ *
			
 
				+ * Creates a filter for @call with @filter_str.  If @set_str is %true,
			
 
				+ * @filter_str is copied and recorded in the new filter.
			
 
				+ *
			
 
				+ * On success, returns 0 and *@filterp points to the new filter.  On
			
 
				+ * failure, returns -errno and *@filterp may point to %NULL or to a new
			
 
				+ * filter.  In the latter case, the returned filter contains error
			
 
				+ * information if @set_str is %true and the caller is responsible for
			
 
				+ * freeing it.
			
 
				+ */
			
 
				+static int create_filter(struct ftrace_event_call *call,
			
 
				+			 char *filter_str, bool set_str,
			
 
				+			 struct event_filter **filterp)
			
 
				+{
			
 
				+	struct event_filter *filter = NULL;
			
 
				+	struct filter_parse_state *ps = NULL;
			
 
				+	int err;
			
 
				+
			
 
				+	err = create_filter_start(filter_str, set_str, &ps, &filter);
			
 
				+	if (!err) {
			
 
				+		err = replace_preds(call, filter, ps, filter_str, false);
			
 
				+		if (err && set_str)
			
 
				+			append_filter_err(ps, filter);
			
 
				+	}
			
 
				+	create_filter_finish(ps);
			
 
				+
			
 
				+	*filterp = filter;
			
 
				+	return err;
			
 
				+}
			
 
				+
			
 
				+/**
			
 
				+ * create_system_filter - create a filter for an event_subsystem
			
 
				+ * @system: event_subsystem to create a filter for
			
 
				+ * @filter_str: filter string
			
 
				+ * @filterp: out param for created filter (always updated on return)
			
 
				+ *
			
 
				+ * Identical to create_filter() except that it creates a subsystem filter
			
 
				+ * and always remembers @filter_str.
			
 
				+ */
			
 
				+static int create_system_filter(struct event_subsystem *system,
			
 
				+				char *filter_str, struct event_filter **filterp)
			
 
				+{
			
 
				+	struct event_filter *filter = NULL;
			
 
				+	struct filter_parse_state *ps = NULL;
			
 
				+	int err;
			
 
				+
			
 
				+	err = create_filter_start(filter_str, true, &ps, &filter);
			
 
				+	if (!err) {
			
 
				+		err = replace_system_preds(system, ps, filter_str);
			
 
				+		if (!err) {
			
 
				+			/* System filters just show a default message */
			
 
				+			kfree(filter->filter_string);
			
 
				+			filter->filter_string = NULL;
			
 
				+		} else {
			
 
				+			append_filter_err(ps, filter);
			
 
				+		}
			
 
				+	}
			
 
				+	create_filter_finish(ps);
			
 
				+
			
 
				+	*filterp = filter;
			
 
				+	return err;
			
 
				+}
			
 
				+
			
 
				 int apply_event_filter(struct ftrace_event_call *call, char *filter_string)
			
 
				 {
			
 
				-	struct filter_parse_state *ps;
			
 
				 	struct event_filter *filter;
			
 
				-	struct event_filter *tmp;
			
 
				 	int err = 0;
			
 
				 
			
 
				 	mutex_lock(&event_mutex);
			
@@ -1759,49 +1869,30 @@ int apply_event_filter(struct ftrace_event_call *call, char *filter_string)
 
				 		goto out_unlock;
			
 
				 	}
			
 
				 
			
 
				-	err = -ENOMEM;
			
 
				-	ps = kzalloc(sizeof(*ps), GFP_KERNEL);
			
 
				-	if (!ps)
			
 
				-		goto out_unlock;
			
 
				-
			
 
				-	filter = __alloc_filter();
			
 
				-	if (!filter) {
			
 
				-		kfree(ps);
			
 
				-		goto out_unlock;
			
 
				-	}
			
 
				-
			
 
				-	replace_filter_string(filter, filter_string);
			
 
				-
			
 
				-	parse_init(ps, filter_ops, filter_string);
			
 
				-	err = filter_parse(ps);
			
 
				-	if (err) {
			
 
				-		append_filter_err(ps, filter);
			
 
				-		goto out;
			
 
				-	}
			
 
				+	err = create_filter(call, filter_string, true, &filter);
			
 
				 
			
 
				-	err = replace_preds(call, filter, ps, filter_string, false);
			
 
				-	if (err) {
			
 
				-		filter_disable(call);
			
 
				-		append_filter_err(ps, filter);
			
 
				-	} else
			
 
				-		call->flags |= TRACE_EVENT_FL_FILTERED;
			
 
				-out:
			
 
				 	/*
			
 
				 	 * Always swap the call filter with the new filter
			
 
				 	 * even if there was an error. If there was an error
			
 
				 	 * in the filter, we disable the filter and show the error
			
 
				 	 * string
			
 
				 	 */
			
 
				-	tmp = call->filter;
			
 
				-	rcu_assign_pointer(call->filter, filter);
			
 
				-	if (tmp) {
			
 
				-		/* Make sure the call is done with the filter */
			
 
				-		synchronize_sched();
			
 
				-		__free_filter(tmp);
			
 
				+	if (filter) {
			
 
				+		struct event_filter *tmp = call->filter;
			
 
				+
			
 
				+		if (!err)
			
 
				+			call->flags |= TRACE_EVENT_FL_FILTERED;
			
 
				+		else
			
 
				+			filter_disable(call);
			
 
				+
			
 
				+		rcu_assign_pointer(call->filter, filter);
			
 
				+
			
 
				+		if (tmp) {
			
 
				+			/* Make sure the call is done with the filter */
			
 
				+			synchronize_sched();
			
 
				+			__free_filter(tmp);
			
 
				+		}
			
 
				 	}
			
 
				-	filter_opstack_clear(ps);
			
 
				-	postfix_clear(ps);
			
 
				-	kfree(ps);
			
 
				 out_unlock:
			
 
				 	mutex_unlock(&event_mutex);
			
 
				 
			
@@ -1811,7 +1902,6 @@ out_unlock:
 
				 int apply_subsystem_event_filter(struct event_subsystem *system,
			
 
				 				 char *filter_string)
			
 
				 {
			
 
				-	struct filter_parse_state *ps;
			
 
				 	struct event_filter *filter;
			
 
				 	int err = 0;
			
 
				 
			
@@ -1835,48 +1925,19 @@ int apply_subsystem_event_filter(struct event_subsystem *system,
 
				 		goto out_unlock;
			
 
				 	}
			
 
				 
			
 
				-	err = -ENOMEM;
			
 
				-	ps = kzalloc(sizeof(*ps), GFP_KERNEL);
			
 
				-	if (!ps)
			
 
				-		goto out_unlock;
			
 
				-
			
 
				-	filter = __alloc_filter();
			
 
				-	if (!filter)
			
 
				-		goto out;
			
 
				-
			
 
				-	/* System filters just show a default message */
			
 
				-	kfree(filter->filter_string);
			
 
				-	filter->filter_string = NULL;
			
 
				-
			
 
				-	/*
			
 
				-	 * No event actually uses the system filter
			
 
				-	 * we can free it without synchronize_sched().
			
 
				-	 */
			
 
				-	__free_filter(system->filter);
			
 
				-	system->filter = filter;
			
 
				-
			
 
				-	parse_init(ps, filter_ops, filter_string);
			
 
				-	err = filter_parse(ps);
			
 
				-	if (err)
			
 
				-		goto err_filter;
			
 
				-
			
 
				-	err = replace_system_preds(system, ps, filter_string);
			
 
				-	if (err)
			
 
				-		goto err_filter;
			
 
				-
			
 
				-out:
			
 
				-	filter_opstack_clear(ps);
			
 
				-	postfix_clear(ps);
			
 
				-	kfree(ps);
			
 
				+	err = create_system_filter(system, filter_string, &filter);
			
 
				+	if (filter) {
			
 
				+		/*
			
 
				+		 * No event actually uses the system filter
			
 
				+		 * we can free it without synchronize_sched().
			
 
				+		 */
			
 
				+		__free_filter(system->filter);
			
 
				+		system->filter = filter;
			
 
				+	}
			
 
				 out_unlock:
			
 
				 	mutex_unlock(&event_mutex);
			
 
				 
			
 
				 	return err;
			
 
				-
			
 
				-err_filter:
			
 
				-	replace_filter_string(filter, filter_string);
			
 
				-	append_filter_err(ps, system->filter);
			
 
				-	goto out;
			
 
				 }
			
 
				 
			
 
				 #ifdef CONFIG_PERF_EVENTS
			
@@ -1894,7 +1955,6 @@ int ftrace_profile_set_filter(struct perf_event *event, int event_id,
 
				 {
			
 
				 	int err;
			
 
				 	struct event_filter *filter;
			
 
				-	struct filter_parse_state *ps;
			
 
				 	struct ftrace_event_call *call;
			
 
				 
			
 
				 	mutex_lock(&event_mutex);
			
@@ -1909,33 +1969,10 @@ int ftrace_profile_set_filter(struct perf_event *event, int event_id,
 
				 	if (event->filter)
			
 
				 		goto out_unlock;
			
 
				 
			
 
				-	filter = __alloc_filter();
			
 
				-	if (!filter) {
			
 
				-		err = PTR_ERR(filter);
			
 
				-		goto out_unlock;
			
 
				-	}
			
 
				-
			
 
				-	err = -ENOMEM;
			
 
				-	ps = kzalloc(sizeof(*ps), GFP_KERNEL);
			
 
				-	if (!ps)
			
 
				-		goto free_filter;
			
 
				-
			
 
				-	parse_init(ps, filter_ops, filter_str);
			
 
				-	err = filter_parse(ps);
			
 
				-	if (err)
			
 
				-		goto free_ps;
			
 
				-
			
 
				-	err = replace_preds(call, filter, ps, filter_str, false);
			
 
				+	err = create_filter(call, filter_str, false, &filter);
			
 
				 	if (!err)
			
 
				 		event->filter = filter;
			
 
				-
			
 
				-free_ps:
			
 
				-	filter_opstack_clear(ps);
			
 
				-	postfix_clear(ps);
			
 
				-	kfree(ps);
			
 
				-
			
 
				-free_filter:
			
 
				-	if (err)
			
 
				+	else
			
 
				 		__free_filter(filter);
			
 
				 
			
 
				 out_unlock:
			
@@ -1954,43 +1991,6 @@ out_unlock:
 
				 #define CREATE_TRACE_POINTS
			
 
				 #include "trace_events_filter_test.h"
			
 
				 
			
 
				-static int test_get_filter(char *filter_str, struct ftrace_event_call *call,
			
 
				-			   struct event_filter **pfilter)
			
 
				-{
			
 
				-	struct event_filter *filter;
			
 
				-	struct filter_parse_state *ps;
			
 
				-	int err = -ENOMEM;
			
 
				-
			
 
				-	filter = __alloc_filter();
			
 
				-	if (!filter)
			
 
				-		goto out;
			
 
				-
			
 
				-	ps = kzalloc(sizeof(*ps), GFP_KERNEL);
			
 
				-	if (!ps)
			
 
				-		goto free_filter;
			
 
				-
			
 
				-	parse_init(ps, filter_ops, filter_str);
			
 
				-	err = filter_parse(ps);
			
 
				-	if (err)
			
 
				-		goto free_ps;
			
 
				-
			
 
				-	err = replace_preds(call, filter, ps, filter_str, false);
			
 
				-	if (!err)
			
 
				-		*pfilter = filter;
			
 
				-
			
 
				- free_ps:
			
 
				-	filter_opstack_clear(ps);
			
 
				-	postfix_clear(ps);
			
 
				-	kfree(ps);
			
 
				-
			
 
				- free_filter:
			
 
				-	if (err)
			
 
				-		__free_filter(filter);
			
 
				-
			
 
				- out:
			
 
				-	return err;
			
 
				-}
			
 
				-
			
 
				 #define DATA_REC(m, va, vb, vc, vd, ve, vf, vg, vh, nvisit) \
			
 
				 { \
			
 
				 	.filter = FILTER, \
			
@@ -2109,12 +2109,13 @@ static __init int ftrace_test_event_filter(void)
 
				 		struct test_filter_data_t *d = &test_filter_data[i];
			
 
				 		int err;
			
 
				 
			
 
				-		err = test_get_filter(d->filter, &event_ftrace_test_filter,
			
 
				-				      &filter);
			
 
				+		err = create_filter(&event_ftrace_test_filter, d->filter,
			
 
				+				    false, &filter);
			
 
				 		if (err) {
			
 
				 			printk(KERN_INFO
			
 
				 			       "Failed to get filter for '%s', err %d\n",
			
 
				 			       d->filter, err);
			
 
				+			__free_filter(filter);
			
 
				 			break;
			
 
				 		}
			
 
				 
			
--- a/kernel/trace/trace_stack.c
+++ b/kernel/trace/trace_stack.c
@@ -13,6 +13,9 @@
 
				 #include <linux/sysctl.h>
			
 
				 #include <linux/init.h>
			
 
				 #include <linux/fs.h>
			
 
				+
			
 
				+#include <asm/setup.h>
			
 
				+
			
 
				 #include "trace.h"
			
 
				 
			
 
				 #define STACK_TRACE_ENTRIES 500
			
@@ -133,7 +136,6 @@ stack_trace_call(unsigned long ip, unsigned long parent_ip)
 
				 static struct ftrace_ops trace_ops __read_mostly =
			
 
				 {
			
 
				 	.func = stack_trace_call,
			
 
				-	.flags = FTRACE_OPS_FL_GLOBAL,
			
 
				 };
			
 
				 
			
 
				 static ssize_t
			
@@ -311,6 +313,21 @@ static const struct file_operations stack_trace_fops = {
 
				 	.release	= seq_release,
			
 
				 };
			
 
				 
			
 
				+static int
			
 
				+stack_trace_filter_open(struct inode *inode, struct file *file)
			
 
				+{
			
 
				+	return ftrace_regex_open(&trace_ops, FTRACE_ITER_FILTER,
			
 
				+				 inode, file);
			
 
				+}
			
 
				+
			
 
				+static const struct file_operations stack_trace_filter_fops = {
			
 
				+	.open = stack_trace_filter_open,
			
 
				+	.read = seq_read,
			
 
				+	.write = ftrace_filter_write,
			
 
				+	.llseek = ftrace_regex_lseek,
			
 
				+	.release = ftrace_regex_release,
			
 
				+};
			
 
				+
			
 
				 int
			
 
				 stack_trace_sysctl(struct ctl_table *table, int write,
			
 
				 		   void __user *buffer, size_t *lenp,
			
@@ -338,8 +355,13 @@ stack_trace_sysctl(struct ctl_table *table, int write,
 
				 	return ret;
			
 
				 }
			
 
				 
			
 
				+static char stack_trace_filter_buf[COMMAND_LINE_SIZE+1] __initdata;
			
 
				+
			
 
				 static __init int enable_stacktrace(char *str)
			
 
				 {
			
 
				+	if (strncmp(str, "_filter=", 8) == 0)
			
 
				+		strncpy(stack_trace_filter_buf, str+8, COMMAND_LINE_SIZE);
			
 
				+
			
 
				 	stack_tracer_enabled = 1;
			
 
				 	last_stack_tracer_enabled = 1;
			
 
				 	return 1;
			
@@ -358,6 +380,12 @@ static __init int stack_trace_init(void)
 
				 	trace_create_file("stack_trace", 0444, d_tracer,
			
 
				 			NULL, &stack_trace_fops);
			
 
				 
			
 
				+	trace_create_file("stack_trace_filter", 0444, d_tracer,
			
 
				+			NULL, &stack_trace_filter_fops);
			
 
				+
			
 
				+	if (stack_trace_filter_buf[0])
			
 
				+		ftrace_set_early_filter(&trace_ops, stack_trace_filter_buf, 1);
			
 
				+
			
 
				 	if (stack_tracer_enabled)
			
 
				 		register_ftrace_function(&trace_ops);
			
 
				 
			
--- a/scripts/recordmcount.h
+++ b/scripts/recordmcount.h
@@ -462,7 +462,7 @@ __has_rel_mcount(Elf_Shdr const *const relhdr,  /* is SHT_REL or SHT_RELA */
 
				 		succeed_file();
			
 
				 	}
			
 
				 	if (w(txthdr->sh_type) != SHT_PROGBITS ||
			
 
				-	    !(w(txthdr->sh_flags) & SHF_EXECINSTR))
			
 
				+	    !(_w(txthdr->sh_flags) & SHF_EXECINSTR))
			
 
				 		return NULL;
			
 
				 	return txtname;
			
 
				 }
			
--- a/tools/perf/Documentation/perf-list.txt
+++ b/tools/perf/Documentation/perf-list.txt
@@ -21,6 +21,8 @@ EVENT MODIFIERS
 
				 Events can optionally have a modifer by appending a colon and one or
			
 
				 more modifiers.  Modifiers allow the user to restrict when events are
			
 
				 counted with 'u' for user-space, 'k' for kernel, 'h' for hypervisor.
			
 
				+Additional modifiers are 'G' for guest counting (in KVM guests) and 'H'
			
 
				+for host counting (not in KVM guests).
			
 
				 
			
 
				 The 'p' modifier can be used for specifying how precise the instruction
			
 
				 address should be. The 'p' modifier is currently only implemented for
			
--- a/tools/perf/MANIFEST
+++ b/tools/perf/MANIFEST
@@ -1,4 +1,5 @@
 
				 tools/perf
			
 
				+include/linux/const.h
			
 
				 include/linux/perf_event.h
			
 
				 include/linux/rbtree.h
			
 
				 include/linux/list.h
			
--- a/tools/perf/builtin-annotate.c
+++ b/tools/perf/builtin-annotate.c
@@ -235,7 +235,7 @@ out_delete:
 
				 }
			
 
				 
			
 
				 static const char * const annotate_usage[] = {
			
 
				-	"perf annotate [<options>] <command>",
			
 
				+	"perf annotate [<options>]",
			
 
				 	NULL
			
 
				 };
			
 
				 
			
@@ -313,10 +313,5 @@ int cmd_annotate(int argc, const char **argv, const char *prefix __used)
 
				 		annotate.sym_hist_filter = argv[0];
			
 
				 	}
			
 
				 
			
 
				-	if (field_sep && *field_sep == '.') {
			
 
				-		pr_err("'.' is the only non valid --field-separator argument\n");
			
 
				-		return -1;
			
 
				-	}
			
 
				-
			
 
				 	return __cmd_annotate(&annotate);
			
 
				 }
			
--- a/tools/perf/builtin-kmem.c
+++ b/tools/perf/builtin-kmem.c
@@ -108,7 +108,9 @@ static void setup_cpunode_map(void)
 
				 				continue;
			
 
				 			cpunode_map[cpu] = mem;
			
 
				 		}
			
 
				+		closedir(dir2);
			
 
				 	}
			
 
				+	closedir(dir1);
			
 
				 }
			
 
				 
			
 
				 static void insert_alloc_stat(unsigned long call_site, unsigned long ptr,
			
@@ -645,6 +647,7 @@ static int setup_sorting(struct list_head *sort_list, const char *arg)
 
				 			break;
			
 
				 		if (sort_dimension__add(tok, sort_list) < 0) {
			
 
				 			error("Unknown --sort key: '%s'", tok);
			
 
				+			free(str);
			
 
				 			return -1;
			
 
				 		}
			
 
				 	}
			
--- a/tools/perf/builtin-kvm.c
+++ b/tools/perf/builtin-kvm.c
@@ -22,9 +22,6 @@
 
				 static const char		*file_name;
			
 
				 static char			name_buffer[256];
			
 
				 
			
 
				-bool				perf_host = 1;
			
 
				-bool				perf_guest;
			
 
				-
			
 
				 static const char * const kvm_usage[] = {
			
 
				 	"perf kvm [<options>] {top|record|report|diff|buildid-list}",
			
 
				 	NULL
			
@@ -107,7 +104,8 @@ static int __cmd_buildid_list(int argc, const char **argv)
 
				 
			
 
				 int cmd_kvm(int argc, const char **argv, const char *prefix __used)
			
 
				 {
			
 
				-	perf_host = perf_guest = 0;
			
 
				+	perf_host  = 0;
			
 
				+	perf_guest = 1;
			
 
				 
			
 
				 	argc = parse_options(argc, argv, kvm_options, kvm_usage,
			
 
				 			PARSE_OPT_STOP_AT_NON_OPTION);
			
--- a/tools/perf/builtin-script.c
+++ b/tools/perf/builtin-script.c
@@ -1018,13 +1018,17 @@ static char *get_script_path(const char *script_root, const char *suffix)
 
				 			__script_root = get_script_root(&script_dirent, suffix);
			
 
				 			if (__script_root && !strcmp(script_root, __script_root)) {
			
 
				 				free(__script_root);
			
 
				+				closedir(lang_dir);
			
 
				+				closedir(scripts_dir);
			
 
				 				snprintf(script_path, MAXPATHLEN, "%s/%s",
			
 
				 					 lang_path, script_dirent.d_name);
			
 
				 				return strdup(script_path);
			
 
				 			}
			
 
				 			free(__script_root);
			
 
				 		}
			
 
				+		closedir(lang_dir);
			
 
				 	}
			
 
				+	closedir(scripts_dir);
			
 
				 
			
 
				 	return NULL;
			
 
				 }
			
--- a/tools/perf/builtin-test.c
+++ b/tools/perf/builtin-test.c
@@ -1396,7 +1396,7 @@ int cmd_test(int argc, const char **argv, const char *prefix __used)
 
				 	NULL,
			
 
				 	};
			
 
				 	const struct option test_options[] = {
			
 
				-	OPT_INTEGER('v', "verbose", &verbose,
			
 
				+	OPT_INCR('v', "verbose", &verbose,
			
 
				 		    "be more verbose (show symbol address, etc)"),
			
 
				 	OPT_END()
			
 
				 	};
			
--- a/tools/perf/builtin-top.c
+++ b/tools/perf/builtin-top.c
@@ -235,7 +235,6 @@ static struct hist_entry *perf_evsel__add_hist_entry(struct perf_evsel *evsel,
 
				 	if (he == NULL)
			
 
				 		return NULL;
			
 
				 
			
 
				-	evsel->hists.stats.total_period += sample->period;
			
 
				 	hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
			
 
				 	return he;
			
 
				 }
			
@@ -889,6 +888,10 @@ try_again:
 
				 				ui__warning("The %s event is not supported.\n",
			
 
				 					    event_name(counter));
			
 
				 				goto out_err;
			
 
				+			} else if (err == EMFILE) {
			
 
				+				ui__warning("Too many events are opened.\n"
			
 
				+					    "Try again after reducing the number of events\n");
			
 
				+				goto out_err;
			
 
				 			}
			
 
				 
			
 
				 			ui__warning("The sys_perf_event_open() syscall "
			
--- a/tools/perf/util/evlist.c
+++ b/tools/perf/util/evlist.c
@@ -111,8 +111,11 @@ int perf_evlist__add_default(struct perf_evlist *evlist)
 
				 		.type = PERF_TYPE_HARDWARE,
			
 
				 		.config = PERF_COUNT_HW_CPU_CYCLES,
			
 
				 	};
			
 
				-	struct perf_evsel *evsel = perf_evsel__new(&attr, 0);
			
 
				+	struct perf_evsel *evsel;
			
 
				+
			
 
				+	event_attr_init(&attr);
			
 
				 
			
 
				+	evsel = perf_evsel__new(&attr, 0);
			
 
				 	if (evsel == NULL)
			
 
				 		goto error;
			
 
				 
			
--- a/tools/perf/util/hist.c
+++ b/tools/perf/util/hist.c
@@ -76,21 +76,21 @@ static void hists__calc_col_len(struct hists *hists, struct hist_entry *h)
 
				 	}
			
 
				 }
			
 
				 
			
 
				-static void hist_entry__add_cpumode_period(struct hist_entry *self,
			
 
				+static void hist_entry__add_cpumode_period(struct hist_entry *he,
			
 
				 					   unsigned int cpumode, u64 period)
			
 
				 {
			
 
				 	switch (cpumode) {
			
 
				 	case PERF_RECORD_MISC_KERNEL:
			
 
				-		self->period_sys += period;
			
 
				+		he->period_sys += period;
			
 
				 		break;
			
 
				 	case PERF_RECORD_MISC_USER:
			
 
				-		self->period_us += period;
			
 
				+		he->period_us += period;
			
 
				 		break;
			
 
				 	case PERF_RECORD_MISC_GUEST_KERNEL:
			
 
				-		self->period_guest_sys += period;
			
 
				+		he->period_guest_sys += period;
			
 
				 		break;
			
 
				 	case PERF_RECORD_MISC_GUEST_USER:
			
 
				-		self->period_guest_us += period;
			
 
				+		he->period_guest_us += period;
			
 
				 		break;
			
 
				 	default:
			
 
				 		break;
			
@@ -165,18 +165,18 @@ void hists__decay_entries_threaded(struct hists *hists,
 
				 static struct hist_entry *hist_entry__new(struct hist_entry *template)
			
 
				 {
			
 
				 	size_t callchain_size = symbol_conf.use_callchain ? sizeof(struct callchain_root) : 0;
			
 
				-	struct hist_entry *self = malloc(sizeof(*self) + callchain_size);
			
 
				+	struct hist_entry *he = malloc(sizeof(*he) + callchain_size);
			
 
				 
			
 
				-	if (self != NULL) {
			
 
				-		*self = *template;
			
 
				-		self->nr_events = 1;
			
 
				-		if (self->ms.map)
			
 
				-			self->ms.map->referenced = true;
			
 
				+	if (he != NULL) {
			
 
				+		*he = *template;
			
 
				+		he->nr_events = 1;
			
 
				+		if (he->ms.map)
			
 
				+			he->ms.map->referenced = true;
			
 
				 		if (symbol_conf.use_callchain)
			
 
				-			callchain_init(self->callchain);
			
 
				+			callchain_init(he->callchain);
			
 
				 	}
			
 
				 
			
 
				-	return self;
			
 
				+	return he;
			
 
				 }
			
 
				 
			
 
				 static void hists__inc_nr_entries(struct hists *hists, struct hist_entry *h)
			
@@ -677,15 +677,16 @@ static size_t callchain__fprintf_flat(FILE *fp, struct callchain_node *self,
 
				 	return ret;
			
 
				 }
			
 
				 
			
 
				-static size_t hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self,
			
 
				-					    u64 total_samples, int left_margin)
			
 
				+static size_t hist_entry_callchain__fprintf(struct hist_entry *he,
			
 
				+					    u64 total_samples, int left_margin,
			
 
				+					    FILE *fp)
			
 
				 {
			
 
				 	struct rb_node *rb_node;
			
 
				 	struct callchain_node *chain;
			
 
				 	size_t ret = 0;
			
 
				 	u32 entries_printed = 0;
			
 
				 
			
 
				-	rb_node = rb_first(&self->sorted_chain);
			
 
				+	rb_node = rb_first(&he->sorted_chain);
			
 
				 	while (rb_node) {
			
 
				 		double percent;
			
 
				 
			
@@ -730,35 +731,35 @@ void hists__output_recalc_col_len(struct hists *hists, int max_rows)
 
				 	}
			
 
				 }
			
 
				 
			
 
				-static int hist_entry__pcnt_snprintf(struct hist_entry *self, char *s,
			
 
				+static int hist_entry__pcnt_snprintf(struct hist_entry *he, char *s,
			
 
				 				     size_t size, struct hists *pair_hists,
			
 
				 				     bool show_displacement, long displacement,
			
 
				-				     bool color, u64 session_total)
			
 
				+				     bool color, u64 total_period)
			
 
				 {
			
 
				 	u64 period, total, period_sys, period_us, period_guest_sys, period_guest_us;
			
 
				 	u64 nr_events;
			
 
				 	const char *sep = symbol_conf.field_sep;
			
 
				 	int ret;
			
 
				 
			
 
				-	if (symbol_conf.exclude_other && !self->parent)
			
 
				+	if (symbol_conf.exclude_other && !he->parent)
			
 
				 		return 0;
			
 
				 
			
 
				 	if (pair_hists) {
			
 
				-		period = self->pair ? self->pair->period : 0;
			
 
				-		nr_events = self->pair ? self->pair->nr_events : 0;
			
 
				+		period = he->pair ? he->pair->period : 0;
			
 
				+		nr_events = he->pair ? he->pair->nr_events : 0;
			
 
				 		total = pair_hists->stats.total_period;
			
 
				-		period_sys = self->pair ? self->pair->period_sys : 0;
			
 
				-		period_us = self->pair ? self->pair->period_us : 0;
			
 
				-		period_guest_sys = self->pair ? self->pair->period_guest_sys : 0;
			
 
				-		period_guest_us = self->pair ? self->pair->period_guest_us : 0;
			
 
				+		period_sys = he->pair ? he->pair->period_sys : 0;
			
 
				+		period_us = he->pair ? he->pair->period_us : 0;
			
 
				+		period_guest_sys = he->pair ? he->pair->period_guest_sys : 0;
			
 
				+		period_guest_us = he->pair ? he->pair->period_guest_us : 0;
			
 
				 	} else {
			
 
				-		period = self->period;
			
 
				-		nr_events = self->nr_events;
			
 
				-		total = session_total;
			
 
				-		period_sys = self->period_sys;
			
 
				-		period_us = self->period_us;
			
 
				-		period_guest_sys = self->period_guest_sys;
			
 
				-		period_guest_us = self->period_guest_us;
			
 
				+		period = he->period;
			
 
				+		nr_events = he->nr_events;
			
 
				+		total = total_period;
			
 
				+		period_sys = he->period_sys;
			
 
				+		period_us = he->period_us;
			
 
				+		period_guest_sys = he->period_guest_sys;
			
 
				+		period_guest_us = he->period_guest_us;
			
 
				 	}
			
 
				 
			
 
				 	if (total) {
			
@@ -812,8 +813,8 @@ static int hist_entry__pcnt_snprintf(struct hist_entry *self, char *s,
 
				 
			
 
				 		if (total > 0)
			
 
				 			old_percent = (period * 100.0) / total;
			
 
				-		if (session_total > 0)
			
 
				-			new_percent = (self->period * 100.0) / session_total;
			
 
				+		if (total_period > 0)
			
 
				+			new_percent = (he->period * 100.0) / total_period;
			
 
				 
			
 
				 		diff = new_percent - old_percent;
			
 
				 
			
@@ -862,9 +863,10 @@ int hist_entry__snprintf(struct hist_entry *he, char *s, size_t size,
 
				 	return ret;
			
 
				 }
			
 
				 
			
 
				-int hist_entry__fprintf(struct hist_entry *he, size_t size, struct hists *hists,
			
 
				-			struct hists *pair_hists, bool show_displacement,
			
 
				-			long displacement, FILE *fp, u64 session_total)
			
 
				+static int hist_entry__fprintf(struct hist_entry *he, size_t size,
			
 
				+			       struct hists *hists, struct hists *pair_hists,
			
 
				+			       bool show_displacement, long displacement,
			
 
				+			       u64 total_period, FILE *fp)
			
 
				 {
			
 
				 	char bf[512];
			
 
				 	int ret;
			
@@ -874,14 +876,14 @@ int hist_entry__fprintf(struct hist_entry *he, size_t size, struct hists *hists,
 
				 
			
 
				 	ret = hist_entry__pcnt_snprintf(he, bf, size, pair_hists,
			
 
				 					show_displacement, displacement,
			
 
				-					true, session_total);
			
 
				+					true, total_period);
			
 
				 	hist_entry__snprintf(he, bf + ret, size - ret, hists);
			
 
				 	return fprintf(fp, "%s\n", bf);
			
 
				 }
			
 
				 
			
 
				-static size_t hist_entry__fprintf_callchain(struct hist_entry *self,
			
 
				-					    struct hists *hists, FILE *fp,
			
 
				-					    u64 session_total)
			
 
				+static size_t hist_entry__fprintf_callchain(struct hist_entry *he,
			
 
				+					    struct hists *hists,
			
 
				+					    u64 total_period, FILE *fp)
			
 
				 {
			
 
				 	int left_margin = 0;
			
 
				 
			
@@ -889,11 +891,10 @@ static size_t hist_entry__fprintf_callchain(struct hist_entry *self,
 
				 		struct sort_entry *se = list_first_entry(&hist_entry__sort_list,
			
 
				 							 typeof(*se), list);
			
 
				 		left_margin = hists__col_len(hists, se->se_width_idx);
			
 
				-		left_margin -= thread__comm_len(self->thread);
			
 
				+		left_margin -= thread__comm_len(he->thread);
			
 
				 	}
			
 
				 
			
 
				-	return hist_entry_callchain__fprintf(fp, self, session_total,
			
 
				-					     left_margin);
			
 
				+	return hist_entry_callchain__fprintf(he, total_period, left_margin, fp);
			
 
				 }
			
 
				 
			
 
				 size_t hists__fprintf(struct hists *hists, struct hists *pair,
			
@@ -903,6 +904,7 @@ size_t hists__fprintf(struct hists *hists, struct hists *pair,
 
				 	struct sort_entry *se;
			
 
				 	struct rb_node *nd;
			
 
				 	size_t ret = 0;
			
 
				+	u64 total_period;
			
 
				 	unsigned long position = 1;
			
 
				 	long displacement = 0;
			
 
				 	unsigned int width;
			
@@ -917,20 +919,6 @@ size_t hists__fprintf(struct hists *hists, struct hists *pair,
 
				 
			
 
				 	fprintf(fp, "# %s", pair ? "Baseline" : "Overhead");
			
 
				 
			
 
				-	if (symbol_conf.show_nr_samples) {
			
 
				-		if (sep)
			
 
				-			fprintf(fp, "%cSamples", *sep);
			
 
				-		else
			
 
				-			fputs("  Samples  ", fp);
			
 
				-	}
			
 
				-
			
 
				-	if (symbol_conf.show_total_period) {
			
 
				-		if (sep)
			
 
				-			ret += fprintf(fp, "%cPeriod", *sep);
			
 
				-		else
			
 
				-			ret += fprintf(fp, "   Period    ");
			
 
				-	}
			
 
				-
			
 
				 	if (symbol_conf.show_cpu_utilization) {
			
 
				 		if (sep) {
			
 
				 			ret += fprintf(fp, "%csys", *sep);
			
@@ -940,8 +928,8 @@ size_t hists__fprintf(struct hists *hists, struct hists *pair,
 
				 				ret += fprintf(fp, "%cguest us", *sep);
			
 
				 			}
			
 
				 		} else {
			
 
				-			ret += fprintf(fp, "  sys  ");
			
 
				-			ret += fprintf(fp, "  us  ");
			
 
				+			ret += fprintf(fp, "     sys  ");
			
 
				+			ret += fprintf(fp, "      us  ");
			
 
				 			if (perf_guest) {
			
 
				 				ret += fprintf(fp, "  guest sys  ");
			
 
				 				ret += fprintf(fp, "  guest us  ");
			
@@ -949,6 +937,20 @@ size_t hists__fprintf(struct hists *hists, struct hists *pair,
 
				 		}
			
 
				 	}
			
 
				 
			
 
				+	if (symbol_conf.show_nr_samples) {
			
 
				+		if (sep)
			
 
				+			fprintf(fp, "%cSamples", *sep);
			
 
				+		else
			
 
				+			fputs("  Samples  ", fp);
			
 
				+	}
			
 
				+
			
 
				+	if (symbol_conf.show_total_period) {
			
 
				+		if (sep)
			
 
				+			ret += fprintf(fp, "%cPeriod", *sep);
			
 
				+		else
			
 
				+			ret += fprintf(fp, "   Period    ");
			
 
				+	}
			
 
				+
			
 
				 	if (pair) {
			
 
				 		if (sep)
			
 
				 			ret += fprintf(fp, "%cDelta", *sep);
			
@@ -993,6 +995,8 @@ size_t hists__fprintf(struct hists *hists, struct hists *pair,
 
				 		goto print_entries;
			
 
				 
			
 
				 	fprintf(fp, "# ........");
			
 
				+	if (symbol_conf.show_cpu_utilization)
			
 
				+		fprintf(fp, "   .......   .......");
			
 
				 	if (symbol_conf.show_nr_samples)
			
 
				 		fprintf(fp, " ..........");
			
 
				 	if (symbol_conf.show_total_period)
			
@@ -1025,6 +1029,8 @@ size_t hists__fprintf(struct hists *hists, struct hists *pair,
 
				 		goto out;
			
 
				 
			
 
				 print_entries:
			
 
				+	total_period = hists->stats.total_period;
			
 
				+
			
 
				 	for (nd = rb_first(&hists->entries); nd; nd = rb_next(nd)) {
			
 
				 		struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node);
			
 
				 
			
@@ -1040,11 +1046,10 @@ print_entries:
 
				 			++position;
			
 
				 		}
			
 
				 		ret += hist_entry__fprintf(h, max_cols, hists, pair, show_displacement,
			
 
				-					   displacement, fp, hists->stats.total_period);
			
 
				+					   displacement, total_period, fp);
			
 
				 
			
 
				 		if (symbol_conf.use_callchain)
			
 
				-			ret += hist_entry__fprintf_callchain(h, hists, fp,
			
 
				-							     hists->stats.total_period);
			
 
				+			ret += hist_entry__fprintf_callchain(h, hists, total_period, fp);
			
 
				 		if (max_rows && ++nr_rows >= max_rows)
			
 
				 			goto out;
			
 
				 
			
--- a/tools/perf/util/hist.h
+++ b/tools/perf/util/hist.h
@@ -66,11 +66,8 @@ struct hists {
 
				 struct hist_entry *__hists__add_entry(struct hists *self,
			
 
				 				      struct addr_location *al,
			
 
				 				      struct symbol *parent, u64 period);
			
 
				-extern int64_t hist_entry__cmp(struct hist_entry *, struct hist_entry *);
			
 
				-extern int64_t hist_entry__collapse(struct hist_entry *, struct hist_entry *);
			
 
				-int hist_entry__fprintf(struct hist_entry *he, size_t size, struct hists *hists,
			
 
				-			struct hists *pair_hists, bool show_displacement,
			
 
				-			long displacement, FILE *fp, u64 session_total);
			
 
				+int64_t hist_entry__cmp(struct hist_entry *left, struct hist_entry *right);
			
 
				+int64_t hist_entry__collapse(struct hist_entry *left, struct hist_entry *right);
			
 
				 int hist_entry__snprintf(struct hist_entry *self, char *bf, size_t size,
			
 
				 			 struct hists *hists);
			
 
				 void hist_entry__free(struct hist_entry *);
			
--- a/tools/perf/util/parse-events.c
+++ b/tools/perf/util/parse-events.c
@@ -735,8 +735,8 @@ static int
 
				 parse_event_modifier(const char **strp, struct perf_event_attr *attr)
			
 
				 {
			
 
				 	const char *str = *strp;
			
 
				-	int exclude = 0;
			
 
				-	int eu = 0, ek = 0, eh = 0, precise = 0;
			
 
				+	int exclude = 0, exclude_GH = 0;
			
 
				+	int eu = 0, ek = 0, eh = 0, eH = 0, eG = 0, precise = 0;
			
 
				 
			
 
				 	if (!*str)
			
 
				 		return 0;
			
@@ -760,6 +760,14 @@ parse_event_modifier(const char **strp, struct perf_event_attr *attr)
 
				 			if (!exclude)
			
 
				 				exclude = eu = ek = eh = 1;
			
 
				 			eh = 0;
			
 
				+		} else if (*str == 'G') {
			
 
				+			if (!exclude_GH)
			
 
				+				exclude_GH = eG = eH = 1;
			
 
				+			eG = 0;
			
 
				+		} else if (*str == 'H') {
			
 
				+			if (!exclude_GH)
			
 
				+				exclude_GH = eG = eH = 1;
			
 
				+			eH = 0;
			
 
				 		} else if (*str == 'p') {
			
 
				 			precise++;
			
 
				 		} else
			
@@ -776,6 +784,8 @@ parse_event_modifier(const char **strp, struct perf_event_attr *attr)
 
				 	attr->exclude_kernel = ek;
			
 
				 	attr->exclude_hv     = eh;
			
 
				 	attr->precise_ip     = precise;
			
 
				+	attr->exclude_host   = eH;
			
 
				+	attr->exclude_guest  = eG;
			
 
				 
			
 
				 	return 0;
			
 
				 }
			
@@ -838,6 +848,7 @@ int parse_events(struct perf_evlist *evlist , const char *str, int unset __used)
 
				 	for (;;) {
			
 
				 		ostr = str;
			
 
				 		memset(&attr, 0, sizeof(attr));
			
 
				+		event_attr_init(&attr);
			
 
				 		ret = parse_event_symbols(evlist, &str, &attr);
			
 
				 		if (ret == EVT_FAILED)
			
 
				 			return -1;
			
--- a/tools/perf/util/trace-event-info.c
+++ b/tools/perf/util/trace-event-info.c
@@ -18,7 +18,6 @@
 
				  *
			
 
				  * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
			
 
				  */
			
 
				-#include <ctype.h>
			
 
				 #include "util.h"
			
 
				 #include <dirent.h>
			
 
				 #include <mntent.h>
			
--- a/tools/perf/util/util.c
+++ b/tools/perf/util/util.c
@@ -1,6 +1,21 @@
 
				+#include "../perf.h"
			
 
				 #include "util.h"
			
 
				 #include <sys/mman.h>
			
 
				 
			
 
				+/*
			
 
				+ * XXX We need to find a better place for these things...
			
 
				+ */
			
 
				+bool perf_host  = true;
			
 
				+bool perf_guest = true;
			
 
				+
			
 
				+void event_attr_init(struct perf_event_attr *attr)
			
 
				+{
			
 
				+	if (!perf_host)
			
 
				+		attr->exclude_host  = 1;
			
 
				+	if (!perf_guest)
			
 
				+		attr->exclude_guest = 1;
			
 
				+}
			
 
				+
			
 
				 int mkdir_p(char *path, mode_t mode)
			
 
				 {
			
 
				 	struct stat st;
			
--- a/tools/perf/util/util.h
+++ b/tools/perf/util/util.h
@@ -242,6 +242,10 @@ int strtailcmp(const char *s1, const char *s2);
 
				 unsigned long convert_unit(unsigned long value, char *unit);
			
 
				 int readn(int fd, void *buf, size_t size);
			
 
				 
			
 
				+struct perf_event_attr;
			
 
				+
			
 
				+void event_attr_init(struct perf_event_attr *attr);
			
 
				+
			
 
				 #define _STR(x) #x
			
 
				 #define STR(x) _STR(x)