14 年之前 · a926021cb1
--- a/Documentation/trace/ftrace-design.txt
+++ b/Documentation/trace/ftrace-design.txt
@@ -247,6 +247,13 @@ You need very few things to get the syscalls tracing in an arch.
 
															 - Support the TIF_SYSCALL_TRACEPOINT thread flags.
														
 
															 - Put the trace_sys_enter() and trace_sys_exit() tracepoints calls from ptrace
														
 
															   in the ptrace syscalls tracing path.
														
 
															+- If the system call table on this arch is more complicated than a simple array
														
 
															+  of addresses of the system calls, implement an arch_syscall_addr to return
														
 
															+  the address of a given system call.
														
 
															+- If the symbol names of the system calls do not match the function names on
														
 
															+  this arch, define ARCH_HAS_SYSCALL_MATCH_SYM_NAME in asm/ftrace.h and
														
 
															+  implement arch_syscall_match_sym_name with the appropriate logic to return
														
 
															+  true if the function name corresponds with the symbol name.
														
 
															 - Tag this arch as HAVE_SYSCALL_TRACEPOINTS.
														
--- a/Documentation/trace/ftrace.txt
+++ b/Documentation/trace/ftrace.txt
@@ -80,11 +80,11 @@ of ftrace. Here is a list of some of the key files:
 
															 	tracers listed here can be configured by
														
 
															 	echoing their name into current_tracer.
														
 
															-  tracing_enabled:
														
 
															+  tracing_on:
														
 
															-	This sets or displays whether the current_tracer
														
 
															-	is activated and tracing or not. Echo 0 into this
														
 
															-	file to disable the tracer or 1 to enable it.
														
 
															+	This sets or displays whether writing to the trace
														
 
															+	ring buffer is enabled. Echo 0 into this file to disable
														
 
															+	the tracer or 1 to enable it.
														
 
															   trace:
														
@@ -202,10 +202,6 @@ Here is the list of current tracers that may be configured.
 
															 	to draw a graph of function calls similar to C code
														
 
															 	source.
														
 
															-  "sched_switch"
														
 
															-
														
 
															-	Traces the context switches and wakeups between tasks.
														
 
															-
														
 
															   "irqsoff"
														
 
															 	Traces the areas that disable interrupts and saves
														
@@ -273,39 +269,6 @@ format, the function name that was traced "path_put" and the
 
															 parent function that called this function "path_walk". The
														
 
															 timestamp is the time at which the function was entered.
														
 
															-The sched_switch tracer also includes tracing of task wakeups
														
 
															-and context switches.
														
 
															-
														
 
															-     ksoftirqd/1-7     [01]  1453.070013:      7:115:R   +  2916:115:S
														
 
															-     ksoftirqd/1-7     [01]  1453.070013:      7:115:R   +    10:115:S
														
 
															-     ksoftirqd/1-7     [01]  1453.070013:      7:115:R ==>    10:115:R
														
 
															-        events/1-10    [01]  1453.070013:     10:115:S ==>  2916:115:R
														
 
															-     kondemand/1-2916  [01]  1453.070013:   2916:115:S ==>     7:115:R
														
 
															-     ksoftirqd/1-7     [01]  1453.070013:      7:115:S ==>     0:140:R
														
 
															-
														
 
															-Wake ups are represented by a "+" and the context switches are
														
 
															-shown as "==>".  The format is:
														
 
															-
														
 
															- Context switches:
														
 
															-
														
 
															-       Previous task              Next Task
														
 
															-
														
 
															-  <pid>:<prio>:<state>  ==>  <pid>:<prio>:<state>
														
 
															-
														
 
															- Wake ups:
														
 
															-
														
 
															-       Current task               Task waking up
														
 
															-
														
 
															-  <pid>:<prio>:<state>    +  <pid>:<prio>:<state>
														
 
															-
														
 
															-The prio is the internal kernel priority, which is the inverse
														
 
															-of the priority that is usually displayed by user-space tools.
														
 
															-Zero represents the highest priority (99). Prio 100 starts the
														
 
															-"nice" priorities with 100 being equal to nice -20 and 139 being
														
 
															-nice 19. The prio "140" is reserved for the idle task which is
														
 
															-the lowest priority thread (pid 0).
														
 
															-
														
 
															-
														
 
															 Latency trace format
														
 
															 --------------------
														
@@ -491,78 +454,10 @@ x494] <- /root/a.out[+0x4a8] <- /lib/libc-2.7.so[+0x1e1a6]
 
															                    latencies, as described in "Latency
														
 
															                    trace format".
														
 
															-sched_switch
														
 
															-------------
														
 
															-
														
 
															-This tracer simply records schedule switches. Here is an example
														
 
															-of how to use it.
														
 
															-
														
 
															- # echo sched_switch > current_tracer
														
 
															- # echo 1 > tracing_enabled
														
 
															- # sleep 1
														
 
															- # echo 0 > tracing_enabled
														
 
															- # cat trace
														
 
															-
														
 
															-# tracer: sched_switch
														
 
															-#
														
 
															-#           TASK-PID   CPU#    TIMESTAMP  FUNCTION
														
 
															-#              | |      |          |         |
														
 
															-            bash-3997  [01]   240.132281:   3997:120:R   +  4055:120:R
														
 
															-            bash-3997  [01]   240.132284:   3997:120:R ==>  4055:120:R
														
 
															-           sleep-4055  [01]   240.132371:   4055:120:S ==>  3997:120:R
														
 
															-            bash-3997  [01]   240.132454:   3997:120:R   +  4055:120:S
														
 
															-            bash-3997  [01]   240.132457:   3997:120:R ==>  4055:120:R
														
 
															-           sleep-4055  [01]   240.132460:   4055:120:D ==>  3997:120:R
														
 
															-            bash-3997  [01]   240.132463:   3997:120:R   +  4055:120:D
														
 
															-            bash-3997  [01]   240.132465:   3997:120:R ==>  4055:120:R
														
 
															-          <idle>-0     [00]   240.132589:      0:140:R   +     4:115:S
														
 
															-          <idle>-0     [00]   240.132591:      0:140:R ==>     4:115:R
														
 
															-     ksoftirqd/0-4     [00]   240.132595:      4:115:S ==>     0:140:R
														
 
															-          <idle>-0     [00]   240.132598:      0:140:R   +     4:115:S
														
 
															-          <idle>-0     [00]   240.132599:      0:140:R ==>     4:115:R
														
 
															-     ksoftirqd/0-4     [00]   240.132603:      4:115:S ==>     0:140:R
														
 
															-           sleep-4055  [01]   240.133058:   4055:120:S ==>  3997:120:R
														
 
															- [...]
														
 
															-
														
 
															-
														
 
															-As we have discussed previously about this format, the header
														
 
															-shows the name of the trace and points to the options. The
														
 
															-"FUNCTION" is a misnomer since here it represents the wake ups
														
 
															-and context switches.
														
 
															-
														
 
															-The sched_switch file only lists the wake ups (represented with
														
 
															-'+') and context switches ('==>') with the previous task or
														
 
															-current task first followed by the next task or task waking up.
														
 
															-The format for both of these is PID:KERNEL-PRIO:TASK-STATE.
														
 
															-Remember that the KERNEL-PRIO is the inverse of the actual
														
 
															-priority with zero (0) being the highest priority and the nice
														
 
															-values starting at 100 (nice -20). Below is a quick chart to map
														
 
															-the kernel priority to user land priorities.
														
 
															-
														
 
															-   Kernel Space                     User Space
														
 
															- ===============================================================
														
 
															-   0(high) to  98(low)     user RT priority 99(high) to 1(low)
														
 
															-                           with SCHED_RR or SCHED_FIFO
														
 
															- ---------------------------------------------------------------
														
 
															-  99                       sched_priority is not used in scheduling
														
 
															-                           decisions(it must be specified as 0)
														
 
															- ---------------------------------------------------------------
														
 
															- 100(high) to 139(low)     user nice -20(high) to 19(low)
														
 
															- ---------------------------------------------------------------
														
 
															- 140                       idle task priority
														
 
															- ---------------------------------------------------------------
														
 
															-
														
 
															-The task states are:
														
 
															-
														
 
															- R - running : wants to run, may not actually be running
														
 
															- S - sleep   : process is waiting to be woken up (handles signals)
														
 
															- D - disk sleep (uninterruptible sleep) : process must be woken up
														
 
															-					(ignores signals)
														
 
															- T - stopped : process suspended
														
 
															- t - traced  : process is being traced (with something like gdb)
														
 
															- Z - zombie  : process waiting to be cleaned up
														
 
															- X - unknown
														
 
															-
														
 
															+  overwrite - This controls what happens when the trace buffer is
														
 
															+              full. If "1" (default), the oldest events are
														
 
															+              discarded and overwritten. If "0", then the newest
														
 
															+              events are discarded.
														
 
															 ftrace_enabled
														
 
															 --------------
														
@@ -607,10 +502,10 @@ an example:
 
															  # echo irqsoff > current_tracer
														
 
															  # echo latency-format > trace_options
														
 
															  # echo 0 > tracing_max_latency
														
 
															- # echo 1 > tracing_enabled
														
 
															+ # echo 1 > tracing_on
														
 
															  # ls -ltr
														
 
															  [...]
														
 
															- # echo 0 > tracing_enabled
														
 
															+ # echo 0 > tracing_on
														
 
															  # cat trace
														
 
															 # tracer: irqsoff
														
 
															 #
														
@@ -715,10 +610,10 @@ is much like the irqsoff tracer.
 
															  # echo preemptoff > current_tracer
														
 
															  # echo latency-format > trace_options
														
 
															  # echo 0 > tracing_max_latency
														
 
															- # echo 1 > tracing_enabled
														
 
															+ # echo 1 > tracing_on
														
 
															  # ls -ltr
														
 
															  [...]
														
 
															- # echo 0 > tracing_enabled
														
 
															+ # echo 0 > tracing_on
														
 
															  # cat trace
														
 
															 # tracer: preemptoff
														
 
															 #
														
@@ -863,10 +758,10 @@ tracers.
 
															  # echo preemptirqsoff > current_tracer
														
 
															  # echo latency-format > trace_options
														
 
															  # echo 0 > tracing_max_latency
														
 
															- # echo 1 > tracing_enabled
														
 
															+ # echo 1 > tracing_on
														
 
															  # ls -ltr
														
 
															  [...]
														
 
															- # echo 0 > tracing_enabled
														
 
															+ # echo 0 > tracing_on
														
 
															  # cat trace
														
 
															 # tracer: preemptirqsoff
														
 
															 #
														
@@ -1026,9 +921,9 @@ Instead of performing an 'ls', we will run 'sleep 1' under
 
															  # echo wakeup > current_tracer
														
 
															  # echo latency-format > trace_options
														
 
															  # echo 0 > tracing_max_latency
														
 
															- # echo 1 > tracing_enabled
														
 
															+ # echo 1 > tracing_on
														
 
															  # chrt -f 5 sleep 1
														
 
															- # echo 0 > tracing_enabled
														
 
															+ # echo 0 > tracing_on
														
 
															  # cat trace
														
 
															 # tracer: wakeup
														
 
															 #
														
@@ -1140,9 +1035,9 @@ ftrace_enabled is set; otherwise this tracer is a nop.
 
															  # sysctl kernel.ftrace_enabled=1
														
 
															  # echo function > current_tracer
														
 
															- # echo 1 > tracing_enabled
														
 
															+ # echo 1 > tracing_on
														
 
															  # usleep 1
														
 
															- # echo 0 > tracing_enabled
														
 
															+ # echo 0 > tracing_on
														
 
															  # cat trace
														
 
															 # tracer: function
														
 
															 #
														
@@ -1180,7 +1075,7 @@ int trace_fd;
 
															 [...]
														
 
															 int main(int argc, char *argv[]) {
														
 
															 	[...]
														
 
															-	trace_fd = open(tracing_file("tracing_enabled"), O_WRONLY);
														
 
															+	trace_fd = open(tracing_file("tracing_on"), O_WRONLY);
														
 
															 	[...]
														
 
															 	if (condition_hit()) {
														
 
															 		write(trace_fd, "0", 1);
														
@@ -1631,9 +1526,9 @@ If I am only interested in sys_nanosleep and hrtimer_interrupt:
 
															  # echo sys_nanosleep hrtimer_interrupt \
														
 
															 		> set_ftrace_filter
														
 
															  # echo function > current_tracer
														
 
															- # echo 1 > tracing_enabled
														
 
															+ # echo 1 > tracing_on
														
 
															  # usleep 1
														
 
															- # echo 0 > tracing_enabled
														
 
															+ # echo 0 > tracing_on
														
 
															  # cat trace
														
 
															 # tracer: ftrace
														
 
															 #
														
@@ -1879,9 +1774,9 @@ different. The trace is live.
 
															  # echo function > current_tracer
														
 
															  # cat trace_pipe > /tmp/trace.out &
														
 
															 [1] 4153
														
 
															- # echo 1 > tracing_enabled
														
 
															+ # echo 1 > tracing_on
														
 
															  # usleep 1
														
 
															- # echo 0 > tracing_enabled
														
 
															+ # echo 0 > tracing_on
														
 
															  # cat trace
														
 
															 # tracer: function
														
 
															 #
														
--- a/Documentation/trace/kprobetrace.txt
+++ b/Documentation/trace/kprobetrace.txt
@@ -42,11 +42,25 @@ Synopsis of kprobe_events
 
															   +|-offs(FETCHARG) : Fetch memory at FETCHARG +|- offs address.(**)
														
 
															   NAME=FETCHARG : Set NAME as the argument name of FETCHARG.
														
 
															   FETCHARG:TYPE : Set TYPE as the type of FETCHARG. Currently, basic types
														
 
															-		  (u8/u16/u32/u64/s8/s16/s32/s64) and string are supported.
														
 
															+		  (u8/u16/u32/u64/s8/s16/s32/s64), "string" and bitfield
														
 
															+		  are supported.
														
 
															   (*) only for return probe.
														
 
															   (**) this is useful for fetching a field of data structures.
														
 
															+Types
														
 
															+-----
														
 
															+Several types are supported for fetch-args. Kprobe tracer will access memory
														
 
															+by given type. Prefix 's' and 'u' means those types are signed and unsigned
														
 
															+respectively. Traced arguments are shown in decimal (signed) or hex (unsigned).
														
 
															+String type is a special type, which fetches a "null-terminated" string from
														
 
															+kernel space. This means it will fail and store NULL if the string container
														
 
															+has been paged out.
														
 
															+Bitfield is another special type, which takes 3 parameters, bit-width, bit-
														
 
															+offset, and container-size (usually 32). The syntax is;
														
 
															+
														
 
															+ b<bit-width>@<bit-offset>/<container-size>
														
 
															+
														
 
															 Per-Probe Event Filtering
														
 
															 -------------------------
														
--- a/arch/x86/ia32/ia32entry.S
+++ b/arch/x86/ia32/ia32entry.S
@@ -25,6 +25,8 @@
 
															 #define sysretl_audit ia32_ret_from_sys_call
														
 
															 #endif
														
 
															+	.section .entry.text, "ax"
														
 
															+
														
 
															 #define IA32_NR_syscalls ((ia32_syscall_end - ia32_sys_call_table)/8)
														
 
															 	.macro IA32_ARG_FIXUP noebp=0
														
--- a/arch/x86/include/asm/cpufeature.h
+++ b/arch/x86/include/asm/cpufeature.h
@@ -160,6 +160,7 @@
 
															 #define X86_FEATURE_NODEID_MSR	(6*32+19) /* NodeId MSR */
														
 
															 #define X86_FEATURE_TBM		(6*32+21) /* trailing bit manipulations */
														
 
															 #define X86_FEATURE_TOPOEXT	(6*32+22) /* topology extensions CPUID leafs */
														
 
															+#define X86_FEATURE_PERFCTR_CORE (6*32+23) /* core performance counter extensions */
														
 
															 /*
														
 
															  * Auxiliary flags: Linux defined - For features scattered in various
														
@@ -279,6 +280,7 @@ extern const char * const x86_power_flags[32];
 
															 #define cpu_has_xsave		boot_cpu_has(X86_FEATURE_XSAVE)
														
 
															 #define cpu_has_hypervisor	boot_cpu_has(X86_FEATURE_HYPERVISOR)
														
 
															 #define cpu_has_pclmulqdq	boot_cpu_has(X86_FEATURE_PCLMULQDQ)
														
 
															+#define cpu_has_perfctr_core	boot_cpu_has(X86_FEATURE_PERFCTR_CORE)
														
 
															 #if defined(CONFIG_X86_INVLPG) || defined(CONFIG_X86_64)
														
 
															 # define cpu_has_invlpg		1
														
--- a/arch/x86/include/asm/kdebug.h
+++ b/arch/x86/include/asm/kdebug.h
@@ -13,7 +13,6 @@ enum die_val {
 
															 	DIE_PANIC,
														
 
															 	DIE_NMI,
														
 
															 	DIE_DIE,
														
 
															-	DIE_NMIWATCHDOG,
														
 
															 	DIE_KERNELDEBUG,
														
 
															 	DIE_TRAP,
														
 
															 	DIE_GPF,
														
--- a/arch/x86/include/asm/msr-index.h
+++ b/arch/x86/include/asm/msr-index.h
@@ -52,6 +52,9 @@
 
															 #define MSR_IA32_MCG_STATUS		0x0000017a
														
 
															 #define MSR_IA32_MCG_CTL		0x0000017b
														
 
															+#define MSR_OFFCORE_RSP_0		0x000001a6
														
 
															+#define MSR_OFFCORE_RSP_1		0x000001a7
														
 
															+
														
 
															 #define MSR_IA32_PEBS_ENABLE		0x000003f1
														
 
															 #define MSR_IA32_DS_AREA		0x00000600
														
 
															 #define MSR_IA32_PERF_CAPABILITIES	0x00000345
														
--- a/arch/x86/include/asm/nmi.h
+++ b/arch/x86/include/asm/nmi.h
@@ -7,7 +7,6 @@
 
															 #ifdef CONFIG_X86_LOCAL_APIC
														
 
															-extern void die_nmi(char *str, struct pt_regs *regs, int do_panic);
														
 
															 extern int avail_to_resrv_perfctr_nmi_bit(unsigned int);
														
 
															 extern int reserve_perfctr_nmi(unsigned int);
														
 
															 extern void release_perfctr_nmi(unsigned int);
														
--- a/arch/x86/include/asm/smp.h
+++ b/arch/x86/include/asm/smp.h
@@ -17,10 +17,20 @@
 
															 #endif
														
 
															 #include <asm/thread_info.h>
														
 
															 #include <asm/cpumask.h>
														
 
															+#include <asm/cpufeature.h>
														
 
															 extern int smp_num_siblings;
														
 
															 extern unsigned int num_processors;
														
 
															+static inline bool cpu_has_ht_siblings(void)
														
 
															+{
														
 
															+	bool has_siblings = false;
														
 
															+#ifdef CONFIG_SMP
														
 
															+	has_siblings = cpu_has_ht && smp_num_siblings > 1;
														
 
															+#endif
														
 
															+	return has_siblings;
														
 
															+}
														
 
															+
														
 
															 DECLARE_PER_CPU(cpumask_var_t, cpu_sibling_map);
														
 
															 DECLARE_PER_CPU(cpumask_var_t, cpu_core_map);
														
 
															 DECLARE_PER_CPU(u16, cpu_llc_id);
														
--- a/arch/x86/kernel/cpu/perf_event.c
+++ b/arch/x86/kernel/cpu/perf_event.c
@@ -30,6 +30,7 @@
 
															 #include <asm/stacktrace.h>
														
 
															 #include <asm/nmi.h>
														
 
															 #include <asm/compat.h>
														
 
															+#include <asm/smp.h>
														
 
															 #if 0
														
 
															 #undef wrmsrl
														
@@ -93,6 +94,8 @@ struct amd_nb {
 
															 	struct event_constraint event_constraints[X86_PMC_IDX_MAX];
														
 
															 };
														
 
															+struct intel_percore;
														
 
															+
														
 
															 #define MAX_LBR_ENTRIES		16
														
 
															 struct cpu_hw_events {
														
@@ -127,6 +130,13 @@ struct cpu_hw_events {
 
															 	struct perf_branch_stack	lbr_stack;
														
 
															 	struct perf_branch_entry	lbr_entries[MAX_LBR_ENTRIES];
														
 
															+	/*
														
 
															+	 * Intel percore register state.
														
 
															+	 * Coordinate shared resources between HT threads.
														
 
															+	 */
														
 
															+	int				percore_used; /* Used by this CPU? */
														
 
															+	struct intel_percore		*per_core;
														
 
															+
														
 
															 	/*
														
 
															 	 * AMD specific bits
														
 
															 	 */
														
@@ -166,8 +176,10 @@ struct cpu_hw_events {
 
															 /*
														
 
															  * Constraint on the Event code + UMask
														
 
															  */
														
 
															-#define PEBS_EVENT_CONSTRAINT(c, n)	\
														
 
															+#define INTEL_UEVENT_CONSTRAINT(c, n)	\
														
 
															 	EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK)
														
 
															+#define PEBS_EVENT_CONSTRAINT(c, n)	\
														
 
															+	INTEL_UEVENT_CONSTRAINT(c, n)
														
 
															 #define EVENT_CONSTRAINT_END		\
														
 
															 	EVENT_CONSTRAINT(0, 0, 0)
														
@@ -175,6 +187,28 @@ struct cpu_hw_events {
 
															 #define for_each_event_constraint(e, c)	\
														
 
															 	for ((e) = (c); (e)->weight; (e)++)
														
 
															+/*
														
 
															+ * Extra registers for specific events.
														
 
															+ * Some events need large masks and require external MSRs.
														
 
															+ * Define a mapping to these extra registers.
														
 
															+ */
														
 
															+struct extra_reg {
														
 
															+	unsigned int		event;
														
 
															+	unsigned int		msr;
														
 
															+	u64			config_mask;
														
 
															+	u64			valid_mask;
														
 
															+};
														
 
															+
														
 
															+#define EVENT_EXTRA_REG(e, ms, m, vm) {	\
														
 
															+	.event = (e),		\
														
 
															+	.msr = (ms),		\
														
 
															+	.config_mask = (m),	\
														
 
															+	.valid_mask = (vm),	\
														
 
															+	}
														
 
															+#define INTEL_EVENT_EXTRA_REG(event, msr, vm)	\
														
 
															+	EVENT_EXTRA_REG(event, msr, ARCH_PERFMON_EVENTSEL_EVENT, vm)
														
 
															+#define EVENT_EXTRA_END EVENT_EXTRA_REG(0, 0, 0, 0)
														
 
															+
														
 
															 union perf_capabilities {
														
 
															 	struct {
														
 
															 		u64	lbr_format    : 6;
														
@@ -219,6 +253,7 @@ struct x86_pmu {
 
															 	void		(*put_event_constraints)(struct cpu_hw_events *cpuc,
														
 
															 						 struct perf_event *event);
														
 
															 	struct event_constraint *event_constraints;
														
 
															+	struct event_constraint *percore_constraints;
														
 
															 	void		(*quirks)(void);
														
 
															 	int		perfctr_second_write;
														
@@ -247,6 +282,11 @@ struct x86_pmu {
 
															 	 */
														
 
															 	unsigned long	lbr_tos, lbr_from, lbr_to; /* MSR base regs       */
														
 
															 	int		lbr_nr;			   /* hardware stack size */
														
 
															+
														
 
															+	/*
														
 
															+	 * Extra registers for events
														
 
															+	 */
														
 
															+	struct extra_reg *extra_regs;
														
 
															 };
														
 
															 static struct x86_pmu x86_pmu __read_mostly;
														
@@ -271,6 +311,10 @@ static u64 __read_mostly hw_cache_event_ids
 
															 				[PERF_COUNT_HW_CACHE_MAX]
														
 
															 				[PERF_COUNT_HW_CACHE_OP_MAX]
														
 
															 				[PERF_COUNT_HW_CACHE_RESULT_MAX];
														
 
															+static u64 __read_mostly hw_cache_extra_regs
														
 
															+				[PERF_COUNT_HW_CACHE_MAX]
														
 
															+				[PERF_COUNT_HW_CACHE_OP_MAX]
														
 
															+				[PERF_COUNT_HW_CACHE_RESULT_MAX];
														
 
															 /*
														
 
															  * Propagate event elapsed time into the generic event.
														
@@ -298,7 +342,7 @@ x86_perf_event_update(struct perf_event *event)
 
															 	 */
														
 
															 again:
														
 
															 	prev_raw_count = local64_read(&hwc->prev_count);
														
 
															-	rdmsrl(hwc->event_base + idx, new_raw_count);
														
 
															+	rdmsrl(hwc->event_base, new_raw_count);
														
 
															 	if (local64_cmpxchg(&hwc->prev_count, prev_raw_count,
														
 
															 					new_raw_count) != prev_raw_count)
														
@@ -321,6 +365,49 @@ again:
 
															 	return new_raw_count;
														
 
															 }
														
 
															+/* using X86_FEATURE_PERFCTR_CORE to later implement ALTERNATIVE() here */
														
 
															+static inline int x86_pmu_addr_offset(int index)
														
 
															+{
														
 
															+	if (boot_cpu_has(X86_FEATURE_PERFCTR_CORE))
														
 
															+		return index << 1;
														
 
															+	return index;
														
 
															+}
														
 
															+
														
 
															+static inline unsigned int x86_pmu_config_addr(int index)
														
 
															+{
														
 
															+	return x86_pmu.eventsel + x86_pmu_addr_offset(index);
														
 
															+}
														
 
															+
														
 
															+static inline unsigned int x86_pmu_event_addr(int index)
														
 
															+{
														
 
															+	return x86_pmu.perfctr + x86_pmu_addr_offset(index);
														
 
															+}
														
 
															+
														
 
															+/*
														
 
															+ * Find and validate any extra registers to set up.
														
 
															+ */
														
 
															+static int x86_pmu_extra_regs(u64 config, struct perf_event *event)
														
 
															+{
														
 
															+	struct extra_reg *er;
														
 
															+
														
 
															+	event->hw.extra_reg = 0;
														
 
															+	event->hw.extra_config = 0;
														
 
															+
														
 
															+	if (!x86_pmu.extra_regs)
														
 
															+		return 0;
														
 
															+
														
 
															+	for (er = x86_pmu.extra_regs; er->msr; er++) {
														
 
															+		if (er->event != (config & er->config_mask))
														
 
															+			continue;
														
 
															+		if (event->attr.config1 & ~er->valid_mask)
														
 
															+			return -EINVAL;
														
 
															+		event->hw.extra_reg = er->msr;
														
 
															+		event->hw.extra_config = event->attr.config1;
														
 
															+		break;
														
 
															+	}
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															 static atomic_t active_events;
														
 
															 static DEFINE_MUTEX(pmc_reserve_mutex);
														
@@ -331,12 +418,12 @@ static bool reserve_pmc_hardware(void)
 
															 	int i;
														
 
															 	for (i = 0; i < x86_pmu.num_counters; i++) {
														
 
															-		if (!reserve_perfctr_nmi(x86_pmu.perfctr + i))
														
 
															+		if (!reserve_perfctr_nmi(x86_pmu_event_addr(i)))
														
 
															 			goto perfctr_fail;
														
 
															 	}
														
 
															 	for (i = 0; i < x86_pmu.num_counters; i++) {
														
 
															-		if (!reserve_evntsel_nmi(x86_pmu.eventsel + i))
														
 
															+		if (!reserve_evntsel_nmi(x86_pmu_config_addr(i)))
														
 
															 			goto eventsel_fail;
														
 
															 	}
														
@@ -344,13 +431,13 @@ static bool reserve_pmc_hardware(void)
 
															 eventsel_fail:
														
 
															 	for (i--; i >= 0; i--)
														
 
															-		release_evntsel_nmi(x86_pmu.eventsel + i);
														
 
															+		release_evntsel_nmi(x86_pmu_config_addr(i));
														
 
															 	i = x86_pmu.num_counters;
														
 
															 perfctr_fail:
														
 
															 	for (i--; i >= 0; i--)
														
 
															-		release_perfctr_nmi(x86_pmu.perfctr + i);
														
 
															+		release_perfctr_nmi(x86_pmu_event_addr(i));
														
 
															 	return false;
														
 
															 }
														
@@ -360,8 +447,8 @@ static void release_pmc_hardware(void)
 
															 	int i;
														
 
															 	for (i = 0; i < x86_pmu.num_counters; i++) {
														
 
															-		release_perfctr_nmi(x86_pmu.perfctr + i);
														
 
															-		release_evntsel_nmi(x86_pmu.eventsel + i);
														
 
															+		release_perfctr_nmi(x86_pmu_event_addr(i));
														
 
															+		release_evntsel_nmi(x86_pmu_config_addr(i));
														
 
															 	}
														
 
															 }
														
@@ -382,7 +469,7 @@ static bool check_hw_exists(void)
 
															 	 * complain and bail.
														
 
															 	 */
														
 
															 	for (i = 0; i < x86_pmu.num_counters; i++) {
														
 
															-		reg = x86_pmu.eventsel + i;
														
 
															+		reg = x86_pmu_config_addr(i);
														
 
															 		ret = rdmsrl_safe(reg, &val);
														
 
															 		if (ret)
														
 
															 			goto msr_fail;
														
@@ -407,8 +494,8 @@ static bool check_hw_exists(void)
 
															 	 * that don't trap on the MSR access and always return 0s.
														
 
															 	 */
														
 
															 	val = 0xabcdUL;
														
 
															-	ret = checking_wrmsrl(x86_pmu.perfctr, val);
														
 
															-	ret |= rdmsrl_safe(x86_pmu.perfctr, &val_new);
														
 
															+	ret = checking_wrmsrl(x86_pmu_event_addr(0), val);
														
 
															+	ret |= rdmsrl_safe(x86_pmu_event_addr(0), &val_new);
														
 
															 	if (ret || val != val_new)
														
 
															 		goto msr_fail;
														
@@ -442,8 +529,9 @@ static inline int x86_pmu_initialized(void)
 
															 }
														
 
															 static inline int
														
 
															-set_ext_hw_attr(struct hw_perf_event *hwc, struct perf_event_attr *attr)
														
 
															+set_ext_hw_attr(struct hw_perf_event *hwc, struct perf_event *event)
														
 
															 {
														
 
															+	struct perf_event_attr *attr = &event->attr;
														
 
															 	unsigned int cache_type, cache_op, cache_result;
														
 
															 	u64 config, val;
														
@@ -470,8 +558,8 @@ set_ext_hw_attr(struct hw_perf_event *hwc, struct perf_event_attr *attr)
 
															 		return -EINVAL;
														
 
															 	hwc->config |= val;
														
 
															-
														
 
															-	return 0;
														
 
															+	attr->config1 = hw_cache_extra_regs[cache_type][cache_op][cache_result];
														
 
															+	return x86_pmu_extra_regs(val, event);
														
 
															 }
														
 
															 static int x86_setup_perfctr(struct perf_event *event)
														
@@ -496,10 +584,10 @@ static int x86_setup_perfctr(struct perf_event *event)
 
															 	}
														
 
															 	if (attr->type == PERF_TYPE_RAW)
														
 
															-		return 0;
														
 
															+		return x86_pmu_extra_regs(event->attr.config, event);
														
 
															 	if (attr->type == PERF_TYPE_HW_CACHE)
														
 
															-		return set_ext_hw_attr(hwc, attr);
														
 
															+		return set_ext_hw_attr(hwc, event);
														
 
															 	if (attr->config >= x86_pmu.max_events)
														
 
															 		return -EINVAL;
														
@@ -617,11 +705,11 @@ static void x86_pmu_disable_all(void)
 
															 		if (!test_bit(idx, cpuc->active_mask))
														
 
															 			continue;
														
 
															-		rdmsrl(x86_pmu.eventsel + idx, val);
														
 
															+		rdmsrl(x86_pmu_config_addr(idx), val);
														
 
															 		if (!(val & ARCH_PERFMON_EVENTSEL_ENABLE))
														
 
															 			continue;
														
 
															 		val &= ~ARCH_PERFMON_EVENTSEL_ENABLE;
														
 
															-		wrmsrl(x86_pmu.eventsel + idx, val);
														
 
															+		wrmsrl(x86_pmu_config_addr(idx), val);
														
 
															 	}
														
 
															 }
														
@@ -642,21 +730,26 @@ static void x86_pmu_disable(struct pmu *pmu)
 
															 	x86_pmu.disable_all();
														
 
															 }
														
 
															+static inline void __x86_pmu_enable_event(struct hw_perf_event *hwc,
														
 
															+					  u64 enable_mask)
														
 
															+{
														
 
															+	if (hwc->extra_reg)
														
 
															+		wrmsrl(hwc->extra_reg, hwc->extra_config);
														
 
															+	wrmsrl(hwc->config_base, hwc->config | enable_mask);
														
 
															+}
														
 
															+
														
 
															 static void x86_pmu_enable_all(int added)
														
 
															 {
														
 
															 	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
														
 
															 	int idx;
														
 
															 	for (idx = 0; idx < x86_pmu.num_counters; idx++) {
														
 
															-		struct perf_event *event = cpuc->events[idx];
														
 
															-		u64 val;
														
 
															+		struct hw_perf_event *hwc = &cpuc->events[idx]->hw;
														
 
															 		if (!test_bit(idx, cpuc->active_mask))
														
 
															 			continue;
														
 
															-		val = event->hw.config;
														
 
															-		val |= ARCH_PERFMON_EVENTSEL_ENABLE;
														
 
															-		wrmsrl(x86_pmu.eventsel + idx, val);
														
 
															+		__x86_pmu_enable_event(hwc, ARCH_PERFMON_EVENTSEL_ENABLE);
														
 
															 	}
														
 
															 }
														
@@ -821,15 +914,10 @@ static inline void x86_assign_hw_event(struct perf_event *event,
 
															 		hwc->event_base	= 0;
														
 
															 	} else if (hwc->idx >= X86_PMC_IDX_FIXED) {
														
 
															 		hwc->config_base = MSR_ARCH_PERFMON_FIXED_CTR_CTRL;
														
 
															-		/*
														
 
															-		 * We set it so that event_base + idx in wrmsr/rdmsr maps to
														
 
															-		 * MSR_ARCH_PERFMON_FIXED_CTR0 ... CTR2:
														
 
															-		 */
														
 
															-		hwc->event_base =
														
 
															-			MSR_ARCH_PERFMON_FIXED_CTR0 - X86_PMC_IDX_FIXED;
														
 
															+		hwc->event_base = MSR_ARCH_PERFMON_FIXED_CTR0;
														
 
															 	} else {
														
 
															-		hwc->config_base = x86_pmu.eventsel;
														
 
															-		hwc->event_base  = x86_pmu.perfctr;
														
 
															+		hwc->config_base = x86_pmu_config_addr(hwc->idx);
														
 
															+		hwc->event_base  = x86_pmu_event_addr(hwc->idx);
														
 
															 	}
														
 
															 }
														
@@ -915,17 +1003,11 @@ static void x86_pmu_enable(struct pmu *pmu)
 
															 	x86_pmu.enable_all(added);
														
 
															 }
														
 
															-static inline void __x86_pmu_enable_event(struct hw_perf_event *hwc,
														
 
															-					  u64 enable_mask)
														
 
															-{
														
 
															-	wrmsrl(hwc->config_base + hwc->idx, hwc->config | enable_mask);
														
 
															-}
														
 
															-
														
 
															 static inline void x86_pmu_disable_event(struct perf_event *event)
														
 
															 {
														
 
															 	struct hw_perf_event *hwc = &event->hw;
														
 
															-	wrmsrl(hwc->config_base + hwc->idx, hwc->config);
														
 
															+	wrmsrl(hwc->config_base, hwc->config);
														
 
															 }
														
 
															 static DEFINE_PER_CPU(u64 [X86_PMC_IDX_MAX], pmc_prev_left);
														
@@ -978,7 +1060,7 @@ x86_perf_event_set_period(struct perf_event *event)
 
															 	 */
														
 
															 	local64_set(&hwc->prev_count, (u64)-left);
														
 
															-	wrmsrl(hwc->event_base + idx, (u64)(-left) & x86_pmu.cntval_mask);
														
 
															+	wrmsrl(hwc->event_base, (u64)(-left) & x86_pmu.cntval_mask);
														
 
															 	/*
														
 
															 	 * Due to erratum on certan cpu we need
														
@@ -986,7 +1068,7 @@ x86_perf_event_set_period(struct perf_event *event)
 
															 	 * is updated properly
														
 
															 	 */
														
 
															 	if (x86_pmu.perfctr_second_write) {
														
 
															-		wrmsrl(hwc->event_base + idx,
														
 
															+		wrmsrl(hwc->event_base,
														
 
															 			(u64)(-left) & x86_pmu.cntval_mask);
														
 
															 	}
														
@@ -1113,8 +1195,8 @@ void perf_event_print_debug(void)
 
															 	pr_info("CPU#%d: active:     %016llx\n", cpu, *(u64 *)cpuc->active_mask);
														
 
															 	for (idx = 0; idx < x86_pmu.num_counters; idx++) {
														
 
															-		rdmsrl(x86_pmu.eventsel + idx, pmc_ctrl);
														
 
															-		rdmsrl(x86_pmu.perfctr  + idx, pmc_count);
														
 
															+		rdmsrl(x86_pmu_config_addr(idx), pmc_ctrl);
														
 
															+		rdmsrl(x86_pmu_event_addr(idx), pmc_count);
														
 
															 		prev_left = per_cpu(pmc_prev_left[idx], cpu);
														
@@ -1389,7 +1471,7 @@ static void __init pmu_check_apic(void)
 
															 	pr_info("no hardware sampling interrupt available.\n");
														
 
															 }
														
 
															-int __init init_hw_perf_events(void)
														
 
															+static int __init init_hw_perf_events(void)
														
 
															 {
														
 
															 	struct event_constraint *c;
														
 
															 	int err;
														
@@ -1608,7 +1690,7 @@ out:
 
															 	return ret;
														
 
															 }
														
 
															-int x86_pmu_event_init(struct perf_event *event)
														
 
															+static int x86_pmu_event_init(struct perf_event *event)
														
 
															 {
														
 
															 	struct pmu *tmp;
														
 
															 	int err;
														
--- a/arch/x86/kernel/cpu/perf_event_amd.c
+++ b/arch/x86/kernel/cpu/perf_event_amd.c
@@ -127,6 +127,11 @@ static int amd_pmu_hw_config(struct perf_event *event)
 
															 /*
														
 
															  * AMD64 events are detected based on their event codes.
														
 
															  */
														
 
															+static inline unsigned int amd_get_event_code(struct hw_perf_event *hwc)
														
 
															+{
														
 
															+	return ((hwc->config >> 24) & 0x0f00) | (hwc->config & 0x00ff);
														
 
															+}
														
 
															+
														
 
															 static inline int amd_is_nb_event(struct hw_perf_event *hwc)
														
 
															 {
														
 
															 	return (hwc->config & 0xe0) == 0xe0;
														
@@ -385,13 +390,181 @@ static __initconst const struct x86_pmu amd_pmu = {
 
															 	.cpu_dead		= amd_pmu_cpu_dead,
														
 
															 };
														
 
															+/* AMD Family 15h */
														
 
															+
														
 
															+#define AMD_EVENT_TYPE_MASK	0x000000F0ULL
														
 
															+
														
 
															+#define AMD_EVENT_FP		0x00000000ULL ... 0x00000010ULL
														
 
															+#define AMD_EVENT_LS		0x00000020ULL ... 0x00000030ULL
														
 
															+#define AMD_EVENT_DC		0x00000040ULL ... 0x00000050ULL
														
 
															+#define AMD_EVENT_CU		0x00000060ULL ... 0x00000070ULL
														
 
															+#define AMD_EVENT_IC_DE		0x00000080ULL ... 0x00000090ULL
														
 
															+#define AMD_EVENT_EX_LS		0x000000C0ULL
														
 
															+#define AMD_EVENT_DE		0x000000D0ULL
														
 
															+#define AMD_EVENT_NB		0x000000E0ULL ... 0x000000F0ULL
														
 
															+
														
 
															+/*
														
 
															+ * AMD family 15h event code/PMC mappings:
														
 
															+ *
														
 
															+ * type = event_code & 0x0F0:
														
 
															+ *
														
 
															+ * 0x000	FP	PERF_CTL[5:3]
														
 
															+ * 0x010	FP	PERF_CTL[5:3]
														
 
															+ * 0x020	LS	PERF_CTL[5:0]
														
 
															+ * 0x030	LS	PERF_CTL[5:0]
														
 
															+ * 0x040	DC	PERF_CTL[5:0]
														
 
															+ * 0x050	DC	PERF_CTL[5:0]
														
 
															+ * 0x060	CU	PERF_CTL[2:0]
														
 
															+ * 0x070	CU	PERF_CTL[2:0]
														
 
															+ * 0x080	IC/DE	PERF_CTL[2:0]
														
 
															+ * 0x090	IC/DE	PERF_CTL[2:0]
														
 
															+ * 0x0A0	---
														
 
															+ * 0x0B0	---
														
 
															+ * 0x0C0	EX/LS	PERF_CTL[5:0]
														
 
															+ * 0x0D0	DE	PERF_CTL[2:0]
														
 
															+ * 0x0E0	NB	NB_PERF_CTL[3:0]
														
 
															+ * 0x0F0	NB	NB_PERF_CTL[3:0]
														
 
															+ *
														
 
															+ * Exceptions:
														
 
															+ *
														
 
															+ * 0x003	FP	PERF_CTL[3]
														
 
															+ * 0x00B	FP	PERF_CTL[3]
														
 
															+ * 0x00D	FP	PERF_CTL[3]
														
 
															+ * 0x023	DE	PERF_CTL[2:0]
														
 
															+ * 0x02D	LS	PERF_CTL[3]
														
 
															+ * 0x02E	LS	PERF_CTL[3,0]
														
 
															+ * 0x043	CU	PERF_CTL[2:0]
														
 
															+ * 0x045	CU	PERF_CTL[2:0]
														
 
															+ * 0x046	CU	PERF_CTL[2:0]
														
 
															+ * 0x054	CU	PERF_CTL[2:0]
														
 
															+ * 0x055	CU	PERF_CTL[2:0]
														
 
															+ * 0x08F	IC	PERF_CTL[0]
														
 
															+ * 0x187	DE	PERF_CTL[0]
														
 
															+ * 0x188	DE	PERF_CTL[0]
														
 
															+ * 0x0DB	EX	PERF_CTL[5:0]
														
 
															+ * 0x0DC	LS	PERF_CTL[5:0]
														
 
															+ * 0x0DD	LS	PERF_CTL[5:0]
														
 
															+ * 0x0DE	LS	PERF_CTL[5:0]
														
 
															+ * 0x0DF	LS	PERF_CTL[5:0]
														
 
															+ * 0x1D6	EX	PERF_CTL[5:0]
														
 
															+ * 0x1D8	EX	PERF_CTL[5:0]
														
 
															+ */
														
 
															+
														
 
															+static struct event_constraint amd_f15_PMC0  = EVENT_CONSTRAINT(0, 0x01, 0);
														
 
															+static struct event_constraint amd_f15_PMC20 = EVENT_CONSTRAINT(0, 0x07, 0);
														
 
															+static struct event_constraint amd_f15_PMC3  = EVENT_CONSTRAINT(0, 0x08, 0);
														
 
															+static struct event_constraint amd_f15_PMC30 = EVENT_CONSTRAINT(0, 0x09, 0);
														
 
															+static struct event_constraint amd_f15_PMC50 = EVENT_CONSTRAINT(0, 0x3F, 0);
														
 
															+static struct event_constraint amd_f15_PMC53 = EVENT_CONSTRAINT(0, 0x38, 0);
														
 
															+
														
 
															+static struct event_constraint *
														
 
															+amd_get_event_constraints_f15h(struct cpu_hw_events *cpuc, struct perf_event *event)
														
 
															+{
														
 
															+	unsigned int event_code = amd_get_event_code(&event->hw);
														
 
															+
														
 
															+	switch (event_code & AMD_EVENT_TYPE_MASK) {
														
 
															+	case AMD_EVENT_FP:
														
 
															+		switch (event_code) {
														
 
															+		case 0x003:
														
 
															+		case 0x00B:
														
 
															+		case 0x00D:
														
 
															+			return &amd_f15_PMC3;
														
 
															+		default:
														
 
															+			return &amd_f15_PMC53;
														
 
															+		}
														
 
															+	case AMD_EVENT_LS:
														
 
															+	case AMD_EVENT_DC:
														
 
															+	case AMD_EVENT_EX_LS:
														
 
															+		switch (event_code) {
														
 
															+		case 0x023:
														
 
															+		case 0x043:
														
 
															+		case 0x045:
														
 
															+		case 0x046:
														
 
															+		case 0x054:
														
 
															+		case 0x055:
														
 
															+			return &amd_f15_PMC20;
														
 
															+		case 0x02D:
														
 
															+			return &amd_f15_PMC3;
														
 
															+		case 0x02E:
														
 
															+			return &amd_f15_PMC30;
														
 
															+		default:
														
 
															+			return &amd_f15_PMC50;
														
 
															+		}
														
 
															+	case AMD_EVENT_CU:
														
 
															+	case AMD_EVENT_IC_DE:
														
 
															+	case AMD_EVENT_DE:
														
 
															+		switch (event_code) {
														
 
															+		case 0x08F:
														
 
															+		case 0x187:
														
 
															+		case 0x188:
														
 
															+			return &amd_f15_PMC0;
														
 
															+		case 0x0DB ... 0x0DF:
														
 
															+		case 0x1D6:
														
 
															+		case 0x1D8:
														
 
															+			return &amd_f15_PMC50;
														
 
															+		default:
														
 
															+			return &amd_f15_PMC20;
														
 
															+		}
														
 
															+	case AMD_EVENT_NB:
														
 
															+		/* not yet implemented */
														
 
															+		return &emptyconstraint;
														
 
															+	default:
														
 
															+		return &emptyconstraint;
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+static __initconst const struct x86_pmu amd_pmu_f15h = {
														
 
															+	.name			= "AMD Family 15h",
														
 
															+	.handle_irq		= x86_pmu_handle_irq,
														
 
															+	.disable_all		= x86_pmu_disable_all,
														
 
															+	.enable_all		= x86_pmu_enable_all,
														
 
															+	.enable			= x86_pmu_enable_event,
														
 
															+	.disable		= x86_pmu_disable_event,
														
 
															+	.hw_config		= amd_pmu_hw_config,
														
 
															+	.schedule_events	= x86_schedule_events,
														
 
															+	.eventsel		= MSR_F15H_PERF_CTL,
														
 
															+	.perfctr		= MSR_F15H_PERF_CTR,
														
 
															+	.event_map		= amd_pmu_event_map,
														
 
															+	.max_events		= ARRAY_SIZE(amd_perfmon_event_map),
														
 
															+	.num_counters		= 6,
														
 
															+	.cntval_bits		= 48,
														
 
															+	.cntval_mask		= (1ULL << 48) - 1,
														
 
															+	.apic			= 1,
														
 
															+	/* use highest bit to detect overflow */
														
 
															+	.max_period		= (1ULL << 47) - 1,
														
 
															+	.get_event_constraints	= amd_get_event_constraints_f15h,
														
 
															+	/* nortbridge counters not yet implemented: */
														
 
															+#if 0
														
 
															+	.put_event_constraints	= amd_put_event_constraints,
														
 
															+
														
 
															+	.cpu_prepare		= amd_pmu_cpu_prepare,
														
 
															+	.cpu_starting		= amd_pmu_cpu_starting,
														
 
															+	.cpu_dead		= amd_pmu_cpu_dead,
														
 
															+#endif
														
 
															+};
														
 
															+
														
 
															 static __init int amd_pmu_init(void)
														
 
															 {
														
 
															 	/* Performance-monitoring supported from K7 and later: */
														
 
															 	if (boot_cpu_data.x86 < 6)
														
 
															 		return -ENODEV;
														
 
															-	x86_pmu = amd_pmu;
														
 
															+	/*
														
 
															+	 * If core performance counter extensions exists, it must be
														
 
															+	 * family 15h, otherwise fail. See x86_pmu_addr_offset().
														
 
															+	 */
														
 
															+	switch (boot_cpu_data.x86) {
														
 
															+	case 0x15:
														
 
															+		if (!cpu_has_perfctr_core)
														
 
															+			return -ENODEV;
														
 
															+		x86_pmu = amd_pmu_f15h;
														
 
															+		break;
														
 
															+	default:
														
 
															+		if (cpu_has_perfctr_core)
														
 
															+			return -ENODEV;
														
 
															+		x86_pmu = amd_pmu;
														
 
															+		break;
														
 
															+	}
														
 
															 	/* Events are common for all AMDs */
														
 
															 	memcpy(hw_cache_event_ids, amd_hw_cache_event_ids,
														
--- a/arch/x86/kernel/cpu/perf_event_intel.c
+++ b/arch/x86/kernel/cpu/perf_event_intel.c
@@ -1,5 +1,27 @@
 
															 #ifdef CONFIG_CPU_SUP_INTEL
														
 
															+#define MAX_EXTRA_REGS 2
														
 
															+
														
 
															+/*
														
 
															+ * Per register state.
														
 
															+ */
														
 
															+struct er_account {
														
 
															+	int			ref;		/* reference count */
														
 
															+	unsigned int		extra_reg;	/* extra MSR number */
														
 
															+	u64			extra_config;	/* extra MSR config */
														
 
															+};
														
 
															+
														
 
															+/*
														
 
															+ * Per core state
														
 
															+ * This used to coordinate shared registers for HT threads.
														
 
															+ */
														
 
															+struct intel_percore {
														
 
															+	raw_spinlock_t		lock;		/* protect structure */
														
 
															+	struct er_account	regs[MAX_EXTRA_REGS];
														
 
															+	int			refcnt;		/* number of threads */
														
 
															+	unsigned		core_id;
														
 
															+};
														
 
															+
														
 
															 /*
														
 
															  * Intel PerfMon, used on Core and later.
														
 
															  */
														
@@ -64,6 +86,18 @@ static struct event_constraint intel_nehalem_event_constraints[] =
 
															 	EVENT_CONSTRAINT_END
														
 
															 };
														
 
															+static struct extra_reg intel_nehalem_extra_regs[] =
														
 
															+{
														
 
															+	INTEL_EVENT_EXTRA_REG(0xb7, MSR_OFFCORE_RSP_0, 0xffff),
														
 
															+	EVENT_EXTRA_END
														
 
															+};
														
 
															+
														
 
															+static struct event_constraint intel_nehalem_percore_constraints[] =
														
 
															+{
														
 
															+	INTEL_EVENT_CONSTRAINT(0xb7, 0),
														
 
															+	EVENT_CONSTRAINT_END
														
 
															+};
														
 
															+
														
 
															 static struct event_constraint intel_westmere_event_constraints[] =
														
 
															 {
														
 
															 	FIXED_EVENT_CONSTRAINT(0x00c0, 0), /* INST_RETIRED.ANY */
														
@@ -76,6 +110,33 @@ static struct event_constraint intel_westmere_event_constraints[] =
 
															 	EVENT_CONSTRAINT_END
														
 
															 };
														
 
															+static struct event_constraint intel_snb_event_constraints[] =
														
 
															+{
														
 
															+	FIXED_EVENT_CONSTRAINT(0x00c0, 0), /* INST_RETIRED.ANY */
														
 
															+	FIXED_EVENT_CONSTRAINT(0x003c, 1), /* CPU_CLK_UNHALTED.CORE */
														
 
															+	/* FIXED_EVENT_CONSTRAINT(0x013c, 2), CPU_CLK_UNHALTED.REF */
														
 
															+	INTEL_EVENT_CONSTRAINT(0x48, 0x4), /* L1D_PEND_MISS.PENDING */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xb7, 0x1), /* OFF_CORE_RESPONSE_0 */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xbb, 0x8), /* OFF_CORE_RESPONSE_1 */
														
 
															+	INTEL_UEVENT_CONSTRAINT(0x01c0, 0x2), /* INST_RETIRED.PREC_DIST */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xcd, 0x8), /* MEM_TRANS_RETIRED.LOAD_LATENCY */
														
 
															+	EVENT_CONSTRAINT_END
														
 
															+};
														
 
															+
														
 
															+static struct extra_reg intel_westmere_extra_regs[] =
														
 
															+{
														
 
															+	INTEL_EVENT_EXTRA_REG(0xb7, MSR_OFFCORE_RSP_0, 0xffff),
														
 
															+	INTEL_EVENT_EXTRA_REG(0xbb, MSR_OFFCORE_RSP_1, 0xffff),
														
 
															+	EVENT_EXTRA_END
														
 
															+};
														
 
															+
														
 
															+static struct event_constraint intel_westmere_percore_constraints[] =
														
 
															+{
														
 
															+	INTEL_EVENT_CONSTRAINT(0xb7, 0),
														
 
															+	INTEL_EVENT_CONSTRAINT(0xbb, 0),
														
 
															+	EVENT_CONSTRAINT_END
														
 
															+};
														
 
															+
														
 
															 static struct event_constraint intel_gen_event_constraints[] =
														
 
															 {
														
 
															 	FIXED_EVENT_CONSTRAINT(0x00c0, 0), /* INST_RETIRED.ANY */
														
@@ -89,6 +150,106 @@ static u64 intel_pmu_event_map(int hw_event)
 
															 	return intel_perfmon_event_map[hw_event];
														
 
															 }
														
 
															+static __initconst const u64 snb_hw_cache_event_ids
														
 
															+				[PERF_COUNT_HW_CACHE_MAX]
														
 
															+				[PERF_COUNT_HW_CACHE_OP_MAX]
														
 
															+				[PERF_COUNT_HW_CACHE_RESULT_MAX] =
														
 
															+{
														
 
															+ [ C(L1D) ] = {
														
 
															+	[ C(OP_READ) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0xf1d0, /* MEM_UOP_RETIRED.LOADS        */
														
 
															+		[ C(RESULT_MISS)   ] = 0x0151, /* L1D.REPLACEMENT              */
														
 
															+	},
														
 
															+	[ C(OP_WRITE) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0xf2d0, /* MEM_UOP_RETIRED.STORES       */
														
 
															+		[ C(RESULT_MISS)   ] = 0x0851, /* L1D.ALL_M_REPLACEMENT        */
														
 
															+	},
														
 
															+	[ C(OP_PREFETCH) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0x0,
														
 
															+		[ C(RESULT_MISS)   ] = 0x024e, /* HW_PRE_REQ.DL1_MISS          */
														
 
															+	},
														
 
															+ },
														
 
															+ [ C(L1I ) ] = {
														
 
															+	[ C(OP_READ) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0x0,
														
 
															+		[ C(RESULT_MISS)   ] = 0x0280, /* ICACHE.MISSES */
														
 
															+	},
														
 
															+	[ C(OP_WRITE) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = -1,
														
 
															+		[ C(RESULT_MISS)   ] = -1,
														
 
															+	},
														
 
															+	[ C(OP_PREFETCH) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0x0,
														
 
															+		[ C(RESULT_MISS)   ] = 0x0,
														
 
															+	},
														
 
															+ },
														
 
															+ [ C(LL  ) ] = {
														
 
															+	/*
														
 
															+	 * TBD: Need Off-core Response Performance Monitoring support
														
 
															+	 */
														
 
															+	[ C(OP_READ) ] = {
														
 
															+		/* OFFCORE_RESPONSE_0.ANY_DATA.LOCAL_CACHE */
														
 
															+		[ C(RESULT_ACCESS) ] = 0x01b7,
														
 
															+		/* OFFCORE_RESPONSE_1.ANY_DATA.ANY_LLC_MISS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x01bb,
														
 
															+	},
														
 
															+	[ C(OP_WRITE) ] = {
														
 
															+		/* OFFCORE_RESPONSE_0.ANY_RFO.LOCAL_CACHE */
														
 
															+		[ C(RESULT_ACCESS) ] = 0x01b7,
														
 
															+		/* OFFCORE_RESPONSE_1.ANY_RFO.ANY_LLC_MISS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x01bb,
														
 
															+	},
														
 
															+	[ C(OP_PREFETCH) ] = {
														
 
															+		/* OFFCORE_RESPONSE_0.PREFETCH.LOCAL_CACHE */
														
 
															+		[ C(RESULT_ACCESS) ] = 0x01b7,
														
 
															+		/* OFFCORE_RESPONSE_1.PREFETCH.ANY_LLC_MISS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x01bb,
														
 
															+	},
														
 
															+ },
														
 
															+ [ C(DTLB) ] = {
														
 
															+	[ C(OP_READ) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0x81d0, /* MEM_UOP_RETIRED.ALL_LOADS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x0108, /* DTLB_LOAD_MISSES.CAUSES_A_WALK */
														
 
															+	},
														
 
															+	[ C(OP_WRITE) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0x82d0, /* MEM_UOP_RETIRED.ALL_STORES */
														
 
															+		[ C(RESULT_MISS)   ] = 0x0149, /* DTLB_STORE_MISSES.MISS_CAUSES_A_WALK */
														
 
															+	},
														
 
															+	[ C(OP_PREFETCH) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0x0,
														
 
															+		[ C(RESULT_MISS)   ] = 0x0,
														
 
															+	},
														
 
															+ },
														
 
															+ [ C(ITLB) ] = {
														
 
															+	[ C(OP_READ) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0x1085, /* ITLB_MISSES.STLB_HIT         */
														
 
															+		[ C(RESULT_MISS)   ] = 0x0185, /* ITLB_MISSES.CAUSES_A_WALK    */
														
 
															+	},
														
 
															+	[ C(OP_WRITE) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = -1,
														
 
															+		[ C(RESULT_MISS)   ] = -1,
														
 
															+	},
														
 
															+	[ C(OP_PREFETCH) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = -1,
														
 
															+		[ C(RESULT_MISS)   ] = -1,
														
 
															+	},
														
 
															+ },
														
 
															+ [ C(BPU ) ] = {
														
 
															+	[ C(OP_READ) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = 0x00c4, /* BR_INST_RETIRED.ALL_BRANCHES */
														
 
															+		[ C(RESULT_MISS)   ] = 0x00c5, /* BR_MISP_RETIRED.ALL_BRANCHES */
														
 
															+	},
														
 
															+	[ C(OP_WRITE) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = -1,
														
 
															+		[ C(RESULT_MISS)   ] = -1,
														
 
															+	},
														
 
															+	[ C(OP_PREFETCH) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = -1,
														
 
															+		[ C(RESULT_MISS)   ] = -1,
														
 
															+	},
														
 
															+ },
														
 
															+};
														
 
															+
														
 
															 static __initconst const u64 westmere_hw_cache_event_ids
														
 
															 				[PERF_COUNT_HW_CACHE_MAX]
														
 
															 				[PERF_COUNT_HW_CACHE_OP_MAX]
														
@@ -124,16 +285,26 @@ static __initconst const u64 westmere_hw_cache_event_ids
 
															  },
														
 
															  [ C(LL  ) ] = {
														
 
															 	[ C(OP_READ) ] = {
														
 
															-		[ C(RESULT_ACCESS) ] = 0x0324, /* L2_RQSTS.LOADS               */
														
 
															-		[ C(RESULT_MISS)   ] = 0x0224, /* L2_RQSTS.LD_MISS             */
														
 
															+		/* OFFCORE_RESPONSE_0.ANY_DATA.LOCAL_CACHE */
														
 
															+		[ C(RESULT_ACCESS) ] = 0x01b7,
														
 
															+		/* OFFCORE_RESPONSE_1.ANY_DATA.ANY_LLC_MISS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x01bb,
														
 
															 	},
														
 
															+	/*
														
 
															+	 * Use RFO, not WRITEBACK, because a write miss would typically occur
														
 
															+	 * on RFO.
														
 
															+	 */
														
 
															 	[ C(OP_WRITE) ] = {
														
 
															-		[ C(RESULT_ACCESS) ] = 0x0c24, /* L2_RQSTS.RFOS                */
														
 
															-		[ C(RESULT_MISS)   ] = 0x0824, /* L2_RQSTS.RFO_MISS            */
														
 
															+		/* OFFCORE_RESPONSE_1.ANY_RFO.LOCAL_CACHE */
														
 
															+		[ C(RESULT_ACCESS) ] = 0x01bb,
														
 
															+		/* OFFCORE_RESPONSE_0.ANY_RFO.ANY_LLC_MISS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x01b7,
														
 
															 	},
														
 
															 	[ C(OP_PREFETCH) ] = {
														
 
															-		[ C(RESULT_ACCESS) ] = 0x4f2e, /* LLC Reference                */
														
 
															-		[ C(RESULT_MISS)   ] = 0x412e, /* LLC Misses                   */
														
 
															+		/* OFFCORE_RESPONSE_0.PREFETCH.LOCAL_CACHE */
														
 
															+		[ C(RESULT_ACCESS) ] = 0x01b7,
														
 
															+		/* OFFCORE_RESPONSE_1.PREFETCH.ANY_LLC_MISS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x01bb,
														
 
															 	},
														
 
															  },
														
 
															  [ C(DTLB) ] = {
														
@@ -180,6 +351,39 @@ static __initconst const u64 westmere_hw_cache_event_ids
 
															  },
														
 
															 };
														
 
															+/*
														
 
															+ * OFFCORE_RESPONSE MSR bits (subset), See IA32 SDM Vol 3 30.6.1.3
														
 
															+ */
														
 
															+
														
 
															+#define DMND_DATA_RD     (1 << 0)
														
 
															+#define DMND_RFO         (1 << 1)
														
 
															+#define DMND_WB          (1 << 3)
														
 
															+#define PF_DATA_RD       (1 << 4)
														
 
															+#define PF_DATA_RFO      (1 << 5)
														
 
															+#define RESP_UNCORE_HIT  (1 << 8)
														
 
															+#define RESP_MISS        (0xf600) /* non uncore hit */
														
 
															+
														
 
															+static __initconst const u64 nehalem_hw_cache_extra_regs
														
 
															+				[PERF_COUNT_HW_CACHE_MAX]
														
 
															+				[PERF_COUNT_HW_CACHE_OP_MAX]
														
 
															+				[PERF_COUNT_HW_CACHE_RESULT_MAX] =
														
 
															+{
														
 
															+ [ C(LL  ) ] = {
														
 
															+	[ C(OP_READ) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = DMND_DATA_RD|RESP_UNCORE_HIT,
														
 
															+		[ C(RESULT_MISS)   ] = DMND_DATA_RD|RESP_MISS,
														
 
															+	},
														
 
															+	[ C(OP_WRITE) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = DMND_RFO|DMND_WB|RESP_UNCORE_HIT,
														
 
															+		[ C(RESULT_MISS)   ] = DMND_RFO|DMND_WB|RESP_MISS,
														
 
															+	},
														
 
															+	[ C(OP_PREFETCH) ] = {
														
 
															+		[ C(RESULT_ACCESS) ] = PF_DATA_RD|PF_DATA_RFO|RESP_UNCORE_HIT,
														
 
															+		[ C(RESULT_MISS)   ] = PF_DATA_RD|PF_DATA_RFO|RESP_MISS,
														
 
															+	},
														
 
															+ }
														
 
															+};
														
 
															+
														
 
															 static __initconst const u64 nehalem_hw_cache_event_ids
														
 
															 				[PERF_COUNT_HW_CACHE_MAX]
														
 
															 				[PERF_COUNT_HW_CACHE_OP_MAX]
														
@@ -215,16 +419,26 @@ static __initconst const u64 nehalem_hw_cache_event_ids
 
															  },
														
 
															  [ C(LL  ) ] = {
														
 
															 	[ C(OP_READ) ] = {
														
 
															-		[ C(RESULT_ACCESS) ] = 0x0324, /* L2_RQSTS.LOADS               */
														
 
															-		[ C(RESULT_MISS)   ] = 0x0224, /* L2_RQSTS.LD_MISS             */
														
 
															+		/* OFFCORE_RESPONSE.ANY_DATA.LOCAL_CACHE */
														
 
															+		[ C(RESULT_ACCESS) ] = 0x01b7,
														
 
															+		/* OFFCORE_RESPONSE.ANY_DATA.ANY_LLC_MISS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x01b7,
														
 
															 	},
														
 
															+	/*
														
 
															+	 * Use RFO, not WRITEBACK, because a write miss would typically occur
														
 
															+	 * on RFO.
														
 
															+	 */
														
 
															 	[ C(OP_WRITE) ] = {
														
 
															-		[ C(RESULT_ACCESS) ] = 0x0c24, /* L2_RQSTS.RFOS                */
														
 
															-		[ C(RESULT_MISS)   ] = 0x0824, /* L2_RQSTS.RFO_MISS            */
														
 
															+		/* OFFCORE_RESPONSE.ANY_RFO.LOCAL_CACHE */
														
 
															+		[ C(RESULT_ACCESS) ] = 0x01b7,
														
 
															+		/* OFFCORE_RESPONSE.ANY_RFO.ANY_LLC_MISS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x01b7,
														
 
															 	},
														
 
															 	[ C(OP_PREFETCH) ] = {
														
 
															-		[ C(RESULT_ACCESS) ] = 0x4f2e, /* LLC Reference                */
														
 
															-		[ C(RESULT_MISS)   ] = 0x412e, /* LLC Misses                   */
														
 
															+		/* OFFCORE_RESPONSE.PREFETCH.LOCAL_CACHE */
														
 
															+		[ C(RESULT_ACCESS) ] = 0x01b7,
														
 
															+		/* OFFCORE_RESPONSE.PREFETCH.ANY_LLC_MISS */
														
 
															+		[ C(RESULT_MISS)   ] = 0x01b7,
														
 
															 	},
														
 
															  },
														
 
															  [ C(DTLB) ] = {
														
@@ -691,8 +905,8 @@ static void intel_pmu_reset(void)
 
															 	printk("clearing PMU state on CPU#%d\n", smp_processor_id());
														
 
															 	for (idx = 0; idx < x86_pmu.num_counters; idx++) {
														
 
															-		checking_wrmsrl(x86_pmu.eventsel + idx, 0ull);
														
 
															-		checking_wrmsrl(x86_pmu.perfctr  + idx, 0ull);
														
 
															+		checking_wrmsrl(x86_pmu_config_addr(idx), 0ull);
														
 
															+		checking_wrmsrl(x86_pmu_event_addr(idx),  0ull);
														
 
															 	}
														
 
															 	for (idx = 0; idx < x86_pmu.num_counters_fixed; idx++)
														
 
															 		checking_wrmsrl(MSR_ARCH_PERFMON_FIXED_CTR0 + idx, 0ull);
														
@@ -793,6 +1007,67 @@ intel_bts_constraints(struct perf_event *event)
 
															 	return NULL;
														
 
															 }
														
 
															+static struct event_constraint *
														
 
															+intel_percore_constraints(struct cpu_hw_events *cpuc, struct perf_event *event)
														
 
															+{
														
 
															+	struct hw_perf_event *hwc = &event->hw;
														
 
															+	unsigned int e = hwc->config & ARCH_PERFMON_EVENTSEL_EVENT;
														
 
															+	struct event_constraint *c;
														
 
															+	struct intel_percore *pc;
														
 
															+	struct er_account *era;
														
 
															+	int i;
														
 
															+	int free_slot;
														
 
															+	int found;
														
 
															+
														
 
															+	if (!x86_pmu.percore_constraints || hwc->extra_alloc)
														
 
															+		return NULL;
														
 
															+
														
 
															+	for (c = x86_pmu.percore_constraints; c->cmask; c++) {
														
 
															+		if (e != c->code)
														
 
															+			continue;
														
 
															+
														
 
															+		/*
														
 
															+		 * Allocate resource per core.
														
 
															+		 */
														
 
															+		pc = cpuc->per_core;
														
 
															+		if (!pc)
														
 
															+			break;
														
 
															+		c = &emptyconstraint;
														
 
															+		raw_spin_lock(&pc->lock);
														
 
															+		free_slot = -1;
														
 
															+		found = 0;
														
 
															+		for (i = 0; i < MAX_EXTRA_REGS; i++) {
														
 
															+			era = &pc->regs[i];
														
 
															+			if (era->ref > 0 && hwc->extra_reg == era->extra_reg) {
														
 
															+				/* Allow sharing same config */
														
 
															+				if (hwc->extra_config == era->extra_config) {
														
 
															+					era->ref++;
														
 
															+					cpuc->percore_used = 1;
														
 
															+					hwc->extra_alloc = 1;
														
 
															+					c = NULL;
														
 
															+				}
														
 
															+				/* else conflict */
														
 
															+				found = 1;
														
 
															+				break;
														
 
															+			} else if (era->ref == 0 && free_slot == -1)
														
 
															+				free_slot = i;
														
 
															+		}
														
 
															+		if (!found && free_slot != -1) {
														
 
															+			era = &pc->regs[free_slot];
														
 
															+			era->ref = 1;
														
 
															+			era->extra_reg = hwc->extra_reg;
														
 
															+			era->extra_config = hwc->extra_config;
														
 
															+			cpuc->percore_used = 1;
														
 
															+			hwc->extra_alloc = 1;
														
 
															+			c = NULL;
														
 
															+		}
														
 
															+		raw_spin_unlock(&pc->lock);
														
 
															+		return c;
														
 
															+	}
														
 
															+
														
 
															+	return NULL;
														
 
															+}
														
 
															+
														
 
															 static struct event_constraint *
														
 
															 intel_get_event_constraints(struct cpu_hw_events *cpuc, struct perf_event *event)
														
 
															 {
														
@@ -806,9 +1081,51 @@ intel_get_event_constraints(struct cpu_hw_events *cpuc, struct perf_event *event
 
															 	if (c)
														
 
															 		return c;
														
 
															+	c = intel_percore_constraints(cpuc, event);
														
 
															+	if (c)
														
 
															+		return c;
														
 
															+
														
 
															 	return x86_get_event_constraints(cpuc, event);
														
 
															 }
														
 
															+static void intel_put_event_constraints(struct cpu_hw_events *cpuc,
														
 
															+					struct perf_event *event)
														
 
															+{
														
 
															+	struct extra_reg *er;
														
 
															+	struct intel_percore *pc;
														
 
															+	struct er_account *era;
														
 
															+	struct hw_perf_event *hwc = &event->hw;
														
 
															+	int i, allref;
														
 
															+
														
 
															+	if (!cpuc->percore_used)
														
 
															+		return;
														
 
															+
														
 
															+	for (er = x86_pmu.extra_regs; er->msr; er++) {
														
 
															+		if (er->event != (hwc->config & er->config_mask))
														
 
															+			continue;
														
 
															+
														
 
															+		pc = cpuc->per_core;
														
 
															+		raw_spin_lock(&pc->lock);
														
 
															+		for (i = 0; i < MAX_EXTRA_REGS; i++) {
														
 
															+			era = &pc->regs[i];
														
 
															+			if (era->ref > 0 &&
														
 
															+			    era->extra_config == hwc->extra_config &&
														
 
															+			    era->extra_reg == er->msr) {
														
 
															+				era->ref--;
														
 
															+				hwc->extra_alloc = 0;
														
 
															+				break;
														
 
															+			}
														
 
															+		}
														
 
															+		allref = 0;
														
 
															+		for (i = 0; i < MAX_EXTRA_REGS; i++)
														
 
															+			allref += pc->regs[i].ref;
														
 
															+		if (allref == 0)
														
 
															+			cpuc->percore_used = 0;
														
 
															+		raw_spin_unlock(&pc->lock);
														
 
															+		break;
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															 static int intel_pmu_hw_config(struct perf_event *event)
														
 
															 {
														
 
															 	int ret = x86_pmu_hw_config(event);
														
@@ -880,20 +1197,67 @@ static __initconst const struct x86_pmu core_pmu = {
 
															 	 */
														
 
															 	.max_period		= (1ULL << 31) - 1,
														
 
															 	.get_event_constraints	= intel_get_event_constraints,
														
 
															+	.put_event_constraints	= intel_put_event_constraints,
														
 
															 	.event_constraints	= intel_core_event_constraints,
														
 
															 };
														
 
															+static int intel_pmu_cpu_prepare(int cpu)
														
 
															+{
														
 
															+	struct cpu_hw_events *cpuc = &per_cpu(cpu_hw_events, cpu);
														
 
															+
														
 
															+	if (!cpu_has_ht_siblings())
														
 
															+		return NOTIFY_OK;
														
 
															+
														
 
															+	cpuc->per_core = kzalloc_node(sizeof(struct intel_percore),
														
 
															+				      GFP_KERNEL, cpu_to_node(cpu));
														
 
															+	if (!cpuc->per_core)
														
 
															+		return NOTIFY_BAD;
														
 
															+
														
 
															+	raw_spin_lock_init(&cpuc->per_core->lock);
														
 
															+	cpuc->per_core->core_id = -1;
														
 
															+	return NOTIFY_OK;
														
 
															+}
														
 
															+
														
 
															 static void intel_pmu_cpu_starting(int cpu)
														
 
															 {
														
 
															+	struct cpu_hw_events *cpuc = &per_cpu(cpu_hw_events, cpu);
														
 
															+	int core_id = topology_core_id(cpu);
														
 
															+	int i;
														
 
															+
														
 
															 	init_debug_store_on_cpu(cpu);
														
 
															 	/*
														
 
															 	 * Deal with CPUs that don't clear their LBRs on power-up.
														
 
															 	 */
														
 
															 	intel_pmu_lbr_reset();
														
 
															+
														
 
															+	if (!cpu_has_ht_siblings())
														
 
															+		return;
														
 
															+
														
 
															+	for_each_cpu(i, topology_thread_cpumask(cpu)) {
														
 
															+		struct intel_percore *pc = per_cpu(cpu_hw_events, i).per_core;
														
 
															+
														
 
															+		if (pc && pc->core_id == core_id) {
														
 
															+			kfree(cpuc->per_core);
														
 
															+			cpuc->per_core = pc;
														
 
															+			break;
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	cpuc->per_core->core_id = core_id;
														
 
															+	cpuc->per_core->refcnt++;
														
 
															 }
														
 
															 static void intel_pmu_cpu_dying(int cpu)
														
 
															 {
														
 
															+	struct cpu_hw_events *cpuc = &per_cpu(cpu_hw_events, cpu);
														
 
															+	struct intel_percore *pc = cpuc->per_core;
														
 
															+
														
 
															+	if (pc) {
														
 
															+		if (pc->core_id == -1 || --pc->refcnt == 0)
														
 
															+			kfree(pc);
														
 
															+		cpuc->per_core = NULL;
														
 
															+	}
														
 
															+
														
 
															 	fini_debug_store_on_cpu(cpu);
														
 
															 }
														
@@ -918,7 +1282,9 @@ static __initconst const struct x86_pmu intel_pmu = {
 
															 	 */
														
 
															 	.max_period		= (1ULL << 31) - 1,
														
 
															 	.get_event_constraints	= intel_get_event_constraints,
														
 
															+	.put_event_constraints	= intel_put_event_constraints,
														
 
															+	.cpu_prepare		= intel_pmu_cpu_prepare,
														
 
															 	.cpu_starting		= intel_pmu_cpu_starting,
														
 
															 	.cpu_dying		= intel_pmu_cpu_dying,
														
 
															 };
														
@@ -1024,6 +1390,7 @@ static __init int intel_pmu_init(void)
 
															 		intel_pmu_lbr_init_core();
														
 
															 		x86_pmu.event_constraints = intel_core2_event_constraints;
														
 
															+		x86_pmu.pebs_constraints = intel_core2_pebs_event_constraints;
														
 
															 		pr_cont("Core2 events, ");
														
 
															 		break;
														
@@ -1032,11 +1399,16 @@ static __init int intel_pmu_init(void)
 
															 	case 46: /* 45 nm nehalem-ex, "Beckton" */
														
 
															 		memcpy(hw_cache_event_ids, nehalem_hw_cache_event_ids,
														
 
															 		       sizeof(hw_cache_event_ids));
														
 
															+		memcpy(hw_cache_extra_regs, nehalem_hw_cache_extra_regs,
														
 
															+		       sizeof(hw_cache_extra_regs));
														
 
															 		intel_pmu_lbr_init_nhm();
														
 
															 		x86_pmu.event_constraints = intel_nehalem_event_constraints;
														
 
															+		x86_pmu.pebs_constraints = intel_nehalem_pebs_event_constraints;
														
 
															+		x86_pmu.percore_constraints = intel_nehalem_percore_constraints;
														
 
															 		x86_pmu.enable_all = intel_pmu_nhm_enable_all;
														
 
															+		x86_pmu.extra_regs = intel_nehalem_extra_regs;
														
 
															 		pr_cont("Nehalem events, ");
														
 
															 		break;
														
@@ -1047,6 +1419,7 @@ static __init int intel_pmu_init(void)
 
															 		intel_pmu_lbr_init_atom();
														
 
															 		x86_pmu.event_constraints = intel_gen_event_constraints;
														
 
															+		x86_pmu.pebs_constraints = intel_atom_pebs_event_constraints;
														
 
															 		pr_cont("Atom events, ");
														
 
															 		break;
														
@@ -1054,14 +1427,30 @@ static __init int intel_pmu_init(void)
 
															 	case 44: /* 32 nm nehalem, "Gulftown" */
														
 
															 		memcpy(hw_cache_event_ids, westmere_hw_cache_event_ids,
														
 
															 		       sizeof(hw_cache_event_ids));
														
 
															+		memcpy(hw_cache_extra_regs, nehalem_hw_cache_extra_regs,
														
 
															+		       sizeof(hw_cache_extra_regs));
														
 
															 		intel_pmu_lbr_init_nhm();
														
 
															 		x86_pmu.event_constraints = intel_westmere_event_constraints;
														
 
															+		x86_pmu.percore_constraints = intel_westmere_percore_constraints;
														
 
															 		x86_pmu.enable_all = intel_pmu_nhm_enable_all;
														
 
															+		x86_pmu.pebs_constraints = intel_westmere_pebs_event_constraints;
														
 
															+		x86_pmu.extra_regs = intel_westmere_extra_regs;
														
 
															 		pr_cont("Westmere events, ");
														
 
															 		break;
														
 
															+	case 42: /* SandyBridge */
														
 
															+		memcpy(hw_cache_event_ids, snb_hw_cache_event_ids,
														
 
															+		       sizeof(hw_cache_event_ids));
														
 
															+
														
 
															+		intel_pmu_lbr_init_nhm();
														
 
															+
														
 
															+		x86_pmu.event_constraints = intel_snb_event_constraints;
														
 
															+		x86_pmu.pebs_constraints = intel_snb_pebs_events;
														
 
															+		pr_cont("SandyBridge events, ");
														
 
															+		break;
														
 
															+
														
 
															 	default:
														
 
															 		/*
														
 
															 		 * default constraints for v2 and up
														
--- a/arch/x86/kernel/cpu/perf_event_intel_ds.c
+++ b/arch/x86/kernel/cpu/perf_event_intel_ds.c
@@ -361,30 +361,88 @@ static int intel_pmu_drain_bts_buffer(void)
 
															 /*
														
 
															  * PEBS
														
 
															  */
														
 
															-
														
 
															-static struct event_constraint intel_core_pebs_events[] = {
														
 
															-	PEBS_EVENT_CONSTRAINT(0x00c0, 0x1), /* INSTR_RETIRED.ANY */
														
 
															+static struct event_constraint intel_core2_pebs_event_constraints[] = {
														
 
															+	PEBS_EVENT_CONSTRAINT(0x00c0, 0x1), /* INST_RETIRED.ANY */
														
 
															 	PEBS_EVENT_CONSTRAINT(0xfec1, 0x1), /* X87_OPS_RETIRED.ANY */
														
 
															 	PEBS_EVENT_CONSTRAINT(0x00c5, 0x1), /* BR_INST_RETIRED.MISPRED */
														
 
															 	PEBS_EVENT_CONSTRAINT(0x1fc7, 0x1), /* SIMD_INST_RETURED.ANY */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x01cb, 0x1), /* MEM_LOAD_RETIRED.L1D_MISS */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x02cb, 0x1), /* MEM_LOAD_RETIRED.L1D_LINE_MISS */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x04cb, 0x1), /* MEM_LOAD_RETIRED.L2_MISS */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x08cb, 0x1), /* MEM_LOAD_RETIRED.L2_LINE_MISS */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x10cb, 0x1), /* MEM_LOAD_RETIRED.DTLB_MISS */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xcb, 0x1),  /* MEM_LOAD_RETIRED.* */
														
 
															+	EVENT_CONSTRAINT_END
														
 
															+};
														
 
															+
														
 
															+static struct event_constraint intel_atom_pebs_event_constraints[] = {
														
 
															+	PEBS_EVENT_CONSTRAINT(0x00c0, 0x1), /* INST_RETIRED.ANY */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x00c5, 0x1), /* MISPREDICTED_BRANCH_RETIRED */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xcb, 0x1),  /* MEM_LOAD_RETIRED.* */
														
 
															 	EVENT_CONSTRAINT_END
														
 
															 };
														
 
															-static struct event_constraint intel_nehalem_pebs_events[] = {
														
 
															-	PEBS_EVENT_CONSTRAINT(0x00c0, 0xf), /* INSTR_RETIRED.ANY */
														
 
															-	PEBS_EVENT_CONSTRAINT(0xfec1, 0xf), /* X87_OPS_RETIRED.ANY */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x00c5, 0xf), /* BR_INST_RETIRED.MISPRED */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x1fc7, 0xf), /* SIMD_INST_RETURED.ANY */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x01cb, 0xf), /* MEM_LOAD_RETIRED.L1D_MISS */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x02cb, 0xf), /* MEM_LOAD_RETIRED.L1D_LINE_MISS */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x04cb, 0xf), /* MEM_LOAD_RETIRED.L2_MISS */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x08cb, 0xf), /* MEM_LOAD_RETIRED.L2_LINE_MISS */
														
 
															-	PEBS_EVENT_CONSTRAINT(0x10cb, 0xf), /* MEM_LOAD_RETIRED.DTLB_MISS */
														
 
															+static struct event_constraint intel_nehalem_pebs_event_constraints[] = {
														
 
															+	INTEL_EVENT_CONSTRAINT(0x0b, 0xf),  /* MEM_INST_RETIRED.* */
														
 
															+	INTEL_EVENT_CONSTRAINT(0x0f, 0xf),  /* MEM_UNCORE_RETIRED.* */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x010c, 0xf), /* MEM_STORE_RETIRED.DTLB_MISS */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xc0, 0xf),  /* INST_RETIRED.ANY */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xc2, 0xf),  /* UOPS_RETIRED.* */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xc4, 0xf),  /* BR_INST_RETIRED.* */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x02c5, 0xf), /* BR_MISP_RETIRED.NEAR_CALL */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xc7, 0xf),  /* SSEX_UOPS_RETIRED.* */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x20c8, 0xf), /* ITLB_MISS_RETIRED */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xcb, 0xf),  /* MEM_LOAD_RETIRED.* */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xf7, 0xf),  /* FP_ASSIST.* */
														
 
															+	EVENT_CONSTRAINT_END
														
 
															+};
														
 
															+
														
 
															+static struct event_constraint intel_westmere_pebs_event_constraints[] = {
														
 
															+	INTEL_EVENT_CONSTRAINT(0x0b, 0xf),  /* MEM_INST_RETIRED.* */
														
 
															+	INTEL_EVENT_CONSTRAINT(0x0f, 0xf),  /* MEM_UNCORE_RETIRED.* */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x010c, 0xf), /* MEM_STORE_RETIRED.DTLB_MISS */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xc0, 0xf),  /* INSTR_RETIRED.* */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xc2, 0xf),  /* UOPS_RETIRED.* */
														
 
															+
														
 
															+	INTEL_EVENT_CONSTRAINT(0xc4, 0xf),  /* BR_INST_RETIRED.* */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xc5, 0xf),  /* BR_MISP_RETIRED.* */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xc7, 0xf),  /* SSEX_UOPS_RETIRED.* */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x20c8, 0xf), /* ITLB_MISS_RETIRED */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xcb, 0xf),  /* MEM_LOAD_RETIRED.* */
														
 
															+	INTEL_EVENT_CONSTRAINT(0xf7, 0xf),  /* FP_ASSIST.* */
														
 
															+	EVENT_CONSTRAINT_END
														
 
															+};
														
 
															+
														
 
															+static struct event_constraint intel_snb_pebs_events[] = {
														
 
															+	PEBS_EVENT_CONSTRAINT(0x01c0, 0x2), /* INST_RETIRED.PRECDIST */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x01c2, 0xf), /* UOPS_RETIRED.ALL */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x02c2, 0xf), /* UOPS_RETIRED.RETIRE_SLOTS */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x01c4, 0xf), /* BR_INST_RETIRED.CONDITIONAL */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x02c4, 0xf), /* BR_INST_RETIRED.NEAR_CALL */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x04c4, 0xf), /* BR_INST_RETIRED.ALL_BRANCHES */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x08c4, 0xf), /* BR_INST_RETIRED.NEAR_RETURN */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x10c4, 0xf), /* BR_INST_RETIRED.NOT_TAKEN */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x20c4, 0xf), /* BR_INST_RETIRED.NEAR_TAKEN */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x40c4, 0xf), /* BR_INST_RETIRED.FAR_BRANCH */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x01c5, 0xf), /* BR_MISP_RETIRED.CONDITIONAL */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x02c5, 0xf), /* BR_MISP_RETIRED.NEAR_CALL */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x04c5, 0xf), /* BR_MISP_RETIRED.ALL_BRANCHES */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x10c5, 0xf), /* BR_MISP_RETIRED.NOT_TAKEN */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x20c5, 0xf), /* BR_MISP_RETIRED.TAKEN */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x01cd, 0x8), /* MEM_TRANS_RETIRED.LOAD_LATENCY */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x02cd, 0x8), /* MEM_TRANS_RETIRED.PRECISE_STORE */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x11d0, 0xf), /* MEM_UOP_RETIRED.STLB_MISS_LOADS */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x12d0, 0xf), /* MEM_UOP_RETIRED.STLB_MISS_STORES */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x21d0, 0xf), /* MEM_UOP_RETIRED.LOCK_LOADS */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x22d0, 0xf), /* MEM_UOP_RETIRED.LOCK_STORES */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x41d0, 0xf), /* MEM_UOP_RETIRED.SPLIT_LOADS */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x42d0, 0xf), /* MEM_UOP_RETIRED.SPLIT_STORES */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x81d0, 0xf), /* MEM_UOP_RETIRED.ANY_LOADS */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x82d0, 0xf), /* MEM_UOP_RETIRED.ANY_STORES */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x01d1, 0xf), /* MEM_LOAD_UOPS_RETIRED.L1_HIT */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x02d1, 0xf), /* MEM_LOAD_UOPS_RETIRED.L2_HIT */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x04d1, 0xf), /* MEM_LOAD_UOPS_RETIRED.LLC_HIT */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x40d1, 0xf), /* MEM_LOAD_UOPS_RETIRED.HIT_LFB */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x01d2, 0xf), /* MEM_LOAD_UOPS_LLC_HIT_RETIRED.XSNP_MISS */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x02d2, 0xf), /* MEM_LOAD_UOPS_LLC_HIT_RETIRED.XSNP_HIT */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x04d2, 0xf), /* MEM_LOAD_UOPS_LLC_HIT_RETIRED.XSNP_HITM */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x08d2, 0xf), /* MEM_LOAD_UOPS_LLC_HIT_RETIRED.XSNP_NONE */
														
 
															+	PEBS_EVENT_CONSTRAINT(0x02d4, 0xf), /* MEM_LOAD_UOPS_MISC_RETIRED.LLC_MISS */
														
 
															 	EVENT_CONSTRAINT_END
														
 
															 };
														
@@ -695,20 +753,17 @@ static void intel_ds_init(void)
 
															 			printk(KERN_CONT "PEBS fmt0%c, ", pebs_type);
														
 
															 			x86_pmu.pebs_record_size = sizeof(struct pebs_record_core);
														
 
															 			x86_pmu.drain_pebs = intel_pmu_drain_pebs_core;
														
 
															-			x86_pmu.pebs_constraints = intel_core_pebs_events;
														
 
															 			break;
														
 
															 		case 1:
														
 
															 			printk(KERN_CONT "PEBS fmt1%c, ", pebs_type);
														
 
															 			x86_pmu.pebs_record_size = sizeof(struct pebs_record_nhm);
														
 
															 			x86_pmu.drain_pebs = intel_pmu_drain_pebs_nhm;
														
 
															-			x86_pmu.pebs_constraints = intel_nehalem_pebs_events;
														
 
															 			break;
														
 
															 		default:
														
 
															 			printk(KERN_CONT "no PEBS fmt%d%c, ", format, pebs_type);
														
 
															 			x86_pmu.pebs = 0;
														
 
															-			break;
														
 
															 		}
														
 
															 	}
														
 
															 }
														
--- a/arch/x86/kernel/cpu/perf_event_p4.c
+++ b/arch/x86/kernel/cpu/perf_event_p4.c
@@ -764,9 +764,9 @@ static inline int p4_pmu_clear_cccr_ovf(struct hw_perf_event *hwc)
 
															 	u64 v;
														
 
															 	/* an official way for overflow indication */
														
 
															-	rdmsrl(hwc->config_base + hwc->idx, v);
														
 
															+	rdmsrl(hwc->config_base, v);
														
 
															 	if (v & P4_CCCR_OVF) {
														
 
															-		wrmsrl(hwc->config_base + hwc->idx, v & ~P4_CCCR_OVF);
														
 
															+		wrmsrl(hwc->config_base, v & ~P4_CCCR_OVF);
														
 
															 		return 1;
														
 
															 	}
														
@@ -815,7 +815,7 @@ static inline void p4_pmu_disable_event(struct perf_event *event)
 
															 	 * state we need to clear P4_CCCR_OVF, otherwise interrupt get
														
 
															 	 * asserted again and again
														
 
															 	 */
														
 
															-	(void)checking_wrmsrl(hwc->config_base + hwc->idx,
														
 
															+	(void)checking_wrmsrl(hwc->config_base,
														
 
															 		(u64)(p4_config_unpack_cccr(hwc->config)) &
														
 
															 			~P4_CCCR_ENABLE & ~P4_CCCR_OVF & ~P4_CCCR_RESERVED);
														
 
															 }
														
@@ -885,7 +885,7 @@ static void p4_pmu_enable_event(struct perf_event *event)
 
															 	p4_pmu_enable_pebs(hwc->config);
														
 
															 	(void)checking_wrmsrl(escr_addr, escr_conf);
														
 
															-	(void)checking_wrmsrl(hwc->config_base + hwc->idx,
														
 
															+	(void)checking_wrmsrl(hwc->config_base,
														
 
															 				(cccr & ~P4_CCCR_RESERVED) | P4_CCCR_ENABLE);
														
 
															 }
														
--- a/arch/x86/kernel/cpu/perf_event_p6.c
+++ b/arch/x86/kernel/cpu/perf_event_p6.c
@@ -68,7 +68,7 @@ p6_pmu_disable_event(struct perf_event *event)
 
															 	if (cpuc->enabled)
														
 
															 		val |= ARCH_PERFMON_EVENTSEL_ENABLE;
														
 
															-	(void)checking_wrmsrl(hwc->config_base + hwc->idx, val);
														
 
															+	(void)checking_wrmsrl(hwc->config_base, val);
														
 
															 }
														
 
															 static void p6_pmu_enable_event(struct perf_event *event)
														
@@ -81,7 +81,7 @@ static void p6_pmu_enable_event(struct perf_event *event)
 
															 	if (cpuc->enabled)
														
 
															 		val |= ARCH_PERFMON_EVENTSEL_ENABLE;
														
 
															-	(void)checking_wrmsrl(hwc->config_base + hwc->idx, val);
														
 
															+	(void)checking_wrmsrl(hwc->config_base, val);
														
 
															 }
														
 
															 static __initconst const struct x86_pmu p6_pmu = {
														
--- a/arch/x86/kernel/cpu/perfctr-watchdog.c
+++ b/arch/x86/kernel/cpu/perfctr-watchdog.c
@@ -46,6 +46,8 @@ static inline unsigned int nmi_perfctr_msr_to_bit(unsigned int msr)
 
															 	/* returns the bit offset of the performance counter register */
														
 
															 	switch (boot_cpu_data.x86_vendor) {
														
 
															 	case X86_VENDOR_AMD:
														
 
															+		if (msr >= MSR_F15H_PERF_CTR)
														
 
															+			return (msr - MSR_F15H_PERF_CTR) >> 1;
														
 
															 		return msr - MSR_K7_PERFCTR0;
														
 
															 	case X86_VENDOR_INTEL:
														
 
															 		if (cpu_has(&boot_cpu_data, X86_FEATURE_ARCH_PERFMON))
														
@@ -70,6 +72,8 @@ static inline unsigned int nmi_evntsel_msr_to_bit(unsigned int msr)
 
															 	/* returns the bit offset of the event selection register */
														
 
															 	switch (boot_cpu_data.x86_vendor) {
														
 
															 	case X86_VENDOR_AMD:
														
 
															+		if (msr >= MSR_F15H_PERF_CTL)
														
 
															+			return (msr - MSR_F15H_PERF_CTL) >> 1;
														
 
															 		return msr - MSR_K7_EVNTSEL0;
														
 
															 	case X86_VENDOR_INTEL:
														
 
															 		if (cpu_has(&boot_cpu_data, X86_FEATURE_ARCH_PERFMON))
														
--- a/arch/x86/kernel/dumpstack.c
+++ b/arch/x86/kernel/dumpstack.c
@@ -320,31 +320,6 @@ void die(const char *str, struct pt_regs *regs, long err)
 
															 	oops_end(flags, regs, sig);
														
 
															 }
														
 
															-void notrace __kprobes
														
 
															-die_nmi(char *str, struct pt_regs *regs, int do_panic)
														
 
															-{
														
 
															-	unsigned long flags;
														
 
															-
														
 
															-	if (notify_die(DIE_NMIWATCHDOG, str, regs, 0, 2, SIGINT) == NOTIFY_STOP)
														
 
															-		return;
														
 
															-
														
 
															-	/*
														
 
															-	 * We are in trouble anyway, lets at least try
														
 
															-	 * to get a message out.
														
 
															-	 */
														
 
															-	flags = oops_begin();
														
 
															-	printk(KERN_EMERG "%s", str);
														
 
															-	printk(" on CPU%d, ip %08lx, registers:\n",
														
 
															-		smp_processor_id(), regs->ip);
														
 
															-	show_registers(regs);
														
 
															-	oops_end(flags, regs, 0);
														
 
															-	if (do_panic || panic_on_oops)
														
 
															-		panic("Non maskable interrupt");
														
 
															-	nmi_exit();
														
 
															-	local_irq_enable();
														
 
															-	do_exit(SIGBUS);
														
 
															-}
														
 
															-
														
 
															 static int __init oops_setup(char *s)
														
 
															 {
														
 
															 	if (!s)
														
--- a/arch/x86/kernel/entry_32.S
+++ b/arch/x86/kernel/entry_32.S
@@ -65,6 +65,8 @@
 
															 #define sysexit_audit	syscall_exit_work
														
 
															 #endif
														
 
															+	.section .entry.text, "ax"
														
 
															+
														
 
															 /*
														
 
															  * We use macros for low-level operations which need to be overridden
														
 
															  * for paravirtualization.  The following will never clobber any registers:
														
@@ -788,7 +790,7 @@ ENDPROC(ptregs_clone)
 
															  */
														
 
															 .section .init.rodata,"a"
														
 
															 ENTRY(interrupt)
														
 
															-.text
														
 
															+.section .entry.text, "ax"
														
 
															 	.p2align 5
														
 
															 	.p2align CONFIG_X86_L1_CACHE_SHIFT
														
 
															 ENTRY(irq_entries_start)
														
@@ -807,7 +809,7 @@ vector=FIRST_EXTERNAL_VECTOR
 
															       .endif
														
 
															       .previous
														
 
															 	.long 1b
														
 
															-      .text
														
 
															+      .section .entry.text, "ax"
														
 
															 vector=vector+1
														
 
															     .endif
														
 
															   .endr
														
--- a/arch/x86/kernel/entry_64.S
+++ b/arch/x86/kernel/entry_64.S
@@ -61,6 +61,8 @@
 
															 #define __AUDIT_ARCH_LE	   0x40000000
														
 
															 	.code64
														
 
															+	.section .entry.text, "ax"
														
 
															+
														
 
															 #ifdef CONFIG_FUNCTION_TRACER
														
 
															 #ifdef CONFIG_DYNAMIC_FTRACE
														
 
															 ENTRY(mcount)
														
@@ -744,7 +746,7 @@ END(stub_rt_sigreturn)
 
															  */
														
 
															 	.section .init.rodata,"a"
														
 
															 ENTRY(interrupt)
														
 
															-	.text
														
 
															+	.section .entry.text
														
 
															 	.p2align 5
														
 
															 	.p2align CONFIG_X86_L1_CACHE_SHIFT
														
 
															 ENTRY(irq_entries_start)
														
@@ -763,7 +765,7 @@ vector=FIRST_EXTERNAL_VECTOR
 
															       .endif
														
 
															       .previous
														
 
															 	.quad 1b
														
 
															-      .text
														
 
															+      .section .entry.text
														
 
															 vector=vector+1
														
 
															     .endif
														
 
															   .endr
														
--- a/arch/x86/kernel/ftrace.c
+++ b/arch/x86/kernel/ftrace.c
@@ -437,18 +437,19 @@ void prepare_ftrace_return(unsigned long *parent, unsigned long self_addr,
 
															 		return;
														
 
															 	}
														
 
															-	if (ftrace_push_return_trace(old, self_addr, &trace.depth,
														
 
															-		    frame_pointer) == -EBUSY) {
														
 
															-		*parent = old;
														
 
															-		return;
														
 
															-	}
														
 
															-
														
 
															 	trace.func = self_addr;
														
 
															+	trace.depth = current->curr_ret_stack + 1;
														
 
															 	/* Only trace if the calling function expects to */
														
 
															 	if (!ftrace_graph_entry(&trace)) {
														
 
															-		current->curr_ret_stack--;
														
 
															 		*parent = old;
														
 
															+		return;
														
 
															+	}
														
 
															+
														
 
															+	if (ftrace_push_return_trace(old, self_addr, &trace.depth,
														
 
															+		    frame_pointer) == -EBUSY) {
														
 
															+		*parent = old;
														
 
															+		return;
														
 
															 	}
														
 
															 }
														
 
															 #endif /* CONFIG_FUNCTION_GRAPH_TRACER */
														
--- a/arch/x86/kernel/kgdb.c
+++ b/arch/x86/kernel/kgdb.c
@@ -533,15 +533,6 @@ static int __kgdb_notify(struct die_args *args, unsigned long cmd)
 
															 		}
														
 
															 		return NOTIFY_DONE;
														
 
															-	case DIE_NMIWATCHDOG:
														
 
															-		if (atomic_read(&kgdb_active) != -1) {
														
 
															-			/* KGDB CPU roundup: */
														
 
															-			kgdb_nmicallback(raw_smp_processor_id(), regs);
														
 
															-			return NOTIFY_STOP;
														
 
															-		}
														
 
															-		/* Enter debugger: */
														
 
															-		break;
														
 
															-
														
 
															 	case DIE_DEBUG:
														
 
															 		if (atomic_read(&kgdb_cpu_doing_single_step) != -1) {
														
 
															 			if (user_mode(regs))
														
--- a/arch/x86/kernel/kprobes.c
+++ b/arch/x86/kernel/kprobes.c
@@ -1276,6 +1276,14 @@ static int __kprobes can_optimize(unsigned long paddr)
 
															 	if (!kallsyms_lookup_size_offset(paddr, &size, &offset))
														
 
															 		return 0;
														
 
															+	/*
														
 
															+	 * Do not optimize in the entry code due to the unstable
														
 
															+	 * stack handling.
														
 
															+	 */
														
 
															+	if ((paddr >= (unsigned long )__entry_text_start) &&
														
 
															+	    (paddr <  (unsigned long )__entry_text_end))
														
 
															+		return 0;
														
 
															+
														
 
															 	/* Check there is enough space for a relative jump. */
														
 
															 	if (size - offset < RELATIVEJUMP_SIZE)
														
 
															 		return 0;
														
--- a/arch/x86/kernel/vmlinux.lds.S
+++ b/arch/x86/kernel/vmlinux.lds.S
@@ -105,6 +105,7 @@ SECTIONS
 
															 		SCHED_TEXT
														
 
															 		LOCK_TEXT
														
 
															 		KPROBES_TEXT
														
 
															+		ENTRY_TEXT
														
 
															 		IRQENTRY_TEXT
														
 
															 		*(.fixup)
														
 
															 		*(.gnu.warning)
														
--- a/arch/x86/kvm/trace.h
+++ b/arch/x86/kvm/trace.h
@@ -62,21 +62,21 @@ TRACE_EVENT(kvm_hv_hypercall,
 
															 	TP_ARGS(code, fast, rep_cnt, rep_idx, ingpa, outgpa),
														
 
															 	TP_STRUCT__entry(
														
 
															-		__field(	__u16, 		code		)
														
 
															-		__field(	bool,		fast		)
														
 
															 		__field(	__u16,		rep_cnt		)
														
 
															 		__field(	__u16,		rep_idx		)
														
 
															 		__field(	__u64,		ingpa		)
														
 
															 		__field(	__u64,		outgpa		)
														
 
															+		__field(	__u16, 		code		)
														
 
															+		__field(	bool,		fast		)
														
 
															 	),
														
 
															 	TP_fast_assign(
														
 
															-		__entry->code		= code;
														
 
															-		__entry->fast		= fast;
														
 
															 		__entry->rep_cnt	= rep_cnt;
														
 
															 		__entry->rep_idx	= rep_idx;
														
 
															 		__entry->ingpa		= ingpa;
														
 
															 		__entry->outgpa		= outgpa;
														
 
															+		__entry->code		= code;
														
 
															+		__entry->fast		= fast;
														
 
															 	),
														
 
															 	TP_printk("code 0x%x %s cnt 0x%x idx 0x%x in 0x%llx out 0x%llx",
														
--- a/include/asm-generic/sections.h
+++ b/include/asm-generic/sections.h
@@ -11,6 +11,7 @@ extern char _sinittext[], _einittext[];
 
															 extern char _end[];
														
 
															 extern char __per_cpu_load[], __per_cpu_start[], __per_cpu_end[];
														
 
															 extern char __kprobes_text_start[], __kprobes_text_end[];
														
 
															+extern char __entry_text_start[], __entry_text_end[];
														
 
															 extern char __initdata_begin[], __initdata_end[];
														
 
															 extern char __start_rodata[], __end_rodata[];
														
--- a/include/asm-generic/vmlinux.lds.h
+++ b/include/asm-generic/vmlinux.lds.h
@@ -424,6 +424,12 @@
 
															 		*(.kprobes.text)					\
														
 
															 		VMLINUX_SYMBOL(__kprobes_text_end) = .;
														
 
															+#define ENTRY_TEXT							\
														
 
															+		ALIGN_FUNCTION();					\
														
 
															+		VMLINUX_SYMBOL(__entry_text_start) = .;			\
														
 
															+		*(.entry.text)						\
														
 
															+		VMLINUX_SYMBOL(__entry_text_end) = .;
														
 
															+
														
 
															 #ifdef CONFIG_FUNCTION_GRAPH_TRACER
														
 
															 #define IRQENTRY_TEXT							\
														
 
															 		ALIGN_FUNCTION();					\
														
--- a/include/linux/cgroup.h
+++ b/include/linux/cgroup.h
@@ -474,7 +474,8 @@ struct cgroup_subsys {
 
															 			struct cgroup *old_cgrp, struct task_struct *tsk,
														
 
															 			bool threadgroup);
														
 
															 	void (*fork)(struct cgroup_subsys *ss, struct task_struct *task);
														
 
															-	void (*exit)(struct cgroup_subsys *ss, struct task_struct *task);
														
 
															+	void (*exit)(struct cgroup_subsys *ss, struct cgroup *cgrp,
														
 
															+			struct cgroup *old_cgrp, struct task_struct *task);
														
 
															 	int (*populate)(struct cgroup_subsys *ss,
														
 
															 			struct cgroup *cgrp);
														
 
															 	void (*post_clone)(struct cgroup_subsys *ss, struct cgroup *cgrp);
														
@@ -626,6 +627,7 @@ bool css_is_ancestor(struct cgroup_subsys_state *cg,
 
															 /* Get id and depth of css */
														
 
															 unsigned short css_id(struct cgroup_subsys_state *css);
														
 
															 unsigned short css_depth(struct cgroup_subsys_state *css);
														
 
															+struct cgroup_subsys_state *cgroup_css_from_dir(struct file *f, int id);
														
 
															 #else /* !CONFIG_CGROUPS */
														
--- a/include/linux/cgroup_subsys.h
+++ b/include/linux/cgroup_subsys.h
@@ -65,4 +65,8 @@ SUBSYS(net_cls)
 
															 SUBSYS(blkio)
														
 
															 #endif
														
 
															+#ifdef CONFIG_CGROUP_PERF
														
 
															+SUBSYS(perf)
														
 
															+#endif
														
 
															+
														
 
															 /* */
														
--- a/include/linux/ftrace.h
+++ b/include/linux/ftrace.h
@@ -428,6 +428,7 @@ extern void unregister_ftrace_graph(void);
 
															 extern void ftrace_graph_init_task(struct task_struct *t);
														
 
															 extern void ftrace_graph_exit_task(struct task_struct *t);
														
 
															+extern void ftrace_graph_init_idle_task(struct task_struct *t, int cpu);
														
 
															 static inline int task_curr_ret_stack(struct task_struct *t)
														
 
															 {
														
@@ -451,6 +452,7 @@ static inline void unpause_graph_tracing(void)
 
															 static inline void ftrace_graph_init_task(struct task_struct *t) { }
														
 
															 static inline void ftrace_graph_exit_task(struct task_struct *t) { }
														
 
															+static inline void ftrace_graph_init_idle_task(struct task_struct *t, int cpu) { }
														
 
															 static inline int register_ftrace_graph(trace_func_graph_ret_t retfunc,
														
 
															 			  trace_func_graph_ent_t entryfunc)
														
--- a/include/linux/ftrace_event.h
+++ b/include/linux/ftrace_event.h
@@ -37,7 +37,6 @@ struct trace_entry {
 
															 	unsigned char		flags;
														
 
															 	unsigned char		preempt_count;
														
 
															 	int			pid;
														
 
															-	int			lock_depth;
														
 
															 };
														
 
															 #define FTRACE_MAX_EVENT						\
														
@@ -208,7 +207,6 @@ struct ftrace_event_call {
 
															 #define PERF_MAX_TRACE_SIZE	2048
														
 
															-#define MAX_FILTER_PRED		32
														
 
															 #define MAX_FILTER_STR_VAL	256	/* Should handle KSYM_SYMBOL_LEN */
														
 
															 extern void destroy_preds(struct ftrace_event_call *call);
														
--- a/include/linux/perf_event.h
+++ b/include/linux/perf_event.h
@@ -225,8 +225,14 @@ struct perf_event_attr {
 
															 	};
														
 
															 	__u32			bp_type;
														
 
															-	__u64			bp_addr;
														
 
															-	__u64			bp_len;
														
 
															+	union {
														
 
															+		__u64		bp_addr;
														
 
															+		__u64		config1; /* extension of config */
														
 
															+	};
														
 
															+	union {
														
 
															+		__u64		bp_len;
														
 
															+		__u64		config2; /* extension of config1 */
														
 
															+	};
														
 
															 };
														
 
															 /*
														
@@ -464,6 +470,7 @@ enum perf_callchain_context {
 
															 #define PERF_FLAG_FD_NO_GROUP	(1U << 0)
														
 
															 #define PERF_FLAG_FD_OUTPUT	(1U << 1)
														
 
															+#define PERF_FLAG_PID_CGROUP	(1U << 2) /* pid=cgroup id, per-cpu mode only */
														
 
															 #ifdef __KERNEL__
														
 
															 /*
														
@@ -471,6 +478,7 @@ enum perf_callchain_context {
 
															  */
														
 
															 #ifdef CONFIG_PERF_EVENTS
														
 
															+# include <linux/cgroup.h>
														
 
															 # include <asm/perf_event.h>
														
 
															 # include <asm/local64.h>
														
 
															 #endif
														
@@ -539,6 +547,9 @@ struct hw_perf_event {
 
															 			unsigned long	event_base;
														
 
															 			int		idx;
														
 
															 			int		last_cpu;
														
 
															+			unsigned int	extra_reg;
														
 
															+			u64		extra_config;
														
 
															+			int		extra_alloc;
														
 
															 		};
														
 
															 		struct { /* software */
														
 
															 			struct hrtimer	hrtimer;
														
@@ -716,6 +727,22 @@ struct swevent_hlist {
 
															 #define PERF_ATTACH_GROUP	0x02
														
 
															 #define PERF_ATTACH_TASK	0x04
														
 
															+#ifdef CONFIG_CGROUP_PERF
														
 
															+/*
														
 
															+ * perf_cgroup_info keeps track of time_enabled for a cgroup.
														
 
															+ * This is a per-cpu dynamically allocated data structure.
														
 
															+ */
														
 
															+struct perf_cgroup_info {
														
 
															+	u64 time;
														
 
															+	u64 timestamp;
														
 
															+};
														
 
															+
														
 
															+struct perf_cgroup {
														
 
															+	struct cgroup_subsys_state css;
														
 
															+	struct perf_cgroup_info *info;	/* timing info, one per cpu */
														
 
															+};
														
 
															+#endif
														
 
															+
														
 
															 /**
														
 
															  * struct perf_event - performance event kernel representation:
														
 
															  */
														
@@ -832,6 +859,11 @@ struct perf_event {
 
															 	struct event_filter		*filter;
														
 
															 #endif
														
 
															+#ifdef CONFIG_CGROUP_PERF
														
 
															+	struct perf_cgroup		*cgrp; /* cgroup event is attach to */
														
 
															+	int				cgrp_defer_enabled;
														
 
															+#endif
														
 
															+
														
 
															 #endif /* CONFIG_PERF_EVENTS */
														
 
															 };
														
@@ -886,6 +918,7 @@ struct perf_event_context {
 
															 	u64				generation;
														
 
															 	int				pin_count;
														
 
															 	struct rcu_head			rcu_head;
														
 
															+	int				nr_cgroups; /* cgroup events present */
														
 
															 };
														
 
															 /*
														
@@ -905,6 +938,9 @@ struct perf_cpu_context {
 
															 	struct list_head		rotation_list;
														
 
															 	int				jiffies_interval;
														
 
															 	struct pmu			*active_pmu;
														
 
															+#ifdef CONFIG_CGROUP_PERF
														
 
															+	struct perf_cgroup		*cgrp;
														
 
															+#endif
														
 
															 };
														
 
															 struct perf_output_handle {
														
@@ -1040,11 +1076,11 @@ have_event:
 
															 	__perf_sw_event(event_id, nr, nmi, regs, addr);
														
 
															 }
														
 
															-extern atomic_t perf_task_events;
														
 
															+extern atomic_t perf_sched_events;
														
 
															 static inline void perf_event_task_sched_in(struct task_struct *task)
														
 
															 {
														
 
															-	COND_STMT(&perf_task_events, __perf_event_task_sched_in(task));
														
 
															+	COND_STMT(&perf_sched_events, __perf_event_task_sched_in(task));
														
 
															 }
														
 
															 static inline
														
@@ -1052,7 +1088,7 @@ void perf_event_task_sched_out(struct task_struct *task, struct task_struct *nex
 
															 {
														
 
															 	perf_sw_event(PERF_COUNT_SW_CONTEXT_SWITCHES, 1, 1, NULL, 0);
														
 
															-	COND_STMT(&perf_task_events, __perf_event_task_sched_out(task, next));
														
 
															+	COND_STMT(&perf_sched_events, __perf_event_task_sched_out(task, next));
														
 
															 }
														
 
															 extern void perf_event_mmap(struct vm_area_struct *vma);
														
@@ -1083,6 +1119,10 @@ extern int sysctl_perf_event_paranoid;
 
															 extern int sysctl_perf_event_mlock;
														
 
															 extern int sysctl_perf_event_sample_rate;
														
 
															+extern int perf_proc_update_handler(struct ctl_table *table, int write,
														
 
															+		void __user *buffer, size_t *lenp,
														
 
															+		loff_t *ppos);
														
 
															+
														
 
															 static inline bool perf_paranoid_tracepoint_raw(void)
														
 
															 {
														
 
															 	return sysctl_perf_event_paranoid > -1;
														
--- a/include/linux/ring_buffer.h
+++ b/include/linux/ring_buffer.h
@@ -100,6 +100,8 @@ void ring_buffer_free(struct ring_buffer *buffer);
 
															 int ring_buffer_resize(struct ring_buffer *buffer, unsigned long size);
														
 
															+void ring_buffer_change_overwrite(struct ring_buffer *buffer, int val);
														
 
															+
														
 
															 struct ring_buffer_event *ring_buffer_lock_reserve(struct ring_buffer *buffer,
														
 
															 						   unsigned long length);
														
 
															 int ring_buffer_unlock_commit(struct ring_buffer *buffer,
														
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -2578,13 +2578,6 @@ static inline void inc_syscw(struct task_struct *tsk)
 
															 #define TASK_SIZE_OF(tsk)	TASK_SIZE
														
 
															 #endif
														
 
															-/*
														
 
															- * Call the function if the target task is executing on a CPU right now:
														
 
															- */
														
 
															-extern void task_oncpu_function_call(struct task_struct *p,
														
 
															-				     void (*func) (void *info), void *info);
														
 
															-
														
 
															-
														
 
															 #ifdef CONFIG_MM_OWNER
														
 
															 extern void mm_update_next_owner(struct mm_struct *mm);
														
 
															 extern void mm_init_owner(struct mm_struct *mm, struct task_struct *p);
														
--- a/include/linux/syscalls.h
+++ b/include/linux/syscalls.h
@@ -133,11 +133,11 @@ extern struct trace_event_functions exit_syscall_print_funcs;
 
															 		.class			= &event_class_syscall_enter,	\
														
 
															 		.event.funcs            = &enter_syscall_print_funcs,	\
														
 
															 		.data			= (void *)&__syscall_meta_##sname,\
														
 
															+		.flags			= TRACE_EVENT_FL_CAP_ANY,	\
														
 
															 	};								\
														
 
															 	static struct ftrace_event_call __used				\
														
 
															 	  __attribute__((section("_ftrace_events")))			\
														
 
															-	 *__event_enter_##sname = &event_enter_##sname;			\
														
 
															-	__TRACE_EVENT_FLAGS(enter_##sname, TRACE_EVENT_FL_CAP_ANY)
														
 
															+	 *__event_enter_##sname = &event_enter_##sname;
														
 
															 #define SYSCALL_TRACE_EXIT_EVENT(sname)					\
														
 
															 	static struct syscall_metadata __syscall_meta_##sname;		\
														
@@ -147,11 +147,11 @@ extern struct trace_event_functions exit_syscall_print_funcs;
 
															 		.class			= &event_class_syscall_exit,	\
														
 
															 		.event.funcs		= &exit_syscall_print_funcs,	\
														
 
															 		.data			= (void *)&__syscall_meta_##sname,\
														
 
															+		.flags			= TRACE_EVENT_FL_CAP_ANY,	\
														
 
															 	};								\
														
 
															 	static struct ftrace_event_call __used				\
														
 
															 	  __attribute__((section("_ftrace_events")))			\
														
 
															-	*__event_exit_##sname = &event_exit_##sname;			\
														
 
															-	__TRACE_EVENT_FLAGS(exit_##sname, TRACE_EVENT_FL_CAP_ANY)
														
 
															+	*__event_exit_##sname = &event_exit_##sname;
														
 
															 #define SYSCALL_METADATA(sname, nb)				\
														
 
															 	SYSCALL_TRACE_ENTER_EVENT(sname);			\
														
@@ -159,6 +159,7 @@ extern struct trace_event_functions exit_syscall_print_funcs;
 
															 	static struct syscall_metadata __used			\
														
 
															 	  __syscall_meta_##sname = {				\
														
 
															 		.name 		= "sys"#sname,			\
														
 
															+		.syscall_nr	= -1,	/* Filled in at boot */	\
														
 
															 		.nb_args 	= nb,				\
														
 
															 		.types		= types_##sname,		\
														
 
															 		.args		= args_##sname,			\
														
@@ -176,6 +177,7 @@ extern struct trace_event_functions exit_syscall_print_funcs;
 
															 	static struct syscall_metadata __used			\
														
 
															 	  __syscall_meta__##sname = {				\
														
 
															 		.name 		= "sys_"#sname,			\
														
 
															+		.syscall_nr	= -1,	/* Filled in at boot */	\
														
 
															 		.nb_args 	= 0,				\
														
 
															 		.enter_event	= &event_enter__##sname,	\
														
 
															 		.exit_event	= &event_exit__##sname,		\
														
--- a/include/trace/events/mce.h
+++ b/include/trace/events/mce.h
@@ -17,36 +17,36 @@ TRACE_EVENT(mce_record,
 
															 	TP_STRUCT__entry(
														
 
															 		__field(	u64,		mcgcap		)
														
 
															 		__field(	u64,		mcgstatus	)
														
 
															-		__field(	u8,		bank		)
														
 
															 		__field(	u64,		status		)
														
 
															 		__field(	u64,		addr		)
														
 
															 		__field(	u64,		misc		)
														
 
															 		__field(	u64,		ip		)
														
 
															-		__field(	u8,		cs		)
														
 
															 		__field(	u64,		tsc		)
														
 
															 		__field(	u64,		walltime	)
														
 
															 		__field(	u32,		cpu		)
														
 
															 		__field(	u32,		cpuid		)
														
 
															 		__field(	u32,		apicid		)
														
 
															 		__field(	u32,		socketid	)
														
 
															+		__field(	u8,		cs		)
														
 
															+		__field(	u8,		bank		)
														
 
															 		__field(	u8,		cpuvendor	)
														
 
															 	),
														
 
															 	TP_fast_assign(
														
 
															 		__entry->mcgcap		= m->mcgcap;
														
 
															 		__entry->mcgstatus	= m->mcgstatus;
														
 
															-		__entry->bank		= m->bank;
														
 
															 		__entry->status		= m->status;
														
 
															 		__entry->addr		= m->addr;
														
 
															 		__entry->misc		= m->misc;
														
 
															 		__entry->ip		= m->ip;
														
 
															-		__entry->cs		= m->cs;
														
 
															 		__entry->tsc		= m->tsc;
														
 
															 		__entry->walltime	= m->time;
														
 
															 		__entry->cpu		= m->extcpu;
														
 
															 		__entry->cpuid		= m->cpuid;
														
 
															 		__entry->apicid		= m->apicid;
														
 
															 		__entry->socketid	= m->socketid;
														
 
															+		__entry->cs		= m->cs;
														
 
															+		__entry->bank		= m->bank;
														
 
															 		__entry->cpuvendor	= m->cpuvendor;
														
 
															 	),
														
--- a/include/trace/events/module.h
+++ b/include/trace/events/module.h
@@ -108,14 +108,14 @@ TRACE_EVENT(module_request,
 
															 	TP_ARGS(name, wait, ip),
														
 
															 	TP_STRUCT__entry(
														
 
															-		__field(	bool,		wait		)
														
 
															 		__field(	unsigned long,	ip		)
														
 
															+		__field(	bool,		wait		)
														
 
															 		__string(	name,		name		)
														
 
															 	),
														
 
															 	TP_fast_assign(
														
 
															-		__entry->wait	= wait;
														
 
															 		__entry->ip	= ip;
														
 
															+		__entry->wait	= wait;
														
 
															 		__assign_str(name, name);
														
 
															 	),
														
@@ -129,4 +129,3 @@ TRACE_EVENT(module_request,
 
															 /* This part must be outside protection */
														
 
															 #include <trace/define_trace.h>
														
 
															-
														
--- a/include/trace/events/skb.h
+++ b/include/trace/events/skb.h
@@ -19,14 +19,14 @@ TRACE_EVENT(kfree_skb,
 
															 	TP_STRUCT__entry(
														
 
															 		__field(	void *,		skbaddr		)
														
 
															-		__field(	unsigned short,	protocol	)
														
 
															 		__field(	void *,		location	)
														
 
															+		__field(	unsigned short,	protocol	)
														
 
															 	),
														
 
															 	TP_fast_assign(
														
 
															 		__entry->skbaddr = skb;
														
 
															-		__entry->protocol = ntohs(skb->protocol);
														
 
															 		__entry->location = location;
														
 
															+		__entry->protocol = ntohs(skb->protocol);
														
 
															 	),
														
 
															 	TP_printk("skbaddr=%p protocol=%u location=%p",
														
--- a/init/Kconfig
+++ b/init/Kconfig
@@ -695,6 +695,16 @@ config CGROUP_MEM_RES_CTLR_SWAP_ENABLED
 
															 	  select this option (if, for some reason, they need to disable it
														
 
															 	  then noswapaccount does the trick).
														
 
															+config CGROUP_PERF
														
 
															+	bool "Enable perf_event per-cpu per-container group (cgroup) monitoring"
														
 
															+	depends on PERF_EVENTS && CGROUPS
														
 
															+	help
														
 
															+	  This option extends the per-cpu mode to restrict monitoring to
														
 
															+	  threads which belong to the cgroup specified and run on the
														
 
															+	  designated cpu.
														
 
															+
														
 
															+	  Say N if unsure.
														
 
															+
														
 
															 menuconfig CGROUP_SCHED
														
 
															 	bool "Group CPU scheduler"
														
 
															 	depends on EXPERIMENTAL
														
--- a/kernel/cgroup.c
+++ b/kernel/cgroup.c
@@ -4230,20 +4230,8 @@ void cgroup_post_fork(struct task_struct *child)
 
															  */
														
 
															 void cgroup_exit(struct task_struct *tsk, int run_callbacks)
														
 
															 {
														
 
															-	int i;
														
 
															 	struct css_set *cg;
														
 
															-
														
 
															-	if (run_callbacks && need_forkexit_callback) {
														
 
															-		/*
														
 
															-		 * modular subsystems can't use callbacks, so no need to lock
														
 
															-		 * the subsys array
														
 
															-		 */
														
 
															-		for (i = 0; i < CGROUP_BUILTIN_SUBSYS_COUNT; i++) {
														
 
															-			struct cgroup_subsys *ss = subsys[i];
														
 
															-			if (ss->exit)
														
 
															-				ss->exit(ss, tsk);
														
 
															-		}
														
 
															-	}
														
 
															+	int i;
														
 
															 	/*
														
 
															 	 * Unlink from the css_set task list if necessary.
														
@@ -4261,7 +4249,24 @@ void cgroup_exit(struct task_struct *tsk, int run_callbacks)
 
															 	task_lock(tsk);
														
 
															 	cg = tsk->cgroups;
														
 
															 	tsk->cgroups = &init_css_set;
														
 
															+
														
 
															+	if (run_callbacks && need_forkexit_callback) {
														
 
															+		/*
														
 
															+		 * modular subsystems can't use callbacks, so no need to lock
														
 
															+		 * the subsys array
														
 
															+		 */
														
 
															+		for (i = 0; i < CGROUP_BUILTIN_SUBSYS_COUNT; i++) {
														
 
															+			struct cgroup_subsys *ss = subsys[i];
														
 
															+			if (ss->exit) {
														
 
															+				struct cgroup *old_cgrp =
														
 
															+					rcu_dereference_raw(cg->subsys[i])->cgroup;
														
 
															+				struct cgroup *cgrp = task_cgroup(tsk, i);
														
 
															+				ss->exit(ss, cgrp, old_cgrp, tsk);
														
 
															+			}
														
 
															+		}
														
 
															+	}
														
 
															 	task_unlock(tsk);
														
 
															+
														
 
															 	if (cg)
														
 
															 		put_css_set_taskexit(cg);
														
 
															 }
														
@@ -4813,6 +4818,29 @@ css_get_next(struct cgroup_subsys *ss, int id,
 
															 	return ret;
														
 
															 }
														
 
															+/*
														
 
															+ * get corresponding css from file open on cgroupfs directory
														
 
															+ */
														
 
															+struct cgroup_subsys_state *cgroup_css_from_dir(struct file *f, int id)
														
 
															+{
														
 
															+	struct cgroup *cgrp;
														
 
															+	struct inode *inode;
														
 
															+	struct cgroup_subsys_state *css;
														
 
															+
														
 
															+	inode = f->f_dentry->d_inode;
														
 
															+	/* check in cgroup filesystem dir */
														
 
															+	if (inode->i_op != &cgroup_dir_inode_operations)
														
 
															+		return ERR_PTR(-EBADF);
														
 
															+
														
 
															+	if (id < 0 || id >= CGROUP_SUBSYS_COUNT)
														
 
															+		return ERR_PTR(-EINVAL);
														
 
															+
														
 
															+	/* get cgroup */
														
 
															+	cgrp = __d_cgrp(f->f_dentry);
														
 
															+	css = cgrp->subsys[id];
														
 
															+	return css ? css : ERR_PTR(-ENOENT);
														
 
															+}
														
 
															+
														
 
															 #ifdef CONFIG_CGROUP_DEBUG
														
 
															 static struct cgroup_subsys_state *debug_create(struct cgroup_subsys *ss,
														
 
															 						   struct cgroup *cont)
														
--- a/kernel/perf_event.c
+++ b/kernel/perf_event.c
@@ -38,13 +38,96 @@
 
															 #include <asm/irq_regs.h>
														
 
															+struct remote_function_call {
														
 
															+	struct task_struct *p;
														
 
															+	int (*func)(void *info);
														
 
															+	void *info;
														
 
															+	int ret;
														
 
															+};
														
 
															+
														
 
															+static void remote_function(void *data)
														
 
															+{
														
 
															+	struct remote_function_call *tfc = data;
														
 
															+	struct task_struct *p = tfc->p;
														
 
															+
														
 
															+	if (p) {
														
 
															+		tfc->ret = -EAGAIN;
														
 
															+		if (task_cpu(p) != smp_processor_id() || !task_curr(p))
														
 
															+			return;
														
 
															+	}
														
 
															+
														
 
															+	tfc->ret = tfc->func(tfc->info);
														
 
															+}
														
 
															+
														
 
															+/**
														
 
															+ * task_function_call - call a function on the cpu on which a task runs
														
 
															+ * @p:		the task to evaluate
														
 
															+ * @func:	the function to be called
														
 
															+ * @info:	the function call argument
														
 
															+ *
														
 
															+ * Calls the function @func when the task is currently running. This might
														
 
															+ * be on the current CPU, which just calls the function directly
														
 
															+ *
														
 
															+ * returns: @func return value, or
														
 
															+ *	    -ESRCH  - when the process isn't running
														
 
															+ *	    -EAGAIN - when the process moved away
														
 
															+ */
														
 
															+static int
														
 
															+task_function_call(struct task_struct *p, int (*func) (void *info), void *info)
														
 
															+{
														
 
															+	struct remote_function_call data = {
														
 
															+		.p = p,
														
 
															+		.func = func,
														
 
															+		.info = info,
														
 
															+		.ret = -ESRCH, /* No such (running) process */
														
 
															+	};
														
 
															+
														
 
															+	if (task_curr(p))
														
 
															+		smp_call_function_single(task_cpu(p), remote_function, &data, 1);
														
 
															+
														
 
															+	return data.ret;
														
 
															+}
														
 
															+
														
 
															+/**
														
 
															+ * cpu_function_call - call a function on the cpu
														
 
															+ * @func:	the function to be called
														
 
															+ * @info:	the function call argument
														
 
															+ *
														
 
															+ * Calls the function @func on the remote cpu.
														
 
															+ *
														
 
															+ * returns: @func return value or -ENXIO when the cpu is offline
														
 
															+ */
														
 
															+static int cpu_function_call(int cpu, int (*func) (void *info), void *info)
														
 
															+{
														
 
															+	struct remote_function_call data = {
														
 
															+		.p = NULL,
														
 
															+		.func = func,
														
 
															+		.info = info,
														
 
															+		.ret = -ENXIO, /* No such CPU */
														
 
															+	};
														
 
															+
														
 
															+	smp_call_function_single(cpu, remote_function, &data, 1);
														
 
															+
														
 
															+	return data.ret;
														
 
															+}
														
 
															+
														
 
															+#define PERF_FLAG_ALL (PERF_FLAG_FD_NO_GROUP |\
														
 
															+		       PERF_FLAG_FD_OUTPUT  |\
														
 
															+		       PERF_FLAG_PID_CGROUP)
														
 
															+
														
 
															 enum event_type_t {
														
 
															 	EVENT_FLEXIBLE = 0x1,
														
 
															 	EVENT_PINNED = 0x2,
														
 
															 	EVENT_ALL = EVENT_FLEXIBLE | EVENT_PINNED,
														
 
															 };
														
 
															-atomic_t perf_task_events __read_mostly;
														
 
															+/*
														
 
															+ * perf_sched_events : >0 events exist
														
 
															+ * perf_cgroup_events: >0 per-cpu cgroup events exist on this cpu
														
 
															+ */
														
 
															+atomic_t perf_sched_events __read_mostly;
														
 
															+static DEFINE_PER_CPU(atomic_t, perf_cgroup_events);
														
 
															+
														
 
															 static atomic_t nr_mmap_events __read_mostly;
														
 
															 static atomic_t nr_comm_events __read_mostly;
														
 
															 static atomic_t nr_task_events __read_mostly;
														
@@ -67,7 +150,24 @@ int sysctl_perf_event_mlock __read_mostly = 512; /* 'free' kb per user */
 
															 /*
														
 
															  * max perf event sample rate
														
 
															  */
														
 
															-int sysctl_perf_event_sample_rate __read_mostly = 100000;
														
 
															+#define DEFAULT_MAX_SAMPLE_RATE 100000
														
 
															+int sysctl_perf_event_sample_rate __read_mostly = DEFAULT_MAX_SAMPLE_RATE;
														
 
															+static int max_samples_per_tick __read_mostly =
														
 
															+	DIV_ROUND_UP(DEFAULT_MAX_SAMPLE_RATE, HZ);
														
 
															+
														
 
															+int perf_proc_update_handler(struct ctl_table *table, int write,
														
 
															+		void __user *buffer, size_t *lenp,
														
 
															+		loff_t *ppos)
														
 
															+{
														
 
															+	int ret = proc_dointvec(table, write, buffer, lenp, ppos);
														
 
															+
														
 
															+	if (ret || !write)
														
 
															+		return ret;
														
 
															+
														
 
															+	max_samples_per_tick = DIV_ROUND_UP(sysctl_perf_event_sample_rate, HZ);
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															 static atomic64_t perf_event_id;
														
@@ -75,7 +175,11 @@ static void cpu_ctx_sched_out(struct perf_cpu_context *cpuctx,
 
															 			      enum event_type_t event_type);
														
 
															 static void cpu_ctx_sched_in(struct perf_cpu_context *cpuctx,
														
 
															-			     enum event_type_t event_type);
														
 
															+			     enum event_type_t event_type,
														
 
															+			     struct task_struct *task);
														
 
															+
														
 
															+static void update_context_time(struct perf_event_context *ctx);
														
 
															+static u64 perf_event_time(struct perf_event *event);
														
 
															 void __weak perf_event_print_debug(void)	{ }
														
@@ -89,6 +193,360 @@ static inline u64 perf_clock(void)
 
															 	return local_clock();
														
 
															 }
														
 
															+static inline struct perf_cpu_context *
														
 
															+__get_cpu_context(struct perf_event_context *ctx)
														
 
															+{
														
 
															+	return this_cpu_ptr(ctx->pmu->pmu_cpu_context);
														
 
															+}
														
 
															+
														
 
															+#ifdef CONFIG_CGROUP_PERF
														
 
															+
														
 
															+/*
														
 
															+ * Must ensure cgroup is pinned (css_get) before calling
														
 
															+ * this function. In other words, we cannot call this function
														
 
															+ * if there is no cgroup event for the current CPU context.
														
 
															+ */
														
 
															+static inline struct perf_cgroup *
														
 
															+perf_cgroup_from_task(struct task_struct *task)
														
 
															+{
														
 
															+	return container_of(task_subsys_state(task, perf_subsys_id),
														
 
															+			struct perf_cgroup, css);
														
 
															+}
														
 
															+
														
 
															+static inline bool
														
 
															+perf_cgroup_match(struct perf_event *event)
														
 
															+{
														
 
															+	struct perf_event_context *ctx = event->ctx;
														
 
															+	struct perf_cpu_context *cpuctx = __get_cpu_context(ctx);
														
 
															+
														
 
															+	return !event->cgrp || event->cgrp == cpuctx->cgrp;
														
 
															+}
														
 
															+
														
 
															+static inline void perf_get_cgroup(struct perf_event *event)
														
 
															+{
														
 
															+	css_get(&event->cgrp->css);
														
 
															+}
														
 
															+
														
 
															+static inline void perf_put_cgroup(struct perf_event *event)
														
 
															+{
														
 
															+	css_put(&event->cgrp->css);
														
 
															+}
														
 
															+
														
 
															+static inline void perf_detach_cgroup(struct perf_event *event)
														
 
															+{
														
 
															+	perf_put_cgroup(event);
														
 
															+	event->cgrp = NULL;
														
 
															+}
														
 
															+
														
 
															+static inline int is_cgroup_event(struct perf_event *event)
														
 
															+{
														
 
															+	return event->cgrp != NULL;
														
 
															+}
														
 
															+
														
 
															+static inline u64 perf_cgroup_event_time(struct perf_event *event)
														
 
															+{
														
 
															+	struct perf_cgroup_info *t;
														
 
															+
														
 
															+	t = per_cpu_ptr(event->cgrp->info, event->cpu);
														
 
															+	return t->time;
														
 
															+}
														
 
															+
														
 
															+static inline void __update_cgrp_time(struct perf_cgroup *cgrp)
														
 
															+{
														
 
															+	struct perf_cgroup_info *info;
														
 
															+	u64 now;
														
 
															+
														
 
															+	now = perf_clock();
														
 
															+
														
 
															+	info = this_cpu_ptr(cgrp->info);
														
 
															+
														
 
															+	info->time += now - info->timestamp;
														
 
															+	info->timestamp = now;
														
 
															+}
														
 
															+
														
 
															+static inline void update_cgrp_time_from_cpuctx(struct perf_cpu_context *cpuctx)
														
 
															+{
														
 
															+	struct perf_cgroup *cgrp_out = cpuctx->cgrp;
														
 
															+	if (cgrp_out)
														
 
															+		__update_cgrp_time(cgrp_out);
														
 
															+}
														
 
															+
														
 
															+static inline void update_cgrp_time_from_event(struct perf_event *event)
														
 
															+{
														
 
															+	struct perf_cgroup *cgrp;
														
 
															+
														
 
															+	/*
														
 
															+	 * ensure we access cgroup data only when needed and
														
 
															+	 * when we know the cgroup is pinned (css_get)
														
 
															+	 */
														
 
															+	if (!is_cgroup_event(event))
														
 
															+		return;
														
 
															+
														
 
															+	cgrp = perf_cgroup_from_task(current);
														
 
															+	/*
														
 
															+	 * Do not update time when cgroup is not active
														
 
															+	 */
														
 
															+	if (cgrp == event->cgrp)
														
 
															+		__update_cgrp_time(event->cgrp);
														
 
															+}
														
 
															+
														
 
															+static inline void
														
 
															+perf_cgroup_set_timestamp(struct task_struct *task,
														
 
															+			  struct perf_event_context *ctx)
														
 
															+{
														
 
															+	struct perf_cgroup *cgrp;
														
 
															+	struct perf_cgroup_info *info;
														
 
															+
														
 
															+	/*
														
 
															+	 * ctx->lock held by caller
														
 
															+	 * ensure we do not access cgroup data
														
 
															+	 * unless we have the cgroup pinned (css_get)
														
 
															+	 */
														
 
															+	if (!task || !ctx->nr_cgroups)
														
 
															+		return;
														
 
															+
														
 
															+	cgrp = perf_cgroup_from_task(task);
														
 
															+	info = this_cpu_ptr(cgrp->info);
														
 
															+	info->timestamp = ctx->timestamp;
														
 
															+}
														
 
															+
														
 
															+#define PERF_CGROUP_SWOUT	0x1 /* cgroup switch out every event */
														
 
															+#define PERF_CGROUP_SWIN	0x2 /* cgroup switch in events based on task */
														
 
															+
														
 
															+/*
														
 
															+ * reschedule events based on the cgroup constraint of task.
														
 
															+ *
														
 
															+ * mode SWOUT : schedule out everything
														
 
															+ * mode SWIN : schedule in based on cgroup for next
														
 
															+ */
														
 
															+void perf_cgroup_switch(struct task_struct *task, int mode)
														
 
															+{
														
 
															+	struct perf_cpu_context *cpuctx;
														
 
															+	struct pmu *pmu;
														
 
															+	unsigned long flags;
														
 
															+
														
 
															+	/*
														
 
															+	 * disable interrupts to avoid geting nr_cgroup
														
 
															+	 * changes via __perf_event_disable(). Also
														
 
															+	 * avoids preemption.
														
 
															+	 */
														
 
															+	local_irq_save(flags);
														
 
															+
														
 
															+	/*
														
 
															+	 * we reschedule only in the presence of cgroup
														
 
															+	 * constrained events.
														
 
															+	 */
														
 
															+	rcu_read_lock();
														
 
															+
														
 
															+	list_for_each_entry_rcu(pmu, &pmus, entry) {
														
 
															+
														
 
															+		cpuctx = this_cpu_ptr(pmu->pmu_cpu_context);
														
 
															+
														
 
															+		perf_pmu_disable(cpuctx->ctx.pmu);
														
 
															+
														
 
															+		/*
														
 
															+		 * perf_cgroup_events says at least one
														
 
															+		 * context on this CPU has cgroup events.
														
 
															+		 *
														
 
															+		 * ctx->nr_cgroups reports the number of cgroup
														
 
															+		 * events for a context.
														
 
															+		 */
														
 
															+		if (cpuctx->ctx.nr_cgroups > 0) {
														
 
															+
														
 
															+			if (mode & PERF_CGROUP_SWOUT) {
														
 
															+				cpu_ctx_sched_out(cpuctx, EVENT_ALL);
														
 
															+				/*
														
 
															+				 * must not be done before ctxswout due
														
 
															+				 * to event_filter_match() in event_sched_out()
														
 
															+				 */
														
 
															+				cpuctx->cgrp = NULL;
														
 
															+			}
														
 
															+
														
 
															+			if (mode & PERF_CGROUP_SWIN) {
														
 
															+				/* set cgrp before ctxsw in to
														
 
															+				 * allow event_filter_match() to not
														
 
															+				 * have to pass task around
														
 
															+				 */
														
 
															+				cpuctx->cgrp = perf_cgroup_from_task(task);
														
 
															+				cpu_ctx_sched_in(cpuctx, EVENT_ALL, task);
														
 
															+			}
														
 
															+		}
														
 
															+
														
 
															+		perf_pmu_enable(cpuctx->ctx.pmu);
														
 
															+	}
														
 
															+
														
 
															+	rcu_read_unlock();
														
 
															+
														
 
															+	local_irq_restore(flags);
														
 
															+}
														
 
															+
														
 
															+static inline void perf_cgroup_sched_out(struct task_struct *task)
														
 
															+{
														
 
															+	perf_cgroup_switch(task, PERF_CGROUP_SWOUT);
														
 
															+}
														
 
															+
														
 
															+static inline void perf_cgroup_sched_in(struct task_struct *task)
														
 
															+{
														
 
															+	perf_cgroup_switch(task, PERF_CGROUP_SWIN);
														
 
															+}
														
 
															+
														
 
															+static inline int perf_cgroup_connect(int fd, struct perf_event *event,
														
 
															+				      struct perf_event_attr *attr,
														
 
															+				      struct perf_event *group_leader)
														
 
															+{
														
 
															+	struct perf_cgroup *cgrp;
														
 
															+	struct cgroup_subsys_state *css;
														
 
															+	struct file *file;
														
 
															+	int ret = 0, fput_needed;
														
 
															+
														
 
															+	file = fget_light(fd, &fput_needed);
														
 
															+	if (!file)
														
 
															+		return -EBADF;
														
 
															+
														
 
															+	css = cgroup_css_from_dir(file, perf_subsys_id);
														
 
															+	if (IS_ERR(css)) {
														
 
															+		ret = PTR_ERR(css);
														
 
															+		goto out;
														
 
															+	}
														
 
															+
														
 
															+	cgrp = container_of(css, struct perf_cgroup, css);
														
 
															+	event->cgrp = cgrp;
														
 
															+
														
 
															+	/* must be done before we fput() the file */
														
 
															+	perf_get_cgroup(event);
														
 
															+
														
 
															+	/*
														
 
															+	 * all events in a group must monitor
														
 
															+	 * the same cgroup because a task belongs
														
 
															+	 * to only one perf cgroup at a time
														
 
															+	 */
														
 
															+	if (group_leader && group_leader->cgrp != cgrp) {
														
 
															+		perf_detach_cgroup(event);
														
 
															+		ret = -EINVAL;
														
 
															+	}
														
 
															+out:
														
 
															+	fput_light(file, fput_needed);
														
 
															+	return ret;
														
 
															+}
														
 
															+
														
 
															+static inline void
														
 
															+perf_cgroup_set_shadow_time(struct perf_event *event, u64 now)
														
 
															+{
														
 
															+	struct perf_cgroup_info *t;
														
 
															+	t = per_cpu_ptr(event->cgrp->info, event->cpu);
														
 
															+	event->shadow_ctx_time = now - t->timestamp;
														
 
															+}
														
 
															+
														
 
															+static inline void
														
 
															+perf_cgroup_defer_enabled(struct perf_event *event)
														
 
															+{
														
 
															+	/*
														
 
															+	 * when the current task's perf cgroup does not match
														
 
															+	 * the event's, we need to remember to call the
														
 
															+	 * perf_mark_enable() function the first time a task with
														
 
															+	 * a matching perf cgroup is scheduled in.
														
 
															+	 */
														
 
															+	if (is_cgroup_event(event) && !perf_cgroup_match(event))
														
 
															+		event->cgrp_defer_enabled = 1;
														
 
															+}
														
 
															+
														
 
															+static inline void
														
 
															+perf_cgroup_mark_enabled(struct perf_event *event,
														
 
															+			 struct perf_event_context *ctx)
														
 
															+{
														
 
															+	struct perf_event *sub;
														
 
															+	u64 tstamp = perf_event_time(event);
														
 
															+
														
 
															+	if (!event->cgrp_defer_enabled)
														
 
															+		return;
														
 
															+
														
 
															+	event->cgrp_defer_enabled = 0;
														
 
															+
														
 
															+	event->tstamp_enabled = tstamp - event->total_time_enabled;
														
 
															+	list_for_each_entry(sub, &event->sibling_list, group_entry) {
														
 
															+		if (sub->state >= PERF_EVENT_STATE_INACTIVE) {
														
 
															+			sub->tstamp_enabled = tstamp - sub->total_time_enabled;
														
 
															+			sub->cgrp_defer_enabled = 0;
														
 
															+		}
														
 
															+	}
														
 
															+}
														
 
															+#else /* !CONFIG_CGROUP_PERF */
														
 
															+
														
 
															+static inline bool
														
 
															+perf_cgroup_match(struct perf_event *event)
														
 
															+{
														
 
															+	return true;
														
 
															+}
														
 
															+
														
 
															+static inline void perf_detach_cgroup(struct perf_event *event)
														
 
															+{}
														
 
															+
														
 
															+static inline int is_cgroup_event(struct perf_event *event)
														
 
															+{
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static inline u64 perf_cgroup_event_cgrp_time(struct perf_event *event)
														
 
															+{
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static inline void update_cgrp_time_from_event(struct perf_event *event)
														
 
															+{
														
 
															+}
														
 
															+
														
 
															+static inline void update_cgrp_time_from_cpuctx(struct perf_cpu_context *cpuctx)
														
 
															+{
														
 
															+}
														
 
															+
														
 
															+static inline void perf_cgroup_sched_out(struct task_struct *task)
														
 
															+{
														
 
															+}
														
 
															+
														
 
															+static inline void perf_cgroup_sched_in(struct task_struct *task)
														
 
															+{
														
 
															+}
														
 
															+
														
 
															+static inline int perf_cgroup_connect(pid_t pid, struct perf_event *event,
														
 
															+				      struct perf_event_attr *attr,
														
 
															+				      struct perf_event *group_leader)
														
 
															+{
														
 
															+	return -EINVAL;
														
 
															+}
														
 
															+
														
 
															+static inline void
														
 
															+perf_cgroup_set_timestamp(struct task_struct *task,
														
 
															+			  struct perf_event_context *ctx)
														
 
															+{
														
 
															+}
														
 
															+
														
 
															+void
														
 
															+perf_cgroup_switch(struct task_struct *task, struct task_struct *next)
														
 
															+{
														
 
															+}
														
 
															+
														
 
															+static inline void
														
 
															+perf_cgroup_set_shadow_time(struct perf_event *event, u64 now)
														
 
															+{
														
 
															+}
														
 
															+
														
 
															+static inline u64 perf_cgroup_event_time(struct perf_event *event)
														
 
															+{
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static inline void
														
 
															+perf_cgroup_defer_enabled(struct perf_event *event)
														
 
															+{
														
 
															+}
														
 
															+
														
 
															+static inline void
														
 
															+perf_cgroup_mark_enabled(struct perf_event *event,
														
 
															+			 struct perf_event_context *ctx)
														
 
															+{
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															 void perf_pmu_disable(struct pmu *pmu)
														
 
															 {
														
 
															 	int *count = this_cpu_ptr(pmu->pmu_disable_count);
														
@@ -254,7 +712,6 @@ static void perf_unpin_context(struct perf_event_context *ctx)
 
															 	raw_spin_lock_irqsave(&ctx->lock, flags);
														
 
															 	--ctx->pin_count;
														
 
															 	raw_spin_unlock_irqrestore(&ctx->lock, flags);
														
 
															-	put_ctx(ctx);
														
 
															 }
														
 
															 /*
														
@@ -271,6 +728,10 @@ static void update_context_time(struct perf_event_context *ctx)
 
															 static u64 perf_event_time(struct perf_event *event)
														
 
															 {
														
 
															 	struct perf_event_context *ctx = event->ctx;
														
 
															+
														
 
															+	if (is_cgroup_event(event))
														
 
															+		return perf_cgroup_event_time(event);
														
 
															+
														
 
															 	return ctx ? ctx->time : 0;
														
 
															 }
														
@@ -285,9 +746,20 @@ static void update_event_times(struct perf_event *event)
 
															 	if (event->state < PERF_EVENT_STATE_INACTIVE ||
														
 
															 	    event->group_leader->state < PERF_EVENT_STATE_INACTIVE)
														
 
															 		return;
														
 
															-
														
 
															-	if (ctx->is_active)
														
 
															+	/*
														
 
															+	 * in cgroup mode, time_enabled represents
														
 
															+	 * the time the event was enabled AND active
														
 
															+	 * tasks were in the monitored cgroup. This is
														
 
															+	 * independent of the activity of the context as
														
 
															+	 * there may be a mix of cgroup and non-cgroup events.
														
 
															+	 *
														
 
															+	 * That is why we treat cgroup events differently
														
 
															+	 * here.
														
 
															+	 */
														
 
															+	if (is_cgroup_event(event))
														
 
															 		run_end = perf_event_time(event);
														
 
															+	else if (ctx->is_active)
														
 
															+		run_end = ctx->time;
														
 
															 	else
														
 
															 		run_end = event->tstamp_stopped;
														
@@ -299,6 +771,7 @@ static void update_event_times(struct perf_event *event)
 
															 		run_end = perf_event_time(event);
														
 
															 	event->total_time_running = run_end - event->tstamp_running;
														
 
															+
														
 
															 }
														
 
															 /*
														
@@ -347,6 +820,9 @@ list_add_event(struct perf_event *event, struct perf_event_context *ctx)
 
															 		list_add_tail(&event->group_entry, list);
														
 
															 	}
														
 
															+	if (is_cgroup_event(event))
														
 
															+		ctx->nr_cgroups++;
														
 
															+
														
 
															 	list_add_rcu(&event->event_entry, &ctx->event_list);
														
 
															 	if (!ctx->nr_events)
														
 
															 		perf_pmu_rotate_start(ctx->pmu);
														
@@ -473,6 +949,9 @@ list_del_event(struct perf_event *event, struct perf_event_context *ctx)
 
															 	event->attach_state &= ~PERF_ATTACH_CONTEXT;
														
 
															+	if (is_cgroup_event(event))
														
 
															+		ctx->nr_cgroups--;
														
 
															+
														
 
															 	ctx->nr_events--;
														
 
															 	if (event->attr.inherit_stat)
														
 
															 		ctx->nr_stat--;
														
@@ -544,7 +1023,8 @@ out:
 
															 static inline int
														
 
															 event_filter_match(struct perf_event *event)
														
 
															 {
														
 
															-	return event->cpu == -1 || event->cpu == smp_processor_id();
														
 
															+	return (event->cpu == -1 || event->cpu == smp_processor_id())
														
 
															+	    && perf_cgroup_match(event);
														
 
															 }
														
 
															 static void
														
@@ -562,7 +1042,7 @@ event_sched_out(struct perf_event *event,
 
															 	 */
														
 
															 	if (event->state == PERF_EVENT_STATE_INACTIVE
														
 
															 	    && !event_filter_match(event)) {
														
 
															-		delta = ctx->time - event->tstamp_stopped;
														
 
															+		delta = tstamp - event->tstamp_stopped;
														
 
															 		event->tstamp_running += delta;
														
 
															 		event->tstamp_stopped = tstamp;
														
 
															 	}
														
@@ -606,47 +1086,30 @@ group_sched_out(struct perf_event *group_event,
 
															 		cpuctx->exclusive = 0;
														
 
															 }
														
 
															-static inline struct perf_cpu_context *
														
 
															-__get_cpu_context(struct perf_event_context *ctx)
														
 
															-{
														
 
															-	return this_cpu_ptr(ctx->pmu->pmu_cpu_context);
														
 
															-}
														
 
															-
														
 
															 /*
														
 
															  * Cross CPU call to remove a performance event
														
 
															  *
														
 
															  * We disable the event on the hardware level first. After that we
														
 
															  * remove it from the context list.
														
 
															  */
														
 
															-static void __perf_event_remove_from_context(void *info)
														
 
															+static int __perf_remove_from_context(void *info)
														
 
															 {
														
 
															 	struct perf_event *event = info;
														
 
															 	struct perf_event_context *ctx = event->ctx;
														
 
															 	struct perf_cpu_context *cpuctx = __get_cpu_context(ctx);
														
 
															-	/*
														
 
															-	 * If this is a task context, we need to check whether it is
														
 
															-	 * the current task context of this cpu. If not it has been
														
 
															-	 * scheduled out before the smp call arrived.
														
 
															-	 */
														
 
															-	if (ctx->task && cpuctx->task_ctx != ctx)
														
 
															-		return;
														
 
															-
														
 
															 	raw_spin_lock(&ctx->lock);
														
 
															-
														
 
															 	event_sched_out(event, cpuctx, ctx);
														
 
															-
														
 
															 	list_del_event(event, ctx);
														
 
															-
														
 
															 	raw_spin_unlock(&ctx->lock);
														
 
															+
														
 
															+	return 0;
														
 
															 }
														
 
															 /*
														
 
															  * Remove the event from a task's (or a CPU's) list of events.
														
 
															  *
														
 
															- * Must be called with ctx->mutex held.
														
 
															- *
														
 
															  * CPU events are removed with a smp call. For task events we only
														
 
															  * call when the task is on a CPU.
														
 
															  *
														
@@ -657,49 +1120,48 @@ static void __perf_event_remove_from_context(void *info)
 
															  * When called from perf_event_exit_task, it's OK because the
														
 
															  * context has been detached from its task.
														
 
															  */
														
 
															-static void perf_event_remove_from_context(struct perf_event *event)
														
 
															+static void perf_remove_from_context(struct perf_event *event)
														
 
															 {
														
 
															 	struct perf_event_context *ctx = event->ctx;
														
 
															 	struct task_struct *task = ctx->task;
														
 
															+	lockdep_assert_held(&ctx->mutex);
														
 
															+
														
 
															 	if (!task) {
														
 
															 		/*
														
 
															 		 * Per cpu events are removed via an smp call and
														
 
															 		 * the removal is always successful.
														
 
															 		 */
														
 
															-		smp_call_function_single(event->cpu,
														
 
															-					 __perf_event_remove_from_context,
														
 
															-					 event, 1);
														
 
															+		cpu_function_call(event->cpu, __perf_remove_from_context, event);
														
 
															 		return;
														
 
															 	}
														
 
															 retry:
														
 
															-	task_oncpu_function_call(task, __perf_event_remove_from_context,
														
 
															-				 event);
														
 
															+	if (!task_function_call(task, __perf_remove_from_context, event))
														
 
															+		return;
														
 
															 	raw_spin_lock_irq(&ctx->lock);
														
 
															 	/*
														
 
															-	 * If the context is active we need to retry the smp call.
														
 
															+	 * If we failed to find a running task, but find the context active now
														
 
															+	 * that we've acquired the ctx->lock, retry.
														
 
															 	 */
														
 
															-	if (ctx->nr_active && !list_empty(&event->group_entry)) {
														
 
															+	if (ctx->is_active) {
														
 
															 		raw_spin_unlock_irq(&ctx->lock);
														
 
															 		goto retry;
														
 
															 	}
														
 
															 	/*
														
 
															-	 * The lock prevents that this context is scheduled in so we
														
 
															-	 * can remove the event safely, if the call above did not
														
 
															-	 * succeed.
														
 
															+	 * Since the task isn't running, its safe to remove the event, us
														
 
															+	 * holding the ctx->lock ensures the task won't get scheduled in.
														
 
															 	 */
														
 
															-	if (!list_empty(&event->group_entry))
														
 
															-		list_del_event(event, ctx);
														
 
															+	list_del_event(event, ctx);
														
 
															 	raw_spin_unlock_irq(&ctx->lock);
														
 
															 }
														
 
															 /*
														
 
															  * Cross CPU call to disable a performance event
														
 
															  */
														
 
															-static void __perf_event_disable(void *info)
														
 
															+static int __perf_event_disable(void *info)
														
 
															 {
														
 
															 	struct perf_event *event = info;
														
 
															 	struct perf_event_context *ctx = event->ctx;
														
@@ -708,9 +1170,12 @@ static void __perf_event_disable(void *info)
 
															 	/*
														
 
															 	 * If this is a per-task event, need to check whether this
														
 
															 	 * event's task is the current task on this cpu.
														
 
															+	 *
														
 
															+	 * Can trigger due to concurrent perf_event_context_sched_out()
														
 
															+	 * flipping contexts around.
														
 
															 	 */
														
 
															 	if (ctx->task && cpuctx->task_ctx != ctx)
														
 
															-		return;
														
 
															+		return -EINVAL;
														
 
															 	raw_spin_lock(&ctx->lock);
														
@@ -720,6 +1185,7 @@ static void __perf_event_disable(void *info)
 
															 	 */
														
 
															 	if (event->state >= PERF_EVENT_STATE_INACTIVE) {
														
 
															 		update_context_time(ctx);
														
 
															+		update_cgrp_time_from_event(event);
														
 
															 		update_group_times(event);
														
 
															 		if (event == event->group_leader)
														
 
															 			group_sched_out(event, cpuctx, ctx);
														
@@ -729,6 +1195,8 @@ static void __perf_event_disable(void *info)
 
															 	}
														
 
															 	raw_spin_unlock(&ctx->lock);
														
 
															+
														
 
															+	return 0;
														
 
															 }
														
 
															 /*
														
@@ -753,13 +1221,13 @@ void perf_event_disable(struct perf_event *event)
 
															 		/*
														
 
															 		 * Disable the event on the cpu that it's on
														
 
															 		 */
														
 
															-		smp_call_function_single(event->cpu, __perf_event_disable,
														
 
															-					 event, 1);
														
 
															+		cpu_function_call(event->cpu, __perf_event_disable, event);
														
 
															 		return;
														
 
															 	}
														
 
															 retry:
														
 
															-	task_oncpu_function_call(task, __perf_event_disable, event);
														
 
															+	if (!task_function_call(task, __perf_event_disable, event))
														
 
															+		return;
														
 
															 	raw_spin_lock_irq(&ctx->lock);
														
 
															 	/*
														
@@ -767,6 +1235,11 @@ retry:
 
															 	 */
														
 
															 	if (event->state == PERF_EVENT_STATE_ACTIVE) {
														
 
															 		raw_spin_unlock_irq(&ctx->lock);
														
 
															+		/*
														
 
															+		 * Reload the task pointer, it might have been changed by
														
 
															+		 * a concurrent perf_event_context_sched_out().
														
 
															+		 */
														
 
															+		task = ctx->task;
														
 
															 		goto retry;
														
 
															 	}
														
@@ -778,10 +1251,44 @@ retry:
 
															 		update_group_times(event);
														
 
															 		event->state = PERF_EVENT_STATE_OFF;
														
 
															 	}
														
 
															-
														
 
															 	raw_spin_unlock_irq(&ctx->lock);
														
 
															 }
														
 
															+static void perf_set_shadow_time(struct perf_event *event,
														
 
															+				 struct perf_event_context *ctx,
														
 
															+				 u64 tstamp)
														
 
															+{
														
 
															+	/*
														
 
															+	 * use the correct time source for the time snapshot
														
 
															+	 *
														
 
															+	 * We could get by without this by leveraging the
														
 
															+	 * fact that to get to this function, the caller
														
 
															+	 * has most likely already called update_context_time()
														
 
															+	 * and update_cgrp_time_xx() and thus both timestamp
														
 
															+	 * are identical (or very close). Given that tstamp is,
														
 
															+	 * already adjusted for cgroup, we could say that:
														
 
															+	 *    tstamp - ctx->timestamp
														
 
															+	 * is equivalent to
														
 
															+	 *    tstamp - cgrp->timestamp.
														
 
															+	 *
														
 
															+	 * Then, in perf_output_read(), the calculation would
														
 
															+	 * work with no changes because:
														
 
															+	 * - event is guaranteed scheduled in
														
 
															+	 * - no scheduled out in between
														
 
															+	 * - thus the timestamp would be the same
														
 
															+	 *
														
 
															+	 * But this is a bit hairy.
														
 
															+	 *
														
 
															+	 * So instead, we have an explicit cgroup call to remain
														
 
															+	 * within the time time source all along. We believe it
														
 
															+	 * is cleaner and simpler to understand.
														
 
															+	 */
														
 
															+	if (is_cgroup_event(event))
														
 
															+		perf_cgroup_set_shadow_time(event, tstamp);
														
 
															+	else
														
 
															+		event->shadow_ctx_time = tstamp - ctx->timestamp;
														
 
															+}
														
 
															+
														
 
															 #define MAX_INTERRUPTS (~0ULL)
														
 
															 static void perf_log_throttle(struct perf_event *event, int enable);
														
@@ -822,7 +1329,7 @@ event_sched_in(struct perf_event *event,
 
															 	event->tstamp_running += tstamp - event->tstamp_stopped;
														
 
															-	event->shadow_ctx_time = tstamp - ctx->timestamp;
														
 
															+	perf_set_shadow_time(event, ctx, tstamp);
														
 
															 	if (!is_software_event(event))
														
 
															 		cpuctx->active_oncpu++;
														
@@ -943,12 +1450,15 @@ static void add_event_to_ctx(struct perf_event *event,
 
															 	event->tstamp_stopped = tstamp;
														
 
															 }
														
 
															+static void perf_event_context_sched_in(struct perf_event_context *ctx,
														
 
															+					struct task_struct *tsk);
														
 
															+
														
 
															 /*
														
 
															  * Cross CPU call to install and enable a performance event
														
 
															  *
														
 
															  * Must be called with ctx->mutex held
														
 
															  */
														
 
															-static void __perf_install_in_context(void *info)
														
 
															+static int  __perf_install_in_context(void *info)
														
 
															 {
														
 
															 	struct perf_event *event = info;
														
 
															 	struct perf_event_context *ctx = event->ctx;
														
@@ -957,21 +1467,22 @@ static void __perf_install_in_context(void *info)
 
															 	int err;
														
 
															 	/*
														
 
															-	 * If this is a task context, we need to check whether it is
														
 
															-	 * the current task context of this cpu. If not it has been
														
 
															-	 * scheduled out before the smp call arrived.
														
 
															-	 * Or possibly this is the right context but it isn't
														
 
															-	 * on this cpu because it had no events.
														
 
															+	 * In case we're installing a new context to an already running task,
														
 
															+	 * could also happen before perf_event_task_sched_in() on architectures
														
 
															+	 * which do context switches with IRQs enabled.
														
 
															 	 */
														
 
															-	if (ctx->task && cpuctx->task_ctx != ctx) {
														
 
															-		if (cpuctx->task_ctx || ctx->task != current)
														
 
															-			return;
														
 
															-		cpuctx->task_ctx = ctx;
														
 
															-	}
														
 
															+	if (ctx->task && !cpuctx->task_ctx)
														
 
															+		perf_event_context_sched_in(ctx, ctx->task);
														
 
															 	raw_spin_lock(&ctx->lock);
														
 
															 	ctx->is_active = 1;
														
 
															 	update_context_time(ctx);
														
 
															+	/*
														
 
															+	 * update cgrp time only if current cgrp
														
 
															+	 * matches event->cgrp. Must be done before
														
 
															+	 * calling add_event_to_ctx()
														
 
															+	 */
														
 
															+	update_cgrp_time_from_event(event);
														
 
															 	add_event_to_ctx(event, ctx);
														
@@ -1012,6 +1523,8 @@ static void __perf_install_in_context(void *info)
 
															 unlock:
														
 
															 	raw_spin_unlock(&ctx->lock);
														
 
															+
														
 
															+	return 0;
														
 
															 }
														
 
															 /*
														
@@ -1023,8 +1536,6 @@ unlock:
 
															  * If the event is attached to a task which is on a CPU we use a smp
														
 
															  * call to enable it in the task context. The task might have been
														
 
															  * scheduled away, but we check this in the smp call again.
														
 
															- *
														
 
															- * Must be called with ctx->mutex held.
														
 
															  */
														
 
															 static void
														
 
															 perf_install_in_context(struct perf_event_context *ctx,
														
@@ -1033,6 +1544,8 @@ perf_install_in_context(struct perf_event_context *ctx,
 
															 {
														
 
															 	struct task_struct *task = ctx->task;
														
 
															+	lockdep_assert_held(&ctx->mutex);
														
 
															+
														
 
															 	event->ctx = ctx;
														
 
															 	if (!task) {
														
@@ -1040,31 +1553,29 @@ perf_install_in_context(struct perf_event_context *ctx,
 
															 		 * Per cpu events are installed via an smp call and
														
 
															 		 * the install is always successful.
														
 
															 		 */
														
 
															-		smp_call_function_single(cpu, __perf_install_in_context,
														
 
															-					 event, 1);
														
 
															+		cpu_function_call(cpu, __perf_install_in_context, event);
														
 
															 		return;
														
 
															 	}
														
 
															 retry:
														
 
															-	task_oncpu_function_call(task, __perf_install_in_context,
														
 
															-				 event);
														
 
															+	if (!task_function_call(task, __perf_install_in_context, event))
														
 
															+		return;
														
 
															 	raw_spin_lock_irq(&ctx->lock);
														
 
															 	/*
														
 
															-	 * we need to retry the smp call.
														
 
															+	 * If we failed to find a running task, but find the context active now
														
 
															+	 * that we've acquired the ctx->lock, retry.
														
 
															 	 */
														
 
															-	if (ctx->is_active && list_empty(&event->group_entry)) {
														
 
															+	if (ctx->is_active) {
														
 
															 		raw_spin_unlock_irq(&ctx->lock);
														
 
															 		goto retry;
														
 
															 	}
														
 
															 	/*
														
 
															-	 * The lock prevents that this context is scheduled in so we
														
 
															-	 * can add the event safely, if it the call above did not
														
 
															-	 * succeed.
														
 
															+	 * Since the task isn't running, its safe to add the event, us holding
														
 
															+	 * the ctx->lock ensures the task won't get scheduled in.
														
 
															 	 */
														
 
															-	if (list_empty(&event->group_entry))
														
 
															-		add_event_to_ctx(event, ctx);
														
 
															+	add_event_to_ctx(event, ctx);
														
 
															 	raw_spin_unlock_irq(&ctx->lock);
														
 
															 }
														
@@ -1093,7 +1604,7 @@ static void __perf_event_mark_enabled(struct perf_event *event,
 
															 /*
														
 
															  * Cross CPU call to enable a performance event
														
 
															  */
														
 
															-static void __perf_event_enable(void *info)
														
 
															+static int __perf_event_enable(void *info)
														
 
															 {
														
 
															 	struct perf_event *event = info;
														
 
															 	struct perf_event_context *ctx = event->ctx;
														
@@ -1101,26 +1612,27 @@ static void __perf_event_enable(void *info)
 
															 	struct perf_cpu_context *cpuctx = __get_cpu_context(ctx);
														
 
															 	int err;
														
 
															-	/*
														
 
															-	 * If this is a per-task event, need to check whether this
														
 
															-	 * event's task is the current task on this cpu.
														
 
															-	 */
														
 
															-	if (ctx->task && cpuctx->task_ctx != ctx) {
														
 
															-		if (cpuctx->task_ctx || ctx->task != current)
														
 
															-			return;
														
 
															-		cpuctx->task_ctx = ctx;
														
 
															-	}
														
 
															+	if (WARN_ON_ONCE(!ctx->is_active))
														
 
															+		return -EINVAL;
														
 
															 	raw_spin_lock(&ctx->lock);
														
 
															-	ctx->is_active = 1;
														
 
															 	update_context_time(ctx);
														
 
															 	if (event->state >= PERF_EVENT_STATE_INACTIVE)
														
 
															 		goto unlock;
														
 
															+
														
 
															+	/*
														
 
															+	 * set current task's cgroup time reference point
														
 
															+	 */
														
 
															+	perf_cgroup_set_timestamp(current, ctx);
														
 
															+
														
 
															 	__perf_event_mark_enabled(event, ctx);
														
 
															-	if (!event_filter_match(event))
														
 
															+	if (!event_filter_match(event)) {
														
 
															+		if (is_cgroup_event(event))
														
 
															+			perf_cgroup_defer_enabled(event);
														
 
															 		goto unlock;
														
 
															+	}
														
 
															 	/*
														
 
															 	 * If the event is in a group and isn't the group leader,
														
@@ -1153,6 +1665,8 @@ static void __perf_event_enable(void *info)
 
															 unlock:
														
 
															 	raw_spin_unlock(&ctx->lock);
														
 
															+
														
 
															+	return 0;
														
 
															 }
														
 
															 /*
														
@@ -1173,8 +1687,7 @@ void perf_event_enable(struct perf_event *event)
 
															 		/*
														
 
															 		 * Enable the event on the cpu that it's on
														
 
															 		 */
														
 
															-		smp_call_function_single(event->cpu, __perf_event_enable,
														
 
															-					 event, 1);
														
 
															+		cpu_function_call(event->cpu, __perf_event_enable, event);
														
 
															 		return;
														
 
															 	}
														
@@ -1193,8 +1706,15 @@ void perf_event_enable(struct perf_event *event)
 
															 		event->state = PERF_EVENT_STATE_OFF;
														
 
															 retry:
														
 
															+	if (!ctx->is_active) {
														
 
															+		__perf_event_mark_enabled(event, ctx);
														
 
															+		goto out;
														
 
															+	}
														
 
															+
														
 
															 	raw_spin_unlock_irq(&ctx->lock);
														
 
															-	task_oncpu_function_call(task, __perf_event_enable, event);
														
 
															+
														
 
															+	if (!task_function_call(task, __perf_event_enable, event))
														
 
															+		return;
														
 
															 	raw_spin_lock_irq(&ctx->lock);
														
@@ -1202,15 +1722,14 @@ retry:
 
															 	 * If the context is active and the event is still off,
														
 
															 	 * we need to retry the cross-call.
														
 
															 	 */
														
 
															-	if (ctx->is_active && event->state == PERF_EVENT_STATE_OFF)
														
 
															+	if (ctx->is_active && event->state == PERF_EVENT_STATE_OFF) {
														
 
															+		/*
														
 
															+		 * task could have been flipped by a concurrent
														
 
															+		 * perf_event_context_sched_out()
														
 
															+		 */
														
 
															+		task = ctx->task;
														
 
															 		goto retry;
														
 
															-
														
 
															-	/*
														
 
															-	 * Since we have the lock this context can't be scheduled
														
 
															-	 * in, so we can change the state safely.
														
 
															-	 */
														
 
															-	if (event->state == PERF_EVENT_STATE_OFF)
														
 
															-		__perf_event_mark_enabled(event, ctx);
														
 
															+	}
														
 
															 out:
														
 
															 	raw_spin_unlock_irq(&ctx->lock);
														
@@ -1242,6 +1761,7 @@ static void ctx_sched_out(struct perf_event_context *ctx,
 
															 	if (likely(!ctx->nr_events))
														
 
															 		goto out;
														
 
															 	update_context_time(ctx);
														
 
															+	update_cgrp_time_from_cpuctx(cpuctx);
														
 
															 	if (!ctx->nr_active)
														
 
															 		goto out;
														
@@ -1354,8 +1874,8 @@ static void perf_event_sync_stat(struct perf_event_context *ctx,
 
															 	}
														
 
															 }
														
 
															-void perf_event_context_sched_out(struct task_struct *task, int ctxn,
														
 
															-				  struct task_struct *next)
														
 
															+static void perf_event_context_sched_out(struct task_struct *task, int ctxn,
														
 
															+					 struct task_struct *next)
														
 
															 {
														
 
															 	struct perf_event_context *ctx = task->perf_event_ctxp[ctxn];
														
 
															 	struct perf_event_context *next_ctx;
														
@@ -1431,6 +1951,14 @@ void __perf_event_task_sched_out(struct task_struct *task,
 
															 	for_each_task_context_nr(ctxn)
														
 
															 		perf_event_context_sched_out(task, ctxn, next);
														
 
															+
														
 
															+	/*
														
 
															+	 * if cgroup events exist on this CPU, then we need
														
 
															+	 * to check if we have to switch out PMU state.
														
 
															+	 * cgroup event are system-wide mode only
														
 
															+	 */
														
 
															+	if (atomic_read(&__get_cpu_var(perf_cgroup_events)))
														
 
															+		perf_cgroup_sched_out(task);
														
 
															 }
														
 
															 static void task_ctx_sched_out(struct perf_event_context *ctx,
														
@@ -1469,6 +1997,10 @@ ctx_pinned_sched_in(struct perf_event_context *ctx,
 
															 		if (!event_filter_match(event))
														
 
															 			continue;
														
 
															+		/* may need to reset tstamp_enabled */
														
 
															+		if (is_cgroup_event(event))
														
 
															+			perf_cgroup_mark_enabled(event, ctx);
														
 
															+
														
 
															 		if (group_can_go_on(event, cpuctx, 1))
														
 
															 			group_sched_in(event, cpuctx, ctx);
														
@@ -1501,6 +2033,10 @@ ctx_flexible_sched_in(struct perf_event_context *ctx,
 
															 		if (!event_filter_match(event))
														
 
															 			continue;
														
 
															+		/* may need to reset tstamp_enabled */
														
 
															+		if (is_cgroup_event(event))
														
 
															+			perf_cgroup_mark_enabled(event, ctx);
														
 
															+
														
 
															 		if (group_can_go_on(event, cpuctx, can_add_hw)) {
														
 
															 			if (group_sched_in(event, cpuctx, ctx))
														
 
															 				can_add_hw = 0;
														
@@ -1511,15 +2047,19 @@ ctx_flexible_sched_in(struct perf_event_context *ctx,
 
															 static void
														
 
															 ctx_sched_in(struct perf_event_context *ctx,
														
 
															 	     struct perf_cpu_context *cpuctx,
														
 
															-	     enum event_type_t event_type)
														
 
															+	     enum event_type_t event_type,
														
 
															+	     struct task_struct *task)
														
 
															 {
														
 
															+	u64 now;
														
 
															+
														
 
															 	raw_spin_lock(&ctx->lock);
														
 
															 	ctx->is_active = 1;
														
 
															 	if (likely(!ctx->nr_events))
														
 
															 		goto out;
														
 
															-	ctx->timestamp = perf_clock();
														
 
															-
														
 
															+	now = perf_clock();
														
 
															+	ctx->timestamp = now;
														
 
															+	perf_cgroup_set_timestamp(task, ctx);
														
 
															 	/*
														
 
															 	 * First go through the list and put on any pinned groups
														
 
															 	 * in order to give them the best chance of going on.
														
@@ -1536,11 +2076,12 @@ out:
 
															 }
														
 
															 static void cpu_ctx_sched_in(struct perf_cpu_context *cpuctx,
														
 
															-			     enum event_type_t event_type)
														
 
															+			     enum event_type_t event_type,
														
 
															+			     struct task_struct *task)
														
 
															 {
														
 
															 	struct perf_event_context *ctx = &cpuctx->ctx;
														
 
															-	ctx_sched_in(ctx, cpuctx, event_type);
														
 
															+	ctx_sched_in(ctx, cpuctx, event_type, task);
														
 
															 }
														
 
															 static void task_ctx_sched_in(struct perf_event_context *ctx,
														
@@ -1548,15 +2089,16 @@ static void task_ctx_sched_in(struct perf_event_context *ctx,
 
															 {
														
 
															 	struct perf_cpu_context *cpuctx;
														
 
															-       	cpuctx = __get_cpu_context(ctx);
														
 
															+	cpuctx = __get_cpu_context(ctx);
														
 
															 	if (cpuctx->task_ctx == ctx)
														
 
															 		return;
														
 
															-	ctx_sched_in(ctx, cpuctx, event_type);
														
 
															+	ctx_sched_in(ctx, cpuctx, event_type, NULL);
														
 
															 	cpuctx->task_ctx = ctx;
														
 
															 }
														
 
															-void perf_event_context_sched_in(struct perf_event_context *ctx)
														
 
															+static void perf_event_context_sched_in(struct perf_event_context *ctx,
														
 
															+					struct task_struct *task)
														
 
															 {
														
 
															 	struct perf_cpu_context *cpuctx;
														
@@ -1572,9 +2114,9 @@ void perf_event_context_sched_in(struct perf_event_context *ctx)
 
															 	 */
														
 
															 	cpu_ctx_sched_out(cpuctx, EVENT_FLEXIBLE);
														
 
															-	ctx_sched_in(ctx, cpuctx, EVENT_PINNED);
														
 
															-	cpu_ctx_sched_in(cpuctx, EVENT_FLEXIBLE);
														
 
															-	ctx_sched_in(ctx, cpuctx, EVENT_FLEXIBLE);
														
 
															+	ctx_sched_in(ctx, cpuctx, EVENT_PINNED, task);
														
 
															+	cpu_ctx_sched_in(cpuctx, EVENT_FLEXIBLE, task);
														
 
															+	ctx_sched_in(ctx, cpuctx, EVENT_FLEXIBLE, task);
														
 
															 	cpuctx->task_ctx = ctx;
														
@@ -1607,8 +2149,15 @@ void __perf_event_task_sched_in(struct task_struct *task)
 
															 		if (likely(!ctx))
														
 
															 			continue;
														
 
															-		perf_event_context_sched_in(ctx);
														
 
															+		perf_event_context_sched_in(ctx, task);
														
 
															 	}
														
 
															+	/*
														
 
															+	 * if cgroup events exist on this CPU, then we need
														
 
															+	 * to check if we have to switch in PMU state.
														
 
															+	 * cgroup event are system-wide mode only
														
 
															+	 */
														
 
															+	if (atomic_read(&__get_cpu_var(perf_cgroup_events)))
														
 
															+		perf_cgroup_sched_in(task);
														
 
															 }
														
 
															 static u64 perf_calculate_period(struct perf_event *event, u64 nsec, u64 count)
														
@@ -1638,7 +2187,7 @@ static u64 perf_calculate_period(struct perf_event *event, u64 nsec, u64 count)
 
															 	 * Reduce accuracy by one bit such that @a and @b converge
														
 
															 	 * to a similar magnitude.
														
 
															 	 */
														
 
															-#define REDUCE_FLS(a, b) 		\
														
 
															+#define REDUCE_FLS(a, b)		\
														
 
															 do {					\
														
 
															 	if (a##_fls > b##_fls) {	\
														
 
															 		a >>= 1;		\
														
@@ -1808,7 +2357,7 @@ static void perf_rotate_context(struct perf_cpu_context *cpuctx)
 
															 	if (ctx)
														
 
															 		rotate_ctx(ctx);
														
 
															-	cpu_ctx_sched_in(cpuctx, EVENT_FLEXIBLE);
														
 
															+	cpu_ctx_sched_in(cpuctx, EVENT_FLEXIBLE, current);
														
 
															 	if (ctx)
														
 
															 		task_ctx_sched_in(ctx, EVENT_FLEXIBLE);
														
@@ -1887,7 +2436,7 @@ static void perf_event_enable_on_exec(struct perf_event_context *ctx)
 
															 	raw_spin_unlock(&ctx->lock);
														
 
															-	perf_event_context_sched_in(ctx);
														
 
															+	perf_event_context_sched_in(ctx, ctx->task);
														
 
															 out:
														
 
															 	local_irq_restore(flags);
														
 
															 }
														
@@ -1912,8 +2461,10 @@ static void __perf_event_read(void *info)
 
															 		return;
														
 
															 	raw_spin_lock(&ctx->lock);
														
 
															-	if (ctx->is_active)
														
 
															+	if (ctx->is_active) {
														
 
															 		update_context_time(ctx);
														
 
															+		update_cgrp_time_from_event(event);
														
 
															+	}
														
 
															 	update_event_times(event);
														
 
															 	if (event->state == PERF_EVENT_STATE_ACTIVE)
														
 
															 		event->pmu->read(event);
														
@@ -1944,8 +2495,10 @@ static u64 perf_event_read(struct perf_event *event)
 
															 		 * (e.g., thread is blocked), in that case
														
 
															 		 * we cannot update context time
														
 
															 		 */
														
 
															-		if (ctx->is_active)
														
 
															+		if (ctx->is_active) {
														
 
															 			update_context_time(ctx);
														
 
															+			update_cgrp_time_from_event(event);
														
 
															+		}
														
 
															 		update_event_times(event);
														
 
															 		raw_spin_unlock_irqrestore(&ctx->lock, flags);
														
 
															 	}
														
@@ -2224,6 +2777,9 @@ errout:
 
															 }
														
 
															+/*
														
 
															+ * Returns a matching context with refcount and pincount.
														
 
															+ */
														
 
															 static struct perf_event_context *
														
 
															 find_get_context(struct pmu *pmu, struct task_struct *task, int cpu)
														
 
															 {
														
@@ -2248,6 +2804,7 @@ find_get_context(struct pmu *pmu, struct task_struct *task, int cpu)
 
															 		cpuctx = per_cpu_ptr(pmu->pmu_cpu_context, cpu);
														
 
															 		ctx = &cpuctx->ctx;
														
 
															 		get_ctx(ctx);
														
 
															+		++ctx->pin_count;
														
 
															 		return ctx;
														
 
															 	}
														
@@ -2261,6 +2818,7 @@ retry:
 
															 	ctx = perf_lock_task_context(task, ctxn, &flags);
														
 
															 	if (ctx) {
														
 
															 		unclone_ctx(ctx);
														
 
															+		++ctx->pin_count;
														
 
															 		raw_spin_unlock_irqrestore(&ctx->lock, flags);
														
 
															 	}
														
@@ -2282,8 +2840,10 @@ retry:
 
															 			err = -ESRCH;
														
 
															 		else if (task->perf_event_ctxp[ctxn])
														
 
															 			err = -EAGAIN;
														
 
															-		else
														
 
															+		else {
														
 
															+			++ctx->pin_count;
														
 
															 			rcu_assign_pointer(task->perf_event_ctxp[ctxn], ctx);
														
 
															+		}
														
 
															 		mutex_unlock(&task->perf_event_mutex);
														
 
															 		if (unlikely(err)) {
														
@@ -2323,7 +2883,7 @@ static void free_event(struct perf_event *event)
 
															 	if (!event->parent) {
														
 
															 		if (event->attach_state & PERF_ATTACH_TASK)
														
 
															-			jump_label_dec(&perf_task_events);
														
 
															+			jump_label_dec(&perf_sched_events);
														
 
															 		if (event->attr.mmap || event->attr.mmap_data)
														
 
															 			atomic_dec(&nr_mmap_events);
														
 
															 		if (event->attr.comm)
														
@@ -2332,6 +2892,10 @@ static void free_event(struct perf_event *event)
 
															 			atomic_dec(&nr_task_events);
														
 
															 		if (event->attr.sample_type & PERF_SAMPLE_CALLCHAIN)
														
 
															 			put_callchain_buffers();
														
 
															+		if (is_cgroup_event(event)) {
														
 
															+			atomic_dec(&per_cpu(perf_cgroup_events, event->cpu));
														
 
															+			jump_label_dec(&perf_sched_events);
														
 
															+		}
														
 
															 	}
														
 
															 	if (event->buffer) {
														
@@ -2339,6 +2903,9 @@ static void free_event(struct perf_event *event)
 
															 		event->buffer = NULL;
														
 
															 	}
														
 
															+	if (is_cgroup_event(event))
														
 
															+		perf_detach_cgroup(event);
														
 
															+
														
 
															 	if (event->destroy)
														
 
															 		event->destroy(event);
														
@@ -4406,26 +4973,14 @@ static int __perf_event_overflow(struct perf_event *event, int nmi,
 
															 	if (unlikely(!is_sampling_event(event)))
														
 
															 		return 0;
														
 
															-	if (!throttle) {
														
 
															-		hwc->interrupts++;
														
 
															-	} else {
														
 
															-		if (hwc->interrupts != MAX_INTERRUPTS) {
														
 
															-			hwc->interrupts++;
														
 
															-			if (HZ * hwc->interrupts >
														
 
															-					(u64)sysctl_perf_event_sample_rate) {
														
 
															-				hwc->interrupts = MAX_INTERRUPTS;
														
 
															-				perf_log_throttle(event, 0);
														
 
															-				ret = 1;
														
 
															-			}
														
 
															-		} else {
														
 
															-			/*
														
 
															-			 * Keep re-disabling events even though on the previous
														
 
															-			 * pass we disabled it - just in case we raced with a
														
 
															-			 * sched-in and the event got enabled again:
														
 
															-			 */
														
 
															+	if (unlikely(hwc->interrupts >= max_samples_per_tick)) {
														
 
															+		if (throttle) {
														
 
															+			hwc->interrupts = MAX_INTERRUPTS;
														
 
															+			perf_log_throttle(event, 0);
														
 
															 			ret = 1;
														
 
															 		}
														
 
															-	}
														
 
															+	} else
														
 
															+		hwc->interrupts++;
														
 
															 	if (event->attr.freq) {
														
 
															 		u64 now = perf_clock();
														
@@ -5062,6 +5617,10 @@ static enum hrtimer_restart perf_swevent_hrtimer(struct hrtimer *hrtimer)
 
															 	u64 period;
														
 
															 	event = container_of(hrtimer, struct perf_event, hw.hrtimer);
														
 
															+
														
 
															+	if (event->state != PERF_EVENT_STATE_ACTIVE)
														
 
															+		return HRTIMER_NORESTART;
														
 
															+
														
 
															 	event->pmu->read(event);
														
 
															 	perf_sample_data_init(&data, 0);
														
@@ -5088,9 +5647,6 @@ static void perf_swevent_start_hrtimer(struct perf_event *event)
 
															 	if (!is_sampling_event(event))
														
 
															 		return;
														
 
															-	hrtimer_init(&hwc->hrtimer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
														
 
															-	hwc->hrtimer.function = perf_swevent_hrtimer;
														
 
															-
														
 
															 	period = local64_read(&hwc->period_left);
														
 
															 	if (period) {
														
 
															 		if (period < 0)
														
@@ -5117,6 +5673,30 @@ static void perf_swevent_cancel_hrtimer(struct perf_event *event)
 
															 	}
														
 
															 }
														
 
															+static void perf_swevent_init_hrtimer(struct perf_event *event)
														
 
															+{
														
 
															+	struct hw_perf_event *hwc = &event->hw;
														
 
															+
														
 
															+	if (!is_sampling_event(event))
														
 
															+		return;
														
 
															+
														
 
															+	hrtimer_init(&hwc->hrtimer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
														
 
															+	hwc->hrtimer.function = perf_swevent_hrtimer;
														
 
															+
														
 
															+	/*
														
 
															+	 * Since hrtimers have a fixed rate, we can do a static freq->period
														
 
															+	 * mapping and avoid the whole period adjust feedback stuff.
														
 
															+	 */
														
 
															+	if (event->attr.freq) {
														
 
															+		long freq = event->attr.sample_freq;
														
 
															+
														
 
															+		event->attr.sample_period = NSEC_PER_SEC / freq;
														
 
															+		hwc->sample_period = event->attr.sample_period;
														
 
															+		local64_set(&hwc->period_left, hwc->sample_period);
														
 
															+		event->attr.freq = 0;
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															 /*
														
 
															  * Software event: cpu wall time clock
														
 
															  */
														
@@ -5169,6 +5749,8 @@ static int cpu_clock_event_init(struct perf_event *event)
 
															 	if (event->attr.config != PERF_COUNT_SW_CPU_CLOCK)
														
 
															 		return -ENOENT;
														
 
															+	perf_swevent_init_hrtimer(event);
														
 
															+
														
 
															 	return 0;
														
 
															 }
														
@@ -5224,16 +5806,9 @@ static void task_clock_event_del(struct perf_event *event, int flags)
 
															 static void task_clock_event_read(struct perf_event *event)
														
 
															 {
														
 
															-	u64 time;
														
 
															-
														
 
															-	if (!in_nmi()) {
														
 
															-		update_context_time(event->ctx);
														
 
															-		time = event->ctx->time;
														
 
															-	} else {
														
 
															-		u64 now = perf_clock();
														
 
															-		u64 delta = now - event->ctx->timestamp;
														
 
															-		time = event->ctx->time + delta;
														
 
															-	}
														
 
															+	u64 now = perf_clock();
														
 
															+	u64 delta = now - event->ctx->timestamp;
														
 
															+	u64 time = event->ctx->time + delta;
														
 
															 	task_clock_event_update(event, time);
														
 
															 }
														
@@ -5246,6 +5821,8 @@ static int task_clock_event_init(struct perf_event *event)
 
															 	if (event->attr.config != PERF_COUNT_SW_TASK_CLOCK)
														
 
															 		return -ENOENT;
														
 
															+	perf_swevent_init_hrtimer(event);
														
 
															+
														
 
															 	return 0;
														
 
															 }
														
@@ -5517,17 +6094,22 @@ struct pmu *perf_init_event(struct perf_event *event)
 
															 {
														
 
															 	struct pmu *pmu = NULL;
														
 
															 	int idx;
														
 
															+	int ret;
														
 
															 	idx = srcu_read_lock(&pmus_srcu);
														
 
															 	rcu_read_lock();
														
 
															 	pmu = idr_find(&pmu_idr, event->attr.type);
														
 
															 	rcu_read_unlock();
														
 
															-	if (pmu)
														
 
															+	if (pmu) {
														
 
															+		ret = pmu->event_init(event);
														
 
															+		if (ret)
														
 
															+			pmu = ERR_PTR(ret);
														
 
															 		goto unlock;
														
 
															+	}
														
 
															 	list_for_each_entry_rcu(pmu, &pmus, entry) {
														
 
															-		int ret = pmu->event_init(event);
														
 
															+		ret = pmu->event_init(event);
														
 
															 		if (!ret)
														
 
															 			goto unlock;
														
@@ -5653,7 +6235,7 @@ done:
 
															 	if (!event->parent) {
														
 
															 		if (event->attach_state & PERF_ATTACH_TASK)
														
 
															-			jump_label_inc(&perf_task_events);
														
 
															+			jump_label_inc(&perf_sched_events);
														
 
															 		if (event->attr.mmap || event->attr.mmap_data)
														
 
															 			atomic_inc(&nr_mmap_events);
														
 
															 		if (event->attr.comm)
														
@@ -5828,7 +6410,7 @@ SYSCALL_DEFINE5(perf_event_open,
 
															 	int err;
														
 
															 	/* for future expandability... */
														
 
															-	if (flags & ~(PERF_FLAG_FD_NO_GROUP | PERF_FLAG_FD_OUTPUT))
														
 
															+	if (flags & ~PERF_FLAG_ALL)
														
 
															 		return -EINVAL;
														
 
															 	err = perf_copy_attr(attr_uptr, &attr);
														
@@ -5845,6 +6427,15 @@ SYSCALL_DEFINE5(perf_event_open,
 
															 			return -EINVAL;
														
 
															 	}
														
 
															+	/*
														
 
															+	 * In cgroup mode, the pid argument is used to pass the fd
														
 
															+	 * opened to the cgroup directory in cgroupfs. The cpu argument
														
 
															+	 * designates the cpu on which to monitor threads from that
														
 
															+	 * cgroup.
														
 
															+	 */
														
 
															+	if ((flags & PERF_FLAG_PID_CGROUP) && (pid == -1 || cpu == -1))
														
 
															+		return -EINVAL;
														
 
															+
														
 
															 	event_fd = get_unused_fd_flags(O_RDWR);
														
 
															 	if (event_fd < 0)
														
 
															 		return event_fd;
														
@@ -5862,7 +6453,7 @@ SYSCALL_DEFINE5(perf_event_open,
 
															 			group_leader = NULL;
														
 
															 	}
														
 
															-	if (pid != -1) {
														
 
															+	if (pid != -1 && !(flags & PERF_FLAG_PID_CGROUP)) {
														
 
															 		task = find_lively_task_by_vpid(pid);
														
 
															 		if (IS_ERR(task)) {
														
 
															 			err = PTR_ERR(task);
														
@@ -5876,6 +6467,19 @@ SYSCALL_DEFINE5(perf_event_open,
 
															 		goto err_task;
														
 
															 	}
														
 
															+	if (flags & PERF_FLAG_PID_CGROUP) {
														
 
															+		err = perf_cgroup_connect(pid, event, &attr, group_leader);
														
 
															+		if (err)
														
 
															+			goto err_alloc;
														
 
															+		/*
														
 
															+		 * one more event:
														
 
															+		 * - that has cgroup constraint on event->cpu
														
 
															+		 * - that may need work on context switch
														
 
															+		 */
														
 
															+		atomic_inc(&per_cpu(perf_cgroup_events, event->cpu));
														
 
															+		jump_label_inc(&perf_sched_events);
														
 
															+	}
														
 
															+
														
 
															 	/*
														
 
															 	 * Special case software events and allow them to be part of
														
 
															 	 * any hardware group.
														
@@ -5961,10 +6565,10 @@ SYSCALL_DEFINE5(perf_event_open,
 
															 		struct perf_event_context *gctx = group_leader->ctx;
														
 
															 		mutex_lock(&gctx->mutex);
														
 
															-		perf_event_remove_from_context(group_leader);
														
 
															+		perf_remove_from_context(group_leader);
														
 
															 		list_for_each_entry(sibling, &group_leader->sibling_list,
														
 
															 				    group_entry) {
														
 
															-			perf_event_remove_from_context(sibling);
														
 
															+			perf_remove_from_context(sibling);
														
 
															 			put_ctx(gctx);
														
 
															 		}
														
 
															 		mutex_unlock(&gctx->mutex);
														
@@ -5987,6 +6591,7 @@ SYSCALL_DEFINE5(perf_event_open,
 
															 	perf_install_in_context(ctx, event, cpu);
														
 
															 	++ctx->generation;
														
 
															+	perf_unpin_context(ctx);
														
 
															 	mutex_unlock(&ctx->mutex);
														
 
															 	event->owner = current;
														
@@ -6012,6 +6617,7 @@ SYSCALL_DEFINE5(perf_event_open,
 
															 	return event_fd;
														
 
															 err_context:
														
 
															+	perf_unpin_context(ctx);
														
 
															 	put_ctx(ctx);
														
 
															 err_alloc:
														
 
															 	free_event(event);
														
@@ -6062,6 +6668,7 @@ perf_event_create_kernel_counter(struct perf_event_attr *attr, int cpu,
 
															 	mutex_lock(&ctx->mutex);
														
 
															 	perf_install_in_context(ctx, event, cpu);
														
 
															 	++ctx->generation;
														
 
															+	perf_unpin_context(ctx);
														
 
															 	mutex_unlock(&ctx->mutex);
														
 
															 	return event;
														
@@ -6115,7 +6722,7 @@ __perf_event_exit_task(struct perf_event *child_event,
 
															 {
														
 
															 	struct perf_event *parent_event;
														
 
															-	perf_event_remove_from_context(child_event);
														
 
															+	perf_remove_from_context(child_event);
														
 
															 	parent_event = child_event->parent;
														
 
															 	/*
														
@@ -6422,7 +7029,7 @@ inherit_task_group(struct perf_event *event, struct task_struct *parent,
 
															 		return 0;
														
 
															 	}
														
 
															-       	child_ctx = child->perf_event_ctxp[ctxn];
														
 
															+	child_ctx = child->perf_event_ctxp[ctxn];
														
 
															 	if (!child_ctx) {
														
 
															 		/*
														
 
															 		 * This is executed from the parent task context, so
														
@@ -6537,6 +7144,7 @@ int perf_event_init_context(struct task_struct *child, int ctxn)
 
															 	mutex_unlock(&parent_ctx->mutex);
														
 
															 	perf_unpin_context(parent_ctx);
														
 
															+	put_ctx(parent_ctx);
														
 
															 	return ret;
														
 
															 }
														
@@ -6606,9 +7214,9 @@ static void __perf_event_exit_context(void *__info)
 
															 	perf_pmu_rotate_stop(ctx->pmu);
														
 
															 	list_for_each_entry_safe(event, tmp, &ctx->pinned_groups, group_entry)
														
 
															-		__perf_event_remove_from_context(event);
														
 
															+		__perf_remove_from_context(event);
														
 
															 	list_for_each_entry_safe(event, tmp, &ctx->flexible_groups, group_entry)
														
 
															-		__perf_event_remove_from_context(event);
														
 
															+		__perf_remove_from_context(event);
														
 
															 }
														
 
															 static void perf_event_exit_cpu_context(int cpu)
														
@@ -6732,3 +7340,83 @@ unlock:
 
															 	return ret;
														
 
															 }
														
 
															 device_initcall(perf_event_sysfs_init);
														
 
															+
														
 
															+#ifdef CONFIG_CGROUP_PERF
														
 
															+static struct cgroup_subsys_state *perf_cgroup_create(
														
 
															+	struct cgroup_subsys *ss, struct cgroup *cont)
														
 
															+{
														
 
															+	struct perf_cgroup *jc;
														
 
															+
														
 
															+	jc = kzalloc(sizeof(*jc), GFP_KERNEL);
														
 
															+	if (!jc)
														
 
															+		return ERR_PTR(-ENOMEM);
														
 
															+
														
 
															+	jc->info = alloc_percpu(struct perf_cgroup_info);
														
 
															+	if (!jc->info) {
														
 
															+		kfree(jc);
														
 
															+		return ERR_PTR(-ENOMEM);
														
 
															+	}
														
 
															+
														
 
															+	return &jc->css;
														
 
															+}
														
 
															+
														
 
															+static void perf_cgroup_destroy(struct cgroup_subsys *ss,
														
 
															+				struct cgroup *cont)
														
 
															+{
														
 
															+	struct perf_cgroup *jc;
														
 
															+	jc = container_of(cgroup_subsys_state(cont, perf_subsys_id),
														
 
															+			  struct perf_cgroup, css);
														
 
															+	free_percpu(jc->info);
														
 
															+	kfree(jc);
														
 
															+}
														
 
															+
														
 
															+static int __perf_cgroup_move(void *info)
														
 
															+{
														
 
															+	struct task_struct *task = info;
														
 
															+	perf_cgroup_switch(task, PERF_CGROUP_SWOUT | PERF_CGROUP_SWIN);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static void perf_cgroup_move(struct task_struct *task)
														
 
															+{
														
 
															+	task_function_call(task, __perf_cgroup_move, task);
														
 
															+}
														
 
															+
														
 
															+static void perf_cgroup_attach(struct cgroup_subsys *ss, struct cgroup *cgrp,
														
 
															+		struct cgroup *old_cgrp, struct task_struct *task,
														
 
															+		bool threadgroup)
														
 
															+{
														
 
															+	perf_cgroup_move(task);
														
 
															+	if (threadgroup) {
														
 
															+		struct task_struct *c;
														
 
															+		rcu_read_lock();
														
 
															+		list_for_each_entry_rcu(c, &task->thread_group, thread_group) {
														
 
															+			perf_cgroup_move(c);
														
 
															+		}
														
 
															+		rcu_read_unlock();
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+static void perf_cgroup_exit(struct cgroup_subsys *ss, struct cgroup *cgrp,
														
 
															+		struct cgroup *old_cgrp, struct task_struct *task)
														
 
															+{
														
 
															+	/*
														
 
															+	 * cgroup_exit() is called in the copy_process() failure path.
														
 
															+	 * Ignore this case since the task hasn't ran yet, this avoids
														
 
															+	 * trying to poke a half freed task state from generic code.
														
 
															+	 */
														
 
															+	if (!(task->flags & PF_EXITING))
														
 
															+		return;
														
 
															+
														
 
															+	perf_cgroup_move(task);
														
 
															+}
														
 
															+
														
 
															+struct cgroup_subsys perf_subsys = {
														
 
															+	.name = "perf_event",
														
 
															+	.subsys_id = perf_subsys_id,
														
 
															+	.create = perf_cgroup_create,
														
 
															+	.destroy = perf_cgroup_destroy,
														
 
															+	.exit = perf_cgroup_exit,
														
 
															+	.attach = perf_cgroup_attach,
														
 
															+};
														
 
															+#endif /* CONFIG_CGROUP_PERF */
														
--- a/kernel/sched.c
+++ b/kernel/sched.c
@@ -606,9 +606,6 @@ static inline struct task_group *task_group(struct task_struct *p)
 
															 	struct task_group *tg;
														
 
															 	struct cgroup_subsys_state *css;
														
 
															-	if (p->flags & PF_EXITING)
														
 
															-		return &root_task_group;
														
 
															-
														
 
															 	css = task_subsys_state_check(p, cpu_cgroup_subsys_id,
														
 
															 			lockdep_is_held(&task_rq(p)->lock));
														
 
															 	tg = container_of(css, struct task_group, css);
														
@@ -2265,27 +2262,6 @@ void kick_process(struct task_struct *p)
 
															 EXPORT_SYMBOL_GPL(kick_process);
														
 
															 #endif /* CONFIG_SMP */
														
 
															-/**
														
 
															- * task_oncpu_function_call - call a function on the cpu on which a task runs
														
 
															- * @p:		the task to evaluate
														
 
															- * @func:	the function to be called
														
 
															- * @info:	the function call argument
														
 
															- *
														
 
															- * Calls the function @func when the task is currently running. This might
														
 
															- * be on the current CPU, which just calls the function directly
														
 
															- */
														
 
															-void task_oncpu_function_call(struct task_struct *p,
														
 
															-			      void (*func) (void *info), void *info)
														
 
															-{
														
 
															-	int cpu;
														
 
															-
														
 
															-	preempt_disable();
														
 
															-	cpu = task_cpu(p);
														
 
															-	if (task_curr(p))
														
 
															-		smp_call_function_single(cpu, func, info, 1);
														
 
															-	preempt_enable();
														
 
															-}
														
 
															-
														
 
															 #ifdef CONFIG_SMP
														
 
															 /*
														
 
															  * ->cpus_allowed is protected by either TASK_WAKING or rq->lock held.
														
@@ -2776,9 +2752,12 @@ static inline void
 
															 prepare_task_switch(struct rq *rq, struct task_struct *prev,
														
 
															 		    struct task_struct *next)
														
 
															 {
														
 
															+	sched_info_switch(prev, next);
														
 
															+	perf_event_task_sched_out(prev, next);
														
 
															 	fire_sched_out_preempt_notifiers(prev, next);
														
 
															 	prepare_lock_switch(rq, next);
														
 
															 	prepare_arch_switch(next);
														
 
															+	trace_sched_switch(prev, next);
														
 
															 }
														
 
															 /**
														
@@ -2911,7 +2890,7 @@ context_switch(struct rq *rq, struct task_struct *prev,
 
															 	struct mm_struct *mm, *oldmm;
														
 
															 	prepare_task_switch(rq, prev, next);
														
 
															-	trace_sched_switch(prev, next);
														
 
															+
														
 
															 	mm = next->mm;
														
 
															 	oldmm = prev->active_mm;
														
 
															 	/*
														
@@ -3989,9 +3968,6 @@ need_resched_nonpreemptible:
 
															 	rq->skip_clock_update = 0;
														
 
															 	if (likely(prev != next)) {
														
 
															-		sched_info_switch(prev, next);
														
 
															-		perf_event_task_sched_out(prev, next);
														
 
															-
														
 
															 		rq->nr_switches++;
														
 
															 		rq->curr = next;
														
 
															 		++*switch_count;
														
@@ -5572,7 +5548,7 @@ void __cpuinit init_idle(struct task_struct *idle, int cpu)
 
															 	 * The idle tasks have their own, simple scheduling class:
														
 
															 	 */
														
 
															 	idle->sched_class = &idle_sched_class;
														
 
															-	ftrace_graph_init_task(idle);
														
 
															+	ftrace_graph_init_idle_task(idle, cpu);
														
 
															 }
														
 
															 /*
														
@@ -8885,7 +8861,8 @@ cpu_cgroup_attach(struct cgroup_subsys *ss, struct cgroup *cgrp,
 
															 }
														
 
															 static void
														
 
															-cpu_cgroup_exit(struct cgroup_subsys *ss, struct task_struct *task)
														
 
															+cpu_cgroup_exit(struct cgroup_subsys *ss, struct cgroup *cgrp,
														
 
															+		struct cgroup *old_cgrp, struct task_struct *task)
														
 
															 {
														
 
															 	/*
														
 
															 	 * cgroup_exit() is called in the copy_process() failure path.
														
--- a/kernel/sysctl.c
+++ b/kernel/sysctl.c
@@ -948,7 +948,7 @@ static struct ctl_table kern_table[] = {
 
															 		.data		= &sysctl_perf_event_sample_rate,
														
 
															 		.maxlen		= sizeof(sysctl_perf_event_sample_rate),
														
 
															 		.mode		= 0644,
														
 
															-		.proc_handler	= proc_dointvec,
														
 
															+		.proc_handler	= perf_proc_update_handler,
														
 
															 	},
														
 
															 #endif
														
 
															 #ifdef CONFIG_KMEMCHECK
														
--- a/kernel/trace/ftrace.c
+++ b/kernel/trace/ftrace.c
@@ -3328,7 +3328,7 @@ static int start_graph_tracing(void)
 
															 	/* The cpu_boot init_task->ret_stack will never be freed */
														
 
															 	for_each_online_cpu(cpu) {
														
 
															 		if (!idle_task(cpu)->ret_stack)
														
 
															-			ftrace_graph_init_task(idle_task(cpu));
														
 
															+			ftrace_graph_init_idle_task(idle_task(cpu), cpu);
														
 
															 	}
														
 
															 	do {
														
@@ -3418,6 +3418,49 @@ void unregister_ftrace_graph(void)
 
															 	mutex_unlock(&ftrace_lock);
														
 
															 }
														
 
															+static DEFINE_PER_CPU(struct ftrace_ret_stack *, idle_ret_stack);
														
 
															+
														
 
															+static void
														
 
															+graph_init_task(struct task_struct *t, struct ftrace_ret_stack *ret_stack)
														
 
															+{
														
 
															+	atomic_set(&t->tracing_graph_pause, 0);
														
 
															+	atomic_set(&t->trace_overrun, 0);
														
 
															+	t->ftrace_timestamp = 0;
														
 
															+	/* make curr_ret_stack visable before we add the ret_stack */
														
 
															+	smp_wmb();
														
 
															+	t->ret_stack = ret_stack;
														
 
															+}
														
 
															+
														
 
															+/*
														
 
															+ * Allocate a return stack for the idle task. May be the first
														
 
															+ * time through, or it may be done by CPU hotplug online.
														
 
															+ */
														
 
															+void ftrace_graph_init_idle_task(struct task_struct *t, int cpu)
														
 
															+{
														
 
															+	t->curr_ret_stack = -1;
														
 
															+	/*
														
 
															+	 * The idle task has no parent, it either has its own
														
 
															+	 * stack or no stack at all.
														
 
															+	 */
														
 
															+	if (t->ret_stack)
														
 
															+		WARN_ON(t->ret_stack != per_cpu(idle_ret_stack, cpu));
														
 
															+
														
 
															+	if (ftrace_graph_active) {
														
 
															+		struct ftrace_ret_stack *ret_stack;
														
 
															+
														
 
															+		ret_stack = per_cpu(idle_ret_stack, cpu);
														
 
															+		if (!ret_stack) {
														
 
															+			ret_stack = kmalloc(FTRACE_RETFUNC_DEPTH
														
 
															+					    * sizeof(struct ftrace_ret_stack),
														
 
															+					    GFP_KERNEL);
														
 
															+			if (!ret_stack)
														
 
															+				return;
														
 
															+			per_cpu(idle_ret_stack, cpu) = ret_stack;
														
 
															+		}
														
 
															+		graph_init_task(t, ret_stack);
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															 /* Allocate a return stack for newly created task */
														
 
															 void ftrace_graph_init_task(struct task_struct *t)
														
 
															 {
														
@@ -3433,12 +3476,7 @@ void ftrace_graph_init_task(struct task_struct *t)
 
															 				GFP_KERNEL);
														
 
															 		if (!ret_stack)
														
 
															 			return;
														
 
															-		atomic_set(&t->tracing_graph_pause, 0);
														
 
															-		atomic_set(&t->trace_overrun, 0);
														
 
															-		t->ftrace_timestamp = 0;
														
 
															-		/* make curr_ret_stack visable before we add the ret_stack */
														
 
															-		smp_wmb();
														
 
															-		t->ret_stack = ret_stack;
														
 
															+		graph_init_task(t, ret_stack);
														
 
															 	}
														
 
															 }
														
--- a/kernel/trace/ring_buffer.c
+++ b/kernel/trace/ring_buffer.c
@@ -5,7 +5,6 @@
 
															  */
														
 
															 #include <linux/ring_buffer.h>
														
 
															 #include <linux/trace_clock.h>
														
 
															-#include <linux/ftrace_irq.h>
														
 
															 #include <linux/spinlock.h>
														
 
															 #include <linux/debugfs.h>
														
 
															 #include <linux/uaccess.h>
														
@@ -1429,6 +1428,17 @@ int ring_buffer_resize(struct ring_buffer *buffer, unsigned long size)
 
															 }
														
 
															 EXPORT_SYMBOL_GPL(ring_buffer_resize);
														
 
															+void ring_buffer_change_overwrite(struct ring_buffer *buffer, int val)
														
 
															+{
														
 
															+	mutex_lock(&buffer->mutex);
														
 
															+	if (val)
														
 
															+		buffer->flags |= RB_FL_OVERWRITE;
														
 
															+	else
														
 
															+		buffer->flags &= ~RB_FL_OVERWRITE;
														
 
															+	mutex_unlock(&buffer->mutex);
														
 
															+}
														
 
															+EXPORT_SYMBOL_GPL(ring_buffer_change_overwrite);
														
 
															+
														
 
															 static inline void *
														
 
															 __rb_data_page_index(struct buffer_data_page *bpage, unsigned index)
														
 
															 {
														
@@ -2162,11 +2172,19 @@ rb_reserve_next_event(struct ring_buffer *buffer,
 
															 	if (likely(ts >= cpu_buffer->write_stamp)) {
														
 
															 		delta = diff;
														
 
															 		if (unlikely(test_time_stamp(delta))) {
														
 
															+			int local_clock_stable = 1;
														
 
															+#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
														
 
															+			local_clock_stable = sched_clock_stable;
														
 
															+#endif
														
 
															 			WARN_ONCE(delta > (1ULL << 59),
														
 
															-				  KERN_WARNING "Delta way too big! %llu ts=%llu write stamp = %llu\n",
														
 
															+				  KERN_WARNING "Delta way too big! %llu ts=%llu write stamp = %llu\n%s",
														
 
															 				  (unsigned long long)delta,
														
 
															 				  (unsigned long long)ts,
														
 
															-				  (unsigned long long)cpu_buffer->write_stamp);
														
 
															+				  (unsigned long long)cpu_buffer->write_stamp,
														
 
															+				  local_clock_stable ? "" :
														
 
															+				  "If you just came from a suspend/resume,\n"
														
 
															+				  "please switch to the trace global clock:\n"
														
 
															+				  "  echo global > /sys/kernel/debug/tracing/trace_clock\n");
														
 
															 			add_timestamp = 1;
														
 
															 		}
														
 
															 	}
														
--- a/kernel/trace/trace.c
+++ b/kernel/trace/trace.c
@@ -41,8 +41,6 @@
 
															 #include "trace.h"
														
 
															 #include "trace_output.h"
														
 
															-#define TRACE_BUFFER_FLAGS	(RB_FL_OVERWRITE)
														
 
															-
														
 
															 /*
														
 
															  * On boot up, the ring buffer is set to the minimum size, so that
														
 
															  * we do not waste memory on systems that are not using tracing.
														
@@ -340,7 +338,7 @@ static DECLARE_WAIT_QUEUE_HEAD(trace_wait);
 
															 /* trace_flags holds trace_options default values */
														
 
															 unsigned long trace_flags = TRACE_ITER_PRINT_PARENT | TRACE_ITER_PRINTK |
														
 
															 	TRACE_ITER_ANNOTATE | TRACE_ITER_CONTEXT_INFO | TRACE_ITER_SLEEP_TIME |
														
 
															-	TRACE_ITER_GRAPH_TIME | TRACE_ITER_RECORD_CMD;
														
 
															+	TRACE_ITER_GRAPH_TIME | TRACE_ITER_RECORD_CMD | TRACE_ITER_OVERWRITE;
														
 
															 static int trace_stop_count;
														
 
															 static DEFINE_SPINLOCK(tracing_start_lock);
														
@@ -425,6 +423,7 @@ static const char *trace_options[] = {
 
															 	"sleep-time",
														
 
															 	"graph-time",
														
 
															 	"record-cmd",
														
 
															+	"overwrite",
														
 
															 	NULL
														
 
															 };
														
@@ -780,6 +779,11 @@ __acquires(kernel_lock)
 
															 		tracing_reset_online_cpus(tr);
														
 
															 		current_trace = type;
														
 
															+
														
 
															+		/* If we expanded the buffers, make sure the max is expanded too */
														
 
															+		if (ring_buffer_expanded && type->use_max_tr)
														
 
															+			ring_buffer_resize(max_tr.buffer, trace_buf_size);
														
 
															+
														
 
															 		/* the test is responsible for initializing and enabling */
														
 
															 		pr_info("Testing tracer %s: ", type->name);
														
 
															 		ret = type->selftest(type, tr);
														
@@ -792,6 +796,10 @@ __acquires(kernel_lock)
 
															 		/* Only reset on passing, to avoid touching corrupted buffers */
														
 
															 		tracing_reset_online_cpus(tr);
														
 
															+		/* Shrink the max buffer again */
														
 
															+		if (ring_buffer_expanded && type->use_max_tr)
														
 
															+			ring_buffer_resize(max_tr.buffer, 1);
														
 
															+
														
 
															 		printk(KERN_CONT "PASSED\n");
														
 
															 	}
														
 
															 #endif
														
@@ -1102,7 +1110,6 @@ tracing_generic_entry_update(struct trace_entry *entry, unsigned long flags,
 
															 	entry->preempt_count		= pc & 0xff;
														
 
															 	entry->pid			= (tsk) ? tsk->pid : 0;
														
 
															-	entry->lock_depth		= (tsk) ? tsk->lock_depth : 0;
														
 
															 	entry->flags =
														
 
															 #ifdef CONFIG_TRACE_IRQFLAGS_SUPPORT
														
 
															 		(irqs_disabled_flags(flags) ? TRACE_FLAG_IRQS_OFF : 0) |
														
@@ -1749,10 +1756,9 @@ static void print_lat_help_header(struct seq_file *m)
 
															 	seq_puts(m, "#                | / _----=> need-resched    \n");
														
 
															 	seq_puts(m, "#                || / _---=> hardirq/softirq \n");
														
 
															 	seq_puts(m, "#                ||| / _--=> preempt-depth   \n");
														
 
															-	seq_puts(m, "#                |||| /_--=> lock-depth       \n");
														
 
															-	seq_puts(m, "#                |||||/     delay             \n");
														
 
															-	seq_puts(m, "#  cmd     pid   |||||| time  |   caller      \n");
														
 
															-	seq_puts(m, "#     \\   /      ||||||   \\   |   /           \n");
														
 
															+	seq_puts(m, "#                |||| /     delay             \n");
														
 
															+	seq_puts(m, "#  cmd     pid   ||||| time  |   caller      \n");
														
 
															+	seq_puts(m, "#     \\   /      |||||  \\    |   /           \n");
														
 
															 }
														
 
															 static void print_func_help_header(struct seq_file *m)
														
@@ -2529,6 +2535,9 @@ static void set_tracer_flags(unsigned int mask, int enabled)
 
															 	if (mask == TRACE_ITER_RECORD_CMD)
														
 
															 		trace_event_enable_cmd_record(enabled);
														
 
															+
														
 
															+	if (mask == TRACE_ITER_OVERWRITE)
														
 
															+		ring_buffer_change_overwrite(global_trace.buffer, enabled);
														
 
															 }
														
 
															 static ssize_t
														
@@ -2710,6 +2719,10 @@ tracing_ctrl_write(struct file *filp, const char __user *ubuf,
 
															 	mutex_lock(&trace_types_lock);
														
 
															 	if (tracer_enabled ^ val) {
														
 
															+
														
 
															+		/* Only need to warn if this is used to change the state */
														
 
															+		WARN_ONCE(1, "tracing_enabled is deprecated. Use tracing_on");
														
 
															+
														
 
															 		if (val) {
														
 
															 			tracer_enabled = 1;
														
 
															 			if (current_trace->start)
														
@@ -4551,9 +4564,11 @@ void ftrace_dump(enum ftrace_dump_mode oops_dump_mode)
 
															 __init static int tracer_alloc_buffers(void)
														
 
															 {
														
 
															 	int ring_buf_size;
														
 
															+	enum ring_buffer_flags rb_flags;
														
 
															 	int i;
														
 
															 	int ret = -ENOMEM;
														
 
															+
														
 
															 	if (!alloc_cpumask_var(&tracing_buffer_mask, GFP_KERNEL))
														
 
															 		goto out;
														
@@ -4566,12 +4581,13 @@ __init static int tracer_alloc_buffers(void)
 
															 	else
														
 
															 		ring_buf_size = 1;
														
 
															+	rb_flags = trace_flags & TRACE_ITER_OVERWRITE ? RB_FL_OVERWRITE : 0;
														
 
															+
														
 
															 	cpumask_copy(tracing_buffer_mask, cpu_possible_mask);
														
 
															 	cpumask_copy(tracing_cpumask, cpu_all_mask);
														
 
															 	/* TODO: make the number of buffers hot pluggable with CPUS */
														
 
															-	global_trace.buffer = ring_buffer_alloc(ring_buf_size,
														
 
															-						   TRACE_BUFFER_FLAGS);
														
 
															+	global_trace.buffer = ring_buffer_alloc(ring_buf_size, rb_flags);
														
 
															 	if (!global_trace.buffer) {
														
 
															 		printk(KERN_ERR "tracer: failed to allocate ring buffer!\n");
														
 
															 		WARN_ON(1);
														
@@ -4581,7 +4597,7 @@ __init static int tracer_alloc_buffers(void)
 
															 #ifdef CONFIG_TRACER_MAX_TRACE
														
 
															-	max_tr.buffer = ring_buffer_alloc(1, TRACE_BUFFER_FLAGS);
														
 
															+	max_tr.buffer = ring_buffer_alloc(1, rb_flags);
														
 
															 	if (!max_tr.buffer) {
														
 
															 		printk(KERN_ERR "tracer: failed to allocate max ring buffer!\n");
														
 
															 		WARN_ON(1);
														
--- a/kernel/trace/trace.h
+++ b/kernel/trace/trace.h
@@ -272,8 +272,8 @@ struct tracer {
 
															 	/* If you handled the flag setting, return 0 */
														
 
															 	int			(*set_flag)(u32 old_flags, u32 bit, int set);
														
 
															 	struct tracer		*next;
														
 
															-	int			print_max;
														
 
															 	struct tracer_flags	*flags;
														
 
															+	int			print_max;
														
 
															 	int			use_max_tr;
														
 
															 };
														
@@ -606,6 +606,7 @@ enum trace_iterator_flags {
 
															 	TRACE_ITER_SLEEP_TIME		= 0x40000,
														
 
															 	TRACE_ITER_GRAPH_TIME		= 0x80000,
														
 
															 	TRACE_ITER_RECORD_CMD		= 0x100000,
														
 
															+	TRACE_ITER_OVERWRITE		= 0x200000,
														
 
															 };
														
 
															 /*
														
@@ -661,8 +662,10 @@ struct ftrace_event_field {
 
															 };
														
 
															 struct event_filter {
														
 
															-	int			n_preds;
														
 
															-	struct filter_pred	**preds;
														
 
															+	int			n_preds;	/* Number assigned */
														
 
															+	int			a_preds;	/* allocated */
														
 
															+	struct filter_pred	*preds;
														
 
															+	struct filter_pred	*root;
														
 
															 	char			*filter_string;
														
 
															 };
														
@@ -674,11 +677,23 @@ struct event_subsystem {
 
															 	int			nr_events;
														
 
															 };
														
 
															+#define FILTER_PRED_INVALID	((unsigned short)-1)
														
 
															+#define FILTER_PRED_IS_RIGHT	(1 << 15)
														
 
															+#define FILTER_PRED_FOLD	(1 << 15)
														
 
															+
														
 
															+/*
														
 
															+ * The max preds is the size of unsigned short with
														
 
															+ * two flags at the MSBs. One bit is used for both the IS_RIGHT
														
 
															+ * and FOLD flags. The other is reserved.
														
 
															+ *
														
 
															+ * 2^14 preds is way more than enough.
														
 
															+ */
														
 
															+#define MAX_FILTER_PRED		16384
														
 
															+
														
 
															 struct filter_pred;
														
 
															 struct regex;
														
 
															-typedef int (*filter_pred_fn_t) (struct filter_pred *pred, void *event,
														
 
															-				 int val1, int val2);
														
 
															+typedef int (*filter_pred_fn_t) (struct filter_pred *pred, void *event);
														
 
															 typedef int (*regex_match_func)(char *str, struct regex *r, int len);
														
@@ -700,11 +715,23 @@ struct filter_pred {
 
															 	filter_pred_fn_t 	fn;
														
 
															 	u64 			val;
														
 
															 	struct regex		regex;
														
 
															-	char 			*field_name;
														
 
															+	/*
														
 
															+	 * Leaf nodes use field_name, ops is used by AND and OR
														
 
															+	 * nodes. The field_name is always freed when freeing a pred.
														
 
															+	 * We can overload field_name for ops and have it freed
														
 
															+	 * as well.
														
 
															+	 */
														
 
															+	union {
														
 
															+		char		*field_name;
														
 
															+		unsigned short	*ops;
														
 
															+	};
														
 
															 	int 			offset;
														
 
															 	int 			not;
														
 
															 	int 			op;
														
 
															-	int 			pop_n;
														
 
															+	unsigned short		index;
														
 
															+	unsigned short		parent;
														
 
															+	unsigned short		left;
														
 
															+	unsigned short		right;
														
 
															 };
														
 
															 extern struct list_head ftrace_common_fields;
														
--- a/kernel/trace/trace_entries.h
+++ b/kernel/trace/trace_entries.h
@@ -109,12 +109,12 @@ FTRACE_ENTRY(funcgraph_exit, ftrace_graph_ret_entry,
 
															  */
														
 
															 #define FTRACE_CTX_FIELDS					\
														
 
															 	__field(	unsigned int,	prev_pid	)	\
														
 
															+	__field(	unsigned int,	next_pid	)	\
														
 
															+	__field(	unsigned int,	next_cpu	)       \
														
 
															 	__field(	unsigned char,	prev_prio	)	\
														
 
															 	__field(	unsigned char,	prev_state	)	\
														
 
															-	__field(	unsigned int,	next_pid	)	\
														
 
															 	__field(	unsigned char,	next_prio	)	\
														
 
															-	__field(	unsigned char,	next_state	)	\
														
 
															-	__field(	unsigned int,	next_cpu	)
														
 
															+	__field(	unsigned char,	next_state	)
														
 
															 FTRACE_ENTRY(context_switch, ctx_switch_entry,
														
--- a/kernel/trace/trace_events.c
+++ b/kernel/trace/trace_events.c
@@ -116,7 +116,6 @@ static int trace_define_common_fields(void)
 
															 	__common_field(unsigned char, flags);
														
 
															 	__common_field(unsigned char, preempt_count);
														
 
															 	__common_field(int, pid);
														
 
															-	__common_field(int, lock_depth);
														
 
															 	return ret;
														
 
															 }
														
@@ -326,6 +325,7 @@ int trace_set_clr_event(const char *system, const char *event, int set)
 
															 {
														
 
															 	return __ftrace_set_clr_event(NULL, system, event, set);
														
 
															 }
														
 
															+EXPORT_SYMBOL_GPL(trace_set_clr_event);
														
 
															 /* 128 should be much more than enough */
														
 
															 #define EVENT_BUF_SIZE		127
														
--- a/kernel/trace/trace_events_filter.c
+++ b/kernel/trace/trace_events_filter.c
@@ -123,9 +123,13 @@ struct filter_parse_state {
 
															 	} operand;
														
 
															 };
														
 
															+struct pred_stack {
														
 
															+	struct filter_pred	**preds;
														
 
															+	int			index;
														
 
															+};
														
 
															+
														
 
															 #define DEFINE_COMPARISON_PRED(type)					\
														
 
															-static int filter_pred_##type(struct filter_pred *pred, void *event,	\
														
 
															-			      int val1, int val2)			\
														
 
															+static int filter_pred_##type(struct filter_pred *pred, void *event)	\
														
 
															 {									\
														
 
															 	type *addr = (type *)(event + pred->offset);			\
														
 
															 	type val = (type)pred->val;					\
														
@@ -152,8 +156,7 @@ static int filter_pred_##type(struct filter_pred *pred, void *event,	\
 
															 }
														
 
															 #define DEFINE_EQUALITY_PRED(size)					\
														
 
															-static int filter_pred_##size(struct filter_pred *pred, void *event,	\
														
 
															-			      int val1, int val2)			\
														
 
															+static int filter_pred_##size(struct filter_pred *pred, void *event)	\
														
 
															 {									\
														
 
															 	u##size *addr = (u##size *)(event + pred->offset);		\
														
 
															 	u##size val = (u##size)pred->val;				\
														
@@ -178,23 +181,8 @@ DEFINE_EQUALITY_PRED(32);
 
															 DEFINE_EQUALITY_PRED(16);
														
 
															 DEFINE_EQUALITY_PRED(8);
														
 
															-static int filter_pred_and(struct filter_pred *pred __attribute((unused)),
														
 
															-			   void *event __attribute((unused)),
														
 
															-			   int val1, int val2)
														
 
															-{
														
 
															-	return val1 && val2;
														
 
															-}
														
 
															-
														
 
															-static int filter_pred_or(struct filter_pred *pred __attribute((unused)),
														
 
															-			  void *event __attribute((unused)),
														
 
															-			  int val1, int val2)
														
 
															-{
														
 
															-	return val1 || val2;
														
 
															-}
														
 
															-
														
 
															 /* Filter predicate for fixed sized arrays of characters */
														
 
															-static int filter_pred_string(struct filter_pred *pred, void *event,
														
 
															-			      int val1, int val2)
														
 
															+static int filter_pred_string(struct filter_pred *pred, void *event)
														
 
															 {
														
 
															 	char *addr = (char *)(event + pred->offset);
														
 
															 	int cmp, match;
														
@@ -207,8 +195,7 @@ static int filter_pred_string(struct filter_pred *pred, void *event,
 
															 }
														
 
															 /* Filter predicate for char * pointers */
														
 
															-static int filter_pred_pchar(struct filter_pred *pred, void *event,
														
 
															-			     int val1, int val2)
														
 
															+static int filter_pred_pchar(struct filter_pred *pred, void *event)
														
 
															 {
														
 
															 	char **addr = (char **)(event + pred->offset);
														
 
															 	int cmp, match;
														
@@ -231,8 +218,7 @@ static int filter_pred_pchar(struct filter_pred *pred, void *event,
 
															  * and add it to the address of the entry, and at last we have
														
 
															  * the address of the string.
														
 
															  */
														
 
															-static int filter_pred_strloc(struct filter_pred *pred, void *event,
														
 
															-			      int val1, int val2)
														
 
															+static int filter_pred_strloc(struct filter_pred *pred, void *event)
														
 
															 {
														
 
															 	u32 str_item = *(u32 *)(event + pred->offset);
														
 
															 	int str_loc = str_item & 0xffff;
														
@@ -247,8 +233,7 @@ static int filter_pred_strloc(struct filter_pred *pred, void *event,
 
															 	return match;
														
 
															 }
														
 
															-static int filter_pred_none(struct filter_pred *pred, void *event,
														
 
															-			    int val1, int val2)
														
 
															+static int filter_pred_none(struct filter_pred *pred, void *event)
														
 
															 {
														
 
															 	return 0;
														
 
															 }
														
@@ -377,32 +362,147 @@ static void filter_build_regex(struct filter_pred *pred)
 
															 	pred->not ^= not;
														
 
															 }
														
 
															+enum move_type {
														
 
															+	MOVE_DOWN,
														
 
															+	MOVE_UP_FROM_LEFT,
														
 
															+	MOVE_UP_FROM_RIGHT
														
 
															+};
														
 
															+
														
 
															+static struct filter_pred *
														
 
															+get_pred_parent(struct filter_pred *pred, struct filter_pred *preds,
														
 
															+		int index, enum move_type *move)
														
 
															+{
														
 
															+	if (pred->parent & FILTER_PRED_IS_RIGHT)
														
 
															+		*move = MOVE_UP_FROM_RIGHT;
														
 
															+	else
														
 
															+		*move = MOVE_UP_FROM_LEFT;
														
 
															+	pred = &preds[pred->parent & ~FILTER_PRED_IS_RIGHT];
														
 
															+
														
 
															+	return pred;
														
 
															+}
														
 
															+
														
 
															+/*
														
 
															+ * A series of AND or ORs where found together. Instead of
														
 
															+ * climbing up and down the tree branches, an array of the
														
 
															+ * ops were made in order of checks. We can just move across
														
 
															+ * the array and short circuit if needed.
														
 
															+ */
														
 
															+static int process_ops(struct filter_pred *preds,
														
 
															+		       struct filter_pred *op, void *rec)
														
 
															+{
														
 
															+	struct filter_pred *pred;
														
 
															+	int type;
														
 
															+	int match;
														
 
															+	int i;
														
 
															+
														
 
															+	/*
														
 
															+	 * Micro-optimization: We set type to true if op
														
 
															+	 * is an OR and false otherwise (AND). Then we
														
 
															+	 * just need to test if the match is equal to
														
 
															+	 * the type, and if it is, we can short circuit the
														
 
															+	 * rest of the checks:
														
 
															+	 *
														
 
															+	 * if ((match && op->op == OP_OR) ||
														
 
															+	 *     (!match && op->op == OP_AND))
														
 
															+	 *	  return match;
														
 
															+	 */
														
 
															+	type = op->op == OP_OR;
														
 
															+
														
 
															+	for (i = 0; i < op->val; i++) {
														
 
															+		pred = &preds[op->ops[i]];
														
 
															+		match = pred->fn(pred, rec);
														
 
															+		if (!!match == type)
														
 
															+			return match;
														
 
															+	}
														
 
															+	return match;
														
 
															+}
														
 
															+
														
 
															 /* return 1 if event matches, 0 otherwise (discard) */
														
 
															 int filter_match_preds(struct event_filter *filter, void *rec)
														
 
															 {
														
 
															-	int match, top = 0, val1 = 0, val2 = 0;
														
 
															-	int stack[MAX_FILTER_PRED];
														
 
															+	int match = -1;
														
 
															+	enum move_type move = MOVE_DOWN;
														
 
															+	struct filter_pred *preds;
														
 
															 	struct filter_pred *pred;
														
 
															-	int i;
														
 
															+	struct filter_pred *root;
														
 
															+	int n_preds;
														
 
															+	int done = 0;
														
 
															+
														
 
															+	/* no filter is considered a match */
														
 
															+	if (!filter)
														
 
															+		return 1;
														
 
															+
														
 
															+	n_preds = filter->n_preds;
														
 
															+
														
 
															+	if (!n_preds)
														
 
															+		return 1;
														
 
															+
														
 
															+	/*
														
 
															+	 * n_preds, root and filter->preds are protect with preemption disabled.
														
 
															+	 */
														
 
															+	preds = rcu_dereference_sched(filter->preds);
														
 
															+	root = rcu_dereference_sched(filter->root);
														
 
															+	if (!root)
														
 
															+		return 1;
														
 
															+
														
 
															+	pred = root;
														
 
															-	for (i = 0; i < filter->n_preds; i++) {
														
 
															-		pred = filter->preds[i];
														
 
															-		if (!pred->pop_n) {
														
 
															-			match = pred->fn(pred, rec, val1, val2);
														
 
															-			stack[top++] = match;
														
 
															+	/* match is currently meaningless */
														
 
															+	match = -1;
														
 
															+
														
 
															+	do {
														
 
															+		switch (move) {
														
 
															+		case MOVE_DOWN:
														
 
															+			/* only AND and OR have children */
														
 
															+			if (pred->left != FILTER_PRED_INVALID) {
														
 
															+				/* If ops is set, then it was folded. */
														
 
															+				if (!pred->ops) {
														
 
															+					/* keep going to down the left side */
														
 
															+					pred = &preds[pred->left];
														
 
															+					continue;
														
 
															+				}
														
 
															+				/* We can treat folded ops as a leaf node */
														
 
															+				match = process_ops(preds, pred, rec);
														
 
															+			} else
														
 
															+				match = pred->fn(pred, rec);
														
 
															+			/* If this pred is the only pred */
														
 
															+			if (pred == root)
														
 
															+				break;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_LEFT:
														
 
															+			/*
														
 
															+			 * Check for short circuits.
														
 
															+			 *
														
 
															+			 * Optimization: !!match == (pred->op == OP_OR)
														
 
															+			 *   is the same as:
														
 
															+			 * if ((match && pred->op == OP_OR) ||
														
 
															+			 *     (!match && pred->op == OP_AND))
														
 
															+			 */
														
 
															+			if (!!match == (pred->op == OP_OR)) {
														
 
															+				if (pred == root)
														
 
															+					break;
														
 
															+				pred = get_pred_parent(pred, preds,
														
 
															+						       pred->parent, &move);
														
 
															+				continue;
														
 
															+			}
														
 
															+			/* now go down the right side of the tree. */
														
 
															+			pred = &preds[pred->right];
														
 
															+			move = MOVE_DOWN;
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_RIGHT:
														
 
															+			/* We finished this equation. */
														
 
															+			if (pred == root)
														
 
															+				break;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															 			continue;
														
 
															 		}
														
 
															-		if (pred->pop_n > top) {
														
 
															-			WARN_ON_ONCE(1);
														
 
															-			return 0;
														
 
															-		}
														
 
															-		val1 = stack[--top];
														
 
															-		val2 = stack[--top];
														
 
															-		match = pred->fn(pred, rec, val1, val2);
														
 
															-		stack[top++] = match;
														
 
															-	}
														
 
															+		done = 1;
														
 
															+	} while (!done);
														
 
															-	return stack[--top];
														
 
															+	return match;
														
 
															 }
														
 
															 EXPORT_SYMBOL_GPL(filter_match_preds);
														
@@ -414,6 +514,9 @@ static void parse_error(struct filter_parse_state *ps, int err, int pos)
 
															 static void remove_filter_string(struct event_filter *filter)
														
 
															 {
														
 
															+	if (!filter)
														
 
															+		return;
														
 
															+
														
 
															 	kfree(filter->filter_string);
														
 
															 	filter->filter_string = NULL;
														
 
															 }
														
@@ -473,9 +576,10 @@ static void append_filter_err(struct filter_parse_state *ps,
 
															 void print_event_filter(struct ftrace_event_call *call, struct trace_seq *s)
														
 
															 {
														
 
															-	struct event_filter *filter = call->filter;
														
 
															+	struct event_filter *filter;
														
 
															 	mutex_lock(&event_mutex);
														
 
															+	filter = call->filter;
														
 
															 	if (filter && filter->filter_string)
														
 
															 		trace_seq_printf(s, "%s\n", filter->filter_string);
														
 
															 	else
														
@@ -486,9 +590,10 @@ void print_event_filter(struct ftrace_event_call *call, struct trace_seq *s)
 
															 void print_subsystem_event_filter(struct event_subsystem *system,
														
 
															 				  struct trace_seq *s)
														
 
															 {
														
 
															-	struct event_filter *filter = system->filter;
														
 
															+	struct event_filter *filter;
														
 
															 	mutex_lock(&event_mutex);
														
 
															+	filter = system->filter;
														
 
															 	if (filter && filter->filter_string)
														
 
															 		trace_seq_printf(s, "%s\n", filter->filter_string);
														
 
															 	else
														
@@ -539,10 +644,58 @@ static void filter_clear_pred(struct filter_pred *pred)
 
															 	pred->regex.len = 0;
														
 
															 }
														
 
															-static int filter_set_pred(struct filter_pred *dest,
														
 
															+static int __alloc_pred_stack(struct pred_stack *stack, int n_preds)
														
 
															+{
														
 
															+	stack->preds = kzalloc(sizeof(*stack->preds)*(n_preds + 1), GFP_KERNEL);
														
 
															+	if (!stack->preds)
														
 
															+		return -ENOMEM;
														
 
															+	stack->index = n_preds;
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static void __free_pred_stack(struct pred_stack *stack)
														
 
															+{
														
 
															+	kfree(stack->preds);
														
 
															+	stack->index = 0;
														
 
															+}
														
 
															+
														
 
															+static int __push_pred_stack(struct pred_stack *stack,
														
 
															+			     struct filter_pred *pred)
														
 
															+{
														
 
															+	int index = stack->index;
														
 
															+
														
 
															+	if (WARN_ON(index == 0))
														
 
															+		return -ENOSPC;
														
 
															+
														
 
															+	stack->preds[--index] = pred;
														
 
															+	stack->index = index;
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static struct filter_pred *
														
 
															+__pop_pred_stack(struct pred_stack *stack)
														
 
															+{
														
 
															+	struct filter_pred *pred;
														
 
															+	int index = stack->index;
														
 
															+
														
 
															+	pred = stack->preds[index++];
														
 
															+	if (!pred)
														
 
															+		return NULL;
														
 
															+
														
 
															+	stack->index = index;
														
 
															+	return pred;
														
 
															+}
														
 
															+
														
 
															+static int filter_set_pred(struct event_filter *filter,
														
 
															+			   int idx,
														
 
															+			   struct pred_stack *stack,
														
 
															 			   struct filter_pred *src,
														
 
															 			   filter_pred_fn_t fn)
														
 
															 {
														
 
															+	struct filter_pred *dest = &filter->preds[idx];
														
 
															+	struct filter_pred *left;
														
 
															+	struct filter_pred *right;
														
 
															+
														
 
															 	*dest = *src;
														
 
															 	if (src->field_name) {
														
 
															 		dest->field_name = kstrdup(src->field_name, GFP_KERNEL);
														
@@ -550,116 +703,140 @@ static int filter_set_pred(struct filter_pred *dest,
 
															 			return -ENOMEM;
														
 
															 	}
														
 
															 	dest->fn = fn;
														
 
															+	dest->index = idx;
														
 
															-	return 0;
														
 
															+	if (dest->op == OP_OR || dest->op == OP_AND) {
														
 
															+		right = __pop_pred_stack(stack);
														
 
															+		left = __pop_pred_stack(stack);
														
 
															+		if (!left || !right)
														
 
															+			return -EINVAL;
														
 
															+		/*
														
 
															+		 * If both children can be folded
														
 
															+		 * and they are the same op as this op or a leaf,
														
 
															+		 * then this op can be folded.
														
 
															+		 */
														
 
															+		if (left->index & FILTER_PRED_FOLD &&
														
 
															+		    (left->op == dest->op ||
														
 
															+		     left->left == FILTER_PRED_INVALID) &&
														
 
															+		    right->index & FILTER_PRED_FOLD &&
														
 
															+		    (right->op == dest->op ||
														
 
															+		     right->left == FILTER_PRED_INVALID))
														
 
															+			dest->index |= FILTER_PRED_FOLD;
														
 
															+
														
 
															+		dest->left = left->index & ~FILTER_PRED_FOLD;
														
 
															+		dest->right = right->index & ~FILTER_PRED_FOLD;
														
 
															+		left->parent = dest->index & ~FILTER_PRED_FOLD;
														
 
															+		right->parent = dest->index | FILTER_PRED_IS_RIGHT;
														
 
															+	} else {
														
 
															+		/*
														
 
															+		 * Make dest->left invalid to be used as a quick
														
 
															+		 * way to know this is a leaf node.
														
 
															+		 */
														
 
															+		dest->left = FILTER_PRED_INVALID;
														
 
															+
														
 
															+		/* All leafs allow folding the parent ops. */
														
 
															+		dest->index |= FILTER_PRED_FOLD;
														
 
															+	}
														
 
															+
														
 
															+	return __push_pred_stack(stack, dest);
														
 
															 }
														
 
															-static void filter_disable_preds(struct ftrace_event_call *call)
														
 
															+static void __free_preds(struct event_filter *filter)
														
 
															 {
														
 
															-	struct event_filter *filter = call->filter;
														
 
															 	int i;
														
 
															-	call->flags &= ~TRACE_EVENT_FL_FILTERED;
														
 
															+	if (filter->preds) {
														
 
															+		for (i = 0; i < filter->a_preds; i++)
														
 
															+			kfree(filter->preds[i].field_name);
														
 
															+		kfree(filter->preds);
														
 
															+		filter->preds = NULL;
														
 
															+	}
														
 
															+	filter->a_preds = 0;
														
 
															 	filter->n_preds = 0;
														
 
															-
														
 
															-	for (i = 0; i < MAX_FILTER_PRED; i++)
														
 
															-		filter->preds[i]->fn = filter_pred_none;
														
 
															 }
														
 
															-static void __free_preds(struct event_filter *filter)
														
 
															+static void filter_disable(struct ftrace_event_call *call)
														
 
															 {
														
 
															-	int i;
														
 
															+	call->flags &= ~TRACE_EVENT_FL_FILTERED;
														
 
															+}
														
 
															+static void __free_filter(struct event_filter *filter)
														
 
															+{
														
 
															 	if (!filter)
														
 
															 		return;
														
 
															-	for (i = 0; i < MAX_FILTER_PRED; i++) {
														
 
															-		if (filter->preds[i])
														
 
															-			filter_free_pred(filter->preds[i]);
														
 
															-	}
														
 
															-	kfree(filter->preds);
														
 
															+	__free_preds(filter);
														
 
															 	kfree(filter->filter_string);
														
 
															 	kfree(filter);
														
 
															 }
														
 
															+/*
														
 
															+ * Called when destroying the ftrace_event_call.
														
 
															+ * The call is being freed, so we do not need to worry about
														
 
															+ * the call being currently used. This is for module code removing
														
 
															+ * the tracepoints from within it.
														
 
															+ */
														
 
															 void destroy_preds(struct ftrace_event_call *call)
														
 
															 {
														
 
															-	__free_preds(call->filter);
														
 
															+	__free_filter(call->filter);
														
 
															 	call->filter = NULL;
														
 
															-	call->flags &= ~TRACE_EVENT_FL_FILTERED;
														
 
															 }
														
 
															-static struct event_filter *__alloc_preds(void)
														
 
															+static struct event_filter *__alloc_filter(void)
														
 
															 {
														
 
															 	struct event_filter *filter;
														
 
															+
														
 
															+	filter = kzalloc(sizeof(*filter), GFP_KERNEL);
														
 
															+	return filter;
														
 
															+}
														
 
															+
														
 
															+static int __alloc_preds(struct event_filter *filter, int n_preds)
														
 
															+{
														
 
															 	struct filter_pred *pred;
														
 
															 	int i;
														
 
															-	filter = kzalloc(sizeof(*filter), GFP_KERNEL);
														
 
															-	if (!filter)
														
 
															-		return ERR_PTR(-ENOMEM);
														
 
															+	if (filter->preds)
														
 
															+		__free_preds(filter);
														
 
															-	filter->n_preds = 0;
														
 
															+	filter->preds =
														
 
															+		kzalloc(sizeof(*filter->preds) * n_preds, GFP_KERNEL);
														
 
															-	filter->preds = kzalloc(MAX_FILTER_PRED * sizeof(pred), GFP_KERNEL);
														
 
															 	if (!filter->preds)
														
 
															-		goto oom;
														
 
															+		return -ENOMEM;
														
 
															-	for (i = 0; i < MAX_FILTER_PRED; i++) {
														
 
															-		pred = kzalloc(sizeof(*pred), GFP_KERNEL);
														
 
															-		if (!pred)
														
 
															-			goto oom;
														
 
															+	filter->a_preds = n_preds;
														
 
															+	filter->n_preds = 0;
														
 
															+
														
 
															+	for (i = 0; i < n_preds; i++) {
														
 
															+		pred = &filter->preds[i];
														
 
															 		pred->fn = filter_pred_none;
														
 
															-		filter->preds[i] = pred;
														
 
															 	}
														
 
															-	return filter;
														
 
															-
														
 
															-oom:
														
 
															-	__free_preds(filter);
														
 
															-	return ERR_PTR(-ENOMEM);
														
 
															-}
														
 
															-
														
 
															-static int init_preds(struct ftrace_event_call *call)
														
 
															-{
														
 
															-	if (call->filter)
														
 
															-		return 0;
														
 
															-
														
 
															-	call->flags &= ~TRACE_EVENT_FL_FILTERED;
														
 
															-	call->filter = __alloc_preds();
														
 
															-	if (IS_ERR(call->filter))
														
 
															-		return PTR_ERR(call->filter);
														
 
															-
														
 
															 	return 0;
														
 
															 }
														
 
															-static int init_subsystem_preds(struct event_subsystem *system)
														
 
															+static void filter_free_subsystem_preds(struct event_subsystem *system)
														
 
															 {
														
 
															 	struct ftrace_event_call *call;
														
 
															-	int err;
														
 
															 	list_for_each_entry(call, &ftrace_events, list) {
														
 
															 		if (strcmp(call->class->system, system->name) != 0)
														
 
															 			continue;
														
 
															-		err = init_preds(call);
														
 
															-		if (err)
														
 
															-			return err;
														
 
															+		filter_disable(call);
														
 
															+		remove_filter_string(call->filter);
														
 
															 	}
														
 
															-
														
 
															-	return 0;
														
 
															 }
														
 
															-static void filter_free_subsystem_preds(struct event_subsystem *system)
														
 
															+static void filter_free_subsystem_filters(struct event_subsystem *system)
														
 
															 {
														
 
															 	struct ftrace_event_call *call;
														
 
															 	list_for_each_entry(call, &ftrace_events, list) {
														
 
															 		if (strcmp(call->class->system, system->name) != 0)
														
 
															 			continue;
														
 
															-
														
 
															-		filter_disable_preds(call);
														
 
															-		remove_filter_string(call->filter);
														
 
															+		__free_filter(call->filter);
														
 
															+		call->filter = NULL;
														
 
															 	}
														
 
															 }
														
@@ -667,18 +844,19 @@ static int filter_add_pred_fn(struct filter_parse_state *ps,
 
															 			      struct ftrace_event_call *call,
														
 
															 			      struct event_filter *filter,
														
 
															 			      struct filter_pred *pred,
														
 
															+			      struct pred_stack *stack,
														
 
															 			      filter_pred_fn_t fn)
														
 
															 {
														
 
															 	int idx, err;
														
 
															-	if (filter->n_preds == MAX_FILTER_PRED) {
														
 
															+	if (WARN_ON(filter->n_preds == filter->a_preds)) {
														
 
															 		parse_error(ps, FILT_ERR_TOO_MANY_PREDS, 0);
														
 
															 		return -ENOSPC;
														
 
															 	}
														
 
															 	idx = filter->n_preds;
														
 
															-	filter_clear_pred(filter->preds[idx]);
														
 
															-	err = filter_set_pred(filter->preds[idx], pred, fn);
														
 
															+	filter_clear_pred(&filter->preds[idx]);
														
 
															+	err = filter_set_pred(filter, idx, stack, pred, fn);
														
 
															 	if (err)
														
 
															 		return err;
														
@@ -763,6 +941,7 @@ static int filter_add_pred(struct filter_parse_state *ps,
 
															 			   struct ftrace_event_call *call,
														
 
															 			   struct event_filter *filter,
														
 
															 			   struct filter_pred *pred,
														
 
															+			   struct pred_stack *stack,
														
 
															 			   bool dry_run)
														
 
															 {
														
 
															 	struct ftrace_event_field *field;
														
@@ -770,17 +949,12 @@ static int filter_add_pred(struct filter_parse_state *ps,
 
															 	unsigned long long val;
														
 
															 	int ret;
														
 
															-	pred->fn = filter_pred_none;
														
 
															+	fn = pred->fn = filter_pred_none;
														
 
															-	if (pred->op == OP_AND) {
														
 
															-		pred->pop_n = 2;
														
 
															-		fn = filter_pred_and;
														
 
															+	if (pred->op == OP_AND)
														
 
															 		goto add_pred_fn;
														
 
															-	} else if (pred->op == OP_OR) {
														
 
															-		pred->pop_n = 2;
														
 
															-		fn = filter_pred_or;
														
 
															+	else if (pred->op == OP_OR)
														
 
															 		goto add_pred_fn;
														
 
															-	}
														
 
															 	field = find_event_field(call, pred->field_name);
														
 
															 	if (!field) {
														
@@ -829,7 +1003,7 @@ static int filter_add_pred(struct filter_parse_state *ps,
 
															 add_pred_fn:
														
 
															 	if (!dry_run)
														
 
															-		return filter_add_pred_fn(ps, call, filter, pred, fn);
														
 
															+		return filter_add_pred_fn(ps, call, filter, pred, stack, fn);
														
 
															 	return 0;
														
 
															 }
														
@@ -1187,6 +1361,234 @@ static int check_preds(struct filter_parse_state *ps)
 
															 	return 0;
														
 
															 }
														
 
															+static int count_preds(struct filter_parse_state *ps)
														
 
															+{
														
 
															+	struct postfix_elt *elt;
														
 
															+	int n_preds = 0;
														
 
															+
														
 
															+	list_for_each_entry(elt, &ps->postfix, list) {
														
 
															+		if (elt->op == OP_NONE)
														
 
															+			continue;
														
 
															+		n_preds++;
														
 
															+	}
														
 
															+
														
 
															+	return n_preds;
														
 
															+}
														
 
															+
														
 
															+/*
														
 
															+ * The tree is walked at filtering of an event. If the tree is not correctly
														
 
															+ * built, it may cause an infinite loop. Check here that the tree does
														
 
															+ * indeed terminate.
														
 
															+ */
														
 
															+static int check_pred_tree(struct event_filter *filter,
														
 
															+			   struct filter_pred *root)
														
 
															+{
														
 
															+	struct filter_pred *preds;
														
 
															+	struct filter_pred *pred;
														
 
															+	enum move_type move = MOVE_DOWN;
														
 
															+	int count = 0;
														
 
															+	int done = 0;
														
 
															+	int max;
														
 
															+
														
 
															+	/*
														
 
															+	 * The max that we can hit a node is three times.
														
 
															+	 * Once going down, once coming up from left, and
														
 
															+	 * once coming up from right. This is more than enough
														
 
															+	 * since leafs are only hit a single time.
														
 
															+	 */
														
 
															+	max = 3 * filter->n_preds;
														
 
															+
														
 
															+	preds = filter->preds;
														
 
															+	if  (!preds)
														
 
															+		return -EINVAL;
														
 
															+	pred = root;
														
 
															+
														
 
															+	do {
														
 
															+		if (WARN_ON(count++ > max))
														
 
															+			return -EINVAL;
														
 
															+
														
 
															+		switch (move) {
														
 
															+		case MOVE_DOWN:
														
 
															+			if (pred->left != FILTER_PRED_INVALID) {
														
 
															+				pred = &preds[pred->left];
														
 
															+				continue;
														
 
															+			}
														
 
															+			/* A leaf at the root is just a leaf in the tree */
														
 
															+			if (pred == root)
														
 
															+				break;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_LEFT:
														
 
															+			pred = &preds[pred->right];
														
 
															+			move = MOVE_DOWN;
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_RIGHT:
														
 
															+			if (pred == root)
														
 
															+				break;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															+			continue;
														
 
															+		}
														
 
															+		done = 1;
														
 
															+	} while (!done);
														
 
															+
														
 
															+	/* We are fine. */
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static int count_leafs(struct filter_pred *preds, struct filter_pred *root)
														
 
															+{
														
 
															+	struct filter_pred *pred;
														
 
															+	enum move_type move = MOVE_DOWN;
														
 
															+	int count = 0;
														
 
															+	int done = 0;
														
 
															+
														
 
															+	pred = root;
														
 
															+
														
 
															+	do {
														
 
															+		switch (move) {
														
 
															+		case MOVE_DOWN:
														
 
															+			if (pred->left != FILTER_PRED_INVALID) {
														
 
															+				pred = &preds[pred->left];
														
 
															+				continue;
														
 
															+			}
														
 
															+			/* A leaf at the root is just a leaf in the tree */
														
 
															+			if (pred == root)
														
 
															+				return 1;
														
 
															+			count++;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_LEFT:
														
 
															+			pred = &preds[pred->right];
														
 
															+			move = MOVE_DOWN;
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_RIGHT:
														
 
															+			if (pred == root)
														
 
															+				break;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															+			continue;
														
 
															+		}
														
 
															+		done = 1;
														
 
															+	} while (!done);
														
 
															+
														
 
															+	return count;
														
 
															+}
														
 
															+
														
 
															+static int fold_pred(struct filter_pred *preds, struct filter_pred *root)
														
 
															+{
														
 
															+	struct filter_pred *pred;
														
 
															+	enum move_type move = MOVE_DOWN;
														
 
															+	int count = 0;
														
 
															+	int children;
														
 
															+	int done = 0;
														
 
															+
														
 
															+	/* No need to keep the fold flag */
														
 
															+	root->index &= ~FILTER_PRED_FOLD;
														
 
															+
														
 
															+	/* If the root is a leaf then do nothing */
														
 
															+	if (root->left == FILTER_PRED_INVALID)
														
 
															+		return 0;
														
 
															+
														
 
															+	/* count the children */
														
 
															+	children = count_leafs(preds, &preds[root->left]);
														
 
															+	children += count_leafs(preds, &preds[root->right]);
														
 
															+
														
 
															+	root->ops = kzalloc(sizeof(*root->ops) * children, GFP_KERNEL);
														
 
															+	if (!root->ops)
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															+	root->val = children;
														
 
															+
														
 
															+	pred = root;
														
 
															+	do {
														
 
															+		switch (move) {
														
 
															+		case MOVE_DOWN:
														
 
															+			if (pred->left != FILTER_PRED_INVALID) {
														
 
															+				pred = &preds[pred->left];
														
 
															+				continue;
														
 
															+			}
														
 
															+			if (WARN_ON(count == children))
														
 
															+				return -EINVAL;
														
 
															+			pred->index &= ~FILTER_PRED_FOLD;
														
 
															+			root->ops[count++] = pred->index;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_LEFT:
														
 
															+			pred = &preds[pred->right];
														
 
															+			move = MOVE_DOWN;
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_RIGHT:
														
 
															+			if (pred == root)
														
 
															+				break;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															+			continue;
														
 
															+		}
														
 
															+		done = 1;
														
 
															+	} while (!done);
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+/*
														
 
															+ * To optimize the processing of the ops, if we have several "ors" or
														
 
															+ * "ands" together, we can put them in an array and process them all
														
 
															+ * together speeding up the filter logic.
														
 
															+ */
														
 
															+static int fold_pred_tree(struct event_filter *filter,
														
 
															+			   struct filter_pred *root)
														
 
															+{
														
 
															+	struct filter_pred *preds;
														
 
															+	struct filter_pred *pred;
														
 
															+	enum move_type move = MOVE_DOWN;
														
 
															+	int done = 0;
														
 
															+	int err;
														
 
															+
														
 
															+	preds = filter->preds;
														
 
															+	if  (!preds)
														
 
															+		return -EINVAL;
														
 
															+	pred = root;
														
 
															+
														
 
															+	do {
														
 
															+		switch (move) {
														
 
															+		case MOVE_DOWN:
														
 
															+			if (pred->index & FILTER_PRED_FOLD) {
														
 
															+				err = fold_pred(preds, pred);
														
 
															+				if (err)
														
 
															+					return err;
														
 
															+				/* Folded nodes are like leafs */
														
 
															+			} else if (pred->left != FILTER_PRED_INVALID) {
														
 
															+				pred = &preds[pred->left];
														
 
															+				continue;
														
 
															+			}
														
 
															+
														
 
															+			/* A leaf at the root is just a leaf in the tree */
														
 
															+			if (pred == root)
														
 
															+				break;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_LEFT:
														
 
															+			pred = &preds[pred->right];
														
 
															+			move = MOVE_DOWN;
														
 
															+			continue;
														
 
															+		case MOVE_UP_FROM_RIGHT:
														
 
															+			if (pred == root)
														
 
															+				break;
														
 
															+			pred = get_pred_parent(pred, preds,
														
 
															+					       pred->parent, &move);
														
 
															+			continue;
														
 
															+		}
														
 
															+		done = 1;
														
 
															+	} while (!done);
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															 static int replace_preds(struct ftrace_event_call *call,
														
 
															 			 struct event_filter *filter,
														
 
															 			 struct filter_parse_state *ps,
														
@@ -1195,14 +1597,32 @@ static int replace_preds(struct ftrace_event_call *call,
 
															 {
														
 
															 	char *operand1 = NULL, *operand2 = NULL;
														
 
															 	struct filter_pred *pred;
														
 
															+	struct filter_pred *root;
														
 
															 	struct postfix_elt *elt;
														
 
															+	struct pred_stack stack = { }; /* init to NULL */
														
 
															 	int err;
														
 
															 	int n_preds = 0;
														
 
															+	n_preds = count_preds(ps);
														
 
															+	if (n_preds >= MAX_FILTER_PRED) {
														
 
															+		parse_error(ps, FILT_ERR_TOO_MANY_PREDS, 0);
														
 
															+		return -ENOSPC;
														
 
															+	}
														
 
															+
														
 
															 	err = check_preds(ps);
														
 
															 	if (err)
														
 
															 		return err;
														
 
															+	if (!dry_run) {
														
 
															+		err = __alloc_pred_stack(&stack, n_preds);
														
 
															+		if (err)
														
 
															+			return err;
														
 
															+		err = __alloc_preds(filter, n_preds);
														
 
															+		if (err)
														
 
															+			goto fail;
														
 
															+	}
														
 
															+
														
 
															+	n_preds = 0;
														
 
															 	list_for_each_entry(elt, &ps->postfix, list) {
														
 
															 		if (elt->op == OP_NONE) {
														
 
															 			if (!operand1)
														
@@ -1211,14 +1631,16 @@ static int replace_preds(struct ftrace_event_call *call,
 
															 				operand2 = elt->operand;
														
 
															 			else {
														
 
															 				parse_error(ps, FILT_ERR_TOO_MANY_OPERANDS, 0);
														
 
															-				return -EINVAL;
														
 
															+				err = -EINVAL;
														
 
															+				goto fail;
														
 
															 			}
														
 
															 			continue;
														
 
															 		}
														
 
															-		if (n_preds++ == MAX_FILTER_PRED) {
														
 
															+		if (WARN_ON(n_preds++ == MAX_FILTER_PRED)) {
														
 
															 			parse_error(ps, FILT_ERR_TOO_MANY_PREDS, 0);
														
 
															-			return -ENOSPC;
														
 
															+			err = -ENOSPC;
														
 
															+			goto fail;
														
 
															 		}
														
 
															 		if (elt->op == OP_AND || elt->op == OP_OR) {
														
@@ -1228,76 +1650,181 @@ static int replace_preds(struct ftrace_event_call *call,
 
															 		if (!operand1 || !operand2) {
														
 
															 			parse_error(ps, FILT_ERR_MISSING_FIELD, 0);
														
 
															-			return -EINVAL;
														
 
															+			err = -EINVAL;
														
 
															+			goto fail;
														
 
															 		}
														
 
															 		pred = create_pred(elt->op, operand1, operand2);
														
 
															 add_pred:
														
 
															-		if (!pred)
														
 
															-			return -ENOMEM;
														
 
															-		err = filter_add_pred(ps, call, filter, pred, dry_run);
														
 
															+		if (!pred) {
														
 
															+			err = -ENOMEM;
														
 
															+			goto fail;
														
 
															+		}
														
 
															+		err = filter_add_pred(ps, call, filter, pred, &stack, dry_run);
														
 
															 		filter_free_pred(pred);
														
 
															 		if (err)
														
 
															-			return err;
														
 
															+			goto fail;
														
 
															 		operand1 = operand2 = NULL;
														
 
															 	}
														
 
															-	return 0;
														
 
															+	if (!dry_run) {
														
 
															+		/* We should have one item left on the stack */
														
 
															+		pred = __pop_pred_stack(&stack);
														
 
															+		if (!pred)
														
 
															+			return -EINVAL;
														
 
															+		/* This item is where we start from in matching */
														
 
															+		root = pred;
														
 
															+		/* Make sure the stack is empty */
														
 
															+		pred = __pop_pred_stack(&stack);
														
 
															+		if (WARN_ON(pred)) {
														
 
															+			err = -EINVAL;
														
 
															+			filter->root = NULL;
														
 
															+			goto fail;
														
 
															+		}
														
 
															+		err = check_pred_tree(filter, root);
														
 
															+		if (err)
														
 
															+			goto fail;
														
 
															+
														
 
															+		/* Optimize the tree */
														
 
															+		err = fold_pred_tree(filter, root);
														
 
															+		if (err)
														
 
															+			goto fail;
														
 
															+
														
 
															+		/* We don't set root until we know it works */
														
 
															+		barrier();
														
 
															+		filter->root = root;
														
 
															+	}
														
 
															+
														
 
															+	err = 0;
														
 
															+fail:
														
 
															+	__free_pred_stack(&stack);
														
 
															+	return err;
														
 
															 }
														
 
															+struct filter_list {
														
 
															+	struct list_head	list;
														
 
															+	struct event_filter	*filter;
														
 
															+};
														
 
															+
														
 
															 static int replace_system_preds(struct event_subsystem *system,
														
 
															 				struct filter_parse_state *ps,
														
 
															 				char *filter_string)
														
 
															 {
														
 
															 	struct ftrace_event_call *call;
														
 
															+	struct filter_list *filter_item;
														
 
															+	struct filter_list *tmp;
														
 
															+	LIST_HEAD(filter_list);
														
 
															 	bool fail = true;
														
 
															 	int err;
														
 
															 	list_for_each_entry(call, &ftrace_events, list) {
														
 
															-		struct event_filter *filter = call->filter;
														
 
															 		if (strcmp(call->class->system, system->name) != 0)
														
 
															 			continue;
														
 
															-		/* try to see if the filter can be applied */
														
 
															-		err = replace_preds(call, filter, ps, filter_string, true);
														
 
															+		/*
														
 
															+		 * Try to see if the filter can be applied
														
 
															+		 *  (filter arg is ignored on dry_run)
														
 
															+		 */
														
 
															+		err = replace_preds(call, NULL, ps, filter_string, true);
														
 
															 		if (err)
														
 
															+			goto fail;
														
 
															+	}
														
 
															+
														
 
															+	list_for_each_entry(call, &ftrace_events, list) {
														
 
															+		struct event_filter *filter;
														
 
															+
														
 
															+		if (strcmp(call->class->system, system->name) != 0)
														
 
															 			continue;
														
 
															-		/* really apply the filter */
														
 
															-		filter_disable_preds(call);
														
 
															-		err = replace_preds(call, filter, ps, filter_string, false);
														
 
															+		filter_item = kzalloc(sizeof(*filter_item), GFP_KERNEL);
														
 
															+		if (!filter_item)
														
 
															+			goto fail_mem;
														
 
															+
														
 
															+		list_add_tail(&filter_item->list, &filter_list);
														
 
															+
														
 
															+		filter_item->filter = __alloc_filter();
														
 
															+		if (!filter_item->filter)
														
 
															+			goto fail_mem;
														
 
															+		filter = filter_item->filter;
														
 
															+
														
 
															+		/* Can only fail on no memory */
														
 
															+		err = replace_filter_string(filter, filter_string);
														
 
															 		if (err)
														
 
															-			filter_disable_preds(call);
														
 
															-		else {
														
 
															+			goto fail_mem;
														
 
															+
														
 
															+		err = replace_preds(call, filter, ps, filter_string, false);
														
 
															+		if (err) {
														
 
															+			filter_disable(call);
														
 
															+			parse_error(ps, FILT_ERR_BAD_SUBSYS_FILTER, 0);
														
 
															+			append_filter_err(ps, filter);
														
 
															+		} else
														
 
															 			call->flags |= TRACE_EVENT_FL_FILTERED;
														
 
															-			replace_filter_string(filter, filter_string);
														
 
															-		}
														
 
															+		/*
														
 
															+		 * Regardless of if this returned an error, we still
														
 
															+		 * replace the filter for the call.
														
 
															+		 */
														
 
															+		filter = call->filter;
														
 
															+		call->filter = filter_item->filter;
														
 
															+		filter_item->filter = filter;
														
 
															+
														
 
															 		fail = false;
														
 
															 	}
														
 
															-	if (fail) {
														
 
															-		parse_error(ps, FILT_ERR_BAD_SUBSYS_FILTER, 0);
														
 
															-		return -EINVAL;
														
 
															+	if (fail)
														
 
															+		goto fail;
														
 
															+
														
 
															+	/*
														
 
															+	 * The calls can still be using the old filters.
														
 
															+	 * Do a synchronize_sched() to ensure all calls are
														
 
															+	 * done with them before we free them.
														
 
															+	 */
														
 
															+	synchronize_sched();
														
 
															+	list_for_each_entry_safe(filter_item, tmp, &filter_list, list) {
														
 
															+		__free_filter(filter_item->filter);
														
 
															+		list_del(&filter_item->list);
														
 
															+		kfree(filter_item);
														
 
															 	}
														
 
															 	return 0;
														
 
															+ fail:
														
 
															+	/* No call succeeded */
														
 
															+	list_for_each_entry_safe(filter_item, tmp, &filter_list, list) {
														
 
															+		list_del(&filter_item->list);
														
 
															+		kfree(filter_item);
														
 
															+	}
														
 
															+	parse_error(ps, FILT_ERR_BAD_SUBSYS_FILTER, 0);
														
 
															+	return -EINVAL;
														
 
															+ fail_mem:
														
 
															+	/* If any call succeeded, we still need to sync */
														
 
															+	if (!fail)
														
 
															+		synchronize_sched();
														
 
															+	list_for_each_entry_safe(filter_item, tmp, &filter_list, list) {
														
 
															+		__free_filter(filter_item->filter);
														
 
															+		list_del(&filter_item->list);
														
 
															+		kfree(filter_item);
														
 
															+	}
														
 
															+	return -ENOMEM;
														
 
															 }
														
 
															 int apply_event_filter(struct ftrace_event_call *call, char *filter_string)
														
 
															 {
														
 
															-	int err;
														
 
															 	struct filter_parse_state *ps;
														
 
															+	struct event_filter *filter;
														
 
															+	struct event_filter *tmp;
														
 
															+	int err = 0;
														
 
															 	mutex_lock(&event_mutex);
														
 
															-	err = init_preds(call);
														
 
															-	if (err)
														
 
															-		goto out_unlock;
														
 
															-
														
 
															 	if (!strcmp(strstrip(filter_string), "0")) {
														
 
															-		filter_disable_preds(call);
														
 
															-		remove_filter_string(call->filter);
														
 
															+		filter_disable(call);
														
 
															+		filter = call->filter;
														
 
															+		if (!filter)
														
 
															+			goto out_unlock;
														
 
															+		call->filter = NULL;
														
 
															+		/* Make sure the filter is not being used */
														
 
															+		synchronize_sched();
														
 
															+		__free_filter(filter);
														
 
															 		goto out_unlock;
														
 
															 	}
														
@@ -1306,22 +1833,41 @@ int apply_event_filter(struct ftrace_event_call *call, char *filter_string)
 
															 	if (!ps)
														
 
															 		goto out_unlock;
														
 
															-	filter_disable_preds(call);
														
 
															-	replace_filter_string(call->filter, filter_string);
														
 
															+	filter = __alloc_filter();
														
 
															+	if (!filter) {
														
 
															+		kfree(ps);
														
 
															+		goto out_unlock;
														
 
															+	}
														
 
															+
														
 
															+	replace_filter_string(filter, filter_string);
														
 
															 	parse_init(ps, filter_ops, filter_string);
														
 
															 	err = filter_parse(ps);
														
 
															 	if (err) {
														
 
															-		append_filter_err(ps, call->filter);
														
 
															+		append_filter_err(ps, filter);
														
 
															 		goto out;
														
 
															 	}
														
 
															-	err = replace_preds(call, call->filter, ps, filter_string, false);
														
 
															-	if (err)
														
 
															-		append_filter_err(ps, call->filter);
														
 
															-	else
														
 
															+	err = replace_preds(call, filter, ps, filter_string, false);
														
 
															+	if (err) {
														
 
															+		filter_disable(call);
														
 
															+		append_filter_err(ps, filter);
														
 
															+	} else
														
 
															 		call->flags |= TRACE_EVENT_FL_FILTERED;
														
 
															 out:
														
 
															+	/*
														
 
															+	 * Always swap the call filter with the new filter
														
 
															+	 * even if there was an error. If there was an error
														
 
															+	 * in the filter, we disable the filter and show the error
														
 
															+	 * string
														
 
															+	 */
														
 
															+	tmp = call->filter;
														
 
															+	call->filter = filter;
														
 
															+	if (tmp) {
														
 
															+		/* Make sure the call is done with the filter */
														
 
															+		synchronize_sched();
														
 
															+		__free_filter(tmp);
														
 
															+	}
														
 
															 	filter_opstack_clear(ps);
														
 
															 	postfix_clear(ps);
														
 
															 	kfree(ps);
														
@@ -1334,18 +1880,21 @@ out_unlock:
 
															 int apply_subsystem_event_filter(struct event_subsystem *system,
														
 
															 				 char *filter_string)
														
 
															 {
														
 
															-	int err;
														
 
															 	struct filter_parse_state *ps;
														
 
															+	struct event_filter *filter;
														
 
															+	int err = 0;
														
 
															 	mutex_lock(&event_mutex);
														
 
															-	err = init_subsystem_preds(system);
														
 
															-	if (err)
														
 
															-		goto out_unlock;
														
 
															-
														
 
															 	if (!strcmp(strstrip(filter_string), "0")) {
														
 
															 		filter_free_subsystem_preds(system);
														
 
															 		remove_filter_string(system->filter);
														
 
															+		filter = system->filter;
														
 
															+		system->filter = NULL;
														
 
															+		/* Ensure all filters are no longer used */
														
 
															+		synchronize_sched();
														
 
															+		filter_free_subsystem_filters(system);
														
 
															+		__free_filter(filter);
														
 
															 		goto out_unlock;
														
 
															 	}
														
@@ -1354,7 +1903,17 @@ int apply_subsystem_event_filter(struct event_subsystem *system,
 
															 	if (!ps)
														
 
															 		goto out_unlock;
														
 
															-	replace_filter_string(system->filter, filter_string);
														
 
															+	filter = __alloc_filter();
														
 
															+	if (!filter)
														
 
															+		goto out;
														
 
															+
														
 
															+	replace_filter_string(filter, filter_string);
														
 
															+	/*
														
 
															+	 * No event actually uses the system filter
														
 
															+	 * we can free it without synchronize_sched().
														
 
															+	 */
														
 
															+	__free_filter(system->filter);
														
 
															+	system->filter = filter;
														
 
															 	parse_init(ps, filter_ops, filter_string);
														
 
															 	err = filter_parse(ps);
														
@@ -1384,7 +1943,7 @@ void ftrace_profile_free_filter(struct perf_event *event)
 
															 	struct event_filter *filter = event->filter;
														
 
															 	event->filter = NULL;
														
 
															-	__free_preds(filter);
														
 
															+	__free_filter(filter);
														
 
															 }
														
 
															 int ftrace_profile_set_filter(struct perf_event *event, int event_id,
														
@@ -1410,8 +1969,8 @@ int ftrace_profile_set_filter(struct perf_event *event, int event_id,
 
															 	if (event->filter)
														
 
															 		goto out_unlock;
														
 
															-	filter = __alloc_preds();
														
 
															-	if (IS_ERR(filter)) {
														
 
															+	filter = __alloc_filter();
														
 
															+	if (!filter) {
														
 
															 		err = PTR_ERR(filter);
														
 
															 		goto out_unlock;
														
 
															 	}
														
@@ -1419,7 +1978,7 @@ int ftrace_profile_set_filter(struct perf_event *event, int event_id,
 
															 	err = -ENOMEM;
														
 
															 	ps = kzalloc(sizeof(*ps), GFP_KERNEL);
														
 
															 	if (!ps)
														
 
															-		goto free_preds;
														
 
															+		goto free_filter;
														
 
															 	parse_init(ps, filter_ops, filter_str);
														
 
															 	err = filter_parse(ps);
														
@@ -1435,9 +1994,9 @@ free_ps:
 
															 	postfix_clear(ps);
														
 
															 	kfree(ps);
														
 
															-free_preds:
														
 
															+free_filter:
														
 
															 	if (err)
														
 
															-		__free_preds(filter);
														
 
															+		__free_filter(filter);
														
 
															 out_unlock:
														
 
															 	mutex_unlock(&event_mutex);
														
--- a/kernel/trace/trace_kprobe.c
+++ b/kernel/trace/trace_kprobe.c
@@ -353,6 +353,43 @@ static __kprobes void free_deref_fetch_param(struct deref_fetch_param *data)
 
															 	kfree(data);
														
 
															 }
														
 
															+/* Bitfield fetch function */
														
 
															+struct bitfield_fetch_param {
														
 
															+	struct fetch_param orig;
														
 
															+	unsigned char hi_shift;
														
 
															+	unsigned char low_shift;
														
 
															+};
														
 
															+
														
 
															+#define DEFINE_FETCH_bitfield(type)					\
														
 
															+static __kprobes void FETCH_FUNC_NAME(bitfield, type)(struct pt_regs *regs,\
														
 
															+					    void *data, void *dest)	\
														
 
															+{									\
														
 
															+	struct bitfield_fetch_param *bprm = data;			\
														
 
															+	type buf = 0;							\
														
 
															+	call_fetch(&bprm->orig, regs, &buf);				\
														
 
															+	if (buf) {							\
														
 
															+		buf <<= bprm->hi_shift;					\
														
 
															+		buf >>= bprm->low_shift;				\
														
 
															+	}								\
														
 
															+	*(type *)dest = buf;						\
														
 
															+}
														
 
															+DEFINE_BASIC_FETCH_FUNCS(bitfield)
														
 
															+#define fetch_bitfield_string NULL
														
 
															+#define fetch_bitfield_string_size NULL
														
 
															+
														
 
															+static __kprobes void
														
 
															+free_bitfield_fetch_param(struct bitfield_fetch_param *data)
														
 
															+{
														
 
															+	/*
														
 
															+	 * Don't check the bitfield itself, because this must be the
														
 
															+	 * last fetch function.
														
 
															+	 */
														
 
															+	if (CHECK_FETCH_FUNCS(deref, data->orig.fn))
														
 
															+		free_deref_fetch_param(data->orig.data);
														
 
															+	else if (CHECK_FETCH_FUNCS(symbol, data->orig.fn))
														
 
															+		free_symbol_cache(data->orig.data);
														
 
															+	kfree(data);
														
 
															+}
														
 
															 /* Default (unsigned long) fetch type */
														
 
															 #define __DEFAULT_FETCH_TYPE(t) u##t
														
 
															 #define _DEFAULT_FETCH_TYPE(t) __DEFAULT_FETCH_TYPE(t)
														
@@ -367,6 +404,7 @@ enum {
 
															 	FETCH_MTD_memory,
														
 
															 	FETCH_MTD_symbol,
														
 
															 	FETCH_MTD_deref,
														
 
															+	FETCH_MTD_bitfield,
														
 
															 	FETCH_MTD_END,
														
 
															 };
														
@@ -387,6 +425,7 @@ ASSIGN_FETCH_FUNC(retval, ftype),			\
 
															 ASSIGN_FETCH_FUNC(memory, ftype),			\
														
 
															 ASSIGN_FETCH_FUNC(symbol, ftype),			\
														
 
															 ASSIGN_FETCH_FUNC(deref, ftype),			\
														
 
															+ASSIGN_FETCH_FUNC(bitfield, ftype),			\
														
 
															 	  }						\
														
 
															 	}
														
@@ -430,9 +469,33 @@ static const struct fetch_type *find_fetch_type(const char *type)
 
															 	if (!type)
														
 
															 		type = DEFAULT_FETCH_TYPE_STR;
														
 
															+	/* Special case: bitfield */
														
 
															+	if (*type == 'b') {
														
 
															+		unsigned long bs;
														
 
															+		type = strchr(type, '/');
														
 
															+		if (!type)
														
 
															+			goto fail;
														
 
															+		type++;
														
 
															+		if (strict_strtoul(type, 0, &bs))
														
 
															+			goto fail;
														
 
															+		switch (bs) {
														
 
															+		case 8:
														
 
															+			return find_fetch_type("u8");
														
 
															+		case 16:
														
 
															+			return find_fetch_type("u16");
														
 
															+		case 32:
														
 
															+			return find_fetch_type("u32");
														
 
															+		case 64:
														
 
															+			return find_fetch_type("u64");
														
 
															+		default:
														
 
															+			goto fail;
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															 	for (i = 0; i < ARRAY_SIZE(fetch_type_table); i++)
														
 
															 		if (strcmp(type, fetch_type_table[i].name) == 0)
														
 
															 			return &fetch_type_table[i];
														
 
															+fail:
														
 
															 	return NULL;
														
 
															 }
														
@@ -586,7 +649,9 @@ error:
 
															 static void free_probe_arg(struct probe_arg *arg)
														
 
															 {
														
 
															-	if (CHECK_FETCH_FUNCS(deref, arg->fetch.fn))
														
 
															+	if (CHECK_FETCH_FUNCS(bitfield, arg->fetch.fn))
														
 
															+		free_bitfield_fetch_param(arg->fetch.data);
														
 
															+	else if (CHECK_FETCH_FUNCS(deref, arg->fetch.fn))
														
 
															 		free_deref_fetch_param(arg->fetch.data);
														
 
															 	else if (CHECK_FETCH_FUNCS(symbol, arg->fetch.fn))
														
 
															 		free_symbol_cache(arg->fetch.data);
														
@@ -767,16 +832,15 @@ static int __parse_probe_arg(char *arg, const struct fetch_type *t,
 
															 		}
														
 
															 		break;
														
 
															 	case '+':	/* deref memory */
														
 
															+		arg++;	/* Skip '+', because strict_strtol() rejects it. */
														
 
															 	case '-':
														
 
															 		tmp = strchr(arg, '(');
														
 
															 		if (!tmp)
														
 
															 			break;
														
 
															 		*tmp = '\0';
														
 
															-		ret = strict_strtol(arg + 1, 0, &offset);
														
 
															+		ret = strict_strtol(arg, 0, &offset);
														
 
															 		if (ret)
														
 
															 			break;
														
 
															-		if (arg[0] == '-')
														
 
															-			offset = -offset;
														
 
															 		arg = tmp + 1;
														
 
															 		tmp = strrchr(arg, ')');
														
 
															 		if (tmp) {
														
@@ -807,6 +871,41 @@ static int __parse_probe_arg(char *arg, const struct fetch_type *t,
 
															 	return ret;
														
 
															 }
														
 
															+#define BYTES_TO_BITS(nb)	((BITS_PER_LONG * (nb)) / sizeof(long))
														
 
															+
														
 
															+/* Bitfield type needs to be parsed into a fetch function */
														
 
															+static int __parse_bitfield_probe_arg(const char *bf,
														
 
															+				      const struct fetch_type *t,
														
 
															+				      struct fetch_param *f)
														
 
															+{
														
 
															+	struct bitfield_fetch_param *bprm;
														
 
															+	unsigned long bw, bo;
														
 
															+	char *tail;
														
 
															+
														
 
															+	if (*bf != 'b')
														
 
															+		return 0;
														
 
															+
														
 
															+	bprm = kzalloc(sizeof(*bprm), GFP_KERNEL);
														
 
															+	if (!bprm)
														
 
															+		return -ENOMEM;
														
 
															+	bprm->orig = *f;
														
 
															+	f->fn = t->fetch[FETCH_MTD_bitfield];
														
 
															+	f->data = (void *)bprm;
														
 
															+
														
 
															+	bw = simple_strtoul(bf + 1, &tail, 0);	/* Use simple one */
														
 
															+	if (bw == 0 || *tail != '@')
														
 
															+		return -EINVAL;
														
 
															+
														
 
															+	bf = tail + 1;
														
 
															+	bo = simple_strtoul(bf, &tail, 0);
														
 
															+	if (tail == bf || *tail != '/')
														
 
															+		return -EINVAL;
														
 
															+
														
 
															+	bprm->hi_shift = BYTES_TO_BITS(t->size) - (bw + bo);
														
 
															+	bprm->low_shift = bprm->hi_shift + bo;
														
 
															+	return (BYTES_TO_BITS(t->size) < (bw + bo)) ? -EINVAL : 0;
														
 
															+}
														
 
															+
														
 
															 /* String length checking wrapper */
														
 
															 static int parse_probe_arg(char *arg, struct trace_probe *tp,
														
 
															 			   struct probe_arg *parg, int is_return)
														
@@ -836,6 +935,8 @@ static int parse_probe_arg(char *arg, struct trace_probe *tp,
 
															 	parg->offset = tp->size;
														
 
															 	tp->size += parg->type->size;
														
 
															 	ret = __parse_probe_arg(arg, parg->type, &parg->fetch, is_return);
														
 
															+	if (ret >= 0 && t != NULL)
														
 
															+		ret = __parse_bitfield_probe_arg(t, parg->type, &parg->fetch);
														
 
															 	if (ret >= 0) {
														
 
															 		parg->fetch_size.fn = get_fetch_size_function(parg->type,
														
 
															 							      parg->fetch.fn);
														
@@ -1130,7 +1231,7 @@ static int command_trace_probe(const char *buf)
 
															 	return ret;
														
 
															 }
														
 
															-#define WRITE_BUFSIZE 128
														
 
															+#define WRITE_BUFSIZE 4096
														
 
															 static ssize_t probes_write(struct file *file, const char __user *buffer,
														
 
															 			    size_t count, loff_t *ppos)
														
--- a/kernel/trace/trace_output.c
+++ b/kernel/trace/trace_output.c
@@ -529,24 +529,34 @@ seq_print_ip_sym(struct trace_seq *s, unsigned long ip, unsigned long sym_flags)
 
															  * @entry: The trace entry field from the ring buffer
														
 
															  *
														
 
															  * Prints the generic fields of irqs off, in hard or softirq, preempt
														
 
															- * count and lock depth.
														
 
															+ * count.
														
 
															  */
														
 
															 int trace_print_lat_fmt(struct trace_seq *s, struct trace_entry *entry)
														
 
															 {
														
 
															-	int hardirq, softirq;
														
 
															+	char hardsoft_irq;
														
 
															+	char need_resched;
														
 
															+	char irqs_off;
														
 
															+	int hardirq;
														
 
															+	int softirq;
														
 
															 	int ret;
														
 
															 	hardirq = entry->flags & TRACE_FLAG_HARDIRQ;
														
 
															 	softirq = entry->flags & TRACE_FLAG_SOFTIRQ;
														
 
															+	irqs_off =
														
 
															+		(entry->flags & TRACE_FLAG_IRQS_OFF) ? 'd' :
														
 
															+		(entry->flags & TRACE_FLAG_IRQS_NOSUPPORT) ? 'X' :
														
 
															+		'.';
														
 
															+	need_resched =
														
 
															+		(entry->flags & TRACE_FLAG_NEED_RESCHED) ? 'N' : '.';
														
 
															+	hardsoft_irq =
														
 
															+		(hardirq && softirq) ? 'H' :
														
 
															+		hardirq ? 'h' :
														
 
															+		softirq ? 's' :
														
 
															+		'.';
														
 
															+
														
 
															 	if (!trace_seq_printf(s, "%c%c%c",
														
 
															-			      (entry->flags & TRACE_FLAG_IRQS_OFF) ? 'd' :
														
 
															-				(entry->flags & TRACE_FLAG_IRQS_NOSUPPORT) ?
														
 
															-				  'X' : '.',
														
 
															-			      (entry->flags & TRACE_FLAG_NEED_RESCHED) ?
														
 
															-				'N' : '.',
														
 
															-			      (hardirq && softirq) ? 'H' :
														
 
															-				hardirq ? 'h' : softirq ? 's' : '.'))
														
 
															+			      irqs_off, need_resched, hardsoft_irq))
														
 
															 		return 0;
														
 
															 	if (entry->preempt_count)
														
@@ -554,13 +564,7 @@ int trace_print_lat_fmt(struct trace_seq *s, struct trace_entry *entry)
 
															 	else
														
 
															 		ret = trace_seq_putc(s, '.');
														
 
															-	if (!ret)
														
 
															-		return 0;
														
 
															-
														
 
															-	if (entry->lock_depth < 0)
														
 
															-		return trace_seq_putc(s, '.');
														
 
															-
														
 
															-	return trace_seq_printf(s, "%d", entry->lock_depth);
														
 
															+	return ret;
														
 
															 }
														
 
															 static int
														
--- a/kernel/trace/trace_sched_switch.c
+++ b/kernel/trace/trace_sched_switch.c
@@ -247,51 +247,3 @@ void tracing_sched_switch_assign_trace(struct trace_array *tr)
 
															 	ctx_trace = tr;
														
 
															 }
														
 
															-static void stop_sched_trace(struct trace_array *tr)
														
 
															-{
														
 
															-	tracing_stop_sched_switch_record();
														
 
															-}
														
 
															-
														
 
															-static int sched_switch_trace_init(struct trace_array *tr)
														
 
															-{
														
 
															-	ctx_trace = tr;
														
 
															-	tracing_reset_online_cpus(tr);
														
 
															-	tracing_start_sched_switch_record();
														
 
															-	return 0;
														
 
															-}
														
 
															-
														
 
															-static void sched_switch_trace_reset(struct trace_array *tr)
														
 
															-{
														
 
															-	if (sched_ref)
														
 
															-		stop_sched_trace(tr);
														
 
															-}
														
 
															-
														
 
															-static void sched_switch_trace_start(struct trace_array *tr)
														
 
															-{
														
 
															-	sched_stopped = 0;
														
 
															-}
														
 
															-
														
 
															-static void sched_switch_trace_stop(struct trace_array *tr)
														
 
															-{
														
 
															-	sched_stopped = 1;
														
 
															-}
														
 
															-
														
 
															-static struct tracer sched_switch_trace __read_mostly =
														
 
															-{
														
 
															-	.name		= "sched_switch",
														
 
															-	.init		= sched_switch_trace_init,
														
 
															-	.reset		= sched_switch_trace_reset,
														
 
															-	.start		= sched_switch_trace_start,
														
 
															-	.stop		= sched_switch_trace_stop,
														
 
															-	.wait_pipe	= poll_wait_pipe,
														
 
															-#ifdef CONFIG_FTRACE_SELFTEST
														
 
															-	.selftest    = trace_selftest_startup_sched_switch,
														
 
															-#endif
														
 
															-};
														
 
															-
														
 
															-__init static int init_sched_switch_trace(void)
														
 
															-{
														
 
															-	return register_tracer(&sched_switch_trace);
														
 
															-}
														
 
															-device_initcall(init_sched_switch_trace);
														
 
															-
														
--- a/kernel/trace/trace_syscalls.c
+++ b/kernel/trace/trace_syscalls.c
@@ -60,6 +60,19 @@ extern struct syscall_metadata *__stop_syscalls_metadata[];
 
															 static struct syscall_metadata **syscalls_metadata;
														
 
															+#ifndef ARCH_HAS_SYSCALL_MATCH_SYM_NAME
														
 
															+static inline bool arch_syscall_match_sym_name(const char *sym, const char *name)
														
 
															+{
														
 
															+	/*
														
 
															+	 * Only compare after the "sys" prefix. Archs that use
														
 
															+	 * syscall wrappers may have syscalls symbols aliases prefixed
														
 
															+	 * with "SyS" instead of "sys", leading to an unwanted
														
 
															+	 * mismatch.
														
 
															+	 */
														
 
															+	return !strcmp(sym + 3, name + 3);
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															 static __init struct syscall_metadata *
														
 
															 find_syscall_meta(unsigned long syscall)
														
 
															 {
														
@@ -72,14 +85,11 @@ find_syscall_meta(unsigned long syscall)
 
															 	stop = __stop_syscalls_metadata;
														
 
															 	kallsyms_lookup(syscall, NULL, NULL, NULL, str);
														
 
															+	if (arch_syscall_match_sym_name(str, "sys_ni_syscall"))
														
 
															+		return NULL;
														
 
															+
														
 
															 	for ( ; start < stop; start++) {
														
 
															-		/*
														
 
															-		 * Only compare after the "sys" prefix. Archs that use
														
 
															-		 * syscall wrappers may have syscalls symbols aliases prefixed
														
 
															-		 * with "SyS" instead of "sys", leading to an unwanted
														
 
															-		 * mismatch.
														
 
															-		 */
														
 
															-		if ((*start)->name && !strcmp((*start)->name + 3, str + 3))
														
 
															+		if ((*start)->name && arch_syscall_match_sym_name(str, (*start)->name))
														
 
															 			return *start;
														
 
															 	}
														
 
															 	return NULL;
														
@@ -359,7 +369,7 @@ int reg_event_syscall_enter(struct ftrace_event_call *call)
 
															 	int num;
														
 
															 	num = ((struct syscall_metadata *)call->data)->syscall_nr;
														
 
															-	if (num < 0 || num >= NR_syscalls)
														
 
															+	if (WARN_ON_ONCE(num < 0 || num >= NR_syscalls))
														
 
															 		return -ENOSYS;
														
 
															 	mutex_lock(&syscall_trace_lock);
														
 
															 	if (!sys_refcount_enter)
														
@@ -377,7 +387,7 @@ void unreg_event_syscall_enter(struct ftrace_event_call *call)
 
															 	int num;
														
 
															 	num = ((struct syscall_metadata *)call->data)->syscall_nr;
														
 
															-	if (num < 0 || num >= NR_syscalls)
														
 
															+	if (WARN_ON_ONCE(num < 0 || num >= NR_syscalls))
														
 
															 		return;
														
 
															 	mutex_lock(&syscall_trace_lock);
														
 
															 	sys_refcount_enter--;
														
@@ -393,7 +403,7 @@ int reg_event_syscall_exit(struct ftrace_event_call *call)
 
															 	int num;
														
 
															 	num = ((struct syscall_metadata *)call->data)->syscall_nr;
														
 
															-	if (num < 0 || num >= NR_syscalls)
														
 
															+	if (WARN_ON_ONCE(num < 0 || num >= NR_syscalls))
														
 
															 		return -ENOSYS;
														
 
															 	mutex_lock(&syscall_trace_lock);
														
 
															 	if (!sys_refcount_exit)
														
@@ -411,7 +421,7 @@ void unreg_event_syscall_exit(struct ftrace_event_call *call)
 
															 	int num;
														
 
															 	num = ((struct syscall_metadata *)call->data)->syscall_nr;
														
 
															-	if (num < 0 || num >= NR_syscalls)
														
 
															+	if (WARN_ON_ONCE(num < 0 || num >= NR_syscalls))
														
 
															 		return;
														
 
															 	mutex_lock(&syscall_trace_lock);
														
 
															 	sys_refcount_exit--;
														
@@ -424,6 +434,14 @@ void unreg_event_syscall_exit(struct ftrace_event_call *call)
 
															 int init_syscall_trace(struct ftrace_event_call *call)
														
 
															 {
														
 
															 	int id;
														
 
															+	int num;
														
 
															+
														
 
															+	num = ((struct syscall_metadata *)call->data)->syscall_nr;
														
 
															+	if (num < 0 || num >= NR_syscalls) {
														
 
															+		pr_debug("syscall %s metadata not mapped, disabling ftrace event\n",
														
 
															+				((struct syscall_metadata *)call->data)->name);
														
 
															+		return -ENOSYS;
														
 
															+	}
														
 
															 	if (set_syscall_print_fmt(call) < 0)
														
 
															 		return -ENOMEM;
														
@@ -438,7 +456,7 @@ int init_syscall_trace(struct ftrace_event_call *call)
 
															 	return id;
														
 
															 }
														
 
															-unsigned long __init arch_syscall_addr(int nr)
														
 
															+unsigned long __init __weak arch_syscall_addr(int nr)
														
 
															 {
														
 
															 	return (unsigned long)sys_call_table[nr];
														
 
															 }
														
--- a/scripts/kconfig/streamline_config.pl
+++ b/scripts/kconfig/streamline_config.pl
@@ -1,6 +1,6 @@
 
															 #!/usr/bin/perl -w
														
 
															 #
														
 
															-# Copywrite 2005-2009 - Steven Rostedt
														
 
															+# Copyright 2005-2009 - Steven Rostedt
														
 
															 # Licensed under the terms of the GNU GPL License version 2
														
 
															 #
														
 
															 #  It's simple enough to figure out how this works.
														
--- a/scripts/recordmcount.c
+++ b/scripts/recordmcount.c
@@ -206,7 +206,8 @@ static uint32_t (*w2)(uint16_t);
 
															 static int
														
 
															 is_mcounted_section_name(char const *const txtname)
														
 
															 {
														
 
															-	return 0 == strcmp(".text",          txtname) ||
														
 
															+	return 0 == strcmp(".text",           txtname) ||
														
 
															+		0 == strcmp(".ref.text",      txtname) ||
														
 
															 		0 == strcmp(".sched.text",    txtname) ||
														
 
															 		0 == strcmp(".spinlock.text", txtname) ||
														
 
															 		0 == strcmp(".irqentry.text", txtname) ||
														
--- a/scripts/recordmcount.pl
+++ b/scripts/recordmcount.pl
@@ -130,6 +130,7 @@ if ($inputfile =~ m,kernel/trace/ftrace\.o$,) {
 
															 # Acceptable sections to record.
														
 
															 my %text_sections = (
														
 
															      ".text" => 1,
														
 
															+     ".ref.text" => 1,
														
 
															      ".sched.text" => 1,
														
 
															      ".spinlock.text" => 1,
														
 
															      ".irqentry.text" => 1,
														
--- a/tools/perf/.gitignore
+++ b/tools/perf/.gitignore
@@ -1,4 +1,3 @@
 
															-PERF-BUILD-OPTIONS
														
 
															 PERF-CFLAGS
														
 
															 PERF-GUI-VARS
														
 
															 PERF-VERSION-FILE
														
--- a/tools/perf/Documentation/Makefile
+++ b/tools/perf/Documentation/Makefile
@@ -178,8 +178,8 @@ install-pdf: pdf
 
															 	$(INSTALL) -d -m 755 $(DESTDIR)$(pdfdir)
														
 
															 	$(INSTALL) -m 644 user-manual.pdf $(DESTDIR)$(pdfdir)
														
 
															-install-html: html
														
 
															-	'$(SHELL_PATH_SQ)' ./install-webdoc.sh $(DESTDIR)$(htmldir)
														
 
															+#install-html: html
														
 
															+#	'$(SHELL_PATH_SQ)' ./install-webdoc.sh $(DESTDIR)$(htmldir)
														
 
															 ../PERF-VERSION-FILE: .FORCE-PERF-VERSION-FILE
														
 
															 	$(QUIET_SUBDIR0)../ $(QUIET_SUBDIR1) PERF-VERSION-FILE
														
@@ -288,15 +288,16 @@ $(patsubst %.txt,%.html,$(wildcard howto/*.txt)): %.html : %.txt
 
															 	sed -e '1,/^$$/d' $< | $(ASCIIDOC) -b xhtml11 - >$@+ && \
														
 
															 	mv $@+ $@
														
 
															-install-webdoc : html
														
 
															-	'$(SHELL_PATH_SQ)' ./install-webdoc.sh $(WEBDOC_DEST)
														
 
															+# UNIMPLEMENTED
														
 
															+#install-webdoc : html
														
 
															+#	'$(SHELL_PATH_SQ)' ./install-webdoc.sh $(WEBDOC_DEST)
														
 
															-quick-install: quick-install-man
														
 
															+# quick-install: quick-install-man
														
 
															-quick-install-man:
														
 
															-	'$(SHELL_PATH_SQ)' ./install-doc-quick.sh $(DOC_REF) $(DESTDIR)$(mandir)
														
 
															+# quick-install-man:
														
 
															+#	'$(SHELL_PATH_SQ)' ./install-doc-quick.sh $(DOC_REF) $(DESTDIR)$(mandir)
														
 
															-quick-install-html:
														
 
															-	'$(SHELL_PATH_SQ)' ./install-doc-quick.sh $(HTML_REF) $(DESTDIR)$(htmldir)
														
 
															+#quick-install-html:
														
 
															+#	'$(SHELL_PATH_SQ)' ./install-doc-quick.sh $(HTML_REF) $(DESTDIR)$(htmldir)
														
 
															 .PHONY: .FORCE-PERF-VERSION-FILE
														
--- a/tools/perf/Documentation/perf-list.txt
+++ b/tools/perf/Documentation/perf-list.txt
@@ -8,7 +8,7 @@ perf-list - List all symbolic event types
 
															 SYNOPSIS
														
 
															 --------
														
 
															 [verse]
														
 
															-'perf list'
														
 
															+'perf list' [hw|sw|cache|tracepoint|event_glob]
														
 
															 DESCRIPTION
														
 
															 -----------
														
@@ -63,7 +63,26 @@ details. Some of them are referenced in the SEE ALSO section below.
 
															 OPTIONS
														
 
															 -------
														
 
															-None
														
 
															+
														
 
															+Without options all known events will be listed.
														
 
															+
														
 
															+To limit the list use:
														
 
															+
														
 
															+. 'hw' or 'hardware' to list hardware events such as cache-misses, etc.
														
 
															+
														
 
															+. 'sw' or 'software' to list software events such as context switches, etc.
														
 
															+
														
 
															+. 'cache' or 'hwcache' to list hardware cache events such as L1-dcache-loads, etc.
														
 
															+
														
 
															+. 'tracepoint' to list all tracepoint events, alternatively use
														
 
															+  'subsys_glob:event_glob' to filter by tracepoint subsystems such as sched,
														
 
															+  block, etc.
														
 
															+
														
 
															+. If none of the above is matched, it will apply the supplied glob to all
														
 
															+  events, printing the ones that match.
														
 
															+
														
 
															+One or more types can be used at the same time, listing the events for the
														
 
															+types specified.
														
 
															 SEE ALSO
														
 
															 --------
														
--- a/tools/perf/Documentation/perf-lock.txt
+++ b/tools/perf/Documentation/perf-lock.txt
@@ -24,8 +24,8 @@ and statistics with this 'perf lock' command.
 
															   'perf lock report' reports statistical data.
														
 
															-OPTIONS
														
 
															--------
														
 
															+COMMON OPTIONS
														
 
															+--------------
														
 
															 -i::
														
 
															 --input=<file>::
														
@@ -39,6 +39,14 @@ OPTIONS
 
															 --dump-raw-trace::
														
 
															         Dump raw trace in ASCII.
														
 
															+REPORT OPTIONS
														
 
															+--------------
														
 
															+
														
 
															+-k::
														
 
															+--key=<value>::
														
 
															+        Sorting key. Possible values: acquired (default), contended,
														
 
															+        wait_total, wait_max, wait_min.
														
 
															+
														
 
															 SEE ALSO
														
 
															 --------
														
 
															 linkperf:perf[1]
														
--- a/tools/perf/Documentation/perf-probe.txt
+++ b/tools/perf/Documentation/perf-probe.txt
@@ -16,7 +16,7 @@ or
 
															 or
														
 
															 'perf probe' --list
														
 
															 or
														
 
															-'perf probe' [options] --line='FUNC[:RLN[+NUM|:RLN2]]|SRC:ALN[+NUM|:ALN2]'
														
 
															+'perf probe' [options] --line='LINE'
														
 
															 or
														
 
															 'perf probe' [options] --vars='PROBEPOINT'
														
@@ -73,6 +73,17 @@ OPTIONS
 
															 	(Only for --vars) Show external defined variables in addition to local
														
 
															 	variables.
														
 
															+-F::
														
 
															+--funcs::
														
 
															+	Show available functions in given module or kernel.
														
 
															+
														
 
															+--filter=FILTER::
														
 
															+	(Only for --vars and --funcs) Set filter. FILTER is a combination of glob
														
 
															+	pattern, see FILTER PATTERN for detail.
														
 
															+	Default FILTER is "!__k???tab_* & !__crc_*" for --vars, and "!_*"
														
 
															+	for --funcs.
														
 
															+	If several filters are specified, only the last filter is used.
														
 
															+
														
 
															 -f::
														
 
															 --force::
														
 
															 	Forcibly add events with existing name.
														
@@ -117,13 +128,14 @@ LINE SYNTAX
 
															 -----------
														
 
															 Line range is described by following syntax.
														
 
															- "FUNC[:RLN[+NUM|-RLN2]]|SRC[:ALN[+NUM|-ALN2]]"
														
 
															+ "FUNC[@SRC][:RLN[+NUM|-RLN2]]|SRC[:ALN[+NUM|-ALN2]]"
														
 
															 FUNC specifies the function name of showing lines. 'RLN' is the start line
														
 
															 number from function entry line, and 'RLN2' is the end line number. As same as
														
 
															 probe syntax, 'SRC' means the source file path, 'ALN' is start line number,
														
 
															 and 'ALN2' is end line number in the file. It is also possible to specify how
														
 
															-many lines to show by using 'NUM'.
														
 
															+many lines to show by using 'NUM'. Moreover, 'FUNC@SRC' combination is good
														
 
															+for searching a specific function when several functions share same name.
														
 
															 So, "source.c:100-120" shows lines between 100th to l20th in source.c file. And "func:10+20" shows 20 lines from 10th line of func function.
														
 
															 LAZY MATCHING
														
@@ -135,6 +147,14 @@ e.g.
 
															 This provides some sort of flexibility and robustness to probe point definitions against minor code changes. For example, actual 10th line of schedule() can be moved easily by modifying schedule(), but the same line matching 'rq=cpu_rq*' may still exist in the function.)
														
 
															+FILTER PATTERN
														
 
															+--------------
														
 
															+ The filter pattern is a glob matching pattern(s) to filter variables.
														
 
															+ In addition, you can use "!" for specifying filter-out rule. You also can give several rules combined with "&" or "|", and fold those rules as one rule by using "(" ")".
														
 
															+
														
 
															+e.g.
														
 
															+ With --filter "foo* | bar*", perf probe -V shows variables which start with "foo" or "bar".
														
 
															+ With --filter "!foo* & *bar", perf probe -V shows variables which don't start with "foo" and end with "bar", like "fizzbar". But "foobar" is filtered out.
														
 
															 EXAMPLES
														
 
															 --------
														
--- a/tools/perf/Documentation/perf-record.txt
+++ b/tools/perf/Documentation/perf-record.txt
@@ -137,6 +137,17 @@ Do not update the builid cache. This saves some overhead in situations
 
															 where the information in the perf.data file (which includes buildids)
														
 
															 is sufficient.
														
 
															+-G name,...::
														
 
															+--cgroup name,...::
														
 
															+monitor only in the container (cgroup) called "name". This option is available only
														
 
															+in per-cpu mode. The cgroup filesystem must be mounted. All threads belonging to
														
 
															+container "name" are monitored when they run on the monitored CPUs. Multiple cgroups
														
 
															+can be provided. Each cgroup is applied to the corresponding event, i.e., first cgroup
														
 
															+to first event, second cgroup to second event and so on. It is possible to provide
														
 
															+an empty cgroup (monitor all the time) using, e.g., -G foo,,bar. Cgroups must have
														
 
															+corresponding events, i.e., they always refer to events defined earlier on the command
														
 
															+line.
														
 
															+
														
 
															 SEE ALSO
														
 
															 --------
														
 
															 linkperf:perf-stat[1], linkperf:perf-list[1]
														
--- a/tools/perf/Documentation/perf-stat.txt
+++ b/tools/perf/Documentation/perf-stat.txt
@@ -83,6 +83,17 @@ This option is only valid in system-wide mode.
 
															 print counts using a CSV-style output to make it easy to import directly into
														
 
															 spreadsheets. Columns are separated by the string specified in SEP.
														
 
															+-G name::
														
 
															+--cgroup name::
														
 
															+monitor only in the container (cgroup) called "name". This option is available only
														
 
															+in per-cpu mode. The cgroup filesystem must be mounted. All threads belonging to
														
 
															+container "name" are monitored when they run on the monitored CPUs. Multiple cgroups
														
 
															+can be provided. Each cgroup is applied to the corresponding event, i.e., first cgroup
														
 
															+to first event, second cgroup to second event and so on. It is possible to provide
														
 
															+an empty cgroup (monitor all the time) using, e.g., -G foo,,bar. Cgroups must have
														
 
															+corresponding events, i.e., they always refer to events defined earlier on the command
														
 
															+line.
														
 
															+
														
 
															 EXAMPLES
														
 
															 --------
														
--- a/tools/perf/Makefile
+++ b/tools/perf/Makefile
@@ -3,7 +3,7 @@ ifeq ("$(origin O)", "command line")
 
															 endif
														
 
															 # The default target of this Makefile is...
														
 
															-all::
														
 
															+all:
														
 
															 ifneq ($(OUTPUT),)
														
 
															 # check that the output directory actually exists
														
@@ -11,152 +11,12 @@ OUTDIR := $(shell cd $(OUTPUT) && /bin/pwd)
 
															 $(if $(OUTDIR),, $(error output directory "$(OUTPUT)" does not exist))
														
 
															 endif
														
 
															-# Define V=1 to have a more verbose compile.
														
 
															-# Define V=2 to have an even more verbose compile.
														
 
															-#
														
 
															-# Define SNPRINTF_RETURNS_BOGUS if your are on a system which snprintf()
														
 
															-# or vsnprintf() return -1 instead of number of characters which would
														
 
															-# have been written to the final string if enough space had been available.
														
 
															-#
														
 
															-# Define FREAD_READS_DIRECTORIES if your are on a system which succeeds
														
 
															-# when attempting to read from an fopen'ed directory.
														
 
															-#
														
 
															-# Define NO_OPENSSL environment variable if you do not have OpenSSL.
														
 
															-# This also implies MOZILLA_SHA1.
														
 
															-#
														
 
															-# Define CURLDIR=/foo/bar if your curl header and library files are in
														
 
															-# /foo/bar/include and /foo/bar/lib directories.
														
 
															-#
														
 
															-# Define EXPATDIR=/foo/bar if your expat header and library files are in
														
 
															-# /foo/bar/include and /foo/bar/lib directories.
														
 
															-#
														
 
															-# Define NO_D_INO_IN_DIRENT if you don't have d_ino in your struct dirent.
														
 
															-#
														
 
															-# Define NO_D_TYPE_IN_DIRENT if your platform defines DT_UNKNOWN but lacks
														
 
															-# d_type in struct dirent (latest Cygwin -- will be fixed soonish).
														
 
															-#
														
 
															-# Define NO_C99_FORMAT if your formatted IO functions (printf/scanf et.al.)
														
 
															-# do not support the 'size specifiers' introduced by C99, namely ll, hh,
														
 
															-# j, z, t. (representing long long int, char, intmax_t, size_t, ptrdiff_t).
														
 
															-# some C compilers supported these specifiers prior to C99 as an extension.
														
 
															-#
														
 
															-# Define NO_STRCASESTR if you don't have strcasestr.
														
 
															-#
														
 
															-# Define NO_MEMMEM if you don't have memmem.
														
 
															-#
														
 
															-# Define NO_STRTOUMAX if you don't have strtoumax in the C library.
														
 
															-# If your compiler also does not support long long or does not have
														
 
															-# strtoull, define NO_STRTOULL.
														
 
															-#
														
 
															-# Define NO_SETENV if you don't have setenv in the C library.
														
 
															-#
														
 
															-# Define NO_UNSETENV if you don't have unsetenv in the C library.
														
 
															-#
														
 
															-# Define NO_MKDTEMP if you don't have mkdtemp in the C library.
														
 
															-#
														
 
															-# Define NO_SYS_SELECT_H if you don't have sys/select.h.
														
 
															-#
														
 
															-# Define NO_SYMLINK_HEAD if you never want .perf/HEAD to be a symbolic link.
														
 
															-# Enable it on Windows.  By default, symrefs are still used.
														
 
															-#
														
 
															-# Define NO_SVN_TESTS if you want to skip time-consuming SVN interoperability
														
 
															-# tests.  These tests take up a significant amount of the total test time
														
 
															-# but are not needed unless you plan to talk to SVN repos.
														
 
															-#
														
 
															-# Define NO_FINK if you are building on Darwin/Mac OS X, have Fink
														
 
															-# installed in /sw, but don't want PERF to link against any libraries
														
 
															-# installed there.  If defined you may specify your own (or Fink's)
														
 
															-# include directories and library directories by defining CFLAGS
														
 
															-# and LDFLAGS appropriately.
														
 
															-#
														
 
															-# Define NO_DARWIN_PORTS if you are building on Darwin/Mac OS X,
														
 
															-# have DarwinPorts installed in /opt/local, but don't want PERF to
														
 
															-# link against any libraries installed there.  If defined you may
														
 
															-# specify your own (or DarwinPort's) include directories and
														
 
															-# library directories by defining CFLAGS and LDFLAGS appropriately.
														
 
															-#
														
 
															-# Define PPC_SHA1 environment variable when running make to make use of
														
 
															-# a bundled SHA1 routine optimized for PowerPC.
														
 
															-#
														
 
															-# Define ARM_SHA1 environment variable when running make to make use of
														
 
															-# a bundled SHA1 routine optimized for ARM.
														
 
															-#
														
 
															-# Define MOZILLA_SHA1 environment variable when running make to make use of
														
 
															-# a bundled SHA1 routine coming from Mozilla. It is GPL'd and should be fast
														
 
															-# on non-x86 architectures (e.g. PowerPC), while the OpenSSL version (default
														
 
															-# choice) has very fast version optimized for i586.
														
 
															-#
														
 
															-# Define NEEDS_SSL_WITH_CRYPTO if you need -lcrypto with -lssl (Darwin).
														
 
															-#
														
 
															-# Define NEEDS_LIBICONV if linking with libc is not enough (Darwin).
														
 
															-#
														
 
															-# Define NEEDS_SOCKET if linking with libc is not enough (SunOS,
														
 
															-# Patrick Mauritz).
														
 
															-#
														
 
															-# Define NO_MMAP if you want to avoid mmap.
														
 
															-#
														
 
															-# Define NO_PTHREADS if you do not have or do not want to use Pthreads.
														
 
															-#
														
 
															-# Define NO_PREAD if you have a problem with pread() system call (e.g.
														
 
															-# cygwin.dll before v1.5.22).
														
 
															-#
														
 
															-# Define NO_FAST_WORKING_DIRECTORY if accessing objects in pack files is
														
 
															-# generally faster on your platform than accessing the working directory.
														
 
															-#
														
 
															-# Define NO_TRUSTABLE_FILEMODE if your filesystem may claim to support
														
 
															-# the executable mode bit, but doesn't really do so.
														
 
															-#
														
 
															-# Define NO_IPV6 if you lack IPv6 support and getaddrinfo().
														
 
															-#
														
 
															-# Define NO_SOCKADDR_STORAGE if your platform does not have struct
														
 
															-# sockaddr_storage.
														
 
															-#
														
 
															-# Define NO_ICONV if your libc does not properly support iconv.
														
 
															-#
														
 
															-# Define OLD_ICONV if your library has an old iconv(), where the second
														
 
															-# (input buffer pointer) parameter is declared with type (const char **).
														
 
															-#
														
 
															-# Define NO_DEFLATE_BOUND if your zlib does not have deflateBound.
														
 
															-#
														
 
															-# Define NO_R_TO_GCC_LINKER if your gcc does not like "-R/path/lib"
														
 
															-# that tells runtime paths to dynamic libraries;
														
 
															-# "-Wl,-rpath=/path/lib" is used instead.
														
 
															-#
														
 
															-# Define USE_NSEC below if you want perf to care about sub-second file mtimes
														
 
															-# and ctimes. Note that you need recent glibc (at least 2.2.4) for this, and
														
 
															-# it will BREAK YOUR LOCAL DIFFS! show-diff and anything using it will likely
														
 
															-# randomly break unless your underlying filesystem supports those sub-second
														
 
															-# times (my ext3 doesn't).
														
 
															-#
														
 
															-# Define USE_ST_TIMESPEC if your "struct stat" uses "st_ctimespec" instead of
														
 
															-# "st_ctim"
														
 
															-#
														
 
															-# Define NO_NSEC if your "struct stat" does not have "st_ctim.tv_nsec"
														
 
															-# available.  This automatically turns USE_NSEC off.
														
 
															-#
														
 
															-# Define USE_STDEV below if you want perf to care about the underlying device
														
 
															-# change being considered an inode change from the update-index perspective.
														
 
															-#
														
 
															-# Define NO_ST_BLOCKS_IN_STRUCT_STAT if your platform does not have st_blocks
														
 
															-# field that counts the on-disk footprint in 512-byte blocks.
														
 
															+# Define V to have a more verbose compile.
														
 
															 #
														
 
															 # Define ASCIIDOC8 if you want to format documentation with AsciiDoc 8
														
 
															 #
														
 
															 # Define DOCBOOK_XSL_172 if you want to format man pages with DocBook XSL v1.72.
														
 
															 #
														
 
															-# Define NO_PERL_MAKEMAKER if you cannot use Makefiles generated by perl's
														
 
															-# MakeMaker (e.g. using ActiveState under Cygwin).
														
 
															-#
														
 
															-# Define NO_PERL if you do not want Perl scripts or libraries at all.
														
 
															-#
														
 
															-# Define INTERNAL_QSORT to use Git's implementation of qsort(), which
														
 
															-# is a simplified version of the merge sort used in glibc. This is
														
 
															-# recommended if Git triggers O(n^2) behavior in your platform's qsort().
														
 
															-#
														
 
															-# Define NO_EXTERNAL_GREP if you don't want "perf grep" to ever call
														
 
															-# your external grep (e.g., if your system lacks grep, if its grep is
														
 
															-# broken, or spawning external process is slower than built-in grep perf has).
														
 
															-#
														
 
															 # Define LDFLAGS=-static to build a static binary.
														
 
															 #
														
 
															 # Define EXTRA_CFLAGS=-m64 or EXTRA_CFLAGS=-m32 as appropriate for cross-builds.
														
@@ -167,12 +27,7 @@ $(OUTPUT)PERF-VERSION-FILE: .FORCE-PERF-VERSION-FILE
 
															 	@$(SHELL_PATH) util/PERF-VERSION-GEN $(OUTPUT)
														
 
															 -include $(OUTPUT)PERF-VERSION-FILE
														
 
															-uname_S := $(shell sh -c 'uname -s 2>/dev/null || echo not')
														
 
															-uname_M := $(shell sh -c 'uname -m 2>/dev/null || echo not')
														
 
															-uname_O := $(shell sh -c 'uname -o 2>/dev/null || echo not')
														
 
															-uname_R := $(shell sh -c 'uname -r 2>/dev/null || echo not')
														
 
															-uname_P := $(shell sh -c 'uname -p 2>/dev/null || echo not')
														
 
															-uname_V := $(shell sh -c 'uname -v 2>/dev/null || echo not')
														
 
															+uname_M := $(shell uname -m 2>/dev/null || echo not)
														
 
															 ARCH ?= $(shell echo $(uname_M) | sed -e s/i.86/i386/ -e s/sun4u/sparc64/ \
														
 
															 				  -e s/arm.*/arm/ -e s/sa110/arm/ \
														
@@ -191,8 +46,6 @@ ifeq ($(ARCH),x86_64)
 
															 	ARCH_INCLUDE = ../../arch/x86/lib/memcpy_64.S
														
 
															 endif
														
 
															-# CFLAGS and LDFLAGS are for the users to override from the command line.
														
 
															-
														
 
															 #
														
 
															 # Include saner warnings here, which can catch bugs:
														
 
															 #
														
@@ -270,22 +123,13 @@ CC = $(CROSS_COMPILE)gcc
 
															 AR = $(CROSS_COMPILE)ar
														
 
															 RM = rm -f
														
 
															 MKDIR = mkdir
														
 
															-TAR = tar
														
 
															 FIND = find
														
 
															 INSTALL = install
														
 
															-RPMBUILD = rpmbuild
														
 
															-PTHREAD_LIBS = -lpthread
														
 
															 # sparse is architecture-neutral, which means that we need to tell it
														
 
															 # explicitly what architecture to check for. Fix this up for yours..
														
 
															 SPARSE_FLAGS = -D__BIG_ENDIAN__ -D__powerpc__
														
 
															-ifeq ($(V), 2)
														
 
															-	QUIET_STDERR = ">/dev/null"
														
 
															-else
														
 
															-	QUIET_STDERR = ">/dev/null 2>&1"
														
 
															-endif
														
 
															-
														
 
															 -include feature-tests.mak
														
 
															 ifeq ($(call try-cc,$(SOURCE_HELLO),-Werror -fstack-protector-all),y)
														
@@ -310,49 +154,37 @@ BASIC_LDFLAGS =
 
															 # Guard against environment variables
														
 
															 BUILTIN_OBJS =
														
 
															-BUILT_INS =
														
 
															-COMPAT_CFLAGS =
														
 
															-COMPAT_OBJS =
														
 
															 LIB_H =
														
 
															 LIB_OBJS =
														
 
															-SCRIPT_PERL =
														
 
															+PYRF_OBJS =
														
 
															 SCRIPT_SH =
														
 
															-TEST_PROGRAMS =
														
 
															 SCRIPT_SH += perf-archive.sh
														
 
															 grep-libs = $(filter -l%,$(1))
														
 
															 strip-libs = $(filter-out -l%,$(1))
														
 
															+$(OUTPUT)python/perf.so: $(PYRF_OBJS)
														
 
															+	$(QUIET_GEN)python util/setup.py --quiet  build_ext --build-lib='$(OUTPUT)python' \
														
 
															+						--build-temp='$(OUTPUT)python/temp'
														
 
															 #
														
 
															 # No Perl scripts right now:
														
 
															 #
														
 
															-# SCRIPT_PERL += perf-add--interactive.perl
														
 
															-
														
 
															-SCRIPTS = $(patsubst %.sh,%,$(SCRIPT_SH)) \
														
 
															-	  $(patsubst %.perl,%,$(SCRIPT_PERL))
														
 
															-
														
 
															-# Empty...
														
 
															-EXTRA_PROGRAMS =
														
 
															-
														
 
															-# ... and all the rest that could be moved out of bindir to perfexecdir
														
 
															-PROGRAMS += $(EXTRA_PROGRAMS)
														
 
															+SCRIPTS = $(patsubst %.sh,%,$(SCRIPT_SH))
														
 
															 #
														
 
															 # Single 'perf' binary right now:
														
 
															 #
														
 
															 PROGRAMS += $(OUTPUT)perf
														
 
															-# List built-in command $C whose implementation cmd_$C() is not in
														
 
															-# builtin-$C.o but is linked in as part of some other command.
														
 
															-#
														
 
															+LANG_BINDINGS =
														
 
															 # what 'all' will build and 'install' will install, in perfexecdir
														
 
															 ALL_PROGRAMS = $(PROGRAMS) $(SCRIPTS)
														
 
															 # what 'all' will build but not install in perfexecdir
														
 
															-OTHER_PROGRAMS = $(OUTPUT)perf$X
														
 
															+OTHER_PROGRAMS = $(OUTPUT)perf
														
 
															 # Set paths to tools early so that they can be used for version tests.
														
 
															 ifndef SHELL_PATH
														
@@ -395,6 +227,7 @@ LIB_H += util/include/dwarf-regs.h
 
															 LIB_H += util/include/asm/dwarf2.h
														
 
															 LIB_H += util/include/asm/cpufeature.h
														
 
															 LIB_H += perf.h
														
 
															+LIB_H += util/annotate.h
														
 
															 LIB_H += util/cache.h
														
 
															 LIB_H += util/callchain.h
														
 
															 LIB_H += util/build-id.h
														
@@ -402,6 +235,7 @@ LIB_H += util/debug.h
 
															 LIB_H += util/debugfs.h
														
 
															 LIB_H += util/event.h
														
 
															 LIB_H += util/evsel.h
														
 
															+LIB_H += util/evlist.h
														
 
															 LIB_H += util/exec_cmd.h
														
 
															 LIB_H += util/types.h
														
 
															 LIB_H += util/levenshtein.h
														
@@ -416,6 +250,7 @@ LIB_H += util/help.h
 
															 LIB_H += util/session.h
														
 
															 LIB_H += util/strbuf.h
														
 
															 LIB_H += util/strlist.h
														
 
															+LIB_H += util/strfilter.h
														
 
															 LIB_H += util/svghelper.h
														
 
															 LIB_H += util/run-command.h
														
 
															 LIB_H += util/sigchain.h
														
@@ -425,21 +260,26 @@ LIB_H += util/values.h
 
															 LIB_H += util/sort.h
														
 
															 LIB_H += util/hist.h
														
 
															 LIB_H += util/thread.h
														
 
															+LIB_H += util/thread_map.h
														
 
															 LIB_H += util/trace-event.h
														
 
															 LIB_H += util/probe-finder.h
														
 
															 LIB_H += util/probe-event.h
														
 
															 LIB_H += util/pstack.h
														
 
															 LIB_H += util/cpumap.h
														
 
															+LIB_H += util/top.h
														
 
															 LIB_H += $(ARCH_INCLUDE)
														
 
															+LIB_H += util/cgroup.h
														
 
															 LIB_OBJS += $(OUTPUT)util/abspath.o
														
 
															 LIB_OBJS += $(OUTPUT)util/alias.o
														
 
															+LIB_OBJS += $(OUTPUT)util/annotate.o
														
 
															 LIB_OBJS += $(OUTPUT)util/build-id.o
														
 
															 LIB_OBJS += $(OUTPUT)util/config.o
														
 
															 LIB_OBJS += $(OUTPUT)util/ctype.o
														
 
															 LIB_OBJS += $(OUTPUT)util/debugfs.o
														
 
															 LIB_OBJS += $(OUTPUT)util/environment.o
														
 
															 LIB_OBJS += $(OUTPUT)util/event.o
														
 
															+LIB_OBJS += $(OUTPUT)util/evlist.o
														
 
															 LIB_OBJS += $(OUTPUT)util/evsel.o
														
 
															 LIB_OBJS += $(OUTPUT)util/exec_cmd.o
														
 
															 LIB_OBJS += $(OUTPUT)util/help.o
														
@@ -455,6 +295,8 @@ LIB_OBJS += $(OUTPUT)util/quote.o
 
															 LIB_OBJS += $(OUTPUT)util/strbuf.o
														
 
															 LIB_OBJS += $(OUTPUT)util/string.o
														
 
															 LIB_OBJS += $(OUTPUT)util/strlist.o
														
 
															+LIB_OBJS += $(OUTPUT)util/strfilter.o
														
 
															+LIB_OBJS += $(OUTPUT)util/top.o
														
 
															 LIB_OBJS += $(OUTPUT)util/usage.o
														
 
															 LIB_OBJS += $(OUTPUT)util/wrapper.o
														
 
															 LIB_OBJS += $(OUTPUT)util/sigchain.o
														
@@ -469,6 +311,7 @@ LIB_OBJS += $(OUTPUT)util/map.o
 
															 LIB_OBJS += $(OUTPUT)util/pstack.o
														
 
															 LIB_OBJS += $(OUTPUT)util/session.o
														
 
															 LIB_OBJS += $(OUTPUT)util/thread.o
														
 
															+LIB_OBJS += $(OUTPUT)util/thread_map.o
														
 
															 LIB_OBJS += $(OUTPUT)util/trace-event-parse.o
														
 
															 LIB_OBJS += $(OUTPUT)util/trace-event-read.o
														
 
															 LIB_OBJS += $(OUTPUT)util/trace-event-info.o
														
@@ -480,6 +323,7 @@ LIB_OBJS += $(OUTPUT)util/probe-event.o
 
															 LIB_OBJS += $(OUTPUT)util/util.o
														
 
															 LIB_OBJS += $(OUTPUT)util/xyarray.o
														
 
															 LIB_OBJS += $(OUTPUT)util/cpumap.o
														
 
															+LIB_OBJS += $(OUTPUT)util/cgroup.o
														
 
															 BUILTIN_OBJS += $(OUTPUT)builtin-annotate.o
														
@@ -514,6 +358,20 @@ BUILTIN_OBJS += $(OUTPUT)builtin-inject.o
 
															 PERFLIBS = $(LIB_FILE)
														
 
															+# Files needed for the python binding, perf.so
														
 
															+# pyrf is just an internal name needed for all those wrappers.
														
 
															+# This has to be in sync with what is in the 'sources' variable in
														
 
															+# tools/perf/util/setup.py
														
 
															+
														
 
															+PYRF_OBJS += $(OUTPUT)util/cpumap.o
														
 
															+PYRF_OBJS += $(OUTPUT)util/ctype.o
														
 
															+PYRF_OBJS += $(OUTPUT)util/evlist.o
														
 
															+PYRF_OBJS += $(OUTPUT)util/evsel.o
														
 
															+PYRF_OBJS += $(OUTPUT)util/python.o
														
 
															+PYRF_OBJS += $(OUTPUT)util/thread_map.o
														
 
															+PYRF_OBJS += $(OUTPUT)util/util.o
														
 
															+PYRF_OBJS += $(OUTPUT)util/xyarray.o
														
 
															+
														
 
															 #
														
 
															 # Platform specific tweaks
														
 
															 #
														
@@ -535,22 +393,6 @@ endif # NO_DWARF
 
															 -include arch/$(ARCH)/Makefile
														
 
															-ifeq ($(uname_S),Darwin)
														
 
															-	ifndef NO_FINK
														
 
															-		ifeq ($(shell test -d /sw/lib && echo y),y)
														
 
															-			BASIC_CFLAGS += -I/sw/include
														
 
															-			BASIC_LDFLAGS += -L/sw/lib
														
 
															-		endif
														
 
															-	endif
														
 
															-	ifndef NO_DARWIN_PORTS
														
 
															-		ifeq ($(shell test -d /opt/local/lib && echo y),y)
														
 
															-			BASIC_CFLAGS += -I/opt/local/include
														
 
															-			BASIC_LDFLAGS += -L/opt/local/lib
														
 
															-		endif
														
 
															-	endif
														
 
															-	PTHREAD_LIBS =
														
 
															-endif
														
 
															-
														
 
															 ifneq ($(OUTPUT),)
														
 
															 	BASIC_CFLAGS += -I$(OUTPUT)
														
 
															 endif
														
@@ -595,6 +437,7 @@ else
 
															 		LIB_OBJS += $(OUTPUT)util/ui/browsers/annotate.o
														
 
															 		LIB_OBJS += $(OUTPUT)util/ui/browsers/hists.o
														
 
															 		LIB_OBJS += $(OUTPUT)util/ui/browsers/map.o
														
 
															+		LIB_OBJS += $(OUTPUT)util/ui/browsers/top.o
														
 
															 		LIB_OBJS += $(OUTPUT)util/ui/helpline.o
														
 
															 		LIB_OBJS += $(OUTPUT)util/ui/progress.o
														
 
															 		LIB_OBJS += $(OUTPUT)util/ui/util.o
														
@@ -604,6 +447,7 @@ else
 
															 		LIB_H += util/ui/libslang.h
														
 
															 		LIB_H += util/ui/progress.h
														
 
															 		LIB_H += util/ui/util.h
														
 
															+		LIB_H += util/ui/ui.h
														
 
															 	endif
														
 
															 endif
														
@@ -635,12 +479,14 @@ else
 
															 	PYTHON_EMBED_CCOPTS = `python-config --cflags 2>/dev/null`
														
 
															 	FLAGS_PYTHON_EMBED=$(PYTHON_EMBED_CCOPTS) $(PYTHON_EMBED_LDOPTS)
														
 
															 	ifneq ($(call try-cc,$(SOURCE_PYTHON_EMBED),$(FLAGS_PYTHON_EMBED)),y)
														
 
															+		msg := $(warning No Python.h found, install python-dev[el] to have python support in 'perf script' and to build the python bindings)
														
 
															 		BASIC_CFLAGS += -DNO_LIBPYTHON
														
 
															 	else
														
 
															                ALL_LDFLAGS += $(PYTHON_EMBED_LDFLAGS)
														
 
															                EXTLIBS += $(PYTHON_EMBED_LIBADD)
														
 
															 		LIB_OBJS += $(OUTPUT)util/scripting-engines/trace-event-python.o
														
 
															 		LIB_OBJS += $(OUTPUT)scripts/python/Perf-Trace-Util/Context.o
														
 
															+		LANG_BINDINGS += $(OUTPUT)python/perf.so
														
 
															 	endif
														
 
															 endif
														
@@ -690,201 +536,13 @@ else
 
															 	endif
														
 
															 endif
														
 
															-ifndef CC_LD_DYNPATH
														
 
															-	ifdef NO_R_TO_GCC_LINKER
														
 
															-		# Some gcc does not accept and pass -R to the linker to specify
														
 
															-		# the runtime dynamic library path.
														
 
															-		CC_LD_DYNPATH = -Wl,-rpath,
														
 
															-	else
														
 
															-		CC_LD_DYNPATH = -R
														
 
															-	endif
														
 
															-endif
														
 
															-
														
 
															-ifdef NEEDS_SOCKET
														
 
															-	EXTLIBS += -lsocket
														
 
															-endif
														
 
															-ifdef NEEDS_NSL
														
 
															-	EXTLIBS += -lnsl
														
 
															-endif
														
 
															-ifdef NO_D_TYPE_IN_DIRENT
														
 
															-	BASIC_CFLAGS += -DNO_D_TYPE_IN_DIRENT
														
 
															-endif
														
 
															-ifdef NO_D_INO_IN_DIRENT
														
 
															-	BASIC_CFLAGS += -DNO_D_INO_IN_DIRENT
														
 
															-endif
														
 
															-ifdef NO_ST_BLOCKS_IN_STRUCT_STAT
														
 
															-	BASIC_CFLAGS += -DNO_ST_BLOCKS_IN_STRUCT_STAT
														
 
															-endif
														
 
															-ifdef USE_NSEC
														
 
															-	BASIC_CFLAGS += -DUSE_NSEC
														
 
															-endif
														
 
															-ifdef USE_ST_TIMESPEC
														
 
															-	BASIC_CFLAGS += -DUSE_ST_TIMESPEC
														
 
															-endif
														
 
															-ifdef NO_NSEC
														
 
															-	BASIC_CFLAGS += -DNO_NSEC
														
 
															-endif
														
 
															-ifdef NO_C99_FORMAT
														
 
															-	BASIC_CFLAGS += -DNO_C99_FORMAT
														
 
															-endif
														
 
															-ifdef SNPRINTF_RETURNS_BOGUS
														
 
															-	COMPAT_CFLAGS += -DSNPRINTF_RETURNS_BOGUS
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/snprintf.o
														
 
															-endif
														
 
															-ifdef FREAD_READS_DIRECTORIES
														
 
															-	COMPAT_CFLAGS += -DFREAD_READS_DIRECTORIES
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/fopen.o
														
 
															-endif
														
 
															-ifdef NO_SYMLINK_HEAD
														
 
															-	BASIC_CFLAGS += -DNO_SYMLINK_HEAD
														
 
															-endif
														
 
															-ifdef NO_STRCASESTR
														
 
															-	COMPAT_CFLAGS += -DNO_STRCASESTR
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/strcasestr.o
														
 
															-endif
														
 
															-ifdef NO_STRTOUMAX
														
 
															-	COMPAT_CFLAGS += -DNO_STRTOUMAX
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/strtoumax.o
														
 
															-endif
														
 
															-ifdef NO_STRTOULL
														
 
															-	COMPAT_CFLAGS += -DNO_STRTOULL
														
 
															-endif
														
 
															-ifdef NO_SETENV
														
 
															-	COMPAT_CFLAGS += -DNO_SETENV
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/setenv.o
														
 
															-endif
														
 
															-ifdef NO_MKDTEMP
														
 
															-	COMPAT_CFLAGS += -DNO_MKDTEMP
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/mkdtemp.o
														
 
															-endif
														
 
															-ifdef NO_UNSETENV
														
 
															-	COMPAT_CFLAGS += -DNO_UNSETENV
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/unsetenv.o
														
 
															-endif
														
 
															-ifdef NO_SYS_SELECT_H
														
 
															-	BASIC_CFLAGS += -DNO_SYS_SELECT_H
														
 
															-endif
														
 
															-ifdef NO_MMAP
														
 
															-	COMPAT_CFLAGS += -DNO_MMAP
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/mmap.o
														
 
															-else
														
 
															-	ifdef USE_WIN32_MMAP
														
 
															-		COMPAT_CFLAGS += -DUSE_WIN32_MMAP
														
 
															-		COMPAT_OBJS += $(OUTPUT)compat/win32mmap.o
														
 
															-	endif
														
 
															-endif
														
 
															-ifdef NO_PREAD
														
 
															-	COMPAT_CFLAGS += -DNO_PREAD
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/pread.o
														
 
															-endif
														
 
															-ifdef NO_FAST_WORKING_DIRECTORY
														
 
															-	BASIC_CFLAGS += -DNO_FAST_WORKING_DIRECTORY
														
 
															-endif
														
 
															-ifdef NO_TRUSTABLE_FILEMODE
														
 
															-	BASIC_CFLAGS += -DNO_TRUSTABLE_FILEMODE
														
 
															-endif
														
 
															-ifdef NO_IPV6
														
 
															-	BASIC_CFLAGS += -DNO_IPV6
														
 
															-endif
														
 
															-ifdef NO_UINTMAX_T
														
 
															-	BASIC_CFLAGS += -Duintmax_t=uint32_t
														
 
															-endif
														
 
															-ifdef NO_SOCKADDR_STORAGE
														
 
															-ifdef NO_IPV6
														
 
															-	BASIC_CFLAGS += -Dsockaddr_storage=sockaddr_in
														
 
															-else
														
 
															-	BASIC_CFLAGS += -Dsockaddr_storage=sockaddr_in6
														
 
															-endif
														
 
															-endif
														
 
															-ifdef NO_INET_NTOP
														
 
															-	LIB_OBJS += $(OUTPUT)compat/inet_ntop.o
														
 
															-endif
														
 
															-ifdef NO_INET_PTON
														
 
															-	LIB_OBJS += $(OUTPUT)compat/inet_pton.o
														
 
															-endif
														
 
															-
														
 
															-ifdef NO_ICONV
														
 
															-	BASIC_CFLAGS += -DNO_ICONV
														
 
															-endif
														
 
															-
														
 
															-ifdef OLD_ICONV
														
 
															-	BASIC_CFLAGS += -DOLD_ICONV
														
 
															-endif
														
 
															-
														
 
															-ifdef NO_DEFLATE_BOUND
														
 
															-	BASIC_CFLAGS += -DNO_DEFLATE_BOUND
														
 
															-endif
														
 
															-
														
 
															-ifdef PPC_SHA1
														
 
															-	SHA1_HEADER = "ppc/sha1.h"
														
 
															-	LIB_OBJS += $(OUTPUT)ppc/sha1.o ppc/sha1ppc.o
														
 
															-else
														
 
															-ifdef ARM_SHA1
														
 
															-	SHA1_HEADER = "arm/sha1.h"
														
 
															-	LIB_OBJS += $(OUTPUT)arm/sha1.o $(OUTPUT)arm/sha1_arm.o
														
 
															-else
														
 
															-ifdef MOZILLA_SHA1
														
 
															-	SHA1_HEADER = "mozilla-sha1/sha1.h"
														
 
															-	LIB_OBJS += $(OUTPUT)mozilla-sha1/sha1.o
														
 
															-else
														
 
															-	SHA1_HEADER = <openssl/sha.h>
														
 
															-	EXTLIBS += $(LIB_4_CRYPTO)
														
 
															-endif
														
 
															-endif
														
 
															-endif
														
 
															-ifdef NO_PERL_MAKEMAKER
														
 
															-	export NO_PERL_MAKEMAKER
														
 
															-endif
														
 
															-ifdef NO_HSTRERROR
														
 
															-	COMPAT_CFLAGS += -DNO_HSTRERROR
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/hstrerror.o
														
 
															-endif
														
 
															-ifdef NO_MEMMEM
														
 
															-	COMPAT_CFLAGS += -DNO_MEMMEM
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/memmem.o
														
 
															-endif
														
 
															-ifdef INTERNAL_QSORT
														
 
															-	COMPAT_CFLAGS += -DINTERNAL_QSORT
														
 
															-	COMPAT_OBJS += $(OUTPUT)compat/qsort.o
														
 
															-endif
														
 
															-ifdef RUNTIME_PREFIX
														
 
															-	COMPAT_CFLAGS += -DRUNTIME_PREFIX
														
 
															-endif
														
 
															-
														
 
															-ifdef DIR_HAS_BSD_GROUP_SEMANTICS
														
 
															-	COMPAT_CFLAGS += -DDIR_HAS_BSD_GROUP_SEMANTICS
														
 
															-endif
														
 
															-ifdef NO_EXTERNAL_GREP
														
 
															-	BASIC_CFLAGS += -DNO_EXTERNAL_GREP
														
 
															-endif
														
 
															-
														
 
															-ifeq ($(PERL_PATH),)
														
 
															-NO_PERL=NoThanks
														
 
															-endif
														
 
															-
														
 
															-QUIET_SUBDIR0  = +$(MAKE) -C # space to separate -C and subdir
														
 
															-QUIET_SUBDIR1  =
														
 
															-
														
 
															-ifneq ($(findstring $(MAKEFLAGS),w),w)
														
 
															-PRINT_DIR = --no-print-directory
														
 
															-else # "make -w"
														
 
															-NO_SUBDIR = :
														
 
															-endif
														
 
															-
														
 
															 ifneq ($(findstring $(MAKEFLAGS),s),s)
														
 
															 ifndef V
														
 
															 	QUIET_CC       = @echo '   ' CC $@;
														
 
															 	QUIET_AR       = @echo '   ' AR $@;
														
 
															 	QUIET_LINK     = @echo '   ' LINK $@;
														
 
															 	QUIET_MKDIR    = @echo '   ' MKDIR $@;
														
 
															-	QUIET_BUILT_IN = @echo '   ' BUILTIN $@;
														
 
															 	QUIET_GEN      = @echo '   ' GEN $@;
														
 
															-	QUIET_SUBDIR0  = +@subdir=
														
 
															-	QUIET_SUBDIR1  = ;$(NO_SUBDIR) echo '   ' SUBDIR $$subdir; \
														
 
															-			 $(MAKE) $(PRINT_DIR) -C $$subdir
														
 
															-	export V
														
 
															-	export QUIET_GEN
														
 
															-	export QUIET_BUILT_IN
														
 
															 endif
														
 
															 endif
														
@@ -894,7 +552,6 @@ endif
 
															 # Shell quote (do not use $(call) to accommodate ancient setups);
														
 
															-SHA1_HEADER_SQ = $(subst ','\'',$(SHA1_HEADER))
														
 
															 ETC_PERFCONFIG_SQ = $(subst ','\'',$(ETC_PERFCONFIG))
														
 
															 DESTDIR_SQ = $(subst ','\'',$(DESTDIR))
														
@@ -908,46 +565,36 @@ htmldir_SQ = $(subst ','\'',$(htmldir))
 
															 prefix_SQ = $(subst ','\'',$(prefix))
														
 
															 SHELL_PATH_SQ = $(subst ','\'',$(SHELL_PATH))
														
 
															-PERL_PATH_SQ = $(subst ','\'',$(PERL_PATH))
														
 
															 LIBS = -Wl,--whole-archive $(PERFLIBS) -Wl,--no-whole-archive $(EXTLIBS)
														
 
															-BASIC_CFLAGS += -DSHA1_HEADER='$(SHA1_HEADER_SQ)' \
														
 
															-	$(COMPAT_CFLAGS)
														
 
															-LIB_OBJS += $(COMPAT_OBJS)
														
 
															-
														
 
															 ALL_CFLAGS += $(BASIC_CFLAGS)
														
 
															 ALL_CFLAGS += $(ARCH_CFLAGS)
														
 
															 ALL_LDFLAGS += $(BASIC_LDFLAGS)
														
 
															-export TAR INSTALL DESTDIR SHELL_PATH
														
 
															+export INSTALL SHELL_PATH
														
 
															 ### Build rules
														
 
															 SHELL = $(SHELL_PATH)
														
 
															-all:: shell_compatibility_test $(ALL_PROGRAMS) $(BUILT_INS) $(OTHER_PROGRAMS) $(OUTPUT)PERF-BUILD-OPTIONS
														
 
															-ifneq (,$X)
														
 
															-	$(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), test '$p' -ef '$p$X' || $(RM) '$p';)
														
 
															-endif
														
 
															-
														
 
															-all::
														
 
															+all: shell_compatibility_test $(ALL_PROGRAMS) $(LANG_BINDINGS) $(OTHER_PROGRAMS)
														
 
															 please_set_SHELL_PATH_to_a_more_modern_shell:
														
 
															 	@$$(:)
														
 
															 shell_compatibility_test: please_set_SHELL_PATH_to_a_more_modern_shell
														
 
															-strip: $(PROGRAMS) $(OUTPUT)perf$X
														
 
															-	$(STRIP) $(STRIP_OPTS) $(PROGRAMS) $(OUTPUT)perf$X
														
 
															+strip: $(PROGRAMS) $(OUTPUT)perf
														
 
															+	$(STRIP) $(STRIP_OPTS) $(PROGRAMS) $(OUTPUT)perf
														
 
															 $(OUTPUT)perf.o: perf.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS
														
 
															 	$(QUIET_CC)$(CC) -DPERF_VERSION='"$(PERF_VERSION)"' \
														
 
															 		'-DPERF_HTML_PATH="$(htmldir_SQ)"' \
														
 
															 		$(ALL_CFLAGS) -c $(filter %.c,$^) -o $@
														
 
															-$(OUTPUT)perf$X: $(OUTPUT)perf.o $(BUILTIN_OBJS) $(PERFLIBS)
														
 
															+$(OUTPUT)perf: $(OUTPUT)perf.o $(BUILTIN_OBJS) $(PERFLIBS)
														
 
															 	$(QUIET_LINK)$(CC) $(ALL_CFLAGS) $(ALL_LDFLAGS) $(OUTPUT)perf.o \
														
 
															                $(BUILTIN_OBJS) $(LIBS) -o $@
														
@@ -963,39 +610,17 @@ $(OUTPUT)builtin-timechart.o: builtin-timechart.c $(OUTPUT)common-cmds.h $(OUTPU
 
															 		'-DPERF_MAN_PATH="$(mandir_SQ)"' \
														
 
															 		'-DPERF_INFO_PATH="$(infodir_SQ)"' $<
														
 
															-$(BUILT_INS): $(OUTPUT)perf$X
														
 
															-	$(QUIET_BUILT_IN)$(RM) $@ && \
														
 
															-	ln perf$X $@ 2>/dev/null || \
														
 
															-	ln -s perf$X $@ 2>/dev/null || \
														
 
															-	cp perf$X $@
														
 
															-
														
 
															 $(OUTPUT)common-cmds.h: util/generate-cmdlist.sh command-list.txt
														
 
															 $(OUTPUT)common-cmds.h: $(wildcard Documentation/perf-*.txt)
														
 
															 	$(QUIET_GEN). util/generate-cmdlist.sh > $@+ && mv $@+ $@
														
 
															-$(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh
														
 
															-	$(QUIET_GEN)$(RM) $(OUTPUT)$@ $(OUTPUT)$@+ && \
														
 
															-	sed -e '1s|#!.*/sh|#!$(SHELL_PATH_SQ)|' \
														
 
															-	    -e 's|@SHELL_PATH@|$(SHELL_PATH_SQ)|' \
														
 
															-	    -e 's|@@PERL@@|$(PERL_PATH_SQ)|g' \
														
 
															-	    -e 's/@@PERF_VERSION@@/$(PERF_VERSION)/g' \
														
 
															-	    -e 's/@@NO_CURL@@/$(NO_CURL)/g' \
														
 
															-	    $@.sh > $(OUTPUT)$@+ && \
														
 
															-	chmod +x $(OUTPUT)$@+ && \
														
 
															-	mv $(OUTPUT)$@+ $(OUTPUT)$@
														
 
															-
														
 
															-configure: configure.ac
														
 
															-	$(QUIET_GEN)$(RM) $@ $<+ && \
														
 
															-	sed -e 's/@@PERF_VERSION@@/$(PERF_VERSION)/g' \
														
 
															-	    $< > $<+ && \
														
 
															-	autoconf -o $@ $<+ && \
														
 
															-	$(RM) $<+
														
 
															+$(SCRIPTS) : % : %.sh
														
 
															+	$(QUIET_GEN)$(INSTALL) '$@.sh' '$(OUTPUT)$@'
														
 
															 # These can record PERF_VERSION
														
 
															 $(OUTPUT)perf.o perf.spec \
														
 
															-	$(patsubst %.sh,%,$(SCRIPT_SH)) \
														
 
															-	$(patsubst %.perl,%,$(SCRIPT_PERL)) \
														
 
															+	$(SCRIPTS) \
														
 
															 	: $(OUTPUT)PERF-VERSION-FILE
														
 
															 $(OUTPUT)%.o: %.c $(OUTPUT)PERF-CFLAGS
														
@@ -1012,9 +637,6 @@ $(OUTPUT)util/exec_cmd.o: util/exec_cmd.c $(OUTPUT)PERF-CFLAGS
 
															 		'-DPREFIX="$(prefix_SQ)"' \
														
 
															 		$<
														
 
															-$(OUTPUT)builtin-init-db.o: builtin-init-db.c $(OUTPUT)PERF-CFLAGS
														
 
															-	$(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DDEFAULT_PERF_TEMPLATE_DIR='"$(template_dir_SQ)"' $<
														
 
															-
														
 
															 $(OUTPUT)util/config.o: util/config.c $(OUTPUT)PERF-CFLAGS
														
 
															 	$(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $<
														
@@ -1024,6 +646,9 @@ $(OUTPUT)util/ui/browser.o: util/ui/browser.c $(OUTPUT)PERF-CFLAGS
 
															 $(OUTPUT)util/ui/browsers/annotate.o: util/ui/browsers/annotate.c $(OUTPUT)PERF-CFLAGS
														
 
															 	$(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DENABLE_SLFUTURE_CONST $<
														
 
															+$(OUTPUT)util/ui/browsers/top.o: util/ui/browsers/top.c $(OUTPUT)PERF-CFLAGS
														
 
															+	$(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DENABLE_SLFUTURE_CONST $<
														
 
															+
														
 
															 $(OUTPUT)util/ui/browsers/hists.o: util/ui/browsers/hists.c $(OUTPUT)PERF-CFLAGS
														
 
															 	$(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DENABLE_SLFUTURE_CONST $<
														
@@ -1045,12 +670,11 @@ $(OUTPUT)util/scripting-engines/trace-event-python.o: util/scripting-engines/tra
 
															 $(OUTPUT)scripts/python/Perf-Trace-Util/Context.o: scripts/python/Perf-Trace-Util/Context.c $(OUTPUT)PERF-CFLAGS
														
 
															 	$(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $<
														
 
															-$(OUTPUT)perf-%$X: %.o $(PERFLIBS)
														
 
															+$(OUTPUT)perf-%: %.o $(PERFLIBS)
														
 
															 	$(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(ALL_LDFLAGS) $(filter %.o,$^) $(LIBS)
														
 
															 $(LIB_OBJS) $(BUILTIN_OBJS): $(LIB_H)
														
 
															-$(patsubst perf-%$X,%.o,$(PROGRAMS)): $(LIB_H) $(wildcard */*.h)
														
 
															-builtin-revert.o wt-status.o: wt-status.h
														
 
															+$(patsubst perf-%,%.o,$(PROGRAMS)): $(LIB_H) $(wildcard */*.h)
														
 
															 # we compile into subdirectories. if the target directory is not the source directory, they might not exists. So
														
 
															 # we depend the various files onto their directories.
														
@@ -1063,6 +687,36 @@ $(sort $(dir $(DIRECTORY_DEPS))):
 
															 $(LIB_FILE): $(LIB_OBJS)
														
 
															 	$(QUIET_AR)$(RM) $@ && $(AR) rcs $@ $(LIB_OBJS)
														
 
															+help:
														
 
															+	@echo 'Perf make targets:'
														
 
															+	@echo '  doc		- make *all* documentation (see below)'
														
 
															+	@echo '  man		- make manpage documentation (access with man <foo>)'
														
 
															+	@echo '  html		- make html documentation'
														
 
															+	@echo '  info		- make GNU info documentation (access with info <foo>)'
														
 
															+	@echo '  pdf		- make pdf documentation'
														
 
															+	@echo '  TAGS		- use etags to make tag information for source browsing'
														
 
															+	@echo '  tags		- use ctags to make tag information for source browsing'
														
 
															+	@echo '  cscope	- use cscope to make interactive browsing database'
														
 
															+	@echo ''
														
 
															+	@echo 'Perf install targets:'
														
 
															+	@echo '  NOTE: documentation build requires asciidoc, xmlto packages to be installed'
														
 
															+	@echo '  HINT: use "make prefix=<path> <install target>" to install to a particular'
														
 
															+	@echo '        path like make prefix=/usr/local install install-doc'
														
 
															+	@echo '  install	- install compiled binaries'
														
 
															+	@echo '  install-doc	- install *all* documentation'
														
 
															+	@echo '  install-man	- install manpage documentation'
														
 
															+	@echo '  install-html	- install html documentation'
														
 
															+	@echo '  install-info	- install GNU info documentation'
														
 
															+	@echo '  install-pdf	- install pdf documentation'
														
 
															+	@echo ''
														
 
															+	@echo '  quick-install-doc	- alias for quick-install-man'
														
 
															+	@echo '  quick-install-man	- install the documentation quickly'
														
 
															+	@echo '  quick-install-html	- install the html documentation quickly'
														
 
															+	@echo ''
														
 
															+	@echo 'Perf maintainer targets:'
														
 
															+	@echo '  distclean		- alias to clean'
														
 
															+	@echo '  clean			- clean all binary objects and build output'
														
 
															+
														
 
															 doc:
														
 
															 	$(MAKE) -C Documentation all
														
@@ -1101,30 +755,12 @@ $(OUTPUT)PERF-CFLAGS: .FORCE-PERF-CFLAGS
 
															 		echo "$$FLAGS" >$(OUTPUT)PERF-CFLAGS; \
														
 
															             fi
														
 
															-# We need to apply sq twice, once to protect from the shell
														
 
															-# that runs $(OUTPUT)PERF-BUILD-OPTIONS, and then again to protect it
														
 
															-# and the first level quoting from the shell that runs "echo".
														
 
															-$(OUTPUT)PERF-BUILD-OPTIONS: .FORCE-PERF-BUILD-OPTIONS
														
 
															-	@echo SHELL_PATH=\''$(subst ','\'',$(SHELL_PATH_SQ))'\' >$@
														
 
															-	@echo TAR=\''$(subst ','\'',$(subst ','\'',$(TAR)))'\' >>$@
														
 
															-	@echo NO_CURL=\''$(subst ','\'',$(subst ','\'',$(NO_CURL)))'\' >>$@
														
 
															-	@echo NO_PERL=\''$(subst ','\'',$(subst ','\'',$(NO_PERL)))'\' >>$@
														
 
															-
														
 
															 ### Testing rules
														
 
															-#
														
 
															-# None right now:
														
 
															-#
														
 
															-# TEST_PROGRAMS += test-something$X
														
 
															-
														
 
															-all:: $(TEST_PROGRAMS)
														
 
															-
														
 
															 # GNU make supports exporting all variables by "export" without parameters.
														
 
															 # However, the environment gets quite big, and some programs have problems
														
 
															 # with that.
														
 
															-export NO_SVN_TESTS
														
 
															-
														
 
															 check: $(OUTPUT)common-cmds.h
														
 
															 	if sparse; \
														
 
															 	then \
														
@@ -1133,33 +769,21 @@ check: $(OUTPUT)common-cmds.h
 
															 			sparse $(ALL_CFLAGS) $(SPARSE_FLAGS) $$i || exit; \
														
 
															 		done; \
														
 
															 	else \
														
 
															-		echo 2>&1 "Did you mean 'make test'?"; \
														
 
															 		exit 1; \
														
 
															 	fi
														
 
															-remove-dashes:
														
 
															-	./fixup-builtins $(BUILT_INS) $(PROGRAMS) $(SCRIPTS)
														
 
															-
														
 
															 ### Installation rules
														
 
															-ifneq ($(filter /%,$(firstword $(template_dir))),)
														
 
															-template_instdir = $(template_dir)
														
 
															-else
														
 
															-template_instdir = $(prefix)/$(template_dir)
														
 
															-endif
														
 
															-export template_instdir
														
 
															-
														
 
															 ifneq ($(filter /%,$(firstword $(perfexecdir))),)
														
 
															 perfexec_instdir = $(perfexecdir)
														
 
															 else
														
 
															 perfexec_instdir = $(prefix)/$(perfexecdir)
														
 
															 endif
														
 
															 perfexec_instdir_SQ = $(subst ','\'',$(perfexec_instdir))
														
 
															-export perfexec_instdir
														
 
															 install: all
														
 
															 	$(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(bindir_SQ)'
														
 
															-	$(INSTALL) $(OUTPUT)perf$X '$(DESTDIR_SQ)$(bindir_SQ)'
														
 
															+	$(INSTALL) $(OUTPUT)perf '$(DESTDIR_SQ)$(bindir_SQ)'
														
 
															 	$(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace'
														
 
															 	$(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin'
														
 
															 	$(INSTALL) $(OUTPUT)perf-archive -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)'
														
@@ -1172,14 +796,6 @@ install: all
 
															 	$(INSTALL) scripts/python/*.py -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/python'
														
 
															 	$(INSTALL) scripts/python/bin/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/python/bin'
														
 
															-ifdef BUILT_INS
														
 
															-	$(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)'
														
 
															-	$(INSTALL) $(BUILT_INS) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)'
														
 
															-ifneq (,$X)
														
 
															-	$(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) $(OUTPUT)perf$X)), $(RM) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/$p';)
														
 
															-endif
														
 
															-endif
														
 
															-
														
 
															 install-doc:
														
 
															 	$(MAKE) -C Documentation install
														
@@ -1204,104 +820,17 @@ quick-install-man:
 
															 quick-install-html:
														
 
															 	$(MAKE) -C Documentation quick-install-html
														
 
															-
														
 
															-### Maintainer's dist rules
														
 
															-#
														
 
															-# None right now
														
 
															-#
														
 
															-#
														
 
															-# perf.spec: perf.spec.in
														
 
															-#	sed -e 's/@@VERSION@@/$(PERF_VERSION)/g' < $< > $@+
														
 
															-#	mv $@+ $@
														
 
															-#
														
 
															-# PERF_TARNAME=perf-$(PERF_VERSION)
														
 
															-# dist: perf.spec perf-archive$(X) configure
														
 
															-#	./perf-archive --format=tar \
														
 
															-#		--prefix=$(PERF_TARNAME)/ HEAD^{tree} > $(PERF_TARNAME).tar
														
 
															-#	@mkdir -p $(PERF_TARNAME)
														
 
															-#	@cp perf.spec configure $(PERF_TARNAME)
														
 
															-#	@echo $(PERF_VERSION) > $(PERF_TARNAME)/version
														
 
															-#	$(TAR) rf $(PERF_TARNAME).tar \
														
 
															-#		$(PERF_TARNAME)/perf.spec \
														
 
															-#		$(PERF_TARNAME)/configure \
														
 
															-#		$(PERF_TARNAME)/version
														
 
															-#	@$(RM) -r $(PERF_TARNAME)
														
 
															-#	gzip -f -9 $(PERF_TARNAME).tar
														
 
															-#
														
 
															-# htmldocs = perf-htmldocs-$(PERF_VERSION)
														
 
															-# manpages = perf-manpages-$(PERF_VERSION)
														
 
															-# dist-doc:
														
 
															-#	$(RM) -r .doc-tmp-dir
														
 
															-#	mkdir .doc-tmp-dir
														
 
															-#	$(MAKE) -C Documentation WEBDOC_DEST=../.doc-tmp-dir install-webdoc
														
 
															-#	cd .doc-tmp-dir && $(TAR) cf ../$(htmldocs).tar .
														
 
															-#	gzip -n -9 -f $(htmldocs).tar
														
 
															-#	:
														
 
															-#	$(RM) -r .doc-tmp-dir
														
 
															-#	mkdir -p .doc-tmp-dir/man1 .doc-tmp-dir/man5 .doc-tmp-dir/man7
														
 
															-#	$(MAKE) -C Documentation DESTDIR=./ \
														
 
															-#		man1dir=../.doc-tmp-dir/man1 \
														
 
															-#		man5dir=../.doc-tmp-dir/man5 \
														
 
															-#		man7dir=../.doc-tmp-dir/man7 \
														
 
															-#		install
														
 
															-#	cd .doc-tmp-dir && $(TAR) cf ../$(manpages).tar .
														
 
															-#	gzip -n -9 -f $(manpages).tar
														
 
															-#	$(RM) -r .doc-tmp-dir
														
 
															-#
														
 
															-# rpm: dist
														
 
															-#	$(RPMBUILD) -ta $(PERF_TARNAME).tar.gz
														
 
															-
														
 
															 ### Cleaning rules
														
 
															-distclean: clean
														
 
															-#	$(RM) configure
														
 
															-
														
 
															 clean:
														
 
															-	$(RM) *.o */*.o */*/*.o */*/*/*.o $(LIB_FILE)
														
 
															-	$(RM) $(ALL_PROGRAMS) $(BUILT_INS) perf$X
														
 
															-	$(RM) $(TEST_PROGRAMS)
														
 
															+	$(RM) $(OUTPUT){*.o,*/*.o,*/*/*.o,*/*/*/*.o,$(LIB_FILE),perf-archive}
														
 
															+	$(RM) $(ALL_PROGRAMS) perf
														
 
															 	$(RM) *.spec *.pyc *.pyo */*.pyc */*.pyo $(OUTPUT)common-cmds.h TAGS tags cscope*
														
 
															-	$(RM) -r autom4te.cache
														
 
															-	$(RM) config.log config.mak.autogen config.mak.append config.status config.cache
														
 
															-	$(RM) -r $(PERF_TARNAME) .doc-tmp-dir
														
 
															-	$(RM) $(PERF_TARNAME).tar.gz perf-core_$(PERF_VERSION)-*.tar.gz
														
 
															-	$(RM) $(htmldocs).tar.gz $(manpages).tar.gz
														
 
															 	$(MAKE) -C Documentation/ clean
														
 
															-	$(RM) $(OUTPUT)PERF-VERSION-FILE $(OUTPUT)PERF-CFLAGS $(OUTPUT)PERF-BUILD-OPTIONS
														
 
															+	$(RM) $(OUTPUT)PERF-VERSION-FILE $(OUTPUT)PERF-CFLAGS
														
 
															+	@python util/setup.py clean --build-lib='$(OUTPUT)python' \
														
 
															+				   --build-temp='$(OUTPUT)python/temp'
														
 
															 .PHONY: all install clean strip
														
 
															 .PHONY: shell_compatibility_test please_set_SHELL_PATH_to_a_more_modern_shell
														
 
															 .PHONY: .FORCE-PERF-VERSION-FILE TAGS tags cscope .FORCE-PERF-CFLAGS
														
 
															-.PHONY: .FORCE-PERF-BUILD-OPTIONS
														
 
															-
														
 
															-### Make sure built-ins do not have dups and listed in perf.c
														
 
															-#
														
 
															-check-builtins::
														
 
															-	./check-builtins.sh
														
 
															-
														
 
															-### Test suite coverage testing
														
 
															-#
														
 
															-# None right now
														
 
															-#
														
 
															-# .PHONY: coverage coverage-clean coverage-build coverage-report
														
 
															-#
														
 
															-# coverage:
														
 
															-#	$(MAKE) coverage-build
														
 
															-#	$(MAKE) coverage-report
														
 
															-#
														
 
															-# coverage-clean:
														
 
															-#	rm -f *.gcda *.gcno
														
 
															-#
														
 
															-# COVERAGE_CFLAGS = $(CFLAGS) -O0 -ftest-coverage -fprofile-arcs
														
 
															-# COVERAGE_LDFLAGS = $(CFLAGS)  -O0 -lgcov
														
 
															-#
														
 
															-# coverage-build: coverage-clean
														
 
															-#	$(MAKE) CFLAGS="$(COVERAGE_CFLAGS)" LDFLAGS="$(COVERAGE_LDFLAGS)" all
														
 
															-#	$(MAKE) CFLAGS="$(COVERAGE_CFLAGS)" LDFLAGS="$(COVERAGE_LDFLAGS)" \
														
 
															-#		-j1 test
														
 
															-#
														
 
															-# coverage-report:
														
 
															-#	gcov -b *.c */*.c
														
 
															-#	grep '^function.*called 0 ' *.c.gcov */*.c.gcov \
														
 
															-#		| sed -e 's/\([^:]*\)\.gcov: *function \([^ ]*\) called.*/\1: \2/' \
														
 
															-#		| tee coverage-untested-functions
														
--- a/tools/perf/bench/sched-pipe.c
+++ b/tools/perf/bench/sched-pipe.c
@@ -55,7 +55,7 @@ int bench_sched_pipe(int argc, const char **argv,
 
															 	 * discarding returned value of read(), write()
														
 
															 	 * causes error in building environment for perf
														
 
															 	 */
														
 
															-	int ret, wait_stat;
														
 
															+	int __used ret, wait_stat;
														
 
															 	pid_t pid, retpid;
														
 
															 	argc = parse_options(argc, argv, options,
														
--- a/tools/perf/builtin-annotate.c
+++ b/tools/perf/builtin-annotate.c
@@ -9,6 +9,7 @@
 
															 #include "util/util.h"
														
 
															+#include "util/util.h"
														
 
															 #include "util/color.h"
														
 
															 #include <linux/list.h>
														
 
															 #include "util/cache.h"
														
@@ -18,6 +19,9 @@
 
															 #include "perf.h"
														
 
															 #include "util/debug.h"
														
 
															+#include "util/evlist.h"
														
 
															+#include "util/evsel.h"
														
 
															+#include "util/annotate.h"
														
 
															 #include "util/event.h"
														
 
															 #include "util/parse-options.h"
														
 
															 #include "util/parse-events.h"
														
@@ -36,9 +40,13 @@ static bool		print_line;
 
															 static const char *sym_hist_filter;
														
 
															-static int hists__add_entry(struct hists *self, struct addr_location *al)
														
 
															+static int perf_evlist__add_sample(struct perf_evlist *evlist,
														
 
															+				   struct perf_sample *sample,
														
 
															+				   struct addr_location *al)
														
 
															 {
														
 
															+	struct perf_evsel *evsel;
														
 
															 	struct hist_entry *he;
														
 
															+	int ret;
														
 
															 	if (sym_hist_filter != NULL &&
														
 
															 	    (al->sym == NULL || strcmp(sym_hist_filter, al->sym->name) != 0)) {
														
@@ -51,25 +59,51 @@ static int hists__add_entry(struct hists *self, struct addr_location *al)
 
															 		return 0;
														
 
															 	}
														
 
															-	he = __hists__add_entry(self, al, NULL, 1);
														
 
															+	evsel = perf_evlist__id2evsel(evlist, sample->id);
														
 
															+	if (evsel == NULL) {
														
 
															+		/*
														
 
															+		 * FIXME: Propagate this back, but at least we're in a builtin,
														
 
															+		 * where exit() is allowed. ;-)
														
 
															+		 */
														
 
															+		ui__warning("Invalid %s file, contains samples with id not in "
														
 
															+			    "its header!\n", input_name);
														
 
															+		exit_browser(0);
														
 
															+		exit(1);
														
 
															+	}
														
 
															+
														
 
															+	he = __hists__add_entry(&evsel->hists, al, NULL, 1);
														
 
															 	if (he == NULL)
														
 
															 		return -ENOMEM;
														
 
															-	return hist_entry__inc_addr_samples(he, al->addr);
														
 
															+	ret = 0;
														
 
															+	if (he->ms.sym != NULL) {
														
 
															+		struct annotation *notes = symbol__annotation(he->ms.sym);
														
 
															+		if (notes->src == NULL &&
														
 
															+		    symbol__alloc_hist(he->ms.sym, evlist->nr_entries) < 0)
														
 
															+			return -ENOMEM;
														
 
															+
														
 
															+		ret = hist_entry__inc_addr_samples(he, evsel->idx, al->addr);
														
 
															+	}
														
 
															+
														
 
															+	evsel->hists.stats.total_period += sample->period;
														
 
															+	hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
														
 
															+	return ret;
														
 
															 }
														
 
															-static int process_sample_event(event_t *event, struct sample_data *sample,
														
 
															+static int process_sample_event(union perf_event *event,
														
 
															+				struct perf_sample *sample,
														
 
															 				struct perf_session *session)
														
 
															 {
														
 
															 	struct addr_location al;
														
 
															-	if (event__preprocess_sample(event, session, &al, sample, NULL) < 0) {
														
 
															+	if (perf_event__preprocess_sample(event, session, &al, sample,
														
 
															+					  symbol__annotate_init) < 0) {
														
 
															 		pr_warning("problem processing %d event, skipping it.\n",
														
 
															 			   event->header.type);
														
 
															 		return -1;
														
 
															 	}
														
 
															-	if (!al.filtered && hists__add_entry(&session->hists, &al)) {
														
 
															+	if (!al.filtered && perf_evlist__add_sample(session->evlist, sample, &al)) {
														
 
															 		pr_warning("problem incrementing symbol count, "
														
 
															 			   "skipping event\n");
														
 
															 		return -1;
														
@@ -78,261 +112,26 @@ static int process_sample_event(event_t *event, struct sample_data *sample,
 
															 	return 0;
														
 
															 }
														
 
															-static int objdump_line__print(struct objdump_line *self,
														
 
															-			       struct list_head *head,
														
 
															-			       struct hist_entry *he, u64 len)
														
 
															-{
														
 
															-	struct symbol *sym = he->ms.sym;
														
 
															-	static const char *prev_line;
														
 
															-	static const char *prev_color;
														
 
															-
														
 
															-	if (self->offset != -1) {
														
 
															-		const char *path = NULL;
														
 
															-		unsigned int hits = 0;
														
 
															-		double percent = 0.0;
														
 
															-		const char *color;
														
 
															-		struct sym_priv *priv = symbol__priv(sym);
														
 
															-		struct sym_ext *sym_ext = priv->ext;
														
 
															-		struct sym_hist *h = priv->hist;
														
 
															-		s64 offset = self->offset;
														
 
															-		struct objdump_line *next = objdump__get_next_ip_line(head, self);
														
 
															-
														
 
															-		while (offset < (s64)len &&
														
 
															-		       (next == NULL || offset < next->offset)) {
														
 
															-			if (sym_ext) {
														
 
															-				if (path == NULL)
														
 
															-					path = sym_ext[offset].path;
														
 
															-				percent += sym_ext[offset].percent;
														
 
															-			} else
														
 
															-				hits += h->ip[offset];
														
 
															-
														
 
															-			++offset;
														
 
															-		}
														
 
															-
														
 
															-		if (sym_ext == NULL && h->sum)
														
 
															-			percent = 100.0 * hits / h->sum;
														
 
															-
														
 
															-		color = get_percent_color(percent);
														
 
															-
														
 
															-		/*
														
 
															-		 * Also color the filename and line if needed, with
														
 
															-		 * the same color than the percentage. Don't print it
														
 
															-		 * twice for close colored ip with the same filename:line
														
 
															-		 */
														
 
															-		if (path) {
														
 
															-			if (!prev_line || strcmp(prev_line, path)
														
 
															-				       || color != prev_color) {
														
 
															-				color_fprintf(stdout, color, " %s", path);
														
 
															-				prev_line = path;
														
 
															-				prev_color = color;
														
 
															-			}
														
 
															-		}
														
 
															-
														
 
															-		color_fprintf(stdout, color, " %7.2f", percent);
														
 
															-		printf(" :	");
														
 
															-		color_fprintf(stdout, PERF_COLOR_BLUE, "%s\n", self->line);
														
 
															-	} else {
														
 
															-		if (!*self->line)
														
 
															-			printf("         :\n");
														
 
															-		else
														
 
															-			printf("         :	%s\n", self->line);
														
 
															-	}
														
 
															-
														
 
															-	return 0;
														
 
															-}
														
 
															-
														
 
															-static struct rb_root root_sym_ext;
														
 
															-
														
 
															-static void insert_source_line(struct sym_ext *sym_ext)
														
 
															-{
														
 
															-	struct sym_ext *iter;
														
 
															-	struct rb_node **p = &root_sym_ext.rb_node;
														
 
															-	struct rb_node *parent = NULL;
														
 
															-
														
 
															-	while (*p != NULL) {
														
 
															-		parent = *p;
														
 
															-		iter = rb_entry(parent, struct sym_ext, node);
														
 
															-
														
 
															-		if (sym_ext->percent > iter->percent)
														
 
															-			p = &(*p)->rb_left;
														
 
															-		else
														
 
															-			p = &(*p)->rb_right;
														
 
															-	}
														
 
															-
														
 
															-	rb_link_node(&sym_ext->node, parent, p);
														
 
															-	rb_insert_color(&sym_ext->node, &root_sym_ext);
														
 
															-}
														
 
															-
														
 
															-static void free_source_line(struct hist_entry *he, int len)
														
 
															-{
														
 
															-	struct sym_priv *priv = symbol__priv(he->ms.sym);
														
 
															-	struct sym_ext *sym_ext = priv->ext;
														
 
															-	int i;
														
 
															-
														
 
															-	if (!sym_ext)
														
 
															-		return;
														
 
															-
														
 
															-	for (i = 0; i < len; i++)
														
 
															-		free(sym_ext[i].path);
														
 
															-	free(sym_ext);
														
 
															-
														
 
															-	priv->ext = NULL;
														
 
															-	root_sym_ext = RB_ROOT;
														
 
															-}
														
 
															-
														
 
															-/* Get the filename:line for the colored entries */
														
 
															-static void
														
 
															-get_source_line(struct hist_entry *he, int len, const char *filename)
														
 
															-{
														
 
															-	struct symbol *sym = he->ms.sym;
														
 
															-	u64 start;
														
 
															-	int i;
														
 
															-	char cmd[PATH_MAX * 2];
														
 
															-	struct sym_ext *sym_ext;
														
 
															-	struct sym_priv *priv = symbol__priv(sym);
														
 
															-	struct sym_hist *h = priv->hist;
														
 
															-
														
 
															-	if (!h->sum)
														
 
															-		return;
														
 
															-
														
 
															-	sym_ext = priv->ext = calloc(len, sizeof(struct sym_ext));
														
 
															-	if (!priv->ext)
														
 
															-		return;
														
 
															-
														
 
															-	start = he->ms.map->unmap_ip(he->ms.map, sym->start);
														
 
															-
														
 
															-	for (i = 0; i < len; i++) {
														
 
															-		char *path = NULL;
														
 
															-		size_t line_len;
														
 
															-		u64 offset;
														
 
															-		FILE *fp;
														
 
															-
														
 
															-		sym_ext[i].percent = 100.0 * h->ip[i] / h->sum;
														
 
															-		if (sym_ext[i].percent <= 0.5)
														
 
															-			continue;
														
 
															-
														
 
															-		offset = start + i;
														
 
															-		sprintf(cmd, "addr2line -e %s %016" PRIx64, filename, offset);
														
 
															-		fp = popen(cmd, "r");
														
 
															-		if (!fp)
														
 
															-			continue;
														
 
															-
														
 
															-		if (getline(&path, &line_len, fp) < 0 || !line_len)
														
 
															-			goto next;
														
 
															-
														
 
															-		sym_ext[i].path = malloc(sizeof(char) * line_len + 1);
														
 
															-		if (!sym_ext[i].path)
														
 
															-			goto next;
														
 
															-
														
 
															-		strcpy(sym_ext[i].path, path);
														
 
															-		insert_source_line(&sym_ext[i]);
														
 
															-
														
 
															-	next:
														
 
															-		pclose(fp);
														
 
															-	}
														
 
															-}
														
 
															-
														
 
															-static void print_summary(const char *filename)
														
 
															-{
														
 
															-	struct sym_ext *sym_ext;
														
 
															-	struct rb_node *node;
														
 
															-
														
 
															-	printf("\nSorted summary for file %s\n", filename);
														
 
															-	printf("----------------------------------------------\n\n");
														
 
															-
														
 
															-	if (RB_EMPTY_ROOT(&root_sym_ext)) {
														
 
															-		printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
														
 
															-		return;
														
 
															-	}
														
 
															-
														
 
															-	node = rb_first(&root_sym_ext);
														
 
															-	while (node) {
														
 
															-		double percent;
														
 
															-		const char *color;
														
 
															-		char *path;
														
 
															-
														
 
															-		sym_ext = rb_entry(node, struct sym_ext, node);
														
 
															-		percent = sym_ext->percent;
														
 
															-		color = get_percent_color(percent);
														
 
															-		path = sym_ext->path;
														
 
															-
														
 
															-		color_fprintf(stdout, color, " %7.2f %s", percent, path);
														
 
															-		node = rb_next(node);
														
 
															-	}
														
 
															-}
														
 
															-
														
 
															-static void hist_entry__print_hits(struct hist_entry *self)
														
 
															-{
														
 
															-	struct symbol *sym = self->ms.sym;
														
 
															-	struct sym_priv *priv = symbol__priv(sym);
														
 
															-	struct sym_hist *h = priv->hist;
														
 
															-	u64 len = sym->end - sym->start, offset;
														
 
															-
														
 
															-	for (offset = 0; offset < len; ++offset)
														
 
															-		if (h->ip[offset] != 0)
														
 
															-			printf("%*" PRIx64 ": %" PRIu64 "\n", BITS_PER_LONG / 2,
														
 
															-			       sym->start + offset, h->ip[offset]);
														
 
															-	printf("%*s: %" PRIu64 "\n", BITS_PER_LONG / 2, "h->sum", h->sum);
														
 
															-}
														
 
															-
														
 
															-static int hist_entry__tty_annotate(struct hist_entry *he)
														
 
															+static int hist_entry__tty_annotate(struct hist_entry *he, int evidx)
														
 
															 {
														
 
															-	struct map *map = he->ms.map;
														
 
															-	struct dso *dso = map->dso;
														
 
															-	struct symbol *sym = he->ms.sym;
														
 
															-	const char *filename = dso->long_name, *d_filename;
														
 
															-	u64 len;
														
 
															-	LIST_HEAD(head);
														
 
															-	struct objdump_line *pos, *n;
														
 
															-
														
 
															-	if (hist_entry__annotate(he, &head, 0) < 0)
														
 
															-		return -1;
														
 
															-
														
 
															-	if (full_paths)
														
 
															-		d_filename = filename;
														
 
															-	else
														
 
															-		d_filename = basename(filename);
														
 
															-
														
 
															-	len = sym->end - sym->start;
														
 
															-
														
 
															-	if (print_line) {
														
 
															-		get_source_line(he, len, filename);
														
 
															-		print_summary(filename);
														
 
															-	}
														
 
															-
														
 
															-	printf("\n\n------------------------------------------------\n");
														
 
															-	printf(" Percent |	Source code & Disassembly of %s\n", d_filename);
														
 
															-	printf("------------------------------------------------\n");
														
 
															-
														
 
															-	if (verbose)
														
 
															-		hist_entry__print_hits(he);
														
 
															-
														
 
															-	list_for_each_entry_safe(pos, n, &head, node) {
														
 
															-		objdump_line__print(pos, &head, he, len);
														
 
															-		list_del(&pos->node);
														
 
															-		objdump_line__free(pos);
														
 
															-	}
														
 
															-
														
 
															-	if (print_line)
														
 
															-		free_source_line(he, len);
														
 
															-
														
 
															-	return 0;
														
 
															+	return symbol__tty_annotate(he->ms.sym, he->ms.map, evidx,
														
 
															+				    print_line, full_paths, 0, 0);
														
 
															 }
														
 
															-static void hists__find_annotations(struct hists *self)
														
 
															+static void hists__find_annotations(struct hists *self, int evidx)
														
 
															 {
														
 
															 	struct rb_node *nd = rb_first(&self->entries), *next;
														
 
															 	int key = KEY_RIGHT;
														
 
															 	while (nd) {
														
 
															 		struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node);
														
 
															-		struct sym_priv *priv;
														
 
															+		struct annotation *notes;
														
 
															 		if (he->ms.sym == NULL || he->ms.map->dso->annotate_warned)
														
 
															 			goto find_next;
														
 
															-		priv = symbol__priv(he->ms.sym);
														
 
															-		if (priv->hist == NULL) {
														
 
															+		notes = symbol__annotation(he->ms.sym);
														
 
															+		if (notes->src == NULL) {
														
 
															 find_next:
														
 
															 			if (key == KEY_LEFT)
														
 
															 				nd = rb_prev(nd);
														
@@ -342,7 +141,7 @@ find_next:
 
															 		}
														
 
															 		if (use_browser > 0) {
														
 
															-			key = hist_entry__tui_annotate(he);
														
 
															+			key = hist_entry__tui_annotate(he, evidx);
														
 
															 			switch (key) {
														
 
															 			case KEY_RIGHT:
														
 
															 				next = rb_next(nd);
														
@@ -357,24 +156,24 @@ find_next:
 
															 			if (next != NULL)
														
 
															 				nd = next;
														
 
															 		} else {
														
 
															-			hist_entry__tty_annotate(he);
														
 
															+			hist_entry__tty_annotate(he, evidx);
														
 
															 			nd = rb_next(nd);
														
 
															 			/*
														
 
															 			 * Since we have a hist_entry per IP for the same
														
 
															-			 * symbol, free he->ms.sym->hist to signal we already
														
 
															+			 * symbol, free he->ms.sym->src to signal we already
														
 
															 			 * processed this symbol.
														
 
															 			 */
														
 
															-			free(priv->hist);
														
 
															-			priv->hist = NULL;
														
 
															+			free(notes->src);
														
 
															+			notes->src = NULL;
														
 
															 		}
														
 
															 	}
														
 
															 }
														
 
															 static struct perf_event_ops event_ops = {
														
 
															 	.sample	= process_sample_event,
														
 
															-	.mmap	= event__process_mmap,
														
 
															-	.comm	= event__process_comm,
														
 
															-	.fork	= event__process_task,
														
 
															+	.mmap	= perf_event__process_mmap,
														
 
															+	.comm	= perf_event__process_comm,
														
 
															+	.fork	= perf_event__process_task,
														
 
															 	.ordered_samples = true,
														
 
															 	.ordering_requires_timestamps = true,
														
 
															 };
														
@@ -383,6 +182,8 @@ static int __cmd_annotate(void)
 
															 {
														
 
															 	int ret;
														
 
															 	struct perf_session *session;
														
 
															+	struct perf_evsel *pos;
														
 
															+	u64 total_nr_samples;
														
 
															 	session = perf_session__new(input_name, O_RDONLY, force, false, &event_ops);
														
 
															 	if (session == NULL)
														
@@ -403,12 +204,36 @@ static int __cmd_annotate(void)
 
															 	if (verbose > 2)
														
 
															 		perf_session__fprintf_dsos(session, stdout);
														
 
															-	hists__collapse_resort(&session->hists);
														
 
															-	hists__output_resort(&session->hists);
														
 
															-	hists__find_annotations(&session->hists);
														
 
															-out_delete:
														
 
															-	perf_session__delete(session);
														
 
															+	total_nr_samples = 0;
														
 
															+	list_for_each_entry(pos, &session->evlist->entries, node) {
														
 
															+		struct hists *hists = &pos->hists;
														
 
															+		u32 nr_samples = hists->stats.nr_events[PERF_RECORD_SAMPLE];
														
 
															+
														
 
															+		if (nr_samples > 0) {
														
 
															+			total_nr_samples += nr_samples;
														
 
															+			hists__collapse_resort(hists);
														
 
															+			hists__output_resort(hists);
														
 
															+			hists__find_annotations(hists, pos->idx);
														
 
															+		}
														
 
															+	}
														
 
															+	if (total_nr_samples == 0) {
														
 
															+		ui__warning("The %s file has no samples!\n", input_name);
														
 
															+		goto out_delete;
														
 
															+	}
														
 
															+out_delete:
														
 
															+	/*
														
 
															+	 * Speed up the exit process, for large files this can
														
 
															+	 * take quite a while.
														
 
															+	 *
														
 
															+	 * XXX Enable this when using valgrind or if we ever
														
 
															+	 * librarize this command.
														
 
															+	 *
														
 
															+	 * Also experiment with obstacks to see how much speed
														
 
															+	 * up we'll get here.
														
 
															+	 *
														
 
															+	 * perf_session__delete(session);
														
 
															+	 */
														
 
															 	return ret;
														
 
															 }
														
@@ -451,9 +276,9 @@ int cmd_annotate(int argc, const char **argv, const char *prefix __used)
 
															 	else if (use_tui)
														
 
															 		use_browser = 1;
														
 
															-	setup_browser();
														
 
															+	setup_browser(true);
														
 
															-	symbol_conf.priv_size = sizeof(struct sym_priv);
														
 
															+	symbol_conf.priv_size = sizeof(struct annotation);
														
 
															 	symbol_conf.try_vmlinux_path = true;
														
 
															 	if (symbol__init() < 0)
														
--- a/tools/perf/builtin-diff.c
+++ b/tools/perf/builtin-diff.c
@@ -30,13 +30,13 @@ static int hists__add_entry(struct hists *self,
 
															 	return -ENOMEM;
														
 
															 }
														
 
															-static int diff__process_sample_event(event_t *event,
														
 
															-				      struct sample_data *sample,
														
 
															+static int diff__process_sample_event(union perf_event *event,
														
 
															+				      struct perf_sample *sample,
														
 
															 				      struct perf_session *session)
														
 
															 {
														
 
															 	struct addr_location al;
														
 
															-	if (event__preprocess_sample(event, session, &al, sample, NULL) < 0) {
														
 
															+	if (perf_event__preprocess_sample(event, session, &al, sample, NULL) < 0) {
														
 
															 		pr_warning("problem processing %d event, skipping it.\n",
														
 
															 			   event->header.type);
														
 
															 		return -1;
														
@@ -56,11 +56,11 @@ static int diff__process_sample_event(event_t *event,
 
															 static struct perf_event_ops event_ops = {
														
 
															 	.sample	= diff__process_sample_event,
														
 
															-	.mmap	= event__process_mmap,
														
 
															-	.comm	= event__process_comm,
														
 
															-	.exit	= event__process_task,
														
 
															-	.fork	= event__process_task,
														
 
															-	.lost	= event__process_lost,
														
 
															+	.mmap	= perf_event__process_mmap,
														
 
															+	.comm	= perf_event__process_comm,
														
 
															+	.exit	= perf_event__process_task,
														
 
															+	.fork	= perf_event__process_task,
														
 
															+	.lost	= perf_event__process_lost,
														
 
															 	.ordered_samples = true,
														
 
															 	.ordering_requires_timestamps = true,
														
 
															 };
														
--- a/tools/perf/builtin-inject.c
+++ b/tools/perf/builtin-inject.c
@@ -16,8 +16,8 @@
 
															 static char		const *input_name = "-";
														
 
															 static bool		inject_build_ids;
														
 
															-static int event__repipe_synth(event_t *event,
														
 
															-			       struct perf_session *session __used)
														
 
															+static int perf_event__repipe_synth(union perf_event *event,
														
 
															+				    struct perf_session *session __used)
														
 
															 {
														
 
															 	uint32_t size;
														
 
															 	void *buf = event;
														
@@ -36,41 +36,44 @@ static int event__repipe_synth(event_t *event,
 
															 	return 0;
														
 
															 }
														
 
															-static int event__repipe(event_t *event, struct sample_data *sample __used,
														
 
															-			 struct perf_session *session)
														
 
															+static int perf_event__repipe(union perf_event *event,
														
 
															+			      struct perf_sample *sample __used,
														
 
															+			      struct perf_session *session)
														
 
															 {
														
 
															-	return event__repipe_synth(event, session);
														
 
															+	return perf_event__repipe_synth(event, session);
														
 
															 }
														
 
															-static int event__repipe_mmap(event_t *self, struct sample_data *sample,
														
 
															-			      struct perf_session *session)
														
 
															+static int perf_event__repipe_mmap(union perf_event *event,
														
 
															+				   struct perf_sample *sample,
														
 
															+				   struct perf_session *session)
														
 
															 {
														
 
															 	int err;
														
 
															-	err = event__process_mmap(self, sample, session);
														
 
															-	event__repipe(self, sample, session);
														
 
															+	err = perf_event__process_mmap(event, sample, session);
														
 
															+	perf_event__repipe(event, sample, session);
														
 
															 	return err;
														
 
															 }
														
 
															-static int event__repipe_task(event_t *self, struct sample_data *sample,
														
 
															-			      struct perf_session *session)
														
 
															+static int perf_event__repipe_task(union perf_event *event,
														
 
															+				   struct perf_sample *sample,
														
 
															+				   struct perf_session *session)
														
 
															 {
														
 
															 	int err;
														
 
															-	err = event__process_task(self, sample, session);
														
 
															-	event__repipe(self, sample, session);
														
 
															+	err = perf_event__process_task(event, sample, session);
														
 
															+	perf_event__repipe(event, sample, session);
														
 
															 	return err;
														
 
															 }
														
 
															-static int event__repipe_tracing_data(event_t *self,
														
 
															-				      struct perf_session *session)
														
 
															+static int perf_event__repipe_tracing_data(union perf_event *event,
														
 
															+					   struct perf_session *session)
														
 
															 {
														
 
															 	int err;
														
 
															-	event__repipe_synth(self, session);
														
 
															-	err = event__process_tracing_data(self, session);
														
 
															+	perf_event__repipe_synth(event, session);
														
 
															+	err = perf_event__process_tracing_data(event, session);
														
 
															 	return err;
														
 
															 }
														
@@ -109,8 +112,8 @@ static int dso__inject_build_id(struct dso *self, struct perf_session *session)
 
															 	if (self->kernel)
														
 
															 		misc = PERF_RECORD_MISC_KERNEL;
														
 
															-	err = event__synthesize_build_id(self, misc, event__repipe,
														
 
															-					 machine, session);
														
 
															+	err = perf_event__synthesize_build_id(self, misc, perf_event__repipe,
														
 
															+					      machine, session);
														
 
															 	if (err) {
														
 
															 		pr_err("Can't synthesize build_id event for %s\n", self->long_name);
														
 
															 		return -1;
														
@@ -119,8 +122,9 @@ static int dso__inject_build_id(struct dso *self, struct perf_session *session)
 
															 	return 0;
														
 
															 }
														
 
															-static int event__inject_buildid(event_t *event, struct sample_data *sample,
														
 
															-				 struct perf_session *session)
														
 
															+static int perf_event__inject_buildid(union perf_event *event,
														
 
															+				      struct perf_sample *sample,
														
 
															+				      struct perf_session *session)
														
 
															 {
														
 
															 	struct addr_location al;
														
 
															 	struct thread *thread;
														
@@ -155,24 +159,24 @@ static int event__inject_buildid(event_t *event, struct sample_data *sample,
 
															 	}
														
 
															 repipe:
														
 
															-	event__repipe(event, sample, session);
														
 
															+	perf_event__repipe(event, sample, session);
														
 
															 	return 0;
														
 
															 }
														
 
															 struct perf_event_ops inject_ops = {
														
 
															-	.sample		= event__repipe,
														
 
															-	.mmap		= event__repipe,
														
 
															-	.comm		= event__repipe,
														
 
															-	.fork		= event__repipe,
														
 
															-	.exit		= event__repipe,
														
 
															-	.lost		= event__repipe,
														
 
															-	.read		= event__repipe,
														
 
															-	.throttle	= event__repipe,
														
 
															-	.unthrottle	= event__repipe,
														
 
															-	.attr		= event__repipe_synth,
														
 
															-	.event_type 	= event__repipe_synth,
														
 
															-	.tracing_data 	= event__repipe_synth,
														
 
															-	.build_id 	= event__repipe_synth,
														
 
															+	.sample		= perf_event__repipe,
														
 
															+	.mmap		= perf_event__repipe,
														
 
															+	.comm		= perf_event__repipe,
														
 
															+	.fork		= perf_event__repipe,
														
 
															+	.exit		= perf_event__repipe,
														
 
															+	.lost		= perf_event__repipe,
														
 
															+	.read		= perf_event__repipe,
														
 
															+	.throttle	= perf_event__repipe,
														
 
															+	.unthrottle	= perf_event__repipe,
														
 
															+	.attr		= perf_event__repipe_synth,
														
 
															+	.event_type 	= perf_event__repipe_synth,
														
 
															+	.tracing_data 	= perf_event__repipe_synth,
														
 
															+	.build_id 	= perf_event__repipe_synth,
														
 
															 };
														
 
															 extern volatile int session_done;
														
@@ -190,10 +194,10 @@ static int __cmd_inject(void)
 
															 	signal(SIGINT, sig_handler);
														
 
															 	if (inject_build_ids) {
														
 
															-		inject_ops.sample	= event__inject_buildid;
														
 
															-		inject_ops.mmap		= event__repipe_mmap;
														
 
															-		inject_ops.fork		= event__repipe_task;
														
 
															-		inject_ops.tracing_data	= event__repipe_tracing_data;
														
 
															+		inject_ops.sample	= perf_event__inject_buildid;
														
 
															+		inject_ops.mmap		= perf_event__repipe_mmap;
														
 
															+		inject_ops.fork		= perf_event__repipe_task;
														
 
															+		inject_ops.tracing_data	= perf_event__repipe_tracing_data;
														
 
															 	}
														
 
															 	session = perf_session__new(input_name, O_RDONLY, false, true, &inject_ops);
														
--- a/tools/perf/builtin-kmem.c
+++ b/tools/perf/builtin-kmem.c
@@ -275,9 +275,8 @@ static void process_free_event(void *data,
 
															 	s_alloc->alloc_cpu = -1;
														
 
															 }
														
 
															-static void
														
 
															-process_raw_event(event_t *raw_event __used, void *data,
														
 
															-		  int cpu, u64 timestamp, struct thread *thread)
														
 
															+static void process_raw_event(union perf_event *raw_event __used, void *data,
														
 
															+			      int cpu, u64 timestamp, struct thread *thread)
														
 
															 {
														
 
															 	struct event *event;
														
 
															 	int type;
														
@@ -304,7 +303,8 @@ process_raw_event(event_t *raw_event __used, void *data,
 
															 	}
														
 
															 }
														
 
															-static int process_sample_event(event_t *event, struct sample_data *sample,
														
 
															+static int process_sample_event(union perf_event *event,
														
 
															+				struct perf_sample *sample,
														
 
															 				struct perf_session *session)
														
 
															 {
														
 
															 	struct thread *thread = perf_session__findnew(session, event->ip.pid);
														
@@ -325,7 +325,7 @@ static int process_sample_event(event_t *event, struct sample_data *sample,
 
															 static struct perf_event_ops event_ops = {
														
 
															 	.sample			= process_sample_event,
														
 
															-	.comm			= event__process_comm,
														
 
															+	.comm			= perf_event__process_comm,
														
 
															 	.ordered_samples	= true,
														
 
															 };
														
--- a/tools/perf/builtin-list.c
+++ b/tools/perf/builtin-list.c
@@ -5,6 +5,7 @@
 
															  *
														
 
															  * Copyright (C) 2009, Thomas Gleixner <tglx@linutronix.de>
														
 
															  * Copyright (C) 2008-2009, Red Hat Inc, Ingo Molnar <mingo@redhat.com>
														
 
															+ * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
														
 
															  */
														
 
															 #include "builtin.h"
														
@@ -13,9 +14,47 @@
 
															 #include "util/parse-events.h"
														
 
															 #include "util/cache.h"
														
 
															-int cmd_list(int argc __used, const char **argv __used, const char *prefix __used)
														
 
															+int cmd_list(int argc, const char **argv, const char *prefix __used)
														
 
															 {
														
 
															 	setup_pager();
														
 
															-	print_events();
														
 
															+
														
 
															+	if (argc == 1)
														
 
															+		print_events(NULL);
														
 
															+	else {
														
 
															+		int i;
														
 
															+
														
 
															+		for (i = 1; i < argc; ++i) {
														
 
															+			if (i > 1)
														
 
															+				putchar('\n');
														
 
															+			if (strncmp(argv[i], "tracepoint", 10) == 0)
														
 
															+				print_tracepoint_events(NULL, NULL);
														
 
															+			else if (strcmp(argv[i], "hw") == 0 ||
														
 
															+				 strcmp(argv[i], "hardware") == 0)
														
 
															+				print_events_type(PERF_TYPE_HARDWARE);
														
 
															+			else if (strcmp(argv[i], "sw") == 0 ||
														
 
															+				 strcmp(argv[i], "software") == 0)
														
 
															+				print_events_type(PERF_TYPE_SOFTWARE);
														
 
															+			else if (strcmp(argv[i], "cache") == 0 ||
														
 
															+				 strcmp(argv[i], "hwcache") == 0)
														
 
															+				print_hwcache_events(NULL);
														
 
															+			else {
														
 
															+				char *sep = strchr(argv[i], ':'), *s;
														
 
															+				int sep_idx;
														
 
															+
														
 
															+				if (sep == NULL) {
														
 
															+					print_events(argv[i]);
														
 
															+					continue;
														
 
															+				}
														
 
															+				sep_idx = sep - argv[i];
														
 
															+				s = strdup(argv[i]);
														
 
															+				if (s == NULL)
														
 
															+					return -1;
														
 
															+
														
 
															+				s[sep_idx] = '\0';
														
 
															+				print_tracepoint_events(s, s + sep_idx + 1);
														
 
															+				free(s);
														
 
															+			}
														
 
															+		}
														
 
															+	}
														
 
															 	return 0;
														
 
															 }
														
--- a/tools/perf/builtin-lock.c
+++ b/tools/perf/builtin-lock.c
@@ -834,14 +834,14 @@ static void dump_info(void)
 
															 		die("Unknown type of information\n");
														
 
															 }
														
 
															-static int process_sample_event(event_t *self, struct sample_data *sample,
														
 
															+static int process_sample_event(union perf_event *event, struct perf_sample *sample,
														
 
															 				struct perf_session *s)
														
 
															 {
														
 
															 	struct thread *thread = perf_session__findnew(s, sample->tid);
														
 
															 	if (thread == NULL) {
														
 
															 		pr_debug("problem processing %d event, skipping it.\n",
														
 
															-			self->header.type);
														
 
															+			event->header.type);
														
 
															 		return -1;
														
 
															 	}
														
@@ -852,7 +852,7 @@ static int process_sample_event(event_t *self, struct sample_data *sample,
 
															 static struct perf_event_ops eops = {
														
 
															 	.sample			= process_sample_event,
														
 
															-	.comm			= event__process_comm,
														
 
															+	.comm			= perf_event__process_comm,
														
 
															 	.ordered_samples	= true,
														
 
															 };
														
@@ -893,7 +893,7 @@ static const char * const report_usage[] = {
 
															 static const struct option report_options[] = {
														
 
															 	OPT_STRING('k', "key", &sort_key, "acquired",
														
 
															-		    "key for sorting"),
														
 
															+		    "key for sorting (acquired / contended / wait_total / wait_max / wait_min)"),
														
 
															 	/* TODO: type */
														
 
															 	OPT_END()
														
 
															 };
														
--- a/tools/perf/builtin-probe.c
+++ b/tools/perf/builtin-probe.c
@@ -36,6 +36,7 @@
 
															 #include "builtin.h"
														
 
															 #include "util/util.h"
														
 
															 #include "util/strlist.h"
														
 
															+#include "util/strfilter.h"
														
 
															 #include "util/symbol.h"
														
 
															 #include "util/debug.h"
														
 
															 #include "util/debugfs.h"
														
@@ -43,6 +44,8 @@
 
															 #include "util/probe-finder.h"
														
 
															 #include "util/probe-event.h"
														
 
															+#define DEFAULT_VAR_FILTER "!__k???tab_* & !__crc_*"
														
 
															+#define DEFAULT_FUNC_FILTER "!_*"
														
 
															 #define MAX_PATH_LEN 256
														
 
															 /* Session management structure */
														
@@ -52,6 +55,7 @@ static struct {
 
															 	bool show_lines;
														
 
															 	bool show_vars;
														
 
															 	bool show_ext_vars;
														
 
															+	bool show_funcs;
														
 
															 	bool mod_events;
														
 
															 	int nevents;
														
 
															 	struct perf_probe_event events[MAX_PROBES];
														
@@ -59,6 +63,7 @@ static struct {
 
															 	struct line_range line_range;
														
 
															 	const char *target_module;
														
 
															 	int max_probe_points;
														
 
															+	struct strfilter *filter;
														
 
															 } params;
														
 
															 /* Parse an event definition. Note that any error must die. */
														
@@ -157,6 +162,27 @@ static int opt_show_vars(const struct option *opt __used,
 
															 }
														
 
															 #endif
														
 
															+static int opt_set_filter(const struct option *opt __used,
														
 
															+			  const char *str, int unset __used)
														
 
															+{
														
 
															+	const char *err;
														
 
															+
														
 
															+	if (str) {
														
 
															+		pr_debug2("Set filter: %s\n", str);
														
 
															+		if (params.filter)
														
 
															+			strfilter__delete(params.filter);
														
 
															+		params.filter = strfilter__new(str, &err);
														
 
															+		if (!params.filter) {
														
 
															+			pr_err("Filter parse error at %td.\n", err - str + 1);
														
 
															+			pr_err("Source: \"%s\"\n", str);
														
 
															+			pr_err("         %*c\n", (int)(err - str + 1), '^');
														
 
															+			return -EINVAL;
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															 static const char * const probe_usage[] = {
														
 
															 	"perf probe [<options>] 'PROBEDEF' ['PROBEDEF' ...]",
														
 
															 	"perf probe [<options>] --add 'PROBEDEF' [--add 'PROBEDEF' ...]",
														
@@ -221,6 +247,13 @@ static const struct option options[] = {
 
															 	OPT__DRY_RUN(&probe_event_dry_run),
														
 
															 	OPT_INTEGER('\0', "max-probes", &params.max_probe_points,
														
 
															 		 "Set how many probe points can be found for a probe."),
														
 
															+	OPT_BOOLEAN('F', "funcs", &params.show_funcs,
														
 
															+		    "Show potential probe-able functions."),
														
 
															+	OPT_CALLBACK('\0', "filter", NULL,
														
 
															+		     "[!]FILTER", "Set a filter (with --vars/funcs only)\n"
														
 
															+		     "\t\t\t(default: \"" DEFAULT_VAR_FILTER "\" for --vars,\n"
														
 
															+		     "\t\t\t \"" DEFAULT_FUNC_FILTER "\" for --funcs)",
														
 
															+		     opt_set_filter),
														
 
															 	OPT_END()
														
 
															 };
														
@@ -246,7 +279,7 @@ int cmd_probe(int argc, const char **argv, const char *prefix __used)
 
															 		params.max_probe_points = MAX_PROBES;
														
 
															 	if ((!params.nevents && !params.dellist && !params.list_events &&
														
 
															-	     !params.show_lines))
														
 
															+	     !params.show_lines && !params.show_funcs))
														
 
															 		usage_with_options(probe_usage, options);
														
 
															 	/*
														
@@ -267,12 +300,41 @@ int cmd_probe(int argc, const char **argv, const char *prefix __used)
 
															 			pr_err(" Error: Don't use --list with --vars.\n");
														
 
															 			usage_with_options(probe_usage, options);
														
 
															 		}
														
 
															+		if (params.show_funcs) {
														
 
															+			pr_err("  Error: Don't use --list with --funcs.\n");
														
 
															+			usage_with_options(probe_usage, options);
														
 
															+		}
														
 
															 		ret = show_perf_probe_events();
														
 
															 		if (ret < 0)
														
 
															 			pr_err("  Error: Failed to show event list. (%d)\n",
														
 
															 			       ret);
														
 
															 		return ret;
														
 
															 	}
														
 
															+	if (params.show_funcs) {
														
 
															+		if (params.nevents != 0 || params.dellist) {
														
 
															+			pr_err("  Error: Don't use --funcs with"
														
 
															+			       " --add/--del.\n");
														
 
															+			usage_with_options(probe_usage, options);
														
 
															+		}
														
 
															+		if (params.show_lines) {
														
 
															+			pr_err("  Error: Don't use --funcs with --line.\n");
														
 
															+			usage_with_options(probe_usage, options);
														
 
															+		}
														
 
															+		if (params.show_vars) {
														
 
															+			pr_err("  Error: Don't use --funcs with --vars.\n");
														
 
															+			usage_with_options(probe_usage, options);
														
 
															+		}
														
 
															+		if (!params.filter)
														
 
															+			params.filter = strfilter__new(DEFAULT_FUNC_FILTER,
														
 
															+						       NULL);
														
 
															+		ret = show_available_funcs(params.target_module,
														
 
															+					   params.filter);
														
 
															+		strfilter__delete(params.filter);
														
 
															+		if (ret < 0)
														
 
															+			pr_err("  Error: Failed to show functions."
														
 
															+			       " (%d)\n", ret);
														
 
															+		return ret;
														
 
															+	}
														
 
															 #ifdef DWARF_SUPPORT
														
 
															 	if (params.show_lines) {
														
@@ -297,10 +359,16 @@ int cmd_probe(int argc, const char **argv, const char *prefix __used)
 
															 			       " --add/--del.\n");
														
 
															 			usage_with_options(probe_usage, options);
														
 
															 		}
														
 
															+		if (!params.filter)
														
 
															+			params.filter = strfilter__new(DEFAULT_VAR_FILTER,
														
 
															+						       NULL);
														
 
															+
														
 
															 		ret = show_available_vars(params.events, params.nevents,
														
 
															 					  params.max_probe_points,
														
 
															 					  params.target_module,
														
 
															+					  params.filter,
														
 
															 					  params.show_ext_vars);
														
 
															+		strfilter__delete(params.filter);
														
 
															 		if (ret < 0)
														
 
															 			pr_err("  Error: Failed to show vars. (%d)\n", ret);
														
 
															 		return ret;
														
--- a/tools/perf/builtin-record.c
+++ b/tools/perf/builtin-record.c
@@ -18,11 +18,13 @@
 
															 #include "util/header.h"
														
 
															 #include "util/event.h"
														
 
															+#include "util/evlist.h"
														
 
															 #include "util/evsel.h"
														
 
															 #include "util/debug.h"
														
 
															 #include "util/session.h"
														
 
															 #include "util/symbol.h"
														
 
															 #include "util/cpumap.h"
														
 
															+#include "util/thread_map.h"
														
 
															 #include <unistd.h>
														
 
															 #include <sched.h>
														
@@ -37,16 +39,14 @@ enum write_mode_t {
 
															 static u64			user_interval			= ULLONG_MAX;
														
 
															 static u64			default_interval		=      0;
														
 
															-static u64			sample_type;
														
 
															-static struct cpu_map		*cpus;
														
 
															 static unsigned int		page_size;
														
 
															 static unsigned int		mmap_pages			=    128;
														
 
															 static unsigned int		user_freq 			= UINT_MAX;
														
 
															 static int			freq				=   1000;
														
 
															 static int			output;
														
 
															 static int			pipe_output			=      0;
														
 
															-static const char		*output_name			= "perf.data";
														
 
															+static const char		*output_name			= NULL;
														
 
															 static int			group				=      0;
														
 
															 static int			realtime_prio			=      0;
														
 
															 static bool			nodelay				=  false;
														
@@ -55,7 +55,6 @@ static bool			sample_id_all_avail		=   true;
 
															 static bool			system_wide			=  false;
														
 
															 static pid_t			target_pid			=     -1;
														
 
															 static pid_t			target_tid			=     -1;
														
 
															-static struct thread_map	*threads;
														
 
															 static pid_t			child_pid			=     -1;
														
 
															 static bool			no_inherit			=  false;
														
 
															 static enum write_mode_t	write_mode			= WRITE_FORCE;
														
@@ -66,51 +65,17 @@ static bool			sample_address			=  false;
 
															 static bool			sample_time			=  false;
														
 
															 static bool			no_buildid			=  false;
														
 
															 static bool			no_buildid_cache		=  false;
														
 
															+static struct perf_evlist	*evsel_list;
														
 
															 static long			samples				=      0;
														
 
															 static u64			bytes_written			=      0;
														
 
															-static struct pollfd		*event_array;
														
 
															-
														
 
															-static int			nr_poll				=      0;
														
 
															-static int			nr_cpu				=      0;
														
 
															-
														
 
															 static int			file_new			=      1;
														
 
															 static off_t			post_processing_offset;
														
 
															 static struct perf_session	*session;
														
 
															 static const char		*cpu_list;
														
 
															-struct mmap_data {
														
 
															-	void			*base;
														
 
															-	unsigned int		mask;
														
 
															-	unsigned int		prev;
														
 
															-};
														
 
															-
														
 
															-static struct mmap_data		mmap_array[MAX_NR_CPUS];
														
 
															-
														
 
															-static unsigned long mmap_read_head(struct mmap_data *md)
														
 
															-{
														
 
															-	struct perf_event_mmap_page *pc = md->base;
														
 
															-	long head;
														
 
															-
														
 
															-	head = pc->data_head;
														
 
															-	rmb();
														
 
															-
														
 
															-	return head;
														
 
															-}
														
 
															-
														
 
															-static void mmap_write_tail(struct mmap_data *md, unsigned long tail)
														
 
															-{
														
 
															-	struct perf_event_mmap_page *pc = md->base;
														
 
															-
														
 
															-	/*
														
 
															-	 * ensure all reads are done before we write the tail out.
														
 
															-	 */
														
 
															-	/* mb(); */
														
 
															-	pc->data_tail = tail;
														
 
															-}
														
 
															-
														
 
															 static void advance_output(size_t size)
														
 
															 {
														
 
															 	bytes_written += size;
														
@@ -131,42 +96,26 @@ static void write_output(void *buf, size_t size)
 
															 	}
														
 
															 }
														
 
															-static int process_synthesized_event(event_t *event,
														
 
															-				     struct sample_data *sample __used,
														
 
															+static int process_synthesized_event(union perf_event *event,
														
 
															+				     struct perf_sample *sample __used,
														
 
															 				     struct perf_session *self __used)
														
 
															 {
														
 
															 	write_output(event, event->header.size);
														
 
															 	return 0;
														
 
															 }
														
 
															-static void mmap_read(struct mmap_data *md)
														
 
															+static void mmap_read(struct perf_mmap *md)
														
 
															 {
														
 
															-	unsigned int head = mmap_read_head(md);
														
 
															+	unsigned int head = perf_mmap__read_head(md);
														
 
															 	unsigned int old = md->prev;
														
 
															 	unsigned char *data = md->base + page_size;
														
 
															 	unsigned long size;
														
 
															 	void *buf;
														
 
															-	int diff;
														
 
															-	/*
														
 
															-	 * If we're further behind than half the buffer, there's a chance
														
 
															-	 * the writer will bite our tail and mess up the samples under us.
														
 
															-	 *
														
 
															-	 * If we somehow ended up ahead of the head, we got messed up.
														
 
															-	 *
														
 
															-	 * In either case, truncate and restart at head.
														
 
															-	 */
														
 
															-	diff = head - old;
														
 
															-	if (diff < 0) {
														
 
															-		fprintf(stderr, "WARNING: failed to keep up with mmap data\n");
														
 
															-		/*
														
 
															-		 * head points to a known good entry, start there.
														
 
															-		 */
														
 
															-		old = head;
														
 
															-	}
														
 
															+	if (old == head)
														
 
															+		return;
														
 
															-	if (old != head)
														
 
															-		samples++;
														
 
															+	samples++;
														
 
															 	size = head - old;
														
@@ -185,7 +134,7 @@ static void mmap_read(struct mmap_data *md)
 
															 	write_output(buf, size);
														
 
															 	md->prev = old;
														
 
															-	mmap_write_tail(md, old);
														
 
															+	perf_mmap__write_tail(md, old);
														
 
															 }
														
 
															 static volatile int done = 0;
														
@@ -209,53 +158,10 @@ static void sig_atexit(void)
 
															 	kill(getpid(), signr);
														
 
															 }
														
 
															-static int group_fd;
														
 
															-
														
 
															-static struct perf_header_attr *get_header_attr(struct perf_event_attr *a, int nr)
														
 
															-{
														
 
															-	struct perf_header_attr *h_attr;
														
 
															-
														
 
															-	if (nr < session->header.attrs) {
														
 
															-		h_attr = session->header.attr[nr];
														
 
															-	} else {
														
 
															-		h_attr = perf_header_attr__new(a);
														
 
															-		if (h_attr != NULL)
														
 
															-			if (perf_header__add_attr(&session->header, h_attr) < 0) {
														
 
															-				perf_header_attr__delete(h_attr);
														
 
															-				h_attr = NULL;
														
 
															-			}
														
 
															-	}
														
 
															-
														
 
															-	return h_attr;
														
 
															-}
														
 
															-
														
 
															-static void create_counter(struct perf_evsel *evsel, int cpu)
														
 
															+static void config_attr(struct perf_evsel *evsel, struct perf_evlist *evlist)
														
 
															 {
														
 
															-	char *filter = evsel->filter;
														
 
															 	struct perf_event_attr *attr = &evsel->attr;
														
 
															-	struct perf_header_attr *h_attr;
														
 
															 	int track = !evsel->idx; /* only the first counter needs these */
														
 
															-	int thread_index;
														
 
															-	int ret;
														
 
															-	struct {
														
 
															-		u64 count;
														
 
															-		u64 time_enabled;
														
 
															-		u64 time_running;
														
 
															-		u64 id;
														
 
															-	} read_data;
														
 
															-	/*
														
 
															- 	 * Check if parse_single_tracepoint_event has already asked for
														
 
															- 	 * PERF_SAMPLE_TIME.
														
 
															- 	 *
														
 
															-	 * XXX this is kludgy but short term fix for problems introduced by
														
 
															-	 * eac23d1c that broke 'perf script' by having different sample_types
														
 
															-	 * when using multiple tracepoint events when we use a perf binary
														
 
															-	 * that tries to use sample_id_all on an older kernel.
														
 
															- 	 *
														
 
															- 	 * We need to move counter creation to perf_session, support
														
 
															- 	 * different sample_types, etc.
														
 
															- 	 */
														
 
															-	bool time_needed = attr->sample_type & PERF_SAMPLE_TIME;
														
 
															 	attr->read_format	= PERF_FORMAT_TOTAL_TIME_ENABLED |
														
 
															 				  PERF_FORMAT_TOTAL_TIME_RUNNING |
														
@@ -263,7 +169,7 @@ static void create_counter(struct perf_evsel *evsel, int cpu)
 
															 	attr->sample_type	|= PERF_SAMPLE_IP | PERF_SAMPLE_TID;
														
 
															-	if (nr_counters > 1)
														
 
															+	if (evlist->nr_entries > 1)
														
 
															 		attr->sample_type |= PERF_SAMPLE_ID;
														
 
															 	/*
														
@@ -315,19 +221,58 @@ static void create_counter(struct perf_evsel *evsel, int cpu)
 
															 	attr->mmap		= track;
														
 
															 	attr->comm		= track;
														
 
															-	attr->inherit		= !no_inherit;
														
 
															+
														
 
															 	if (target_pid == -1 && target_tid == -1 && !system_wide) {
														
 
															 		attr->disabled = 1;
														
 
															 		attr->enable_on_exec = 1;
														
 
															 	}
														
 
															-retry_sample_id:
														
 
															-	attr->sample_id_all = sample_id_all_avail ? 1 : 0;
														
 
															+}
														
 
															-	for (thread_index = 0; thread_index < threads->nr; thread_index++) {
														
 
															-try_again:
														
 
															-		FD(evsel, nr_cpu, thread_index) = sys_perf_event_open(attr, threads->map[thread_index], cpu, group_fd, 0);
														
 
															+static bool perf_evlist__equal(struct perf_evlist *evlist,
														
 
															+			       struct perf_evlist *other)
														
 
															+{
														
 
															+	struct perf_evsel *pos, *pair;
														
 
															+
														
 
															+	if (evlist->nr_entries != other->nr_entries)
														
 
															+		return false;
														
 
															+
														
 
															+	pair = list_entry(other->entries.next, struct perf_evsel, node);
														
 
															-		if (FD(evsel, nr_cpu, thread_index) < 0) {
														
 
															+	list_for_each_entry(pos, &evlist->entries, node) {
														
 
															+		if (memcmp(&pos->attr, &pair->attr, sizeof(pos->attr) != 0))
														
 
															+			return false;
														
 
															+		pair = list_entry(pair->node.next, struct perf_evsel, node);
														
 
															+	}
														
 
															+
														
 
															+	return true;
														
 
															+}
														
 
															+
														
 
															+static void open_counters(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	struct perf_evsel *pos;
														
 
															+
														
 
															+	list_for_each_entry(pos, &evlist->entries, node) {
														
 
															+		struct perf_event_attr *attr = &pos->attr;
														
 
															+		/*
														
 
															+		 * Check if parse_single_tracepoint_event has already asked for
														
 
															+		 * PERF_SAMPLE_TIME.
														
 
															+		 *
														
 
															+		 * XXX this is kludgy but short term fix for problems introduced by
														
 
															+		 * eac23d1c that broke 'perf script' by having different sample_types
														
 
															+		 * when using multiple tracepoint events when we use a perf binary
														
 
															+		 * that tries to use sample_id_all on an older kernel.
														
 
															+		 *
														
 
															+		 * We need to move counter creation to perf_session, support
														
 
															+		 * different sample_types, etc.
														
 
															+		 */
														
 
															+		bool time_needed = attr->sample_type & PERF_SAMPLE_TIME;
														
 
															+
														
 
															+		config_attr(pos, evlist);
														
 
															+retry_sample_id:
														
 
															+		attr->sample_id_all = sample_id_all_avail ? 1 : 0;
														
 
															+try_again:
														
 
															+		if (perf_evsel__open(pos, evlist->cpus, evlist->threads, group,
														
 
															+				     !no_inherit) < 0) {
														
 
															 			int err = errno;
														
 
															 			if (err == EPERM || err == EACCES)
														
@@ -364,7 +309,7 @@ try_again:
 
															 			}
														
 
															 			printf("\n");
														
 
															 			error("sys_perf_event_open() syscall returned with %d (%s).  /bin/dmesg may provide additional information.\n",
														
 
															-			      FD(evsel, nr_cpu, thread_index), strerror(err));
														
 
															+			      err, strerror(err));
														
 
															 #if defined(__i386__) || defined(__x86_64__)
														
 
															 			if (attr->type == PERF_TYPE_HARDWARE && err == EOPNOTSUPP)
														
@@ -375,90 +320,28 @@ try_again:
 
															 #endif
														
 
															 			die("No CONFIG_PERF_EVENTS=y kernel support configured?\n");
														
 
															-			exit(-1);
														
 
															 		}
														
 
															+	}
														
 
															-		h_attr = get_header_attr(attr, evsel->idx);
														
 
															-		if (h_attr == NULL)
														
 
															-			die("nomem\n");
														
 
															+	if (perf_evlist__set_filters(evlist)) {
														
 
															+		error("failed to set filter with %d (%s)\n", errno,
														
 
															+			strerror(errno));
														
 
															+		exit(-1);
														
 
															+	}
														
 
															-		if (!file_new) {
														
 
															-			if (memcmp(&h_attr->attr, attr, sizeof(*attr))) {
														
 
															-				fprintf(stderr, "incompatible append\n");
														
 
															-				exit(-1);
														
 
															-			}
														
 
															-		}
														
 
															+	if (perf_evlist__mmap(evlist, mmap_pages, false) < 0)
														
 
															+		die("failed to mmap with %d (%s)\n", errno, strerror(errno));
														
 
															-		if (read(FD(evsel, nr_cpu, thread_index), &read_data, sizeof(read_data)) == -1) {
														
 
															-			perror("Unable to read perf file descriptor");
														
 
															+	if (file_new)
														
 
															+		session->evlist = evlist;
														
 
															+	else {
														
 
															+		if (!perf_evlist__equal(session->evlist, evlist)) {
														
 
															+			fprintf(stderr, "incompatible append\n");
														
 
															 			exit(-1);
														
 
															 		}
														
 
															+ 	}
														
 
															-		if (perf_header_attr__add_id(h_attr, read_data.id) < 0) {
														
 
															-			pr_warning("Not enough memory to add id\n");
														
 
															-			exit(-1);
														
 
															-		}
														
 
															-
														
 
															-		assert(FD(evsel, nr_cpu, thread_index) >= 0);
														
 
															-		fcntl(FD(evsel, nr_cpu, thread_index), F_SETFL, O_NONBLOCK);
														
 
															-
														
 
															-		/*
														
 
															-		 * First counter acts as the group leader:
														
 
															-		 */
														
 
															-		if (group && group_fd == -1)
														
 
															-			group_fd = FD(evsel, nr_cpu, thread_index);
														
 
															-
														
 
															-		if (evsel->idx || thread_index) {
														
 
															-			struct perf_evsel *first;
														
 
															-			first = list_entry(evsel_list.next, struct perf_evsel, node);
														
 
															-			ret = ioctl(FD(evsel, nr_cpu, thread_index),
														
 
															-				    PERF_EVENT_IOC_SET_OUTPUT,
														
 
															-				    FD(first, nr_cpu, 0));
														
 
															-			if (ret) {
														
 
															-				error("failed to set output: %d (%s)\n", errno,
														
 
															-						strerror(errno));
														
 
															-				exit(-1);
														
 
															-			}
														
 
															-		} else {
														
 
															-			mmap_array[nr_cpu].prev = 0;
														
 
															-			mmap_array[nr_cpu].mask = mmap_pages*page_size - 1;
														
 
															-			mmap_array[nr_cpu].base = mmap(NULL, (mmap_pages+1)*page_size,
														
 
															-				PROT_READ | PROT_WRITE, MAP_SHARED, FD(evsel, nr_cpu, thread_index), 0);
														
 
															-			if (mmap_array[nr_cpu].base == MAP_FAILED) {
														
 
															-				error("failed to mmap with %d (%s)\n", errno, strerror(errno));
														
 
															-				exit(-1);
														
 
															-			}
														
 
															-
														
 
															-			event_array[nr_poll].fd = FD(evsel, nr_cpu, thread_index);
														
 
															-			event_array[nr_poll].events = POLLIN;
														
 
															-			nr_poll++;
														
 
															-		}
														
 
															-
														
 
															-		if (filter != NULL) {
														
 
															-			ret = ioctl(FD(evsel, nr_cpu, thread_index),
														
 
															-				    PERF_EVENT_IOC_SET_FILTER, filter);
														
 
															-			if (ret) {
														
 
															-				error("failed to set filter with %d (%s)\n", errno,
														
 
															-						strerror(errno));
														
 
															-				exit(-1);
														
 
															-			}
														
 
															-		}
														
 
															-	}
														
 
															-
														
 
															-	if (!sample_type)
														
 
															-		sample_type = attr->sample_type;
														
 
															-}
														
 
															-
														
 
															-static void open_counters(int cpu)
														
 
															-{
														
 
															-	struct perf_evsel *pos;
														
 
															-
														
 
															-	group_fd = -1;
														
 
															-
														
 
															-	list_for_each_entry(pos, &evsel_list, node)
														
 
															-		create_counter(pos, cpu);
														
 
															-
														
 
															-	nr_cpu++;
														
 
															+	perf_session__update_sample_type(session);
														
 
															 }
														
 
															 static int process_buildids(void)
														
@@ -481,14 +364,14 @@ static void atexit_header(void)
 
															 		if (!no_buildid)
														
 
															 			process_buildids();
														
 
															-		perf_header__write(&session->header, output, true);
														
 
															+		perf_session__write_header(session, evsel_list, output, true);
														
 
															 		perf_session__delete(session);
														
 
															-		perf_evsel_list__delete();
														
 
															+		perf_evlist__delete(evsel_list);
														
 
															 		symbol__exit();
														
 
															 	}
														
 
															 }
														
 
															-static void event__synthesize_guest_os(struct machine *machine, void *data)
														
 
															+static void perf_event__synthesize_guest_os(struct machine *machine, void *data)
														
 
															 {
														
 
															 	int err;
														
 
															 	struct perf_session *psession = data;
														
@@ -504,8 +387,8 @@ static void event__synthesize_guest_os(struct machine *machine, void *data)
 
															 	 *method is used to avoid symbol missing when the first addr is
														
 
															 	 *in module instead of in guest kernel.
														
 
															 	 */
														
 
															-	err = event__synthesize_modules(process_synthesized_event,
														
 
															-					psession, machine);
														
 
															+	err = perf_event__synthesize_modules(process_synthesized_event,
														
 
															+					     psession, machine);
														
 
															 	if (err < 0)
														
 
															 		pr_err("Couldn't record guest kernel [%d]'s reference"
														
 
															 		       " relocation symbol.\n", machine->pid);
														
@@ -514,11 +397,12 @@ static void event__synthesize_guest_os(struct machine *machine, void *data)
 
															 	 * We use _stext for guest kernel because guest kernel's /proc/kallsyms
														
 
															 	 * have no _text sometimes.
														
 
															 	 */
														
 
															-	err = event__synthesize_kernel_mmap(process_synthesized_event,
														
 
															-					    psession, machine, "_text");
														
 
															+	err = perf_event__synthesize_kernel_mmap(process_synthesized_event,
														
 
															+						 psession, machine, "_text");
														
 
															 	if (err < 0)
														
 
															-		err = event__synthesize_kernel_mmap(process_synthesized_event,
														
 
															-						    psession, machine, "_stext");
														
 
															+		err = perf_event__synthesize_kernel_mmap(process_synthesized_event,
														
 
															+							 psession, machine,
														
 
															+							 "_stext");
														
 
															 	if (err < 0)
														
 
															 		pr_err("Couldn't record guest kernel [%d]'s reference"
														
 
															 		       " relocation symbol.\n", machine->pid);
														
@@ -533,9 +417,9 @@ static void mmap_read_all(void)
 
															 {
														
 
															 	int i;
														
 
															-	for (i = 0; i < nr_cpu; i++) {
														
 
															-		if (mmap_array[i].base)
														
 
															-			mmap_read(&mmap_array[i]);
														
 
															+	for (i = 0; i < evsel_list->cpus->nr; i++) {
														
 
															+		if (evsel_list->mmap[i].base)
														
 
															+			mmap_read(&evsel_list->mmap[i]);
														
 
															 	}
														
 
															 	if (perf_header__has_feat(&session->header, HEADER_TRACE_INFO))
														
@@ -566,18 +450,26 @@ static int __cmd_record(int argc, const char **argv)
 
															 		exit(-1);
														
 
															 	}
														
 
															-	if (!strcmp(output_name, "-"))
														
 
															-		pipe_output = 1;
														
 
															-	else if (!stat(output_name, &st) && st.st_size) {
														
 
															-		if (write_mode == WRITE_FORCE) {
														
 
															-			char oldname[PATH_MAX];
														
 
															-			snprintf(oldname, sizeof(oldname), "%s.old",
														
 
															-				 output_name);
														
 
															-			unlink(oldname);
														
 
															-			rename(output_name, oldname);
														
 
															+	if (!output_name) {
														
 
															+		if (!fstat(STDOUT_FILENO, &st) && S_ISFIFO(st.st_mode))
														
 
															+			pipe_output = 1;
														
 
															+		else
														
 
															+			output_name = "perf.data";
														
 
															+	}
														
 
															+	if (output_name) {
														
 
															+		if (!strcmp(output_name, "-"))
														
 
															+			pipe_output = 1;
														
 
															+		else if (!stat(output_name, &st) && st.st_size) {
														
 
															+			if (write_mode == WRITE_FORCE) {
														
 
															+				char oldname[PATH_MAX];
														
 
															+				snprintf(oldname, sizeof(oldname), "%s.old",
														
 
															+					 output_name);
														
 
															+				unlink(oldname);
														
 
															+				rename(output_name, oldname);
														
 
															+			}
														
 
															+		} else if (write_mode == WRITE_APPEND) {
														
 
															+			write_mode = WRITE_FORCE;
														
 
															 		}
														
 
															-	} else if (write_mode == WRITE_APPEND) {
														
 
															-		write_mode = WRITE_FORCE;
														
 
															 	}
														
 
															 	flags = O_CREAT|O_RDWR;
														
@@ -606,19 +498,14 @@ static int __cmd_record(int argc, const char **argv)
 
															 		perf_header__set_feat(&session->header, HEADER_BUILD_ID);
														
 
															 	if (!file_new) {
														
 
															-		err = perf_header__read(session, output);
														
 
															+		err = perf_session__read_header(session, output);
														
 
															 		if (err < 0)
														
 
															 			goto out_delete_session;
														
 
															 	}
														
 
															-	if (have_tracepoints(&evsel_list))
														
 
															+	if (have_tracepoints(&evsel_list->entries))
														
 
															 		perf_header__set_feat(&session->header, HEADER_TRACE_INFO);
														
 
															-	/*
														
 
															- 	 * perf_session__delete(session) will be called at atexit_header()
														
 
															-	 */
														
 
															-	atexit(atexit_header);
														
 
															-
														
 
															 	if (forks) {
														
 
															 		child_pid = fork();
														
 
															 		if (child_pid < 0) {
														
@@ -659,7 +546,7 @@ static int __cmd_record(int argc, const char **argv)
 
															 		}
														
 
															 		if (!system_wide && target_tid == -1 && target_pid == -1)
														
 
															-			threads->map[0] = child_pid;
														
 
															+			evsel_list->threads->map[0] = child_pid;
														
 
															 		close(child_ready_pipe[1]);
														
 
															 		close(go_pipe[0]);
														
@@ -673,46 +560,42 @@ static int __cmd_record(int argc, const char **argv)
 
															 		close(child_ready_pipe[0]);
														
 
															 	}
														
 
															-	if (!system_wide && no_inherit && !cpu_list) {
														
 
															-		open_counters(-1);
														
 
															-	} else {
														
 
															-		for (i = 0; i < cpus->nr; i++)
														
 
															-			open_counters(cpus->map[i]);
														
 
															-	}
														
 
															+	open_counters(evsel_list);
														
 
															-	perf_session__set_sample_type(session, sample_type);
														
 
															+	/*
														
 
															+	 * perf_session__delete(session) will be called at atexit_header()
														
 
															+	 */
														
 
															+	atexit(atexit_header);
														
 
															 	if (pipe_output) {
														
 
															 		err = perf_header__write_pipe(output);
														
 
															 		if (err < 0)
														
 
															 			return err;
														
 
															 	} else if (file_new) {
														
 
															-		err = perf_header__write(&session->header, output, false);
														
 
															+		err = perf_session__write_header(session, evsel_list,
														
 
															+						 output, false);
														
 
															 		if (err < 0)
														
 
															 			return err;
														
 
															 	}
														
 
															 	post_processing_offset = lseek(output, 0, SEEK_CUR);
														
 
															-	perf_session__set_sample_id_all(session, sample_id_all_avail);
														
 
															-
														
 
															 	if (pipe_output) {
														
 
															-		err = event__synthesize_attrs(&session->header,
														
 
															-					      process_synthesized_event,
														
 
															-					      session);
														
 
															+		err = perf_session__synthesize_attrs(session,
														
 
															+						     process_synthesized_event);
														
 
															 		if (err < 0) {
														
 
															 			pr_err("Couldn't synthesize attrs.\n");
														
 
															 			return err;
														
 
															 		}
														
 
															-		err = event__synthesize_event_types(process_synthesized_event,
														
 
															-						    session);
														
 
															+		err = perf_event__synthesize_event_types(process_synthesized_event,
														
 
															+							 session);
														
 
															 		if (err < 0) {
														
 
															 			pr_err("Couldn't synthesize event_types.\n");
														
 
															 			return err;
														
 
															 		}
														
 
															-		if (have_tracepoints(&evsel_list)) {
														
 
															+		if (have_tracepoints(&evsel_list->entries)) {
														
 
															 			/*
														
 
															 			 * FIXME err <= 0 here actually means that
														
 
															 			 * there were no tracepoints so its not really
														
@@ -721,9 +604,9 @@ static int __cmd_record(int argc, const char **argv)
 
															 			 * return this more properly and also
														
 
															 			 * propagate errors that now are calling die()
														
 
															 			 */
														
 
															-			err = event__synthesize_tracing_data(output, &evsel_list,
														
 
															-							     process_synthesized_event,
														
 
															-							     session);
														
 
															+			err = perf_event__synthesize_tracing_data(output, evsel_list,
														
 
															+								  process_synthesized_event,
														
 
															+								  session);
														
 
															 			if (err <= 0) {
														
 
															 				pr_err("Couldn't record tracing data.\n");
														
 
															 				return err;
														
@@ -738,31 +621,34 @@ static int __cmd_record(int argc, const char **argv)
 
															 		return -1;
														
 
															 	}
														
 
															-	err = event__synthesize_kernel_mmap(process_synthesized_event,
														
 
															-					    session, machine, "_text");
														
 
															+	err = perf_event__synthesize_kernel_mmap(process_synthesized_event,
														
 
															+						 session, machine, "_text");
														
 
															 	if (err < 0)
														
 
															-		err = event__synthesize_kernel_mmap(process_synthesized_event,
														
 
															-						    session, machine, "_stext");
														
 
															+		err = perf_event__synthesize_kernel_mmap(process_synthesized_event,
														
 
															+							 session, machine, "_stext");
														
 
															 	if (err < 0)
														
 
															 		pr_err("Couldn't record kernel reference relocation symbol\n"
														
 
															 		       "Symbol resolution may be skewed if relocation was used (e.g. kexec).\n"
														
 
															 		       "Check /proc/kallsyms permission or run as root.\n");
														
 
															-	err = event__synthesize_modules(process_synthesized_event,
														
 
															-					session, machine);
														
 
															+	err = perf_event__synthesize_modules(process_synthesized_event,
														
 
															+					     session, machine);
														
 
															 	if (err < 0)
														
 
															 		pr_err("Couldn't record kernel module information.\n"
														
 
															 		       "Symbol resolution may be skewed if relocation was used (e.g. kexec).\n"
														
 
															 		       "Check /proc/modules permission or run as root.\n");
														
 
															 	if (perf_guest)
														
 
															-		perf_session__process_machines(session, event__synthesize_guest_os);
														
 
															+		perf_session__process_machines(session,
														
 
															+					       perf_event__synthesize_guest_os);
														
 
															 	if (!system_wide)
														
 
															-		event__synthesize_thread_map(threads, process_synthesized_event,
														
 
															-					     session);
														
 
															+		perf_event__synthesize_thread_map(evsel_list->threads,
														
 
															+						  process_synthesized_event,
														
 
															+						  session);
														
 
															 	else
														
 
															-		event__synthesize_threads(process_synthesized_event, session);
														
 
															+		perf_event__synthesize_threads(process_synthesized_event,
														
 
															+					       session);
														
 
															 	if (realtime_prio) {
														
 
															 		struct sched_param param;
														
@@ -789,17 +675,17 @@ static int __cmd_record(int argc, const char **argv)
 
															 		if (hits == samples) {
														
 
															 			if (done)
														
 
															 				break;
														
 
															-			err = poll(event_array, nr_poll, -1);
														
 
															+			err = poll(evsel_list->pollfd, evsel_list->nr_fds, -1);
														
 
															 			waking++;
														
 
															 		}
														
 
															 		if (done) {
														
 
															-			for (i = 0; i < nr_cpu; i++) {
														
 
															+			for (i = 0; i < evsel_list->cpus->nr; i++) {
														
 
															 				struct perf_evsel *pos;
														
 
															-				list_for_each_entry(pos, &evsel_list, node) {
														
 
															+				list_for_each_entry(pos, &evsel_list->entries, node) {
														
 
															 					for (thread = 0;
														
 
															-						thread < threads->nr;
														
 
															+						thread < evsel_list->threads->nr;
														
 
															 						thread++)
														
 
															 						ioctl(FD(pos, i, thread),
														
 
															 							PERF_EVENT_IOC_DISABLE);
														
@@ -838,10 +724,10 @@ static const char * const record_usage[] = {
 
															 static bool force, append_file;
														
 
															 const struct option record_options[] = {
														
 
															-	OPT_CALLBACK('e', "event", NULL, "event",
														
 
															+	OPT_CALLBACK('e', "event", &evsel_list, "event",
														
 
															 		     "event selector. use 'perf list' to list available events",
														
 
															 		     parse_events),
														
 
															-	OPT_CALLBACK(0, "filter", NULL, "filter",
														
 
															+	OPT_CALLBACK(0, "filter", &evsel_list, "filter",
														
 
															 		     "event filter", parse_filter),
														
 
															 	OPT_INTEGER('p', "pid", &target_pid,
														
 
															 		    "record events on existing process id"),
														
@@ -884,6 +770,9 @@ const struct option record_options[] = {
 
															 		    "do not update the buildid cache"),
														
 
															 	OPT_BOOLEAN('B', "no-buildid", &no_buildid,
														
 
															 		    "do not collect buildids in perf.data"),
														
 
															+	OPT_CALLBACK('G', "cgroup", &evsel_list, "name",
														
 
															+		     "monitor event in cgroup name only",
														
 
															+		     parse_cgroups),
														
 
															 	OPT_END()
														
 
															 };
														
@@ -892,6 +781,10 @@ int cmd_record(int argc, const char **argv, const char *prefix __used)
 
															 	int err = -ENOMEM;
														
 
															 	struct perf_evsel *pos;
														
 
															+	evsel_list = perf_evlist__new(NULL, NULL);
														
 
															+	if (evsel_list == NULL)
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															 	argc = parse_options(argc, argv, record_options, record_usage,
														
 
															 			    PARSE_OPT_STOP_AT_NON_OPTION);
														
 
															 	if (!argc && target_pid == -1 && target_tid == -1 &&
														
@@ -908,12 +801,19 @@ int cmd_record(int argc, const char **argv, const char *prefix __used)
 
															 		write_mode = WRITE_FORCE;
														
 
															 	}
														
 
															+	if (nr_cgroups && !system_wide) {
														
 
															+		fprintf(stderr, "cgroup monitoring only available in"
														
 
															+			" system-wide mode\n");
														
 
															+		usage_with_options(record_usage, record_options);
														
 
															+	}
														
 
															+
														
 
															 	symbol__init();
														
 
															 	if (no_buildid_cache || no_buildid)
														
 
															 		disable_buildid_cache();
														
 
															-	if (list_empty(&evsel_list) && perf_evsel_list__create_default() < 0) {
														
 
															+	if (evsel_list->nr_entries == 0 &&
														
 
															+	    perf_evlist__add_default(evsel_list) < 0) {
														
 
															 		pr_err("Not enough memory for event selector list\n");
														
 
															 		goto out_symbol_exit;
														
 
															 	}
														
@@ -921,27 +821,19 @@ int cmd_record(int argc, const char **argv, const char *prefix __used)
 
															 	if (target_pid != -1)
														
 
															 		target_tid = target_pid;
														
 
															-	threads = thread_map__new(target_pid, target_tid);
														
 
															-	if (threads == NULL) {
														
 
															-		pr_err("Problems finding threads of monitor\n");
														
 
															+	if (perf_evlist__create_maps(evsel_list, target_pid,
														
 
															+				     target_tid, cpu_list) < 0)
														
 
															 		usage_with_options(record_usage, record_options);
														
 
															-	}
														
 
															-	cpus = cpu_map__new(cpu_list);
														
 
															-	if (cpus == NULL) {
														
 
															-		perror("failed to parse CPUs map");
														
 
															-		return -1;
														
 
															-	}
														
 
															-
														
 
															-	list_for_each_entry(pos, &evsel_list, node) {
														
 
															-		if (perf_evsel__alloc_fd(pos, cpus->nr, threads->nr) < 0)
														
 
															+	list_for_each_entry(pos, &evsel_list->entries, node) {
														
 
															+		if (perf_evsel__alloc_fd(pos, evsel_list->cpus->nr,
														
 
															+					 evsel_list->threads->nr) < 0)
														
 
															 			goto out_free_fd;
														
 
															 		if (perf_header__push_event(pos->attr.config, event_name(pos)))
														
 
															 			goto out_free_fd;
														
 
															 	}
														
 
															-	event_array = malloc((sizeof(struct pollfd) * MAX_NR_CPUS *
														
 
															-			      MAX_COUNTERS * threads->nr));
														
 
															-	if (!event_array)
														
 
															+
														
 
															+	if (perf_evlist__alloc_pollfd(evsel_list) < 0)
														
 
															 		goto out_free_fd;
														
 
															 	if (user_interval != ULLONG_MAX)
														
@@ -959,16 +851,12 @@ int cmd_record(int argc, const char **argv, const char *prefix __used)
 
															 	} else {
														
 
															 		fprintf(stderr, "frequency and count are zero, aborting\n");
														
 
															 		err = -EINVAL;
														
 
															-		goto out_free_event_array;
														
 
															+		goto out_free_fd;
														
 
															 	}
														
 
															 	err = __cmd_record(argc, argv);
														
 
															-
														
 
															-out_free_event_array:
														
 
															-	free(event_array);
														
 
															 out_free_fd:
														
 
															-	thread_map__delete(threads);
														
 
															-	threads = NULL;
														
 
															+	perf_evlist__delete_maps(evsel_list);
														
 
															 out_symbol_exit:
														
 
															 	symbol__exit();
														
 
															 	return err;
														
--- a/tools/perf/builtin-report.c
+++ b/tools/perf/builtin-report.c
@@ -9,6 +9,7 @@
 
															 #include "util/util.h"
														
 
															+#include "util/annotate.h"
														
 
															 #include "util/color.h"
														
 
															 #include <linux/list.h>
														
 
															 #include "util/cache.h"
														
@@ -20,6 +21,8 @@
 
															 #include "perf.h"
														
 
															 #include "util/debug.h"
														
 
															+#include "util/evlist.h"
														
 
															+#include "util/evsel.h"
														
 
															 #include "util/header.h"
														
 
															 #include "util/session.h"
														
@@ -43,120 +46,79 @@ static const char	default_pretty_printing_style[] = "normal";
 
															 static const char	*pretty_printing_style = default_pretty_printing_style;
														
 
															 static char		callchain_default_opt[] = "fractal,0.5";
														
 
															+static symbol_filter_t	annotate_init;
														
 
															-static struct hists *perf_session__hists_findnew(struct perf_session *self,
														
 
															-						 u64 event_stream, u32 type,
														
 
															-						 u64 config)
														
 
															-{
														
 
															-	struct rb_node **p = &self->hists_tree.rb_node;
														
 
															-	struct rb_node *parent = NULL;
														
 
															-	struct hists *iter, *new;
														
 
															-
														
 
															-	while (*p != NULL) {
														
 
															-		parent = *p;
														
 
															-		iter = rb_entry(parent, struct hists, rb_node);
														
 
															-		if (iter->config == config)
														
 
															-			return iter;
														
 
															-
														
 
															-
														
 
															-		if (config > iter->config)
														
 
															-			p = &(*p)->rb_right;
														
 
															-		else
														
 
															-			p = &(*p)->rb_left;
														
 
															-	}
														
 
															-
														
 
															-	new = malloc(sizeof(struct hists));
														
 
															-	if (new == NULL)
														
 
															-		return NULL;
														
 
															-	memset(new, 0, sizeof(struct hists));
														
 
															-	new->event_stream = event_stream;
														
 
															-	new->config = config;
														
 
															-	new->type = type;
														
 
															-	rb_link_node(&new->rb_node, parent, p);
														
 
															-	rb_insert_color(&new->rb_node, &self->hists_tree);
														
 
															-	return new;
														
 
															-}
														
 
															-
														
 
															-static int perf_session__add_hist_entry(struct perf_session *self,
														
 
															+static int perf_session__add_hist_entry(struct perf_session *session,
														
 
															 					struct addr_location *al,
														
 
															-					struct sample_data *data)
														
 
															+					struct perf_sample *sample)
														
 
															 {
														
 
															-	struct map_symbol *syms = NULL;
														
 
															 	struct symbol *parent = NULL;
														
 
															-	int err = -ENOMEM;
														
 
															+	int err = 0;
														
 
															 	struct hist_entry *he;
														
 
															-	struct hists *hists;
														
 
															-	struct perf_event_attr *attr;
														
 
															-
														
 
															-	if ((sort__has_parent || symbol_conf.use_callchain) && data->callchain) {
														
 
															-		syms = perf_session__resolve_callchain(self, al->thread,
														
 
															-						       data->callchain, &parent);
														
 
															-		if (syms == NULL)
														
 
															-			return -ENOMEM;
														
 
															+	struct perf_evsel *evsel;
														
 
															+
														
 
															+	if ((sort__has_parent || symbol_conf.use_callchain) && sample->callchain) {
														
 
															+		err = perf_session__resolve_callchain(session, al->thread,
														
 
															+						      sample->callchain, &parent);
														
 
															+		if (err)
														
 
															+			return err;
														
 
															 	}
														
 
															-	attr = perf_header__find_attr(data->id, &self->header);
														
 
															-	if (attr)
														
 
															-		hists = perf_session__hists_findnew(self, data->id, attr->type, attr->config);
														
 
															-	else
														
 
															-		hists = perf_session__hists_findnew(self, data->id, 0, 0);
														
 
															-	if (hists == NULL)
														
 
															-		goto out_free_syms;
														
 
															-	he = __hists__add_entry(hists, al, parent, data->period);
														
 
															+	evsel = perf_evlist__id2evsel(session->evlist, sample->id);
														
 
															+	if (evsel == NULL) {
														
 
															+		/*
														
 
															+		 * FIXME: Propagate this back, but at least we're in a builtin,
														
 
															+		 * where exit() is allowed. ;-)
														
 
															+		 */
														
 
															+		ui__warning("Invalid %s file, contains samples with id %" PRIu64 " not in "
														
 
															+			    "its header!\n", input_name, sample->id);
														
 
															+		exit_browser(0);
														
 
															+		exit(1);
														
 
															+	}
														
 
															+
														
 
															+	he = __hists__add_entry(&evsel->hists, al, parent, sample->period);
														
 
															 	if (he == NULL)
														
 
															-		goto out_free_syms;
														
 
															-	err = 0;
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															 	if (symbol_conf.use_callchain) {
														
 
															-		err = callchain_append(he->callchain, data->callchain, syms,
														
 
															-				       data->period);
														
 
															+		err = callchain_append(he->callchain, &session->callchain_cursor,
														
 
															+				       sample->period);
														
 
															 		if (err)
														
 
															-			goto out_free_syms;
														
 
															+			return err;
														
 
															 	}
														
 
															 	/*
														
 
															 	 * Only in the newt browser we are doing integrated annotation,
														
 
															 	 * so we don't allocated the extra space needed because the stdio
														
 
															 	 * code will not use it.
														
 
															 	 */
														
 
															-	if (use_browser > 0)
														
 
															-		err = hist_entry__inc_addr_samples(he, al->addr);
														
 
															-out_free_syms:
														
 
															-	free(syms);
														
 
															-	return err;
														
 
															-}
														
 
															+	if (al->sym != NULL && use_browser > 0) {
														
 
															+		struct annotation *notes = symbol__annotation(he->ms.sym);
														
 
															-static int add_event_total(struct perf_session *session,
														
 
															-			   struct sample_data *data,
														
 
															-			   struct perf_event_attr *attr)
														
 
															-{
														
 
															-	struct hists *hists;
														
 
															+		assert(evsel != NULL);
														
 
															-	if (attr)
														
 
															-		hists = perf_session__hists_findnew(session, data->id,
														
 
															-						    attr->type, attr->config);
														
 
															-	else
														
 
															-		hists = perf_session__hists_findnew(session, data->id, 0, 0);
														
 
															+		err = -ENOMEM;
														
 
															+		if (notes->src == NULL &&
														
 
															+		    symbol__alloc_hist(he->ms.sym, session->evlist->nr_entries) < 0)
														
 
															+			goto out;
														
 
															-	if (!hists)
														
 
															-		return -ENOMEM;
														
 
															+		err = hist_entry__inc_addr_samples(he, evsel->idx, al->addr);
														
 
															+	}
														
 
															-	hists->stats.total_period += data->period;
														
 
															-	/*
														
 
															-	 * FIXME: add_event_total should be moved from here to
														
 
															-	 * perf_session__process_event so that the proper hist is passed to
														
 
															-	 * the event_op methods.
														
 
															-	 */
														
 
															-	hists__inc_nr_events(hists, PERF_RECORD_SAMPLE);
														
 
															-	session->hists.stats.total_period += data->period;
														
 
															-	return 0;
														
 
															+	evsel->hists.stats.total_period += sample->period;
														
 
															+	hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
														
 
															+out:
														
 
															+	return err;
														
 
															 }
														
 
															-static int process_sample_event(event_t *event, struct sample_data *sample,
														
 
															+
														
 
															+static int process_sample_event(union perf_event *event,
														
 
															+				struct perf_sample *sample,
														
 
															 				struct perf_session *session)
														
 
															 {
														
 
															 	struct addr_location al;
														
 
															-	struct perf_event_attr *attr;
														
 
															-	if (event__preprocess_sample(event, session, &al, sample, NULL) < 0) {
														
 
															+	if (perf_event__preprocess_sample(event, session, &al, sample,
														
 
															+					  annotate_init) < 0) {
														
 
															 		fprintf(stderr, "problem processing %d event, skipping it.\n",
														
 
															 			event->header.type);
														
 
															 		return -1;
														
@@ -170,26 +132,17 @@ static int process_sample_event(event_t *event, struct sample_data *sample,
 
															 		return -1;
														
 
															 	}
														
 
															-	attr = perf_header__find_attr(sample->id, &session->header);
														
 
															-
														
 
															-	if (add_event_total(session, sample, attr)) {
														
 
															-		pr_debug("problem adding event period\n");
														
 
															-		return -1;
														
 
															-	}
														
 
															-
														
 
															 	return 0;
														
 
															 }
														
 
															-static int process_read_event(event_t *event, struct sample_data *sample __used,
														
 
															-			      struct perf_session *session __used)
														
 
															+static int process_read_event(union perf_event *event,
														
 
															+			      struct perf_sample *sample __used,
														
 
															+			      struct perf_session *session)
														
 
															 {
														
 
															-	struct perf_event_attr *attr;
														
 
															-
														
 
															-	attr = perf_header__find_attr(event->read.id, &session->header);
														
 
															-
														
 
															+	struct perf_evsel *evsel = perf_evlist__id2evsel(session->evlist,
														
 
															+							 event->read.id);
														
 
															 	if (show_threads) {
														
 
															-		const char *name = attr ? __event_name(attr->type, attr->config)
														
 
															-				   : "unknown";
														
 
															+		const char *name = evsel ? event_name(evsel) : "unknown";
														
 
															 		perf_read_values_add_value(&show_threads_values,
														
 
															 					   event->read.pid, event->read.tid,
														
 
															 					   event->read.id,
														
@@ -198,7 +151,7 @@ static int process_read_event(event_t *event, struct sample_data *sample __used,
 
															 	}
														
 
															 	dump_printf(": %d %d %s %" PRIu64 "\n", event->read.pid, event->read.tid,
														
 
															-		    attr ? __event_name(attr->type, attr->config) : "FAIL",
														
 
															+		    evsel ? event_name(evsel) : "FAIL",
														
 
															 		    event->read.value);
														
 
															 	return 0;
														
@@ -222,7 +175,7 @@ static int perf_session__setup_sample_type(struct perf_session *self)
 
															 	} else if (!dont_use_callchains && callchain_param.mode != CHAIN_NONE &&
														
 
															 		   !symbol_conf.use_callchain) {
														
 
															 			symbol_conf.use_callchain = true;
														
 
															-			if (register_callchain_param(&callchain_param) < 0) {
														
 
															+			if (callchain_register_param(&callchain_param) < 0) {
														
 
															 				fprintf(stderr, "Can't register callchain"
														
 
															 						" params\n");
														
 
															 				return -EINVAL;
														
@@ -233,17 +186,17 @@ static int perf_session__setup_sample_type(struct perf_session *self)
 
															 }
														
 
															 static struct perf_event_ops event_ops = {
														
 
															-	.sample	= process_sample_event,
														
 
															-	.mmap	= event__process_mmap,
														
 
															-	.comm	= event__process_comm,
														
 
															-	.exit	= event__process_task,
														
 
															-	.fork	= event__process_task,
														
 
															-	.lost	= event__process_lost,
														
 
															-	.read	= process_read_event,
														
 
															-	.attr	= event__process_attr,
														
 
															-	.event_type = event__process_event_type,
														
 
															-	.tracing_data = event__process_tracing_data,
														
 
															-	.build_id = event__process_build_id,
														
 
															+	.sample		 = process_sample_event,
														
 
															+	.mmap		 = perf_event__process_mmap,
														
 
															+	.comm		 = perf_event__process_comm,
														
 
															+	.exit		 = perf_event__process_task,
														
 
															+	.fork		 = perf_event__process_task,
														
 
															+	.lost		 = perf_event__process_lost,
														
 
															+	.read		 = process_read_event,
														
 
															+	.attr		 = perf_event__process_attr,
														
 
															+	.event_type	 = perf_event__process_event_type,
														
 
															+	.tracing_data	 = perf_event__process_tracing_data,
														
 
															+	.build_id	 = perf_event__process_build_id,
														
 
															 	.ordered_samples = true,
														
 
															 	.ordering_requires_timestamps = true,
														
 
															 };
														
@@ -269,21 +222,21 @@ static size_t hists__fprintf_nr_sample_events(struct hists *self,
 
															 	return ret + fprintf(fp, "\n#\n");
														
 
															 }
														
 
															-static int hists__tty_browse_tree(struct rb_root *tree, const char *help)
														
 
															+static int perf_evlist__tty_browse_hists(struct perf_evlist *evlist,
														
 
															+					 const char *help)
														
 
															 {
														
 
															-	struct rb_node *next = rb_first(tree);
														
 
															+	struct perf_evsel *pos;
														
 
															-	while (next) {
														
 
															-		struct hists *hists = rb_entry(next, struct hists, rb_node);
														
 
															+	list_for_each_entry(pos, &evlist->entries, node) {
														
 
															+		struct hists *hists = &pos->hists;
														
 
															 		const char *evname = NULL;
														
 
															 		if (rb_first(&hists->entries) != rb_last(&hists->entries))
														
 
															-			evname = __event_name(hists->type, hists->config);
														
 
															+			evname = event_name(pos);
														
 
															 		hists__fprintf_nr_sample_events(hists, evname, stdout);
														
 
															 		hists__fprintf(hists, NULL, false, stdout);
														
 
															 		fprintf(stdout, "\n\n");
														
 
															-		next = rb_next(&hists->rb_node);
														
 
															 	}
														
 
															 	if (sort_order == default_sort_order &&
														
@@ -304,8 +257,9 @@ static int hists__tty_browse_tree(struct rb_root *tree, const char *help)
 
															 static int __cmd_report(void)
														
 
															 {
														
 
															 	int ret = -EINVAL;
														
 
															+	u64 nr_samples;
														
 
															 	struct perf_session *session;
														
 
															-	struct rb_node *next;
														
 
															+	struct perf_evsel *pos;
														
 
															 	const char *help = "For a higher level overview, try: perf report --sort comm,dso";
														
 
															 	signal(SIGINT, sig_handler);
														
@@ -336,20 +290,24 @@ static int __cmd_report(void)
 
															 	if (verbose > 2)
														
 
															 		perf_session__fprintf_dsos(session, stdout);
														
 
															-	next = rb_first(&session->hists_tree);
														
 
															-	while (next) {
														
 
															-		struct hists *hists;
														
 
															+	nr_samples = 0;
														
 
															+	list_for_each_entry(pos, &session->evlist->entries, node) {
														
 
															+		struct hists *hists = &pos->hists;
														
 
															-		hists = rb_entry(next, struct hists, rb_node);
														
 
															 		hists__collapse_resort(hists);
														
 
															 		hists__output_resort(hists);
														
 
															-		next = rb_next(&hists->rb_node);
														
 
															+		nr_samples += hists->stats.nr_events[PERF_RECORD_SAMPLE];
														
 
															+	}
														
 
															+
														
 
															+	if (nr_samples == 0) {
														
 
															+		ui__warning("The %s file has no samples!\n", input_name);
														
 
															+		goto out_delete;
														
 
															 	}
														
 
															 	if (use_browser > 0)
														
 
															-		hists__tui_browse_tree(&session->hists_tree, help);
														
 
															+		perf_evlist__tui_browse_hists(session->evlist, help);
														
 
															 	else
														
 
															-		hists__tty_browse_tree(&session->hists_tree, help);
														
 
															+		perf_evlist__tty_browse_hists(session->evlist, help);
														
 
															 out_delete:
														
 
															 	/*
														
@@ -424,7 +382,7 @@ parse_callchain_opt(const struct option *opt __used, const char *arg,
 
															 	if (tok2)
														
 
															 		callchain_param.print_limit = strtod(tok2, &endptr);
														
 
															 setup:
														
 
															-	if (register_callchain_param(&callchain_param) < 0) {
														
 
															+	if (callchain_register_param(&callchain_param) < 0) {
														
 
															 		fprintf(stderr, "Can't register callchain params\n");
														
 
															 		return -1;
														
 
															 	}
														
@@ -498,7 +456,7 @@ int cmd_report(int argc, const char **argv, const char *prefix __used)
 
															 		use_browser = 1;
														
 
															 	if (strcmp(input_name, "-") != 0)
														
 
															-		setup_browser();
														
 
															+		setup_browser(true);
														
 
															 	else
														
 
															 		use_browser = 0;
														
 
															 	/*
														
@@ -507,7 +465,8 @@ int cmd_report(int argc, const char **argv, const char *prefix __used)
 
															 	 * implementation.
														
 
															 	 */
														
 
															 	if (use_browser > 0) {
														
 
															-		symbol_conf.priv_size = sizeof(struct sym_priv);
														
 
															+		symbol_conf.priv_size = sizeof(struct annotation);
														
 
															+		annotate_init	      = symbol__annotate_init;
														
 
															 		/*
														
 
															  		 * For searching by name on the "Browse map details".
														
 
															  		 * providing it only in verbose mode not to bloat too
														
--- a/tools/perf/builtin-sched.c
+++ b/tools/perf/builtin-sched.c
@@ -369,11 +369,6 @@ static void
 
															 process_sched_event(struct task_desc *this_task __used, struct sched_atom *atom)
														
 
															 {
														
 
															 	int ret = 0;
														
 
															-	u64 now;
														
 
															-	long long delta;
														
 
															-
														
 
															-	now = get_nsecs();
														
 
															-	delta = start_time + atom->timestamp - now;
														
 
															 	switch (atom->type) {
														
 
															 		case SCHED_EVENT_RUN:
														
@@ -562,7 +557,7 @@ static void wait_for_tasks(void)
 
															 static void run_one_test(void)
														
 
															 {
														
 
															-	u64 T0, T1, delta, avg_delta, fluct, std_dev;
														
 
															+	u64 T0, T1, delta, avg_delta, fluct;
														
 
															 	T0 = get_nsecs();
														
 
															 	wait_for_tasks();
														
@@ -578,7 +573,6 @@ static void run_one_test(void)
 
															 	else
														
 
															 		fluct = delta - avg_delta;
														
 
															 	sum_fluct += fluct;
														
 
															-	std_dev = sum_fluct / nr_runs / sqrt(nr_runs);
														
 
															 	if (!run_avg)
														
 
															 		run_avg = delta;
														
 
															 	run_avg = (run_avg*9 + delta)/10;
														
@@ -799,7 +793,7 @@ replay_switch_event(struct trace_switch_event *switch_event,
 
															 		    u64 timestamp,
														
 
															 		    struct thread *thread __used)
														
 
															 {
														
 
															-	struct task_desc *prev, *next;
														
 
															+	struct task_desc *prev, __used *next;
														
 
															 	u64 timestamp0;
														
 
															 	s64 delta;
														
@@ -1404,7 +1398,7 @@ map_switch_event(struct trace_switch_event *switch_event,
 
															 		 u64 timestamp,
														
 
															 		 struct thread *thread __used)
														
 
															 {
														
 
															-	struct thread *sched_out, *sched_in;
														
 
															+	struct thread *sched_out __used, *sched_in;
														
 
															 	int new_shortname;
														
 
															 	u64 timestamp0;
														
 
															 	s64 delta;
														
@@ -1580,9 +1574,9 @@ process_sched_migrate_task_event(void *data, struct perf_session *session,
 
															 						 event, cpu, timestamp, thread);
														
 
															 }
														
 
															-static void
														
 
															-process_raw_event(event_t *raw_event __used, struct perf_session *session,
														
 
															-		  void *data, int cpu, u64 timestamp, struct thread *thread)
														
 
															+static void process_raw_event(union perf_event *raw_event __used,
														
 
															+			      struct perf_session *session, void *data, int cpu,
														
 
															+			      u64 timestamp, struct thread *thread)
														
 
															 {
														
 
															 	struct event *event;
														
 
															 	int type;
														
@@ -1607,7 +1601,8 @@ process_raw_event(event_t *raw_event __used, struct perf_session *session,
 
															 		process_sched_migrate_task_event(data, session, event, cpu, timestamp, thread);
														
 
															 }
														
 
															-static int process_sample_event(event_t *event, struct sample_data *sample,
														
 
															+static int process_sample_event(union perf_event *event,
														
 
															+				struct perf_sample *sample,
														
 
															 				struct perf_session *session)
														
 
															 {
														
 
															 	struct thread *thread;
														
@@ -1635,9 +1630,9 @@ static int process_sample_event(event_t *event, struct sample_data *sample,
 
															 static struct perf_event_ops event_ops = {
														
 
															 	.sample			= process_sample_event,
														
 
															-	.comm			= event__process_comm,
														
 
															-	.lost			= event__process_lost,
														
 
															-	.fork			= event__process_task,
														
 
															+	.comm			= perf_event__process_comm,
														
 
															+	.lost			= perf_event__process_lost,
														
 
															+	.fork			= perf_event__process_task,
														
 
															 	.ordered_samples	= true,
														
 
															 };
														
--- a/tools/perf/builtin-script.c
+++ b/tools/perf/builtin-script.c
@@ -63,7 +63,8 @@ static int cleanup_scripting(void)
 
															 static char const		*input_name = "perf.data";
														
 
															-static int process_sample_event(event_t *event, struct sample_data *sample,
														
 
															+static int process_sample_event(union perf_event *event,
														
 
															+				struct perf_sample *sample,
														
 
															 				struct perf_session *session)
														
 
															 {
														
 
															 	struct thread *thread = perf_session__findnew(session, event->ip.pid);
														
@@ -100,14 +101,14 @@ static int process_sample_event(event_t *event, struct sample_data *sample,
 
															 }
														
 
															 static struct perf_event_ops event_ops = {
														
 
															-	.sample	= process_sample_event,
														
 
															-	.comm	= event__process_comm,
														
 
															-	.attr	= event__process_attr,
														
 
															-	.event_type = event__process_event_type,
														
 
															-	.tracing_data = event__process_tracing_data,
														
 
															-	.build_id = event__process_build_id,
														
 
															-	.ordering_requires_timestamps = true,
														
 
															+	.sample		 = process_sample_event,
														
 
															+	.comm		 = perf_event__process_comm,
														
 
															+	.attr		 = perf_event__process_attr,
														
 
															+	.event_type	 = perf_event__process_event_type,
														
 
															+	.tracing_data	 = perf_event__process_tracing_data,
														
 
															+	.build_id	 = perf_event__process_build_id,
														
 
															 	.ordered_samples = true,
														
 
															+	.ordering_requires_timestamps = true,
														
 
															 };
														
 
															 extern volatile int session_done;
														
--- a/tools/perf/builtin-stat.c
+++ b/tools/perf/builtin-stat.c
@@ -43,11 +43,13 @@
 
															 #include "util/parse-options.h"
														
 
															 #include "util/parse-events.h"
														
 
															 #include "util/event.h"
														
 
															+#include "util/evlist.h"
														
 
															 #include "util/evsel.h"
														
 
															 #include "util/debug.h"
														
 
															 #include "util/header.h"
														
 
															 #include "util/cpumap.h"
														
 
															 #include "util/thread.h"
														
 
															+#include "util/thread_map.h"
														
 
															 #include <sys/prctl.h>
														
 
															 #include <math.h>
														
@@ -71,8 +73,9 @@ static struct perf_event_attr default_attrs[] = {
 
															 };
														
 
															+struct perf_evlist		*evsel_list;
														
 
															+
														
 
															 static bool			system_wide			=  false;
														
 
															-static struct cpu_map		*cpus;
														
 
															 static int			run_idx				=  0;
														
 
															 static int			run_count			=  1;
														
@@ -81,7 +84,6 @@ static bool			scale				=  true;
 
															 static bool			no_aggr				= false;
														
 
															 static pid_t			target_pid			= -1;
														
 
															 static pid_t			target_tid			= -1;
														
 
															-static struct thread_map	*threads;
														
 
															 static pid_t			child_pid			= -1;
														
 
															 static bool			null_run			=  false;
														
 
															 static bool			big_num				=  true;
														
@@ -166,7 +168,7 @@ static int create_perf_stat_counter(struct perf_evsel *evsel)
 
															 				    PERF_FORMAT_TOTAL_TIME_RUNNING;
														
 
															 	if (system_wide)
														
 
															-		return perf_evsel__open_per_cpu(evsel, cpus);
														
 
															+		return perf_evsel__open_per_cpu(evsel, evsel_list->cpus, false, false);
														
 
															 	attr->inherit = !no_inherit;
														
 
															 	if (target_pid == -1 && target_tid == -1) {
														
@@ -174,7 +176,7 @@ static int create_perf_stat_counter(struct perf_evsel *evsel)
 
															 		attr->enable_on_exec = 1;
														
 
															 	}
														
 
															-	return perf_evsel__open_per_thread(evsel, threads);
														
 
															+	return perf_evsel__open_per_thread(evsel, evsel_list->threads, false, false);
														
 
															 }
														
 
															 /*
														
@@ -199,7 +201,8 @@ static int read_counter_aggr(struct perf_evsel *counter)
 
															 	u64 *count = counter->counts->aggr.values;
														
 
															 	int i;
														
 
															-	if (__perf_evsel__read(counter, cpus->nr, threads->nr, scale) < 0)
														
 
															+	if (__perf_evsel__read(counter, evsel_list->cpus->nr,
														
 
															+			       evsel_list->threads->nr, scale) < 0)
														
 
															 		return -1;
														
 
															 	for (i = 0; i < 3; i++)
														
@@ -232,7 +235,7 @@ static int read_counter(struct perf_evsel *counter)
 
															 	u64 *count;
														
 
															 	int cpu;
														
 
															-	for (cpu = 0; cpu < cpus->nr; cpu++) {
														
 
															+	for (cpu = 0; cpu < evsel_list->cpus->nr; cpu++) {
														
 
															 		if (__perf_evsel__read_on_cpu(counter, cpu, 0, scale) < 0)
														
 
															 			return -1;
														
@@ -297,7 +300,7 @@ static int run_perf_stat(int argc __used, const char **argv)
 
															 		}
														
 
															 		if (target_tid == -1 && target_pid == -1 && !system_wide)
														
 
															-			threads->map[0] = child_pid;
														
 
															+			evsel_list->threads->map[0] = child_pid;
														
 
															 		/*
														
 
															 		 * Wait for the child to be ready to exec.
														
@@ -309,7 +312,7 @@ static int run_perf_stat(int argc __used, const char **argv)
 
															 		close(child_ready_pipe[0]);
														
 
															 	}
														
 
															-	list_for_each_entry(counter, &evsel_list, node) {
														
 
															+	list_for_each_entry(counter, &evsel_list->entries, node) {
														
 
															 		if (create_perf_stat_counter(counter) < 0) {
														
 
															 			if (errno == -EPERM || errno == -EACCES) {
														
 
															 				error("You may not have permission to collect %sstats.\n"
														
@@ -347,14 +350,15 @@ static int run_perf_stat(int argc __used, const char **argv)
 
															 	update_stats(&walltime_nsecs_stats, t1 - t0);
														
 
															 	if (no_aggr) {
														
 
															-		list_for_each_entry(counter, &evsel_list, node) {
														
 
															+		list_for_each_entry(counter, &evsel_list->entries, node) {
														
 
															 			read_counter(counter);
														
 
															-			perf_evsel__close_fd(counter, cpus->nr, 1);
														
 
															+			perf_evsel__close_fd(counter, evsel_list->cpus->nr, 1);
														
 
															 		}
														
 
															 	} else {
														
 
															-		list_for_each_entry(counter, &evsel_list, node) {
														
 
															+		list_for_each_entry(counter, &evsel_list->entries, node) {
														
 
															 			read_counter_aggr(counter);
														
 
															-			perf_evsel__close_fd(counter, cpus->nr, threads->nr);
														
 
															+			perf_evsel__close_fd(counter, evsel_list->cpus->nr,
														
 
															+					     evsel_list->threads->nr);
														
 
															 		}
														
 
															 	}
														
@@ -382,10 +386,13 @@ static void nsec_printout(int cpu, struct perf_evsel *evsel, double avg)
 
															 	if (no_aggr)
														
 
															 		sprintf(cpustr, "CPU%*d%s",
														
 
															 			csv_output ? 0 : -4,
														
 
															-			cpus->map[cpu], csv_sep);
														
 
															+			evsel_list->cpus->map[cpu], csv_sep);
														
 
															 	fprintf(stderr, fmt, cpustr, msecs, csv_sep, event_name(evsel));
														
 
															+	if (evsel->cgrp)
														
 
															+		fprintf(stderr, "%s%s", csv_sep, evsel->cgrp->name);
														
 
															+
														
 
															 	if (csv_output)
														
 
															 		return;
														
@@ -410,12 +417,15 @@ static void abs_printout(int cpu, struct perf_evsel *evsel, double avg)
 
															 	if (no_aggr)
														
 
															 		sprintf(cpustr, "CPU%*d%s",
														
 
															 			csv_output ? 0 : -4,
														
 
															-			cpus->map[cpu], csv_sep);
														
 
															+			evsel_list->cpus->map[cpu], csv_sep);
														
 
															 	else
														
 
															 		cpu = 0;
														
 
															 	fprintf(stderr, fmt, cpustr, avg, csv_sep, event_name(evsel));
														
 
															+	if (evsel->cgrp)
														
 
															+		fprintf(stderr, "%s%s", csv_sep, evsel->cgrp->name);
														
 
															+
														
 
															 	if (csv_output)
														
 
															 		return;
														
@@ -456,9 +466,17 @@ static void print_counter_aggr(struct perf_evsel *counter)
 
															 	int scaled = counter->counts->scaled;
														
 
															 	if (scaled == -1) {
														
 
															-		fprintf(stderr, "%*s%s%-24s\n",
														
 
															+		fprintf(stderr, "%*s%s%*s",
														
 
															 			csv_output ? 0 : 18,
														
 
															-			"<not counted>", csv_sep, event_name(counter));
														
 
															+			"<not counted>",
														
 
															+			csv_sep,
														
 
															+			csv_output ? 0 : -24,
														
 
															+			event_name(counter));
														
 
															+
														
 
															+		if (counter->cgrp)
														
 
															+			fprintf(stderr, "%s%s", csv_sep, counter->cgrp->name);
														
 
															+
														
 
															+		fputc('\n', stderr);
														
 
															 		return;
														
 
															 	}
														
@@ -483,7 +501,6 @@ static void print_counter_aggr(struct perf_evsel *counter)
 
															 		fprintf(stderr, "  (scaled from %.2f%%)",
														
 
															 				100 * avg_running / avg_enabled);
														
 
															 	}
														
 
															-
														
 
															 	fprintf(stderr, "\n");
														
 
															 }
														
@@ -496,19 +513,23 @@ static void print_counter(struct perf_evsel *counter)
 
															 	u64 ena, run, val;
														
 
															 	int cpu;
														
 
															-	for (cpu = 0; cpu < cpus->nr; cpu++) {
														
 
															+	for (cpu = 0; cpu < evsel_list->cpus->nr; cpu++) {
														
 
															 		val = counter->counts->cpu[cpu].val;
														
 
															 		ena = counter->counts->cpu[cpu].ena;
														
 
															 		run = counter->counts->cpu[cpu].run;
														
 
															 		if (run == 0 || ena == 0) {
														
 
															-			fprintf(stderr, "CPU%*d%s%*s%s%-24s",
														
 
															+			fprintf(stderr, "CPU%*d%s%*s%s%*s",
														
 
															 				csv_output ? 0 : -4,
														
 
															-				cpus->map[cpu], csv_sep,
														
 
															+				evsel_list->cpus->map[cpu], csv_sep,
														
 
															 				csv_output ? 0 : 18,
														
 
															 				"<not counted>", csv_sep,
														
 
															+				csv_output ? 0 : -24,
														
 
															 				event_name(counter));
														
 
															-			fprintf(stderr, "\n");
														
 
															+			if (counter->cgrp)
														
 
															+				fprintf(stderr, "%s%s", csv_sep, counter->cgrp->name);
														
 
															+
														
 
															+			fputc('\n', stderr);
														
 
															 			continue;
														
 
															 		}
														
@@ -525,7 +546,7 @@ static void print_counter(struct perf_evsel *counter)
 
															 					100.0 * run / ena);
														
 
															 			}
														
 
															 		}
														
 
															-		fprintf(stderr, "\n");
														
 
															+		fputc('\n', stderr);
														
 
															 	}
														
 
															 }
														
@@ -555,10 +576,10 @@ static void print_stat(int argc, const char **argv)
 
															 	}
														
 
															 	if (no_aggr) {
														
 
															-		list_for_each_entry(counter, &evsel_list, node)
														
 
															+		list_for_each_entry(counter, &evsel_list->entries, node)
														
 
															 			print_counter(counter);
														
 
															 	} else {
														
 
															-		list_for_each_entry(counter, &evsel_list, node)
														
 
															+		list_for_each_entry(counter, &evsel_list->entries, node)
														
 
															 			print_counter_aggr(counter);
														
 
															 	}
														
@@ -610,7 +631,7 @@ static int stat__set_big_num(const struct option *opt __used,
 
															 }
														
 
															 static const struct option options[] = {
														
 
															-	OPT_CALLBACK('e', "event", NULL, "event",
														
 
															+	OPT_CALLBACK('e', "event", &evsel_list, "event",
														
 
															 		     "event selector. use 'perf list' to list available events",
														
 
															 		     parse_events),
														
 
															 	OPT_BOOLEAN('i', "no-inherit", &no_inherit,
														
@@ -638,6 +659,9 @@ static const struct option options[] = {
 
															 		    "disable CPU count aggregation"),
														
 
															 	OPT_STRING('x', "field-separator", &csv_sep, "separator",
														
 
															 		   "print counts with custom separator"),
														
 
															+	OPT_CALLBACK('G', "cgroup", &evsel_list, "name",
														
 
															+		     "monitor event in cgroup name only",
														
 
															+		     parse_cgroups),
														
 
															 	OPT_END()
														
 
															 };
														
@@ -648,6 +672,10 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used)
 
															 	setlocale(LC_ALL, "");
														
 
															+	evsel_list = perf_evlist__new(NULL, NULL);
														
 
															+	if (evsel_list == NULL)
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															 	argc = parse_options(argc, argv, options, stat_usage,
														
 
															 		PARSE_OPT_STOP_AT_NON_OPTION);
														
@@ -674,49 +702,50 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used)
 
															 	if (run_count <= 0)
														
 
															 		usage_with_options(stat_usage, options);
														
 
															-	/* no_aggr is for system-wide only */
														
 
															-	if (no_aggr && !system_wide)
														
 
															+	/* no_aggr, cgroup are for system-wide only */
														
 
															+	if ((no_aggr || nr_cgroups) && !system_wide) {
														
 
															+		fprintf(stderr, "both cgroup and no-aggregation "
														
 
															+			"modes only available in system-wide mode\n");
														
 
															+
														
 
															 		usage_with_options(stat_usage, options);
														
 
															+	}
														
 
															 	/* Set attrs and nr_counters if no event is selected and !null_run */
														
 
															-	if (!null_run && !nr_counters) {
														
 
															+	if (!null_run && !evsel_list->nr_entries) {
														
 
															 		size_t c;
														
 
															-		nr_counters = ARRAY_SIZE(default_attrs);
														
 
															-
														
 
															 		for (c = 0; c < ARRAY_SIZE(default_attrs); ++c) {
														
 
															-			pos = perf_evsel__new(&default_attrs[c],
														
 
															-					      nr_counters);
														
 
															+			pos = perf_evsel__new(&default_attrs[c], c);
														
 
															 			if (pos == NULL)
														
 
															 				goto out;
														
 
															-			list_add(&pos->node, &evsel_list);
														
 
															+			perf_evlist__add(evsel_list, pos);
														
 
															 		}
														
 
															 	}
														
 
															 	if (target_pid != -1)
														
 
															 		target_tid = target_pid;
														
 
															-	threads = thread_map__new(target_pid, target_tid);
														
 
															-	if (threads == NULL) {
														
 
															+	evsel_list->threads = thread_map__new(target_pid, target_tid);
														
 
															+	if (evsel_list->threads == NULL) {
														
 
															 		pr_err("Problems finding threads of monitor\n");
														
 
															 		usage_with_options(stat_usage, options);
														
 
															 	}
														
 
															 	if (system_wide)
														
 
															-		cpus = cpu_map__new(cpu_list);
														
 
															+		evsel_list->cpus = cpu_map__new(cpu_list);
														
 
															 	else
														
 
															-		cpus = cpu_map__dummy_new();
														
 
															+		evsel_list->cpus = cpu_map__dummy_new();
														
 
															-	if (cpus == NULL) {
														
 
															+	if (evsel_list->cpus == NULL) {
														
 
															 		perror("failed to parse CPUs map");
														
 
															 		usage_with_options(stat_usage, options);
														
 
															 		return -1;
														
 
															 	}
														
 
															-	list_for_each_entry(pos, &evsel_list, node) {
														
 
															+	list_for_each_entry(pos, &evsel_list->entries, node) {
														
 
															 		if (perf_evsel__alloc_stat_priv(pos) < 0 ||
														
 
															-		    perf_evsel__alloc_counts(pos, cpus->nr) < 0 ||
														
 
															-		    perf_evsel__alloc_fd(pos, cpus->nr, threads->nr) < 0)
														
 
															+		    perf_evsel__alloc_counts(pos, evsel_list->cpus->nr) < 0 ||
														
 
															+		    perf_evsel__alloc_fd(pos, evsel_list->cpus->nr, evsel_list->threads->nr) < 0)
														
 
															 			goto out_free_fd;
														
 
															 	}
														
@@ -741,11 +770,10 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used)
 
															 	if (status != -1)
														
 
															 		print_stat(argc, argv);
														
 
															 out_free_fd:
														
 
															-	list_for_each_entry(pos, &evsel_list, node)
														
 
															+	list_for_each_entry(pos, &evsel_list->entries, node)
														
 
															 		perf_evsel__free_stat_priv(pos);
														
 
															-	perf_evsel_list__delete();
														
 
															+	perf_evlist__delete_maps(evsel_list);
														
 
															 out:
														
 
															-	thread_map__delete(threads);
														
 
															-	threads = NULL;
														
 
															+	perf_evlist__delete(evsel_list);
														
 
															 	return status;
														
 
															 }
														
--- a/tools/perf/builtin-test.c
+++ b/tools/perf/builtin-test.c
@@ -7,10 +7,11 @@
 
															 #include "util/cache.h"
														
 
															 #include "util/debug.h"
														
 
															+#include "util/evlist.h"
														
 
															 #include "util/parse-options.h"
														
 
															-#include "util/session.h"
														
 
															+#include "util/parse-events.h"
														
 
															 #include "util/symbol.h"
														
 
															-#include "util/thread.h"
														
 
															+#include "util/thread_map.h"
														
 
															 static long page_size;
														
@@ -238,14 +239,14 @@ out:
 
															 #include "util/evsel.h"
														
 
															 #include <sys/types.h>
														
 
															-static int trace_event__id(const char *event_name)
														
 
															+static int trace_event__id(const char *evname)
														
 
															 {
														
 
															 	char *filename;
														
 
															 	int err = -1, fd;
														
 
															 	if (asprintf(&filename,
														
 
															 		     "/sys/kernel/debug/tracing/events/syscalls/%s/id",
														
 
															-		     event_name) < 0)
														
 
															+		     evname) < 0)
														
 
															 		return -1;
														
 
															 	fd = open(filename, O_RDONLY);
														
@@ -289,7 +290,7 @@ static int test__open_syscall_event(void)
 
															 		goto out_thread_map_delete;
														
 
															 	}
														
 
															-	if (perf_evsel__open_per_thread(evsel, threads) < 0) {
														
 
															+	if (perf_evsel__open_per_thread(evsel, threads, false, false) < 0) {
														
 
															 		pr_debug("failed to open counter: %s, "
														
 
															 			 "tweak /proc/sys/kernel/perf_event_paranoid?\n",
														
 
															 			 strerror(errno));
														
@@ -347,9 +348,9 @@ static int test__open_syscall_event_on_all_cpus(void)
 
															 	}
														
 
															 	cpus = cpu_map__new(NULL);
														
 
															-	if (threads == NULL) {
														
 
															-		pr_debug("thread_map__new\n");
														
 
															-		return -1;
														
 
															+	if (cpus == NULL) {
														
 
															+		pr_debug("cpu_map__new\n");
														
 
															+		goto out_thread_map_delete;
														
 
															 	}
														
@@ -364,7 +365,7 @@ static int test__open_syscall_event_on_all_cpus(void)
 
															 		goto out_thread_map_delete;
														
 
															 	}
														
 
															-	if (perf_evsel__open(evsel, cpus, threads) < 0) {
														
 
															+	if (perf_evsel__open(evsel, cpus, threads, false, false) < 0) {
														
 
															 		pr_debug("failed to open counter: %s, "
														
 
															 			 "tweak /proc/sys/kernel/perf_event_paranoid?\n",
														
 
															 			 strerror(errno));
														
@@ -408,6 +409,8 @@ static int test__open_syscall_event_on_all_cpus(void)
 
															 		goto out_close_fd;
														
 
															 	}
														
 
															+	err = 0;
														
 
															+
														
 
															 	for (cpu = 0; cpu < cpus->nr; ++cpu) {
														
 
															 		unsigned int expected;
														
@@ -416,18 +419,18 @@ static int test__open_syscall_event_on_all_cpus(void)
 
															 		if (perf_evsel__read_on_cpu(evsel, cpu, 0) < 0) {
														
 
															 			pr_debug("perf_evsel__open_read_on_cpu\n");
														
 
															-			goto out_close_fd;
														
 
															+			err = -1;
														
 
															+			break;
														
 
															 		}
														
 
															 		expected = nr_open_calls + cpu;
														
 
															 		if (evsel->counts->cpu[cpu].val != expected) {
														
 
															 			pr_debug("perf_evsel__read_on_cpu: expected to intercept %d calls on cpu %d, got %" PRIu64 "\n",
														
 
															 				 expected, cpus->map[cpu], evsel->counts->cpu[cpu].val);
														
 
															-			goto out_close_fd;
														
 
															+			err = -1;
														
 
															 		}
														
 
															 	}
														
 
															-	err = 0;
														
 
															 out_close_fd:
														
 
															 	perf_evsel__close_fd(evsel, 1, threads->nr);
														
 
															 out_evsel_delete:
														
@@ -437,6 +440,159 @@ out_thread_map_delete:
 
															 	return err;
														
 
															 }
														
 
															+/*
														
 
															+ * This test will generate random numbers of calls to some getpid syscalls,
														
 
															+ * then establish an mmap for a group of events that are created to monitor
														
 
															+ * the syscalls.
														
 
															+ *
														
 
															+ * It will receive the events, using mmap, use its PERF_SAMPLE_ID generated
														
 
															+ * sample.id field to map back to its respective perf_evsel instance.
														
 
															+ *
														
 
															+ * Then it checks if the number of syscalls reported as perf events by
														
 
															+ * the kernel corresponds to the number of syscalls made.
														
 
															+ */
														
 
															+static int test__basic_mmap(void)
														
 
															+{
														
 
															+	int err = -1;
														
 
															+	union perf_event *event;
														
 
															+	struct thread_map *threads;
														
 
															+	struct cpu_map *cpus;
														
 
															+	struct perf_evlist *evlist;
														
 
															+	struct perf_event_attr attr = {
														
 
															+		.type		= PERF_TYPE_TRACEPOINT,
														
 
															+		.read_format	= PERF_FORMAT_ID,
														
 
															+		.sample_type	= PERF_SAMPLE_ID,
														
 
															+		.watermark	= 0,
														
 
															+	};
														
 
															+	cpu_set_t cpu_set;
														
 
															+	const char *syscall_names[] = { "getsid", "getppid", "getpgrp",
														
 
															+					"getpgid", };
														
 
															+	pid_t (*syscalls[])(void) = { (void *)getsid, getppid, getpgrp,
														
 
															+				      (void*)getpgid };
														
 
															+#define nsyscalls ARRAY_SIZE(syscall_names)
														
 
															+	int ids[nsyscalls];
														
 
															+	unsigned int nr_events[nsyscalls],
														
 
															+		     expected_nr_events[nsyscalls], i, j;
														
 
															+	struct perf_evsel *evsels[nsyscalls], *evsel;
														
 
															+
														
 
															+	for (i = 0; i < nsyscalls; ++i) {
														
 
															+		char name[64];
														
 
															+
														
 
															+		snprintf(name, sizeof(name), "sys_enter_%s", syscall_names[i]);
														
 
															+		ids[i] = trace_event__id(name);
														
 
															+		if (ids[i] < 0) {
														
 
															+			pr_debug("Is debugfs mounted on /sys/kernel/debug?\n");
														
 
															+			return -1;
														
 
															+		}
														
 
															+		nr_events[i] = 0;
														
 
															+		expected_nr_events[i] = random() % 257;
														
 
															+	}
														
 
															+
														
 
															+	threads = thread_map__new(-1, getpid());
														
 
															+	if (threads == NULL) {
														
 
															+		pr_debug("thread_map__new\n");
														
 
															+		return -1;
														
 
															+	}
														
 
															+
														
 
															+	cpus = cpu_map__new(NULL);
														
 
															+	if (cpus == NULL) {
														
 
															+		pr_debug("cpu_map__new\n");
														
 
															+		goto out_free_threads;
														
 
															+	}
														
 
															+
														
 
															+	CPU_ZERO(&cpu_set);
														
 
															+	CPU_SET(cpus->map[0], &cpu_set);
														
 
															+	sched_setaffinity(0, sizeof(cpu_set), &cpu_set);
														
 
															+	if (sched_setaffinity(0, sizeof(cpu_set), &cpu_set) < 0) {
														
 
															+		pr_debug("sched_setaffinity() failed on CPU %d: %s ",
														
 
															+			 cpus->map[0], strerror(errno));
														
 
															+		goto out_free_cpus;
														
 
															+	}
														
 
															+
														
 
															+	evlist = perf_evlist__new(cpus, threads);
														
 
															+	if (evlist == NULL) {
														
 
															+		pr_debug("perf_evlist__new\n");
														
 
															+		goto out_free_cpus;
														
 
															+	}
														
 
															+
														
 
															+	/* anonymous union fields, can't be initialized above */
														
 
															+	attr.wakeup_events = 1;
														
 
															+	attr.sample_period = 1;
														
 
															+
														
 
															+	for (i = 0; i < nsyscalls; ++i) {
														
 
															+		attr.config = ids[i];
														
 
															+		evsels[i] = perf_evsel__new(&attr, i);
														
 
															+		if (evsels[i] == NULL) {
														
 
															+			pr_debug("perf_evsel__new\n");
														
 
															+			goto out_free_evlist;
														
 
															+		}
														
 
															+
														
 
															+		perf_evlist__add(evlist, evsels[i]);
														
 
															+
														
 
															+		if (perf_evsel__open(evsels[i], cpus, threads, false, false) < 0) {
														
 
															+			pr_debug("failed to open counter: %s, "
														
 
															+				 "tweak /proc/sys/kernel/perf_event_paranoid?\n",
														
 
															+				 strerror(errno));
														
 
															+			goto out_close_fd;
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	if (perf_evlist__mmap(evlist, 128, true) < 0) {
														
 
															+		pr_debug("failed to mmap events: %d (%s)\n", errno,
														
 
															+			 strerror(errno));
														
 
															+		goto out_close_fd;
														
 
															+	}
														
 
															+
														
 
															+	for (i = 0; i < nsyscalls; ++i)
														
 
															+		for (j = 0; j < expected_nr_events[i]; ++j) {
														
 
															+			int foo = syscalls[i]();
														
 
															+			++foo;
														
 
															+		}
														
 
															+
														
 
															+	while ((event = perf_evlist__read_on_cpu(evlist, 0)) != NULL) {
														
 
															+		struct perf_sample sample;
														
 
															+
														
 
															+		if (event->header.type != PERF_RECORD_SAMPLE) {
														
 
															+			pr_debug("unexpected %s event\n",
														
 
															+				 perf_event__name(event->header.type));
														
 
															+			goto out_munmap;
														
 
															+		}
														
 
															+
														
 
															+		perf_event__parse_sample(event, attr.sample_type, false, &sample);
														
 
															+		evsel = perf_evlist__id2evsel(evlist, sample.id);
														
 
															+		if (evsel == NULL) {
														
 
															+			pr_debug("event with id %" PRIu64
														
 
															+				 " doesn't map to an evsel\n", sample.id);
														
 
															+			goto out_munmap;
														
 
															+		}
														
 
															+		nr_events[evsel->idx]++;
														
 
															+	}
														
 
															+
														
 
															+	list_for_each_entry(evsel, &evlist->entries, node) {
														
 
															+		if (nr_events[evsel->idx] != expected_nr_events[evsel->idx]) {
														
 
															+			pr_debug("expected %d %s events, got %d\n",
														
 
															+				 expected_nr_events[evsel->idx],
														
 
															+				 event_name(evsel), nr_events[evsel->idx]);
														
 
															+			goto out_munmap;
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	err = 0;
														
 
															+out_munmap:
														
 
															+	perf_evlist__munmap(evlist);
														
 
															+out_close_fd:
														
 
															+	for (i = 0; i < nsyscalls; ++i)
														
 
															+		perf_evsel__close_fd(evsels[i], 1, threads->nr);
														
 
															+out_free_evlist:
														
 
															+	perf_evlist__delete(evlist);
														
 
															+out_free_cpus:
														
 
															+	cpu_map__delete(cpus);
														
 
															+out_free_threads:
														
 
															+	thread_map__delete(threads);
														
 
															+	return err;
														
 
															+#undef nsyscalls
														
 
															+}
														
 
															+
														
 
															 static struct test {
														
 
															 	const char *desc;
														
 
															 	int (*func)(void);
														
@@ -453,6 +609,10 @@ static struct test {
 
															 		.desc = "detect open syscall event on all cpus",
														
 
															 		.func = test__open_syscall_event_on_all_cpus,
														
 
															 	},
														
 
															+	{
														
 
															+		.desc = "read samples using the mmap interface",
														
 
															+		.func = test__basic_mmap,
														
 
															+	},
														
 
															 	{
														
 
															 		.func = NULL,
														
 
															 	},
														
--- a/tools/perf/builtin-timechart.c
+++ b/tools/perf/builtin-timechart.c
@@ -273,21 +273,24 @@ static int cpus_cstate_state[MAX_CPUS];
 
															 static u64 cpus_pstate_start_times[MAX_CPUS];
														
 
															 static u64 cpus_pstate_state[MAX_CPUS];
														
 
															-static int process_comm_event(event_t *event, struct sample_data *sample __used,
														
 
															+static int process_comm_event(union perf_event *event,
														
 
															+			      struct perf_sample *sample __used,
														
 
															 			      struct perf_session *session __used)
														
 
															 {
														
 
															 	pid_set_comm(event->comm.tid, event->comm.comm);
														
 
															 	return 0;
														
 
															 }
														
 
															-static int process_fork_event(event_t *event, struct sample_data *sample __used,
														
 
															+static int process_fork_event(union perf_event *event,
														
 
															+			      struct perf_sample *sample __used,
														
 
															 			      struct perf_session *session __used)
														
 
															 {
														
 
															 	pid_fork(event->fork.pid, event->fork.ppid, event->fork.time);
														
 
															 	return 0;
														
 
															 }
														
 
															-static int process_exit_event(event_t *event, struct sample_data *sample __used,
														
 
															+static int process_exit_event(union perf_event *event,
														
 
															+			      struct perf_sample *sample __used,
														
 
															 			      struct perf_session *session __used)
														
 
															 {
														
 
															 	pid_exit(event->fork.pid, event->fork.time);
														
@@ -483,8 +486,8 @@ static void sched_switch(int cpu, u64 timestamp, struct trace_entry *te)
 
															 }
														
 
															-static int process_sample_event(event_t *event __used,
														
 
															-				struct sample_data *sample,
														
 
															+static int process_sample_event(union perf_event *event __used,
														
 
															+				struct perf_sample *sample,
														
 
															 				struct perf_session *session)
														
 
															 {
														
 
															 	struct trace_entry *te;
														
--- a/tools/perf/builtin-top.c
+++ b/tools/perf/builtin-top.c
@@ -20,11 +20,16 @@
 
															 #include "perf.h"
														
 
															+#include "util/annotate.h"
														
 
															+#include "util/cache.h"
														
 
															 #include "util/color.h"
														
 
															+#include "util/evlist.h"
														
 
															 #include "util/evsel.h"
														
 
															 #include "util/session.h"
														
 
															 #include "util/symbol.h"
														
 
															 #include "util/thread.h"
														
 
															+#include "util/thread_map.h"
														
 
															+#include "util/top.h"
														
 
															 #include "util/util.h"
														
 
															 #include <linux/rbtree.h>
														
 
															 #include "util/parse-options.h"
														
@@ -45,7 +50,6 @@
 
															 #include <errno.h>
														
 
															 #include <time.h>
														
 
															 #include <sched.h>
														
 
															-#include <pthread.h>
														
 
															 #include <sys/syscall.h>
														
 
															 #include <sys/ioctl.h>
														
@@ -60,85 +64,42 @@
 
															 #define FD(e, x, y) (*(int *)xyarray__entry(e->fd, x, y))
														
 
															+static struct perf_top top = {
														
 
															+	.count_filter		= 5,
														
 
															+	.delay_secs		= 2,
														
 
															+	.display_weighted	= -1,
														
 
															+	.target_pid		= -1,
														
 
															+	.target_tid		= -1,
														
 
															+	.active_symbols		= LIST_HEAD_INIT(top.active_symbols),
														
 
															+	.active_symbols_lock	= PTHREAD_MUTEX_INITIALIZER,
														
 
															+	.active_symbols_cond	= PTHREAD_COND_INITIALIZER,
														
 
															+	.freq			= 1000, /* 1 KHz */
														
 
															+};
														
 
															+
														
 
															 static bool			system_wide			=  false;
														
 
															-static int			default_interval		=      0;
														
 
															+static bool			use_tui, use_stdio;
														
 
															-static int			count_filter			=      5;
														
 
															-static int			print_entries;
														
 
															+static int			default_interval		=      0;
														
 
															-static int			target_pid			=     -1;
														
 
															-static int			target_tid			=     -1;
														
 
															-static struct thread_map	*threads;
														
 
															 static bool			inherit				=  false;
														
 
															-static struct cpu_map		*cpus;
														
 
															 static int			realtime_prio			=      0;
														
 
															 static bool			group				=  false;
														
 
															 static unsigned int		page_size;
														
 
															-static unsigned int		mmap_pages			=     16;
														
 
															-static int			freq				=   1000; /* 1 KHz */
														
 
															+static unsigned int		mmap_pages			=    128;
														
 
															-static int			delay_secs			=      2;
														
 
															-static bool			zero                            =  false;
														
 
															 static bool			dump_symtab                     =  false;
														
 
															-static bool			hide_kernel_symbols		=  false;
														
 
															-static bool			hide_user_symbols		=  false;
														
 
															 static struct winsize		winsize;
														
 
															-/*
														
 
															- * Source
														
 
															- */
														
 
															-
														
 
															-struct source_line {
														
 
															-	u64			eip;
														
 
															-	unsigned long		count[MAX_COUNTERS];
														
 
															-	char			*line;
														
 
															-	struct source_line	*next;
														
 
															-};
														
 
															-
														
 
															 static const char		*sym_filter			=   NULL;
														
 
															-struct sym_entry		*sym_filter_entry		=   NULL;
														
 
															 struct sym_entry		*sym_filter_entry_sched		=   NULL;
														
 
															 static int			sym_pcnt_filter			=      5;
														
 
															-static int			sym_counter			=      0;
														
 
															-static struct perf_evsel	*sym_evsel			=   NULL;
														
 
															-static int			display_weighted		=     -1;
														
 
															-static const char		*cpu_list;
														
 
															-
														
 
															-/*
														
 
															- * Symbols
														
 
															- */
														
 
															-
														
 
															-struct sym_entry_source {
														
 
															-	struct source_line	*source;
														
 
															-	struct source_line	*lines;
														
 
															-	struct source_line	**lines_tail;
														
 
															-	pthread_mutex_t		lock;
														
 
															-};
														
 
															-
														
 
															-struct sym_entry {
														
 
															-	struct rb_node		rb_node;
														
 
															-	struct list_head	node;
														
 
															-	unsigned long		snap_count;
														
 
															-	double			weight;
														
 
															-	int			skip;
														
 
															-	u16			name_len;
														
 
															-	u8			origin;
														
 
															-	struct map		*map;
														
 
															-	struct sym_entry_source	*src;
														
 
															-	unsigned long		count[0];
														
 
															-};
														
 
															 /*
														
 
															  * Source functions
														
 
															  */
														
 
															-static inline struct symbol *sym_entry__symbol(struct sym_entry *self)
														
 
															-{
														
 
															-       return ((void *)self) + symbol_conf.priv_size;
														
 
															-}
														
 
															-
														
 
															 void get_term_dimensions(struct winsize *ws)
														
 
															 {
														
 
															 	char *s = getenv("LINES");
														
@@ -163,10 +124,10 @@ void get_term_dimensions(struct winsize *ws)
 
															 static void update_print_entries(struct winsize *ws)
														
 
															 {
														
 
															-	print_entries = ws->ws_row;
														
 
															+	top.print_entries = ws->ws_row;
														
 
															-	if (print_entries > 9)
														
 
															-		print_entries -= 9;
														
 
															+	if (top.print_entries > 9)
														
 
															+		top.print_entries -= 9;
														
 
															 }
														
 
															 static void sig_winch_handler(int sig __used)
														
@@ -178,12 +139,9 @@ static void sig_winch_handler(int sig __used)
 
															 static int parse_source(struct sym_entry *syme)
														
 
															 {
														
 
															 	struct symbol *sym;
														
 
															-	struct sym_entry_source *source;
														
 
															+	struct annotation *notes;
														
 
															 	struct map *map;
														
 
															-	FILE *file;
														
 
															-	char command[PATH_MAX*2];
														
 
															-	const char *path;
														
 
															-	u64 len;
														
 
															+	int err = -1;
														
 
															 	if (!syme)
														
 
															 		return -1;
														
@@ -194,411 +152,137 @@ static int parse_source(struct sym_entry *syme)
 
															 	/*
														
 
															 	 * We can't annotate with just /proc/kallsyms
														
 
															 	 */
														
 
															-	if (map->dso->origin == DSO__ORIG_KERNEL)
														
 
															+	if (map->dso->origin == DSO__ORIG_KERNEL) {
														
 
															+		pr_err("Can't annotate %s: No vmlinux file was found in the "
														
 
															+		       "path\n", sym->name);
														
 
															+		sleep(1);
														
 
															 		return -1;
														
 
															-
														
 
															-	if (syme->src == NULL) {
														
 
															-		syme->src = zalloc(sizeof(*source));
														
 
															-		if (syme->src == NULL)
														
 
															-			return -1;
														
 
															-		pthread_mutex_init(&syme->src->lock, NULL);
														
 
															 	}
														
 
															-	source = syme->src;
														
 
															-
														
 
															-	if (source->lines) {
														
 
															-		pthread_mutex_lock(&source->lock);
														
 
															+	notes = symbol__annotation(sym);
														
 
															+	if (notes->src != NULL) {
														
 
															+		pthread_mutex_lock(&notes->lock);
														
 
															 		goto out_assign;
														
 
															 	}
														
 
															-	path = map->dso->long_name;
														
 
															-
														
 
															-	len = sym->end - sym->start;
														
 
															-
														
 
															-	sprintf(command,
														
 
															-		"objdump --start-address=%#0*" PRIx64 " --stop-address=%#0*" PRIx64 " -dS %s",
														
 
															-		BITS_PER_LONG / 4, map__rip_2objdump(map, sym->start),
														
 
															-		BITS_PER_LONG / 4, map__rip_2objdump(map, sym->end), path);
														
 
															-
														
 
															-	file = popen(command, "r");
														
 
															-	if (!file)
														
 
															-		return -1;
														
 
															-
														
 
															-	pthread_mutex_lock(&source->lock);
														
 
															-	source->lines_tail = &source->lines;
														
 
															-	while (!feof(file)) {
														
 
															-		struct source_line *src;
														
 
															-		size_t dummy = 0;
														
 
															-		char *c, *sep;
														
 
															-		src = malloc(sizeof(struct source_line));
														
 
															-		assert(src != NULL);
														
 
															-		memset(src, 0, sizeof(struct source_line));
														
 
															+	pthread_mutex_lock(&notes->lock);
														
 
															-		if (getline(&src->line, &dummy, file) < 0)
														
 
															-			break;
														
 
															-		if (!src->line)
														
 
															-			break;
														
 
															-
														
 
															-		c = strchr(src->line, '\n');
														
 
															-		if (c)
														
 
															-			*c = 0;
														
 
															-
														
 
															-		src->next = NULL;
														
 
															-		*source->lines_tail = src;
														
 
															-		source->lines_tail = &src->next;
														
 
															-
														
 
															-		src->eip = strtoull(src->line, &sep, 16);
														
 
															-		if (*sep == ':')
														
 
															-			src->eip = map__objdump_2ip(map, src->eip);
														
 
															-		else /* this line has no ip info (e.g. source line) */
														
 
															-			src->eip = 0;
														
 
															+	if (symbol__alloc_hist(sym, top.evlist->nr_entries) < 0) {
														
 
															+		pthread_mutex_unlock(&notes->lock);
														
 
															+		pr_err("Not enough memory for annotating '%s' symbol!\n",
														
 
															+		       sym->name);
														
 
															+		sleep(1);
														
 
															+		return err;
														
 
															 	}
														
 
															-	pclose(file);
														
 
															+
														
 
															+	err = symbol__annotate(sym, syme->map, 0);
														
 
															+	if (err == 0) {
														
 
															 out_assign:
														
 
															-	sym_filter_entry = syme;
														
 
															-	pthread_mutex_unlock(&source->lock);
														
 
															-	return 0;
														
 
															+		top.sym_filter_entry = syme;
														
 
															+	}
														
 
															+
														
 
															+	pthread_mutex_unlock(&notes->lock);
														
 
															+	return err;
														
 
															 }
														
 
															 static void __zero_source_counters(struct sym_entry *syme)
														
 
															 {
														
 
															-	int i;
														
 
															-	struct source_line *line;
														
 
															-
														
 
															-	line = syme->src->lines;
														
 
															-	while (line) {
														
 
															-		for (i = 0; i < nr_counters; i++)
														
 
															-			line->count[i] = 0;
														
 
															-		line = line->next;
														
 
															-	}
														
 
															+	struct symbol *sym = sym_entry__symbol(syme);
														
 
															+	symbol__annotate_zero_histograms(sym);
														
 
															 }
														
 
															 static void record_precise_ip(struct sym_entry *syme, int counter, u64 ip)
														
 
															 {
														
 
															-	struct source_line *line;
														
 
															-
														
 
															-	if (syme != sym_filter_entry)
														
 
															-		return;
														
 
															+	struct annotation *notes;
														
 
															+	struct symbol *sym;
														
 
															-	if (pthread_mutex_trylock(&syme->src->lock))
														
 
															+	if (syme != top.sym_filter_entry)
														
 
															 		return;
														
 
															-	if (syme->src == NULL || syme->src->source == NULL)
														
 
															-		goto out_unlock;
														
 
															-
														
 
															-	for (line = syme->src->lines; line; line = line->next) {
														
 
															-		/* skip lines without IP info */
														
 
															-		if (line->eip == 0)
														
 
															-			continue;
														
 
															-		if (line->eip == ip) {
														
 
															-			line->count[counter]++;
														
 
															-			break;
														
 
															-		}
														
 
															-		if (line->eip > ip)
														
 
															-			break;
														
 
															-	}
														
 
															-out_unlock:
														
 
															-	pthread_mutex_unlock(&syme->src->lock);
														
 
															-}
														
 
															-
														
 
															-#define PATTERN_LEN		(BITS_PER_LONG / 4 + 2)
														
 
															-
														
 
															-static void lookup_sym_source(struct sym_entry *syme)
														
 
															-{
														
 
															-	struct symbol *symbol = sym_entry__symbol(syme);
														
 
															-	struct source_line *line;
														
 
															-	char pattern[PATTERN_LEN + 1];
														
 
															-
														
 
															-	sprintf(pattern, "%0*" PRIx64 " <", BITS_PER_LONG / 4,
														
 
															-		map__rip_2objdump(syme->map, symbol->start));
														
 
															-
														
 
															-	pthread_mutex_lock(&syme->src->lock);
														
 
															-	for (line = syme->src->lines; line; line = line->next) {
														
 
															-		if (memcmp(line->line, pattern, PATTERN_LEN) == 0) {
														
 
															-			syme->src->source = line;
														
 
															-			break;
														
 
															-		}
														
 
															-	}
														
 
															-	pthread_mutex_unlock(&syme->src->lock);
														
 
															-}
														
 
															+	sym = sym_entry__symbol(syme);
														
 
															+	notes = symbol__annotation(sym);
														
 
															-static void show_lines(struct source_line *queue, int count, int total)
														
 
															-{
														
 
															-	int i;
														
 
															-	struct source_line *line;
														
 
															+	if (pthread_mutex_trylock(&notes->lock))
														
 
															+		return;
														
 
															-	line = queue;
														
 
															-	for (i = 0; i < count; i++) {
														
 
															-		float pcnt = 100.0*(float)line->count[sym_counter]/(float)total;
														
 
															+	ip = syme->map->map_ip(syme->map, ip);
														
 
															+	symbol__inc_addr_samples(sym, syme->map, counter, ip);
														
 
															-		printf("%8li %4.1f%%\t%s\n", line->count[sym_counter], pcnt, line->line);
														
 
															-		line = line->next;
														
 
															-	}
														
 
															+	pthread_mutex_unlock(&notes->lock);
														
 
															 }
														
 
															-#define TRACE_COUNT     3
														
 
															-
														
 
															 static void show_details(struct sym_entry *syme)
														
 
															 {
														
 
															+	struct annotation *notes;
														
 
															 	struct symbol *symbol;
														
 
															-	struct source_line *line;
														
 
															-	struct source_line *line_queue = NULL;
														
 
															-	int displayed = 0;
														
 
															-	int line_queue_count = 0, total = 0, more = 0;
														
 
															+	int more;
														
 
															 	if (!syme)
														
 
															 		return;
														
 
															-	if (!syme->src->source)
														
 
															-		lookup_sym_source(syme);
														
 
															-
														
 
															-	if (!syme->src->source)
														
 
															-		return;
														
 
															-
														
 
															 	symbol = sym_entry__symbol(syme);
														
 
															-	printf("Showing %s for %s\n", event_name(sym_evsel), symbol->name);
														
 
															-	printf("  Events  Pcnt (>=%d%%)\n", sym_pcnt_filter);
														
 
															-
														
 
															-	pthread_mutex_lock(&syme->src->lock);
														
 
															-	line = syme->src->source;
														
 
															-	while (line) {
														
 
															-		total += line->count[sym_counter];
														
 
															-		line = line->next;
														
 
															-	}
														
 
															-
														
 
															-	line = syme->src->source;
														
 
															-	while (line) {
														
 
															-		float pcnt = 0.0;
														
 
															-
														
 
															-		if (!line_queue_count)
														
 
															-			line_queue = line;
														
 
															-		line_queue_count++;
														
 
															-
														
 
															-		if (line->count[sym_counter])
														
 
															-			pcnt = 100.0 * line->count[sym_counter] / (float)total;
														
 
															-		if (pcnt >= (float)sym_pcnt_filter) {
														
 
															-			if (displayed <= print_entries)
														
 
															-				show_lines(line_queue, line_queue_count, total);
														
 
															-			else more++;
														
 
															-			displayed += line_queue_count;
														
 
															-			line_queue_count = 0;
														
 
															-			line_queue = NULL;
														
 
															-		} else if (line_queue_count > TRACE_COUNT) {
														
 
															-			line_queue = line_queue->next;
														
 
															-			line_queue_count--;
														
 
															-		}
														
 
															-
														
 
															-		line->count[sym_counter] = zero ? 0 : line->count[sym_counter] * 7 / 8;
														
 
															-		line = line->next;
														
 
															-	}
														
 
															-	pthread_mutex_unlock(&syme->src->lock);
														
 
															-	if (more)
														
 
															-		printf("%d lines not displayed, maybe increase display entries [e]\n", more);
														
 
															-}
														
 
															+	notes = symbol__annotation(symbol);
														
 
															-/*
														
 
															- * Symbols will be added here in event__process_sample and will get out
														
 
															- * after decayed.
														
 
															- */
														
 
															-static LIST_HEAD(active_symbols);
														
 
															-static pthread_mutex_t active_symbols_lock = PTHREAD_MUTEX_INITIALIZER;
														
 
															-
														
 
															-/*
														
 
															- * Ordering weight: count-1 * count-2 * ... / count-n
														
 
															- */
														
 
															-static double sym_weight(const struct sym_entry *sym)
														
 
															-{
														
 
															-	double weight = sym->snap_count;
														
 
															-	int counter;
														
 
															-
														
 
															-	if (!display_weighted)
														
 
															-		return weight;
														
 
															+	pthread_mutex_lock(&notes->lock);
														
 
															-	for (counter = 1; counter < nr_counters-1; counter++)
														
 
															-		weight *= sym->count[counter];
														
 
															+	if (notes->src == NULL)
														
 
															+		goto out_unlock;
														
 
															-	weight /= (sym->count[counter] + 1);
														
 
															+	printf("Showing %s for %s\n", event_name(top.sym_evsel), symbol->name);
														
 
															+	printf("  Events  Pcnt (>=%d%%)\n", sym_pcnt_filter);
														
 
															-	return weight;
														
 
															+	more = symbol__annotate_printf(symbol, syme->map, top.sym_evsel->idx,
														
 
															+				       0, sym_pcnt_filter, top.print_entries, 4);
														
 
															+	if (top.zero)
														
 
															+		symbol__annotate_zero_histogram(symbol, top.sym_evsel->idx);
														
 
															+	else
														
 
															+		symbol__annotate_decay_histogram(symbol, top.sym_evsel->idx);
														
 
															+	if (more != 0)
														
 
															+		printf("%d lines not displayed, maybe increase display entries [e]\n", more);
														
 
															+out_unlock:
														
 
															+	pthread_mutex_unlock(&notes->lock);
														
 
															 }
														
 
															-static long			samples;
														
 
															-static long			kernel_samples, us_samples;
														
 
															-static long			exact_samples;
														
 
															-static long			guest_us_samples, guest_kernel_samples;
														
 
															 static const char		CONSOLE_CLEAR[] = "[H[2J";
														
 
															 static void __list_insert_active_sym(struct sym_entry *syme)
														
 
															 {
														
 
															-	list_add(&syme->node, &active_symbols);
														
 
															-}
														
 
															-
														
 
															-static void list_remove_active_sym(struct sym_entry *syme)
														
 
															-{
														
 
															-	pthread_mutex_lock(&active_symbols_lock);
														
 
															-	list_del_init(&syme->node);
														
 
															-	pthread_mutex_unlock(&active_symbols_lock);
														
 
															+	list_add(&syme->node, &top.active_symbols);
														
 
															 }
														
 
															-static void rb_insert_active_sym(struct rb_root *tree, struct sym_entry *se)
														
 
															+static void print_sym_table(struct perf_session *session)
														
 
															 {
														
 
															-	struct rb_node **p = &tree->rb_node;
														
 
															-	struct rb_node *parent = NULL;
														
 
															-	struct sym_entry *iter;
														
 
															-
														
 
															-	while (*p != NULL) {
														
 
															-		parent = *p;
														
 
															-		iter = rb_entry(parent, struct sym_entry, rb_node);
														
 
															-
														
 
															-		if (se->weight > iter->weight)
														
 
															-			p = &(*p)->rb_left;
														
 
															-		else
														
 
															-			p = &(*p)->rb_right;
														
 
															-	}
														
 
															-
														
 
															-	rb_link_node(&se->rb_node, parent, p);
														
 
															-	rb_insert_color(&se->rb_node, tree);
														
 
															-}
														
 
															-
														
 
															-static void print_sym_table(void)
														
 
															-{
														
 
															-	int printed = 0, j;
														
 
															-	struct perf_evsel *counter;
														
 
															-	int snap = !display_weighted ? sym_counter : 0;
														
 
															-	float samples_per_sec = samples/delay_secs;
														
 
															-	float ksamples_per_sec = kernel_samples/delay_secs;
														
 
															-	float us_samples_per_sec = (us_samples)/delay_secs;
														
 
															-	float guest_kernel_samples_per_sec = (guest_kernel_samples)/delay_secs;
														
 
															-	float guest_us_samples_per_sec = (guest_us_samples)/delay_secs;
														
 
															-	float esamples_percent = (100.0*exact_samples)/samples;
														
 
															-	float sum_ksamples = 0.0;
														
 
															-	struct sym_entry *syme, *n;
														
 
															-	struct rb_root tmp = RB_ROOT;
														
 
															+	char bf[160];
														
 
															+	int printed = 0;
														
 
															 	struct rb_node *nd;
														
 
															-	int sym_width = 0, dso_width = 0, dso_short_width = 0;
														
 
															+	struct sym_entry *syme;
														
 
															+	struct rb_root tmp = RB_ROOT;
														
 
															 	const int win_width = winsize.ws_col - 1;
														
 
															-
														
 
															-	samples = us_samples = kernel_samples = exact_samples = 0;
														
 
															-	guest_kernel_samples = guest_us_samples = 0;
														
 
															-
														
 
															-	/* Sort the active symbols */
														
 
															-	pthread_mutex_lock(&active_symbols_lock);
														
 
															-	syme = list_entry(active_symbols.next, struct sym_entry, node);
														
 
															-	pthread_mutex_unlock(&active_symbols_lock);
														
 
															-
														
 
															-	list_for_each_entry_safe_from(syme, n, &active_symbols, node) {
														
 
															-		syme->snap_count = syme->count[snap];
														
 
															-		if (syme->snap_count != 0) {
														
 
															-
														
 
															-			if ((hide_user_symbols &&
														
 
															-			     syme->origin == PERF_RECORD_MISC_USER) ||
														
 
															-			    (hide_kernel_symbols &&
														
 
															-			     syme->origin == PERF_RECORD_MISC_KERNEL)) {
														
 
															-				list_remove_active_sym(syme);
														
 
															-				continue;
														
 
															-			}
														
 
															-			syme->weight = sym_weight(syme);
														
 
															-			rb_insert_active_sym(&tmp, syme);
														
 
															-			sum_ksamples += syme->snap_count;
														
 
															-
														
 
															-			for (j = 0; j < nr_counters; j++)
														
 
															-				syme->count[j] = zero ? 0 : syme->count[j] * 7 / 8;
														
 
															-		} else
														
 
															-			list_remove_active_sym(syme);
														
 
															-	}
														
 
															+	int sym_width, dso_width, dso_short_width;
														
 
															+	float sum_ksamples = perf_top__decay_samples(&top, &tmp);
														
 
															 	puts(CONSOLE_CLEAR);
														
 
															-	printf("%-*.*s\n", win_width, win_width, graph_dotted_line);
														
 
															-	if (!perf_guest) {
														
 
															-		printf("   PerfTop:%8.0f irqs/sec  kernel:%4.1f%%"
														
 
															-			"  exact: %4.1f%% [",
														
 
															-			samples_per_sec,
														
 
															-			100.0 - (100.0 * ((samples_per_sec - ksamples_per_sec) /
														
 
															-					 samples_per_sec)),
														
 
															-			esamples_percent);
														
 
															-	} else {
														
 
															-		printf("   PerfTop:%8.0f irqs/sec  kernel:%4.1f%% us:%4.1f%%"
														
 
															-			" guest kernel:%4.1f%% guest us:%4.1f%%"
														
 
															-			" exact: %4.1f%% [",
														
 
															-			samples_per_sec,
														
 
															-			100.0 - (100.0 * ((samples_per_sec-ksamples_per_sec) /
														
 
															-					  samples_per_sec)),
														
 
															-			100.0 - (100.0 * ((samples_per_sec-us_samples_per_sec) /
														
 
															-					  samples_per_sec)),
														
 
															-			100.0 - (100.0 * ((samples_per_sec -
														
 
															-						guest_kernel_samples_per_sec) /
														
 
															-					  samples_per_sec)),
														
 
															-			100.0 - (100.0 * ((samples_per_sec -
														
 
															-					   guest_us_samples_per_sec) /
														
 
															-					  samples_per_sec)),
														
 
															-			esamples_percent);
														
 
															-	}
														
 
															-
														
 
															-	if (nr_counters == 1 || !display_weighted) {
														
 
															-		struct perf_evsel *first;
														
 
															-		first = list_entry(evsel_list.next, struct perf_evsel, node);
														
 
															-		printf("%" PRIu64, (uint64_t)first->attr.sample_period);
														
 
															-		if (freq)
														
 
															-			printf("Hz ");
														
 
															-		else
														
 
															-			printf(" ");
														
 
															-	}
														
 
															-
														
 
															-	if (!display_weighted)
														
 
															-		printf("%s", event_name(sym_evsel));
														
 
															-	else list_for_each_entry(counter, &evsel_list, node) {
														
 
															-		if (counter->idx)
														
 
															-			printf("/");
														
 
															-
														
 
															-		printf("%s", event_name(counter));
														
 
															-	}
														
 
															+	perf_top__header_snprintf(&top, bf, sizeof(bf));
														
 
															+	printf("%s\n", bf);
														
 
															-	printf( "], ");
														
 
															-
														
 
															-	if (target_pid != -1)
														
 
															-		printf(" (target_pid: %d", target_pid);
														
 
															-	else if (target_tid != -1)
														
 
															-		printf(" (target_tid: %d", target_tid);
														
 
															-	else
														
 
															-		printf(" (all");
														
 
															-
														
 
															-	if (cpu_list)
														
 
															-		printf(", CPU%s: %s)\n", cpus->nr > 1 ? "s" : "", cpu_list);
														
 
															-	else {
														
 
															-		if (target_tid != -1)
														
 
															-			printf(")\n");
														
 
															-		else
														
 
															-			printf(", %d CPU%s)\n", cpus->nr, cpus->nr > 1 ? "s" : "");
														
 
															-	}
														
 
															+	perf_top__reset_sample_counters(&top);
														
 
															 	printf("%-*.*s\n", win_width, win_width, graph_dotted_line);
														
 
															-	if (sym_filter_entry) {
														
 
															-		show_details(sym_filter_entry);
														
 
															-		return;
														
 
															+	if (session->hists.stats.total_lost != 0) {
														
 
															+		color_fprintf(stdout, PERF_COLOR_RED, "WARNING:");
														
 
															+		printf(" LOST %" PRIu64 " events, Check IO/CPU overload\n",
														
 
															+		       session->hists.stats.total_lost);
														
 
															 	}
														
 
															-	/*
														
 
															-	 * Find the longest symbol name that will be displayed
														
 
															-	 */
														
 
															-	for (nd = rb_first(&tmp); nd; nd = rb_next(nd)) {
														
 
															-		syme = rb_entry(nd, struct sym_entry, rb_node);
														
 
															-		if (++printed > print_entries ||
														
 
															-		    (int)syme->snap_count < count_filter)
														
 
															-			continue;
														
 
															-
														
 
															-		if (syme->map->dso->long_name_len > dso_width)
														
 
															-			dso_width = syme->map->dso->long_name_len;
														
 
															-
														
 
															-		if (syme->map->dso->short_name_len > dso_short_width)
														
 
															-			dso_short_width = syme->map->dso->short_name_len;
														
 
															-
														
 
															-		if (syme->name_len > sym_width)
														
 
															-			sym_width = syme->name_len;
														
 
															+	if (top.sym_filter_entry) {
														
 
															+		show_details(top.sym_filter_entry);
														
 
															+		return;
														
 
															 	}
														
 
															-	printed = 0;
														
 
															+	perf_top__find_widths(&top, &tmp, &dso_width, &dso_short_width,
														
 
															+			      &sym_width);
														
 
															 	if (sym_width + dso_width > winsize.ws_col - 29) {
														
 
															 		dso_width = dso_short_width;
														
@@ -606,7 +290,7 @@ static void print_sym_table(void)
 
															 			sym_width = winsize.ws_col - dso_width - 29;
														
 
															 	}
														
 
															 	putchar('\n');
														
 
															-	if (nr_counters == 1)
														
 
															+	if (top.evlist->nr_entries == 1)
														
 
															 		printf("             samples  pcnt");
														
 
															 	else
														
 
															 		printf("   weight    samples  pcnt");
														
@@ -615,7 +299,7 @@ static void print_sym_table(void)
 
															 		printf("         RIP       ");
														
 
															 	printf(" %-*.*s DSO\n", sym_width, sym_width, "function");
														
 
															 	printf("   %s    _______ _____",
														
 
															-	       nr_counters == 1 ? "      " : "______");
														
 
															+	       top.evlist->nr_entries == 1 ? "      " : "______");
														
 
															 	if (verbose)
														
 
															 		printf(" ________________");
														
 
															 	printf(" %-*.*s", sym_width, sym_width, graph_line);
														
@@ -628,13 +312,14 @@ static void print_sym_table(void)
 
															 		syme = rb_entry(nd, struct sym_entry, rb_node);
														
 
															 		sym = sym_entry__symbol(syme);
														
 
															-		if (++printed > print_entries || (int)syme->snap_count < count_filter)
														
 
															+		if (++printed > top.print_entries ||
														
 
															+		    (int)syme->snap_count < top.count_filter)
														
 
															 			continue;
														
 
															 		pcnt = 100.0 - (100.0 * ((sum_ksamples - syme->snap_count) /
														
 
															 					 sum_ksamples));
														
 
															-		if (nr_counters == 1 || !display_weighted)
														
 
															+		if (top.evlist->nr_entries == 1 || !top.display_weighted)
														
 
															 			printf("%20.2f ", syme->weight);
														
 
															 		else
														
 
															 			printf("%9.1f %10ld ", syme->weight, syme->snap_count);
														
@@ -693,10 +378,8 @@ static void prompt_symbol(struct sym_entry **target, const char *msg)
 
															 	/* zero counters of active symbol */
														
 
															 	if (syme) {
														
 
															-		pthread_mutex_lock(&syme->src->lock);
														
 
															 		__zero_source_counters(syme);
														
 
															 		*target = NULL;
														
 
															-		pthread_mutex_unlock(&syme->src->lock);
														
 
															 	}
														
 
															 	fprintf(stdout, "\n%s: ", msg);
														
@@ -707,11 +390,11 @@ static void prompt_symbol(struct sym_entry **target, const char *msg)
 
															 	if (p)
														
 
															 		*p = 0;
														
 
															-	pthread_mutex_lock(&active_symbols_lock);
														
 
															-	syme = list_entry(active_symbols.next, struct sym_entry, node);
														
 
															-	pthread_mutex_unlock(&active_symbols_lock);
														
 
															+	pthread_mutex_lock(&top.active_symbols_lock);
														
 
															+	syme = list_entry(top.active_symbols.next, struct sym_entry, node);
														
 
															+	pthread_mutex_unlock(&top.active_symbols_lock);
														
 
															-	list_for_each_entry_safe_from(syme, n, &active_symbols, node) {
														
 
															+	list_for_each_entry_safe_from(syme, n, &top.active_symbols, node) {
														
 
															 		struct symbol *sym = sym_entry__symbol(syme);
														
 
															 		if (!strcmp(buf, sym->name)) {
														
@@ -735,34 +418,34 @@ static void print_mapped_keys(void)
 
															 {
														
 
															 	char *name = NULL;
														
 
															-	if (sym_filter_entry) {
														
 
															-		struct symbol *sym = sym_entry__symbol(sym_filter_entry);
														
 
															+	if (top.sym_filter_entry) {
														
 
															+		struct symbol *sym = sym_entry__symbol(top.sym_filter_entry);
														
 
															 		name = sym->name;
														
 
															 	}
														
 
															 	fprintf(stdout, "\nMapped keys:\n");
														
 
															-	fprintf(stdout, "\t[d]     display refresh delay.             \t(%d)\n", delay_secs);
														
 
															-	fprintf(stdout, "\t[e]     display entries (lines).           \t(%d)\n", print_entries);
														
 
															+	fprintf(stdout, "\t[d]     display refresh delay.             \t(%d)\n", top.delay_secs);
														
 
															+	fprintf(stdout, "\t[e]     display entries (lines).           \t(%d)\n", top.print_entries);
														
 
															-	if (nr_counters > 1)
														
 
															-		fprintf(stdout, "\t[E]     active event counter.              \t(%s)\n", event_name(sym_evsel));
														
 
															+	if (top.evlist->nr_entries > 1)
														
 
															+		fprintf(stdout, "\t[E]     active event counter.              \t(%s)\n", event_name(top.sym_evsel));
														
 
															-	fprintf(stdout, "\t[f]     profile display filter (count).    \t(%d)\n", count_filter);
														
 
															+	fprintf(stdout, "\t[f]     profile display filter (count).    \t(%d)\n", top.count_filter);
														
 
															 	fprintf(stdout, "\t[F]     annotate display filter (percent). \t(%d%%)\n", sym_pcnt_filter);
														
 
															 	fprintf(stdout, "\t[s]     annotate symbol.                   \t(%s)\n", name?: "NULL");
														
 
															 	fprintf(stdout, "\t[S]     stop annotation.\n");
														
 
															-	if (nr_counters > 1)
														
 
															-		fprintf(stdout, "\t[w]     toggle display weighted/count[E]r. \t(%d)\n", display_weighted ? 1 : 0);
														
 
															+	if (top.evlist->nr_entries > 1)
														
 
															+		fprintf(stdout, "\t[w]     toggle display weighted/count[E]r. \t(%d)\n", top.display_weighted ? 1 : 0);
														
 
															 	fprintf(stdout,
														
 
															 		"\t[K]     hide kernel_symbols symbols.     \t(%s)\n",
														
 
															-		hide_kernel_symbols ? "yes" : "no");
														
 
															+		top.hide_kernel_symbols ? "yes" : "no");
														
 
															 	fprintf(stdout,
														
 
															 		"\t[U]     hide user symbols.               \t(%s)\n",
														
 
															-		hide_user_symbols ? "yes" : "no");
														
 
															-	fprintf(stdout, "\t[z]     toggle sample zeroing.             \t(%d)\n", zero ? 1 : 0);
														
 
															+		top.hide_user_symbols ? "yes" : "no");
														
 
															+	fprintf(stdout, "\t[z]     toggle sample zeroing.             \t(%d)\n", top.zero ? 1 : 0);
														
 
															 	fprintf(stdout, "\t[qQ]    quit.\n");
														
 
															 }
														
@@ -783,7 +466,7 @@ static int key_mapped(int c)
 
															 			return 1;
														
 
															 		case 'E':
														
 
															 		case 'w':
														
 
															-			return nr_counters > 1 ? 1 : 0;
														
 
															+			return top.evlist->nr_entries > 1 ? 1 : 0;
														
 
															 		default:
														
 
															 			break;
														
 
															 	}
														
@@ -818,47 +501,47 @@ static void handle_keypress(struct perf_session *session, int c)
 
															 	switch (c) {
														
 
															 		case 'd':
														
 
															-			prompt_integer(&delay_secs, "Enter display delay");
														
 
															-			if (delay_secs < 1)
														
 
															-				delay_secs = 1;
														
 
															+			prompt_integer(&top.delay_secs, "Enter display delay");
														
 
															+			if (top.delay_secs < 1)
														
 
															+				top.delay_secs = 1;
														
 
															 			break;
														
 
															 		case 'e':
														
 
															-			prompt_integer(&print_entries, "Enter display entries (lines)");
														
 
															-			if (print_entries == 0) {
														
 
															+			prompt_integer(&top.print_entries, "Enter display entries (lines)");
														
 
															+			if (top.print_entries == 0) {
														
 
															 				sig_winch_handler(SIGWINCH);
														
 
															 				signal(SIGWINCH, sig_winch_handler);
														
 
															 			} else
														
 
															 				signal(SIGWINCH, SIG_DFL);
														
 
															 			break;
														
 
															 		case 'E':
														
 
															-			if (nr_counters > 1) {
														
 
															+			if (top.evlist->nr_entries > 1) {
														
 
															 				fprintf(stderr, "\nAvailable events:");
														
 
															-				list_for_each_entry(sym_evsel, &evsel_list, node)
														
 
															-					fprintf(stderr, "\n\t%d %s", sym_evsel->idx, event_name(sym_evsel));
														
 
															+				list_for_each_entry(top.sym_evsel, &top.evlist->entries, node)
														
 
															+					fprintf(stderr, "\n\t%d %s", top.sym_evsel->idx, event_name(top.sym_evsel));
														
 
															-				prompt_integer(&sym_counter, "Enter details event counter");
														
 
															+				prompt_integer(&top.sym_counter, "Enter details event counter");
														
 
															-				if (sym_counter >= nr_counters) {
														
 
															-					sym_evsel = list_entry(evsel_list.next, struct perf_evsel, node);
														
 
															-					sym_counter = 0;
														
 
															-					fprintf(stderr, "Sorry, no such event, using %s.\n", event_name(sym_evsel));
														
 
															+				if (top.sym_counter >= top.evlist->nr_entries) {
														
 
															+					top.sym_evsel = list_entry(top.evlist->entries.next, struct perf_evsel, node);
														
 
															+					top.sym_counter = 0;
														
 
															+					fprintf(stderr, "Sorry, no such event, using %s.\n", event_name(top.sym_evsel));
														
 
															 					sleep(1);
														
 
															 					break;
														
 
															 				}
														
 
															-				list_for_each_entry(sym_evsel, &evsel_list, node)
														
 
															-					if (sym_evsel->idx == sym_counter)
														
 
															+				list_for_each_entry(top.sym_evsel, &top.evlist->entries, node)
														
 
															+					if (top.sym_evsel->idx == top.sym_counter)
														
 
															 						break;
														
 
															-			} else sym_counter = 0;
														
 
															+			} else top.sym_counter = 0;
														
 
															 			break;
														
 
															 		case 'f':
														
 
															-			prompt_integer(&count_filter, "Enter display event count filter");
														
 
															+			prompt_integer(&top.count_filter, "Enter display event count filter");
														
 
															 			break;
														
 
															 		case 'F':
														
 
															 			prompt_percent(&sym_pcnt_filter, "Enter details display event filter (percent)");
														
 
															 			break;
														
 
															 		case 'K':
														
 
															-			hide_kernel_symbols = !hide_kernel_symbols;
														
 
															+			top.hide_kernel_symbols = !top.hide_kernel_symbols;
														
 
															 			break;
														
 
															 		case 'q':
														
 
															 		case 'Q':
														
@@ -867,34 +550,50 @@ static void handle_keypress(struct perf_session *session, int c)
 
															 				perf_session__fprintf_dsos(session, stderr);
														
 
															 			exit(0);
														
 
															 		case 's':
														
 
															-			prompt_symbol(&sym_filter_entry, "Enter details symbol");
														
 
															+			prompt_symbol(&top.sym_filter_entry, "Enter details symbol");
														
 
															 			break;
														
 
															 		case 'S':
														
 
															-			if (!sym_filter_entry)
														
 
															+			if (!top.sym_filter_entry)
														
 
															 				break;
														
 
															 			else {
														
 
															-				struct sym_entry *syme = sym_filter_entry;
														
 
															+				struct sym_entry *syme = top.sym_filter_entry;
														
 
															-				pthread_mutex_lock(&syme->src->lock);
														
 
															-				sym_filter_entry = NULL;
														
 
															+				top.sym_filter_entry = NULL;
														
 
															 				__zero_source_counters(syme);
														
 
															-				pthread_mutex_unlock(&syme->src->lock);
														
 
															 			}
														
 
															 			break;
														
 
															 		case 'U':
														
 
															-			hide_user_symbols = !hide_user_symbols;
														
 
															+			top.hide_user_symbols = !top.hide_user_symbols;
														
 
															 			break;
														
 
															 		case 'w':
														
 
															-			display_weighted = ~display_weighted;
														
 
															+			top.display_weighted = ~top.display_weighted;
														
 
															 			break;
														
 
															 		case 'z':
														
 
															-			zero = !zero;
														
 
															+			top.zero = !top.zero;
														
 
															 			break;
														
 
															 		default:
														
 
															 			break;
														
 
															 	}
														
 
															 }
														
 
															+static void *display_thread_tui(void *arg __used)
														
 
															+{
														
 
															+	int err = 0;
														
 
															+	pthread_mutex_lock(&top.active_symbols_lock);
														
 
															+	while (list_empty(&top.active_symbols)) {
														
 
															+		err = pthread_cond_wait(&top.active_symbols_cond,
														
 
															+					&top.active_symbols_lock);
														
 
															+		if (err)
														
 
															+			break;
														
 
															+	}
														
 
															+	pthread_mutex_unlock(&top.active_symbols_lock);
														
 
															+	if (!err)
														
 
															+		perf_top__tui_browser(&top);
														
 
															+	exit_browser(0);
														
 
															+	exit(0);
														
 
															+	return NULL;
														
 
															+}
														
 
															+
														
 
															 static void *display_thread(void *arg __used)
														
 
															 {
														
 
															 	struct pollfd stdin_poll = { .fd = 0, .events = POLLIN };
														
@@ -909,13 +608,13 @@ static void *display_thread(void *arg __used)
 
															 	tc.c_cc[VTIME] = 0;
														
 
															 repeat:
														
 
															-	delay_msecs = delay_secs * 1000;
														
 
															+	delay_msecs = top.delay_secs * 1000;
														
 
															 	tcsetattr(0, TCSANOW, &tc);
														
 
															 	/* trash return*/
														
 
															 	getc(stdin);
														
 
															 	do {
														
 
															-		print_sym_table();
														
 
															+		print_sym_table(session);
														
 
															 	} while (!poll(&stdin_poll, 1, delay_msecs) == 1);
														
 
															 	c = getc(stdin);
														
@@ -930,6 +629,7 @@ repeat:
 
															 /* Tag samples to be skipped. */
														
 
															 static const char *skip_symbols[] = {
														
 
															 	"default_idle",
														
 
															+	"native_safe_halt",
														
 
															 	"cpu_idle",
														
 
															 	"enter_idle",
														
 
															 	"exit_idle",
														
@@ -965,9 +665,9 @@ static int symbol_filter(struct map *map, struct symbol *sym)
 
															 	syme = symbol__priv(sym);
														
 
															 	syme->map = map;
														
 
															-	syme->src = NULL;
														
 
															+	symbol__annotate_init(map, sym);
														
 
															-	if (!sym_filter_entry && sym_filter && !strcmp(name, sym_filter)) {
														
 
															+	if (!top.sym_filter_entry && sym_filter && !strcmp(name, sym_filter)) {
														
 
															 		/* schedule initial sym_filter_entry setup */
														
 
															 		sym_filter_entry_sched = syme;
														
 
															 		sym_filter = NULL;
														
@@ -980,44 +680,40 @@ static int symbol_filter(struct map *map, struct symbol *sym)
 
															 		}
														
 
															 	}
														
 
															-	if (!syme->skip)
														
 
															-		syme->name_len = strlen(sym->name);
														
 
															-
														
 
															 	return 0;
														
 
															 }
														
 
															-static void event__process_sample(const event_t *self,
														
 
															-				  struct sample_data *sample,
														
 
															-				  struct perf_session *session,
														
 
															-				  struct perf_evsel *evsel)
														
 
															+static void perf_event__process_sample(const union perf_event *event,
														
 
															+				       struct perf_sample *sample,
														
 
															+				       struct perf_session *session)
														
 
															 {
														
 
															-	u64 ip = self->ip.ip;
														
 
															+	u64 ip = event->ip.ip;
														
 
															 	struct sym_entry *syme;
														
 
															 	struct addr_location al;
														
 
															 	struct machine *machine;
														
 
															-	u8 origin = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
														
 
															+	u8 origin = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
														
 
															-	++samples;
														
 
															+	++top.samples;
														
 
															 	switch (origin) {
														
 
															 	case PERF_RECORD_MISC_USER:
														
 
															-		++us_samples;
														
 
															-		if (hide_user_symbols)
														
 
															+		++top.us_samples;
														
 
															+		if (top.hide_user_symbols)
														
 
															 			return;
														
 
															 		machine = perf_session__find_host_machine(session);
														
 
															 		break;
														
 
															 	case PERF_RECORD_MISC_KERNEL:
														
 
															-		++kernel_samples;
														
 
															-		if (hide_kernel_symbols)
														
 
															+		++top.kernel_samples;
														
 
															+		if (top.hide_kernel_symbols)
														
 
															 			return;
														
 
															 		machine = perf_session__find_host_machine(session);
														
 
															 		break;
														
 
															 	case PERF_RECORD_MISC_GUEST_KERNEL:
														
 
															-		++guest_kernel_samples;
														
 
															-		machine = perf_session__find_machine(session, self->ip.pid);
														
 
															+		++top.guest_kernel_samples;
														
 
															+		machine = perf_session__find_machine(session, event->ip.pid);
														
 
															 		break;
														
 
															 	case PERF_RECORD_MISC_GUEST_USER:
														
 
															-		++guest_us_samples;
														
 
															+		++top.guest_us_samples;
														
 
															 		/*
														
 
															 		 * TODO: we don't process guest user from host side
														
 
															 		 * except simple counting.
														
@@ -1029,15 +725,15 @@ static void event__process_sample(const event_t *self,
 
															 	if (!machine && perf_guest) {
														
 
															 		pr_err("Can't find guest [%d]'s kernel information\n",
														
 
															-			self->ip.pid);
														
 
															+			event->ip.pid);
														
 
															 		return;
														
 
															 	}
														
 
															-	if (self->header.misc & PERF_RECORD_MISC_EXACT_IP)
														
 
															-		exact_samples++;
														
 
															+	if (event->header.misc & PERF_RECORD_MISC_EXACT_IP)
														
 
															+		top.exact_samples++;
														
 
															-	if (event__preprocess_sample(self, session, &al, sample,
														
 
															-				     symbol_filter) < 0 ||
														
 
															+	if (perf_event__preprocess_sample(event, session, &al, sample,
														
 
															+					  symbol_filter) < 0 ||
														
 
															 	    al.filtered)
														
 
															 		return;
														
@@ -1055,8 +751,9 @@ static void event__process_sample(const event_t *self,
 
															 		 */
														
 
															 		if (al.map == machine->vmlinux_maps[MAP__FUNCTION] &&
														
 
															 		    RB_EMPTY_ROOT(&al.map->dso->symbols[MAP__FUNCTION])) {
														
 
															-			pr_err("The %s file can't be used\n",
														
 
															-			       symbol_conf.vmlinux_name);
														
 
															+			ui__warning("The %s file can't be used\n",
														
 
															+				    symbol_conf.vmlinux_name);
														
 
															+			exit_browser(0);
														
 
															 			exit(1);
														
 
															 		}
														
@@ -1065,13 +762,13 @@ static void event__process_sample(const event_t *self,
 
															 	/* let's see, whether we need to install initial sym_filter_entry */
														
 
															 	if (sym_filter_entry_sched) {
														
 
															-		sym_filter_entry = sym_filter_entry_sched;
														
 
															+		top.sym_filter_entry = sym_filter_entry_sched;
														
 
															 		sym_filter_entry_sched = NULL;
														
 
															-		if (parse_source(sym_filter_entry) < 0) {
														
 
															-			struct symbol *sym = sym_entry__symbol(sym_filter_entry);
														
 
															+		if (parse_source(top.sym_filter_entry) < 0) {
														
 
															+			struct symbol *sym = sym_entry__symbol(top.sym_filter_entry);
														
 
															 			pr_err("Can't annotate %s", sym->name);
														
 
															-			if (sym_filter_entry->map->dso->origin == DSO__ORIG_KERNEL) {
														
 
															+			if (top.sym_filter_entry->map->dso->origin == DSO__ORIG_KERNEL) {
														
 
															 				pr_err(": No vmlinux file was found in the path:\n");
														
 
															 				machine__fprintf_vmlinux_path(machine, stderr);
														
 
															 			} else
														
@@ -1082,166 +779,73 @@ static void event__process_sample(const event_t *self,
 
															 	syme = symbol__priv(al.sym);
														
 
															 	if (!syme->skip) {
														
 
															-		syme->count[evsel->idx]++;
														
 
															+		struct perf_evsel *evsel;
														
 
															+
														
 
															 		syme->origin = origin;
														
 
															+		evsel = perf_evlist__id2evsel(top.evlist, sample->id);
														
 
															+		assert(evsel != NULL);
														
 
															+		syme->count[evsel->idx]++;
														
 
															 		record_precise_ip(syme, evsel->idx, ip);
														
 
															-		pthread_mutex_lock(&active_symbols_lock);
														
 
															-		if (list_empty(&syme->node) || !syme->node.next)
														
 
															+		pthread_mutex_lock(&top.active_symbols_lock);
														
 
															+		if (list_empty(&syme->node) || !syme->node.next) {
														
 
															+			static bool first = true;
														
 
															 			__list_insert_active_sym(syme);
														
 
															-		pthread_mutex_unlock(&active_symbols_lock);
														
 
															+			if (first) {
														
 
															+				pthread_cond_broadcast(&top.active_symbols_cond);
														
 
															+				first = false;
														
 
															+			}
														
 
															+		}
														
 
															+		pthread_mutex_unlock(&top.active_symbols_lock);
														
 
															 	}
														
 
															 }
														
 
															-struct mmap_data {
														
 
															-	void			*base;
														
 
															-	int			mask;
														
 
															-	unsigned int		prev;
														
 
															-};
														
 
															-
														
 
															-static int perf_evsel__alloc_mmap_per_thread(struct perf_evsel *evsel,
														
 
															-					     int ncpus, int nthreads)
														
 
															-{
														
 
															-	evsel->priv = xyarray__new(ncpus, nthreads, sizeof(struct mmap_data));
														
 
															-	return evsel->priv != NULL ? 0 : -ENOMEM;
														
 
															-}
														
 
															-
														
 
															-static void perf_evsel__free_mmap(struct perf_evsel *evsel)
														
 
															-{
														
 
															-	xyarray__delete(evsel->priv);
														
 
															-	evsel->priv = NULL;
														
 
															-}
														
 
															-
														
 
															-static unsigned int mmap_read_head(struct mmap_data *md)
														
 
															-{
														
 
															-	struct perf_event_mmap_page *pc = md->base;
														
 
															-	int head;
														
 
															-
														
 
															-	head = pc->data_head;
														
 
															-	rmb();
														
 
															-
														
 
															-	return head;
														
 
															-}
														
 
															-
														
 
															-static void perf_session__mmap_read_counter(struct perf_session *self,
														
 
															-					    struct perf_evsel *evsel,
														
 
															-					    int cpu, int thread_idx)
														
 
															+static void perf_session__mmap_read_cpu(struct perf_session *self, int cpu)
														
 
															 {
														
 
															-	struct xyarray *mmap_array = evsel->priv;
														
 
															-	struct mmap_data *md = xyarray__entry(mmap_array, cpu, thread_idx);
														
 
															-	unsigned int head = mmap_read_head(md);
														
 
															-	unsigned int old = md->prev;
														
 
															-	unsigned char *data = md->base + page_size;
														
 
															-	struct sample_data sample;
														
 
															-	int diff;
														
 
															-
														
 
															-	/*
														
 
															-	 * If we're further behind than half the buffer, there's a chance
														
 
															-	 * the writer will bite our tail and mess up the samples under us.
														
 
															-	 *
														
 
															-	 * If we somehow ended up ahead of the head, we got messed up.
														
 
															-	 *
														
 
															-	 * In either case, truncate and restart at head.
														
 
															-	 */
														
 
															-	diff = head - old;
														
 
															-	if (diff > md->mask / 2 || diff < 0) {
														
 
															-		fprintf(stderr, "WARNING: failed to keep up with mmap data.\n");
														
 
															-
														
 
															-		/*
														
 
															-		 * head points to a known good entry, start there.
														
 
															-		 */
														
 
															-		old = head;
														
 
															-	}
														
 
															-
														
 
															-	for (; old != head;) {
														
 
															-		event_t *event = (event_t *)&data[old & md->mask];
														
 
															-
														
 
															-		event_t event_copy;
														
 
															+	struct perf_sample sample;
														
 
															+	union perf_event *event;
														
 
															-		size_t size = event->header.size;
														
 
															+	while ((event = perf_evlist__read_on_cpu(top.evlist, cpu)) != NULL) {
														
 
															+		perf_session__parse_sample(self, event, &sample);
														
 
															-		/*
														
 
															-		 * Event straddles the mmap boundary -- header should always
														
 
															-		 * be inside due to u64 alignment of output.
														
 
															-		 */
														
 
															-		if ((old & md->mask) + size != ((old + size) & md->mask)) {
														
 
															-			unsigned int offset = old;
														
 
															-			unsigned int len = min(sizeof(*event), size), cpy;
														
 
															-			void *dst = &event_copy;
														
 
															-
														
 
															-			do {
														
 
															-				cpy = min(md->mask + 1 - (offset & md->mask), len);
														
 
															-				memcpy(dst, &data[offset & md->mask], cpy);
														
 
															-				offset += cpy;
														
 
															-				dst += cpy;
														
 
															-				len -= cpy;
														
 
															-			} while (len);
														
 
															-
														
 
															-			event = &event_copy;
														
 
															-		}
														
 
															-
														
 
															-		event__parse_sample(event, self, &sample);
														
 
															 		if (event->header.type == PERF_RECORD_SAMPLE)
														
 
															-			event__process_sample(event, &sample, self, evsel);
														
 
															+			perf_event__process_sample(event, &sample, self);
														
 
															 		else
														
 
															-			event__process(event, &sample, self);
														
 
															-		old += size;
														
 
															+			perf_event__process(event, &sample, self);
														
 
															 	}
														
 
															-
														
 
															-	md->prev = old;
														
 
															 }
														
 
															-static struct pollfd *event_array;
														
 
															-
														
 
															 static void perf_session__mmap_read(struct perf_session *self)
														
 
															 {
														
 
															-	struct perf_evsel *counter;
														
 
															-	int i, thread_index;
														
 
															-
														
 
															-	for (i = 0; i < cpus->nr; i++) {
														
 
															-		list_for_each_entry(counter, &evsel_list, node) {
														
 
															-			for (thread_index = 0;
														
 
															-				thread_index < threads->nr;
														
 
															-				thread_index++) {
														
 
															-				perf_session__mmap_read_counter(self,
														
 
															-					counter, i, thread_index);
														
 
															-			}
														
 
															-		}
														
 
															-	}
														
 
															-}
														
 
															+	int i;
														
 
															-int nr_poll;
														
 
															-int group_fd;
														
 
															+	for (i = 0; i < top.evlist->cpus->nr; i++)
														
 
															+		perf_session__mmap_read_cpu(self, i);
														
 
															+}
														
 
															-static void start_counter(int i, struct perf_evsel *evsel)
														
 
															+static void start_counters(struct perf_evlist *evlist)
														
 
															 {
														
 
															-	struct xyarray *mmap_array = evsel->priv;
														
 
															-	struct mmap_data *mm;
														
 
															-	struct perf_event_attr *attr;
														
 
															-	int cpu = -1;
														
 
															-	int thread_index;
														
 
															-
														
 
															-	if (target_tid == -1)
														
 
															-		cpu = cpus->map[i];
														
 
															+	struct perf_evsel *counter;
														
 
															-	attr = &evsel->attr;
														
 
															+	list_for_each_entry(counter, &evlist->entries, node) {
														
 
															+		struct perf_event_attr *attr = &counter->attr;
														
 
															-	attr->sample_type	= PERF_SAMPLE_IP | PERF_SAMPLE_TID;
														
 
															+		attr->sample_type = PERF_SAMPLE_IP | PERF_SAMPLE_TID;
														
 
															-	if (freq) {
														
 
															-		attr->sample_type	|= PERF_SAMPLE_PERIOD;
														
 
															-		attr->freq		= 1;
														
 
															-		attr->sample_freq	= freq;
														
 
															-	}
														
 
															+		if (top.freq) {
														
 
															+			attr->sample_type |= PERF_SAMPLE_PERIOD;
														
 
															+			attr->freq	  = 1;
														
 
															+			attr->sample_freq = top.freq;
														
 
															+		}
														
 
															-	attr->inherit		= (cpu < 0) && inherit;
														
 
															-	attr->mmap		= 1;
														
 
															+		if (evlist->nr_entries > 1) {
														
 
															+			attr->sample_type |= PERF_SAMPLE_ID;
														
 
															+			attr->read_format |= PERF_FORMAT_ID;
														
 
															+		}
														
 
															-	for (thread_index = 0; thread_index < threads->nr; thread_index++) {
														
 
															+		attr->mmap = 1;
														
 
															 try_again:
														
 
															-		FD(evsel, i, thread_index) = sys_perf_event_open(attr,
														
 
															-				threads->map[thread_index], cpu, group_fd, 0);
														
 
															-
														
 
															-		if (FD(evsel, i, thread_index) < 0) {
														
 
															+		if (perf_evsel__open(counter, top.evlist->cpus,
														
 
															+				     top.evlist->threads, group, inherit) < 0) {
														
 
															 			int err = errno;
														
 
															 			if (err == EPERM || err == EACCES)
														
@@ -1253,8 +857,8 @@ try_again:
 
															 			 * based cpu-clock-tick sw counter, which
														
 
															 			 * is always available even if no PMU support:
														
 
															 			 */
														
 
															-			if (attr->type == PERF_TYPE_HARDWARE
														
 
															-					&& attr->config == PERF_COUNT_HW_CPU_CYCLES) {
														
 
															+			if (attr->type == PERF_TYPE_HARDWARE &&
														
 
															+			    attr->config == PERF_COUNT_HW_CPU_CYCLES) {
														
 
															 				if (verbose)
														
 
															 					warning(" ... trying to fall back to cpu-clock-ticks\n");
														
@@ -1264,39 +868,22 @@ try_again:
 
															 				goto try_again;
														
 
															 			}
														
 
															 			printf("\n");
														
 
															-			error("sys_perf_event_open() syscall returned with %d (%s).  /bin/dmesg may provide additional information.\n",
														
 
															-					FD(evsel, i, thread_index), strerror(err));
														
 
															+			error("sys_perf_event_open() syscall returned with %d "
														
 
															+			      "(%s).  /bin/dmesg may provide additional information.\n",
														
 
															+			      err, strerror(err));
														
 
															 			die("No CONFIG_PERF_EVENTS=y kernel support configured?\n");
														
 
															 			exit(-1);
														
 
															 		}
														
 
															-		assert(FD(evsel, i, thread_index) >= 0);
														
 
															-		fcntl(FD(evsel, i, thread_index), F_SETFL, O_NONBLOCK);
														
 
															-
														
 
															-		/*
														
 
															-		 * First counter acts as the group leader:
														
 
															-		 */
														
 
															-		if (group && group_fd == -1)
														
 
															-			group_fd = FD(evsel, i, thread_index);
														
 
															-
														
 
															-		event_array[nr_poll].fd = FD(evsel, i, thread_index);
														
 
															-		event_array[nr_poll].events = POLLIN;
														
 
															-		nr_poll++;
														
 
															-
														
 
															-		mm = xyarray__entry(mmap_array, i, thread_index);
														
 
															-		mm->prev = 0;
														
 
															-		mm->mask = mmap_pages*page_size - 1;
														
 
															-		mm->base = mmap(NULL, (mmap_pages+1)*page_size,
														
 
															-				PROT_READ, MAP_SHARED, FD(evsel, i, thread_index), 0);
														
 
															-		if (mm->base == MAP_FAILED)
														
 
															-			die("failed to mmap with %d (%s)\n", errno, strerror(errno));
														
 
															 	}
														
 
															+
														
 
															+	if (perf_evlist__mmap(evlist, mmap_pages, false) < 0)
														
 
															+		die("failed to mmap with %d (%s)\n", errno, strerror(errno));
														
 
															 }
														
 
															 static int __cmd_top(void)
														
 
															 {
														
 
															 	pthread_t thread;
														
 
															-	struct perf_evsel *counter;
														
 
															-	int i, ret;
														
 
															+	int ret __used;
														
 
															 	/*
														
 
															 	 * FIXME: perf_session__new should allow passing a O_MMAP, so that all this
														
 
															 	 * mmap reading, etc is encapsulated in it. Use O_WRONLY for now.
														
@@ -1305,23 +892,23 @@ static int __cmd_top(void)
 
															 	if (session == NULL)
														
 
															 		return -ENOMEM;
														
 
															-	if (target_tid != -1)
														
 
															-		event__synthesize_thread_map(threads, event__process, session);
														
 
															+	if (top.target_tid != -1)
														
 
															+		perf_event__synthesize_thread_map(top.evlist->threads,
														
 
															+						  perf_event__process, session);
														
 
															 	else
														
 
															-		event__synthesize_threads(event__process, session);
														
 
															+		perf_event__synthesize_threads(perf_event__process, session);
														
 
															-	for (i = 0; i < cpus->nr; i++) {
														
 
															-		group_fd = -1;
														
 
															-		list_for_each_entry(counter, &evsel_list, node)
														
 
															-			start_counter(i, counter);
														
 
															-	}
														
 
															+	start_counters(top.evlist);
														
 
															+	session->evlist = top.evlist;
														
 
															+	perf_session__update_sample_type(session);
														
 
															 	/* Wait for a minimal set of events before starting the snapshot */
														
 
															-	poll(&event_array[0], nr_poll, 100);
														
 
															+	poll(top.evlist->pollfd, top.evlist->nr_fds, 100);
														
 
															 	perf_session__mmap_read(session);
														
 
															-	if (pthread_create(&thread, NULL, display_thread, session)) {
														
 
															+	if (pthread_create(&thread, NULL, (use_browser > 0 ? display_thread_tui :
														
 
															+							     display_thread), session)) {
														
 
															 		printf("Could not create display thread.\n");
														
 
															 		exit(-1);
														
 
															 	}
														
@@ -1337,12 +924,12 @@ static int __cmd_top(void)
 
															 	}
														
 
															 	while (1) {
														
 
															-		int hits = samples;
														
 
															+		u64 hits = top.samples;
														
 
															 		perf_session__mmap_read(session);
														
 
															-		if (hits == samples)
														
 
															-			ret = poll(event_array, nr_poll, 100);
														
 
															+		if (hits == top.samples)
														
 
															+			ret = poll(top.evlist->pollfd, top.evlist->nr_fds, 100);
														
 
															 	}
														
 
															 	return 0;
														
@@ -1354,31 +941,31 @@ static const char * const top_usage[] = {
 
															 };
														
 
															 static const struct option options[] = {
														
 
															-	OPT_CALLBACK('e', "event", NULL, "event",
														
 
															+	OPT_CALLBACK('e', "event", &top.evlist, "event",
														
 
															 		     "event selector. use 'perf list' to list available events",
														
 
															 		     parse_events),
														
 
															 	OPT_INTEGER('c', "count", &default_interval,
														
 
															 		    "event period to sample"),
														
 
															-	OPT_INTEGER('p', "pid", &target_pid,
														
 
															+	OPT_INTEGER('p', "pid", &top.target_pid,
														
 
															 		    "profile events on existing process id"),
														
 
															-	OPT_INTEGER('t', "tid", &target_tid,
														
 
															+	OPT_INTEGER('t', "tid", &top.target_tid,
														
 
															 		    "profile events on existing thread id"),
														
 
															 	OPT_BOOLEAN('a', "all-cpus", &system_wide,
														
 
															 			    "system-wide collection from all CPUs"),
														
 
															-	OPT_STRING('C', "cpu", &cpu_list, "cpu",
														
 
															+	OPT_STRING('C', "cpu", &top.cpu_list, "cpu",
														
 
															 		    "list of cpus to monitor"),
														
 
															 	OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
														
 
															 		   "file", "vmlinux pathname"),
														
 
															-	OPT_BOOLEAN('K', "hide_kernel_symbols", &hide_kernel_symbols,
														
 
															+	OPT_BOOLEAN('K', "hide_kernel_symbols", &top.hide_kernel_symbols,
														
 
															 		    "hide kernel symbols"),
														
 
															 	OPT_UINTEGER('m', "mmap-pages", &mmap_pages, "number of mmap data pages"),
														
 
															 	OPT_INTEGER('r', "realtime", &realtime_prio,
														
 
															 		    "collect data with this RT SCHED_FIFO priority"),
														
 
															-	OPT_INTEGER('d', "delay", &delay_secs,
														
 
															+	OPT_INTEGER('d', "delay", &top.delay_secs,
														
 
															 		    "number of seconds to delay between refreshes"),
														
 
															 	OPT_BOOLEAN('D', "dump-symtab", &dump_symtab,
														
 
															 			    "dump the symbol table used for profiling"),
														
 
															-	OPT_INTEGER('f', "count-filter", &count_filter,
														
 
															+	OPT_INTEGER('f', "count-filter", &top.count_filter,
														
 
															 		    "only display functions with more events than this"),
														
 
															 	OPT_BOOLEAN('g', "group", &group,
														
 
															 			    "put the counters into a counter group"),
														
@@ -1386,14 +973,16 @@ static const struct option options[] = {
 
															 		    "child tasks inherit counters"),
														
 
															 	OPT_STRING('s', "sym-annotate", &sym_filter, "symbol name",
														
 
															 		    "symbol to annotate"),
														
 
															-	OPT_BOOLEAN('z', "zero", &zero,
														
 
															+	OPT_BOOLEAN('z', "zero", &top.zero,
														
 
															 		    "zero history across updates"),
														
 
															-	OPT_INTEGER('F', "freq", &freq,
														
 
															+	OPT_INTEGER('F', "freq", &top.freq,
														
 
															 		    "profile at this frequency"),
														
 
															-	OPT_INTEGER('E', "entries", &print_entries,
														
 
															+	OPT_INTEGER('E', "entries", &top.print_entries,
														
 
															 		    "display this many functions"),
														
 
															-	OPT_BOOLEAN('U', "hide_user_symbols", &hide_user_symbols,
														
 
															+	OPT_BOOLEAN('U', "hide_user_symbols", &top.hide_user_symbols,
														
 
															 		    "hide user symbols"),
														
 
															+	OPT_BOOLEAN(0, "tui", &use_tui, "Use the TUI interface"),
														
 
															+	OPT_BOOLEAN(0, "stdio", &use_stdio, "Use the stdio interface"),
														
 
															 	OPT_INCR('v', "verbose", &verbose,
														
 
															 		    "be more verbose (show counter open errors, etc)"),
														
 
															 	OPT_END()
														
@@ -1404,64 +993,68 @@ int cmd_top(int argc, const char **argv, const char *prefix __used)
 
															 	struct perf_evsel *pos;
														
 
															 	int status = -ENOMEM;
														
 
															+	top.evlist = perf_evlist__new(NULL, NULL);
														
 
															+	if (top.evlist == NULL)
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															 	page_size = sysconf(_SC_PAGE_SIZE);
														
 
															 	argc = parse_options(argc, argv, options, top_usage, 0);
														
 
															 	if (argc)
														
 
															 		usage_with_options(top_usage, options);
														
 
															-	if (target_pid != -1)
														
 
															-		target_tid = target_pid;
														
 
															+	/*
														
 
															+ 	 * XXX For now start disabled, only using TUI if explicitely asked for.
														
 
															+ 	 * Change that when handle_keys equivalent gets written, live annotation
														
 
															+ 	 * done, etc.
														
 
															+ 	 */
														
 
															+	use_browser = 0;
														
 
															-	threads = thread_map__new(target_pid, target_tid);
														
 
															-	if (threads == NULL) {
														
 
															-		pr_err("Problems finding threads of monitor\n");
														
 
															-		usage_with_options(top_usage, options);
														
 
															-	}
														
 
															+	if (use_stdio)
														
 
															+		use_browser = 0;
														
 
															+	else if (use_tui)
														
 
															+		use_browser = 1;
														
 
															-	event_array = malloc((sizeof(struct pollfd) *
														
 
															-			      MAX_NR_CPUS * MAX_COUNTERS * threads->nr));
														
 
															-	if (!event_array)
														
 
															-		return -ENOMEM;
														
 
															+	setup_browser(false);
														
 
															 	/* CPU and PID are mutually exclusive */
														
 
															-	if (target_tid > 0 && cpu_list) {
														
 
															+	if (top.target_tid > 0 && top.cpu_list) {
														
 
															 		printf("WARNING: PID switch overriding CPU\n");
														
 
															 		sleep(1);
														
 
															-		cpu_list = NULL;
														
 
															+		top.cpu_list = NULL;
														
 
															 	}
														
 
															-	if (!nr_counters && perf_evsel_list__create_default() < 0) {
														
 
															+	if (top.target_pid != -1)
														
 
															+		top.target_tid = top.target_pid;
														
 
															+
														
 
															+	if (perf_evlist__create_maps(top.evlist, top.target_pid,
														
 
															+				     top.target_tid, top.cpu_list) < 0)
														
 
															+		usage_with_options(top_usage, options);
														
 
															+
														
 
															+	if (!top.evlist->nr_entries &&
														
 
															+	    perf_evlist__add_default(top.evlist) < 0) {
														
 
															 		pr_err("Not enough memory for event selector list\n");
														
 
															 		return -ENOMEM;
														
 
															 	}
														
 
															-	if (delay_secs < 1)
														
 
															-		delay_secs = 1;
														
 
															+	if (top.delay_secs < 1)
														
 
															+		top.delay_secs = 1;
														
 
															 	/*
														
 
															 	 * User specified count overrides default frequency.
														
 
															 	 */
														
 
															 	if (default_interval)
														
 
															-		freq = 0;
														
 
															-	else if (freq) {
														
 
															-		default_interval = freq;
														
 
															+		top.freq = 0;
														
 
															+	else if (top.freq) {
														
 
															+		default_interval = top.freq;
														
 
															 	} else {
														
 
															 		fprintf(stderr, "frequency and count are zero, aborting\n");
														
 
															 		exit(EXIT_FAILURE);
														
 
															 	}
														
 
															-	if (target_tid != -1)
														
 
															-		cpus = cpu_map__dummy_new();
														
 
															-	else
														
 
															-		cpus = cpu_map__new(cpu_list);
														
 
															-
														
 
															-	if (cpus == NULL)
														
 
															-		usage_with_options(top_usage, options);
														
 
															-
														
 
															-	list_for_each_entry(pos, &evsel_list, node) {
														
 
															-		if (perf_evsel__alloc_mmap_per_thread(pos, cpus->nr, threads->nr) < 0 ||
														
 
															-		    perf_evsel__alloc_fd(pos, cpus->nr, threads->nr) < 0)
														
 
															+	list_for_each_entry(pos, &top.evlist->entries, node) {
														
 
															+		if (perf_evsel__alloc_fd(pos, top.evlist->cpus->nr,
														
 
															+					 top.evlist->threads->nr) < 0)
														
 
															 			goto out_free_fd;
														
 
															 		/*
														
 
															 		 * Fill in the ones not specifically initialized via -c:
														
@@ -1472,26 +1065,28 @@ int cmd_top(int argc, const char **argv, const char *prefix __used)
 
															 		pos->attr.sample_period = default_interval;
														
 
															 	}
														
 
															-	sym_evsel = list_entry(evsel_list.next, struct perf_evsel, node);
														
 
															+	if (perf_evlist__alloc_pollfd(top.evlist) < 0 ||
														
 
															+	    perf_evlist__alloc_mmap(top.evlist) < 0)
														
 
															+		goto out_free_fd;
														
 
															+
														
 
															+	top.sym_evsel = list_entry(top.evlist->entries.next, struct perf_evsel, node);
														
 
															-	symbol_conf.priv_size = (sizeof(struct sym_entry) +
														
 
															-				 (nr_counters + 1) * sizeof(unsigned long));
														
 
															+	symbol_conf.priv_size = (sizeof(struct sym_entry) + sizeof(struct annotation) +
														
 
															+				 (top.evlist->nr_entries + 1) * sizeof(unsigned long));
														
 
															 	symbol_conf.try_vmlinux_path = (symbol_conf.vmlinux_name == NULL);
														
 
															 	if (symbol__init() < 0)
														
 
															 		return -1;
														
 
															 	get_term_dimensions(&winsize);
														
 
															-	if (print_entries == 0) {
														
 
															+	if (top.print_entries == 0) {
														
 
															 		update_print_entries(&winsize);
														
 
															 		signal(SIGWINCH, sig_winch_handler);
														
 
															 	}
														
 
															 	status = __cmd_top();
														
 
															 out_free_fd:
														
 
															-	list_for_each_entry(pos, &evsel_list, node)
														
 
															-		perf_evsel__free_mmap(pos);
														
 
															-	perf_evsel_list__delete();
														
 
															+	perf_evlist__delete(top.evlist);
														
 
															 	return status;
														
 
															 }
														
--- a/tools/perf/perf.h
+++ b/tools/perf/perf.h
@@ -94,6 +94,32 @@ void get_term_dimensions(struct winsize *ws);
 
															 #include "util/types.h"
														
 
															 #include <stdbool.h>
														
 
															+struct perf_mmap {
														
 
															+	void			*base;
														
 
															+	int			mask;
														
 
															+	unsigned int		prev;
														
 
															+};
														
 
															+
														
 
															+static inline unsigned int perf_mmap__read_head(struct perf_mmap *mm)
														
 
															+{
														
 
															+	struct perf_event_mmap_page *pc = mm->base;
														
 
															+	int head = pc->data_head;
														
 
															+	rmb();
														
 
															+	return head;
														
 
															+}
														
 
															+
														
 
															+static inline void perf_mmap__write_tail(struct perf_mmap *md,
														
 
															+					 unsigned long tail)
														
 
															+{
														
 
															+	struct perf_event_mmap_page *pc = md->base;
														
 
															+
														
 
															+	/*
														
 
															+	 * ensure all reads are done before we write the tail out.
														
 
															+	 */
														
 
															+	/* mb(); */
														
 
															+	pc->data_tail = tail;
														
 
															+}
														
 
															+
														
 
															 /*
														
 
															  * prctl(PR_TASK_PERF_EVENTS_DISABLE) will (cheaply) disable all
														
 
															  * counters in the current task.
														
--- a/tools/perf/python/twatch.py
+++ b/tools/perf/python/twatch.py
@@ -0,0 +1,41 @@
 
															+#! /usr/bin/python
														
 
															+# -*- python -*-
														
 
															+# -*- coding: utf-8 -*-
														
 
															+#   twatch - Experimental use of the perf python interface
														
 
															+#   Copyright (C) 2011 Arnaldo Carvalho de Melo <acme@redhat.com>
														
 
															+#
														
 
															+#   This application is free software; you can redistribute it and/or
														
 
															+#   modify it under the terms of the GNU General Public License
														
 
															+#   as published by the Free Software Foundation; version 2.
														
 
															+#
														
 
															+#   This application is distributed in the hope that it will be useful,
														
 
															+#   but WITHOUT ANY WARRANTY; without even the implied warranty of
														
 
															+#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
														
 
															+#   General Public License for more details.
														
 
															+
														
 
															+import perf
														
 
															+
														
 
															+def main():
														
 
															+	cpus = perf.cpu_map()
														
 
															+	threads = perf.thread_map()
														
 
															+	evsel = perf.evsel(task = 1, comm = 1, mmap = 0,
														
 
															+			   wakeup_events = 1, sample_period = 1,
														
 
															+			   sample_id_all = 1,
														
 
															+			   sample_type = perf.SAMPLE_PERIOD | perf.SAMPLE_TID | perf.SAMPLE_CPU | perf.SAMPLE_TID)
														
 
															+	evsel.open(cpus = cpus, threads = threads);
														
 
															+	evlist = perf.evlist(cpus, threads)
														
 
															+	evlist.add(evsel)
														
 
															+	evlist.mmap()
														
 
															+	while True:
														
 
															+		evlist.poll(timeout = -1)
														
 
															+		for cpu in cpus:
														
 
															+			event = evlist.read_on_cpu(cpu)
														
 
															+			if not event:
														
 
															+				continue
														
 
															+			print "cpu: %2d, pid: %4d, tid: %4d" % (event.sample_cpu,
														
 
															+								event.sample_pid,
														
 
															+								event.sample_tid),
														
 
															+			print event
														
 
															+
														
 
															+if __name__ == '__main__':
														
 
															+    main()
														
--- a/tools/perf/util/annotate.c
+++ b/tools/perf/util/annotate.c
@@ -0,0 +1,605 @@
 
															+/*
														
 
															+ * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
														
 
															+ *
														
 
															+ * Parts came from builtin-annotate.c, see those files for further
														
 
															+ * copyright notes.
														
 
															+ *
														
 
															+ * Released under the GPL v2. (and only v2, not any later version)
														
 
															+ */
														
 
															+
														
 
															+#include "util.h"
														
 
															+#include "build-id.h"
														
 
															+#include "color.h"
														
 
															+#include "cache.h"
														
 
															+#include "symbol.h"
														
 
															+#include "debug.h"
														
 
															+#include "annotate.h"
														
 
															+#include <pthread.h>
														
 
															+
														
 
															+int symbol__annotate_init(struct map *map __used, struct symbol *sym)
														
 
															+{
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+	pthread_mutex_init(&notes->lock, NULL);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+int symbol__alloc_hist(struct symbol *sym, int nevents)
														
 
															+{
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+	size_t sizeof_sym_hist = (sizeof(struct sym_hist) +
														
 
															+				  (sym->end - sym->start) * sizeof(u64));
														
 
															+
														
 
															+	notes->src = zalloc(sizeof(*notes->src) + nevents * sizeof_sym_hist);
														
 
															+	if (notes->src == NULL)
														
 
															+		return -1;
														
 
															+	notes->src->sizeof_sym_hist = sizeof_sym_hist;
														
 
															+	notes->src->nr_histograms   = nevents;
														
 
															+	INIT_LIST_HEAD(&notes->src->source);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+void symbol__annotate_zero_histograms(struct symbol *sym)
														
 
															+{
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+
														
 
															+	pthread_mutex_lock(&notes->lock);
														
 
															+	if (notes->src != NULL)
														
 
															+		memset(notes->src->histograms, 0,
														
 
															+		       notes->src->nr_histograms * notes->src->sizeof_sym_hist);
														
 
															+	pthread_mutex_unlock(&notes->lock);
														
 
															+}
														
 
															+
														
 
															+int symbol__inc_addr_samples(struct symbol *sym, struct map *map,
														
 
															+			     int evidx, u64 addr)
														
 
															+{
														
 
															+	unsigned offset;
														
 
															+	struct annotation *notes;
														
 
															+	struct sym_hist *h;
														
 
															+
														
 
															+	notes = symbol__annotation(sym);
														
 
															+	if (notes->src == NULL)
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															+	pr_debug3("%s: addr=%#" PRIx64 "\n", __func__, map->unmap_ip(map, addr));
														
 
															+
														
 
															+	if (addr >= sym->end)
														
 
															+		return 0;
														
 
															+
														
 
															+	offset = addr - sym->start;
														
 
															+	h = annotation__histogram(notes, evidx);
														
 
															+	h->sum++;
														
 
															+	h->addr[offset]++;
														
 
															+
														
 
															+	pr_debug3("%#" PRIx64 " %s: period++ [addr: %#" PRIx64 ", %#" PRIx64
														
 
															+		  ", evidx=%d] => %" PRIu64 "\n", sym->start, sym->name,
														
 
															+		  addr, addr - sym->start, evidx, h->addr[offset]);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static struct objdump_line *objdump_line__new(s64 offset, char *line, size_t privsize)
														
 
															+{
														
 
															+	struct objdump_line *self = malloc(sizeof(*self) + privsize);
														
 
															+
														
 
															+	if (self != NULL) {
														
 
															+		self->offset = offset;
														
 
															+		self->line = line;
														
 
															+	}
														
 
															+
														
 
															+	return self;
														
 
															+}
														
 
															+
														
 
															+void objdump_line__free(struct objdump_line *self)
														
 
															+{
														
 
															+	free(self->line);
														
 
															+	free(self);
														
 
															+}
														
 
															+
														
 
															+static void objdump__add_line(struct list_head *head, struct objdump_line *line)
														
 
															+{
														
 
															+	list_add_tail(&line->node, head);
														
 
															+}
														
 
															+
														
 
															+struct objdump_line *objdump__get_next_ip_line(struct list_head *head,
														
 
															+					       struct objdump_line *pos)
														
 
															+{
														
 
															+	list_for_each_entry_continue(pos, head, node)
														
 
															+		if (pos->offset >= 0)
														
 
															+			return pos;
														
 
															+
														
 
															+	return NULL;
														
 
															+}
														
 
															+
														
 
															+static int objdump_line__print(struct objdump_line *oline, struct symbol *sym,
														
 
															+			       int evidx, u64 len, int min_pcnt,
														
 
															+			       int printed, int max_lines,
														
 
															+			       struct objdump_line *queue)
														
 
															+{
														
 
															+	static const char *prev_line;
														
 
															+	static const char *prev_color;
														
 
															+
														
 
															+	if (oline->offset != -1) {
														
 
															+		const char *path = NULL;
														
 
															+		unsigned int hits = 0;
														
 
															+		double percent = 0.0;
														
 
															+		const char *color;
														
 
															+		struct annotation *notes = symbol__annotation(sym);
														
 
															+		struct source_line *src_line = notes->src->lines;
														
 
															+		struct sym_hist *h = annotation__histogram(notes, evidx);
														
 
															+		s64 offset = oline->offset;
														
 
															+		struct objdump_line *next;
														
 
															+
														
 
															+		next = objdump__get_next_ip_line(&notes->src->source, oline);
														
 
															+
														
 
															+		while (offset < (s64)len &&
														
 
															+		       (next == NULL || offset < next->offset)) {
														
 
															+			if (src_line) {
														
 
															+				if (path == NULL)
														
 
															+					path = src_line[offset].path;
														
 
															+				percent += src_line[offset].percent;
														
 
															+			} else
														
 
															+				hits += h->addr[offset];
														
 
															+
														
 
															+			++offset;
														
 
															+		}
														
 
															+
														
 
															+		if (src_line == NULL && h->sum)
														
 
															+			percent = 100.0 * hits / h->sum;
														
 
															+
														
 
															+		if (percent < min_pcnt)
														
 
															+			return -1;
														
 
															+
														
 
															+		if (max_lines && printed >= max_lines)
														
 
															+			return 1;
														
 
															+
														
 
															+		if (queue != NULL) {
														
 
															+			list_for_each_entry_from(queue, &notes->src->source, node) {
														
 
															+				if (queue == oline)
														
 
															+					break;
														
 
															+				objdump_line__print(queue, sym, evidx, len,
														
 
															+						    0, 0, 1, NULL);
														
 
															+			}
														
 
															+		}
														
 
															+
														
 
															+		color = get_percent_color(percent);
														
 
															+
														
 
															+		/*
														
 
															+		 * Also color the filename and line if needed, with
														
 
															+		 * the same color than the percentage. Don't print it
														
 
															+		 * twice for close colored addr with the same filename:line
														
 
															+		 */
														
 
															+		if (path) {
														
 
															+			if (!prev_line || strcmp(prev_line, path)
														
 
															+				       || color != prev_color) {
														
 
															+				color_fprintf(stdout, color, " %s", path);
														
 
															+				prev_line = path;
														
 
															+				prev_color = color;
														
 
															+			}
														
 
															+		}
														
 
															+
														
 
															+		color_fprintf(stdout, color, " %7.2f", percent);
														
 
															+		printf(" :	");
														
 
															+		color_fprintf(stdout, PERF_COLOR_BLUE, "%s\n", oline->line);
														
 
															+	} else if (max_lines && printed >= max_lines)
														
 
															+		return 1;
														
 
															+	else {
														
 
															+		if (queue)
														
 
															+			return -1;
														
 
															+
														
 
															+		if (!*oline->line)
														
 
															+			printf("         :\n");
														
 
															+		else
														
 
															+			printf("         :	%s\n", oline->line);
														
 
															+	}
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static int symbol__parse_objdump_line(struct symbol *sym, struct map *map,
														
 
															+				      FILE *file, size_t privsize)
														
 
															+{
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+	struct objdump_line *objdump_line;
														
 
															+	char *line = NULL, *tmp, *tmp2, *c;
														
 
															+	size_t line_len;
														
 
															+	s64 line_ip, offset = -1;
														
 
															+
														
 
															+	if (getline(&line, &line_len, file) < 0)
														
 
															+		return -1;
														
 
															+
														
 
															+	if (!line)
														
 
															+		return -1;
														
 
															+
														
 
															+	while (line_len != 0 && isspace(line[line_len - 1]))
														
 
															+		line[--line_len] = '\0';
														
 
															+
														
 
															+	c = strchr(line, '\n');
														
 
															+	if (c)
														
 
															+		*c = 0;
														
 
															+
														
 
															+	line_ip = -1;
														
 
															+
														
 
															+	/*
														
 
															+	 * Strip leading spaces:
														
 
															+	 */
														
 
															+	tmp = line;
														
 
															+	while (*tmp) {
														
 
															+		if (*tmp != ' ')
														
 
															+			break;
														
 
															+		tmp++;
														
 
															+	}
														
 
															+
														
 
															+	if (*tmp) {
														
 
															+		/*
														
 
															+		 * Parse hexa addresses followed by ':'
														
 
															+		 */
														
 
															+		line_ip = strtoull(tmp, &tmp2, 16);
														
 
															+		if (*tmp2 != ':' || tmp == tmp2 || tmp2[1] == '\0')
														
 
															+			line_ip = -1;
														
 
															+	}
														
 
															+
														
 
															+	if (line_ip != -1) {
														
 
															+		u64 start = map__rip_2objdump(map, sym->start),
														
 
															+		    end = map__rip_2objdump(map, sym->end);
														
 
															+
														
 
															+		offset = line_ip - start;
														
 
															+		if (offset < 0 || (u64)line_ip > end)
														
 
															+			offset = -1;
														
 
															+	}
														
 
															+
														
 
															+	objdump_line = objdump_line__new(offset, line, privsize);
														
 
															+	if (objdump_line == NULL) {
														
 
															+		free(line);
														
 
															+		return -1;
														
 
															+	}
														
 
															+	objdump__add_line(&notes->src->source, objdump_line);
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+int symbol__annotate(struct symbol *sym, struct map *map, size_t privsize)
														
 
															+{
														
 
															+	struct dso *dso = map->dso;
														
 
															+	char *filename = dso__build_id_filename(dso, NULL, 0);
														
 
															+	bool free_filename = true;
														
 
															+	char command[PATH_MAX * 2];
														
 
															+	FILE *file;
														
 
															+	int err = 0;
														
 
															+	char symfs_filename[PATH_MAX];
														
 
															+
														
 
															+	if (filename) {
														
 
															+		snprintf(symfs_filename, sizeof(symfs_filename), "%s%s",
														
 
															+			 symbol_conf.symfs, filename);
														
 
															+	}
														
 
															+
														
 
															+	if (filename == NULL) {
														
 
															+		if (dso->has_build_id) {
														
 
															+			pr_err("Can't annotate %s: not enough memory\n",
														
 
															+			       sym->name);
														
 
															+			return -ENOMEM;
														
 
															+		}
														
 
															+		goto fallback;
														
 
															+	} else if (readlink(symfs_filename, command, sizeof(command)) < 0 ||
														
 
															+		   strstr(command, "[kernel.kallsyms]") ||
														
 
															+		   access(symfs_filename, R_OK)) {
														
 
															+		free(filename);
														
 
															+fallback:
														
 
															+		/*
														
 
															+		 * If we don't have build-ids or the build-id file isn't in the
														
 
															+		 * cache, or is just a kallsyms file, well, lets hope that this
														
 
															+		 * DSO is the same as when 'perf record' ran.
														
 
															+		 */
														
 
															+		filename = dso->long_name;
														
 
															+		snprintf(symfs_filename, sizeof(symfs_filename), "%s%s",
														
 
															+			 symbol_conf.symfs, filename);
														
 
															+		free_filename = false;
														
 
															+	}
														
 
															+
														
 
															+	if (dso->origin == DSO__ORIG_KERNEL) {
														
 
															+		char bf[BUILD_ID_SIZE * 2 + 16] = " with build id ";
														
 
															+		char *build_id_msg = NULL;
														
 
															+
														
 
															+		if (dso->annotate_warned)
														
 
															+			goto out_free_filename;
														
 
															+
														
 
															+		if (dso->has_build_id) {
														
 
															+			build_id__sprintf(dso->build_id,
														
 
															+					  sizeof(dso->build_id), bf + 15);
														
 
															+			build_id_msg = bf;
														
 
															+		}
														
 
															+		err = -ENOENT;
														
 
															+		dso->annotate_warned = 1;
														
 
															+		pr_err("Can't annotate %s: No vmlinux file%s was found in the "
														
 
															+		       "path.\nPlease use 'perf buildid-cache -av vmlinux' or "
														
 
															+		       "--vmlinux vmlinux.\n",
														
 
															+		       sym->name, build_id_msg ?: "");
														
 
															+		goto out_free_filename;
														
 
															+	}
														
 
															+
														
 
															+	pr_debug("%s: filename=%s, sym=%s, start=%#" PRIx64 ", end=%#" PRIx64 "\n", __func__,
														
 
															+		 filename, sym->name, map->unmap_ip(map, sym->start),
														
 
															+		 map->unmap_ip(map, sym->end));
														
 
															+
														
 
															+	pr_debug("annotating [%p] %30s : [%p] %30s\n",
														
 
															+		 dso, dso->long_name, sym, sym->name);
														
 
															+
														
 
															+	snprintf(command, sizeof(command),
														
 
															+		 "objdump --start-address=0x%016" PRIx64
														
 
															+		 " --stop-address=0x%016" PRIx64 " -dS -C %s|grep -v %s|expand",
														
 
															+		 map__rip_2objdump(map, sym->start),
														
 
															+		 map__rip_2objdump(map, sym->end),
														
 
															+		 symfs_filename, filename);
														
 
															+
														
 
															+	pr_debug("Executing: %s\n", command);
														
 
															+
														
 
															+	file = popen(command, "r");
														
 
															+	if (!file)
														
 
															+		goto out_free_filename;
														
 
															+
														
 
															+	while (!feof(file))
														
 
															+		if (symbol__parse_objdump_line(sym, map, file, privsize) < 0)
														
 
															+			break;
														
 
															+
														
 
															+	pclose(file);
														
 
															+out_free_filename:
														
 
															+	if (free_filename)
														
 
															+		free(filename);
														
 
															+	return err;
														
 
															+}
														
 
															+
														
 
															+static void insert_source_line(struct rb_root *root, struct source_line *src_line)
														
 
															+{
														
 
															+	struct source_line *iter;
														
 
															+	struct rb_node **p = &root->rb_node;
														
 
															+	struct rb_node *parent = NULL;
														
 
															+
														
 
															+	while (*p != NULL) {
														
 
															+		parent = *p;
														
 
															+		iter = rb_entry(parent, struct source_line, node);
														
 
															+
														
 
															+		if (src_line->percent > iter->percent)
														
 
															+			p = &(*p)->rb_left;
														
 
															+		else
														
 
															+			p = &(*p)->rb_right;
														
 
															+	}
														
 
															+
														
 
															+	rb_link_node(&src_line->node, parent, p);
														
 
															+	rb_insert_color(&src_line->node, root);
														
 
															+}
														
 
															+
														
 
															+static void symbol__free_source_line(struct symbol *sym, int len)
														
 
															+{
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+	struct source_line *src_line = notes->src->lines;
														
 
															+	int i;
														
 
															+
														
 
															+	for (i = 0; i < len; i++)
														
 
															+		free(src_line[i].path);
														
 
															+
														
 
															+	free(src_line);
														
 
															+	notes->src->lines = NULL;
														
 
															+}
														
 
															+
														
 
															+/* Get the filename:line for the colored entries */
														
 
															+static int symbol__get_source_line(struct symbol *sym, struct map *map,
														
 
															+				   int evidx, struct rb_root *root, int len,
														
 
															+				   const char *filename)
														
 
															+{
														
 
															+	u64 start;
														
 
															+	int i;
														
 
															+	char cmd[PATH_MAX * 2];
														
 
															+	struct source_line *src_line;
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+	struct sym_hist *h = annotation__histogram(notes, evidx);
														
 
															+
														
 
															+	if (!h->sum)
														
 
															+		return 0;
														
 
															+
														
 
															+	src_line = notes->src->lines = calloc(len, sizeof(struct source_line));
														
 
															+	if (!notes->src->lines)
														
 
															+		return -1;
														
 
															+
														
 
															+	start = map->unmap_ip(map, sym->start);
														
 
															+
														
 
															+	for (i = 0; i < len; i++) {
														
 
															+		char *path = NULL;
														
 
															+		size_t line_len;
														
 
															+		u64 offset;
														
 
															+		FILE *fp;
														
 
															+
														
 
															+		src_line[i].percent = 100.0 * h->addr[i] / h->sum;
														
 
															+		if (src_line[i].percent <= 0.5)
														
 
															+			continue;
														
 
															+
														
 
															+		offset = start + i;
														
 
															+		sprintf(cmd, "addr2line -e %s %016" PRIx64, filename, offset);
														
 
															+		fp = popen(cmd, "r");
														
 
															+		if (!fp)
														
 
															+			continue;
														
 
															+
														
 
															+		if (getline(&path, &line_len, fp) < 0 || !line_len)
														
 
															+			goto next;
														
 
															+
														
 
															+		src_line[i].path = malloc(sizeof(char) * line_len + 1);
														
 
															+		if (!src_line[i].path)
														
 
															+			goto next;
														
 
															+
														
 
															+		strcpy(src_line[i].path, path);
														
 
															+		insert_source_line(root, &src_line[i]);
														
 
															+
														
 
															+	next:
														
 
															+		pclose(fp);
														
 
															+	}
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static void print_summary(struct rb_root *root, const char *filename)
														
 
															+{
														
 
															+	struct source_line *src_line;
														
 
															+	struct rb_node *node;
														
 
															+
														
 
															+	printf("\nSorted summary for file %s\n", filename);
														
 
															+	printf("----------------------------------------------\n\n");
														
 
															+
														
 
															+	if (RB_EMPTY_ROOT(root)) {
														
 
															+		printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
														
 
															+		return;
														
 
															+	}
														
 
															+
														
 
															+	node = rb_first(root);
														
 
															+	while (node) {
														
 
															+		double percent;
														
 
															+		const char *color;
														
 
															+		char *path;
														
 
															+
														
 
															+		src_line = rb_entry(node, struct source_line, node);
														
 
															+		percent = src_line->percent;
														
 
															+		color = get_percent_color(percent);
														
 
															+		path = src_line->path;
														
 
															+
														
 
															+		color_fprintf(stdout, color, " %7.2f %s", percent, path);
														
 
															+		node = rb_next(node);
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+static void symbol__annotate_hits(struct symbol *sym, int evidx)
														
 
															+{
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+	struct sym_hist *h = annotation__histogram(notes, evidx);
														
 
															+	u64 len = sym->end - sym->start, offset;
														
 
															+
														
 
															+	for (offset = 0; offset < len; ++offset)
														
 
															+		if (h->addr[offset] != 0)
														
 
															+			printf("%*" PRIx64 ": %" PRIu64 "\n", BITS_PER_LONG / 2,
														
 
															+			       sym->start + offset, h->addr[offset]);
														
 
															+	printf("%*s: %" PRIu64 "\n", BITS_PER_LONG / 2, "h->sum", h->sum);
														
 
															+}
														
 
															+
														
 
															+int symbol__annotate_printf(struct symbol *sym, struct map *map, int evidx,
														
 
															+			    bool full_paths, int min_pcnt, int max_lines,
														
 
															+			    int context)
														
 
															+{
														
 
															+	struct dso *dso = map->dso;
														
 
															+	const char *filename = dso->long_name, *d_filename;
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+	struct objdump_line *pos, *queue = NULL;
														
 
															+	int printed = 2, queue_len = 0;
														
 
															+	int more = 0;
														
 
															+	u64 len;
														
 
															+
														
 
															+	if (full_paths)
														
 
															+		d_filename = filename;
														
 
															+	else
														
 
															+		d_filename = basename(filename);
														
 
															+
														
 
															+	len = sym->end - sym->start;
														
 
															+
														
 
															+	printf(" Percent |	Source code & Disassembly of %s\n", d_filename);
														
 
															+	printf("------------------------------------------------\n");
														
 
															+
														
 
															+	if (verbose)
														
 
															+		symbol__annotate_hits(sym, evidx);
														
 
															+
														
 
															+	list_for_each_entry(pos, &notes->src->source, node) {
														
 
															+		if (context && queue == NULL) {
														
 
															+			queue = pos;
														
 
															+			queue_len = 0;
														
 
															+		}
														
 
															+
														
 
															+		switch (objdump_line__print(pos, sym, evidx, len, min_pcnt,
														
 
															+					    printed, max_lines, queue)) {
														
 
															+		case 0:
														
 
															+			++printed;
														
 
															+			if (context) {
														
 
															+				printed += queue_len;
														
 
															+				queue = NULL;
														
 
															+				queue_len = 0;
														
 
															+			}
														
 
															+			break;
														
 
															+		case 1:
														
 
															+			/* filtered by max_lines */
														
 
															+			++more;
														
 
															+			break;
														
 
															+		case -1:
														
 
															+		default:
														
 
															+			/*
														
 
															+			 * Filtered by min_pcnt or non IP lines when
														
 
															+			 * context != 0
														
 
															+			 */
														
 
															+			if (!context)
														
 
															+				break;
														
 
															+			if (queue_len == context)
														
 
															+				queue = list_entry(queue->node.next, typeof(*queue), node);
														
 
															+			else
														
 
															+				++queue_len;
														
 
															+			break;
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	return more;
														
 
															+}
														
 
															+
														
 
															+void symbol__annotate_zero_histogram(struct symbol *sym, int evidx)
														
 
															+{
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+	struct sym_hist *h = annotation__histogram(notes, evidx);
														
 
															+
														
 
															+	memset(h, 0, notes->src->sizeof_sym_hist);
														
 
															+}
														
 
															+
														
 
															+void symbol__annotate_decay_histogram(struct symbol *sym, int evidx)
														
 
															+{
														
 
															+	struct annotation *notes = symbol__annotation(sym);
														
 
															+	struct sym_hist *h = annotation__histogram(notes, evidx);
														
 
															+	struct objdump_line *pos;
														
 
															+	int len = sym->end - sym->start;
														
 
															+
														
 
															+	h->sum = 0;
														
 
															+
														
 
															+	list_for_each_entry(pos, &notes->src->source, node) {
														
 
															+		if (pos->offset != -1 && pos->offset < len) {
														
 
															+			h->addr[pos->offset] = h->addr[pos->offset] * 7 / 8;
														
 
															+			h->sum += h->addr[pos->offset];
														
 
															+		}
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+void objdump_line_list__purge(struct list_head *head)
														
 
															+{
														
 
															+	struct objdump_line *pos, *n;
														
 
															+
														
 
															+	list_for_each_entry_safe(pos, n, head, node) {
														
 
															+		list_del(&pos->node);
														
 
															+		objdump_line__free(pos);
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+int symbol__tty_annotate(struct symbol *sym, struct map *map, int evidx,
														
 
															+			 bool print_lines, bool full_paths, int min_pcnt,
														
 
															+			 int max_lines)
														
 
															+{
														
 
															+	struct dso *dso = map->dso;
														
 
															+	const char *filename = dso->long_name;
														
 
															+	struct rb_root source_line = RB_ROOT;
														
 
															+	u64 len;
														
 
															+
														
 
															+	if (symbol__annotate(sym, map, 0) < 0)
														
 
															+		return -1;
														
 
															+
														
 
															+	len = sym->end - sym->start;
														
 
															+
														
 
															+	if (print_lines) {
														
 
															+		symbol__get_source_line(sym, map, evidx, &source_line,
														
 
															+					len, filename);
														
 
															+		print_summary(&source_line, filename);
														
 
															+	}
														
 
															+
														
 
															+	symbol__annotate_printf(sym, map, evidx, full_paths,
														
 
															+				min_pcnt, max_lines, 0);
														
 
															+	if (print_lines)
														
 
															+		symbol__free_source_line(sym, len);
														
 
															+
														
 
															+	objdump_line_list__purge(&symbol__annotation(sym)->src->source);
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
--- a/tools/perf/util/annotate.h
+++ b/tools/perf/util/annotate.h
@@ -0,0 +1,103 @@
 
															+#ifndef __PERF_ANNOTATE_H
														
 
															+#define __PERF_ANNOTATE_H
														
 
															+
														
 
															+#include <stdbool.h>
														
 
															+#include "types.h"
														
 
															+#include "symbol.h"
														
 
															+#include <linux/list.h>
														
 
															+#include <linux/rbtree.h>
														
 
															+
														
 
															+struct objdump_line {
														
 
															+	struct list_head node;
														
 
															+	s64		 offset;
														
 
															+	char		 *line;
														
 
															+};
														
 
															+
														
 
															+void objdump_line__free(struct objdump_line *self);
														
 
															+struct objdump_line *objdump__get_next_ip_line(struct list_head *head,
														
 
															+					       struct objdump_line *pos);
														
 
															+
														
 
															+struct sym_hist {
														
 
															+	u64		sum;
														
 
															+	u64		addr[0];
														
 
															+};
														
 
															+
														
 
															+struct source_line {
														
 
															+	struct rb_node	node;
														
 
															+	double		percent;
														
 
															+	char		*path;
														
 
															+};
														
 
															+
														
 
															+/** struct annotated_source - symbols with hits have this attached as in sannotation
														
 
															+ *
														
 
															+ * @histogram: Array of addr hit histograms per event being monitored
														
 
															+ * @lines: If 'print_lines' is specified, per source code line percentages
														
 
															+ * @source: source parsed from objdump -dS
														
 
															+ *
														
 
															+ * lines is allocated, percentages calculated and all sorted by percentage
														
 
															+ * when the annotation is about to be presented, so the percentages are for
														
 
															+ * one of the entries in the histogram array, i.e. for the event/counter being
														
 
															+ * presented. It is deallocated right after symbol__{tui,tty,etc}_annotate
														
 
															+ * returns.
														
 
															+ */
														
 
															+struct annotated_source {
														
 
															+	struct list_head   source;
														
 
															+	struct source_line *lines;
														
 
															+	int    		   nr_histograms;
														
 
															+	int    		   sizeof_sym_hist;
														
 
															+	struct sym_hist	   histograms[0];
														
 
															+};
														
 
															+
														
 
															+struct annotation {
														
 
															+	pthread_mutex_t		lock;
														
 
															+	struct annotated_source *src;
														
 
															+};
														
 
															+
														
 
															+struct sannotation {
														
 
															+	struct annotation annotation;
														
 
															+	struct symbol	  symbol;
														
 
															+};
														
 
															+
														
 
															+static inline struct sym_hist *annotation__histogram(struct annotation *notes, int idx)
														
 
															+{
														
 
															+	return (((void *)&notes->src->histograms) +
														
 
															+	 	(notes->src->sizeof_sym_hist * idx));
														
 
															+}
														
 
															+
														
 
															+static inline struct annotation *symbol__annotation(struct symbol *sym)
														
 
															+{
														
 
															+	struct sannotation *a = container_of(sym, struct sannotation, symbol);
														
 
															+	return &a->annotation;
														
 
															+}
														
 
															+
														
 
															+int symbol__inc_addr_samples(struct symbol *sym, struct map *map,
														
 
															+			     int evidx, u64 addr);
														
 
															+int symbol__alloc_hist(struct symbol *sym, int nevents);
														
 
															+void symbol__annotate_zero_histograms(struct symbol *sym);
														
 
															+
														
 
															+int symbol__annotate(struct symbol *sym, struct map *map, size_t privsize);
														
 
															+int symbol__annotate_init(struct map *map __used, struct symbol *sym);
														
 
															+int symbol__annotate_printf(struct symbol *sym, struct map *map, int evidx,
														
 
															+			    bool full_paths, int min_pcnt, int max_lines,
														
 
															+			    int context);
														
 
															+void symbol__annotate_zero_histogram(struct symbol *sym, int evidx);
														
 
															+void symbol__annotate_decay_histogram(struct symbol *sym, int evidx);
														
 
															+void objdump_line_list__purge(struct list_head *head);
														
 
															+
														
 
															+int symbol__tty_annotate(struct symbol *sym, struct map *map, int evidx,
														
 
															+			 bool print_lines, bool full_paths, int min_pcnt,
														
 
															+			 int max_lines);
														
 
															+
														
 
															+#ifdef NO_NEWT_SUPPORT
														
 
															+static inline int symbol__tui_annotate(struct symbol *sym __used,
														
 
															+				       struct map *map __used,
														
 
															+				       int evidx __used, int refresh __used)
														
 
															+{
														
 
															+	return 0;
														
 
															+}
														
 
															+#else
														
 
															+int symbol__tui_annotate(struct symbol *sym, struct map *map, int evidx,
														
 
															+			 int refresh);
														
 
															+#endif
														
 
															+
														
 
															+#endif	/* __PERF_ANNOTATE_H */
														
--- a/tools/perf/util/build-id.c
+++ b/tools/perf/util/build-id.c
@@ -14,8 +14,8 @@
 
															 #include <linux/kernel.h>
														
 
															 #include "debug.h"
														
 
															-static int build_id__mark_dso_hit(event_t *event,
														
 
															-				  struct sample_data *sample __used,
														
 
															+static int build_id__mark_dso_hit(union perf_event *event,
														
 
															+				  struct perf_sample *sample __used,
														
 
															 				  struct perf_session *session)
														
 
															 {
														
 
															 	struct addr_location al;
														
@@ -37,13 +37,14 @@ static int build_id__mark_dso_hit(event_t *event,
 
															 	return 0;
														
 
															 }
														
 
															-static int event__exit_del_thread(event_t *self, struct sample_data *sample __used,
														
 
															-				  struct perf_session *session)
														
 
															+static int perf_event__exit_del_thread(union perf_event *event,
														
 
															+				       struct perf_sample *sample __used,
														
 
															+				       struct perf_session *session)
														
 
															 {
														
 
															-	struct thread *thread = perf_session__findnew(session, self->fork.tid);
														
 
															+	struct thread *thread = perf_session__findnew(session, event->fork.tid);
														
 
															-	dump_printf("(%d:%d):(%d:%d)\n", self->fork.pid, self->fork.tid,
														
 
															-		    self->fork.ppid, self->fork.ptid);
														
 
															+	dump_printf("(%d:%d):(%d:%d)\n", event->fork.pid, event->fork.tid,
														
 
															+		    event->fork.ppid, event->fork.ptid);
														
 
															 	if (thread) {
														
 
															 		rb_erase(&thread->rb_node, &session->threads);
														
@@ -56,9 +57,9 @@ static int event__exit_del_thread(event_t *self, struct sample_data *sample __us
 
															 struct perf_event_ops build_id__mark_dso_hit_ops = {
														
 
															 	.sample	= build_id__mark_dso_hit,
														
 
															-	.mmap	= event__process_mmap,
														
 
															-	.fork	= event__process_task,
														
 
															-	.exit	= event__exit_del_thread,
														
 
															+	.mmap	= perf_event__process_mmap,
														
 
															+	.fork	= perf_event__process_task,
														
 
															+	.exit	= perf_event__exit_del_thread,
														
 
															 };
														
 
															 char *dso__build_id_filename(struct dso *self, char *bf, size_t size)
														
--- a/tools/perf/util/cache.h
+++ b/tools/perf/util/cache.h
@@ -34,13 +34,14 @@ extern int pager_use_color;
 
															 extern int use_browser;
														
 
															 #ifdef NO_NEWT_SUPPORT
														
 
															-static inline void setup_browser(void)
														
 
															+static inline void setup_browser(bool fallback_to_pager)
														
 
															 {
														
 
															-	setup_pager();
														
 
															+	if (fallback_to_pager)
														
 
															+		setup_pager();
														
 
															 }
														
 
															 static inline void exit_browser(bool wait_for_ok __used) {}
														
 
															 #else
														
 
															-void setup_browser(void);
														
 
															+void setup_browser(bool fallback_to_pager);
														
 
															 void exit_browser(bool wait_for_ok);
														
 
															 #endif
														
--- a/tools/perf/util/callchain.c
+++ b/tools/perf/util/callchain.c
@@ -1,5 +1,5 @@
 
															 /*
														
 
															- * Copyright (C) 2009-2010, Frederic Weisbecker <fweisbec@gmail.com>
														
 
															+ * Copyright (C) 2009-2011, Frederic Weisbecker <fweisbec@gmail.com>
														
 
															  *
														
 
															  * Handle the callchains from the stream in an ad-hoc radix tree and then
														
 
															  * sort them in an rbtree.
														
@@ -18,7 +18,8 @@
 
															 #include "util.h"
														
 
															 #include "callchain.h"
														
 
															-bool ip_callchain__valid(struct ip_callchain *chain, const event_t *event)
														
 
															+bool ip_callchain__valid(struct ip_callchain *chain,
														
 
															+			 const union perf_event *event)
														
 
															 {
														
 
															 	unsigned int chain_size = event->header.size;
														
 
															 	chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event;
														
@@ -26,10 +27,10 @@ bool ip_callchain__valid(struct ip_callchain *chain, const event_t *event)
 
															 }
														
 
															 #define chain_for_each_child(child, parent)	\
														
 
															-	list_for_each_entry(child, &parent->children, brothers)
														
 
															+	list_for_each_entry(child, &parent->children, siblings)
														
 
															 #define chain_for_each_child_safe(child, next, parent)	\
														
 
															-	list_for_each_entry_safe(child, next, &parent->children, brothers)
														
 
															+	list_for_each_entry_safe(child, next, &parent->children, siblings)
														
 
															 static void
														
 
															 rb_insert_callchain(struct rb_root *root, struct callchain_node *chain,
														
@@ -38,14 +39,14 @@ rb_insert_callchain(struct rb_root *root, struct callchain_node *chain,
 
															 	struct rb_node **p = &root->rb_node;
														
 
															 	struct rb_node *parent = NULL;
														
 
															 	struct callchain_node *rnode;
														
 
															-	u64 chain_cumul = cumul_hits(chain);
														
 
															+	u64 chain_cumul = callchain_cumul_hits(chain);
														
 
															 	while (*p) {
														
 
															 		u64 rnode_cumul;
														
 
															 		parent = *p;
														
 
															 		rnode = rb_entry(parent, struct callchain_node, rb_node);
														
 
															-		rnode_cumul = cumul_hits(rnode);
														
 
															+		rnode_cumul = callchain_cumul_hits(rnode);
														
 
															 		switch (mode) {
														
 
															 		case CHAIN_FLAT:
														
@@ -104,7 +105,7 @@ static void __sort_chain_graph_abs(struct callchain_node *node,
 
															 	chain_for_each_child(child, node) {
														
 
															 		__sort_chain_graph_abs(child, min_hit);
														
 
															-		if (cumul_hits(child) >= min_hit)
														
 
															+		if (callchain_cumul_hits(child) >= min_hit)
														
 
															 			rb_insert_callchain(&node->rb_root, child,
														
 
															 					    CHAIN_GRAPH_ABS);
														
 
															 	}
														
@@ -129,7 +130,7 @@ static void __sort_chain_graph_rel(struct callchain_node *node,
 
															 	chain_for_each_child(child, node) {
														
 
															 		__sort_chain_graph_rel(child, min_percent);
														
 
															-		if (cumul_hits(child) >= min_hit)
														
 
															+		if (callchain_cumul_hits(child) >= min_hit)
														
 
															 			rb_insert_callchain(&node->rb_root, child,
														
 
															 					    CHAIN_GRAPH_REL);
														
 
															 	}
														
@@ -143,7 +144,7 @@ sort_chain_graph_rel(struct rb_root *rb_root, struct callchain_root *chain_root,
 
															 	rb_root->rb_node = chain_root->node.rb_root.rb_node;
														
 
															 }
														
 
															-int register_callchain_param(struct callchain_param *param)
														
 
															+int callchain_register_param(struct callchain_param *param)
														
 
															 {
														
 
															 	switch (param->mode) {
														
 
															 	case CHAIN_GRAPH_ABS:
														
@@ -189,32 +190,27 @@ create_child(struct callchain_node *parent, bool inherit_children)
 
															 		chain_for_each_child(next, new)
														
 
															 			next->parent = new;
														
 
															 	}
														
 
															-	list_add_tail(&new->brothers, &parent->children);
														
 
															+	list_add_tail(&new->siblings, &parent->children);
														
 
															 	return new;
														
 
															 }
														
 
															-struct resolved_ip {
														
 
															-	u64		  ip;
														
 
															-	struct map_symbol ms;
														
 
															-};
														
 
															-
														
 
															-struct resolved_chain {
														
 
															-	u64			nr;
														
 
															-	struct resolved_ip	ips[0];
														
 
															-};
														
 
															-
														
 
															-
														
 
															 /*
														
 
															  * Fill the node with callchain values
														
 
															  */
														
 
															 static void
														
 
															-fill_node(struct callchain_node *node, struct resolved_chain *chain, int start)
														
 
															+fill_node(struct callchain_node *node, struct callchain_cursor *cursor)
														
 
															 {
														
 
															-	unsigned int i;
														
 
															+	struct callchain_cursor_node *cursor_node;
														
 
															+
														
 
															+	node->val_nr = cursor->nr - cursor->pos;
														
 
															+	if (!node->val_nr)
														
 
															+		pr_warning("Warning: empty node in callchain tree\n");
														
 
															-	for (i = start; i < chain->nr; i++) {
														
 
															+	cursor_node = callchain_cursor_current(cursor);
														
 
															+
														
 
															+	while (cursor_node) {
														
 
															 		struct callchain_list *call;
														
 
															 		call = zalloc(sizeof(*call));
														
@@ -222,23 +218,25 @@ fill_node(struct callchain_node *node, struct resolved_chain *chain, int start)
 
															 			perror("not enough memory for the code path tree");
														
 
															 			return;
														
 
															 		}
														
 
															-		call->ip = chain->ips[i].ip;
														
 
															-		call->ms = chain->ips[i].ms;
														
 
															+		call->ip = cursor_node->ip;
														
 
															+		call->ms.sym = cursor_node->sym;
														
 
															+		call->ms.map = cursor_node->map;
														
 
															 		list_add_tail(&call->list, &node->val);
														
 
															+
														
 
															+		callchain_cursor_advance(cursor);
														
 
															+		cursor_node = callchain_cursor_current(cursor);
														
 
															 	}
														
 
															-	node->val_nr = chain->nr - start;
														
 
															-	if (!node->val_nr)
														
 
															-		pr_warning("Warning: empty node in callchain tree\n");
														
 
															 }
														
 
															 static void
														
 
															-add_child(struct callchain_node *parent, struct resolved_chain *chain,
														
 
															-	  int start, u64 period)
														
 
															+add_child(struct callchain_node *parent,
														
 
															+	  struct callchain_cursor *cursor,
														
 
															+	  u64 period)
														
 
															 {
														
 
															 	struct callchain_node *new;
														
 
															 	new = create_child(parent, false);
														
 
															-	fill_node(new, chain, start);
														
 
															+	fill_node(new, cursor);
														
 
															 	new->children_hit = 0;
														
 
															 	new->hit = period;
														
@@ -250,9 +248,10 @@ add_child(struct callchain_node *parent, struct resolved_chain *chain,
 
															  * Then create another child to host the given callchain of new branch
														
 
															  */
														
 
															 static void
														
 
															-split_add_child(struct callchain_node *parent, struct resolved_chain *chain,
														
 
															-		struct callchain_list *to_split, int idx_parents, int idx_local,
														
 
															-		u64 period)
														
 
															+split_add_child(struct callchain_node *parent,
														
 
															+		struct callchain_cursor *cursor,
														
 
															+		struct callchain_list *to_split,
														
 
															+		u64 idx_parents, u64 idx_local, u64 period)
														
 
															 {
														
 
															 	struct callchain_node *new;
														
 
															 	struct list_head *old_tail;
														
@@ -272,14 +271,14 @@ split_add_child(struct callchain_node *parent, struct resolved_chain *chain,
 
															 	/* split the hits */
														
 
															 	new->hit = parent->hit;
														
 
															 	new->children_hit = parent->children_hit;
														
 
															-	parent->children_hit = cumul_hits(new);
														
 
															+	parent->children_hit = callchain_cumul_hits(new);
														
 
															 	new->val_nr = parent->val_nr - idx_local;
														
 
															 	parent->val_nr = idx_local;
														
 
															 	/* create a new child for the new branch if any */
														
 
															-	if (idx_total < chain->nr) {
														
 
															+	if (idx_total < cursor->nr) {
														
 
															 		parent->hit = 0;
														
 
															-		add_child(parent, chain, idx_total, period);
														
 
															+		add_child(parent, cursor, period);
														
 
															 		parent->children_hit += period;
														
 
															 	} else {
														
 
															 		parent->hit = period;
														
@@ -287,36 +286,41 @@ split_add_child(struct callchain_node *parent, struct resolved_chain *chain,
 
															 }
														
 
															 static int
														
 
															-append_chain(struct callchain_node *root, struct resolved_chain *chain,
														
 
															-	     unsigned int start, u64 period);
														
 
															+append_chain(struct callchain_node *root,
														
 
															+	     struct callchain_cursor *cursor,
														
 
															+	     u64 period);
														
 
															 static void
														
 
															-append_chain_children(struct callchain_node *root, struct resolved_chain *chain,
														
 
															-		      unsigned int start, u64 period)
														
 
															+append_chain_children(struct callchain_node *root,
														
 
															+		      struct callchain_cursor *cursor,
														
 
															+		      u64 period)
														
 
															 {
														
 
															 	struct callchain_node *rnode;
														
 
															 	/* lookup in childrens */
														
 
															 	chain_for_each_child(rnode, root) {
														
 
															-		unsigned int ret = append_chain(rnode, chain, start, period);
														
 
															+		unsigned int ret = append_chain(rnode, cursor, period);
														
 
															 		if (!ret)
														
 
															 			goto inc_children_hit;
														
 
															 	}
														
 
															 	/* nothing in children, add to the current node */
														
 
															-	add_child(root, chain, start, period);
														
 
															+	add_child(root, cursor, period);
														
 
															 inc_children_hit:
														
 
															 	root->children_hit += period;
														
 
															 }
														
 
															 static int
														
 
															-append_chain(struct callchain_node *root, struct resolved_chain *chain,
														
 
															-	     unsigned int start, u64 period)
														
 
															+append_chain(struct callchain_node *root,
														
 
															+	     struct callchain_cursor *cursor,
														
 
															+	     u64 period)
														
 
															 {
														
 
															+	struct callchain_cursor_node *curr_snap = cursor->curr;
														
 
															 	struct callchain_list *cnode;
														
 
															-	unsigned int i = start;
														
 
															+	u64 start = cursor->pos;
														
 
															 	bool found = false;
														
 
															+	u64 matches;
														
 
															 	/*
														
 
															 	 * Lookup in the current node
														
@@ -324,141 +328,134 @@ append_chain(struct callchain_node *root, struct resolved_chain *chain,
 
															 	 * anywhere inside a function.
														
 
															 	 */
														
 
															 	list_for_each_entry(cnode, &root->val, list) {
														
 
															+		struct callchain_cursor_node *node;
														
 
															 		struct symbol *sym;
														
 
															-		if (i == chain->nr)
														
 
															+		node = callchain_cursor_current(cursor);
														
 
															+		if (!node)
														
 
															 			break;
														
 
															-		sym = chain->ips[i].ms.sym;
														
 
															+		sym = node->sym;
														
 
															 		if (cnode->ms.sym && sym) {
														
 
															 			if (cnode->ms.sym->start != sym->start)
														
 
															 				break;
														
 
															-		} else if (cnode->ip != chain->ips[i].ip)
														
 
															+		} else if (cnode->ip != node->ip)
														
 
															 			break;
														
 
															 		if (!found)
														
 
															 			found = true;
														
 
															-		i++;
														
 
															+
														
 
															+		callchain_cursor_advance(cursor);
														
 
															 	}
														
 
															 	/* matches not, relay on the parent */
														
 
															-	if (!found)
														
 
															+	if (!found) {
														
 
															+		cursor->curr = curr_snap;
														
 
															+		cursor->pos = start;
														
 
															 		return -1;
														
 
															+	}
														
 
															+
														
 
															+	matches = cursor->pos - start;
														
 
															 	/* we match only a part of the node. Split it and add the new chain */
														
 
															-	if (i - start < root->val_nr) {
														
 
															-		split_add_child(root, chain, cnode, start, i - start, period);
														
 
															+	if (matches < root->val_nr) {
														
 
															+		split_add_child(root, cursor, cnode, start, matches, period);
														
 
															 		return 0;
														
 
															 	}
														
 
															 	/* we match 100% of the path, increment the hit */
														
 
															-	if (i - start == root->val_nr && i == chain->nr) {
														
 
															+	if (matches == root->val_nr && cursor->pos == cursor->nr) {
														
 
															 		root->hit += period;
														
 
															 		return 0;
														
 
															 	}
														
 
															 	/* We match the node and still have a part remaining */
														
 
															-	append_chain_children(root, chain, i, period);
														
 
															+	append_chain_children(root, cursor, period);
														
 
															 	return 0;
														
 
															 }
														
 
															-static void filter_context(struct ip_callchain *old, struct resolved_chain *new,
														
 
															-			   struct map_symbol *syms)
														
 
															-{
														
 
															-	int i, j = 0;
														
 
															-
														
 
															-	for (i = 0; i < (int)old->nr; i++) {
														
 
															-		if (old->ips[i] >= PERF_CONTEXT_MAX)
														
 
															-			continue;
														
 
															-
														
 
															-		new->ips[j].ip = old->ips[i];
														
 
															-		new->ips[j].ms = syms[i];
														
 
															-		j++;
														
 
															-	}
														
 
															-
														
 
															-	new->nr = j;
														
 
															-}
														
 
															-
														
 
															-
														
 
															-int callchain_append(struct callchain_root *root, struct ip_callchain *chain,
														
 
															-		     struct map_symbol *syms, u64 period)
														
 
															+int callchain_append(struct callchain_root *root,
														
 
															+		     struct callchain_cursor *cursor,
														
 
															+		     u64 period)
														
 
															 {
														
 
															-	struct resolved_chain *filtered;
														
 
															-
														
 
															-	if (!chain->nr)
														
 
															+	if (!cursor->nr)
														
 
															 		return 0;
														
 
															-	filtered = zalloc(sizeof(*filtered) +
														
 
															-			  chain->nr * sizeof(struct resolved_ip));
														
 
															-	if (!filtered)
														
 
															-		return -ENOMEM;
														
 
															-
														
 
															-	filter_context(chain, filtered, syms);
														
 
															-
														
 
															-	if (!filtered->nr)
														
 
															-		goto end;
														
 
															+	callchain_cursor_commit(cursor);
														
 
															-	append_chain_children(&root->node, filtered, 0, period);
														
 
															+	append_chain_children(&root->node, cursor, period);
														
 
															-	if (filtered->nr > root->max_depth)
														
 
															-		root->max_depth = filtered->nr;
														
 
															-end:
														
 
															-	free(filtered);
														
 
															+	if (cursor->nr > root->max_depth)
														
 
															+		root->max_depth = cursor->nr;
														
 
															 	return 0;
														
 
															 }
														
 
															 static int
														
 
															-merge_chain_branch(struct callchain_node *dst, struct callchain_node *src,
														
 
															-		   struct resolved_chain *chain)
														
 
															+merge_chain_branch(struct callchain_cursor *cursor,
														
 
															+		   struct callchain_node *dst, struct callchain_node *src)
														
 
															 {
														
 
															+	struct callchain_cursor_node **old_last = cursor->last;
														
 
															 	struct callchain_node *child, *next_child;
														
 
															 	struct callchain_list *list, *next_list;
														
 
															-	int old_pos = chain->nr;
														
 
															+	int old_pos = cursor->nr;
														
 
															 	int err = 0;
														
 
															 	list_for_each_entry_safe(list, next_list, &src->val, list) {
														
 
															-		chain->ips[chain->nr].ip = list->ip;
														
 
															-		chain->ips[chain->nr].ms = list->ms;
														
 
															-		chain->nr++;
														
 
															+		callchain_cursor_append(cursor, list->ip,
														
 
															+					list->ms.map, list->ms.sym);
														
 
															 		list_del(&list->list);
														
 
															 		free(list);
														
 
															 	}
														
 
															-	if (src->hit)
														
 
															-		append_chain_children(dst, chain, 0, src->hit);
														
 
															+	if (src->hit) {
														
 
															+		callchain_cursor_commit(cursor);
														
 
															+		append_chain_children(dst, cursor, src->hit);
														
 
															+	}
														
 
															 	chain_for_each_child_safe(child, next_child, src) {
														
 
															-		err = merge_chain_branch(dst, child, chain);
														
 
															+		err = merge_chain_branch(cursor, dst, child);
														
 
															 		if (err)
														
 
															 			break;
														
 
															-		list_del(&child->brothers);
														
 
															+		list_del(&child->siblings);
														
 
															 		free(child);
														
 
															 	}
														
 
															-	chain->nr = old_pos;
														
 
															+	cursor->nr = old_pos;
														
 
															+	cursor->last = old_last;
														
 
															 	return err;
														
 
															 }
														
 
															-int callchain_merge(struct callchain_root *dst, struct callchain_root *src)
														
 
															+int callchain_merge(struct callchain_cursor *cursor,
														
 
															+		    struct callchain_root *dst, struct callchain_root *src)
														
 
															+{
														
 
															+	return merge_chain_branch(cursor, &dst->node, &src->node);
														
 
															+}
														
 
															+
														
 
															+int callchain_cursor_append(struct callchain_cursor *cursor,
														
 
															+			    u64 ip, struct map *map, struct symbol *sym)
														
 
															 {
														
 
															-	struct resolved_chain *chain;
														
 
															-	int err;
														
 
															+	struct callchain_cursor_node *node = *cursor->last;
														
 
															-	chain = malloc(sizeof(*chain) +
														
 
															-		       src->max_depth * sizeof(struct resolved_ip));
														
 
															-	if (!chain)
														
 
															-		return -ENOMEM;
														
 
															+	if (!node) {
														
 
															+		node = calloc(sizeof(*node), 1);
														
 
															+		if (!node)
														
 
															+			return -ENOMEM;
														
 
															-	chain->nr = 0;
														
 
															+		*cursor->last = node;
														
 
															+	}
														
 
															-	err = merge_chain_branch(&dst->node, &src->node, chain);
														
 
															+	node->ip = ip;
														
 
															+	node->map = map;
														
 
															+	node->sym = sym;
														
 
															-	free(chain);
														
 
															+	cursor->nr++;
														
 
															-	return err;
														
 
															+	cursor->last = &node->next;
														
 
															+
														
 
															+	return 0;
														
 
															 }
														
--- a/tools/perf/util/callchain.h
+++ b/tools/perf/util/callchain.h
@@ -16,7 +16,7 @@ enum chain_mode {
 
															 struct callchain_node {
														
 
															 	struct callchain_node	*parent;
														
 
															-	struct list_head	brothers;
														
 
															+	struct list_head	siblings;
														
 
															 	struct list_head	children;
														
 
															 	struct list_head	val;
														
 
															 	struct rb_node		rb_node; /* to sort nodes in an rbtree */
														
@@ -49,9 +49,30 @@ struct callchain_list {
 
															 	struct list_head	list;
														
 
															 };
														
 
															+/*
														
 
															+ * A callchain cursor is a single linked list that
														
 
															+ * let one feed a callchain progressively.
														
 
															+ * It keeps persitent allocated entries to minimize
														
 
															+ * allocations.
														
 
															+ */
														
 
															+struct callchain_cursor_node {
														
 
															+	u64				ip;
														
 
															+	struct map			*map;
														
 
															+	struct symbol			*sym;
														
 
															+	struct callchain_cursor_node	*next;
														
 
															+};
														
 
															+
														
 
															+struct callchain_cursor {
														
 
															+	u64				nr;
														
 
															+	struct callchain_cursor_node	*first;
														
 
															+	struct callchain_cursor_node	**last;
														
 
															+	u64				pos;
														
 
															+	struct callchain_cursor_node	*curr;
														
 
															+};
														
 
															+
														
 
															 static inline void callchain_init(struct callchain_root *root)
														
 
															 {
														
 
															-	INIT_LIST_HEAD(&root->node.brothers);
														
 
															+	INIT_LIST_HEAD(&root->node.siblings);
														
 
															 	INIT_LIST_HEAD(&root->node.children);
														
 
															 	INIT_LIST_HEAD(&root->node.val);
														
@@ -61,15 +82,54 @@ static inline void callchain_init(struct callchain_root *root)
 
															 	root->max_depth = 0;
														
 
															 }
														
 
															-static inline u64 cumul_hits(struct callchain_node *node)
														
 
															+static inline u64 callchain_cumul_hits(struct callchain_node *node)
														
 
															 {
														
 
															 	return node->hit + node->children_hit;
														
 
															 }
														
 
															-int register_callchain_param(struct callchain_param *param);
														
 
															-int callchain_append(struct callchain_root *root, struct ip_callchain *chain,
														
 
															-		     struct map_symbol *syms, u64 period);
														
 
															-int callchain_merge(struct callchain_root *dst, struct callchain_root *src);
														
 
															+int callchain_register_param(struct callchain_param *param);
														
 
															+int callchain_append(struct callchain_root *root,
														
 
															+		     struct callchain_cursor *cursor,
														
 
															+		     u64 period);
														
 
															+
														
 
															+int callchain_merge(struct callchain_cursor *cursor,
														
 
															+		    struct callchain_root *dst, struct callchain_root *src);
														
 
															+
														
 
															+bool ip_callchain__valid(struct ip_callchain *chain,
														
 
															+			 const union perf_event *event);
														
 
															+/*
														
 
															+ * Initialize a cursor before adding entries inside, but keep
														
 
															+ * the previously allocated entries as a cache.
														
 
															+ */
														
 
															+static inline void callchain_cursor_reset(struct callchain_cursor *cursor)
														
 
															+{
														
 
															+	cursor->nr = 0;
														
 
															+	cursor->last = &cursor->first;
														
 
															+}
														
 
															+
														
 
															+int callchain_cursor_append(struct callchain_cursor *cursor, u64 ip,
														
 
															+			    struct map *map, struct symbol *sym);
														
 
															-bool ip_callchain__valid(struct ip_callchain *chain, const event_t *event);
														
 
															+/* Close a cursor writing session. Initialize for the reader */
														
 
															+static inline void callchain_cursor_commit(struct callchain_cursor *cursor)
														
 
															+{
														
 
															+	cursor->curr = cursor->first;
														
 
															+	cursor->pos = 0;
														
 
															+}
														
 
															+
														
 
															+/* Cursor reading iteration helpers */
														
 
															+static inline struct callchain_cursor_node *
														
 
															+callchain_cursor_current(struct callchain_cursor *cursor)
														
 
															+{
														
 
															+	if (cursor->pos == cursor->nr)
														
 
															+		return NULL;
														
 
															+
														
 
															+	return cursor->curr;
														
 
															+}
														
 
															+
														
 
															+static inline void callchain_cursor_advance(struct callchain_cursor *cursor)
														
 
															+{
														
 
															+	cursor->curr = cursor->curr->next;
														
 
															+	cursor->pos++;
														
 
															+}
														
 
															 #endif	/* __PERF_CALLCHAIN_H */
														
--- a/tools/perf/util/cgroup.c
+++ b/tools/perf/util/cgroup.c
@@ -0,0 +1,178 @@
 
															+#include "util.h"
														
 
															+#include "../perf.h"
														
 
															+#include "parse-options.h"
														
 
															+#include "evsel.h"
														
 
															+#include "cgroup.h"
														
 
															+#include "debugfs.h" /* MAX_PATH, STR() */
														
 
															+#include "evlist.h"
														
 
															+
														
 
															+int nr_cgroups;
														
 
															+
														
 
															+static int
														
 
															+cgroupfs_find_mountpoint(char *buf, size_t maxlen)
														
 
															+{
														
 
															+	FILE *fp;
														
 
															+	char mountpoint[MAX_PATH+1], tokens[MAX_PATH+1], type[MAX_PATH+1];
														
 
															+	char *token, *saved_ptr;
														
 
															+	int found = 0;
														
 
															+
														
 
															+	fp = fopen("/proc/mounts", "r");
														
 
															+	if (!fp)
														
 
															+		return -1;
														
 
															+
														
 
															+	/*
														
 
															+	 * in order to handle split hierarchy, we need to scan /proc/mounts
														
 
															+	 * and inspect every cgroupfs mount point to find one that has
														
 
															+	 * perf_event subsystem
														
 
															+	 */
														
 
															+	while (fscanf(fp, "%*s %"STR(MAX_PATH)"s %"STR(MAX_PATH)"s %"
														
 
															+				STR(MAX_PATH)"s %*d %*d\n",
														
 
															+				mountpoint, type, tokens) == 3) {
														
 
															+
														
 
															+		if (!strcmp(type, "cgroup")) {
														
 
															+
														
 
															+			token = strtok_r(tokens, ",", &saved_ptr);
														
 
															+
														
 
															+			while (token != NULL) {
														
 
															+				if (!strcmp(token, "perf_event")) {
														
 
															+					found = 1;
														
 
															+					break;
														
 
															+				}
														
 
															+				token = strtok_r(NULL, ",", &saved_ptr);
														
 
															+			}
														
 
															+		}
														
 
															+		if (found)
														
 
															+			break;
														
 
															+	}
														
 
															+	fclose(fp);
														
 
															+	if (!found)
														
 
															+		return -1;
														
 
															+
														
 
															+	if (strlen(mountpoint) < maxlen) {
														
 
															+		strcpy(buf, mountpoint);
														
 
															+		return 0;
														
 
															+	}
														
 
															+	return -1;
														
 
															+}
														
 
															+
														
 
															+static int open_cgroup(char *name)
														
 
															+{
														
 
															+	char path[MAX_PATH+1];
														
 
															+	char mnt[MAX_PATH+1];
														
 
															+	int fd;
														
 
															+
														
 
															+
														
 
															+	if (cgroupfs_find_mountpoint(mnt, MAX_PATH+1))
														
 
															+		return -1;
														
 
															+
														
 
															+	snprintf(path, MAX_PATH, "%s/%s", mnt, name);
														
 
															+
														
 
															+	fd = open(path, O_RDONLY);
														
 
															+	if (fd == -1)
														
 
															+		fprintf(stderr, "no access to cgroup %s\n", path);
														
 
															+
														
 
															+	return fd;
														
 
															+}
														
 
															+
														
 
															+static int add_cgroup(struct perf_evlist *evlist, char *str)
														
 
															+{
														
 
															+	struct perf_evsel *counter;
														
 
															+	struct cgroup_sel *cgrp = NULL;
														
 
															+	int n;
														
 
															+	/*
														
 
															+	 * check if cgrp is already defined, if so we reuse it
														
 
															+	 */
														
 
															+	list_for_each_entry(counter, &evlist->entries, node) {
														
 
															+		cgrp = counter->cgrp;
														
 
															+		if (!cgrp)
														
 
															+			continue;
														
 
															+		if (!strcmp(cgrp->name, str))
														
 
															+			break;
														
 
															+
														
 
															+		cgrp = NULL;
														
 
															+	}
														
 
															+
														
 
															+	if (!cgrp) {
														
 
															+		cgrp = zalloc(sizeof(*cgrp));
														
 
															+		if (!cgrp)
														
 
															+			return -1;
														
 
															+
														
 
															+		cgrp->name = str;
														
 
															+
														
 
															+		cgrp->fd = open_cgroup(str);
														
 
															+		if (cgrp->fd == -1) {
														
 
															+			free(cgrp);
														
 
															+			return -1;
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	/*
														
 
															+	 * find corresponding event
														
 
															+	 * if add cgroup N, then need to find event N
														
 
															+	 */
														
 
															+	n = 0;
														
 
															+	list_for_each_entry(counter, &evlist->entries, node) {
														
 
															+		if (n == nr_cgroups)
														
 
															+			goto found;
														
 
															+		n++;
														
 
															+	}
														
 
															+	if (cgrp->refcnt == 0)
														
 
															+		free(cgrp);
														
 
															+
														
 
															+	return -1;
														
 
															+found:
														
 
															+	cgrp->refcnt++;
														
 
															+	counter->cgrp = cgrp;
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+void close_cgroup(struct cgroup_sel *cgrp)
														
 
															+{
														
 
															+	if (!cgrp)
														
 
															+		return;
														
 
															+
														
 
															+	/* XXX: not reentrant */
														
 
															+	if (--cgrp->refcnt == 0) {
														
 
															+		close(cgrp->fd);
														
 
															+		free(cgrp->name);
														
 
															+		free(cgrp);
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+int parse_cgroups(const struct option *opt __used, const char *str,
														
 
															+		  int unset __used)
														
 
															+{
														
 
															+	struct perf_evlist *evlist = *(struct perf_evlist **)opt->value;
														
 
															+	const char *p, *e, *eos = str + strlen(str);
														
 
															+	char *s;
														
 
															+	int ret;
														
 
															+
														
 
															+	if (list_empty(&evlist->entries)) {
														
 
															+		fprintf(stderr, "must define events before cgroups\n");
														
 
															+		return -1;
														
 
															+	}
														
 
															+
														
 
															+	for (;;) {
														
 
															+		p = strchr(str, ',');
														
 
															+		e = p ? p : eos;
														
 
															+
														
 
															+		/* allow empty cgroups, i.e., skip */
														
 
															+		if (e - str) {
														
 
															+			/* termination added */
														
 
															+			s = strndup(str, e - str);
														
 
															+			if (!s)
														
 
															+				return -1;
														
 
															+			ret = add_cgroup(evlist, s);
														
 
															+			if (ret) {
														
 
															+				free(s);
														
 
															+				return -1;
														
 
															+			}
														
 
															+		}
														
 
															+		/* nr_cgroups is increased een for empty cgroups */
														
 
															+		nr_cgroups++;
														
 
															+		if (!p)
														
 
															+			break;
														
 
															+		str = p+1;
														
 
															+	}
														
 
															+	return 0;
														
 
															+}
														
--- a/tools/perf/util/cgroup.h
+++ b/tools/perf/util/cgroup.h
@@ -0,0 +1,17 @@
 
															+#ifndef __CGROUP_H__
														
 
															+#define __CGROUP_H__
														
 
															+
														
 
															+struct option;
														
 
															+
														
 
															+struct cgroup_sel {
														
 
															+	char *name;
														
 
															+	int fd;
														
 
															+	int refcnt;
														
 
															+};
														
 
															+
														
 
															+
														
 
															+extern int nr_cgroups; /* number of explicit cgroups defined */
														
 
															+extern void close_cgroup(struct cgroup_sel *cgrp);
														
 
															+extern int parse_cgroups(const struct option *opt, const char *str, int unset);
														
 
															+
														
 
															+#endif /* __CGROUP_H__ */
														
--- a/tools/perf/util/cpumap.c
+++ b/tools/perf/util/cpumap.c
@@ -177,3 +177,8 @@ struct cpu_map *cpu_map__dummy_new(void)
 
															 	return cpus;
														
 
															 }
														
 
															+
														
 
															+void cpu_map__delete(struct cpu_map *map)
														
 
															+{
														
 
															+	free(map);
														
 
															+}
														
--- a/tools/perf/util/cpumap.h
+++ b/tools/perf/util/cpumap.h
@@ -8,6 +8,6 @@ struct cpu_map {
 
															 struct cpu_map *cpu_map__new(const char *cpu_list);
														
 
															 struct cpu_map *cpu_map__dummy_new(void);
														
 
															-void *cpu_map__delete(struct cpu_map *map);
														
 
															+void cpu_map__delete(struct cpu_map *map);
														
 
															 #endif /* __PERF_CPUMAP_H */
														
--- a/tools/perf/util/debug.c
+++ b/tools/perf/util/debug.c
@@ -57,7 +57,7 @@ void ui__warning(const char *format, ...)
 
															 }
														
 
															 #endif
														
 
															-void trace_event(event_t *event)
														
 
															+void trace_event(union perf_event *event)
														
 
															 {
														
 
															 	unsigned char *raw_event = (void *)event;
														
 
															 	const char *color = PERF_COLOR_BLUE;
														
--- a/tools/perf/util/debug.h
+++ b/tools/perf/util/debug.h
@@ -9,7 +9,7 @@ extern int verbose;
 
															 extern bool quiet, dump_trace;
														
 
															 int dump_printf(const char *fmt, ...) __attribute__((format(printf, 1, 2)));
														
 
															-void trace_event(event_t *event);
														
 
															+void trace_event(union perf_event *event);
														
 
															 struct ui_progress;
														
--- a/tools/perf/util/event.c
+++ b/tools/perf/util/event.c
@@ -6,8 +6,9 @@
 
															 #include "string.h"
														
 
															 #include "strlist.h"
														
 
															 #include "thread.h"
														
 
															+#include "thread_map.h"
														
 
															-static const char *event__name[] = {
														
 
															+static const char *perf_event__names[] = {
														
 
															 	[0]			 = "TOTAL",
														
 
															 	[PERF_RECORD_MMAP]	 = "MMAP",
														
 
															 	[PERF_RECORD_LOST]	 = "LOST",
														
@@ -25,16 +26,16 @@ static const char *event__name[] = {
 
															 	[PERF_RECORD_FINISHED_ROUND]	 = "FINISHED_ROUND",
														
 
															 };
														
 
															-const char *event__get_event_name(unsigned int id)
														
 
															+const char *perf_event__name(unsigned int id)
														
 
															 {
														
 
															-	if (id >= ARRAY_SIZE(event__name))
														
 
															+	if (id >= ARRAY_SIZE(perf_event__names))
														
 
															 		return "INVALID";
														
 
															-	if (!event__name[id])
														
 
															+	if (!perf_event__names[id])
														
 
															 		return "UNKNOWN";
														
 
															-	return event__name[id];
														
 
															+	return perf_event__names[id];
														
 
															 }
														
 
															-static struct sample_data synth_sample = {
														
 
															+static struct perf_sample synth_sample = {
														
 
															 	.pid	   = -1,
														
 
															 	.tid	   = -1,
														
 
															 	.time	   = -1,
														
@@ -43,9 +44,9 @@ static struct sample_data synth_sample = {
 
															 	.period	   = 1,
														
 
															 };
														
 
															-static pid_t event__synthesize_comm(event_t *event, pid_t pid, int full,
														
 
															-				    event__handler_t process,
														
 
															-				    struct perf_session *session)
														
 
															+static pid_t perf_event__synthesize_comm(union perf_event *event, pid_t pid,
														
 
															+					 int full, perf_event__handler_t process,
														
 
															+					 struct perf_session *session)
														
 
															 {
														
 
															 	char filename[PATH_MAX];
														
 
															 	char bf[BUFSIZ];
														
@@ -126,9 +127,10 @@ out:
 
															 	return tgid;
														
 
															 }
														
 
															-static int event__synthesize_mmap_events(event_t *event, pid_t pid, pid_t tgid,
														
 
															-					 event__handler_t process,
														
 
															-					 struct perf_session *session)
														
 
															+static int perf_event__synthesize_mmap_events(union perf_event *event,
														
 
															+					      pid_t pid, pid_t tgid,
														
 
															+					      perf_event__handler_t process,
														
 
															+					      struct perf_session *session)
														
 
															 {
														
 
															 	char filename[PATH_MAX];
														
 
															 	FILE *fp;
														
@@ -199,14 +201,14 @@ static int event__synthesize_mmap_events(event_t *event, pid_t pid, pid_t tgid,
 
															 	return 0;
														
 
															 }
														
 
															-int event__synthesize_modules(event__handler_t process,
														
 
															-			      struct perf_session *session,
														
 
															-			      struct machine *machine)
														
 
															+int perf_event__synthesize_modules(perf_event__handler_t process,
														
 
															+				   struct perf_session *session,
														
 
															+				   struct machine *machine)
														
 
															 {
														
 
															 	struct rb_node *nd;
														
 
															 	struct map_groups *kmaps = &machine->kmaps;
														
 
															-	event_t *event = zalloc(sizeof(event->mmap) + session->id_hdr_size);
														
 
															-
														
 
															+	union perf_event *event = zalloc((sizeof(event->mmap) +
														
 
															+					  session->id_hdr_size));
														
 
															 	if (event == NULL) {
														
 
															 		pr_debug("Not enough memory synthesizing mmap event "
														
 
															 			 "for kernel modules\n");
														
@@ -251,23 +253,24 @@ int event__synthesize_modules(event__handler_t process,
 
															 	return 0;
														
 
															 }
														
 
															-static int __event__synthesize_thread(event_t *comm_event, event_t *mmap_event,
														
 
															-				      pid_t pid, event__handler_t process,
														
 
															+static int __event__synthesize_thread(union perf_event *comm_event,
														
 
															+				      union perf_event *mmap_event,
														
 
															+				      pid_t pid, perf_event__handler_t process,
														
 
															 				      struct perf_session *session)
														
 
															 {
														
 
															-	pid_t tgid = event__synthesize_comm(comm_event, pid, 1, process,
														
 
															+	pid_t tgid = perf_event__synthesize_comm(comm_event, pid, 1, process,
														
 
															 					    session);
														
 
															 	if (tgid == -1)
														
 
															 		return -1;
														
 
															-	return event__synthesize_mmap_events(mmap_event, pid, tgid,
														
 
															+	return perf_event__synthesize_mmap_events(mmap_event, pid, tgid,
														
 
															 					     process, session);
														
 
															 }
														
 
															-int event__synthesize_thread_map(struct thread_map *threads,
														
 
															-				 event__handler_t process,
														
 
															-				 struct perf_session *session)
														
 
															+int perf_event__synthesize_thread_map(struct thread_map *threads,
														
 
															+				      perf_event__handler_t process,
														
 
															+				      struct perf_session *session)
														
 
															 {
														
 
															-	event_t *comm_event, *mmap_event;
														
 
															+	union perf_event *comm_event, *mmap_event;
														
 
															 	int err = -1, thread;
														
 
															 	comm_event = malloc(sizeof(comm_event->comm) + session->id_hdr_size);
														
@@ -294,12 +297,12 @@ out:
 
															 	return err;
														
 
															 }
														
 
															-int event__synthesize_threads(event__handler_t process,
														
 
															-			      struct perf_session *session)
														
 
															+int perf_event__synthesize_threads(perf_event__handler_t process,
														
 
															+				   struct perf_session *session)
														
 
															 {
														
 
															 	DIR *proc;
														
 
															 	struct dirent dirent, *next;
														
 
															-	event_t *comm_event, *mmap_event;
														
 
															+	union perf_event *comm_event, *mmap_event;
														
 
															 	int err = -1;
														
 
															 	comm_event = malloc(sizeof(comm_event->comm) + session->id_hdr_size);
														
@@ -357,10 +360,10 @@ static int find_symbol_cb(void *arg, const char *name, char type,
 
															 	return 1;
														
 
															 }
														
 
															-int event__synthesize_kernel_mmap(event__handler_t process,
														
 
															-				  struct perf_session *session,
														
 
															-				  struct machine *machine,
														
 
															-				  const char *symbol_name)
														
 
															+int perf_event__synthesize_kernel_mmap(perf_event__handler_t process,
														
 
															+				       struct perf_session *session,
														
 
															+				       struct machine *machine,
														
 
															+				       const char *symbol_name)
														
 
															 {
														
 
															 	size_t size;
														
 
															 	const char *filename, *mmap_name;
														
@@ -374,8 +377,8 @@ int event__synthesize_kernel_mmap(event__handler_t process,
 
															 	 * kernels.
														
 
															 	 */
														
 
															 	struct process_symbol_args args = { .name = symbol_name, };
														
 
															-	event_t *event = zalloc(sizeof(event->mmap) + session->id_hdr_size);
														
 
															-
														
 
															+	union perf_event *event = zalloc((sizeof(event->mmap) +
														
 
															+					  session->id_hdr_size));
														
 
															 	if (event == NULL) {
														
 
															 		pr_debug("Not enough memory synthesizing mmap event "
														
 
															 			 "for kernel modules\n");
														
@@ -421,42 +424,15 @@ int event__synthesize_kernel_mmap(event__handler_t process,
 
															 	return err;
														
 
															 }
														
 
															-static void thread__comm_adjust(struct thread *self, struct hists *hists)
														
 
															-{
														
 
															-	char *comm = self->comm;
														
 
															-
														
 
															-	if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep &&
														
 
															-	    (!symbol_conf.comm_list ||
														
 
															-	     strlist__has_entry(symbol_conf.comm_list, comm))) {
														
 
															-		u16 slen = strlen(comm);
														
 
															-
														
 
															-		if (hists__new_col_len(hists, HISTC_COMM, slen))
														
 
															-			hists__set_col_len(hists, HISTC_THREAD, slen + 6);
														
 
															-	}
														
 
															-}
														
 
															-
														
 
															-static int thread__set_comm_adjust(struct thread *self, const char *comm,
														
 
															-				   struct hists *hists)
														
 
															+int perf_event__process_comm(union perf_event *event,
														
 
															+			     struct perf_sample *sample __used,
														
 
															+			     struct perf_session *session)
														
 
															 {
														
 
															-	int ret = thread__set_comm(self, comm);
														
 
															-
														
 
															-	if (ret)
														
 
															-		return ret;
														
 
															-
														
 
															-	thread__comm_adjust(self, hists);
														
 
															+	struct thread *thread = perf_session__findnew(session, event->comm.tid);
														
 
															-	return 0;
														
 
															-}
														
 
															+	dump_printf(": %s:%d\n", event->comm.comm, event->comm.tid);
														
 
															-int event__process_comm(event_t *self, struct sample_data *sample __used,
														
 
															-			struct perf_session *session)
														
 
															-{
														
 
															-	struct thread *thread = perf_session__findnew(session, self->comm.tid);
														
 
															-
														
 
															-	dump_printf(": %s:%d\n", self->comm.comm, self->comm.tid);
														
 
															-
														
 
															-	if (thread == NULL || thread__set_comm_adjust(thread, self->comm.comm,
														
 
															-						      &session->hists)) {
														
 
															+	if (thread == NULL || thread__set_comm(thread, event->comm.comm)) {
														
 
															 		dump_printf("problem processing PERF_RECORD_COMM, skipping event.\n");
														
 
															 		return -1;
														
 
															 	}
														
@@ -464,19 +440,21 @@ int event__process_comm(event_t *self, struct sample_data *sample __used,
 
															 	return 0;
														
 
															 }
														
 
															-int event__process_lost(event_t *self, struct sample_data *sample __used,
														
 
															-			struct perf_session *session)
														
 
															+int perf_event__process_lost(union perf_event *event,
														
 
															+			     struct perf_sample *sample __used,
														
 
															+			     struct perf_session *session)
														
 
															 {
														
 
															 	dump_printf(": id:%" PRIu64 ": lost:%" PRIu64 "\n",
														
 
															-		    self->lost.id, self->lost.lost);
														
 
															-	session->hists.stats.total_lost += self->lost.lost;
														
 
															+		    event->lost.id, event->lost.lost);
														
 
															+	session->hists.stats.total_lost += event->lost.lost;
														
 
															 	return 0;
														
 
															 }
														
 
															-static void event_set_kernel_mmap_len(struct map **maps, event_t *self)
														
 
															+static void perf_event__set_kernel_mmap_len(union perf_event *event,
														
 
															+					    struct map **maps)
														
 
															 {
														
 
															-	maps[MAP__FUNCTION]->start = self->mmap.start;
														
 
															-	maps[MAP__FUNCTION]->end   = self->mmap.start + self->mmap.len;
														
 
															+	maps[MAP__FUNCTION]->start = event->mmap.start;
														
 
															+	maps[MAP__FUNCTION]->end   = event->mmap.start + event->mmap.len;
														
 
															 	/*
														
 
															 	 * Be a bit paranoid here, some perf.data file came with
														
 
															 	 * a zero sized synthesized MMAP event for the kernel.
														
@@ -485,8 +463,8 @@ static void event_set_kernel_mmap_len(struct map **maps, event_t *self)
 
															 		maps[MAP__FUNCTION]->end = ~0ULL;
														
 
															 }
														
 
															-static int event__process_kernel_mmap(event_t *self,
														
 
															-			struct perf_session *session)
														
 
															+static int perf_event__process_kernel_mmap(union perf_event *event,
														
 
															+					   struct perf_session *session)
														
 
															 {
														
 
															 	struct map *map;
														
 
															 	char kmmap_prefix[PATH_MAX];
														
@@ -494,9 +472,9 @@ static int event__process_kernel_mmap(event_t *self,
 
															 	enum dso_kernel_type kernel_type;
														
 
															 	bool is_kernel_mmap;
														
 
															-	machine = perf_session__findnew_machine(session, self->mmap.pid);
														
 
															+	machine = perf_session__findnew_machine(session, event->mmap.pid);
														
 
															 	if (!machine) {
														
 
															-		pr_err("Can't find id %d's machine\n", self->mmap.pid);
														
 
															+		pr_err("Can't find id %d's machine\n", event->mmap.pid);
														
 
															 		goto out_problem;
														
 
															 	}
														
@@ -506,17 +484,17 @@ static int event__process_kernel_mmap(event_t *self,
 
															 	else
														
 
															 		kernel_type = DSO_TYPE_GUEST_KERNEL;
														
 
															-	is_kernel_mmap = memcmp(self->mmap.filename,
														
 
															+	is_kernel_mmap = memcmp(event->mmap.filename,
														
 
															 				kmmap_prefix,
														
 
															 				strlen(kmmap_prefix)) == 0;
														
 
															-	if (self->mmap.filename[0] == '/' ||
														
 
															-	    (!is_kernel_mmap && self->mmap.filename[0] == '[')) {
														
 
															+	if (event->mmap.filename[0] == '/' ||
														
 
															+	    (!is_kernel_mmap && event->mmap.filename[0] == '[')) {
														
 
															 		char short_module_name[1024];
														
 
															 		char *name, *dot;
														
 
															-		if (self->mmap.filename[0] == '/') {
														
 
															-			name = strrchr(self->mmap.filename, '/');
														
 
															+		if (event->mmap.filename[0] == '/') {
														
 
															+			name = strrchr(event->mmap.filename, '/');
														
 
															 			if (name == NULL)
														
 
															 				goto out_problem;
														
@@ -528,10 +506,10 @@ static int event__process_kernel_mmap(event_t *self,
 
															 					"[%.*s]", (int)(dot - name), name);
														
 
															 			strxfrchar(short_module_name, '-', '_');
														
 
															 		} else
														
 
															-			strcpy(short_module_name, self->mmap.filename);
														
 
															+			strcpy(short_module_name, event->mmap.filename);
														
 
															-		map = machine__new_module(machine, self->mmap.start,
														
 
															-					  self->mmap.filename);
														
 
															+		map = machine__new_module(machine, event->mmap.start,
														
 
															+					  event->mmap.filename);
														
 
															 		if (map == NULL)
														
 
															 			goto out_problem;
														
@@ -541,9 +519,9 @@ static int event__process_kernel_mmap(event_t *self,
 
															 		map->dso->short_name = name;
														
 
															 		map->dso->sname_alloc = 1;
														
 
															-		map->end = map->start + self->mmap.len;
														
 
															+		map->end = map->start + event->mmap.len;
														
 
															 	} else if (is_kernel_mmap) {
														
 
															-		const char *symbol_name = (self->mmap.filename +
														
 
															+		const char *symbol_name = (event->mmap.filename +
														
 
															 				strlen(kmmap_prefix));
														
 
															 		/*
														
 
															 		 * Should be there already, from the build-id table in
														
@@ -558,10 +536,10 @@ static int event__process_kernel_mmap(event_t *self,
 
															 		if (__machine__create_kernel_maps(machine, kernel) < 0)
														
 
															 			goto out_problem;
														
 
															-		event_set_kernel_mmap_len(machine->vmlinux_maps, self);
														
 
															+		perf_event__set_kernel_mmap_len(event, machine->vmlinux_maps);
														
 
															 		perf_session__set_kallsyms_ref_reloc_sym(machine->vmlinux_maps,
														
 
															 							 symbol_name,
														
 
															-							 self->mmap.pgoff);
														
 
															+							 event->mmap.pgoff);
														
 
															 		if (machine__is_default_guest(machine)) {
														
 
															 			/*
														
 
															 			 * preload dso of guest kernel and modules
														
@@ -575,22 +553,23 @@ out_problem:
 
															 	return -1;
														
 
															 }
														
 
															-int event__process_mmap(event_t *self, struct sample_data *sample __used,
														
 
															-			struct perf_session *session)
														
 
															+int perf_event__process_mmap(union perf_event *event,
														
 
															+			     struct perf_sample *sample __used,
														
 
															+			     struct perf_session *session)
														
 
															 {
														
 
															 	struct machine *machine;
														
 
															 	struct thread *thread;
														
 
															 	struct map *map;
														
 
															-	u8 cpumode = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
														
 
															+	u8 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
														
 
															 	int ret = 0;
														
 
															 	dump_printf(" %d/%d: [%#" PRIx64 "(%#" PRIx64 ") @ %#" PRIx64 "]: %s\n",
														
 
															-			self->mmap.pid, self->mmap.tid, self->mmap.start,
														
 
															-			self->mmap.len, self->mmap.pgoff, self->mmap.filename);
														
 
															+			event->mmap.pid, event->mmap.tid, event->mmap.start,
														
 
															+			event->mmap.len, event->mmap.pgoff, event->mmap.filename);
														
 
															 	if (cpumode == PERF_RECORD_MISC_GUEST_KERNEL ||
														
 
															 	    cpumode == PERF_RECORD_MISC_KERNEL) {
														
 
															-		ret = event__process_kernel_mmap(self, session);
														
 
															+		ret = perf_event__process_kernel_mmap(event, session);
														
 
															 		if (ret < 0)
														
 
															 			goto out_problem;
														
 
															 		return 0;
														
@@ -599,12 +578,12 @@ int event__process_mmap(event_t *self, struct sample_data *sample __used,
 
															 	machine = perf_session__find_host_machine(session);
														
 
															 	if (machine == NULL)
														
 
															 		goto out_problem;
														
 
															-	thread = perf_session__findnew(session, self->mmap.pid);
														
 
															+	thread = perf_session__findnew(session, event->mmap.pid);
														
 
															 	if (thread == NULL)
														
 
															 		goto out_problem;
														
 
															-	map = map__new(&machine->user_dsos, self->mmap.start,
														
 
															-			self->mmap.len, self->mmap.pgoff,
														
 
															-			self->mmap.pid, self->mmap.filename,
														
 
															+	map = map__new(&machine->user_dsos, event->mmap.start,
														
 
															+			event->mmap.len, event->mmap.pgoff,
														
 
															+			event->mmap.pid, event->mmap.filename,
														
 
															 			MAP__FUNCTION);
														
 
															 	if (map == NULL)
														
 
															 		goto out_problem;
														
@@ -617,16 +596,17 @@ out_problem:
 
															 	return 0;
														
 
															 }
														
 
															-int event__process_task(event_t *self, struct sample_data *sample __used,
														
 
															-			struct perf_session *session)
														
 
															+int perf_event__process_task(union perf_event *event,
														
 
															+			     struct perf_sample *sample __used,
														
 
															+			     struct perf_session *session)
														
 
															 {
														
 
															-	struct thread *thread = perf_session__findnew(session, self->fork.tid);
														
 
															-	struct thread *parent = perf_session__findnew(session, self->fork.ptid);
														
 
															+	struct thread *thread = perf_session__findnew(session, event->fork.tid);
														
 
															+	struct thread *parent = perf_session__findnew(session, event->fork.ptid);
														
 
															-	dump_printf("(%d:%d):(%d:%d)\n", self->fork.pid, self->fork.tid,
														
 
															-		    self->fork.ppid, self->fork.ptid);
														
 
															+	dump_printf("(%d:%d):(%d:%d)\n", event->fork.pid, event->fork.tid,
														
 
															+		    event->fork.ppid, event->fork.ptid);
														
 
															-	if (self->header.type == PERF_RECORD_EXIT) {
														
 
															+	if (event->header.type == PERF_RECORD_EXIT) {
														
 
															 		perf_session__remove_thread(session, thread);
														
 
															 		return 0;
														
 
															 	}
														
@@ -640,20 +620,22 @@ int event__process_task(event_t *self, struct sample_data *sample __used,
 
															 	return 0;
														
 
															 }
														
 
															-int event__process(event_t *event, struct sample_data *sample,
														
 
															-		   struct perf_session *session)
														
 
															+int perf_event__process(union perf_event *event, struct perf_sample *sample,
														
 
															+			struct perf_session *session)
														
 
															 {
														
 
															 	switch (event->header.type) {
														
 
															 	case PERF_RECORD_COMM:
														
 
															-		event__process_comm(event, sample, session);
														
 
															+		perf_event__process_comm(event, sample, session);
														
 
															 		break;
														
 
															 	case PERF_RECORD_MMAP:
														
 
															-		event__process_mmap(event, sample, session);
														
 
															+		perf_event__process_mmap(event, sample, session);
														
 
															 		break;
														
 
															 	case PERF_RECORD_FORK:
														
 
															 	case PERF_RECORD_EXIT:
														
 
															-		event__process_task(event, sample, session);
														
 
															+		perf_event__process_task(event, sample, session);
														
 
															 		break;
														
 
															+	case PERF_RECORD_LOST:
														
 
															+		perf_event__process_lost(event, sample, session);
														
 
															 	default:
														
 
															 		break;
														
 
															 	}
														
@@ -750,24 +732,14 @@ void thread__find_addr_location(struct thread *self,
 
															 		al->sym = NULL;
														
 
															 }
														
 
															-static void dso__calc_col_width(struct dso *self, struct hists *hists)
														
 
															-{
														
 
															-	if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep &&
														
 
															-	    (!symbol_conf.dso_list ||
														
 
															-	     strlist__has_entry(symbol_conf.dso_list, self->name))) {
														
 
															-		u16 slen = dso__name_len(self);
														
 
															-		hists__new_col_len(hists, HISTC_DSO, slen);
														
 
															-	}
														
 
															-
														
 
															-	self->slen_calculated = 1;
														
 
															-}
														
 
															-
														
 
															-int event__preprocess_sample(const event_t *self, struct perf_session *session,
														
 
															-			     struct addr_location *al, struct sample_data *data,
														
 
															-			     symbol_filter_t filter)
														
 
															+int perf_event__preprocess_sample(const union perf_event *event,
														
 
															+				  struct perf_session *session,
														
 
															+				  struct addr_location *al,
														
 
															+				  struct perf_sample *sample,
														
 
															+				  symbol_filter_t filter)
														
 
															 {
														
 
															-	u8 cpumode = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
														
 
															-	struct thread *thread = perf_session__findnew(session, self->ip.pid);
														
 
															+	u8 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
														
 
															+	struct thread *thread = perf_session__findnew(session, event->ip.pid);
														
 
															 	if (thread == NULL)
														
 
															 		return -1;
														
@@ -789,12 +761,12 @@ int event__preprocess_sample(const event_t *self, struct perf_session *session,
 
															 		machine__create_kernel_maps(&session->host_machine);
														
 
															 	thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION,
														
 
															-			      self->ip.pid, self->ip.ip, al);
														
 
															+			      event->ip.pid, event->ip.ip, al);
														
 
															 	dump_printf(" ...... dso: %s\n",
														
 
															 		    al->map ? al->map->dso->long_name :
														
 
															 			al->level == 'H' ? "[hypervisor]" : "<not found>");
														
 
															 	al->sym = NULL;
														
 
															-	al->cpu = data->cpu;
														
 
															+	al->cpu = sample->cpu;
														
 
															 	if (al->map) {
														
 
															 		if (symbol_conf.dso_list &&
														
@@ -805,23 +777,8 @@ int event__preprocess_sample(const event_t *self, struct perf_session *session,
 
															 			strlist__has_entry(symbol_conf.dso_list,
														
 
															 					   al->map->dso->long_name)))))
														
 
															 			goto out_filtered;
														
 
															-		/*
														
 
															-		 * We have to do this here as we may have a dso with no symbol
														
 
															-		 * hit that has a name longer than the ones with symbols
														
 
															-		 * sampled.
														
 
															-		 */
														
 
															-		if (!sort_dso.elide && !al->map->dso->slen_calculated)
														
 
															-			dso__calc_col_width(al->map->dso, &session->hists);
														
 
															 		al->sym = map__find_symbol(al->map, al->addr, filter);
														
 
															-	} else {
														
 
															-		const unsigned int unresolved_col_width = BITS_PER_LONG / 4;
														
 
															-
														
 
															-		if (hists__col_len(&session->hists, HISTC_DSO) < unresolved_col_width &&
														
 
															-		    !symbol_conf.col_width_list_str && !symbol_conf.field_sep &&
														
 
															-		    !symbol_conf.dso_list)
														
 
															-			hists__set_col_len(&session->hists, HISTC_DSO,
														
 
															-					   unresolved_col_width);
														
 
															 	}
														
 
															 	if (symbol_conf.sym_list && al->sym &&
														
@@ -834,128 +791,3 @@ out_filtered:
 
															 	al->filtered = true;
														
 
															 	return 0;
														
 
															 }
														
 
															-
														
 
															-static int event__parse_id_sample(const event_t *event,
														
 
															-				  struct perf_session *session,
														
 
															-				  struct sample_data *sample)
														
 
															-{
														
 
															-	const u64 *array;
														
 
															-	u64 type;
														
 
															-
														
 
															-	sample->cpu = sample->pid = sample->tid = -1;
														
 
															-	sample->stream_id = sample->id = sample->time = -1ULL;
														
 
															-
														
 
															-	if (!session->sample_id_all)
														
 
															-		return 0;
														
 
															-
														
 
															-	array = event->sample.array;
														
 
															-	array += ((event->header.size -
														
 
															-		   sizeof(event->header)) / sizeof(u64)) - 1;
														
 
															-	type = session->sample_type;
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_CPU) {
														
 
															-		u32 *p = (u32 *)array;
														
 
															-		sample->cpu = *p;
														
 
															-		array--;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_STREAM_ID) {
														
 
															-		sample->stream_id = *array;
														
 
															-		array--;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_ID) {
														
 
															-		sample->id = *array;
														
 
															-		array--;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_TIME) {
														
 
															-		sample->time = *array;
														
 
															-		array--;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_TID) {
														
 
															-		u32 *p = (u32 *)array;
														
 
															-		sample->pid = p[0];
														
 
															-		sample->tid = p[1];
														
 
															-	}
														
 
															-
														
 
															-	return 0;
														
 
															-}
														
 
															-
														
 
															-int event__parse_sample(const event_t *event, struct perf_session *session,
														
 
															-			struct sample_data *data)
														
 
															-{
														
 
															-	const u64 *array;
														
 
															-	u64 type;
														
 
															-
														
 
															-	if (event->header.type != PERF_RECORD_SAMPLE)
														
 
															-		return event__parse_id_sample(event, session, data);
														
 
															-
														
 
															-	array = event->sample.array;
														
 
															-	type = session->sample_type;
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_IP) {
														
 
															-		data->ip = event->ip.ip;
														
 
															-		array++;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_TID) {
														
 
															-		u32 *p = (u32 *)array;
														
 
															-		data->pid = p[0];
														
 
															-		data->tid = p[1];
														
 
															-		array++;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_TIME) {
														
 
															-		data->time = *array;
														
 
															-		array++;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_ADDR) {
														
 
															-		data->addr = *array;
														
 
															-		array++;
														
 
															-	}
														
 
															-
														
 
															-	data->id = -1ULL;
														
 
															-	if (type & PERF_SAMPLE_ID) {
														
 
															-		data->id = *array;
														
 
															-		array++;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_STREAM_ID) {
														
 
															-		data->stream_id = *array;
														
 
															-		array++;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_CPU) {
														
 
															-		u32 *p = (u32 *)array;
														
 
															-		data->cpu = *p;
														
 
															-		array++;
														
 
															-	} else
														
 
															-		data->cpu = -1;
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_PERIOD) {
														
 
															-		data->period = *array;
														
 
															-		array++;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_READ) {
														
 
															-		pr_debug("PERF_SAMPLE_READ is unsuported for now\n");
														
 
															-		return -1;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_CALLCHAIN) {
														
 
															-		data->callchain = (struct ip_callchain *)array;
														
 
															-		array += 1 + data->callchain->nr;
														
 
															-	}
														
 
															-
														
 
															-	if (type & PERF_SAMPLE_RAW) {
														
 
															-		u32 *p = (u32 *)array;
														
 
															-		data->raw_size = *p;
														
 
															-		p++;
														
 
															-		data->raw_data = p;
														
 
															-	}
														
 
															-
														
 
															-	return 0;
														
 
															-}
														
--- a/tools/perf/util/event.h
+++ b/tools/perf/util/event.h
@@ -61,7 +61,7 @@ struct sample_event {
 
															 	u64 array[];
														
 
															 };
														
 
															-struct sample_data {
														
 
															+struct perf_sample {
														
 
															 	u64 ip;
														
 
															 	u32 pid, tid;
														
 
															 	u64 time;
														
@@ -117,7 +117,7 @@ struct tracing_data_event {
 
															 	u32 size;
														
 
															 };
														
 
															-typedef union event_union {
														
 
															+union perf_event {
														
 
															 	struct perf_event_header	header;
														
 
															 	struct ip_event			ip;
														
 
															 	struct mmap_event		mmap;
														
@@ -130,50 +130,54 @@ typedef union event_union {
 
															 	struct event_type_event		event_type;
														
 
															 	struct tracing_data_event	tracing_data;
														
 
															 	struct build_id_event		build_id;
														
 
															-} event_t;
														
 
															+};
														
 
															-void event__print_totals(void);
														
 
															+void perf_event__print_totals(void);
														
 
															 struct perf_session;
														
 
															 struct thread_map;
														
 
															-typedef int (*event__handler_synth_t)(event_t *event, 
														
 
															+typedef int (*perf_event__handler_synth_t)(union perf_event *event, 
														
 
															+					   struct perf_session *session);
														
 
															+typedef int (*perf_event__handler_t)(union perf_event *event,
														
 
															+				     struct perf_sample *sample,
														
 
															 				      struct perf_session *session);
														
 
															-typedef int (*event__handler_t)(event_t *event, struct sample_data *sample,
														
 
															-				struct perf_session *session);
														
 
															-
														
 
															-int event__synthesize_thread_map(struct thread_map *threads,
														
 
															-				 event__handler_t process,
														
 
															-				 struct perf_session *session);
														
 
															-int event__synthesize_threads(event__handler_t process,
														
 
															-			      struct perf_session *session);
														
 
															-int event__synthesize_kernel_mmap(event__handler_t process,
														
 
															-				struct perf_session *session,
														
 
															-				struct machine *machine,
														
 
															-				const char *symbol_name);
														
 
															-
														
 
															-int event__synthesize_modules(event__handler_t process,
														
 
															-			      struct perf_session *session,
														
 
															-			      struct machine *machine);
														
 
															-
														
 
															-int event__process_comm(event_t *self, struct sample_data *sample,
														
 
															-			struct perf_session *session);
														
 
															-int event__process_lost(event_t *self, struct sample_data *sample,
														
 
															-			struct perf_session *session);
														
 
															-int event__process_mmap(event_t *self, struct sample_data *sample,
														
 
															-			struct perf_session *session);
														
 
															-int event__process_task(event_t *self, struct sample_data *sample,
														
 
															+
														
 
															+int perf_event__synthesize_thread_map(struct thread_map *threads,
														
 
															+				      perf_event__handler_t process,
														
 
															+				      struct perf_session *session);
														
 
															+int perf_event__synthesize_threads(perf_event__handler_t process,
														
 
															+				   struct perf_session *session);
														
 
															+int perf_event__synthesize_kernel_mmap(perf_event__handler_t process,
														
 
															+				       struct perf_session *session,
														
 
															+				       struct machine *machine,
														
 
															+				       const char *symbol_name);
														
 
															+
														
 
															+int perf_event__synthesize_modules(perf_event__handler_t process,
														
 
															+				   struct perf_session *session,
														
 
															+				   struct machine *machine);
														
 
															+
														
 
															+int perf_event__process_comm(union perf_event *event, struct perf_sample *sample,
														
 
															+			     struct perf_session *session);
														
 
															+int perf_event__process_lost(union perf_event *event, struct perf_sample *sample,
														
 
															+			     struct perf_session *session);
														
 
															+int perf_event__process_mmap(union perf_event *event, struct perf_sample *sample,
														
 
															+			     struct perf_session *session);
														
 
															+int perf_event__process_task(union perf_event *event, struct perf_sample *sample,
														
 
															+			     struct perf_session *session);
														
 
															+int perf_event__process(union perf_event *event, struct perf_sample *sample,
														
 
															 			struct perf_session *session);
														
 
															-int event__process(event_t *event, struct sample_data *sample,
														
 
															-		   struct perf_session *session);
														
 
															 struct addr_location;
														
 
															-int event__preprocess_sample(const event_t *self, struct perf_session *session,
														
 
															-			     struct addr_location *al, struct sample_data *data,
														
 
															-			     symbol_filter_t filter);
														
 
															-int event__parse_sample(const event_t *event, struct perf_session *session,
														
 
															-			struct sample_data *sample);
														
 
															+int perf_event__preprocess_sample(const union perf_event *self,
														
 
															+				  struct perf_session *session,
														
 
															+				  struct addr_location *al,
														
 
															+				  struct perf_sample *sample,
														
 
															+				  symbol_filter_t filter);
														
 
															+
														
 
															+const char *perf_event__name(unsigned int id);
														
 
															-const char *event__get_event_name(unsigned int id);
														
 
															+int perf_event__parse_sample(const union perf_event *event, u64 type,
														
 
															+			     bool sample_id_all, struct perf_sample *sample);
														
 
															 #endif /* __PERF_RECORD_H */
														
--- a/tools/perf/util/evlist.c
+++ b/tools/perf/util/evlist.c
@@ -0,0 +1,394 @@
 
															+/*
														
 
															+ * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
														
 
															+ *
														
 
															+ * Parts came from builtin-{top,stat,record}.c, see those files for further
														
 
															+ * copyright notes.
														
 
															+ *
														
 
															+ * Released under the GPL v2. (and only v2, not any later version)
														
 
															+ */
														
 
															+#include <poll.h>
														
 
															+#include "cpumap.h"
														
 
															+#include "thread_map.h"
														
 
															+#include "evlist.h"
														
 
															+#include "evsel.h"
														
 
															+#include "util.h"
														
 
															+
														
 
															+#include <sys/mman.h>
														
 
															+
														
 
															+#include <linux/bitops.h>
														
 
															+#include <linux/hash.h>
														
 
															+
														
 
															+#define FD(e, x, y) (*(int *)xyarray__entry(e->fd, x, y))
														
 
															+#define SID(e, x, y) xyarray__entry(e->sample_id, x, y)
														
 
															+
														
 
															+void perf_evlist__init(struct perf_evlist *evlist, struct cpu_map *cpus,
														
 
															+		       struct thread_map *threads)
														
 
															+{
														
 
															+	int i;
														
 
															+
														
 
															+	for (i = 0; i < PERF_EVLIST__HLIST_SIZE; ++i)
														
 
															+		INIT_HLIST_HEAD(&evlist->heads[i]);
														
 
															+	INIT_LIST_HEAD(&evlist->entries);
														
 
															+	perf_evlist__set_maps(evlist, cpus, threads);
														
 
															+}
														
 
															+
														
 
															+struct perf_evlist *perf_evlist__new(struct cpu_map *cpus,
														
 
															+				     struct thread_map *threads)
														
 
															+{
														
 
															+	struct perf_evlist *evlist = zalloc(sizeof(*evlist));
														
 
															+
														
 
															+	if (evlist != NULL)
														
 
															+		perf_evlist__init(evlist, cpus, threads);
														
 
															+
														
 
															+	return evlist;
														
 
															+}
														
 
															+
														
 
															+static void perf_evlist__purge(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	struct perf_evsel *pos, *n;
														
 
															+
														
 
															+	list_for_each_entry_safe(pos, n, &evlist->entries, node) {
														
 
															+		list_del_init(&pos->node);
														
 
															+		perf_evsel__delete(pos);
														
 
															+	}
														
 
															+
														
 
															+	evlist->nr_entries = 0;
														
 
															+}
														
 
															+
														
 
															+void perf_evlist__exit(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	free(evlist->mmap);
														
 
															+	free(evlist->pollfd);
														
 
															+	evlist->mmap = NULL;
														
 
															+	evlist->pollfd = NULL;
														
 
															+}
														
 
															+
														
 
															+void perf_evlist__delete(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	perf_evlist__purge(evlist);
														
 
															+	perf_evlist__exit(evlist);
														
 
															+	free(evlist);
														
 
															+}
														
 
															+
														
 
															+void perf_evlist__add(struct perf_evlist *evlist, struct perf_evsel *entry)
														
 
															+{
														
 
															+	list_add_tail(&entry->node, &evlist->entries);
														
 
															+	++evlist->nr_entries;
														
 
															+}
														
 
															+
														
 
															+int perf_evlist__add_default(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	struct perf_event_attr attr = {
														
 
															+		.type = PERF_TYPE_HARDWARE,
														
 
															+		.config = PERF_COUNT_HW_CPU_CYCLES,
														
 
															+	};
														
 
															+	struct perf_evsel *evsel = perf_evsel__new(&attr, 0);
														
 
															+
														
 
															+	if (evsel == NULL)
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															+	perf_evlist__add(evlist, evsel);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+int perf_evlist__alloc_pollfd(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	int nfds = evlist->cpus->nr * evlist->threads->nr * evlist->nr_entries;
														
 
															+	evlist->pollfd = malloc(sizeof(struct pollfd) * nfds);
														
 
															+	return evlist->pollfd != NULL ? 0 : -ENOMEM;
														
 
															+}
														
 
															+
														
 
															+void perf_evlist__add_pollfd(struct perf_evlist *evlist, int fd)
														
 
															+{
														
 
															+	fcntl(fd, F_SETFL, O_NONBLOCK);
														
 
															+	evlist->pollfd[evlist->nr_fds].fd = fd;
														
 
															+	evlist->pollfd[evlist->nr_fds].events = POLLIN;
														
 
															+	evlist->nr_fds++;
														
 
															+}
														
 
															+
														
 
															+static void perf_evlist__id_hash(struct perf_evlist *evlist,
														
 
															+				 struct perf_evsel *evsel,
														
 
															+				 int cpu, int thread, u64 id)
														
 
															+{
														
 
															+	int hash;
														
 
															+	struct perf_sample_id *sid = SID(evsel, cpu, thread);
														
 
															+
														
 
															+	sid->id = id;
														
 
															+	sid->evsel = evsel;
														
 
															+	hash = hash_64(sid->id, PERF_EVLIST__HLIST_BITS);
														
 
															+	hlist_add_head(&sid->node, &evlist->heads[hash]);
														
 
															+}
														
 
															+
														
 
															+void perf_evlist__id_add(struct perf_evlist *evlist, struct perf_evsel *evsel,
														
 
															+			 int cpu, int thread, u64 id)
														
 
															+{
														
 
															+	perf_evlist__id_hash(evlist, evsel, cpu, thread, id);
														
 
															+	evsel->id[evsel->ids++] = id;
														
 
															+}
														
 
															+
														
 
															+static int perf_evlist__id_add_fd(struct perf_evlist *evlist,
														
 
															+				  struct perf_evsel *evsel,
														
 
															+				  int cpu, int thread, int fd)
														
 
															+{
														
 
															+	u64 read_data[4] = { 0, };
														
 
															+	int id_idx = 1; /* The first entry is the counter value */
														
 
															+
														
 
															+	if (!(evsel->attr.read_format & PERF_FORMAT_ID) ||
														
 
															+	    read(fd, &read_data, sizeof(read_data)) == -1)
														
 
															+		return -1;
														
 
															+
														
 
															+	if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_ENABLED)
														
 
															+		++id_idx;
														
 
															+	if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_RUNNING)
														
 
															+		++id_idx;
														
 
															+
														
 
															+	perf_evlist__id_add(evlist, evsel, cpu, thread, read_data[id_idx]);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+struct perf_evsel *perf_evlist__id2evsel(struct perf_evlist *evlist, u64 id)
														
 
															+{
														
 
															+	struct hlist_head *head;
														
 
															+	struct hlist_node *pos;
														
 
															+	struct perf_sample_id *sid;
														
 
															+	int hash;
														
 
															+
														
 
															+	if (evlist->nr_entries == 1)
														
 
															+		return list_entry(evlist->entries.next, struct perf_evsel, node);
														
 
															+
														
 
															+	hash = hash_64(id, PERF_EVLIST__HLIST_BITS);
														
 
															+	head = &evlist->heads[hash];
														
 
															+
														
 
															+	hlist_for_each_entry(sid, pos, head, node)
														
 
															+		if (sid->id == id)
														
 
															+			return sid->evsel;
														
 
															+	return NULL;
														
 
															+}
														
 
															+
														
 
															+union perf_event *perf_evlist__read_on_cpu(struct perf_evlist *evlist, int cpu)
														
 
															+{
														
 
															+	/* XXX Move this to perf.c, making it generally available */
														
 
															+	unsigned int page_size = sysconf(_SC_PAGE_SIZE);
														
 
															+	struct perf_mmap *md = &evlist->mmap[cpu];
														
 
															+	unsigned int head = perf_mmap__read_head(md);
														
 
															+	unsigned int old = md->prev;
														
 
															+	unsigned char *data = md->base + page_size;
														
 
															+	union perf_event *event = NULL;
														
 
															+
														
 
															+	if (evlist->overwrite) {
														
 
															+		/*
														
 
															+		 * If we're further behind than half the buffer, there's a chance
														
 
															+		 * the writer will bite our tail and mess up the samples under us.
														
 
															+		 *
														
 
															+		 * If we somehow ended up ahead of the head, we got messed up.
														
 
															+		 *
														
 
															+		 * In either case, truncate and restart at head.
														
 
															+		 */
														
 
															+		int diff = head - old;
														
 
															+		if (diff > md->mask / 2 || diff < 0) {
														
 
															+			fprintf(stderr, "WARNING: failed to keep up with mmap data.\n");
														
 
															+
														
 
															+			/*
														
 
															+			 * head points to a known good entry, start there.
														
 
															+			 */
														
 
															+			old = head;
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	if (old != head) {
														
 
															+		size_t size;
														
 
															+
														
 
															+		event = (union perf_event *)&data[old & md->mask];
														
 
															+		size = event->header.size;
														
 
															+
														
 
															+		/*
														
 
															+		 * Event straddles the mmap boundary -- header should always
														
 
															+		 * be inside due to u64 alignment of output.
														
 
															+		 */
														
 
															+		if ((old & md->mask) + size != ((old + size) & md->mask)) {
														
 
															+			unsigned int offset = old;
														
 
															+			unsigned int len = min(sizeof(*event), size), cpy;
														
 
															+			void *dst = &evlist->event_copy;
														
 
															+
														
 
															+			do {
														
 
															+				cpy = min(md->mask + 1 - (offset & md->mask), len);
														
 
															+				memcpy(dst, &data[offset & md->mask], cpy);
														
 
															+				offset += cpy;
														
 
															+				dst += cpy;
														
 
															+				len -= cpy;
														
 
															+			} while (len);
														
 
															+
														
 
															+			event = &evlist->event_copy;
														
 
															+		}
														
 
															+
														
 
															+		old += size;
														
 
															+	}
														
 
															+
														
 
															+	md->prev = old;
														
 
															+
														
 
															+	if (!evlist->overwrite)
														
 
															+		perf_mmap__write_tail(md, old);
														
 
															+
														
 
															+	return event;
														
 
															+}
														
 
															+
														
 
															+void perf_evlist__munmap(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	int cpu;
														
 
															+
														
 
															+	for (cpu = 0; cpu < evlist->cpus->nr; cpu++) {
														
 
															+		if (evlist->mmap[cpu].base != NULL) {
														
 
															+			munmap(evlist->mmap[cpu].base, evlist->mmap_len);
														
 
															+			evlist->mmap[cpu].base = NULL;
														
 
															+		}
														
 
															+	}
														
 
															+}
														
 
															+
														
 
															+int perf_evlist__alloc_mmap(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	evlist->mmap = zalloc(evlist->cpus->nr * sizeof(struct perf_mmap));
														
 
															+	return evlist->mmap != NULL ? 0 : -ENOMEM;
														
 
															+}
														
 
															+
														
 
															+static int __perf_evlist__mmap(struct perf_evlist *evlist, int cpu, int prot,
														
 
															+			       int mask, int fd)
														
 
															+{
														
 
															+	evlist->mmap[cpu].prev = 0;
														
 
															+	evlist->mmap[cpu].mask = mask;
														
 
															+	evlist->mmap[cpu].base = mmap(NULL, evlist->mmap_len, prot,
														
 
															+				      MAP_SHARED, fd, 0);
														
 
															+	if (evlist->mmap[cpu].base == MAP_FAILED)
														
 
															+		return -1;
														
 
															+
														
 
															+	perf_evlist__add_pollfd(evlist, fd);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+/** perf_evlist__mmap - Create per cpu maps to receive events
														
 
															+ *
														
 
															+ * @evlist - list of events
														
 
															+ * @pages - map length in pages
														
 
															+ * @overwrite - overwrite older events?
														
 
															+ *
														
 
															+ * If overwrite is false the user needs to signal event consuption using:
														
 
															+ *
														
 
															+ *	struct perf_mmap *m = &evlist->mmap[cpu];
														
 
															+ *	unsigned int head = perf_mmap__read_head(m);
														
 
															+ *
														
 
															+ *	perf_mmap__write_tail(m, head)
														
 
															+ *
														
 
															+ * Using perf_evlist__read_on_cpu does this automatically.
														
 
															+ */
														
 
															+int perf_evlist__mmap(struct perf_evlist *evlist, int pages, bool overwrite)
														
 
															+{
														
 
															+	unsigned int page_size = sysconf(_SC_PAGE_SIZE);
														
 
															+	int mask = pages * page_size - 1, cpu;
														
 
															+	struct perf_evsel *first_evsel, *evsel;
														
 
															+	const struct cpu_map *cpus = evlist->cpus;
														
 
															+	const struct thread_map *threads = evlist->threads;
														
 
															+	int thread, prot = PROT_READ | (overwrite ? 0 : PROT_WRITE);
														
 
															+
														
 
															+	if (evlist->mmap == NULL && perf_evlist__alloc_mmap(evlist) < 0)
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															+	if (evlist->pollfd == NULL && perf_evlist__alloc_pollfd(evlist) < 0)
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															+	evlist->overwrite = overwrite;
														
 
															+	evlist->mmap_len = (pages + 1) * page_size;
														
 
															+	first_evsel = list_entry(evlist->entries.next, struct perf_evsel, node);
														
 
															+
														
 
															+	list_for_each_entry(evsel, &evlist->entries, node) {
														
 
															+		if ((evsel->attr.read_format & PERF_FORMAT_ID) &&
														
 
															+		    evsel->sample_id == NULL &&
														
 
															+		    perf_evsel__alloc_id(evsel, cpus->nr, threads->nr) < 0)
														
 
															+			return -ENOMEM;
														
 
															+
														
 
															+		for (cpu = 0; cpu < cpus->nr; cpu++) {
														
 
															+			for (thread = 0; thread < threads->nr; thread++) {
														
 
															+				int fd = FD(evsel, cpu, thread);
														
 
															+
														
 
															+				if (evsel->idx || thread) {
														
 
															+					if (ioctl(fd, PERF_EVENT_IOC_SET_OUTPUT,
														
 
															+						  FD(first_evsel, cpu, 0)) != 0)
														
 
															+						goto out_unmap;
														
 
															+				} else if (__perf_evlist__mmap(evlist, cpu, prot, mask, fd) < 0)
														
 
															+					goto out_unmap;
														
 
															+
														
 
															+				if ((evsel->attr.read_format & PERF_FORMAT_ID) &&
														
 
															+				    perf_evlist__id_add_fd(evlist, evsel, cpu, thread, fd) < 0)
														
 
															+					goto out_unmap;
														
 
															+			}
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	return 0;
														
 
															+
														
 
															+out_unmap:
														
 
															+	for (cpu = 0; cpu < cpus->nr; cpu++) {
														
 
															+		if (evlist->mmap[cpu].base != NULL) {
														
 
															+			munmap(evlist->mmap[cpu].base, evlist->mmap_len);
														
 
															+			evlist->mmap[cpu].base = NULL;
														
 
															+		}
														
 
															+	}
														
 
															+	return -1;
														
 
															+}
														
 
															+
														
 
															+int perf_evlist__create_maps(struct perf_evlist *evlist, pid_t target_pid,
														
 
															+			     pid_t target_tid, const char *cpu_list)
														
 
															+{
														
 
															+	evlist->threads = thread_map__new(target_pid, target_tid);
														
 
															+
														
 
															+	if (evlist->threads == NULL)
														
 
															+		return -1;
														
 
															+
														
 
															+	if (target_tid != -1)
														
 
															+		evlist->cpus = cpu_map__dummy_new();
														
 
															+	else
														
 
															+		evlist->cpus = cpu_map__new(cpu_list);
														
 
															+
														
 
															+	if (evlist->cpus == NULL)
														
 
															+		goto out_delete_threads;
														
 
															+
														
 
															+	return 0;
														
 
															+
														
 
															+out_delete_threads:
														
 
															+	thread_map__delete(evlist->threads);
														
 
															+	return -1;
														
 
															+}
														
 
															+
														
 
															+void perf_evlist__delete_maps(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	cpu_map__delete(evlist->cpus);
														
 
															+	thread_map__delete(evlist->threads);
														
 
															+	evlist->cpus	= NULL;
														
 
															+	evlist->threads = NULL;
														
 
															+}
														
 
															+
														
 
															+int perf_evlist__set_filters(struct perf_evlist *evlist)
														
 
															+{
														
 
															+	const struct thread_map *threads = evlist->threads;
														
 
															+	const struct cpu_map *cpus = evlist->cpus;
														
 
															+	struct perf_evsel *evsel;
														
 
															+	char *filter;
														
 
															+	int thread;
														
 
															+	int cpu;
														
 
															+	int err;
														
 
															+	int fd;
														
 
															+
														
 
															+	list_for_each_entry(evsel, &evlist->entries, node) {
														
 
															+		filter = evsel->filter;
														
 
															+		if (!filter)
														
 
															+			continue;
														
 
															+		for (cpu = 0; cpu < cpus->nr; cpu++) {
														
 
															+			for (thread = 0; thread < threads->nr; thread++) {
														
 
															+				fd = FD(evsel, cpu, thread);
														
 
															+				err = ioctl(fd, PERF_EVENT_IOC_SET_FILTER, filter);
														
 
															+				if (err)
														
 
															+					return err;
														
 
															+			}
														
 
															+		}
														
 
															+	}
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
--- a/tools/perf/util/evlist.h
+++ b/tools/perf/util/evlist.h
@@ -0,0 +1,68 @@
 
															+#ifndef __PERF_EVLIST_H
														
 
															+#define __PERF_EVLIST_H 1
														
 
															+
														
 
															+#include <linux/list.h>
														
 
															+#include "../perf.h"
														
 
															+#include "event.h"
														
 
															+
														
 
															+struct pollfd;
														
 
															+struct thread_map;
														
 
															+struct cpu_map;
														
 
															+
														
 
															+#define PERF_EVLIST__HLIST_BITS 8
														
 
															+#define PERF_EVLIST__HLIST_SIZE (1 << PERF_EVLIST__HLIST_BITS)
														
 
															+
														
 
															+struct perf_evlist {
														
 
															+	struct list_head entries;
														
 
															+	struct hlist_head heads[PERF_EVLIST__HLIST_SIZE];
														
 
															+	int		 nr_entries;
														
 
															+	int		 nr_fds;
														
 
															+	int		 mmap_len;
														
 
															+	bool		 overwrite;
														
 
															+	union perf_event event_copy;
														
 
															+	struct perf_mmap *mmap;
														
 
															+	struct pollfd	 *pollfd;
														
 
															+	struct thread_map *threads;
														
 
															+	struct cpu_map	  *cpus;
														
 
															+};
														
 
															+
														
 
															+struct perf_evsel;
														
 
															+
														
 
															+struct perf_evlist *perf_evlist__new(struct cpu_map *cpus,
														
 
															+				     struct thread_map *threads);
														
 
															+void perf_evlist__init(struct perf_evlist *evlist, struct cpu_map *cpus,
														
 
															+		       struct thread_map *threads);
														
 
															+void perf_evlist__exit(struct perf_evlist *evlist);
														
 
															+void perf_evlist__delete(struct perf_evlist *evlist);
														
 
															+
														
 
															+void perf_evlist__add(struct perf_evlist *evlist, struct perf_evsel *entry);
														
 
															+int perf_evlist__add_default(struct perf_evlist *evlist);
														
 
															+
														
 
															+void perf_evlist__id_add(struct perf_evlist *evlist, struct perf_evsel *evsel,
														
 
															+			 int cpu, int thread, u64 id);
														
 
															+
														
 
															+int perf_evlist__alloc_pollfd(struct perf_evlist *evlist);
														
 
															+void perf_evlist__add_pollfd(struct perf_evlist *evlist, int fd);
														
 
															+
														
 
															+struct perf_evsel *perf_evlist__id2evsel(struct perf_evlist *evlist, u64 id);
														
 
															+
														
 
															+union perf_event *perf_evlist__read_on_cpu(struct perf_evlist *self, int cpu);
														
 
															+
														
 
															+int perf_evlist__alloc_mmap(struct perf_evlist *evlist);
														
 
															+int perf_evlist__mmap(struct perf_evlist *evlist, int pages, bool overwrite);
														
 
															+void perf_evlist__munmap(struct perf_evlist *evlist);
														
 
															+
														
 
															+static inline void perf_evlist__set_maps(struct perf_evlist *evlist,
														
 
															+					 struct cpu_map *cpus,
														
 
															+					 struct thread_map *threads)
														
 
															+{
														
 
															+	evlist->cpus	= cpus;
														
 
															+	evlist->threads	= threads;
														
 
															+}
														
 
															+
														
 
															+int perf_evlist__create_maps(struct perf_evlist *evlist, pid_t target_pid,
														
 
															+			     pid_t target_tid, const char *cpu_list);
														
 
															+void perf_evlist__delete_maps(struct perf_evlist *evlist);
														
 
															+int perf_evlist__set_filters(struct perf_evlist *evlist);
														
 
															+
														
 
															+#endif /* __PERF_EVLIST_H */
														
--- a/tools/perf/util/evsel.c
+++ b/tools/perf/util/evsel.c
@@ -1,20 +1,34 @@
 
															+/*
														
 
															+ * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
														
 
															+ *
														
 
															+ * Parts came from builtin-{top,stat,record}.c, see those files for further
														
 
															+ * copyright notes.
														
 
															+ *
														
 
															+ * Released under the GPL v2. (and only v2, not any later version)
														
 
															+ */
														
 
															+
														
 
															 #include "evsel.h"
														
 
															-#include "../perf.h"
														
 
															+#include "evlist.h"
														
 
															 #include "util.h"
														
 
															 #include "cpumap.h"
														
 
															-#include "thread.h"
														
 
															+#include "thread_map.h"
														
 
															 #define FD(e, x, y) (*(int *)xyarray__entry(e->fd, x, y))
														
 
															+void perf_evsel__init(struct perf_evsel *evsel,
														
 
															+		      struct perf_event_attr *attr, int idx)
														
 
															+{
														
 
															+	evsel->idx	   = idx;
														
 
															+	evsel->attr	   = *attr;
														
 
															+	INIT_LIST_HEAD(&evsel->node);
														
 
															+}
														
 
															+
														
 
															 struct perf_evsel *perf_evsel__new(struct perf_event_attr *attr, int idx)
														
 
															 {
														
 
															 	struct perf_evsel *evsel = zalloc(sizeof(*evsel));
														
 
															-	if (evsel != NULL) {
														
 
															-		evsel->idx	   = idx;
														
 
															-		evsel->attr	   = *attr;
														
 
															-		INIT_LIST_HEAD(&evsel->node);
														
 
															-	}
														
 
															+	if (evsel != NULL)
														
 
															+		perf_evsel__init(evsel, attr, idx);
														
 
															 	return evsel;
														
 
															 }
														
@@ -25,6 +39,22 @@ int perf_evsel__alloc_fd(struct perf_evsel *evsel, int ncpus, int nthreads)
 
															 	return evsel->fd != NULL ? 0 : -ENOMEM;
														
 
															 }
														
 
															+int perf_evsel__alloc_id(struct perf_evsel *evsel, int ncpus, int nthreads)
														
 
															+{
														
 
															+	evsel->sample_id = xyarray__new(ncpus, nthreads, sizeof(struct perf_sample_id));
														
 
															+	if (evsel->sample_id == NULL)
														
 
															+		return -ENOMEM;
														
 
															+
														
 
															+	evsel->id = zalloc(ncpus * nthreads * sizeof(u64));
														
 
															+	if (evsel->id == NULL) {
														
 
															+		xyarray__delete(evsel->sample_id);
														
 
															+		evsel->sample_id = NULL;
														
 
															+		return -ENOMEM;
														
 
															+	}
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															 int perf_evsel__alloc_counts(struct perf_evsel *evsel, int ncpus)
														
 
															 {
														
 
															 	evsel->counts = zalloc((sizeof(*evsel->counts) +
														
@@ -38,6 +68,14 @@ void perf_evsel__free_fd(struct perf_evsel *evsel)
 
															 	evsel->fd = NULL;
														
 
															 }
														
 
															+void perf_evsel__free_id(struct perf_evsel *evsel)
														
 
															+{
														
 
															+	xyarray__delete(evsel->sample_id);
														
 
															+	evsel->sample_id = NULL;
														
 
															+	free(evsel->id);
														
 
															+	evsel->id = NULL;
														
 
															+}
														
 
															+
														
 
															 void perf_evsel__close_fd(struct perf_evsel *evsel, int ncpus, int nthreads)
														
 
															 {
														
 
															 	int cpu, thread;
														
@@ -49,10 +87,19 @@ void perf_evsel__close_fd(struct perf_evsel *evsel, int ncpus, int nthreads)
 
															 		}
														
 
															 }
														
 
															-void perf_evsel__delete(struct perf_evsel *evsel)
														
 
															+void perf_evsel__exit(struct perf_evsel *evsel)
														
 
															 {
														
 
															 	assert(list_empty(&evsel->node));
														
 
															 	xyarray__delete(evsel->fd);
														
 
															+	xyarray__delete(evsel->sample_id);
														
 
															+	free(evsel->id);
														
 
															+}
														
 
															+
														
 
															+void perf_evsel__delete(struct perf_evsel *evsel)
														
 
															+{
														
 
															+	perf_evsel__exit(evsel);
														
 
															+	close_cgroup(evsel->cgrp);
														
 
															+	free(evsel->name);
														
 
															 	free(evsel);
														
 
															 }
														
@@ -128,21 +175,51 @@ int __perf_evsel__read(struct perf_evsel *evsel,
 
															 }
														
 
															 static int __perf_evsel__open(struct perf_evsel *evsel, struct cpu_map *cpus,
														
 
															-			      struct thread_map *threads)
														
 
															+			      struct thread_map *threads, bool group, bool inherit)
														
 
															 {
														
 
															 	int cpu, thread;
														
 
															+	unsigned long flags = 0;
														
 
															+	int pid = -1;
														
 
															 	if (evsel->fd == NULL &&
														
 
															 	    perf_evsel__alloc_fd(evsel, cpus->nr, threads->nr) < 0)
														
 
															 		return -1;
														
 
															+	if (evsel->cgrp) {
														
 
															+		flags = PERF_FLAG_PID_CGROUP;
														
 
															+		pid = evsel->cgrp->fd;
														
 
															+	}
														
 
															+
														
 
															 	for (cpu = 0; cpu < cpus->nr; cpu++) {
														
 
															+		int group_fd = -1;
														
 
															+		/*
														
 
															+		 * Don't allow mmap() of inherited per-task counters. This
														
 
															+		 * would create a performance issue due to all children writing
														
 
															+		 * to the same buffer.
														
 
															+		 *
														
 
															+		 * FIXME:
														
 
															+		 * Proper fix is not to pass 'inherit' to perf_evsel__open*,
														
 
															+		 * but a 'flags' parameter, with 'group' folded there as well,
														
 
															+		 * then introduce a PERF_O_{MMAP,GROUP,INHERIT} enum, and if
														
 
															+		 * O_MMAP is set, emit a warning if cpu < 0 and O_INHERIT is
														
 
															+		 * set. Lets go for the minimal fix first tho.
														
 
															+		 */
														
 
															+		evsel->attr.inherit = (cpus->map[cpu] >= 0) && inherit;
														
 
															+
														
 
															 		for (thread = 0; thread < threads->nr; thread++) {
														
 
															+
														
 
															+			if (!evsel->cgrp)
														
 
															+				pid = threads->map[thread];
														
 
															+
														
 
															 			FD(evsel, cpu, thread) = sys_perf_event_open(&evsel->attr,
														
 
															-								     threads->map[thread],
														
 
															-								     cpus->map[cpu], -1, 0);
														
 
															+								     pid,
														
 
															+								     cpus->map[cpu],
														
 
															+								     group_fd, flags);
														
 
															 			if (FD(evsel, cpu, thread) < 0)
														
 
															 				goto out_close;
														
 
															+
														
 
															+			if (group && group_fd == -1)
														
 
															+				group_fd = FD(evsel, cpu, thread);
														
 
															 		}
														
 
															 	}
														
@@ -175,10 +252,9 @@ static struct {
 
															 	.threads = { -1, },
														
 
															 };
														
 
															-int perf_evsel__open(struct perf_evsel *evsel,
														
 
															-		     struct cpu_map *cpus, struct thread_map *threads)
														
 
															+int perf_evsel__open(struct perf_evsel *evsel, struct cpu_map *cpus,
														
 
															+		     struct thread_map *threads, bool group, bool inherit)
														
 
															 {
														
 
															-
														
 
															 	if (cpus == NULL) {
														
 
															 		/* Work around old compiler warnings about strict aliasing */
														
 
															 		cpus = &empty_cpu_map.map;
														
@@ -187,15 +263,135 @@ int perf_evsel__open(struct perf_evsel *evsel,
 
															 	if (threads == NULL)
														
 
															 		threads = &empty_thread_map.map;
														
 
															-	return __perf_evsel__open(evsel, cpus, threads);
														
 
															+	return __perf_evsel__open(evsel, cpus, threads, group, inherit);
														
 
															 }
														
 
															-int perf_evsel__open_per_cpu(struct perf_evsel *evsel, struct cpu_map *cpus)
														
 
															+int perf_evsel__open_per_cpu(struct perf_evsel *evsel,
														
 
															+			     struct cpu_map *cpus, bool group, bool inherit)
														
 
															 {
														
 
															-	return __perf_evsel__open(evsel, cpus, &empty_thread_map.map);
														
 
															+	return __perf_evsel__open(evsel, cpus, &empty_thread_map.map, group, inherit);
														
 
															+}
														
 
															+
														
 
															+int perf_evsel__open_per_thread(struct perf_evsel *evsel,
														
 
															+				struct thread_map *threads, bool group, bool inherit)
														
 
															+{
														
 
															+	return __perf_evsel__open(evsel, &empty_cpu_map.map, threads, group, inherit);
														
 
															+}
														
 
															+
														
 
															+static int perf_event__parse_id_sample(const union perf_event *event, u64 type,
														
 
															+				       struct perf_sample *sample)
														
 
															+{
														
 
															+	const u64 *array = event->sample.array;
														
 
															+
														
 
															+	array += ((event->header.size -
														
 
															+		   sizeof(event->header)) / sizeof(u64)) - 1;
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_CPU) {
														
 
															+		u32 *p = (u32 *)array;
														
 
															+		sample->cpu = *p;
														
 
															+		array--;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_STREAM_ID) {
														
 
															+		sample->stream_id = *array;
														
 
															+		array--;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_ID) {
														
 
															+		sample->id = *array;
														
 
															+		array--;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_TIME) {
														
 
															+		sample->time = *array;
														
 
															+		array--;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_TID) {
														
 
															+		u32 *p = (u32 *)array;
														
 
															+		sample->pid = p[0];
														
 
															+		sample->tid = p[1];
														
 
															+	}
														
 
															+
														
 
															+	return 0;
														
 
															 }
														
 
															-int perf_evsel__open_per_thread(struct perf_evsel *evsel, struct thread_map *threads)
														
 
															+int perf_event__parse_sample(const union perf_event *event, u64 type,
														
 
															+			     bool sample_id_all, struct perf_sample *data)
														
 
															 {
														
 
															-	return __perf_evsel__open(evsel, &empty_cpu_map.map, threads);
														
 
															+	const u64 *array;
														
 
															+
														
 
															+	data->cpu = data->pid = data->tid = -1;
														
 
															+	data->stream_id = data->id = data->time = -1ULL;
														
 
															+
														
 
															+	if (event->header.type != PERF_RECORD_SAMPLE) {
														
 
															+		if (!sample_id_all)
														
 
															+			return 0;
														
 
															+		return perf_event__parse_id_sample(event, type, data);
														
 
															+	}
														
 
															+
														
 
															+	array = event->sample.array;
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_IP) {
														
 
															+		data->ip = event->ip.ip;
														
 
															+		array++;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_TID) {
														
 
															+		u32 *p = (u32 *)array;
														
 
															+		data->pid = p[0];
														
 
															+		data->tid = p[1];
														
 
															+		array++;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_TIME) {
														
 
															+		data->time = *array;
														
 
															+		array++;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_ADDR) {
														
 
															+		data->addr = *array;
														
 
															+		array++;
														
 
															+	}
														
 
															+
														
 
															+	data->id = -1ULL;
														
 
															+	if (type & PERF_SAMPLE_ID) {
														
 
															+		data->id = *array;
														
 
															+		array++;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_STREAM_ID) {
														
 
															+		data->stream_id = *array;
														
 
															+		array++;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_CPU) {
														
 
															+		u32 *p = (u32 *)array;
														
 
															+		data->cpu = *p;
														
 
															+		array++;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_PERIOD) {
														
 
															+		data->period = *array;
														
 
															+		array++;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_READ) {
														
 
															+		fprintf(stderr, "PERF_SAMPLE_READ is unsuported for now\n");
														
 
															+		return -1;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_CALLCHAIN) {
														
 
															+		data->callchain = (struct ip_callchain *)array;
														
 
															+		array += 1 + data->callchain->nr;
														
 
															+	}
														
 
															+
														
 
															+	if (type & PERF_SAMPLE_RAW) {
														
 
															+		u32 *p = (u32 *)array;
														
 
															+		data->raw_size = *p;
														
 
															+		p++;
														
 
															+		data->raw_data = p;
														
 
															+	}
														
 
															+
														
 
															+	return 0;
														
 
															 }
														
--- a/tools/perf/util/evsel.h
+++ b/tools/perf/util/evsel.h
@@ -6,6 +6,8 @@
 
															 #include "../../../include/linux/perf_event.h"
														
 
															 #include "types.h"
														
 
															 #include "xyarray.h"
														
 
															+#include "cgroup.h"
														
 
															+#include "hist.h"
														
 
															 struct perf_counts_values {
														
 
															 	union {
														
@@ -24,31 +26,66 @@ struct perf_counts {
 
															 	struct perf_counts_values cpu[];
														
 
															 };
														
 
															+struct perf_evsel;
														
 
															+
														
 
															+/*
														
 
															+ * Per fd, to map back from PERF_SAMPLE_ID to evsel, only used when there are
														
 
															+ * more than one entry in the evlist.
														
 
															+ */
														
 
															+struct perf_sample_id {
														
 
															+	struct hlist_node 	node;
														
 
															+	u64		 	id;
														
 
															+	struct perf_evsel	*evsel;
														
 
															+};
														
 
															+
														
 
															+/** struct perf_evsel - event selector
														
 
															+ *
														
 
															+ * @name - Can be set to retain the original event name passed by the user,
														
 
															+ *         so that when showing results in tools such as 'perf stat', we
														
 
															+ *         show the name used, not some alias.
														
 
															+ */
														
 
															 struct perf_evsel {
														
 
															 	struct list_head	node;
														
 
															 	struct perf_event_attr	attr;
														
 
															 	char			*filter;
														
 
															 	struct xyarray		*fd;
														
 
															+	struct xyarray		*sample_id;
														
 
															+	u64			*id;
														
 
															 	struct perf_counts	*counts;
														
 
															 	int			idx;
														
 
															-	void			*priv;
														
 
															+	int			ids;
														
 
															+	struct hists		hists;
														
 
															+	char			*name;
														
 
															+	union {
														
 
															+		void		*priv;
														
 
															+		off_t		id_offset;
														
 
															+	};
														
 
															+	struct cgroup_sel	*cgrp;
														
 
															 };
														
 
															 struct cpu_map;
														
 
															 struct thread_map;
														
 
															+struct perf_evlist;
														
 
															 struct perf_evsel *perf_evsel__new(struct perf_event_attr *attr, int idx);
														
 
															+void perf_evsel__init(struct perf_evsel *evsel,
														
 
															+		      struct perf_event_attr *attr, int idx);
														
 
															+void perf_evsel__exit(struct perf_evsel *evsel);
														
 
															 void perf_evsel__delete(struct perf_evsel *evsel);
														
 
															 int perf_evsel__alloc_fd(struct perf_evsel *evsel, int ncpus, int nthreads);
														
 
															+int perf_evsel__alloc_id(struct perf_evsel *evsel, int ncpus, int nthreads);
														
 
															 int perf_evsel__alloc_counts(struct perf_evsel *evsel, int ncpus);
														
 
															 void perf_evsel__free_fd(struct perf_evsel *evsel);
														
 
															+void perf_evsel__free_id(struct perf_evsel *evsel);
														
 
															 void perf_evsel__close_fd(struct perf_evsel *evsel, int ncpus, int nthreads);
														
 
															-int perf_evsel__open_per_cpu(struct perf_evsel *evsel, struct cpu_map *cpus);
														
 
															-int perf_evsel__open_per_thread(struct perf_evsel *evsel, struct thread_map *threads);
														
 
															-int perf_evsel__open(struct perf_evsel *evsel, 
														
 
															-		     struct cpu_map *cpus, struct thread_map *threads);
														
 
															+int perf_evsel__open_per_cpu(struct perf_evsel *evsel,
														
 
															+			     struct cpu_map *cpus, bool group, bool inherit);
														
 
															+int perf_evsel__open_per_thread(struct perf_evsel *evsel,
														
 
															+				struct thread_map *threads, bool group, bool inherit);
														
 
															+int perf_evsel__open(struct perf_evsel *evsel, struct cpu_map *cpus,
														
 
															+		     struct thread_map *threads, bool group, bool inherit);
														
 
															 #define perf_evsel__match(evsel, t, c)		\
														
 
															 	(evsel->attr.type == PERF_TYPE_##t &&	\