perf_event.h 8.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315
  1. /* SPDX-License-Identifier: GPL-2.0 */
  2. #ifndef _ASM_X86_PERF_EVENT_H
  3. #define _ASM_X86_PERF_EVENT_H
  4. /*
  5. * Performance event hw details:
  6. */
  7. #define INTEL_PMC_MAX_GENERIC 32
  8. #define INTEL_PMC_MAX_FIXED 3
  9. #define INTEL_PMC_IDX_FIXED 32
  10. #define X86_PMC_IDX_MAX 64
  11. #define MSR_ARCH_PERFMON_PERFCTR0 0xc1
  12. #define MSR_ARCH_PERFMON_PERFCTR1 0xc2
  13. #define MSR_ARCH_PERFMON_EVENTSEL0 0x186
  14. #define MSR_ARCH_PERFMON_EVENTSEL1 0x187
  15. #define ARCH_PERFMON_EVENTSEL_EVENT 0x000000FFULL
  16. #define ARCH_PERFMON_EVENTSEL_UMASK 0x0000FF00ULL
  17. #define ARCH_PERFMON_EVENTSEL_USR (1ULL << 16)
  18. #define ARCH_PERFMON_EVENTSEL_OS (1ULL << 17)
  19. #define ARCH_PERFMON_EVENTSEL_EDGE (1ULL << 18)
  20. #define ARCH_PERFMON_EVENTSEL_PIN_CONTROL (1ULL << 19)
  21. #define ARCH_PERFMON_EVENTSEL_INT (1ULL << 20)
  22. #define ARCH_PERFMON_EVENTSEL_ANY (1ULL << 21)
  23. #define ARCH_PERFMON_EVENTSEL_ENABLE (1ULL << 22)
  24. #define ARCH_PERFMON_EVENTSEL_INV (1ULL << 23)
  25. #define ARCH_PERFMON_EVENTSEL_CMASK 0xFF000000ULL
  26. #define HSW_IN_TX (1ULL << 32)
  27. #define HSW_IN_TX_CHECKPOINTED (1ULL << 33)
  28. #define AMD64_EVENTSEL_INT_CORE_ENABLE (1ULL << 36)
  29. #define AMD64_EVENTSEL_GUESTONLY (1ULL << 40)
  30. #define AMD64_EVENTSEL_HOSTONLY (1ULL << 41)
  31. #define AMD64_EVENTSEL_INT_CORE_SEL_SHIFT 37
  32. #define AMD64_EVENTSEL_INT_CORE_SEL_MASK \
  33. (0xFULL << AMD64_EVENTSEL_INT_CORE_SEL_SHIFT)
  34. #define AMD64_EVENTSEL_EVENT \
  35. (ARCH_PERFMON_EVENTSEL_EVENT | (0x0FULL << 32))
  36. #define INTEL_ARCH_EVENT_MASK \
  37. (ARCH_PERFMON_EVENTSEL_UMASK | ARCH_PERFMON_EVENTSEL_EVENT)
  38. #define AMD64_L3_SLICE_SHIFT 48
  39. #define AMD64_L3_SLICE_MASK \
  40. ((0xFULL) << AMD64_L3_SLICE_SHIFT)
  41. #define AMD64_L3_THREAD_SHIFT 56
  42. #define AMD64_L3_THREAD_MASK \
  43. ((0xFFULL) << AMD64_L3_THREAD_SHIFT)
  44. #define X86_RAW_EVENT_MASK \
  45. (ARCH_PERFMON_EVENTSEL_EVENT | \
  46. ARCH_PERFMON_EVENTSEL_UMASK | \
  47. ARCH_PERFMON_EVENTSEL_EDGE | \
  48. ARCH_PERFMON_EVENTSEL_INV | \
  49. ARCH_PERFMON_EVENTSEL_CMASK)
  50. #define X86_ALL_EVENT_FLAGS \
  51. (ARCH_PERFMON_EVENTSEL_EDGE | \
  52. ARCH_PERFMON_EVENTSEL_INV | \
  53. ARCH_PERFMON_EVENTSEL_CMASK | \
  54. ARCH_PERFMON_EVENTSEL_ANY | \
  55. ARCH_PERFMON_EVENTSEL_PIN_CONTROL | \
  56. HSW_IN_TX | \
  57. HSW_IN_TX_CHECKPOINTED)
  58. #define AMD64_RAW_EVENT_MASK \
  59. (X86_RAW_EVENT_MASK | \
  60. AMD64_EVENTSEL_EVENT)
  61. #define AMD64_RAW_EVENT_MASK_NB \
  62. (AMD64_EVENTSEL_EVENT | \
  63. ARCH_PERFMON_EVENTSEL_UMASK)
  64. #define AMD64_NUM_COUNTERS 4
  65. #define AMD64_NUM_COUNTERS_CORE 6
  66. #define AMD64_NUM_COUNTERS_NB 4
  67. #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_SEL 0x3c
  68. #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_UMASK (0x00 << 8)
  69. #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_INDEX 0
  70. #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_PRESENT \
  71. (1 << (ARCH_PERFMON_UNHALTED_CORE_CYCLES_INDEX))
  72. #define ARCH_PERFMON_BRANCH_MISSES_RETIRED 6
  73. #define ARCH_PERFMON_EVENTS_COUNT 7
  74. /*
  75. * Intel "Architectural Performance Monitoring" CPUID
  76. * detection/enumeration details:
  77. */
  78. union cpuid10_eax {
  79. struct {
  80. unsigned int version_id:8;
  81. unsigned int num_counters:8;
  82. unsigned int bit_width:8;
  83. unsigned int mask_length:8;
  84. } split;
  85. unsigned int full;
  86. };
  87. union cpuid10_ebx {
  88. struct {
  89. unsigned int no_unhalted_core_cycles:1;
  90. unsigned int no_instructions_retired:1;
  91. unsigned int no_unhalted_reference_cycles:1;
  92. unsigned int no_llc_reference:1;
  93. unsigned int no_llc_misses:1;
  94. unsigned int no_branch_instruction_retired:1;
  95. unsigned int no_branch_misses_retired:1;
  96. } split;
  97. unsigned int full;
  98. };
  99. union cpuid10_edx {
  100. struct {
  101. unsigned int num_counters_fixed:5;
  102. unsigned int bit_width_fixed:8;
  103. unsigned int reserved:19;
  104. } split;
  105. unsigned int full;
  106. };
  107. struct x86_pmu_capability {
  108. int version;
  109. int num_counters_gp;
  110. int num_counters_fixed;
  111. int bit_width_gp;
  112. int bit_width_fixed;
  113. unsigned int events_mask;
  114. int events_mask_len;
  115. };
  116. /*
  117. * Fixed-purpose performance events:
  118. */
  119. /*
  120. * All 3 fixed-mode PMCs are configured via this single MSR:
  121. */
  122. #define MSR_ARCH_PERFMON_FIXED_CTR_CTRL 0x38d
  123. /*
  124. * The counts are available in three separate MSRs:
  125. */
  126. /* Instr_Retired.Any: */
  127. #define MSR_ARCH_PERFMON_FIXED_CTR0 0x309
  128. #define INTEL_PMC_IDX_FIXED_INSTRUCTIONS (INTEL_PMC_IDX_FIXED + 0)
  129. /* CPU_CLK_Unhalted.Core: */
  130. #define MSR_ARCH_PERFMON_FIXED_CTR1 0x30a
  131. #define INTEL_PMC_IDX_FIXED_CPU_CYCLES (INTEL_PMC_IDX_FIXED + 1)
  132. /* CPU_CLK_Unhalted.Ref: */
  133. #define MSR_ARCH_PERFMON_FIXED_CTR2 0x30b
  134. #define INTEL_PMC_IDX_FIXED_REF_CYCLES (INTEL_PMC_IDX_FIXED + 2)
  135. #define INTEL_PMC_MSK_FIXED_REF_CYCLES (1ULL << INTEL_PMC_IDX_FIXED_REF_CYCLES)
  136. /*
  137. * We model BTS tracing as another fixed-mode PMC.
  138. *
  139. * We choose a value in the middle of the fixed event range, since lower
  140. * values are used by actual fixed events and higher values are used
  141. * to indicate other overflow conditions in the PERF_GLOBAL_STATUS msr.
  142. */
  143. #define INTEL_PMC_IDX_FIXED_BTS (INTEL_PMC_IDX_FIXED + 16)
  144. #define GLOBAL_STATUS_COND_CHG BIT_ULL(63)
  145. #define GLOBAL_STATUS_BUFFER_OVF BIT_ULL(62)
  146. #define GLOBAL_STATUS_UNC_OVF BIT_ULL(61)
  147. #define GLOBAL_STATUS_ASIF BIT_ULL(60)
  148. #define GLOBAL_STATUS_COUNTERS_FROZEN BIT_ULL(59)
  149. #define GLOBAL_STATUS_LBRS_FROZEN BIT_ULL(58)
  150. #define GLOBAL_STATUS_TRACE_TOPAPMI BIT_ULL(55)
  151. /*
  152. * IBS cpuid feature detection
  153. */
  154. #define IBS_CPUID_FEATURES 0x8000001b
  155. /*
  156. * Same bit mask as for IBS cpuid feature flags (Fn8000_001B_EAX), but
  157. * bit 0 is used to indicate the existence of IBS.
  158. */
  159. #define IBS_CAPS_AVAIL (1U<<0)
  160. #define IBS_CAPS_FETCHSAM (1U<<1)
  161. #define IBS_CAPS_OPSAM (1U<<2)
  162. #define IBS_CAPS_RDWROPCNT (1U<<3)
  163. #define IBS_CAPS_OPCNT (1U<<4)
  164. #define IBS_CAPS_BRNTRGT (1U<<5)
  165. #define IBS_CAPS_OPCNTEXT (1U<<6)
  166. #define IBS_CAPS_RIPINVALIDCHK (1U<<7)
  167. #define IBS_CAPS_OPBRNFUSE (1U<<8)
  168. #define IBS_CAPS_FETCHCTLEXTD (1U<<9)
  169. #define IBS_CAPS_OPDATA4 (1U<<10)
  170. #define IBS_CAPS_DEFAULT (IBS_CAPS_AVAIL \
  171. | IBS_CAPS_FETCHSAM \
  172. | IBS_CAPS_OPSAM)
  173. /*
  174. * IBS APIC setup
  175. */
  176. #define IBSCTL 0x1cc
  177. #define IBSCTL_LVT_OFFSET_VALID (1ULL<<8)
  178. #define IBSCTL_LVT_OFFSET_MASK 0x0F
  179. /* IBS fetch bits/masks */
  180. #define IBS_FETCH_RAND_EN (1ULL<<57)
  181. #define IBS_FETCH_VAL (1ULL<<49)
  182. #define IBS_FETCH_ENABLE (1ULL<<48)
  183. #define IBS_FETCH_CNT 0xFFFF0000ULL
  184. #define IBS_FETCH_MAX_CNT 0x0000FFFFULL
  185. /*
  186. * IBS op bits/masks
  187. * The lower 7 bits of the current count are random bits
  188. * preloaded by hardware and ignored in software
  189. */
  190. #define IBS_OP_CUR_CNT (0xFFF80ULL<<32)
  191. #define IBS_OP_CUR_CNT_RAND (0x0007FULL<<32)
  192. #define IBS_OP_CNT_CTL (1ULL<<19)
  193. #define IBS_OP_VAL (1ULL<<18)
  194. #define IBS_OP_ENABLE (1ULL<<17)
  195. #define IBS_OP_MAX_CNT 0x0000FFFFULL
  196. #define IBS_OP_MAX_CNT_EXT 0x007FFFFFULL /* not a register bit mask */
  197. #define IBS_RIP_INVALID (1ULL<<38)
  198. #ifdef CONFIG_X86_LOCAL_APIC
  199. extern u32 get_ibs_caps(void);
  200. #else
  201. static inline u32 get_ibs_caps(void) { return 0; }
  202. #endif
  203. #ifdef CONFIG_PERF_EVENTS
  204. extern void perf_events_lapic_init(void);
  205. /*
  206. * Abuse bits {3,5} of the cpu eflags register. These flags are otherwise
  207. * unused and ABI specified to be 0, so nobody should care what we do with
  208. * them.
  209. *
  210. * EXACT - the IP points to the exact instruction that triggered the
  211. * event (HW bugs exempt).
  212. * VM - original X86_VM_MASK; see set_linear_ip().
  213. */
  214. #define PERF_EFLAGS_EXACT (1UL << 3)
  215. #define PERF_EFLAGS_VM (1UL << 5)
  216. struct pt_regs;
  217. extern unsigned long perf_instruction_pointer(struct pt_regs *regs);
  218. extern unsigned long perf_misc_flags(struct pt_regs *regs);
  219. #define perf_misc_flags(regs) perf_misc_flags(regs)
  220. #include <asm/stacktrace.h>
  221. /*
  222. * We abuse bit 3 from flags to pass exact information, see perf_misc_flags
  223. * and the comment with PERF_EFLAGS_EXACT.
  224. */
  225. #define perf_arch_fetch_caller_regs(regs, __ip) { \
  226. (regs)->ip = (__ip); \
  227. (regs)->bp = caller_frame_pointer(); \
  228. (regs)->cs = __KERNEL_CS; \
  229. regs->flags = 0; \
  230. asm volatile( \
  231. _ASM_MOV "%%"_ASM_SP ", %0\n" \
  232. : "=m" ((regs)->sp) \
  233. :: "memory" \
  234. ); \
  235. }
  236. struct perf_guest_switch_msr {
  237. unsigned msr;
  238. u64 host, guest;
  239. };
  240. extern struct perf_guest_switch_msr *perf_guest_get_msrs(int *nr);
  241. extern void perf_get_x86_pmu_capability(struct x86_pmu_capability *cap);
  242. extern void perf_check_microcode(void);
  243. #else
  244. static inline struct perf_guest_switch_msr *perf_guest_get_msrs(int *nr)
  245. {
  246. *nr = 0;
  247. return NULL;
  248. }
  249. static inline void perf_get_x86_pmu_capability(struct x86_pmu_capability *cap)
  250. {
  251. memset(cap, 0, sizeof(*cap));
  252. }
  253. static inline void perf_events_lapic_init(void) { }
  254. static inline void perf_check_microcode(void) { }
  255. #endif
  256. #ifdef CONFIG_CPU_SUP_INTEL
  257. extern void intel_pt_handle_vmx(int on);
  258. #endif
  259. #if defined(CONFIG_PERF_EVENTS) && defined(CONFIG_CPU_SUP_AMD)
  260. extern void amd_pmu_enable_virt(void);
  261. extern void amd_pmu_disable_virt(void);
  262. #else
  263. static inline void amd_pmu_enable_virt(void) { }
  264. static inline void amd_pmu_disable_virt(void) { }
  265. #endif
  266. #define arch_perf_out_copy_user copy_from_user_nmi
  267. #endif /* _ASM_X86_PERF_EVENT_H */