perf_event.h 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597
  1. /* SPDX-License-Identifier: GPL-2.0 */
  2. #ifndef _ASM_X86_PERF_EVENT_H
  3. #define _ASM_X86_PERF_EVENT_H
  4. #include <linux/static_call.h>
  5. /*
  6. * Performance event hw details:
  7. */
  8. #define INTEL_PMC_MAX_GENERIC 32
  9. #define INTEL_PMC_MAX_FIXED 16
  10. #define INTEL_PMC_IDX_FIXED 32
  11. #define X86_PMC_IDX_MAX 64
  12. #define MSR_ARCH_PERFMON_PERFCTR0 0xc1
  13. #define MSR_ARCH_PERFMON_PERFCTR1 0xc2
  14. #define MSR_ARCH_PERFMON_EVENTSEL0 0x186
  15. #define MSR_ARCH_PERFMON_EVENTSEL1 0x187
  16. #define ARCH_PERFMON_EVENTSEL_EVENT 0x000000FFULL
  17. #define ARCH_PERFMON_EVENTSEL_UMASK 0x0000FF00ULL
  18. #define ARCH_PERFMON_EVENTSEL_USR (1ULL << 16)
  19. #define ARCH_PERFMON_EVENTSEL_OS (1ULL << 17)
  20. #define ARCH_PERFMON_EVENTSEL_EDGE (1ULL << 18)
  21. #define ARCH_PERFMON_EVENTSEL_PIN_CONTROL (1ULL << 19)
  22. #define ARCH_PERFMON_EVENTSEL_INT (1ULL << 20)
  23. #define ARCH_PERFMON_EVENTSEL_ANY (1ULL << 21)
  24. #define ARCH_PERFMON_EVENTSEL_ENABLE (1ULL << 22)
  25. #define ARCH_PERFMON_EVENTSEL_INV (1ULL << 23)
  26. #define ARCH_PERFMON_EVENTSEL_CMASK 0xFF000000ULL
  27. #define HSW_IN_TX (1ULL << 32)
  28. #define HSW_IN_TX_CHECKPOINTED (1ULL << 33)
  29. #define ICL_EVENTSEL_ADAPTIVE (1ULL << 34)
  30. #define ICL_FIXED_0_ADAPTIVE (1ULL << 32)
  31. #define AMD64_EVENTSEL_INT_CORE_ENABLE (1ULL << 36)
  32. #define AMD64_EVENTSEL_GUESTONLY (1ULL << 40)
  33. #define AMD64_EVENTSEL_HOSTONLY (1ULL << 41)
  34. #define AMD64_EVENTSEL_INT_CORE_SEL_SHIFT 37
  35. #define AMD64_EVENTSEL_INT_CORE_SEL_MASK \
  36. (0xFULL << AMD64_EVENTSEL_INT_CORE_SEL_SHIFT)
  37. #define AMD64_EVENTSEL_EVENT \
  38. (ARCH_PERFMON_EVENTSEL_EVENT | (0x0FULL << 32))
  39. #define INTEL_ARCH_EVENT_MASK \
  40. (ARCH_PERFMON_EVENTSEL_UMASK | ARCH_PERFMON_EVENTSEL_EVENT)
  41. #define AMD64_L3_SLICE_SHIFT 48
  42. #define AMD64_L3_SLICE_MASK \
  43. (0xFULL << AMD64_L3_SLICE_SHIFT)
  44. #define AMD64_L3_SLICEID_MASK \
  45. (0x7ULL << AMD64_L3_SLICE_SHIFT)
  46. #define AMD64_L3_THREAD_SHIFT 56
  47. #define AMD64_L3_THREAD_MASK \
  48. (0xFFULL << AMD64_L3_THREAD_SHIFT)
  49. #define AMD64_L3_F19H_THREAD_MASK \
  50. (0x3ULL << AMD64_L3_THREAD_SHIFT)
  51. #define AMD64_L3_EN_ALL_CORES BIT_ULL(47)
  52. #define AMD64_L3_EN_ALL_SLICES BIT_ULL(46)
  53. #define AMD64_L3_COREID_SHIFT 42
  54. #define AMD64_L3_COREID_MASK \
  55. (0x7ULL << AMD64_L3_COREID_SHIFT)
  56. #define X86_RAW_EVENT_MASK \
  57. (ARCH_PERFMON_EVENTSEL_EVENT | \
  58. ARCH_PERFMON_EVENTSEL_UMASK | \
  59. ARCH_PERFMON_EVENTSEL_EDGE | \
  60. ARCH_PERFMON_EVENTSEL_INV | \
  61. ARCH_PERFMON_EVENTSEL_CMASK)
  62. #define X86_ALL_EVENT_FLAGS \
  63. (ARCH_PERFMON_EVENTSEL_EDGE | \
  64. ARCH_PERFMON_EVENTSEL_INV | \
  65. ARCH_PERFMON_EVENTSEL_CMASK | \
  66. ARCH_PERFMON_EVENTSEL_ANY | \
  67. ARCH_PERFMON_EVENTSEL_PIN_CONTROL | \
  68. HSW_IN_TX | \
  69. HSW_IN_TX_CHECKPOINTED)
  70. #define AMD64_RAW_EVENT_MASK \
  71. (X86_RAW_EVENT_MASK | \
  72. AMD64_EVENTSEL_EVENT)
  73. #define AMD64_RAW_EVENT_MASK_NB \
  74. (AMD64_EVENTSEL_EVENT | \
  75. ARCH_PERFMON_EVENTSEL_UMASK)
  76. #define AMD64_PERFMON_V2_EVENTSEL_EVENT_NB \
  77. (AMD64_EVENTSEL_EVENT | \
  78. GENMASK_ULL(37, 36))
  79. #define AMD64_PERFMON_V2_EVENTSEL_UMASK_NB \
  80. (ARCH_PERFMON_EVENTSEL_UMASK | \
  81. GENMASK_ULL(27, 24))
  82. #define AMD64_PERFMON_V2_RAW_EVENT_MASK_NB \
  83. (AMD64_PERFMON_V2_EVENTSEL_EVENT_NB | \
  84. AMD64_PERFMON_V2_EVENTSEL_UMASK_NB)
  85. #define AMD64_NUM_COUNTERS 4
  86. #define AMD64_NUM_COUNTERS_CORE 6
  87. #define AMD64_NUM_COUNTERS_NB 4
  88. #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_SEL 0x3c
  89. #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_UMASK (0x00 << 8)
  90. #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_INDEX 0
  91. #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_PRESENT \
  92. (1 << (ARCH_PERFMON_UNHALTED_CORE_CYCLES_INDEX))
  93. #define ARCH_PERFMON_BRANCH_MISSES_RETIRED 6
  94. #define ARCH_PERFMON_EVENTS_COUNT 7
  95. #define PEBS_DATACFG_MEMINFO BIT_ULL(0)
  96. #define PEBS_DATACFG_GP BIT_ULL(1)
  97. #define PEBS_DATACFG_XMMS BIT_ULL(2)
  98. #define PEBS_DATACFG_LBRS BIT_ULL(3)
  99. #define PEBS_DATACFG_LBR_SHIFT 24
  100. /*
  101. * Intel "Architectural Performance Monitoring" CPUID
  102. * detection/enumeration details:
  103. */
  104. union cpuid10_eax {
  105. struct {
  106. unsigned int version_id:8;
  107. unsigned int num_counters:8;
  108. unsigned int bit_width:8;
  109. unsigned int mask_length:8;
  110. } split;
  111. unsigned int full;
  112. };
  113. union cpuid10_ebx {
  114. struct {
  115. unsigned int no_unhalted_core_cycles:1;
  116. unsigned int no_instructions_retired:1;
  117. unsigned int no_unhalted_reference_cycles:1;
  118. unsigned int no_llc_reference:1;
  119. unsigned int no_llc_misses:1;
  120. unsigned int no_branch_instruction_retired:1;
  121. unsigned int no_branch_misses_retired:1;
  122. } split;
  123. unsigned int full;
  124. };
  125. union cpuid10_edx {
  126. struct {
  127. unsigned int num_counters_fixed:5;
  128. unsigned int bit_width_fixed:8;
  129. unsigned int reserved1:2;
  130. unsigned int anythread_deprecated:1;
  131. unsigned int reserved2:16;
  132. } split;
  133. unsigned int full;
  134. };
  135. /*
  136. * Intel Architectural LBR CPUID detection/enumeration details:
  137. */
  138. union cpuid28_eax {
  139. struct {
  140. /* Supported LBR depth values */
  141. unsigned int lbr_depth_mask:8;
  142. unsigned int reserved:22;
  143. /* Deep C-state Reset */
  144. unsigned int lbr_deep_c_reset:1;
  145. /* IP values contain LIP */
  146. unsigned int lbr_lip:1;
  147. } split;
  148. unsigned int full;
  149. };
  150. union cpuid28_ebx {
  151. struct {
  152. /* CPL Filtering Supported */
  153. unsigned int lbr_cpl:1;
  154. /* Branch Filtering Supported */
  155. unsigned int lbr_filter:1;
  156. /* Call-stack Mode Supported */
  157. unsigned int lbr_call_stack:1;
  158. } split;
  159. unsigned int full;
  160. };
  161. union cpuid28_ecx {
  162. struct {
  163. /* Mispredict Bit Supported */
  164. unsigned int lbr_mispred:1;
  165. /* Timed LBRs Supported */
  166. unsigned int lbr_timed_lbr:1;
  167. /* Branch Type Field Supported */
  168. unsigned int lbr_br_type:1;
  169. } split;
  170. unsigned int full;
  171. };
  172. /*
  173. * AMD "Extended Performance Monitoring and Debug" CPUID
  174. * detection/enumeration details:
  175. */
  176. union cpuid_0x80000022_ebx {
  177. struct {
  178. /* Number of Core Performance Counters */
  179. unsigned int num_core_pmc:4;
  180. /* Number of available LBR Stack Entries */
  181. unsigned int lbr_v2_stack_sz:6;
  182. /* Number of Data Fabric Counters */
  183. unsigned int num_df_pmc:6;
  184. } split;
  185. unsigned int full;
  186. };
  187. struct x86_pmu_capability {
  188. int version;
  189. int num_counters_gp;
  190. int num_counters_fixed;
  191. int bit_width_gp;
  192. int bit_width_fixed;
  193. unsigned int events_mask;
  194. int events_mask_len;
  195. unsigned int pebs_ept :1;
  196. };
  197. /*
  198. * Fixed-purpose performance events:
  199. */
  200. /* RDPMC offset for Fixed PMCs */
  201. #define INTEL_PMC_FIXED_RDPMC_BASE (1 << 30)
  202. #define INTEL_PMC_FIXED_RDPMC_METRICS (1 << 29)
  203. /*
  204. * All the fixed-mode PMCs are configured via this single MSR:
  205. */
  206. #define MSR_ARCH_PERFMON_FIXED_CTR_CTRL 0x38d
  207. /*
  208. * There is no event-code assigned to the fixed-mode PMCs.
  209. *
  210. * For a fixed-mode PMC, which has an equivalent event on a general-purpose
  211. * PMC, the event-code of the equivalent event is used for the fixed-mode PMC,
  212. * e.g., Instr_Retired.Any and CPU_CLK_Unhalted.Core.
  213. *
  214. * For a fixed-mode PMC, which doesn't have an equivalent event, a
  215. * pseudo-encoding is used, e.g., CPU_CLK_Unhalted.Ref and TOPDOWN.SLOTS.
  216. * The pseudo event-code for a fixed-mode PMC must be 0x00.
  217. * The pseudo umask-code is 0xX. The X equals the index of the fixed
  218. * counter + 1, e.g., the fixed counter 2 has the pseudo-encoding 0x0300.
  219. *
  220. * The counts are available in separate MSRs:
  221. */
  222. /* Instr_Retired.Any: */
  223. #define MSR_ARCH_PERFMON_FIXED_CTR0 0x309
  224. #define INTEL_PMC_IDX_FIXED_INSTRUCTIONS (INTEL_PMC_IDX_FIXED + 0)
  225. /* CPU_CLK_Unhalted.Core: */
  226. #define MSR_ARCH_PERFMON_FIXED_CTR1 0x30a
  227. #define INTEL_PMC_IDX_FIXED_CPU_CYCLES (INTEL_PMC_IDX_FIXED + 1)
  228. /* CPU_CLK_Unhalted.Ref: event=0x00,umask=0x3 (pseudo-encoding) */
  229. #define MSR_ARCH_PERFMON_FIXED_CTR2 0x30b
  230. #define INTEL_PMC_IDX_FIXED_REF_CYCLES (INTEL_PMC_IDX_FIXED + 2)
  231. #define INTEL_PMC_MSK_FIXED_REF_CYCLES (1ULL << INTEL_PMC_IDX_FIXED_REF_CYCLES)
  232. /* TOPDOWN.SLOTS: event=0x00,umask=0x4 (pseudo-encoding) */
  233. #define MSR_ARCH_PERFMON_FIXED_CTR3 0x30c
  234. #define INTEL_PMC_IDX_FIXED_SLOTS (INTEL_PMC_IDX_FIXED + 3)
  235. #define INTEL_PMC_MSK_FIXED_SLOTS (1ULL << INTEL_PMC_IDX_FIXED_SLOTS)
  236. static inline bool use_fixed_pseudo_encoding(u64 code)
  237. {
  238. return !(code & 0xff);
  239. }
  240. /*
  241. * We model BTS tracing as another fixed-mode PMC.
  242. *
  243. * We choose the value 47 for the fixed index of BTS, since lower
  244. * values are used by actual fixed events and higher values are used
  245. * to indicate other overflow conditions in the PERF_GLOBAL_STATUS msr.
  246. */
  247. #define INTEL_PMC_IDX_FIXED_BTS (INTEL_PMC_IDX_FIXED + 15)
  248. /*
  249. * The PERF_METRICS MSR is modeled as several magic fixed-mode PMCs, one for
  250. * each TopDown metric event.
  251. *
  252. * Internally the TopDown metric events are mapped to the FxCtr 3 (SLOTS).
  253. */
  254. #define INTEL_PMC_IDX_METRIC_BASE (INTEL_PMC_IDX_FIXED + 16)
  255. #define INTEL_PMC_IDX_TD_RETIRING (INTEL_PMC_IDX_METRIC_BASE + 0)
  256. #define INTEL_PMC_IDX_TD_BAD_SPEC (INTEL_PMC_IDX_METRIC_BASE + 1)
  257. #define INTEL_PMC_IDX_TD_FE_BOUND (INTEL_PMC_IDX_METRIC_BASE + 2)
  258. #define INTEL_PMC_IDX_TD_BE_BOUND (INTEL_PMC_IDX_METRIC_BASE + 3)
  259. #define INTEL_PMC_IDX_TD_HEAVY_OPS (INTEL_PMC_IDX_METRIC_BASE + 4)
  260. #define INTEL_PMC_IDX_TD_BR_MISPREDICT (INTEL_PMC_IDX_METRIC_BASE + 5)
  261. #define INTEL_PMC_IDX_TD_FETCH_LAT (INTEL_PMC_IDX_METRIC_BASE + 6)
  262. #define INTEL_PMC_IDX_TD_MEM_BOUND (INTEL_PMC_IDX_METRIC_BASE + 7)
  263. #define INTEL_PMC_IDX_METRIC_END INTEL_PMC_IDX_TD_MEM_BOUND
  264. #define INTEL_PMC_MSK_TOPDOWN ((0xffull << INTEL_PMC_IDX_METRIC_BASE) | \
  265. INTEL_PMC_MSK_FIXED_SLOTS)
  266. /*
  267. * There is no event-code assigned to the TopDown events.
  268. *
  269. * For the slots event, use the pseudo code of the fixed counter 3.
  270. *
  271. * For the metric events, the pseudo event-code is 0x00.
  272. * The pseudo umask-code starts from the middle of the pseudo event
  273. * space, 0x80.
  274. */
  275. #define INTEL_TD_SLOTS 0x0400 /* TOPDOWN.SLOTS */
  276. /* Level 1 metrics */
  277. #define INTEL_TD_METRIC_RETIRING 0x8000 /* Retiring metric */
  278. #define INTEL_TD_METRIC_BAD_SPEC 0x8100 /* Bad speculation metric */
  279. #define INTEL_TD_METRIC_FE_BOUND 0x8200 /* FE bound metric */
  280. #define INTEL_TD_METRIC_BE_BOUND 0x8300 /* BE bound metric */
  281. /* Level 2 metrics */
  282. #define INTEL_TD_METRIC_HEAVY_OPS 0x8400 /* Heavy Operations metric */
  283. #define INTEL_TD_METRIC_BR_MISPREDICT 0x8500 /* Branch Mispredict metric */
  284. #define INTEL_TD_METRIC_FETCH_LAT 0x8600 /* Fetch Latency metric */
  285. #define INTEL_TD_METRIC_MEM_BOUND 0x8700 /* Memory bound metric */
  286. #define INTEL_TD_METRIC_MAX INTEL_TD_METRIC_MEM_BOUND
  287. #define INTEL_TD_METRIC_NUM 8
  288. static inline bool is_metric_idx(int idx)
  289. {
  290. return (unsigned)(idx - INTEL_PMC_IDX_METRIC_BASE) < INTEL_TD_METRIC_NUM;
  291. }
  292. static inline bool is_topdown_idx(int idx)
  293. {
  294. return is_metric_idx(idx) || idx == INTEL_PMC_IDX_FIXED_SLOTS;
  295. }
  296. #define INTEL_PMC_OTHER_TOPDOWN_BITS(bit) \
  297. (~(0x1ull << bit) & INTEL_PMC_MSK_TOPDOWN)
  298. #define GLOBAL_STATUS_COND_CHG BIT_ULL(63)
  299. #define GLOBAL_STATUS_BUFFER_OVF_BIT 62
  300. #define GLOBAL_STATUS_BUFFER_OVF BIT_ULL(GLOBAL_STATUS_BUFFER_OVF_BIT)
  301. #define GLOBAL_STATUS_UNC_OVF BIT_ULL(61)
  302. #define GLOBAL_STATUS_ASIF BIT_ULL(60)
  303. #define GLOBAL_STATUS_COUNTERS_FROZEN BIT_ULL(59)
  304. #define GLOBAL_STATUS_LBRS_FROZEN_BIT 58
  305. #define GLOBAL_STATUS_LBRS_FROZEN BIT_ULL(GLOBAL_STATUS_LBRS_FROZEN_BIT)
  306. #define GLOBAL_STATUS_TRACE_TOPAPMI_BIT 55
  307. #define GLOBAL_STATUS_TRACE_TOPAPMI BIT_ULL(GLOBAL_STATUS_TRACE_TOPAPMI_BIT)
  308. #define GLOBAL_STATUS_PERF_METRICS_OVF_BIT 48
  309. #define GLOBAL_CTRL_EN_PERF_METRICS 48
  310. /*
  311. * We model guest LBR event tracing as another fixed-mode PMC like BTS.
  312. *
  313. * We choose bit 58 because it's used to indicate LBR stack frozen state
  314. * for architectural perfmon v4, also we unconditionally mask that bit in
  315. * the handle_pmi_common(), so it'll never be set in the overflow handling.
  316. *
  317. * With this fake counter assigned, the guest LBR event user (such as KVM),
  318. * can program the LBR registers on its own, and we don't actually do anything
  319. * with then in the host context.
  320. */
  321. #define INTEL_PMC_IDX_FIXED_VLBR (GLOBAL_STATUS_LBRS_FROZEN_BIT)
  322. /*
  323. * Pseudo-encoding the guest LBR event as event=0x00,umask=0x1b,
  324. * since it would claim bit 58 which is effectively Fixed26.
  325. */
  326. #define INTEL_FIXED_VLBR_EVENT 0x1b00
  327. /*
  328. * Adaptive PEBS v4
  329. */
  330. struct pebs_basic {
  331. u64 format_size;
  332. u64 ip;
  333. u64 applicable_counters;
  334. u64 tsc;
  335. };
  336. struct pebs_meminfo {
  337. u64 address;
  338. u64 aux;
  339. u64 latency;
  340. u64 tsx_tuning;
  341. };
  342. struct pebs_gprs {
  343. u64 flags, ip, ax, cx, dx, bx, sp, bp, si, di;
  344. u64 r8, r9, r10, r11, r12, r13, r14, r15;
  345. };
  346. struct pebs_xmm {
  347. u64 xmm[16*2]; /* two entries for each register */
  348. };
  349. /*
  350. * AMD Extended Performance Monitoring and Debug cpuid feature detection
  351. */
  352. #define EXT_PERFMON_DEBUG_FEATURES 0x80000022
  353. /*
  354. * IBS cpuid feature detection
  355. */
  356. #define IBS_CPUID_FEATURES 0x8000001b
  357. /*
  358. * Same bit mask as for IBS cpuid feature flags (Fn8000_001B_EAX), but
  359. * bit 0 is used to indicate the existence of IBS.
  360. */
  361. #define IBS_CAPS_AVAIL (1U<<0)
  362. #define IBS_CAPS_FETCHSAM (1U<<1)
  363. #define IBS_CAPS_OPSAM (1U<<2)
  364. #define IBS_CAPS_RDWROPCNT (1U<<3)
  365. #define IBS_CAPS_OPCNT (1U<<4)
  366. #define IBS_CAPS_BRNTRGT (1U<<5)
  367. #define IBS_CAPS_OPCNTEXT (1U<<6)
  368. #define IBS_CAPS_RIPINVALIDCHK (1U<<7)
  369. #define IBS_CAPS_OPBRNFUSE (1U<<8)
  370. #define IBS_CAPS_FETCHCTLEXTD (1U<<9)
  371. #define IBS_CAPS_OPDATA4 (1U<<10)
  372. #define IBS_CAPS_ZEN4 (1U<<11)
  373. #define IBS_CAPS_DEFAULT (IBS_CAPS_AVAIL \
  374. | IBS_CAPS_FETCHSAM \
  375. | IBS_CAPS_OPSAM)
  376. /*
  377. * IBS APIC setup
  378. */
  379. #define IBSCTL 0x1cc
  380. #define IBSCTL_LVT_OFFSET_VALID (1ULL<<8)
  381. #define IBSCTL_LVT_OFFSET_MASK 0x0F
  382. /* IBS fetch bits/masks */
  383. #define IBS_FETCH_L3MISSONLY (1ULL<<59)
  384. #define IBS_FETCH_RAND_EN (1ULL<<57)
  385. #define IBS_FETCH_VAL (1ULL<<49)
  386. #define IBS_FETCH_ENABLE (1ULL<<48)
  387. #define IBS_FETCH_CNT 0xFFFF0000ULL
  388. #define IBS_FETCH_MAX_CNT 0x0000FFFFULL
  389. /*
  390. * IBS op bits/masks
  391. * The lower 7 bits of the current count are random bits
  392. * preloaded by hardware and ignored in software
  393. */
  394. #define IBS_OP_CUR_CNT (0xFFF80ULL<<32)
  395. #define IBS_OP_CUR_CNT_RAND (0x0007FULL<<32)
  396. #define IBS_OP_CNT_CTL (1ULL<<19)
  397. #define IBS_OP_VAL (1ULL<<18)
  398. #define IBS_OP_ENABLE (1ULL<<17)
  399. #define IBS_OP_L3MISSONLY (1ULL<<16)
  400. #define IBS_OP_MAX_CNT 0x0000FFFFULL
  401. #define IBS_OP_MAX_CNT_EXT 0x007FFFFFULL /* not a register bit mask */
  402. #define IBS_OP_MAX_CNT_EXT_MASK (0x7FULL<<20) /* separate upper 7 bits */
  403. #define IBS_RIP_INVALID (1ULL<<38)
  404. #ifdef CONFIG_X86_LOCAL_APIC
  405. extern u32 get_ibs_caps(void);
  406. extern int forward_event_to_ibs(struct perf_event *event);
  407. #else
  408. static inline u32 get_ibs_caps(void) { return 0; }
  409. static inline int forward_event_to_ibs(struct perf_event *event) { return -ENOENT; }
  410. #endif
  411. #ifdef CONFIG_PERF_EVENTS
  412. extern void perf_events_lapic_init(void);
  413. /*
  414. * Abuse bits {3,5} of the cpu eflags register. These flags are otherwise
  415. * unused and ABI specified to be 0, so nobody should care what we do with
  416. * them.
  417. *
  418. * EXACT - the IP points to the exact instruction that triggered the
  419. * event (HW bugs exempt).
  420. * VM - original X86_VM_MASK; see set_linear_ip().
  421. */
  422. #define PERF_EFLAGS_EXACT (1UL << 3)
  423. #define PERF_EFLAGS_VM (1UL << 5)
  424. struct pt_regs;
  425. struct x86_perf_regs {
  426. struct pt_regs regs;
  427. u64 *xmm_regs;
  428. };
  429. extern unsigned long perf_instruction_pointer(struct pt_regs *regs);
  430. extern unsigned long perf_misc_flags(struct pt_regs *regs);
  431. #define perf_misc_flags(regs) perf_misc_flags(regs)
  432. #include <asm/stacktrace.h>
  433. /*
  434. * We abuse bit 3 from flags to pass exact information, see perf_misc_flags
  435. * and the comment with PERF_EFLAGS_EXACT.
  436. */
  437. #define perf_arch_fetch_caller_regs(regs, __ip) { \
  438. (regs)->ip = (__ip); \
  439. (regs)->sp = (unsigned long)__builtin_frame_address(0); \
  440. (regs)->cs = __KERNEL_CS; \
  441. regs->flags = 0; \
  442. }
  443. struct perf_guest_switch_msr {
  444. unsigned msr;
  445. u64 host, guest;
  446. };
  447. struct x86_pmu_lbr {
  448. unsigned int nr;
  449. unsigned int from;
  450. unsigned int to;
  451. unsigned int info;
  452. };
  453. extern void perf_get_x86_pmu_capability(struct x86_pmu_capability *cap);
  454. extern u64 perf_get_hw_event_config(int hw_event);
  455. extern void perf_check_microcode(void);
  456. extern void perf_clear_dirty_counters(void);
  457. extern int x86_perf_rdpmc_index(struct perf_event *event);
  458. #else
  459. static inline void perf_get_x86_pmu_capability(struct x86_pmu_capability *cap)
  460. {
  461. memset(cap, 0, sizeof(*cap));
  462. }
  463. static inline u64 perf_get_hw_event_config(int hw_event)
  464. {
  465. return 0;
  466. }
  467. static inline void perf_events_lapic_init(void) { }
  468. static inline void perf_check_microcode(void) { }
  469. #endif
  470. #if defined(CONFIG_PERF_EVENTS) && defined(CONFIG_CPU_SUP_INTEL)
  471. extern struct perf_guest_switch_msr *perf_guest_get_msrs(int *nr, void *data);
  472. extern void x86_perf_get_lbr(struct x86_pmu_lbr *lbr);
  473. #else
  474. struct perf_guest_switch_msr *perf_guest_get_msrs(int *nr, void *data);
  475. static inline void x86_perf_get_lbr(struct x86_pmu_lbr *lbr)
  476. {
  477. memset(lbr, 0, sizeof(*lbr));
  478. }
  479. #endif
  480. #ifdef CONFIG_CPU_SUP_INTEL
  481. extern void intel_pt_handle_vmx(int on);
  482. #else
  483. static inline void intel_pt_handle_vmx(int on)
  484. {
  485. }
  486. #endif
  487. #if defined(CONFIG_PERF_EVENTS) && defined(CONFIG_CPU_SUP_AMD)
  488. extern void amd_pmu_enable_virt(void);
  489. extern void amd_pmu_disable_virt(void);
  490. #if defined(CONFIG_PERF_EVENTS_AMD_BRS)
  491. #define PERF_NEEDS_LOPWR_CB 1
  492. /*
  493. * architectural low power callback impacts
  494. * drivers/acpi/processor_idle.c
  495. * drivers/acpi/acpi_pad.c
  496. */
  497. extern void perf_amd_brs_lopwr_cb(bool lopwr_in);
  498. DECLARE_STATIC_CALL(perf_lopwr_cb, perf_amd_brs_lopwr_cb);
  499. static inline void perf_lopwr_cb(bool lopwr_in)
  500. {
  501. static_call_mod(perf_lopwr_cb)(lopwr_in);
  502. }
  503. #endif /* PERF_NEEDS_LOPWR_CB */
  504. #else
  505. static inline void amd_pmu_enable_virt(void) { }
  506. static inline void amd_pmu_disable_virt(void) { }
  507. #endif
  508. #define arch_perf_out_copy_user copy_from_user_nmi
  509. #endif /* _ASM_X86_PERF_EVENT_H */