1
2
3
4
5
6
7
8
9
10
11
12
13
14
15#include <linux/perf_event.h>
16
17#include <asm/intel_ds.h>
18#include <asm/cpu.h>
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36enum extra_reg_type {
37 EXTRA_REG_NONE = -1,
38
39 EXTRA_REG_RSP_0 = 0,
40 EXTRA_REG_RSP_1 = 1,
41 EXTRA_REG_LBR = 2,
42 EXTRA_REG_LDLAT = 3,
43 EXTRA_REG_FE = 4,
44
45 EXTRA_REG_MAX
46};
47
48struct event_constraint {
49 union {
50 unsigned long idxmsk[BITS_TO_LONGS(X86_PMC_IDX_MAX)];
51 u64 idxmsk64;
52 };
53 u64 code;
54 u64 cmask;
55 int weight;
56 int overlap;
57 int flags;
58 unsigned int size;
59};
60
61static inline bool constraint_match(struct event_constraint *c, u64 ecode)
62{
63 return ((ecode & c->cmask) - c->code) <= (u64)c->size;
64}
65
66
67
68
69#define PERF_X86_EVENT_PEBS_LDLAT 0x0001
70#define PERF_X86_EVENT_PEBS_ST 0x0002
71#define PERF_X86_EVENT_PEBS_ST_HSW 0x0004
72#define PERF_X86_EVENT_PEBS_LD_HSW 0x0008
73#define PERF_X86_EVENT_PEBS_NA_HSW 0x0010
74#define PERF_X86_EVENT_EXCL 0x0020
75#define PERF_X86_EVENT_DYNAMIC 0x0040
76#define PERF_X86_EVENT_RDPMC_ALLOWED 0x0080
77#define PERF_X86_EVENT_EXCL_ACCT 0x0100
78#define PERF_X86_EVENT_AUTO_RELOAD 0x0200
79#define PERF_X86_EVENT_LARGE_PEBS 0x0400
80#define PERF_X86_EVENT_PEBS_VIA_PT 0x0800
81#define PERF_X86_EVENT_PAIR 0x1000
82#define PERF_X86_EVENT_LBR_SELECT 0x2000
83#define PERF_X86_EVENT_TOPDOWN 0x4000
84#define PERF_X86_EVENT_PEBS_STLAT 0x8000
85
86static inline bool is_topdown_count(struct perf_event *event)
87{
88 return event->hw.flags & PERF_X86_EVENT_TOPDOWN;
89}
90
91static inline bool is_metric_event(struct perf_event *event)
92{
93 u64 config = event->attr.config;
94
95 return ((config & ARCH_PERFMON_EVENTSEL_EVENT) == 0) &&
96 ((config & INTEL_ARCH_EVENT_MASK) >= INTEL_TD_METRIC_RETIRING) &&
97 ((config & INTEL_ARCH_EVENT_MASK) <= INTEL_TD_METRIC_MAX);
98}
99
100static inline bool is_slots_event(struct perf_event *event)
101{
102 return (event->attr.config & INTEL_ARCH_EVENT_MASK) == INTEL_TD_SLOTS;
103}
104
105static inline bool is_topdown_event(struct perf_event *event)
106{
107 return is_metric_event(event) || is_slots_event(event);
108}
109
110struct amd_nb {
111 int nb_id;
112 int refcnt;
113 struct perf_event *owners[X86_PMC_IDX_MAX];
114 struct event_constraint event_constraints[X86_PMC_IDX_MAX];
115};
116
117#define PEBS_COUNTER_MASK ((1ULL << MAX_PEBS_EVENTS) - 1)
118#define PEBS_PMI_AFTER_EACH_RECORD BIT_ULL(60)
119#define PEBS_OUTPUT_OFFSET 61
120#define PEBS_OUTPUT_MASK (3ull << PEBS_OUTPUT_OFFSET)
121#define PEBS_OUTPUT_PT (1ull << PEBS_OUTPUT_OFFSET)
122#define PEBS_VIA_PT_MASK (PEBS_OUTPUT_PT | PEBS_PMI_AFTER_EACH_RECORD)
123
124
125
126
127
128
129
130
131#define LARGE_PEBS_FLAGS \
132 (PERF_SAMPLE_IP | PERF_SAMPLE_TID | PERF_SAMPLE_ADDR | \
133 PERF_SAMPLE_ID | PERF_SAMPLE_CPU | PERF_SAMPLE_STREAM_ID | \
134 PERF_SAMPLE_DATA_SRC | PERF_SAMPLE_IDENTIFIER | \
135 PERF_SAMPLE_TRANSACTION | PERF_SAMPLE_PHYS_ADDR | \
136 PERF_SAMPLE_REGS_INTR | PERF_SAMPLE_REGS_USER | \
137 PERF_SAMPLE_PERIOD | PERF_SAMPLE_CODE_PAGE_SIZE)
138
139#define PEBS_GP_REGS \
140 ((1ULL << PERF_REG_X86_AX) | \
141 (1ULL << PERF_REG_X86_BX) | \
142 (1ULL << PERF_REG_X86_CX) | \
143 (1ULL << PERF_REG_X86_DX) | \
144 (1ULL << PERF_REG_X86_DI) | \
145 (1ULL << PERF_REG_X86_SI) | \
146 (1ULL << PERF_REG_X86_SP) | \
147 (1ULL << PERF_REG_X86_BP) | \
148 (1ULL << PERF_REG_X86_IP) | \
149 (1ULL << PERF_REG_X86_FLAGS) | \
150 (1ULL << PERF_REG_X86_R8) | \
151 (1ULL << PERF_REG_X86_R9) | \
152 (1ULL << PERF_REG_X86_R10) | \
153 (1ULL << PERF_REG_X86_R11) | \
154 (1ULL << PERF_REG_X86_R12) | \
155 (1ULL << PERF_REG_X86_R13) | \
156 (1ULL << PERF_REG_X86_R14) | \
157 (1ULL << PERF_REG_X86_R15))
158
159
160
161
162struct er_account {
163 raw_spinlock_t lock;
164 u64 config;
165 u64 reg;
166 atomic_t ref;
167};
168
169
170
171
172
173
174
175struct intel_shared_regs {
176 struct er_account regs[EXTRA_REG_MAX];
177 int refcnt;
178 unsigned core_id;
179};
180
181enum intel_excl_state_type {
182 INTEL_EXCL_UNUSED = 0,
183 INTEL_EXCL_SHARED = 1,
184 INTEL_EXCL_EXCLUSIVE = 2,
185};
186
187struct intel_excl_states {
188 enum intel_excl_state_type state[X86_PMC_IDX_MAX];
189 bool sched_started;
190};
191
192struct intel_excl_cntrs {
193 raw_spinlock_t lock;
194
195 struct intel_excl_states states[2];
196
197 union {
198 u16 has_exclusive[2];
199 u32 exclusive_present;
200 };
201
202 int refcnt;
203 unsigned core_id;
204};
205
206struct x86_perf_task_context;
207#define MAX_LBR_ENTRIES 32
208
209enum {
210 LBR_FORMAT_32 = 0x00,
211 LBR_FORMAT_LIP = 0x01,
212 LBR_FORMAT_EIP = 0x02,
213 LBR_FORMAT_EIP_FLAGS = 0x03,
214 LBR_FORMAT_EIP_FLAGS2 = 0x04,
215 LBR_FORMAT_INFO = 0x05,
216 LBR_FORMAT_TIME = 0x06,
217 LBR_FORMAT_MAX_KNOWN = LBR_FORMAT_TIME,
218};
219
220enum {
221 X86_PERF_KFREE_SHARED = 0,
222 X86_PERF_KFREE_EXCL = 1,
223 X86_PERF_KFREE_MAX
224};
225
226struct cpu_hw_events {
227
228
229
230 struct perf_event *events[X86_PMC_IDX_MAX];
231 unsigned long active_mask[BITS_TO_LONGS(X86_PMC_IDX_MAX)];
232 unsigned long dirty[BITS_TO_LONGS(X86_PMC_IDX_MAX)];
233 int enabled;
234
235 int n_events;
236 int n_added;
237
238 int n_txn;
239
240 int n_txn_pair;
241 int n_txn_metric;
242 int assign[X86_PMC_IDX_MAX];
243 u64 tags[X86_PMC_IDX_MAX];
244
245 struct perf_event *event_list[X86_PMC_IDX_MAX];
246 struct event_constraint *event_constraint[X86_PMC_IDX_MAX];
247
248 int n_excl;
249
250 unsigned int txn_flags;
251 int is_fake;
252
253
254
255
256 struct debug_store *ds;
257 void *ds_pebs_vaddr;
258 void *ds_bts_vaddr;
259 u64 pebs_enabled;
260 int n_pebs;
261 int n_large_pebs;
262 int n_pebs_via_pt;
263 int pebs_output;
264
265
266 u64 pebs_data_cfg;
267 u64 active_pebs_data_cfg;
268 int pebs_record_size;
269
270
271
272
273 int lbr_users;
274 int lbr_pebs_users;
275 struct perf_branch_stack lbr_stack;
276 struct perf_branch_entry lbr_entries[MAX_LBR_ENTRIES];
277 union {
278 struct er_account *lbr_sel;
279 struct er_account *lbr_ctl;
280 };
281 u64 br_sel;
282 void *last_task_ctx;
283 int last_log_id;
284 int lbr_select;
285 void *lbr_xsave;
286
287
288
289
290 u64 intel_ctrl_guest_mask;
291 u64 intel_ctrl_host_mask;
292 struct perf_guest_switch_msr guest_switch_msrs[X86_PMC_IDX_MAX];
293
294
295
296
297 u64 intel_cp_status;
298
299
300
301
302
303 struct intel_shared_regs *shared_regs;
304
305
306
307 struct event_constraint *constraint_list;
308 struct intel_excl_cntrs *excl_cntrs;
309 int excl_thread_id;
310
311
312
313
314 u64 tfa_shadow;
315
316
317
318
319
320 int n_metric;
321
322
323
324
325 struct amd_nb *amd_nb;
326
327 u64 perf_ctr_virt_mask;
328 int n_pair;
329
330 void *kfree_on_online[X86_PERF_KFREE_MAX];
331
332 struct pmu *pmu;
333};
334
335#define __EVENT_CONSTRAINT_RANGE(c, e, n, m, w, o, f) { \
336 { .idxmsk64 = (n) }, \
337 .code = (c), \
338 .size = (e) - (c), \
339 .cmask = (m), \
340 .weight = (w), \
341 .overlap = (o), \
342 .flags = f, \
343}
344
345#define __EVENT_CONSTRAINT(c, n, m, w, o, f) \
346 __EVENT_CONSTRAINT_RANGE(c, c, n, m, w, o, f)
347
348#define EVENT_CONSTRAINT(c, n, m) \
349 __EVENT_CONSTRAINT(c, n, m, HWEIGHT(n), 0, 0)
350
351
352
353
354
355#define EVENT_CONSTRAINT_RANGE(c, e, n, m) \
356 __EVENT_CONSTRAINT_RANGE(c, e, n, m, HWEIGHT(n), 0, 0)
357
358#define INTEL_EXCLEVT_CONSTRAINT(c, n) \
359 __EVENT_CONSTRAINT(c, n, ARCH_PERFMON_EVENTSEL_EVENT, HWEIGHT(n),\
360 0, PERF_X86_EVENT_EXCL)
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383#define EVENT_CONSTRAINT_OVERLAP(c, n, m) \
384 __EVENT_CONSTRAINT(c, n, m, HWEIGHT(n), 1, 0)
385
386
387
388
389#define INTEL_EVENT_CONSTRAINT(c, n) \
390 EVENT_CONSTRAINT(c, n, ARCH_PERFMON_EVENTSEL_EVENT)
391
392
393
394
395#define INTEL_EVENT_CONSTRAINT_RANGE(c, e, n) \
396 EVENT_CONSTRAINT_RANGE(c, e, n, ARCH_PERFMON_EVENTSEL_EVENT)
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411#define FIXED_EVENT_FLAGS (X86_RAW_EVENT_MASK|HSW_IN_TX|HSW_IN_TX_CHECKPOINTED)
412#define FIXED_EVENT_CONSTRAINT(c, n) \
413 EVENT_CONSTRAINT(c, (1ULL << (32+n)), FIXED_EVENT_FLAGS)
414
415
416
417
418
419
420
421
422
423
424#define METRIC_EVENT_CONSTRAINT(c, n) \
425 EVENT_CONSTRAINT(c, (1ULL << (INTEL_PMC_IDX_METRIC_BASE + n)), \
426 INTEL_ARCH_EVENT_MASK)
427
428
429
430
431#define INTEL_UEVENT_CONSTRAINT(c, n) \
432 EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK)
433
434
435#define INTEL_UBIT_EVENT_CONSTRAINT(c, n) \
436 EVENT_CONSTRAINT(c, n, ARCH_PERFMON_EVENTSEL_EVENT|(c))
437
438
439#define INTEL_FLAGS_UEVENT_CONSTRAINT(c, n) \
440 EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK|X86_ALL_EVENT_FLAGS)
441
442#define INTEL_EXCLUEVT_CONSTRAINT(c, n) \
443 __EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK, \
444 HWEIGHT(n), 0, PERF_X86_EVENT_EXCL)
445
446#define INTEL_PLD_CONSTRAINT(c, n) \
447 __EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK|X86_ALL_EVENT_FLAGS, \
448 HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_LDLAT)
449
450#define INTEL_PSD_CONSTRAINT(c, n) \
451 __EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK|X86_ALL_EVENT_FLAGS, \
452 HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_STLAT)
453
454#define INTEL_PST_CONSTRAINT(c, n) \
455 __EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK|X86_ALL_EVENT_FLAGS, \
456 HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_ST)
457
458
459#define INTEL_FLAGS_EVENT_CONSTRAINT(c, n) \
460 EVENT_CONSTRAINT(c, n, ARCH_PERFMON_EVENTSEL_EVENT|X86_ALL_EVENT_FLAGS)
461
462#define INTEL_FLAGS_EVENT_CONSTRAINT_RANGE(c, e, n) \
463 EVENT_CONSTRAINT_RANGE(c, e, n, ARCH_PERFMON_EVENTSEL_EVENT|X86_ALL_EVENT_FLAGS)
464
465
466#define INTEL_ALL_EVENT_CONSTRAINT(code, n) \
467 EVENT_CONSTRAINT(code, n, X86_ALL_EVENT_FLAGS)
468
469
470#define INTEL_FLAGS_EVENT_CONSTRAINT_DATALA_ST(code, n) \
471 __EVENT_CONSTRAINT(code, n, \
472 ARCH_PERFMON_EVENTSEL_EVENT|X86_ALL_EVENT_FLAGS, \
473 HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_ST_HSW)
474
475
476#define INTEL_FLAGS_EVENT_CONSTRAINT_DATALA_LD(code, n) \
477 __EVENT_CONSTRAINT(code, n, \
478 ARCH_PERFMON_EVENTSEL_EVENT|X86_ALL_EVENT_FLAGS, \
479 HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_LD_HSW)
480
481#define INTEL_FLAGS_EVENT_CONSTRAINT_DATALA_LD_RANGE(code, end, n) \
482 __EVENT_CONSTRAINT_RANGE(code, end, n, \
483 ARCH_PERFMON_EVENTSEL_EVENT|X86_ALL_EVENT_FLAGS, \
484 HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_LD_HSW)
485
486#define INTEL_FLAGS_EVENT_CONSTRAINT_DATALA_XLD(code, n) \
487 __EVENT_CONSTRAINT(code, n, \
488 ARCH_PERFMON_EVENTSEL_EVENT|X86_ALL_EVENT_FLAGS, \
489 HWEIGHT(n), 0, \
490 PERF_X86_EVENT_PEBS_LD_HSW|PERF_X86_EVENT_EXCL)
491
492
493#define INTEL_FLAGS_UEVENT_CONSTRAINT_DATALA_ST(code, n) \
494 __EVENT_CONSTRAINT(code, n, \
495 INTEL_ARCH_EVENT_MASK|X86_ALL_EVENT_FLAGS, \
496 HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_ST_HSW)
497
498#define INTEL_FLAGS_UEVENT_CONSTRAINT_DATALA_XST(code, n) \
499 __EVENT_CONSTRAINT(code, n, \
500 INTEL_ARCH_EVENT_MASK|X86_ALL_EVENT_FLAGS, \
501 HWEIGHT(n), 0, \
502 PERF_X86_EVENT_PEBS_ST_HSW|PERF_X86_EVENT_EXCL)
503
504
505#define INTEL_FLAGS_UEVENT_CONSTRAINT_DATALA_LD(code, n) \
506 __EVENT_CONSTRAINT(code, n, \
507 INTEL_ARCH_EVENT_MASK|X86_ALL_EVENT_FLAGS, \
508 HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_LD_HSW)
509
510#define INTEL_FLAGS_UEVENT_CONSTRAINT_DATALA_XLD(code, n) \
511 __EVENT_CONSTRAINT(code, n, \
512 INTEL_ARCH_EVENT_MASK|X86_ALL_EVENT_FLAGS, \
513 HWEIGHT(n), 0, \
514 PERF_X86_EVENT_PEBS_LD_HSW|PERF_X86_EVENT_EXCL)
515
516
517#define INTEL_FLAGS_UEVENT_CONSTRAINT_DATALA_NA(code, n) \
518 __EVENT_CONSTRAINT(code, n, \
519 INTEL_ARCH_EVENT_MASK|X86_ALL_EVENT_FLAGS, \
520 HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_NA_HSW)
521
522
523
524
525
526
527
528
529
530#define EVENT_CONSTRAINT_END { .weight = -1 }
531
532
533
534
535#define for_each_event_constraint(e, c) \
536 for ((e) = (c); (e)->weight != -1; (e)++)
537
538
539
540
541
542
543
544
545
546
547
548struct extra_reg {
549 unsigned int event;
550 unsigned int msr;
551 u64 config_mask;
552 u64 valid_mask;
553 int idx;
554 bool extra_msr_access;
555};
556
557#define EVENT_EXTRA_REG(e, ms, m, vm, i) { \
558 .event = (e), \
559 .msr = (ms), \
560 .config_mask = (m), \
561 .valid_mask = (vm), \
562 .idx = EXTRA_REG_##i, \
563 .extra_msr_access = true, \
564 }
565
566#define INTEL_EVENT_EXTRA_REG(event, msr, vm, idx) \
567 EVENT_EXTRA_REG(event, msr, ARCH_PERFMON_EVENTSEL_EVENT, vm, idx)
568
569#define INTEL_UEVENT_EXTRA_REG(event, msr, vm, idx) \
570 EVENT_EXTRA_REG(event, msr, ARCH_PERFMON_EVENTSEL_EVENT | \
571 ARCH_PERFMON_EVENTSEL_UMASK, vm, idx)
572
573#define INTEL_UEVENT_PEBS_LDLAT_EXTRA_REG(c) \
574 INTEL_UEVENT_EXTRA_REG(c, \
575 MSR_PEBS_LD_LAT_THRESHOLD, \
576 0xffff, \
577 LDLAT)
578
579#define EVENT_EXTRA_END EVENT_EXTRA_REG(0, 0, 0, 0, RSP_0)
580
581union perf_capabilities {
582 struct {
583 u64 lbr_format:6;
584 u64 pebs_trap:1;
585 u64 pebs_arch_reg:1;
586 u64 pebs_format:4;
587 u64 smm_freeze:1;
588
589
590
591
592 u64 full_width_write:1;
593 u64 pebs_baseline:1;
594 u64 perf_metrics:1;
595 u64 pebs_output_pt_available:1;
596 u64 anythread_deprecated:1;
597 };
598 u64 capabilities;
599};
600
601struct x86_pmu_quirk {
602 struct x86_pmu_quirk *next;
603 void (*func)(void);
604};
605
606union x86_pmu_config {
607 struct {
608 u64 event:8,
609 umask:8,
610 usr:1,
611 os:1,
612 edge:1,
613 pc:1,
614 interrupt:1,
615 __reserved1:1,
616 en:1,
617 inv:1,
618 cmask:8,
619 event2:4,
620 __reserved2:4,
621 go:1,
622 ho:1;
623 } bits;
624 u64 value;
625};
626
627#define X86_CONFIG(args...) ((union x86_pmu_config){.bits = {args}}).value
628
629enum {
630 x86_lbr_exclusive_lbr,
631 x86_lbr_exclusive_bts,
632 x86_lbr_exclusive_pt,
633 x86_lbr_exclusive_max,
634};
635
636struct x86_hybrid_pmu {
637 struct pmu pmu;
638 const char *name;
639 u8 cpu_type;
640 cpumask_t supported_cpus;
641 union perf_capabilities intel_cap;
642 u64 intel_ctrl;
643 int max_pebs_events;
644 int num_counters;
645 int num_counters_fixed;
646 struct event_constraint unconstrained;
647
648 u64 hw_cache_event_ids
649 [PERF_COUNT_HW_CACHE_MAX]
650 [PERF_COUNT_HW_CACHE_OP_MAX]
651 [PERF_COUNT_HW_CACHE_RESULT_MAX];
652 u64 hw_cache_extra_regs
653 [PERF_COUNT_HW_CACHE_MAX]
654 [PERF_COUNT_HW_CACHE_OP_MAX]
655 [PERF_COUNT_HW_CACHE_RESULT_MAX];
656 struct event_constraint *event_constraints;
657 struct event_constraint *pebs_constraints;
658 struct extra_reg *extra_regs;
659
660 unsigned int late_ack :1,
661 mid_ack :1,
662 enabled_ack :1;
663};
664
665static __always_inline struct x86_hybrid_pmu *hybrid_pmu(struct pmu *pmu)
666{
667 return container_of(pmu, struct x86_hybrid_pmu, pmu);
668}
669
670extern struct static_key_false perf_is_hybrid;
671#define is_hybrid() static_branch_unlikely(&perf_is_hybrid)
672
673#define hybrid(_pmu, _field) \
674(*({ \
675 typeof(&x86_pmu._field) __Fp = &x86_pmu._field; \
676 \
677 if (is_hybrid() && (_pmu)) \
678 __Fp = &hybrid_pmu(_pmu)->_field; \
679 \
680 __Fp; \
681}))
682
683#define hybrid_var(_pmu, _var) \
684(*({ \
685 typeof(&_var) __Fp = &_var; \
686 \
687 if (is_hybrid() && (_pmu)) \
688 __Fp = &hybrid_pmu(_pmu)->_var; \
689 \
690 __Fp; \
691}))
692
693#define hybrid_bit(_pmu, _field) \
694({ \
695 bool __Fp = x86_pmu._field; \
696 \
697 if (is_hybrid() && (_pmu)) \
698 __Fp = hybrid_pmu(_pmu)->_field; \
699 \
700 __Fp; \
701})
702
703enum hybrid_pmu_type {
704 hybrid_big = 0x40,
705 hybrid_small = 0x20,
706
707 hybrid_big_small = hybrid_big | hybrid_small,
708};
709
710#define X86_HYBRID_PMU_ATOM_IDX 0
711#define X86_HYBRID_PMU_CORE_IDX 1
712
713#define X86_HYBRID_NUM_PMUS 2
714
715
716
717
718struct x86_pmu {
719
720
721
722 const char *name;
723 int version;
724 int (*handle_irq)(struct pt_regs *);
725 void (*disable_all)(void);
726 void (*enable_all)(int added);
727 void (*enable)(struct perf_event *);
728 void (*disable)(struct perf_event *);
729 void (*add)(struct perf_event *);
730 void (*del)(struct perf_event *);
731 void (*read)(struct perf_event *event);
732 int (*hw_config)(struct perf_event *event);
733 int (*schedule_events)(struct cpu_hw_events *cpuc, int n, int *assign);
734 unsigned eventsel;
735 unsigned perfctr;
736 int (*addr_offset)(int index, bool eventsel);
737 int (*rdpmc_index)(int index);
738 u64 (*event_map)(int);
739 int max_events;
740 int num_counters;
741 int num_counters_fixed;
742 int cntval_bits;
743 u64 cntval_mask;
744 union {
745 unsigned long events_maskl;
746 unsigned long events_mask[BITS_TO_LONGS(ARCH_PERFMON_EVENTS_COUNT)];
747 };
748 int events_mask_len;
749 int apic;
750 u64 max_period;
751 struct event_constraint *
752 (*get_event_constraints)(struct cpu_hw_events *cpuc,
753 int idx,
754 struct perf_event *event);
755
756 void (*put_event_constraints)(struct cpu_hw_events *cpuc,
757 struct perf_event *event);
758
759 void (*start_scheduling)(struct cpu_hw_events *cpuc);
760
761 void (*commit_scheduling)(struct cpu_hw_events *cpuc, int idx, int cntr);
762
763 void (*stop_scheduling)(struct cpu_hw_events *cpuc);
764
765 struct event_constraint *event_constraints;
766 struct x86_pmu_quirk *quirks;
767 int perfctr_second_write;
768 u64 (*limit_period)(struct perf_event *event, u64 l);
769
770
771 unsigned int late_ack :1,
772 mid_ack :1,
773 enabled_ack :1;
774
775
776
777 int attr_rdpmc_broken;
778 int attr_rdpmc;
779 struct attribute **format_attrs;
780
781 ssize_t (*events_sysfs_show)(char *page, u64 config);
782 const struct attribute_group **attr_update;
783
784 unsigned long attr_freeze_on_smi;
785
786
787
788
789 int (*cpu_prepare)(int cpu);
790 void (*cpu_starting)(int cpu);
791 void (*cpu_dying)(int cpu);
792 void (*cpu_dead)(int cpu);
793
794 void (*check_microcode)(void);
795 void (*sched_task)(struct perf_event_context *ctx,
796 bool sched_in);
797
798
799
800
801 u64 intel_ctrl;
802 union perf_capabilities intel_cap;
803
804
805
806
807 unsigned int bts :1,
808 bts_active :1,
809 pebs :1,
810 pebs_active :1,
811 pebs_broken :1,
812 pebs_prec_dist :1,
813 pebs_no_tlb :1,
814 pebs_no_isolation :1,
815 pebs_block :1;
816 int pebs_record_size;
817 int pebs_buffer_size;
818 int max_pebs_events;
819 void (*drain_pebs)(struct pt_regs *regs, struct perf_sample_data *data);
820 struct event_constraint *pebs_constraints;
821 void (*pebs_aliases)(struct perf_event *event);
822 unsigned long large_pebs_flags;
823 u64 rtm_abort_event;
824
825
826
827
828 unsigned int lbr_tos, lbr_from, lbr_to,
829 lbr_info, lbr_nr;
830 union {
831 u64 lbr_sel_mask;
832 u64 lbr_ctl_mask;
833 };
834 union {
835 const int *lbr_sel_map;
836 int *lbr_ctl_map;
837 };
838 bool lbr_double_abort;
839 bool lbr_pt_coexist;
840
841
842
843
844 unsigned int lbr_depth_mask:8;
845 unsigned int lbr_deep_c_reset:1;
846 unsigned int lbr_lip:1;
847 unsigned int lbr_cpl:1;
848 unsigned int lbr_filter:1;
849 unsigned int lbr_call_stack:1;
850 unsigned int lbr_mispred:1;
851 unsigned int lbr_timed_lbr:1;
852 unsigned int lbr_br_type:1;
853
854 void (*lbr_reset)(void);
855 void (*lbr_read)(struct cpu_hw_events *cpuc);
856 void (*lbr_save)(void *ctx);
857 void (*lbr_restore)(void *ctx);
858
859
860
861
862 atomic_t lbr_exclusive[x86_lbr_exclusive_max];
863
864
865
866
867 int num_topdown_events;
868 u64 (*update_topdown_event)(struct perf_event *event);
869 int (*set_topdown_event_period)(struct perf_event *event);
870
871
872
873
874
875
876 void (*swap_task_ctx)(struct perf_event_context *prev,
877 struct perf_event_context *next);
878
879
880
881
882 unsigned int amd_nb_constraints : 1;
883 u64 perf_ctr_pair_en;
884
885
886
887
888 struct extra_reg *extra_regs;
889 unsigned int flags;
890
891
892
893
894 struct perf_guest_switch_msr *(*guest_get_msrs)(int *nr);
895
896
897
898
899 int (*check_period) (struct perf_event *event, u64 period);
900
901 int (*aux_output_match) (struct perf_event *event);
902
903 int (*filter_match)(struct perf_event *event);
904
905
906
907
908
909
910
911
912 int num_hybrid_pmus;
913 struct x86_hybrid_pmu *hybrid_pmu;
914 u8 (*get_hybrid_cpu_type) (void);
915};
916
917struct x86_perf_task_context_opt {
918 int lbr_callstack_users;
919 int lbr_stack_state;
920 int log_id;
921};
922
923struct x86_perf_task_context {
924 u64 lbr_sel;
925 int tos;
926 int valid_lbrs;
927 struct x86_perf_task_context_opt opt;
928 struct lbr_entry lbr[MAX_LBR_ENTRIES];
929};
930
931struct x86_perf_task_context_arch_lbr {
932 struct x86_perf_task_context_opt opt;
933 struct lbr_entry entries[];
934};
935
936
937
938
939
940
941
942
943
944struct x86_perf_task_context_arch_lbr_xsave {
945 struct x86_perf_task_context_opt opt;
946
947 union {
948 struct xregs_state xsave;
949 struct {
950 struct fxregs_state i387;
951 struct xstate_header header;
952 struct arch_lbr_state lbr;
953 } __attribute__ ((packed, aligned (XSAVE_ALIGNMENT)));
954 };
955};
956
957#define x86_add_quirk(func_) \
958do { \
959 static struct x86_pmu_quirk __quirk __initdata = { \
960 .func = func_, \
961 }; \
962 __quirk.next = x86_pmu.quirks; \
963 x86_pmu.quirks = &__quirk; \
964} while (0)
965
966
967
968
969#define PMU_FL_NO_HT_SHARING 0x1
970#define PMU_FL_HAS_RSP_1 0x2
971#define PMU_FL_EXCL_CNTRS 0x4
972#define PMU_FL_EXCL_ENABLED 0x8
973#define PMU_FL_PEBS_ALL 0x10
974#define PMU_FL_TFA 0x20
975#define PMU_FL_PAIR 0x40
976#define PMU_FL_INSTR_LATENCY 0x80
977#define PMU_FL_MEM_LOADS_AUX 0x100
978
979#define EVENT_VAR(_id) event_attr_##_id
980#define EVENT_PTR(_id) &event_attr_##_id.attr.attr
981
982#define EVENT_ATTR(_name, _id) \
983static struct perf_pmu_events_attr EVENT_VAR(_id) = { \
984 .attr = __ATTR(_name, 0444, events_sysfs_show, NULL), \
985 .id = PERF_COUNT_HW_##_id, \
986 .event_str = NULL, \
987};
988
989#define EVENT_ATTR_STR(_name, v, str) \
990static struct perf_pmu_events_attr event_attr_##v = { \
991 .attr = __ATTR(_name, 0444, events_sysfs_show, NULL), \
992 .id = 0, \
993 .event_str = str, \
994};
995
996#define EVENT_ATTR_STR_HT(_name, v, noht, ht) \
997static struct perf_pmu_events_ht_attr event_attr_##v = { \
998 .attr = __ATTR(_name, 0444, events_ht_sysfs_show, NULL),\
999 .id = 0, \
1000 .event_str_noht = noht, \
1001 .event_str_ht = ht, \
1002}
1003
1004#define EVENT_ATTR_STR_HYBRID(_name, v, str, _pmu) \
1005static struct perf_pmu_events_hybrid_attr event_attr_##v = { \
1006 .attr = __ATTR(_name, 0444, events_hybrid_sysfs_show, NULL),\
1007 .id = 0, \
1008 .event_str = str, \
1009 .pmu_type = _pmu, \
1010}
1011
1012#define FORMAT_HYBRID_PTR(_id) (&format_attr_hybrid_##_id.attr.attr)
1013
1014#define FORMAT_ATTR_HYBRID(_name, _pmu) \
1015static struct perf_pmu_format_hybrid_attr format_attr_hybrid_##_name = {\
1016 .attr = __ATTR_RO(_name), \
1017 .pmu_type = _pmu, \
1018}
1019
1020struct pmu *x86_get_pmu(unsigned int cpu);
1021extern struct x86_pmu x86_pmu __read_mostly;
1022
1023static __always_inline struct x86_perf_task_context_opt *task_context_opt(void *ctx)
1024{
1025 if (static_cpu_has(X86_FEATURE_ARCH_LBR))
1026 return &((struct x86_perf_task_context_arch_lbr *)ctx)->opt;
1027
1028 return &((struct x86_perf_task_context *)ctx)->opt;
1029}
1030
1031static inline bool x86_pmu_has_lbr_callstack(void)
1032{
1033 return x86_pmu.lbr_sel_map &&
1034 x86_pmu.lbr_sel_map[PERF_SAMPLE_BRANCH_CALL_STACK_SHIFT] > 0;
1035}
1036
1037DECLARE_PER_CPU(struct cpu_hw_events, cpu_hw_events);
1038
1039int x86_perf_event_set_period(struct perf_event *event);
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049#define C(x) PERF_COUNT_HW_CACHE_##x
1050
1051extern u64 __read_mostly hw_cache_event_ids
1052 [PERF_COUNT_HW_CACHE_MAX]
1053 [PERF_COUNT_HW_CACHE_OP_MAX]
1054 [PERF_COUNT_HW_CACHE_RESULT_MAX];
1055extern u64 __read_mostly hw_cache_extra_regs
1056 [PERF_COUNT_HW_CACHE_MAX]
1057 [PERF_COUNT_HW_CACHE_OP_MAX]
1058 [PERF_COUNT_HW_CACHE_RESULT_MAX];
1059
1060u64 x86_perf_event_update(struct perf_event *event);
1061
1062static inline unsigned int x86_pmu_config_addr(int index)
1063{
1064 return x86_pmu.eventsel + (x86_pmu.addr_offset ?
1065 x86_pmu.addr_offset(index, true) : index);
1066}
1067
1068static inline unsigned int x86_pmu_event_addr(int index)
1069{
1070 return x86_pmu.perfctr + (x86_pmu.addr_offset ?
1071 x86_pmu.addr_offset(index, false) : index);
1072}
1073
1074static inline int x86_pmu_rdpmc_index(int index)
1075{
1076 return x86_pmu.rdpmc_index ? x86_pmu.rdpmc_index(index) : index;
1077}
1078
1079bool check_hw_exists(struct pmu *pmu, int num_counters,
1080 int num_counters_fixed);
1081
1082int x86_add_exclusive(unsigned int what);
1083
1084void x86_del_exclusive(unsigned int what);
1085
1086int x86_reserve_hardware(void);
1087
1088void x86_release_hardware(void);
1089
1090int x86_pmu_max_precise(void);
1091
1092void hw_perf_lbr_event_destroy(struct perf_event *event);
1093
1094int x86_setup_perfctr(struct perf_event *event);
1095
1096int x86_pmu_hw_config(struct perf_event *event);
1097
1098void x86_pmu_disable_all(void);
1099
1100static inline bool is_counter_pair(struct hw_perf_event *hwc)
1101{
1102 return hwc->flags & PERF_X86_EVENT_PAIR;
1103}
1104
1105static inline void __x86_pmu_enable_event(struct hw_perf_event *hwc,
1106 u64 enable_mask)
1107{
1108 u64 disable_mask = __this_cpu_read(cpu_hw_events.perf_ctr_virt_mask);
1109
1110 if (hwc->extra_reg.reg)
1111 wrmsrl(hwc->extra_reg.reg, hwc->extra_reg.config);
1112
1113
1114
1115
1116
1117 if (is_counter_pair(hwc))
1118 wrmsrl(x86_pmu_config_addr(hwc->idx + 1), x86_pmu.perf_ctr_pair_en);
1119
1120 wrmsrl(hwc->config_base, (hwc->config | enable_mask) & ~disable_mask);
1121}
1122
1123void x86_pmu_enable_all(int added);
1124
1125int perf_assign_events(struct event_constraint **constraints, int n,
1126 int wmin, int wmax, int gpmax, int *assign);
1127int x86_schedule_events(struct cpu_hw_events *cpuc, int n, int *assign);
1128
1129void x86_pmu_stop(struct perf_event *event, int flags);
1130
1131static inline void x86_pmu_disable_event(struct perf_event *event)
1132{
1133 u64 disable_mask = __this_cpu_read(cpu_hw_events.perf_ctr_virt_mask);
1134 struct hw_perf_event *hwc = &event->hw;
1135
1136 wrmsrl(hwc->config_base, hwc->config & ~disable_mask);
1137
1138 if (is_counter_pair(hwc))
1139 wrmsrl(x86_pmu_config_addr(hwc->idx + 1), 0);
1140}
1141
1142void x86_pmu_enable_event(struct perf_event *event);
1143
1144int x86_pmu_handle_irq(struct pt_regs *regs);
1145
1146void x86_pmu_show_pmu_cap(int num_counters, int num_counters_fixed,
1147 u64 intel_ctrl);
1148
1149void x86_pmu_update_cpu_context(struct pmu *pmu, int cpu);
1150
1151extern struct event_constraint emptyconstraint;
1152
1153extern struct event_constraint unconstrained;
1154
1155static inline bool kernel_ip(unsigned long ip)
1156{
1157#ifdef CONFIG_X86_32
1158 return ip > PAGE_OFFSET;
1159#else
1160 return (long)ip < 0;
1161#endif
1162}
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
1175
1176static inline void set_linear_ip(struct pt_regs *regs, unsigned long ip)
1177{
1178 regs->cs = kernel_ip(ip) ? __KERNEL_CS : __USER_CS;
1179 if (regs->flags & X86_VM_MASK)
1180 regs->flags ^= (PERF_EFLAGS_VM | X86_VM_MASK);
1181 regs->ip = ip;
1182}
1183
1184ssize_t x86_event_sysfs_show(char *page, u64 config, u64 event);
1185ssize_t intel_event_sysfs_show(char *page, u64 config);
1186
1187ssize_t events_sysfs_show(struct device *dev, struct device_attribute *attr,
1188 char *page);
1189ssize_t events_ht_sysfs_show(struct device *dev, struct device_attribute *attr,
1190 char *page);
1191ssize_t events_hybrid_sysfs_show(struct device *dev,
1192 struct device_attribute *attr,
1193 char *page);
1194
1195static inline bool fixed_counter_disabled(int i, struct pmu *pmu)
1196{
1197 u64 intel_ctrl = hybrid(pmu, intel_ctrl);
1198
1199 return !(intel_ctrl >> (i + INTEL_PMC_IDX_FIXED));
1200}
1201
1202#ifdef CONFIG_CPU_SUP_AMD
1203
1204int amd_pmu_init(void);
1205
1206#else
1207
1208static inline int amd_pmu_init(void)
1209{
1210 return 0;
1211}
1212
1213#endif
1214
1215static inline int is_pebs_pt(struct perf_event *event)
1216{
1217 return !!(event->hw.flags & PERF_X86_EVENT_PEBS_VIA_PT);
1218}
1219
1220#ifdef CONFIG_CPU_SUP_INTEL
1221
1222static inline bool intel_pmu_has_bts_period(struct perf_event *event, u64 period)
1223{
1224 struct hw_perf_event *hwc = &event->hw;
1225 unsigned int hw_event, bts_event;
1226
1227 if (event->attr.freq)
1228 return false;
1229
1230 hw_event = hwc->config & INTEL_ARCH_EVENT_MASK;
1231 bts_event = x86_pmu.event_map(PERF_COUNT_HW_BRANCH_INSTRUCTIONS);
1232
1233 return hw_event == bts_event && period == 1;
1234}
1235
1236static inline bool intel_pmu_has_bts(struct perf_event *event)
1237{
1238 struct hw_perf_event *hwc = &event->hw;
1239
1240 return intel_pmu_has_bts_period(event, hwc->sample_period);
1241}
1242
1243int intel_pmu_save_and_restart(struct perf_event *event);
1244
1245struct event_constraint *
1246x86_get_event_constraints(struct cpu_hw_events *cpuc, int idx,
1247 struct perf_event *event);
1248
1249extern int intel_cpuc_prepare(struct cpu_hw_events *cpuc, int cpu);
1250extern void intel_cpuc_finish(struct cpu_hw_events *cpuc);
1251
1252int intel_pmu_init(void);
1253
1254void init_debug_store_on_cpu(int cpu);
1255
1256void fini_debug_store_on_cpu(int cpu);
1257
1258void release_ds_buffers(void);
1259
1260void reserve_ds_buffers(void);
1261
1262void release_lbr_buffers(void);
1263
1264void reserve_lbr_buffers(void);
1265
1266extern struct event_constraint bts_constraint;
1267extern struct event_constraint vlbr_constraint;
1268
1269void intel_pmu_enable_bts(u64 config);
1270
1271void intel_pmu_disable_bts(void);
1272
1273int intel_pmu_drain_bts_buffer(void);
1274
1275extern struct event_constraint intel_core2_pebs_event_constraints[];
1276
1277extern struct event_constraint intel_atom_pebs_event_constraints[];
1278
1279extern struct event_constraint intel_slm_pebs_event_constraints[];
1280
1281extern struct event_constraint intel_glm_pebs_event_constraints[];
1282
1283extern struct event_constraint intel_glp_pebs_event_constraints[];
1284
1285extern struct event_constraint intel_grt_pebs_event_constraints[];
1286
1287extern struct event_constraint intel_nehalem_pebs_event_constraints[];
1288
1289extern struct event_constraint intel_westmere_pebs_event_constraints[];
1290
1291extern struct event_constraint intel_snb_pebs_event_constraints[];
1292
1293extern struct event_constraint intel_ivb_pebs_event_constraints[];
1294
1295extern struct event_constraint intel_hsw_pebs_event_constraints[];
1296
1297extern struct event_constraint intel_bdw_pebs_event_constraints[];
1298
1299extern struct event_constraint intel_skl_pebs_event_constraints[];
1300
1301extern struct event_constraint intel_icl_pebs_event_constraints[];
1302
1303extern struct event_constraint intel_spr_pebs_event_constraints[];
1304
1305struct event_constraint *intel_pebs_constraints(struct perf_event *event);
1306
1307void intel_pmu_pebs_add(struct perf_event *event);
1308
1309void intel_pmu_pebs_del(struct perf_event *event);
1310
1311void intel_pmu_pebs_enable(struct perf_event *event);
1312
1313void intel_pmu_pebs_disable(struct perf_event *event);
1314
1315void intel_pmu_pebs_enable_all(void);
1316
1317void intel_pmu_pebs_disable_all(void);
1318
1319void intel_pmu_pebs_sched_task(struct perf_event_context *ctx, bool sched_in);
1320
1321void intel_pmu_auto_reload_read(struct perf_event *event);
1322
1323void intel_pmu_store_pebs_lbrs(struct lbr_entry *lbr);
1324
1325void intel_ds_init(void);
1326
1327void intel_pmu_lbr_swap_task_ctx(struct perf_event_context *prev,
1328 struct perf_event_context *next);
1329
1330void intel_pmu_lbr_sched_task(struct perf_event_context *ctx, bool sched_in);
1331
1332u64 lbr_from_signext_quirk_wr(u64 val);
1333
1334void intel_pmu_lbr_reset(void);
1335
1336void intel_pmu_lbr_reset_32(void);
1337
1338void intel_pmu_lbr_reset_64(void);
1339
1340void intel_pmu_lbr_add(struct perf_event *event);
1341
1342void intel_pmu_lbr_del(struct perf_event *event);
1343
1344void intel_pmu_lbr_enable_all(bool pmi);
1345
1346void intel_pmu_lbr_disable_all(void);
1347
1348void intel_pmu_lbr_read(void);
1349
1350void intel_pmu_lbr_read_32(struct cpu_hw_events *cpuc);
1351
1352void intel_pmu_lbr_read_64(struct cpu_hw_events *cpuc);
1353
1354void intel_pmu_lbr_save(void *ctx);
1355
1356void intel_pmu_lbr_restore(void *ctx);
1357
1358void intel_pmu_lbr_init_core(void);
1359
1360void intel_pmu_lbr_init_nhm(void);
1361
1362void intel_pmu_lbr_init_atom(void);
1363
1364void intel_pmu_lbr_init_slm(void);
1365
1366void intel_pmu_lbr_init_snb(void);
1367
1368void intel_pmu_lbr_init_hsw(void);
1369
1370void intel_pmu_lbr_init_skl(void);
1371
1372void intel_pmu_lbr_init_knl(void);
1373
1374void intel_pmu_arch_lbr_init(void);
1375
1376void intel_pmu_pebs_data_source_nhm(void);
1377
1378void intel_pmu_pebs_data_source_skl(bool pmem);
1379
1380int intel_pmu_setup_lbr_filter(struct perf_event *event);
1381
1382void intel_pt_interrupt(void);
1383
1384int intel_bts_interrupt(void);
1385
1386void intel_bts_enable_local(void);
1387
1388void intel_bts_disable_local(void);
1389
1390int p4_pmu_init(void);
1391
1392int p6_pmu_init(void);
1393
1394int knc_pmu_init(void);
1395
1396static inline int is_ht_workaround_enabled(void)
1397{
1398 return !!(x86_pmu.flags & PMU_FL_EXCL_ENABLED);
1399}
1400
1401#else
1402
1403static inline void reserve_ds_buffers(void)
1404{
1405}
1406
1407static inline void release_ds_buffers(void)
1408{
1409}
1410
1411static inline void release_lbr_buffers(void)
1412{
1413}
1414
1415static inline void reserve_lbr_buffers(void)
1416{
1417}
1418
1419static inline int intel_pmu_init(void)
1420{
1421 return 0;
1422}
1423
1424static inline int intel_cpuc_prepare(struct cpu_hw_events *cpuc, int cpu)
1425{
1426 return 0;
1427}
1428
1429static inline void intel_cpuc_finish(struct cpu_hw_events *cpuc)
1430{
1431}
1432
1433static inline int is_ht_workaround_enabled(void)
1434{
1435 return 0;
1436}
1437#endif
1438
1439#if ((defined CONFIG_CPU_SUP_CENTAUR) || (defined CONFIG_CPU_SUP_ZHAOXIN))
1440int zhaoxin_pmu_init(void);
1441#else
1442static inline int zhaoxin_pmu_init(void)
1443{
1444 return 0;
1445}
1446#endif
1447