linux/arch/x86/events/intel/p6.c
<<
>>
Prefs
   1// SPDX-License-Identifier: GPL-2.0
   2#include <linux/perf_event.h>
   3#include <linux/types.h>
   4
   5#include "../perf_event.h"
   6
   7/*
   8 * Not sure about some of these
   9 */
  10static const u64 p6_perfmon_event_map[] =
  11{
  12  [PERF_COUNT_HW_CPU_CYCLES]            = 0x0079,       /* CPU_CLK_UNHALTED */
  13  [PERF_COUNT_HW_INSTRUCTIONS]          = 0x00c0,       /* INST_RETIRED     */
  14  [PERF_COUNT_HW_CACHE_REFERENCES]      = 0x0f2e,       /* L2_RQSTS:M:E:S:I */
  15  [PERF_COUNT_HW_CACHE_MISSES]          = 0x012e,       /* L2_RQSTS:I       */
  16  [PERF_COUNT_HW_BRANCH_INSTRUCTIONS]   = 0x00c4,       /* BR_INST_RETIRED  */
  17  [PERF_COUNT_HW_BRANCH_MISSES]         = 0x00c5,       /* BR_MISS_PRED_RETIRED */
  18  [PERF_COUNT_HW_BUS_CYCLES]            = 0x0062,       /* BUS_DRDY_CLOCKS  */
  19  [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = 0x00a2,     /* RESOURCE_STALLS  */
  20
  21};
  22
  23static const u64 __initconst p6_hw_cache_event_ids
  24                                [PERF_COUNT_HW_CACHE_MAX]
  25                                [PERF_COUNT_HW_CACHE_OP_MAX]
  26                                [PERF_COUNT_HW_CACHE_RESULT_MAX] =
  27{
  28 [ C(L1D) ] = {
  29        [ C(OP_READ) ] = {
  30                [ C(RESULT_ACCESS) ] = 0x0043,  /* DATA_MEM_REFS       */
  31                [ C(RESULT_MISS)   ] = 0x0045,  /* DCU_LINES_IN        */
  32        },
  33        [ C(OP_WRITE) ] = {
  34                [ C(RESULT_ACCESS) ] = 0,
  35                [ C(RESULT_MISS)   ] = 0x0f29,  /* L2_LD:M:E:S:I       */
  36        },
  37        [ C(OP_PREFETCH) ] = {
  38                [ C(RESULT_ACCESS) ] = 0,
  39                [ C(RESULT_MISS)   ] = 0,
  40        },
  41 },
  42 [ C(L1I ) ] = {
  43        [ C(OP_READ) ] = {
  44                [ C(RESULT_ACCESS) ] = 0x0080,  /* IFU_IFETCH         */
  45                [ C(RESULT_MISS)   ] = 0x0f28,  /* L2_IFETCH:M:E:S:I  */
  46        },
  47        [ C(OP_WRITE) ] = {
  48                [ C(RESULT_ACCESS) ] = -1,
  49                [ C(RESULT_MISS)   ] = -1,
  50        },
  51        [ C(OP_PREFETCH) ] = {
  52                [ C(RESULT_ACCESS) ] = 0,
  53                [ C(RESULT_MISS)   ] = 0,
  54        },
  55 },
  56 [ C(LL  ) ] = {
  57        [ C(OP_READ) ] = {
  58                [ C(RESULT_ACCESS) ] = 0,
  59                [ C(RESULT_MISS)   ] = 0,
  60        },
  61        [ C(OP_WRITE) ] = {
  62                [ C(RESULT_ACCESS) ] = 0,
  63                [ C(RESULT_MISS)   ] = 0x0025,  /* L2_M_LINES_INM     */
  64        },
  65        [ C(OP_PREFETCH) ] = {
  66                [ C(RESULT_ACCESS) ] = 0,
  67                [ C(RESULT_MISS)   ] = 0,
  68        },
  69 },
  70 [ C(DTLB) ] = {
  71        [ C(OP_READ) ] = {
  72                [ C(RESULT_ACCESS) ] = 0x0043,  /* DATA_MEM_REFS      */
  73                [ C(RESULT_MISS)   ] = 0,
  74        },
  75        [ C(OP_WRITE) ] = {
  76                [ C(RESULT_ACCESS) ] = 0,
  77                [ C(RESULT_MISS)   ] = 0,
  78        },
  79        [ C(OP_PREFETCH) ] = {
  80                [ C(RESULT_ACCESS) ] = 0,
  81                [ C(RESULT_MISS)   ] = 0,
  82        },
  83 },
  84 [ C(ITLB) ] = {
  85        [ C(OP_READ) ] = {
  86                [ C(RESULT_ACCESS) ] = 0x0080,  /* IFU_IFETCH         */
  87                [ C(RESULT_MISS)   ] = 0x0085,  /* ITLB_MISS          */
  88        },
  89        [ C(OP_WRITE) ] = {
  90                [ C(RESULT_ACCESS) ] = -1,
  91                [ C(RESULT_MISS)   ] = -1,
  92        },
  93        [ C(OP_PREFETCH) ] = {
  94                [ C(RESULT_ACCESS) ] = -1,
  95                [ C(RESULT_MISS)   ] = -1,
  96        },
  97 },
  98 [ C(BPU ) ] = {
  99        [ C(OP_READ) ] = {
 100                [ C(RESULT_ACCESS) ] = 0x00c4,  /* BR_INST_RETIRED      */
 101                [ C(RESULT_MISS)   ] = 0x00c5,  /* BR_MISS_PRED_RETIRED */
 102        },
 103        [ C(OP_WRITE) ] = {
 104                [ C(RESULT_ACCESS) ] = -1,
 105                [ C(RESULT_MISS)   ] = -1,
 106        },
 107        [ C(OP_PREFETCH) ] = {
 108                [ C(RESULT_ACCESS) ] = -1,
 109                [ C(RESULT_MISS)   ] = -1,
 110        },
 111 },
 112};
 113
 114static u64 p6_pmu_event_map(int hw_event)
 115{
 116        return p6_perfmon_event_map[hw_event];
 117}
 118
 119/*
 120 * Event setting that is specified not to count anything.
 121 * We use this to effectively disable a counter.
 122 *
 123 * L2_RQSTS with 0 MESI unit mask.
 124 */
 125#define P6_NOP_EVENT                    0x0000002EULL
 126
 127static struct event_constraint p6_event_constraints[] =
 128{
 129        INTEL_EVENT_CONSTRAINT(0xc1, 0x1),      /* FLOPS */
 130        INTEL_EVENT_CONSTRAINT(0x10, 0x1),      /* FP_COMP_OPS_EXE */
 131        INTEL_EVENT_CONSTRAINT(0x11, 0x2),      /* FP_ASSIST */
 132        INTEL_EVENT_CONSTRAINT(0x12, 0x2),      /* MUL */
 133        INTEL_EVENT_CONSTRAINT(0x13, 0x2),      /* DIV */
 134        INTEL_EVENT_CONSTRAINT(0x14, 0x1),      /* CYCLES_DIV_BUSY */
 135        EVENT_CONSTRAINT_END
 136};
 137
 138static void p6_pmu_disable_all(void)
 139{
 140        u64 val;
 141
 142        /* p6 only has one enable register */
 143        rdmsrl(MSR_P6_EVNTSEL0, val);
 144        val &= ~ARCH_PERFMON_EVENTSEL_ENABLE;
 145        wrmsrl(MSR_P6_EVNTSEL0, val);
 146}
 147
 148static void p6_pmu_enable_all(int added)
 149{
 150        unsigned long val;
 151
 152        /* p6 only has one enable register */
 153        rdmsrl(MSR_P6_EVNTSEL0, val);
 154        val |= ARCH_PERFMON_EVENTSEL_ENABLE;
 155        wrmsrl(MSR_P6_EVNTSEL0, val);
 156}
 157
 158static inline void
 159p6_pmu_disable_event(struct perf_event *event)
 160{
 161        struct hw_perf_event *hwc = &event->hw;
 162        u64 val = P6_NOP_EVENT;
 163
 164        (void)wrmsrl_safe(hwc->config_base, val);
 165}
 166
 167static void p6_pmu_enable_event(struct perf_event *event)
 168{
 169        struct hw_perf_event *hwc = &event->hw;
 170        u64 val;
 171
 172        val = hwc->config;
 173
 174        /*
 175         * p6 only has a global event enable, set on PerfEvtSel0
 176         * We "disable" events by programming P6_NOP_EVENT
 177         * and we rely on p6_pmu_enable_all() being called
 178         * to actually enable the events.
 179         */
 180
 181        (void)wrmsrl_safe(hwc->config_base, val);
 182}
 183
 184PMU_FORMAT_ATTR(event,  "config:0-7"    );
 185PMU_FORMAT_ATTR(umask,  "config:8-15"   );
 186PMU_FORMAT_ATTR(edge,   "config:18"     );
 187PMU_FORMAT_ATTR(pc,     "config:19"     );
 188PMU_FORMAT_ATTR(inv,    "config:23"     );
 189PMU_FORMAT_ATTR(cmask,  "config:24-31"  );
 190
 191static struct attribute *intel_p6_formats_attr[] = {
 192        &format_attr_event.attr,
 193        &format_attr_umask.attr,
 194        &format_attr_edge.attr,
 195        &format_attr_pc.attr,
 196        &format_attr_inv.attr,
 197        &format_attr_cmask.attr,
 198        NULL,
 199};
 200
 201static __initconst const struct x86_pmu p6_pmu = {
 202        .name                   = "p6",
 203        .handle_irq             = x86_pmu_handle_irq,
 204        .disable_all            = p6_pmu_disable_all,
 205        .enable_all             = p6_pmu_enable_all,
 206        .enable                 = p6_pmu_enable_event,
 207        .disable                = p6_pmu_disable_event,
 208        .hw_config              = x86_pmu_hw_config,
 209        .schedule_events        = x86_schedule_events,
 210        .eventsel               = MSR_P6_EVNTSEL0,
 211        .perfctr                = MSR_P6_PERFCTR0,
 212        .event_map              = p6_pmu_event_map,
 213        .max_events             = ARRAY_SIZE(p6_perfmon_event_map),
 214        .apic                   = 1,
 215        .max_period             = (1ULL << 31) - 1,
 216        .version                = 0,
 217        .num_counters           = 2,
 218        /*
 219         * Events have 40 bits implemented. However they are designed such
 220         * that bits [32-39] are sign extensions of bit 31. As such the
 221         * effective width of a event for P6-like PMU is 32 bits only.
 222         *
 223         * See IA-32 Intel Architecture Software developer manual Vol 3B
 224         */
 225        .cntval_bits            = 32,
 226        .cntval_mask            = (1ULL << 32) - 1,
 227        .get_event_constraints  = x86_get_event_constraints,
 228        .event_constraints      = p6_event_constraints,
 229
 230        .format_attrs           = intel_p6_formats_attr,
 231        .events_sysfs_show      = intel_event_sysfs_show,
 232
 233};
 234
 235static __init void p6_pmu_rdpmc_quirk(void)
 236{
 237        if (boot_cpu_data.x86_mask < 9) {
 238                /*
 239                 * PPro erratum 26; fixed in stepping 9 and above.
 240                 */
 241                pr_warn("Userspace RDPMC support disabled due to a CPU erratum\n");
 242                x86_pmu.attr_rdpmc_broken = 1;
 243                x86_pmu.attr_rdpmc = 0;
 244        }
 245}
 246
 247__init int p6_pmu_init(void)
 248{
 249        x86_pmu = p6_pmu;
 250
 251        switch (boot_cpu_data.x86_model) {
 252        case  1: /* Pentium Pro */
 253                x86_add_quirk(p6_pmu_rdpmc_quirk);
 254                break;
 255
 256        case  3: /* Pentium II - Klamath */
 257        case  5: /* Pentium II - Deschutes */
 258        case  6: /* Pentium II - Mendocino */
 259                break;
 260
 261        case  7: /* Pentium III - Katmai */
 262        case  8: /* Pentium III - Coppermine */
 263        case 10: /* Pentium III Xeon */
 264        case 11: /* Pentium III - Tualatin */
 265                break;
 266
 267        case  9: /* Pentium M - Banias */
 268        case 13: /* Pentium M - Dothan */
 269                break;
 270
 271        default:
 272                pr_cont("unsupported p6 CPU model %d ", boot_cpu_data.x86_model);
 273                return -ENODEV;
 274        }
 275
 276        memcpy(hw_cache_event_ids, p6_hw_cache_event_ids,
 277                sizeof(hw_cache_event_ids));
 278
 279        return 0;
 280}
 281