cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

p6.c (7040B)


      1// SPDX-License-Identifier: GPL-2.0
      2#include <linux/perf_event.h>
      3#include <linux/types.h>
      4
      5#include "../perf_event.h"
      6
      7/*
      8 * Not sure about some of these
      9 */
     10static const u64 p6_perfmon_event_map[] =
     11{
     12  [PERF_COUNT_HW_CPU_CYCLES]		= 0x0079,	/* CPU_CLK_UNHALTED */
     13  [PERF_COUNT_HW_INSTRUCTIONS]		= 0x00c0,	/* INST_RETIRED     */
     14  [PERF_COUNT_HW_CACHE_REFERENCES]	= 0x0f2e,	/* L2_RQSTS:M:E:S:I */
     15  [PERF_COUNT_HW_CACHE_MISSES]		= 0x012e,	/* L2_RQSTS:I       */
     16  [PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= 0x00c4,	/* BR_INST_RETIRED  */
     17  [PERF_COUNT_HW_BRANCH_MISSES]		= 0x00c5,	/* BR_MISS_PRED_RETIRED */
     18  [PERF_COUNT_HW_BUS_CYCLES]		= 0x0062,	/* BUS_DRDY_CLOCKS  */
     19  [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = 0x00a2,	/* RESOURCE_STALLS  */
     20
     21};
     22
     23static const u64 __initconst p6_hw_cache_event_ids
     24				[PERF_COUNT_HW_CACHE_MAX]
     25				[PERF_COUNT_HW_CACHE_OP_MAX]
     26				[PERF_COUNT_HW_CACHE_RESULT_MAX] =
     27{
     28 [ C(L1D) ] = {
     29	[ C(OP_READ) ] = {
     30		[ C(RESULT_ACCESS) ] = 0x0043,	/* DATA_MEM_REFS       */
     31                [ C(RESULT_MISS)   ] = 0x0045,	/* DCU_LINES_IN        */
     32	},
     33	[ C(OP_WRITE) ] = {
     34		[ C(RESULT_ACCESS) ] = 0,
     35		[ C(RESULT_MISS)   ] = 0x0f29,	/* L2_LD:M:E:S:I       */
     36	},
     37        [ C(OP_PREFETCH) ] = {
     38		[ C(RESULT_ACCESS) ] = 0,
     39		[ C(RESULT_MISS)   ] = 0,
     40        },
     41 },
     42 [ C(L1I ) ] = {
     43	[ C(OP_READ) ] = {
     44		[ C(RESULT_ACCESS) ] = 0x0080,	/* IFU_IFETCH         */
     45		[ C(RESULT_MISS)   ] = 0x0f28,	/* L2_IFETCH:M:E:S:I  */
     46	},
     47	[ C(OP_WRITE) ] = {
     48		[ C(RESULT_ACCESS) ] = -1,
     49		[ C(RESULT_MISS)   ] = -1,
     50	},
     51	[ C(OP_PREFETCH) ] = {
     52		[ C(RESULT_ACCESS) ] = 0,
     53		[ C(RESULT_MISS)   ] = 0,
     54	},
     55 },
     56 [ C(LL  ) ] = {
     57	[ C(OP_READ) ] = {
     58		[ C(RESULT_ACCESS) ] = 0,
     59		[ C(RESULT_MISS)   ] = 0,
     60	},
     61	[ C(OP_WRITE) ] = {
     62		[ C(RESULT_ACCESS) ] = 0,
     63		[ C(RESULT_MISS)   ] = 0x0025,	/* L2_M_LINES_INM     */
     64	},
     65	[ C(OP_PREFETCH) ] = {
     66		[ C(RESULT_ACCESS) ] = 0,
     67		[ C(RESULT_MISS)   ] = 0,
     68	},
     69 },
     70 [ C(DTLB) ] = {
     71	[ C(OP_READ) ] = {
     72		[ C(RESULT_ACCESS) ] = 0x0043,	/* DATA_MEM_REFS      */
     73		[ C(RESULT_MISS)   ] = 0,
     74	},
     75	[ C(OP_WRITE) ] = {
     76		[ C(RESULT_ACCESS) ] = 0,
     77		[ C(RESULT_MISS)   ] = 0,
     78	},
     79	[ C(OP_PREFETCH) ] = {
     80		[ C(RESULT_ACCESS) ] = 0,
     81		[ C(RESULT_MISS)   ] = 0,
     82	},
     83 },
     84 [ C(ITLB) ] = {
     85	[ C(OP_READ) ] = {
     86		[ C(RESULT_ACCESS) ] = 0x0080,	/* IFU_IFETCH         */
     87		[ C(RESULT_MISS)   ] = 0x0085,	/* ITLB_MISS          */
     88	},
     89	[ C(OP_WRITE) ] = {
     90		[ C(RESULT_ACCESS) ] = -1,
     91		[ C(RESULT_MISS)   ] = -1,
     92	},
     93	[ C(OP_PREFETCH) ] = {
     94		[ C(RESULT_ACCESS) ] = -1,
     95		[ C(RESULT_MISS)   ] = -1,
     96	},
     97 },
     98 [ C(BPU ) ] = {
     99	[ C(OP_READ) ] = {
    100		[ C(RESULT_ACCESS) ] = 0x00c4,	/* BR_INST_RETIRED      */
    101		[ C(RESULT_MISS)   ] = 0x00c5,	/* BR_MISS_PRED_RETIRED */
    102        },
    103	[ C(OP_WRITE) ] = {
    104		[ C(RESULT_ACCESS) ] = -1,
    105		[ C(RESULT_MISS)   ] = -1,
    106	},
    107	[ C(OP_PREFETCH) ] = {
    108		[ C(RESULT_ACCESS) ] = -1,
    109		[ C(RESULT_MISS)   ] = -1,
    110	},
    111 },
    112};
    113
    114static u64 p6_pmu_event_map(int hw_event)
    115{
    116	return p6_perfmon_event_map[hw_event];
    117}
    118
    119/*
    120 * Event setting that is specified not to count anything.
    121 * We use this to effectively disable a counter.
    122 *
    123 * L2_RQSTS with 0 MESI unit mask.
    124 */
    125#define P6_NOP_EVENT			0x0000002EULL
    126
    127static struct event_constraint p6_event_constraints[] =
    128{
    129	INTEL_EVENT_CONSTRAINT(0xc1, 0x1),	/* FLOPS */
    130	INTEL_EVENT_CONSTRAINT(0x10, 0x1),	/* FP_COMP_OPS_EXE */
    131	INTEL_EVENT_CONSTRAINT(0x11, 0x2),	/* FP_ASSIST */
    132	INTEL_EVENT_CONSTRAINT(0x12, 0x2),	/* MUL */
    133	INTEL_EVENT_CONSTRAINT(0x13, 0x2),	/* DIV */
    134	INTEL_EVENT_CONSTRAINT(0x14, 0x1),	/* CYCLES_DIV_BUSY */
    135	EVENT_CONSTRAINT_END
    136};
    137
    138static void p6_pmu_disable_all(void)
    139{
    140	u64 val;
    141
    142	/* p6 only has one enable register */
    143	rdmsrl(MSR_P6_EVNTSEL0, val);
    144	val &= ~ARCH_PERFMON_EVENTSEL_ENABLE;
    145	wrmsrl(MSR_P6_EVNTSEL0, val);
    146}
    147
    148static void p6_pmu_enable_all(int added)
    149{
    150	unsigned long val;
    151
    152	/* p6 only has one enable register */
    153	rdmsrl(MSR_P6_EVNTSEL0, val);
    154	val |= ARCH_PERFMON_EVENTSEL_ENABLE;
    155	wrmsrl(MSR_P6_EVNTSEL0, val);
    156}
    157
    158static inline void
    159p6_pmu_disable_event(struct perf_event *event)
    160{
    161	struct hw_perf_event *hwc = &event->hw;
    162	u64 val = P6_NOP_EVENT;
    163
    164	(void)wrmsrl_safe(hwc->config_base, val);
    165}
    166
    167static void p6_pmu_enable_event(struct perf_event *event)
    168{
    169	struct hw_perf_event *hwc = &event->hw;
    170	u64 val;
    171
    172	val = hwc->config;
    173
    174	/*
    175	 * p6 only has a global event enable, set on PerfEvtSel0
    176	 * We "disable" events by programming P6_NOP_EVENT
    177	 * and we rely on p6_pmu_enable_all() being called
    178	 * to actually enable the events.
    179	 */
    180
    181	(void)wrmsrl_safe(hwc->config_base, val);
    182}
    183
    184PMU_FORMAT_ATTR(event,	"config:0-7"	);
    185PMU_FORMAT_ATTR(umask,	"config:8-15"	);
    186PMU_FORMAT_ATTR(edge,	"config:18"	);
    187PMU_FORMAT_ATTR(pc,	"config:19"	);
    188PMU_FORMAT_ATTR(inv,	"config:23"	);
    189PMU_FORMAT_ATTR(cmask,	"config:24-31"	);
    190
    191static struct attribute *intel_p6_formats_attr[] = {
    192	&format_attr_event.attr,
    193	&format_attr_umask.attr,
    194	&format_attr_edge.attr,
    195	&format_attr_pc.attr,
    196	&format_attr_inv.attr,
    197	&format_attr_cmask.attr,
    198	NULL,
    199};
    200
    201static __initconst const struct x86_pmu p6_pmu = {
    202	.name			= "p6",
    203	.handle_irq		= x86_pmu_handle_irq,
    204	.disable_all		= p6_pmu_disable_all,
    205	.enable_all		= p6_pmu_enable_all,
    206	.enable			= p6_pmu_enable_event,
    207	.disable		= p6_pmu_disable_event,
    208	.hw_config		= x86_pmu_hw_config,
    209	.schedule_events	= x86_schedule_events,
    210	.eventsel		= MSR_P6_EVNTSEL0,
    211	.perfctr		= MSR_P6_PERFCTR0,
    212	.event_map		= p6_pmu_event_map,
    213	.max_events		= ARRAY_SIZE(p6_perfmon_event_map),
    214	.apic			= 1,
    215	.max_period		= (1ULL << 31) - 1,
    216	.version		= 0,
    217	.num_counters		= 2,
    218	/*
    219	 * Events have 40 bits implemented. However they are designed such
    220	 * that bits [32-39] are sign extensions of bit 31. As such the
    221	 * effective width of a event for P6-like PMU is 32 bits only.
    222	 *
    223	 * See IA-32 Intel Architecture Software developer manual Vol 3B
    224	 */
    225	.cntval_bits		= 32,
    226	.cntval_mask		= (1ULL << 32) - 1,
    227	.get_event_constraints	= x86_get_event_constraints,
    228	.event_constraints	= p6_event_constraints,
    229
    230	.format_attrs		= intel_p6_formats_attr,
    231	.events_sysfs_show	= intel_event_sysfs_show,
    232
    233};
    234
    235static __init void p6_pmu_rdpmc_quirk(void)
    236{
    237	if (boot_cpu_data.x86_stepping < 9) {
    238		/*
    239		 * PPro erratum 26; fixed in stepping 9 and above.
    240		 */
    241		pr_warn("Userspace RDPMC support disabled due to a CPU erratum\n");
    242		x86_pmu.attr_rdpmc_broken = 1;
    243		x86_pmu.attr_rdpmc = 0;
    244	}
    245}
    246
    247__init int p6_pmu_init(void)
    248{
    249	x86_pmu = p6_pmu;
    250
    251	switch (boot_cpu_data.x86_model) {
    252	case  1: /* Pentium Pro */
    253		x86_add_quirk(p6_pmu_rdpmc_quirk);
    254		break;
    255
    256	case  3: /* Pentium II - Klamath */
    257	case  5: /* Pentium II - Deschutes */
    258	case  6: /* Pentium II - Mendocino */
    259		break;
    260
    261	case  7: /* Pentium III - Katmai */
    262	case  8: /* Pentium III - Coppermine */
    263	case 10: /* Pentium III Xeon */
    264	case 11: /* Pentium III - Tualatin */
    265		break;
    266
    267	case  9: /* Pentium M - Banias */
    268	case 13: /* Pentium M - Dothan */
    269		break;
    270
    271	default:
    272		pr_cont("unsupported p6 CPU model %d ", boot_cpu_data.x86_model);
    273		return -ENODEV;
    274	}
    275
    276	memcpy(hw_cache_event_ids, p6_hw_cache_event_ids,
    277		sizeof(hw_cache_event_ids));
    278
    279	return 0;
    280}