cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

amd_nb.c (14017B)


      1// SPDX-License-Identifier: GPL-2.0-only
      2/*
      3 * Shared support code for AMD K8 northbridges and derivatives.
      4 * Copyright 2006 Andi Kleen, SUSE Labs.
      5 */
      6
      7#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
      8
      9#include <linux/types.h>
     10#include <linux/slab.h>
     11#include <linux/init.h>
     12#include <linux/errno.h>
     13#include <linux/export.h>
     14#include <linux/spinlock.h>
     15#include <linux/pci_ids.h>
     16#include <asm/amd_nb.h>
     17
     18#define PCI_DEVICE_ID_AMD_17H_ROOT	0x1450
     19#define PCI_DEVICE_ID_AMD_17H_M10H_ROOT	0x15d0
     20#define PCI_DEVICE_ID_AMD_17H_M30H_ROOT	0x1480
     21#define PCI_DEVICE_ID_AMD_17H_M60H_ROOT	0x1630
     22#define PCI_DEVICE_ID_AMD_19H_M10H_ROOT	0x14a4
     23#define PCI_DEVICE_ID_AMD_17H_DF_F4	0x1464
     24#define PCI_DEVICE_ID_AMD_17H_M10H_DF_F4 0x15ec
     25#define PCI_DEVICE_ID_AMD_17H_M30H_DF_F4 0x1494
     26#define PCI_DEVICE_ID_AMD_17H_M60H_DF_F4 0x144c
     27#define PCI_DEVICE_ID_AMD_17H_M70H_DF_F4 0x1444
     28#define PCI_DEVICE_ID_AMD_19H_DF_F4	0x1654
     29#define PCI_DEVICE_ID_AMD_19H_M10H_DF_F4 0x14b1
     30#define PCI_DEVICE_ID_AMD_19H_M40H_ROOT	0x14b5
     31#define PCI_DEVICE_ID_AMD_19H_M40H_DF_F4 0x167d
     32#define PCI_DEVICE_ID_AMD_19H_M50H_DF_F4 0x166e
     33
     34/* Protect the PCI config register pairs used for SMN. */
     35static DEFINE_MUTEX(smn_mutex);
     36
     37static u32 *flush_words;
     38
     39static const struct pci_device_id amd_root_ids[] = {
     40	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_ROOT) },
     41	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M10H_ROOT) },
     42	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M30H_ROOT) },
     43	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M60H_ROOT) },
     44	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_M10H_ROOT) },
     45	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_M40H_ROOT) },
     46	{}
     47};
     48
     49#define PCI_DEVICE_ID_AMD_CNB17H_F4     0x1704
     50
     51static const struct pci_device_id amd_nb_misc_ids[] = {
     52	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_K8_NB_MISC) },
     53	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_10H_NB_MISC) },
     54	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_NB_F3) },
     55	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M10H_F3) },
     56	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M30H_NB_F3) },
     57	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M60H_NB_F3) },
     58	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_16H_NB_F3) },
     59	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_16H_M30H_NB_F3) },
     60	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_DF_F3) },
     61	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M10H_DF_F3) },
     62	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M30H_DF_F3) },
     63	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M60H_DF_F3) },
     64	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_CNB17H_F3) },
     65	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M70H_DF_F3) },
     66	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_DF_F3) },
     67	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_M10H_DF_F3) },
     68	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_M40H_DF_F3) },
     69	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_M50H_DF_F3) },
     70	{}
     71};
     72
     73static const struct pci_device_id amd_nb_link_ids[] = {
     74	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_NB_F4) },
     75	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M30H_NB_F4) },
     76	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M60H_NB_F4) },
     77	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_16H_NB_F4) },
     78	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_16H_M30H_NB_F4) },
     79	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_DF_F4) },
     80	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M10H_DF_F4) },
     81	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M30H_DF_F4) },
     82	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M60H_DF_F4) },
     83	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M70H_DF_F4) },
     84	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_DF_F4) },
     85	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_M10H_DF_F4) },
     86	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_M40H_DF_F4) },
     87	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_19H_M50H_DF_F4) },
     88	{ PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_CNB17H_F4) },
     89	{}
     90};
     91
     92static const struct pci_device_id hygon_root_ids[] = {
     93	{ PCI_DEVICE(PCI_VENDOR_ID_HYGON, PCI_DEVICE_ID_AMD_17H_ROOT) },
     94	{}
     95};
     96
     97static const struct pci_device_id hygon_nb_misc_ids[] = {
     98	{ PCI_DEVICE(PCI_VENDOR_ID_HYGON, PCI_DEVICE_ID_AMD_17H_DF_F3) },
     99	{}
    100};
    101
    102static const struct pci_device_id hygon_nb_link_ids[] = {
    103	{ PCI_DEVICE(PCI_VENDOR_ID_HYGON, PCI_DEVICE_ID_AMD_17H_DF_F4) },
    104	{}
    105};
    106
    107const struct amd_nb_bus_dev_range amd_nb_bus_dev_ranges[] __initconst = {
    108	{ 0x00, 0x18, 0x20 },
    109	{ 0xff, 0x00, 0x20 },
    110	{ 0xfe, 0x00, 0x20 },
    111	{ }
    112};
    113
    114static struct amd_northbridge_info amd_northbridges;
    115
    116u16 amd_nb_num(void)
    117{
    118	return amd_northbridges.num;
    119}
    120EXPORT_SYMBOL_GPL(amd_nb_num);
    121
    122bool amd_nb_has_feature(unsigned int feature)
    123{
    124	return ((amd_northbridges.flags & feature) == feature);
    125}
    126EXPORT_SYMBOL_GPL(amd_nb_has_feature);
    127
    128struct amd_northbridge *node_to_amd_nb(int node)
    129{
    130	return (node < amd_northbridges.num) ? &amd_northbridges.nb[node] : NULL;
    131}
    132EXPORT_SYMBOL_GPL(node_to_amd_nb);
    133
    134static struct pci_dev *next_northbridge(struct pci_dev *dev,
    135					const struct pci_device_id *ids)
    136{
    137	do {
    138		dev = pci_get_device(PCI_ANY_ID, PCI_ANY_ID, dev);
    139		if (!dev)
    140			break;
    141	} while (!pci_match_id(ids, dev));
    142	return dev;
    143}
    144
    145static int __amd_smn_rw(u16 node, u32 address, u32 *value, bool write)
    146{
    147	struct pci_dev *root;
    148	int err = -ENODEV;
    149
    150	if (node >= amd_northbridges.num)
    151		goto out;
    152
    153	root = node_to_amd_nb(node)->root;
    154	if (!root)
    155		goto out;
    156
    157	mutex_lock(&smn_mutex);
    158
    159	err = pci_write_config_dword(root, 0x60, address);
    160	if (err) {
    161		pr_warn("Error programming SMN address 0x%x.\n", address);
    162		goto out_unlock;
    163	}
    164
    165	err = (write ? pci_write_config_dword(root, 0x64, *value)
    166		     : pci_read_config_dword(root, 0x64, value));
    167	if (err)
    168		pr_warn("Error %s SMN address 0x%x.\n",
    169			(write ? "writing to" : "reading from"), address);
    170
    171out_unlock:
    172	mutex_unlock(&smn_mutex);
    173
    174out:
    175	return err;
    176}
    177
    178int amd_smn_read(u16 node, u32 address, u32 *value)
    179{
    180	return __amd_smn_rw(node, address, value, false);
    181}
    182EXPORT_SYMBOL_GPL(amd_smn_read);
    183
    184int amd_smn_write(u16 node, u32 address, u32 value)
    185{
    186	return __amd_smn_rw(node, address, &value, true);
    187}
    188EXPORT_SYMBOL_GPL(amd_smn_write);
    189
    190
    191static int amd_cache_northbridges(void)
    192{
    193	const struct pci_device_id *misc_ids = amd_nb_misc_ids;
    194	const struct pci_device_id *link_ids = amd_nb_link_ids;
    195	const struct pci_device_id *root_ids = amd_root_ids;
    196	struct pci_dev *root, *misc, *link;
    197	struct amd_northbridge *nb;
    198	u16 roots_per_misc = 0;
    199	u16 misc_count = 0;
    200	u16 root_count = 0;
    201	u16 i, j;
    202
    203	if (amd_northbridges.num)
    204		return 0;
    205
    206	if (boot_cpu_data.x86_vendor == X86_VENDOR_HYGON) {
    207		root_ids = hygon_root_ids;
    208		misc_ids = hygon_nb_misc_ids;
    209		link_ids = hygon_nb_link_ids;
    210	}
    211
    212	misc = NULL;
    213	while ((misc = next_northbridge(misc, misc_ids)))
    214		misc_count++;
    215
    216	if (!misc_count)
    217		return -ENODEV;
    218
    219	root = NULL;
    220	while ((root = next_northbridge(root, root_ids)))
    221		root_count++;
    222
    223	if (root_count) {
    224		roots_per_misc = root_count / misc_count;
    225
    226		/*
    227		 * There should be _exactly_ N roots for each DF/SMN
    228		 * interface.
    229		 */
    230		if (!roots_per_misc || (root_count % roots_per_misc)) {
    231			pr_info("Unsupported AMD DF/PCI configuration found\n");
    232			return -ENODEV;
    233		}
    234	}
    235
    236	nb = kcalloc(misc_count, sizeof(struct amd_northbridge), GFP_KERNEL);
    237	if (!nb)
    238		return -ENOMEM;
    239
    240	amd_northbridges.nb = nb;
    241	amd_northbridges.num = misc_count;
    242
    243	link = misc = root = NULL;
    244	for (i = 0; i < amd_northbridges.num; i++) {
    245		node_to_amd_nb(i)->root = root =
    246			next_northbridge(root, root_ids);
    247		node_to_amd_nb(i)->misc = misc =
    248			next_northbridge(misc, misc_ids);
    249		node_to_amd_nb(i)->link = link =
    250			next_northbridge(link, link_ids);
    251
    252		/*
    253		 * If there are more PCI root devices than data fabric/
    254		 * system management network interfaces, then the (N)
    255		 * PCI roots per DF/SMN interface are functionally the
    256		 * same (for DF/SMN access) and N-1 are redundant.  N-1
    257		 * PCI roots should be skipped per DF/SMN interface so
    258		 * the following DF/SMN interfaces get mapped to
    259		 * correct PCI roots.
    260		 */
    261		for (j = 1; j < roots_per_misc; j++)
    262			root = next_northbridge(root, root_ids);
    263	}
    264
    265	if (amd_gart_present())
    266		amd_northbridges.flags |= AMD_NB_GART;
    267
    268	/*
    269	 * Check for L3 cache presence.
    270	 */
    271	if (!cpuid_edx(0x80000006))
    272		return 0;
    273
    274	/*
    275	 * Some CPU families support L3 Cache Index Disable. There are some
    276	 * limitations because of E382 and E388 on family 0x10.
    277	 */
    278	if (boot_cpu_data.x86 == 0x10 &&
    279	    boot_cpu_data.x86_model >= 0x8 &&
    280	    (boot_cpu_data.x86_model > 0x9 ||
    281	     boot_cpu_data.x86_stepping >= 0x1))
    282		amd_northbridges.flags |= AMD_NB_L3_INDEX_DISABLE;
    283
    284	if (boot_cpu_data.x86 == 0x15)
    285		amd_northbridges.flags |= AMD_NB_L3_INDEX_DISABLE;
    286
    287	/* L3 cache partitioning is supported on family 0x15 */
    288	if (boot_cpu_data.x86 == 0x15)
    289		amd_northbridges.flags |= AMD_NB_L3_PARTITIONING;
    290
    291	return 0;
    292}
    293
    294/*
    295 * Ignores subdevice/subvendor but as far as I can figure out
    296 * they're useless anyways
    297 */
    298bool __init early_is_amd_nb(u32 device)
    299{
    300	const struct pci_device_id *misc_ids = amd_nb_misc_ids;
    301	const struct pci_device_id *id;
    302	u32 vendor = device & 0xffff;
    303
    304	if (boot_cpu_data.x86_vendor != X86_VENDOR_AMD &&
    305	    boot_cpu_data.x86_vendor != X86_VENDOR_HYGON)
    306		return false;
    307
    308	if (boot_cpu_data.x86_vendor == X86_VENDOR_HYGON)
    309		misc_ids = hygon_nb_misc_ids;
    310
    311	device >>= 16;
    312	for (id = misc_ids; id->vendor; id++)
    313		if (vendor == id->vendor && device == id->device)
    314			return true;
    315	return false;
    316}
    317
    318struct resource *amd_get_mmconfig_range(struct resource *res)
    319{
    320	u32 address;
    321	u64 base, msr;
    322	unsigned int segn_busn_bits;
    323
    324	if (boot_cpu_data.x86_vendor != X86_VENDOR_AMD &&
    325	    boot_cpu_data.x86_vendor != X86_VENDOR_HYGON)
    326		return NULL;
    327
    328	/* assume all cpus from fam10h have mmconfig */
    329	if (boot_cpu_data.x86 < 0x10)
    330		return NULL;
    331
    332	address = MSR_FAM10H_MMIO_CONF_BASE;
    333	rdmsrl(address, msr);
    334
    335	/* mmconfig is not enabled */
    336	if (!(msr & FAM10H_MMIO_CONF_ENABLE))
    337		return NULL;
    338
    339	base = msr & (FAM10H_MMIO_CONF_BASE_MASK<<FAM10H_MMIO_CONF_BASE_SHIFT);
    340
    341	segn_busn_bits = (msr >> FAM10H_MMIO_CONF_BUSRANGE_SHIFT) &
    342			 FAM10H_MMIO_CONF_BUSRANGE_MASK;
    343
    344	res->flags = IORESOURCE_MEM;
    345	res->start = base;
    346	res->end = base + (1ULL<<(segn_busn_bits + 20)) - 1;
    347	return res;
    348}
    349
    350int amd_get_subcaches(int cpu)
    351{
    352	struct pci_dev *link = node_to_amd_nb(topology_die_id(cpu))->link;
    353	unsigned int mask;
    354
    355	if (!amd_nb_has_feature(AMD_NB_L3_PARTITIONING))
    356		return 0;
    357
    358	pci_read_config_dword(link, 0x1d4, &mask);
    359
    360	return (mask >> (4 * cpu_data(cpu).cpu_core_id)) & 0xf;
    361}
    362
    363int amd_set_subcaches(int cpu, unsigned long mask)
    364{
    365	static unsigned int reset, ban;
    366	struct amd_northbridge *nb = node_to_amd_nb(topology_die_id(cpu));
    367	unsigned int reg;
    368	int cuid;
    369
    370	if (!amd_nb_has_feature(AMD_NB_L3_PARTITIONING) || mask > 0xf)
    371		return -EINVAL;
    372
    373	/* if necessary, collect reset state of L3 partitioning and BAN mode */
    374	if (reset == 0) {
    375		pci_read_config_dword(nb->link, 0x1d4, &reset);
    376		pci_read_config_dword(nb->misc, 0x1b8, &ban);
    377		ban &= 0x180000;
    378	}
    379
    380	/* deactivate BAN mode if any subcaches are to be disabled */
    381	if (mask != 0xf) {
    382		pci_read_config_dword(nb->misc, 0x1b8, &reg);
    383		pci_write_config_dword(nb->misc, 0x1b8, reg & ~0x180000);
    384	}
    385
    386	cuid = cpu_data(cpu).cpu_core_id;
    387	mask <<= 4 * cuid;
    388	mask |= (0xf ^ (1 << cuid)) << 26;
    389
    390	pci_write_config_dword(nb->link, 0x1d4, mask);
    391
    392	/* reset BAN mode if L3 partitioning returned to reset state */
    393	pci_read_config_dword(nb->link, 0x1d4, &reg);
    394	if (reg == reset) {
    395		pci_read_config_dword(nb->misc, 0x1b8, &reg);
    396		reg &= ~0x180000;
    397		pci_write_config_dword(nb->misc, 0x1b8, reg | ban);
    398	}
    399
    400	return 0;
    401}
    402
    403static void amd_cache_gart(void)
    404{
    405	u16 i;
    406
    407	if (!amd_nb_has_feature(AMD_NB_GART))
    408		return;
    409
    410	flush_words = kmalloc_array(amd_northbridges.num, sizeof(u32), GFP_KERNEL);
    411	if (!flush_words) {
    412		amd_northbridges.flags &= ~AMD_NB_GART;
    413		pr_notice("Cannot initialize GART flush words, GART support disabled\n");
    414		return;
    415	}
    416
    417	for (i = 0; i != amd_northbridges.num; i++)
    418		pci_read_config_dword(node_to_amd_nb(i)->misc, 0x9c, &flush_words[i]);
    419}
    420
    421void amd_flush_garts(void)
    422{
    423	int flushed, i;
    424	unsigned long flags;
    425	static DEFINE_SPINLOCK(gart_lock);
    426
    427	if (!amd_nb_has_feature(AMD_NB_GART))
    428		return;
    429
    430	/*
    431	 * Avoid races between AGP and IOMMU. In theory it's not needed
    432	 * but I'm not sure if the hardware won't lose flush requests
    433	 * when another is pending. This whole thing is so expensive anyways
    434	 * that it doesn't matter to serialize more. -AK
    435	 */
    436	spin_lock_irqsave(&gart_lock, flags);
    437	flushed = 0;
    438	for (i = 0; i < amd_northbridges.num; i++) {
    439		pci_write_config_dword(node_to_amd_nb(i)->misc, 0x9c,
    440				       flush_words[i] | 1);
    441		flushed++;
    442	}
    443	for (i = 0; i < amd_northbridges.num; i++) {
    444		u32 w;
    445		/* Make sure the hardware actually executed the flush*/
    446		for (;;) {
    447			pci_read_config_dword(node_to_amd_nb(i)->misc,
    448					      0x9c, &w);
    449			if (!(w & 1))
    450				break;
    451			cpu_relax();
    452		}
    453	}
    454	spin_unlock_irqrestore(&gart_lock, flags);
    455	if (!flushed)
    456		pr_notice("nothing to flush?\n");
    457}
    458EXPORT_SYMBOL_GPL(amd_flush_garts);
    459
    460static void __fix_erratum_688(void *info)
    461{
    462#define MSR_AMD64_IC_CFG 0xC0011021
    463
    464	msr_set_bit(MSR_AMD64_IC_CFG, 3);
    465	msr_set_bit(MSR_AMD64_IC_CFG, 14);
    466}
    467
    468/* Apply erratum 688 fix so machines without a BIOS fix work. */
    469static __init void fix_erratum_688(void)
    470{
    471	struct pci_dev *F4;
    472	u32 val;
    473
    474	if (boot_cpu_data.x86 != 0x14)
    475		return;
    476
    477	if (!amd_northbridges.num)
    478		return;
    479
    480	F4 = node_to_amd_nb(0)->link;
    481	if (!F4)
    482		return;
    483
    484	if (pci_read_config_dword(F4, 0x164, &val))
    485		return;
    486
    487	if (val & BIT(2))
    488		return;
    489
    490	on_each_cpu(__fix_erratum_688, NULL, 0);
    491
    492	pr_info("x86/cpu/AMD: CPU erratum 688 worked around\n");
    493}
    494
    495static __init int init_amd_nbs(void)
    496{
    497	amd_cache_northbridges();
    498	amd_cache_gart();
    499
    500	fix_erratum_688();
    501
    502	return 0;
    503}
    504
    505/* This has to go after the PCI subsystem */
    506fs_initcall(init_amd_nbs);