cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

pci.c (28427B)


      1// SPDX-License-Identifier: GPL-2.0
      2/*
      3 * Copyright IBM Corp. 2012
      4 *
      5 * Author(s):
      6 *   Jan Glauber <jang@linux.vnet.ibm.com>
      7 *
      8 * The System z PCI code is a rewrite from a prototype by
      9 * the following people (Kudoz!):
     10 *   Alexander Schmidt
     11 *   Christoph Raisch
     12 *   Hannes Hering
     13 *   Hoang-Nam Nguyen
     14 *   Jan-Bernd Themann
     15 *   Stefan Roscher
     16 *   Thomas Klein
     17 */
     18
     19#define KMSG_COMPONENT "zpci"
     20#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
     21
     22#include <linux/kernel.h>
     23#include <linux/slab.h>
     24#include <linux/err.h>
     25#include <linux/export.h>
     26#include <linux/delay.h>
     27#include <linux/seq_file.h>
     28#include <linux/jump_label.h>
     29#include <linux/pci.h>
     30#include <linux/printk.h>
     31
     32#include <asm/isc.h>
     33#include <asm/airq.h>
     34#include <asm/facility.h>
     35#include <asm/pci_insn.h>
     36#include <asm/pci_clp.h>
     37#include <asm/pci_dma.h>
     38
     39#include "pci_bus.h"
     40#include "pci_iov.h"
     41
     42/* list of all detected zpci devices */
     43static LIST_HEAD(zpci_list);
     44static DEFINE_SPINLOCK(zpci_list_lock);
     45
     46static DECLARE_BITMAP(zpci_domain, ZPCI_DOMAIN_BITMAP_SIZE);
     47static DEFINE_SPINLOCK(zpci_domain_lock);
     48
     49#define ZPCI_IOMAP_ENTRIES						\
     50	min(((unsigned long) ZPCI_NR_DEVICES * PCI_STD_NUM_BARS / 2),	\
     51	    ZPCI_IOMAP_MAX_ENTRIES)
     52
     53unsigned int s390_pci_no_rid;
     54
     55static DEFINE_SPINLOCK(zpci_iomap_lock);
     56static unsigned long *zpci_iomap_bitmap;
     57struct zpci_iomap_entry *zpci_iomap_start;
     58EXPORT_SYMBOL_GPL(zpci_iomap_start);
     59
     60DEFINE_STATIC_KEY_FALSE(have_mio);
     61
     62static struct kmem_cache *zdev_fmb_cache;
     63
     64struct zpci_dev *get_zdev_by_fid(u32 fid)
     65{
     66	struct zpci_dev *tmp, *zdev = NULL;
     67
     68	spin_lock(&zpci_list_lock);
     69	list_for_each_entry(tmp, &zpci_list, entry) {
     70		if (tmp->fid == fid) {
     71			zdev = tmp;
     72			zpci_zdev_get(zdev);
     73			break;
     74		}
     75	}
     76	spin_unlock(&zpci_list_lock);
     77	return zdev;
     78}
     79
     80void zpci_remove_reserved_devices(void)
     81{
     82	struct zpci_dev *tmp, *zdev;
     83	enum zpci_state state;
     84	LIST_HEAD(remove);
     85
     86	spin_lock(&zpci_list_lock);
     87	list_for_each_entry_safe(zdev, tmp, &zpci_list, entry) {
     88		if (zdev->state == ZPCI_FN_STATE_STANDBY &&
     89		    !clp_get_state(zdev->fid, &state) &&
     90		    state == ZPCI_FN_STATE_RESERVED)
     91			list_move_tail(&zdev->entry, &remove);
     92	}
     93	spin_unlock(&zpci_list_lock);
     94
     95	list_for_each_entry_safe(zdev, tmp, &remove, entry)
     96		zpci_device_reserved(zdev);
     97}
     98
     99int pci_domain_nr(struct pci_bus *bus)
    100{
    101	return ((struct zpci_bus *) bus->sysdata)->domain_nr;
    102}
    103EXPORT_SYMBOL_GPL(pci_domain_nr);
    104
    105int pci_proc_domain(struct pci_bus *bus)
    106{
    107	return pci_domain_nr(bus);
    108}
    109EXPORT_SYMBOL_GPL(pci_proc_domain);
    110
    111/* Modify PCI: Register I/O address translation parameters */
    112int zpci_register_ioat(struct zpci_dev *zdev, u8 dmaas,
    113		       u64 base, u64 limit, u64 iota)
    114{
    115	u64 req = ZPCI_CREATE_REQ(zdev->fh, dmaas, ZPCI_MOD_FC_REG_IOAT);
    116	struct zpci_fib fib = {0};
    117	u8 cc, status;
    118
    119	WARN_ON_ONCE(iota & 0x3fff);
    120	fib.pba = base;
    121	fib.pal = limit;
    122	fib.iota = iota | ZPCI_IOTA_RTTO_FLAG;
    123	cc = zpci_mod_fc(req, &fib, &status);
    124	if (cc)
    125		zpci_dbg(3, "reg ioat fid:%x, cc:%d, status:%d\n", zdev->fid, cc, status);
    126	return cc;
    127}
    128
    129/* Modify PCI: Unregister I/O address translation parameters */
    130int zpci_unregister_ioat(struct zpci_dev *zdev, u8 dmaas)
    131{
    132	u64 req = ZPCI_CREATE_REQ(zdev->fh, dmaas, ZPCI_MOD_FC_DEREG_IOAT);
    133	struct zpci_fib fib = {0};
    134	u8 cc, status;
    135
    136	cc = zpci_mod_fc(req, &fib, &status);
    137	if (cc)
    138		zpci_dbg(3, "unreg ioat fid:%x, cc:%d, status:%d\n", zdev->fid, cc, status);
    139	return cc;
    140}
    141
    142/* Modify PCI: Set PCI function measurement parameters */
    143int zpci_fmb_enable_device(struct zpci_dev *zdev)
    144{
    145	u64 req = ZPCI_CREATE_REQ(zdev->fh, 0, ZPCI_MOD_FC_SET_MEASURE);
    146	struct zpci_fib fib = {0};
    147	u8 cc, status;
    148
    149	if (zdev->fmb || sizeof(*zdev->fmb) < zdev->fmb_length)
    150		return -EINVAL;
    151
    152	zdev->fmb = kmem_cache_zalloc(zdev_fmb_cache, GFP_KERNEL);
    153	if (!zdev->fmb)
    154		return -ENOMEM;
    155	WARN_ON((u64) zdev->fmb & 0xf);
    156
    157	/* reset software counters */
    158	atomic64_set(&zdev->allocated_pages, 0);
    159	atomic64_set(&zdev->mapped_pages, 0);
    160	atomic64_set(&zdev->unmapped_pages, 0);
    161
    162	fib.fmb_addr = virt_to_phys(zdev->fmb);
    163	cc = zpci_mod_fc(req, &fib, &status);
    164	if (cc) {
    165		kmem_cache_free(zdev_fmb_cache, zdev->fmb);
    166		zdev->fmb = NULL;
    167	}
    168	return cc ? -EIO : 0;
    169}
    170
    171/* Modify PCI: Disable PCI function measurement */
    172int zpci_fmb_disable_device(struct zpci_dev *zdev)
    173{
    174	u64 req = ZPCI_CREATE_REQ(zdev->fh, 0, ZPCI_MOD_FC_SET_MEASURE);
    175	struct zpci_fib fib = {0};
    176	u8 cc, status;
    177
    178	if (!zdev->fmb)
    179		return -EINVAL;
    180
    181	/* Function measurement is disabled if fmb address is zero */
    182	cc = zpci_mod_fc(req, &fib, &status);
    183	if (cc == 3) /* Function already gone. */
    184		cc = 0;
    185
    186	if (!cc) {
    187		kmem_cache_free(zdev_fmb_cache, zdev->fmb);
    188		zdev->fmb = NULL;
    189	}
    190	return cc ? -EIO : 0;
    191}
    192
    193static int zpci_cfg_load(struct zpci_dev *zdev, int offset, u32 *val, u8 len)
    194{
    195	u64 req = ZPCI_CREATE_REQ(zdev->fh, ZPCI_PCIAS_CFGSPC, len);
    196	u64 data;
    197	int rc;
    198
    199	rc = __zpci_load(&data, req, offset);
    200	if (!rc) {
    201		data = le64_to_cpu((__force __le64) data);
    202		data >>= (8 - len) * 8;
    203		*val = (u32) data;
    204	} else
    205		*val = 0xffffffff;
    206	return rc;
    207}
    208
    209static int zpci_cfg_store(struct zpci_dev *zdev, int offset, u32 val, u8 len)
    210{
    211	u64 req = ZPCI_CREATE_REQ(zdev->fh, ZPCI_PCIAS_CFGSPC, len);
    212	u64 data = val;
    213	int rc;
    214
    215	data <<= (8 - len) * 8;
    216	data = (__force u64) cpu_to_le64(data);
    217	rc = __zpci_store(data, req, offset);
    218	return rc;
    219}
    220
    221resource_size_t pcibios_align_resource(void *data, const struct resource *res,
    222				       resource_size_t size,
    223				       resource_size_t align)
    224{
    225	return 0;
    226}
    227
    228/* combine single writes by using store-block insn */
    229void __iowrite64_copy(void __iomem *to, const void *from, size_t count)
    230{
    231       zpci_memcpy_toio(to, from, count);
    232}
    233
    234static void __iomem *__ioremap(phys_addr_t addr, size_t size, pgprot_t prot)
    235{
    236	unsigned long offset, vaddr;
    237	struct vm_struct *area;
    238	phys_addr_t last_addr;
    239
    240	last_addr = addr + size - 1;
    241	if (!size || last_addr < addr)
    242		return NULL;
    243
    244	if (!static_branch_unlikely(&have_mio))
    245		return (void __iomem *) addr;
    246
    247	offset = addr & ~PAGE_MASK;
    248	addr &= PAGE_MASK;
    249	size = PAGE_ALIGN(size + offset);
    250	area = get_vm_area(size, VM_IOREMAP);
    251	if (!area)
    252		return NULL;
    253
    254	vaddr = (unsigned long) area->addr;
    255	if (ioremap_page_range(vaddr, vaddr + size, addr, prot)) {
    256		free_vm_area(area);
    257		return NULL;
    258	}
    259	return (void __iomem *) ((unsigned long) area->addr + offset);
    260}
    261
    262void __iomem *ioremap_prot(phys_addr_t addr, size_t size, unsigned long prot)
    263{
    264	return __ioremap(addr, size, __pgprot(prot));
    265}
    266EXPORT_SYMBOL(ioremap_prot);
    267
    268void __iomem *ioremap(phys_addr_t addr, size_t size)
    269{
    270	return __ioremap(addr, size, PAGE_KERNEL);
    271}
    272EXPORT_SYMBOL(ioremap);
    273
    274void __iomem *ioremap_wc(phys_addr_t addr, size_t size)
    275{
    276	return __ioremap(addr, size, pgprot_writecombine(PAGE_KERNEL));
    277}
    278EXPORT_SYMBOL(ioremap_wc);
    279
    280void __iomem *ioremap_wt(phys_addr_t addr, size_t size)
    281{
    282	return __ioremap(addr, size, pgprot_writethrough(PAGE_KERNEL));
    283}
    284EXPORT_SYMBOL(ioremap_wt);
    285
    286void iounmap(volatile void __iomem *addr)
    287{
    288	if (static_branch_likely(&have_mio))
    289		vunmap((__force void *) ((unsigned long) addr & PAGE_MASK));
    290}
    291EXPORT_SYMBOL(iounmap);
    292
    293/* Create a virtual mapping cookie for a PCI BAR */
    294static void __iomem *pci_iomap_range_fh(struct pci_dev *pdev, int bar,
    295					unsigned long offset, unsigned long max)
    296{
    297	struct zpci_dev *zdev =	to_zpci(pdev);
    298	int idx;
    299
    300	idx = zdev->bars[bar].map_idx;
    301	spin_lock(&zpci_iomap_lock);
    302	/* Detect overrun */
    303	WARN_ON(!++zpci_iomap_start[idx].count);
    304	zpci_iomap_start[idx].fh = zdev->fh;
    305	zpci_iomap_start[idx].bar = bar;
    306	spin_unlock(&zpci_iomap_lock);
    307
    308	return (void __iomem *) ZPCI_ADDR(idx) + offset;
    309}
    310
    311static void __iomem *pci_iomap_range_mio(struct pci_dev *pdev, int bar,
    312					 unsigned long offset,
    313					 unsigned long max)
    314{
    315	unsigned long barsize = pci_resource_len(pdev, bar);
    316	struct zpci_dev *zdev = to_zpci(pdev);
    317	void __iomem *iova;
    318
    319	iova = ioremap((unsigned long) zdev->bars[bar].mio_wt, barsize);
    320	return iova ? iova + offset : iova;
    321}
    322
    323void __iomem *pci_iomap_range(struct pci_dev *pdev, int bar,
    324			      unsigned long offset, unsigned long max)
    325{
    326	if (bar >= PCI_STD_NUM_BARS || !pci_resource_len(pdev, bar))
    327		return NULL;
    328
    329	if (static_branch_likely(&have_mio))
    330		return pci_iomap_range_mio(pdev, bar, offset, max);
    331	else
    332		return pci_iomap_range_fh(pdev, bar, offset, max);
    333}
    334EXPORT_SYMBOL(pci_iomap_range);
    335
    336void __iomem *pci_iomap(struct pci_dev *dev, int bar, unsigned long maxlen)
    337{
    338	return pci_iomap_range(dev, bar, 0, maxlen);
    339}
    340EXPORT_SYMBOL(pci_iomap);
    341
    342static void __iomem *pci_iomap_wc_range_mio(struct pci_dev *pdev, int bar,
    343					    unsigned long offset, unsigned long max)
    344{
    345	unsigned long barsize = pci_resource_len(pdev, bar);
    346	struct zpci_dev *zdev = to_zpci(pdev);
    347	void __iomem *iova;
    348
    349	iova = ioremap((unsigned long) zdev->bars[bar].mio_wb, barsize);
    350	return iova ? iova + offset : iova;
    351}
    352
    353void __iomem *pci_iomap_wc_range(struct pci_dev *pdev, int bar,
    354				 unsigned long offset, unsigned long max)
    355{
    356	if (bar >= PCI_STD_NUM_BARS || !pci_resource_len(pdev, bar))
    357		return NULL;
    358
    359	if (static_branch_likely(&have_mio))
    360		return pci_iomap_wc_range_mio(pdev, bar, offset, max);
    361	else
    362		return pci_iomap_range_fh(pdev, bar, offset, max);
    363}
    364EXPORT_SYMBOL(pci_iomap_wc_range);
    365
    366void __iomem *pci_iomap_wc(struct pci_dev *dev, int bar, unsigned long maxlen)
    367{
    368	return pci_iomap_wc_range(dev, bar, 0, maxlen);
    369}
    370EXPORT_SYMBOL(pci_iomap_wc);
    371
    372static void pci_iounmap_fh(struct pci_dev *pdev, void __iomem *addr)
    373{
    374	unsigned int idx = ZPCI_IDX(addr);
    375
    376	spin_lock(&zpci_iomap_lock);
    377	/* Detect underrun */
    378	WARN_ON(!zpci_iomap_start[idx].count);
    379	if (!--zpci_iomap_start[idx].count) {
    380		zpci_iomap_start[idx].fh = 0;
    381		zpci_iomap_start[idx].bar = 0;
    382	}
    383	spin_unlock(&zpci_iomap_lock);
    384}
    385
    386static void pci_iounmap_mio(struct pci_dev *pdev, void __iomem *addr)
    387{
    388	iounmap(addr);
    389}
    390
    391void pci_iounmap(struct pci_dev *pdev, void __iomem *addr)
    392{
    393	if (static_branch_likely(&have_mio))
    394		pci_iounmap_mio(pdev, addr);
    395	else
    396		pci_iounmap_fh(pdev, addr);
    397}
    398EXPORT_SYMBOL(pci_iounmap);
    399
    400static int pci_read(struct pci_bus *bus, unsigned int devfn, int where,
    401		    int size, u32 *val)
    402{
    403	struct zpci_dev *zdev = zdev_from_bus(bus, devfn);
    404
    405	return (zdev) ? zpci_cfg_load(zdev, where, val, size) : -ENODEV;
    406}
    407
    408static int pci_write(struct pci_bus *bus, unsigned int devfn, int where,
    409		     int size, u32 val)
    410{
    411	struct zpci_dev *zdev = zdev_from_bus(bus, devfn);
    412
    413	return (zdev) ? zpci_cfg_store(zdev, where, val, size) : -ENODEV;
    414}
    415
    416static struct pci_ops pci_root_ops = {
    417	.read = pci_read,
    418	.write = pci_write,
    419};
    420
    421static void zpci_map_resources(struct pci_dev *pdev)
    422{
    423	struct zpci_dev *zdev = to_zpci(pdev);
    424	resource_size_t len;
    425	int i;
    426
    427	for (i = 0; i < PCI_STD_NUM_BARS; i++) {
    428		len = pci_resource_len(pdev, i);
    429		if (!len)
    430			continue;
    431
    432		if (zpci_use_mio(zdev))
    433			pdev->resource[i].start =
    434				(resource_size_t __force) zdev->bars[i].mio_wt;
    435		else
    436			pdev->resource[i].start = (resource_size_t __force)
    437				pci_iomap_range_fh(pdev, i, 0, 0);
    438		pdev->resource[i].end = pdev->resource[i].start + len - 1;
    439	}
    440
    441	zpci_iov_map_resources(pdev);
    442}
    443
    444static void zpci_unmap_resources(struct pci_dev *pdev)
    445{
    446	struct zpci_dev *zdev = to_zpci(pdev);
    447	resource_size_t len;
    448	int i;
    449
    450	if (zpci_use_mio(zdev))
    451		return;
    452
    453	for (i = 0; i < PCI_STD_NUM_BARS; i++) {
    454		len = pci_resource_len(pdev, i);
    455		if (!len)
    456			continue;
    457		pci_iounmap_fh(pdev, (void __iomem __force *)
    458			       pdev->resource[i].start);
    459	}
    460}
    461
    462static int zpci_alloc_iomap(struct zpci_dev *zdev)
    463{
    464	unsigned long entry;
    465
    466	spin_lock(&zpci_iomap_lock);
    467	entry = find_first_zero_bit(zpci_iomap_bitmap, ZPCI_IOMAP_ENTRIES);
    468	if (entry == ZPCI_IOMAP_ENTRIES) {
    469		spin_unlock(&zpci_iomap_lock);
    470		return -ENOSPC;
    471	}
    472	set_bit(entry, zpci_iomap_bitmap);
    473	spin_unlock(&zpci_iomap_lock);
    474	return entry;
    475}
    476
    477static void zpci_free_iomap(struct zpci_dev *zdev, int entry)
    478{
    479	spin_lock(&zpci_iomap_lock);
    480	memset(&zpci_iomap_start[entry], 0, sizeof(struct zpci_iomap_entry));
    481	clear_bit(entry, zpci_iomap_bitmap);
    482	spin_unlock(&zpci_iomap_lock);
    483}
    484
    485static void zpci_do_update_iomap_fh(struct zpci_dev *zdev, u32 fh)
    486{
    487	int bar, idx;
    488
    489	spin_lock(&zpci_iomap_lock);
    490	for (bar = 0; bar < PCI_STD_NUM_BARS; bar++) {
    491		if (!zdev->bars[bar].size)
    492			continue;
    493		idx = zdev->bars[bar].map_idx;
    494		if (!zpci_iomap_start[idx].count)
    495			continue;
    496		WRITE_ONCE(zpci_iomap_start[idx].fh, zdev->fh);
    497	}
    498	spin_unlock(&zpci_iomap_lock);
    499}
    500
    501void zpci_update_fh(struct zpci_dev *zdev, u32 fh)
    502{
    503	if (!fh || zdev->fh == fh)
    504		return;
    505
    506	zdev->fh = fh;
    507	if (zpci_use_mio(zdev))
    508		return;
    509	if (zdev->has_resources && zdev_enabled(zdev))
    510		zpci_do_update_iomap_fh(zdev, fh);
    511}
    512
    513static struct resource *__alloc_res(struct zpci_dev *zdev, unsigned long start,
    514				    unsigned long size, unsigned long flags)
    515{
    516	struct resource *r;
    517
    518	r = kzalloc(sizeof(*r), GFP_KERNEL);
    519	if (!r)
    520		return NULL;
    521
    522	r->start = start;
    523	r->end = r->start + size - 1;
    524	r->flags = flags;
    525	r->name = zdev->res_name;
    526
    527	if (request_resource(&iomem_resource, r)) {
    528		kfree(r);
    529		return NULL;
    530	}
    531	return r;
    532}
    533
    534int zpci_setup_bus_resources(struct zpci_dev *zdev,
    535			     struct list_head *resources)
    536{
    537	unsigned long addr, size, flags;
    538	struct resource *res;
    539	int i, entry;
    540
    541	snprintf(zdev->res_name, sizeof(zdev->res_name),
    542		 "PCI Bus %04x:%02x", zdev->uid, ZPCI_BUS_NR);
    543
    544	for (i = 0; i < PCI_STD_NUM_BARS; i++) {
    545		if (!zdev->bars[i].size)
    546			continue;
    547		entry = zpci_alloc_iomap(zdev);
    548		if (entry < 0)
    549			return entry;
    550		zdev->bars[i].map_idx = entry;
    551
    552		/* only MMIO is supported */
    553		flags = IORESOURCE_MEM;
    554		if (zdev->bars[i].val & 8)
    555			flags |= IORESOURCE_PREFETCH;
    556		if (zdev->bars[i].val & 4)
    557			flags |= IORESOURCE_MEM_64;
    558
    559		if (zpci_use_mio(zdev))
    560			addr = (unsigned long) zdev->bars[i].mio_wt;
    561		else
    562			addr = ZPCI_ADDR(entry);
    563		size = 1UL << zdev->bars[i].size;
    564
    565		res = __alloc_res(zdev, addr, size, flags);
    566		if (!res) {
    567			zpci_free_iomap(zdev, entry);
    568			return -ENOMEM;
    569		}
    570		zdev->bars[i].res = res;
    571		pci_add_resource(resources, res);
    572	}
    573	zdev->has_resources = 1;
    574
    575	return 0;
    576}
    577
    578static void zpci_cleanup_bus_resources(struct zpci_dev *zdev)
    579{
    580	int i;
    581
    582	for (i = 0; i < PCI_STD_NUM_BARS; i++) {
    583		if (!zdev->bars[i].size || !zdev->bars[i].res)
    584			continue;
    585
    586		zpci_free_iomap(zdev, zdev->bars[i].map_idx);
    587		release_resource(zdev->bars[i].res);
    588		kfree(zdev->bars[i].res);
    589	}
    590	zdev->has_resources = 0;
    591}
    592
    593int pcibios_device_add(struct pci_dev *pdev)
    594{
    595	struct zpci_dev *zdev = to_zpci(pdev);
    596	struct resource *res;
    597	int i;
    598
    599	/* The pdev has a reference to the zdev via its bus */
    600	zpci_zdev_get(zdev);
    601	if (pdev->is_physfn)
    602		pdev->no_vf_scan = 1;
    603
    604	pdev->dev.groups = zpci_attr_groups;
    605	pdev->dev.dma_ops = &s390_pci_dma_ops;
    606	zpci_map_resources(pdev);
    607
    608	for (i = 0; i < PCI_STD_NUM_BARS; i++) {
    609		res = &pdev->resource[i];
    610		if (res->parent || !res->flags)
    611			continue;
    612		pci_claim_resource(pdev, i);
    613	}
    614
    615	return 0;
    616}
    617
    618void pcibios_release_device(struct pci_dev *pdev)
    619{
    620	struct zpci_dev *zdev = to_zpci(pdev);
    621
    622	zpci_unmap_resources(pdev);
    623	zpci_zdev_put(zdev);
    624}
    625
    626int pcibios_enable_device(struct pci_dev *pdev, int mask)
    627{
    628	struct zpci_dev *zdev = to_zpci(pdev);
    629
    630	zpci_debug_init_device(zdev, dev_name(&pdev->dev));
    631	zpci_fmb_enable_device(zdev);
    632
    633	return pci_enable_resources(pdev, mask);
    634}
    635
    636void pcibios_disable_device(struct pci_dev *pdev)
    637{
    638	struct zpci_dev *zdev = to_zpci(pdev);
    639
    640	zpci_fmb_disable_device(zdev);
    641	zpci_debug_exit_device(zdev);
    642}
    643
    644static int __zpci_register_domain(int domain)
    645{
    646	spin_lock(&zpci_domain_lock);
    647	if (test_bit(domain, zpci_domain)) {
    648		spin_unlock(&zpci_domain_lock);
    649		pr_err("Domain %04x is already assigned\n", domain);
    650		return -EEXIST;
    651	}
    652	set_bit(domain, zpci_domain);
    653	spin_unlock(&zpci_domain_lock);
    654	return domain;
    655}
    656
    657static int __zpci_alloc_domain(void)
    658{
    659	int domain;
    660
    661	spin_lock(&zpci_domain_lock);
    662	/*
    663	 * We can always auto allocate domains below ZPCI_NR_DEVICES.
    664	 * There is either a free domain or we have reached the maximum in
    665	 * which case we would have bailed earlier.
    666	 */
    667	domain = find_first_zero_bit(zpci_domain, ZPCI_NR_DEVICES);
    668	set_bit(domain, zpci_domain);
    669	spin_unlock(&zpci_domain_lock);
    670	return domain;
    671}
    672
    673int zpci_alloc_domain(int domain)
    674{
    675	if (zpci_unique_uid) {
    676		if (domain)
    677			return __zpci_register_domain(domain);
    678		pr_warn("UID checking was active but no UID is provided: switching to automatic domain allocation\n");
    679		update_uid_checking(false);
    680	}
    681	return __zpci_alloc_domain();
    682}
    683
    684void zpci_free_domain(int domain)
    685{
    686	spin_lock(&zpci_domain_lock);
    687	clear_bit(domain, zpci_domain);
    688	spin_unlock(&zpci_domain_lock);
    689}
    690
    691
    692int zpci_enable_device(struct zpci_dev *zdev)
    693{
    694	u32 fh = zdev->fh;
    695	int rc = 0;
    696
    697	if (clp_enable_fh(zdev, &fh, ZPCI_NR_DMA_SPACES))
    698		rc = -EIO;
    699	else
    700		zpci_update_fh(zdev, fh);
    701	return rc;
    702}
    703
    704int zpci_disable_device(struct zpci_dev *zdev)
    705{
    706	u32 fh = zdev->fh;
    707	int cc, rc = 0;
    708
    709	cc = clp_disable_fh(zdev, &fh);
    710	if (!cc) {
    711		zpci_update_fh(zdev, fh);
    712	} else if (cc == CLP_RC_SETPCIFN_ALRDY) {
    713		pr_info("Disabling PCI function %08x had no effect as it was already disabled\n",
    714			zdev->fid);
    715		/* Function is already disabled - update handle */
    716		rc = clp_refresh_fh(zdev->fid, &fh);
    717		if (!rc) {
    718			zpci_update_fh(zdev, fh);
    719			rc = -EINVAL;
    720		}
    721	} else {
    722		rc = -EIO;
    723	}
    724	return rc;
    725}
    726
    727/**
    728 * zpci_hot_reset_device - perform a reset of the given zPCI function
    729 * @zdev: the slot which should be reset
    730 *
    731 * Performs a low level reset of the zPCI function. The reset is low level in
    732 * the sense that the zPCI function can be reset without detaching it from the
    733 * common PCI subsystem. The reset may be performed while under control of
    734 * either DMA or IOMMU APIs in which case the existing DMA/IOMMU translation
    735 * table is reinstated at the end of the reset.
    736 *
    737 * After the reset the functions internal state is reset to an initial state
    738 * equivalent to its state during boot when first probing a driver.
    739 * Consequently after reset the PCI function requires re-initialization via the
    740 * common PCI code including re-enabling IRQs via pci_alloc_irq_vectors()
    741 * and enabling the function via e.g.pci_enablde_device_flags().The caller
    742 * must guard against concurrent reset attempts.
    743 *
    744 * In most cases this function should not be called directly but through
    745 * pci_reset_function() or pci_reset_bus() which handle the save/restore and
    746 * locking.
    747 *
    748 * Return: 0 on success and an error value otherwise
    749 */
    750int zpci_hot_reset_device(struct zpci_dev *zdev)
    751{
    752	int rc;
    753
    754	zpci_dbg(3, "rst fid:%x, fh:%x\n", zdev->fid, zdev->fh);
    755	if (zdev_enabled(zdev)) {
    756		/* Disables device access, DMAs and IRQs (reset state) */
    757		rc = zpci_disable_device(zdev);
    758		/*
    759		 * Due to a z/VM vs LPAR inconsistency in the error state the
    760		 * FH may indicate an enabled device but disable says the
    761		 * device is already disabled don't treat it as an error here.
    762		 */
    763		if (rc == -EINVAL)
    764			rc = 0;
    765		if (rc)
    766			return rc;
    767	}
    768
    769	rc = zpci_enable_device(zdev);
    770	if (rc)
    771		return rc;
    772
    773	if (zdev->dma_table)
    774		rc = zpci_register_ioat(zdev, 0, zdev->start_dma, zdev->end_dma,
    775					virt_to_phys(zdev->dma_table));
    776	else
    777		rc = zpci_dma_init_device(zdev);
    778	if (rc) {
    779		zpci_disable_device(zdev);
    780		return rc;
    781	}
    782
    783	return 0;
    784}
    785
    786/**
    787 * zpci_create_device() - Create a new zpci_dev and add it to the zbus
    788 * @fid: Function ID of the device to be created
    789 * @fh: Current Function Handle of the device to be created
    790 * @state: Initial state after creation either Standby or Configured
    791 *
    792 * Creates a new zpci device and adds it to its, possibly newly created, zbus
    793 * as well as zpci_list.
    794 *
    795 * Returns: the zdev on success or an error pointer otherwise
    796 */
    797struct zpci_dev *zpci_create_device(u32 fid, u32 fh, enum zpci_state state)
    798{
    799	struct zpci_dev *zdev;
    800	int rc;
    801
    802	zpci_dbg(1, "add fid:%x, fh:%x, c:%d\n", fid, fh, state);
    803	zdev = kzalloc(sizeof(*zdev), GFP_KERNEL);
    804	if (!zdev)
    805		return ERR_PTR(-ENOMEM);
    806
    807	/* FID and Function Handle are the static/dynamic identifiers */
    808	zdev->fid = fid;
    809	zdev->fh = fh;
    810
    811	/* Query function properties and update zdev */
    812	rc = clp_query_pci_fn(zdev);
    813	if (rc)
    814		goto error;
    815	zdev->state =  state;
    816
    817	kref_init(&zdev->kref);
    818	mutex_init(&zdev->lock);
    819
    820	rc = zpci_init_iommu(zdev);
    821	if (rc)
    822		goto error;
    823
    824	rc = zpci_bus_device_register(zdev, &pci_root_ops);
    825	if (rc)
    826		goto error_destroy_iommu;
    827
    828	spin_lock(&zpci_list_lock);
    829	list_add_tail(&zdev->entry, &zpci_list);
    830	spin_unlock(&zpci_list_lock);
    831
    832	return zdev;
    833
    834error_destroy_iommu:
    835	zpci_destroy_iommu(zdev);
    836error:
    837	zpci_dbg(0, "add fid:%x, rc:%d\n", fid, rc);
    838	kfree(zdev);
    839	return ERR_PTR(rc);
    840}
    841
    842bool zpci_is_device_configured(struct zpci_dev *zdev)
    843{
    844	enum zpci_state state = zdev->state;
    845
    846	return state != ZPCI_FN_STATE_RESERVED &&
    847		state != ZPCI_FN_STATE_STANDBY;
    848}
    849
    850/**
    851 * zpci_scan_configured_device() - Scan a freshly configured zpci_dev
    852 * @zdev: The zpci_dev to be configured
    853 * @fh: The general function handle supplied by the platform
    854 *
    855 * Given a device in the configuration state Configured, enables, scans and
    856 * adds it to the common code PCI subsystem if possible. If the PCI device is
    857 * parked because we can not yet create a PCI bus because we have not seen
    858 * function 0, it is ignored but will be scanned once function 0 appears.
    859 * If any failure occurs, the zpci_dev is left disabled.
    860 *
    861 * Return: 0 on success, or an error code otherwise
    862 */
    863int zpci_scan_configured_device(struct zpci_dev *zdev, u32 fh)
    864{
    865	int rc;
    866
    867	zpci_update_fh(zdev, fh);
    868	/* the PCI function will be scanned once function 0 appears */
    869	if (!zdev->zbus->bus)
    870		return 0;
    871
    872	/* For function 0 on a multi-function bus scan whole bus as we might
    873	 * have to pick up existing functions waiting for it to allow creating
    874	 * the PCI bus
    875	 */
    876	if (zdev->devfn == 0 && zdev->zbus->multifunction)
    877		rc = zpci_bus_scan_bus(zdev->zbus);
    878	else
    879		rc = zpci_bus_scan_device(zdev);
    880
    881	return rc;
    882}
    883
    884/**
    885 * zpci_deconfigure_device() - Deconfigure a zpci_dev
    886 * @zdev: The zpci_dev to configure
    887 *
    888 * Deconfigure a zPCI function that is currently configured and possibly known
    889 * to the common code PCI subsystem.
    890 * If any failure occurs the device is left as is.
    891 *
    892 * Return: 0 on success, or an error code otherwise
    893 */
    894int zpci_deconfigure_device(struct zpci_dev *zdev)
    895{
    896	int rc;
    897
    898	if (zdev->zbus->bus)
    899		zpci_bus_remove_device(zdev, false);
    900
    901	if (zdev->dma_table) {
    902		rc = zpci_dma_exit_device(zdev);
    903		if (rc)
    904			return rc;
    905	}
    906	if (zdev_enabled(zdev)) {
    907		rc = zpci_disable_device(zdev);
    908		if (rc)
    909			return rc;
    910	}
    911
    912	rc = sclp_pci_deconfigure(zdev->fid);
    913	zpci_dbg(3, "deconf fid:%x, rc:%d\n", zdev->fid, rc);
    914	if (rc)
    915		return rc;
    916	zdev->state = ZPCI_FN_STATE_STANDBY;
    917
    918	return 0;
    919}
    920
    921/**
    922 * zpci_device_reserved() - Mark device as resverved
    923 * @zdev: the zpci_dev that was reserved
    924 *
    925 * Handle the case that a given zPCI function was reserved by another system.
    926 * After a call to this function the zpci_dev can not be found via
    927 * get_zdev_by_fid() anymore but may still be accessible via existing
    928 * references though it will not be functional anymore.
    929 */
    930void zpci_device_reserved(struct zpci_dev *zdev)
    931{
    932	if (zdev->has_hp_slot)
    933		zpci_exit_slot(zdev);
    934	/*
    935	 * Remove device from zpci_list as it is going away. This also
    936	 * makes sure we ignore subsequent zPCI events for this device.
    937	 */
    938	spin_lock(&zpci_list_lock);
    939	list_del(&zdev->entry);
    940	spin_unlock(&zpci_list_lock);
    941	zdev->state = ZPCI_FN_STATE_RESERVED;
    942	zpci_dbg(3, "rsv fid:%x\n", zdev->fid);
    943	zpci_zdev_put(zdev);
    944}
    945
    946void zpci_release_device(struct kref *kref)
    947{
    948	struct zpci_dev *zdev = container_of(kref, struct zpci_dev, kref);
    949	int ret;
    950
    951	if (zdev->zbus->bus)
    952		zpci_bus_remove_device(zdev, false);
    953
    954	if (zdev->dma_table)
    955		zpci_dma_exit_device(zdev);
    956	if (zdev_enabled(zdev))
    957		zpci_disable_device(zdev);
    958
    959	switch (zdev->state) {
    960	case ZPCI_FN_STATE_CONFIGURED:
    961		ret = sclp_pci_deconfigure(zdev->fid);
    962		zpci_dbg(3, "deconf fid:%x, rc:%d\n", zdev->fid, ret);
    963		fallthrough;
    964	case ZPCI_FN_STATE_STANDBY:
    965		if (zdev->has_hp_slot)
    966			zpci_exit_slot(zdev);
    967		spin_lock(&zpci_list_lock);
    968		list_del(&zdev->entry);
    969		spin_unlock(&zpci_list_lock);
    970		zpci_dbg(3, "rsv fid:%x\n", zdev->fid);
    971		fallthrough;
    972	case ZPCI_FN_STATE_RESERVED:
    973		if (zdev->has_resources)
    974			zpci_cleanup_bus_resources(zdev);
    975		zpci_bus_device_unregister(zdev);
    976		zpci_destroy_iommu(zdev);
    977		fallthrough;
    978	default:
    979		break;
    980	}
    981	zpci_dbg(3, "rem fid:%x\n", zdev->fid);
    982	kfree(zdev);
    983}
    984
    985int zpci_report_error(struct pci_dev *pdev,
    986		      struct zpci_report_error_header *report)
    987{
    988	struct zpci_dev *zdev = to_zpci(pdev);
    989
    990	return sclp_pci_report(report, zdev->fh, zdev->fid);
    991}
    992EXPORT_SYMBOL(zpci_report_error);
    993
    994/**
    995 * zpci_clear_error_state() - Clears the zPCI error state of the device
    996 * @zdev: The zdev for which the zPCI error state should be reset
    997 *
    998 * Clear the zPCI error state of the device. If clearing the zPCI error state
    999 * fails the device is left in the error state. In this case it may make sense
   1000 * to call zpci_io_perm_failure() on the associated pdev if it exists.
   1001 *
   1002 * Returns: 0 on success, -EIO otherwise
   1003 */
   1004int zpci_clear_error_state(struct zpci_dev *zdev)
   1005{
   1006	u64 req = ZPCI_CREATE_REQ(zdev->fh, 0, ZPCI_MOD_FC_RESET_ERROR);
   1007	struct zpci_fib fib = {0};
   1008	u8 status;
   1009	int cc;
   1010
   1011	cc = zpci_mod_fc(req, &fib, &status);
   1012	if (cc) {
   1013		zpci_dbg(3, "ces fid:%x, cc:%d, status:%x\n", zdev->fid, cc, status);
   1014		return -EIO;
   1015	}
   1016
   1017	return 0;
   1018}
   1019
   1020/**
   1021 * zpci_reset_load_store_blocked() - Re-enables L/S from error state
   1022 * @zdev: The zdev for which to unblock load/store access
   1023 *
   1024 * Re-enables load/store access for a PCI function in the error state while
   1025 * keeping DMA blocked. In this state drivers can poke MMIO space to determine
   1026 * if error recovery is possible while catching any rogue DMA access from the
   1027 * device.
   1028 *
   1029 * Returns: 0 on success, -EIO otherwise
   1030 */
   1031int zpci_reset_load_store_blocked(struct zpci_dev *zdev)
   1032{
   1033	u64 req = ZPCI_CREATE_REQ(zdev->fh, 0, ZPCI_MOD_FC_RESET_BLOCK);
   1034	struct zpci_fib fib = {0};
   1035	u8 status;
   1036	int cc;
   1037
   1038	cc = zpci_mod_fc(req, &fib, &status);
   1039	if (cc) {
   1040		zpci_dbg(3, "rls fid:%x, cc:%d, status:%x\n", zdev->fid, cc, status);
   1041		return -EIO;
   1042	}
   1043
   1044	return 0;
   1045}
   1046
   1047static int zpci_mem_init(void)
   1048{
   1049	BUILD_BUG_ON(!is_power_of_2(__alignof__(struct zpci_fmb)) ||
   1050		     __alignof__(struct zpci_fmb) < sizeof(struct zpci_fmb));
   1051
   1052	zdev_fmb_cache = kmem_cache_create("PCI_FMB_cache", sizeof(struct zpci_fmb),
   1053					   __alignof__(struct zpci_fmb), 0, NULL);
   1054	if (!zdev_fmb_cache)
   1055		goto error_fmb;
   1056
   1057	zpci_iomap_start = kcalloc(ZPCI_IOMAP_ENTRIES,
   1058				   sizeof(*zpci_iomap_start), GFP_KERNEL);
   1059	if (!zpci_iomap_start)
   1060		goto error_iomap;
   1061
   1062	zpci_iomap_bitmap = kcalloc(BITS_TO_LONGS(ZPCI_IOMAP_ENTRIES),
   1063				    sizeof(*zpci_iomap_bitmap), GFP_KERNEL);
   1064	if (!zpci_iomap_bitmap)
   1065		goto error_iomap_bitmap;
   1066
   1067	if (static_branch_likely(&have_mio))
   1068		clp_setup_writeback_mio();
   1069
   1070	return 0;
   1071error_iomap_bitmap:
   1072	kfree(zpci_iomap_start);
   1073error_iomap:
   1074	kmem_cache_destroy(zdev_fmb_cache);
   1075error_fmb:
   1076	return -ENOMEM;
   1077}
   1078
   1079static void zpci_mem_exit(void)
   1080{
   1081	kfree(zpci_iomap_bitmap);
   1082	kfree(zpci_iomap_start);
   1083	kmem_cache_destroy(zdev_fmb_cache);
   1084}
   1085
   1086static unsigned int s390_pci_probe __initdata = 1;
   1087unsigned int s390_pci_force_floating __initdata;
   1088static unsigned int s390_pci_initialized;
   1089
   1090char * __init pcibios_setup(char *str)
   1091{
   1092	if (!strcmp(str, "off")) {
   1093		s390_pci_probe = 0;
   1094		return NULL;
   1095	}
   1096	if (!strcmp(str, "nomio")) {
   1097		S390_lowcore.machine_flags &= ~MACHINE_FLAG_PCI_MIO;
   1098		return NULL;
   1099	}
   1100	if (!strcmp(str, "force_floating")) {
   1101		s390_pci_force_floating = 1;
   1102		return NULL;
   1103	}
   1104	if (!strcmp(str, "norid")) {
   1105		s390_pci_no_rid = 1;
   1106		return NULL;
   1107	}
   1108	return str;
   1109}
   1110
   1111bool zpci_is_enabled(void)
   1112{
   1113	return s390_pci_initialized;
   1114}
   1115
   1116static int __init pci_base_init(void)
   1117{
   1118	int rc;
   1119
   1120	if (!s390_pci_probe)
   1121		return 0;
   1122
   1123	if (!test_facility(69) || !test_facility(71)) {
   1124		pr_info("PCI is not supported because CPU facilities 69 or 71 are not available\n");
   1125		return 0;
   1126	}
   1127
   1128	if (MACHINE_HAS_PCI_MIO) {
   1129		static_branch_enable(&have_mio);
   1130		ctl_set_bit(2, 5);
   1131	}
   1132
   1133	rc = zpci_debug_init();
   1134	if (rc)
   1135		goto out;
   1136
   1137	rc = zpci_mem_init();
   1138	if (rc)
   1139		goto out_mem;
   1140
   1141	rc = zpci_irq_init();
   1142	if (rc)
   1143		goto out_irq;
   1144
   1145	rc = zpci_dma_init();
   1146	if (rc)
   1147		goto out_dma;
   1148
   1149	rc = clp_scan_pci_devices();
   1150	if (rc)
   1151		goto out_find;
   1152	zpci_bus_scan_busses();
   1153
   1154	s390_pci_initialized = 1;
   1155	return 0;
   1156
   1157out_find:
   1158	zpci_dma_exit();
   1159out_dma:
   1160	zpci_irq_exit();
   1161out_irq:
   1162	zpci_mem_exit();
   1163out_mem:
   1164	zpci_debug_exit();
   1165out:
   1166	return rc;
   1167}
   1168subsys_initcall_sync(pci_base_init);