cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

main.c (27719B)


      1/* QLogic qedr NIC Driver
      2 * Copyright (c) 2015-2016  QLogic Corporation
      3 *
      4 * This software is available to you under a choice of one of two
      5 * licenses.  You may choose to be licensed under the terms of the GNU
      6 * General Public License (GPL) Version 2, available from the file
      7 * COPYING in the main directory of this source tree, or the
      8 * OpenIB.org BSD license below:
      9 *
     10 *     Redistribution and use in source and binary forms, with or
     11 *     without modification, are permitted provided that the following
     12 *     conditions are met:
     13 *
     14 *      - Redistributions of source code must retain the above
     15 *        copyright notice, this list of conditions and the following
     16 *        disclaimer.
     17 *
     18 *      - Redistributions in binary form must reproduce the above
     19 *        copyright notice, this list of conditions and the following
     20 *        disclaimer in the documentation and /or other materials
     21 *        provided with the distribution.
     22 *
     23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
     24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
     25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
     26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
     27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
     28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
     29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
     30 * SOFTWARE.
     31 */
     32#include <linux/module.h>
     33#include <rdma/ib_verbs.h>
     34#include <rdma/ib_addr.h>
     35#include <rdma/ib_user_verbs.h>
     36#include <rdma/iw_cm.h>
     37#include <rdma/ib_mad.h>
     38#include <linux/netdevice.h>
     39#include <linux/iommu.h>
     40#include <linux/pci.h>
     41#include <net/addrconf.h>
     42
     43#include <linux/qed/qed_chain.h>
     44#include <linux/qed/qed_if.h>
     45#include "qedr.h"
     46#include "verbs.h"
     47#include <rdma/qedr-abi.h>
     48#include "qedr_iw_cm.h"
     49
     50MODULE_DESCRIPTION("QLogic 40G/100G ROCE Driver");
     51MODULE_AUTHOR("QLogic Corporation");
     52MODULE_LICENSE("Dual BSD/GPL");
     53
     54#define QEDR_WQ_MULTIPLIER_DFT	(3)
     55
     56static void qedr_ib_dispatch_event(struct qedr_dev *dev, u32 port_num,
     57				   enum ib_event_type type)
     58{
     59	struct ib_event ibev;
     60
     61	ibev.device = &dev->ibdev;
     62	ibev.element.port_num = port_num;
     63	ibev.event = type;
     64
     65	ib_dispatch_event(&ibev);
     66}
     67
     68static enum rdma_link_layer qedr_link_layer(struct ib_device *device,
     69					    u32 port_num)
     70{
     71	return IB_LINK_LAYER_ETHERNET;
     72}
     73
     74static void qedr_get_dev_fw_str(struct ib_device *ibdev, char *str)
     75{
     76	struct qedr_dev *qedr = get_qedr_dev(ibdev);
     77	u32 fw_ver = (u32)qedr->attr.fw_ver;
     78
     79	snprintf(str, IB_FW_VERSION_NAME_MAX, "%d.%d.%d.%d",
     80		 (fw_ver >> 24) & 0xFF, (fw_ver >> 16) & 0xFF,
     81		 (fw_ver >> 8) & 0xFF, fw_ver & 0xFF);
     82}
     83
     84static int qedr_roce_port_immutable(struct ib_device *ibdev, u32 port_num,
     85				    struct ib_port_immutable *immutable)
     86{
     87	struct ib_port_attr attr;
     88	int err;
     89
     90	err = qedr_query_port(ibdev, port_num, &attr);
     91	if (err)
     92		return err;
     93
     94	immutable->pkey_tbl_len = attr.pkey_tbl_len;
     95	immutable->gid_tbl_len = attr.gid_tbl_len;
     96	immutable->core_cap_flags = RDMA_CORE_PORT_IBA_ROCE |
     97	    RDMA_CORE_PORT_IBA_ROCE_UDP_ENCAP;
     98	immutable->max_mad_size = IB_MGMT_MAD_SIZE;
     99
    100	return 0;
    101}
    102
    103static int qedr_iw_port_immutable(struct ib_device *ibdev, u32 port_num,
    104				  struct ib_port_immutable *immutable)
    105{
    106	struct ib_port_attr attr;
    107	int err;
    108
    109	err = qedr_query_port(ibdev, port_num, &attr);
    110	if (err)
    111		return err;
    112
    113	immutable->gid_tbl_len = 1;
    114	immutable->core_cap_flags = RDMA_CORE_PORT_IWARP;
    115	immutable->max_mad_size = 0;
    116
    117	return 0;
    118}
    119
    120/* QEDR sysfs interface */
    121static ssize_t hw_rev_show(struct device *device, struct device_attribute *attr,
    122			   char *buf)
    123{
    124	struct qedr_dev *dev =
    125		rdma_device_to_drv_device(device, struct qedr_dev, ibdev);
    126
    127	return sysfs_emit(buf, "0x%x\n", dev->attr.hw_ver);
    128}
    129static DEVICE_ATTR_RO(hw_rev);
    130
    131static ssize_t hca_type_show(struct device *device,
    132			     struct device_attribute *attr, char *buf)
    133{
    134	struct qedr_dev *dev =
    135		rdma_device_to_drv_device(device, struct qedr_dev, ibdev);
    136
    137	return sysfs_emit(buf, "FastLinQ QL%x %s\n", dev->pdev->device,
    138			  rdma_protocol_iwarp(&dev->ibdev, 1) ? "iWARP" :
    139								"RoCE");
    140}
    141static DEVICE_ATTR_RO(hca_type);
    142
    143static struct attribute *qedr_attributes[] = {
    144	&dev_attr_hw_rev.attr,
    145	&dev_attr_hca_type.attr,
    146	NULL
    147};
    148
    149static const struct attribute_group qedr_attr_group = {
    150	.attrs = qedr_attributes,
    151};
    152
    153static const struct ib_device_ops qedr_iw_dev_ops = {
    154	.get_port_immutable = qedr_iw_port_immutable,
    155	.iw_accept = qedr_iw_accept,
    156	.iw_add_ref = qedr_iw_qp_add_ref,
    157	.iw_connect = qedr_iw_connect,
    158	.iw_create_listen = qedr_iw_create_listen,
    159	.iw_destroy_listen = qedr_iw_destroy_listen,
    160	.iw_get_qp = qedr_iw_get_qp,
    161	.iw_reject = qedr_iw_reject,
    162	.iw_rem_ref = qedr_iw_qp_rem_ref,
    163	.query_gid = qedr_iw_query_gid,
    164};
    165
    166static int qedr_iw_register_device(struct qedr_dev *dev)
    167{
    168	dev->ibdev.node_type = RDMA_NODE_RNIC;
    169
    170	ib_set_device_ops(&dev->ibdev, &qedr_iw_dev_ops);
    171
    172	memcpy(dev->ibdev.iw_ifname,
    173	       dev->ndev->name, sizeof(dev->ibdev.iw_ifname));
    174
    175	return 0;
    176}
    177
    178static const struct ib_device_ops qedr_roce_dev_ops = {
    179	.alloc_xrcd = qedr_alloc_xrcd,
    180	.dealloc_xrcd = qedr_dealloc_xrcd,
    181	.get_port_immutable = qedr_roce_port_immutable,
    182	.query_pkey = qedr_query_pkey,
    183};
    184
    185static void qedr_roce_register_device(struct qedr_dev *dev)
    186{
    187	dev->ibdev.node_type = RDMA_NODE_IB_CA;
    188
    189	ib_set_device_ops(&dev->ibdev, &qedr_roce_dev_ops);
    190}
    191
    192static const struct ib_device_ops qedr_dev_ops = {
    193	.owner = THIS_MODULE,
    194	.driver_id = RDMA_DRIVER_QEDR,
    195	.uverbs_abi_ver = QEDR_ABI_VERSION,
    196
    197	.alloc_mr = qedr_alloc_mr,
    198	.alloc_pd = qedr_alloc_pd,
    199	.alloc_ucontext = qedr_alloc_ucontext,
    200	.create_ah = qedr_create_ah,
    201	.create_cq = qedr_create_cq,
    202	.create_qp = qedr_create_qp,
    203	.create_srq = qedr_create_srq,
    204	.dealloc_pd = qedr_dealloc_pd,
    205	.dealloc_ucontext = qedr_dealloc_ucontext,
    206	.dereg_mr = qedr_dereg_mr,
    207	.destroy_ah = qedr_destroy_ah,
    208	.destroy_cq = qedr_destroy_cq,
    209	.destroy_qp = qedr_destroy_qp,
    210	.destroy_srq = qedr_destroy_srq,
    211	.device_group = &qedr_attr_group,
    212	.get_dev_fw_str = qedr_get_dev_fw_str,
    213	.get_dma_mr = qedr_get_dma_mr,
    214	.get_link_layer = qedr_link_layer,
    215	.map_mr_sg = qedr_map_mr_sg,
    216	.mmap = qedr_mmap,
    217	.mmap_free = qedr_mmap_free,
    218	.modify_qp = qedr_modify_qp,
    219	.modify_srq = qedr_modify_srq,
    220	.poll_cq = qedr_poll_cq,
    221	.post_recv = qedr_post_recv,
    222	.post_send = qedr_post_send,
    223	.post_srq_recv = qedr_post_srq_recv,
    224	.process_mad = qedr_process_mad,
    225	.query_device = qedr_query_device,
    226	.query_port = qedr_query_port,
    227	.query_qp = qedr_query_qp,
    228	.query_srq = qedr_query_srq,
    229	.reg_user_mr = qedr_reg_user_mr,
    230	.req_notify_cq = qedr_arm_cq,
    231
    232	INIT_RDMA_OBJ_SIZE(ib_ah, qedr_ah, ibah),
    233	INIT_RDMA_OBJ_SIZE(ib_cq, qedr_cq, ibcq),
    234	INIT_RDMA_OBJ_SIZE(ib_pd, qedr_pd, ibpd),
    235	INIT_RDMA_OBJ_SIZE(ib_qp, qedr_qp, ibqp),
    236	INIT_RDMA_OBJ_SIZE(ib_srq, qedr_srq, ibsrq),
    237	INIT_RDMA_OBJ_SIZE(ib_xrcd, qedr_xrcd, ibxrcd),
    238	INIT_RDMA_OBJ_SIZE(ib_ucontext, qedr_ucontext, ibucontext),
    239};
    240
    241static int qedr_register_device(struct qedr_dev *dev)
    242{
    243	int rc;
    244
    245	dev->ibdev.node_guid = dev->attr.node_guid;
    246	memcpy(dev->ibdev.node_desc, QEDR_NODE_DESC, sizeof(QEDR_NODE_DESC));
    247
    248	if (IS_IWARP(dev)) {
    249		rc = qedr_iw_register_device(dev);
    250		if (rc)
    251			return rc;
    252	} else {
    253		qedr_roce_register_device(dev);
    254	}
    255
    256	dev->ibdev.phys_port_cnt = 1;
    257	dev->ibdev.num_comp_vectors = dev->num_cnq;
    258	dev->ibdev.dev.parent = &dev->pdev->dev;
    259
    260	ib_set_device_ops(&dev->ibdev, &qedr_dev_ops);
    261
    262	rc = ib_device_set_netdev(&dev->ibdev, dev->ndev, 1);
    263	if (rc)
    264		return rc;
    265
    266	dma_set_max_seg_size(&dev->pdev->dev, UINT_MAX);
    267	return ib_register_device(&dev->ibdev, "qedr%d", &dev->pdev->dev);
    268}
    269
    270/* This function allocates fast-path status block memory */
    271static int qedr_alloc_mem_sb(struct qedr_dev *dev,
    272			     struct qed_sb_info *sb_info, u16 sb_id)
    273{
    274	struct status_block *sb_virt;
    275	dma_addr_t sb_phys;
    276	int rc;
    277
    278	sb_virt = dma_alloc_coherent(&dev->pdev->dev,
    279				     sizeof(*sb_virt), &sb_phys, GFP_KERNEL);
    280	if (!sb_virt)
    281		return -ENOMEM;
    282
    283	rc = dev->ops->common->sb_init(dev->cdev, sb_info,
    284				       sb_virt, sb_phys, sb_id,
    285				       QED_SB_TYPE_CNQ);
    286	if (rc) {
    287		pr_err("Status block initialization failed\n");
    288		dma_free_coherent(&dev->pdev->dev, sizeof(*sb_virt),
    289				  sb_virt, sb_phys);
    290		return rc;
    291	}
    292
    293	return 0;
    294}
    295
    296static void qedr_free_mem_sb(struct qedr_dev *dev,
    297			     struct qed_sb_info *sb_info, int sb_id)
    298{
    299	if (sb_info->sb_virt) {
    300		dev->ops->common->sb_release(dev->cdev, sb_info, sb_id,
    301					     QED_SB_TYPE_CNQ);
    302		dma_free_coherent(&dev->pdev->dev, sizeof(*sb_info->sb_virt),
    303				  (void *)sb_info->sb_virt, sb_info->sb_phys);
    304	}
    305}
    306
    307static void qedr_free_resources(struct qedr_dev *dev)
    308{
    309	int i;
    310
    311	if (IS_IWARP(dev))
    312		destroy_workqueue(dev->iwarp_wq);
    313
    314	for (i = 0; i < dev->num_cnq; i++) {
    315		qedr_free_mem_sb(dev, &dev->sb_array[i], dev->sb_start + i);
    316		dev->ops->common->chain_free(dev->cdev, &dev->cnq_array[i].pbl);
    317	}
    318
    319	kfree(dev->cnq_array);
    320	kfree(dev->sb_array);
    321	kfree(dev->sgid_tbl);
    322}
    323
    324static int qedr_alloc_resources(struct qedr_dev *dev)
    325{
    326	struct qed_chain_init_params params = {
    327		.mode		= QED_CHAIN_MODE_PBL,
    328		.intended_use	= QED_CHAIN_USE_TO_CONSUME,
    329		.cnt_type	= QED_CHAIN_CNT_TYPE_U16,
    330		.elem_size	= sizeof(struct regpair *),
    331	};
    332	struct qedr_cnq *cnq;
    333	__le16 *cons_pi;
    334	int i, rc;
    335
    336	dev->sgid_tbl = kcalloc(QEDR_MAX_SGID, sizeof(union ib_gid),
    337				GFP_KERNEL);
    338	if (!dev->sgid_tbl)
    339		return -ENOMEM;
    340
    341	spin_lock_init(&dev->sgid_lock);
    342	xa_init_flags(&dev->srqs, XA_FLAGS_LOCK_IRQ);
    343
    344	if (IS_IWARP(dev)) {
    345		xa_init(&dev->qps);
    346		dev->iwarp_wq = create_singlethread_workqueue("qedr_iwarpq");
    347	}
    348
    349	/* Allocate Status blocks for CNQ */
    350	dev->sb_array = kcalloc(dev->num_cnq, sizeof(*dev->sb_array),
    351				GFP_KERNEL);
    352	if (!dev->sb_array) {
    353		rc = -ENOMEM;
    354		goto err1;
    355	}
    356
    357	dev->cnq_array = kcalloc(dev->num_cnq,
    358				 sizeof(*dev->cnq_array), GFP_KERNEL);
    359	if (!dev->cnq_array) {
    360		rc = -ENOMEM;
    361		goto err2;
    362	}
    363
    364	dev->sb_start = dev->ops->rdma_get_start_sb(dev->cdev);
    365
    366	/* Allocate CNQ PBLs */
    367	params.num_elems = min_t(u32, QED_RDMA_MAX_CNQ_SIZE,
    368				 QEDR_ROCE_MAX_CNQ_SIZE);
    369
    370	for (i = 0; i < dev->num_cnq; i++) {
    371		cnq = &dev->cnq_array[i];
    372
    373		rc = qedr_alloc_mem_sb(dev, &dev->sb_array[i],
    374				       dev->sb_start + i);
    375		if (rc)
    376			goto err3;
    377
    378		rc = dev->ops->common->chain_alloc(dev->cdev, &cnq->pbl,
    379						   &params);
    380		if (rc)
    381			goto err4;
    382
    383		cnq->dev = dev;
    384		cnq->sb = &dev->sb_array[i];
    385		cons_pi = dev->sb_array[i].sb_virt->pi_array;
    386		cnq->hw_cons_ptr = &cons_pi[QED_ROCE_PROTOCOL_INDEX];
    387		cnq->index = i;
    388		sprintf(cnq->name, "qedr%d@pci:%s", i, pci_name(dev->pdev));
    389
    390		DP_DEBUG(dev, QEDR_MSG_INIT, "cnq[%d].cons=%d\n",
    391			 i, qed_chain_get_cons_idx(&cnq->pbl));
    392	}
    393
    394	return 0;
    395err4:
    396	qedr_free_mem_sb(dev, &dev->sb_array[i], dev->sb_start + i);
    397err3:
    398	for (--i; i >= 0; i--) {
    399		dev->ops->common->chain_free(dev->cdev, &dev->cnq_array[i].pbl);
    400		qedr_free_mem_sb(dev, &dev->sb_array[i], dev->sb_start + i);
    401	}
    402	kfree(dev->cnq_array);
    403err2:
    404	kfree(dev->sb_array);
    405err1:
    406	kfree(dev->sgid_tbl);
    407	return rc;
    408}
    409
    410static void qedr_pci_set_atomic(struct qedr_dev *dev, struct pci_dev *pdev)
    411{
    412	int rc = pci_enable_atomic_ops_to_root(pdev,
    413					       PCI_EXP_DEVCAP2_ATOMIC_COMP64);
    414
    415	if (rc) {
    416		dev->atomic_cap = IB_ATOMIC_NONE;
    417		DP_DEBUG(dev, QEDR_MSG_INIT, "Atomic capability disabled\n");
    418	} else {
    419		dev->atomic_cap = IB_ATOMIC_GLOB;
    420		DP_DEBUG(dev, QEDR_MSG_INIT, "Atomic capability enabled\n");
    421	}
    422}
    423
    424static const struct qed_rdma_ops *qed_ops;
    425
    426#define HILO_U64(hi, lo)		((((u64)(hi)) << 32) + (lo))
    427
    428static irqreturn_t qedr_irq_handler(int irq, void *handle)
    429{
    430	u16 hw_comp_cons, sw_comp_cons;
    431	struct qedr_cnq *cnq = handle;
    432	struct regpair *cq_handle;
    433	struct qedr_cq *cq;
    434
    435	qed_sb_ack(cnq->sb, IGU_INT_DISABLE, 0);
    436
    437	qed_sb_update_sb_idx(cnq->sb);
    438
    439	hw_comp_cons = le16_to_cpu(*cnq->hw_cons_ptr);
    440	sw_comp_cons = qed_chain_get_cons_idx(&cnq->pbl);
    441
    442	/* Align protocol-index and chain reads */
    443	rmb();
    444
    445	while (sw_comp_cons != hw_comp_cons) {
    446		cq_handle = (struct regpair *)qed_chain_consume(&cnq->pbl);
    447		cq = (struct qedr_cq *)(uintptr_t)HILO_U64(cq_handle->hi,
    448				cq_handle->lo);
    449
    450		if (cq == NULL) {
    451			DP_ERR(cnq->dev,
    452			       "Received NULL CQ cq_handle->hi=%d cq_handle->lo=%d sw_comp_cons=%d hw_comp_cons=%d\n",
    453			       cq_handle->hi, cq_handle->lo, sw_comp_cons,
    454			       hw_comp_cons);
    455
    456			break;
    457		}
    458
    459		if (cq->sig != QEDR_CQ_MAGIC_NUMBER) {
    460			DP_ERR(cnq->dev,
    461			       "Problem with cq signature, cq_handle->hi=%d ch_handle->lo=%d cq=%p\n",
    462			       cq_handle->hi, cq_handle->lo, cq);
    463			break;
    464		}
    465
    466		cq->arm_flags = 0;
    467
    468		if (!cq->destroyed && cq->ibcq.comp_handler)
    469			(*cq->ibcq.comp_handler)
    470				(&cq->ibcq, cq->ibcq.cq_context);
    471
    472		/* The CQ's CNQ notification counter is checked before
    473		 * destroying the CQ in a busy-wait loop that waits for all of
    474		 * the CQ's CNQ interrupts to be processed. It is increased
    475		 * here, only after the completion handler, to ensure that the
    476		 * the handler is not running when the CQ is destroyed.
    477		 */
    478		cq->cnq_notif++;
    479
    480		sw_comp_cons = qed_chain_get_cons_idx(&cnq->pbl);
    481
    482		cnq->n_comp++;
    483	}
    484
    485	qed_ops->rdma_cnq_prod_update(cnq->dev->rdma_ctx, cnq->index,
    486				      sw_comp_cons);
    487
    488	qed_sb_ack(cnq->sb, IGU_INT_ENABLE, 1);
    489
    490	return IRQ_HANDLED;
    491}
    492
    493static void qedr_sync_free_irqs(struct qedr_dev *dev)
    494{
    495	u32 vector;
    496	u16 idx;
    497	int i;
    498
    499	for (i = 0; i < dev->int_info.used_cnt; i++) {
    500		if (dev->int_info.msix_cnt) {
    501			idx = i * dev->num_hwfns + dev->affin_hwfn_idx;
    502			vector = dev->int_info.msix[idx].vector;
    503			free_irq(vector, &dev->cnq_array[i]);
    504		}
    505	}
    506
    507	dev->int_info.used_cnt = 0;
    508}
    509
    510static int qedr_req_msix_irqs(struct qedr_dev *dev)
    511{
    512	int i, rc = 0;
    513	u16 idx;
    514
    515	if (dev->num_cnq > dev->int_info.msix_cnt) {
    516		DP_ERR(dev,
    517		       "Interrupt mismatch: %d CNQ queues > %d MSI-x vectors\n",
    518		       dev->num_cnq, dev->int_info.msix_cnt);
    519		return -EINVAL;
    520	}
    521
    522	for (i = 0; i < dev->num_cnq; i++) {
    523		idx = i * dev->num_hwfns + dev->affin_hwfn_idx;
    524		rc = request_irq(dev->int_info.msix[idx].vector,
    525				 qedr_irq_handler, 0, dev->cnq_array[i].name,
    526				 &dev->cnq_array[i]);
    527		if (rc) {
    528			DP_ERR(dev, "Request cnq %d irq failed\n", i);
    529			qedr_sync_free_irqs(dev);
    530		} else {
    531			DP_DEBUG(dev, QEDR_MSG_INIT,
    532				 "Requested cnq irq for %s [entry %d]. Cookie is at %p\n",
    533				 dev->cnq_array[i].name, i,
    534				 &dev->cnq_array[i]);
    535			dev->int_info.used_cnt++;
    536		}
    537	}
    538
    539	return rc;
    540}
    541
    542static int qedr_setup_irqs(struct qedr_dev *dev)
    543{
    544	int rc;
    545
    546	DP_DEBUG(dev, QEDR_MSG_INIT, "qedr_setup_irqs\n");
    547
    548	/* Learn Interrupt configuration */
    549	rc = dev->ops->rdma_set_rdma_int(dev->cdev, dev->num_cnq);
    550	if (rc < 0)
    551		return rc;
    552
    553	rc = dev->ops->rdma_get_rdma_int(dev->cdev, &dev->int_info);
    554	if (rc) {
    555		DP_DEBUG(dev, QEDR_MSG_INIT, "get_rdma_int failed\n");
    556		return rc;
    557	}
    558
    559	if (dev->int_info.msix_cnt) {
    560		DP_DEBUG(dev, QEDR_MSG_INIT, "rdma msix_cnt = %d\n",
    561			 dev->int_info.msix_cnt);
    562		rc = qedr_req_msix_irqs(dev);
    563		if (rc)
    564			return rc;
    565	}
    566
    567	DP_DEBUG(dev, QEDR_MSG_INIT, "qedr_setup_irqs succeeded\n");
    568
    569	return 0;
    570}
    571
    572static int qedr_set_device_attr(struct qedr_dev *dev)
    573{
    574	struct qed_rdma_device *qed_attr;
    575	struct qedr_device_attr *attr;
    576	u32 page_size;
    577
    578	/* Part 1 - query core capabilities */
    579	qed_attr = dev->ops->rdma_query_device(dev->rdma_ctx);
    580
    581	/* Part 2 - check capabilities */
    582	page_size = ~qed_attr->page_size_caps + 1;
    583	if (page_size > PAGE_SIZE) {
    584		DP_ERR(dev,
    585		       "Kernel PAGE_SIZE is %ld which is smaller than minimum page size (%d) required by qedr\n",
    586		       PAGE_SIZE, page_size);
    587		return -ENODEV;
    588	}
    589
    590	/* Part 3 - copy and update capabilities */
    591	attr = &dev->attr;
    592	attr->vendor_id = qed_attr->vendor_id;
    593	attr->vendor_part_id = qed_attr->vendor_part_id;
    594	attr->hw_ver = qed_attr->hw_ver;
    595	attr->fw_ver = qed_attr->fw_ver;
    596	attr->node_guid = qed_attr->node_guid;
    597	attr->sys_image_guid = qed_attr->sys_image_guid;
    598	attr->max_cnq = qed_attr->max_cnq;
    599	attr->max_sge = qed_attr->max_sge;
    600	attr->max_inline = qed_attr->max_inline;
    601	attr->max_sqe = min_t(u32, qed_attr->max_wqe, QEDR_MAX_SQE);
    602	attr->max_rqe = min_t(u32, qed_attr->max_wqe, QEDR_MAX_RQE);
    603	attr->max_qp_resp_rd_atomic_resc = qed_attr->max_qp_resp_rd_atomic_resc;
    604	attr->max_qp_req_rd_atomic_resc = qed_attr->max_qp_req_rd_atomic_resc;
    605	attr->max_dev_resp_rd_atomic_resc =
    606	    qed_attr->max_dev_resp_rd_atomic_resc;
    607	attr->max_cq = qed_attr->max_cq;
    608	attr->max_qp = qed_attr->max_qp;
    609	attr->max_mr = qed_attr->max_mr;
    610	attr->max_mr_size = qed_attr->max_mr_size;
    611	attr->max_cqe = min_t(u64, qed_attr->max_cqe, QEDR_MAX_CQES);
    612	attr->max_mw = qed_attr->max_mw;
    613	attr->max_mr_mw_fmr_pbl = qed_attr->max_mr_mw_fmr_pbl;
    614	attr->max_mr_mw_fmr_size = qed_attr->max_mr_mw_fmr_size;
    615	attr->max_pd = qed_attr->max_pd;
    616	attr->max_ah = qed_attr->max_ah;
    617	attr->max_pkey = qed_attr->max_pkey;
    618	attr->max_srq = qed_attr->max_srq;
    619	attr->max_srq_wr = qed_attr->max_srq_wr;
    620	attr->dev_caps = qed_attr->dev_caps;
    621	attr->page_size_caps = qed_attr->page_size_caps;
    622	attr->dev_ack_delay = qed_attr->dev_ack_delay;
    623	attr->reserved_lkey = qed_attr->reserved_lkey;
    624	attr->bad_pkey_counter = qed_attr->bad_pkey_counter;
    625	attr->max_stats_queues = qed_attr->max_stats_queues;
    626
    627	return 0;
    628}
    629
    630static void qedr_unaffiliated_event(void *context, u8 event_code)
    631{
    632	pr_err("unaffiliated event not implemented yet\n");
    633}
    634
    635static void qedr_affiliated_event(void *context, u8 e_code, void *fw_handle)
    636{
    637#define EVENT_TYPE_NOT_DEFINED	0
    638#define EVENT_TYPE_CQ		1
    639#define EVENT_TYPE_QP		2
    640#define EVENT_TYPE_SRQ		3
    641	struct qedr_dev *dev = (struct qedr_dev *)context;
    642	struct regpair *async_handle = (struct regpair *)fw_handle;
    643	u64 roce_handle64 = ((u64) async_handle->hi << 32) + async_handle->lo;
    644	u8 event_type = EVENT_TYPE_NOT_DEFINED;
    645	struct ib_event event;
    646	struct ib_srq *ibsrq;
    647	struct qedr_srq *srq;
    648	unsigned long flags;
    649	struct ib_cq *ibcq;
    650	struct ib_qp *ibqp;
    651	struct qedr_cq *cq;
    652	struct qedr_qp *qp;
    653	u16 srq_id;
    654
    655	if (IS_ROCE(dev)) {
    656		switch (e_code) {
    657		case ROCE_ASYNC_EVENT_CQ_OVERFLOW_ERR:
    658			event.event = IB_EVENT_CQ_ERR;
    659			event_type = EVENT_TYPE_CQ;
    660			break;
    661		case ROCE_ASYNC_EVENT_SQ_DRAINED:
    662			event.event = IB_EVENT_SQ_DRAINED;
    663			event_type = EVENT_TYPE_QP;
    664			break;
    665		case ROCE_ASYNC_EVENT_QP_CATASTROPHIC_ERR:
    666			event.event = IB_EVENT_QP_FATAL;
    667			event_type = EVENT_TYPE_QP;
    668			break;
    669		case ROCE_ASYNC_EVENT_LOCAL_INVALID_REQUEST_ERR:
    670			event.event = IB_EVENT_QP_REQ_ERR;
    671			event_type = EVENT_TYPE_QP;
    672			break;
    673		case ROCE_ASYNC_EVENT_LOCAL_ACCESS_ERR:
    674			event.event = IB_EVENT_QP_ACCESS_ERR;
    675			event_type = EVENT_TYPE_QP;
    676			break;
    677		case ROCE_ASYNC_EVENT_SRQ_LIMIT:
    678			event.event = IB_EVENT_SRQ_LIMIT_REACHED;
    679			event_type = EVENT_TYPE_SRQ;
    680			break;
    681		case ROCE_ASYNC_EVENT_SRQ_EMPTY:
    682			event.event = IB_EVENT_SRQ_ERR;
    683			event_type = EVENT_TYPE_SRQ;
    684			break;
    685		case ROCE_ASYNC_EVENT_XRC_DOMAIN_ERR:
    686			event.event = IB_EVENT_QP_ACCESS_ERR;
    687			event_type = EVENT_TYPE_QP;
    688			break;
    689		case ROCE_ASYNC_EVENT_INVALID_XRCETH_ERR:
    690			event.event = IB_EVENT_QP_ACCESS_ERR;
    691			event_type = EVENT_TYPE_QP;
    692			break;
    693		case ROCE_ASYNC_EVENT_XRC_SRQ_CATASTROPHIC_ERR:
    694			event.event = IB_EVENT_CQ_ERR;
    695			event_type = EVENT_TYPE_CQ;
    696			break;
    697		default:
    698			DP_ERR(dev, "unsupported event %d on handle=%llx\n",
    699			       e_code, roce_handle64);
    700		}
    701	} else {
    702		switch (e_code) {
    703		case QED_IWARP_EVENT_SRQ_LIMIT:
    704			event.event = IB_EVENT_SRQ_LIMIT_REACHED;
    705			event_type = EVENT_TYPE_SRQ;
    706			break;
    707		case QED_IWARP_EVENT_SRQ_EMPTY:
    708			event.event = IB_EVENT_SRQ_ERR;
    709			event_type = EVENT_TYPE_SRQ;
    710			break;
    711		default:
    712		DP_ERR(dev, "unsupported event %d on handle=%llx\n", e_code,
    713		       roce_handle64);
    714		}
    715	}
    716	switch (event_type) {
    717	case EVENT_TYPE_CQ:
    718		cq = (struct qedr_cq *)(uintptr_t)roce_handle64;
    719		if (cq) {
    720			ibcq = &cq->ibcq;
    721			if (ibcq->event_handler) {
    722				event.device = ibcq->device;
    723				event.element.cq = ibcq;
    724				ibcq->event_handler(&event, ibcq->cq_context);
    725			}
    726		} else {
    727			WARN(1,
    728			     "Error: CQ event with NULL pointer ibcq. Handle=%llx\n",
    729			     roce_handle64);
    730		}
    731		DP_ERR(dev, "CQ event %d on handle %p\n", e_code, cq);
    732		break;
    733	case EVENT_TYPE_QP:
    734		qp = (struct qedr_qp *)(uintptr_t)roce_handle64;
    735		if (qp) {
    736			ibqp = &qp->ibqp;
    737			if (ibqp->event_handler) {
    738				event.device = ibqp->device;
    739				event.element.qp = ibqp;
    740				ibqp->event_handler(&event, ibqp->qp_context);
    741			}
    742		} else {
    743			WARN(1,
    744			     "Error: QP event with NULL pointer ibqp. Handle=%llx\n",
    745			     roce_handle64);
    746		}
    747		DP_ERR(dev, "QP event %d on handle %p\n", e_code, qp);
    748		break;
    749	case EVENT_TYPE_SRQ:
    750		srq_id = (u16)roce_handle64;
    751		xa_lock_irqsave(&dev->srqs, flags);
    752		srq = xa_load(&dev->srqs, srq_id);
    753		if (srq) {
    754			ibsrq = &srq->ibsrq;
    755			if (ibsrq->event_handler) {
    756				event.device = ibsrq->device;
    757				event.element.srq = ibsrq;
    758				ibsrq->event_handler(&event,
    759						     ibsrq->srq_context);
    760			}
    761		} else {
    762			DP_NOTICE(dev,
    763				  "SRQ event with NULL pointer ibsrq. Handle=%llx\n",
    764				  roce_handle64);
    765		}
    766		xa_unlock_irqrestore(&dev->srqs, flags);
    767		DP_NOTICE(dev, "SRQ event %d on handle %p\n", e_code, srq);
    768		break;
    769	default:
    770		break;
    771	}
    772}
    773
    774static int qedr_init_hw(struct qedr_dev *dev)
    775{
    776	struct qed_rdma_add_user_out_params out_params;
    777	struct qed_rdma_start_in_params *in_params;
    778	struct qed_rdma_cnq_params *cur_pbl;
    779	struct qed_rdma_events events;
    780	dma_addr_t p_phys_table;
    781	u32 page_cnt;
    782	int rc = 0;
    783	int i;
    784
    785	in_params =  kzalloc(sizeof(*in_params), GFP_KERNEL);
    786	if (!in_params) {
    787		rc = -ENOMEM;
    788		goto out;
    789	}
    790
    791	in_params->desired_cnq = dev->num_cnq;
    792	for (i = 0; i < dev->num_cnq; i++) {
    793		cur_pbl = &in_params->cnq_pbl_list[i];
    794
    795		page_cnt = qed_chain_get_page_cnt(&dev->cnq_array[i].pbl);
    796		cur_pbl->num_pbl_pages = page_cnt;
    797
    798		p_phys_table = qed_chain_get_pbl_phys(&dev->cnq_array[i].pbl);
    799		cur_pbl->pbl_ptr = (u64)p_phys_table;
    800	}
    801
    802	events.affiliated_event = qedr_affiliated_event;
    803	events.unaffiliated_event = qedr_unaffiliated_event;
    804	events.context = dev;
    805
    806	in_params->events = &events;
    807	in_params->cq_mode = QED_RDMA_CQ_MODE_32_BITS;
    808	in_params->max_mtu = dev->ndev->mtu;
    809	dev->iwarp_max_mtu = dev->ndev->mtu;
    810	ether_addr_copy(&in_params->mac_addr[0], dev->ndev->dev_addr);
    811
    812	rc = dev->ops->rdma_init(dev->cdev, in_params);
    813	if (rc)
    814		goto out;
    815
    816	rc = dev->ops->rdma_add_user(dev->rdma_ctx, &out_params);
    817	if (rc)
    818		goto out;
    819
    820	dev->db_addr = out_params.dpi_addr;
    821	dev->db_phys_addr = out_params.dpi_phys_addr;
    822	dev->db_size = out_params.dpi_size;
    823	dev->dpi = out_params.dpi;
    824
    825	rc = qedr_set_device_attr(dev);
    826out:
    827	kfree(in_params);
    828	if (rc)
    829		DP_ERR(dev, "Init HW Failed rc = %d\n", rc);
    830
    831	return rc;
    832}
    833
    834static void qedr_stop_hw(struct qedr_dev *dev)
    835{
    836	dev->ops->rdma_remove_user(dev->rdma_ctx, dev->dpi);
    837	dev->ops->rdma_stop(dev->rdma_ctx);
    838}
    839
    840static struct qedr_dev *qedr_add(struct qed_dev *cdev, struct pci_dev *pdev,
    841				 struct net_device *ndev)
    842{
    843	struct qed_dev_rdma_info dev_info;
    844	struct qedr_dev *dev;
    845	int rc = 0;
    846
    847	dev = ib_alloc_device(qedr_dev, ibdev);
    848	if (!dev) {
    849		pr_err("Unable to allocate ib device\n");
    850		return NULL;
    851	}
    852
    853	DP_DEBUG(dev, QEDR_MSG_INIT, "qedr add device called\n");
    854
    855	dev->pdev = pdev;
    856	dev->ndev = ndev;
    857	dev->cdev = cdev;
    858
    859	qed_ops = qed_get_rdma_ops();
    860	if (!qed_ops) {
    861		DP_ERR(dev, "Failed to get qed roce operations\n");
    862		goto init_err;
    863	}
    864
    865	dev->ops = qed_ops;
    866	rc = qed_ops->fill_dev_info(cdev, &dev_info);
    867	if (rc)
    868		goto init_err;
    869
    870	dev->user_dpm_enabled = dev_info.user_dpm_enabled;
    871	dev->rdma_type = dev_info.rdma_type;
    872	dev->num_hwfns = dev_info.common.num_hwfns;
    873
    874	if (IS_IWARP(dev) && QEDR_IS_CMT(dev)) {
    875		rc = dev->ops->iwarp_set_engine_affin(cdev, false);
    876		if (rc) {
    877			DP_ERR(dev, "iWARP is disabled over a 100g device Enabling it may impact L2 performance. To enable it run devlink dev param set <dev> name iwarp_cmt value true cmode runtime\n");
    878			goto init_err;
    879		}
    880	}
    881	dev->affin_hwfn_idx = dev->ops->common->get_affin_hwfn_idx(cdev);
    882
    883	dev->rdma_ctx = dev->ops->rdma_get_rdma_ctx(cdev);
    884
    885	dev->num_cnq = dev->ops->rdma_get_min_cnq_msix(cdev);
    886	if (!dev->num_cnq) {
    887		DP_ERR(dev, "Failed. At least one CNQ is required.\n");
    888		rc = -ENOMEM;
    889		goto init_err;
    890	}
    891
    892	dev->wq_multiplier = QEDR_WQ_MULTIPLIER_DFT;
    893
    894	qedr_pci_set_atomic(dev, pdev);
    895
    896	rc = qedr_alloc_resources(dev);
    897	if (rc)
    898		goto init_err;
    899
    900	rc = qedr_init_hw(dev);
    901	if (rc)
    902		goto alloc_err;
    903
    904	rc = qedr_setup_irqs(dev);
    905	if (rc)
    906		goto irq_err;
    907
    908	rc = qedr_register_device(dev);
    909	if (rc) {
    910		DP_ERR(dev, "Unable to allocate register device\n");
    911		goto reg_err;
    912	}
    913
    914	if (!test_and_set_bit(QEDR_ENET_STATE_BIT, &dev->enet_state))
    915		qedr_ib_dispatch_event(dev, QEDR_PORT, IB_EVENT_PORT_ACTIVE);
    916
    917	DP_DEBUG(dev, QEDR_MSG_INIT, "qedr driver loaded successfully\n");
    918	return dev;
    919
    920reg_err:
    921	qedr_sync_free_irqs(dev);
    922irq_err:
    923	qedr_stop_hw(dev);
    924alloc_err:
    925	qedr_free_resources(dev);
    926init_err:
    927	ib_dealloc_device(&dev->ibdev);
    928	DP_ERR(dev, "qedr driver load failed rc=%d\n", rc);
    929
    930	return NULL;
    931}
    932
    933static void qedr_remove(struct qedr_dev *dev)
    934{
    935	/* First unregister with stack to stop all the active traffic
    936	 * of the registered clients.
    937	 */
    938	ib_unregister_device(&dev->ibdev);
    939
    940	qedr_stop_hw(dev);
    941	qedr_sync_free_irqs(dev);
    942	qedr_free_resources(dev);
    943
    944	if (IS_IWARP(dev) && QEDR_IS_CMT(dev))
    945		dev->ops->iwarp_set_engine_affin(dev->cdev, true);
    946
    947	ib_dealloc_device(&dev->ibdev);
    948}
    949
    950static void qedr_close(struct qedr_dev *dev)
    951{
    952	if (test_and_clear_bit(QEDR_ENET_STATE_BIT, &dev->enet_state))
    953		qedr_ib_dispatch_event(dev, QEDR_PORT, IB_EVENT_PORT_ERR);
    954}
    955
    956static void qedr_shutdown(struct qedr_dev *dev)
    957{
    958	qedr_close(dev);
    959	qedr_remove(dev);
    960}
    961
    962static void qedr_open(struct qedr_dev *dev)
    963{
    964	if (!test_and_set_bit(QEDR_ENET_STATE_BIT, &dev->enet_state))
    965		qedr_ib_dispatch_event(dev, QEDR_PORT, IB_EVENT_PORT_ACTIVE);
    966}
    967
    968static void qedr_mac_address_change(struct qedr_dev *dev)
    969{
    970	union ib_gid *sgid = &dev->sgid_tbl[0];
    971	u8 guid[8], mac_addr[6];
    972	int rc;
    973
    974	/* Update SGID */
    975	ether_addr_copy(&mac_addr[0], dev->ndev->dev_addr);
    976	guid[0] = mac_addr[0] ^ 2;
    977	guid[1] = mac_addr[1];
    978	guid[2] = mac_addr[2];
    979	guid[3] = 0xff;
    980	guid[4] = 0xfe;
    981	guid[5] = mac_addr[3];
    982	guid[6] = mac_addr[4];
    983	guid[7] = mac_addr[5];
    984	sgid->global.subnet_prefix = cpu_to_be64(0xfe80000000000000LL);
    985	memcpy(&sgid->raw[8], guid, sizeof(guid));
    986
    987	/* Update LL2 */
    988	rc = dev->ops->ll2_set_mac_filter(dev->cdev,
    989					  dev->gsi_ll2_mac_address,
    990					  dev->ndev->dev_addr);
    991
    992	ether_addr_copy(dev->gsi_ll2_mac_address, dev->ndev->dev_addr);
    993
    994	qedr_ib_dispatch_event(dev, QEDR_PORT, IB_EVENT_GID_CHANGE);
    995
    996	if (rc)
    997		DP_ERR(dev, "Error updating mac filter\n");
    998}
    999
   1000/* event handling via NIC driver ensures that all the NIC specific
   1001 * initialization done before RoCE driver notifies
   1002 * event to stack.
   1003 */
   1004static void qedr_notify(struct qedr_dev *dev, enum qede_rdma_event event)
   1005{
   1006	switch (event) {
   1007	case QEDE_UP:
   1008		qedr_open(dev);
   1009		break;
   1010	case QEDE_DOWN:
   1011		qedr_close(dev);
   1012		break;
   1013	case QEDE_CLOSE:
   1014		qedr_shutdown(dev);
   1015		break;
   1016	case QEDE_CHANGE_ADDR:
   1017		qedr_mac_address_change(dev);
   1018		break;
   1019	case QEDE_CHANGE_MTU:
   1020		if (rdma_protocol_iwarp(&dev->ibdev, 1))
   1021			if (dev->ndev->mtu != dev->iwarp_max_mtu)
   1022				DP_NOTICE(dev,
   1023					  "Mtu was changed from %d to %d. This will not take affect for iWARP until qedr is reloaded\n",
   1024					  dev->iwarp_max_mtu, dev->ndev->mtu);
   1025		break;
   1026	default:
   1027		pr_err("Event not supported\n");
   1028	}
   1029}
   1030
   1031static struct qedr_driver qedr_drv = {
   1032	.name = "qedr_driver",
   1033	.add = qedr_add,
   1034	.remove = qedr_remove,
   1035	.notify = qedr_notify,
   1036};
   1037
   1038static int __init qedr_init_module(void)
   1039{
   1040	return qede_rdma_register_driver(&qedr_drv);
   1041}
   1042
   1043static void __exit qedr_exit_module(void)
   1044{
   1045	qede_rdma_unregister_driver(&qedr_drv);
   1046}
   1047
   1048module_init(qedr_init_module);
   1049module_exit(qedr_exit_module);