cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

dma.c (47096B)


      1// SPDX-License-Identifier: GPL-2.0-or-later
      2/*
      3
      4  Broadcom B43 wireless driver
      5
      6  DMA ringbuffer and descriptor allocation/management
      7
      8  Copyright (c) 2005, 2006 Michael Buesch <m@bues.ch>
      9
     10  Some code in this file is derived from the b44.c driver
     11  Copyright (C) 2002 David S. Miller
     12  Copyright (C) Pekka Pietikainen
     13
     14
     15*/
     16
     17#include "b43.h"
     18#include "dma.h"
     19#include "main.h"
     20#include "debugfs.h"
     21#include "xmit.h"
     22
     23#include <linux/dma-mapping.h>
     24#include <linux/pci.h>
     25#include <linux/delay.h>
     26#include <linux/skbuff.h>
     27#include <linux/etherdevice.h>
     28#include <linux/slab.h>
     29#include <asm/div64.h>
     30
     31
     32/* Required number of TX DMA slots per TX frame.
     33 * This currently is 2, because we put the header and the ieee80211 frame
     34 * into separate slots. */
     35#define TX_SLOTS_PER_FRAME	2
     36
     37static u32 b43_dma_address(struct b43_dma *dma, dma_addr_t dmaaddr,
     38			   enum b43_addrtype addrtype)
     39{
     40	u32 addr;
     41
     42	switch (addrtype) {
     43	case B43_DMA_ADDR_LOW:
     44		addr = lower_32_bits(dmaaddr);
     45		if (dma->translation_in_low) {
     46			addr &= ~SSB_DMA_TRANSLATION_MASK;
     47			addr |= dma->translation;
     48		}
     49		break;
     50	case B43_DMA_ADDR_HIGH:
     51		addr = upper_32_bits(dmaaddr);
     52		if (!dma->translation_in_low) {
     53			addr &= ~SSB_DMA_TRANSLATION_MASK;
     54			addr |= dma->translation;
     55		}
     56		break;
     57	case B43_DMA_ADDR_EXT:
     58		if (dma->translation_in_low)
     59			addr = lower_32_bits(dmaaddr);
     60		else
     61			addr = upper_32_bits(dmaaddr);
     62		addr &= SSB_DMA_TRANSLATION_MASK;
     63		addr >>= SSB_DMA_TRANSLATION_SHIFT;
     64		break;
     65	}
     66
     67	return addr;
     68}
     69
     70/* 32bit DMA ops. */
     71static
     72struct b43_dmadesc_generic *op32_idx2desc(struct b43_dmaring *ring,
     73					  int slot,
     74					  struct b43_dmadesc_meta **meta)
     75{
     76	struct b43_dmadesc32 *desc;
     77
     78	*meta = &(ring->meta[slot]);
     79	desc = ring->descbase;
     80	desc = &(desc[slot]);
     81
     82	return (struct b43_dmadesc_generic *)desc;
     83}
     84
     85static void op32_fill_descriptor(struct b43_dmaring *ring,
     86				 struct b43_dmadesc_generic *desc,
     87				 dma_addr_t dmaaddr, u16 bufsize,
     88				 int start, int end, int irq)
     89{
     90	struct b43_dmadesc32 *descbase = ring->descbase;
     91	int slot;
     92	u32 ctl;
     93	u32 addr;
     94	u32 addrext;
     95
     96	slot = (int)(&(desc->dma32) - descbase);
     97	B43_WARN_ON(!(slot >= 0 && slot < ring->nr_slots));
     98
     99	addr = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_LOW);
    100	addrext = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_EXT);
    101
    102	ctl = bufsize & B43_DMA32_DCTL_BYTECNT;
    103	if (slot == ring->nr_slots - 1)
    104		ctl |= B43_DMA32_DCTL_DTABLEEND;
    105	if (start)
    106		ctl |= B43_DMA32_DCTL_FRAMESTART;
    107	if (end)
    108		ctl |= B43_DMA32_DCTL_FRAMEEND;
    109	if (irq)
    110		ctl |= B43_DMA32_DCTL_IRQ;
    111	ctl |= (addrext << B43_DMA32_DCTL_ADDREXT_SHIFT)
    112	    & B43_DMA32_DCTL_ADDREXT_MASK;
    113
    114	desc->dma32.control = cpu_to_le32(ctl);
    115	desc->dma32.address = cpu_to_le32(addr);
    116}
    117
    118static void op32_poke_tx(struct b43_dmaring *ring, int slot)
    119{
    120	b43_dma_write(ring, B43_DMA32_TXINDEX,
    121		      (u32) (slot * sizeof(struct b43_dmadesc32)));
    122}
    123
    124static void op32_tx_suspend(struct b43_dmaring *ring)
    125{
    126	b43_dma_write(ring, B43_DMA32_TXCTL, b43_dma_read(ring, B43_DMA32_TXCTL)
    127		      | B43_DMA32_TXSUSPEND);
    128}
    129
    130static void op32_tx_resume(struct b43_dmaring *ring)
    131{
    132	b43_dma_write(ring, B43_DMA32_TXCTL, b43_dma_read(ring, B43_DMA32_TXCTL)
    133		      & ~B43_DMA32_TXSUSPEND);
    134}
    135
    136static int op32_get_current_rxslot(struct b43_dmaring *ring)
    137{
    138	u32 val;
    139
    140	val = b43_dma_read(ring, B43_DMA32_RXSTATUS);
    141	val &= B43_DMA32_RXDPTR;
    142
    143	return (val / sizeof(struct b43_dmadesc32));
    144}
    145
    146static void op32_set_current_rxslot(struct b43_dmaring *ring, int slot)
    147{
    148	b43_dma_write(ring, B43_DMA32_RXINDEX,
    149		      (u32) (slot * sizeof(struct b43_dmadesc32)));
    150}
    151
    152static const struct b43_dma_ops dma32_ops = {
    153	.idx2desc = op32_idx2desc,
    154	.fill_descriptor = op32_fill_descriptor,
    155	.poke_tx = op32_poke_tx,
    156	.tx_suspend = op32_tx_suspend,
    157	.tx_resume = op32_tx_resume,
    158	.get_current_rxslot = op32_get_current_rxslot,
    159	.set_current_rxslot = op32_set_current_rxslot,
    160};
    161
    162/* 64bit DMA ops. */
    163static
    164struct b43_dmadesc_generic *op64_idx2desc(struct b43_dmaring *ring,
    165					  int slot,
    166					  struct b43_dmadesc_meta **meta)
    167{
    168	struct b43_dmadesc64 *desc;
    169
    170	*meta = &(ring->meta[slot]);
    171	desc = ring->descbase;
    172	desc = &(desc[slot]);
    173
    174	return (struct b43_dmadesc_generic *)desc;
    175}
    176
    177static void op64_fill_descriptor(struct b43_dmaring *ring,
    178				 struct b43_dmadesc_generic *desc,
    179				 dma_addr_t dmaaddr, u16 bufsize,
    180				 int start, int end, int irq)
    181{
    182	struct b43_dmadesc64 *descbase = ring->descbase;
    183	int slot;
    184	u32 ctl0 = 0, ctl1 = 0;
    185	u32 addrlo, addrhi;
    186	u32 addrext;
    187
    188	slot = (int)(&(desc->dma64) - descbase);
    189	B43_WARN_ON(!(slot >= 0 && slot < ring->nr_slots));
    190
    191	addrlo = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_LOW);
    192	addrhi = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_HIGH);
    193	addrext = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_EXT);
    194
    195	if (slot == ring->nr_slots - 1)
    196		ctl0 |= B43_DMA64_DCTL0_DTABLEEND;
    197	if (start)
    198		ctl0 |= B43_DMA64_DCTL0_FRAMESTART;
    199	if (end)
    200		ctl0 |= B43_DMA64_DCTL0_FRAMEEND;
    201	if (irq)
    202		ctl0 |= B43_DMA64_DCTL0_IRQ;
    203	ctl1 |= bufsize & B43_DMA64_DCTL1_BYTECNT;
    204	ctl1 |= (addrext << B43_DMA64_DCTL1_ADDREXT_SHIFT)
    205	    & B43_DMA64_DCTL1_ADDREXT_MASK;
    206
    207	desc->dma64.control0 = cpu_to_le32(ctl0);
    208	desc->dma64.control1 = cpu_to_le32(ctl1);
    209	desc->dma64.address_low = cpu_to_le32(addrlo);
    210	desc->dma64.address_high = cpu_to_le32(addrhi);
    211}
    212
    213static void op64_poke_tx(struct b43_dmaring *ring, int slot)
    214{
    215	b43_dma_write(ring, B43_DMA64_TXINDEX,
    216		      (u32) (slot * sizeof(struct b43_dmadesc64)));
    217}
    218
    219static void op64_tx_suspend(struct b43_dmaring *ring)
    220{
    221	b43_dma_write(ring, B43_DMA64_TXCTL, b43_dma_read(ring, B43_DMA64_TXCTL)
    222		      | B43_DMA64_TXSUSPEND);
    223}
    224
    225static void op64_tx_resume(struct b43_dmaring *ring)
    226{
    227	b43_dma_write(ring, B43_DMA64_TXCTL, b43_dma_read(ring, B43_DMA64_TXCTL)
    228		      & ~B43_DMA64_TXSUSPEND);
    229}
    230
    231static int op64_get_current_rxslot(struct b43_dmaring *ring)
    232{
    233	u32 val;
    234
    235	val = b43_dma_read(ring, B43_DMA64_RXSTATUS);
    236	val &= B43_DMA64_RXSTATDPTR;
    237
    238	return (val / sizeof(struct b43_dmadesc64));
    239}
    240
    241static void op64_set_current_rxslot(struct b43_dmaring *ring, int slot)
    242{
    243	b43_dma_write(ring, B43_DMA64_RXINDEX,
    244		      (u32) (slot * sizeof(struct b43_dmadesc64)));
    245}
    246
    247static const struct b43_dma_ops dma64_ops = {
    248	.idx2desc = op64_idx2desc,
    249	.fill_descriptor = op64_fill_descriptor,
    250	.poke_tx = op64_poke_tx,
    251	.tx_suspend = op64_tx_suspend,
    252	.tx_resume = op64_tx_resume,
    253	.get_current_rxslot = op64_get_current_rxslot,
    254	.set_current_rxslot = op64_set_current_rxslot,
    255};
    256
    257static inline int free_slots(struct b43_dmaring *ring)
    258{
    259	return (ring->nr_slots - ring->used_slots);
    260}
    261
    262static inline int next_slot(struct b43_dmaring *ring, int slot)
    263{
    264	B43_WARN_ON(!(slot >= -1 && slot <= ring->nr_slots - 1));
    265	if (slot == ring->nr_slots - 1)
    266		return 0;
    267	return slot + 1;
    268}
    269
    270static inline int prev_slot(struct b43_dmaring *ring, int slot)
    271{
    272	B43_WARN_ON(!(slot >= 0 && slot <= ring->nr_slots - 1));
    273	if (slot == 0)
    274		return ring->nr_slots - 1;
    275	return slot - 1;
    276}
    277
    278#ifdef CONFIG_B43_DEBUG
    279static void update_max_used_slots(struct b43_dmaring *ring,
    280				  int current_used_slots)
    281{
    282	if (current_used_slots <= ring->max_used_slots)
    283		return;
    284	ring->max_used_slots = current_used_slots;
    285	if (b43_debug(ring->dev, B43_DBG_DMAVERBOSE)) {
    286		b43dbg(ring->dev->wl,
    287		       "max_used_slots increased to %d on %s ring %d\n",
    288		       ring->max_used_slots,
    289		       ring->tx ? "TX" : "RX", ring->index);
    290	}
    291}
    292#else
    293static inline
    294    void update_max_used_slots(struct b43_dmaring *ring, int current_used_slots)
    295{
    296}
    297#endif /* DEBUG */
    298
    299/* Request a slot for usage. */
    300static inline int request_slot(struct b43_dmaring *ring)
    301{
    302	int slot;
    303
    304	B43_WARN_ON(!ring->tx);
    305	B43_WARN_ON(ring->stopped);
    306	B43_WARN_ON(free_slots(ring) == 0);
    307
    308	slot = next_slot(ring, ring->current_slot);
    309	ring->current_slot = slot;
    310	ring->used_slots++;
    311
    312	update_max_used_slots(ring, ring->used_slots);
    313
    314	return slot;
    315}
    316
    317static u16 b43_dmacontroller_base(enum b43_dmatype type, int controller_idx)
    318{
    319	static const u16 map64[] = {
    320		B43_MMIO_DMA64_BASE0,
    321		B43_MMIO_DMA64_BASE1,
    322		B43_MMIO_DMA64_BASE2,
    323		B43_MMIO_DMA64_BASE3,
    324		B43_MMIO_DMA64_BASE4,
    325		B43_MMIO_DMA64_BASE5,
    326	};
    327	static const u16 map32[] = {
    328		B43_MMIO_DMA32_BASE0,
    329		B43_MMIO_DMA32_BASE1,
    330		B43_MMIO_DMA32_BASE2,
    331		B43_MMIO_DMA32_BASE3,
    332		B43_MMIO_DMA32_BASE4,
    333		B43_MMIO_DMA32_BASE5,
    334	};
    335
    336	if (type == B43_DMA_64BIT) {
    337		B43_WARN_ON(!(controller_idx >= 0 &&
    338			      controller_idx < ARRAY_SIZE(map64)));
    339		return map64[controller_idx];
    340	}
    341	B43_WARN_ON(!(controller_idx >= 0 &&
    342		      controller_idx < ARRAY_SIZE(map32)));
    343	return map32[controller_idx];
    344}
    345
    346static inline
    347    dma_addr_t map_descbuffer(struct b43_dmaring *ring,
    348			      unsigned char *buf, size_t len, int tx)
    349{
    350	dma_addr_t dmaaddr;
    351
    352	if (tx) {
    353		dmaaddr = dma_map_single(ring->dev->dev->dma_dev,
    354					 buf, len, DMA_TO_DEVICE);
    355	} else {
    356		dmaaddr = dma_map_single(ring->dev->dev->dma_dev,
    357					 buf, len, DMA_FROM_DEVICE);
    358	}
    359
    360	return dmaaddr;
    361}
    362
    363static inline
    364    void unmap_descbuffer(struct b43_dmaring *ring,
    365			  dma_addr_t addr, size_t len, int tx)
    366{
    367	if (tx) {
    368		dma_unmap_single(ring->dev->dev->dma_dev,
    369				 addr, len, DMA_TO_DEVICE);
    370	} else {
    371		dma_unmap_single(ring->dev->dev->dma_dev,
    372				 addr, len, DMA_FROM_DEVICE);
    373	}
    374}
    375
    376static inline
    377    void sync_descbuffer_for_cpu(struct b43_dmaring *ring,
    378				 dma_addr_t addr, size_t len)
    379{
    380	B43_WARN_ON(ring->tx);
    381	dma_sync_single_for_cpu(ring->dev->dev->dma_dev,
    382				    addr, len, DMA_FROM_DEVICE);
    383}
    384
    385static inline
    386    void sync_descbuffer_for_device(struct b43_dmaring *ring,
    387				    dma_addr_t addr, size_t len)
    388{
    389	B43_WARN_ON(ring->tx);
    390	dma_sync_single_for_device(ring->dev->dev->dma_dev,
    391				   addr, len, DMA_FROM_DEVICE);
    392}
    393
    394static inline
    395    void free_descriptor_buffer(struct b43_dmaring *ring,
    396				struct b43_dmadesc_meta *meta)
    397{
    398	if (meta->skb) {
    399		if (ring->tx)
    400			ieee80211_free_txskb(ring->dev->wl->hw, meta->skb);
    401		else
    402			dev_kfree_skb_any(meta->skb);
    403		meta->skb = NULL;
    404	}
    405}
    406
    407static int alloc_ringmemory(struct b43_dmaring *ring)
    408{
    409	/* The specs call for 4K buffers for 30- and 32-bit DMA with 4K
    410	 * alignment and 8K buffers for 64-bit DMA with 8K alignment.
    411	 * In practice we could use smaller buffers for the latter, but the
    412	 * alignment is really important because of the hardware bug. If bit
    413	 * 0x00001000 is used in DMA address, some hardware (like BCM4331)
    414	 * copies that bit into B43_DMA64_RXSTATUS and we get false values from
    415	 * B43_DMA64_RXSTATDPTR. Let's just use 8K buffers even if we don't use
    416	 * more than 256 slots for ring.
    417	 */
    418	u16 ring_mem_size = (ring->type == B43_DMA_64BIT) ?
    419				B43_DMA64_RINGMEMSIZE : B43_DMA32_RINGMEMSIZE;
    420
    421	ring->descbase = dma_alloc_coherent(ring->dev->dev->dma_dev,
    422					    ring_mem_size, &(ring->dmabase),
    423					    GFP_KERNEL);
    424	if (!ring->descbase)
    425		return -ENOMEM;
    426
    427	return 0;
    428}
    429
    430static void free_ringmemory(struct b43_dmaring *ring)
    431{
    432	u16 ring_mem_size = (ring->type == B43_DMA_64BIT) ?
    433				B43_DMA64_RINGMEMSIZE : B43_DMA32_RINGMEMSIZE;
    434	dma_free_coherent(ring->dev->dev->dma_dev, ring_mem_size,
    435			  ring->descbase, ring->dmabase);
    436}
    437
    438/* Reset the RX DMA channel */
    439static int b43_dmacontroller_rx_reset(struct b43_wldev *dev, u16 mmio_base,
    440				      enum b43_dmatype type)
    441{
    442	int i;
    443	u32 value;
    444	u16 offset;
    445
    446	might_sleep();
    447
    448	offset = (type == B43_DMA_64BIT) ? B43_DMA64_RXCTL : B43_DMA32_RXCTL;
    449	b43_write32(dev, mmio_base + offset, 0);
    450	for (i = 0; i < 10; i++) {
    451		offset = (type == B43_DMA_64BIT) ? B43_DMA64_RXSTATUS :
    452						   B43_DMA32_RXSTATUS;
    453		value = b43_read32(dev, mmio_base + offset);
    454		if (type == B43_DMA_64BIT) {
    455			value &= B43_DMA64_RXSTAT;
    456			if (value == B43_DMA64_RXSTAT_DISABLED) {
    457				i = -1;
    458				break;
    459			}
    460		} else {
    461			value &= B43_DMA32_RXSTATE;
    462			if (value == B43_DMA32_RXSTAT_DISABLED) {
    463				i = -1;
    464				break;
    465			}
    466		}
    467		msleep(1);
    468	}
    469	if (i != -1) {
    470		b43err(dev->wl, "DMA RX reset timed out\n");
    471		return -ENODEV;
    472	}
    473
    474	return 0;
    475}
    476
    477/* Reset the TX DMA channel */
    478static int b43_dmacontroller_tx_reset(struct b43_wldev *dev, u16 mmio_base,
    479				      enum b43_dmatype type)
    480{
    481	int i;
    482	u32 value;
    483	u16 offset;
    484
    485	might_sleep();
    486
    487	for (i = 0; i < 10; i++) {
    488		offset = (type == B43_DMA_64BIT) ? B43_DMA64_TXSTATUS :
    489						   B43_DMA32_TXSTATUS;
    490		value = b43_read32(dev, mmio_base + offset);
    491		if (type == B43_DMA_64BIT) {
    492			value &= B43_DMA64_TXSTAT;
    493			if (value == B43_DMA64_TXSTAT_DISABLED ||
    494			    value == B43_DMA64_TXSTAT_IDLEWAIT ||
    495			    value == B43_DMA64_TXSTAT_STOPPED)
    496				break;
    497		} else {
    498			value &= B43_DMA32_TXSTATE;
    499			if (value == B43_DMA32_TXSTAT_DISABLED ||
    500			    value == B43_DMA32_TXSTAT_IDLEWAIT ||
    501			    value == B43_DMA32_TXSTAT_STOPPED)
    502				break;
    503		}
    504		msleep(1);
    505	}
    506	offset = (type == B43_DMA_64BIT) ? B43_DMA64_TXCTL : B43_DMA32_TXCTL;
    507	b43_write32(dev, mmio_base + offset, 0);
    508	for (i = 0; i < 10; i++) {
    509		offset = (type == B43_DMA_64BIT) ? B43_DMA64_TXSTATUS :
    510						   B43_DMA32_TXSTATUS;
    511		value = b43_read32(dev, mmio_base + offset);
    512		if (type == B43_DMA_64BIT) {
    513			value &= B43_DMA64_TXSTAT;
    514			if (value == B43_DMA64_TXSTAT_DISABLED) {
    515				i = -1;
    516				break;
    517			}
    518		} else {
    519			value &= B43_DMA32_TXSTATE;
    520			if (value == B43_DMA32_TXSTAT_DISABLED) {
    521				i = -1;
    522				break;
    523			}
    524		}
    525		msleep(1);
    526	}
    527	if (i != -1) {
    528		b43err(dev->wl, "DMA TX reset timed out\n");
    529		return -ENODEV;
    530	}
    531	/* ensure the reset is completed. */
    532	msleep(1);
    533
    534	return 0;
    535}
    536
    537/* Check if a DMA mapping address is invalid. */
    538static bool b43_dma_mapping_error(struct b43_dmaring *ring,
    539				  dma_addr_t addr,
    540				  size_t buffersize, bool dma_to_device)
    541{
    542	if (unlikely(dma_mapping_error(ring->dev->dev->dma_dev, addr)))
    543		return true;
    544
    545	switch (ring->type) {
    546	case B43_DMA_30BIT:
    547		if ((u64)addr + buffersize > (1ULL << 30))
    548			goto address_error;
    549		break;
    550	case B43_DMA_32BIT:
    551		if ((u64)addr + buffersize > (1ULL << 32))
    552			goto address_error;
    553		break;
    554	case B43_DMA_64BIT:
    555		/* Currently we can't have addresses beyond
    556		 * 64bit in the kernel. */
    557		break;
    558	}
    559
    560	/* The address is OK. */
    561	return false;
    562
    563address_error:
    564	/* We can't support this address. Unmap it again. */
    565	unmap_descbuffer(ring, addr, buffersize, dma_to_device);
    566
    567	return true;
    568}
    569
    570static bool b43_rx_buffer_is_poisoned(struct b43_dmaring *ring, struct sk_buff *skb)
    571{
    572	unsigned char *f = skb->data + ring->frameoffset;
    573
    574	return ((f[0] & f[1] & f[2] & f[3] & f[4] & f[5] & f[6] & f[7]) == 0xFF);
    575}
    576
    577static void b43_poison_rx_buffer(struct b43_dmaring *ring, struct sk_buff *skb)
    578{
    579	struct b43_rxhdr_fw4 *rxhdr;
    580	unsigned char *frame;
    581
    582	/* This poisons the RX buffer to detect DMA failures. */
    583
    584	rxhdr = (struct b43_rxhdr_fw4 *)(skb->data);
    585	rxhdr->frame_len = 0;
    586
    587	B43_WARN_ON(ring->rx_buffersize < ring->frameoffset + sizeof(struct b43_plcp_hdr6) + 2);
    588	frame = skb->data + ring->frameoffset;
    589	memset(frame, 0xFF, sizeof(struct b43_plcp_hdr6) + 2 /* padding */);
    590}
    591
    592static int setup_rx_descbuffer(struct b43_dmaring *ring,
    593			       struct b43_dmadesc_generic *desc,
    594			       struct b43_dmadesc_meta *meta, gfp_t gfp_flags)
    595{
    596	dma_addr_t dmaaddr;
    597	struct sk_buff *skb;
    598
    599	B43_WARN_ON(ring->tx);
    600
    601	skb = __dev_alloc_skb(ring->rx_buffersize, gfp_flags);
    602	if (unlikely(!skb))
    603		return -ENOMEM;
    604	b43_poison_rx_buffer(ring, skb);
    605	dmaaddr = map_descbuffer(ring, skb->data, ring->rx_buffersize, 0);
    606	if (b43_dma_mapping_error(ring, dmaaddr, ring->rx_buffersize, 0)) {
    607		/* ugh. try to realloc in zone_dma */
    608		gfp_flags |= GFP_DMA;
    609
    610		dev_kfree_skb_any(skb);
    611
    612		skb = __dev_alloc_skb(ring->rx_buffersize, gfp_flags);
    613		if (unlikely(!skb))
    614			return -ENOMEM;
    615		b43_poison_rx_buffer(ring, skb);
    616		dmaaddr = map_descbuffer(ring, skb->data,
    617					 ring->rx_buffersize, 0);
    618		if (b43_dma_mapping_error(ring, dmaaddr, ring->rx_buffersize, 0)) {
    619			b43err(ring->dev->wl, "RX DMA buffer allocation failed\n");
    620			dev_kfree_skb_any(skb);
    621			return -EIO;
    622		}
    623	}
    624
    625	meta->skb = skb;
    626	meta->dmaaddr = dmaaddr;
    627	ring->ops->fill_descriptor(ring, desc, dmaaddr,
    628				   ring->rx_buffersize, 0, 0, 0);
    629
    630	return 0;
    631}
    632
    633/* Allocate the initial descbuffers.
    634 * This is used for an RX ring only.
    635 */
    636static int alloc_initial_descbuffers(struct b43_dmaring *ring)
    637{
    638	int i, err = -ENOMEM;
    639	struct b43_dmadesc_generic *desc;
    640	struct b43_dmadesc_meta *meta;
    641
    642	for (i = 0; i < ring->nr_slots; i++) {
    643		desc = ring->ops->idx2desc(ring, i, &meta);
    644
    645		err = setup_rx_descbuffer(ring, desc, meta, GFP_KERNEL);
    646		if (err) {
    647			b43err(ring->dev->wl,
    648			       "Failed to allocate initial descbuffers\n");
    649			goto err_unwind;
    650		}
    651	}
    652	mb();
    653	ring->used_slots = ring->nr_slots;
    654	err = 0;
    655      out:
    656	return err;
    657
    658      err_unwind:
    659	for (i--; i >= 0; i--) {
    660		desc = ring->ops->idx2desc(ring, i, &meta);
    661
    662		unmap_descbuffer(ring, meta->dmaaddr, ring->rx_buffersize, 0);
    663		dev_kfree_skb(meta->skb);
    664	}
    665	goto out;
    666}
    667
    668/* Do initial setup of the DMA controller.
    669 * Reset the controller, write the ring busaddress
    670 * and switch the "enable" bit on.
    671 */
    672static int dmacontroller_setup(struct b43_dmaring *ring)
    673{
    674	int err = 0;
    675	u32 value;
    676	u32 addrext;
    677	bool parity = ring->dev->dma.parity;
    678	u32 addrlo;
    679	u32 addrhi;
    680
    681	if (ring->tx) {
    682		if (ring->type == B43_DMA_64BIT) {
    683			u64 ringbase = (u64) (ring->dmabase);
    684			addrext = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_EXT);
    685			addrlo = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_LOW);
    686			addrhi = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_HIGH);
    687
    688			value = B43_DMA64_TXENABLE;
    689			value |= (addrext << B43_DMA64_TXADDREXT_SHIFT)
    690			    & B43_DMA64_TXADDREXT_MASK;
    691			if (!parity)
    692				value |= B43_DMA64_TXPARITYDISABLE;
    693			b43_dma_write(ring, B43_DMA64_TXCTL, value);
    694			b43_dma_write(ring, B43_DMA64_TXRINGLO, addrlo);
    695			b43_dma_write(ring, B43_DMA64_TXRINGHI, addrhi);
    696		} else {
    697			u32 ringbase = (u32) (ring->dmabase);
    698			addrext = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_EXT);
    699			addrlo = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_LOW);
    700
    701			value = B43_DMA32_TXENABLE;
    702			value |= (addrext << B43_DMA32_TXADDREXT_SHIFT)
    703			    & B43_DMA32_TXADDREXT_MASK;
    704			if (!parity)
    705				value |= B43_DMA32_TXPARITYDISABLE;
    706			b43_dma_write(ring, B43_DMA32_TXCTL, value);
    707			b43_dma_write(ring, B43_DMA32_TXRING, addrlo);
    708		}
    709	} else {
    710		err = alloc_initial_descbuffers(ring);
    711		if (err)
    712			goto out;
    713		if (ring->type == B43_DMA_64BIT) {
    714			u64 ringbase = (u64) (ring->dmabase);
    715			addrext = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_EXT);
    716			addrlo = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_LOW);
    717			addrhi = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_HIGH);
    718
    719			value = (ring->frameoffset << B43_DMA64_RXFROFF_SHIFT);
    720			value |= B43_DMA64_RXENABLE;
    721			value |= (addrext << B43_DMA64_RXADDREXT_SHIFT)
    722			    & B43_DMA64_RXADDREXT_MASK;
    723			if (!parity)
    724				value |= B43_DMA64_RXPARITYDISABLE;
    725			b43_dma_write(ring, B43_DMA64_RXCTL, value);
    726			b43_dma_write(ring, B43_DMA64_RXRINGLO, addrlo);
    727			b43_dma_write(ring, B43_DMA64_RXRINGHI, addrhi);
    728			b43_dma_write(ring, B43_DMA64_RXINDEX, ring->nr_slots *
    729				      sizeof(struct b43_dmadesc64));
    730		} else {
    731			u32 ringbase = (u32) (ring->dmabase);
    732			addrext = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_EXT);
    733			addrlo = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_LOW);
    734
    735			value = (ring->frameoffset << B43_DMA32_RXFROFF_SHIFT);
    736			value |= B43_DMA32_RXENABLE;
    737			value |= (addrext << B43_DMA32_RXADDREXT_SHIFT)
    738			    & B43_DMA32_RXADDREXT_MASK;
    739			if (!parity)
    740				value |= B43_DMA32_RXPARITYDISABLE;
    741			b43_dma_write(ring, B43_DMA32_RXCTL, value);
    742			b43_dma_write(ring, B43_DMA32_RXRING, addrlo);
    743			b43_dma_write(ring, B43_DMA32_RXINDEX, ring->nr_slots *
    744				      sizeof(struct b43_dmadesc32));
    745		}
    746	}
    747
    748out:
    749	return err;
    750}
    751
    752/* Shutdown the DMA controller. */
    753static void dmacontroller_cleanup(struct b43_dmaring *ring)
    754{
    755	if (ring->tx) {
    756		b43_dmacontroller_tx_reset(ring->dev, ring->mmio_base,
    757					   ring->type);
    758		if (ring->type == B43_DMA_64BIT) {
    759			b43_dma_write(ring, B43_DMA64_TXRINGLO, 0);
    760			b43_dma_write(ring, B43_DMA64_TXRINGHI, 0);
    761		} else
    762			b43_dma_write(ring, B43_DMA32_TXRING, 0);
    763	} else {
    764		b43_dmacontroller_rx_reset(ring->dev, ring->mmio_base,
    765					   ring->type);
    766		if (ring->type == B43_DMA_64BIT) {
    767			b43_dma_write(ring, B43_DMA64_RXRINGLO, 0);
    768			b43_dma_write(ring, B43_DMA64_RXRINGHI, 0);
    769		} else
    770			b43_dma_write(ring, B43_DMA32_RXRING, 0);
    771	}
    772}
    773
    774static void free_all_descbuffers(struct b43_dmaring *ring)
    775{
    776	struct b43_dmadesc_meta *meta;
    777	int i;
    778
    779	if (!ring->used_slots)
    780		return;
    781	for (i = 0; i < ring->nr_slots; i++) {
    782		/* get meta - ignore returned value */
    783		ring->ops->idx2desc(ring, i, &meta);
    784
    785		if (!meta->skb || b43_dma_ptr_is_poisoned(meta->skb)) {
    786			B43_WARN_ON(!ring->tx);
    787			continue;
    788		}
    789		if (ring->tx) {
    790			unmap_descbuffer(ring, meta->dmaaddr,
    791					 meta->skb->len, 1);
    792		} else {
    793			unmap_descbuffer(ring, meta->dmaaddr,
    794					 ring->rx_buffersize, 0);
    795		}
    796		free_descriptor_buffer(ring, meta);
    797	}
    798}
    799
    800static enum b43_dmatype b43_engine_type(struct b43_wldev *dev)
    801{
    802	u32 tmp;
    803	u16 mmio_base;
    804
    805	switch (dev->dev->bus_type) {
    806#ifdef CONFIG_B43_BCMA
    807	case B43_BUS_BCMA:
    808		tmp = bcma_aread32(dev->dev->bdev, BCMA_IOST);
    809		if (tmp & BCMA_IOST_DMA64)
    810			return B43_DMA_64BIT;
    811		break;
    812#endif
    813#ifdef CONFIG_B43_SSB
    814	case B43_BUS_SSB:
    815		tmp = ssb_read32(dev->dev->sdev, SSB_TMSHIGH);
    816		if (tmp & SSB_TMSHIGH_DMA64)
    817			return B43_DMA_64BIT;
    818		break;
    819#endif
    820	}
    821
    822	mmio_base = b43_dmacontroller_base(0, 0);
    823	b43_write32(dev, mmio_base + B43_DMA32_TXCTL, B43_DMA32_TXADDREXT_MASK);
    824	tmp = b43_read32(dev, mmio_base + B43_DMA32_TXCTL);
    825	if (tmp & B43_DMA32_TXADDREXT_MASK)
    826		return B43_DMA_32BIT;
    827	return B43_DMA_30BIT;
    828}
    829
    830/* Main initialization function. */
    831static
    832struct b43_dmaring *b43_setup_dmaring(struct b43_wldev *dev,
    833				      int controller_index,
    834				      int for_tx,
    835				      enum b43_dmatype type)
    836{
    837	struct b43_dmaring *ring;
    838	int i, err;
    839	dma_addr_t dma_test;
    840
    841	ring = kzalloc(sizeof(*ring), GFP_KERNEL);
    842	if (!ring)
    843		goto out;
    844
    845	ring->nr_slots = B43_RXRING_SLOTS;
    846	if (for_tx)
    847		ring->nr_slots = B43_TXRING_SLOTS;
    848
    849	ring->meta = kcalloc(ring->nr_slots, sizeof(struct b43_dmadesc_meta),
    850			     GFP_KERNEL);
    851	if (!ring->meta)
    852		goto err_kfree_ring;
    853	for (i = 0; i < ring->nr_slots; i++)
    854		ring->meta->skb = B43_DMA_PTR_POISON;
    855
    856	ring->type = type;
    857	ring->dev = dev;
    858	ring->mmio_base = b43_dmacontroller_base(type, controller_index);
    859	ring->index = controller_index;
    860	if (type == B43_DMA_64BIT)
    861		ring->ops = &dma64_ops;
    862	else
    863		ring->ops = &dma32_ops;
    864	if (for_tx) {
    865		ring->tx = true;
    866		ring->current_slot = -1;
    867	} else {
    868		if (ring->index == 0) {
    869			switch (dev->fw.hdr_format) {
    870			case B43_FW_HDR_598:
    871				ring->rx_buffersize = B43_DMA0_RX_FW598_BUFSIZE;
    872				ring->frameoffset = B43_DMA0_RX_FW598_FO;
    873				break;
    874			case B43_FW_HDR_410:
    875			case B43_FW_HDR_351:
    876				ring->rx_buffersize = B43_DMA0_RX_FW351_BUFSIZE;
    877				ring->frameoffset = B43_DMA0_RX_FW351_FO;
    878				break;
    879			}
    880		} else
    881			B43_WARN_ON(1);
    882	}
    883#ifdef CONFIG_B43_DEBUG
    884	ring->last_injected_overflow = jiffies;
    885#endif
    886
    887	if (for_tx) {
    888		/* Assumption: B43_TXRING_SLOTS can be divided by TX_SLOTS_PER_FRAME */
    889		BUILD_BUG_ON(B43_TXRING_SLOTS % TX_SLOTS_PER_FRAME != 0);
    890
    891		ring->txhdr_cache = kcalloc(ring->nr_slots / TX_SLOTS_PER_FRAME,
    892					    b43_txhdr_size(dev),
    893					    GFP_KERNEL);
    894		if (!ring->txhdr_cache)
    895			goto err_kfree_meta;
    896
    897		/* test for ability to dma to txhdr_cache */
    898		dma_test = dma_map_single(dev->dev->dma_dev,
    899					  ring->txhdr_cache,
    900					  b43_txhdr_size(dev),
    901					  DMA_TO_DEVICE);
    902
    903		if (b43_dma_mapping_error(ring, dma_test,
    904					  b43_txhdr_size(dev), 1)) {
    905			/* ugh realloc */
    906			kfree(ring->txhdr_cache);
    907			ring->txhdr_cache = kcalloc(ring->nr_slots / TX_SLOTS_PER_FRAME,
    908						    b43_txhdr_size(dev),
    909						    GFP_KERNEL | GFP_DMA);
    910			if (!ring->txhdr_cache)
    911				goto err_kfree_meta;
    912
    913			dma_test = dma_map_single(dev->dev->dma_dev,
    914						  ring->txhdr_cache,
    915						  b43_txhdr_size(dev),
    916						  DMA_TO_DEVICE);
    917
    918			if (b43_dma_mapping_error(ring, dma_test,
    919						  b43_txhdr_size(dev), 1)) {
    920
    921				b43err(dev->wl,
    922				       "TXHDR DMA allocation failed\n");
    923				goto err_kfree_txhdr_cache;
    924			}
    925		}
    926
    927		dma_unmap_single(dev->dev->dma_dev,
    928				 dma_test, b43_txhdr_size(dev),
    929				 DMA_TO_DEVICE);
    930	}
    931
    932	err = alloc_ringmemory(ring);
    933	if (err)
    934		goto err_kfree_txhdr_cache;
    935	err = dmacontroller_setup(ring);
    936	if (err)
    937		goto err_free_ringmemory;
    938
    939      out:
    940	return ring;
    941
    942      err_free_ringmemory:
    943	free_ringmemory(ring);
    944      err_kfree_txhdr_cache:
    945	kfree(ring->txhdr_cache);
    946      err_kfree_meta:
    947	kfree(ring->meta);
    948      err_kfree_ring:
    949	kfree(ring);
    950	ring = NULL;
    951	goto out;
    952}
    953
    954#define divide(a, b)	({	\
    955	typeof(a) __a = a;	\
    956	do_div(__a, b);		\
    957	__a;			\
    958  })
    959
    960#define modulo(a, b)	({	\
    961	typeof(a) __a = a;	\
    962	do_div(__a, b);		\
    963  })
    964
    965/* Main cleanup function. */
    966static void b43_destroy_dmaring(struct b43_dmaring *ring,
    967				const char *ringname)
    968{
    969	if (!ring)
    970		return;
    971
    972#ifdef CONFIG_B43_DEBUG
    973	{
    974		/* Print some statistics. */
    975		u64 failed_packets = ring->nr_failed_tx_packets;
    976		u64 succeed_packets = ring->nr_succeed_tx_packets;
    977		u64 nr_packets = failed_packets + succeed_packets;
    978		u64 permille_failed = 0, average_tries = 0;
    979
    980		if (nr_packets)
    981			permille_failed = divide(failed_packets * 1000, nr_packets);
    982		if (nr_packets)
    983			average_tries = divide(ring->nr_total_packet_tries * 100, nr_packets);
    984
    985		b43dbg(ring->dev->wl, "DMA-%u %s: "
    986		       "Used slots %d/%d, Failed frames %llu/%llu = %llu.%01llu%%, "
    987		       "Average tries %llu.%02llu\n",
    988		       (unsigned int)(ring->type), ringname,
    989		       ring->max_used_slots,
    990		       ring->nr_slots,
    991		       (unsigned long long)failed_packets,
    992		       (unsigned long long)nr_packets,
    993		       (unsigned long long)divide(permille_failed, 10),
    994		       (unsigned long long)modulo(permille_failed, 10),
    995		       (unsigned long long)divide(average_tries, 100),
    996		       (unsigned long long)modulo(average_tries, 100));
    997	}
    998#endif /* DEBUG */
    999
   1000	/* Device IRQs are disabled prior entering this function,
   1001	 * so no need to take care of concurrency with rx handler stuff.
   1002	 */
   1003	dmacontroller_cleanup(ring);
   1004	free_all_descbuffers(ring);
   1005	free_ringmemory(ring);
   1006
   1007	kfree(ring->txhdr_cache);
   1008	kfree(ring->meta);
   1009	kfree(ring);
   1010}
   1011
   1012#define destroy_ring(dma, ring) do {				\
   1013	b43_destroy_dmaring((dma)->ring, __stringify(ring));	\
   1014	(dma)->ring = NULL;					\
   1015    } while (0)
   1016
   1017void b43_dma_free(struct b43_wldev *dev)
   1018{
   1019	struct b43_dma *dma;
   1020
   1021	if (b43_using_pio_transfers(dev))
   1022		return;
   1023	dma = &dev->dma;
   1024
   1025	destroy_ring(dma, rx_ring);
   1026	destroy_ring(dma, tx_ring_AC_BK);
   1027	destroy_ring(dma, tx_ring_AC_BE);
   1028	destroy_ring(dma, tx_ring_AC_VI);
   1029	destroy_ring(dma, tx_ring_AC_VO);
   1030	destroy_ring(dma, tx_ring_mcast);
   1031}
   1032
   1033/* Some hardware with 64-bit DMA seems to be bugged and looks for translation
   1034 * bit in low address word instead of high one.
   1035 */
   1036static bool b43_dma_translation_in_low_word(struct b43_wldev *dev,
   1037					    enum b43_dmatype type)
   1038{
   1039	if (type != B43_DMA_64BIT)
   1040		return true;
   1041
   1042#ifdef CONFIG_B43_SSB
   1043	if (dev->dev->bus_type == B43_BUS_SSB &&
   1044	    dev->dev->sdev->bus->bustype == SSB_BUSTYPE_PCI &&
   1045	    !(pci_is_pcie(dev->dev->sdev->bus->host_pci) &&
   1046	      ssb_read32(dev->dev->sdev, SSB_TMSHIGH) & SSB_TMSHIGH_DMA64))
   1047			return true;
   1048#endif
   1049	return false;
   1050}
   1051
   1052int b43_dma_init(struct b43_wldev *dev)
   1053{
   1054	struct b43_dma *dma = &dev->dma;
   1055	enum b43_dmatype type = b43_engine_type(dev);
   1056	int err;
   1057
   1058	err = dma_set_mask_and_coherent(dev->dev->dma_dev, DMA_BIT_MASK(type));
   1059	if (err) {
   1060		b43err(dev->wl, "The machine/kernel does not support "
   1061		       "the required %u-bit DMA mask\n", type);
   1062		return err;
   1063	}
   1064
   1065	switch (dev->dev->bus_type) {
   1066#ifdef CONFIG_B43_BCMA
   1067	case B43_BUS_BCMA:
   1068		dma->translation = bcma_core_dma_translation(dev->dev->bdev);
   1069		break;
   1070#endif
   1071#ifdef CONFIG_B43_SSB
   1072	case B43_BUS_SSB:
   1073		dma->translation = ssb_dma_translation(dev->dev->sdev);
   1074		break;
   1075#endif
   1076	}
   1077	dma->translation_in_low = b43_dma_translation_in_low_word(dev, type);
   1078
   1079	dma->parity = true;
   1080#ifdef CONFIG_B43_BCMA
   1081	/* TODO: find out which SSB devices need disabling parity */
   1082	if (dev->dev->bus_type == B43_BUS_BCMA)
   1083		dma->parity = false;
   1084#endif
   1085
   1086	err = -ENOMEM;
   1087	/* setup TX DMA channels. */
   1088	dma->tx_ring_AC_BK = b43_setup_dmaring(dev, 0, 1, type);
   1089	if (!dma->tx_ring_AC_BK)
   1090		goto out;
   1091
   1092	dma->tx_ring_AC_BE = b43_setup_dmaring(dev, 1, 1, type);
   1093	if (!dma->tx_ring_AC_BE)
   1094		goto err_destroy_bk;
   1095
   1096	dma->tx_ring_AC_VI = b43_setup_dmaring(dev, 2, 1, type);
   1097	if (!dma->tx_ring_AC_VI)
   1098		goto err_destroy_be;
   1099
   1100	dma->tx_ring_AC_VO = b43_setup_dmaring(dev, 3, 1, type);
   1101	if (!dma->tx_ring_AC_VO)
   1102		goto err_destroy_vi;
   1103
   1104	dma->tx_ring_mcast = b43_setup_dmaring(dev, 4, 1, type);
   1105	if (!dma->tx_ring_mcast)
   1106		goto err_destroy_vo;
   1107
   1108	/* setup RX DMA channel. */
   1109	dma->rx_ring = b43_setup_dmaring(dev, 0, 0, type);
   1110	if (!dma->rx_ring)
   1111		goto err_destroy_mcast;
   1112
   1113	/* No support for the TX status DMA ring. */
   1114	B43_WARN_ON(dev->dev->core_rev < 5);
   1115
   1116	b43dbg(dev->wl, "%u-bit DMA initialized\n",
   1117	       (unsigned int)type);
   1118	err = 0;
   1119out:
   1120	return err;
   1121
   1122err_destroy_mcast:
   1123	destroy_ring(dma, tx_ring_mcast);
   1124err_destroy_vo:
   1125	destroy_ring(dma, tx_ring_AC_VO);
   1126err_destroy_vi:
   1127	destroy_ring(dma, tx_ring_AC_VI);
   1128err_destroy_be:
   1129	destroy_ring(dma, tx_ring_AC_BE);
   1130err_destroy_bk:
   1131	destroy_ring(dma, tx_ring_AC_BK);
   1132	return err;
   1133}
   1134
   1135/* Generate a cookie for the TX header. */
   1136static u16 generate_cookie(struct b43_dmaring *ring, int slot)
   1137{
   1138	u16 cookie;
   1139
   1140	/* Use the upper 4 bits of the cookie as
   1141	 * DMA controller ID and store the slot number
   1142	 * in the lower 12 bits.
   1143	 * Note that the cookie must never be 0, as this
   1144	 * is a special value used in RX path.
   1145	 * It can also not be 0xFFFF because that is special
   1146	 * for multicast frames.
   1147	 */
   1148	cookie = (((u16)ring->index + 1) << 12);
   1149	B43_WARN_ON(slot & ~0x0FFF);
   1150	cookie |= (u16)slot;
   1151
   1152	return cookie;
   1153}
   1154
   1155/* Inspect a cookie and find out to which controller/slot it belongs. */
   1156static
   1157struct b43_dmaring *parse_cookie(struct b43_wldev *dev, u16 cookie, int *slot)
   1158{
   1159	struct b43_dma *dma = &dev->dma;
   1160	struct b43_dmaring *ring = NULL;
   1161
   1162	switch (cookie & 0xF000) {
   1163	case 0x1000:
   1164		ring = dma->tx_ring_AC_BK;
   1165		break;
   1166	case 0x2000:
   1167		ring = dma->tx_ring_AC_BE;
   1168		break;
   1169	case 0x3000:
   1170		ring = dma->tx_ring_AC_VI;
   1171		break;
   1172	case 0x4000:
   1173		ring = dma->tx_ring_AC_VO;
   1174		break;
   1175	case 0x5000:
   1176		ring = dma->tx_ring_mcast;
   1177		break;
   1178	}
   1179	*slot = (cookie & 0x0FFF);
   1180	if (unlikely(!ring || *slot < 0 || *slot >= ring->nr_slots)) {
   1181		b43dbg(dev->wl, "TX-status contains "
   1182		       "invalid cookie: 0x%04X\n", cookie);
   1183		return NULL;
   1184	}
   1185
   1186	return ring;
   1187}
   1188
   1189static int dma_tx_fragment(struct b43_dmaring *ring,
   1190			   struct sk_buff *skb)
   1191{
   1192	const struct b43_dma_ops *ops = ring->ops;
   1193	struct ieee80211_tx_info *info = IEEE80211_SKB_CB(skb);
   1194	struct b43_private_tx_info *priv_info = b43_get_priv_tx_info(info);
   1195	u8 *header;
   1196	int slot, old_top_slot, old_used_slots;
   1197	int err;
   1198	struct b43_dmadesc_generic *desc;
   1199	struct b43_dmadesc_meta *meta;
   1200	struct b43_dmadesc_meta *meta_hdr;
   1201	u16 cookie;
   1202	size_t hdrsize = b43_txhdr_size(ring->dev);
   1203
   1204	/* Important note: If the number of used DMA slots per TX frame
   1205	 * is changed here, the TX_SLOTS_PER_FRAME definition at the top of
   1206	 * the file has to be updated, too!
   1207	 */
   1208
   1209	old_top_slot = ring->current_slot;
   1210	old_used_slots = ring->used_slots;
   1211
   1212	/* Get a slot for the header. */
   1213	slot = request_slot(ring);
   1214	desc = ops->idx2desc(ring, slot, &meta_hdr);
   1215	memset(meta_hdr, 0, sizeof(*meta_hdr));
   1216
   1217	header = &(ring->txhdr_cache[(slot / TX_SLOTS_PER_FRAME) * hdrsize]);
   1218	cookie = generate_cookie(ring, slot);
   1219	err = b43_generate_txhdr(ring->dev, header,
   1220				 skb, info, cookie);
   1221	if (unlikely(err)) {
   1222		ring->current_slot = old_top_slot;
   1223		ring->used_slots = old_used_slots;
   1224		return err;
   1225	}
   1226
   1227	meta_hdr->dmaaddr = map_descbuffer(ring, (unsigned char *)header,
   1228					   hdrsize, 1);
   1229	if (b43_dma_mapping_error(ring, meta_hdr->dmaaddr, hdrsize, 1)) {
   1230		ring->current_slot = old_top_slot;
   1231		ring->used_slots = old_used_slots;
   1232		return -EIO;
   1233	}
   1234	ops->fill_descriptor(ring, desc, meta_hdr->dmaaddr,
   1235			     hdrsize, 1, 0, 0);
   1236
   1237	/* Get a slot for the payload. */
   1238	slot = request_slot(ring);
   1239	desc = ops->idx2desc(ring, slot, &meta);
   1240	memset(meta, 0, sizeof(*meta));
   1241
   1242	meta->skb = skb;
   1243	meta->is_last_fragment = true;
   1244	priv_info->bouncebuffer = NULL;
   1245
   1246	meta->dmaaddr = map_descbuffer(ring, skb->data, skb->len, 1);
   1247	/* create a bounce buffer in zone_dma on mapping failure. */
   1248	if (b43_dma_mapping_error(ring, meta->dmaaddr, skb->len, 1)) {
   1249		priv_info->bouncebuffer = kmemdup(skb->data, skb->len,
   1250						  GFP_ATOMIC | GFP_DMA);
   1251		if (!priv_info->bouncebuffer) {
   1252			ring->current_slot = old_top_slot;
   1253			ring->used_slots = old_used_slots;
   1254			err = -ENOMEM;
   1255			goto out_unmap_hdr;
   1256		}
   1257
   1258		meta->dmaaddr = map_descbuffer(ring, priv_info->bouncebuffer, skb->len, 1);
   1259		if (b43_dma_mapping_error(ring, meta->dmaaddr, skb->len, 1)) {
   1260			kfree(priv_info->bouncebuffer);
   1261			priv_info->bouncebuffer = NULL;
   1262			ring->current_slot = old_top_slot;
   1263			ring->used_slots = old_used_slots;
   1264			err = -EIO;
   1265			goto out_unmap_hdr;
   1266		}
   1267	}
   1268
   1269	ops->fill_descriptor(ring, desc, meta->dmaaddr, skb->len, 0, 1, 1);
   1270
   1271	if (info->flags & IEEE80211_TX_CTL_SEND_AFTER_DTIM) {
   1272		/* Tell the firmware about the cookie of the last
   1273		 * mcast frame, so it can clear the more-data bit in it. */
   1274		b43_shm_write16(ring->dev, B43_SHM_SHARED,
   1275				B43_SHM_SH_MCASTCOOKIE, cookie);
   1276	}
   1277	/* Now transfer the whole frame. */
   1278	wmb();
   1279	ops->poke_tx(ring, next_slot(ring, slot));
   1280	return 0;
   1281
   1282out_unmap_hdr:
   1283	unmap_descbuffer(ring, meta_hdr->dmaaddr,
   1284			 hdrsize, 1);
   1285	return err;
   1286}
   1287
   1288static inline int should_inject_overflow(struct b43_dmaring *ring)
   1289{
   1290#ifdef CONFIG_B43_DEBUG
   1291	if (unlikely(b43_debug(ring->dev, B43_DBG_DMAOVERFLOW))) {
   1292		/* Check if we should inject another ringbuffer overflow
   1293		 * to test handling of this situation in the stack. */
   1294		unsigned long next_overflow;
   1295
   1296		next_overflow = ring->last_injected_overflow + HZ;
   1297		if (time_after(jiffies, next_overflow)) {
   1298			ring->last_injected_overflow = jiffies;
   1299			b43dbg(ring->dev->wl,
   1300			       "Injecting TX ring overflow on "
   1301			       "DMA controller %d\n", ring->index);
   1302			return 1;
   1303		}
   1304	}
   1305#endif /* CONFIG_B43_DEBUG */
   1306	return 0;
   1307}
   1308
   1309/* Static mapping of mac80211's queues (priorities) to b43 DMA rings. */
   1310static struct b43_dmaring *select_ring_by_priority(struct b43_wldev *dev,
   1311						   u8 queue_prio)
   1312{
   1313	struct b43_dmaring *ring;
   1314
   1315	if (dev->qos_enabled) {
   1316		/* 0 = highest priority */
   1317		switch (queue_prio) {
   1318		default:
   1319			B43_WARN_ON(1);
   1320			fallthrough;
   1321		case 0:
   1322			ring = dev->dma.tx_ring_AC_VO;
   1323			break;
   1324		case 1:
   1325			ring = dev->dma.tx_ring_AC_VI;
   1326			break;
   1327		case 2:
   1328			ring = dev->dma.tx_ring_AC_BE;
   1329			break;
   1330		case 3:
   1331			ring = dev->dma.tx_ring_AC_BK;
   1332			break;
   1333		}
   1334	} else
   1335		ring = dev->dma.tx_ring_AC_BE;
   1336
   1337	return ring;
   1338}
   1339
   1340int b43_dma_tx(struct b43_wldev *dev, struct sk_buff *skb)
   1341{
   1342	struct b43_dmaring *ring;
   1343	struct ieee80211_hdr *hdr;
   1344	int err = 0;
   1345	struct ieee80211_tx_info *info = IEEE80211_SKB_CB(skb);
   1346
   1347	hdr = (struct ieee80211_hdr *)skb->data;
   1348	if (info->flags & IEEE80211_TX_CTL_SEND_AFTER_DTIM) {
   1349		/* The multicast ring will be sent after the DTIM */
   1350		ring = dev->dma.tx_ring_mcast;
   1351		/* Set the more-data bit. Ucode will clear it on
   1352		 * the last frame for us. */
   1353		hdr->frame_control |= cpu_to_le16(IEEE80211_FCTL_MOREDATA);
   1354	} else {
   1355		/* Decide by priority where to put this frame. */
   1356		ring = select_ring_by_priority(
   1357			dev, skb_get_queue_mapping(skb));
   1358	}
   1359
   1360	B43_WARN_ON(!ring->tx);
   1361
   1362	if (unlikely(ring->stopped)) {
   1363		/* We get here only because of a bug in mac80211.
   1364		 * Because of a race, one packet may be queued after
   1365		 * the queue is stopped, thus we got called when we shouldn't.
   1366		 * For now, just refuse the transmit. */
   1367		if (b43_debug(dev, B43_DBG_DMAVERBOSE))
   1368			b43err(dev->wl, "Packet after queue stopped\n");
   1369		err = -ENOSPC;
   1370		goto out;
   1371	}
   1372
   1373	if (WARN_ON(free_slots(ring) < TX_SLOTS_PER_FRAME)) {
   1374		/* If we get here, we have a real error with the queue
   1375		 * full, but queues not stopped. */
   1376		b43err(dev->wl, "DMA queue overflow\n");
   1377		err = -ENOSPC;
   1378		goto out;
   1379	}
   1380
   1381	/* Assign the queue number to the ring (if not already done before)
   1382	 * so TX status handling can use it. The queue to ring mapping is
   1383	 * static, so we don't need to store it per frame. */
   1384	ring->queue_prio = skb_get_queue_mapping(skb);
   1385
   1386	err = dma_tx_fragment(ring, skb);
   1387	if (unlikely(err == -ENOKEY)) {
   1388		/* Drop this packet, as we don't have the encryption key
   1389		 * anymore and must not transmit it unencrypted. */
   1390		ieee80211_free_txskb(dev->wl->hw, skb);
   1391		err = 0;
   1392		goto out;
   1393	}
   1394	if (unlikely(err)) {
   1395		b43err(dev->wl, "DMA tx mapping failure\n");
   1396		goto out;
   1397	}
   1398	if ((free_slots(ring) < TX_SLOTS_PER_FRAME) ||
   1399	    should_inject_overflow(ring)) {
   1400		/* This TX ring is full. */
   1401		unsigned int skb_mapping = skb_get_queue_mapping(skb);
   1402		ieee80211_stop_queue(dev->wl->hw, skb_mapping);
   1403		dev->wl->tx_queue_stopped[skb_mapping] = true;
   1404		ring->stopped = true;
   1405		if (b43_debug(dev, B43_DBG_DMAVERBOSE)) {
   1406			b43dbg(dev->wl, "Stopped TX ring %d\n", ring->index);
   1407		}
   1408	}
   1409out:
   1410
   1411	return err;
   1412}
   1413
   1414void b43_dma_handle_txstatus(struct b43_wldev *dev,
   1415			     const struct b43_txstatus *status)
   1416{
   1417	const struct b43_dma_ops *ops;
   1418	struct b43_dmaring *ring;
   1419	struct b43_dmadesc_meta *meta;
   1420	static const struct b43_txstatus fake; /* filled with 0 */
   1421	const struct b43_txstatus *txstat;
   1422	int slot, firstused;
   1423	bool frame_succeed;
   1424	int skip;
   1425	static u8 err_out1;
   1426
   1427	ring = parse_cookie(dev, status->cookie, &slot);
   1428	if (unlikely(!ring))
   1429		return;
   1430	B43_WARN_ON(!ring->tx);
   1431
   1432	/* Sanity check: TX packets are processed in-order on one ring.
   1433	 * Check if the slot deduced from the cookie really is the first
   1434	 * used slot. */
   1435	firstused = ring->current_slot - ring->used_slots + 1;
   1436	if (firstused < 0)
   1437		firstused = ring->nr_slots + firstused;
   1438
   1439	skip = 0;
   1440	if (unlikely(slot != firstused)) {
   1441		/* This possibly is a firmware bug and will result in
   1442		 * malfunction, memory leaks and/or stall of DMA functionality.
   1443		 */
   1444		if (slot == next_slot(ring, next_slot(ring, firstused))) {
   1445			/* If a single header/data pair was missed, skip over
   1446			 * the first two slots in an attempt to recover.
   1447			 */
   1448			slot = firstused;
   1449			skip = 2;
   1450			if (!err_out1) {
   1451				/* Report the error once. */
   1452				b43dbg(dev->wl,
   1453				       "Skip on DMA ring %d slot %d.\n",
   1454				       ring->index, slot);
   1455				err_out1 = 1;
   1456			}
   1457		} else {
   1458			/* More than a single header/data pair were missed.
   1459			 * Report this error. If running with open-source
   1460			 * firmware, then reset the controller to
   1461			 * revive operation.
   1462			 */
   1463			b43dbg(dev->wl,
   1464			       "Out of order TX status report on DMA ring %d. Expected %d, but got %d\n",
   1465			       ring->index, firstused, slot);
   1466			if (dev->fw.opensource)
   1467				b43_controller_restart(dev, "Out of order TX");
   1468			return;
   1469		}
   1470	}
   1471
   1472	ops = ring->ops;
   1473	while (1) {
   1474		B43_WARN_ON(slot < 0 || slot >= ring->nr_slots);
   1475		/* get meta - ignore returned value */
   1476		ops->idx2desc(ring, slot, &meta);
   1477
   1478		if (b43_dma_ptr_is_poisoned(meta->skb)) {
   1479			b43dbg(dev->wl, "Poisoned TX slot %d (first=%d) "
   1480			       "on ring %d\n",
   1481			       slot, firstused, ring->index);
   1482			break;
   1483		}
   1484
   1485		if (meta->skb) {
   1486			struct b43_private_tx_info *priv_info =
   1487			     b43_get_priv_tx_info(IEEE80211_SKB_CB(meta->skb));
   1488
   1489			unmap_descbuffer(ring, meta->dmaaddr,
   1490					 meta->skb->len, 1);
   1491			kfree(priv_info->bouncebuffer);
   1492			priv_info->bouncebuffer = NULL;
   1493		} else {
   1494			unmap_descbuffer(ring, meta->dmaaddr,
   1495					 b43_txhdr_size(dev), 1);
   1496		}
   1497
   1498		if (meta->is_last_fragment) {
   1499			struct ieee80211_tx_info *info;
   1500
   1501			if (unlikely(!meta->skb)) {
   1502				/* This is a scatter-gather fragment of a frame,
   1503				 * so the skb pointer must not be NULL.
   1504				 */
   1505				b43dbg(dev->wl, "TX status unexpected NULL skb "
   1506				       "at slot %d (first=%d) on ring %d\n",
   1507				       slot, firstused, ring->index);
   1508				break;
   1509			}
   1510
   1511			info = IEEE80211_SKB_CB(meta->skb);
   1512
   1513			/*
   1514			 * Call back to inform the ieee80211 subsystem about
   1515			 * the status of the transmission. When skipping over
   1516			 * a missed TX status report, use a status structure
   1517			 * filled with zeros to indicate that the frame was not
   1518			 * sent (frame_count 0) and not acknowledged
   1519			 */
   1520			if (unlikely(skip))
   1521				txstat = &fake;
   1522			else
   1523				txstat = status;
   1524
   1525			frame_succeed = b43_fill_txstatus_report(dev, info,
   1526								 txstat);
   1527#ifdef CONFIG_B43_DEBUG
   1528			if (frame_succeed)
   1529				ring->nr_succeed_tx_packets++;
   1530			else
   1531				ring->nr_failed_tx_packets++;
   1532			ring->nr_total_packet_tries += status->frame_count;
   1533#endif /* DEBUG */
   1534			ieee80211_tx_status(dev->wl->hw, meta->skb);
   1535
   1536			/* skb will be freed by ieee80211_tx_status().
   1537			 * Poison our pointer. */
   1538			meta->skb = B43_DMA_PTR_POISON;
   1539		} else {
   1540			/* No need to call free_descriptor_buffer here, as
   1541			 * this is only the txhdr, which is not allocated.
   1542			 */
   1543			if (unlikely(meta->skb)) {
   1544				b43dbg(dev->wl, "TX status unexpected non-NULL skb "
   1545				       "at slot %d (first=%d) on ring %d\n",
   1546				       slot, firstused, ring->index);
   1547				break;
   1548			}
   1549		}
   1550
   1551		/* Everything unmapped and free'd. So it's not used anymore. */
   1552		ring->used_slots--;
   1553
   1554		if (meta->is_last_fragment && !skip) {
   1555			/* This is the last scatter-gather
   1556			 * fragment of the frame. We are done. */
   1557			break;
   1558		}
   1559		slot = next_slot(ring, slot);
   1560		if (skip > 0)
   1561			--skip;
   1562	}
   1563	if (ring->stopped) {
   1564		B43_WARN_ON(free_slots(ring) < TX_SLOTS_PER_FRAME);
   1565		ring->stopped = false;
   1566	}
   1567
   1568	if (dev->wl->tx_queue_stopped[ring->queue_prio]) {
   1569		dev->wl->tx_queue_stopped[ring->queue_prio] = false;
   1570	} else {
   1571		/* If the driver queue is running wake the corresponding
   1572		 * mac80211 queue. */
   1573		ieee80211_wake_queue(dev->wl->hw, ring->queue_prio);
   1574		if (b43_debug(dev, B43_DBG_DMAVERBOSE)) {
   1575			b43dbg(dev->wl, "Woke up TX ring %d\n", ring->index);
   1576		}
   1577	}
   1578	/* Add work to the queue. */
   1579	ieee80211_queue_work(dev->wl->hw, &dev->wl->tx_work);
   1580}
   1581
   1582static void dma_rx(struct b43_dmaring *ring, int *slot)
   1583{
   1584	const struct b43_dma_ops *ops = ring->ops;
   1585	struct b43_dmadesc_generic *desc;
   1586	struct b43_dmadesc_meta *meta;
   1587	struct b43_rxhdr_fw4 *rxhdr;
   1588	struct sk_buff *skb;
   1589	u16 len;
   1590	int err;
   1591	dma_addr_t dmaaddr;
   1592
   1593	desc = ops->idx2desc(ring, *slot, &meta);
   1594
   1595	sync_descbuffer_for_cpu(ring, meta->dmaaddr, ring->rx_buffersize);
   1596	skb = meta->skb;
   1597
   1598	rxhdr = (struct b43_rxhdr_fw4 *)skb->data;
   1599	len = le16_to_cpu(rxhdr->frame_len);
   1600	if (len == 0) {
   1601		int i = 0;
   1602
   1603		do {
   1604			udelay(2);
   1605			barrier();
   1606			len = le16_to_cpu(rxhdr->frame_len);
   1607		} while (len == 0 && i++ < 5);
   1608		if (unlikely(len == 0)) {
   1609			dmaaddr = meta->dmaaddr;
   1610			goto drop_recycle_buffer;
   1611		}
   1612	}
   1613	if (unlikely(b43_rx_buffer_is_poisoned(ring, skb))) {
   1614		/* Something went wrong with the DMA.
   1615		 * The device did not touch the buffer and did not overwrite the poison. */
   1616		b43dbg(ring->dev->wl, "DMA RX: Dropping poisoned buffer.\n");
   1617		dmaaddr = meta->dmaaddr;
   1618		goto drop_recycle_buffer;
   1619	}
   1620	if (unlikely(len + ring->frameoffset > ring->rx_buffersize)) {
   1621		/* The data did not fit into one descriptor buffer
   1622		 * and is split over multiple buffers.
   1623		 * This should never happen, as we try to allocate buffers
   1624		 * big enough. So simply ignore this packet.
   1625		 */
   1626		int cnt = 0;
   1627		s32 tmp = len;
   1628
   1629		while (1) {
   1630			desc = ops->idx2desc(ring, *slot, &meta);
   1631			/* recycle the descriptor buffer. */
   1632			b43_poison_rx_buffer(ring, meta->skb);
   1633			sync_descbuffer_for_device(ring, meta->dmaaddr,
   1634						   ring->rx_buffersize);
   1635			*slot = next_slot(ring, *slot);
   1636			cnt++;
   1637			tmp -= ring->rx_buffersize;
   1638			if (tmp <= 0)
   1639				break;
   1640		}
   1641		b43err(ring->dev->wl, "DMA RX buffer too small "
   1642		       "(len: %u, buffer: %u, nr-dropped: %d)\n",
   1643		       len, ring->rx_buffersize, cnt);
   1644		goto drop;
   1645	}
   1646
   1647	dmaaddr = meta->dmaaddr;
   1648	err = setup_rx_descbuffer(ring, desc, meta, GFP_ATOMIC);
   1649	if (unlikely(err)) {
   1650		b43dbg(ring->dev->wl, "DMA RX: setup_rx_descbuffer() failed\n");
   1651		goto drop_recycle_buffer;
   1652	}
   1653
   1654	unmap_descbuffer(ring, dmaaddr, ring->rx_buffersize, 0);
   1655	skb_put(skb, len + ring->frameoffset);
   1656	skb_pull(skb, ring->frameoffset);
   1657
   1658	b43_rx(ring->dev, skb, rxhdr);
   1659drop:
   1660	return;
   1661
   1662drop_recycle_buffer:
   1663	/* Poison and recycle the RX buffer. */
   1664	b43_poison_rx_buffer(ring, skb);
   1665	sync_descbuffer_for_device(ring, dmaaddr, ring->rx_buffersize);
   1666}
   1667
   1668void b43_dma_handle_rx_overflow(struct b43_dmaring *ring)
   1669{
   1670	int current_slot, previous_slot;
   1671
   1672	B43_WARN_ON(ring->tx);
   1673
   1674	/* Device has filled all buffers, drop all packets and let TCP
   1675	 * decrease speed.
   1676	 * Decrement RX index by one will let the device to see all slots
   1677	 * as free again
   1678	 */
   1679	/*
   1680	*TODO: How to increase rx_drop in mac80211?
   1681	*/
   1682	current_slot = ring->ops->get_current_rxslot(ring);
   1683	previous_slot = prev_slot(ring, current_slot);
   1684	ring->ops->set_current_rxslot(ring, previous_slot);
   1685}
   1686
   1687void b43_dma_rx(struct b43_dmaring *ring)
   1688{
   1689	const struct b43_dma_ops *ops = ring->ops;
   1690	int slot, current_slot;
   1691	int used_slots = 0;
   1692
   1693	B43_WARN_ON(ring->tx);
   1694	current_slot = ops->get_current_rxslot(ring);
   1695	B43_WARN_ON(!(current_slot >= 0 && current_slot < ring->nr_slots));
   1696
   1697	slot = ring->current_slot;
   1698	for (; slot != current_slot; slot = next_slot(ring, slot)) {
   1699		dma_rx(ring, &slot);
   1700		update_max_used_slots(ring, ++used_slots);
   1701	}
   1702	wmb();
   1703	ops->set_current_rxslot(ring, slot);
   1704	ring->current_slot = slot;
   1705}
   1706
   1707static void b43_dma_tx_suspend_ring(struct b43_dmaring *ring)
   1708{
   1709	B43_WARN_ON(!ring->tx);
   1710	ring->ops->tx_suspend(ring);
   1711}
   1712
   1713static void b43_dma_tx_resume_ring(struct b43_dmaring *ring)
   1714{
   1715	B43_WARN_ON(!ring->tx);
   1716	ring->ops->tx_resume(ring);
   1717}
   1718
   1719void b43_dma_tx_suspend(struct b43_wldev *dev)
   1720{
   1721	b43_power_saving_ctl_bits(dev, B43_PS_AWAKE);
   1722	b43_dma_tx_suspend_ring(dev->dma.tx_ring_AC_BK);
   1723	b43_dma_tx_suspend_ring(dev->dma.tx_ring_AC_BE);
   1724	b43_dma_tx_suspend_ring(dev->dma.tx_ring_AC_VI);
   1725	b43_dma_tx_suspend_ring(dev->dma.tx_ring_AC_VO);
   1726	b43_dma_tx_suspend_ring(dev->dma.tx_ring_mcast);
   1727}
   1728
   1729void b43_dma_tx_resume(struct b43_wldev *dev)
   1730{
   1731	b43_dma_tx_resume_ring(dev->dma.tx_ring_mcast);
   1732	b43_dma_tx_resume_ring(dev->dma.tx_ring_AC_VO);
   1733	b43_dma_tx_resume_ring(dev->dma.tx_ring_AC_VI);
   1734	b43_dma_tx_resume_ring(dev->dma.tx_ring_AC_BE);
   1735	b43_dma_tx_resume_ring(dev->dma.tx_ring_AC_BK);
   1736	b43_power_saving_ctl_bits(dev, 0);
   1737}
   1738
   1739static void direct_fifo_rx(struct b43_wldev *dev, enum b43_dmatype type,
   1740			   u16 mmio_base, bool enable)
   1741{
   1742	u32 ctl;
   1743
   1744	if (type == B43_DMA_64BIT) {
   1745		ctl = b43_read32(dev, mmio_base + B43_DMA64_RXCTL);
   1746		ctl &= ~B43_DMA64_RXDIRECTFIFO;
   1747		if (enable)
   1748			ctl |= B43_DMA64_RXDIRECTFIFO;
   1749		b43_write32(dev, mmio_base + B43_DMA64_RXCTL, ctl);
   1750	} else {
   1751		ctl = b43_read32(dev, mmio_base + B43_DMA32_RXCTL);
   1752		ctl &= ~B43_DMA32_RXDIRECTFIFO;
   1753		if (enable)
   1754			ctl |= B43_DMA32_RXDIRECTFIFO;
   1755		b43_write32(dev, mmio_base + B43_DMA32_RXCTL, ctl);
   1756	}
   1757}
   1758
   1759/* Enable/Disable Direct FIFO Receive Mode (PIO) on a RX engine.
   1760 * This is called from PIO code, so DMA structures are not available. */
   1761void b43_dma_direct_fifo_rx(struct b43_wldev *dev,
   1762			    unsigned int engine_index, bool enable)
   1763{
   1764	enum b43_dmatype type;
   1765	u16 mmio_base;
   1766
   1767	type = b43_engine_type(dev);
   1768
   1769	mmio_base = b43_dmacontroller_base(type, engine_index);
   1770	direct_fifo_rx(dev, type, mmio_base, enable);
   1771}