pio.h (11401B)
1/* SPDX-License-Identifier: GPL-2.0 or BSD-3-Clause */ 2/* 3 * Copyright(c) 2015-2017 Intel Corporation. 4 */ 5 6#ifndef _PIO_H 7#define _PIO_H 8/* send context types */ 9#define SC_KERNEL 0 10#define SC_VL15 1 11#define SC_ACK 2 12#define SC_USER 3 /* must be the last one: it may take all left */ 13#define SC_MAX 4 /* count of send context types */ 14 15/* invalid send context index */ 16#define INVALID_SCI 0xff 17 18/* PIO buffer release callback function */ 19typedef void (*pio_release_cb)(void *arg, int code); 20 21/* PIO release codes - in bits, as there could more than one that apply */ 22#define PRC_OK 0 /* no known error */ 23#define PRC_STATUS_ERR 0x01 /* credit return due to status error */ 24#define PRC_PBC 0x02 /* credit return due to PBC */ 25#define PRC_THRESHOLD 0x04 /* credit return due to threshold */ 26#define PRC_FILL_ERR 0x08 /* credit return due fill error */ 27#define PRC_FORCE 0x10 /* credit return due credit force */ 28#define PRC_SC_DISABLE 0x20 /* clean-up after a context disable */ 29 30/* byte helper */ 31union mix { 32 u64 val64; 33 u32 val32[2]; 34 u8 val8[8]; 35}; 36 37/* an allocated PIO buffer */ 38struct pio_buf { 39 struct send_context *sc;/* back pointer to owning send context */ 40 pio_release_cb cb; /* called when the buffer is released */ 41 void *arg; /* argument for cb */ 42 void __iomem *start; /* buffer start address */ 43 void __iomem *end; /* context end address */ 44 unsigned long sent_at; /* buffer is sent when <= free */ 45 union mix carry; /* pending unwritten bytes */ 46 u16 qw_written; /* QW written so far */ 47 u8 carry_bytes; /* number of valid bytes in carry */ 48}; 49 50/* cache line aligned pio buffer array */ 51union pio_shadow_ring { 52 struct pio_buf pbuf; 53} ____cacheline_aligned; 54 55/* per-NUMA send context */ 56struct send_context { 57 /* read-only after init */ 58 struct hfi1_devdata *dd; /* device */ 59 union pio_shadow_ring *sr; /* shadow ring */ 60 void __iomem *base_addr; /* start of PIO memory */ 61 u32 __percpu *buffers_allocated;/* count of buffers allocated */ 62 u32 size; /* context size, in bytes */ 63 64 int node; /* context home node */ 65 u32 sr_size; /* size of the shadow ring */ 66 u16 flags; /* flags */ 67 u8 type; /* context type */ 68 u8 sw_index; /* software index number */ 69 u8 hw_context; /* hardware context number */ 70 u8 group; /* credit return group */ 71 72 /* allocator fields */ 73 spinlock_t alloc_lock ____cacheline_aligned_in_smp; 74 u32 sr_head; /* shadow ring head */ 75 unsigned long fill; /* official alloc count */ 76 unsigned long alloc_free; /* copy of free (less cache thrash) */ 77 u32 fill_wrap; /* tracks fill within ring */ 78 u32 credits; /* number of blocks in context */ 79 /* adding a new field here would make it part of this cacheline */ 80 81 /* releaser fields */ 82 spinlock_t release_lock ____cacheline_aligned_in_smp; 83 u32 sr_tail; /* shadow ring tail */ 84 unsigned long free; /* official free count */ 85 volatile __le64 *hw_free; /* HW free counter */ 86 /* list for PIO waiters */ 87 struct list_head piowait ____cacheline_aligned_in_smp; 88 seqlock_t waitlock; 89 90 spinlock_t credit_ctrl_lock ____cacheline_aligned_in_smp; 91 u32 credit_intr_count; /* count of credit intr users */ 92 u64 credit_ctrl; /* cache for credit control */ 93 wait_queue_head_t halt_wait; /* wait until kernel sees interrupt */ 94 struct work_struct halt_work; /* halted context work queue entry */ 95}; 96 97/* send context flags */ 98#define SCF_ENABLED 0x01 99#define SCF_IN_FREE 0x02 100#define SCF_HALTED 0x04 101#define SCF_FROZEN 0x08 102#define SCF_LINK_DOWN 0x10 103 104struct send_context_info { 105 struct send_context *sc; /* allocated working context */ 106 u16 allocated; /* has this been allocated? */ 107 u16 type; /* context type */ 108 u16 base; /* base in PIO array */ 109 u16 credits; /* size in PIO array */ 110}; 111 112/* DMA credit return, index is always (context & 0x7) */ 113struct credit_return { 114 volatile __le64 cr[8]; 115}; 116 117/* NUMA indexed credit return array */ 118struct credit_return_base { 119 struct credit_return *va; 120 dma_addr_t dma; 121}; 122 123/* send context configuration sizes (one per type) */ 124struct sc_config_sizes { 125 short int size; 126 short int count; 127}; 128 129/* 130 * The diagram below details the relationship of the mapping structures 131 * 132 * Since the mapping now allows for non-uniform send contexts per vl, the 133 * number of send contexts for a vl is either the vl_scontexts[vl] or 134 * a computation based on num_kernel_send_contexts/num_vls: 135 * 136 * For example: 137 * nactual = vl_scontexts ? vl_scontexts[vl] : num_kernel_send_contexts/num_vls 138 * 139 * n = roundup to next highest power of 2 using nactual 140 * 141 * In the case where there are num_kernel_send_contexts/num_vls doesn't divide 142 * evenly, the extras are added from the last vl downward. 143 * 144 * For the case where n > nactual, the send contexts are assigned 145 * in a round robin fashion wrapping back to the first send context 146 * for a particular vl. 147 * 148 * dd->pio_map 149 * | pio_map_elem[0] 150 * | +--------------------+ 151 * v | mask | 152 * pio_vl_map |--------------------| 153 * +--------------------------+ | ksc[0] -> sc 1 | 154 * | list (RCU) | |--------------------| 155 * |--------------------------| ->| ksc[1] -> sc 2 | 156 * | mask | --/ |--------------------| 157 * |--------------------------| -/ | * | 158 * | actual_vls (max 8) | -/ |--------------------| 159 * |--------------------------| --/ | ksc[n-1] -> sc n | 160 * | vls (max 8) | -/ +--------------------+ 161 * |--------------------------| --/ 162 * | map[0] |-/ 163 * |--------------------------| +--------------------+ 164 * | map[1] |--- | mask | 165 * |--------------------------| \---- |--------------------| 166 * | * | \-- | ksc[0] -> sc 1+n | 167 * | * | \---- |--------------------| 168 * | * | \->| ksc[1] -> sc 2+n | 169 * |--------------------------| |--------------------| 170 * | map[vls - 1] |- | * | 171 * +--------------------------+ \- |--------------------| 172 * \- | ksc[m-1] -> sc m+n | 173 * \ +--------------------+ 174 * \- 175 * \ 176 * \- +----------------------+ 177 * \- | mask | 178 * \ |----------------------| 179 * \- | ksc[0] -> sc 1+m+n | 180 * \- |----------------------| 181 * >| ksc[1] -> sc 2+m+n | 182 * |----------------------| 183 * | * | 184 * |----------------------| 185 * | ksc[o-1] -> sc o+m+n | 186 * +----------------------+ 187 * 188 */ 189 190/* Initial number of send contexts per VL */ 191#define INIT_SC_PER_VL 2 192 193/* 194 * struct pio_map_elem - mapping for a vl 195 * @mask - selector mask 196 * @ksc - array of kernel send contexts for this vl 197 * 198 * The mask is used to "mod" the selector to 199 * produce index into the trailing array of 200 * kscs 201 */ 202struct pio_map_elem { 203 u32 mask; 204 struct send_context *ksc[]; 205}; 206 207/* 208 * struct pio_vl_map - mapping for a vl 209 * @list - rcu head for free callback 210 * @mask - vl mask to "mod" the vl to produce an index to map array 211 * @actual_vls - number of vls 212 * @vls - numbers of vls rounded to next power of 2 213 * @map - array of pio_map_elem entries 214 * 215 * This is the parent mapping structure. The trailing members of the 216 * struct point to pio_map_elem entries, which in turn point to an 217 * array of kscs for that vl. 218 */ 219struct pio_vl_map { 220 struct rcu_head list; 221 u32 mask; 222 u8 actual_vls; 223 u8 vls; 224 struct pio_map_elem *map[]; 225}; 226 227int pio_map_init(struct hfi1_devdata *dd, u8 port, u8 num_vls, 228 u8 *vl_scontexts); 229void free_pio_map(struct hfi1_devdata *dd); 230struct send_context *pio_select_send_context_vl(struct hfi1_devdata *dd, 231 u32 selector, u8 vl); 232struct send_context *pio_select_send_context_sc(struct hfi1_devdata *dd, 233 u32 selector, u8 sc5); 234 235/* send context functions */ 236int init_credit_return(struct hfi1_devdata *dd); 237void free_credit_return(struct hfi1_devdata *dd); 238int init_sc_pools_and_sizes(struct hfi1_devdata *dd); 239int init_send_contexts(struct hfi1_devdata *dd); 240int init_pervl_scs(struct hfi1_devdata *dd); 241struct send_context *sc_alloc(struct hfi1_devdata *dd, int type, 242 uint hdrqentsize, int numa); 243void sc_free(struct send_context *sc); 244int sc_enable(struct send_context *sc); 245void sc_disable(struct send_context *sc); 246int sc_restart(struct send_context *sc); 247void sc_return_credits(struct send_context *sc); 248void sc_flush(struct send_context *sc); 249void sc_drop(struct send_context *sc); 250void sc_stop(struct send_context *sc, int bit); 251struct pio_buf *sc_buffer_alloc(struct send_context *sc, u32 dw_len, 252 pio_release_cb cb, void *arg); 253void sc_release_update(struct send_context *sc); 254void sc_group_release_update(struct hfi1_devdata *dd, u32 hw_context); 255void sc_add_credit_return_intr(struct send_context *sc); 256void sc_del_credit_return_intr(struct send_context *sc); 257void sc_set_cr_threshold(struct send_context *sc, u32 new_threshold); 258u32 sc_percent_to_threshold(struct send_context *sc, u32 percent); 259u32 sc_mtu_to_threshold(struct send_context *sc, u32 mtu, u32 hdrqentsize); 260void hfi1_sc_wantpiobuf_intr(struct send_context *sc, u32 needint); 261void sc_wait(struct hfi1_devdata *dd); 262void set_pio_integrity(struct send_context *sc); 263 264/* support functions */ 265void pio_reset_all(struct hfi1_devdata *dd); 266void pio_freeze(struct hfi1_devdata *dd); 267void pio_kernel_unfreeze(struct hfi1_devdata *dd); 268void pio_kernel_linkup(struct hfi1_devdata *dd); 269 270/* global PIO send control operations */ 271#define PSC_GLOBAL_ENABLE 0 272#define PSC_GLOBAL_DISABLE 1 273#define PSC_GLOBAL_VLARB_ENABLE 2 274#define PSC_GLOBAL_VLARB_DISABLE 3 275#define PSC_CM_RESET 4 276#define PSC_DATA_VL_ENABLE 5 277#define PSC_DATA_VL_DISABLE 6 278 279void __cm_reset(struct hfi1_devdata *dd, u64 sendctrl); 280void pio_send_control(struct hfi1_devdata *dd, int op); 281 282/* PIO copy routines */ 283void pio_copy(struct hfi1_devdata *dd, struct pio_buf *pbuf, u64 pbc, 284 const void *from, size_t count); 285void seg_pio_copy_start(struct pio_buf *pbuf, u64 pbc, 286 const void *from, size_t nbytes); 287void seg_pio_copy_mid(struct pio_buf *pbuf, const void *from, size_t nbytes); 288void seg_pio_copy_end(struct pio_buf *pbuf); 289 290void seqfile_dump_sci(struct seq_file *s, u32 i, 291 struct send_context_info *sci); 292 293#endif /* _PIO_H */