cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

vas-window.c (41532B)


      1// SPDX-License-Identifier: GPL-2.0-or-later
      2/*
      3 * Copyright 2016-17 IBM Corp.
      4 */
      5
      6#define pr_fmt(fmt) "vas: " fmt
      7
      8#include <linux/types.h>
      9#include <linux/mutex.h>
     10#include <linux/slab.h>
     11#include <linux/io.h>
     12#include <linux/log2.h>
     13#include <linux/rcupdate.h>
     14#include <linux/cred.h>
     15#include <linux/sched/mm.h>
     16#include <linux/mmu_context.h>
     17#include <asm/switch_to.h>
     18#include <asm/ppc-opcode.h>
     19#include <asm/vas.h>
     20#include "vas.h"
     21#include "copy-paste.h"
     22
     23#define CREATE_TRACE_POINTS
     24#include "vas-trace.h"
     25
     26/*
     27 * Compute the paste address region for the window @window using the
     28 * ->paste_base_addr and ->paste_win_id_shift we got from device tree.
     29 */
     30void vas_win_paste_addr(struct pnv_vas_window *window, u64 *addr, int *len)
     31{
     32	int winid;
     33	u64 base, shift;
     34
     35	base = window->vinst->paste_base_addr;
     36	shift = window->vinst->paste_win_id_shift;
     37	winid = window->vas_win.winid;
     38
     39	*addr  = base + (winid << shift);
     40	if (len)
     41		*len = PAGE_SIZE;
     42
     43	pr_debug("Txwin #%d: Paste addr 0x%llx\n", winid, *addr);
     44}
     45
     46static inline void get_hvwc_mmio_bar(struct pnv_vas_window *window,
     47			u64 *start, int *len)
     48{
     49	u64 pbaddr;
     50
     51	pbaddr = window->vinst->hvwc_bar_start;
     52	*start = pbaddr + window->vas_win.winid * VAS_HVWC_SIZE;
     53	*len = VAS_HVWC_SIZE;
     54}
     55
     56static inline void get_uwc_mmio_bar(struct pnv_vas_window *window,
     57			u64 *start, int *len)
     58{
     59	u64 pbaddr;
     60
     61	pbaddr = window->vinst->uwc_bar_start;
     62	*start = pbaddr + window->vas_win.winid * VAS_UWC_SIZE;
     63	*len = VAS_UWC_SIZE;
     64}
     65
     66/*
     67 * Map the paste bus address of the given send window into kernel address
     68 * space. Unlike MMIO regions (map_mmio_region() below), paste region must
     69 * be mapped cache-able and is only applicable to send windows.
     70 */
     71static void *map_paste_region(struct pnv_vas_window *txwin)
     72{
     73	int len;
     74	void *map;
     75	char *name;
     76	u64 start;
     77
     78	name = kasprintf(GFP_KERNEL, "window-v%d-w%d", txwin->vinst->vas_id,
     79				txwin->vas_win.winid);
     80	if (!name)
     81		goto free_name;
     82
     83	txwin->paste_addr_name = name;
     84	vas_win_paste_addr(txwin, &start, &len);
     85
     86	if (!request_mem_region(start, len, name)) {
     87		pr_devel("%s(): request_mem_region(0x%llx, %d) failed\n",
     88				__func__, start, len);
     89		goto free_name;
     90	}
     91
     92	map = ioremap_cache(start, len);
     93	if (!map) {
     94		pr_devel("%s(): ioremap_cache(0x%llx, %d) failed\n", __func__,
     95				start, len);
     96		goto free_name;
     97	}
     98
     99	pr_devel("Mapped paste addr 0x%llx to kaddr 0x%p\n", start, map);
    100	return map;
    101
    102free_name:
    103	kfree(name);
    104	return ERR_PTR(-ENOMEM);
    105}
    106
    107static void *map_mmio_region(char *name, u64 start, int len)
    108{
    109	void *map;
    110
    111	if (!request_mem_region(start, len, name)) {
    112		pr_devel("%s(): request_mem_region(0x%llx, %d) failed\n",
    113				__func__, start, len);
    114		return NULL;
    115	}
    116
    117	map = ioremap(start, len);
    118	if (!map) {
    119		pr_devel("%s(): ioremap(0x%llx, %d) failed\n", __func__, start,
    120				len);
    121		return NULL;
    122	}
    123
    124	return map;
    125}
    126
    127static void unmap_region(void *addr, u64 start, int len)
    128{
    129	iounmap(addr);
    130	release_mem_region((phys_addr_t)start, len);
    131}
    132
    133/*
    134 * Unmap the paste address region for a window.
    135 */
    136static void unmap_paste_region(struct pnv_vas_window *window)
    137{
    138	int len;
    139	u64 busaddr_start;
    140
    141	if (window->paste_kaddr) {
    142		vas_win_paste_addr(window, &busaddr_start, &len);
    143		unmap_region(window->paste_kaddr, busaddr_start, len);
    144		window->paste_kaddr = NULL;
    145		kfree(window->paste_addr_name);
    146		window->paste_addr_name = NULL;
    147	}
    148}
    149
    150/*
    151 * Unmap the MMIO regions for a window. Hold the vas_mutex so we don't
    152 * unmap when the window's debugfs dir is in use. This serializes close
    153 * of a window even on another VAS instance but since its not a critical
    154 * path, just minimize the time we hold the mutex for now. We can add
    155 * a per-instance mutex later if necessary.
    156 */
    157static void unmap_winctx_mmio_bars(struct pnv_vas_window *window)
    158{
    159	int len;
    160	void *uwc_map;
    161	void *hvwc_map;
    162	u64 busaddr_start;
    163
    164	mutex_lock(&vas_mutex);
    165
    166	hvwc_map = window->hvwc_map;
    167	window->hvwc_map = NULL;
    168
    169	uwc_map = window->uwc_map;
    170	window->uwc_map = NULL;
    171
    172	mutex_unlock(&vas_mutex);
    173
    174	if (hvwc_map) {
    175		get_hvwc_mmio_bar(window, &busaddr_start, &len);
    176		unmap_region(hvwc_map, busaddr_start, len);
    177	}
    178
    179	if (uwc_map) {
    180		get_uwc_mmio_bar(window, &busaddr_start, &len);
    181		unmap_region(uwc_map, busaddr_start, len);
    182	}
    183}
    184
    185/*
    186 * Find the Hypervisor Window Context (HVWC) MMIO Base Address Region and the
    187 * OS/User Window Context (UWC) MMIO Base Address Region for the given window.
    188 * Map these bus addresses and save the mapped kernel addresses in @window.
    189 */
    190static int map_winctx_mmio_bars(struct pnv_vas_window *window)
    191{
    192	int len;
    193	u64 start;
    194
    195	get_hvwc_mmio_bar(window, &start, &len);
    196	window->hvwc_map = map_mmio_region("HVWCM_Window", start, len);
    197
    198	get_uwc_mmio_bar(window, &start, &len);
    199	window->uwc_map = map_mmio_region("UWCM_Window", start, len);
    200
    201	if (!window->hvwc_map || !window->uwc_map) {
    202		unmap_winctx_mmio_bars(window);
    203		return -1;
    204	}
    205
    206	return 0;
    207}
    208
    209/*
    210 * Reset all valid registers in the HV and OS/User Window Contexts for
    211 * the window identified by @window.
    212 *
    213 * NOTE: We cannot really use a for loop to reset window context. Not all
    214 *	 offsets in a window context are valid registers and the valid
    215 *	 registers are not sequential. And, we can only write to offsets
    216 *	 with valid registers.
    217 */
    218static void reset_window_regs(struct pnv_vas_window *window)
    219{
    220	write_hvwc_reg(window, VREG(LPID), 0ULL);
    221	write_hvwc_reg(window, VREG(PID), 0ULL);
    222	write_hvwc_reg(window, VREG(XLATE_MSR), 0ULL);
    223	write_hvwc_reg(window, VREG(XLATE_LPCR), 0ULL);
    224	write_hvwc_reg(window, VREG(XLATE_CTL), 0ULL);
    225	write_hvwc_reg(window, VREG(AMR), 0ULL);
    226	write_hvwc_reg(window, VREG(SEIDR), 0ULL);
    227	write_hvwc_reg(window, VREG(FAULT_TX_WIN), 0ULL);
    228	write_hvwc_reg(window, VREG(OSU_INTR_SRC_RA), 0ULL);
    229	write_hvwc_reg(window, VREG(HV_INTR_SRC_RA), 0ULL);
    230	write_hvwc_reg(window, VREG(PSWID), 0ULL);
    231	write_hvwc_reg(window, VREG(LFIFO_BAR), 0ULL);
    232	write_hvwc_reg(window, VREG(LDATA_STAMP_CTL), 0ULL);
    233	write_hvwc_reg(window, VREG(LDMA_CACHE_CTL), 0ULL);
    234	write_hvwc_reg(window, VREG(LRFIFO_PUSH), 0ULL);
    235	write_hvwc_reg(window, VREG(CURR_MSG_COUNT), 0ULL);
    236	write_hvwc_reg(window, VREG(LNOTIFY_AFTER_COUNT), 0ULL);
    237	write_hvwc_reg(window, VREG(LRX_WCRED), 0ULL);
    238	write_hvwc_reg(window, VREG(LRX_WCRED_ADDER), 0ULL);
    239	write_hvwc_reg(window, VREG(TX_WCRED), 0ULL);
    240	write_hvwc_reg(window, VREG(TX_WCRED_ADDER), 0ULL);
    241	write_hvwc_reg(window, VREG(LFIFO_SIZE), 0ULL);
    242	write_hvwc_reg(window, VREG(WINCTL), 0ULL);
    243	write_hvwc_reg(window, VREG(WIN_STATUS), 0ULL);
    244	write_hvwc_reg(window, VREG(WIN_CTX_CACHING_CTL), 0ULL);
    245	write_hvwc_reg(window, VREG(TX_RSVD_BUF_COUNT), 0ULL);
    246	write_hvwc_reg(window, VREG(LRFIFO_WIN_PTR), 0ULL);
    247	write_hvwc_reg(window, VREG(LNOTIFY_CTL), 0ULL);
    248	write_hvwc_reg(window, VREG(LNOTIFY_PID), 0ULL);
    249	write_hvwc_reg(window, VREG(LNOTIFY_LPID), 0ULL);
    250	write_hvwc_reg(window, VREG(LNOTIFY_TID), 0ULL);
    251	write_hvwc_reg(window, VREG(LNOTIFY_SCOPE), 0ULL);
    252	write_hvwc_reg(window, VREG(NX_UTIL_ADDER), 0ULL);
    253
    254	/* Skip read-only registers: NX_UTIL and NX_UTIL_SE */
    255
    256	/*
    257	 * The send and receive window credit adder registers are also
    258	 * accessible from HVWC and have been initialized above. We don't
    259	 * need to initialize from the OS/User Window Context, so skip
    260	 * following calls:
    261	 *
    262	 *	write_uwc_reg(window, VREG(TX_WCRED_ADDER), 0ULL);
    263	 *	write_uwc_reg(window, VREG(LRX_WCRED_ADDER), 0ULL);
    264	 */
    265}
    266
    267/*
    268 * Initialize window context registers related to Address Translation.
    269 * These registers are common to send/receive windows although they
    270 * differ for user/kernel windows. As we resolve the TODOs we may
    271 * want to add fields to vas_winctx and move the initialization to
    272 * init_vas_winctx_regs().
    273 */
    274static void init_xlate_regs(struct pnv_vas_window *window, bool user_win)
    275{
    276	u64 lpcr, val;
    277
    278	/*
    279	 * MSR_TA, MSR_US are false for both kernel and user.
    280	 * MSR_DR and MSR_PR are false for kernel.
    281	 */
    282	val = 0ULL;
    283	val = SET_FIELD(VAS_XLATE_MSR_HV, val, 1);
    284	val = SET_FIELD(VAS_XLATE_MSR_SF, val, 1);
    285	if (user_win) {
    286		val = SET_FIELD(VAS_XLATE_MSR_DR, val, 1);
    287		val = SET_FIELD(VAS_XLATE_MSR_PR, val, 1);
    288	}
    289	write_hvwc_reg(window, VREG(XLATE_MSR), val);
    290
    291	lpcr = mfspr(SPRN_LPCR);
    292	val = 0ULL;
    293	/*
    294	 * NOTE: From Section 5.7.8.1 Segment Lookaside Buffer of the
    295	 *	 Power ISA, v3.0B, Page size encoding is 0 = 4KB, 5 = 64KB.
    296	 *
    297	 * NOTE: From Section 1.3.1, Address Translation Context of the
    298	 *	 Nest MMU Workbook, LPCR_SC should be 0 for Power9.
    299	 */
    300	val = SET_FIELD(VAS_XLATE_LPCR_PAGE_SIZE, val, 5);
    301	val = SET_FIELD(VAS_XLATE_LPCR_ISL, val, lpcr & LPCR_ISL);
    302	val = SET_FIELD(VAS_XLATE_LPCR_TC, val, lpcr & LPCR_TC);
    303	val = SET_FIELD(VAS_XLATE_LPCR_SC, val, 0);
    304	write_hvwc_reg(window, VREG(XLATE_LPCR), val);
    305
    306	/*
    307	 * Section 1.3.1 (Address translation Context) of NMMU workbook.
    308	 *	0b00	Hashed Page Table mode
    309	 *	0b01	Reserved
    310	 *	0b10	Radix on HPT
    311	 *	0b11	Radix on Radix
    312	 */
    313	val = 0ULL;
    314	val = SET_FIELD(VAS_XLATE_MODE, val, radix_enabled() ? 3 : 2);
    315	write_hvwc_reg(window, VREG(XLATE_CTL), val);
    316
    317	/*
    318	 * TODO: Can we mfspr(AMR) even for user windows?
    319	 */
    320	val = 0ULL;
    321	val = SET_FIELD(VAS_AMR, val, mfspr(SPRN_AMR));
    322	write_hvwc_reg(window, VREG(AMR), val);
    323
    324	val = 0ULL;
    325	val = SET_FIELD(VAS_SEIDR, val, 0);
    326	write_hvwc_reg(window, VREG(SEIDR), val);
    327}
    328
    329/*
    330 * Initialize Reserved Send Buffer Count for the send window. It involves
    331 * writing to the register, reading it back to confirm that the hardware
    332 * has enough buffers to reserve. See section 1.3.1.2.1 of VAS workbook.
    333 *
    334 * Since we can only make a best-effort attempt to fulfill the request,
    335 * we don't return any errors if we cannot.
    336 *
    337 * TODO: Reserved (aka dedicated) send buffers are not supported yet.
    338 */
    339static void init_rsvd_tx_buf_count(struct pnv_vas_window *txwin,
    340				struct vas_winctx *winctx)
    341{
    342	write_hvwc_reg(txwin, VREG(TX_RSVD_BUF_COUNT), 0ULL);
    343}
    344
    345/*
    346 * init_winctx_regs()
    347 *	Initialize window context registers for a receive window.
    348 *	Except for caching control and marking window open, the registers
    349 *	are initialized in the order listed in Section 3.1.4 (Window Context
    350 *	Cache Register Details) of the VAS workbook although they don't need
    351 *	to be.
    352 *
    353 * Design note: For NX receive windows, NX allocates the FIFO buffer in OPAL
    354 *	(so that it can get a large contiguous area) and passes that buffer
    355 *	to kernel via device tree. We now write that buffer address to the
    356 *	FIFO BAR. Would it make sense to do this all in OPAL? i.e have OPAL
    357 *	write the per-chip RX FIFO addresses to the windows during boot-up
    358 *	as a one-time task? That could work for NX but what about other
    359 *	receivers?  Let the receivers tell us the rx-fifo buffers for now.
    360 */
    361static void init_winctx_regs(struct pnv_vas_window *window,
    362			     struct vas_winctx *winctx)
    363{
    364	u64 val;
    365	int fifo_size;
    366
    367	reset_window_regs(window);
    368
    369	val = 0ULL;
    370	val = SET_FIELD(VAS_LPID, val, winctx->lpid);
    371	write_hvwc_reg(window, VREG(LPID), val);
    372
    373	val = 0ULL;
    374	val = SET_FIELD(VAS_PID_ID, val, winctx->pidr);
    375	write_hvwc_reg(window, VREG(PID), val);
    376
    377	init_xlate_regs(window, winctx->user_win);
    378
    379	val = 0ULL;
    380	val = SET_FIELD(VAS_FAULT_TX_WIN, val, winctx->fault_win_id);
    381	write_hvwc_reg(window, VREG(FAULT_TX_WIN), val);
    382
    383	/* In PowerNV, interrupts go to HV. */
    384	write_hvwc_reg(window, VREG(OSU_INTR_SRC_RA), 0ULL);
    385
    386	val = 0ULL;
    387	val = SET_FIELD(VAS_HV_INTR_SRC_RA, val, winctx->irq_port);
    388	write_hvwc_reg(window, VREG(HV_INTR_SRC_RA), val);
    389
    390	val = 0ULL;
    391	val = SET_FIELD(VAS_PSWID_EA_HANDLE, val, winctx->pswid);
    392	write_hvwc_reg(window, VREG(PSWID), val);
    393
    394	write_hvwc_reg(window, VREG(SPARE1), 0ULL);
    395	write_hvwc_reg(window, VREG(SPARE2), 0ULL);
    396	write_hvwc_reg(window, VREG(SPARE3), 0ULL);
    397
    398	/*
    399	 * NOTE: VAS expects the FIFO address to be copied into the LFIFO_BAR
    400	 *	 register as is - do NOT shift the address into VAS_LFIFO_BAR
    401	 *	 bit fields! Ok to set the page migration select fields -
    402	 *	 VAS ignores the lower 10+ bits in the address anyway, because
    403	 *	 the minimum FIFO size is 1K?
    404	 *
    405	 * See also: Design note in function header.
    406	 */
    407	val = winctx->rx_fifo;
    408	val = SET_FIELD(VAS_PAGE_MIGRATION_SELECT, val, 0);
    409	write_hvwc_reg(window, VREG(LFIFO_BAR), val);
    410
    411	val = 0ULL;
    412	val = SET_FIELD(VAS_LDATA_STAMP, val, winctx->data_stamp);
    413	write_hvwc_reg(window, VREG(LDATA_STAMP_CTL), val);
    414
    415	val = 0ULL;
    416	val = SET_FIELD(VAS_LDMA_TYPE, val, winctx->dma_type);
    417	val = SET_FIELD(VAS_LDMA_FIFO_DISABLE, val, winctx->fifo_disable);
    418	write_hvwc_reg(window, VREG(LDMA_CACHE_CTL), val);
    419
    420	write_hvwc_reg(window, VREG(LRFIFO_PUSH), 0ULL);
    421	write_hvwc_reg(window, VREG(CURR_MSG_COUNT), 0ULL);
    422	write_hvwc_reg(window, VREG(LNOTIFY_AFTER_COUNT), 0ULL);
    423
    424	val = 0ULL;
    425	val = SET_FIELD(VAS_LRX_WCRED, val, winctx->wcreds_max);
    426	write_hvwc_reg(window, VREG(LRX_WCRED), val);
    427
    428	val = 0ULL;
    429	val = SET_FIELD(VAS_TX_WCRED, val, winctx->wcreds_max);
    430	write_hvwc_reg(window, VREG(TX_WCRED), val);
    431
    432	write_hvwc_reg(window, VREG(LRX_WCRED_ADDER), 0ULL);
    433	write_hvwc_reg(window, VREG(TX_WCRED_ADDER), 0ULL);
    434
    435	fifo_size = winctx->rx_fifo_size / 1024;
    436
    437	val = 0ULL;
    438	val = SET_FIELD(VAS_LFIFO_SIZE, val, ilog2(fifo_size));
    439	write_hvwc_reg(window, VREG(LFIFO_SIZE), val);
    440
    441	/* Update window control and caching control registers last so
    442	 * we mark the window open only after fully initializing it and
    443	 * pushing context to cache.
    444	 */
    445
    446	write_hvwc_reg(window, VREG(WIN_STATUS), 0ULL);
    447
    448	init_rsvd_tx_buf_count(window, winctx);
    449
    450	/* for a send window, point to the matching receive window */
    451	val = 0ULL;
    452	val = SET_FIELD(VAS_LRX_WIN_ID, val, winctx->rx_win_id);
    453	write_hvwc_reg(window, VREG(LRFIFO_WIN_PTR), val);
    454
    455	write_hvwc_reg(window, VREG(SPARE4), 0ULL);
    456
    457	val = 0ULL;
    458	val = SET_FIELD(VAS_NOTIFY_DISABLE, val, winctx->notify_disable);
    459	val = SET_FIELD(VAS_INTR_DISABLE, val, winctx->intr_disable);
    460	val = SET_FIELD(VAS_NOTIFY_EARLY, val, winctx->notify_early);
    461	val = SET_FIELD(VAS_NOTIFY_OSU_INTR, val, winctx->notify_os_intr_reg);
    462	write_hvwc_reg(window, VREG(LNOTIFY_CTL), val);
    463
    464	val = 0ULL;
    465	val = SET_FIELD(VAS_LNOTIFY_PID, val, winctx->lnotify_pid);
    466	write_hvwc_reg(window, VREG(LNOTIFY_PID), val);
    467
    468	val = 0ULL;
    469	val = SET_FIELD(VAS_LNOTIFY_LPID, val, winctx->lnotify_lpid);
    470	write_hvwc_reg(window, VREG(LNOTIFY_LPID), val);
    471
    472	val = 0ULL;
    473	val = SET_FIELD(VAS_LNOTIFY_TID, val, winctx->lnotify_tid);
    474	write_hvwc_reg(window, VREG(LNOTIFY_TID), val);
    475
    476	val = 0ULL;
    477	val = SET_FIELD(VAS_LNOTIFY_MIN_SCOPE, val, winctx->min_scope);
    478	val = SET_FIELD(VAS_LNOTIFY_MAX_SCOPE, val, winctx->max_scope);
    479	write_hvwc_reg(window, VREG(LNOTIFY_SCOPE), val);
    480
    481	/* Skip read-only registers NX_UTIL and NX_UTIL_SE */
    482
    483	write_hvwc_reg(window, VREG(SPARE5), 0ULL);
    484	write_hvwc_reg(window, VREG(NX_UTIL_ADDER), 0ULL);
    485	write_hvwc_reg(window, VREG(SPARE6), 0ULL);
    486
    487	/* Finally, push window context to memory and... */
    488	val = 0ULL;
    489	val = SET_FIELD(VAS_PUSH_TO_MEM, val, 1);
    490	write_hvwc_reg(window, VREG(WIN_CTX_CACHING_CTL), val);
    491
    492	/* ... mark the window open for business */
    493	val = 0ULL;
    494	val = SET_FIELD(VAS_WINCTL_REJ_NO_CREDIT, val, winctx->rej_no_credit);
    495	val = SET_FIELD(VAS_WINCTL_PIN, val, winctx->pin_win);
    496	val = SET_FIELD(VAS_WINCTL_TX_WCRED_MODE, val, winctx->tx_wcred_mode);
    497	val = SET_FIELD(VAS_WINCTL_RX_WCRED_MODE, val, winctx->rx_wcred_mode);
    498	val = SET_FIELD(VAS_WINCTL_TX_WORD_MODE, val, winctx->tx_word_mode);
    499	val = SET_FIELD(VAS_WINCTL_RX_WORD_MODE, val, winctx->rx_word_mode);
    500	val = SET_FIELD(VAS_WINCTL_FAULT_WIN, val, winctx->fault_win);
    501	val = SET_FIELD(VAS_WINCTL_NX_WIN, val, winctx->nx_win);
    502	val = SET_FIELD(VAS_WINCTL_OPEN, val, 1);
    503	write_hvwc_reg(window, VREG(WINCTL), val);
    504}
    505
    506static void vas_release_window_id(struct ida *ida, int winid)
    507{
    508	ida_free(ida, winid);
    509}
    510
    511static int vas_assign_window_id(struct ida *ida)
    512{
    513	int winid = ida_alloc_max(ida, VAS_WINDOWS_PER_CHIP - 1, GFP_KERNEL);
    514
    515	if (winid == -ENOSPC) {
    516		pr_err("Too many (%d) open windows\n", VAS_WINDOWS_PER_CHIP);
    517		return -EAGAIN;
    518	}
    519
    520	return winid;
    521}
    522
    523static void vas_window_free(struct pnv_vas_window *window)
    524{
    525	struct vas_instance *vinst = window->vinst;
    526	int winid = window->vas_win.winid;
    527
    528	unmap_winctx_mmio_bars(window);
    529
    530	vas_window_free_dbgdir(window);
    531
    532	kfree(window);
    533
    534	vas_release_window_id(&vinst->ida, winid);
    535}
    536
    537static struct pnv_vas_window *vas_window_alloc(struct vas_instance *vinst)
    538{
    539	int winid;
    540	struct pnv_vas_window *window;
    541
    542	winid = vas_assign_window_id(&vinst->ida);
    543	if (winid < 0)
    544		return ERR_PTR(winid);
    545
    546	window = kzalloc(sizeof(*window), GFP_KERNEL);
    547	if (!window)
    548		goto out_free;
    549
    550	window->vinst = vinst;
    551	window->vas_win.winid = winid;
    552
    553	if (map_winctx_mmio_bars(window))
    554		goto out_free;
    555
    556	vas_window_init_dbgdir(window);
    557
    558	return window;
    559
    560out_free:
    561	kfree(window);
    562	vas_release_window_id(&vinst->ida, winid);
    563	return ERR_PTR(-ENOMEM);
    564}
    565
    566static void put_rx_win(struct pnv_vas_window *rxwin)
    567{
    568	/* Better not be a send window! */
    569	WARN_ON_ONCE(rxwin->tx_win);
    570
    571	atomic_dec(&rxwin->num_txwins);
    572}
    573
    574/*
    575 * Find the user space receive window given the @pswid.
    576 *      - We must have a valid vasid and it must belong to this instance.
    577 *        (so both send and receive windows are on the same VAS instance)
    578 *      - The window must refer to an OPEN, FTW, RECEIVE window.
    579 *
    580 * NOTE: We access ->windows[] table and assume that vinst->mutex is held.
    581 */
    582static struct pnv_vas_window *get_user_rxwin(struct vas_instance *vinst,
    583					     u32 pswid)
    584{
    585	int vasid, winid;
    586	struct pnv_vas_window *rxwin;
    587
    588	decode_pswid(pswid, &vasid, &winid);
    589
    590	if (vinst->vas_id != vasid)
    591		return ERR_PTR(-EINVAL);
    592
    593	rxwin = vinst->windows[winid];
    594
    595	if (!rxwin || rxwin->tx_win || rxwin->vas_win.cop != VAS_COP_TYPE_FTW)
    596		return ERR_PTR(-EINVAL);
    597
    598	return rxwin;
    599}
    600
    601/*
    602 * Get the VAS receive window associated with NX engine identified
    603 * by @cop and if applicable, @pswid.
    604 *
    605 * See also function header of set_vinst_win().
    606 */
    607static struct pnv_vas_window *get_vinst_rxwin(struct vas_instance *vinst,
    608			enum vas_cop_type cop, u32 pswid)
    609{
    610	struct pnv_vas_window *rxwin;
    611
    612	mutex_lock(&vinst->mutex);
    613
    614	if (cop == VAS_COP_TYPE_FTW)
    615		rxwin = get_user_rxwin(vinst, pswid);
    616	else
    617		rxwin = vinst->rxwin[cop] ?: ERR_PTR(-EINVAL);
    618
    619	if (!IS_ERR(rxwin))
    620		atomic_inc(&rxwin->num_txwins);
    621
    622	mutex_unlock(&vinst->mutex);
    623
    624	return rxwin;
    625}
    626
    627/*
    628 * We have two tables of windows in a VAS instance. The first one,
    629 * ->windows[], contains all the windows in the instance and allows
    630 * looking up a window by its id. It is used to look up send windows
    631 * during fault handling and receive windows when pairing user space
    632 * send/receive windows.
    633 *
    634 * The second table, ->rxwin[], contains receive windows that are
    635 * associated with NX engines. This table has VAS_COP_TYPE_MAX
    636 * entries and is used to look up a receive window by its
    637 * coprocessor type.
    638 *
    639 * Here, we save @window in the ->windows[] table. If it is a receive
    640 * window, we also save the window in the ->rxwin[] table.
    641 */
    642static void set_vinst_win(struct vas_instance *vinst,
    643			struct pnv_vas_window *window)
    644{
    645	int id = window->vas_win.winid;
    646
    647	mutex_lock(&vinst->mutex);
    648
    649	/*
    650	 * There should only be one receive window for a coprocessor type
    651	 * unless its a user (FTW) window.
    652	 */
    653	if (!window->user_win && !window->tx_win) {
    654		WARN_ON_ONCE(vinst->rxwin[window->vas_win.cop]);
    655		vinst->rxwin[window->vas_win.cop] = window;
    656	}
    657
    658	WARN_ON_ONCE(vinst->windows[id] != NULL);
    659	vinst->windows[id] = window;
    660
    661	mutex_unlock(&vinst->mutex);
    662}
    663
    664/*
    665 * Clear this window from the table(s) of windows for this VAS instance.
    666 * See also function header of set_vinst_win().
    667 */
    668static void clear_vinst_win(struct pnv_vas_window *window)
    669{
    670	int id = window->vas_win.winid;
    671	struct vas_instance *vinst = window->vinst;
    672
    673	mutex_lock(&vinst->mutex);
    674
    675	if (!window->user_win && !window->tx_win) {
    676		WARN_ON_ONCE(!vinst->rxwin[window->vas_win.cop]);
    677		vinst->rxwin[window->vas_win.cop] = NULL;
    678	}
    679
    680	WARN_ON_ONCE(vinst->windows[id] != window);
    681	vinst->windows[id] = NULL;
    682
    683	mutex_unlock(&vinst->mutex);
    684}
    685
    686static void init_winctx_for_rxwin(struct pnv_vas_window *rxwin,
    687			struct vas_rx_win_attr *rxattr,
    688			struct vas_winctx *winctx)
    689{
    690	/*
    691	 * We first zero (memset()) all fields and only set non-zero fields.
    692	 * Following fields are 0/false but maybe deserve a comment:
    693	 *
    694	 *	->notify_os_intr_reg	In powerNV, send intrs to HV
    695	 *	->notify_disable	False for NX windows
    696	 *	->intr_disable		False for Fault Windows
    697	 *	->xtra_write		False for NX windows
    698	 *	->notify_early		NA for NX windows
    699	 *	->rsvd_txbuf_count	NA for Rx windows
    700	 *	->lpid, ->pid, ->tid	NA for Rx windows
    701	 */
    702
    703	memset(winctx, 0, sizeof(struct vas_winctx));
    704
    705	winctx->rx_fifo = rxattr->rx_fifo;
    706	winctx->rx_fifo_size = rxattr->rx_fifo_size;
    707	winctx->wcreds_max = rxwin->vas_win.wcreds_max;
    708	winctx->pin_win = rxattr->pin_win;
    709
    710	winctx->nx_win = rxattr->nx_win;
    711	winctx->fault_win = rxattr->fault_win;
    712	winctx->user_win = rxattr->user_win;
    713	winctx->rej_no_credit = rxattr->rej_no_credit;
    714	winctx->rx_word_mode = rxattr->rx_win_ord_mode;
    715	winctx->tx_word_mode = rxattr->tx_win_ord_mode;
    716	winctx->rx_wcred_mode = rxattr->rx_wcred_mode;
    717	winctx->tx_wcred_mode = rxattr->tx_wcred_mode;
    718	winctx->notify_early = rxattr->notify_early;
    719
    720	if (winctx->nx_win) {
    721		winctx->data_stamp = true;
    722		winctx->intr_disable = true;
    723		winctx->pin_win = true;
    724
    725		WARN_ON_ONCE(winctx->fault_win);
    726		WARN_ON_ONCE(!winctx->rx_word_mode);
    727		WARN_ON_ONCE(!winctx->tx_word_mode);
    728		WARN_ON_ONCE(winctx->notify_after_count);
    729	} else if (winctx->fault_win) {
    730		winctx->notify_disable = true;
    731	} else if (winctx->user_win) {
    732		/*
    733		 * Section 1.8.1 Low Latency Core-Core Wake up of
    734		 * the VAS workbook:
    735		 *
    736		 *      - disable credit checks ([tr]x_wcred_mode = false)
    737		 *      - disable FIFO writes
    738		 *      - enable ASB_Notify, disable interrupt
    739		 */
    740		winctx->fifo_disable = true;
    741		winctx->intr_disable = true;
    742		winctx->rx_fifo = 0;
    743	}
    744
    745	winctx->lnotify_lpid = rxattr->lnotify_lpid;
    746	winctx->lnotify_pid = rxattr->lnotify_pid;
    747	winctx->lnotify_tid = rxattr->lnotify_tid;
    748	winctx->pswid = rxattr->pswid;
    749	winctx->dma_type = VAS_DMA_TYPE_INJECT;
    750	winctx->tc_mode = rxattr->tc_mode;
    751
    752	winctx->min_scope = VAS_SCOPE_LOCAL;
    753	winctx->max_scope = VAS_SCOPE_VECTORED_GROUP;
    754	if (rxwin->vinst->virq)
    755		winctx->irq_port = rxwin->vinst->irq_port;
    756}
    757
    758static bool rx_win_args_valid(enum vas_cop_type cop,
    759			struct vas_rx_win_attr *attr)
    760{
    761	pr_debug("Rxattr: fault %d, notify %d, intr %d, early %d, fifo %d\n",
    762			attr->fault_win, attr->notify_disable,
    763			attr->intr_disable, attr->notify_early,
    764			attr->rx_fifo_size);
    765
    766	if (cop >= VAS_COP_TYPE_MAX)
    767		return false;
    768
    769	if (cop != VAS_COP_TYPE_FTW &&
    770				attr->rx_fifo_size < VAS_RX_FIFO_SIZE_MIN)
    771		return false;
    772
    773	if (attr->rx_fifo_size > VAS_RX_FIFO_SIZE_MAX)
    774		return false;
    775
    776	if (!attr->wcreds_max)
    777		return false;
    778
    779	if (attr->nx_win) {
    780		/* cannot be fault or user window if it is nx */
    781		if (attr->fault_win || attr->user_win)
    782			return false;
    783		/*
    784		 * Section 3.1.4.32: NX Windows must not disable notification,
    785		 *	and must not enable interrupts or early notification.
    786		 */
    787		if (attr->notify_disable || !attr->intr_disable ||
    788				attr->notify_early)
    789			return false;
    790	} else if (attr->fault_win) {
    791		/* cannot be both fault and user window */
    792		if (attr->user_win)
    793			return false;
    794
    795		/*
    796		 * Section 3.1.4.32: Fault windows must disable notification
    797		 *	but not interrupts.
    798		 */
    799		if (!attr->notify_disable || attr->intr_disable)
    800			return false;
    801
    802	} else if (attr->user_win) {
    803		/*
    804		 * User receive windows are only for fast-thread-wakeup
    805		 * (FTW). They don't need a FIFO and must disable interrupts
    806		 */
    807		if (attr->rx_fifo || attr->rx_fifo_size || !attr->intr_disable)
    808			return false;
    809	} else {
    810		/* Rx window must be one of NX or Fault or User window. */
    811		return false;
    812	}
    813
    814	return true;
    815}
    816
    817void vas_init_rx_win_attr(struct vas_rx_win_attr *rxattr, enum vas_cop_type cop)
    818{
    819	memset(rxattr, 0, sizeof(*rxattr));
    820
    821	if (cop == VAS_COP_TYPE_842 || cop == VAS_COP_TYPE_842_HIPRI ||
    822		cop == VAS_COP_TYPE_GZIP || cop == VAS_COP_TYPE_GZIP_HIPRI) {
    823		rxattr->pin_win = true;
    824		rxattr->nx_win = true;
    825		rxattr->fault_win = false;
    826		rxattr->intr_disable = true;
    827		rxattr->rx_wcred_mode = true;
    828		rxattr->tx_wcred_mode = true;
    829		rxattr->rx_win_ord_mode = true;
    830		rxattr->tx_win_ord_mode = true;
    831	} else if (cop == VAS_COP_TYPE_FAULT) {
    832		rxattr->pin_win = true;
    833		rxattr->fault_win = true;
    834		rxattr->notify_disable = true;
    835		rxattr->rx_wcred_mode = true;
    836		rxattr->rx_win_ord_mode = true;
    837		rxattr->rej_no_credit = true;
    838		rxattr->tc_mode = VAS_THRESH_DISABLED;
    839	} else if (cop == VAS_COP_TYPE_FTW) {
    840		rxattr->user_win = true;
    841		rxattr->intr_disable = true;
    842
    843		/*
    844		 * As noted in the VAS Workbook we disable credit checks.
    845		 * If we enable credit checks in the future, we must also
    846		 * implement a mechanism to return the user credits or new
    847		 * paste operations will fail.
    848		 */
    849	}
    850}
    851EXPORT_SYMBOL_GPL(vas_init_rx_win_attr);
    852
    853struct vas_window *vas_rx_win_open(int vasid, enum vas_cop_type cop,
    854			struct vas_rx_win_attr *rxattr)
    855{
    856	struct pnv_vas_window *rxwin;
    857	struct vas_winctx winctx;
    858	struct vas_instance *vinst;
    859
    860	trace_vas_rx_win_open(current, vasid, cop, rxattr);
    861
    862	if (!rx_win_args_valid(cop, rxattr))
    863		return ERR_PTR(-EINVAL);
    864
    865	vinst = find_vas_instance(vasid);
    866	if (!vinst) {
    867		pr_devel("vasid %d not found!\n", vasid);
    868		return ERR_PTR(-EINVAL);
    869	}
    870	pr_devel("Found instance %d\n", vasid);
    871
    872	rxwin = vas_window_alloc(vinst);
    873	if (IS_ERR(rxwin)) {
    874		pr_devel("Unable to allocate memory for Rx window\n");
    875		return (struct vas_window *)rxwin;
    876	}
    877
    878	rxwin->tx_win = false;
    879	rxwin->nx_win = rxattr->nx_win;
    880	rxwin->user_win = rxattr->user_win;
    881	rxwin->vas_win.cop = cop;
    882	rxwin->vas_win.wcreds_max = rxattr->wcreds_max;
    883
    884	init_winctx_for_rxwin(rxwin, rxattr, &winctx);
    885	init_winctx_regs(rxwin, &winctx);
    886
    887	set_vinst_win(vinst, rxwin);
    888
    889	return &rxwin->vas_win;
    890}
    891EXPORT_SYMBOL_GPL(vas_rx_win_open);
    892
    893void vas_init_tx_win_attr(struct vas_tx_win_attr *txattr, enum vas_cop_type cop)
    894{
    895	memset(txattr, 0, sizeof(*txattr));
    896
    897	if (cop == VAS_COP_TYPE_842 || cop == VAS_COP_TYPE_842_HIPRI ||
    898		cop == VAS_COP_TYPE_GZIP || cop == VAS_COP_TYPE_GZIP_HIPRI) {
    899		txattr->rej_no_credit = false;
    900		txattr->rx_wcred_mode = true;
    901		txattr->tx_wcred_mode = true;
    902		txattr->rx_win_ord_mode = true;
    903		txattr->tx_win_ord_mode = true;
    904	} else if (cop == VAS_COP_TYPE_FTW) {
    905		txattr->user_win = true;
    906	}
    907}
    908EXPORT_SYMBOL_GPL(vas_init_tx_win_attr);
    909
    910static void init_winctx_for_txwin(struct pnv_vas_window *txwin,
    911			struct vas_tx_win_attr *txattr,
    912			struct vas_winctx *winctx)
    913{
    914	/*
    915	 * We first zero all fields and only set non-zero ones. Following
    916	 * are some fields set to 0/false for the stated reason:
    917	 *
    918	 *	->notify_os_intr_reg	In powernv, send intrs to HV
    919	 *	->rsvd_txbuf_count	Not supported yet.
    920	 *	->notify_disable	False for NX windows
    921	 *	->xtra_write		False for NX windows
    922	 *	->notify_early		NA for NX windows
    923	 *	->lnotify_lpid		NA for Tx windows
    924	 *	->lnotify_pid		NA for Tx windows
    925	 *	->lnotify_tid		NA for Tx windows
    926	 *	->tx_win_cred_mode	Ignore for now for NX windows
    927	 *	->rx_win_cred_mode	Ignore for now for NX windows
    928	 */
    929	memset(winctx, 0, sizeof(struct vas_winctx));
    930
    931	winctx->wcreds_max = txwin->vas_win.wcreds_max;
    932
    933	winctx->user_win = txattr->user_win;
    934	winctx->nx_win = txwin->rxwin->nx_win;
    935	winctx->pin_win = txattr->pin_win;
    936	winctx->rej_no_credit = txattr->rej_no_credit;
    937	winctx->rsvd_txbuf_enable = txattr->rsvd_txbuf_enable;
    938
    939	winctx->rx_wcred_mode = txattr->rx_wcred_mode;
    940	winctx->tx_wcred_mode = txattr->tx_wcred_mode;
    941	winctx->rx_word_mode = txattr->rx_win_ord_mode;
    942	winctx->tx_word_mode = txattr->tx_win_ord_mode;
    943	winctx->rsvd_txbuf_count = txattr->rsvd_txbuf_count;
    944
    945	winctx->intr_disable = true;
    946	if (winctx->nx_win)
    947		winctx->data_stamp = true;
    948
    949	winctx->lpid = txattr->lpid;
    950	winctx->pidr = txattr->pidr;
    951	winctx->rx_win_id = txwin->rxwin->vas_win.winid;
    952	/*
    953	 * IRQ and fault window setup is successful. Set fault window
    954	 * for the send window so that ready to handle faults.
    955	 */
    956	if (txwin->vinst->virq)
    957		winctx->fault_win_id = txwin->vinst->fault_win->vas_win.winid;
    958
    959	winctx->dma_type = VAS_DMA_TYPE_INJECT;
    960	winctx->tc_mode = txattr->tc_mode;
    961	winctx->min_scope = VAS_SCOPE_LOCAL;
    962	winctx->max_scope = VAS_SCOPE_VECTORED_GROUP;
    963	if (txwin->vinst->virq)
    964		winctx->irq_port = txwin->vinst->irq_port;
    965
    966	winctx->pswid = txattr->pswid ? txattr->pswid :
    967			encode_pswid(txwin->vinst->vas_id,
    968			txwin->vas_win.winid);
    969}
    970
    971static bool tx_win_args_valid(enum vas_cop_type cop,
    972			struct vas_tx_win_attr *attr)
    973{
    974	if (attr->tc_mode != VAS_THRESH_DISABLED)
    975		return false;
    976
    977	if (cop > VAS_COP_TYPE_MAX)
    978		return false;
    979
    980	if (attr->wcreds_max > VAS_TX_WCREDS_MAX)
    981		return false;
    982
    983	if (attr->user_win) {
    984		if (attr->rsvd_txbuf_count)
    985			return false;
    986
    987		if (cop != VAS_COP_TYPE_FTW && cop != VAS_COP_TYPE_GZIP &&
    988			cop != VAS_COP_TYPE_GZIP_HIPRI)
    989			return false;
    990	}
    991
    992	return true;
    993}
    994
    995struct vas_window *vas_tx_win_open(int vasid, enum vas_cop_type cop,
    996			struct vas_tx_win_attr *attr)
    997{
    998	int rc;
    999	struct pnv_vas_window *txwin;
   1000	struct pnv_vas_window *rxwin;
   1001	struct vas_winctx winctx;
   1002	struct vas_instance *vinst;
   1003
   1004	trace_vas_tx_win_open(current, vasid, cop, attr);
   1005
   1006	if (!tx_win_args_valid(cop, attr))
   1007		return ERR_PTR(-EINVAL);
   1008
   1009	/*
   1010	 * If caller did not specify a vasid but specified the PSWID of a
   1011	 * receive window (applicable only to FTW windows), use the vasid
   1012	 * from that receive window.
   1013	 */
   1014	if (vasid == -1 && attr->pswid)
   1015		decode_pswid(attr->pswid, &vasid, NULL);
   1016
   1017	vinst = find_vas_instance(vasid);
   1018	if (!vinst) {
   1019		pr_devel("vasid %d not found!\n", vasid);
   1020		return ERR_PTR(-EINVAL);
   1021	}
   1022
   1023	rxwin = get_vinst_rxwin(vinst, cop, attr->pswid);
   1024	if (IS_ERR(rxwin)) {
   1025		pr_devel("No RxWin for vasid %d, cop %d\n", vasid, cop);
   1026		return (struct vas_window *)rxwin;
   1027	}
   1028
   1029	txwin = vas_window_alloc(vinst);
   1030	if (IS_ERR(txwin)) {
   1031		rc = PTR_ERR(txwin);
   1032		goto put_rxwin;
   1033	}
   1034
   1035	txwin->vas_win.cop = cop;
   1036	txwin->tx_win = 1;
   1037	txwin->rxwin = rxwin;
   1038	txwin->nx_win = txwin->rxwin->nx_win;
   1039	txwin->user_win = attr->user_win;
   1040	txwin->vas_win.wcreds_max = attr->wcreds_max ?: VAS_WCREDS_DEFAULT;
   1041
   1042	init_winctx_for_txwin(txwin, attr, &winctx);
   1043
   1044	init_winctx_regs(txwin, &winctx);
   1045
   1046	/*
   1047	 * If its a kernel send window, map the window address into the
   1048	 * kernel's address space. For user windows, user must issue an
   1049	 * mmap() to map the window into their address space.
   1050	 *
   1051	 * NOTE: If kernel ever resubmits a user CRB after handling a page
   1052	 *	 fault, we will need to map this into kernel as well.
   1053	 */
   1054	if (!txwin->user_win) {
   1055		txwin->paste_kaddr = map_paste_region(txwin);
   1056		if (IS_ERR(txwin->paste_kaddr)) {
   1057			rc = PTR_ERR(txwin->paste_kaddr);
   1058			goto free_window;
   1059		}
   1060	} else {
   1061		/*
   1062		 * Interrupt hanlder or fault window setup failed. Means
   1063		 * NX can not generate fault for page fault. So not
   1064		 * opening for user space tx window.
   1065		 */
   1066		if (!vinst->virq) {
   1067			rc = -ENODEV;
   1068			goto free_window;
   1069		}
   1070		rc = get_vas_user_win_ref(&txwin->vas_win.task_ref);
   1071		if (rc)
   1072			goto free_window;
   1073
   1074		vas_user_win_add_mm_context(&txwin->vas_win.task_ref);
   1075	}
   1076
   1077	set_vinst_win(vinst, txwin);
   1078
   1079	return &txwin->vas_win;
   1080
   1081free_window:
   1082	vas_window_free(txwin);
   1083
   1084put_rxwin:
   1085	put_rx_win(rxwin);
   1086	return ERR_PTR(rc);
   1087
   1088}
   1089EXPORT_SYMBOL_GPL(vas_tx_win_open);
   1090
   1091int vas_copy_crb(void *crb, int offset)
   1092{
   1093	return vas_copy(crb, offset);
   1094}
   1095EXPORT_SYMBOL_GPL(vas_copy_crb);
   1096
   1097#define RMA_LSMP_REPORT_ENABLE PPC_BIT(53)
   1098int vas_paste_crb(struct vas_window *vwin, int offset, bool re)
   1099{
   1100	struct pnv_vas_window *txwin;
   1101	int rc;
   1102	void *addr;
   1103	uint64_t val;
   1104
   1105	txwin = container_of(vwin, struct pnv_vas_window, vas_win);
   1106	trace_vas_paste_crb(current, txwin);
   1107
   1108	/*
   1109	 * Only NX windows are supported for now and hardware assumes
   1110	 * report-enable flag is set for NX windows. Ensure software
   1111	 * complies too.
   1112	 */
   1113	WARN_ON_ONCE(txwin->nx_win && !re);
   1114
   1115	addr = txwin->paste_kaddr;
   1116	if (re) {
   1117		/*
   1118		 * Set the REPORT_ENABLE bit (equivalent to writing
   1119		 * to 1K offset of the paste address)
   1120		 */
   1121		val = SET_FIELD(RMA_LSMP_REPORT_ENABLE, 0ULL, 1);
   1122		addr += val;
   1123	}
   1124
   1125	/*
   1126	 * Map the raw CR value from vas_paste() to an error code (there
   1127	 * is just pass or fail for now though).
   1128	 */
   1129	rc = vas_paste(addr, offset);
   1130	if (rc == 2)
   1131		rc = 0;
   1132	else
   1133		rc = -EINVAL;
   1134
   1135	pr_debug("Txwin #%d: Msg count %llu\n", txwin->vas_win.winid,
   1136			read_hvwc_reg(txwin, VREG(LRFIFO_PUSH)));
   1137
   1138	return rc;
   1139}
   1140EXPORT_SYMBOL_GPL(vas_paste_crb);
   1141
   1142/*
   1143 * If credit checking is enabled for this window, poll for the return
   1144 * of window credits (i.e for NX engines to process any outstanding CRBs).
   1145 * Since NX-842 waits for the CRBs to be processed before closing the
   1146 * window, we should not have to wait for too long.
   1147 *
   1148 * TODO: We retry in 10ms intervals now. We could/should probably peek at
   1149 *	the VAS_LRFIFO_PUSH_OFFSET register to get an estimate of pending
   1150 *	CRBs on the FIFO and compute the delay dynamically on each retry.
   1151 *	But that is not really needed until we support NX-GZIP access from
   1152 *	user space. (NX-842 driver waits for CSB and Fast thread-wakeup
   1153 *	doesn't use credit checking).
   1154 */
   1155static void poll_window_credits(struct pnv_vas_window *window)
   1156{
   1157	u64 val;
   1158	int creds, mode;
   1159	int count = 0;
   1160
   1161	val = read_hvwc_reg(window, VREG(WINCTL));
   1162	if (window->tx_win)
   1163		mode = GET_FIELD(VAS_WINCTL_TX_WCRED_MODE, val);
   1164	else
   1165		mode = GET_FIELD(VAS_WINCTL_RX_WCRED_MODE, val);
   1166
   1167	if (!mode)
   1168		return;
   1169retry:
   1170	if (window->tx_win) {
   1171		val = read_hvwc_reg(window, VREG(TX_WCRED));
   1172		creds = GET_FIELD(VAS_TX_WCRED, val);
   1173	} else {
   1174		val = read_hvwc_reg(window, VREG(LRX_WCRED));
   1175		creds = GET_FIELD(VAS_LRX_WCRED, val);
   1176	}
   1177
   1178	/*
   1179	 * Takes around few milliseconds to complete all pending requests
   1180	 * and return credits.
   1181	 * TODO: Scan fault FIFO and invalidate CRBs points to this window
   1182	 *       and issue CRB Kill to stop all pending requests. Need only
   1183	 *       if there is a bug in NX or fault handling in kernel.
   1184	 */
   1185	if (creds < window->vas_win.wcreds_max) {
   1186		val = 0;
   1187		set_current_state(TASK_UNINTERRUPTIBLE);
   1188		schedule_timeout(msecs_to_jiffies(10));
   1189		count++;
   1190		/*
   1191		 * Process can not close send window until all credits are
   1192		 * returned.
   1193		 */
   1194		if (!(count % 1000))
   1195			pr_warn_ratelimited("VAS: pid %d stuck. Waiting for credits returned for Window(%d). creds %d, Retries %d\n",
   1196				vas_window_pid(&window->vas_win),
   1197				window->vas_win.winid,
   1198				creds, count);
   1199
   1200		goto retry;
   1201	}
   1202}
   1203
   1204/*
   1205 * Wait for the window to go to "not-busy" state. It should only take a
   1206 * short time to queue a CRB, so window should not be busy for too long.
   1207 * Trying 5ms intervals.
   1208 */
   1209static void poll_window_busy_state(struct pnv_vas_window *window)
   1210{
   1211	int busy;
   1212	u64 val;
   1213	int count = 0;
   1214
   1215retry:
   1216	val = read_hvwc_reg(window, VREG(WIN_STATUS));
   1217	busy = GET_FIELD(VAS_WIN_BUSY, val);
   1218	if (busy) {
   1219		val = 0;
   1220		set_current_state(TASK_UNINTERRUPTIBLE);
   1221		schedule_timeout(msecs_to_jiffies(10));
   1222		count++;
   1223		/*
   1224		 * Takes around few milliseconds to process all pending
   1225		 * requests.
   1226		 */
   1227		if (!(count % 1000))
   1228			pr_warn_ratelimited("VAS: pid %d stuck. Window (ID=%d) is in busy state. Retries %d\n",
   1229				vas_window_pid(&window->vas_win),
   1230				window->vas_win.winid, count);
   1231
   1232		goto retry;
   1233	}
   1234}
   1235
   1236/*
   1237 * Have the hardware cast a window out of cache and wait for it to
   1238 * be completed.
   1239 *
   1240 * NOTE: It can take a relatively long time to cast the window context
   1241 *	out of the cache. It is not strictly necessary to cast out if:
   1242 *
   1243 *	- we clear the "Pin Window" bit (so hardware is free to evict)
   1244 *
   1245 *	- we re-initialize the window context when it is reassigned.
   1246 *
   1247 *	We do the former in vas_win_close() and latter in vas_win_open().
   1248 *	So, ignoring the cast-out for now. We can add it as needed. If
   1249 *	casting out becomes necessary we should consider offloading the
   1250 *	job to a worker thread, so the window close can proceed quickly.
   1251 */
   1252static void poll_window_castout(struct pnv_vas_window *window)
   1253{
   1254	/* stub for now */
   1255}
   1256
   1257/*
   1258 * Unpin and close a window so no new requests are accepted and the
   1259 * hardware can evict this window from cache if necessary.
   1260 */
   1261static void unpin_close_window(struct pnv_vas_window *window)
   1262{
   1263	u64 val;
   1264
   1265	val = read_hvwc_reg(window, VREG(WINCTL));
   1266	val = SET_FIELD(VAS_WINCTL_PIN, val, 0);
   1267	val = SET_FIELD(VAS_WINCTL_OPEN, val, 0);
   1268	write_hvwc_reg(window, VREG(WINCTL), val);
   1269}
   1270
   1271/*
   1272 * Close a window.
   1273 *
   1274 * See Section 1.12.1 of VAS workbook v1.05 for details on closing window:
   1275 *	- Disable new paste operations (unmap paste address)
   1276 *	- Poll for the "Window Busy" bit to be cleared
   1277 *	- Clear the Open/Enable bit for the Window.
   1278 *	- Poll for return of window Credits (implies FIFO empty for Rx win?)
   1279 *	- Unpin and cast window context out of cache
   1280 *
   1281 * Besides the hardware, kernel has some bookkeeping of course.
   1282 */
   1283int vas_win_close(struct vas_window *vwin)
   1284{
   1285	struct pnv_vas_window *window;
   1286
   1287	if (!vwin)
   1288		return 0;
   1289
   1290	window = container_of(vwin, struct pnv_vas_window, vas_win);
   1291
   1292	if (!window->tx_win && atomic_read(&window->num_txwins) != 0) {
   1293		pr_devel("Attempting to close an active Rx window!\n");
   1294		WARN_ON_ONCE(1);
   1295		return -EBUSY;
   1296	}
   1297
   1298	unmap_paste_region(window);
   1299
   1300	poll_window_busy_state(window);
   1301
   1302	unpin_close_window(window);
   1303
   1304	poll_window_credits(window);
   1305
   1306	clear_vinst_win(window);
   1307
   1308	poll_window_castout(window);
   1309
   1310	/* if send window, drop reference to matching receive window */
   1311	if (window->tx_win) {
   1312		if (window->user_win) {
   1313			put_vas_user_win_ref(&vwin->task_ref);
   1314			mm_context_remove_vas_window(vwin->task_ref.mm);
   1315		}
   1316		put_rx_win(window->rxwin);
   1317	}
   1318
   1319	vas_window_free(window);
   1320
   1321	return 0;
   1322}
   1323EXPORT_SYMBOL_GPL(vas_win_close);
   1324
   1325/*
   1326 * Return credit for the given window.
   1327 * Send windows and fault window uses credit mechanism as follows:
   1328 *
   1329 * Send windows:
   1330 * - The default number of credits available for each send window is
   1331 *   1024. It means 1024 requests can be issued asynchronously at the
   1332 *   same time. If the credit is not available, that request will be
   1333 *   returned with RMA_Busy.
   1334 * - One credit is taken when NX request is issued.
   1335 * - This credit is returned after NX processed that request.
   1336 * - If NX encounters translation error, kernel will return the
   1337 *   credit on the specific send window after processing the fault CRB.
   1338 *
   1339 * Fault window:
   1340 * - The total number credits available is FIFO_SIZE/CRB_SIZE.
   1341 *   Means 4MB/128 in the current implementation. If credit is not
   1342 *   available, RMA_Reject is returned.
   1343 * - A credit is taken when NX pastes CRB in fault FIFO.
   1344 * - The kernel with return credit on fault window after reading entry
   1345 *   from fault FIFO.
   1346 */
   1347void vas_return_credit(struct pnv_vas_window *window, bool tx)
   1348{
   1349	uint64_t val;
   1350
   1351	val = 0ULL;
   1352	if (tx) { /* send window */
   1353		val = SET_FIELD(VAS_TX_WCRED, val, 1);
   1354		write_hvwc_reg(window, VREG(TX_WCRED_ADDER), val);
   1355	} else {
   1356		val = SET_FIELD(VAS_LRX_WCRED, val, 1);
   1357		write_hvwc_reg(window, VREG(LRX_WCRED_ADDER), val);
   1358	}
   1359}
   1360
   1361struct pnv_vas_window *vas_pswid_to_window(struct vas_instance *vinst,
   1362		uint32_t pswid)
   1363{
   1364	struct pnv_vas_window *window;
   1365	int winid;
   1366
   1367	if (!pswid) {
   1368		pr_devel("%s: called for pswid 0!\n", __func__);
   1369		return ERR_PTR(-ESRCH);
   1370	}
   1371
   1372	decode_pswid(pswid, NULL, &winid);
   1373
   1374	if (winid >= VAS_WINDOWS_PER_CHIP)
   1375		return ERR_PTR(-ESRCH);
   1376
   1377	/*
   1378	 * If application closes the window before the hardware
   1379	 * returns the fault CRB, we should wait in vas_win_close()
   1380	 * for the pending requests. so the window must be active
   1381	 * and the process alive.
   1382	 *
   1383	 * If its a kernel process, we should not get any faults and
   1384	 * should not get here.
   1385	 */
   1386	window = vinst->windows[winid];
   1387
   1388	if (!window) {
   1389		pr_err("PSWID decode: Could not find window for winid %d pswid %d vinst 0x%p\n",
   1390			winid, pswid, vinst);
   1391		return NULL;
   1392	}
   1393
   1394	/*
   1395	 * Do some sanity checks on the decoded window.  Window should be
   1396	 * NX GZIP user send window. FTW windows should not incur faults
   1397	 * since their CRBs are ignored (not queued on FIFO or processed
   1398	 * by NX).
   1399	 */
   1400	if (!window->tx_win || !window->user_win || !window->nx_win ||
   1401			window->vas_win.cop == VAS_COP_TYPE_FAULT ||
   1402			window->vas_win.cop == VAS_COP_TYPE_FTW) {
   1403		pr_err("PSWID decode: id %d, tx %d, user %d, nx %d, cop %d\n",
   1404			winid, window->tx_win, window->user_win,
   1405			window->nx_win, window->vas_win.cop);
   1406		WARN_ON(1);
   1407	}
   1408
   1409	return window;
   1410}
   1411
   1412static struct vas_window *vas_user_win_open(int vas_id, u64 flags,
   1413				enum vas_cop_type cop_type)
   1414{
   1415	struct vas_tx_win_attr txattr = {};
   1416
   1417	vas_init_tx_win_attr(&txattr, cop_type);
   1418
   1419	txattr.lpid = mfspr(SPRN_LPID);
   1420	txattr.pidr = mfspr(SPRN_PID);
   1421	txattr.user_win = true;
   1422	txattr.rsvd_txbuf_count = false;
   1423	txattr.pswid = false;
   1424
   1425	pr_devel("Pid %d: Opening txwin, PIDR %ld\n", txattr.pidr,
   1426				mfspr(SPRN_PID));
   1427
   1428	return vas_tx_win_open(vas_id, cop_type, &txattr);
   1429}
   1430
   1431static u64 vas_user_win_paste_addr(struct vas_window *txwin)
   1432{
   1433	struct pnv_vas_window *win;
   1434	u64 paste_addr;
   1435
   1436	win = container_of(txwin, struct pnv_vas_window, vas_win);
   1437	vas_win_paste_addr(win, &paste_addr, NULL);
   1438
   1439	return paste_addr;
   1440}
   1441
   1442static int vas_user_win_close(struct vas_window *txwin)
   1443{
   1444	vas_win_close(txwin);
   1445
   1446	return 0;
   1447}
   1448
   1449static const struct vas_user_win_ops vops =  {
   1450	.open_win	=	vas_user_win_open,
   1451	.paste_addr	=	vas_user_win_paste_addr,
   1452	.close_win	=	vas_user_win_close,
   1453};
   1454
   1455/*
   1456 * Supporting only nx-gzip coprocessor type now, but this API code
   1457 * extended to other coprocessor types later.
   1458 */
   1459int vas_register_api_powernv(struct module *mod, enum vas_cop_type cop_type,
   1460			     const char *name)
   1461{
   1462
   1463	return vas_register_coproc_api(mod, cop_type, name, &vops);
   1464}
   1465EXPORT_SYMBOL_GPL(vas_register_api_powernv);
   1466
   1467void vas_unregister_api_powernv(void)
   1468{
   1469	vas_unregister_coproc_api();
   1470}
   1471EXPORT_SYMBOL_GPL(vas_unregister_api_powernv);