cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

gpfifogv100.c (7862B)


      1/*
      2 * Copyright 2018 Red Hat Inc.
      3 *
      4 * Permission is hereby granted, free of charge, to any person obtaining a
      5 * copy of this software and associated documentation files (the "Software"),
      6 * to deal in the Software without restriction, including without limitation
      7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
      8 * and/or sell copies of the Software, and to permit persons to whom the
      9 * Software is furnished to do so, subject to the following conditions:
     10 *
     11 * The above copyright notice and this permission notice shall be included in
     12 * all copies or substantial portions of the Software.
     13 *
     14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
     17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
     18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
     19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
     20 * OTHER DEALINGS IN THE SOFTWARE.
     21 */
     22#include "changk104.h"
     23#include "cgrp.h"
     24
     25#include <core/client.h>
     26#include <core/gpuobj.h>
     27
     28#include <nvif/clc36f.h>
     29#include <nvif/unpack.h>
     30
     31static u32
     32gv100_fifo_gpfifo_submit_token(struct nvkm_fifo_chan *chan)
     33{
     34	return chan->chid;
     35}
     36
     37static int
     38gv100_fifo_gpfifo_engine_valid(struct gk104_fifo_chan *chan, bool ce, bool valid)
     39{
     40	struct nvkm_subdev *subdev = &chan->base.fifo->engine.subdev;
     41	struct nvkm_device *device = subdev->device;
     42	const u32 mask = ce ? 0x00020000 : 0x00010000;
     43	const u32 data = valid ? mask : 0x00000000;
     44	int ret;
     45
     46	/* Block runlist to prevent the channel from being rescheduled. */
     47	mutex_lock(&chan->fifo->base.mutex);
     48	nvkm_mask(device, 0x002630, BIT(chan->runl), BIT(chan->runl));
     49
     50	/* Preempt the channel. */
     51	ret = gk104_fifo_gpfifo_kick_locked(chan);
     52	if (ret == 0) {
     53		/* Update engine context validity. */
     54		nvkm_kmap(chan->base.inst);
     55		nvkm_mo32(chan->base.inst, 0x0ac, mask, data);
     56		nvkm_done(chan->base.inst);
     57	}
     58
     59	/* Resume runlist. */
     60	nvkm_mask(device, 0x002630, BIT(chan->runl), 0);
     61	mutex_unlock(&chan->fifo->base.mutex);
     62	return ret;
     63}
     64
     65int
     66gv100_fifo_gpfifo_engine_fini(struct nvkm_fifo_chan *base,
     67			      struct nvkm_engine *engine, bool suspend)
     68{
     69	struct gk104_fifo_chan *chan = gk104_fifo_chan(base);
     70	struct nvkm_gpuobj *inst = chan->base.inst;
     71	int ret;
     72
     73	if (engine->subdev.type == NVKM_ENGINE_CE)
     74		return gk104_fifo_gpfifo_kick(chan);
     75
     76	ret = gv100_fifo_gpfifo_engine_valid(chan, false, false);
     77	if (ret && suspend)
     78		return ret;
     79
     80	nvkm_kmap(inst);
     81	nvkm_wo32(inst, 0x0210, 0x00000000);
     82	nvkm_wo32(inst, 0x0214, 0x00000000);
     83	nvkm_done(inst);
     84	return ret;
     85}
     86
     87int
     88gv100_fifo_gpfifo_engine_init(struct nvkm_fifo_chan *base,
     89			      struct nvkm_engine *engine)
     90{
     91	struct gk104_fifo_chan *chan = gk104_fifo_chan(base);
     92	struct gk104_fifo_engn *engn = gk104_fifo_gpfifo_engine(chan, engine);
     93	struct nvkm_gpuobj *inst = chan->base.inst;
     94
     95	if (engine->subdev.type == NVKM_ENGINE_CE)
     96		return 0;
     97
     98	nvkm_kmap(inst);
     99	nvkm_wo32(inst, 0x210, lower_32_bits(engn->vma->addr) | 0x00000004);
    100	nvkm_wo32(inst, 0x214, upper_32_bits(engn->vma->addr));
    101	nvkm_done(inst);
    102
    103	return gv100_fifo_gpfifo_engine_valid(chan, false, true);
    104}
    105
    106static const struct nvkm_fifo_chan_func
    107gv100_fifo_gpfifo = {
    108	.dtor = gk104_fifo_gpfifo_dtor,
    109	.init = gk104_fifo_gpfifo_init,
    110	.fini = gk104_fifo_gpfifo_fini,
    111	.ntfy = gf100_fifo_chan_ntfy,
    112	.engine_ctor = gk104_fifo_gpfifo_engine_ctor,
    113	.engine_dtor = gk104_fifo_gpfifo_engine_dtor,
    114	.engine_init = gv100_fifo_gpfifo_engine_init,
    115	.engine_fini = gv100_fifo_gpfifo_engine_fini,
    116	.submit_token = gv100_fifo_gpfifo_submit_token,
    117};
    118
    119int
    120gv100_fifo_gpfifo_new_(const struct nvkm_fifo_chan_func *func,
    121		       struct gk104_fifo *fifo, u64 *runlists, u16 *chid,
    122		       u64 vmm, u64 ioffset, u64 ilength, u64 *inst, bool priv,
    123		       u32 *token, const struct nvkm_oclass *oclass,
    124		       struct nvkm_object **pobject)
    125{
    126	struct nvkm_device *device = fifo->base.engine.subdev.device;
    127	struct gk104_fifo_chan *chan;
    128	int runlist = ffs(*runlists) -1, ret, i;
    129	u64 usermem, mthd;
    130	u32 size;
    131
    132	if (!vmm || runlist < 0 || runlist >= fifo->runlist_nr)
    133		return -EINVAL;
    134	*runlists = BIT_ULL(runlist);
    135
    136	/* Allocate the channel. */
    137	if (!(chan = kzalloc(sizeof(*chan), GFP_KERNEL)))
    138		return -ENOMEM;
    139	*pobject = &chan->base.object;
    140	chan->fifo = fifo;
    141	chan->runl = runlist;
    142	INIT_LIST_HEAD(&chan->head);
    143
    144	ret = nvkm_fifo_chan_ctor(func, &fifo->base, 0x1000, 0x1000, true, vmm,
    145				  0, fifo->runlist[runlist].engm, 1, fifo->user.bar->addr, 0x200,
    146				  oclass, &chan->base);
    147	if (ret)
    148		return ret;
    149
    150	*chid = chan->base.chid;
    151	*inst = chan->base.inst->addr;
    152	*token = chan->base.func->submit_token(&chan->base);
    153
    154	/* Hack to support GPUs where even individual channels should be
    155	 * part of a channel group.
    156	 */
    157	if (fifo->func->cgrp_force) {
    158		if (!(chan->cgrp = kmalloc(sizeof(*chan->cgrp), GFP_KERNEL)))
    159			return -ENOMEM;
    160		chan->cgrp->id = chan->base.chid;
    161		INIT_LIST_HEAD(&chan->cgrp->head);
    162		INIT_LIST_HEAD(&chan->cgrp->chan);
    163		chan->cgrp->chan_nr = 0;
    164	}
    165
    166	/* Clear channel control registers. */
    167	usermem = chan->base.chid * 0x200;
    168	ilength = order_base_2(ilength / 8);
    169
    170	nvkm_kmap(fifo->user.mem);
    171	for (i = 0; i < 0x200; i += 4)
    172		nvkm_wo32(fifo->user.mem, usermem + i, 0x00000000);
    173	nvkm_done(fifo->user.mem);
    174	usermem = nvkm_memory_addr(fifo->user.mem) + usermem;
    175
    176	/* Allocate fault method buffer (magics come from nvgpu). */
    177	size = nvkm_rd32(device, 0x104028); /* NV_PCE_PCE_MAP */
    178	size = 27 * 5 * (((9 + 1 + 3) * hweight32(size)) + 2);
    179	size = roundup(size, PAGE_SIZE);
    180
    181	ret = nvkm_memory_new(device, NVKM_MEM_TARGET_INST, size, 0x1000, true,
    182			      &chan->mthd);
    183	if (ret)
    184		return ret;
    185
    186	mthd = nvkm_memory_bar2(chan->mthd);
    187	if (mthd == ~0ULL)
    188		return -EFAULT;
    189
    190	/* RAMFC */
    191	nvkm_kmap(chan->base.inst);
    192	nvkm_wo32(chan->base.inst, 0x008, lower_32_bits(usermem));
    193	nvkm_wo32(chan->base.inst, 0x00c, upper_32_bits(usermem));
    194	nvkm_wo32(chan->base.inst, 0x010, 0x0000face);
    195	nvkm_wo32(chan->base.inst, 0x030, 0x7ffff902);
    196	nvkm_wo32(chan->base.inst, 0x048, lower_32_bits(ioffset));
    197	nvkm_wo32(chan->base.inst, 0x04c, upper_32_bits(ioffset) |
    198					  (ilength << 16));
    199	nvkm_wo32(chan->base.inst, 0x084, 0x20400000);
    200	nvkm_wo32(chan->base.inst, 0x094, 0x30000001);
    201	nvkm_wo32(chan->base.inst, 0x0e4, priv ? 0x00000020 : 0x00000000);
    202	nvkm_wo32(chan->base.inst, 0x0e8, chan->base.chid);
    203	nvkm_wo32(chan->base.inst, 0x0f4, 0x00001000);
    204	nvkm_wo32(chan->base.inst, 0x0f8, 0x10003080);
    205	nvkm_mo32(chan->base.inst, 0x218, 0x00000000, 0x00000000);
    206	nvkm_wo32(chan->base.inst, 0x220, lower_32_bits(mthd));
    207	nvkm_wo32(chan->base.inst, 0x224, upper_32_bits(mthd));
    208	nvkm_done(chan->base.inst);
    209	return gv100_fifo_gpfifo_engine_valid(chan, true, true);
    210}
    211
    212int
    213gv100_fifo_gpfifo_new(struct gk104_fifo *fifo, const struct nvkm_oclass *oclass,
    214		      void *data, u32 size, struct nvkm_object **pobject)
    215{
    216	struct nvkm_object *parent = oclass->parent;
    217	union {
    218		struct volta_channel_gpfifo_a_v0 v0;
    219	} *args = data;
    220	int ret = -ENOSYS;
    221
    222	nvif_ioctl(parent, "create channel gpfifo size %d\n", size);
    223	if (!(ret = nvif_unpack(ret, &data, &size, args->v0, 0, 0, false))) {
    224		nvif_ioctl(parent, "create channel gpfifo vers %d vmm %llx "
    225				   "ioffset %016llx ilength %08x "
    226				   "runlist %016llx priv %d\n",
    227			   args->v0.version, args->v0.vmm, args->v0.ioffset,
    228			   args->v0.ilength, args->v0.runlist, args->v0.priv);
    229		return gv100_fifo_gpfifo_new_(&gv100_fifo_gpfifo, fifo,
    230					      &args->v0.runlist,
    231					      &args->v0.chid,
    232					       args->v0.vmm,
    233					       args->v0.ioffset,
    234					       args->v0.ilength,
    235					      &args->v0.inst,
    236					       args->v0.priv,
    237					      &args->v0.token,
    238					      oclass, pobject);
    239	}
    240
    241	return ret;
    242}