17f4f35eaSBen Skeggs /*
27f4f35eaSBen Skeggs  * Copyright 2021 Red Hat Inc.
37f4f35eaSBen Skeggs  *
47f4f35eaSBen Skeggs  * Permission is hereby granted, free of charge, to any person obtaining a
57f4f35eaSBen Skeggs  * copy of this software and associated documentation files (the "Software"),
67f4f35eaSBen Skeggs  * to deal in the Software without restriction, including without limitation
77f4f35eaSBen Skeggs  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
87f4f35eaSBen Skeggs  * and/or sell copies of the Software, and to permit persons to whom the
97f4f35eaSBen Skeggs  * Software is furnished to do so, subject to the following conditions:
107f4f35eaSBen Skeggs  *
117f4f35eaSBen Skeggs  * The above copyright notice and this permission notice shall be included in
127f4f35eaSBen Skeggs  * all copies or substantial portions of the Software.
137f4f35eaSBen Skeggs  *
147f4f35eaSBen Skeggs  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
157f4f35eaSBen Skeggs  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
167f4f35eaSBen Skeggs  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
177f4f35eaSBen Skeggs  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
187f4f35eaSBen Skeggs  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
197f4f35eaSBen Skeggs  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
207f4f35eaSBen Skeggs  * OTHER DEALINGS IN THE SOFTWARE.
217f4f35eaSBen Skeggs  */
227f4f35eaSBen Skeggs #include "priv.h"
237f4f35eaSBen Skeggs #include "cgrp.h"
247f4f35eaSBen Skeggs #include "chan.h"
257f4f35eaSBen Skeggs #include "chid.h"
267f4f35eaSBen Skeggs #include "runl.h"
277f4f35eaSBen Skeggs #include "runq.h"
287f4f35eaSBen Skeggs 
297f4f35eaSBen Skeggs #include <core/gpuobj.h>
307f4f35eaSBen Skeggs #include <subdev/top.h>
317f4f35eaSBen Skeggs #include <subdev/vfn.h>
327f4f35eaSBen Skeggs 
337f4f35eaSBen Skeggs #include <nvif/class.h>
347f4f35eaSBen Skeggs 
357f4f35eaSBen Skeggs static u32
ga100_chan_doorbell_handle(struct nvkm_chan * chan)367f4f35eaSBen Skeggs ga100_chan_doorbell_handle(struct nvkm_chan *chan)
377f4f35eaSBen Skeggs {
387f4f35eaSBen Skeggs 	return (chan->cgrp->runl->doorbell << 16) | chan->id;
397f4f35eaSBen Skeggs }
407f4f35eaSBen Skeggs 
417f4f35eaSBen Skeggs static void
ga100_chan_stop(struct nvkm_chan * chan)427f4f35eaSBen Skeggs ga100_chan_stop(struct nvkm_chan *chan)
437f4f35eaSBen Skeggs {
447f4f35eaSBen Skeggs 	struct nvkm_runl *runl = chan->cgrp->runl;
457f4f35eaSBen Skeggs 
467f4f35eaSBen Skeggs 	nvkm_wr32(runl->fifo->engine.subdev.device, runl->chan + (chan->id * 4), 0x00000003);
477f4f35eaSBen Skeggs }
487f4f35eaSBen Skeggs 
497f4f35eaSBen Skeggs static void
ga100_chan_start(struct nvkm_chan * chan)507f4f35eaSBen Skeggs ga100_chan_start(struct nvkm_chan *chan)
517f4f35eaSBen Skeggs {
527f4f35eaSBen Skeggs 	struct nvkm_runl *runl = chan->cgrp->runl;
537f4f35eaSBen Skeggs 	struct nvkm_device *device = runl->fifo->engine.subdev.device;
547f4f35eaSBen Skeggs 	const int gfid = 0;
557f4f35eaSBen Skeggs 
567f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->chan + (chan->id * 4), 0x00000002);
577f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x0090, (gfid << 16) | chan->id); /* INTERNAL_DOORBELL. */
587f4f35eaSBen Skeggs }
597f4f35eaSBen Skeggs 
607f4f35eaSBen Skeggs static void
ga100_chan_unbind(struct nvkm_chan * chan)617f4f35eaSBen Skeggs ga100_chan_unbind(struct nvkm_chan *chan)
627f4f35eaSBen Skeggs {
637f4f35eaSBen Skeggs 	struct nvkm_runl *runl = chan->cgrp->runl;
647f4f35eaSBen Skeggs 
657f4f35eaSBen Skeggs 	nvkm_wr32(runl->fifo->engine.subdev.device, runl->chan + (chan->id * 4), 0xffffffff);
667f4f35eaSBen Skeggs }
677f4f35eaSBen Skeggs 
687f4f35eaSBen Skeggs static int
ga100_chan_ramfc_write(struct nvkm_chan * chan,u64 offset,u64 length,u32 devm,bool priv)697f4f35eaSBen Skeggs ga100_chan_ramfc_write(struct nvkm_chan *chan, u64 offset, u64 length, u32 devm, bool priv)
707f4f35eaSBen Skeggs {
717f4f35eaSBen Skeggs 	const u32 limit2 = ilog2(length / 8);
727f4f35eaSBen Skeggs 
737f4f35eaSBen Skeggs 	nvkm_kmap(chan->inst);
747f4f35eaSBen Skeggs 	nvkm_wo32(chan->inst, 0x010, 0x0000face);
757f4f35eaSBen Skeggs 	nvkm_wo32(chan->inst, 0x030, 0x7ffff902);
767f4f35eaSBen Skeggs 	nvkm_wo32(chan->inst, 0x048, lower_32_bits(offset));
777f4f35eaSBen Skeggs 	nvkm_wo32(chan->inst, 0x04c, upper_32_bits(offset) | (limit2 << 16));
787f4f35eaSBen Skeggs 	nvkm_wo32(chan->inst, 0x084, 0x20400000);
797f4f35eaSBen Skeggs 	nvkm_wo32(chan->inst, 0x094, 0x30000000 | devm);
807f4f35eaSBen Skeggs 	nvkm_wo32(chan->inst, 0x0e4, priv ? 0x00000020 : 0x00000000);
817f4f35eaSBen Skeggs 	nvkm_wo32(chan->inst, 0x0e8, chan->id);
827f4f35eaSBen Skeggs 	nvkm_wo32(chan->inst, 0x0f4, 0x00001000 | (priv ? 0x00000100 : 0x00000000));
83*55e1a599SBen Skeggs 	nvkm_wo32(chan->inst, 0x0f8, 0x80000000 | chan->cgrp->runl->nonstall.vector);
847f4f35eaSBen Skeggs 	nvkm_mo32(chan->inst, 0x218, 0x00000000, 0x00000000);
857f4f35eaSBen Skeggs 	nvkm_done(chan->inst);
867f4f35eaSBen Skeggs 	return 0;
877f4f35eaSBen Skeggs }
887f4f35eaSBen Skeggs 
897f4f35eaSBen Skeggs static const struct nvkm_chan_func_ramfc
907f4f35eaSBen Skeggs ga100_chan_ramfc = {
917f4f35eaSBen Skeggs 	.write = ga100_chan_ramfc_write,
927f4f35eaSBen Skeggs 	.devm = 0xfff,
937f4f35eaSBen Skeggs 	.priv = true,
947f4f35eaSBen Skeggs };
957f4f35eaSBen Skeggs 
967f4f35eaSBen Skeggs const struct nvkm_chan_func
977f4f35eaSBen Skeggs ga100_chan = {
987f4f35eaSBen Skeggs 	.inst = &gf100_chan_inst,
997f4f35eaSBen Skeggs 	.userd = &gv100_chan_userd,
1007f4f35eaSBen Skeggs 	.ramfc = &ga100_chan_ramfc,
1017f4f35eaSBen Skeggs 	.unbind = ga100_chan_unbind,
1027f4f35eaSBen Skeggs 	.start = ga100_chan_start,
1037f4f35eaSBen Skeggs 	.stop = ga100_chan_stop,
1047f4f35eaSBen Skeggs 	.preempt = gk110_chan_preempt,
1057f4f35eaSBen Skeggs 	.doorbell_handle = ga100_chan_doorbell_handle,
1067f4f35eaSBen Skeggs };
1077f4f35eaSBen Skeggs 
1087f4f35eaSBen Skeggs static void
ga100_cgrp_preempt(struct nvkm_cgrp * cgrp)1097f4f35eaSBen Skeggs ga100_cgrp_preempt(struct nvkm_cgrp *cgrp)
1107f4f35eaSBen Skeggs {
1117f4f35eaSBen Skeggs 	struct nvkm_runl *runl = cgrp->runl;
1127f4f35eaSBen Skeggs 
1137f4f35eaSBen Skeggs 	nvkm_wr32(runl->fifo->engine.subdev.device, runl->addr + 0x098, 0x01000000 | cgrp->id);
1147f4f35eaSBen Skeggs }
1157f4f35eaSBen Skeggs 
1167f4f35eaSBen Skeggs const struct nvkm_cgrp_func
1177f4f35eaSBen Skeggs ga100_cgrp = {
1187f4f35eaSBen Skeggs 	.preempt = ga100_cgrp_preempt,
1197f4f35eaSBen Skeggs };
1207f4f35eaSBen Skeggs 
1217f4f35eaSBen Skeggs static int
ga100_engn_cxid(struct nvkm_engn * engn,bool * cgid)1227f4f35eaSBen Skeggs ga100_engn_cxid(struct nvkm_engn *engn, bool *cgid)
1237f4f35eaSBen Skeggs {
1247f4f35eaSBen Skeggs 	struct nvkm_runl *runl = engn->runl;
1257f4f35eaSBen Skeggs 	struct nvkm_device *device = runl->fifo->engine.subdev.device;
1267f4f35eaSBen Skeggs 	u32 stat = nvkm_rd32(device, runl->addr + 0x200 + engn->id * 0x40);
1277f4f35eaSBen Skeggs 
1287f4f35eaSBen Skeggs 	ENGN_DEBUG(engn, "status %08x", stat);
1297f4f35eaSBen Skeggs 	*cgid = true;
1307f4f35eaSBen Skeggs 
1317f4f35eaSBen Skeggs 	switch ((stat & 0x0000e000) >> 13) {
1327f4f35eaSBen Skeggs 	case 0 /* INVALID */: return -ENODEV;
1337f4f35eaSBen Skeggs 	case 1 /*   VALID */:
1347f4f35eaSBen Skeggs 	case 5 /*    SAVE */: return (stat & 0x00000fff);
1357f4f35eaSBen Skeggs 	case 6 /*    LOAD */: return (stat & 0x0fff0000) >> 16;
1367f4f35eaSBen Skeggs 	case 7 /*  SWITCH */:
1377f4f35eaSBen Skeggs 		if (nvkm_engine_chsw_load(engn->engine))
1387f4f35eaSBen Skeggs 			return (stat & 0x0fff0000) >> 16;
1397f4f35eaSBen Skeggs 		return (stat & 0x00000fff);
1407f4f35eaSBen Skeggs 	default:
1417f4f35eaSBen Skeggs 		WARN_ON(1);
1427f4f35eaSBen Skeggs 		break;
1437f4f35eaSBen Skeggs 	}
1447f4f35eaSBen Skeggs 
1457f4f35eaSBen Skeggs 	return -ENODEV;
1467f4f35eaSBen Skeggs }
1477f4f35eaSBen Skeggs 
148*55e1a599SBen Skeggs static int
ga100_engn_nonstall(struct nvkm_engn * engn)149*55e1a599SBen Skeggs ga100_engn_nonstall(struct nvkm_engn *engn)
150*55e1a599SBen Skeggs {
151*55e1a599SBen Skeggs 	struct nvkm_engine *engine = engn->engine;
152*55e1a599SBen Skeggs 
153*55e1a599SBen Skeggs 	if (WARN_ON(!engine->func->nonstall))
154*55e1a599SBen Skeggs 		return -EINVAL;
155*55e1a599SBen Skeggs 
156*55e1a599SBen Skeggs 	return engine->func->nonstall(engine);
157*55e1a599SBen Skeggs }
158*55e1a599SBen Skeggs 
1597f4f35eaSBen Skeggs const struct nvkm_engn_func
1607f4f35eaSBen Skeggs ga100_engn = {
161*55e1a599SBen Skeggs 	.nonstall = ga100_engn_nonstall,
1627f4f35eaSBen Skeggs 	.cxid = ga100_engn_cxid,
1637f4f35eaSBen Skeggs 	.ctor = gk104_ectx_ctor,
1647f4f35eaSBen Skeggs 	.bind = gv100_ectx_bind,
1657f4f35eaSBen Skeggs };
1667f4f35eaSBen Skeggs 
1677f4f35eaSBen Skeggs const struct nvkm_engn_func
1687f4f35eaSBen Skeggs ga100_engn_ce = {
169*55e1a599SBen Skeggs 	.nonstall = ga100_engn_nonstall,
1707f4f35eaSBen Skeggs 	.cxid = ga100_engn_cxid,
1717f4f35eaSBen Skeggs 	.ctor = gv100_ectx_ce_ctor,
1727f4f35eaSBen Skeggs 	.bind = gv100_ectx_ce_bind,
1737f4f35eaSBen Skeggs };
1747f4f35eaSBen Skeggs 
1757f4f35eaSBen Skeggs static bool
ga100_runq_idle(struct nvkm_runq * runq)1767f4f35eaSBen Skeggs ga100_runq_idle(struct nvkm_runq *runq)
1777f4f35eaSBen Skeggs {
1787f4f35eaSBen Skeggs 	struct nvkm_device *device = runq->fifo->engine.subdev.device;
1797f4f35eaSBen Skeggs 
1807f4f35eaSBen Skeggs 	return !(nvkm_rd32(device, 0x04015c + (runq->id * 0x800)) & 0x0000e000);
1817f4f35eaSBen Skeggs }
1827f4f35eaSBen Skeggs 
1837f4f35eaSBen Skeggs static bool
ga100_runq_intr_1(struct nvkm_runq * runq,struct nvkm_runl * runl)1847f4f35eaSBen Skeggs ga100_runq_intr_1(struct nvkm_runq *runq, struct nvkm_runl *runl)
1857f4f35eaSBen Skeggs {
1867f4f35eaSBen Skeggs 	struct nvkm_device *device = runq->fifo->engine.subdev.device;
1877f4f35eaSBen Skeggs 	u32 inte = nvkm_rd32(device, 0x040180 + (runq->id * 0x800));
1887f4f35eaSBen Skeggs 	u32 intr = nvkm_rd32(device, 0x040148 + (runq->id * 0x800));
1897f4f35eaSBen Skeggs 	u32 stat = intr & inte;
1907f4f35eaSBen Skeggs 
1917f4f35eaSBen Skeggs 	if (!stat) {
1927f4f35eaSBen Skeggs 		RUNQ_DEBUG(runq, "inte1 %08x %08x", intr, inte);
1937f4f35eaSBen Skeggs 		return false;
1947f4f35eaSBen Skeggs 	}
1957f4f35eaSBen Skeggs 
1967f4f35eaSBen Skeggs 	if (stat & 0x80000000) {
1977f4f35eaSBen Skeggs 		u32 chid = nvkm_rd32(device, 0x040120 + (runq->id * 0x0800)) & runl->chid->mask;
1987f4f35eaSBen Skeggs 		struct nvkm_chan *chan;
1997f4f35eaSBen Skeggs 		unsigned long flags;
2007f4f35eaSBen Skeggs 
2017f4f35eaSBen Skeggs 		RUNQ_ERROR(runq, "CTXNOTVALID chid:%d", chid);
2027f4f35eaSBen Skeggs 		chan = nvkm_runl_chan_get_chid(runl, chid, &flags);
2037f4f35eaSBen Skeggs 		if (chan) {
2047f4f35eaSBen Skeggs 			nvkm_chan_error(chan, true);
2057f4f35eaSBen Skeggs 			nvkm_chan_put(&chan, flags);
2067f4f35eaSBen Skeggs 		}
2077f4f35eaSBen Skeggs 
2087f4f35eaSBen Skeggs 		nvkm_mask(device, 0x0400ac + (runq->id * 0x800), 0x00030000, 0x00030000);
2097f4f35eaSBen Skeggs 		stat &= ~0x80000000;
2107f4f35eaSBen Skeggs 	}
2117f4f35eaSBen Skeggs 
2127f4f35eaSBen Skeggs 	if (stat) {
2137f4f35eaSBen Skeggs 		RUNQ_ERROR(runq, "intr1 %08x", stat);
2147f4f35eaSBen Skeggs 		nvkm_wr32(device, 0x0401a0 + (runq->id * 0x800), stat);
2157f4f35eaSBen Skeggs 	}
2167f4f35eaSBen Skeggs 
2177f4f35eaSBen Skeggs 	nvkm_wr32(device, 0x040148 + (runq->id * 0x800), intr);
2187f4f35eaSBen Skeggs 	return true;
2197f4f35eaSBen Skeggs }
2207f4f35eaSBen Skeggs 
2217f4f35eaSBen Skeggs static bool
ga100_runq_intr_0(struct nvkm_runq * runq,struct nvkm_runl * runl)2227f4f35eaSBen Skeggs ga100_runq_intr_0(struct nvkm_runq *runq, struct nvkm_runl *runl)
2237f4f35eaSBen Skeggs {
2247f4f35eaSBen Skeggs 	struct nvkm_device *device = runq->fifo->engine.subdev.device;
2257f4f35eaSBen Skeggs 	u32 inte = nvkm_rd32(device, 0x040170 + (runq->id * 0x800));
2267f4f35eaSBen Skeggs 	u32 intr = nvkm_rd32(device, 0x040108 + (runq->id * 0x800));
2277f4f35eaSBen Skeggs 	u32 stat = intr & inte;
2287f4f35eaSBen Skeggs 
2297f4f35eaSBen Skeggs 	if (!stat) {
2307f4f35eaSBen Skeggs 		RUNQ_DEBUG(runq, "inte0 %08x %08x", intr, inte);
2317f4f35eaSBen Skeggs 		return false;
2327f4f35eaSBen Skeggs 	}
2337f4f35eaSBen Skeggs 
2347f4f35eaSBen Skeggs 	/*TODO: expand on this when fixing up gf100's version. */
2357f4f35eaSBen Skeggs 	if (stat & 0xc6afe000) {
2367f4f35eaSBen Skeggs 		u32 chid = nvkm_rd32(device, 0x040120 + (runq->id * 0x0800)) & runl->chid->mask;
2377f4f35eaSBen Skeggs 		struct nvkm_chan *chan;
2387f4f35eaSBen Skeggs 		unsigned long flags;
2397f4f35eaSBen Skeggs 
2407f4f35eaSBen Skeggs 		RUNQ_ERROR(runq, "intr0 %08x", stat);
2417f4f35eaSBen Skeggs 		chan = nvkm_runl_chan_get_chid(runl, chid, &flags);
2427f4f35eaSBen Skeggs 		if (chan) {
2437f4f35eaSBen Skeggs 			nvkm_chan_error(chan, true);
2447f4f35eaSBen Skeggs 			nvkm_chan_put(&chan, flags);
2457f4f35eaSBen Skeggs 		}
2467f4f35eaSBen Skeggs 
2477f4f35eaSBen Skeggs 		stat &= ~0xc6afe000;
2487f4f35eaSBen Skeggs 	}
2497f4f35eaSBen Skeggs 
2507f4f35eaSBen Skeggs 	if (stat) {
2517f4f35eaSBen Skeggs 		RUNQ_ERROR(runq, "intr0 %08x", stat);
2527f4f35eaSBen Skeggs 		nvkm_wr32(device, 0x040190 + (runq->id * 0x800), stat);
2537f4f35eaSBen Skeggs 	}
2547f4f35eaSBen Skeggs 
2557f4f35eaSBen Skeggs 	nvkm_wr32(device, 0x040108 + (runq->id * 0x800), intr);
2567f4f35eaSBen Skeggs 	return true;
2577f4f35eaSBen Skeggs }
2587f4f35eaSBen Skeggs 
2597f4f35eaSBen Skeggs static bool
ga100_runq_intr(struct nvkm_runq * runq,struct nvkm_runl * runl)2607f4f35eaSBen Skeggs ga100_runq_intr(struct nvkm_runq *runq, struct nvkm_runl *runl)
2617f4f35eaSBen Skeggs {
2627f4f35eaSBen Skeggs 	bool intr0 = ga100_runq_intr_0(runq, runl);
2637f4f35eaSBen Skeggs 	bool intr1 = ga100_runq_intr_1(runq, runl);
2647f4f35eaSBen Skeggs 
2657f4f35eaSBen Skeggs 	return intr0 || intr1;
2667f4f35eaSBen Skeggs }
2677f4f35eaSBen Skeggs 
2687f4f35eaSBen Skeggs static void
ga100_runq_init(struct nvkm_runq * runq)2697f4f35eaSBen Skeggs ga100_runq_init(struct nvkm_runq *runq)
2707f4f35eaSBen Skeggs {
2717f4f35eaSBen Skeggs 	struct nvkm_device *device = runq->fifo->engine.subdev.device;
2727f4f35eaSBen Skeggs 
2737f4f35eaSBen Skeggs 	nvkm_wr32(device, 0x040108 + (runq->id * 0x800), 0xffffffff); /* INTR_0 */
2747f4f35eaSBen Skeggs 	nvkm_wr32(device, 0x040148 + (runq->id * 0x800), 0xffffffff); /* INTR_1 */
2757f4f35eaSBen Skeggs 	nvkm_wr32(device, 0x040170 + (runq->id * 0x800), 0xffffffff); /* INTR_0_EN_SET_TREE */
2767f4f35eaSBen Skeggs 	nvkm_wr32(device, 0x040180 + (runq->id * 0x800), 0xffffffff); /* INTR_1_EN_SET_TREE */
2777f4f35eaSBen Skeggs }
2787f4f35eaSBen Skeggs 
2797f4f35eaSBen Skeggs const struct nvkm_runq_func
2807f4f35eaSBen Skeggs ga100_runq = {
2817f4f35eaSBen Skeggs 	.init = ga100_runq_init,
2827f4f35eaSBen Skeggs 	.intr = ga100_runq_intr,
2837f4f35eaSBen Skeggs 	.idle = ga100_runq_idle,
2847f4f35eaSBen Skeggs };
2857f4f35eaSBen Skeggs 
2867f4f35eaSBen Skeggs static bool
ga100_runl_preempt_pending(struct nvkm_runl * runl)2877f4f35eaSBen Skeggs ga100_runl_preempt_pending(struct nvkm_runl *runl)
2887f4f35eaSBen Skeggs {
2897f4f35eaSBen Skeggs 	return nvkm_rd32(runl->fifo->engine.subdev.device, runl->addr + 0x098) & 0x00100000;
2907f4f35eaSBen Skeggs }
2917f4f35eaSBen Skeggs 
2927f4f35eaSBen Skeggs static void
ga100_runl_preempt(struct nvkm_runl * runl)2937f4f35eaSBen Skeggs ga100_runl_preempt(struct nvkm_runl *runl)
2947f4f35eaSBen Skeggs {
2957f4f35eaSBen Skeggs 	nvkm_wr32(runl->fifo->engine.subdev.device, runl->addr + 0x098, 0x00000000);
2967f4f35eaSBen Skeggs }
2977f4f35eaSBen Skeggs 
2987f4f35eaSBen Skeggs static void
ga100_runl_allow(struct nvkm_runl * runl,u32 engm)2997f4f35eaSBen Skeggs ga100_runl_allow(struct nvkm_runl *runl, u32 engm)
3007f4f35eaSBen Skeggs {
3017f4f35eaSBen Skeggs 	nvkm_mask(runl->fifo->engine.subdev.device, runl->addr + 0x094, 0x00000001, 0x00000000);
3027f4f35eaSBen Skeggs }
3037f4f35eaSBen Skeggs 
3047f4f35eaSBen Skeggs static void
ga100_runl_block(struct nvkm_runl * runl,u32 engm)3057f4f35eaSBen Skeggs ga100_runl_block(struct nvkm_runl *runl, u32 engm)
3067f4f35eaSBen Skeggs {
3077f4f35eaSBen Skeggs 	nvkm_mask(runl->fifo->engine.subdev.device, runl->addr + 0x094, 0x00000001, 0x00000001);
3087f4f35eaSBen Skeggs }
3097f4f35eaSBen Skeggs 
3107f4f35eaSBen Skeggs static bool
ga100_runl_pending(struct nvkm_runl * runl)3117f4f35eaSBen Skeggs ga100_runl_pending(struct nvkm_runl *runl)
3127f4f35eaSBen Skeggs {
3137f4f35eaSBen Skeggs 	struct nvkm_device *device = runl->fifo->engine.subdev.device;
3147f4f35eaSBen Skeggs 
3157f4f35eaSBen Skeggs 	return nvkm_rd32(device, runl->addr + 0x08c) & 0x00008000;
3167f4f35eaSBen Skeggs }
3177f4f35eaSBen Skeggs 
3187f4f35eaSBen Skeggs static void
ga100_runl_commit(struct nvkm_runl * runl,struct nvkm_memory * memory,u32 start,int count)3197f4f35eaSBen Skeggs ga100_runl_commit(struct nvkm_runl *runl, struct nvkm_memory *memory, u32 start, int count)
3207f4f35eaSBen Skeggs {
3217f4f35eaSBen Skeggs 	struct nvkm_device *device = runl->fifo->engine.subdev.device;
3227f4f35eaSBen Skeggs 	u64 addr = nvkm_memory_addr(memory) + start;
3237f4f35eaSBen Skeggs 
3247f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x080, lower_32_bits(addr));
3257f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x084, upper_32_bits(addr));
3267f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x088, count);
3277f4f35eaSBen Skeggs }
3287f4f35eaSBen Skeggs 
3297f4f35eaSBen Skeggs static irqreturn_t
ga100_runl_intr(struct nvkm_inth * inth)3307f4f35eaSBen Skeggs ga100_runl_intr(struct nvkm_inth *inth)
3317f4f35eaSBen Skeggs {
3327f4f35eaSBen Skeggs 	struct nvkm_runl *runl = container_of(inth, typeof(*runl), inth);
3337f4f35eaSBen Skeggs 	struct nvkm_engn *engn;
3347f4f35eaSBen Skeggs 	struct nvkm_device *device = runl->fifo->engine.subdev.device;
3357f4f35eaSBen Skeggs 	u32 inte = nvkm_rd32(device, runl->addr + 0x120);
3367f4f35eaSBen Skeggs 	u32 intr = nvkm_rd32(device, runl->addr + 0x100);
3377f4f35eaSBen Skeggs 	u32 stat = intr & inte;
3387f4f35eaSBen Skeggs 	u32 info;
3397f4f35eaSBen Skeggs 
3407f4f35eaSBen Skeggs 	if (!stat) {
3417f4f35eaSBen Skeggs 		RUNL_DEBUG(runl, "inte %08x %08x", intr, inte);
3427f4f35eaSBen Skeggs 		return IRQ_NONE;
3437f4f35eaSBen Skeggs 	}
3447f4f35eaSBen Skeggs 
3457f4f35eaSBen Skeggs 	if (stat & 0x00000007) {
3467f4f35eaSBen Skeggs 		nvkm_runl_foreach_engn_cond(engn, runl, stat & BIT(engn->id)) {
3477f4f35eaSBen Skeggs 			info = nvkm_rd32(device, runl->addr + 0x224 + (engn->id * 0x40));
3487f4f35eaSBen Skeggs 
3497f4f35eaSBen Skeggs 			tu102_fifo_intr_ctxsw_timeout_info(engn, info);
3507f4f35eaSBen Skeggs 
3517f4f35eaSBen Skeggs 			nvkm_wr32(device, runl->addr + 0x100, BIT(engn->id));
3527f4f35eaSBen Skeggs 			stat &= ~BIT(engn->id);
3537f4f35eaSBen Skeggs 		}
3547f4f35eaSBen Skeggs 	}
3557f4f35eaSBen Skeggs 
3567f4f35eaSBen Skeggs 	if (stat & 0x00000300) {
3577f4f35eaSBen Skeggs 		nvkm_wr32(device, runl->addr + 0x100, stat & 0x00000300);
3587f4f35eaSBen Skeggs 		stat &= ~0x00000300;
3597f4f35eaSBen Skeggs 	}
3607f4f35eaSBen Skeggs 
3617f4f35eaSBen Skeggs 	if (stat & 0x00010000) {
3627f4f35eaSBen Skeggs 		if (runl->runq[0]) {
3637f4f35eaSBen Skeggs 			if (runl->runq[0]->func->intr(runl->runq[0], runl))
3647f4f35eaSBen Skeggs 				stat &= ~0x00010000;
3657f4f35eaSBen Skeggs 		}
3667f4f35eaSBen Skeggs 	}
3677f4f35eaSBen Skeggs 
3687f4f35eaSBen Skeggs 	if (stat & 0x00020000) {
3697f4f35eaSBen Skeggs 		if (runl->runq[1]) {
3707f4f35eaSBen Skeggs 			if (runl->runq[1]->func->intr(runl->runq[1], runl))
3717f4f35eaSBen Skeggs 				stat &= ~0x00020000;
3727f4f35eaSBen Skeggs 		}
3737f4f35eaSBen Skeggs 	}
3747f4f35eaSBen Skeggs 
3757f4f35eaSBen Skeggs 	if (stat) {
3767f4f35eaSBen Skeggs 		RUNL_ERROR(runl, "intr %08x", stat);
3777f4f35eaSBen Skeggs 		nvkm_wr32(device, runl->addr + 0x140, stat);
3787f4f35eaSBen Skeggs 	}
3797f4f35eaSBen Skeggs 
3807f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x180, 0x00000001);
3817f4f35eaSBen Skeggs 	return IRQ_HANDLED;
3827f4f35eaSBen Skeggs }
3837f4f35eaSBen Skeggs 
3847f4f35eaSBen Skeggs static void
ga100_runl_fini(struct nvkm_runl * runl)3857f4f35eaSBen Skeggs ga100_runl_fini(struct nvkm_runl *runl)
3867f4f35eaSBen Skeggs {
3877f4f35eaSBen Skeggs 	nvkm_mask(runl->fifo->engine.subdev.device, runl->addr + 0x300, 0x80000000, 0x00000000);
3887f4f35eaSBen Skeggs 	nvkm_inth_block(&runl->inth);
3897f4f35eaSBen Skeggs }
3907f4f35eaSBen Skeggs 
3917f4f35eaSBen Skeggs static void
ga100_runl_init(struct nvkm_runl * runl)3927f4f35eaSBen Skeggs ga100_runl_init(struct nvkm_runl *runl)
3937f4f35eaSBen Skeggs {
3947f4f35eaSBen Skeggs 	struct nvkm_fifo *fifo = runl->fifo;
3957f4f35eaSBen Skeggs 	struct nvkm_runq *runq;
3967f4f35eaSBen Skeggs 	struct nvkm_device *device = fifo->engine.subdev.device;
3977f4f35eaSBen Skeggs 	int i;
3987f4f35eaSBen Skeggs 
3997f4f35eaSBen Skeggs 	/* Submit NULL runlist and preempt. */
4007f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x088, 0x00000000);
4017f4f35eaSBen Skeggs 	runl->func->preempt(runl);
4027f4f35eaSBen Skeggs 
4037f4f35eaSBen Skeggs 	/* Enable doorbell. */
4047f4f35eaSBen Skeggs 	nvkm_mask(device, runl->addr + 0x300, 0x80000000, 0x80000000);
4057f4f35eaSBen Skeggs 
4067f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x100, 0xffffffff); /* INTR_0 */
4077f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x140, 0xffffffff); /* INTR_0_EN_CLEAR_TREE(0) */
4087f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x120, 0x000f1307); /* INTR_0_EN_SET_TREE(0) */
4097f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x148, 0xffffffff); /* INTR_0_EN_CLEAR_TREE(1) */
4107f4f35eaSBen Skeggs 	nvkm_wr32(device, runl->addr + 0x128, 0x00000000); /* INTR_0_EN_SET_TREE(1) */
4117f4f35eaSBen Skeggs 
4127f4f35eaSBen Skeggs 	/* Init PBDMA(s). */
4137f4f35eaSBen Skeggs 	for (i = 0; i < runl->runq_nr; i++) {
4147f4f35eaSBen Skeggs 		runq = runl->runq[i];
4157f4f35eaSBen Skeggs 		runq->func->init(runq);
4167f4f35eaSBen Skeggs 	}
4177f4f35eaSBen Skeggs 
4187f4f35eaSBen Skeggs 	nvkm_inth_allow(&runl->inth);
4197f4f35eaSBen Skeggs }
4207f4f35eaSBen Skeggs 
4217f4f35eaSBen Skeggs const struct nvkm_runl_func
4227f4f35eaSBen Skeggs ga100_runl = {
4237f4f35eaSBen Skeggs 	.init = ga100_runl_init,
4247f4f35eaSBen Skeggs 	.fini = ga100_runl_fini,
4257f4f35eaSBen Skeggs 	.size = 16,
4267f4f35eaSBen Skeggs 	.update = nv50_runl_update,
4277f4f35eaSBen Skeggs 	.insert_cgrp = gv100_runl_insert_cgrp,
4287f4f35eaSBen Skeggs 	.insert_chan = gv100_runl_insert_chan,
4297f4f35eaSBen Skeggs 	.commit = ga100_runl_commit,
4307f4f35eaSBen Skeggs 	.wait = nv50_runl_wait,
4317f4f35eaSBen Skeggs 	.pending = ga100_runl_pending,
4327f4f35eaSBen Skeggs 	.block = ga100_runl_block,
4337f4f35eaSBen Skeggs 	.allow = ga100_runl_allow,
4347f4f35eaSBen Skeggs 	.preempt = ga100_runl_preempt,
4357f4f35eaSBen Skeggs 	.preempt_pending = ga100_runl_preempt_pending,
4367f4f35eaSBen Skeggs };
4377f4f35eaSBen Skeggs 
4387f4f35eaSBen Skeggs static int
ga100_runl_new(struct nvkm_fifo * fifo,int id,u32 addr,struct nvkm_runl ** prunl)4397f4f35eaSBen Skeggs ga100_runl_new(struct nvkm_fifo *fifo, int id, u32 addr, struct nvkm_runl **prunl)
4407f4f35eaSBen Skeggs {
4417f4f35eaSBen Skeggs 	struct nvkm_device *device = fifo->engine.subdev.device;
44284ab065eSBen Skeggs 	struct nvkm_top_device *tdev;
4437f4f35eaSBen Skeggs 	struct nvkm_runl *runl;
44484ab065eSBen Skeggs 	struct nvkm_engn *engn;
4457f4f35eaSBen Skeggs 	u32 chcfg  = nvkm_rd32(device, addr + 0x004);
4467f4f35eaSBen Skeggs 	u32 chnum  = 1 << (chcfg & 0x0000000f);
4477f4f35eaSBen Skeggs 	u32 chaddr = (chcfg & 0xfffffff0);
4487f4f35eaSBen Skeggs 	u32 dbcfg  = nvkm_rd32(device, addr + 0x008);
4497f4f35eaSBen Skeggs 	u32 vector = nvkm_rd32(device, addr + 0x160);
4507f4f35eaSBen Skeggs 	int i, ret;
4517f4f35eaSBen Skeggs 
45284ab065eSBen Skeggs 	runl = nvkm_runl_new(fifo, id, addr, chnum);
4537f4f35eaSBen Skeggs 	if (IS_ERR(runl))
4547f4f35eaSBen Skeggs 		return PTR_ERR(runl);
4557f4f35eaSBen Skeggs 
45684ab065eSBen Skeggs 	*prunl = runl;
45784ab065eSBen Skeggs 
4587f4f35eaSBen Skeggs 	for (i = 0; i < 2; i++) {
4597f4f35eaSBen Skeggs 		u32 pbcfg = nvkm_rd32(device, addr + 0x010 + (i * 0x04));
4607f4f35eaSBen Skeggs 		if (pbcfg & 0x80000000) {
4617f4f35eaSBen Skeggs 			runl->runq[runl->runq_nr] =
4627f4f35eaSBen Skeggs 				nvkm_runq_new(fifo, ((pbcfg & 0x03fffc00) - 0x040000) / 0x800);
46384ab065eSBen Skeggs 			if (!runl->runq[runl->runq_nr]) {
46484ab065eSBen Skeggs 				RUNL_ERROR(runl, "runq %d", runl->runq_nr);
4657f4f35eaSBen Skeggs 				return -ENOMEM;
46684ab065eSBen Skeggs 			}
4677f4f35eaSBen Skeggs 
4687f4f35eaSBen Skeggs 			runl->runq_nr++;
4697f4f35eaSBen Skeggs 		}
4707f4f35eaSBen Skeggs 	}
4717f4f35eaSBen Skeggs 
47284ab065eSBen Skeggs 	nvkm_list_foreach(tdev, &device->top->device, head, tdev->runlist == runl->addr) {
47384ab065eSBen Skeggs 		if (tdev->engine < 0) {
47484ab065eSBen Skeggs 			RUNL_DEBUG(runl, "engn !top");
47584ab065eSBen Skeggs 			return -EINVAL;
47684ab065eSBen Skeggs 		}
47784ab065eSBen Skeggs 
47884ab065eSBen Skeggs 		engn = nvkm_runl_add(runl, tdev->engine, (tdev->type == NVKM_ENGINE_CE) ?
47984ab065eSBen Skeggs 				     fifo->func->engn_ce : fifo->func->engn,
48084ab065eSBen Skeggs 				     tdev->type, tdev->inst);
48184ab065eSBen Skeggs 		if (!engn)
48284ab065eSBen Skeggs 			return -EINVAL;
483*55e1a599SBen Skeggs 
484*55e1a599SBen Skeggs 		if (!engn->engine->func->nonstall) {
485*55e1a599SBen Skeggs 			RUNL_DEBUG(runl, "engn %s !nonstall", engn->engine->subdev.name);
486*55e1a599SBen Skeggs 			return -EINVAL;
487*55e1a599SBen Skeggs 		}
48884ab065eSBen Skeggs 	}
48984ab065eSBen Skeggs 
49084ab065eSBen Skeggs 	if (list_empty(&runl->engns)) {
49184ab065eSBen Skeggs 		RUNL_DEBUG(runl, "!engns");
49284ab065eSBen Skeggs 		return -EINVAL;
49384ab065eSBen Skeggs 	}
49484ab065eSBen Skeggs 
4957f4f35eaSBen Skeggs 	ret = nvkm_inth_add(&device->vfn->intr, vector & 0x00000fff, NVKM_INTR_PRIO_NORMAL,
4967f4f35eaSBen Skeggs 			    &fifo->engine.subdev, ga100_runl_intr, &runl->inth);
49784ab065eSBen Skeggs 	if (ret) {
49884ab065eSBen Skeggs 		RUNL_ERROR(runl, "inth %d", ret);
4997f4f35eaSBen Skeggs 		return ret;
50084ab065eSBen Skeggs 	}
5017f4f35eaSBen Skeggs 
5027f4f35eaSBen Skeggs 	runl->chan = chaddr;
5037f4f35eaSBen Skeggs 	runl->doorbell = dbcfg >> 16;
5047f4f35eaSBen Skeggs 	return 0;
5057f4f35eaSBen Skeggs }
5067f4f35eaSBen Skeggs 
5077f4f35eaSBen Skeggs static irqreturn_t
ga100_fifo_nonstall_intr(struct nvkm_inth * inth)5087f4f35eaSBen Skeggs ga100_fifo_nonstall_intr(struct nvkm_inth *inth)
5097f4f35eaSBen Skeggs {
510*55e1a599SBen Skeggs 	struct nvkm_runl *runl = container_of(inth, typeof(*runl), nonstall.inth);
5117f4f35eaSBen Skeggs 
512*55e1a599SBen Skeggs 	nvkm_event_ntfy(&runl->fifo->nonstall.event, runl->id, NVKM_FIFO_NONSTALL_EVENT);
5137f4f35eaSBen Skeggs 	return IRQ_HANDLED;
5147f4f35eaSBen Skeggs }
5157f4f35eaSBen Skeggs 
5167f4f35eaSBen Skeggs static void
ga100_fifo_nonstall_block(struct nvkm_event * event,int type,int index)5177f4f35eaSBen Skeggs ga100_fifo_nonstall_block(struct nvkm_event *event, int type, int index)
5187f4f35eaSBen Skeggs {
5197f4f35eaSBen Skeggs 	struct nvkm_fifo *fifo = container_of(event, typeof(*fifo), nonstall.event);
520*55e1a599SBen Skeggs 	struct nvkm_runl *runl = nvkm_runl_get(fifo, index, 0);
5217f4f35eaSBen Skeggs 
522*55e1a599SBen Skeggs 	nvkm_inth_block(&runl->nonstall.inth);
5237f4f35eaSBen Skeggs }
5247f4f35eaSBen Skeggs 
5257f4f35eaSBen Skeggs static void
ga100_fifo_nonstall_allow(struct nvkm_event * event,int type,int index)5267f4f35eaSBen Skeggs ga100_fifo_nonstall_allow(struct nvkm_event *event, int type, int index)
5277f4f35eaSBen Skeggs {
5287f4f35eaSBen Skeggs 	struct nvkm_fifo *fifo = container_of(event, typeof(*fifo), nonstall.event);
529*55e1a599SBen Skeggs 	struct nvkm_runl *runl = nvkm_runl_get(fifo, index, 0);
5307f4f35eaSBen Skeggs 
531*55e1a599SBen Skeggs 	nvkm_inth_allow(&runl->nonstall.inth);
5327f4f35eaSBen Skeggs }
5337f4f35eaSBen Skeggs 
5347f4f35eaSBen Skeggs const struct nvkm_event_func
5357f4f35eaSBen Skeggs ga100_fifo_nonstall = {
5367f4f35eaSBen Skeggs 	.init = ga100_fifo_nonstall_allow,
5377f4f35eaSBen Skeggs 	.fini = ga100_fifo_nonstall_block,
5387f4f35eaSBen Skeggs };
5397f4f35eaSBen Skeggs 
5407f4f35eaSBen Skeggs int
ga100_fifo_nonstall_ctor(struct nvkm_fifo * fifo)5417f4f35eaSBen Skeggs ga100_fifo_nonstall_ctor(struct nvkm_fifo *fifo)
5427f4f35eaSBen Skeggs {
543*55e1a599SBen Skeggs 	struct nvkm_subdev *subdev = &fifo->engine.subdev;
544*55e1a599SBen Skeggs 	struct nvkm_vfn *vfn = subdev->device->vfn;
545*55e1a599SBen Skeggs 	struct nvkm_runl *runl;
546*55e1a599SBen Skeggs 	int ret, nr = 0;
547*55e1a599SBen Skeggs 
548*55e1a599SBen Skeggs 	nvkm_runl_foreach(runl, fifo) {
549*55e1a599SBen Skeggs 		struct nvkm_engn *engn = list_first_entry(&runl->engns, typeof(*engn), head);
550*55e1a599SBen Skeggs 
551*55e1a599SBen Skeggs 		runl->nonstall.vector = engn->func->nonstall(engn);
552*55e1a599SBen Skeggs 		if (runl->nonstall.vector < 0) {
553*55e1a599SBen Skeggs 			RUNL_ERROR(runl, "nonstall %d", runl->nonstall.vector);
554*55e1a599SBen Skeggs 			return runl->nonstall.vector;
555*55e1a599SBen Skeggs 		}
556*55e1a599SBen Skeggs 
557*55e1a599SBen Skeggs 		ret = nvkm_inth_add(&vfn->intr, runl->nonstall.vector, NVKM_INTR_PRIO_NORMAL,
558*55e1a599SBen Skeggs 				    subdev, ga100_fifo_nonstall_intr, &runl->nonstall.inth);
559*55e1a599SBen Skeggs 		if (ret)
560*55e1a599SBen Skeggs 			return ret;
561*55e1a599SBen Skeggs 
562*55e1a599SBen Skeggs 		nr = max(nr, runl->id + 1);
563*55e1a599SBen Skeggs 	}
564*55e1a599SBen Skeggs 
565*55e1a599SBen Skeggs 	return nr;
5667f4f35eaSBen Skeggs }
5677f4f35eaSBen Skeggs 
5687f4f35eaSBen Skeggs int
ga100_fifo_runl_ctor(struct nvkm_fifo * fifo)5697f4f35eaSBen Skeggs ga100_fifo_runl_ctor(struct nvkm_fifo *fifo)
5707f4f35eaSBen Skeggs {
5717f4f35eaSBen Skeggs 	struct nvkm_device *device = fifo->engine.subdev.device;
5727f4f35eaSBen Skeggs 	struct nvkm_top_device *tdev;
5737f4f35eaSBen Skeggs 	struct nvkm_runl *runl;
5747f4f35eaSBen Skeggs 	int id = 0, ret;
5757f4f35eaSBen Skeggs 
5767f4f35eaSBen Skeggs 	nvkm_list_foreach(tdev, &device->top->device, head, tdev->runlist >= 0) {
5777f4f35eaSBen Skeggs 		runl = nvkm_runl_get(fifo, -1, tdev->runlist);
5787f4f35eaSBen Skeggs 		if (!runl) {
5797f4f35eaSBen Skeggs 			ret = ga100_runl_new(fifo, id++, tdev->runlist, &runl);
58084ab065eSBen Skeggs 			if (ret) {
58184ab065eSBen Skeggs 				if (runl)
58284ab065eSBen Skeggs 					nvkm_runl_del(runl);
5837f4f35eaSBen Skeggs 
5847f4f35eaSBen Skeggs 				continue;
58584ab065eSBen Skeggs 			}
58684ab065eSBen Skeggs 		}
5877f4f35eaSBen Skeggs 	}
5887f4f35eaSBen Skeggs 
5897f4f35eaSBen Skeggs 	return 0;
5907f4f35eaSBen Skeggs }
5917f4f35eaSBen Skeggs 
5927f4f35eaSBen Skeggs static const struct nvkm_fifo_func
5937f4f35eaSBen Skeggs ga100_fifo = {
5947f4f35eaSBen Skeggs 	.runl_ctor = ga100_fifo_runl_ctor,
5957f4f35eaSBen Skeggs 	.mmu_fault = &tu102_fifo_mmu_fault,
5967f4f35eaSBen Skeggs 	.nonstall_ctor = ga100_fifo_nonstall_ctor,
5977f4f35eaSBen Skeggs 	.nonstall = &ga100_fifo_nonstall,
5987f4f35eaSBen Skeggs 	.runl = &ga100_runl,
5997f4f35eaSBen Skeggs 	.runq = &ga100_runq,
6007f4f35eaSBen Skeggs 	.engn = &ga100_engn,
6017f4f35eaSBen Skeggs 	.engn_ce = &ga100_engn_ce,
6027f4f35eaSBen Skeggs 	.cgrp = {{ 0, 0, KEPLER_CHANNEL_GROUP_A  }, &ga100_cgrp, .force = true },
6037f4f35eaSBen Skeggs 	.chan = {{ 0, 0, AMPERE_CHANNEL_GPFIFO_A }, &ga100_chan },
6047f4f35eaSBen Skeggs };
6057f4f35eaSBen Skeggs 
6067f4f35eaSBen Skeggs int
ga100_fifo_new(struct nvkm_device * device,enum nvkm_subdev_type type,int inst,struct nvkm_fifo ** pfifo)6077f4f35eaSBen Skeggs ga100_fifo_new(struct nvkm_device *device, enum nvkm_subdev_type type, int inst,
6087f4f35eaSBen Skeggs 	       struct nvkm_fifo **pfifo)
6097f4f35eaSBen Skeggs {
6107f4f35eaSBen Skeggs 	return nvkm_fifo_new_(&ga100_fifo, device, type, inst, pfifo);
6117f4f35eaSBen Skeggs }
612