root/drivers/gpu/drm/nouveau/nvkm/engine/fifo/ga100.c
/*
 * Copyright 2021 Red Hat Inc.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 * OTHER DEALINGS IN THE SOFTWARE.
 */
#include "priv.h"
#include "cgrp.h"
#include "chan.h"
#include "chid.h"
#include "runl.h"
#include "runq.h"

#include <core/gpuobj.h>
#include <subdev/gsp.h>
#include <subdev/top.h>
#include <subdev/vfn.h>

#include <nvif/class.h>

static u32
ga100_chan_doorbell_handle(struct nvkm_chan *chan)
{
        return (chan->cgrp->runl->doorbell << 16) | chan->id;
}

static void
ga100_chan_stop(struct nvkm_chan *chan)
{
        struct nvkm_runl *runl = chan->cgrp->runl;

        nvkm_wr32(runl->fifo->engine.subdev.device, runl->chan + (chan->id * 4), 0x00000003);
}

static void
ga100_chan_start(struct nvkm_chan *chan)
{
        struct nvkm_runl *runl = chan->cgrp->runl;
        struct nvkm_device *device = runl->fifo->engine.subdev.device;
        const int gfid = 0;

        nvkm_wr32(device, runl->chan + (chan->id * 4), 0x00000002);
        nvkm_wr32(device, runl->addr + 0x0090, (gfid << 16) | chan->id); /* INTERNAL_DOORBELL. */
}

static void
ga100_chan_unbind(struct nvkm_chan *chan)
{
        struct nvkm_runl *runl = chan->cgrp->runl;

        nvkm_wr32(runl->fifo->engine.subdev.device, runl->chan + (chan->id * 4), 0xffffffff);
}

static int
ga100_chan_ramfc_write(struct nvkm_chan *chan, u64 offset, u64 length, u32 devm, bool priv)
{
        const u32 limit2 = ilog2(length / 8);

        nvkm_kmap(chan->inst);
        nvkm_wo32(chan->inst, 0x010, 0x0000face);
        nvkm_wo32(chan->inst, 0x030, 0x7ffff902);
        nvkm_wo32(chan->inst, 0x048, lower_32_bits(offset));
        nvkm_wo32(chan->inst, 0x04c, upper_32_bits(offset) | (limit2 << 16));
        nvkm_wo32(chan->inst, 0x084, 0x20400000);
        nvkm_wo32(chan->inst, 0x094, 0x30000000 | devm);
        nvkm_wo32(chan->inst, 0x0e4, priv ? 0x00000020 : 0x00000000);
        nvkm_wo32(chan->inst, 0x0e8, chan->id);
        nvkm_wo32(chan->inst, 0x0f4, 0x00001000 | (priv ? 0x00000100 : 0x00000000));
        nvkm_wo32(chan->inst, 0x0f8, 0x80000000 | chan->cgrp->runl->nonstall.vector);
        nvkm_mo32(chan->inst, 0x218, 0x00000000, 0x00000000);
        nvkm_done(chan->inst);
        return 0;
}

static const struct nvkm_chan_func_ramfc
ga100_chan_ramfc = {
        .write = ga100_chan_ramfc_write,
        .devm = 0xfff,
        .priv = true,
};

const struct nvkm_chan_func
ga100_chan = {
        .inst = &gf100_chan_inst,
        .userd = &gv100_chan_userd,
        .ramfc = &ga100_chan_ramfc,
        .unbind = ga100_chan_unbind,
        .start = ga100_chan_start,
        .stop = ga100_chan_stop,
        .preempt = gk110_chan_preempt,
        .doorbell_handle = ga100_chan_doorbell_handle,
};

static void
ga100_cgrp_preempt(struct nvkm_cgrp *cgrp)
{
        struct nvkm_runl *runl = cgrp->runl;

        nvkm_wr32(runl->fifo->engine.subdev.device, runl->addr + 0x098, 0x01000000 | cgrp->id);
}

const struct nvkm_cgrp_func
ga100_cgrp = {
        .preempt = ga100_cgrp_preempt,
};

static int
ga100_engn_cxid(struct nvkm_engn *engn, bool *cgid)
{
        struct nvkm_runl *runl = engn->runl;
        struct nvkm_device *device = runl->fifo->engine.subdev.device;
        u32 stat = nvkm_rd32(device, runl->addr + 0x200 + engn->id * 0x40);

        ENGN_DEBUG(engn, "status %08x", stat);
        *cgid = true;

        switch ((stat & 0x0000e000) >> 13) {
        case 0 /* INVALID */: return -ENODEV;
        case 1 /*   VALID */:
        case 5 /*    SAVE */: return (stat & 0x00000fff);
        case 6 /*    LOAD */: return (stat & 0x0fff0000) >> 16;
        case 7 /*  SWITCH */:
                if (nvkm_engine_chsw_load(engn->engine))
                        return (stat & 0x0fff0000) >> 16;
                return (stat & 0x00000fff);
        default:
                WARN_ON(1);
                break;
        }

        return -ENODEV;
}

static int
ga100_engn_nonstall(struct nvkm_engn *engn)
{
        struct nvkm_engine *engine = engn->engine;

        if (WARN_ON(!engine->func->nonstall))
                return -EINVAL;

        return engine->func->nonstall(engine);
}

const struct nvkm_engn_func
ga100_engn = {
        .nonstall = ga100_engn_nonstall,
        .cxid = ga100_engn_cxid,
        .ctor = gk104_ectx_ctor,
        .bind = gv100_ectx_bind,
};

const struct nvkm_engn_func
ga100_engn_ce = {
        .nonstall = ga100_engn_nonstall,
        .cxid = ga100_engn_cxid,
        .ctor = gv100_ectx_ce_ctor,
        .bind = gv100_ectx_ce_bind,
};

static bool
ga100_runq_idle(struct nvkm_runq *runq)
{
        struct nvkm_device *device = runq->fifo->engine.subdev.device;

        return !(nvkm_rd32(device, 0x04015c + (runq->id * 0x800)) & 0x0000e000);
}

static bool
ga100_runq_intr_1(struct nvkm_runq *runq, struct nvkm_runl *runl)
{
        struct nvkm_device *device = runq->fifo->engine.subdev.device;
        u32 inte = nvkm_rd32(device, 0x040180 + (runq->id * 0x800));
        u32 intr = nvkm_rd32(device, 0x040148 + (runq->id * 0x800));
        u32 stat = intr & inte;

        if (!stat) {
                RUNQ_DEBUG(runq, "inte1 %08x %08x", intr, inte);
                return false;
        }

        if (stat & 0x80000000) {
                u32 chid = nvkm_rd32(device, 0x040120 + (runq->id * 0x0800)) & runl->chid->mask;
                struct nvkm_chan *chan;
                unsigned long flags;

                RUNQ_ERROR(runq, "CTXNOTVALID chid:%d", chid);
                chan = nvkm_runl_chan_get_chid(runl, chid, &flags);
                if (chan) {
                        nvkm_chan_error(chan, true);
                        nvkm_chan_put(&chan, flags);
                }

                nvkm_mask(device, 0x0400ac + (runq->id * 0x800), 0x00030000, 0x00030000);
                stat &= ~0x80000000;
        }

        if (stat) {
                RUNQ_ERROR(runq, "intr1 %08x", stat);
                nvkm_wr32(device, 0x0401a0 + (runq->id * 0x800), stat);
        }

        nvkm_wr32(device, 0x040148 + (runq->id * 0x800), intr);
        return true;
}

static bool
ga100_runq_intr_0(struct nvkm_runq *runq, struct nvkm_runl *runl)
{
        struct nvkm_device *device = runq->fifo->engine.subdev.device;
        u32 inte = nvkm_rd32(device, 0x040170 + (runq->id * 0x800));
        u32 intr = nvkm_rd32(device, 0x040108 + (runq->id * 0x800));
        u32 stat = intr & inte;

        if (!stat) {
                RUNQ_DEBUG(runq, "inte0 %08x %08x", intr, inte);
                return false;
        }

        /*TODO: expand on this when fixing up gf100's version. */
        if (stat & 0xc6afe000) {
                u32 chid = nvkm_rd32(device, 0x040120 + (runq->id * 0x0800)) & runl->chid->mask;
                struct nvkm_chan *chan;
                unsigned long flags;

                RUNQ_ERROR(runq, "intr0 %08x", stat);
                chan = nvkm_runl_chan_get_chid(runl, chid, &flags);
                if (chan) {
                        nvkm_chan_error(chan, true);
                        nvkm_chan_put(&chan, flags);
                }

                stat &= ~0xc6afe000;
        }

        if (stat) {
                RUNQ_ERROR(runq, "intr0 %08x", stat);
                nvkm_wr32(device, 0x040190 + (runq->id * 0x800), stat);
        }

        nvkm_wr32(device, 0x040108 + (runq->id * 0x800), intr);
        return true;
}

static bool
ga100_runq_intr(struct nvkm_runq *runq, struct nvkm_runl *runl)
{
        bool intr0 = ga100_runq_intr_0(runq, runl);
        bool intr1 = ga100_runq_intr_1(runq, runl);

        return intr0 || intr1;
}

static void
ga100_runq_init(struct nvkm_runq *runq)
{
        struct nvkm_device *device = runq->fifo->engine.subdev.device;

        nvkm_wr32(device, 0x040108 + (runq->id * 0x800), 0xffffffff); /* INTR_0 */
        nvkm_wr32(device, 0x040148 + (runq->id * 0x800), 0xffffffff); /* INTR_1 */
        nvkm_wr32(device, 0x040170 + (runq->id * 0x800), 0xffffffff); /* INTR_0_EN_SET_TREE */
        nvkm_wr32(device, 0x040180 + (runq->id * 0x800), 0xffffffff); /* INTR_1_EN_SET_TREE */
}

const struct nvkm_runq_func
ga100_runq = {
        .init = ga100_runq_init,
        .intr = ga100_runq_intr,
        .idle = ga100_runq_idle,
};

static bool
ga100_runl_preempt_pending(struct nvkm_runl *runl)
{
        return nvkm_rd32(runl->fifo->engine.subdev.device, runl->addr + 0x098) & 0x00100000;
}

static void
ga100_runl_preempt(struct nvkm_runl *runl)
{
        nvkm_wr32(runl->fifo->engine.subdev.device, runl->addr + 0x098, 0x00000000);
}

static void
ga100_runl_allow(struct nvkm_runl *runl, u32 engm)
{
        nvkm_mask(runl->fifo->engine.subdev.device, runl->addr + 0x094, 0x00000001, 0x00000000);
}

static void
ga100_runl_block(struct nvkm_runl *runl, u32 engm)
{
        nvkm_mask(runl->fifo->engine.subdev.device, runl->addr + 0x094, 0x00000001, 0x00000001);
}

static bool
ga100_runl_pending(struct nvkm_runl *runl)
{
        struct nvkm_device *device = runl->fifo->engine.subdev.device;

        return nvkm_rd32(device, runl->addr + 0x08c) & 0x00008000;
}

static void
ga100_runl_commit(struct nvkm_runl *runl, struct nvkm_memory *memory, u32 start, int count)
{
        struct nvkm_device *device = runl->fifo->engine.subdev.device;
        u64 addr = nvkm_memory_addr(memory) + start;

        nvkm_wr32(device, runl->addr + 0x080, lower_32_bits(addr));
        nvkm_wr32(device, runl->addr + 0x084, upper_32_bits(addr));
        nvkm_wr32(device, runl->addr + 0x088, count);
}

static irqreturn_t
ga100_runl_intr(struct nvkm_inth *inth)
{
        struct nvkm_runl *runl = container_of(inth, typeof(*runl), inth);
        struct nvkm_engn *engn;
        struct nvkm_device *device = runl->fifo->engine.subdev.device;
        u32 inte = nvkm_rd32(device, runl->addr + 0x120);
        u32 intr = nvkm_rd32(device, runl->addr + 0x100);
        u32 stat = intr & inte;
        u32 info;

        if (!stat) {
                RUNL_DEBUG(runl, "inte %08x %08x", intr, inte);
                return IRQ_NONE;
        }

        if (stat & 0x00000007) {
                nvkm_runl_foreach_engn_cond(engn, runl, stat & BIT(engn->id)) {
                        info = nvkm_rd32(device, runl->addr + 0x224 + (engn->id * 0x40));

                        tu102_fifo_intr_ctxsw_timeout_info(engn, info);

                        nvkm_wr32(device, runl->addr + 0x100, BIT(engn->id));
                        stat &= ~BIT(engn->id);
                }
        }

        if (stat & 0x00000300) {
                nvkm_wr32(device, runl->addr + 0x100, stat & 0x00000300);
                stat &= ~0x00000300;
        }

        if (stat & 0x00010000) {
                if (runl->runq[0]) {
                        if (runl->runq[0]->func->intr(runl->runq[0], runl))
                                stat &= ~0x00010000;
                }
        }

        if (stat & 0x00020000) {
                if (runl->runq[1]) {
                        if (runl->runq[1]->func->intr(runl->runq[1], runl))
                                stat &= ~0x00020000;
                }
        }

        if (stat) {
                RUNL_ERROR(runl, "intr %08x", stat);
                nvkm_wr32(device, runl->addr + 0x140, stat);
        }

        nvkm_wr32(device, runl->addr + 0x180, 0x00000001);
        return IRQ_HANDLED;
}

static void
ga100_runl_fini(struct nvkm_runl *runl)
{
        nvkm_mask(runl->fifo->engine.subdev.device, runl->addr + 0x300, 0x80000000, 0x00000000);
        nvkm_inth_block(&runl->inth);
}

static void
ga100_runl_init(struct nvkm_runl *runl)
{
        struct nvkm_fifo *fifo = runl->fifo;
        struct nvkm_runq *runq;
        struct nvkm_device *device = fifo->engine.subdev.device;
        int i;

        /* Submit NULL runlist and preempt. */
        nvkm_wr32(device, runl->addr + 0x088, 0x00000000);
        runl->func->preempt(runl);

        /* Enable doorbell. */
        nvkm_mask(device, runl->addr + 0x300, 0x80000000, 0x80000000);

        nvkm_wr32(device, runl->addr + 0x100, 0xffffffff); /* INTR_0 */
        nvkm_wr32(device, runl->addr + 0x140, 0xffffffff); /* INTR_0_EN_CLEAR_TREE(0) */
        nvkm_wr32(device, runl->addr + 0x120, 0x000f1307); /* INTR_0_EN_SET_TREE(0) */
        nvkm_wr32(device, runl->addr + 0x148, 0xffffffff); /* INTR_0_EN_CLEAR_TREE(1) */
        nvkm_wr32(device, runl->addr + 0x128, 0x00000000); /* INTR_0_EN_SET_TREE(1) */

        /* Init PBDMA(s). */
        for (i = 0; i < runl->runq_nr; i++) {
                runq = runl->runq[i];
                runq->func->init(runq);
        }

        nvkm_inth_allow(&runl->inth);
}

const struct nvkm_runl_func
ga100_runl = {
        .init = ga100_runl_init,
        .fini = ga100_runl_fini,
        .size = 16,
        .update = nv50_runl_update,
        .insert_cgrp = gv100_runl_insert_cgrp,
        .insert_chan = gv100_runl_insert_chan,
        .commit = ga100_runl_commit,
        .wait = nv50_runl_wait,
        .pending = ga100_runl_pending,
        .block = ga100_runl_block,
        .allow = ga100_runl_allow,
        .preempt = ga100_runl_preempt,
        .preempt_pending = ga100_runl_preempt_pending,
};

static int
ga100_runl_new(struct nvkm_fifo *fifo, int id, u32 addr, struct nvkm_runl **prunl)
{
        struct nvkm_device *device = fifo->engine.subdev.device;
        struct nvkm_top_device *tdev;
        struct nvkm_runl *runl;
        struct nvkm_engn *engn;
        u32 chcfg  = nvkm_rd32(device, addr + 0x004);
        u32 chnum  = 1 << (chcfg & 0x0000000f);
        u32 chaddr = (chcfg & 0xfffffff0);
        u32 dbcfg  = nvkm_rd32(device, addr + 0x008);
        u32 vector = nvkm_rd32(device, addr + 0x160);
        int i, ret;

        runl = nvkm_runl_new(fifo, id, addr, chnum);
        if (IS_ERR(runl))
                return PTR_ERR(runl);

        *prunl = runl;

        for (i = 0; i < 2; i++) {
                u32 pbcfg = nvkm_rd32(device, addr + 0x010 + (i * 0x04));
                if (pbcfg & 0x80000000) {
                        runl->runq[runl->runq_nr] =
                                nvkm_runq_new(fifo, ((pbcfg & 0x03fffc00) - 0x040000) / 0x800);
                        if (!runl->runq[runl->runq_nr]) {
                                RUNL_ERROR(runl, "runq %d", runl->runq_nr);
                                return -ENOMEM;
                        }

                        runl->runq_nr++;
                }
        }

        nvkm_list_foreach(tdev, &device->top->device, head, tdev->runlist == runl->addr) {
                if (tdev->engine < 0) {
                        RUNL_DEBUG(runl, "engn !top");
                        return -EINVAL;
                }

                engn = nvkm_runl_add(runl, tdev->engine, (tdev->type == NVKM_ENGINE_CE) ?
                                     fifo->func->engn_ce : fifo->func->engn,
                                     tdev->type, tdev->inst);
                if (!engn)
                        return -EINVAL;

                if (!engn->engine->func->nonstall) {
                        RUNL_DEBUG(runl, "engn %s !nonstall", engn->engine->subdev.name);
                        return -EINVAL;
                }
        }

        if (list_empty(&runl->engns)) {
                RUNL_DEBUG(runl, "!engns");
                return -EINVAL;
        }

        ret = nvkm_inth_add(&device->vfn->intr, vector & 0x00000fff, NVKM_INTR_PRIO_NORMAL,
                            &fifo->engine.subdev, ga100_runl_intr, &runl->inth);
        if (ret) {
                RUNL_ERROR(runl, "inth %d", ret);
                return ret;
        }

        runl->chan = chaddr;
        runl->doorbell = dbcfg >> 16;
        return 0;
}

static irqreturn_t
ga100_fifo_nonstall_intr(struct nvkm_inth *inth)
{
        struct nvkm_runl *runl = container_of(inth, typeof(*runl), nonstall.inth);

        nvkm_event_ntfy(&runl->fifo->nonstall.event, runl->id, NVKM_FIFO_NONSTALL_EVENT);
        return IRQ_HANDLED;
}

static void
ga100_fifo_nonstall_block(struct nvkm_event *event, int type, int index)
{
}

static void
ga100_fifo_nonstall_allow(struct nvkm_event *event, int type, int index)
{
}

const struct nvkm_event_func
ga100_fifo_nonstall = {
        .init = ga100_fifo_nonstall_allow,
        .fini = ga100_fifo_nonstall_block,
};

int
ga100_fifo_nonstall_ctor(struct nvkm_fifo *fifo)
{
        struct nvkm_subdev *subdev = &fifo->engine.subdev;
        struct nvkm_vfn *vfn = subdev->device->vfn;
        struct nvkm_runl *runl;
        int ret, nr = 0;

        nvkm_runl_foreach(runl, fifo) {
                struct nvkm_engn *engn = list_first_entry(&runl->engns, typeof(*engn), head);

                runl->nonstall.vector = engn->func->nonstall(engn);

                /* if no nonstall vector just keep going */
                if (runl->nonstall.vector == -1)
                        continue;
                if (runl->nonstall.vector < 0) {
                        RUNL_ERROR(runl, "nonstall %d", runl->nonstall.vector);
                        return runl->nonstall.vector;
                }

                ret = nvkm_inth_add(&vfn->intr, runl->nonstall.vector, NVKM_INTR_PRIO_NORMAL,
                                    subdev, ga100_fifo_nonstall_intr, &runl->nonstall.inth);
                if (ret)
                        return ret;

                nvkm_inth_allow(&runl->nonstall.inth);

                nr = max(nr, runl->id + 1);
        }

        return nr;
}

void
ga100_fifo_nonstall_dtor(struct nvkm_fifo *fifo)
{
        struct nvkm_runl *runl;

        nvkm_runl_foreach(runl, fifo) {
                if (runl->nonstall.vector < 0)
                        continue;
                nvkm_inth_block(&runl->nonstall.inth);
        }
}

int
ga100_fifo_runl_ctor(struct nvkm_fifo *fifo)
{
        struct nvkm_device *device = fifo->engine.subdev.device;
        struct nvkm_top_device *tdev;
        struct nvkm_runl *runl;
        int id = 0, ret;

        nvkm_list_foreach(tdev, &device->top->device, head, tdev->runlist >= 0) {
                runl = nvkm_runl_get(fifo, -1, tdev->runlist);
                if (!runl) {
                        ret = ga100_runl_new(fifo, id++, tdev->runlist, &runl);
                        if (ret) {
                                if (runl)
                                        nvkm_runl_del(runl);

                                continue;
                        }
                }
        }

        return 0;
}

static const struct nvkm_fifo_func
ga100_fifo = {
        .runl_ctor = ga100_fifo_runl_ctor,
        .mmu_fault = &tu102_fifo_mmu_fault,
        .nonstall_ctor = ga100_fifo_nonstall_ctor,
        .nonstall_dtor = ga100_fifo_nonstall_dtor,
        .nonstall = &ga100_fifo_nonstall,
        .runl = &ga100_runl,
        .runq = &ga100_runq,
        .engn = &ga100_engn,
        .engn_ce = &ga100_engn_ce,
        .cgrp = {{ 0, 0, KEPLER_CHANNEL_GROUP_A  }, &ga100_cgrp, .force = true },
        .chan = {{ 0, 0, AMPERE_CHANNEL_GPFIFO_A }, &ga100_chan },
};

int
ga100_fifo_new(struct nvkm_device *device, enum nvkm_subdev_type type, int inst,
               struct nvkm_fifo **pfifo)
{
        if (nvkm_gsp_rm(device->gsp))
                return r535_fifo_new(&ga100_fifo, device, type, inst, pfifo);

        return nvkm_fifo_new_(&ga100_fifo, device, type, inst, pfifo);
}