root/drivers/gpu/host1x/hw/cdma_hw.c
// SPDX-License-Identifier: GPL-2.0-only
/*
 * Tegra host1x Command DMA
 *
 * Copyright (c) 2010-2013, NVIDIA Corporation.
 */

#include <linux/slab.h>
#include <linux/scatterlist.h>
#include <linux/dma-mapping.h>

#include "../cdma.h"
#include "../channel.h"
#include "../dev.h"
#include "../debug.h"

/*
 * Put the restart at the end of pushbuffer memory
 */
static void push_buffer_init(struct push_buffer *pb)
{
        *(u32 *)(pb->mapped + pb->size) = host1x_opcode_restart(0);
}

/*
 * Increment timedout buffer's syncpt via CPU.
 */
static void cdma_timeout_cpu_incr(struct host1x_cdma *cdma, u32 getptr,
                                u32 syncpt_incrs, u32 syncval, u32 nr_slots)
{
        unsigned int i;

        for (i = 0; i < syncpt_incrs; i++)
                host1x_syncpt_incr(cdma->timeout.syncpt);

        /* after CPU incr, ensure shadow is up to date */
        host1x_syncpt_load(cdma->timeout.syncpt);
}

/*
 * Start channel DMA
 */
static void cdma_start(struct host1x_cdma *cdma)
{
        struct host1x_channel *ch = cdma_to_channel(cdma);
        u64 start, end;

        if (cdma->running)
                return;

        cdma->last_pos = cdma->push_buffer.pos;
        start = cdma->push_buffer.dma;
        end = cdma->push_buffer.size + 4;

        host1x_ch_writel(ch, HOST1X_CHANNEL_DMACTRL_DMASTOP,
                         HOST1X_CHANNEL_DMACTRL);

        /* set base, put and end pointer */
        host1x_ch_writel(ch, lower_32_bits(start), HOST1X_CHANNEL_DMASTART);
#if HOST1X_HW >= 6
        host1x_ch_writel(ch, upper_32_bits(start), HOST1X_CHANNEL_DMASTART_HI);
#endif
        host1x_ch_writel(ch, cdma->push_buffer.pos, HOST1X_CHANNEL_DMAPUT);
#if HOST1X_HW >= 6
        host1x_ch_writel(ch, 0, HOST1X_CHANNEL_DMAPUT_HI);
#endif
        host1x_ch_writel(ch, lower_32_bits(end), HOST1X_CHANNEL_DMAEND);
#if HOST1X_HW >= 6
        host1x_ch_writel(ch, upper_32_bits(end), HOST1X_CHANNEL_DMAEND_HI);
#endif

        /* reset GET */
        host1x_ch_writel(ch, HOST1X_CHANNEL_DMACTRL_DMASTOP |
                         HOST1X_CHANNEL_DMACTRL_DMAGETRST |
                         HOST1X_CHANNEL_DMACTRL_DMAINITGET,
                         HOST1X_CHANNEL_DMACTRL);

        /* start the command DMA */
        host1x_ch_writel(ch, 0, HOST1X_CHANNEL_DMACTRL);

        cdma->running = true;
}

/*
 * Similar to cdma_start(), but rather than starting from an idle
 * state (where DMA GET is set to DMA PUT), on a timeout we restore
 * DMA GET from an explicit value (so DMA may again be pending).
 */
static void cdma_timeout_restart(struct host1x_cdma *cdma, u32 getptr)
{
        struct host1x *host1x = cdma_to_host1x(cdma);
        struct host1x_channel *ch = cdma_to_channel(cdma);
        u64 start, end;

        if (cdma->running)
                return;

        cdma->last_pos = cdma->push_buffer.pos;

        host1x_ch_writel(ch, HOST1X_CHANNEL_DMACTRL_DMASTOP,
                         HOST1X_CHANNEL_DMACTRL);

        start = cdma->push_buffer.dma;
        end = cdma->push_buffer.size + 4;

        /* set base, end pointer (all of memory) */
        host1x_ch_writel(ch, lower_32_bits(start), HOST1X_CHANNEL_DMASTART);
#if HOST1X_HW >= 6
        host1x_ch_writel(ch, upper_32_bits(start), HOST1X_CHANNEL_DMASTART_HI);
#endif
        host1x_ch_writel(ch, lower_32_bits(end), HOST1X_CHANNEL_DMAEND);
#if HOST1X_HW >= 6
        host1x_ch_writel(ch, upper_32_bits(end), HOST1X_CHANNEL_DMAEND_HI);
#endif

        /* set GET, by loading the value in PUT (then reset GET) */
        host1x_ch_writel(ch, getptr, HOST1X_CHANNEL_DMAPUT);
        host1x_ch_writel(ch, HOST1X_CHANNEL_DMACTRL_DMASTOP |
                         HOST1X_CHANNEL_DMACTRL_DMAGETRST |
                         HOST1X_CHANNEL_DMACTRL_DMAINITGET,
                         HOST1X_CHANNEL_DMACTRL);

        dev_dbg(host1x->dev,
                "%s: DMA GET 0x%x, PUT HW 0x%x / shadow 0x%x\n", __func__,
                host1x_ch_readl(ch, HOST1X_CHANNEL_DMAGET),
                host1x_ch_readl(ch, HOST1X_CHANNEL_DMAPUT),
                cdma->last_pos);

        /* deassert GET reset and set PUT */
        host1x_ch_writel(ch, HOST1X_CHANNEL_DMACTRL_DMASTOP,
                         HOST1X_CHANNEL_DMACTRL);
        host1x_ch_writel(ch, cdma->push_buffer.pos, HOST1X_CHANNEL_DMAPUT);

        /* start the command DMA */
        host1x_ch_writel(ch, 0, HOST1X_CHANNEL_DMACTRL);

        cdma->running = true;
}

/*
 * Kick channel DMA into action by writing its PUT offset (if it has changed)
 */
static void cdma_flush(struct host1x_cdma *cdma)
{
        struct host1x_channel *ch = cdma_to_channel(cdma);

        if (cdma->push_buffer.pos != cdma->last_pos) {
                host1x_ch_writel(ch, cdma->push_buffer.pos,
                                 HOST1X_CHANNEL_DMAPUT);
                cdma->last_pos = cdma->push_buffer.pos;
        }
}

static void cdma_stop(struct host1x_cdma *cdma)
{
        struct host1x_channel *ch = cdma_to_channel(cdma);

        mutex_lock(&cdma->lock);

        if (cdma->running) {
                host1x_cdma_wait_locked(cdma, CDMA_EVENT_SYNC_QUEUE_EMPTY);
                host1x_ch_writel(ch, HOST1X_CHANNEL_DMACTRL_DMASTOP,
                                 HOST1X_CHANNEL_DMACTRL);
                cdma->running = false;
        }

        mutex_unlock(&cdma->lock);
}

static void cdma_hw_cmdproc_stop(struct host1x *host, struct host1x_channel *ch,
                                 bool stop)
{
#if HOST1X_HW >= 6
        host1x_ch_writel(ch, stop ? 0x1 : 0x0, HOST1X_CHANNEL_CMDPROC_STOP);
#else
        u32 cmdproc_stop = host1x_sync_readl(host, HOST1X_SYNC_CMDPROC_STOP);
        if (stop)
                cmdproc_stop |= BIT(ch->id);
        else
                cmdproc_stop &= ~BIT(ch->id);
        host1x_sync_writel(host, cmdproc_stop, HOST1X_SYNC_CMDPROC_STOP);
#endif
}

static void cdma_hw_teardown(struct host1x *host, struct host1x_channel *ch)
{
#if HOST1X_HW >= 6
        host1x_ch_writel(ch, 0x1, HOST1X_CHANNEL_TEARDOWN);
#else
        host1x_sync_writel(host, BIT(ch->id), HOST1X_SYNC_CH_TEARDOWN);
#endif
}

/*
 * Stops both channel's command processor and CDMA immediately.
 * Also, tears down the channel and resets corresponding module.
 */
static void cdma_freeze(struct host1x_cdma *cdma)
{
        struct host1x *host = cdma_to_host1x(cdma);
        struct host1x_channel *ch = cdma_to_channel(cdma);

        if (cdma->torndown && !cdma->running) {
                dev_warn(host->dev, "Already torn down\n");
                return;
        }

        dev_dbg(host->dev, "freezing channel (id %d)\n", ch->id);

        cdma_hw_cmdproc_stop(host, ch, true);

        dev_dbg(host->dev, "%s: DMA GET 0x%x, PUT HW 0x%x / shadow 0x%x\n",
                __func__, host1x_ch_readl(ch, HOST1X_CHANNEL_DMAGET),
                host1x_ch_readl(ch, HOST1X_CHANNEL_DMAPUT),
                cdma->last_pos);

        host1x_ch_writel(ch, HOST1X_CHANNEL_DMACTRL_DMASTOP,
                         HOST1X_CHANNEL_DMACTRL);

        cdma_hw_teardown(host, ch);

        cdma->running = false;
        cdma->torndown = true;
}

static void cdma_resume(struct host1x_cdma *cdma, u32 getptr)
{
        struct host1x *host1x = cdma_to_host1x(cdma);
        struct host1x_channel *ch = cdma_to_channel(cdma);

        dev_dbg(host1x->dev,
                "resuming channel (id %u, DMAGET restart = 0x%x)\n",
                ch->id, getptr);

        cdma_hw_cmdproc_stop(host1x, ch, false);

        cdma->torndown = false;
        cdma_timeout_restart(cdma, getptr);
}

static void timeout_release_mlock(struct host1x_cdma *cdma)
{
#if HOST1X_HW >= 8
        /* Tegra186 and Tegra194 require a more complicated MLOCK release
         * sequence. Furthermore, those chips by default don't enforce MLOCKs,
         * so it turns out that if we don't /actually/ need MLOCKs, we can just
         * ignore them.
         *
         * As such, for now just implement this on Tegra234 where things are
         * stricter but also easy to implement.
         */
        struct host1x_channel *ch = cdma_to_channel(cdma);
        struct host1x *host1x = cdma_to_host1x(cdma);
        u32 offset;

        switch (ch->client->class) {
        case HOST1X_CLASS_NVJPG1:
                offset = HOST1X_COMMON_NVJPG1_MLOCK;
                break;
        case HOST1X_CLASS_NVENC:
                offset = HOST1X_COMMON_NVENC_MLOCK;
                break;
        case HOST1X_CLASS_VIC:
                offset = HOST1X_COMMON_VIC_MLOCK;
                break;
        case HOST1X_CLASS_NVJPG:
                offset = HOST1X_COMMON_NVJPG_MLOCK;
                break;
        case HOST1X_CLASS_NVDEC:
                offset = HOST1X_COMMON_NVDEC_MLOCK;
                break;
        case HOST1X_CLASS_OFA:
                offset = HOST1X_COMMON_OFA_MLOCK;
                break;
        default:
                WARN(1, "%s was not updated for class %u", __func__, ch->client->class);
                return;
        }

        host1x_common_writel(host1x, 0x0, offset);
#endif
}

/*
 * If this timeout fires, it indicates the current sync_queue entry has
 * exceeded its TTL and the userctx should be timed out and remaining
 * submits already issued cleaned up (future submits return an error).
 */
static void cdma_timeout_handler(struct work_struct *work)
{
        u32 syncpt_val;
        struct host1x_cdma *cdma;
        struct host1x *host1x;
        struct host1x_channel *ch;

        cdma = container_of(to_delayed_work(work), struct host1x_cdma,
                            timeout.wq);
        host1x = cdma_to_host1x(cdma);
        ch = cdma_to_channel(cdma);

        host1x_debug_dump(cdma_to_host1x(cdma));

        mutex_lock(&cdma->lock);

        if (!cdma->timeout.client) {
                dev_dbg(host1x->dev,
                        "cdma_timeout: expired, but has no clientid\n");
                mutex_unlock(&cdma->lock);
                return;
        }

        /* stop processing to get a clean snapshot */
        cdma_hw_cmdproc_stop(host1x, ch, true);

        syncpt_val = host1x_syncpt_load(cdma->timeout.syncpt);

        /* has buffer actually completed? */
        if ((s32)(syncpt_val - cdma->timeout.syncpt_val) >= 0) {
                dev_dbg(host1x->dev,
                        "cdma_timeout: expired, but buffer had completed\n");
                /* restore */
                cdma_hw_cmdproc_stop(host1x, ch, false);
                mutex_unlock(&cdma->lock);
                return;
        }

        dev_warn(host1x->dev, "%s: timeout: %u (%s), HW thresh %d, done %d\n",
                 __func__, cdma->timeout.syncpt->id, cdma->timeout.syncpt->name,
                 syncpt_val, cdma->timeout.syncpt_val);

        /* stop HW, resetting channel/module */
        host1x_hw_cdma_freeze(host1x, cdma);

        /* release any held MLOCK */
        timeout_release_mlock(cdma);

        host1x_cdma_update_sync_queue(cdma, ch->dev);
        mutex_unlock(&cdma->lock);
}

/*
 * Init timeout resources
 */
static int cdma_timeout_init(struct host1x_cdma *cdma)
{
        INIT_DELAYED_WORK(&cdma->timeout.wq, cdma_timeout_handler);
        cdma->timeout.initialized = true;

        return 0;
}

/*
 * Clean up timeout resources
 */
static void cdma_timeout_destroy(struct host1x_cdma *cdma)
{
        if (cdma->timeout.initialized)
                cancel_delayed_work(&cdma->timeout.wq);

        cdma->timeout.initialized = false;
}

static const struct host1x_cdma_ops host1x_cdma_ops = {
        .start = cdma_start,
        .stop = cdma_stop,
        .flush = cdma_flush,

        .timeout_init = cdma_timeout_init,
        .timeout_destroy = cdma_timeout_destroy,
        .freeze = cdma_freeze,
        .resume = cdma_resume,
        .timeout_cpu_incr = cdma_timeout_cpu_incr,
};

static const struct host1x_pushbuffer_ops host1x_pushbuffer_ops = {
        .init = push_buffer_init,
};