root/drivers/media/pci/intel/ipu6/ipu6-fw-com.c
// SPDX-License-Identifier: GPL-2.0-only
/*
 * Copyright (C) 2013--2024 Intel Corporation
 */

#include <linux/device.h>
#include <linux/dma-mapping.h>
#include <linux/io.h>
#include <linux/math.h>
#include <linux/overflow.h>
#include <linux/slab.h>
#include <linux/types.h>

#include "ipu6-bus.h"
#include "ipu6-dma.h"
#include "ipu6-fw-com.h"

/*
 * FWCOM layer is a shared resource between FW and driver. It consist
 * of token queues to both send and receive directions. Queue is simply
 * an array of structures with read and write indexes to the queue.
 * There are 1...n queues to both directions. Queues locates in
 * system RAM and are mapped to ISP MMU so that both CPU and ISP can
 * see the same buffer. Indexes are located in ISP DMEM so that FW code
 * can poll those with very low latency and cost. CPU access to indexes is
 * more costly but that happens only at message sending time and
 * interrupt triggered message handling. CPU doesn't need to poll indexes.
 * wr_reg / rd_reg are offsets to those dmem location. They are not
 * the indexes itself.
 */

/* Shared structure between driver and FW - do not modify */
struct ipu6_fw_sys_queue {
        u64 host_address;
        u32 vied_address;
        u32 size;
        u32 token_size;
        u32 wr_reg;     /* reg number in subsystem's regmem */
        u32 rd_reg;
        u32 _align;
} __packed;

struct ipu6_fw_sys_queue_res {
        u64 host_address;
        u32 vied_address;
        u32 reg;
} __packed;

enum syscom_state {
        /* Program load or explicit host setting should init to this */
        SYSCOM_STATE_UNINIT = 0x57a7e000,
        /* SP Syscom sets this when it is ready for use */
        SYSCOM_STATE_READY = 0x57a7e001,
        /* SP Syscom sets this when no more syscom accesses will happen */
        SYSCOM_STATE_INACTIVE = 0x57a7e002,
};

enum syscom_cmd {
        /* Program load or explicit host setting should init to this */
        SYSCOM_COMMAND_UNINIT = 0x57a7f000,
        /* Host Syscom requests syscom to become inactive */
        SYSCOM_COMMAND_INACTIVE = 0x57a7f001,
};

/* firmware config: data that sent from the host to SP via DDR */
/* Cell copies data into a context */

struct ipu6_fw_syscom_config {
        u32 firmware_address;

        u32 num_input_queues;
        u32 num_output_queues;

        /* ISP pointers to an array of ipu6_fw_sys_queue structures */
        u32 input_queue;
        u32 output_queue;

        /* ISYS / PSYS private data */
        u32 specific_addr;
        u32 specific_size;
};

struct ipu6_fw_com_context {
        struct ipu6_bus_device *adev;
        void __iomem *dmem_addr;
        int (*cell_ready)(struct ipu6_bus_device *adev);
        void (*cell_start)(struct ipu6_bus_device *adev);

        void *dma_buffer;
        dma_addr_t dma_addr;
        unsigned int dma_size;

        struct ipu6_fw_sys_queue *input_queue;  /* array of host to SP queues */
        struct ipu6_fw_sys_queue *output_queue; /* array of SP to host */

        u32 config_vied_addr;

        unsigned int buttress_boot_offset;
        void __iomem *base_addr;
};

#define FW_COM_WR_REG 0
#define FW_COM_RD_REG 4

#define REGMEM_OFFSET 0
#define TUNIT_MAGIC_PATTERN 0x5a5a5a5a

enum regmem_id {
        /* pass pkg_dir address to SPC in non-secure mode */
        PKG_DIR_ADDR_REG = 0,
        /* Tunit CFG blob for secure - provided by host.*/
        TUNIT_CFG_DWR_REG = 1,
        /* syscom commands - modified by the host */
        SYSCOM_COMMAND_REG = 2,
        /* Store interrupt status - updated by SP */
        SYSCOM_IRQ_REG = 3,
        /* first syscom queue pointer register */
        SYSCOM_QPR_BASE_REG = 4
};

#define BUTTRESS_FW_BOOT_PARAMS_0 0x4000
#define BUTTRESS_FW_BOOT_PARAM_REG(base, offset, id)                    \
        ((base) + BUTTRESS_FW_BOOT_PARAMS_0 + ((offset) + (id)) * 4)

enum buttress_syscom_id {
        /* pass syscom configuration to SPC */
        SYSCOM_CONFIG_ID                = 0,
        /* syscom state - modified by SP */
        SYSCOM_STATE_ID                 = 1,
        /* syscom vtl0 addr mask */
        SYSCOM_VTL0_ADDR_MASK_ID        = 2,
        SYSCOM_ID_MAX
};

static void ipu6_sys_queue_init(struct ipu6_fw_sys_queue *q, unsigned int size,
                                unsigned int token_size,
                                struct ipu6_fw_sys_queue_res *res)
{
        unsigned int buf_size = (size + 1) * token_size;

        q->size = size + 1;
        q->token_size = token_size;

        /* acquire the shared buffer space */
        q->host_address = res->host_address;
        res->host_address += buf_size;
        q->vied_address = res->vied_address;
        res->vied_address += buf_size;

        /* acquire the shared read and writer pointers */
        q->wr_reg = res->reg;
        res->reg++;
        q->rd_reg = res->reg;
        res->reg++;
}

void *ipu6_fw_com_prepare(struct ipu6_fw_com_cfg *cfg,
                          struct ipu6_bus_device *adev, void __iomem *base)
{
        size_t conf_size, inq_size, outq_size, specific_size;
        struct ipu6_fw_syscom_config *config_host_addr;
        unsigned int sizeinput = 0, sizeoutput = 0;
        struct ipu6_fw_sys_queue_res res;
        struct ipu6_fw_com_context *ctx;
        struct device *dev = &adev->auxdev.dev;
        size_t sizeall, offset;
        void *specific_host_addr;
        unsigned int i;

        if (!cfg || !cfg->cell_start || !cfg->cell_ready)
                return NULL;

        ctx = kzalloc_obj(*ctx);
        if (!ctx)
                return NULL;
        ctx->dmem_addr = base + cfg->dmem_addr + REGMEM_OFFSET;
        ctx->adev = adev;
        ctx->cell_start = cfg->cell_start;
        ctx->cell_ready = cfg->cell_ready;
        ctx->buttress_boot_offset = cfg->buttress_boot_offset;
        ctx->base_addr  = base;

        /*
         * Allocate DMA mapped memory. Allocate one big chunk.
         */
        /* Base cfg for FW */
        conf_size = roundup(sizeof(struct ipu6_fw_syscom_config), 8);
        /* Descriptions of the queues */
        inq_size = size_mul(cfg->num_input_queues,
                            sizeof(struct ipu6_fw_sys_queue));
        outq_size = size_mul(cfg->num_output_queues,
                             sizeof(struct ipu6_fw_sys_queue));
        /* FW specific information structure */
        specific_size = roundup(cfg->specific_size, 8);

        sizeall = conf_size + inq_size + outq_size + specific_size;

        for (i = 0; i < cfg->num_input_queues; i++)
                sizeinput += size_mul(cfg->input[i].queue_size + 1,
                                      cfg->input[i].token_size);

        for (i = 0; i < cfg->num_output_queues; i++)
                sizeoutput += size_mul(cfg->output[i].queue_size + 1,
                                       cfg->output[i].token_size);

        sizeall += sizeinput + sizeoutput;

        ctx->dma_buffer = ipu6_dma_alloc(adev, sizeall, &ctx->dma_addr,
                                         GFP_KERNEL, 0);
        if (!ctx->dma_buffer) {
                dev_err(dev, "failed to allocate dma memory\n");
                kfree(ctx);
                return NULL;
        }

        ctx->dma_size = sizeall;

        config_host_addr = ctx->dma_buffer;
        ctx->config_vied_addr = ctx->dma_addr;

        offset = conf_size;
        ctx->input_queue = ctx->dma_buffer + offset;
        config_host_addr->input_queue = ctx->dma_addr + offset;
        config_host_addr->num_input_queues = cfg->num_input_queues;

        offset += inq_size;
        ctx->output_queue = ctx->dma_buffer + offset;
        config_host_addr->output_queue = ctx->dma_addr + offset;
        config_host_addr->num_output_queues = cfg->num_output_queues;

        /* copy firmware specific data */
        offset += outq_size;
        specific_host_addr = ctx->dma_buffer + offset;
        config_host_addr->specific_addr = ctx->dma_addr + offset;
        config_host_addr->specific_size = cfg->specific_size;
        if (cfg->specific_addr && cfg->specific_size)
                memcpy(specific_host_addr, cfg->specific_addr,
                       cfg->specific_size);

        ipu6_dma_sync_single(adev, ctx->config_vied_addr, sizeall);

        /* initialize input queues */
        offset += specific_size;
        res.reg = SYSCOM_QPR_BASE_REG;
        res.host_address = (uintptr_t)(ctx->dma_buffer + offset);
        res.vied_address = ctx->dma_addr + offset;
        for (i = 0; i < cfg->num_input_queues; i++)
                ipu6_sys_queue_init(ctx->input_queue + i,
                                    cfg->input[i].queue_size,
                                    cfg->input[i].token_size, &res);

        /* initialize output queues */
        offset += sizeinput;
        res.host_address = (uintptr_t)(ctx->dma_buffer + offset);
        res.vied_address = ctx->dma_addr + offset;
        for (i = 0; i < cfg->num_output_queues; i++) {
                ipu6_sys_queue_init(ctx->output_queue + i,
                                    cfg->output[i].queue_size,
                                    cfg->output[i].token_size, &res);
        }

        return ctx;
}
EXPORT_SYMBOL_NS_GPL(ipu6_fw_com_prepare, "INTEL_IPU6");

int ipu6_fw_com_open(struct ipu6_fw_com_context *ctx)
{
        /* write magic pattern to disable the tunit trace */
        writel(TUNIT_MAGIC_PATTERN, ctx->dmem_addr + TUNIT_CFG_DWR_REG * 4);
        /* Check if SP is in valid state */
        if (!ctx->cell_ready(ctx->adev))
                return -EIO;

        /* store syscom uninitialized command */
        writel(SYSCOM_COMMAND_UNINIT, ctx->dmem_addr + SYSCOM_COMMAND_REG * 4);

        /* store syscom uninitialized state */
        writel(SYSCOM_STATE_UNINIT,
               BUTTRESS_FW_BOOT_PARAM_REG(ctx->base_addr,
                                          ctx->buttress_boot_offset,
                                          SYSCOM_STATE_ID));

        /* store firmware configuration address */
        writel(ctx->config_vied_addr,
               BUTTRESS_FW_BOOT_PARAM_REG(ctx->base_addr,
                                          ctx->buttress_boot_offset,
                                          SYSCOM_CONFIG_ID));
        ctx->cell_start(ctx->adev);

        return 0;
}
EXPORT_SYMBOL_NS_GPL(ipu6_fw_com_open, "INTEL_IPU6");

int ipu6_fw_com_close(struct ipu6_fw_com_context *ctx)
{
        int state;

        state = readl(BUTTRESS_FW_BOOT_PARAM_REG(ctx->base_addr,
                                                 ctx->buttress_boot_offset,
                                                 SYSCOM_STATE_ID));
        if (state != SYSCOM_STATE_READY)
                return -EBUSY;

        /* set close request flag */
        writel(SYSCOM_COMMAND_INACTIVE, ctx->dmem_addr +
               SYSCOM_COMMAND_REG * 4);

        return 0;
}
EXPORT_SYMBOL_NS_GPL(ipu6_fw_com_close, "INTEL_IPU6");

int ipu6_fw_com_release(struct ipu6_fw_com_context *ctx, unsigned int force)
{
        /* check if release is forced, an verify cell state if it is not */
        if (!force && !ctx->cell_ready(ctx->adev))
                return -EBUSY;

        ipu6_dma_free(ctx->adev, ctx->dma_size,
                      ctx->dma_buffer, ctx->dma_addr, 0);
        kfree(ctx);
        return 0;
}
EXPORT_SYMBOL_NS_GPL(ipu6_fw_com_release, "INTEL_IPU6");

bool ipu6_fw_com_ready(struct ipu6_fw_com_context *ctx)
{
        int state;

        state = readl(BUTTRESS_FW_BOOT_PARAM_REG(ctx->base_addr,
                                                 ctx->buttress_boot_offset,
                                                 SYSCOM_STATE_ID));

        return state == SYSCOM_STATE_READY;
}
EXPORT_SYMBOL_NS_GPL(ipu6_fw_com_ready, "INTEL_IPU6");

void *ipu6_send_get_token(struct ipu6_fw_com_context *ctx, int q_nbr)
{
        struct ipu6_fw_sys_queue *q = &ctx->input_queue[q_nbr];
        void __iomem *q_dmem = ctx->dmem_addr + q->wr_reg * 4;
        unsigned int wr, rd;
        unsigned int packets;
        unsigned int index;

        wr = readl(q_dmem + FW_COM_WR_REG);
        rd = readl(q_dmem + FW_COM_RD_REG);

        if (WARN_ON_ONCE(wr >= q->size || rd >= q->size))
                return NULL;

        if (wr < rd)
                packets = rd - wr - 1;
        else
                packets = q->size - (wr - rd + 1);

        if (!packets)
                return NULL;

        index = readl(q_dmem + FW_COM_WR_REG);

        return (void *)((uintptr_t)q->host_address + index * q->token_size);
}
EXPORT_SYMBOL_NS_GPL(ipu6_send_get_token, "INTEL_IPU6");

void ipu6_send_put_token(struct ipu6_fw_com_context *ctx, int q_nbr)
{
        struct ipu6_fw_sys_queue *q = &ctx->input_queue[q_nbr];
        void __iomem *q_dmem = ctx->dmem_addr + q->wr_reg * 4;
        unsigned int wr = readl(q_dmem + FW_COM_WR_REG) + 1;

        if (wr >= q->size)
                wr = 0;

        writel(wr, q_dmem + FW_COM_WR_REG);
}
EXPORT_SYMBOL_NS_GPL(ipu6_send_put_token, "INTEL_IPU6");

void *ipu6_recv_get_token(struct ipu6_fw_com_context *ctx, int q_nbr)
{
        struct ipu6_fw_sys_queue *q = &ctx->output_queue[q_nbr];
        void __iomem *q_dmem = ctx->dmem_addr + q->wr_reg * 4;
        unsigned int wr, rd;
        unsigned int packets;

        wr = readl(q_dmem + FW_COM_WR_REG);
        rd = readl(q_dmem + FW_COM_RD_REG);

        if (WARN_ON_ONCE(wr >= q->size || rd >= q->size))
                return NULL;

        if (wr < rd)
                wr += q->size;

        packets = wr - rd;
        if (!packets)
                return NULL;

        return (void *)((uintptr_t)q->host_address + rd * q->token_size);
}
EXPORT_SYMBOL_NS_GPL(ipu6_recv_get_token, "INTEL_IPU6");

void ipu6_recv_put_token(struct ipu6_fw_com_context *ctx, int q_nbr)
{
        struct ipu6_fw_sys_queue *q = &ctx->output_queue[q_nbr];
        void __iomem *q_dmem = ctx->dmem_addr + q->wr_reg * 4;
        unsigned int rd = readl(q_dmem + FW_COM_RD_REG) + 1;

        if (rd >= q->size)
                rd = 0;

        writel(rd, q_dmem + FW_COM_RD_REG);
}
EXPORT_SYMBOL_NS_GPL(ipu6_recv_put_token, "INTEL_IPU6");