root/arch/arm/mm/cache-uniphier.c
// SPDX-License-Identifier: GPL-2.0-or-later
/*
 * Copyright (C) 2015-2016 Socionext Inc.
 *   Author: Masahiro Yamada <yamada.masahiro@socionext.com>
 */

#define pr_fmt(fmt)             "uniphier: " fmt

#include <linux/bitops.h>
#include <linux/init.h>
#include <linux/io.h>
#include <linux/log2.h>
#include <linux/of_address.h>
#include <linux/slab.h>
#include <asm/hardware/cache-uniphier.h>
#include <asm/outercache.h>

/* control registers */
#define UNIPHIER_SSCC           0x0     /* Control Register */
#define    UNIPHIER_SSCC_BST                    BIT(20) /* UCWG burst read */
#define    UNIPHIER_SSCC_ACT                    BIT(19) /* Inst-Data separate */
#define    UNIPHIER_SSCC_WTG                    BIT(18) /* WT gathering on */
#define    UNIPHIER_SSCC_PRD                    BIT(17) /* enable pre-fetch */
#define    UNIPHIER_SSCC_ON                     BIT(0)  /* enable cache */
#define UNIPHIER_SSCLPDAWCR     0x30    /* Unified/Data Active Way Control */
#define UNIPHIER_SSCLPIAWCR     0x34    /* Instruction Active Way Control */

/* revision registers */
#define UNIPHIER_SSCID          0x0     /* ID Register */

/* operation registers */
#define UNIPHIER_SSCOPE         0x244   /* Cache Operation Primitive Entry */
#define    UNIPHIER_SSCOPE_CM_INV               0x0     /* invalidate */
#define    UNIPHIER_SSCOPE_CM_CLEAN             0x1     /* clean */
#define    UNIPHIER_SSCOPE_CM_FLUSH             0x2     /* flush */
#define    UNIPHIER_SSCOPE_CM_SYNC              0x8     /* sync (drain bufs) */
#define    UNIPHIER_SSCOPE_CM_FLUSH_PREFETCH    0x9     /* flush p-fetch buf */
#define UNIPHIER_SSCOQM         0x248   /* Cache Operation Queue Mode */
#define    UNIPHIER_SSCOQM_S_MASK               (0x3 << 17)
#define    UNIPHIER_SSCOQM_S_RANGE              (0x0 << 17)
#define    UNIPHIER_SSCOQM_S_ALL                (0x1 << 17)
#define    UNIPHIER_SSCOQM_CE                   BIT(15) /* notify completion */
#define    UNIPHIER_SSCOQM_CM_INV               0x0     /* invalidate */
#define    UNIPHIER_SSCOQM_CM_CLEAN             0x1     /* clean */
#define    UNIPHIER_SSCOQM_CM_FLUSH             0x2     /* flush */
#define UNIPHIER_SSCOQAD        0x24c   /* Cache Operation Queue Address */
#define UNIPHIER_SSCOQSZ        0x250   /* Cache Operation Queue Size */
#define UNIPHIER_SSCOPPQSEF     0x25c   /* Cache Operation Queue Set Complete*/
#define    UNIPHIER_SSCOPPQSEF_FE               BIT(1)
#define    UNIPHIER_SSCOPPQSEF_OE               BIT(0)
#define UNIPHIER_SSCOLPQS       0x260   /* Cache Operation Queue Status */
#define    UNIPHIER_SSCOLPQS_EF                 BIT(2)
#define    UNIPHIER_SSCOLPQS_EST                BIT(1)
#define    UNIPHIER_SSCOLPQS_QST                BIT(0)

/* Is the operation region specified by address range? */
#define UNIPHIER_SSCOQM_S_IS_RANGE(op) \
                ((op & UNIPHIER_SSCOQM_S_MASK) == UNIPHIER_SSCOQM_S_RANGE)

/**
 * struct uniphier_cache_data - UniPhier outer cache specific data
 *
 * @ctrl_base: virtual base address of control registers
 * @rev_base: virtual base address of revision registers
 * @op_base: virtual base address of operation registers
 * @way_ctrl_base: virtual address of the way control registers for this
 *      SoC revision
 * @way_mask: each bit specifies if the way is present
 * @nsets: number of associativity sets
 * @line_size: line size in bytes
 * @range_op_max_size: max size that can be handled by a single range operation
 * @list: list node to include this level in the whole cache hierarchy
 */
struct uniphier_cache_data {
        void __iomem *ctrl_base;
        void __iomem *rev_base;
        void __iomem *op_base;
        void __iomem *way_ctrl_base;
        u32 way_mask;
        u32 nsets;
        u32 line_size;
        u32 range_op_max_size;
        struct list_head list;
};

/*
 * List of the whole outer cache hierarchy.  This list is only modified during
 * the early boot stage, so no mutex is taken for the access to the list.
 */
static LIST_HEAD(uniphier_cache_list);

/**
 * __uniphier_cache_sync - perform a sync point for a particular cache level
 *
 * @data: cache controller specific data
 */
static void __uniphier_cache_sync(struct uniphier_cache_data *data)
{
        /* This sequence need not be atomic.  Do not disable IRQ. */
        writel_relaxed(UNIPHIER_SSCOPE_CM_SYNC,
                       data->op_base + UNIPHIER_SSCOPE);
        /* need a read back to confirm */
        readl_relaxed(data->op_base + UNIPHIER_SSCOPE);
}

/**
 * __uniphier_cache_maint_common - run a queue operation for a particular level
 *
 * @data: cache controller specific data
 * @start: start address of range operation (don't care for "all" operation)
 * @size: data size of range operation (don't care for "all" operation)
 * @operation: flags to specify the desired cache operation
 */
static void __uniphier_cache_maint_common(struct uniphier_cache_data *data,
                                          unsigned long start,
                                          unsigned long size,
                                          u32 operation)
{
        unsigned long flags;

        /*
         * No spin lock is necessary here because:
         *
         * [1] This outer cache controller is able to accept maintenance
         * operations from multiple CPUs at a time in an SMP system; if a
         * maintenance operation is under way and another operation is issued,
         * the new one is stored in the queue.  The controller performs one
         * operation after another.  If the queue is full, the status register,
         * UNIPHIER_SSCOPPQSEF, indicates that the queue registration has
         * failed.  The status registers, UNIPHIER_{SSCOPPQSEF, SSCOLPQS}, have
         * different instances for each CPU, i.e. each CPU can track the status
         * of the maintenance operations triggered by itself.
         *
         * [2] The cache command registers, UNIPHIER_{SSCOQM, SSCOQAD, SSCOQSZ,
         * SSCOQWN}, are shared between multiple CPUs, but the hardware still
         * guarantees the registration sequence is atomic; the write access to
         * them are arbitrated by the hardware.  The first accessor to the
         * register, UNIPHIER_SSCOQM, holds the access right and it is released
         * by reading the status register, UNIPHIER_SSCOPPQSEF.  While one CPU
         * is holding the access right, other CPUs fail to register operations.
         * One CPU should not hold the access right for a long time, so local
         * IRQs should be disabled while the following sequence.
         */
        local_irq_save(flags);

        /* clear the complete notification flag */
        writel_relaxed(UNIPHIER_SSCOLPQS_EF, data->op_base + UNIPHIER_SSCOLPQS);

        do {
                /* set cache operation */
                writel_relaxed(UNIPHIER_SSCOQM_CE | operation,
                               data->op_base + UNIPHIER_SSCOQM);

                /* set address range if needed */
                if (likely(UNIPHIER_SSCOQM_S_IS_RANGE(operation))) {
                        writel_relaxed(start, data->op_base + UNIPHIER_SSCOQAD);
                        writel_relaxed(size, data->op_base + UNIPHIER_SSCOQSZ);
                }
        } while (unlikely(readl_relaxed(data->op_base + UNIPHIER_SSCOPPQSEF) &
                          (UNIPHIER_SSCOPPQSEF_FE | UNIPHIER_SSCOPPQSEF_OE)));

        /* wait until the operation is completed */
        while (likely(readl_relaxed(data->op_base + UNIPHIER_SSCOLPQS) !=
                      UNIPHIER_SSCOLPQS_EF))
                cpu_relax();

        local_irq_restore(flags);
}

static void __uniphier_cache_maint_all(struct uniphier_cache_data *data,
                                       u32 operation)
{
        __uniphier_cache_maint_common(data, 0, 0,
                                      UNIPHIER_SSCOQM_S_ALL | operation);

        __uniphier_cache_sync(data);
}

static void __uniphier_cache_maint_range(struct uniphier_cache_data *data,
                                         unsigned long start, unsigned long end,
                                         u32 operation)
{
        unsigned long size;

        /*
         * If the start address is not aligned,
         * perform a cache operation for the first cache-line
         */
        start = start & ~(data->line_size - 1);

        size = end - start;

        if (unlikely(size >= (unsigned long)(-data->line_size))) {
                /* this means cache operation for all range */
                __uniphier_cache_maint_all(data, operation);
                return;
        }

        /*
         * If the end address is not aligned,
         * perform a cache operation for the last cache-line
         */
        size = ALIGN(size, data->line_size);

        while (size) {
                unsigned long chunk_size = min_t(unsigned long, size,
                                                 data->range_op_max_size);

                __uniphier_cache_maint_common(data, start, chunk_size,
                                        UNIPHIER_SSCOQM_S_RANGE | operation);

                start += chunk_size;
                size -= chunk_size;
        }

        __uniphier_cache_sync(data);
}

static void __uniphier_cache_enable(struct uniphier_cache_data *data, bool on)
{
        u32 val = 0;

        if (on)
                val = UNIPHIER_SSCC_WTG | UNIPHIER_SSCC_PRD | UNIPHIER_SSCC_ON;

        writel_relaxed(val, data->ctrl_base + UNIPHIER_SSCC);
}

static void __init __uniphier_cache_set_active_ways(
                                        struct uniphier_cache_data *data)
{
        unsigned int cpu;

        for_each_possible_cpu(cpu)
                writel_relaxed(data->way_mask, data->way_ctrl_base + 4 * cpu);
}

static void uniphier_cache_maint_range(unsigned long start, unsigned long end,
                                       u32 operation)
{
        struct uniphier_cache_data *data;

        list_for_each_entry(data, &uniphier_cache_list, list)
                __uniphier_cache_maint_range(data, start, end, operation);
}

static void uniphier_cache_maint_all(u32 operation)
{
        struct uniphier_cache_data *data;

        list_for_each_entry(data, &uniphier_cache_list, list)
                __uniphier_cache_maint_all(data, operation);
}

static void uniphier_cache_inv_range(unsigned long start, unsigned long end)
{
        uniphier_cache_maint_range(start, end, UNIPHIER_SSCOQM_CM_INV);
}

static void uniphier_cache_clean_range(unsigned long start, unsigned long end)
{
        uniphier_cache_maint_range(start, end, UNIPHIER_SSCOQM_CM_CLEAN);
}

static void uniphier_cache_flush_range(unsigned long start, unsigned long end)
{
        uniphier_cache_maint_range(start, end, UNIPHIER_SSCOQM_CM_FLUSH);
}

static void __init uniphier_cache_inv_all(void)
{
        uniphier_cache_maint_all(UNIPHIER_SSCOQM_CM_INV);
}

static void uniphier_cache_flush_all(void)
{
        uniphier_cache_maint_all(UNIPHIER_SSCOQM_CM_FLUSH);
}

static void uniphier_cache_disable(void)
{
        struct uniphier_cache_data *data;

        list_for_each_entry_reverse(data, &uniphier_cache_list, list)
                __uniphier_cache_enable(data, false);

        uniphier_cache_flush_all();
}

static void __init uniphier_cache_enable(void)
{
        struct uniphier_cache_data *data;

        uniphier_cache_inv_all();

        list_for_each_entry(data, &uniphier_cache_list, list) {
                __uniphier_cache_enable(data, true);
                __uniphier_cache_set_active_ways(data);
        }
}

static void uniphier_cache_sync(void)
{
        struct uniphier_cache_data *data;

        list_for_each_entry(data, &uniphier_cache_list, list)
                __uniphier_cache_sync(data);
}

static const struct of_device_id uniphier_cache_match[] __initconst = {
        { .compatible = "socionext,uniphier-system-cache" },
        { /* sentinel */ }
};

static int __init __uniphier_cache_init(struct device_node *np,
                                        unsigned int *cache_level)
{
        struct uniphier_cache_data *data;
        u32 level, cache_size;
        struct device_node *next_np;
        int ret = 0;

        if (!of_match_node(uniphier_cache_match, np)) {
                pr_err("L%d: not compatible with uniphier cache\n",
                       *cache_level);
                return -EINVAL;
        }

        if (of_property_read_u32(np, "cache-level", &level)) {
                pr_err("L%d: cache-level is not specified\n", *cache_level);
                return -EINVAL;
        }

        if (level != *cache_level) {
                pr_err("L%d: cache-level is unexpected value %d\n",
                       *cache_level, level);
                return -EINVAL;
        }

        if (!of_property_read_bool(np, "cache-unified")) {
                pr_err("L%d: cache-unified is not specified\n", *cache_level);
                return -EINVAL;
        }

        data = kzalloc_obj(*data);
        if (!data)
                return -ENOMEM;

        if (of_property_read_u32(np, "cache-line-size", &data->line_size) ||
            !is_power_of_2(data->line_size)) {
                pr_err("L%d: cache-line-size is unspecified or invalid\n",
                       *cache_level);
                ret = -EINVAL;
                goto err;
        }

        if (of_property_read_u32(np, "cache-sets", &data->nsets) ||
            !is_power_of_2(data->nsets)) {
                pr_err("L%d: cache-sets is unspecified or invalid\n",
                       *cache_level);
                ret = -EINVAL;
                goto err;
        }

        if (of_property_read_u32(np, "cache-size", &cache_size) ||
            cache_size == 0 || cache_size % (data->nsets * data->line_size)) {
                pr_err("L%d: cache-size is unspecified or invalid\n",
                       *cache_level);
                ret = -EINVAL;
                goto err;
        }

        data->way_mask = GENMASK(cache_size / data->nsets / data->line_size - 1,
                                 0);

        data->ctrl_base = of_iomap(np, 0);
        if (!data->ctrl_base) {
                pr_err("L%d: failed to map control register\n", *cache_level);
                ret = -ENOMEM;
                goto err;
        }

        data->rev_base = of_iomap(np, 1);
        if (!data->rev_base) {
                pr_err("L%d: failed to map revision register\n", *cache_level);
                ret = -ENOMEM;
                goto err;
        }

        data->op_base = of_iomap(np, 2);
        if (!data->op_base) {
                pr_err("L%d: failed to map operation register\n", *cache_level);
                ret = -ENOMEM;
                goto err;
        }

        data->way_ctrl_base = data->ctrl_base + 0xc00;

        if (*cache_level == 2) {
                u32 revision = readl(data->rev_base + UNIPHIER_SSCID);
                /*
                 * The size of range operation is limited to (1 << 22) or less
                 * for PH-sLD8 or older SoCs.
                 */
                if (revision <= 0x16)
                        data->range_op_max_size = (u32)1 << 22;

                /*
                 * Unfortunatly, the offset address of active way control base
                 * varies from SoC to SoC.
                 */
                switch (revision) {
                case 0x11:      /* sLD3 */
                        data->way_ctrl_base = data->ctrl_base + 0x870;
                        break;
                case 0x12:      /* LD4 */
                case 0x16:      /* sld8 */
                        data->way_ctrl_base = data->ctrl_base + 0x840;
                        break;
                default:
                        break;
                }
        }

        data->range_op_max_size -= data->line_size;

        INIT_LIST_HEAD(&data->list);
        list_add_tail(&data->list, &uniphier_cache_list); /* no mutex */

        /*
         * OK, this level has been successfully initialized.  Look for the next
         * level cache.  Do not roll back even if the initialization of the
         * next level cache fails because we want to continue with available
         * cache levels.
         */
        next_np = of_find_next_cache_node(np);
        if (next_np) {
                (*cache_level)++;
                ret = __uniphier_cache_init(next_np, cache_level);
        }
        of_node_put(next_np);

        return ret;
err:
        iounmap(data->op_base);
        iounmap(data->rev_base);
        iounmap(data->ctrl_base);
        kfree(data);

        return ret;
}

int __init uniphier_cache_init(void)
{
        struct device_node *np = NULL;
        unsigned int cache_level;
        int ret = 0;

        /* look for level 2 cache */
        while ((np = of_find_matching_node(np, uniphier_cache_match)))
                if (!of_property_read_u32(np, "cache-level", &cache_level) &&
                    cache_level == 2)
                        break;

        if (!np)
                return -ENODEV;

        ret = __uniphier_cache_init(np, &cache_level);
        of_node_put(np);

        if (ret) {
                /*
                 * Error out iif L2 initialization fails.  Continue with any
                 * error on L3 or outer because they are optional.
                 */
                if (cache_level == 2) {
                        pr_err("failed to initialize L2 cache\n");
                        return ret;
                }

                cache_level--;
                ret = 0;
        }

        outer_cache.inv_range = uniphier_cache_inv_range;
        outer_cache.clean_range = uniphier_cache_clean_range;
        outer_cache.flush_range = uniphier_cache_flush_range;
        outer_cache.flush_all = uniphier_cache_flush_all;
        outer_cache.disable = uniphier_cache_disable;
        outer_cache.sync = uniphier_cache_sync;

        uniphier_cache_enable();

        pr_info("enabled outer cache (cache level: %d)\n", cache_level);

        return ret;
}