root/sys/compat/linuxkpi/common/src/linux_radix.c
/*-
 * Copyright (c) 2010 Isilon Systems, Inc.
 * Copyright (c) 2010 iX Systems, Inc.
 * Copyright (c) 2010 Panasas, Inc.
 * Copyright (c) 2013-2020 Mellanox Technologies, Ltd.
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice unmodified, this list of conditions, and the following
 *    disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#include <sys/param.h>
#include <sys/systm.h>
#include <sys/malloc.h>
#include <sys/kernel.h>
#include <sys/sysctl.h>

#include <linux/slab.h>
#include <linux/kernel.h>
#include <linux/radix-tree.h>
#include <linux/err.h>

static MALLOC_DEFINE(M_RADIX, "radix", "Linux radix compat");

static inline unsigned long
radix_max(const struct radix_tree_root *root)
{
        return ((1UL << (root->height * RADIX_TREE_MAP_SHIFT)) - 1UL);
}

static inline int
radix_pos(long id, int height)
{
        return (id >> (RADIX_TREE_MAP_SHIFT * height)) & RADIX_TREE_MAP_MASK;
}

static inline int
root_tag_get(const struct radix_tree_root *root, unsigned tag)
{
        return (test_bit(tag, root->tags));
}

static inline void
root_tag_set(struct radix_tree_root *root, unsigned tag)
{
        set_bit(tag, root->tags);
}

static inline void
root_tag_clear(struct radix_tree_root *root, unsigned tag)
{
        clear_bit(tag, root->tags);
}

static inline int
tag_get(const struct radix_tree_node *node, unsigned int tag, int pos)
{
        return (test_bit(pos, node->tags[tag]));
}

static inline void
tag_set(struct radix_tree_node *node, unsigned int tag, int pos)
{
        set_bit(pos, node->tags[tag]);
}

static inline void
tag_clear(struct radix_tree_node *node, unsigned int tag, int pos)
{
        clear_bit(pos, node->tags[tag]);
}

static inline bool
any_tag_set(const struct radix_tree_node *node, unsigned int tag)
{
        unsigned int pos;

        for (pos = 0; pos < RADIX_TREE_TAG_LONGS; pos++)
                if (node->tags[tag][pos])
                        return (true);

        return (false);
}

static void
node_tag_clear(struct radix_tree_root *root, struct radix_tree_node *stack[],
    unsigned long index, unsigned int tag)
{
        struct radix_tree_node *node;
        int height, pos;

        height = 1;
        node = stack[height];

        while (node && height <= root->height - 1) {
                pos = radix_pos(index, height);
                if (!tag_get(node, tag, pos))
                        return;

                tag_clear(node, tag, pos);
                if (any_tag_set(node, tag))
                        return;

                height++;
                node = stack[height];
        }

        if (root_tag_get(root, tag))
                root_tag_clear(root, tag);
}

static void
radix_tree_clean_root_node(struct radix_tree_root *root)
{
        /* Check if the root node should be freed */
        if (root->rnode->count == 0) {
                free(root->rnode, M_RADIX);
                root->rnode = NULL;
                root->height = 0;
        }
}

void *
radix_tree_lookup(const struct radix_tree_root *root, unsigned long index)
{
        struct radix_tree_node *node;
        void *item;
        int height;

        item = NULL;
        node = root->rnode;
        height = root->height - 1;
        if (index > radix_max(root))
                goto out;
        while (height && node)
                node = node->slots[radix_pos(index, height--)];
        if (node)
                item = node->slots[radix_pos(index, 0)];

out:
        return (item);
}

unsigned int
radix_tree_gang_lookup(const struct radix_tree_root *root, void **results,
    unsigned long first_index, unsigned int max_items)
{
        struct radix_tree_iter iter;
        void **slot;
        int count;

        count = 0;
        if (max_items == 0)
                return (count);

        radix_tree_for_each_slot(slot, root, &iter, first_index) {
                results[count] = *slot;
                if (results[count] == NULL)
                        continue;

                count++;
                if (count == max_items)
                        break;
        }

        return (count);
}

unsigned int
radix_tree_gang_lookup_tag(const struct radix_tree_root *root,
    void **results, unsigned long first_index, unsigned int max_items,
    unsigned int tag)
{
        struct radix_tree_iter iter;
        void **slot;
        int count;

        count = 0;
        if (max_items == 0)
                return (count);

        radix_tree_for_each_slot_tagged(slot, root, &iter, first_index, tag) {
                results[count] = *slot;
                if (results[count] == NULL)
                        continue;

                count++;
                if (count == max_items)
                        break;
        }

        return (count);
}

bool
radix_tree_iter_find(const struct radix_tree_root *root,
    struct radix_tree_iter *iter, void ***pppslot, int flags)
{
        struct radix_tree_node *node;
        unsigned long index = iter->index;
        unsigned int tag;
        int height;

        tag = flags & RADIX_TREE_ITER_TAG_MASK;
        if ((flags & RADIX_TREE_ITER_TAGGED) && !root_tag_get(root, tag))
                return (false);

restart:
        node = root->rnode;
        if (node == NULL)
                return (false);
        height = root->height - 1;
        if (height == -1 || index > radix_max(root))
                return (false);
        do {
                unsigned long mask = RADIX_TREE_MAP_MASK << (RADIX_TREE_MAP_SHIFT * height);
                unsigned long step = 1UL << (RADIX_TREE_MAP_SHIFT * height);
                int pos = radix_pos(index, height);
                struct radix_tree_node *next;

                /* track last slot */
                *pppslot = node->slots + pos;

                next = node->slots[pos];
                if (next == NULL ||
                    (flags & RADIX_TREE_ITER_TAGGED &&
                     !tag_get(next, tag, pos))) {
                        index += step;
                        index &= -step;
                        if ((index & mask) == 0)
                                goto restart;
                } else {
                        node = next;
                        height--;
                }
        } while (height != -1);
        iter->index = index;
        return (true);
}

void *
radix_tree_delete(struct radix_tree_root *root, unsigned long index)
{
        struct radix_tree_node *stack[RADIX_TREE_MAX_HEIGHT];
        struct radix_tree_node *node;
        void *item;
        int height;
        int idx;
        int tag;

        item = NULL;
        node = root->rnode;
        height = root->height - 1;
        if (index > radix_max(root))
                goto out;
        /*
         * Find the node and record the path in stack.
         */
        while (height && node) {
                stack[height] = node;
                node = node->slots[radix_pos(index, height--)];
        }

        if (node) {
                idx = radix_pos(index, 0);
                item = node->slots[idx];

                for (tag = 0; tag < RADIX_TREE_MAX_TAGS; tag++)
                        node_tag_clear(root, stack, index, tag);
        }

        /*
         * If we removed something reduce the height of the tree.
         */
        if (item)
                for (;;) {
                        node->slots[idx] = NULL;
                        node->count--;
                        if (node->count > 0)
                                break;
                        free(node, M_RADIX);
                        if (node == root->rnode) {
                                root->rnode = NULL;
                                root->height = 0;
                                break;
                        }
                        height++;
                        node = stack[height];
                        idx = radix_pos(index, height);
                }
out:
        return (item);
}

void
radix_tree_iter_delete(struct radix_tree_root *root,
    struct radix_tree_iter *iter, void **slot)
{
        radix_tree_delete(root, iter->index);
}

int
radix_tree_insert(struct radix_tree_root *root, unsigned long index, void *item)
{
        struct radix_tree_node *node;
        struct radix_tree_node *temp[RADIX_TREE_MAX_HEIGHT - 1];
        int height;
        int idx;

        /* bail out upon insertion of a NULL item */
        if (item == NULL)
                return (-EINVAL);

        /* get root node, if any */
        node = root->rnode;

        /* allocate root node, if any */
        if (node == NULL) {
                node = malloc(sizeof(*node), M_RADIX, root->gfp_mask | M_ZERO);
                if (node == NULL)
                        return (-ENOMEM);
                root->rnode = node;
                root->height++;
        }

        /* expand radix tree as needed */
        while (radix_max(root) < index) {
                /* check if the radix tree is getting too big */
                if (root->height == RADIX_TREE_MAX_HEIGHT) {
                        radix_tree_clean_root_node(root);
                        return (-E2BIG);
                }

                /*
                 * If the root radix level is not empty, we need to
                 * allocate a new radix level:
                 */
                if (node->count != 0) {
                        node = malloc(sizeof(*node), M_RADIX, root->gfp_mask | M_ZERO);
                        if (node == NULL) {
                                /*
                                 * Freeing the already allocated radix
                                 * levels, if any, will be handled by
                                 * the radix_tree_delete() function.
                                 * This code path can only happen when
                                 * the tree is not empty.
                                 */
                                return (-ENOMEM);
                        }
                        node->slots[0] = root->rnode;
                        node->count++;
                        root->rnode = node;
                }
                root->height++;
        }

        /* get radix tree height index */
        height = root->height - 1;

        /* walk down the tree until the first missing node, if any */
        for ( ; height != 0; height--) {
                idx = radix_pos(index, height);
                if (node->slots[idx] == NULL)
                        break;
                node = node->slots[idx];
        }

        /* allocate the missing radix levels, if any */
        for (idx = 0; idx != height; idx++) {
                temp[idx] = malloc(sizeof(*node), M_RADIX,
                    root->gfp_mask | M_ZERO);
                if (temp[idx] == NULL) {
                        while (idx--)
                                free(temp[idx], M_RADIX);
                        radix_tree_clean_root_node(root);
                        return (-ENOMEM);
                }
        }

        /* setup new radix levels, if any */
        for ( ; height != 0; height--) {
                idx = radix_pos(index, height);
                node->slots[idx] = temp[height - 1];
                node->count++;
                node = node->slots[idx];
        }

        /*
         * Insert and adjust count if the item does not already exist.
         */
        idx = radix_pos(index, 0);
        if (node->slots[idx])
                return (-EEXIST);
        node->slots[idx] = item;
        node->count++;

        return (0);
}

int
radix_tree_store(struct radix_tree_root *root, unsigned long index, void **ppitem)
{
        struct radix_tree_node *node;
        struct radix_tree_node *temp[RADIX_TREE_MAX_HEIGHT - 1];
        void *pitem;
        int height;
        int idx;

        /*
         * Inserting a NULL item means delete it. The old pointer is
         * stored at the location pointed to by "ppitem".
         */
        if (*ppitem == NULL) {
                *ppitem = radix_tree_delete(root, index);
                return (0);
        }

        /* get root node, if any */
        node = root->rnode;

        /* allocate root node, if any */
        if (node == NULL) {
                node = malloc(sizeof(*node), M_RADIX, root->gfp_mask | M_ZERO);
                if (node == NULL)
                        return (-ENOMEM);
                root->rnode = node;
                root->height++;
        }

        /* expand radix tree as needed */
        while (radix_max(root) < index) {
                /* check if the radix tree is getting too big */
                if (root->height == RADIX_TREE_MAX_HEIGHT) {
                        radix_tree_clean_root_node(root);
                        return (-E2BIG);
                }

                /*
                 * If the root radix level is not empty, we need to
                 * allocate a new radix level:
                 */
                if (node->count != 0) {
                        node = malloc(sizeof(*node), M_RADIX, root->gfp_mask | M_ZERO);
                        if (node == NULL) {
                                /*
                                 * Freeing the already allocated radix
                                 * levels, if any, will be handled by
                                 * the radix_tree_delete() function.
                                 * This code path can only happen when
                                 * the tree is not empty.
                                 */
                                return (-ENOMEM);
                        }
                        node->slots[0] = root->rnode;
                        node->count++;
                        root->rnode = node;
                }
                root->height++;
        }

        /* get radix tree height index */
        height = root->height - 1;

        /* walk down the tree until the first missing node, if any */
        for ( ; height != 0; height--) {
                idx = radix_pos(index, height);
                if (node->slots[idx] == NULL)
                        break;
                node = node->slots[idx];
        }

        /* allocate the missing radix levels, if any */
        for (idx = 0; idx != height; idx++) {
                temp[idx] = malloc(sizeof(*node), M_RADIX,
                    root->gfp_mask | M_ZERO);
                if (temp[idx] == NULL) {
                        while (idx--)
                                free(temp[idx], M_RADIX);
                        radix_tree_clean_root_node(root);
                        return (-ENOMEM);
                }
        }

        /* setup new radix levels, if any */
        for ( ; height != 0; height--) {
                idx = radix_pos(index, height);
                node->slots[idx] = temp[height - 1];
                node->count++;
                node = node->slots[idx];
        }

        /*
         * Insert and adjust count if the item does not already exist.
         */
        idx = radix_pos(index, 0);
        /* swap */
        pitem = node->slots[idx];
        node->slots[idx] = *ppitem;
        *ppitem = pitem;

        if (pitem == NULL)
                node->count++;
        return (0);
}

void *
radix_tree_tag_set(struct radix_tree_root *root, unsigned long index,
    unsigned int tag)
{
        struct radix_tree_node *node;
        void *item;
        int height, pos;

        item = NULL;
        node = root->rnode;
        height = root->height - 1;
        if (index > radix_max(root))
                goto out;

        while (height) {
                KASSERT(
                    node != NULL,
                    ("Node at index %lu does not exist in radix tree %p",
                    index, root));

                pos = radix_pos(index, height--);
                node = node->slots[pos];

                if (!tag_get(node, tag, pos))
                        tag_set(node, tag, pos);
        }

        item = node->slots[radix_pos(index, 0)];

        root_tag_set(root, tag);

out:
        return (item);
}

void *
radix_tree_tag_clear(struct radix_tree_root *root,
    unsigned long index, unsigned int tag)
{
        struct radix_tree_node *stack[RADIX_TREE_MAX_HEIGHT];
        struct radix_tree_node *node;
        void *item;
        int height;

        item = NULL;
        node = root->rnode;
        height = root->height - 1;
        if (index > radix_max(root))
                goto out;

        while (height && node) {
                stack[height] = node;
                node = node->slots[radix_pos(index, height--)];
        }

        if (node) {
                item = node->slots[radix_pos(index, 0)];

                node_tag_clear(root, stack, index, tag);
        }

out:
        return (item);
}

int
radix_tree_tagged(const struct radix_tree_root *root, unsigned int tag)
{
        return (root_tag_get(root, tag));
}