root/usr/src/psm/stand/boot/common/heap_kmem.c
/*
 * CDDL HEADER START
 *
 * The contents of this file are subject to the terms of the
 * Common Development and Distribution License, Version 1.0 only
 * (the "License").  You may not use this file except in compliance
 * with the License.
 *
 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
 * or http://www.opensolaris.org/os/licensing.
 * See the License for the specific language governing permissions
 * and limitations under the License.
 *
 * When distributing Covered Code, include this CDDL HEADER in each
 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
 * If applicable, add the following below this CDDL HEADER, with the
 * fields enclosed by brackets "[]" replaced with your own identifying
 * information: Portions Copyright [yyyy] [name of copyright owner]
 *
 * CDDL HEADER END
 */
/*
 * Copyright 2005 Sun Microsystems, Inc.  All rights reserved.
 * Use is subject to license terms.
 */

#if 1
#undef DEBUG
#endif

/*  #define     DEBUG ON */

/*
 * Conditions on use:
 * kmem_alloc and kmem_free must not be called from interrupt level,
 * except from software interrupt level.  This is because they are
 * not reentrant, and only block out software interrupts.  They take
 * too long to block any real devices.  There is a routine
 * kmem_free_intr that can be used to free blocks at interrupt level,
 * but only up to splimp, not higher.  This is because kmem_free_intr
 * only spl's to splimp.
 *
 * Also, these routines are not that fast, so they should not be used
 * in very frequent operations (e.g. operations that happen more often
 * than, say, once every few seconds).
 */

/*
 * description:
 *      Yet another memory allocator, this one based on a method
 *      described in C.J. Stephenson, "Fast Fits", IBM Sys. Journal
 *
 *      The basic data structure is a "Cartesian" binary tree, in which
 *      nodes are ordered by ascending addresses (thus minimizing free
 *      list insertion time) and block sizes decrease with depth in the
 *      tree (thus minimizing search time for a block of a given size).
 *
 *      In other words, for any node s, letting D(s) denote
 *      the set of descendents of s, we have:
 *
 *      a. addr(D(left(s))) <  addr(s) <  addr(D(right(s)))
 *      b. len(D(left(s)))  <= len(s)  >= len(D(right(s)))
 */

#include <sys/param.h>
#include <sys/sysmacros.h>
#include <sys/salib.h>
#include <sys/saio.h>
#include <sys/promif.h>

/*
 * The node header structure.
 *
 * To reduce storage consumption, a header block is associated with
 * free blocks only, not allocated blocks.
 * When a free block is allocated, its header block is put on
 * a free header block list.
 *
 * This creates a header space and a free block space.
 * The left pointer of a header blocks is used to chain free header
 * blocks together.
 */

typedef enum {false, true} bool;
typedef struct  freehdr *Freehdr;
typedef struct  dblk    *Dblk;

/*
 * Description of a header for a free block
 * Only free blocks have such headers.
 */
struct  freehdr {
        Freehdr left;                   /* Left tree pointer */
        Freehdr right;                  /* Right tree pointer */
        Dblk    block;                  /* Ptr to the data block */
        size_t  size;                   /* Size of the data block */
};

#define NIL             ((Freehdr) 0)
#define WORDSIZE        sizeof (int)
#define SMALLEST_BLK    1               /* Size of smallest block */

/*
 * Description of a data block.
 */
struct  dblk    {
        char    data[1];                /* Addr returned to the caller */
};

/*
 * weight(x) is the size of a block, in bytes; or 0 if and only if x
 *      is a null pointer. It is the responsibility of kmem_alloc() and
 *      kmem_free() to keep zero-length blocks out of the arena.
 */

#define weight(x)       ((x) == NIL? 0: (x->size))
#define nextblk(p, size) ((Dblk) ((char *)(p) + (size)))
#define max(a, b)       ((a) < (b)? (b): (a))

void            *kmem_alloc(size_t, int);
void            kmem_free(void *ptr, size_t nbytes);
Freehdr         getfreehdr(void);
static bool     morecore(size_t);
void            insert(Dblk p, size_t len, Freehdr *tree);
void            freehdr(Freehdr p);
void            delete(Freehdr *p);
static void     check_need_to_free(void);
extern caddr_t  resalloc(enum RESOURCES, size_t, caddr_t, int);
#ifdef  __sparc
extern void     resalloc_init(void);
#endif
extern int      splnet(void);
extern int      splimp(void);
extern void     splx(int);

/*
 * Structure containing various info about allocated memory.
 */
#define NEED_TO_FREE_SIZE       5
struct kmem_info {
        Freehdr free_root;
        Freehdr free_hdr_list;
        struct map *map;
        struct pte *pte;
        caddr_t vaddr;
        struct need_to_free {
                caddr_t addr;
                size_t  nbytes;
        } need_to_free_list, need_to_free[NEED_TO_FREE_SIZE];
} kmem_info;


struct map *kernelmap;

#ifdef DEBUG
static void prtree(Freehdr, char *);
#endif

/*
 * Initialize kernel memory allocator
 */

void
kmem_init(void)
{
        int i;
        struct need_to_free *ntf;

#ifdef DEBUG
printf("kmem_init entered\n");
#endif

#ifdef __sparc
        resalloc_init();
#endif

        kmem_info.free_root = NIL;
        kmem_info.free_hdr_list = NULL;
        kmem_info.map = kernelmap;
        kmem_info.need_to_free_list.addr = 0;
        ntf = kmem_info.need_to_free;
        for (i = 0; i < NEED_TO_FREE_SIZE; i++) {
                ntf[i].addr = 0;
        }
#ifdef DEBUG
printf("kmem_init returning\n");
prtree(kmem_info.free_root, "kmem_init");
#endif
}

/*
 * Insert a new node in a cartesian tree or subtree, placing it
 *      in the correct position with respect to the existing nodes.
 *
 * algorithm:
 *      Starting from the root, a binary search is made for the new
 *      node. If this search were allowed to continue, it would
 *      eventually fail (since there cannot already be a node at the
 *      given address); but in fact it stops when it reaches a node in
 *      the tree which has a length less than that of the new node (or
 *      when it reaches a null tree pointer).  The new node is then
 *      inserted at the root of the subtree for which the shorter node
 *      forms the old root (or in place of the null pointer).
 */


void
insert(Dblk p,          /* Ptr to the block to insert */
    size_t len,         /* Length of new node */
    Freehdr *tree)      /* Address of ptr to root */
{
        Freehdr x;
        Freehdr *left_hook;     /* Temp for insertion */
        Freehdr *right_hook;    /* Temp for insertion */
        Freehdr newhdr;

        x = *tree;
        /*
         * Search for the first node which has a weight less
         *      than that of the new node; this will be the
         *      point at which we insert the new node.
         */

        while (weight(x) >= len) {
                if (p < x->block)
                        tree = &x->left;
                else
                        tree = &x->right;
                x = *tree;
        }

        /*
         * Perform root insertion. The variable x traces a path through
         *      the tree, and with the help of left_hook and right_hook,
         *      rewrites all links that cross the territory occupied
         *      by p.  Note that this improves performance under
         *      paging.
         */

        newhdr = getfreehdr();
        *tree = newhdr;
        left_hook = &newhdr->left;
        right_hook = &newhdr->right;

        newhdr->left = NIL;
        newhdr->right = NIL;
        newhdr->block = p;
        newhdr->size = len;

        while (x != NIL) {
                /*
                 * Remark:
                 *      The name 'left_hook' is somewhat confusing, since
                 *      it is always set to the address of a .right link
                 *      field.  However, its value is always an address
                 *      below (i.e., to the left of) p. Similarly
                 *      for right_hook. The values of left_hook and
                 *      right_hook converge toward the value of p,
                 *      as in a classical binary search.
                 */
                if (x->block < p) {
                        /*
                         * rewrite link crossing from the left
                         */
                        *left_hook = x;
                        left_hook = &x->right;
                        x = x->right;
                } else {
                        /*
                         * rewrite link crossing from the right
                         */
                        *right_hook = x;
                        right_hook = &x->left;
                        x = x->left;
                } /* else */
        } /* while */

        *left_hook = *right_hook = NIL;         /* clear remaining hooks */

} /* insert */


/*
 * Delete a node from a cartesian tree. p is the address of
 *      a pointer to the node which is to be deleted.
 *
 * algorithm:
 *      The left and right sons of the node to be deleted define two
 *      subtrees which are to be merged and attached in place of the
 *      deleted node.  Each node on the inside edges of these two
 *      subtrees is examined and longer nodes are placed above the
 *      shorter ones.
 *
 * On entry:
 *      *p is assumed to be non-null.
 */

void
delete(Freehdr *p)
{
        Freehdr x;
        Freehdr left_branch;    /* left subtree of deleted node */
        Freehdr right_branch;   /* right subtree of deleted node */

        x = *p;
        left_branch = x->left;
        right_branch = x->right;

        while (left_branch != right_branch) {
                /*
                 * iterate until left branch and right branch are
                 * both NIL.
                 */
                if (weight(left_branch) >= weight(right_branch)) {
                        /*
                         * promote the left branch
                         */
                        *p = left_branch;
                        p = &left_branch->right;
                        left_branch = left_branch->right;
                } else {
                        /*
                         * promote the right branch
                         */
                        *p = right_branch;
                        p = &right_branch->left;
                        right_branch = right_branch->left;
                } /* else */
        } /* while */
        *p = NIL;
        freehdr(x);
} /* delete */


/*
 * Demote a node in a cartesian tree, if necessary, to establish
 *      the required vertical ordering.
 *
 * algorithm:
 *      The left and right subtrees of the node to be demoted are to
 *      be partially merged and attached in place of the demoted node.
 *      The nodes on the inside edges of these two subtrees are
 *      examined and the longer nodes are placed above the shorter
 *      ones, until a node is reached which has a length no greater
 *      than that of the node being demoted (or until a null pointer
 *      is reached).  The node is then attached at this point, and
 *      the remaining subtrees (if any) become its descendants.
 *
 * on entry:
 *   a. All the nodes in the tree, including the one to be demoted,
 *      must be correctly ordered horizontally;
 *   b. All the nodes except the one to be demoted must also be
 *      correctly positioned vertically.  The node to be demoted
 *      may be already correctly positioned vertically, or it may
 *      have a length which is less than that of one or both of
 *      its progeny.
 *   c. *p is non-null
 */


static void
demote(Freehdr *p)
{
        Freehdr x;              /* addr of node to be demoted */
        Freehdr left_branch;
        Freehdr right_branch;
        size_t    wx;

        x = *p;
        left_branch = x->left;
        right_branch = x->right;
        wx = weight(x);

        while (weight(left_branch) > wx || weight(right_branch) > wx) {
                /*
                 * select a descendant branch for promotion
                 */
                if (weight(left_branch) >= weight(right_branch)) {
                        /*
                         * promote the left branch
                         */
                        *p = left_branch;
                        p = &left_branch->right;
                        left_branch = *p;
                } else {
                        /*
                         * promote the right branch
                         */
                        *p = right_branch;
                        p = &right_branch->left;
                        right_branch = *p;
                } /* else */
        } /* while */

        *p = x;                         /* attach demoted node here */
        x->left = left_branch;
        x->right = right_branch;
} /* demote */

/*
 * Allocate a block of storage
 *
 * algorithm:
 *      The freelist is searched by descending the tree from the root
 *      so that at each decision point the "better fitting" child node
 *      is chosen (i.e., the shorter one, if it is long enough, or
 *      the longer one, otherwise).  The descent stops when both
 *      child nodes are too short.
 *
 * function result:
 *      kmem_alloc returns a pointer to the allocated block; a null
 *      pointer indicates storage could not be allocated.
 */
/*
 * We need to return blocks that are on word boundaries so that callers
 * that are putting int's into the area will work.  Since we allow
 * arbitrary free'ing, we need a weight function that considers
 * free blocks starting on an odd boundary special.  Allocation is
 * aligned to 8 byte boundaries (ALIGN).
 */
#define ALIGN           8               /* doubleword aligned .. */
#define ALIGNMASK       (ALIGN-1)
#define ALIGNMORE(addr) (ALIGN - ((uintptr_t)(addr) & ALIGNMASK))

/*
 * If it is empty then weight == 0
 * If it is aligned then weight == size
 * If it is unaligned
 *      if not enough room to align then weight == 0
 *      else weight == aligned size
 */
#define mweight(x) ((x) == NIL ? 0 : \
        ((((uintptr_t)(x)->block) & ALIGNMASK) == 0 ? (x)->size : \
                (((x)->size <= ALIGNMORE((x)->block)) ? 0 : \
                        (x)->size - ALIGNMORE((x)->block))))

/*ARGSUSED1*/
void *
kmem_alloc(size_t nbytes, int kmflag)
{
        Freehdr a;              /* ptr to node to be allocated */
        Freehdr *p;             /* address of ptr to node */
        size_t   left_weight;
        size_t   right_weight;
        Freehdr left_son;
        Freehdr right_son;
        char     *retblock;     /* Address returned to the user */
        int s;
#ifdef  DEBUG
        printf("kmem_alloc(nbytes 0x%lx)\n", nbytes);
#endif  /* DEBUG */

        if (nbytes == 0) {
                return (NULL);
        }
        s = splnet();

        if (nbytes < SMALLEST_BLK) {
                printf("illegal kmem_alloc call for %lx bytes\n", nbytes);
                prom_panic("kmem_alloc");
        }
        check_need_to_free();

        /*
         * ensure that at least one block is big enough to satisfy
         *      the request.
         */

        if (mweight(kmem_info.free_root) <= nbytes) {
                /*
                 * the largest block is not enough.
                 */
                if (!morecore(nbytes)) {
                        printf("kmem_alloc failed, nbytes %lx\n", nbytes);
                        prom_panic("kmem_alloc");
                }
        }

        /*
         * search down through the tree until a suitable block is
         *      found.  At each decision point, select the better
         *      fitting node.
         */

        p = (Freehdr *) &kmem_info.free_root;
        a = *p;
        left_son = a->left;
        right_son = a->right;
        left_weight = mweight(left_son);
        right_weight = mweight(right_son);

        while (left_weight >= nbytes || right_weight >= nbytes) {
                if (left_weight <= right_weight) {
                        if (left_weight >= nbytes) {
                                p = &a->left;
                                a = left_son;
                        } else {
                                p = &a->right;
                                a = right_son;
                        }
                } else {
                        if (right_weight >= nbytes) {
                                p = &a->right;
                                a = right_son;
                        } else {
                                p = &a->left;
                                a = left_son;
                        }
                }
                left_son = a->left;
                right_son = a->right;
                left_weight = mweight(left_son);
                right_weight = mweight(right_son);
        } /* while */

        /*
         * allocate storage from the selected node.
         */

        if (a->size - nbytes < SMALLEST_BLK) {
                /*
                 * not big enough to split; must leave at least
                 * a dblk's worth of space.
                 */
                retblock = a->block->data;
                delete(p);
        } else {

                /*
                 * split the node, allocating nbytes from the top.
                 *      Remember we've already accounted for the
                 *      allocated node's header space.
                 */
                Freehdr x;
                x = getfreehdr();
                if ((uintptr_t)a->block->data & ALIGNMASK) {
                        size_t size;
                        if (a->size <= ALIGNMORE(a->block->data))
                                prom_panic("kmem_alloc: short block allocated");
                        size = nbytes + ALIGNMORE(a->block->data);
                        x->block = a->block;
                        x->size = ALIGNMORE(a->block->data);
                        x->left = a->left;
                        x->right = a->right;
                        /*
                         * the node pointed to by *p has become smaller;
                         *      move it down to its appropriate place in
                         *      the tree.
                         */
                        *p = x;
                        demote(p);
                        retblock = a->block->data + ALIGNMORE(a->block->data);
                        if (a->size > size) {
                                kmem_free((caddr_t)nextblk(a->block, size),
                                    (size_t)(a->size - size));
                        }
                        freehdr(a);
                } else {
                        x->block = nextblk(a->block, nbytes);
                        x->size = a->size - nbytes;
                        x->left = a->left;
                        x->right = a->right;
                        /*
                         * the node pointed to by *p has become smaller;
                         *      move it down to its appropriate place in
                         *      the tree.
                         */
                        *p = x;
                        demote(p);
                        retblock = a->block->data;
                        freehdr(a);
                }
        }
#ifdef DEBUG
        prtree(kmem_info.free_root, "kmem_alloc");
#endif

        splx(s);
        bzero(retblock, nbytes);
#ifdef DEBUG
        printf("kmem_alloc  bzero complete - returning %p\n", retblock);
#endif
        return (retblock);

} /* kmem_alloc */

/*
 * Return a block to the free space tree.
 *
 * algorithm:
 *      Starting at the root, search for and coalesce free blocks
 *      adjacent to one given.  When the appropriate place in the
 *      tree is found, insert the given block.
 *
 * Do some sanity checks to avoid total confusion in the tree.
 * If the block has already been freed, prom_panic.
 * If the ptr is not from the arena, prom_panic.
 */
void
kmem_free(void *ptr, size_t nbytes)
{
        Freehdr *np;            /* For deletion from free list */
        Freehdr neighbor;       /* Node to be coalesced */
        char     *neigh_block;  /* Ptr to potential neighbor */
        size_t   neigh_size;    /* Size of potential neighbor */
        int s;

#ifdef DEBUG
printf("kmem_free (ptr %p nbytes %lx)\n", ptr, nbytes);
prtree(kmem_info.free_root, "kmem_free");
#endif

#ifdef  lint
        neigh_block = bkmem_zalloc(nbytes);
        neigh_block = neigh_block;
#endif
        if (nbytes == 0) {
                return;
        }

        if (ptr == 0) {
                prom_panic("kmem_free of 0");
        }
        s = splnet();

        /*
         * Search the tree for the correct insertion point for this
         *      node, coalescing adjacent free blocks along the way.
         */
        np = &kmem_info.free_root;
        neighbor = *np;
        while (neighbor != NIL) {
                neigh_block = (char *)neighbor->block;
                neigh_size = neighbor->size;
                if ((char *)ptr < neigh_block) {
                        if ((char *)ptr + nbytes == neigh_block) {
                                /*
                                 * Absorb and delete right neighbor
                                 */
                                nbytes += neigh_size;
                                delete(np);
                        } else if ((char *)ptr + nbytes > neigh_block) {
                                /*
                                 * The block being freed overlaps
                                 * another block in the tree.  This
                                 * is bad news.
                                 */
                                printf("kmem_free: free block overlap %p+%lx"
                                    " over %p\n", (void *)ptr, nbytes,
                                    (void *)neigh_block);
                                prom_panic("kmem_free: free block overlap");
                        } else {
                                /*
                                 * Search to the left
                                 */
                                np = &neighbor->left;
                        }
                } else if ((char *)ptr > neigh_block) {
                        if (neigh_block + neigh_size == ptr) {
                                /*
                                 * Absorb and delete left neighbor
                                 */
                                ptr = neigh_block;
                                nbytes += neigh_size;
                                delete(np);
                        } else if (neigh_block + neigh_size > (char *)ptr) {
                                /*
                                 * This block has already been freed
                                 */
                                prom_panic("kmem_free block already free");
                        } else {
                                /*
                                 * search to the right
                                 */
                                np = &neighbor->right;
                        }
                } else {
                        /*
                         * This block has already been freed
                         * as "ptr == neigh_block"
                         */
                        prom_panic("kmem_free: block already free as neighbor");
                } /* else */
                neighbor = *np;
        } /* while */

        /*
         * Insert the new node into the free space tree
         */
        insert((Dblk) ptr, nbytes, &kmem_info.free_root);
#ifdef DEBUG
printf("exiting kmem_free\n");
prtree(kmem_info.free_root, "kmem_free");
#endif
        splx(s);
} /* kmem_free */

/*
 *  Sigh.  We include a header file which the kernel
 *  uses to declare (one of its many) kmem_free prototypes.
 *  In order not to use the kernel's namespace, then, we must
 *  define another name here for use by boot.
 */
void *
bkmem_alloc(size_t size)
{
        return (kmem_alloc(size, 0));
}

/*
 * Boot's kmem_alloc is really kmem_zalloc().
 */
void *
bkmem_zalloc(size_t size)
{
        return (kmem_alloc(size, 0));
}

void
bkmem_free(void *p, size_t bytes)
{
        kmem_free(p, bytes);
}

static void
check_need_to_free(void)
{
        int i;
        struct need_to_free *ntf;
        caddr_t addr;
        size_t nbytes;
        int s;

again:
        s = splimp();
        ntf = &kmem_info.need_to_free_list;
        if (ntf->addr) {
                addr = ntf->addr;
                nbytes = ntf->nbytes;
                *ntf = *(struct need_to_free *)ntf->addr;
                splx(s);
                kmem_free(addr, nbytes);
                goto again;
        }
        ntf = kmem_info.need_to_free;
        for (i = 0; i < NEED_TO_FREE_SIZE; i++) {
                if (ntf[i].addr) {
                        addr = ntf[i].addr;
                        nbytes = ntf[i].nbytes;
                        ntf[i].addr = 0;
                        splx(s);
                        kmem_free(addr, nbytes);
                        goto again;
                }
        }
        splx(s);
}

/*
 * Add a block of at least nbytes to the free space tree.
 *
 * return value:
 *      true    if at least nbytes can be allocated
 *      false   otherwise
 *
 * remark:
 *      free space (delimited by the static variable ubound) is
 *      extended by an amount determined by rounding nbytes up to
 *      a multiple of the system page size.
 */

static bool
morecore(size_t nbytes)
{
#ifdef  __sparc
        enum RESOURCES type = RES_BOOTSCRATCH_NOFAIL;
#else
        enum RESOURCES type = RES_BOOTSCRATCH;
#endif
        Dblk p;
#ifdef  DEBUG
        printf("morecore(nbytes 0x%lx)\n", nbytes);
#endif  /* DEBUG */


        nbytes = roundup(nbytes, PAGESIZE);
        p = (Dblk) resalloc(type, nbytes, (caddr_t)0, 0);
        if (p == 0) {
                return (false);
        }
        kmem_free((caddr_t)p, nbytes);
#ifdef DEBUG
        printf("morecore() returing, p = %p\n", p);
#endif
        return (true);

} /* morecore */

/*
 * Get a free block header
 * There is a list of available free block headers.
 * When the list is empty, allocate another pagefull.
 */
Freehdr
getfreehdr(void)
{
        Freehdr r;
        int     n = 0;
#ifdef  DEBUG
        printf("getfreehdr()\n");
#endif  /* DEBUG */

        if (kmem_info.free_hdr_list != NIL) {
                r = kmem_info.free_hdr_list;
                kmem_info.free_hdr_list = kmem_info.free_hdr_list->left;
        } else {
                r = (Freehdr)resalloc(RES_BOOTSCRATCH, PAGESIZE, (caddr_t)0, 0);
                if (r == 0) {
                        prom_panic("getfreehdr");
                }
                for (n = 1; n < PAGESIZE / sizeof (*r); n++) {
                        freehdr(&r[n]);
                }
        }
#ifdef  DEBUG
        printf("getfreehdr: freed %x headers\n", n);
        printf("getfreehdr: returning %p\n", r);
#endif  /* DEBUG */
        return (r);
}

/*
 * Free a free block header
 * Add it to the list of available headers.
 */

void
freehdr(Freehdr p)
{
#ifdef  DEBUG
        printf("freehdr(%p)\n", p);
#endif  /* DEBUG */
        p->left = kmem_info.free_hdr_list;
        p->right = NIL;
        p->block = NULL;
        kmem_info.free_hdr_list = p;
}

#ifdef DEBUG
/*
 * Diagnostic routines
 */
static int depth = 0;

static void
prtree(Freehdr p, char *cp)
{
        int n;
        if (depth == 0) {
                printf("prtree(p %p cp %s)\n", p, cp);
        }
        if (p != NIL) {
                depth++;
                prtree(p->left, (char *)NULL);
                depth--;

                for (n = 0; n < depth; n++) {
                        printf("   ");
                }
                printf(
                    "(%p): (left = %p, right = %p, block = %p, size = %lx)\n",
                        p, p->left, p->right, p->block, p->size);

                depth++;
                prtree(p->right, (char *)NULL);
                depth--;
        }
}
#endif /* DEBUG */