root/sys/netinet6/in6.c
/*      $OpenBSD: in6.c,v 1.279 2026/03/22 23:14:00 bluhm Exp $ */
/*      $KAME: in6.c,v 1.372 2004/06/14 08:14:21 itojun Exp $   */

/*
 * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. Neither the name of the project nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */

/*
 * Copyright (c) 1982, 1986, 1991, 1993
 *      The Regents of the University of California.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 *
 *      @(#)in.c        8.2 (Berkeley) 11/15/93
 */

#include "carp.h"

#include <sys/param.h>
#include <sys/ioctl.h>
#include <sys/errno.h>
#include <sys/malloc.h>
#include <sys/socket.h>
#include <sys/socketvar.h>
#include <sys/sockio.h>
#include <sys/mbuf.h>
#include <sys/systm.h>
#include <sys/time.h>
#include <sys/syslog.h>

#include <net/if.h>
#include <net/if_var.h>
#include <net/if_types.h>
#include <net/route.h>

#include <netinet/in.h>

#include <netinet6/in6_var.h>
#include <netinet/ip6.h>
#include <netinet6/ip6_var.h>
#include <netinet6/nd6.h>
#include <netinet6/mld6_var.h>
#ifdef MROUTING
#include <netinet6/ip6_mroute.h>
#endif
#include <netinet6/in6_ifattach.h>
#if NCARP > 0
#include <netinet/ip_carp.h>
#endif

/*
 * Definitions of some constant IP6 addresses.
 */
const struct in6_addr in6addr_any = IN6ADDR_ANY_INIT;
const struct in6_addr in6addr_loopback = IN6ADDR_LOOPBACK_INIT;
const struct in6_addr in6addr_intfacelocal_allnodes =
        IN6ADDR_INTFACELOCAL_ALLNODES_INIT;
const struct in6_addr in6addr_linklocal_allnodes =
        IN6ADDR_LINKLOCAL_ALLNODES_INIT;
const struct in6_addr in6addr_linklocal_allrouters =
        IN6ADDR_LINKLOCAL_ALLROUTERS_INIT;

const struct in6_addr in6mask0 = IN6MASK0;
const struct in6_addr in6mask32 = IN6MASK32;
const struct in6_addr in6mask64 = IN6MASK64;
const struct in6_addr in6mask96 = IN6MASK96;
const struct in6_addr in6mask128 = IN6MASK128;

int in6_ioctl(u_long, caddr_t, struct ifnet *, int);
int in6_ioctl_change_ifaddr(u_long, caddr_t, struct ifnet *);
int in6_ioctl_get(u_long, caddr_t, struct ifnet *);
int in6_check_embed_scope(struct sockaddr_in6 *, unsigned int);
int in6_clear_scope_id(struct sockaddr_in6 *, unsigned int);
int in6_ifinit(struct ifnet *, struct in6_ifaddr *, int);
void in6_unlink_ifa(struct in6_ifaddr *, struct ifnet *);

const struct sockaddr_in6 sa6_any = {
        sizeof(sa6_any), AF_INET6, 0, 0, IN6ADDR_ANY_INIT, 0
};

int
in6_mask2len(struct in6_addr *mask, u_char *lim0)
{
        int x = 0, y;
        u_char *lim = lim0, *p;

        /* ignore the scope_id part */
        if (lim0 == NULL || lim0 - (u_char *)mask > sizeof(*mask))
                lim = (u_char *)mask + sizeof(*mask);
        for (p = (u_char *)mask; p < lim; x++, p++) {
                if (*p != 0xff)
                        break;
        }
        y = 0;
        if (p < lim) {
                for (y = 0; y < 8; y++) {
                        if ((*p & (0x80 >> y)) == 0)
                                break;
                }
        }

        /*
         * when the limit pointer is given, do a stricter check on the
         * remaining bits.
         */
        if (p < lim) {
                if (y != 0 && (*p & (0x00ff >> y)) != 0)
                        return (-1);
                for (p = p + 1; p < lim; p++)
                        if (*p != 0)
                                return (-1);
        }

        return x * 8 + y;
}

int
in6_nam2sin6(const struct mbuf *nam, struct sockaddr_in6 **sin6)
{
        struct sockaddr *sa = mtod(nam, struct sockaddr *);

        if (nam->m_len < offsetof(struct sockaddr, sa_data))
                return EINVAL;
        if (sa->sa_family != AF_INET6)
                return EAFNOSUPPORT;
        if (sa->sa_len != nam->m_len)
                return EINVAL;
        if (sa->sa_len != sizeof(struct sockaddr_in6))
                return EINVAL;
        *sin6 = satosin6(sa);

        return 0;
}

int
in6_sa2sin6(struct sockaddr *sa, struct sockaddr_in6 **sin6)
{
        if (sa->sa_family != AF_INET6)
                return EAFNOSUPPORT;
        if (sa->sa_len != sizeof(struct sockaddr_in6))
                return EINVAL;
        *sin6 = satosin6(sa);

        return 0;
}

int
in6_control(struct socket *so, u_long cmd, caddr_t data, struct ifnet *ifp)
{
        int privileged;

        privileged = 0;
        if ((so->so_state & SS_PRIV) != 0)
                privileged++;

        switch (cmd) {
#ifdef MROUTING
        case SIOCGETSGCNT_IN6:
        case SIOCGETMIFCNT_IN6:
                return mrt6_ioctl(so, cmd, data);
#endif /* MROUTING */
        default:
                return in6_ioctl(cmd, data, ifp, privileged);
        }
}

int
in6_ioctl(u_long cmd, caddr_t data, struct ifnet *ifp, int privileged)
{
        if (ifp == NULL)
                return (ENXIO);

        switch (cmd) {
        case SIOCGIFINFO_IN6:
        case SIOCGNBRINFO_IN6:
                return (nd6_ioctl(cmd, data, ifp));
        case SIOCGIFDSTADDR_IN6:
        case SIOCGIFNETMASK_IN6:
        case SIOCGIFAFLAG_IN6:
        case SIOCGIFALIFETIME_IN6:
                return (in6_ioctl_get(cmd, data, ifp));
        case SIOCAIFADDR_IN6:
        case SIOCDIFADDR_IN6:
                if (!privileged)
                        return (EPERM);
                return (in6_ioctl_change_ifaddr(cmd, data, ifp));
        case SIOCSIFADDR:
        case SIOCSIFDSTADDR:
        case SIOCSIFBRDADDR:
        case SIOCSIFNETMASK:
                /*
                 * Do not pass those ioctl to driver handler since they are not
                 * properly set up. Instead just error out.
                 */
                return (EINVAL);
        default:
                return (EOPNOTSUPP);
        }
}

int
in6_ioctl_change_ifaddr(u_long cmd, caddr_t data, struct ifnet *ifp)
{
        struct  in6_ifaddr *ia6 = NULL;
        struct  in6_aliasreq *ifra = (struct in6_aliasreq *)data;
        struct  sockaddr *sa;
        struct  sockaddr_in6 *sa6 = NULL;
        int     error = 0, newifaddr = 0, plen;

        /*
         * Find address for this interface, if it exists.
         *
         * In netinet code, we have checked ifra_addr in SIOCSIF*ADDR operation
         * only, and used the first interface address as the target of other
         * operations (without checking ifra_addr).  This was because netinet
         * code/API assumed at most 1 interface address per interface.
         * Since IPv6 allows a node to assign multiple addresses
         * on a single interface, we almost always look and check the
         * presence of ifra_addr, and reject invalid ones here.
         * It also decreases duplicated code among SIOC*_IN6 operations.
         *
         * We always require users to specify a valid IPv6 address for
         * the corresponding operation.
         */
        switch (cmd) {
        case SIOCAIFADDR_IN6:
                sa = sin6tosa(&ifra->ifra_addr);
                break;
        case SIOCDIFADDR_IN6:
                sa = sin6tosa(&((struct in6_ifreq *)data)->ifr_addr);
                break;
        default:
                panic("%s: invalid ioctl %lu", __func__, cmd);
        }
        if (sa->sa_family == AF_INET6) {
                error = in6_sa2sin6(sa, &sa6);
                if (error)
                        return (error);
        }

        KERNEL_LOCK();
        NET_LOCK();

        if (sa6 != NULL) {
                error = in6_check_embed_scope(sa6, ifp->if_index);
                if (error)
                        goto err;
                error = in6_clear_scope_id(sa6, ifp->if_index);
                if (error)
                        goto err;
                ia6 = in6ifa_ifpwithaddr(ifp, &sa6->sin6_addr);
        }

        switch (cmd) {
        case SIOCDIFADDR_IN6:
                /*
                 * for IPv4, we look for existing in_ifaddr here to allow
                 * "ifconfig if0 delete" to remove the first IPv4 address on
                 * the interface.  For IPv6, as the spec allows multiple
                 * interface address from the day one, we consider "remove the
                 * first one" semantics to be not preferable.
                 */
                if (ia6 == NULL) {
                        error = EADDRNOTAVAIL;
                        break;
                }
                in6_purgeaddr(&ia6->ia_ifa);
                if_addrhooks_run(ifp);
                break;

        case SIOCAIFADDR_IN6:
                if (ifra->ifra_addr.sin6_family != AF_INET6 ||
                    ifra->ifra_addr.sin6_len != sizeof(struct sockaddr_in6)) {
                        error = EAFNOSUPPORT;
                        break;
                }

                /* reject read-only flags */
                if ((ifra->ifra_flags & IN6_IFF_DUPLICATED) != 0 ||
                    (ifra->ifra_flags & IN6_IFF_DETACHED) != 0 ||
                    (ifra->ifra_flags & IN6_IFF_DEPRECATED) != 0) {
                        error = EINVAL;
                        break;
                }

                if (ia6 == NULL)
                        newifaddr = 1;

                /*
                 * Make the address tentative before joining multicast
                 * addresses, so that corresponding MLD responses would
                 * not have a tentative source address.
                 */
                if (newifaddr && in6if_do_dad(ifp))
                        ifra->ifra_flags |= IN6_IFF_TENTATIVE;

                /*
                 * first, make or update the interface address structure,
                 * and link it to the list. try to enable inet6 if there
                 * is no link-local yet.
                 */
                error = in6_ifattach(ifp);
                if (error)
                        break;
                error = in6_update_ifa(ifp, ifra, ia6);
                if (error)
                        break;

                ia6 = NULL;
                if (sa6 != NULL)
                        ia6 = in6ifa_ifpwithaddr(ifp, &sa6->sin6_addr);
                if (ia6 == NULL) {
                        /*
                         * this can happen when the user specify the 0 valid
                         * lifetime.
                         */
                        break;
                }

                /* Perform DAD, if needed. */
                if (ia6->ia6_flags & IN6_IFF_TENTATIVE)
                        nd6_dad_start(&ia6->ia_ifa);

                if (!newifaddr) {
                        if_addrhooks_run(ifp);
                        break;
                }

                plen = in6_mask2len(&ia6->ia_prefixmask.sin6_addr, NULL);
                if ((ifp->if_flags & IFF_LOOPBACK) || plen == 128) {
                        if_addrhooks_run(ifp);
                        break;  /* No need to install a connected route. */
                }

                error = rt_ifa_add(&ia6->ia_ifa,
                    RTF_CLONING | RTF_CONNECTED | RTF_MPATH,
                    ia6->ia_ifa.ifa_addr, ifp->if_rdomain);
                if (error) {
                        in6_purgeaddr(&ia6->ia_ifa);
                        break;
                }
                if_addrhooks_run(ifp);
                break;
        }

err:
        NET_UNLOCK();
        KERNEL_UNLOCK();
        return (error);
}

int
in6_ioctl_get(u_long cmd, caddr_t data, struct ifnet *ifp)
{
        struct  in6_ifreq *ifr = (struct in6_ifreq *)data;
        struct  in6_ifaddr *ia6 = NULL;
        struct  sockaddr *sa;
        struct  sockaddr_in6 *sa6 = NULL;
        int     error = 0;

        sa = sin6tosa(&ifr->ifr_addr);
        if (sa->sa_family == AF_INET6) {
                sa->sa_len = sizeof(struct sockaddr_in6);
                error = in6_sa2sin6(sa, &sa6);
                if (error)
                        return (error);
        }

        NET_LOCK_SHARED();

        if (sa6 != NULL) {
                error = in6_check_embed_scope(sa6, ifp->if_index);
                if (error)
                        goto err;
                error = in6_clear_scope_id(sa6, ifp->if_index);
                if (error)
                        goto err;
                ia6 = in6ifa_ifpwithaddr(ifp, &sa6->sin6_addr);
        }

        /* must think again about its semantics */
        if (ia6 == NULL) {
                error = EADDRNOTAVAIL;
                goto err;
        }

        switch (cmd) {
        case SIOCGIFDSTADDR_IN6:
                if ((ifp->if_flags & IFF_POINTOPOINT) == 0) {
                        error = EINVAL;
                        break;
                }
                /*
                 * XXX: should we check if ifa_dstaddr is NULL and return
                 * an error?
                 */
                ifr->ifr_dstaddr = ia6->ia_dstaddr;
                break;

        case SIOCGIFNETMASK_IN6:
                ifr->ifr_addr = ia6->ia_prefixmask;
                break;

        case SIOCGIFAFLAG_IN6:
                ifr->ifr_ifru.ifru_flags6 = ia6->ia6_flags;
                break;

        case SIOCGIFALIFETIME_IN6:
                ifr->ifr_ifru.ifru_lifetime = ia6->ia6_lifetime;
                if (ia6->ia6_lifetime.ia6t_vltime != ND6_INFINITE_LIFETIME) {
                        time_t expire, maxexpire;
                        struct in6_addrlifetime *retlt =
                            &ifr->ifr_ifru.ifru_lifetime;

                        /*
                         * XXX: adjust expiration time assuming time_t is
                         * signed.
                         */
                        maxexpire =
                            (time_t)~(1ULL << ((sizeof(maxexpire) * 8) - 1));
                        if (ia6->ia6_lifetime.ia6t_vltime <
                            maxexpire - ia6->ia6_updatetime) {
                                expire = ia6->ia6_updatetime +
                                    ia6->ia6_lifetime.ia6t_vltime;
                                if (expire != 0) {
                                        expire -= getuptime();
                                        expire += gettime();
                                }
                                retlt->ia6t_expire = expire;
                        } else
                                retlt->ia6t_expire = maxexpire;
                }
                if (ia6->ia6_lifetime.ia6t_pltime != ND6_INFINITE_LIFETIME) {
                        time_t expire, maxexpire;
                        struct in6_addrlifetime *retlt =
                            &ifr->ifr_ifru.ifru_lifetime;

                        /*
                         * XXX: adjust expiration time assuming time_t is
                         * signed.
                         */
                        maxexpire =
                            (time_t)~(1ULL << ((sizeof(maxexpire) * 8) - 1));
                        if (ia6->ia6_lifetime.ia6t_pltime <
                            maxexpire - ia6->ia6_updatetime) {
                                expire = ia6->ia6_updatetime +
                                    ia6->ia6_lifetime.ia6t_pltime;
                                if (expire != 0) {
                                        expire -= getuptime();
                                        expire += gettime();
                                }
                                retlt->ia6t_preferred = expire;
                        } else
                                retlt->ia6t_preferred = maxexpire;
                }
                break;

        default:
                panic("%s: invalid ioctl %lu", __func__, cmd);
        }

err:
        NET_UNLOCK_SHARED();
        return (error);
}

int
in6_check_embed_scope(struct sockaddr_in6 *sa6, unsigned int ifidx)
{
        if (IN6_IS_ADDR_LINKLOCAL(&sa6->sin6_addr)) {
                if (sa6->sin6_addr.s6_addr16[1] == 0) {
                        /* link ID is not embedded by the user */
                        sa6->sin6_addr.s6_addr16[1] = htons(ifidx);
                } else if (sa6->sin6_addr.s6_addr16[1] != htons(ifidx))
                        return EINVAL;  /* link ID contradicts */
        }
        return 0;
}

int
in6_clear_scope_id(struct sockaddr_in6 *sa6, unsigned int ifidx)
{
        if (IN6_IS_ADDR_LINKLOCAL(&sa6->sin6_addr)) {
                if (sa6->sin6_scope_id) {
                        if (sa6->sin6_scope_id != (u_int32_t)ifidx)
                                return EINVAL;
                        sa6->sin6_scope_id = 0; /* XXX: good way? */
                }
        }
        return 0;
}

/*
 * Update parameters of an IPv6 interface address.
 * If necessary, a new entry is created and linked into address chains.
 * This function is separated from in6_control().
 */
int
in6_update_ifa(struct ifnet *ifp, struct in6_aliasreq *ifra,
    struct in6_ifaddr *ia6)
{
        int error = 0, hostIsNew = 0, plen = -1;
        struct sockaddr_in6 dst6, gw6;
        struct in6_addrlifetime *lt;
        struct in6_multi_mship *imm;
        struct rtentry *rt;

        NET_ASSERT_LOCKED();

        /* Validate parameters */
        if (ifp == NULL || ifra == NULL) /* this maybe redundant */
                return (EINVAL);

        /*
         * The destination address for a p2p link or the address of the
         * announcing router for an autoconf address must have a family of
         * AF_UNSPEC or AF_INET6.
         */
        if ((ifp->if_flags & IFF_POINTOPOINT) ||
            (ifp->if_flags & IFF_LOOPBACK) ||
            (ifra->ifra_flags & IN6_IFF_AUTOCONF)) {
                if (ifra->ifra_dstaddr.sin6_family != AF_INET6 &&
                    ifra->ifra_dstaddr.sin6_family != AF_UNSPEC)
                        return (EAFNOSUPPORT);

        } else if (ifra->ifra_dstaddr.sin6_family != AF_UNSPEC)
                        return (EINVAL);

        /*
         * validate ifra_prefixmask.  don't check sin6_family, netmask
         * does not carry fields other than sin6_len.
         */
        if (ifra->ifra_prefixmask.sin6_len > sizeof(struct sockaddr_in6))
                return (EINVAL);
        /*
         * Because the IPv6 address architecture is classless, we require
         * users to specify a (non 0) prefix length (mask) for a new address.
         * We also require the prefix (when specified) mask is valid, and thus
         * reject a non-consecutive mask.
         */
        if (ia6 == NULL && ifra->ifra_prefixmask.sin6_len == 0)
                return (EINVAL);
        if (ifra->ifra_prefixmask.sin6_len != 0) {
                plen = in6_mask2len(&ifra->ifra_prefixmask.sin6_addr,
                    (u_char *)&ifra->ifra_prefixmask +
                    ifra->ifra_prefixmask.sin6_len);
                if (plen <= 0)
                        return (EINVAL);
        } else {
                /*
                 * In this case, ia6 must not be NULL.  We just use its prefix
                 * length.
                 */
                plen = in6_mask2len(&ia6->ia_prefixmask.sin6_addr, NULL);
        }

        if (ifra->ifra_flags & IN6_IFF_AUTOCONF) {
                gw6 = ifra->ifra_dstaddr;
                memset(&dst6, 0, sizeof(dst6));
        } else {
                dst6 = ifra->ifra_dstaddr;
                memset(&gw6, 0, sizeof(gw6));
        }
        if (dst6.sin6_family == AF_INET6) {
                error = in6_check_embed_scope(&dst6, ifp->if_index);
                if (error)
                        return error;

                if (((ifp->if_flags & IFF_POINTOPOINT) ||
                    (ifp->if_flags & IFF_LOOPBACK)) && plen != 128)
                        return (EINVAL);
        }
        if (gw6.sin6_family == AF_INET6) {
                error = in6_check_embed_scope(&gw6, ifp->if_index);
                if (error)
                        return error;
        }
        /* lifetime consistency check */
        lt = &ifra->ifra_lifetime;
        if (lt->ia6t_pltime > lt->ia6t_vltime)
                return (EINVAL);
        if (lt->ia6t_vltime == 0 && ia6 == NULL)
                return (0); /* there's nothing to do */

        /*
         * If this is a new address, allocate a new ifaddr and link it
         * into chains.
         */
        if (ia6 == NULL) {
                hostIsNew = 1;
                ia6 = malloc(sizeof(*ia6), M_IFADDR, M_WAITOK | M_ZERO);
                refcnt_init_trace(&ia6->ia_ifa.ifa_refcnt,
                    DT_REFCNT_IDX_IFADDR);
                LIST_INIT(&ia6->ia6_memberships);
                /* Initialize the address and masks, and put time stamp */
                ia6->ia_ifa.ifa_addr = sin6tosa(&ia6->ia_addr);
                ia6->ia_addr.sin6_family = AF_INET6;
                ia6->ia_addr.sin6_len = sizeof(ia6->ia_addr);
                ia6->ia6_updatetime = getuptime();
                if ((ifp->if_flags & IFF_POINTOPOINT) ||
                    (ifp->if_flags & IFF_LOOPBACK)) {
                        /*
                         * XXX: some functions expect that ifa_dstaddr is not
                         * NULL for p2p interfaces.
                         */
                        ia6->ia_ifa.ifa_dstaddr = sin6tosa(&ia6->ia_dstaddr);
                } else {
                        ia6->ia_ifa.ifa_dstaddr = NULL;
                }
                ia6->ia_ifa.ifa_netmask = sin6tosa(&ia6->ia_prefixmask);

                ia6->ia_ifp = ifp;
                ia6->ia_addr = ifra->ifra_addr;
                ifa_add(ifp, &ia6->ia_ifa);
        }

        /* set prefix mask */
        if (ifra->ifra_prefixmask.sin6_len) {
                /*
                 * We prohibit changing the prefix length of an existing
                 * address, because
                 * + such an operation should be rare in IPv6, and
                 * + the operation would confuse prefix management.
                 */
                if (ia6->ia_prefixmask.sin6_len &&
                    in6_mask2len(&ia6->ia_prefixmask.sin6_addr, NULL) != plen) {
                        error = EINVAL;
                        goto unlink;
                }
                ia6->ia_prefixmask = ifra->ifra_prefixmask;
        }

        /*
         * If a new destination address is specified, scrub the old one and
         * install the new destination.
         */
        if (((ifp->if_flags & IFF_POINTOPOINT)  ||
            (ifp->if_flags & IFF_LOOPBACK)) && dst6.sin6_family == AF_INET6 &&
            !IN6_ARE_ADDR_EQUAL(&dst6.sin6_addr, &ia6->ia_dstaddr.sin6_addr)) {
                struct ifaddr *ifa = &ia6->ia_ifa;

                if ((ia6->ia_flags & IFA_ROUTE) != 0)
                        if (rt_ifa_del(ifa, RTF_HOST, ifa->ifa_dstaddr,
                            ifp->if_rdomain) == 0)
                                ia6->ia_flags &= ~IFA_ROUTE;
                ia6->ia_dstaddr = dst6;
        }

        if ((ifra->ifra_flags & IN6_IFF_AUTOCONF) &&
            gw6.sin6_family == AF_INET6 &&
            !IN6_ARE_ADDR_EQUAL(&dst6.sin6_addr, &ia6->ia_gwaddr.sin6_addr)) {
                /* Set or update announcing router */
                ia6->ia_gwaddr = gw6;
        }

        /*
         * Set lifetimes.  We do not refer to ia6t_expire and ia6t_preferred
         * to see if the address is deprecated or invalidated, but initialize
         * these members for applications.
         */
        ia6->ia6_updatetime = getuptime();
        ia6->ia6_lifetime = ifra->ifra_lifetime;
        if (ia6->ia6_lifetime.ia6t_vltime != ND6_INFINITE_LIFETIME) {
                ia6->ia6_lifetime.ia6t_expire =
                    getuptime() + ia6->ia6_lifetime.ia6t_vltime;
        } else
                ia6->ia6_lifetime.ia6t_expire = 0;
        if (ia6->ia6_lifetime.ia6t_pltime != ND6_INFINITE_LIFETIME) {
                ia6->ia6_lifetime.ia6t_preferred =
                    getuptime() + ia6->ia6_lifetime.ia6t_pltime;
        } else
                ia6->ia6_lifetime.ia6t_preferred = 0;

        /* reset the interface and routing table appropriately. */
        if ((error = in6_ifinit(ifp, ia6, hostIsNew)) != 0)
                goto unlink;

        /* re-run DAD */
        if (ia6->ia6_flags & (IN6_IFF_TENTATIVE|IN6_IFF_DUPLICATED))
                ifra->ifra_flags |= IN6_IFF_TENTATIVE;
        /*
         * configure address flags.
         */
        ia6->ia6_flags = ifra->ifra_flags;

        nd6_expire_timer_update(ia6);

        /*
         * We are done if we have simply modified an existing address.
         */
        if (!hostIsNew) {
                /* DAD sends RTM_CHGADDRATTR when done. */
                if (!(ia6->ia6_flags & IN6_IFF_TENTATIVE))
                        rtm_addr(RTM_CHGADDRATTR, &ia6->ia_ifa);
                return (error);
        }

        /*
         * Beyond this point, we should call in6_purgeaddr upon an error,
         * not just go to unlink.
         */

        /* join necessary multiast groups */
        if ((ifp->if_flags & IFF_MULTICAST) != 0) {
                struct sockaddr_in6 mltaddr, mltmask;

                /* join solicited multicast addr for new host id */
                struct sockaddr_in6 llsol;

                bzero(&llsol, sizeof(llsol));
                llsol.sin6_family = AF_INET6;
                llsol.sin6_len = sizeof(llsol);
                llsol.sin6_addr.s6_addr16[0] = htons(0xff02);
                llsol.sin6_addr.s6_addr16[1] = htons(ifp->if_index);
                llsol.sin6_addr.s6_addr32[1] = 0;
                llsol.sin6_addr.s6_addr32[2] = htonl(1);
                llsol.sin6_addr.s6_addr32[3] =
                    ifra->ifra_addr.sin6_addr.s6_addr32[3];
                llsol.sin6_addr.s6_addr8[12] = 0xff;
                imm = in6_joingroup(ifp, &llsol.sin6_addr, &error);
                if (!imm)
                        goto cleanup;
                LIST_INSERT_HEAD(&ia6->ia6_memberships, imm, i6mm_chain);

                bzero(&mltmask, sizeof(mltmask));
                mltmask.sin6_len = sizeof(struct sockaddr_in6);
                mltmask.sin6_family = AF_INET6;
                mltmask.sin6_addr = in6mask32;

                /*
                 * join link-local all-nodes address
                 */
                bzero(&mltaddr, sizeof(mltaddr));
                mltaddr.sin6_len = sizeof(struct sockaddr_in6);
                mltaddr.sin6_family = AF_INET6;
                mltaddr.sin6_addr = in6addr_linklocal_allnodes;
                mltaddr.sin6_addr.s6_addr16[1] = htons(ifp->if_index);
                mltaddr.sin6_scope_id = 0;

                /*
                 * XXX: do we really need this automatic routes?
                 * We should probably reconsider this stuff.  Most applications
                 * actually do not need the routes, since they usually specify
                 * the outgoing interface.
                 */
                rt = rtalloc(sin6tosa(&mltaddr), 0, ifp->if_rdomain);
                if (rt) {
                        /* 32bit came from "mltmask" */
                        if (memcmp(&mltaddr.sin6_addr,
                            &satosin6(rt_key(rt))->sin6_addr,
                            32 / 8)) {
                                rtfree(rt);
                                rt = NULL;
                        }
                }
                if (!rt) {
                        struct rt_addrinfo info;

                        bzero(&info, sizeof(info));
                        info.rti_ifa = &ia6->ia_ifa;
                        info.rti_info[RTAX_DST] = sin6tosa(&mltaddr);
                        info.rti_info[RTAX_GATEWAY] = sin6tosa(&ia6->ia_addr);
                        info.rti_info[RTAX_NETMASK] = sin6tosa(&mltmask);
                        info.rti_info[RTAX_IFA] = sin6tosa(&ia6->ia_addr);
                        info.rti_flags = RTF_MULTICAST;
                        error = rtrequest(RTM_ADD, &info, RTP_CONNECTED, NULL,
                            ifp->if_rdomain);
                        if (error)
                                goto cleanup;
                } else {
                        rtfree(rt);
                }
                imm = in6_joingroup(ifp, &mltaddr.sin6_addr, &error);
                if (!imm)
                        goto cleanup;
                LIST_INSERT_HEAD(&ia6->ia6_memberships, imm, i6mm_chain);

                /*
                 * join interface-local all-nodes address.
                 * (ff01::1%ifN, and ff01::%ifN/32)
                 */
                bzero(&mltaddr, sizeof(mltaddr));
                mltaddr.sin6_len = sizeof(struct sockaddr_in6);
                mltaddr.sin6_family = AF_INET6;
                mltaddr.sin6_addr = in6addr_intfacelocal_allnodes;
                mltaddr.sin6_addr.s6_addr16[1] = htons(ifp->if_index);
                mltaddr.sin6_scope_id = 0;

                /* XXX: again, do we really need the route? */
                rt = rtalloc(sin6tosa(&mltaddr), 0, ifp->if_rdomain);
                if (rt) {
                        /* 32bit came from "mltmask" */
                        if (memcmp(&mltaddr.sin6_addr,
                            &satosin6(rt_key(rt))->sin6_addr,
                            32 / 8)) {
                                rtfree(rt);
                                rt = NULL;
                        }
                }
                if (!rt) {
                        struct rt_addrinfo info;

                        bzero(&info, sizeof(info));
                        info.rti_ifa = &ia6->ia_ifa;
                        info.rti_info[RTAX_DST] = sin6tosa(&mltaddr);
                        info.rti_info[RTAX_GATEWAY] = sin6tosa(&ia6->ia_addr);
                        info.rti_info[RTAX_NETMASK] = sin6tosa(&mltmask);
                        info.rti_info[RTAX_IFA] = sin6tosa(&ia6->ia_addr);
                        info.rti_flags = RTF_MULTICAST;
                        error = rtrequest(RTM_ADD, &info, RTP_CONNECTED, NULL,
                            ifp->if_rdomain);
                        if (error)
                                goto cleanup;
                } else {
                        rtfree(rt);
                }
                imm = in6_joingroup(ifp, &mltaddr.sin6_addr, &error);
                if (!imm)
                        goto cleanup;
                LIST_INSERT_HEAD(&ia6->ia6_memberships, imm, i6mm_chain);
        }

        return (error);

  unlink:
        /*
         * XXX: if a change of an existing address failed, keep the entry
         * anyway.
         */
        if (hostIsNew)
                in6_unlink_ifa(ia6, ifp);
        return (error);

  cleanup:
        in6_purgeaddr(&ia6->ia_ifa);
        return error;
}

void
in6_purgeaddr(struct ifaddr *ifa)
{
        struct ifnet *ifp = ifa->ifa_ifp;
        struct in6_ifaddr *ia6 = ifatoia6(ifa);
        struct in6_multi_mship *imm;

        /* stop DAD processing */
        nd6_dad_stop(ifa);

        /*
         * delete route to the destination of the address being purged.
         * The interface must be p2p or loopback in this case.
         */
        if ((ifp->if_flags & IFF_POINTOPOINT) && (ia6->ia_flags & IFA_ROUTE) &&
            ia6->ia_dstaddr.sin6_len != 0) {
                if (rt_ifa_del(ifa, RTF_HOST, ifa->ifa_dstaddr,
                    ifp->if_rdomain) == 0)
                        ia6->ia_flags &= ~IFA_ROUTE;
        }

        /* Remove ownaddr's loopback rtentry, if it exists. */
        rt_ifa_dellocal(&(ia6->ia_ifa));

        /*
         * leave from multicast groups we have joined for the interface
         */
        while (!LIST_EMPTY(&ia6->ia6_memberships)) {
                imm = LIST_FIRST(&ia6->ia6_memberships);
                LIST_REMOVE(imm, i6mm_chain);
                in6_leavegroup(imm);
        }

        in6_unlink_ifa(ia6, ifp);
}

void
in6_unlink_ifa(struct in6_ifaddr *ia6, struct ifnet *ifp)
{
        struct ifaddr *ifa = &ia6->ia_ifa;
        int plen;

        NET_ASSERT_LOCKED();

        /* Release the reference to the base prefix. */
        plen = in6_mask2len(&ia6->ia_prefixmask.sin6_addr, NULL);
        if ((ifp->if_flags & IFF_LOOPBACK) == 0 && plen != 128) {
                rt_ifa_del(ifa, RTF_CLONING | RTF_CONNECTED,
                    ifa->ifa_addr, ifp->if_rdomain);
        }

        rt_ifa_purge(ifa);
        ifa_del(ifp, ifa);

        ia6->ia_ifp = NULL;
        ifafree(ifa);
}

/*
 * Initialize an interface's inet6 address
 * and routing table entry.
 */
int
in6_ifinit(struct ifnet *ifp, struct in6_ifaddr *ia6, int newhost)
{
        int     error = 0, plen, ifacount = 0;
        struct ifaddr *ifa;

        NET_ASSERT_LOCKED();

        /*
         * Give the interface a chance to initialize
         * if this is its first address (or it is a CARP interface)
         * and to validate the address if necessary.
         */
        TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list) {
                if (ifa->ifa_addr->sa_family != AF_INET6)
                        continue;
                ifacount++;
        }

        if ((ifacount <= 1 || ifp->if_type == IFT_CARP ||
            (ifp->if_flags & (IFF_LOOPBACK|IFF_POINTOPOINT))) &&
            (error = (*ifp->if_ioctl)(ifp, SIOCSIFADDR, (caddr_t)ia6))) {
                return (error);
        }

        ia6->ia_ifa.ifa_metric = ifp->if_metric;

        /* we could do in(6)_socktrim here, but just omit it at this moment. */

        /*
         * Special case:
         * If the destination address is specified for a point-to-point
         * interface, install a route to the destination as an interface
         * direct route.
         */
        plen = in6_mask2len(&ia6->ia_prefixmask.sin6_addr, NULL); /* XXX */
        if ((ifp->if_flags & IFF_POINTOPOINT) && plen == 128 &&
            ia6->ia_dstaddr.sin6_family == AF_INET6) {
                ifa = &ia6->ia_ifa;
                error = rt_ifa_add(ifa, RTF_HOST | RTF_MPATH,
                    ifa->ifa_dstaddr, ifp->if_rdomain);
                if (error != 0)
                        return (error);
                ia6->ia_flags |= IFA_ROUTE;
        }

        if (newhost)
                error = rt_ifa_addlocal(&(ia6->ia_ifa));

        return (error);
}

/*
 * Look up the in6_multi record for a given IP6 multicast address
 * on a given interface.  Return the matching record if found or NULL.
 */
struct in6_multi *
in6_lookupmulti(const struct in6_addr *addr, struct ifnet *ifp)
{
        struct in6_multi *in6m = NULL;
        struct ifmaddr *ifma;

        rw_assert_anylock(&ifp->if_maddrlock);

        TAILQ_FOREACH(ifma, &ifp->if_maddrlist, ifma_list) {
                if (ifma->ifma_addr->sa_family == AF_INET6 &&
                    IN6_ARE_ADDR_EQUAL(&ifmatoin6m(ifma)->in6m_addr, addr)) {
                        in6m = ifmatoin6m(ifma);
                        break;
                }
        }
        return (in6m);
}

/*
 * Add an address to the list of IP6 multicast addresses for a
 * given interface.
 */
struct in6_multi *
in6_addmulti(const struct in6_addr *addr, struct ifnet *ifp, int *errorp)
{
        struct  in6_multi *in6m, *new_in6m = NULL;
        struct  mld6_pktinfo pkt;
        struct  in6_ifreq ifr;

        *errorp = 0;
        /*
         * See if address already in list.
         */
        rw_enter_write(&ifp->if_maddrlock);
        in6m = in6_lookupmulti(addr, ifp);
        if (in6m != NULL)
                goto found;
        rw_exit_write(&ifp->if_maddrlock);

        /*
         * New address; allocate a new multicast record
         * and link it into the interface's multicast list.
         */
        new_in6m = malloc(sizeof(*in6m), M_IPMADDR, M_NOWAIT | M_ZERO);
        if (new_in6m == NULL) {
                *errorp = ENOBUFS;
                return (NULL);
        }

        /*
         * Ask the network driver to update its multicast reception
         * filter appropriately for the new address.
         */
        memset(&ifr, 0, sizeof(ifr));
        ifr.ifr_addr.sin6_len = sizeof(struct sockaddr_in6);
        ifr.ifr_addr.sin6_family = AF_INET6;
        ifr.ifr_addr.sin6_addr = *addr;
        KERNEL_LOCK();
        *errorp = (*ifp->if_ioctl)(ifp, SIOCADDMULTI, (caddr_t)&ifr);
        KERNEL_UNLOCK();
        if (*errorp)
                goto out;

        rw_enter_write(&ifp->if_maddrlock);
        /* check again after unlock and lock */
        in6m = in6_lookupmulti(addr, ifp);
        if (in6m != NULL)
                goto found;
        in6m = new_in6m;
        in6m->in6m_sin.sin6_len = sizeof(struct sockaddr_in6);
        in6m->in6m_sin.sin6_family = AF_INET6;
        in6m->in6m_sin.sin6_addr = *addr;
        refcnt_init_trace(&in6m->in6m_refcnt, DT_REFCNT_IDX_IFMADDR);
        in6m->in6m_ifidx = ifp->if_index;
        in6m->in6m_ifma.ifma_addr = sin6tosa(&in6m->in6m_sin);

        /*
         * Let MLD6 know that we have joined a new IP6 multicast group.
         */
        TAILQ_INSERT_HEAD(&ifp->if_maddrlist, &in6m->in6m_ifma, ifma_list);
        pkt.mpi_ifidx = 0;
        mld6_start_listening(in6m, ifp, &pkt);
        rw_exit_write(&ifp->if_maddrlock);

        if (pkt.mpi_ifidx)
                mld6_sendpkt(&pkt);

        return (in6m);

 found:
        refcnt_take(&in6m->in6m_refcnt);
        rw_exit_write(&ifp->if_maddrlock);
 out:
        free(new_in6m, M_IPMADDR, sizeof(*in6m));
        return (in6m);
}

/*
 * Delete a multicast address record.
 */
void
in6_delmulti(struct in6_multi *in6m)
{
        struct  mld6_pktinfo pkt;
        struct  in6_ifreq ifr;
        struct  ifnet *ifp;

        if (refcnt_rele(&in6m->in6m_refcnt) == 0)
                return;

        ifp = if_get(in6m->in6m_ifidx);
        if (ifp != NULL) {
                rw_enter_write(&ifp->if_maddrlock);
                /*
                 * No remaining claims to this record; let MLD6 know
                 * that we are leaving the multicast group.
                 */
                pkt.mpi_ifidx = 0;
                mld6_stop_listening(in6m, ifp, &pkt);
                TAILQ_REMOVE(&ifp->if_maddrlist, &in6m->in6m_ifma, ifma_list);
                rw_exit_write(&ifp->if_maddrlock);

                if (pkt.mpi_ifidx)
                        mld6_sendpkt(&pkt);

                /*
                 * Notify the network driver to update its multicast
                 * reception filter.
                 */
                memset(&ifr, 0, sizeof(ifr));
                ifr.ifr_addr.sin6_len = sizeof(struct sockaddr_in6);
                ifr.ifr_addr.sin6_family = AF_INET6;
                ifr.ifr_addr.sin6_addr = in6m->in6m_addr;
                KERNEL_LOCK();
                (*ifp->if_ioctl)(ifp, SIOCDELMULTI, (caddr_t)&ifr);
                KERNEL_UNLOCK();

                if_put(ifp);
        }

        free(in6m, M_IPMADDR, sizeof(*in6m));
}

/*
 * Return 1 if the multicast group represented by ``addr'' has been
 * joined by interface ``ifp'', 0 otherwise.
 */
int
in6_hasmulti(const struct in6_addr *addr, struct ifnet *ifp)
{
        struct in6_multi *in6m;
        int joined;

        rw_enter_read(&ifp->if_maddrlock);
        in6m = in6_lookupmulti(addr, ifp);
        joined = (in6m != NULL);
        rw_exit_read(&ifp->if_maddrlock);

        return (joined);
}

struct in6_multi_mship *
in6_joingroup(struct ifnet *ifp, const struct in6_addr *addr, int *errorp)
{
        struct in6_multi_mship *imm;

        imm = malloc(sizeof(*imm), M_IPMADDR, M_NOWAIT);
        if (!imm) {
                *errorp = ENOBUFS;
                return NULL;
        }
        imm->i6mm_maddr = in6_addmulti(addr, ifp, errorp);
        if (!imm->i6mm_maddr) {
                /* *errorp is already set */
                free(imm, M_IPMADDR, sizeof(*imm));
                return NULL;
        }
        return imm;
}

void
in6_leavegroup(struct in6_multi_mship *imm)
{

        if (imm->i6mm_maddr)
                in6_delmulti(imm->i6mm_maddr);
        free(imm,  M_IPMADDR, sizeof(*imm));
}

/*
 * Find an IPv6 interface link-local address specific to an interface.
 */
struct in6_ifaddr *
in6ifa_ifpforlinklocal(struct ifnet *ifp, int ignoreflags)
{
        struct ifaddr *ifa;

        TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list) {
                if (ifa->ifa_addr->sa_family != AF_INET6)
                        continue;
                if (IN6_IS_ADDR_LINKLOCAL(IFA_IN6(ifa))) {
                        if ((ifatoia6(ifa)->ia6_flags & ignoreflags) != 0)
                                continue;
                        break;
                }
        }

        return (ifatoia6(ifa));
}


/*
 * find the internet address corresponding to a given interface and address.
 */
struct in6_ifaddr *
in6ifa_ifpwithaddr(struct ifnet *ifp, struct in6_addr *addr)
{
        struct ifaddr *ifa;

        TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list) {
                if (ifa->ifa_addr->sa_family != AF_INET6)
                        continue;
                if (IN6_ARE_ADDR_EQUAL(addr, IFA_IN6(ifa)))
                        break;
        }

        return (ifatoia6(ifa));
}

/*
 * Get a scope of the address. Node-local, link-local, site-local or global.
 */
int
in6_addrscope(const struct in6_addr *addr)
{
        int scope;

        if (addr->s6_addr8[0] == 0xfe) {
                scope = addr->s6_addr8[1] & 0xc0;

                switch (scope) {
                case 0x80:
                        return __IPV6_ADDR_SCOPE_LINKLOCAL;
                        break;
                case 0xc0:
                        return __IPV6_ADDR_SCOPE_SITELOCAL;
                        break;
                default:
                        return __IPV6_ADDR_SCOPE_GLOBAL; /* just in case */
                        break;
                }
        }


        if (addr->s6_addr8[0] == 0xff) {
                scope = addr->s6_addr8[1] & 0x0f;

                /*
                 * due to other scope such as reserved,
                 * return scope doesn't work.
                 */
                switch (scope) {
                case __IPV6_ADDR_SCOPE_INTFACELOCAL:
                        return __IPV6_ADDR_SCOPE_INTFACELOCAL;
                        break;
                case __IPV6_ADDR_SCOPE_LINKLOCAL:
                        return __IPV6_ADDR_SCOPE_LINKLOCAL;
                        break;
                case __IPV6_ADDR_SCOPE_SITELOCAL:
                        return __IPV6_ADDR_SCOPE_SITELOCAL;
                        break;
                default:
                        return __IPV6_ADDR_SCOPE_GLOBAL;
                        break;
                }
        }

        if (bcmp(&in6addr_loopback, addr, sizeof(*addr) - 1) == 0) {
                if (addr->s6_addr8[15] == 1) /* loopback */
                        return __IPV6_ADDR_SCOPE_INTFACELOCAL;
                if (addr->s6_addr8[15] == 0) /* unspecified */
                        return __IPV6_ADDR_SCOPE_LINKLOCAL;
        }

        return __IPV6_ADDR_SCOPE_GLOBAL;
}

int
in6_addr2scopeid(unsigned int ifidx, const struct in6_addr *addr)
{
        int scope = in6_addrscope(addr);

        switch(scope) {
        case __IPV6_ADDR_SCOPE_INTFACELOCAL:
        case __IPV6_ADDR_SCOPE_LINKLOCAL:
                /* XXX: we do not distinguish between a link and an I/F. */
                return (ifidx);

        case __IPV6_ADDR_SCOPE_SITELOCAL:
                return (0);     /* XXX: invalid. */

        default:
                return (0);     /* XXX: treat as global. */
        }
}

/*
 * return length of part which dst and src are equal
 * hard coding...
 */
int
in6_matchlen(const struct in6_addr *src, const struct in6_addr *dst)
{
        int match = 0;
        u_char *s = (u_char *)src, *d = (u_char *)dst;
        u_char *lim = s + 16, r;

        while (s < lim)
                if ((r = (*d++ ^ *s++)) != 0) {
                        while (r < 128) {
                                match++;
                                r <<= 1;
                        }
                        break;
                } else
                        match += 8;
        return match;
}

void
in6_prefixlen2mask(struct in6_addr *maskp, int len)
{
        u_char maskarray[8] = {0x80, 0xc0, 0xe0, 0xf0, 0xf8, 0xfc, 0xfe, 0xff};
        int bytelen, bitlen, i;

        /* sanity check */
        if (0 > len || len > 128) {
                log(LOG_ERR, "in6_prefixlen2mask: invalid prefix length(%d)\n",
                    len);
                return;
        }

        bzero(maskp, sizeof(*maskp));
        bytelen = len / 8;
        bitlen = len % 8;
        for (i = 0; i < bytelen; i++)
                maskp->s6_addr[i] = 0xff;
        /* len == 128 is ok because bitlen == 0 then */
        if (bitlen)
                maskp->s6_addr[bytelen] = maskarray[bitlen - 1];
}

/*
 * return the best address out of the same scope
 */
struct in6_ifaddr *
in6_ifawithscope(struct ifnet *oifp, const struct in6_addr *dst, u_int rdomain,
    struct rtentry *rt)
{
        int dst_scope = in6_addrscope(dst), src_scope, best_scope = 0;
        int blen = -1;
        struct ifaddr *ifa;
        struct ifnet *ifp;
        struct in6_ifaddr *ia6_best = NULL;
        struct in6_addr *gw6 = NULL;

        if (rt) {
                if (rt->rt_gateway != NULL &&
                    rt->rt_gateway->sa_family == AF_INET6)
                        gw6 = &(satosin6(rt->rt_gateway)->sin6_addr);
        }

        if (oifp == NULL) {
                printf("%s: output interface is not specified\n", __func__);
                return (NULL);
        }

        NET_ASSERT_LOCKED();

        /* We search for all addresses on all interfaces from the beginning. */
        TAILQ_FOREACH(ifp, &ifnetlist, if_list) {
                if (ifp->if_rdomain != rdomain)
                        continue;
#if NCARP > 0
                /*
                 * Never use a carp address of an interface which is not
                 * the master.
                 */
                if (ifp->if_type == IFT_CARP && !carp_iamatch(ifp))
                        continue;
#endif

                /*
                 * We can never take an address that breaks the scope zone
                 * of the destination.
                 */
                if (in6_addr2scopeid(ifp->if_index, dst) !=
                    in6_addr2scopeid(oifp->if_index, dst))
                        continue;

                TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list) {
                        int tlen = -1;

                        if (ifa->ifa_addr->sa_family != AF_INET6)
                                continue;

                        src_scope = in6_addrscope(IFA_IN6(ifa));

                        /*
                         * Don't use an address before completing DAD
                         * nor a duplicated address.
                         */
                        if (ifatoia6(ifa)->ia6_flags &
                            (IN6_IFF_TENTATIVE|IN6_IFF_DUPLICATED))
                                continue;

                        /*
                         * RFC 6724 allows anycast addresses as source address
                         * because the restriction was removed in RFC 4291.
                         * However RFC 4443 states that ICMPv6 responses
                         * MUST use a unicast source address.
                         *
                         * XXX Skip anycast addresses for now since
                         * icmp6_reflect() uses this function for source
                         * address selection.
                         */
                        if (ifatoia6(ifa)->ia6_flags & IN6_IFF_ANYCAST)
                                continue;

                        if (ifatoia6(ifa)->ia6_flags & IN6_IFF_DETACHED)
                                continue;

                        /*
                         * If this is the first address we find,
                         * keep it anyway.
                         */
                        if (ia6_best == NULL)
                                goto replace;

                        /*
                         * ia6_best is never NULL beyond this line except
                         * within the block labeled "replace".
                         */

                        /*
                         * Rule 2: Prefer appropriate scope.
                         * Find the address with the smallest scope that is
                         * bigger (or equal) to the scope of the destination
                         * address.
                         * Accept an address with smaller scope than the
                         * destination if non exists with bigger scope.
                         */
                        if (best_scope < src_scope) {
                                if (best_scope < dst_scope)
                                        goto replace;
                                else
                                        continue;
                        } else if (src_scope < best_scope) {
                                if (src_scope < dst_scope)
                                        continue;
                                else
                                        goto replace;
                        }

                        /* Rule 3: Avoid deprecated addresses. */
                        if (ifatoia6(ifa)->ia6_flags & IN6_IFF_DEPRECATED) {
                                /*
                                 * If we have already found a non-deprecated
                                 * candidate, just ignore deprecated addresses.
                                 */
                                if ((ia6_best->ia6_flags & IN6_IFF_DEPRECATED)
                                    == 0)
                                        continue;
                        } else if ((ia6_best->ia6_flags & IN6_IFF_DEPRECATED))
                                goto replace;

                        /*
                         * Rule 4: Prefer home addresses.
                         * We do not support home addresses.
                         */

                        /* Rule 5: Prefer outgoing interface */
                        if (ia6_best->ia_ifp == oifp && ifp != oifp)
                                continue;
                        if (ia6_best->ia_ifp != oifp && ifp == oifp)
                                goto replace;

                        /*
                         * Rule 5.5: Prefer addresses in a prefix advertised
                         * by the next-hop.
                         */
                        if (gw6) {
                                struct in6_addr *in6_bestgw, *in6_newgw;

                                in6_bestgw = &ia6_best->ia_gwaddr.sin6_addr;
                                in6_newgw = &ifatoia6(ifa)->ia_gwaddr.sin6_addr;
                                if (!IN6_ARE_ADDR_EQUAL(in6_bestgw, gw6) &&
                                    IN6_ARE_ADDR_EQUAL(in6_newgw, gw6))
                                        goto replace;
                        }

                        /*
                         * Rule 6: Prefer matching label.
                         * We do not implement policy tables.
                         */

                        /* Rule 7: Prefer temporary addresses. */
                        if ((ia6_best->ia6_flags & IN6_IFF_TEMPORARY) &&
                            !(ifatoia6(ifa)->ia6_flags & IN6_IFF_TEMPORARY))
                                continue;
                        if (!(ia6_best->ia6_flags & IN6_IFF_TEMPORARY) &&
                            (ifatoia6(ifa)->ia6_flags & IN6_IFF_TEMPORARY))
                                goto replace;

                        /* Rule 8: Use longest matching prefix. */
                        tlen = in6_matchlen(IFA_IN6(ifa), dst);
                        if (tlen > blen) {
#if NCARP > 0
                                /*
                                 * Don't let carp interfaces win a tie against
                                 * the output interface based on matchlen.
                                 * We should only use a carp address if no
                                 * other interface has a usable address.
                                 * Otherwise, when communicating from a carp
                                 * master to a carp backup, the backup system
                                 * won't respond since the carp address is also
                                 * configured as a local address on the backup.
                                 * Note that carp interfaces in backup state
                                 * were already skipped above.
                                 */
                                if (ifp->if_type == IFT_CARP &&
                                    oifp->if_type != IFT_CARP)
                                        continue;
#endif
                                goto replace;
                        } else if (tlen < blen)
                                continue;

                        /*
                         * If the eight rules fail to choose a single address,
                         * the tiebreaker is implementation-specific.
                         */

                         /* Prefer address with highest pltime. */
                        if (ia6_best->ia6_updatetime +
                            ia6_best->ia6_lifetime.ia6t_pltime <
                            ifatoia6(ifa)->ia6_updatetime +
                            ifatoia6(ifa)->ia6_lifetime.ia6t_pltime)
                                goto replace;
                        else if (ia6_best->ia6_updatetime +
                            ia6_best->ia6_lifetime.ia6t_pltime >
                            ifatoia6(ifa)->ia6_updatetime +
                            ifatoia6(ifa)->ia6_lifetime.ia6t_pltime)
                                continue;

                        /* Prefer address with highest vltime. */
                        if (ia6_best->ia6_updatetime +
                            ia6_best->ia6_lifetime.ia6t_vltime <
                            ifatoia6(ifa)->ia6_updatetime +
                            ifatoia6(ifa)->ia6_lifetime.ia6t_vltime)
                                goto replace;
                        else if (ia6_best->ia6_updatetime +
                            ia6_best->ia6_lifetime.ia6t_vltime >
                            ifatoia6(ifa)->ia6_updatetime +
                            ifatoia6(ifa)->ia6_lifetime.ia6t_vltime)
                                continue;

                        continue;
                  replace:
                        ia6_best = ifatoia6(ifa);
                        blen = tlen >= 0 ? tlen :
                            in6_matchlen(IFA_IN6(ifa), dst);
                        best_scope =
                            in6_addrscope(&ia6_best->ia_addr.sin6_addr);
                }
        }

        /* count statistics for future improvements */
        if (ia6_best == NULL)
                ip6stat_inc(ip6s_sources_none);
        else {
                if (oifp == ia6_best->ia_ifp)
                        ip6stat_inc(ip6s_sources_sameif + best_scope);
                else
                        ip6stat_inc(ip6s_sources_otherif + best_scope);

                if (best_scope == dst_scope)
                        ip6stat_inc(ip6s_sources_samescope + best_scope);
                else
                        ip6stat_inc(ip6s_sources_otherscope + best_scope);

                if ((ia6_best->ia6_flags & IN6_IFF_DEPRECATED) != 0)
                        ip6stat_inc(ip6s_sources_deprecated + best_scope);
        }

        return (ia6_best);
}

int
in6if_do_dad(struct ifnet *ifp)
{
        if ((ifp->if_flags & IFF_LOOPBACK) != 0)
                return (0);

        switch (ifp->if_type) {
#if NCARP > 0
        case IFT_CARP:
                /*
                 * XXX: DAD does not work currently on carp(4)
                 * so disable it for now.
                 */
                return (0);
#endif
        default:
                /*
                 * Our DAD routine requires the interface up and running.
                 * However, some interfaces can be up before the RUNNING
                 * status.  Additionally, users may try to assign addresses
                 * before the interface becomes up (or running).
                 * We simply skip DAD in such a case as a work around.
                 * XXX: we should rather mark "tentative" on such addresses,
                 * and do DAD after the interface becomes ready.
                 */
                if ((ifp->if_flags & (IFF_UP|IFF_RUNNING)) !=
                    (IFF_UP|IFF_RUNNING))
                        return (0);

                return (1);
        }
}