#include <sys/types.h>
#include <sys/stream.h>
#include <sys/stropts.h>
#include <sys/ddi.h>
#include <sys/cmn_err.h>
#include <sys/systm.h>
#include <sys/param.h>
#include <sys/socket.h>
#include <net/if.h>
#include <net/route.h>
#include <netinet/in.h>
#include <net/if_dl.h>
#include <netinet/ip6.h>
#include <netinet/icmp6.h>
#include <inet/common.h>
#include <inet/mi.h>
#include <inet/ip.h>
#include <inet/ip6.h>
#include <inet/ip_ndp.h>
#include <inet/ip_if.h>
#include <inet/ip_ire.h>
#include <inet/ipclassifier.h>
#include <inet/nd.h>
#include <inet/tunables.h>
#include <sys/kmem.h>
#include <sys/zone.h>
#include <sys/tsol/label.h>
#include <sys/tsol/tnet.h>
#define IS_DEFAULT_ROUTE_V6(ire) \
(((ire)->ire_type & IRE_DEFAULT) || \
(((ire)->ire_type & IRE_INTERFACE) && \
(IN6_IS_ADDR_UNSPECIFIED(&(ire)->ire_addr_v6))))
static ire_t ire_null;
static ire_t *
ire_ftable_lookup_impl_v6(const in6_addr_t *addr, const in6_addr_t *mask,
const in6_addr_t *gateway, int type, const ill_t *ill,
zoneid_t zoneid, const ts_label_t *tsl, int flags,
ip_stack_t *ipst);
int
ire_init_v6(ire_t *ire, const in6_addr_t *v6addr, const in6_addr_t *v6mask,
const in6_addr_t *v6gateway, ushort_t type, ill_t *ill,
zoneid_t zoneid, uint_t flags, tsol_gc_t *gc, ip_stack_t *ipst)
{
int error;
if (gc != NULL && !is_system_labeled())
return (EINVAL);
BUMP_IRE_STATS(ipst->ips_ire_stats_v6, ire_stats_alloced);
if (v6addr != NULL)
ire->ire_addr_v6 = *v6addr;
if (v6gateway != NULL)
ire->ire_gateway_addr_v6 = *v6gateway;
switch (type) {
case IRE_LOOPBACK:
case IRE_HOST:
case IRE_LOCAL:
case IRE_IF_CLONE:
ire->ire_mask_v6 = ipv6_all_ones;
ire->ire_masklen = IPV6_ABITS;
break;
case IRE_PREFIX:
case IRE_DEFAULT:
case IRE_IF_RESOLVER:
case IRE_IF_NORESOLVER:
if (v6mask != NULL) {
ire->ire_mask_v6 = *v6mask;
ire->ire_masklen =
ip_mask_to_plen_v6(&ire->ire_mask_v6);
}
break;
case IRE_MULTICAST:
case IRE_NOROUTE:
ASSERT(v6mask == NULL);
break;
default:
ASSERT(0);
return (EINVAL);
}
error = ire_init_common(ire, type, ill, zoneid, flags, IPV6_VERSION,
gc, ipst);
if (error != 0)
return (error);
ire->ire_postfragfn = ip_xmit;
switch (ire->ire_type) {
case IRE_LOCAL:
ire->ire_sendfn = ire_send_local_v6;
ire->ire_recvfn = ire_recv_local_v6;
ASSERT(ire->ire_ill != NULL);
if (ire->ire_ill->ill_flags & ILLF_NOACCEPT)
ire->ire_recvfn = ire_recv_noaccept_v6;
break;
case IRE_LOOPBACK:
ire->ire_sendfn = ire_send_local_v6;
ire->ire_recvfn = ire_recv_loopback_v6;
break;
case IRE_MULTICAST:
ire->ire_postfragfn = ip_postfrag_loopcheck;
ire->ire_sendfn = ire_send_multicast_v6;
ire->ire_recvfn = ire_recv_multicast_v6;
break;
default:
ire->ire_sendfn = ire_send_wire_v6;
ire->ire_recvfn = ire_recv_forward_v6;
break;
}
if (ire->ire_flags & (RTF_REJECT|RTF_BLACKHOLE)) {
ire->ire_sendfn = ire_send_noroute_v6;
ire->ire_recvfn = ire_recv_noroute_v6;
} else if (ire->ire_flags & RTF_MULTIRT) {
ire->ire_postfragfn = ip_postfrag_multirt_v6;
ire->ire_sendfn = ire_send_multirt_v6;
ire->ire_recvfn = ire_recv_multirt_v6;
}
ire->ire_nce_capable = ire_determine_nce_capable(ire);
return (0);
}
ire_t *
ire_create_v6(const in6_addr_t *v6addr, const in6_addr_t *v6mask,
const in6_addr_t *v6gateway, ushort_t type, ill_t *ill, zoneid_t zoneid,
uint_t flags, tsol_gc_t *gc, ip_stack_t *ipst)
{
ire_t *ire;
int error;
ASSERT(!IN6_IS_ADDR_V4MAPPED(v6addr));
ire = kmem_cache_alloc(ire_cache, KM_NOSLEEP);
if (ire == NULL) {
DTRACE_PROBE(kmem__cache__alloc);
return (NULL);
}
*ire = ire_null;
error = ire_init_v6(ire, v6addr, v6mask, v6gateway,
type, ill, zoneid, flags, gc, ipst);
if (error != 0) {
DTRACE_PROBE2(ire__init__v6, ire_t *, ire, int, error);
kmem_cache_free(ire_cache, ire);
return (NULL);
}
return (ire);
}
ill_t *
ire_lookup_multi_ill_v6(const in6_addr_t *group, zoneid_t zoneid,
ip_stack_t *ipst, boolean_t *multirtp, in6_addr_t *setsrcp)
{
ire_t *ire;
ill_t *ill;
ire = ire_route_recursive_v6(group, 0, NULL, zoneid, NULL,
MATCH_IRE_DSTONLY, IRR_NONE, 0, ipst, setsrcp, NULL, NULL);
ASSERT(ire != NULL);
if (ire->ire_flags & (RTF_REJECT|RTF_BLACKHOLE)) {
ire_refrele(ire);
return (NULL);
}
if (multirtp != NULL)
*multirtp = (ire->ire_flags & RTF_MULTIRT) != 0;
ill = ire_nexthop_ill(ire);
ire_refrele(ire);
return (ill);
}
int
ip_mask_to_plen_v6(const in6_addr_t *v6mask)
{
int bits;
int plen = IPV6_ABITS;
int i;
for (i = 3; i >= 0; i--) {
if (v6mask->s6_addr32[i] == 0) {
plen -= 32;
continue;
}
bits = ffs(ntohl(v6mask->s6_addr32[i])) - 1;
if (bits == 0)
break;
plen -= bits;
}
return (plen);
}
in6_addr_t *
ip_plen_to_mask_v6(uint_t plen, in6_addr_t *bitmask)
{
uint32_t *ptr;
if (plen < 0 || plen > IPV6_ABITS)
return (NULL);
*bitmask = ipv6_all_zeros;
if (plen == 0)
return (bitmask);
ptr = (uint32_t *)bitmask;
while (plen > 32) {
*ptr++ = 0xffffffffU;
plen -= 32;
}
*ptr = htonl(0xffffffffU << (32 - plen));
return (bitmask);
}
ire_t *
ire_add_v6(ire_t *ire)
{
ire_t *ire1;
int mask_table_index;
irb_t *irb_ptr;
ire_t **irep;
int match_flags;
int error;
ip_stack_t *ipst = ire->ire_ipst;
ASSERT(ire->ire_ipversion == IPV6_VERSION);
V6_MASK_COPY(ire->ire_addr_v6, ire->ire_mask_v6, ire->ire_addr_v6);
mask_table_index = ip_mask_to_plen_v6(&ire->ire_mask_v6);
if ((ipst->ips_ip_forwarding_table_v6[mask_table_index]) == NULL) {
irb_t *ptr;
int i;
ptr = (irb_t *)mi_zalloc((ipst->ips_ip6_ftable_hash_size *
sizeof (irb_t)));
if (ptr == NULL) {
ire_delete(ire);
return (NULL);
}
for (i = 0; i < ipst->ips_ip6_ftable_hash_size; i++) {
rw_init(&ptr[i].irb_lock, NULL, RW_DEFAULT, NULL);
ptr[i].irb_ipst = ipst;
}
mutex_enter(&ipst->ips_ire_ft_init_lock);
if (ipst->ips_ip_forwarding_table_v6[mask_table_index] ==
NULL) {
ipst->ips_ip_forwarding_table_v6[mask_table_index] =
ptr;
mutex_exit(&ipst->ips_ire_ft_init_lock);
} else {
mutex_exit(&ipst->ips_ire_ft_init_lock);
for (i = 0; i < ipst->ips_ip6_ftable_hash_size; i++) {
rw_destroy(&ptr[i].irb_lock);
}
mi_free(ptr);
}
}
irb_ptr = &(ipst->ips_ip_forwarding_table_v6[mask_table_index][
IRE_ADDR_MASK_HASH_V6(ire->ire_addr_v6, ire->ire_mask_v6,
ipst->ips_ip6_ftable_hash_size)]);
match_flags = (MATCH_IRE_MASK | MATCH_IRE_TYPE | MATCH_IRE_GW);
if (ire->ire_ill != NULL)
match_flags |= MATCH_IRE_ILL;
error = ire_atomic_start(irb_ptr, ire);
if (error != 0) {
ire_delete(ire);
return (NULL);
}
if (ire->ire_testhidden)
match_flags |= MATCH_IRE_TESTHIDDEN;
for (ire1 = irb_ptr->irb_ire; ire1 != NULL; ire1 = ire1->ire_next) {
if (IRE_IS_CONDEMNED(ire1))
continue;
if (ire1->ire_zoneid != ire->ire_zoneid)
continue;
if (ire1->ire_type != ire->ire_type)
continue;
if (ire_match_args_v6(ire1, &ire->ire_addr_v6,
&ire->ire_mask_v6, &ire->ire_gateway_addr_v6,
ire->ire_type, ire->ire_ill, ire->ire_zoneid, NULL,
match_flags)) {
if (ire->ire_type != IRE_IF_CLONE) {
atomic_add_32(&ire1->ire_identical_ref, 1);
DTRACE_PROBE2(ire__add__exist, ire_t *, ire1,
ire_t *, ire);
}
ip1dbg(("found dup ire existing %p new %p",
(void *)ire1, (void *)ire));
ire_refhold(ire1);
ire_atomic_end(irb_ptr, ire);
ire_delete(ire);
return (ire1);
}
}
irep = (ire_t **)irb_ptr;
if (ire->ire_type & IRE_IF_CLONE) {
while ((ire1 = *irep) != NULL)
irep = &ire1->ire_next;
}
ire1 = *irep;
if (ire1 != NULL)
ire1->ire_ptpn = &ire->ire_next;
ire->ire_next = ire1;
ire->ire_ptpn = irep;
membar_producer();
*irep = ire;
ire->ire_bucket = irb_ptr;
ire_refhold_locked(ire);
BUMP_IRE_STATS(ipst->ips_ire_stats_v6, ire_stats_inserted);
irb_ptr->irb_ire_cnt++;
if (ire->ire_ill != NULL) {
DTRACE_PROBE3(ill__incr__cnt, (ill_t *), ire->ire_ill,
(char *), "ire", (void *), ire);
ire->ire_ill->ill_ire_cnt++;
ASSERT(ire->ire_ill->ill_ire_cnt != 0);
}
ire_atomic_end(irb_ptr, ire);
ire_flush_cache_v6(ire, IRE_FLUSH_ADD);
return (ire);
}
static void
ire_delete_host_redirects_v6(const in6_addr_t *gateway, ip_stack_t *ipst)
{
irb_t *irb_ptr;
irb_t *irb;
ire_t *ire;
in6_addr_t gw_addr_v6;
int i;
irb_ptr = ipst->ips_ip_forwarding_table_v6[(IP6_MASK_TABLE_SIZE - 1)];
if (irb_ptr == NULL)
return;
for (i = 0; (i < ipst->ips_ip6_ftable_hash_size); i++) {
irb = &irb_ptr[i];
irb_refhold(irb);
for (ire = irb->irb_ire; ire != NULL; ire = ire->ire_next) {
if (!(ire->ire_flags & RTF_DYNAMIC))
continue;
mutex_enter(&ire->ire_lock);
gw_addr_v6 = ire->ire_gateway_addr_v6;
mutex_exit(&ire->ire_lock);
if (IN6_ARE_ADDR_EQUAL(&gw_addr_v6, gateway))
ire_delete(ire);
}
irb_refrele(irb);
}
}
void
ire_delete_v6(ire_t *ire)
{
in6_addr_t gw_addr_v6;
ip_stack_t *ipst = ire->ire_ipst;
rw_enter(&ipst->ips_ip6_ire_head_lock, RW_WRITER);
rw_exit(&ipst->ips_ip6_ire_head_lock);
ASSERT(ire->ire_refcnt >= 1);
ASSERT(ire->ire_ipversion == IPV6_VERSION);
ire_flush_cache_v6(ire, IRE_FLUSH_DELETE);
if (ire->ire_type == IRE_DEFAULT) {
mutex_enter(&ire->ire_lock);
gw_addr_v6 = ire->ire_gateway_addr_v6;
mutex_exit(&ire->ire_lock);
ire_delete_host_redirects_v6(&gw_addr_v6, ipst);
}
if ((ire->ire_type & IRE_INTERFACE) && ire->ire_dep_children != 0)
ire_dep_delete_if_clone(ire);
rw_enter(&ipst->ips_ire_dep_lock, RW_WRITER);
if (ire->ire_dep_parent != NULL) {
ire_dep_remove(ire);
}
while (ire->ire_dep_children != NULL)
ire_dep_remove(ire->ire_dep_children);
rw_exit(&ipst->ips_ire_dep_lock);
}
void
ire_flush_cache_v6(ire_t *ire, int flag)
{
ip_stack_t *ipst = ire->ire_ipst;
if (ire->ire_type & IRE_IF_CLONE)
return;
rw_enter(&ipst->ips_ip6_ire_head_lock, RW_WRITER);
if (flag == IRE_FLUSH_ADD) {
ire_increment_generation(ipst->ips_ire_reject_v6);
ire_increment_generation(ipst->ips_ire_blackhole_v6);
}
if (ire->ire_type == IRE_DEFAULT && flag == IRE_FLUSH_ADD) {
rw_exit(&ipst->ips_ip6_ire_head_lock);
return;
}
switch (flag) {
case IRE_FLUSH_DELETE:
case IRE_FLUSH_GWCHANGE:
ire_dep_incr_generation(ire);
break;
case IRE_FLUSH_ADD: {
in6_addr_t addr;
in6_addr_t mask;
ip_stack_t *ipst = ire->ire_ipst;
uint_t masklen;
addr = ire->ire_addr_v6;
mask = ire->ire_mask_v6;
masklen = ip_mask_to_plen_v6(&mask);
ire = ire_ftable_lookup_impl_v6(&addr, &mask, NULL, 0, NULL,
ALL_ZONES, NULL, MATCH_IRE_SHORTERMASK, ipst);
while (ire != NULL) {
irb_increment_generation(ire->ire_bucket);
mask = ire->ire_mask_v6;
ASSERT(masklen > ip_mask_to_plen_v6(&mask));
masklen = ip_mask_to_plen_v6(&mask);
ire_refrele(ire);
ire = ire_ftable_lookup_impl_v6(&addr, &mask, NULL, 0,
NULL, ALL_ZONES, NULL, MATCH_IRE_SHORTERMASK, ipst);
}
}
break;
}
rw_exit(&ipst->ips_ip6_ire_head_lock);
}
boolean_t
ire_match_args_v6(ire_t *ire, const in6_addr_t *addr, const in6_addr_t *mask,
const in6_addr_t *gateway, int type, const ill_t *ill, zoneid_t zoneid,
const ts_label_t *tsl, int match_flags)
{
in6_addr_t gw_addr_v6 = { 0 };
ill_t *ire_ill = NULL, *dst_ill;
ip_stack_t *ipst = ire->ire_ipst;
ASSERT(ire->ire_ipversion == IPV6_VERSION);
ASSERT(addr != NULL);
ASSERT(mask != NULL);
ASSERT((!(match_flags & MATCH_IRE_GW)) || gateway != NULL);
ASSERT((!(match_flags & (MATCH_IRE_ILL|MATCH_IRE_SRC_ILL))) ||
(ill != NULL && ill->ill_isv6));
if (ire->ire_testhidden) {
if (!(match_flags & MATCH_IRE_TESTHIDDEN))
return (B_FALSE);
}
if (zoneid != ALL_ZONES && zoneid != ire->ire_zoneid &&
ire->ire_zoneid != ALL_ZONES) {
if (match_flags & MATCH_IRE_ZONEONLY)
return (B_FALSE);
if (ire->ire_type & IRE_LOOPBACK)
return (B_FALSE);
if (ire->ire_type & IRE_LOCAL)
goto matchit;
dst_ill = ire->ire_ill;
if (ire->ire_type & IRE_ONLINK) {
uint_t ifindex;
ifindex = dst_ill->ill_usesrc_ifindex;
if (ifindex == 0)
return (B_FALSE);
if (!ipif_zone_avail(ifindex, dst_ill->ill_isv6,
zoneid, ipst)) {
ip3dbg(("ire_match_args: no usrsrc for zone"
" dst_ill %p\n", (void *)dst_ill));
return (B_FALSE);
}
}
if (dst_ill != NULL && (ire->ire_type & IRE_OFFLINK)) {
ipif_t *tipif;
mutex_enter(&dst_ill->ill_lock);
for (tipif = dst_ill->ill_ipif;
tipif != NULL; tipif = tipif->ipif_next) {
if (!IPIF_IS_CONDEMNED(tipif) &&
(tipif->ipif_flags & IPIF_UP) &&
(tipif->ipif_zoneid == zoneid ||
tipif->ipif_zoneid == ALL_ZONES))
break;
}
mutex_exit(&dst_ill->ill_lock);
if (tipif == NULL)
return (B_FALSE);
}
}
matchit:
ire_ill = ire->ire_ill;
if (match_flags & MATCH_IRE_GW) {
mutex_enter(&ire->ire_lock);
gw_addr_v6 = ire->ire_gateway_addr_v6;
mutex_exit(&ire->ire_lock);
}
if (match_flags & MATCH_IRE_ILL) {
if ((match_flags & MATCH_IRE_TESTHIDDEN) &&
!(ire->ire_type & IRE_LOCAL)) {
if (ire->ire_ill != ill)
return (B_FALSE);
} else {
match_flags &= ~MATCH_IRE_TESTHIDDEN;
if (ire_ill == NULL || !IS_ON_SAME_LAN(ill, ire_ill))
return (B_FALSE);
}
}
if (match_flags & MATCH_IRE_SRC_ILL) {
if (ire_ill == NULL)
return (B_FALSE);
if (!IS_ON_SAME_LAN(ill, ire_ill)) {
if (ire_ill->ill_usesrc_ifindex == 0 ||
(ire_ill->ill_usesrc_ifindex !=
ill->ill_phyint->phyint_ifindex))
return (B_FALSE);
}
}
ASSERT(V6_MASK_EQ(ire->ire_addr_v6, ire->ire_mask_v6,
ire->ire_addr_v6));
if (V6_MASK_EQ(*addr, *mask, ire->ire_addr_v6) &&
((!(match_flags & MATCH_IRE_GW)) ||
((!(match_flags & MATCH_IRE_DIRECT)) ||
!(ire->ire_flags & RTF_INDIRECT)) &&
IN6_ARE_ADDR_EQUAL(&gw_addr_v6, gateway)) &&
((!(match_flags & MATCH_IRE_TYPE)) || (ire->ire_type & type)) &&
((!(match_flags & MATCH_IRE_TESTHIDDEN)) || ire->ire_testhidden) &&
((!(match_flags & MATCH_IRE_MASK)) ||
(IN6_ARE_ADDR_EQUAL(&ire->ire_mask_v6, mask))) &&
((!(match_flags & MATCH_IRE_SECATTR)) ||
(!is_system_labeled()) ||
(tsol_ire_match_gwattr(ire, tsl) == 0))) {
return (B_TRUE);
}
return (B_FALSE);
}
boolean_t
ire_gateway_ok_zone_v6(const in6_addr_t *gateway, zoneid_t zoneid, ill_t *ill,
const ts_label_t *tsl, ip_stack_t *ipst, boolean_t lock_held)
{
ire_t *ire;
uint_t match_flags;
if (lock_held)
ASSERT(RW_READ_HELD(&ipst->ips_ip6_ire_head_lock));
else
rw_enter(&ipst->ips_ip6_ire_head_lock, RW_READER);
match_flags = MATCH_IRE_TYPE | MATCH_IRE_SECATTR;
if (ill != NULL)
match_flags |= MATCH_IRE_ILL;
ire = ire_ftable_lookup_impl_v6(gateway, &ipv6_all_zeros,
&ipv6_all_zeros, IRE_INTERFACE, ill, zoneid, tsl, match_flags,
ipst);
if (!lock_held)
rw_exit(&ipst->ips_ip6_ire_head_lock);
if (ire != NULL) {
ire_refrele(ire);
return (B_TRUE);
} else {
return (B_FALSE);
}
}
ire_t *
ire_ftable_lookup_v6(const in6_addr_t *addr, const in6_addr_t *mask,
const in6_addr_t *gateway, int type, const ill_t *ill,
zoneid_t zoneid, const ts_label_t *tsl, int flags,
uint32_t xmit_hint, ip_stack_t *ipst, uint_t *generationp)
{
ire_t *ire = NULL;
ASSERT(addr != NULL);
ASSERT((!(flags & MATCH_IRE_MASK)) || mask != NULL);
ASSERT((!(flags & MATCH_IRE_GW)) || gateway != NULL);
ASSERT(ill == NULL || ill->ill_isv6);
ASSERT(!IN6_IS_ADDR_V4MAPPED(addr));
if ((flags & (MATCH_IRE_ILL|MATCH_IRE_SRC_ILL)) && (ill == NULL))
return (NULL);
rw_enter(&ipst->ips_ip6_ire_head_lock, RW_READER);
ire = ire_ftable_lookup_impl_v6(addr, mask, gateway, type, ill, zoneid,
tsl, flags, ipst);
if (ire == NULL) {
rw_exit(&ipst->ips_ip6_ire_head_lock);
return (NULL);
}
if (ire->ire_bucket->irb_ire_cnt > 1 && !(flags & MATCH_IRE_GW)) {
if (ipst->ips_ip_ecmp_behavior == 2 ||
(ipst->ips_ip_ecmp_behavior == 1 &&
IS_DEFAULT_ROUTE_V6(ire))) {
ire_t *next_ire;
ire_ftable_args_t margs;
bzero(&margs, sizeof (margs));
margs.ift_addr_v6 = *addr;
if (mask != NULL)
margs.ift_mask_v6 = *mask;
if (gateway != NULL)
margs.ift_gateway_v6 = *gateway;
margs.ift_type = type;
margs.ift_ill = ill;
margs.ift_zoneid = zoneid;
margs.ift_tsl = tsl;
margs.ift_flags = flags;
next_ire = ire_round_robin(ire->ire_bucket, &margs,
xmit_hint, ire, ipst);
if (next_ire == NULL) {
goto done;
}
ire_refrele(ire);
ire = next_ire;
}
}
done:
if (generationp != NULL)
*generationp = ire->ire_generation;
rw_exit(&ipst->ips_ip6_ire_head_lock);
if ((ire->ire_type & IRE_LOCAL) && zoneid != ALL_ZONES &&
ire->ire_zoneid != zoneid && ire->ire_zoneid != ALL_ZONES &&
ipst->ips_ip_restrict_interzone_loopback) {
ire = ire_alt_local(ire, zoneid, tsl, ill, generationp);
ASSERT(ire != NULL);
}
return (ire);
}
ire_t *
ire_ftable_lookup_impl_v6(const in6_addr_t *addr, const in6_addr_t *mask,
const in6_addr_t *gateway, int type, const ill_t *ill,
zoneid_t zoneid, const ts_label_t *tsl, int flags,
ip_stack_t *ipst)
{
irb_t *irb_ptr;
ire_t *ire = NULL;
int i;
ASSERT(RW_LOCK_HELD(&ipst->ips_ip6_ire_head_lock));
if (flags & MATCH_IRE_MASK) {
uint_t masklen;
masklen = ip_mask_to_plen_v6(mask);
if (ipst->ips_ip_forwarding_table_v6[masklen] == NULL) {
return (NULL);
}
irb_ptr = &(ipst->ips_ip_forwarding_table_v6[masklen][
IRE_ADDR_MASK_HASH_V6(*addr, *mask,
ipst->ips_ip6_ftable_hash_size)]);
rw_enter(&irb_ptr->irb_lock, RW_READER);
for (ire = irb_ptr->irb_ire; ire != NULL;
ire = ire->ire_next) {
if (IRE_IS_CONDEMNED(ire))
continue;
if (ire_match_args_v6(ire, addr, mask, gateway, type,
ill, zoneid, tsl, flags))
goto found_ire;
}
rw_exit(&irb_ptr->irb_lock);
} else {
uint_t masklen;
if (flags & MATCH_IRE_SHORTERMASK) {
masklen = ip_mask_to_plen_v6(mask);
if (masklen == 0) {
return (NULL);
}
masklen--;
} else {
masklen = IP6_MASK_TABLE_SIZE - 1;
}
for (i = masklen; i >= 0; i--) {
in6_addr_t tmpmask;
if ((ipst->ips_ip_forwarding_table_v6[i]) == NULL)
continue;
(void) ip_plen_to_mask_v6(i, &tmpmask);
irb_ptr = &ipst->ips_ip_forwarding_table_v6[i][
IRE_ADDR_MASK_HASH_V6(*addr, tmpmask,
ipst->ips_ip6_ftable_hash_size)];
rw_enter(&irb_ptr->irb_lock, RW_READER);
for (ire = irb_ptr->irb_ire; ire != NULL;
ire = ire->ire_next) {
if (IRE_IS_CONDEMNED(ire))
continue;
if (ire_match_args_v6(ire, addr,
&ire->ire_mask_v6, gateway, type, ill,
zoneid, tsl, flags))
goto found_ire;
}
rw_exit(&irb_ptr->irb_lock);
}
}
ASSERT(ire == NULL);
ip1dbg(("ire_ftable_lookup_v6: returning NULL ire"));
return (NULL);
found_ire:
ire_refhold(ire);
rw_exit(&irb_ptr->irb_lock);
return (ire);
}
ire_t *
ire_ftable_lookup_simple_v6(const in6_addr_t *addr, uint32_t xmit_hint,
ip_stack_t *ipst, uint_t *generationp)
{
ire_t *ire;
ire = ire_ftable_lookup_v6(addr, NULL, NULL, 0, NULL, ALL_ZONES, NULL,
MATCH_IRE_DSTONLY, xmit_hint, ipst, generationp);
if (ire == NULL) {
ire = ire_reject(ipst, B_TRUE);
if (generationp != NULL)
*generationp = IRE_GENERATION_VERIFY;
}
return (ire);
}
ire_t *
ip_select_route_v6(const in6_addr_t *dst, const in6_addr_t src,
ip_xmit_attr_t *ixa, uint_t *generationp, in6_addr_t *setsrcp,
int *errorp, boolean_t *multirtp)
{
ASSERT(!(ixa->ixa_flags & IXAF_IS_IPV4));
return (ip_select_route(dst, src, ixa, generationp, setsrcp, errorp,
multirtp));
}
ire_t *
ire_route_recursive_impl_v6(ire_t *ire,
const in6_addr_t *nexthop, uint_t ire_type, const ill_t *ill_arg,
zoneid_t zoneid, const ts_label_t *tsl, uint_t match_args,
uint_t irr_flags, uint32_t xmit_hint, ip_stack_t *ipst,
in6_addr_t *setsrcp, tsol_ire_gw_secattr_t **gwattrp, uint_t *generationp)
{
int i, j;
in6_addr_t v6nexthop = *nexthop;
ire_t *ires[MAX_IRE_RECURSION];
uint_t generation;
uint_t generations[MAX_IRE_RECURSION];
boolean_t need_refrele = B_FALSE;
boolean_t invalidate = B_FALSE;
ill_t *ill = NULL;
uint_t maskoff = (IRE_LOCAL|IRE_LOOPBACK);
if (setsrcp != NULL)
ASSERT(IN6_IS_ADDR_UNSPECIFIED(setsrcp));
if (gwattrp != NULL)
ASSERT(*gwattrp == NULL);
i = 0;
while (i < MAX_IRE_RECURSION - 1) {
if (ire == NULL) {
ire = ire_ftable_lookup_v6(&v6nexthop, 0, 0, ire_type,
(ill != NULL ? ill : ill_arg), zoneid, tsl,
match_args, xmit_hint, ipst, &generation);
} else {
ire_refhold(ire);
if (generationp != NULL)
generation = *generationp;
else
generation = IRE_GENERATION_VERIFY;
}
if (ire == NULL) {
if (i > 0 && (irr_flags & IRR_INCOMPLETE)) {
ire = ires[0];
ire_refhold(ire);
} else {
ire = ire_reject(ipst, B_TRUE);
}
goto error;
}
if (ire->ire_flags & (RTF_REJECT|RTF_BLACKHOLE))
goto error;
ASSERT(!(ire->ire_type & IRE_MULTICAST));
if ((ire->ire_type & IRE_IF_CLONE) && !ire_clone_verify(ire)) {
ire_refrele(ire);
ire = NULL;
continue;
}
match_args |= MATCH_IRE_DIRECT;
if ((ire->ire_type & IRE_OFFLINK) &&
!(ire->ire_flags & RTF_INDIRECT)) {
ire_type = IRE_IF_ALL;
} else {
if (!(match_args & MATCH_IRE_TYPE))
ire_type = (IRE_OFFLINK|IRE_ONLINK);
ire_type &= ~maskoff;
}
match_args |= MATCH_IRE_TYPE;
ires[i] = ire;
generations[i] = generation;
i++;
if ((ire->ire_flags & RTF_SETSRC) &&
setsrcp != NULL && IN6_IS_ADDR_UNSPECIFIED(setsrcp)) {
ASSERT(!IN6_IS_ADDR_UNSPECIFIED(
&ire->ire_setsrc_addr_v6));
*setsrcp = ire->ire_setsrc_addr_v6;
}
if (ire->ire_gw_secattr != NULL &&
gwattrp != NULL && *gwattrp == NULL)
*gwattrp = ire->ire_gw_secattr;
mutex_enter(&ire->ire_lock);
if (ire->ire_dep_parent != NULL &&
ire->ire_dep_parent->ire_generation ==
ire->ire_dep_parent_generation) {
mutex_exit(&ire->ire_lock);
ire = NULL;
goto done;
}
mutex_exit(&ire->ire_lock);
if (ire->ire_nce_capable) {
ire = NULL;
goto done;
}
ASSERT(!(ire->ire_type & IRE_IF_CLONE));
if (ire->ire_type & IRE_INTERFACE) {
ire_t *clone;
ASSERT(ire->ire_masklen != IPV6_ABITS);
if (!(irr_flags & IRR_ALLOCATE)) {
invalidate = B_TRUE;
ire = NULL;
goto done;
}
clone = ire_create_if_clone(ire, &v6nexthop,
&generation);
if (clone == NULL) {
invalidate = B_TRUE;
ire = ire_blackhole(ipst, B_TRUE);
goto error;
}
ASSERT(i >= 1);
ASSERT(i < MAX_IRE_RECURSION);
ires[i] = ires[i-1];
generations[i] = generations[i-1];
ires[i-1] = clone;
generations[i-1] = generation;
i++;
ire = NULL;
goto done;
}
match_args &= (MATCH_IRE_TYPE | MATCH_IRE_DIRECT);
v6nexthop = ire->ire_gateway_addr_v6;
if (ill == NULL && ire->ire_ill != NULL) {
ill = ire->ire_ill;
need_refrele = B_TRUE;
ill_refhold(ill);
match_args |= MATCH_IRE_ILL;
}
ire = NULL;
}
ASSERT(ire == NULL);
ire = ire_reject(ipst, B_TRUE);
error:
ASSERT(ire != NULL);
if (need_refrele)
ill_refrele(ill);
if (i > 0 && (ires[0]->ire_flags & RTF_MULTIRT))
(void) ire_no_good(ires[0]);
cleanup:
ire_dep_unbuild(ires, i);
for (j = 0; j < i; j++)
ire_refrele(ires[j]);
ASSERT((ire->ire_flags & (RTF_REJECT|RTF_BLACKHOLE)) ||
(irr_flags & IRR_INCOMPLETE));
if (generationp != NULL)
*generationp = IRE_GENERATION_VERIFY;
return (ire);
done:
ASSERT(ire == NULL);
if (need_refrele)
ill_refrele(ill);
if (i > 1 && !ire_dep_build(ires, generations, i)) {
ire = ire_blackhole(ipst, B_TRUE);
goto cleanup;
}
for (j = 1; j < i; j++)
ire_refrele(ires[j]);
if (invalidate) {
ire_dep_invalidate_generations(ires[0]);
generation = IRE_GENERATION_VERIFY;
} else {
if (ires[0]->ire_dep_parent == NULL)
generation = ires[0]->ire_generation;
else
generation = ire_dep_validate_generations(ires[0]);
if (generations[0] != ires[0]->ire_generation) {
generation = IRE_GENERATION_VERIFY;
}
}
if (generationp != NULL)
*generationp = generation;
return (ires[0]);
}
ire_t *
ire_route_recursive_v6(const in6_addr_t *nexthop, uint_t ire_type,
const ill_t *ill, zoneid_t zoneid, const ts_label_t *tsl, uint_t match_args,
uint_t irr_flags, uint32_t xmit_hint, ip_stack_t *ipst,
in6_addr_t *setsrcp, tsol_ire_gw_secattr_t **gwattrp, uint_t *generationp)
{
return (ire_route_recursive_impl_v6(NULL, nexthop, ire_type, ill,
zoneid, tsl, match_args, irr_flags, xmit_hint, ipst, setsrcp,
gwattrp, generationp));
}
ire_t *
ire_route_recursive_dstonly_v6(const in6_addr_t *nexthop, uint_t irr_flags,
uint32_t xmit_hint, ip_stack_t *ipst)
{
ire_t *ire;
ire_t *ire1;
uint_t generation;
ire = ire_ftable_lookup_simple_v6(nexthop, xmit_hint, ipst,
&generation);
ASSERT(ire != NULL);
mutex_enter(&ire->ire_lock);
if (ire->ire_dep_parent != NULL) {
if (ire->ire_dep_parent->ire_generation ==
ire->ire_dep_parent_generation) {
mutex_exit(&ire->ire_lock);
return (ire);
}
mutex_exit(&ire->ire_lock);
} else {
mutex_exit(&ire->ire_lock);
if (ire->ire_nce_capable)
return (ire);
}
ire1 = ire_route_recursive_impl_v6(ire, nexthop, 0, NULL, ALL_ZONES,
NULL, MATCH_IRE_DSTONLY, irr_flags, xmit_hint, ipst, NULL, NULL,
&generation);
ire_refrele(ire);
return (ire1);
}