#include <sys/param.h>
#include <sys/mbuf.h>
#include <sys/mutex.h>
#include <sys/systm.h>
#include <sys/socket.h>
#include <sys/protosw.h>
#include <sys/sysctl.h>
#include <net/if.h>
#include <net/if_var.h>
#include <netinet/in.h>
#include <netinet/in_var.h>
#include <netinet/ip.h>
#include <netinet/ip_var.h>
#include <netinet/igmp.h>
#include <netinet/igmp_var.h>
#define IP_MULTICASTOPTS 0
struct router_info {
LIST_ENTRY(router_info) rti_list;
unsigned int rti_ifidx;
int rti_type;
int rti_age;
};
int igmp_timers_are_running;
struct mutex igmp_mtx = MUTEX_INITIALIZER(IPL_SOFTNET);
static LIST_HEAD(, router_info) rti_head;
static struct mbuf *router_alert;
struct cpumem *igmpcounters;
int igmp_checktimer(struct ifnet *, struct igmp_pktlist *);
int rti_fill(struct in_multi *);
int rti_reset(struct ifnet *);
int igmp_input_if(struct ifnet *, struct mbuf **, int *, int, int,
struct netstack *);
int igmp_sysctl_igmpstat(void *, size_t *, void *);
void
igmp_init(void)
{
struct ipoption *ra;
igmp_timers_are_running = 0;
LIST_INIT(&rti_head);
igmpcounters = counters_alloc(igps_ncounters);
router_alert = m_get(M_WAIT, MT_DATA);
ra = mtod(router_alert, struct ipoption *);
ra->ipopt_dst.s_addr = INADDR_ANY;
ra->ipopt_list[0] = IPOPT_RA;
ra->ipopt_list[1] = 0x04;
ra->ipopt_list[2] = 0x00;
ra->ipopt_list[3] = 0x00;
router_alert->m_len = sizeof(ra->ipopt_dst) + ra->ipopt_list[1];
}
static struct router_info *
rti_find(unsigned int ifidx)
{
struct router_info *rti;
MUTEX_ASSERT_LOCKED(&igmp_mtx);
LIST_FOREACH(rti, &rti_head, rti_list) {
if (rti->rti_ifidx == ifidx)
return (rti);
}
return (NULL);
}
int
rti_fill(struct in_multi *inm)
{
struct router_info *rti, *new_rti = NULL;
int type;
mtx_enter(&igmp_mtx);
rti = rti_find(inm->inm_ifidx);
if (rti != NULL)
goto found;
mtx_leave(&igmp_mtx);
new_rti = malloc(sizeof(*rti), M_MRTABLE, M_WAITOK);
mtx_enter(&igmp_mtx);
rti = rti_find(inm->inm_ifidx);
if (rti != NULL)
goto found;
rti = new_rti;
rti->rti_ifidx = inm->inm_ifidx;
rti->rti_type = IGMP_v2_ROUTER;
LIST_INSERT_HEAD(&rti_head, rti, rti_list);
inm->inm_rti = rti;
mtx_leave(&igmp_mtx);
return (IGMP_v2_HOST_MEMBERSHIP_REPORT);
found:
inm->inm_rti = rti;
type = rti->rti_type;
mtx_leave(&igmp_mtx);
free(new_rti, M_MRTABLE, sizeof(*rti));
return (type == IGMP_v1_ROUTER ?
IGMP_v1_HOST_MEMBERSHIP_REPORT : IGMP_v2_HOST_MEMBERSHIP_REPORT);
}
int
rti_reset(struct ifnet *ifp)
{
struct router_info *rti;
mtx_enter(&igmp_mtx);
rti = rti_find(ifp->if_index);
if (rti != NULL)
goto found;
rti = malloc(sizeof(*rti), M_MRTABLE, M_NOWAIT);
if (rti == NULL) {
mtx_leave(&igmp_mtx);
return (ENOBUFS);
}
rti->rti_ifidx = ifp->if_index;
LIST_INSERT_HEAD(&rti_head, rti, rti_list);
found:
rti->rti_type = IGMP_v1_ROUTER;
rti->rti_age = 0;
mtx_leave(&igmp_mtx);
return (0);
}
void
rti_delete(struct ifnet *ifp)
{
struct router_info *rti;
mtx_enter(&igmp_mtx);
rti = rti_find(ifp->if_index);
if (rti != NULL)
LIST_REMOVE(rti, rti_list);
mtx_leave(&igmp_mtx);
free(rti, M_MRTABLE, sizeof(*rti));
}
int
igmp_input(struct mbuf **mp, int *offp, int proto, int af, struct netstack *ns)
{
struct ifnet *ifp;
igmpstat_inc(igps_rcv_total);
ifp = if_get((*mp)->m_pkthdr.ph_ifidx);
if (ifp == NULL) {
m_freemp(mp);
return IPPROTO_DONE;
}
KERNEL_LOCK();
proto = igmp_input_if(ifp, mp, offp, proto, af, ns);
KERNEL_UNLOCK();
if_put(ifp);
return proto;
}
int
igmp_input_if(struct ifnet *ifp, struct mbuf **mp, int *offp, int proto,
int af, struct netstack *ns)
{
struct mbuf *m = *mp;
int iphlen = *offp;
struct ip *ip = mtod(m, struct ip *);
struct igmp *igmp;
int igmplen;
int minlen;
struct ifmaddr *ifma;
struct in_multi *inm;
struct in_ifaddr *ia;
int error, timer, running = 0;
igmplen = ntohs(ip->ip_len) - iphlen;
if (igmplen < IGMP_MINLEN) {
igmpstat_inc(igps_rcv_tooshort);
m_freem(m);
return IPPROTO_DONE;
}
minlen = iphlen + IGMP_MINLEN;
if ((m->m_flags & M_EXT || m->m_len < minlen) &&
(m = *mp = m_pullup(m, minlen)) == NULL) {
igmpstat_inc(igps_rcv_tooshort);
return IPPROTO_DONE;
}
m->m_data += iphlen;
m->m_len -= iphlen;
igmp = mtod(m, struct igmp *);
if (in_cksum(m, igmplen)) {
igmpstat_inc(igps_rcv_badsum);
m_freem(m);
return IPPROTO_DONE;
}
m->m_data -= iphlen;
m->m_len += iphlen;
ip = mtod(m, struct ip *);
switch (igmp->igmp_type) {
case IGMP_HOST_MEMBERSHIP_QUERY:
igmpstat_inc(igps_rcv_queries);
if (ifp->if_flags & IFF_LOOPBACK)
break;
if (igmp->igmp_code == 0) {
error = rti_reset(ifp);
if (error) {
m_freem(m);
return IPPROTO_DONE;
}
if (ip->ip_dst.s_addr != INADDR_ALLHOSTS_GROUP) {
igmpstat_inc(igps_rcv_badqueries);
m_freem(m);
return IPPROTO_DONE;
}
rw_enter_write(&ifp->if_maddrlock);
TAILQ_FOREACH(ifma, &ifp->if_maddrlist, ifma_list) {
if (ifma->ifma_addr->sa_family != AF_INET)
continue;
inm = ifmatoinm(ifma);
if (inm->inm_timer == 0 &&
!IN_LOCAL_GROUP(inm->inm_addr.s_addr)) {
inm->inm_state = IGMP_DELAYING_MEMBER;
inm->inm_timer = IGMP_RANDOM_DELAY(
IGMP_MAX_HOST_REPORT_DELAY * PR_FASTHZ);
running = 1;
}
}
rw_exit_write(&ifp->if_maddrlock);
} else {
if (!IN_MULTICAST(ip->ip_dst.s_addr)) {
igmpstat_inc(igps_rcv_badqueries);
m_freem(m);
return IPPROTO_DONE;
}
timer = igmp->igmp_code * PR_FASTHZ / IGMP_TIMER_SCALE;
if (timer == 0)
timer = 1;
rw_enter_write(&ifp->if_maddrlock);
TAILQ_FOREACH(ifma, &ifp->if_maddrlist, ifma_list) {
if (ifma->ifma_addr->sa_family != AF_INET)
continue;
inm = ifmatoinm(ifma);
if (!IN_LOCAL_GROUP(inm->inm_addr.s_addr) &&
(ip->ip_dst.s_addr == INADDR_ALLHOSTS_GROUP ||
ip->ip_dst.s_addr == inm->inm_addr.s_addr)) {
switch (inm->inm_state) {
case IGMP_DELAYING_MEMBER:
if (inm->inm_timer <= timer)
break;
case IGMP_IDLE_MEMBER:
case IGMP_LAZY_MEMBER:
case IGMP_AWAKENING_MEMBER:
inm->inm_state =
IGMP_DELAYING_MEMBER;
inm->inm_timer =
IGMP_RANDOM_DELAY(timer);
running = 1;
break;
case IGMP_SLEEPING_MEMBER:
inm->inm_state =
IGMP_AWAKENING_MEMBER;
break;
}
}
}
rw_exit_write(&ifp->if_maddrlock);
}
break;
case IGMP_v1_HOST_MEMBERSHIP_REPORT:
igmpstat_inc(igps_rcv_reports);
if (ifp->if_flags & IFF_LOOPBACK)
break;
if (!IN_MULTICAST(igmp->igmp_group.s_addr) ||
igmp->igmp_group.s_addr != ip->ip_dst.s_addr) {
igmpstat_inc(igps_rcv_badreports);
m_freem(m);
return IPPROTO_DONE;
}
if ((ip->ip_src.s_addr & IN_CLASSA_NET) == 0) {
ia = in_ifp2ia(ifp);
if (ia)
ip->ip_src.s_addr = ia->ia_net;
}
rw_enter_write(&ifp->if_maddrlock);
inm = in_lookupmulti(&igmp->igmp_group, ifp);
if (inm != NULL) {
inm->inm_timer = 0;
igmpstat_inc(igps_rcv_ourreports);
switch (inm->inm_state) {
case IGMP_IDLE_MEMBER:
case IGMP_LAZY_MEMBER:
case IGMP_AWAKENING_MEMBER:
case IGMP_SLEEPING_MEMBER:
inm->inm_state = IGMP_SLEEPING_MEMBER;
break;
case IGMP_DELAYING_MEMBER:
if (inm->inm_rti->rti_type == IGMP_v1_ROUTER)
inm->inm_state = IGMP_LAZY_MEMBER;
else
inm->inm_state = IGMP_SLEEPING_MEMBER;
break;
}
}
rw_exit_write(&ifp->if_maddrlock);
break;
case IGMP_v2_HOST_MEMBERSHIP_REPORT:
#ifdef MROUTING
ia = in_ifp2ia(ifp);
if (ia && ip->ip_src.s_addr == ia->ia_addr.sin_addr.s_addr)
break;
#endif
igmpstat_inc(igps_rcv_reports);
if (ifp->if_flags & IFF_LOOPBACK)
break;
if (!IN_MULTICAST(igmp->igmp_group.s_addr) ||
igmp->igmp_group.s_addr != ip->ip_dst.s_addr) {
igmpstat_inc(igps_rcv_badreports);
m_freem(m);
return IPPROTO_DONE;
}
if ((ip->ip_src.s_addr & IN_CLASSA_NET) == 0) {
#ifndef MROUTING
ia = in_ifp2ia(ifp);
#endif
if (ia)
ip->ip_src.s_addr = ia->ia_net;
}
rw_enter_write(&ifp->if_maddrlock);
inm = in_lookupmulti(&igmp->igmp_group, ifp);
if (inm != NULL) {
inm->inm_timer = 0;
igmpstat_inc(igps_rcv_ourreports);
switch (inm->inm_state) {
case IGMP_DELAYING_MEMBER:
case IGMP_IDLE_MEMBER:
case IGMP_AWAKENING_MEMBER:
inm->inm_state = IGMP_LAZY_MEMBER;
break;
case IGMP_LAZY_MEMBER:
case IGMP_SLEEPING_MEMBER:
break;
}
}
rw_exit_write(&ifp->if_maddrlock);
break;
}
if (running)
atomic_store_int(&igmp_timers_are_running, 1);
return rip_input(mp, offp, proto, af, ns);
}
void
igmp_joingroup(struct in_multi *inm, struct ifnet *ifp,
struct igmp_pktinfo *pkt)
{
int running = 0;
rw_assert_wrlock(&ifp->if_maddrlock);
inm->inm_state = IGMP_IDLE_MEMBER;
if (!IN_LOCAL_GROUP(inm->inm_addr.s_addr) &&
(ifp->if_flags & IFF_LOOPBACK) == 0) {
inm->inm_state = IGMP_DELAYING_MEMBER;
inm->inm_timer = IGMP_RANDOM_DELAY(
IGMP_MAX_HOST_REPORT_DELAY * PR_FASTHZ);
pkt->ipi_addr = inm->inm_addr;
pkt->ipi_rdomain = ifp->if_rdomain;
pkt->ipi_ifidx = inm->inm_ifidx;
pkt->ipi_type = rti_fill(inm);
running = 1;
} else
inm->inm_timer = 0;
if (running)
atomic_store_int(&igmp_timers_are_running, 1);
}
void
igmp_leavegroup(struct in_multi *inm, struct ifnet *ifp,
struct igmp_pktinfo *pkt)
{
rw_assert_anylock(&ifp->if_maddrlock);
switch (inm->inm_state) {
case IGMP_DELAYING_MEMBER:
case IGMP_IDLE_MEMBER:
if (!IN_LOCAL_GROUP(inm->inm_addr.s_addr) &&
(ifp->if_flags & IFF_LOOPBACK) == 0)
if (inm->inm_rti->rti_type != IGMP_v1_ROUTER) {
pkt->ipi_addr.s_addr = INADDR_ALLROUTERS_GROUP;
pkt->ipi_rdomain = ifp->if_rdomain;
pkt->ipi_ifidx = inm->inm_ifidx;
pkt->ipi_type = IGMP_HOST_LEAVE_MESSAGE;
}
break;
case IGMP_LAZY_MEMBER:
case IGMP_AWAKENING_MEMBER:
case IGMP_SLEEPING_MEMBER:
break;
}
}
void
igmp_fasttimo(void)
{
struct igmp_pktlist pktlist;
struct ifnet *ifp;
int running = 0;
if (!atomic_load_int(&igmp_timers_are_running))
return;
atomic_store_int(&igmp_timers_are_running, 0);
NET_LOCK_SHARED();
STAILQ_INIT(&pktlist);
TAILQ_FOREACH(ifp, &ifnetlist, if_list) {
if (igmp_checktimer(ifp, &pktlist))
running = 1;
}
while (!STAILQ_EMPTY(&pktlist)) {
struct igmp_pktinfo *pkt;
pkt = STAILQ_FIRST(&pktlist);
STAILQ_REMOVE_HEAD(&pktlist, ipi_list);
igmp_sendpkt(pkt);
free(pkt, M_MRTABLE, sizeof(*pkt));
}
NET_UNLOCK_SHARED();
if (running)
atomic_store_int(&igmp_timers_are_running, 1);
}
int
igmp_checktimer(struct ifnet *ifp, struct igmp_pktlist *pktlist)
{
struct in_multi *inm;
struct ifmaddr *ifma;
int running = 0;
rw_enter_write(&ifp->if_maddrlock);
TAILQ_FOREACH(ifma, &ifp->if_maddrlist, ifma_list) {
if (ifma->ifma_addr->sa_family != AF_INET)
continue;
inm = ifmatoinm(ifma);
if (inm->inm_timer == 0) {
} else if (--inm->inm_timer == 0) {
if (inm->inm_state == IGMP_DELAYING_MEMBER) {
struct igmp_pktinfo *pkt;
inm->inm_state = IGMP_IDLE_MEMBER;
pkt = malloc(sizeof(*pkt), M_MRTABLE, M_NOWAIT);
if (pkt == NULL)
continue;
pkt->ipi_addr = inm->inm_addr;
pkt->ipi_rdomain = ifp->if_rdomain;
pkt->ipi_ifidx = inm->inm_ifidx;
pkt->ipi_type =
inm->inm_rti->rti_type == IGMP_v1_ROUTER ?
IGMP_v1_HOST_MEMBERSHIP_REPORT :
IGMP_v2_HOST_MEMBERSHIP_REPORT;
STAILQ_INSERT_TAIL(pktlist, pkt, ipi_list);
}
} else {
running = 1;
}
}
rw_exit_write(&ifp->if_maddrlock);
return (running);
}
void
igmp_slowtimo(void)
{
struct router_info *rti;
if (LIST_EMPTY(&rti_head))
return;
mtx_enter(&igmp_mtx);
LIST_FOREACH(rti, &rti_head, rti_list) {
if (rti->rti_type == IGMP_v1_ROUTER &&
++rti->rti_age >= IGMP_AGE_THRESHOLD) {
rti->rti_type = IGMP_v2_ROUTER;
}
}
mtx_leave(&igmp_mtx);
}
void
igmp_sendpkt(struct igmp_pktinfo *pkt)
{
struct mbuf *m;
struct igmp *igmp;
struct ip *ip;
struct ip_moptions imo;
MGETHDR(m, M_DONTWAIT, MT_HEADER);
if (m == NULL)
return;
m->m_data += max_linkhdr;
m->m_len = sizeof(struct ip) + IGMP_MINLEN;
m->m_pkthdr.len = sizeof(struct ip) + IGMP_MINLEN;
ip = mtod(m, struct ip *);
ip->ip_tos = 0;
ip->ip_len = htons(sizeof(struct ip) + IGMP_MINLEN);
ip->ip_off = 0;
ip->ip_p = IPPROTO_IGMP;
ip->ip_src.s_addr = INADDR_ANY;
ip->ip_dst = pkt->ipi_addr;
m->m_data += sizeof(struct ip);
m->m_len -= sizeof(struct ip);
igmp = mtod(m, struct igmp *);
igmp->igmp_type = pkt->ipi_type;
igmp->igmp_code = 0;
igmp->igmp_group = pkt->ipi_addr;
igmp->igmp_cksum = 0;
igmp->igmp_cksum = in_cksum(m, IGMP_MINLEN);
m->m_data -= sizeof(struct ip);
m->m_len += sizeof(struct ip);
m->m_pkthdr.ph_rtableid = pkt->ipi_rdomain;
imo.imo_ifidx = pkt->ipi_ifidx;
imo.imo_ttl = 1;
#ifdef MROUTING
imo.imo_loop = (ip_mrouter[pkt->ipi_rdomain] != NULL);
#else
imo.imo_loop = 0;
#endif
ip_output(m, router_alert, NULL, IP_MULTICASTOPTS, &imo, NULL, 0);
igmpstat_inc(igps_snd_reports);
}
#ifndef SMALL_KERNEL
int
igmp_sysctl(int *name, u_int namelen, void *oldp, size_t *oldlenp,
void *newp, size_t newlen)
{
if (namelen != 1)
return (ENOTDIR);
switch (name[0]) {
case IGMPCTL_STATS:
return (igmp_sysctl_igmpstat(oldp, oldlenp, newp));
default:
return (EOPNOTSUPP);
}
}
int
igmp_sysctl_igmpstat(void *oldp, size_t *oldlenp, void *newp)
{
uint64_t counters[igps_ncounters];
struct igmpstat igmpstat;
u_long *words = (u_long *)&igmpstat;
int i;
CTASSERT(sizeof(igmpstat) == (nitems(counters) * sizeof(u_long)));
memset(&igmpstat, 0, sizeof igmpstat);
counters_read(igmpcounters, counters, nitems(counters), NULL);
for (i = 0; i < nitems(counters); i++)
words[i] = (u_long)counters[i];
return (sysctl_rdstruct(oldp, oldlenp, newp,
&igmpstat, sizeof(igmpstat)));
}
#endif