igmp.c revision 191264
1139823Simp/*- 2189592Sbms * Copyright (c) 2007-2009 Bruce Simpson. 31541Srgrimes * Copyright (c) 1988 Stephen Deering. 41541Srgrimes * Copyright (c) 1992, 1993 51541Srgrimes * The Regents of the University of California. All rights reserved. 61541Srgrimes * 71541Srgrimes * This code is derived from software contributed to Berkeley by 81541Srgrimes * Stephen Deering of Stanford University. 91541Srgrimes * 101541Srgrimes * Redistribution and use in source and binary forms, with or without 111541Srgrimes * modification, are permitted provided that the following conditions 121541Srgrimes * are met: 131541Srgrimes * 1. Redistributions of source code must retain the above copyright 141541Srgrimes * notice, this list of conditions and the following disclaimer. 151541Srgrimes * 2. Redistributions in binary form must reproduce the above copyright 161541Srgrimes * notice, this list of conditions and the following disclaimer in the 171541Srgrimes * documentation and/or other materials provided with the distribution. 181541Srgrimes * 4. Neither the name of the University nor the names of its contributors 191541Srgrimes * may be used to endorse or promote products derived from this software 201541Srgrimes * without specific prior written permission. 211541Srgrimes * 221541Srgrimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 231541Srgrimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 241541Srgrimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 251541Srgrimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 261541Srgrimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 271541Srgrimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 281541Srgrimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 291541Srgrimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 301541Srgrimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 311541Srgrimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 321541Srgrimes * SUCH DAMAGE. 331541Srgrimes * 341541Srgrimes * @(#)igmp.c 8.1 (Berkeley) 7/19/93 351541Srgrimes */ 361541Srgrimes 372531Swollman/* 382531Swollman * Internet Group Management Protocol (IGMP) routines. 39189592Sbms * [RFC1112, RFC2236, RFC3376] 402531Swollman * 412531Swollman * Written by Steve Deering, Stanford, May 1988. 422531Swollman * Modified by Rosen Sharma, Stanford, Aug 1994. 439209Swollman * Modified by Bill Fenner, Xerox PARC, Feb 1995. 4414622Sfenner * Modified to fully comply to IGMPv2 by Bill Fenner, Oct 1995. 45189592Sbms * Significantly rewritten for IGMPv3, VIMAGE, and SMP by Bruce Simpson. 462531Swollman * 4714622Sfenner * MULTICAST Revision: 3.5.1.4 482531Swollman */ 491541Srgrimes 50172467Ssilby#include <sys/cdefs.h> 51172467Ssilby__FBSDID("$FreeBSD: head/sys/netinet/igmp.c 191264 2009-04-19 08:14:21Z bms $"); 52172467Ssilby 53101091Srwatson#include "opt_mac.h" 54189106Sbz#include "opt_route.h" 55101091Srwatson 561541Srgrimes#include <sys/param.h> 571549Srgrimes#include <sys/systm.h> 58189592Sbms#include <sys/module.h> 5929024Sbde#include <sys/malloc.h> 601541Srgrimes#include <sys/mbuf.h> 611541Srgrimes#include <sys/socket.h> 621541Srgrimes#include <sys/protosw.h> 6312296Sphk#include <sys/kernel.h> 646472Swollman#include <sys/sysctl.h> 65181803Sbz#include <sys/vimage.h> 66189592Sbms#include <sys/ktr.h> 67189592Sbms#include <sys/condvar.h> 681541Srgrimes 691541Srgrimes#include <net/if.h> 70189592Sbms#include <net/netisr.h> 711541Srgrimes#include <net/route.h> 72185571Sbz#include <net/vnet.h> 731541Srgrimes 741541Srgrimes#include <netinet/in.h> 751541Srgrimes#include <netinet/in_var.h> 761541Srgrimes#include <netinet/in_systm.h> 771541Srgrimes#include <netinet/ip.h> 781541Srgrimes#include <netinet/ip_var.h> 79152592Sandre#include <netinet/ip_options.h> 801541Srgrimes#include <netinet/igmp.h> 811541Srgrimes#include <netinet/igmp_var.h> 82185571Sbz#include <netinet/vinet.h> 831541Srgrimes 8460105Sjlemon#include <machine/in_cksum.h> 8560105Sjlemon 86163606Srwatson#include <security/mac/mac_framework.h> 87163606Srwatson 88189592Sbms#ifndef KTR_IGMPV3 89189592Sbms#define KTR_IGMPV3 KTR_SUBSYS 90189592Sbms#endif 9130309Sphk 92189592Sbmsstatic struct igmp_ifinfo * 93189592Sbms igi_alloc_locked(struct ifnet *); 94189592Sbmsstatic void igi_delete_locked(const struct ifnet *); 95189592Sbmsstatic void igmp_dispatch_queue(struct ifqueue *, int, const int); 96189592Sbmsstatic void igmp_fasttimo_vnet(void); 97189592Sbmsstatic void igmp_final_leave(struct in_multi *, struct igmp_ifinfo *); 98189592Sbmsstatic int igmp_handle_state_change(struct in_multi *, 99189592Sbms struct igmp_ifinfo *); 100189592Sbmsstatic int igmp_initial_join(struct in_multi *, struct igmp_ifinfo *); 101189592Sbmsstatic int igmp_input_v1_query(struct ifnet *, const struct ip *); 102189592Sbmsstatic int igmp_input_v2_query(struct ifnet *, const struct ip *, 103189592Sbms const struct igmp *); 104189592Sbmsstatic int igmp_input_v3_query(struct ifnet *, const struct ip *, 105189592Sbms /*const*/ struct igmpv3 *); 106189592Sbmsstatic int igmp_input_v3_group_query(struct in_multi *, 107189592Sbms struct igmp_ifinfo *, int, /*const*/ struct igmpv3 *); 108189592Sbmsstatic int igmp_input_v1_report(struct ifnet *, /*const*/ struct ip *, 109189592Sbms /*const*/ struct igmp *); 110189592Sbmsstatic int igmp_input_v2_report(struct ifnet *, /*const*/ struct ip *, 111189592Sbms /*const*/ struct igmp *); 112189592Sbmsstatic void igmp_intr(struct mbuf *); 113189592Sbmsstatic int igmp_isgroupreported(const struct in_addr); 114189592Sbmsstatic struct mbuf * 115189592Sbms igmp_ra_alloc(void); 116189592Sbms#ifdef KTR 117189592Sbmsstatic char * igmp_rec_type_to_str(const int); 118185088Szec#endif 119189592Sbmsstatic void igmp_set_version(struct igmp_ifinfo *, const int); 120189592Sbmsstatic void igmp_slowtimo_vnet(void); 121189592Sbmsstatic void igmp_sysinit(void); 122189592Sbmsstatic int igmp_v1v2_queue_report(struct in_multi *, const int); 123189592Sbmsstatic void igmp_v1v2_process_group_timer(struct in_multi *, const int); 124189592Sbmsstatic void igmp_v1v2_process_querier_timers(struct igmp_ifinfo *); 125189592Sbmsstatic void igmp_v2_update_group(struct in_multi *, const int); 126189592Sbmsstatic void igmp_v3_cancel_link_timers(struct igmp_ifinfo *); 127189592Sbmsstatic void igmp_v3_dispatch_general_query(struct igmp_ifinfo *); 128189592Sbmsstatic struct mbuf * 129189592Sbms igmp_v3_encap_report(struct ifnet *, struct mbuf *); 130189592Sbmsstatic int igmp_v3_enqueue_group_record(struct ifqueue *, 131189592Sbms struct in_multi *, const int, const int, const int); 132189592Sbmsstatic int igmp_v3_enqueue_filter_change(struct ifqueue *, 133189592Sbms struct in_multi *); 134189592Sbmsstatic void igmp_v3_process_group_timers(struct igmp_ifinfo *, 135189592Sbms struct ifqueue *, struct ifqueue *, struct in_multi *, 136189592Sbms const int); 137189592Sbmsstatic int igmp_v3_merge_state_changes(struct in_multi *, 138189592Sbms struct ifqueue *); 139189592Sbmsstatic void igmp_v3_suppress_group_record(struct in_multi *); 140189592Sbmsstatic int sysctl_igmp_default_version(SYSCTL_HANDLER_ARGS); 141189592Sbmsstatic int sysctl_igmp_gsr(SYSCTL_HANDLER_ARGS); 142189592Sbmsstatic int sysctl_igmp_ifinfo(SYSCTL_HANDLER_ARGS); 1432531Swollman 144189592Sbms#ifdef VIMAGE 145189592Sbmsstatic vnet_attach_fn vnet_igmp_iattach; 146189592Sbmsstatic vnet_detach_fn vnet_igmp_idetach; 147189592Sbms#else 148189592Sbmsstatic int vnet_igmp_iattach(const void *); 149189592Sbmsstatic int vnet_igmp_idetach(const void *); 150189592Sbms#endif /* VIMAGE */ 15112296Sphk 152130333Srwatson/* 153189592Sbms * System-wide globals. 154189592Sbms * 155189592Sbms * Unlocked access to these is OK, except for the global IGMP output 156189592Sbms * queue. The IGMP subsystem lock ends up being system-wide for the moment, 157189592Sbms * because all VIMAGEs have to share a global output queue, as netisrs 158189592Sbms * themselves are not virtualized. 159189592Sbms * 160189592Sbms * Locking: 161189592Sbms * * The permitted lock order is: IN_MULTI_LOCK, IGMP_LOCK, IF_ADDR_LOCK. 162189592Sbms * Any may be taken independently; if any are held at the same 163189592Sbms * time, the above lock order must be followed. 164191264Sbms * * All output is delegated to the netisr. 165191264Sbms * Now that Giant has been eliminated, the netisr may be inlined. 166189592Sbms * * IN_MULTI_LOCK covers in_multi. 167189592Sbms * * IGMP_LOCK covers igmp_ifinfo and any global variables in this file, 168189592Sbms * including the output queue. 169189592Sbms * * IF_ADDR_LOCK covers if_multiaddrs, which is used for a variety of 170189592Sbms * per-link state iterators. 171189592Sbms * * igmp_ifinfo is valid as long as PF_INET is attached to the interface, 172189592Sbms * therefore it is not refcounted. 173189592Sbms * We allow unlocked reads of igmp_ifinfo when accessed via in_multi. 174189592Sbms * 175189592Sbms * Reference counting 176189592Sbms * * IGMP acquires its own reference every time an in_multi is passed to 177189592Sbms * it and the group is being joined for the first time. 178189592Sbms * * IGMP releases its reference(s) on in_multi in a deferred way, 179189592Sbms * because the operations which process the release run as part of 180189592Sbms * a loop whose control variables are directly affected by the release 181189592Sbms * (that, and not recursing on the IF_ADDR_LOCK). 182189592Sbms * 183189592Sbms * VIMAGE: Each in_multi corresponds to an ifp, and each ifp corresponds 184189592Sbms * to a vnet in ifp->if_vnet. 185189592Sbms * 186189931Sbms * SMPng: XXX We may potentially race operations on ifma_protospec. 187189931Sbms * The problem is that we currently lack a clean way of taking the 188189931Sbms * IF_ADDR_LOCK() between the ifnet and in layers w/o recursing, 189189931Sbms * as anything which modifies ifma needs to be covered by that lock. 190189931Sbms * So check for ifma_protospec being NULL before proceeding. 191130333Srwatson */ 192189592Sbmsstruct mtx igmp_mtx; 193189592Sbms 194189592Sbmsstruct mbuf *m_raopt; /* Router Alert option */ 195189592SbmsMALLOC_DEFINE(M_IGMP, "igmp", "igmp state"); 196189592Sbms 197189592Sbms/* 198189592Sbms * Global netisr output queue. 199189592Sbms */ 200189592Sbmsstruct ifqueue igmpoq; 201189592Sbms 202189592Sbms/* 203189592Sbms * VIMAGE-wide globals. 204189592Sbms * 205189592Sbms * The IGMPv3 timers themselves need to run per-image, however, 206189592Sbms * protosw timers run globally (see tcp). 207189592Sbms * An ifnet can only be in one vimage at a time, and the loopback 208189592Sbms * ifnet, loif, is itself virtualized. 209189592Sbms * It would otherwise be possible to seriously hose IGMP state, 210189592Sbms * and create inconsistencies in upstream multicast routing, if you have 211189592Sbms * multiple VIMAGEs running on the same link joining different multicast 212189592Sbms * groups, UNLESS the "primary IP address" is different. This is because 213189592Sbms * IGMP for IPv4 does not force link-local addresses to be used for each 214189592Sbms * node, unlike MLD for IPv6. 215189592Sbms * Obviously the IGMPv3 per-interface state has per-vimage granularity 216189592Sbms * also as a result. 217189592Sbms * 218189592Sbms * FUTURE: Stop using IFP_TO_IA/INADDR_ANY, and use source address selection 219189592Sbms * policy to control the address used by IGMP on the link. 220189592Sbms */ 221185088Szec#ifdef VIMAGE_GLOBALS 222189592Sbmsint interface_timers_running; /* IGMPv3 general query response */ 223189592Sbmsint state_change_timers_running; /* IGMPv3 state-change retransmit */ 224189592Sbmsint current_state_timers_running; /* IGMPv1/v2 host report; 225189592Sbms * IGMPv3 g/sg query response */ 226130333Srwatson 227189592SbmsLIST_HEAD(, igmp_ifinfo) igi_head; 228189592Sbmsstruct igmpstat igmpstat; 229189592Sbmsstruct timeval igmp_gsrdelay; 230189592Sbms 231189592Sbmsint igmp_recvifkludge; 232189592Sbmsint igmp_sendra; 233189592Sbmsint igmp_sendlocal; 234189592Sbmsint igmp_v1enable; 235189592Sbmsint igmp_v2enable; 236189592Sbmsint igmp_legacysupp; 237189592Sbmsint igmp_default_version; 238189592Sbms#endif /* VIMAGE_GLOBALS */ 239189592Sbms 240130333Srwatson/* 241189592Sbms * Virtualized sysctls. 242130333Srwatson */ 243189592SbmsSYSCTL_V_STRUCT(V_NET, vnet_inet, _net_inet_igmp, IGMPCTL_STATS, stats, 244189592Sbms CTLFLAG_RW, igmpstat, igmpstat, ""); 245189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, recvifkludge, 246189592Sbms CTLFLAG_RW, igmp_recvifkludge, 0, 247189592Sbms "Rewrite IGMPv1/v2 reports from 0.0.0.0 to contain subnet address"); 248189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, sendra, 249189592Sbms CTLFLAG_RW, igmp_sendra, 0, 250189592Sbms "Send IP Router Alert option in IGMPv2/v3 messages"); 251189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, sendlocal, 252189592Sbms CTLFLAG_RW, igmp_sendlocal, 0, 253189592Sbms "Send IGMP membership reports for 224.0.0.0/24 groups"); 254189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, v1enable, 255189592Sbms CTLFLAG_RW, igmp_v1enable, 0, 256189592Sbms "Enable backwards compatibility with IGMPv1"); 257189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, v2enable, 258189592Sbms CTLFLAG_RW, igmp_v2enable, 0, 259189592Sbms "Enable backwards compatibility with IGMPv2"); 260189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, legacysupp, 261189592Sbms CTLFLAG_RW, igmp_legacysupp, 0, 262189592Sbms "Allow v1/v2 reports to suppress v3 group responses"); 263189592SbmsSYSCTL_V_PROC(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, default_version, 264189592Sbms CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, igmp_default_version, 0, 265189592Sbms sysctl_igmp_default_version, "I", 266189592Sbms "Default version of IGMP to run on each interface"); 267189592SbmsSYSCTL_V_PROC(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, gsrdelay, 268189592Sbms CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, igmp_gsrdelay.tv_sec, 0, 269189592Sbms sysctl_igmp_gsr, "I", 270189592Sbms "Rate limit for IGMPv3 Group-and-Source queries in seconds"); 271130333Srwatson 272189592Sbms/* 273189592Sbms * Non-virtualized sysctls. 274189592Sbms */ 275189592SbmsSYSCTL_NODE(_net_inet_igmp, OID_AUTO, ifinfo, CTLFLAG_RD | CTLFLAG_MPSAFE, 276189592Sbms sysctl_igmp_ifinfo, "Per-interface IGMPv3 state"); 2771541Srgrimes 278189592Sbmsstatic __inline void 279189592Sbmsigmp_save_context(struct mbuf *m, struct ifnet *ifp) 280189592Sbms{ 281189592Sbms 282189592Sbms#ifdef VIMAGE 283189592Sbms m->m_pkthdr.header = ifp->if_vnet; 284189592Sbms#endif /* VIMAGE */ 285189592Sbms m->m_pkthdr.flowid = ifp->if_index; 286189592Sbms} 287189592Sbms 288189592Sbmsstatic __inline void 289189592Sbmsigmp_scrub_context(struct mbuf *m) 290189592Sbms{ 291189592Sbms 292189592Sbms m->m_pkthdr.header = NULL; 293189592Sbms m->m_pkthdr.flowid = 0; 294189592Sbms} 295189592Sbms 296189592Sbms#ifdef KTR 297189592Sbmsstatic __inline char * 298189592Sbmsinet_ntoa_haddr(in_addr_t haddr) 299189592Sbms{ 300189592Sbms struct in_addr ia; 301189592Sbms 302189592Sbms ia.s_addr = htonl(haddr); 303189592Sbms return (inet_ntoa(ia)); 304189592Sbms} 305119180Srwatson#endif 306119180Srwatson 307189592Sbms/* 308189592Sbms * Restore context from a queued IGMP output chain. 309189592Sbms * Return saved ifindex. 310189592Sbms * 311189592Sbms * VIMAGE: The assertion is there to make sure that we 312189592Sbms * actually called CURVNET_SET() with what's in the mbuf chain. 313189592Sbms */ 314189592Sbmsstatic __inline uint32_t 315189592Sbmsigmp_restore_context(struct mbuf *m) 3161541Srgrimes{ 31714622Sfenner 318189592Sbms#ifdef notyet 319189592Sbms#if defined(VIMAGE) && defined(INVARIANTS) 320189592Sbms KASSERT(curvnet == (m->m_pkthdr.header), 321189592Sbms ("%s: called when curvnet was not restored", __func__)); 322189592Sbms#endif 323189592Sbms#endif 324189592Sbms return (m->m_pkthdr.flowid); 325189592Sbms} 326189592Sbms 327189592Sbms/* 328189592Sbms * Retrieve or set default IGMP version. 329189592Sbms * 330189592Sbms * VIMAGE: Assume curvnet set by caller. 331189592Sbms * SMPng: NOTE: Serialized by IGMP lock. 332189592Sbms */ 333189592Sbmsstatic int 334189592Sbmssysctl_igmp_default_version(SYSCTL_HANDLER_ARGS) 335189592Sbms{ 336189592Sbms int error; 337189592Sbms int new; 338189592Sbms 339189592Sbms error = sysctl_wire_old_buffer(req, sizeof(int)); 340189592Sbms if (error) 341189592Sbms return (error); 342189592Sbms 343189592Sbms IGMP_LOCK(); 344189592Sbms 345189592Sbms new = V_igmp_default_version; 346189592Sbms 347189592Sbms error = sysctl_handle_int(oidp, &new, 0, req); 348189592Sbms if (error || !req->newptr) 349189592Sbms goto out_locked; 350189592Sbms 351189592Sbms if (new < IGMP_VERSION_1 || new > IGMP_VERSION_3) { 352189592Sbms error = EINVAL; 353189592Sbms goto out_locked; 354189592Sbms } 355189592Sbms 356189592Sbms CTR2(KTR_IGMPV3, "change igmp_default_version from %d to %d", 357189592Sbms V_igmp_default_version, new); 358189592Sbms 359189592Sbms V_igmp_default_version = new; 360189592Sbms 361189592Sbmsout_locked: 362189592Sbms IGMP_UNLOCK(); 363189592Sbms return (error); 364189592Sbms} 365189592Sbms 366189592Sbms/* 367189592Sbms * Retrieve or set threshold between group-source queries in seconds. 368189592Sbms * 369189592Sbms * VIMAGE: Assume curvnet set by caller. 370189592Sbms * SMPng: NOTE: Serialized by IGMP lock. 371189592Sbms */ 372189592Sbmsstatic int 373189592Sbmssysctl_igmp_gsr(SYSCTL_HANDLER_ARGS) 374189592Sbms{ 375189592Sbms int error; 376189592Sbms int i; 377189592Sbms 378189592Sbms error = sysctl_wire_old_buffer(req, sizeof(int)); 379189592Sbms if (error) 380189592Sbms return (error); 381189592Sbms 382189592Sbms IGMP_LOCK(); 383189592Sbms 384189592Sbms i = V_igmp_gsrdelay.tv_sec; 385189592Sbms 386189592Sbms error = sysctl_handle_int(oidp, &i, 0, req); 387189592Sbms if (error || !req->newptr) 388189592Sbms goto out_locked; 389189592Sbms 390189592Sbms if (i < -1 || i >= 60) { 391189592Sbms error = EINVAL; 392189592Sbms goto out_locked; 393189592Sbms } 394189592Sbms 395189592Sbms CTR2(KTR_IGMPV3, "change igmp_gsrdelay from %d to %d", 396189592Sbms V_igmp_gsrdelay.tv_sec, i); 397189592Sbms V_igmp_gsrdelay.tv_sec = i; 398189592Sbms 399189592Sbmsout_locked: 400189592Sbms IGMP_UNLOCK(); 401189592Sbms return (error); 402189592Sbms} 403189592Sbms 404189592Sbms/* 405189592Sbms * Expose struct igmp_ifinfo to userland, keyed by ifindex. 406189592Sbms * For use by ifmcstat(8). 407189592Sbms * 408189592Sbms * SMPng: NOTE: Does an unlocked ifindex space read. 409189592Sbms * VIMAGE: Assume curvnet set by caller. The node handler itself 410189592Sbms * is not directly virtualized. 411189592Sbms */ 412189592Sbmsstatic int 413189592Sbmssysctl_igmp_ifinfo(SYSCTL_HANDLER_ARGS) 414189592Sbms{ 415189592Sbms INIT_VNET_NET(curvnet); 416189592Sbms int *name; 417189592Sbms int error; 418189592Sbms u_int namelen; 419189592Sbms struct ifnet *ifp; 420189592Sbms struct igmp_ifinfo *igi; 421189592Sbms 422189592Sbms name = (int *)arg1; 423189592Sbms namelen = arg2; 424189592Sbms 425189592Sbms if (req->newptr != NULL) 426189592Sbms return (EPERM); 427189592Sbms 428189592Sbms if (namelen != 1) 429189592Sbms return (EINVAL); 430189592Sbms 431189592Sbms error = sysctl_wire_old_buffer(req, sizeof(struct igmp_ifinfo)); 432189592Sbms if (error) 433189592Sbms return (error); 434189592Sbms 435189592Sbms IN_MULTI_LOCK(); 436189592Sbms IGMP_LOCK(); 437189592Sbms 438189592Sbms if (name[0] <= 0 || name[0] > V_if_index) { 439189592Sbms error = ENOENT; 440189592Sbms goto out_locked; 441189592Sbms } 442189592Sbms 443189592Sbms error = ENOENT; 444189592Sbms 445189592Sbms ifp = ifnet_byindex(name[0]); 446189592Sbms if (ifp == NULL) 447189592Sbms goto out_locked; 448189592Sbms 449189592Sbms LIST_FOREACH(igi, &V_igi_head, igi_link) { 450189592Sbms if (ifp == igi->igi_ifp) { 451189592Sbms error = SYSCTL_OUT(req, igi, 452189592Sbms sizeof(struct igmp_ifinfo)); 453189592Sbms break; 454189592Sbms } 455189592Sbms } 456189592Sbms 457189592Sbmsout_locked: 458189592Sbms IGMP_UNLOCK(); 459189592Sbms IN_MULTI_UNLOCK(); 460189592Sbms return (error); 461189592Sbms} 462189592Sbms 463189592Sbms/* 464189592Sbms * Dispatch an entire queue of pending packet chains 465189592Sbms * using the netisr. 466189592Sbms * VIMAGE: Assumes the vnet pointer has been set. 467189592Sbms */ 468189592Sbmsstatic void 469189592Sbmsigmp_dispatch_queue(struct ifqueue *ifq, int limit, const int loop) 470189592Sbms{ 471189592Sbms struct mbuf *m; 472189592Sbms 473189592Sbms for (;;) { 474189592Sbms _IF_DEQUEUE(ifq, m); 475189592Sbms if (m == NULL) 476189592Sbms break; 477189592Sbms CTR3(KTR_IGMPV3, "%s: dispatch %p from %p", __func__, ifq, m); 478189592Sbms if (loop) 479189592Sbms m->m_flags |= M_IGMP_LOOP; 480189592Sbms netisr_dispatch(NETISR_IGMP, m); 481189592Sbms if (--limit == 0) 482189592Sbms break; 483189592Sbms } 484189592Sbms} 485189592Sbms 486189592Sbms/* 487189592Sbms * Filter outgoing IGMP report state by group. 488189592Sbms * 489189592Sbms * Reports are ALWAYS suppressed for ALL-HOSTS (224.0.0.1). 490189592Sbms * If the net.inet.igmp.sendlocal sysctl is 0, then IGMP reports are 491189592Sbms * disabled for all groups in the 224.0.0.0/24 link-local scope. However, 492189592Sbms * this may break certain IGMP snooping switches which rely on the old 493189592Sbms * report behaviour. 494189592Sbms * 495189592Sbms * Return zero if the given group is one for which IGMP reports 496189592Sbms * should be suppressed, or non-zero if reports should be issued. 497189592Sbms */ 498189592Sbmsstatic __inline int 499189592Sbmsigmp_isgroupreported(const struct in_addr addr) 500189592Sbms{ 501189592Sbms 502189592Sbms if (in_allhosts(addr) || 503189592Sbms ((!V_igmp_sendlocal && IN_LOCAL_GROUP(ntohl(addr.s_addr))))) 504189592Sbms return (0); 505189592Sbms 506189592Sbms return (1); 507189592Sbms} 508189592Sbms 509189592Sbms/* 510189592Sbms * Construct a Router Alert option to use in outgoing packets. 511189592Sbms */ 512189592Sbmsstatic struct mbuf * 513189592Sbmsigmp_ra_alloc(void) 514189592Sbms{ 515189592Sbms struct mbuf *m; 516189592Sbms struct ipoption *p; 517189592Sbms 518189592Sbms MGET(m, M_DONTWAIT, MT_DATA); 519189592Sbms p = mtod(m, struct ipoption *); 520189592Sbms p->ipopt_dst.s_addr = INADDR_ANY; 521189592Sbms p->ipopt_list[0] = IPOPT_RA; /* Router Alert Option */ 522189592Sbms p->ipopt_list[1] = 0x04; /* 4 bytes long */ 523189592Sbms p->ipopt_list[2] = IPOPT_EOL; /* End of IP option list */ 524189592Sbms p->ipopt_list[3] = 0x00; /* pad byte */ 525189592Sbms m->m_len = sizeof(p->ipopt_dst) + p->ipopt_list[1]; 526189592Sbms 527189592Sbms return (m); 528189592Sbms} 529189592Sbms 530189592Sbms/* 531189592Sbms * Attach IGMP when PF_INET is attached to an interface. 532189592Sbms * 533189592Sbms * VIMAGE: Currently we set the vnet pointer, although it is 534189592Sbms * likely that it was already set by our caller. 535189592Sbms */ 536189592Sbmsstruct igmp_ifinfo * 537189592Sbmsigmp_domifattach(struct ifnet *ifp) 538189592Sbms{ 539189592Sbms struct igmp_ifinfo *igi; 540189592Sbms 541189592Sbms CTR3(KTR_IGMPV3, "%s: called for ifp %p(%s)", 542189592Sbms __func__, ifp, ifp->if_xname); 543189592Sbms 544189592Sbms CURVNET_SET(ifp->if_vnet); 545189592Sbms IGMP_LOCK(); 546189592Sbms 547189592Sbms igi = igi_alloc_locked(ifp); 548189592Sbms if (!(ifp->if_flags & IFF_MULTICAST)) 549189592Sbms igi->igi_flags |= IGIF_SILENT; 550189592Sbms 551189592Sbms IGMP_UNLOCK(); 552189592Sbms CURVNET_RESTORE(); 553189592Sbms 554189592Sbms return (igi); 555189592Sbms} 556189592Sbms 557189592Sbms/* 558189592Sbms * VIMAGE: assume curvnet set by caller. 559189592Sbms */ 560189592Sbmsstatic struct igmp_ifinfo * 561189592Sbmsigi_alloc_locked(/*const*/ struct ifnet *ifp) 562189592Sbms{ 563189592Sbms struct igmp_ifinfo *igi; 564189592Sbms 565189592Sbms IGMP_LOCK_ASSERT(); 566189592Sbms 567189592Sbms igi = malloc(sizeof(struct igmp_ifinfo), M_IGMP, M_NOWAIT|M_ZERO); 568189592Sbms if (igi == NULL) 569189592Sbms goto out; 570189592Sbms 571189592Sbms igi->igi_ifp = ifp; 572189592Sbms igi->igi_version = V_igmp_default_version; 573189592Sbms igi->igi_flags = 0; 574189592Sbms igi->igi_rv = IGMP_RV_INIT; 575189592Sbms igi->igi_qi = IGMP_QI_INIT; 576189592Sbms igi->igi_qri = IGMP_QRI_INIT; 577189592Sbms igi->igi_uri = IGMP_URI_INIT; 578189592Sbms 579189592Sbms SLIST_INIT(&igi->igi_relinmhead); 580189592Sbms 5811541Srgrimes /* 582189592Sbms * Responses to general queries are subject to bounds. 5831541Srgrimes */ 584189592Sbms IFQ_SET_MAXLEN(&igi->igi_gq, IGMP_MAX_RESPONSE_PACKETS); 5859209Swollman 586189592Sbms LIST_INSERT_HEAD(&V_igi_head, igi, igi_link); 5879209Swollman 588189592Sbms CTR2(KTR_IGMPV3, "allocate igmp_ifinfo for ifp %p(%s)", 589189592Sbms ifp, ifp->if_xname); 590189592Sbms 591189592Sbmsout: 592189592Sbms return (igi); 593189592Sbms} 594189592Sbms 595189592Sbms/* 596189592Sbms * Hook for ifdetach. 597189592Sbms * 598189592Sbms * NOTE: Some finalization tasks need to run before the protocol domain 599189592Sbms * is detached, but also before the link layer does its cleanup. 600189592Sbms * 601189592Sbms * SMPNG: igmp_ifdetach() needs to take IF_ADDR_LOCK(). 602189931Sbms * XXX This is also bitten by unlocked ifma_protospec access. 603189592Sbms * 604189592Sbms * VIMAGE: curvnet should have been set by caller, but let's not assume 605189592Sbms * that for now. 606189592Sbms */ 607189592Sbmsvoid 608189592Sbmsigmp_ifdetach(struct ifnet *ifp) 609189592Sbms{ 610189592Sbms struct igmp_ifinfo *igi; 611189592Sbms struct ifmultiaddr *ifma; 612189592Sbms struct in_multi *inm, *tinm; 613189592Sbms 614189592Sbms CTR3(KTR_IGMPV3, "%s: called for ifp %p(%s)", __func__, ifp, 615189592Sbms ifp->if_xname); 616189592Sbms 617189592Sbms CURVNET_SET(ifp->if_vnet); 618189592Sbms 619189592Sbms IGMP_LOCK(); 620189592Sbms 621189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 622189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 623189592Sbms IF_ADDR_LOCK(ifp); 624189592Sbms TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 625189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 626189931Sbms ifma->ifma_protospec == NULL) 627189592Sbms continue; 628189931Sbms#if 0 629189931Sbms KASSERT(ifma->ifma_protospec != NULL, 630189931Sbms ("%s: ifma_protospec is NULL", __func__)); 631189931Sbms#endif 632189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 633189592Sbms if (inm->inm_state == IGMP_LEAVING_MEMBER) { 634189592Sbms SLIST_INSERT_HEAD(&igi->igi_relinmhead, 635189592Sbms inm, inm_nrele); 636189592Sbms } 637189592Sbms inm_clear_recorded(inm); 638189592Sbms } 639189592Sbms IF_ADDR_UNLOCK(ifp); 640189592Sbms /* 641189592Sbms * Free the in_multi reference(s) for this IGMP lifecycle. 642189592Sbms */ 643189592Sbms SLIST_FOREACH_SAFE(inm, &igi->igi_relinmhead, inm_nrele, 644189592Sbms tinm) { 645189592Sbms SLIST_REMOVE_HEAD(&igi->igi_relinmhead, inm_nrele); 646189592Sbms inm_release_locked(inm); 647189592Sbms } 648189592Sbms } 649189592Sbms 650189592Sbms IGMP_UNLOCK(); 651189592Sbms 652189592Sbms CURVNET_RESTORE(); 6531541Srgrimes} 6541541Srgrimes 655189592Sbms/* 656189592Sbms * Hook for domifdetach. 657189592Sbms * 658189592Sbms * VIMAGE: curvnet should have been set by caller, but let's not assume 659189592Sbms * that for now. 660189592Sbms */ 661189592Sbmsvoid 662189592Sbmsigmp_domifdetach(struct ifnet *ifp) 6632531Swollman{ 664189592Sbms struct igmp_ifinfo *igi; 665189592Sbms 666189592Sbms CTR3(KTR_IGMPV3, "%s: called for ifp %p(%s)", 667189592Sbms __func__, ifp, ifp->if_xname); 668189592Sbms 669189592Sbms CURVNET_SET(ifp->if_vnet); 670189592Sbms IGMP_LOCK(); 671189592Sbms 672189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 673189592Sbms igi_delete_locked(ifp); 674189592Sbms 675189592Sbms IGMP_UNLOCK(); 676189592Sbms CURVNET_RESTORE(); 677189592Sbms} 678189592Sbms 679189592Sbmsstatic void 680189592Sbmsigi_delete_locked(const struct ifnet *ifp) 681189592Sbms{ 682189592Sbms struct igmp_ifinfo *igi, *tigi; 683189592Sbms 684189592Sbms CTR3(KTR_IGMPV3, "%s: freeing igmp_ifinfo for ifp %p(%s)", 685189592Sbms __func__, ifp, ifp->if_xname); 686189592Sbms 687189592Sbms IGMP_LOCK_ASSERT(); 688189592Sbms 689189592Sbms LIST_FOREACH_SAFE(igi, &V_igi_head, igi_link, tigi) { 690189592Sbms if (igi->igi_ifp == ifp) { 691189592Sbms /* 692189592Sbms * Free deferred General Query responses. 693189592Sbms */ 694189592Sbms _IF_DRAIN(&igi->igi_gq); 695189592Sbms 696189592Sbms LIST_REMOVE(igi, igi_link); 697189592Sbms 698189592Sbms KASSERT(SLIST_EMPTY(&igi->igi_relinmhead), 699189592Sbms ("%s: there are dangling in_multi references", 700189592Sbms __func__)); 701189592Sbms 702189592Sbms free(igi, M_IGMP); 703189592Sbms return; 704189592Sbms } 705189592Sbms } 706189592Sbms 707189592Sbms#ifdef INVARIANTS 708189592Sbms panic("%s: igmp_ifinfo not found for ifp %p\n", __func__, ifp); 709189592Sbms#endif 710189592Sbms} 711189592Sbms 712189592Sbms/* 713189592Sbms * Process a received IGMPv1 query. 714189592Sbms * Return non-zero if the message should be dropped. 715189592Sbms * 716189592Sbms * VIMAGE: The curvnet pointer is derived from the input ifp. 717189592Sbms */ 718189592Sbmsstatic int 719189592Sbmsigmp_input_v1_query(struct ifnet *ifp, const struct ip *ip) 720189592Sbms{ 721183550Szec INIT_VNET_INET(ifp->if_vnet); 722189592Sbms struct ifmultiaddr *ifma; 723189592Sbms struct igmp_ifinfo *igi; 724189592Sbms struct in_multi *inm; 7252531Swollman 726189592Sbms /* 727189592Sbms * IGMPv1 General Queries SHOULD always addressed to 224.0.0.1. 728189592Sbms * igmp_group is always ignored. Do not drop it as a userland 729189592Sbms * daemon may wish to see it. 730189592Sbms */ 731189592Sbms if (!in_allhosts(ip->ip_dst)) { 732190965Srwatson IGMPSTAT_INC(igps_rcv_badqueries); 733189592Sbms return (0); 734189592Sbms } 735189592Sbms 736190965Srwatson IGMPSTAT_INC(igps_rcv_gen_queries); 737189592Sbms 738189592Sbms /* 739189592Sbms * Switch to IGMPv1 host compatibility mode. 740189592Sbms */ 741189592Sbms IN_MULTI_LOCK(); 742189592Sbms IGMP_LOCK(); 743189592Sbms 744189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 745189592Sbms KASSERT(igi != NULL, ("%s: no igmp_ifinfo for ifp %p", __func__, ifp)); 746189592Sbms 747189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 748189592Sbms CTR2(KTR_IGMPV3, "ignore v1 query on IGIF_LOOPBACK ifp %p(%s)", 749189592Sbms ifp, ifp->if_xname); 750189592Sbms goto out_locked; 751189592Sbms } 752189592Sbms 753189592Sbms igmp_set_version(igi, IGMP_VERSION_1); 754189592Sbms 755189592Sbms CTR2(KTR_IGMPV3, "process v1 query on ifp %p(%s)", ifp, ifp->if_xname); 756189592Sbms 757189592Sbms /* 758189592Sbms * Start the timers in all of our group records 759189592Sbms * for the interface on which the query arrived, 760189592Sbms * except those which are already running. 761189592Sbms */ 762189592Sbms IF_ADDR_LOCK(ifp); 763189592Sbms TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 764189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 765189931Sbms ifma->ifma_protospec == NULL) 766189592Sbms continue; 767189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 768189592Sbms if (inm->inm_timer != 0) 769189592Sbms continue; 770189592Sbms switch (inm->inm_state) { 771189592Sbms case IGMP_NOT_MEMBER: 772189592Sbms case IGMP_SILENT_MEMBER: 773189592Sbms break; 774189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 775189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 776189592Sbms case IGMP_REPORTING_MEMBER: 777189592Sbms case IGMP_IDLE_MEMBER: 778189592Sbms case IGMP_LAZY_MEMBER: 779189592Sbms case IGMP_SLEEPING_MEMBER: 780189592Sbms case IGMP_AWAKENING_MEMBER: 781189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 782189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY( 783189592Sbms IGMP_V1V2_MAX_RI * PR_FASTHZ); 784189592Sbms V_current_state_timers_running = 1; 785189592Sbms break; 786189592Sbms case IGMP_LEAVING_MEMBER: 787189592Sbms break; 788119181Srwatson } 789119181Srwatson } 790189592Sbms IF_ADDR_UNLOCK(ifp); 791189592Sbms 792189592Sbmsout_locked: 793189592Sbms IGMP_UNLOCK(); 794189592Sbms IN_MULTI_UNLOCK(); 795189592Sbms 796189592Sbms return (0); 797189592Sbms} 798189592Sbms 799189592Sbms/* 800189592Sbms * Process a received IGMPv2 general or group-specific query. 801189592Sbms */ 802189592Sbmsstatic int 803189592Sbmsigmp_input_v2_query(struct ifnet *ifp, const struct ip *ip, 804189592Sbms const struct igmp *igmp) 805189592Sbms{ 806189592Sbms struct ifmultiaddr *ifma; 807189592Sbms struct igmp_ifinfo *igi; 808189592Sbms struct in_multi *inm; 809189592Sbms uint16_t timer; 810189592Sbms 811189592Sbms /* 812189592Sbms * Perform lazy allocation of IGMP link info if required, 813189592Sbms * and switch to IGMPv2 host compatibility mode. 814189592Sbms */ 815189592Sbms IN_MULTI_LOCK(); 816189592Sbms IGMP_LOCK(); 817189592Sbms 818189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 819189592Sbms KASSERT(igi != NULL, ("%s: no igmp_ifinfo for ifp %p", __func__, ifp)); 820189592Sbms 821189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 822189592Sbms CTR2(KTR_IGMPV3, "ignore v2 query on IGIF_LOOPBACK ifp %p(%s)", 823189592Sbms ifp, ifp->if_xname); 824189592Sbms goto out_locked; 825144163Ssam } 826189592Sbms 827189592Sbms igmp_set_version(igi, IGMP_VERSION_2); 828189592Sbms 829189592Sbms timer = igmp->igmp_code * PR_FASTHZ / IGMP_TIMER_SCALE; 830189592Sbms if (timer == 0) 831189592Sbms timer = 1; 832189592Sbms 833189592Sbms if (!in_nullhost(igmp->igmp_group)) { 834189592Sbms /* 835189592Sbms * IGMPv2 Group-Specific Query. 836189592Sbms * If this is a group-specific IGMPv2 query, we need only 837189592Sbms * look up the single group to process it. 838189592Sbms */ 839189592Sbms inm = inm_lookup(ifp, igmp->igmp_group); 840189592Sbms if (inm != NULL) { 841189592Sbms CTR3(KTR_IGMPV3, "process v2 query %s on ifp %p(%s)", 842189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 843189592Sbms igmp_v2_update_group(inm, timer); 844189592Sbms } 845190965Srwatson IGMPSTAT_INC(igps_rcv_group_queries); 846189592Sbms } else { 847189592Sbms /* 848189592Sbms * IGMPv2 General Query. 849189592Sbms * If this was not sent to the all-hosts group, ignore it. 850189592Sbms */ 851189592Sbms if (in_allhosts(ip->ip_dst)) { 852189592Sbms /* 853189592Sbms * For each reporting group joined on this 854189592Sbms * interface, kick the report timer. 855189592Sbms */ 856189592Sbms CTR2(KTR_IGMPV3, 857189592Sbms "process v2 general query on ifp %p(%s)", 858189592Sbms ifp, ifp->if_xname); 859189592Sbms 860189592Sbms IF_ADDR_LOCK(ifp); 861189592Sbms TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 862189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 863189931Sbms ifma->ifma_protospec == NULL) 864189592Sbms continue; 865189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 866189592Sbms igmp_v2_update_group(inm, timer); 867189592Sbms } 868189592Sbms IF_ADDR_UNLOCK(ifp); 869189592Sbms } 870190965Srwatson IGMPSTAT_INC(igps_rcv_gen_queries); 871189592Sbms } 872189592Sbms 873189592Sbmsout_locked: 874189592Sbms IGMP_UNLOCK(); 875189592Sbms IN_MULTI_UNLOCK(); 876189592Sbms 877189592Sbms return (0); 8782531Swollman} 8792531Swollman 880189592Sbms/* 881189592Sbms * Update the report timer on a group in response to an IGMPv2 query. 882189592Sbms * 883189592Sbms * If we are becoming the reporting member for this group, start the timer. 884189592Sbms * If we already are the reporting member for this group, and timer is 885189592Sbms * below the threshold, reset it. 886189592Sbms * 887189592Sbms * We may be updating the group for the first time since we switched 888189592Sbms * to IGMPv3. If we are, then we must clear any recorded source lists, 889189592Sbms * and transition to REPORTING state; the group timer is overloaded 890189592Sbms * for group and group-source query responses. 891189592Sbms * 892189592Sbms * Unlike IGMPv3, the delay per group should be jittered 893189592Sbms * to avoid bursts of IGMPv2 reports. 894189592Sbms */ 895189592Sbmsstatic void 896189592Sbmsigmp_v2_update_group(struct in_multi *inm, const int timer) 897189592Sbms{ 898189592Sbms 899189592Sbms CTR4(KTR_IGMPV3, "%s: %s/%s timer=%d", __func__, 900189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname, timer); 901189592Sbms 902189592Sbms IN_MULTI_LOCK_ASSERT(); 903189592Sbms 904189592Sbms switch (inm->inm_state) { 905189592Sbms case IGMP_NOT_MEMBER: 906189592Sbms case IGMP_SILENT_MEMBER: 907189592Sbms break; 908189592Sbms case IGMP_REPORTING_MEMBER: 909189592Sbms if (inm->inm_timer != 0 && 910189592Sbms inm->inm_timer <= timer) { 911189592Sbms CTR1(KTR_IGMPV3, "%s: REPORTING and timer running, " 912189592Sbms "skipping.", __func__); 913189592Sbms break; 914189592Sbms } 915189592Sbms /* FALLTHROUGH */ 916189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 917189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 918189592Sbms case IGMP_IDLE_MEMBER: 919189592Sbms case IGMP_LAZY_MEMBER: 920189592Sbms case IGMP_AWAKENING_MEMBER: 921189592Sbms CTR1(KTR_IGMPV3, "%s: ->REPORTING", __func__); 922189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 923189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY(timer); 924189592Sbms V_current_state_timers_running = 1; 925189592Sbms break; 926189592Sbms case IGMP_SLEEPING_MEMBER: 927189592Sbms CTR1(KTR_IGMPV3, "%s: ->AWAKENING", __func__); 928189592Sbms inm->inm_state = IGMP_AWAKENING_MEMBER; 929189592Sbms break; 930189592Sbms case IGMP_LEAVING_MEMBER: 931189592Sbms break; 932189592Sbms } 933189592Sbms} 934189592Sbms 935189592Sbms/* 936189592Sbms * Process a received IGMPv3 general, group-specific or 937189592Sbms * group-and-source-specific query. 938189592Sbms * Assumes m has already been pulled up to the full IGMP message length. 939189592Sbms * Return 0 if successful, otherwise an appropriate error code is returned. 940189592Sbms */ 941189592Sbmsstatic int 942189592Sbmsigmp_input_v3_query(struct ifnet *ifp, const struct ip *ip, 943189592Sbms /*const*/ struct igmpv3 *igmpv3) 944189592Sbms{ 945189592Sbms struct igmp_ifinfo *igi; 946189592Sbms struct in_multi *inm; 947189592Sbms uint32_t maxresp, nsrc, qqi; 948189592Sbms uint16_t timer; 949189592Sbms uint8_t qrv; 950189592Sbms 951189592Sbms CTR2(KTR_IGMPV3, "process v3 query on ifp %p(%s)", ifp, ifp->if_xname); 952189592Sbms 953189592Sbms maxresp = igmpv3->igmp_code; /* in 1/10ths of a second */ 954189592Sbms if (maxresp >= 128) { 955189592Sbms maxresp = IGMP_MANT(igmpv3->igmp_code) << 956189592Sbms (IGMP_EXP(igmpv3->igmp_code) + 3); 957189592Sbms } 958189592Sbms 959189592Sbms /* 960189592Sbms * Robustness must never be less than 2 for on-wire IGMPv3. 961189592Sbms * FIXME: Check if ifp has IGIF_LOOPBACK set, as we make 962189592Sbms * an exception for interfaces whose IGMPv3 state changes 963189592Sbms * are redirected to loopback (e.g. MANET). 964189592Sbms */ 965189592Sbms qrv = IGMP_QRV(igmpv3->igmp_misc); 966189592Sbms if (qrv < 2) { 967189592Sbms CTR3(KTR_IGMPV3, "%s: clamping qrv %d to %d", __func__, 968189592Sbms qrv, IGMP_RV_INIT); 969189592Sbms qrv = IGMP_RV_INIT; 970189592Sbms } 971189592Sbms 972189592Sbms qqi = igmpv3->igmp_qqi; 973189592Sbms if (qqi >= 128) { 974190691Sbms qqi = IGMP_MANT(igmpv3->igmp_qqi) << 975190691Sbms (IGMP_EXP(igmpv3->igmp_qqi) + 3); 976189592Sbms } 977189592Sbms 978189592Sbms timer = maxresp * PR_FASTHZ / IGMP_TIMER_SCALE; 979189592Sbms if (timer == 0) 980189592Sbms timer = 1; 981189592Sbms 982189592Sbms nsrc = ntohs(igmpv3->igmp_numsrc); 983189592Sbms 984189592Sbms IN_MULTI_LOCK(); 985189592Sbms IGMP_LOCK(); 986189592Sbms 987189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 988189592Sbms KASSERT(igi != NULL, ("%s: no igmp_ifinfo for ifp %p", __func__, ifp)); 989189592Sbms 990189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 991189592Sbms CTR2(KTR_IGMPV3, "ignore v3 query on IGIF_LOOPBACK ifp %p(%s)", 992189592Sbms ifp, ifp->if_xname); 993189592Sbms goto out_locked; 994189592Sbms } 995189592Sbms 996189592Sbms igmp_set_version(igi, IGMP_VERSION_3); 997189592Sbms 998189592Sbms igi->igi_rv = qrv; 999189592Sbms igi->igi_qi = qqi; 1000189592Sbms igi->igi_qri = maxresp; 1001189592Sbms 1002189592Sbms CTR4(KTR_IGMPV3, "%s: qrv %d qi %d qri %d", __func__, qrv, qqi, 1003189592Sbms maxresp); 1004189592Sbms 1005189592Sbms if (in_nullhost(igmpv3->igmp_group)) { 1006189592Sbms /* 1007189592Sbms * IGMPv3 General Query. 1008189592Sbms * Schedule a current-state report on this ifp for 1009189592Sbms * all groups, possibly containing source lists. 1010189592Sbms */ 1011190965Srwatson IGMPSTAT_INC(igps_rcv_gen_queries); 1012189592Sbms 1013189592Sbms if (!in_allhosts(ip->ip_dst) || nsrc > 0) { 1014189592Sbms /* 1015189592Sbms * General Queries SHOULD be directed to 224.0.0.1. 1016189592Sbms * A general query with a source list has undefined 1017189592Sbms * behaviour; discard it. 1018189592Sbms */ 1019190965Srwatson IGMPSTAT_INC(igps_rcv_badqueries); 1020189592Sbms goto out_locked; 1021189592Sbms } 1022189592Sbms 1023189592Sbms CTR2(KTR_IGMPV3, "process v3 general query on ifp %p(%s)", 1024189592Sbms ifp, ifp->if_xname); 1025189592Sbms 1026189592Sbms /* 1027189592Sbms * If there is a pending General Query response 1028189592Sbms * scheduled earlier than the selected delay, do 1029189592Sbms * not schedule any other reports. 1030189592Sbms * Otherwise, reset the interface timer. 1031189592Sbms */ 1032189592Sbms if (igi->igi_v3_timer == 0 || igi->igi_v3_timer >= timer) { 1033189592Sbms igi->igi_v3_timer = IGMP_RANDOM_DELAY(timer); 1034189592Sbms V_interface_timers_running = 1; 1035189592Sbms } 1036189592Sbms } else { 1037189592Sbms /* 1038189592Sbms * IGMPv3 Group-specific or Group-and-source-specific Query. 1039189592Sbms * 1040189592Sbms * Group-source-specific queries are throttled on 1041189592Sbms * a per-group basis to defeat denial-of-service attempts. 1042189592Sbms * Queries for groups we are not a member of on this 1043189592Sbms * link are simply ignored. 1044189592Sbms */ 1045189592Sbms inm = inm_lookup(ifp, igmpv3->igmp_group); 1046189592Sbms if (inm == NULL) 1047189592Sbms goto out_locked; 1048189592Sbms if (nsrc > 0) { 1049190965Srwatson IGMPSTAT_INC(igps_rcv_gsr_queries); 1050189592Sbms if (!ratecheck(&inm->inm_lastgsrtv, 1051189592Sbms &V_igmp_gsrdelay)) { 1052189592Sbms CTR1(KTR_IGMPV3, "%s: GS query throttled.", 1053189592Sbms __func__); 1054190965Srwatson IGMPSTAT_INC(igps_drop_gsr_queries); 1055189592Sbms goto out_locked; 1056189592Sbms } 1057189592Sbms } else { 1058190965Srwatson IGMPSTAT_INC(igps_rcv_group_queries); 1059189592Sbms } 1060189592Sbms CTR3(KTR_IGMPV3, "process v3 %s query on ifp %p(%s)", 1061189592Sbms inet_ntoa(igmpv3->igmp_group), ifp, ifp->if_xname); 1062189592Sbms /* 1063189592Sbms * If there is a pending General Query response 1064189592Sbms * scheduled sooner than the selected delay, no 1065189592Sbms * further report need be scheduled. 1066189592Sbms * Otherwise, prepare to respond to the 1067189592Sbms * group-specific or group-and-source query. 1068189592Sbms */ 1069189592Sbms if (igi->igi_v3_timer == 0 || igi->igi_v3_timer >= timer) 1070189592Sbms igmp_input_v3_group_query(inm, igi, timer, igmpv3); 1071189592Sbms } 1072189592Sbms 1073189592Sbmsout_locked: 1074189592Sbms IGMP_UNLOCK(); 1075189592Sbms IN_MULTI_UNLOCK(); 1076189592Sbms 1077189592Sbms return (0); 1078189592Sbms} 1079189592Sbms 1080189592Sbms/* 1081189592Sbms * Process a recieved IGMPv3 group-specific or group-and-source-specific 1082189592Sbms * query. 1083189592Sbms * Return <0 if any error occured. Currently this is ignored. 1084189592Sbms */ 1085189592Sbmsstatic int 1086189592Sbmsigmp_input_v3_group_query(struct in_multi *inm, struct igmp_ifinfo *igi, 1087189592Sbms int timer, /*const*/ struct igmpv3 *igmpv3) 1088189592Sbms{ 1089189592Sbms int retval; 1090189592Sbms uint16_t nsrc; 1091189592Sbms 1092189592Sbms IN_MULTI_LOCK_ASSERT(); 1093189592Sbms IGMP_LOCK_ASSERT(); 1094189592Sbms 1095189592Sbms retval = 0; 1096189592Sbms 1097189592Sbms switch (inm->inm_state) { 1098189592Sbms case IGMP_NOT_MEMBER: 1099189592Sbms case IGMP_SILENT_MEMBER: 1100189592Sbms case IGMP_SLEEPING_MEMBER: 1101189592Sbms case IGMP_LAZY_MEMBER: 1102189592Sbms case IGMP_AWAKENING_MEMBER: 1103189592Sbms case IGMP_IDLE_MEMBER: 1104189592Sbms case IGMP_LEAVING_MEMBER: 1105189592Sbms return (retval); 1106189592Sbms break; 1107189592Sbms case IGMP_REPORTING_MEMBER: 1108189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1109189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1110189592Sbms break; 1111189592Sbms } 1112189592Sbms 1113189592Sbms nsrc = ntohs(igmpv3->igmp_numsrc); 1114189592Sbms 1115189592Sbms /* 1116189592Sbms * Deal with group-specific queries upfront. 1117189592Sbms * If any group query is already pending, purge any recorded 1118189592Sbms * source-list state if it exists, and schedule a query response 1119189592Sbms * for this group-specific query. 1120189592Sbms */ 1121189592Sbms if (nsrc == 0) { 1122189592Sbms if (inm->inm_state == IGMP_G_QUERY_PENDING_MEMBER || 1123189592Sbms inm->inm_state == IGMP_SG_QUERY_PENDING_MEMBER) { 1124189592Sbms inm_clear_recorded(inm); 1125189592Sbms timer = min(inm->inm_timer, timer); 1126189592Sbms } 1127189592Sbms inm->inm_state = IGMP_G_QUERY_PENDING_MEMBER; 1128189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY(timer); 1129189592Sbms V_current_state_timers_running = 1; 1130189592Sbms return (retval); 1131189592Sbms } 1132189592Sbms 1133189592Sbms /* 1134189592Sbms * Deal with the case where a group-and-source-specific query has 1135189592Sbms * been received but a group-specific query is already pending. 1136189592Sbms */ 1137189592Sbms if (inm->inm_state == IGMP_G_QUERY_PENDING_MEMBER) { 1138189592Sbms timer = min(inm->inm_timer, timer); 1139189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY(timer); 1140189592Sbms V_current_state_timers_running = 1; 1141189592Sbms return (retval); 1142189592Sbms } 1143189592Sbms 1144189592Sbms /* 1145189592Sbms * Finally, deal with the case where a group-and-source-specific 1146189592Sbms * query has been received, where a response to a previous g-s-r 1147189592Sbms * query exists, or none exists. 1148189592Sbms * In this case, we need to parse the source-list which the Querier 1149189592Sbms * has provided us with and check if we have any source list filter 1150189592Sbms * entries at T1 for these sources. If we do not, there is no need 1151189592Sbms * schedule a report and the query may be dropped. 1152189592Sbms * If we do, we must record them and schedule a current-state 1153189592Sbms * report for those sources. 1154189592Sbms * FIXME: Handling source lists larger than 1 mbuf requires that 1155189592Sbms * we pass the mbuf chain pointer down to this function, and use 1156189592Sbms * m_getptr() to walk the chain. 1157189592Sbms */ 1158189592Sbms if (inm->inm_nsrc > 0) { 1159189592Sbms const struct in_addr *ap; 1160189592Sbms int i, nrecorded; 1161189592Sbms 1162189592Sbms ap = (const struct in_addr *)(igmpv3 + 1); 1163189592Sbms nrecorded = 0; 1164189592Sbms for (i = 0; i < nsrc; i++, ap++) { 1165189592Sbms retval = inm_record_source(inm, ap->s_addr); 1166189592Sbms if (retval < 0) 1167189592Sbms break; 1168189592Sbms nrecorded += retval; 1169189592Sbms } 1170189592Sbms if (nrecorded > 0) { 1171189592Sbms CTR1(KTR_IGMPV3, 1172189592Sbms "%s: schedule response to SG query", __func__); 1173189592Sbms inm->inm_state = IGMP_SG_QUERY_PENDING_MEMBER; 1174189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY(timer); 1175189592Sbms V_current_state_timers_running = 1; 1176189592Sbms } 1177189592Sbms } 1178189592Sbms 1179189592Sbms return (retval); 1180189592Sbms} 1181189592Sbms 1182189592Sbms/* 1183189592Sbms * Process a received IGMPv1 host membership report. 1184189592Sbms * 1185189592Sbms * NOTE: 0.0.0.0 workaround breaks const correctness. 1186189592Sbms */ 1187189592Sbmsstatic int 1188189592Sbmsigmp_input_v1_report(struct ifnet *ifp, /*const*/ struct ip *ip, 1189189592Sbms /*const*/ struct igmp *igmp) 1190189592Sbms{ 1191189592Sbms struct in_ifaddr *ia; 1192189592Sbms struct in_multi *inm; 1193189592Sbms 1194190965Srwatson IGMPSTAT_INC(igps_rcv_reports); 1195189592Sbms 1196189592Sbms if (ifp->if_flags & IFF_LOOPBACK) 1197189592Sbms return (0); 1198189592Sbms 1199189592Sbms if (!IN_MULTICAST(ntohl(igmp->igmp_group.s_addr) || 1200189592Sbms !in_hosteq(igmp->igmp_group, ip->ip_dst))) { 1201190965Srwatson IGMPSTAT_INC(igps_rcv_badreports); 1202189592Sbms return (EINVAL); 1203189592Sbms } 1204189592Sbms 1205189592Sbms /* 1206189592Sbms * RFC 3376, Section 4.2.13, 9.2, 9.3: 1207189592Sbms * Booting clients may use the source address 0.0.0.0. Some 1208189592Sbms * IGMP daemons may not know how to use IP_RECVIF to determine 1209189592Sbms * the interface upon which this message was received. 1210189592Sbms * Replace 0.0.0.0 with the subnet address if told to do so. 1211189592Sbms */ 1212189592Sbms if (V_igmp_recvifkludge && in_nullhost(ip->ip_src)) { 1213189592Sbms IFP_TO_IA(ifp, ia); 1214189592Sbms if (ia != NULL) 1215189592Sbms ip->ip_src.s_addr = htonl(ia->ia_subnet); 1216189592Sbms } 1217189592Sbms 1218189592Sbms CTR3(KTR_IGMPV3, "process v1 report %s on ifp %p(%s)", 1219189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1220189592Sbms 1221189592Sbms /* 1222189592Sbms * IGMPv1 report suppression. 1223189592Sbms * If we are a member of this group, and our membership should be 1224189592Sbms * reported, stop our group timer and transition to the 'lazy' state. 1225189592Sbms */ 1226189592Sbms IN_MULTI_LOCK(); 1227189592Sbms inm = inm_lookup(ifp, igmp->igmp_group); 1228189592Sbms if (inm != NULL) { 1229189592Sbms struct igmp_ifinfo *igi; 1230189592Sbms 1231189592Sbms igi = inm->inm_igi; 1232189592Sbms if (igi == NULL) { 1233189592Sbms KASSERT(igi != NULL, 1234189592Sbms ("%s: no igi for ifp %p", __func__, ifp)); 1235189592Sbms goto out_locked; 1236189592Sbms } 1237189592Sbms 1238190965Srwatson IGMPSTAT_INC(igps_rcv_ourreports); 1239189592Sbms 1240189592Sbms /* 1241189592Sbms * If we are in IGMPv3 host mode, do not allow the 1242189592Sbms * other host's IGMPv1 report to suppress our reports 1243189592Sbms * unless explicitly configured to do so. 1244189592Sbms */ 1245189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 1246189592Sbms if (V_igmp_legacysupp) 1247189592Sbms igmp_v3_suppress_group_record(inm); 1248189592Sbms goto out_locked; 1249189592Sbms } 1250189592Sbms 1251189592Sbms inm->inm_timer = 0; 1252189592Sbms 1253189592Sbms switch (inm->inm_state) { 1254189592Sbms case IGMP_NOT_MEMBER: 1255189592Sbms case IGMP_SILENT_MEMBER: 1256189592Sbms break; 1257189592Sbms case IGMP_IDLE_MEMBER: 1258189592Sbms case IGMP_LAZY_MEMBER: 1259189592Sbms case IGMP_AWAKENING_MEMBER: 1260189592Sbms CTR3(KTR_IGMPV3, 1261189592Sbms "report suppressed for %s on ifp %p(%s)", 1262189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1263189592Sbms case IGMP_SLEEPING_MEMBER: 1264189592Sbms inm->inm_state = IGMP_SLEEPING_MEMBER; 1265189592Sbms break; 1266189592Sbms case IGMP_REPORTING_MEMBER: 1267189592Sbms CTR3(KTR_IGMPV3, 1268189592Sbms "report suppressed for %s on ifp %p(%s)", 1269189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1270189592Sbms if (igi->igi_version == IGMP_VERSION_1) 1271189592Sbms inm->inm_state = IGMP_LAZY_MEMBER; 1272189592Sbms else if (igi->igi_version == IGMP_VERSION_2) 1273189592Sbms inm->inm_state = IGMP_SLEEPING_MEMBER; 1274189592Sbms break; 1275189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1276189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1277189592Sbms case IGMP_LEAVING_MEMBER: 1278189592Sbms break; 1279189592Sbms } 1280189592Sbms } 1281189592Sbms 1282189592Sbmsout_locked: 1283189592Sbms IN_MULTI_UNLOCK(); 1284189592Sbms 1285189592Sbms return (0); 1286189592Sbms} 1287189592Sbms 1288189592Sbms/* 1289189592Sbms * Process a received IGMPv2 host membership report. 1290189592Sbms * 1291189592Sbms * NOTE: 0.0.0.0 workaround breaks const correctness. 1292189592Sbms */ 1293189592Sbmsstatic int 1294189592Sbmsigmp_input_v2_report(struct ifnet *ifp, /*const*/ struct ip *ip, 1295189592Sbms /*const*/ struct igmp *igmp) 1296189592Sbms{ 1297189592Sbms struct in_ifaddr *ia; 1298189592Sbms struct in_multi *inm; 1299189592Sbms 1300189592Sbms /* 1301189592Sbms * Make sure we don't hear our own membership report. Fast 1302189592Sbms * leave requires knowing that we are the only member of a 1303189592Sbms * group. 1304189592Sbms */ 1305189592Sbms IFP_TO_IA(ifp, ia); 1306189592Sbms if (ia != NULL && in_hosteq(ip->ip_src, IA_SIN(ia)->sin_addr)) 1307189592Sbms return (0); 1308189592Sbms 1309190965Srwatson IGMPSTAT_INC(igps_rcv_reports); 1310189592Sbms 1311189592Sbms if (ifp->if_flags & IFF_LOOPBACK) 1312189592Sbms return (0); 1313189592Sbms 1314189592Sbms if (!IN_MULTICAST(ntohl(igmp->igmp_group.s_addr)) || 1315189592Sbms !in_hosteq(igmp->igmp_group, ip->ip_dst)) { 1316190965Srwatson IGMPSTAT_INC(igps_rcv_badreports); 1317189592Sbms return (EINVAL); 1318189592Sbms } 1319189592Sbms 1320189592Sbms /* 1321189592Sbms * RFC 3376, Section 4.2.13, 9.2, 9.3: 1322189592Sbms * Booting clients may use the source address 0.0.0.0. Some 1323189592Sbms * IGMP daemons may not know how to use IP_RECVIF to determine 1324189592Sbms * the interface upon which this message was received. 1325189592Sbms * Replace 0.0.0.0 with the subnet address if told to do so. 1326189592Sbms */ 1327189592Sbms if (V_igmp_recvifkludge && in_nullhost(ip->ip_src)) { 1328189592Sbms if (ia != NULL) 1329189592Sbms ip->ip_src.s_addr = htonl(ia->ia_subnet); 1330189592Sbms } 1331189592Sbms 1332189592Sbms CTR3(KTR_IGMPV3, "process v2 report %s on ifp %p(%s)", 1333189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1334189592Sbms 1335189592Sbms /* 1336189592Sbms * IGMPv2 report suppression. 1337189592Sbms * If we are a member of this group, and our membership should be 1338189592Sbms * reported, and our group timer is pending or about to be reset, 1339189592Sbms * stop our group timer by transitioning to the 'lazy' state. 1340189592Sbms */ 1341189592Sbms IN_MULTI_LOCK(); 1342189592Sbms inm = inm_lookup(ifp, igmp->igmp_group); 1343189592Sbms if (inm != NULL) { 1344189592Sbms struct igmp_ifinfo *igi; 1345189592Sbms 1346189592Sbms igi = inm->inm_igi; 1347189592Sbms KASSERT(igi != NULL, ("%s: no igi for ifp %p", __func__, ifp)); 1348189592Sbms 1349190965Srwatson IGMPSTAT_INC(igps_rcv_ourreports); 1350189592Sbms 1351189592Sbms /* 1352189592Sbms * If we are in IGMPv3 host mode, do not allow the 1353189592Sbms * other host's IGMPv1 report to suppress our reports 1354189592Sbms * unless explicitly configured to do so. 1355189592Sbms */ 1356189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 1357189592Sbms if (V_igmp_legacysupp) 1358189592Sbms igmp_v3_suppress_group_record(inm); 1359189592Sbms goto out_locked; 1360189592Sbms } 1361189592Sbms 1362189592Sbms inm->inm_timer = 0; 1363189592Sbms 1364189592Sbms switch (inm->inm_state) { 1365189592Sbms case IGMP_NOT_MEMBER: 1366189592Sbms case IGMP_SILENT_MEMBER: 1367189592Sbms case IGMP_SLEEPING_MEMBER: 1368189592Sbms break; 1369189592Sbms case IGMP_REPORTING_MEMBER: 1370189592Sbms case IGMP_IDLE_MEMBER: 1371189592Sbms case IGMP_AWAKENING_MEMBER: 1372189592Sbms CTR3(KTR_IGMPV3, 1373189592Sbms "report suppressed for %s on ifp %p(%s)", 1374189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1375189592Sbms case IGMP_LAZY_MEMBER: 1376189592Sbms inm->inm_state = IGMP_LAZY_MEMBER; 1377189592Sbms break; 1378189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1379189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1380189592Sbms case IGMP_LEAVING_MEMBER: 1381189592Sbms break; 1382189592Sbms } 1383189592Sbms } 1384189592Sbms 1385189592Sbmsout_locked: 1386189592Sbms IN_MULTI_UNLOCK(); 1387189592Sbms 1388189592Sbms return (0); 1389189592Sbms} 1390189592Sbms 13911541Srgrimesvoid 1392189592Sbmsigmp_input(struct mbuf *m, int off) 13931541Srgrimes{ 1394189592Sbms int iphlen; 1395189592Sbms struct ifnet *ifp; 1396189592Sbms struct igmp *igmp; 1397189592Sbms struct ip *ip; 1398189592Sbms int igmplen; 1399189592Sbms int minlen; 1400189592Sbms int queryver; 1401189592Sbms 1402189592Sbms CTR3(KTR_IGMPV3, "%s: called w/mbuf (%p,%d)", __func__, m, off); 1403189592Sbms 1404189592Sbms ifp = m->m_pkthdr.rcvif; 1405183550Szec INIT_VNET_INET(ifp->if_vnet); 14061541Srgrimes 1407190965Srwatson IGMPSTAT_INC(igps_rcv_total); 14081541Srgrimes 14091541Srgrimes ip = mtod(m, struct ip *); 1410189592Sbms iphlen = off; 14111541Srgrimes igmplen = ip->ip_len; 14121541Srgrimes 14131541Srgrimes /* 1414164863Srwatson * Validate lengths. 14151541Srgrimes */ 14161541Srgrimes if (igmplen < IGMP_MINLEN) { 1417190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 14181541Srgrimes m_freem(m); 14191541Srgrimes return; 14201541Srgrimes } 1421189592Sbms 1422189592Sbms /* 1423189592Sbms * Always pullup to the minimum size for v1/v2 or v3 1424189592Sbms * to amortize calls to m_pullup(). 1425189592Sbms */ 1426189592Sbms minlen = iphlen; 1427189592Sbms if (igmplen >= IGMP_V3_QUERY_MINLEN) 1428189592Sbms minlen += IGMP_V3_QUERY_MINLEN; 1429189592Sbms else 1430189592Sbms minlen += IGMP_MINLEN; 14311541Srgrimes if ((m->m_flags & M_EXT || m->m_len < minlen) && 14321541Srgrimes (m = m_pullup(m, minlen)) == 0) { 1433190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 14341541Srgrimes return; 14351541Srgrimes } 1436189592Sbms ip = mtod(m, struct ip *); 14371541Srgrimes 1438189592Sbms if (ip->ip_ttl != 1) { 1439190965Srwatson IGMPSTAT_INC(igps_rcv_badttl); 1440189592Sbms m_freem(m); 1441189592Sbms return; 1442189592Sbms } 1443189592Sbms 14441541Srgrimes /* 1445164863Srwatson * Validate checksum. 14461541Srgrimes */ 14471541Srgrimes m->m_data += iphlen; 14481541Srgrimes m->m_len -= iphlen; 14491541Srgrimes igmp = mtod(m, struct igmp *); 14501541Srgrimes if (in_cksum(m, igmplen)) { 1451190965Srwatson IGMPSTAT_INC(igps_rcv_badsum); 14521541Srgrimes m_freem(m); 14531541Srgrimes return; 14541541Srgrimes } 14551541Srgrimes m->m_data -= iphlen; 14561541Srgrimes m->m_len += iphlen; 14572531Swollman 14581541Srgrimes switch (igmp->igmp_type) { 1459189592Sbms case IGMP_HOST_MEMBERSHIP_QUERY: 1460189592Sbms if (igmplen == IGMP_MINLEN) { 1461189592Sbms if (igmp->igmp_code == 0) 1462189592Sbms queryver = IGMP_VERSION_1; 1463189592Sbms else 1464189592Sbms queryver = IGMP_VERSION_2; 1465189592Sbms } else if (igmplen >= IGMP_V3_QUERY_MINLEN) { 1466189592Sbms queryver = IGMP_VERSION_3; 1467189592Sbms } else { 1468190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 1469189592Sbms m_freem(m); 1470189592Sbms return; 1471189592Sbms } 14721541Srgrimes 1473189592Sbms switch (queryver) { 1474189592Sbms case IGMP_VERSION_1: 1475190965Srwatson IGMPSTAT_INC(igps_rcv_v1v2_queries); 1476189592Sbms if (!V_igmp_v1enable) 1477189592Sbms break; 1478189592Sbms if (igmp_input_v1_query(ifp, ip) != 0) { 1479144163Ssam m_freem(m); 1480144163Ssam return; 1481144163Ssam } 1482189592Sbms break; 14834028Spst 1484189592Sbms case IGMP_VERSION_2: 1485190965Srwatson IGMPSTAT_INC(igps_rcv_v1v2_queries); 1486189592Sbms if (!V_igmp_v2enable) 1487189592Sbms break; 1488189592Sbms if (igmp_input_v2_query(ifp, ip, igmp) != 0) { 14892531Swollman m_freem(m); 14902531Swollman return; 14912531Swollman } 1492189592Sbms break; 14932531Swollman 1494189592Sbms case IGMP_VERSION_3: { 1495189592Sbms struct igmpv3 *igmpv3; 1496189592Sbms uint16_t igmpv3len; 1497189592Sbms uint16_t srclen; 1498189592Sbms int nsrc; 1499189592Sbms 1500190965Srwatson IGMPSTAT_INC(igps_rcv_v3_queries); 1501189592Sbms igmpv3 = (struct igmpv3 *)igmp; 1502189592Sbms /* 1503189592Sbms * Validate length based on source count. 1504189592Sbms */ 1505189592Sbms nsrc = ntohs(igmpv3->igmp_numsrc); 1506189592Sbms srclen = sizeof(struct in_addr) * nsrc; 1507189592Sbms if (nsrc * sizeof(in_addr_t) > srclen) { 1508190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 1509189592Sbms return; 15102531Swollman } 1511189592Sbms /* 1512189592Sbms * m_pullup() may modify m, so pullup in 1513189592Sbms * this scope. 1514189592Sbms */ 1515189592Sbms igmpv3len = iphlen + IGMP_V3_QUERY_MINLEN + 1516189592Sbms srclen; 1517189592Sbms if ((m->m_flags & M_EXT || 1518189592Sbms m->m_len < igmpv3len) && 1519189592Sbms (m = m_pullup(m, igmpv3len)) == NULL) { 1520190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 1521189592Sbms return; 1522189592Sbms } 1523189592Sbms igmpv3 = (struct igmpv3 *)(mtod(m, uint8_t *) 1524189592Sbms + iphlen); 1525189592Sbms if (igmp_input_v3_query(ifp, ip, igmpv3) != 0) { 1526189592Sbms m_freem(m); 1527189592Sbms return; 1528189592Sbms } 15291541Srgrimes } 1530189592Sbms break; 15311541Srgrimes } 15321541Srgrimes break; 15331541Srgrimes 1534189592Sbms case IGMP_v1_HOST_MEMBERSHIP_REPORT: 1535189592Sbms if (!V_igmp_v1enable) 153614622Sfenner break; 1537189592Sbms if (igmp_input_v1_report(ifp, ip, igmp) != 0) { 1538189592Sbms m_freem(m); 1539189592Sbms return; 1540189592Sbms } 1541189592Sbms break; 154214622Sfenner 1543189592Sbms case IGMP_v2_HOST_MEMBERSHIP_REPORT: 1544189592Sbms if (!V_igmp_v2enable) 15451541Srgrimes break; 1546189592Sbms if (!ip_checkrouteralert(m)) 1547190965Srwatson IGMPSTAT_INC(igps_rcv_nora); 1548189592Sbms if (igmp_input_v2_report(ifp, ip, igmp) != 0) { 15491541Srgrimes m_freem(m); 15501541Srgrimes return; 15511541Srgrimes } 1552189592Sbms break; 15531541Srgrimes 1554189592Sbms case IGMP_v3_HOST_MEMBERSHIP_REPORT: 15551541Srgrimes /* 1556189592Sbms * Hosts do not need to process IGMPv3 membership reports, 1557189592Sbms * as report suppression is no longer required. 15581541Srgrimes */ 1559189592Sbms if (!ip_checkrouteralert(m)) 1560190965Srwatson IGMPSTAT_INC(igps_rcv_nora); 1561189592Sbms break; 15621541Srgrimes 1563189592Sbms default: 15641541Srgrimes break; 15651541Srgrimes } 15661541Srgrimes 15671541Srgrimes /* 1568164863Srwatson * Pass all valid IGMP packets up to any process(es) listening on a 1569164863Srwatson * raw IGMP socket. 15701541Srgrimes */ 157182890Sjulian rip_input(m, off); 15721541Srgrimes} 15731541Srgrimes 1574189592Sbms 1575189592Sbms/* 1576189592Sbms * Fast timeout handler (global). 1577189592Sbms * VIMAGE: Timeout handlers are expected to service all vimages. 1578189592Sbms */ 15791541Srgrimesvoid 1580189592Sbmsigmp_fasttimo(void) 15811541Srgrimes{ 1582189592Sbms#ifdef VIMAGE 1583189592Sbms VNET_ITERATOR_DECL(vnet_iter); 15841541Srgrimes 1585189592Sbms VNET_LIST_RLOCK(); 1586189592Sbms VNET_FOREACH(vnet_iter) { 1587189592Sbms CURVNET_SET(vnet_iter); 1588189592Sbms INIT_VNET_INET(vnet_iter); 1589189592Sbms igmp_fasttimo_vnet(); 1590189592Sbms CURVNET_RESTORE(); 1591189592Sbms } 1592189592Sbms VNET_LIST_RUNLOCK(); 1593189592Sbms#else /* !VIMAGE */ 1594189592Sbms 1595189592Sbms igmp_fasttimo_vnet(); 1596189592Sbms#endif /* VIMAGE */ 1597189592Sbms} 1598189592Sbms 1599189592Sbms/* 1600189592Sbms * Fast timeout handler (per-vnet). 1601189592Sbms * Sends are shuffled off to a netisr to deal with Giant. 1602189592Sbms * 1603189592Sbms * VIMAGE: Assume caller has set up our curvnet. 1604189592Sbms */ 1605189592Sbmsstatic void 1606189592Sbmsigmp_fasttimo_vnet(void) 1607189592Sbms{ 1608189592Sbms struct ifqueue scq; /* State-change packets */ 1609189592Sbms struct ifqueue qrq; /* Query response packets */ 1610189592Sbms struct ifnet *ifp; 1611189592Sbms struct igmp_ifinfo *igi; 1612189592Sbms struct ifmultiaddr *ifma, *tifma; 1613189592Sbms struct in_multi *inm; 1614189592Sbms int loop, uri_fasthz; 1615189592Sbms 1616189592Sbms loop = 0; 1617189592Sbms uri_fasthz = 0; 1618189592Sbms 1619189592Sbms /* 1620189592Sbms * Quick check to see if any work needs to be done, in order to 1621189592Sbms * minimize the overhead of fasttimo processing. 1622189592Sbms * SMPng: XXX Unlocked reads. 1623189592Sbms */ 1624189592Sbms if (!V_current_state_timers_running && 1625189592Sbms !V_interface_timers_running && 1626189592Sbms !V_state_change_timers_running) 1627189592Sbms return; 1628189592Sbms 1629189592Sbms IN_MULTI_LOCK(); 1630189592Sbms IGMP_LOCK(); 1631189592Sbms 1632189592Sbms /* 1633189592Sbms * IGMPv3 General Query response timer processing. 1634189592Sbms */ 1635189592Sbms if (V_interface_timers_running) { 1636189592Sbms CTR1(KTR_IGMPV3, "%s: interface timers running", __func__); 1637189592Sbms 1638189592Sbms V_interface_timers_running = 0; 1639189592Sbms LIST_FOREACH(igi, &V_igi_head, igi_link) { 1640189592Sbms if (igi->igi_v3_timer == 0) { 1641189592Sbms /* Do nothing. */ 1642189592Sbms } else if (--igi->igi_v3_timer == 0) { 1643189592Sbms igmp_v3_dispatch_general_query(igi); 1644189592Sbms } else { 1645189592Sbms V_interface_timers_running = 1; 1646189592Sbms } 1647189592Sbms } 1648189592Sbms } 1649189592Sbms 1650189592Sbms if (!V_current_state_timers_running && 1651189592Sbms !V_state_change_timers_running) 1652189592Sbms goto out_locked; 1653189592Sbms 1654189592Sbms V_current_state_timers_running = 0; 1655189592Sbms V_state_change_timers_running = 0; 1656189592Sbms 1657189592Sbms CTR1(KTR_IGMPV3, "%s: state change timers running", __func__); 1658189592Sbms 1659189592Sbms /* 1660189592Sbms * IGMPv1/v2/v3 host report and state-change timer processing. 1661189592Sbms * Note: Processing a v3 group timer may remove a node. 1662189592Sbms */ 1663189592Sbms LIST_FOREACH(igi, &V_igi_head, igi_link) { 1664189592Sbms ifp = igi->igi_ifp; 1665189592Sbms 1666189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 1667189592Sbms loop = (igi->igi_flags & IGIF_LOOPBACK) ? 1 : 0; 1668189592Sbms uri_fasthz = IGMP_RANDOM_DELAY(igi->igi_uri * 1669189592Sbms PR_FASTHZ); 1670189592Sbms 1671189592Sbms memset(&qrq, 0, sizeof(struct ifqueue)); 1672189592Sbms IFQ_SET_MAXLEN(&qrq, IGMP_MAX_G_GS_PACKETS); 1673189592Sbms 1674189592Sbms memset(&scq, 0, sizeof(struct ifqueue)); 1675189592Sbms IFQ_SET_MAXLEN(&scq, IGMP_MAX_STATE_CHANGE_PACKETS); 1676189592Sbms } 1677189592Sbms 1678189592Sbms IF_ADDR_LOCK(ifp); 1679189592Sbms TAILQ_FOREACH_SAFE(ifma, &ifp->if_multiaddrs, ifma_link, 1680189592Sbms tifma) { 1681189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 1682189931Sbms ifma->ifma_protospec == NULL) 1683189592Sbms continue; 1684189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 1685189592Sbms switch (igi->igi_version) { 1686189592Sbms case IGMP_VERSION_1: 1687189592Sbms case IGMP_VERSION_2: 1688189592Sbms igmp_v1v2_process_group_timer(inm, 1689189592Sbms igi->igi_version); 1690189592Sbms break; 1691189592Sbms case IGMP_VERSION_3: 1692189592Sbms igmp_v3_process_group_timers(igi, &qrq, 1693189592Sbms &scq, inm, uri_fasthz); 1694189592Sbms break; 1695189592Sbms } 1696189592Sbms } 1697189592Sbms IF_ADDR_UNLOCK(ifp); 1698189592Sbms 1699189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 1700189592Sbms struct in_multi *tinm; 1701189592Sbms 1702189592Sbms igmp_dispatch_queue(&qrq, 0, loop); 1703189592Sbms igmp_dispatch_queue(&scq, 0, loop); 1704189592Sbms 1705189592Sbms /* 1706189592Sbms * Free the in_multi reference(s) for this 1707189592Sbms * IGMP lifecycle. 1708189592Sbms */ 1709189592Sbms SLIST_FOREACH_SAFE(inm, &igi->igi_relinmhead, 1710189592Sbms inm_nrele, tinm) { 1711189592Sbms SLIST_REMOVE_HEAD(&igi->igi_relinmhead, 1712189592Sbms inm_nrele); 1713189592Sbms inm_release_locked(inm); 1714189592Sbms } 1715189592Sbms } 1716189592Sbms } 1717189592Sbms 1718189592Sbmsout_locked: 1719189592Sbms IGMP_UNLOCK(); 1720189592Sbms IN_MULTI_UNLOCK(); 1721189592Sbms} 1722189592Sbms 1723189592Sbms/* 1724189592Sbms * Update host report group timer for IGMPv1/v2. 1725189592Sbms * Will update the global pending timer flags. 1726189592Sbms */ 1727189592Sbmsstatic void 1728189592Sbmsigmp_v1v2_process_group_timer(struct in_multi *inm, const int version) 1729189592Sbms{ 1730189592Sbms int report_timer_expired; 1731189592Sbms 1732148682Srwatson IN_MULTI_LOCK_ASSERT(); 1733189592Sbms IGMP_LOCK_ASSERT(); 1734148682Srwatson 1735189592Sbms if (inm->inm_timer == 0) { 1736189592Sbms report_timer_expired = 0; 1737189592Sbms } else if (--inm->inm_timer == 0) { 1738189592Sbms report_timer_expired = 1; 173914622Sfenner } else { 1740189592Sbms V_current_state_timers_running = 1; 1741189592Sbms return; 1742189592Sbms } 1743189592Sbms 1744189592Sbms switch (inm->inm_state) { 1745189592Sbms case IGMP_NOT_MEMBER: 1746189592Sbms case IGMP_SILENT_MEMBER: 1747189592Sbms case IGMP_IDLE_MEMBER: 1748189592Sbms case IGMP_LAZY_MEMBER: 1749189592Sbms case IGMP_SLEEPING_MEMBER: 1750189592Sbms case IGMP_AWAKENING_MEMBER: 1751189592Sbms break; 1752189592Sbms case IGMP_REPORTING_MEMBER: 1753189592Sbms if (report_timer_expired) { 1754189592Sbms inm->inm_state = IGMP_IDLE_MEMBER; 1755189592Sbms (void)igmp_v1v2_queue_report(inm, 1756189592Sbms (version == IGMP_VERSION_2) ? 1757189592Sbms IGMP_v2_HOST_MEMBERSHIP_REPORT : 1758189592Sbms IGMP_v1_HOST_MEMBERSHIP_REPORT); 1759144163Ssam } 1760189592Sbms break; 1761189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1762189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1763189592Sbms case IGMP_LEAVING_MEMBER: 1764189592Sbms break; 17651541Srgrimes } 17661541Srgrimes} 17671541Srgrimes 1768189592Sbms/* 1769189592Sbms * Update a group's timers for IGMPv3. 1770189592Sbms * Will update the global pending timer flags. 1771189592Sbms * Note: Unlocked read from igi. 1772189592Sbms */ 1773189592Sbmsstatic void 1774189592Sbmsigmp_v3_process_group_timers(struct igmp_ifinfo *igi, 1775189592Sbms struct ifqueue *qrq, struct ifqueue *scq, 1776189592Sbms struct in_multi *inm, const int uri_fasthz) 17771541Srgrimes{ 1778189592Sbms int query_response_timer_expired; 1779189592Sbms int state_change_retransmit_timer_expired; 1780119181Srwatson 1781148682Srwatson IN_MULTI_LOCK_ASSERT(); 1782189592Sbms IGMP_LOCK_ASSERT(); 1783148682Srwatson 1784189592Sbms query_response_timer_expired = 0; 1785189592Sbms state_change_retransmit_timer_expired = 0; 1786189592Sbms 1787189592Sbms /* 1788189592Sbms * During a transition from v1/v2 compatibility mode back to v3, 1789189592Sbms * a group record in REPORTING state may still have its group 1790189592Sbms * timer active. This is a no-op in this function; it is easier 1791189592Sbms * to deal with it here than to complicate the slow-timeout path. 1792189592Sbms */ 1793189592Sbms if (inm->inm_timer == 0) { 1794189592Sbms query_response_timer_expired = 0; 1795189592Sbms } else if (--inm->inm_timer == 0) { 1796189592Sbms query_response_timer_expired = 1; 1797189592Sbms } else { 1798189592Sbms V_current_state_timers_running = 1; 1799189592Sbms } 1800189592Sbms 1801189592Sbms if (inm->inm_sctimer == 0) { 1802189592Sbms state_change_retransmit_timer_expired = 0; 1803189592Sbms } else if (--inm->inm_sctimer == 0) { 1804189592Sbms state_change_retransmit_timer_expired = 1; 1805189592Sbms } else { 1806189592Sbms V_state_change_timers_running = 1; 1807189592Sbms } 1808189592Sbms 1809189592Sbms /* We are in fasttimo, so be quick about it. */ 1810189592Sbms if (!state_change_retransmit_timer_expired && 1811189592Sbms !query_response_timer_expired) 1812189592Sbms return; 1813189592Sbms 1814189592Sbms switch (inm->inm_state) { 1815189592Sbms case IGMP_NOT_MEMBER: 1816189592Sbms case IGMP_SILENT_MEMBER: 1817189592Sbms case IGMP_SLEEPING_MEMBER: 1818189592Sbms case IGMP_LAZY_MEMBER: 1819189592Sbms case IGMP_AWAKENING_MEMBER: 1820189592Sbms case IGMP_IDLE_MEMBER: 1821189592Sbms break; 1822189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1823189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1824189592Sbms /* 1825189592Sbms * Respond to a previously pending Group-Specific 1826189592Sbms * or Group-and-Source-Specific query by enqueueing 1827189592Sbms * the appropriate Current-State report for 1828189592Sbms * immediate transmission. 1829189592Sbms */ 1830189592Sbms if (query_response_timer_expired) { 1831189592Sbms int retval; 1832189592Sbms 1833189592Sbms retval = igmp_v3_enqueue_group_record(qrq, inm, 0, 1, 1834189592Sbms (inm->inm_state == IGMP_SG_QUERY_PENDING_MEMBER)); 1835189592Sbms CTR2(KTR_IGMPV3, "%s: enqueue record = %d", 1836189592Sbms __func__, retval); 1837189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 1838189592Sbms /* XXX Clear recorded sources for next time. */ 1839189592Sbms inm_clear_recorded(inm); 1840189592Sbms } 1841189592Sbms /* FALLTHROUGH */ 1842189592Sbms case IGMP_REPORTING_MEMBER: 1843189592Sbms case IGMP_LEAVING_MEMBER: 1844189592Sbms if (state_change_retransmit_timer_expired) { 1845189592Sbms /* 1846189592Sbms * State-change retransmission timer fired. 1847189592Sbms * If there are any further pending retransmissions, 1848189592Sbms * set the global pending state-change flag, and 1849189592Sbms * reset the timer. 1850189592Sbms */ 1851189592Sbms if (--inm->inm_scrv > 0) { 1852189592Sbms inm->inm_sctimer = uri_fasthz; 1853189592Sbms V_state_change_timers_running = 1; 1854189592Sbms } 1855189592Sbms /* 1856189592Sbms * Retransmit the previously computed state-change 1857189592Sbms * report. If there are no further pending 1858189592Sbms * retransmissions, the mbuf queue will be consumed. 1859189592Sbms * Update T0 state to T1 as we have now sent 1860189592Sbms * a state-change. 1861189592Sbms */ 1862189592Sbms (void)igmp_v3_merge_state_changes(inm, scq); 1863189592Sbms 1864189592Sbms inm_commit(inm); 1865189592Sbms CTR3(KTR_IGMPV3, "%s: T1 -> T0 for %s/%s", __func__, 1866189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 1867189592Sbms 1868189592Sbms /* 1869189592Sbms * If we are leaving the group for good, make sure 1870189592Sbms * we release IGMP's reference to it. 1871189592Sbms * This release must be deferred using a SLIST, 1872189592Sbms * as we are called from a loop which traverses 1873189592Sbms * the in_ifmultiaddr TAILQ. 1874189592Sbms */ 1875189592Sbms if (inm->inm_state == IGMP_LEAVING_MEMBER && 1876189592Sbms inm->inm_scrv == 0) { 1877189592Sbms inm->inm_state = IGMP_NOT_MEMBER; 1878189592Sbms SLIST_INSERT_HEAD(&igi->igi_relinmhead, 1879189592Sbms inm, inm_nrele); 1880189592Sbms } 1881189592Sbms } 1882189592Sbms break; 1883189592Sbms } 18841541Srgrimes} 18851541Srgrimes 1886189592Sbms 1887189592Sbms/* 1888189592Sbms * Suppress a group's pending response to a group or source/group query. 1889189592Sbms * 1890189592Sbms * Do NOT suppress state changes. This leads to IGMPv3 inconsistency. 1891189592Sbms * Do NOT update ST1/ST0 as this operation merely suppresses 1892189592Sbms * the currently pending group record. 1893189592Sbms * Do NOT suppress the response to a general query. It is possible but 1894189592Sbms * it would require adding another state or flag. 1895189592Sbms */ 1896189592Sbmsstatic void 1897189592Sbmsigmp_v3_suppress_group_record(struct in_multi *inm) 18981541Srgrimes{ 18991541Srgrimes 1900189592Sbms IN_MULTI_LOCK_ASSERT(); 1901189592Sbms 1902189592Sbms KASSERT(inm->inm_igi->igi_version == IGMP_VERSION_3, 1903189592Sbms ("%s: not IGMPv3 mode on link", __func__)); 1904189592Sbms 1905189592Sbms if (inm->inm_state != IGMP_G_QUERY_PENDING_MEMBER || 1906189592Sbms inm->inm_state != IGMP_SG_QUERY_PENDING_MEMBER) 1907189592Sbms return; 1908189592Sbms 1909189592Sbms if (inm->inm_state == IGMP_SG_QUERY_PENDING_MEMBER) 1910189592Sbms inm_clear_recorded(inm); 1911189592Sbms 1912189592Sbms inm->inm_timer = 0; 1913189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 1914189592Sbms} 1915189592Sbms 1916189592Sbms/* 1917189592Sbms * Switch to a different IGMP version on the given interface, 1918189592Sbms * as per Section 7.2.1. 1919189592Sbms */ 1920189592Sbmsstatic void 1921189592Sbmsigmp_set_version(struct igmp_ifinfo *igi, const int version) 1922189592Sbms{ 1923189592Sbms 1924189592Sbms IGMP_LOCK_ASSERT(); 1925189592Sbms 1926189592Sbms CTR4(KTR_IGMPV3, "%s: switching to v%d on ifp %p(%s)", __func__, 1927189592Sbms version, igi->igi_ifp, igi->igi_ifp->if_xname); 1928189592Sbms 1929189592Sbms if (version == IGMP_VERSION_1 || version == IGMP_VERSION_2) { 1930189592Sbms int old_version_timer; 1931189592Sbms /* 1932189592Sbms * Compute the "Older Version Querier Present" timer as per 1933189592Sbms * Section 8.12. 1934189592Sbms */ 1935189592Sbms old_version_timer = igi->igi_rv * igi->igi_qi + igi->igi_qri; 1936189592Sbms old_version_timer *= PR_SLOWHZ; 1937189592Sbms 1938189592Sbms if (version == IGMP_VERSION_1) { 1939189592Sbms igi->igi_v1_timer = old_version_timer; 1940189592Sbms igi->igi_v2_timer = 0; 1941189592Sbms } else if (version == IGMP_VERSION_2) { 1942189592Sbms igi->igi_v1_timer = 0; 1943189592Sbms igi->igi_v2_timer = old_version_timer; 1944189592Sbms } 1945189592Sbms } 1946189592Sbms 1947189592Sbms if (igi->igi_v1_timer == 0 && igi->igi_v2_timer > 0) { 1948189592Sbms if (igi->igi_version != IGMP_VERSION_2) { 1949189592Sbms igi->igi_version = IGMP_VERSION_2; 1950189592Sbms igmp_v3_cancel_link_timers(igi); 1951189592Sbms } 1952189592Sbms } else if (igi->igi_v1_timer > 0) { 1953189592Sbms if (igi->igi_version != IGMP_VERSION_1) { 1954189592Sbms igi->igi_version = IGMP_VERSION_1; 1955189592Sbms igmp_v3_cancel_link_timers(igi); 1956189592Sbms } 1957189592Sbms } 1958189592Sbms} 1959189592Sbms 1960189592Sbms/* 1961189592Sbms * Cancel pending IGMPv3 timers for the given link and all groups 1962189592Sbms * joined on it; state-change, general-query, and group-query timers. 1963189592Sbms */ 1964189592Sbmsstatic void 1965189592Sbmsigmp_v3_cancel_link_timers(struct igmp_ifinfo *igi) 1966189592Sbms{ 1967189592Sbms struct ifmultiaddr *ifma; 1968189592Sbms struct ifnet *ifp; 1969189592Sbms struct in_multi *inm; 1970189592Sbms 1971189592Sbms CTR3(KTR_IGMPV3, "%s: cancel v3 timers on ifp %p(%s)", __func__, 1972189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 1973189592Sbms 1974189592Sbms IN_MULTI_LOCK_ASSERT(); 1975189592Sbms IGMP_LOCK_ASSERT(); 1976189592Sbms 19771541Srgrimes /* 1978189592Sbms * Fast-track this potentially expensive operation 1979189592Sbms * by checking all the global 'timer pending' flags. 19801541Srgrimes */ 1981189592Sbms if (!V_interface_timers_running && 1982189592Sbms !V_state_change_timers_running && 1983189592Sbms !V_current_state_timers_running) 19841541Srgrimes return; 19851541Srgrimes 1986189592Sbms igi->igi_v3_timer = 0; 1987189592Sbms 1988189592Sbms ifp = igi->igi_ifp; 1989189592Sbms 1990189592Sbms IF_ADDR_LOCK(ifp); 1991189592Sbms TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 1992189592Sbms if (ifma->ifma_addr->sa_family != AF_INET) 1993189592Sbms continue; 1994189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 1995189592Sbms switch (inm->inm_state) { 1996189592Sbms case IGMP_NOT_MEMBER: 1997189592Sbms case IGMP_SILENT_MEMBER: 1998189592Sbms case IGMP_IDLE_MEMBER: 1999189592Sbms case IGMP_LAZY_MEMBER: 2000189592Sbms case IGMP_SLEEPING_MEMBER: 2001189592Sbms case IGMP_AWAKENING_MEMBER: 2002189592Sbms break; 2003189592Sbms case IGMP_LEAVING_MEMBER: 2004189592Sbms /* 2005189592Sbms * If we are leaving the group and switching 2006189592Sbms * IGMP version, we need to release the final 2007189592Sbms * reference held for issuing the INCLUDE {}. 2008189592Sbms * 2009189592Sbms * SMPNG: Must drop and re-acquire IF_ADDR_LOCK 2010189592Sbms * around inm_release_locked(), as it is not 2011189592Sbms * a recursive mutex. 2012189592Sbms */ 2013189592Sbms IF_ADDR_UNLOCK(ifp); 2014189592Sbms inm_release_locked(inm); 2015189592Sbms IF_ADDR_LOCK(ifp); 2016189592Sbms /* FALLTHROUGH */ 2017189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 2018189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 2019189592Sbms inm_clear_recorded(inm); 2020189592Sbms /* FALLTHROUGH */ 2021189592Sbms case IGMP_REPORTING_MEMBER: 2022189592Sbms inm->inm_sctimer = 0; 2023189592Sbms inm->inm_timer = 0; 2024189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 2025189592Sbms /* 2026189592Sbms * Free any pending IGMPv3 state-change records. 2027189592Sbms */ 2028189592Sbms _IF_DRAIN(&inm->inm_scq); 2029189592Sbms break; 2030189592Sbms } 2031189592Sbms } 2032189592Sbms IF_ADDR_UNLOCK(ifp); 2033189592Sbms} 2034189592Sbms 2035189592Sbms/* 2036189592Sbms * Update the Older Version Querier Present timers for a link. 2037189592Sbms * See Section 7.2.1 of RFC 3376. 2038189592Sbms */ 2039189592Sbmsstatic void 2040189592Sbmsigmp_v1v2_process_querier_timers(struct igmp_ifinfo *igi) 2041189592Sbms{ 2042189592Sbms 2043189592Sbms IGMP_LOCK_ASSERT(); 2044189592Sbms 2045189592Sbms if (igi->igi_v1_timer == 0 && igi->igi_v2_timer == 0) { 2046189592Sbms /* 2047189592Sbms * IGMPv1 and IGMPv2 Querier Present timers expired. 2048189592Sbms * 2049189592Sbms * Revert to IGMPv3. 2050189592Sbms */ 2051189592Sbms if (igi->igi_version != IGMP_VERSION_3) { 2052189592Sbms CTR5(KTR_IGMPV3, 2053189592Sbms "%s: transition from v%d -> v%d on %p(%s)", 2054189592Sbms __func__, igi->igi_version, IGMP_VERSION_3, 2055189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 2056189592Sbms igi->igi_version = IGMP_VERSION_3; 2057189592Sbms } 2058189592Sbms } else if (igi->igi_v1_timer == 0 && igi->igi_v2_timer > 0) { 2059189592Sbms /* 2060189592Sbms * IGMPv1 Querier Present timer expired, 2061189592Sbms * IGMPv2 Querier Present timer running. 2062189592Sbms * If IGMPv2 was disabled since last timeout, 2063189592Sbms * revert to IGMPv3. 2064189592Sbms * If IGMPv2 is enabled, revert to IGMPv2. 2065189592Sbms */ 2066189592Sbms if (!V_igmp_v2enable) { 2067189592Sbms CTR5(KTR_IGMPV3, 2068189592Sbms "%s: transition from v%d -> v%d on %p(%s)", 2069189592Sbms __func__, igi->igi_version, IGMP_VERSION_3, 2070189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 2071189592Sbms igi->igi_v2_timer = 0; 2072189592Sbms igi->igi_version = IGMP_VERSION_3; 2073189592Sbms } else { 2074189592Sbms --igi->igi_v2_timer; 2075189592Sbms if (igi->igi_version != IGMP_VERSION_2) { 2076189592Sbms CTR5(KTR_IGMPV3, 2077189592Sbms "%s: transition from v%d -> v%d on %p(%s)", 2078189592Sbms __func__, igi->igi_version, IGMP_VERSION_2, 2079189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 2080189592Sbms igi->igi_version = IGMP_VERSION_2; 2081183550Szec } 20821541Srgrimes } 2083189592Sbms } else if (igi->igi_v1_timer > 0) { 2084189592Sbms /* 2085189592Sbms * IGMPv1 Querier Present timer running. 2086189592Sbms * Stop IGMPv2 timer if running. 2087189592Sbms * 2088189592Sbms * If IGMPv1 was disabled since last timeout, 2089189592Sbms * revert to IGMPv3. 2090189592Sbms * If IGMPv1 is enabled, reset IGMPv2 timer if running. 2091189592Sbms */ 2092189592Sbms if (!V_igmp_v1enable) { 2093189592Sbms CTR5(KTR_IGMPV3, 2094189592Sbms "%s: transition from v%d -> v%d on %p(%s)", 2095189592Sbms __func__, igi->igi_version, IGMP_VERSION_3, 2096189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 2097189592Sbms igi->igi_v1_timer = 0; 2098189592Sbms igi->igi_version = IGMP_VERSION_3; 2099189592Sbms } else { 2100189592Sbms --igi->igi_v1_timer; 2101189592Sbms } 2102189592Sbms if (igi->igi_v2_timer > 0) { 2103189592Sbms CTR3(KTR_IGMPV3, 2104189592Sbms "%s: cancel v2 timer on %p(%s)", 2105189592Sbms __func__, igi->igi_ifp, igi->igi_ifp->if_xname); 2106189592Sbms igi->igi_v2_timer = 0; 2107189592Sbms } 21081541Srgrimes } 21091541Srgrimes} 21101541Srgrimes 2111189592Sbms/* 2112189592Sbms * Global slowtimo handler. 2113189592Sbms * VIMAGE: Timeout handlers are expected to service all vimages. 2114189592Sbms */ 21152531Swollmanvoid 2116119181Srwatsonigmp_slowtimo(void) 21172531Swollman{ 2118189592Sbms#ifdef VIMAGE 2119183550Szec VNET_ITERATOR_DECL(vnet_iter); 21202531Swollman 2121183550Szec VNET_LIST_RLOCK(); 2122183550Szec VNET_FOREACH(vnet_iter) { 2123183550Szec CURVNET_SET(vnet_iter); 2124183550Szec INIT_VNET_INET(vnet_iter); 2125189592Sbms igmp_slowtimo_vnet(); 2126183550Szec CURVNET_RESTORE(); 21272531Swollman } 2128183550Szec VNET_LIST_RUNLOCK(); 2129189592Sbms#else /* !VIMAGE */ 2130189592Sbms igmp_slowtimo_vnet(); 2131189592Sbms#endif /* VIMAGE */ 21322531Swollman} 21332531Swollman 2134189592Sbms/* 2135189592Sbms * Per-vnet slowtimo handler. 2136189592Sbms */ 21371541Srgrimesstatic void 2138189592Sbmsigmp_slowtimo_vnet(void) 21391541Srgrimes{ 2140189592Sbms struct igmp_ifinfo *igi; 21411541Srgrimes 2142189592Sbms IGMP_LOCK(); 2143189592Sbms 2144189592Sbms LIST_FOREACH(igi, &V_igi_head, igi_link) { 2145189592Sbms igmp_v1v2_process_querier_timers(igi); 2146189592Sbms } 2147189592Sbms 2148189592Sbms IGMP_UNLOCK(); 2149189592Sbms} 2150189592Sbms 2151189592Sbms/* 2152189592Sbms * Dispatch an IGMPv1/v2 host report or leave message. 2153189592Sbms * These are always small enough to fit inside a single mbuf. 2154189592Sbms */ 2155189592Sbmsstatic int 2156189592Sbmsigmp_v1v2_queue_report(struct in_multi *inm, const int type) 2157189592Sbms{ 2158189592Sbms struct ifnet *ifp; 2159189592Sbms struct igmp *igmp; 2160189592Sbms struct ip *ip; 2161189592Sbms struct mbuf *m; 2162189592Sbms 2163148682Srwatson IN_MULTI_LOCK_ASSERT(); 2164189592Sbms IGMP_LOCK_ASSERT(); 2165148682Srwatson 2166189592Sbms ifp = inm->inm_ifp; 2167189592Sbms /* XXX are these needed ? */ 2168189592Sbms INIT_VNET_NET(ifp->if_vnet); 2169189592Sbms INIT_VNET_INET(ifp->if_vnet); 2170189592Sbms 2171151967Sandre MGETHDR(m, M_DONTWAIT, MT_DATA); 2172119181Srwatson if (m == NULL) 2173189592Sbms return (ENOMEM); 2174189592Sbms MH_ALIGN(m, sizeof(struct ip) + sizeof(struct igmp)); 21752531Swollman 2176189592Sbms m->m_pkthdr.len = sizeof(struct ip) + sizeof(struct igmp); 2177189592Sbms 21782531Swollman m->m_data += sizeof(struct ip); 2179189592Sbms m->m_len = sizeof(struct igmp); 2180189592Sbms 2181119181Srwatson igmp = mtod(m, struct igmp *); 2182119181Srwatson igmp->igmp_type = type; 2183119181Srwatson igmp->igmp_code = 0; 2184119181Srwatson igmp->igmp_group = inm->inm_addr; 2185119181Srwatson igmp->igmp_cksum = 0; 2186189592Sbms igmp->igmp_cksum = in_cksum(m, sizeof(struct igmp)); 21871541Srgrimes 2188119181Srwatson m->m_data -= sizeof(struct ip); 2189119181Srwatson m->m_len += sizeof(struct ip); 2190189592Sbms 2191119181Srwatson ip = mtod(m, struct ip *); 2192119181Srwatson ip->ip_tos = 0; 2193189592Sbms ip->ip_len = sizeof(struct ip) + sizeof(struct igmp); 2194119181Srwatson ip->ip_off = 0; 2195119181Srwatson ip->ip_p = IPPROTO_IGMP; 2196119181Srwatson ip->ip_src.s_addr = INADDR_ANY; 21971541Srgrimes 2198189592Sbms if (type == IGMP_HOST_LEAVE_MESSAGE) 2199189592Sbms ip->ip_dst.s_addr = htonl(INADDR_ALLRTRS_GROUP); 2200189592Sbms else 2201189592Sbms ip->ip_dst = inm->inm_addr; 2202189592Sbms 2203189592Sbms igmp_save_context(m, ifp); 2204189592Sbms 2205189592Sbms m->m_flags |= M_IGMPV2; 2206189592Sbms if (inm->inm_igi->igi_flags & IGIF_LOOPBACK) 2207189592Sbms m->m_flags |= M_IGMP_LOOP; 2208189592Sbms 2209189592Sbms CTR2(KTR_IGMPV3, "%s: netisr_dispatch(NETISR_IGMP, %p)", __func__, m); 2210189592Sbms netisr_dispatch(NETISR_IGMP, m); 2211189592Sbms 2212189592Sbms return (0); 2213189592Sbms} 2214189592Sbms 2215189592Sbms/* 2216189592Sbms * Process a state change from the upper layer for the given IPv4 group. 2217189592Sbms * 2218189592Sbms * Each socket holds a reference on the in_multi in its own ip_moptions. 2219189592Sbms * The socket layer will have made the necessary updates to.the group 2220189592Sbms * state, it is now up to IGMP to issue a state change report if there 2221189592Sbms * has been any change between T0 (when the last state-change was issued) 2222189592Sbms * and T1 (now). 2223189592Sbms * 2224189592Sbms * We use the IGMPv3 state machine at group level. The IGMP module 2225189592Sbms * however makes the decision as to which IGMP protocol version to speak. 2226189592Sbms * A state change *from* INCLUDE {} always means an initial join. 2227189592Sbms * A state change *to* INCLUDE {} always means a final leave. 2228189592Sbms * 2229189592Sbms * FUTURE: If IGIF_V3LITE is enabled for this interface, then we can 2230189592Sbms * save ourselves a bunch of work; any exclusive mode groups need not 2231189592Sbms * compute source filter lists. 2232189592Sbms * 2233189592Sbms * VIMAGE: curvnet should have been set by caller, as this routine 2234189592Sbms * is called from the socket option handlers. 2235189592Sbms */ 2236189592Sbmsint 2237189592Sbmsigmp_change_state(struct in_multi *inm) 2238189592Sbms{ 2239189592Sbms struct igmp_ifinfo *igi; 2240189592Sbms struct ifnet *ifp; 2241189592Sbms int error; 2242189592Sbms 2243189592Sbms IN_MULTI_LOCK_ASSERT(); 2244189592Sbms 2245189592Sbms error = 0; 2246189592Sbms 2247189592Sbms /* 2248189592Sbms * Try to detect if the upper layer just asked us to change state 2249189592Sbms * for an interface which has now gone away. 2250189592Sbms */ 2251189592Sbms KASSERT(inm->inm_ifma != NULL, ("%s: no ifma", __func__)); 2252189592Sbms ifp = inm->inm_ifma->ifma_ifp; 2253189592Sbms if (ifp != NULL) { 2254189592Sbms /* 2255189592Sbms * Sanity check that netinet's notion of ifp is the 2256189592Sbms * same as net's. 2257189592Sbms */ 2258189592Sbms KASSERT(inm->inm_ifp == ifp, ("%s: bad ifp", __func__)); 2259189592Sbms } 2260189592Sbms 2261189592Sbms IGMP_LOCK(); 2262189592Sbms 2263189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 2264189592Sbms KASSERT(igi != NULL, ("%s: no igmp_ifinfo for ifp %p", __func__, ifp)); 2265189592Sbms 2266189592Sbms /* 2267189592Sbms * If we detect a state transition to or from MCAST_UNDEFINED 2268189592Sbms * for this group, then we are starting or finishing an IGMP 2269189592Sbms * life cycle for this group. 2270189592Sbms */ 2271189592Sbms if (inm->inm_st[1].iss_fmode != inm->inm_st[0].iss_fmode) { 2272189592Sbms CTR3(KTR_IGMPV3, "%s: inm transition %d -> %d", __func__, 2273189592Sbms inm->inm_st[0].iss_fmode, inm->inm_st[1].iss_fmode); 2274189592Sbms if (inm->inm_st[0].iss_fmode == MCAST_UNDEFINED) { 2275189592Sbms CTR1(KTR_IGMPV3, "%s: initial join", __func__); 2276189592Sbms error = igmp_initial_join(inm, igi); 2277189592Sbms goto out_locked; 2278189592Sbms } else if (inm->inm_st[1].iss_fmode == MCAST_UNDEFINED) { 2279189592Sbms CTR1(KTR_IGMPV3, "%s: final leave", __func__); 2280189592Sbms igmp_final_leave(inm, igi); 2281189592Sbms goto out_locked; 2282189592Sbms } 2283189592Sbms } else { 2284189592Sbms CTR1(KTR_IGMPV3, "%s: filter set change", __func__); 2285189592Sbms } 2286189592Sbms 2287189592Sbms error = igmp_handle_state_change(inm, igi); 2288189592Sbms 2289189592Sbmsout_locked: 2290189592Sbms IGMP_UNLOCK(); 2291189592Sbms return (error); 2292189592Sbms} 2293189592Sbms 2294189592Sbms/* 2295189592Sbms * Perform the initial join for an IGMP group. 2296189592Sbms * 2297189592Sbms * When joining a group: 2298189592Sbms * If the group should have its IGMP traffic suppressed, do nothing. 2299189592Sbms * IGMPv1 starts sending IGMPv1 host membership reports. 2300189592Sbms * IGMPv2 starts sending IGMPv2 host membership reports. 2301189592Sbms * IGMPv3 will schedule an IGMPv3 state-change report containing the 2302189592Sbms * initial state of the membership. 2303189592Sbms */ 2304189592Sbmsstatic int 2305189592Sbmsigmp_initial_join(struct in_multi *inm, struct igmp_ifinfo *igi) 2306189592Sbms{ 2307189592Sbms struct ifnet *ifp; 2308189592Sbms struct ifqueue *ifq; 2309189592Sbms int error, retval, syncstates; 2310189592Sbms 2311189592Sbms CTR4(KTR_IGMPV3, "%s: initial join %s on ifp %p(%s)", 2312189592Sbms __func__, inet_ntoa(inm->inm_addr), inm->inm_ifp, 2313189592Sbms inm->inm_ifp->if_xname); 2314189592Sbms 2315189592Sbms error = 0; 2316189592Sbms syncstates = 1; 2317189592Sbms 2318189592Sbms ifp = inm->inm_ifp; 2319189592Sbms 2320189592Sbms IN_MULTI_LOCK_ASSERT(); 2321189592Sbms IGMP_LOCK_ASSERT(); 2322189592Sbms 2323189592Sbms KASSERT(igi && igi->igi_ifp == ifp, ("%s: inconsistent ifp", __func__)); 2324189592Sbms 2325189592Sbms /* 2326189592Sbms * Groups joined on loopback or marked as 'not reported', 2327189592Sbms * e.g. 224.0.0.1, enter the IGMP_SILENT_MEMBER state and 2328189592Sbms * are never reported in any IGMP protocol exchanges. 2329189592Sbms * All other groups enter the appropriate IGMP state machine 2330189592Sbms * for the version in use on this link. 2331189592Sbms * A link marked as IGIF_SILENT causes IGMP to be completely 2332189592Sbms * disabled for the link. 2333189592Sbms */ 2334189592Sbms if ((ifp->if_flags & IFF_LOOPBACK) || 2335189592Sbms (igi->igi_flags & IGIF_SILENT) || 2336189592Sbms !igmp_isgroupreported(inm->inm_addr)) { 2337189592Sbms CTR1(KTR_IGMPV3, 2338189592Sbms"%s: not kicking state machine for silent group", __func__); 2339189592Sbms inm->inm_state = IGMP_SILENT_MEMBER; 2340189592Sbms inm->inm_timer = 0; 2341189592Sbms } else { 2342189592Sbms /* 2343189592Sbms * Deal with overlapping in_multi lifecycle. 2344189592Sbms * If this group was LEAVING, then make sure 2345189592Sbms * we drop the reference we picked up to keep the 2346189592Sbms * group around for the final INCLUDE {} enqueue. 2347189592Sbms */ 2348189592Sbms if (igi->igi_version == IGMP_VERSION_3 && 2349189592Sbms inm->inm_state == IGMP_LEAVING_MEMBER) 2350189592Sbms inm_release_locked(inm); 2351189592Sbms 2352189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 2353189592Sbms 2354189592Sbms switch (igi->igi_version) { 2355189592Sbms case IGMP_VERSION_1: 2356189592Sbms case IGMP_VERSION_2: 2357189592Sbms inm->inm_state = IGMP_IDLE_MEMBER; 2358189592Sbms error = igmp_v1v2_queue_report(inm, 2359189592Sbms (igi->igi_version == IGMP_VERSION_2) ? 2360189592Sbms IGMP_v2_HOST_MEMBERSHIP_REPORT : 2361189592Sbms IGMP_v1_HOST_MEMBERSHIP_REPORT); 2362189592Sbms if (error == 0) { 2363189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY( 2364189592Sbms IGMP_V1V2_MAX_RI * PR_FASTHZ); 2365189592Sbms V_current_state_timers_running = 1; 2366189592Sbms } 2367189592Sbms break; 2368189592Sbms 2369189592Sbms case IGMP_VERSION_3: 2370189592Sbms /* 2371189592Sbms * Defer update of T0 to T1, until the first copy 2372189592Sbms * of the state change has been transmitted. 2373189592Sbms */ 2374189592Sbms syncstates = 0; 2375189592Sbms 2376189592Sbms /* 2377189592Sbms * Immediately enqueue a State-Change Report for 2378189592Sbms * this interface, freeing any previous reports. 2379189592Sbms * Don't kick the timers if there is nothing to do, 2380189592Sbms * or if an error occurred. 2381189592Sbms */ 2382189592Sbms ifq = &inm->inm_scq; 2383189592Sbms _IF_DRAIN(ifq); 2384189592Sbms retval = igmp_v3_enqueue_group_record(ifq, inm, 1, 2385189592Sbms 0, 0); 2386189592Sbms CTR2(KTR_IGMPV3, "%s: enqueue record = %d", 2387189592Sbms __func__, retval); 2388189592Sbms if (retval <= 0) { 2389189592Sbms error = retval * -1; 2390189592Sbms break; 2391189592Sbms } 2392189592Sbms 2393189592Sbms /* 2394189592Sbms * Schedule transmission of pending state-change 2395189592Sbms * report up to RV times for this link. The timer 2396189592Sbms * will fire at the next igmp_fasttimo (~200ms), 2397189592Sbms * giving us an opportunity to merge the reports. 2398189592Sbms */ 2399189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 2400189592Sbms inm->inm_scrv = 1; 2401189592Sbms } else { 2402189592Sbms KASSERT(igi->igi_rv > 1, 2403189592Sbms ("%s: invalid robustness %d", __func__, 2404189592Sbms igi->igi_rv)); 2405189592Sbms inm->inm_scrv = igi->igi_rv; 2406189592Sbms } 2407189592Sbms inm->inm_sctimer = 1; 2408189592Sbms V_state_change_timers_running = 1; 2409189592Sbms 2410189592Sbms error = 0; 2411189592Sbms break; 2412189592Sbms } 2413189592Sbms } 2414189592Sbms 2415189592Sbms /* 2416189592Sbms * Only update the T0 state if state change is atomic, 2417189592Sbms * i.e. we don't need to wait for a timer to fire before we 2418189592Sbms * can consider the state change to have been communicated. 2419189592Sbms */ 2420189592Sbms if (syncstates) { 2421189592Sbms inm_commit(inm); 2422189592Sbms CTR3(KTR_IGMPV3, "%s: T1 -> T0 for %s/%s", __func__, 2423189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 2424189592Sbms } 2425189592Sbms 2426189592Sbms return (error); 2427189592Sbms} 2428189592Sbms 2429189592Sbms/* 2430189592Sbms * Issue an intermediate state change during the IGMP life-cycle. 2431189592Sbms */ 2432189592Sbmsstatic int 2433189592Sbmsigmp_handle_state_change(struct in_multi *inm, struct igmp_ifinfo *igi) 2434189592Sbms{ 2435189592Sbms struct ifnet *ifp; 2436189592Sbms int retval; 2437189592Sbms 2438189592Sbms CTR4(KTR_IGMPV3, "%s: state change for %s on ifp %p(%s)", 2439189592Sbms __func__, inet_ntoa(inm->inm_addr), inm->inm_ifp, 2440189592Sbms inm->inm_ifp->if_xname); 2441189592Sbms 2442189592Sbms ifp = inm->inm_ifp; 2443189592Sbms 2444189592Sbms IN_MULTI_LOCK_ASSERT(); 2445189592Sbms IGMP_LOCK_ASSERT(); 2446189592Sbms 2447189592Sbms KASSERT(igi && igi->igi_ifp == ifp, ("%s: inconsistent ifp", __func__)); 2448189592Sbms 2449189592Sbms if ((ifp->if_flags & IFF_LOOPBACK) || 2450189592Sbms (igi->igi_flags & IGIF_SILENT) || 2451189592Sbms !igmp_isgroupreported(inm->inm_addr) || 2452189592Sbms (igi->igi_version != IGMP_VERSION_3)) { 2453189592Sbms if (!igmp_isgroupreported(inm->inm_addr)) { 2454189592Sbms CTR1(KTR_IGMPV3, 2455189592Sbms"%s: not kicking state machine for silent group", __func__); 2456189592Sbms } 2457189592Sbms CTR1(KTR_IGMPV3, "%s: nothing to do", __func__); 2458189592Sbms inm_commit(inm); 2459189592Sbms CTR3(KTR_IGMPV3, "%s: T1 -> T0 for %s/%s", __func__, 2460189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 2461189592Sbms return (0); 2462189592Sbms } 2463189592Sbms 2464189592Sbms _IF_DRAIN(&inm->inm_scq); 2465189592Sbms 2466189592Sbms retval = igmp_v3_enqueue_group_record(&inm->inm_scq, inm, 1, 0, 0); 2467189592Sbms CTR2(KTR_IGMPV3, "%s: enqueue record = %d", __func__, retval); 2468189592Sbms if (retval <= 0) 2469189592Sbms return (-retval); 2470189592Sbms 2471189592Sbms /* 2472189592Sbms * If record(s) were enqueued, start the state-change 2473189592Sbms * report timer for this group. 2474189592Sbms */ 2475189592Sbms inm->inm_scrv = ((igi->igi_flags & IGIF_LOOPBACK) ? 1 : igi->igi_rv); 2476189592Sbms inm->inm_sctimer = 1; 2477189592Sbms V_state_change_timers_running = 1; 2478189592Sbms 2479189592Sbms return (0); 2480189592Sbms} 2481189592Sbms 2482189592Sbms/* 2483189592Sbms * Perform the final leave for an IGMP group. 2484189592Sbms * 2485189592Sbms * When leaving a group: 2486189592Sbms * IGMPv1 does nothing. 2487189592Sbms * IGMPv2 sends a host leave message, if and only if we are the reporter. 2488189592Sbms * IGMPv3 enqueues a state-change report containing a transition 2489189592Sbms * to INCLUDE {} for immediate transmission. 2490189592Sbms */ 2491189592Sbmsstatic void 2492189592Sbmsigmp_final_leave(struct in_multi *inm, struct igmp_ifinfo *igi) 2493189592Sbms{ 2494189592Sbms int syncstates; 2495189592Sbms 2496189592Sbms syncstates = 1; 2497189592Sbms 2498189592Sbms CTR4(KTR_IGMPV3, "%s: final leave %s on ifp %p(%s)", 2499189592Sbms __func__, inet_ntoa(inm->inm_addr), inm->inm_ifp, 2500189592Sbms inm->inm_ifp->if_xname); 2501189592Sbms 2502189592Sbms IN_MULTI_LOCK_ASSERT(); 2503189592Sbms IGMP_LOCK_ASSERT(); 2504189592Sbms 2505189592Sbms switch (inm->inm_state) { 2506189592Sbms case IGMP_NOT_MEMBER: 2507189592Sbms case IGMP_SILENT_MEMBER: 2508189592Sbms case IGMP_LEAVING_MEMBER: 2509189592Sbms /* Already leaving or left; do nothing. */ 2510189592Sbms CTR1(KTR_IGMPV3, 2511189592Sbms"%s: not kicking state machine for silent group", __func__); 2512189592Sbms break; 2513189592Sbms case IGMP_REPORTING_MEMBER: 2514189592Sbms case IGMP_IDLE_MEMBER: 2515189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 2516189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 2517189592Sbms if (igi->igi_version == IGMP_VERSION_2) { 2518189592Sbms#ifdef INVARIANTS 2519189592Sbms if (inm->inm_state == IGMP_G_QUERY_PENDING_MEMBER || 2520189592Sbms inm->inm_state == IGMP_SG_QUERY_PENDING_MEMBER) 2521189592Sbms panic("%s: IGMPv3 state reached, not IGMPv3 mode", 2522189592Sbms __func__); 2523189592Sbms#endif 2524189592Sbms igmp_v1v2_queue_report(inm, IGMP_HOST_LEAVE_MESSAGE); 2525189592Sbms inm->inm_state = IGMP_NOT_MEMBER; 2526189592Sbms } else if (igi->igi_version == IGMP_VERSION_3) { 2527189592Sbms /* 2528189592Sbms * Stop group timer and all pending reports. 2529189592Sbms * Immediately enqueue a state-change report 2530189592Sbms * TO_IN {} to be sent on the next fast timeout, 2531189592Sbms * giving us an opportunity to merge reports. 2532189592Sbms */ 2533189592Sbms _IF_DRAIN(&inm->inm_scq); 2534189592Sbms inm->inm_timer = 0; 2535189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 2536189592Sbms inm->inm_scrv = 1; 2537189592Sbms } else { 2538189592Sbms inm->inm_scrv = igi->igi_rv; 2539189592Sbms } 2540189592Sbms CTR4(KTR_IGMPV3, "%s: Leaving %s/%s with %d " 2541189592Sbms "pending retransmissions.", __func__, 2542189592Sbms inet_ntoa(inm->inm_addr), 2543189592Sbms inm->inm_ifp->if_xname, inm->inm_scrv); 2544189592Sbms if (inm->inm_scrv == 0) { 2545189592Sbms inm->inm_state = IGMP_NOT_MEMBER; 2546189592Sbms inm->inm_sctimer = 0; 2547189592Sbms } else { 2548189592Sbms int retval; 2549189592Sbms 2550189592Sbms inm_acquire_locked(inm); 2551189592Sbms 2552189592Sbms retval = igmp_v3_enqueue_group_record( 2553189592Sbms &inm->inm_scq, inm, 1, 0, 0); 2554189592Sbms KASSERT(retval != 0, 2555189592Sbms ("%s: enqueue record = %d", __func__, 2556189592Sbms retval)); 2557189592Sbms 2558189592Sbms inm->inm_state = IGMP_LEAVING_MEMBER; 2559189592Sbms inm->inm_sctimer = 1; 2560189592Sbms V_state_change_timers_running = 1; 2561189592Sbms syncstates = 0; 2562189592Sbms } 2563189592Sbms break; 2564189592Sbms } 2565189592Sbms break; 2566189592Sbms case IGMP_LAZY_MEMBER: 2567189592Sbms case IGMP_SLEEPING_MEMBER: 2568189592Sbms case IGMP_AWAKENING_MEMBER: 2569189592Sbms /* Our reports are suppressed; do nothing. */ 2570189592Sbms break; 2571189592Sbms } 2572189592Sbms 2573189592Sbms if (syncstates) { 2574189592Sbms inm_commit(inm); 2575189592Sbms CTR3(KTR_IGMPV3, "%s: T1 -> T0 for %s/%s", __func__, 2576189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 2577189592Sbms inm->inm_st[1].iss_fmode = MCAST_UNDEFINED; 2578189592Sbms CTR3(KTR_IGMPV3, "%s: T1 now MCAST_UNDEFINED for %s/%s", 2579189592Sbms __func__, inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 2580189592Sbms } 2581189592Sbms} 2582189592Sbms 2583189592Sbms/* 2584189592Sbms * Enqueue an IGMPv3 group record to the given output queue. 2585189592Sbms * 2586189592Sbms * XXX This function could do with having the allocation code 2587189592Sbms * split out, and the multiple-tree-walks coalesced into a single 2588189592Sbms * routine as has been done in igmp_v3_enqueue_filter_change(). 2589189592Sbms * 2590189592Sbms * If is_state_change is zero, a current-state record is appended. 2591189592Sbms * If is_state_change is non-zero, a state-change report is appended. 2592189592Sbms * 2593189592Sbms * If is_group_query is non-zero, an mbuf packet chain is allocated. 2594189592Sbms * If is_group_query is zero, and if there is a packet with free space 2595189592Sbms * at the tail of the queue, it will be appended to providing there 2596189592Sbms * is enough free space. 2597189592Sbms * Otherwise a new mbuf packet chain is allocated. 2598189592Sbms * 2599189592Sbms * If is_source_query is non-zero, each source is checked to see if 2600189592Sbms * it was recorded for a Group-Source query, and will be omitted if 2601189592Sbms * it is not both in-mode and recorded. 2602189592Sbms * 2603189592Sbms * The function will attempt to allocate leading space in the packet 2604189592Sbms * for the IP/IGMP header to be prepended without fragmenting the chain. 2605189592Sbms * 2606189592Sbms * If successful the size of all data appended to the queue is returned, 2607189592Sbms * otherwise an error code less than zero is returned, or zero if 2608189592Sbms * no record(s) were appended. 2609189592Sbms */ 2610189592Sbmsstatic int 2611189592Sbmsigmp_v3_enqueue_group_record(struct ifqueue *ifq, struct in_multi *inm, 2612189592Sbms const int is_state_change, const int is_group_query, 2613189592Sbms const int is_source_query) 2614189592Sbms{ 2615189592Sbms struct igmp_grouprec ig; 2616189592Sbms struct igmp_grouprec *pig; 2617189592Sbms struct ifnet *ifp; 2618189592Sbms struct ip_msource *ims, *nims; 2619189592Sbms struct mbuf *m0, *m, *md; 2620189592Sbms int error, is_filter_list_change; 2621189592Sbms int minrec0len, m0srcs, msrcs, nbytes, off; 2622189592Sbms int record_has_sources; 2623189592Sbms int now; 2624189592Sbms int type; 2625189592Sbms in_addr_t naddr; 2626189592Sbms uint8_t mode; 2627189592Sbms 2628189592Sbms IN_MULTI_LOCK_ASSERT(); 2629189592Sbms 2630189592Sbms error = 0; 2631189592Sbms ifp = inm->inm_ifp; 2632189592Sbms is_filter_list_change = 0; 2633189592Sbms m = NULL; 2634189592Sbms m0 = NULL; 2635189592Sbms m0srcs = 0; 2636189592Sbms msrcs = 0; 2637189592Sbms nbytes = 0; 2638189592Sbms nims = NULL; 2639189592Sbms record_has_sources = 1; 2640189592Sbms pig = NULL; 2641189592Sbms type = IGMP_DO_NOTHING; 2642189592Sbms mode = inm->inm_st[1].iss_fmode; 2643189592Sbms 2644189592Sbms /* 2645189592Sbms * If we did not transition out of ASM mode during t0->t1, 2646189592Sbms * and there are no source nodes to process, we can skip 2647189592Sbms * the generation of source records. 2648189592Sbms */ 2649189592Sbms if (inm->inm_st[0].iss_asm > 0 && inm->inm_st[1].iss_asm > 0 && 2650189592Sbms inm->inm_nsrc == 0) 2651189592Sbms record_has_sources = 0; 2652189592Sbms 2653189592Sbms if (is_state_change) { 2654189592Sbms /* 2655189592Sbms * Queue a state change record. 2656189592Sbms * If the mode did not change, and there are non-ASM 2657189592Sbms * listeners or source filters present, 2658189592Sbms * we potentially need to issue two records for the group. 2659189592Sbms * If we are transitioning to MCAST_UNDEFINED, we need 2660189592Sbms * not send any sources. 2661189592Sbms * If there are ASM listeners, and there was no filter 2662189592Sbms * mode transition of any kind, do nothing. 2663189592Sbms */ 2664189592Sbms if (mode != inm->inm_st[0].iss_fmode) { 2665189592Sbms if (mode == MCAST_EXCLUDE) { 2666189592Sbms CTR1(KTR_IGMPV3, "%s: change to EXCLUDE", 2667189592Sbms __func__); 2668189592Sbms type = IGMP_CHANGE_TO_EXCLUDE_MODE; 2669189592Sbms } else { 2670189592Sbms CTR1(KTR_IGMPV3, "%s: change to INCLUDE", 2671189592Sbms __func__); 2672189592Sbms type = IGMP_CHANGE_TO_INCLUDE_MODE; 2673189592Sbms if (mode == MCAST_UNDEFINED) 2674189592Sbms record_has_sources = 0; 2675189592Sbms } 2676189592Sbms } else { 2677189592Sbms if (record_has_sources) { 2678189592Sbms is_filter_list_change = 1; 2679189592Sbms } else { 2680189592Sbms type = IGMP_DO_NOTHING; 2681189592Sbms } 2682189592Sbms } 2683189592Sbms } else { 2684189592Sbms /* 2685189592Sbms * Queue a current state record. 2686189592Sbms */ 2687189592Sbms if (mode == MCAST_EXCLUDE) { 2688189592Sbms type = IGMP_MODE_IS_EXCLUDE; 2689189592Sbms } else if (mode == MCAST_INCLUDE) { 2690189592Sbms type = IGMP_MODE_IS_INCLUDE; 2691189592Sbms KASSERT(inm->inm_st[1].iss_asm == 0, 2692189592Sbms ("%s: inm %p is INCLUDE but ASM count is %d", 2693189592Sbms __func__, inm, inm->inm_st[1].iss_asm)); 2694189592Sbms } 2695189592Sbms } 2696189592Sbms 2697189592Sbms /* 2698189592Sbms * Generate the filter list changes using a separate function. 2699189592Sbms */ 2700189592Sbms if (is_filter_list_change) 2701189592Sbms return (igmp_v3_enqueue_filter_change(ifq, inm)); 2702189592Sbms 2703189592Sbms if (type == IGMP_DO_NOTHING) { 2704189592Sbms CTR3(KTR_IGMPV3, "%s: nothing to do for %s/%s", 2705189592Sbms __func__, inet_ntoa(inm->inm_addr), 2706189592Sbms inm->inm_ifp->if_xname); 2707189592Sbms return (0); 2708189592Sbms } 2709189592Sbms 2710189592Sbms /* 2711189592Sbms * If any sources are present, we must be able to fit at least 2712189592Sbms * one in the trailing space of the tail packet's mbuf, 2713189592Sbms * ideally more. 2714189592Sbms */ 2715189592Sbms minrec0len = sizeof(struct igmp_grouprec); 2716189592Sbms if (record_has_sources) 2717189592Sbms minrec0len += sizeof(in_addr_t); 2718189592Sbms 2719189592Sbms CTR4(KTR_IGMPV3, "%s: queueing %s for %s/%s", __func__, 2720189592Sbms igmp_rec_type_to_str(type), inet_ntoa(inm->inm_addr), 2721189592Sbms inm->inm_ifp->if_xname); 2722189592Sbms 2723189592Sbms /* 2724189592Sbms * Check if we have a packet in the tail of the queue for this 2725189592Sbms * group into which the first group record for this group will fit. 2726189592Sbms * Otherwise allocate a new packet. 2727189592Sbms * Always allocate leading space for IP+RA_OPT+IGMP+REPORT. 2728189592Sbms * Note: Group records for G/GSR query responses MUST be sent 2729189592Sbms * in their own packet. 2730189592Sbms */ 2731189592Sbms m0 = ifq->ifq_tail; 2732189592Sbms if (!is_group_query && 2733189592Sbms m0 != NULL && 2734189592Sbms (m0->m_pkthdr.PH_vt.vt_nrecs + 1 <= IGMP_V3_REPORT_MAXRECS) && 2735189592Sbms (m0->m_pkthdr.len + minrec0len) < 2736189592Sbms (ifp->if_mtu - IGMP_LEADINGSPACE)) { 2737189592Sbms m0srcs = (ifp->if_mtu - m0->m_pkthdr.len - 2738189592Sbms sizeof(struct igmp_grouprec)) / sizeof(in_addr_t); 2739189592Sbms m = m0; 2740189592Sbms CTR1(KTR_IGMPV3, "%s: use existing packet", __func__); 2741189592Sbms } else { 2742189592Sbms if (_IF_QFULL(ifq)) { 2743189592Sbms CTR1(KTR_IGMPV3, "%s: outbound queue full", __func__); 2744189592Sbms return (-ENOMEM); 2745189592Sbms } 2746189592Sbms m = NULL; 2747189592Sbms m0srcs = (ifp->if_mtu - IGMP_LEADINGSPACE - 2748189592Sbms sizeof(struct igmp_grouprec)) / sizeof(in_addr_t); 2749190692Sbms if (!is_state_change && !is_group_query) { 2750189592Sbms m = m_getcl(M_DONTWAIT, MT_DATA, M_PKTHDR); 2751190692Sbms if (m) 2752190692Sbms m->m_data += IGMP_LEADINGSPACE; 2753190692Sbms } 2754189592Sbms if (m == NULL) { 2755189592Sbms m = m_gethdr(M_DONTWAIT, MT_DATA); 2756189592Sbms if (m) 2757189592Sbms MH_ALIGN(m, IGMP_LEADINGSPACE); 2758189592Sbms } 2759189592Sbms if (m == NULL) 2760189592Sbms return (-ENOMEM); 2761189592Sbms 2762189592Sbms igmp_save_context(m, ifp); 2763189592Sbms 2764189592Sbms CTR1(KTR_IGMPV3, "%s: allocated first packet", __func__); 2765189592Sbms } 2766189592Sbms 2767189592Sbms /* 2768189592Sbms * Append group record. 2769189592Sbms * If we have sources, we don't know how many yet. 2770189592Sbms */ 2771189592Sbms ig.ig_type = type; 2772189592Sbms ig.ig_datalen = 0; 2773189592Sbms ig.ig_numsrc = 0; 2774189592Sbms ig.ig_group = inm->inm_addr; 2775189592Sbms if (!m_append(m, sizeof(struct igmp_grouprec), (void *)&ig)) { 2776189592Sbms if (m != m0) 2777189592Sbms m_freem(m); 2778189592Sbms CTR1(KTR_IGMPV3, "%s: m_append() failed.", __func__); 2779189592Sbms return (-ENOMEM); 2780189592Sbms } 2781189592Sbms nbytes += sizeof(struct igmp_grouprec); 2782189592Sbms 2783189592Sbms /* 2784189592Sbms * Append as many sources as will fit in the first packet. 2785189592Sbms * If we are appending to a new packet, the chain allocation 2786189592Sbms * may potentially use clusters; use m_getptr() in this case. 2787189592Sbms * If we are appending to an existing packet, we need to obtain 2788189592Sbms * a pointer to the group record after m_append(), in case a new 2789189592Sbms * mbuf was allocated. 2790189592Sbms * Only append sources which are in-mode at t1. If we are 2791189592Sbms * transitioning to MCAST_UNDEFINED state on the group, do not 2792189592Sbms * include source entries. 2793189592Sbms * Only report recorded sources in our filter set when responding 2794189592Sbms * to a group-source query. 2795189592Sbms */ 2796189592Sbms if (record_has_sources) { 2797189592Sbms if (m == m0) { 2798189592Sbms md = m_last(m); 2799189592Sbms pig = (struct igmp_grouprec *)(mtod(md, uint8_t *) + 2800189592Sbms md->m_len - nbytes); 2801189592Sbms } else { 2802189592Sbms md = m_getptr(m, 0, &off); 2803189592Sbms pig = (struct igmp_grouprec *)(mtod(md, uint8_t *) + 2804189592Sbms off); 2805189592Sbms } 2806189592Sbms msrcs = 0; 2807189592Sbms RB_FOREACH_SAFE(ims, ip_msource_tree, &inm->inm_srcs, nims) { 2808189592Sbms CTR2(KTR_IGMPV3, "%s: visit node %s", __func__, 2809189592Sbms inet_ntoa_haddr(ims->ims_haddr)); 2810189592Sbms now = ims_get_mode(inm, ims, 1); 2811189592Sbms CTR2(KTR_IGMPV3, "%s: node is %d", __func__, now); 2812189592Sbms if ((now != mode) || 2813189592Sbms (now == mode && mode == MCAST_UNDEFINED)) { 2814189592Sbms CTR1(KTR_IGMPV3, "%s: skip node", __func__); 2815189592Sbms continue; 2816189592Sbms } 2817189592Sbms if (is_source_query && ims->ims_stp == 0) { 2818189592Sbms CTR1(KTR_IGMPV3, "%s: skip unrecorded node", 2819189592Sbms __func__); 2820189592Sbms continue; 2821189592Sbms } 2822189592Sbms CTR1(KTR_IGMPV3, "%s: append node", __func__); 2823189592Sbms naddr = htonl(ims->ims_haddr); 2824189592Sbms if (!m_append(m, sizeof(in_addr_t), (void *)&naddr)) { 2825189592Sbms if (m != m0) 2826189592Sbms m_freem(m); 2827189592Sbms CTR1(KTR_IGMPV3, "%s: m_append() failed.", 2828189592Sbms __func__); 2829189592Sbms return (-ENOMEM); 2830189592Sbms } 2831189592Sbms nbytes += sizeof(in_addr_t); 2832189592Sbms ++msrcs; 2833189592Sbms if (msrcs == m0srcs) 2834189592Sbms break; 2835189592Sbms } 2836189592Sbms CTR2(KTR_IGMPV3, "%s: msrcs is %d this packet", __func__, 2837189592Sbms msrcs); 2838189592Sbms pig->ig_numsrc = htons(msrcs); 2839189592Sbms nbytes += (msrcs * sizeof(in_addr_t)); 2840189592Sbms } 2841189592Sbms 2842189592Sbms if (is_source_query && msrcs == 0) { 2843189592Sbms CTR1(KTR_IGMPV3, "%s: no recorded sources to report", __func__); 2844189592Sbms if (m != m0) 2845189592Sbms m_freem(m); 2846189592Sbms return (0); 2847189592Sbms } 2848189592Sbms 2849189592Sbms /* 2850189592Sbms * We are good to go with first packet. 2851189592Sbms */ 2852189592Sbms if (m != m0) { 2853189592Sbms CTR1(KTR_IGMPV3, "%s: enqueueing first packet", __func__); 2854189592Sbms m->m_pkthdr.PH_vt.vt_nrecs = 1; 2855189592Sbms _IF_ENQUEUE(ifq, m); 2856189592Sbms } else 2857189592Sbms m->m_pkthdr.PH_vt.vt_nrecs++; 2858189592Sbms 2859189592Sbms /* 2860189592Sbms * No further work needed if no source list in packet(s). 2861189592Sbms */ 2862189592Sbms if (!record_has_sources) 2863189592Sbms return (nbytes); 2864189592Sbms 2865189592Sbms /* 2866189592Sbms * Whilst sources remain to be announced, we need to allocate 2867189592Sbms * a new packet and fill out as many sources as will fit. 2868189592Sbms * Always try for a cluster first. 2869189592Sbms */ 2870189592Sbms while (nims != NULL) { 2871189592Sbms if (_IF_QFULL(ifq)) { 2872189592Sbms CTR1(KTR_IGMPV3, "%s: outbound queue full", __func__); 2873189592Sbms return (-ENOMEM); 2874189592Sbms } 2875189592Sbms m = m_getcl(M_DONTWAIT, MT_DATA, M_PKTHDR); 2876190692Sbms if (m) 2877190692Sbms m->m_data += IGMP_LEADINGSPACE; 2878189592Sbms if (m == NULL) { 2879189592Sbms m = m_gethdr(M_DONTWAIT, MT_DATA); 2880189592Sbms if (m) 2881189592Sbms MH_ALIGN(m, IGMP_LEADINGSPACE); 2882189592Sbms } 2883189592Sbms if (m == NULL) 2884189592Sbms return (-ENOMEM); 2885189592Sbms igmp_save_context(m, ifp); 2886189592Sbms md = m_getptr(m, 0, &off); 2887189592Sbms pig = (struct igmp_grouprec *)(mtod(md, uint8_t *) + off); 2888189592Sbms CTR1(KTR_IGMPV3, "%s: allocated next packet", __func__); 2889189592Sbms 2890189592Sbms if (!m_append(m, sizeof(struct igmp_grouprec), (void *)&ig)) { 2891189592Sbms if (m != m0) 2892189592Sbms m_freem(m); 2893189592Sbms CTR1(KTR_IGMPV3, "%s: m_append() failed.", __func__); 2894189592Sbms return (-ENOMEM); 2895189592Sbms } 2896189592Sbms m->m_pkthdr.PH_vt.vt_nrecs = 1; 2897189592Sbms nbytes += sizeof(struct igmp_grouprec); 2898189592Sbms 2899189592Sbms m0srcs = (ifp->if_mtu - IGMP_LEADINGSPACE - 2900189592Sbms sizeof(struct igmp_grouprec)) / sizeof(in_addr_t); 2901189592Sbms 2902189592Sbms msrcs = 0; 2903189592Sbms RB_FOREACH_FROM(ims, ip_msource_tree, nims) { 2904189592Sbms CTR2(KTR_IGMPV3, "%s: visit node %s", __func__, 2905189592Sbms inet_ntoa_haddr(ims->ims_haddr)); 2906189592Sbms now = ims_get_mode(inm, ims, 1); 2907189592Sbms if ((now != mode) || 2908189592Sbms (now == mode && mode == MCAST_UNDEFINED)) { 2909189592Sbms CTR1(KTR_IGMPV3, "%s: skip node", __func__); 2910189592Sbms continue; 2911189592Sbms } 2912189592Sbms if (is_source_query && ims->ims_stp == 0) { 2913189592Sbms CTR1(KTR_IGMPV3, "%s: skip unrecorded node", 2914189592Sbms __func__); 2915189592Sbms continue; 2916189592Sbms } 2917189592Sbms CTR1(KTR_IGMPV3, "%s: append node", __func__); 2918189592Sbms naddr = htonl(ims->ims_haddr); 2919189592Sbms if (!m_append(m, sizeof(in_addr_t), (void *)&naddr)) { 2920189592Sbms if (m != m0) 2921189592Sbms m_freem(m); 2922189592Sbms CTR1(KTR_IGMPV3, "%s: m_append() failed.", 2923189592Sbms __func__); 2924189592Sbms return (-ENOMEM); 2925189592Sbms } 2926189592Sbms ++msrcs; 2927189592Sbms if (msrcs == m0srcs) 2928189592Sbms break; 2929189592Sbms } 2930189592Sbms pig->ig_numsrc = htons(msrcs); 2931189592Sbms nbytes += (msrcs * sizeof(in_addr_t)); 2932189592Sbms 2933189592Sbms CTR1(KTR_IGMPV3, "%s: enqueueing next packet", __func__); 2934189592Sbms _IF_ENQUEUE(ifq, m); 2935189592Sbms } 2936189592Sbms 2937189592Sbms return (nbytes); 2938189592Sbms} 2939189592Sbms 2940189592Sbms/* 2941189592Sbms * Type used to mark record pass completion. 2942189592Sbms * We exploit the fact we can cast to this easily from the 2943189592Sbms * current filter modes on each ip_msource node. 2944189592Sbms */ 2945189592Sbmstypedef enum { 2946189592Sbms REC_NONE = 0x00, /* MCAST_UNDEFINED */ 2947189592Sbms REC_ALLOW = 0x01, /* MCAST_INCLUDE */ 2948189592Sbms REC_BLOCK = 0x02, /* MCAST_EXCLUDE */ 2949189592Sbms REC_FULL = REC_ALLOW | REC_BLOCK 2950189592Sbms} rectype_t; 2951189592Sbms 2952189592Sbms/* 2953189592Sbms * Enqueue an IGMPv3 filter list change to the given output queue. 2954189592Sbms * 2955189592Sbms * Source list filter state is held in an RB-tree. When the filter list 2956189592Sbms * for a group is changed without changing its mode, we need to compute 2957189592Sbms * the deltas between T0 and T1 for each source in the filter set, 2958189592Sbms * and enqueue the appropriate ALLOW_NEW/BLOCK_OLD records. 2959189592Sbms * 2960189592Sbms * As we may potentially queue two record types, and the entire R-B tree 2961189592Sbms * needs to be walked at once, we break this out into its own function 2962189592Sbms * so we can generate a tightly packed queue of packets. 2963189592Sbms * 2964189592Sbms * XXX This could be written to only use one tree walk, although that makes 2965189592Sbms * serializing into the mbuf chains a bit harder. For now we do two walks 2966189592Sbms * which makes things easier on us, and it may or may not be harder on 2967189592Sbms * the L2 cache. 2968189592Sbms * 2969189592Sbms * If successful the size of all data appended to the queue is returned, 2970189592Sbms * otherwise an error code less than zero is returned, or zero if 2971189592Sbms * no record(s) were appended. 2972189592Sbms */ 2973189592Sbmsstatic int 2974189592Sbmsigmp_v3_enqueue_filter_change(struct ifqueue *ifq, struct in_multi *inm) 2975189592Sbms{ 2976189592Sbms static const int MINRECLEN = 2977189592Sbms sizeof(struct igmp_grouprec) + sizeof(in_addr_t); 2978189592Sbms struct ifnet *ifp; 2979189592Sbms struct igmp_grouprec ig; 2980189592Sbms struct igmp_grouprec *pig; 2981189592Sbms struct ip_msource *ims, *nims; 2982189592Sbms struct mbuf *m, *m0, *md; 2983189592Sbms in_addr_t naddr; 2984189592Sbms int m0srcs, nbytes, off, rsrcs, schanged; 2985189592Sbms int nallow, nblock; 2986189592Sbms uint8_t mode, now, then; 2987189592Sbms rectype_t crt, drt, nrt; 2988189592Sbms 2989189592Sbms IN_MULTI_LOCK_ASSERT(); 2990189592Sbms 2991189592Sbms if (inm->inm_nsrc == 0 || 2992189592Sbms (inm->inm_st[0].iss_asm > 0 && inm->inm_st[1].iss_asm > 0)) 2993189592Sbms return (0); 2994189592Sbms 2995189592Sbms ifp = inm->inm_ifp; /* interface */ 2996189592Sbms mode = inm->inm_st[1].iss_fmode; /* filter mode at t1 */ 2997189592Sbms crt = REC_NONE; /* current group record type */ 2998189592Sbms drt = REC_NONE; /* mask of completed group record types */ 2999189592Sbms nrt = REC_NONE; /* record type for current node */ 3000189592Sbms m0srcs = 0; /* # source which will fit in current mbuf chain */ 3001189592Sbms nbytes = 0; /* # of bytes appended to group's state-change queue */ 3002189592Sbms rsrcs = 0; /* # sources encoded in current record */ 3003189592Sbms schanged = 0; /* # nodes encoded in overall filter change */ 3004189592Sbms nallow = 0; /* # of source entries in ALLOW_NEW */ 3005189592Sbms nblock = 0; /* # of source entries in BLOCK_OLD */ 3006189592Sbms nims = NULL; /* next tree node pointer */ 3007189592Sbms 3008189592Sbms /* 3009189592Sbms * For each possible filter record mode. 3010189592Sbms * The first kind of source we encounter tells us which 3011189592Sbms * is the first kind of record we start appending. 3012189592Sbms * If a node transitioned to UNDEFINED at t1, its mode is treated 3013189592Sbms * as the inverse of the group's filter mode. 3014189592Sbms */ 3015189592Sbms while (drt != REC_FULL) { 3016189592Sbms do { 3017189592Sbms m0 = ifq->ifq_tail; 3018189592Sbms if (m0 != NULL && 3019189592Sbms (m0->m_pkthdr.PH_vt.vt_nrecs + 1 <= 3020189592Sbms IGMP_V3_REPORT_MAXRECS) && 3021189592Sbms (m0->m_pkthdr.len + MINRECLEN) < 3022189592Sbms (ifp->if_mtu - IGMP_LEADINGSPACE)) { 3023189592Sbms m = m0; 3024189592Sbms m0srcs = (ifp->if_mtu - m0->m_pkthdr.len - 3025189592Sbms sizeof(struct igmp_grouprec)) / 3026189592Sbms sizeof(in_addr_t); 3027189592Sbms CTR1(KTR_IGMPV3, 3028189592Sbms "%s: use previous packet", __func__); 3029189592Sbms } else { 3030189592Sbms m = m_getcl(M_DONTWAIT, MT_DATA, M_PKTHDR); 3031190692Sbms if (m) 3032190692Sbms m->m_data += IGMP_LEADINGSPACE; 3033189592Sbms if (m == NULL) { 3034189592Sbms m = m_gethdr(M_DONTWAIT, MT_DATA); 3035189592Sbms if (m) 3036189592Sbms MH_ALIGN(m, IGMP_LEADINGSPACE); 3037189592Sbms } 3038189592Sbms if (m == NULL) { 3039189592Sbms CTR1(KTR_IGMPV3, 3040189592Sbms "%s: m_get*() failed", __func__); 3041189592Sbms return (-ENOMEM); 3042189592Sbms } 3043189592Sbms m->m_pkthdr.PH_vt.vt_nrecs = 0; 3044189592Sbms igmp_save_context(m, ifp); 3045189592Sbms m0srcs = (ifp->if_mtu - IGMP_LEADINGSPACE - 3046189592Sbms sizeof(struct igmp_grouprec)) / 3047189592Sbms sizeof(in_addr_t); 3048189592Sbms CTR1(KTR_IGMPV3, 3049189592Sbms "%s: allocated new packet", __func__); 3050189592Sbms } 3051189592Sbms /* 3052189592Sbms * Append the IGMP group record header to the 3053189592Sbms * current packet's data area. 3054189592Sbms * Recalculate pointer to free space for next 3055189592Sbms * group record, in case m_append() allocated 3056189592Sbms * a new mbuf or cluster. 3057189592Sbms */ 3058189592Sbms memset(&ig, 0, sizeof(ig)); 3059189592Sbms ig.ig_group = inm->inm_addr; 3060189592Sbms if (!m_append(m, sizeof(ig), (void *)&ig)) { 3061189592Sbms if (m != m0) 3062189592Sbms m_freem(m); 3063189592Sbms CTR1(KTR_IGMPV3, 3064189592Sbms "%s: m_append() failed", __func__); 3065189592Sbms return (-ENOMEM); 3066189592Sbms } 3067189592Sbms nbytes += sizeof(struct igmp_grouprec); 3068189592Sbms if (m == m0) { 3069189592Sbms md = m_last(m); 3070189592Sbms pig = (struct igmp_grouprec *)(mtod(md, 3071189592Sbms uint8_t *) + md->m_len - nbytes); 3072189592Sbms } else { 3073189592Sbms md = m_getptr(m, 0, &off); 3074189592Sbms pig = (struct igmp_grouprec *)(mtod(md, 3075189592Sbms uint8_t *) + off); 3076189592Sbms } 3077189592Sbms /* 3078189592Sbms * Begin walking the tree for this record type 3079189592Sbms * pass, or continue from where we left off 3080189592Sbms * previously if we had to allocate a new packet. 3081189592Sbms * Only report deltas in-mode at t1. 3082189592Sbms * We need not report included sources as allowed 3083189592Sbms * if we are in inclusive mode on the group, 3084189592Sbms * however the converse is not true. 3085189592Sbms */ 3086189592Sbms rsrcs = 0; 3087189592Sbms if (nims == NULL) 3088189592Sbms nims = RB_MIN(ip_msource_tree, &inm->inm_srcs); 3089189592Sbms RB_FOREACH_FROM(ims, ip_msource_tree, nims) { 3090189592Sbms CTR2(KTR_IGMPV3, "%s: visit node %s", 3091189592Sbms __func__, inet_ntoa_haddr(ims->ims_haddr)); 3092189592Sbms now = ims_get_mode(inm, ims, 1); 3093189592Sbms then = ims_get_mode(inm, ims, 0); 3094189592Sbms CTR3(KTR_IGMPV3, "%s: mode: t0 %d, t1 %d", 3095189592Sbms __func__, then, now); 3096189592Sbms if (now == then) { 3097189592Sbms CTR1(KTR_IGMPV3, 3098189592Sbms "%s: skip unchanged", __func__); 3099189592Sbms continue; 3100189592Sbms } 3101189592Sbms if (mode == MCAST_EXCLUDE && 3102189592Sbms now == MCAST_INCLUDE) { 3103189592Sbms CTR1(KTR_IGMPV3, 3104189592Sbms "%s: skip IN src on EX group", 3105189592Sbms __func__); 3106189592Sbms continue; 3107189592Sbms } 3108189592Sbms nrt = (rectype_t)now; 3109189592Sbms if (nrt == REC_NONE) 3110189592Sbms nrt = (rectype_t)(~mode & REC_FULL); 3111189592Sbms if (schanged++ == 0) { 3112189592Sbms crt = nrt; 3113189592Sbms } else if (crt != nrt) 3114189592Sbms continue; 3115189592Sbms naddr = htonl(ims->ims_haddr); 3116189592Sbms if (!m_append(m, sizeof(in_addr_t), 3117189592Sbms (void *)&naddr)) { 3118189592Sbms if (m != m0) 3119189592Sbms m_freem(m); 3120189592Sbms CTR1(KTR_IGMPV3, 3121189592Sbms "%s: m_append() failed", __func__); 3122189592Sbms return (-ENOMEM); 3123189592Sbms } 3124189592Sbms nallow += !!(crt == REC_ALLOW); 3125189592Sbms nblock += !!(crt == REC_BLOCK); 3126189592Sbms if (++rsrcs == m0srcs) 3127189592Sbms break; 3128189592Sbms } 3129189592Sbms /* 3130189592Sbms * If we did not append any tree nodes on this 3131189592Sbms * pass, back out of allocations. 3132189592Sbms */ 3133189592Sbms if (rsrcs == 0) { 3134189592Sbms nbytes -= sizeof(struct igmp_grouprec); 3135189592Sbms if (m != m0) { 3136189592Sbms CTR1(KTR_IGMPV3, 3137189592Sbms "%s: m_free(m)", __func__); 3138189592Sbms m_freem(m); 3139189592Sbms } else { 3140189592Sbms CTR1(KTR_IGMPV3, 3141189592Sbms "%s: m_adj(m, -ig)", __func__); 3142189592Sbms m_adj(m, -((int)sizeof( 3143189592Sbms struct igmp_grouprec))); 3144189592Sbms } 3145189592Sbms continue; 3146189592Sbms } 3147189592Sbms nbytes += (rsrcs * sizeof(in_addr_t)); 3148189592Sbms if (crt == REC_ALLOW) 3149189592Sbms pig->ig_type = IGMP_ALLOW_NEW_SOURCES; 3150189592Sbms else if (crt == REC_BLOCK) 3151189592Sbms pig->ig_type = IGMP_BLOCK_OLD_SOURCES; 3152189592Sbms pig->ig_numsrc = htons(rsrcs); 3153189592Sbms /* 3154189592Sbms * Count the new group record, and enqueue this 3155189592Sbms * packet if it wasn't already queued. 3156189592Sbms */ 3157189592Sbms m->m_pkthdr.PH_vt.vt_nrecs++; 3158189592Sbms if (m != m0) 3159189592Sbms _IF_ENQUEUE(ifq, m); 3160189592Sbms } while (nims != NULL); 3161189592Sbms drt |= crt; 3162189592Sbms crt = (~crt & REC_FULL); 3163189592Sbms } 3164189592Sbms 3165189592Sbms CTR3(KTR_IGMPV3, "%s: queued %d ALLOW_NEW, %d BLOCK_OLD", __func__, 3166189592Sbms nallow, nblock); 3167189592Sbms 3168189592Sbms return (nbytes); 3169189592Sbms} 3170189592Sbms 3171189592Sbmsstatic int 3172189592Sbmsigmp_v3_merge_state_changes(struct in_multi *inm, struct ifqueue *ifscq) 3173189592Sbms{ 3174189592Sbms struct ifqueue *gq; 3175189592Sbms struct mbuf *m; /* pending state-change */ 3176189592Sbms struct mbuf *m0; /* copy of pending state-change */ 3177189592Sbms struct mbuf *mt; /* last state-change in packet */ 3178189592Sbms int docopy, domerge; 3179189592Sbms u_int recslen; 3180189592Sbms 3181189592Sbms docopy = 0; 3182189592Sbms domerge = 0; 3183189592Sbms recslen = 0; 3184189592Sbms 3185189592Sbms IN_MULTI_LOCK_ASSERT(); 3186189592Sbms IGMP_LOCK_ASSERT(); 3187189592Sbms 3188189592Sbms /* 3189189592Sbms * If there are further pending retransmissions, make a writable 3190189592Sbms * copy of each queued state-change message before merging. 3191189592Sbms */ 3192189592Sbms if (inm->inm_scrv > 0) 3193189592Sbms docopy = 1; 3194189592Sbms 3195189592Sbms gq = &inm->inm_scq; 3196189592Sbms#ifdef KTR 3197189592Sbms if (gq->ifq_head == NULL) { 3198189592Sbms CTR2(KTR_IGMPV3, "%s: WARNING: queue for inm %p is empty", 3199189592Sbms __func__, inm); 3200189592Sbms } 3201189592Sbms#endif 3202189592Sbms 3203189592Sbms m = gq->ifq_head; 3204189592Sbms while (m != NULL) { 3205189592Sbms /* 3206189592Sbms * Only merge the report into the current packet if 3207189592Sbms * there is sufficient space to do so; an IGMPv3 report 3208189592Sbms * packet may only contain 65,535 group records. 3209189592Sbms * Always use a simple mbuf chain concatentation to do this, 3210189592Sbms * as large state changes for single groups may have 3211189592Sbms * allocated clusters. 3212189592Sbms */ 3213189592Sbms domerge = 0; 3214189592Sbms mt = ifscq->ifq_tail; 3215189592Sbms if (mt != NULL) { 3216189592Sbms recslen = m_length(m, NULL); 3217189592Sbms 3218189592Sbms if ((mt->m_pkthdr.PH_vt.vt_nrecs + 3219189592Sbms m->m_pkthdr.PH_vt.vt_nrecs <= 3220189592Sbms IGMP_V3_REPORT_MAXRECS) && 3221189592Sbms (mt->m_pkthdr.len + recslen <= 3222189592Sbms (inm->inm_ifp->if_mtu - IGMP_LEADINGSPACE))) 3223189592Sbms domerge = 1; 3224189592Sbms } 3225189592Sbms 3226189592Sbms if (!domerge && _IF_QFULL(gq)) { 3227189592Sbms CTR2(KTR_IGMPV3, 3228189592Sbms "%s: outbound queue full, skipping whole packet %p", 3229189592Sbms __func__, m); 3230189592Sbms mt = m->m_nextpkt; 3231189592Sbms if (!docopy) 3232189592Sbms m_freem(m); 3233189592Sbms m = mt; 3234189592Sbms continue; 3235189592Sbms } 3236189592Sbms 3237189592Sbms if (!docopy) { 3238189592Sbms CTR2(KTR_IGMPV3, "%s: dequeueing %p", __func__, m); 3239189592Sbms _IF_DEQUEUE(gq, m0); 3240189592Sbms m = m0->m_nextpkt; 3241189592Sbms } else { 3242189592Sbms CTR2(KTR_IGMPV3, "%s: copying %p", __func__, m); 3243189592Sbms m0 = m_dup(m, M_NOWAIT); 3244189592Sbms if (m0 == NULL) 3245189592Sbms return (ENOMEM); 3246189592Sbms m0->m_nextpkt = NULL; 3247189592Sbms m = m->m_nextpkt; 3248189592Sbms } 3249189592Sbms 3250189592Sbms if (!domerge) { 3251189592Sbms CTR3(KTR_IGMPV3, "%s: queueing %p to ifscq %p)", 3252189592Sbms __func__, m0, ifscq); 3253189592Sbms _IF_ENQUEUE(ifscq, m0); 3254189592Sbms } else { 3255189592Sbms struct mbuf *mtl; /* last mbuf of packet mt */ 3256189592Sbms 3257189592Sbms CTR3(KTR_IGMPV3, "%s: merging %p with ifscq tail %p)", 3258189592Sbms __func__, m0, mt); 3259189592Sbms 3260189592Sbms mtl = m_last(mt); 3261189592Sbms m0->m_flags &= ~M_PKTHDR; 3262189592Sbms mt->m_pkthdr.len += recslen; 3263189592Sbms mt->m_pkthdr.PH_vt.vt_nrecs += 3264189592Sbms m0->m_pkthdr.PH_vt.vt_nrecs; 3265189592Sbms 3266189592Sbms mtl->m_next = m0; 3267189592Sbms } 3268189592Sbms } 3269189592Sbms 3270189592Sbms return (0); 3271189592Sbms} 3272189592Sbms 3273189592Sbms/* 3274189592Sbms * Respond to a pending IGMPv3 General Query. 3275189592Sbms */ 3276189592Sbmsstatic void 3277189592Sbmsigmp_v3_dispatch_general_query(struct igmp_ifinfo *igi) 3278189592Sbms{ 3279189592Sbms struct ifmultiaddr *ifma, *tifma; 3280189592Sbms struct ifnet *ifp; 3281189592Sbms struct in_multi *inm; 3282189592Sbms int retval, loop; 3283189592Sbms 3284189592Sbms IN_MULTI_LOCK_ASSERT(); 3285189592Sbms IGMP_LOCK_ASSERT(); 3286189592Sbms 3287189592Sbms KASSERT(igi->igi_version == IGMP_VERSION_3, 3288189592Sbms ("%s: called when version %d", __func__, igi->igi_version)); 3289189592Sbms 3290189592Sbms ifp = igi->igi_ifp; 3291189592Sbms 3292189592Sbms IF_ADDR_LOCK(ifp); 3293189592Sbms TAILQ_FOREACH_SAFE(ifma, &ifp->if_multiaddrs, ifma_link, tifma) { 3294189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 3295189931Sbms ifma->ifma_protospec == NULL) 3296189592Sbms continue; 3297189592Sbms 3298189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 3299189592Sbms KASSERT(ifp == inm->inm_ifp, 3300189592Sbms ("%s: inconsistent ifp", __func__)); 3301189592Sbms 3302189592Sbms switch (inm->inm_state) { 3303189592Sbms case IGMP_NOT_MEMBER: 3304189592Sbms case IGMP_SILENT_MEMBER: 3305189592Sbms break; 3306189592Sbms case IGMP_REPORTING_MEMBER: 3307189592Sbms case IGMP_IDLE_MEMBER: 3308189592Sbms case IGMP_LAZY_MEMBER: 3309189592Sbms case IGMP_SLEEPING_MEMBER: 3310189592Sbms case IGMP_AWAKENING_MEMBER: 3311189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 3312189592Sbms retval = igmp_v3_enqueue_group_record(&igi->igi_gq, 3313189592Sbms inm, 0, 0, 0); 3314189592Sbms CTR2(KTR_IGMPV3, "%s: enqueue record = %d", 3315189592Sbms __func__, retval); 3316189592Sbms break; 3317189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 3318189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 3319189592Sbms case IGMP_LEAVING_MEMBER: 3320189592Sbms break; 3321189592Sbms } 3322189592Sbms } 3323189592Sbms IF_ADDR_UNLOCK(ifp); 3324189592Sbms 3325189592Sbms loop = (igi->igi_flags & IGIF_LOOPBACK) ? 1 : 0; 3326189592Sbms igmp_dispatch_queue(&igi->igi_gq, IGMP_MAX_RESPONSE_BURST, loop); 3327189592Sbms 3328189592Sbms /* 3329189592Sbms * Slew transmission of bursts over 500ms intervals. 3330189592Sbms */ 3331189592Sbms if (igi->igi_gq.ifq_head != NULL) { 3332189592Sbms igi->igi_v3_timer = 1 + IGMP_RANDOM_DELAY( 3333189592Sbms IGMP_RESPONSE_BURST_INTERVAL); 3334189592Sbms V_interface_timers_running = 1; 3335189592Sbms } 3336189592Sbms} 3337189592Sbms 3338189592Sbms/* 3339189592Sbms * Transmit the next pending IGMP message in the output queue. 3340189592Sbms * 3341189592Sbms * We get called from netisr_processqueue(). A mutex private to igmpoq 3342189592Sbms * will be acquired and released around this routine. 3343189592Sbms * 3344189592Sbms * VIMAGE: Needs to store/restore vnet pointer on a per-mbuf-chain basis. 3345189592Sbms * MRT: Nothing needs to be done, as IGMP traffic is always local to 3346189592Sbms * a link and uses a link-scope multicast address. 3347189592Sbms */ 3348189592Sbmsstatic void 3349189592Sbmsigmp_intr(struct mbuf *m) 3350189592Sbms{ 3351189592Sbms struct ip_moptions imo; 3352189592Sbms struct ifnet *ifp; 3353189592Sbms struct mbuf *ipopts, *m0; 3354189592Sbms int error; 3355189592Sbms uint32_t ifindex; 3356189592Sbms 3357189592Sbms CTR2(KTR_IGMPV3, "%s: transmit %p", __func__, m); 3358189592Sbms 3359189592Sbms /* 3360189592Sbms * Restore VNET image pointer from enqueued mbuf chain 3361189592Sbms * before doing anything else. Whilst we use interface 3362189592Sbms * indexes to guard against interface detach, they are 3363189592Sbms * unique to each VIMAGE and must be retrieved. 3364189592Sbms */ 3365189592Sbms CURVNET_SET(m->m_pkthdr.header); 3366189592Sbms ifindex = igmp_restore_context(m); 3367189592Sbms 3368189592Sbms /* 3369189592Sbms * Check if the ifnet still exists. This limits the scope of 3370189592Sbms * any race in the absence of a global ifp lock for low cost 3371189592Sbms * (an array lookup). 3372189592Sbms */ 3373189592Sbms ifp = ifnet_byindex(ifindex); 3374189592Sbms if (ifp == NULL) { 3375189592Sbms CTR3(KTR_IGMPV3, "%s: dropped %p as ifindex %u went away.", 3376189592Sbms __func__, m, ifindex); 3377189592Sbms m_freem(m); 3378190951Srwatson IPSTAT_INC(ips_noroute); 3379189592Sbms goto out; 3380189592Sbms } 3381189592Sbms 3382189592Sbms ipopts = V_igmp_sendra ? m_raopt : NULL; 3383189592Sbms 3384119181Srwatson imo.imo_multicast_ttl = 1; 338515292Swollman imo.imo_multicast_vif = -1; 3386181803Sbz imo.imo_multicast_loop = (V_ip_mrouter != NULL); 33871541Srgrimes 338815292Swollman /* 3389189592Sbms * If the user requested that IGMP traffic be explicitly 3390189592Sbms * redirected to the loopback interface (e.g. they are running a 3391189592Sbms * MANET interface and the routing protocol needs to see the 3392189592Sbms * updates), handle this now. 339315292Swollman */ 3394189592Sbms if (m->m_flags & M_IGMP_LOOP) 3395189592Sbms imo.imo_multicast_ifp = V_loif; 3396189592Sbms else 3397189592Sbms imo.imo_multicast_ifp = ifp; 33982531Swollman 3399189592Sbms if (m->m_flags & M_IGMPV2) { 3400189592Sbms m0 = m; 3401189592Sbms } else { 3402189592Sbms m0 = igmp_v3_encap_report(ifp, m); 3403189592Sbms if (m0 == NULL) { 3404189592Sbms CTR2(KTR_IGMPV3, "%s: dropped %p", __func__, m); 3405189592Sbms m_freem(m); 3406190951Srwatson IPSTAT_INC(ips_odropped); 3407189592Sbms goto out; 3408189592Sbms } 3409189592Sbms } 3410189592Sbms 3411189592Sbms igmp_scrub_context(m0); 3412189592Sbms m->m_flags &= ~(M_PROTOFLAGS); 3413189592Sbms m0->m_pkthdr.rcvif = V_loif; 3414189592Sbms#ifdef MAC 3415189592Sbms mac_netinet_igmp_send(ifp, m0); 3416189592Sbms#endif 3417189592Sbms error = ip_output(m0, ipopts, NULL, 0, &imo, NULL); 3418189592Sbms if (error) { 3419189592Sbms CTR3(KTR_IGMPV3, "%s: ip_output(%p) = %d", __func__, m0, error); 3420189592Sbms goto out; 3421189592Sbms } 3422189592Sbms 3423190965Srwatson IGMPSTAT_INC(igps_snd_reports); 3424189592Sbms 3425189592Sbmsout: 3426189592Sbms /* 3427189592Sbms * We must restore the existing vnet pointer before 3428189592Sbms * continuing as we are run from netisr context. 3429189592Sbms */ 3430189592Sbms CURVNET_RESTORE(); 34311541Srgrimes} 3432189592Sbms 3433189592Sbms/* 3434189592Sbms * Encapsulate an IGMPv3 report. 3435189592Sbms * 3436189592Sbms * The internal mbuf flag M_IGMPV3_HDR is used to indicate that the mbuf 3437189592Sbms * chain has already had its IP/IGMPv3 header prepended. In this case 3438189592Sbms * the function will not attempt to prepend; the lengths and checksums 3439189592Sbms * will however be re-computed. 3440189592Sbms * 3441189592Sbms * Returns a pointer to the new mbuf chain head, or NULL if the 3442189592Sbms * allocation failed. 3443189592Sbms */ 3444189592Sbmsstatic struct mbuf * 3445189592Sbmsigmp_v3_encap_report(struct ifnet *ifp, struct mbuf *m) 3446189592Sbms{ 3447189592Sbms INIT_VNET_NET(curvnet); 3448189592Sbms INIT_VNET_INET(curvnet); 3449189592Sbms struct igmp_report *igmp; 3450189592Sbms struct ip *ip; 3451189592Sbms int hdrlen, igmpreclen; 3452189592Sbms 3453189592Sbms KASSERT((m->m_flags & M_PKTHDR), 3454189592Sbms ("%s: mbuf chain %p is !M_PKTHDR", __func__, m)); 3455189592Sbms 3456189592Sbms igmpreclen = m_length(m, NULL); 3457189592Sbms hdrlen = sizeof(struct ip) + sizeof(struct igmp_report); 3458189592Sbms 3459189592Sbms if (m->m_flags & M_IGMPV3_HDR) { 3460189592Sbms igmpreclen -= hdrlen; 3461189592Sbms } else { 3462189592Sbms M_PREPEND(m, hdrlen, M_DONTWAIT); 3463189592Sbms if (m == NULL) 3464189592Sbms return (NULL); 3465189592Sbms m->m_flags |= M_IGMPV3_HDR; 3466189592Sbms } 3467189592Sbms 3468189592Sbms CTR2(KTR_IGMPV3, "%s: igmpreclen is %d", __func__, igmpreclen); 3469189592Sbms 3470189592Sbms m->m_data += sizeof(struct ip); 3471189592Sbms m->m_len -= sizeof(struct ip); 3472189592Sbms 3473189592Sbms igmp = mtod(m, struct igmp_report *); 3474189592Sbms igmp->ir_type = IGMP_v3_HOST_MEMBERSHIP_REPORT; 3475189592Sbms igmp->ir_rsv1 = 0; 3476189592Sbms igmp->ir_rsv2 = 0; 3477189592Sbms igmp->ir_numgrps = htons(m->m_pkthdr.PH_vt.vt_nrecs); 3478189592Sbms igmp->ir_cksum = 0; 3479189592Sbms igmp->ir_cksum = in_cksum(m, sizeof(struct igmp_report) + igmpreclen); 3480189592Sbms m->m_pkthdr.PH_vt.vt_nrecs = 0; 3481189592Sbms 3482189592Sbms m->m_data -= sizeof(struct ip); 3483189592Sbms m->m_len += sizeof(struct ip); 3484189592Sbms 3485189592Sbms ip = mtod(m, struct ip *); 3486189592Sbms ip->ip_tos = IPTOS_PREC_INTERNETCONTROL; 3487189592Sbms ip->ip_len = hdrlen + igmpreclen; 3488189592Sbms ip->ip_off = IP_DF; 3489189592Sbms ip->ip_p = IPPROTO_IGMP; 3490189592Sbms ip->ip_sum = 0; 3491189592Sbms 3492189592Sbms ip->ip_src.s_addr = INADDR_ANY; 3493189592Sbms 3494189592Sbms if (m->m_flags & M_IGMP_LOOP) { 3495189592Sbms struct in_ifaddr *ia; 3496189592Sbms 3497189592Sbms IFP_TO_IA(ifp, ia); 3498189592Sbms if (ia != NULL) 3499189592Sbms ip->ip_src = ia->ia_addr.sin_addr; 3500189592Sbms } 3501189592Sbms 3502189592Sbms ip->ip_dst.s_addr = htonl(INADDR_ALLRPTS_GROUP); 3503189592Sbms 3504189592Sbms return (m); 3505189592Sbms} 3506189592Sbms 3507189592Sbms#ifdef KTR 3508189592Sbmsstatic char * 3509189592Sbmsigmp_rec_type_to_str(const int type) 3510189592Sbms{ 3511189592Sbms 3512189592Sbms switch (type) { 3513189592Sbms case IGMP_CHANGE_TO_EXCLUDE_MODE: 3514189592Sbms return "TO_EX"; 3515189592Sbms break; 3516189592Sbms case IGMP_CHANGE_TO_INCLUDE_MODE: 3517189592Sbms return "TO_IN"; 3518189592Sbms break; 3519189592Sbms case IGMP_MODE_IS_EXCLUDE: 3520189592Sbms return "MODE_EX"; 3521189592Sbms break; 3522189592Sbms case IGMP_MODE_IS_INCLUDE: 3523189592Sbms return "MODE_IN"; 3524189592Sbms break; 3525189592Sbms case IGMP_ALLOW_NEW_SOURCES: 3526189592Sbms return "ALLOW_NEW"; 3527189592Sbms break; 3528189592Sbms case IGMP_BLOCK_OLD_SOURCES: 3529189592Sbms return "BLOCK_OLD"; 3530189592Sbms break; 3531189592Sbms default: 3532189592Sbms break; 3533189592Sbms } 3534189592Sbms return "unknown"; 3535189592Sbms} 3536189592Sbms#endif 3537189592Sbms 3538189592Sbmsstatic void 3539189592Sbmsigmp_sysinit(void) 3540189592Sbms{ 3541189592Sbms 3542189592Sbms CTR1(KTR_IGMPV3, "%s: initializing", __func__); 3543189592Sbms 3544189592Sbms IGMP_LOCK_INIT(); 3545189592Sbms 3546189592Sbms mtx_init(&igmpoq.ifq_mtx, "igmpoq_mtx", NULL, MTX_DEF); 3547189592Sbms IFQ_SET_MAXLEN(&igmpoq, IFQ_MAXLEN); 3548189592Sbms 3549189592Sbms m_raopt = igmp_ra_alloc(); 3550189592Sbms 3551191264Sbms netisr_register(NETISR_IGMP, igmp_intr, &igmpoq, 0); 3552189592Sbms} 3553189592Sbms 3554189592Sbmsstatic void 3555189592Sbmsigmp_sysuninit(void) 3556189592Sbms{ 3557189592Sbms 3558189592Sbms CTR1(KTR_IGMPV3, "%s: tearing down", __func__); 3559189592Sbms 3560189592Sbms netisr_unregister(NETISR_IGMP); 3561189592Sbms mtx_destroy(&igmpoq.ifq_mtx); 3562189592Sbms 3563189592Sbms m_free(m_raopt); 3564189592Sbms m_raopt = NULL; 3565189592Sbms 3566189592Sbms IGMP_LOCK_DESTROY(); 3567189592Sbms} 3568189592Sbms 3569189592Sbms/* 3570189592Sbms * Initialize an IGMPv3 instance. 3571189592Sbms * VIMAGE: Assumes curvnet set by caller and called per vimage. 3572189592Sbms */ 3573189592Sbmsstatic int 3574189592Sbmsvnet_igmp_iattach(const void *unused __unused) 3575189592Sbms{ 3576189592Sbms INIT_VNET_INET(curvnet); 3577189592Sbms 3578189592Sbms CTR1(KTR_IGMPV3, "%s: initializing", __func__); 3579189592Sbms 3580189592Sbms LIST_INIT(&V_igi_head); 3581189592Sbms 3582189592Sbms V_current_state_timers_running = 0; 3583189592Sbms V_state_change_timers_running = 0; 3584189592Sbms V_interface_timers_running = 0; 3585189592Sbms 3586189592Sbms /* 3587189592Sbms * Initialize sysctls to default values. 3588189592Sbms */ 3589189592Sbms V_igmp_recvifkludge = 1; 3590189592Sbms V_igmp_sendra = 1; 3591189592Sbms V_igmp_sendlocal = 1; 3592189592Sbms V_igmp_v1enable = 1; 3593189592Sbms V_igmp_v2enable = 1; 3594189592Sbms V_igmp_legacysupp = 0; 3595189592Sbms V_igmp_default_version = IGMP_VERSION_3; 3596189592Sbms V_igmp_gsrdelay.tv_sec = 10; 3597189592Sbms V_igmp_gsrdelay.tv_usec = 0; 3598189592Sbms 3599189592Sbms memset(&V_igmpstat, 0, sizeof(struct igmpstat)); 3600189592Sbms V_igmpstat.igps_version = IGPS_VERSION_3; 3601189592Sbms V_igmpstat.igps_len = sizeof(struct igmpstat); 3602189592Sbms 3603189592Sbms return (0); 3604189592Sbms} 3605189592Sbms 3606189592Sbmsstatic int 3607189592Sbmsvnet_igmp_idetach(const void *unused __unused) 3608189592Sbms{ 3609189592Sbms INIT_VNET_INET(curvnet); 3610189592Sbms 3611189592Sbms CTR1(KTR_IGMPV3, "%s: tearing down", __func__); 3612189592Sbms 3613189592Sbms KASSERT(LIST_EMPTY(&V_igi_head), 3614189592Sbms ("%s: igi list not empty; ifnets not detached?", __func__)); 3615189592Sbms 3616189592Sbms return (0); 3617189592Sbms} 3618189592Sbms 3619189592Sbms#ifdef VIMAGE 3620189592Sbmsstatic struct vnet_symmap vnet_igmp_symmap[] = { 3621189592Sbms VNET_SYMMAP(igmp, igi_head), 3622189592Sbms VNET_SYMMAP(igmp, igmpstat), 3623189592Sbms VNET_SYMMAP_END 3624189592Sbms}; 3625189592SbmsVNET_MOD_DECLARE(IGMP, igmp, vnet_igmp_iattach, vnet_igmp_idetach, 3626189592Sbms vnet_igmp_symmap); 3627189592Sbms#endif /* VIMAGE */ 3628189592Sbms 3629189592Sbmsstatic int 3630189592Sbmsigmp_modevent(module_t mod, int type, void *unused __unused) 3631189592Sbms{ 3632189592Sbms 3633189592Sbms switch (type) { 3634189592Sbms case MOD_LOAD: 3635189592Sbms igmp_sysinit(); 3636189592Sbms#ifdef VIMAGE 3637189592Sbms vnet_mod_register(&vnet_igmp_modinfo); 3638189592Sbms#else 3639189592Sbms (void)vnet_igmp_iattach(NULL); 3640189592Sbms#endif /* VIMAGE */ 3641189592Sbms break; 3642189592Sbms case MOD_UNLOAD: 3643189592Sbms#ifdef VIMAGE 3644189592Sbms /* 3645189592Sbms * TODO: Allow module unload if any VIMAGE instances 3646189592Sbms * are using this module. 3647189592Sbms */ 3648189592Sbms return (EBUSY); 3649189592Sbms#else 3650189592Sbms (void)vnet_igmp_idetach(NULL); 3651189592Sbms#endif /* VIMAGE */ 3652189592Sbms igmp_sysuninit(); 3653189592Sbms break; 3654189592Sbms default: 3655189592Sbms return (EOPNOTSUPP); 3656189592Sbms } 3657189592Sbms return (0); 3658189592Sbms} 3659189592Sbms 3660189592Sbmsstatic moduledata_t igmp_mod = { 3661189592Sbms "igmp", 3662189592Sbms igmp_modevent, 3663189592Sbms 0 3664189592Sbms}; 3665189592SbmsDECLARE_MODULE(igmp, igmp_mod, SI_SUB_PSEUDO, SI_ORDER_ANY); 3666