igmp.c revision 191816
1139823Simp/*- 2189592Sbms * Copyright (c) 2007-2009 Bruce Simpson. 31541Srgrimes * Copyright (c) 1988 Stephen Deering. 41541Srgrimes * Copyright (c) 1992, 1993 51541Srgrimes * The Regents of the University of California. All rights reserved. 61541Srgrimes * 71541Srgrimes * This code is derived from software contributed to Berkeley by 81541Srgrimes * Stephen Deering of Stanford University. 91541Srgrimes * 101541Srgrimes * Redistribution and use in source and binary forms, with or without 111541Srgrimes * modification, are permitted provided that the following conditions 121541Srgrimes * are met: 131541Srgrimes * 1. Redistributions of source code must retain the above copyright 141541Srgrimes * notice, this list of conditions and the following disclaimer. 151541Srgrimes * 2. Redistributions in binary form must reproduce the above copyright 161541Srgrimes * notice, this list of conditions and the following disclaimer in the 171541Srgrimes * documentation and/or other materials provided with the distribution. 181541Srgrimes * 4. Neither the name of the University nor the names of its contributors 191541Srgrimes * may be used to endorse or promote products derived from this software 201541Srgrimes * without specific prior written permission. 211541Srgrimes * 221541Srgrimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 231541Srgrimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 241541Srgrimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 251541Srgrimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 261541Srgrimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 271541Srgrimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 281541Srgrimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 291541Srgrimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 301541Srgrimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 311541Srgrimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 321541Srgrimes * SUCH DAMAGE. 331541Srgrimes * 341541Srgrimes * @(#)igmp.c 8.1 (Berkeley) 7/19/93 351541Srgrimes */ 361541Srgrimes 372531Swollman/* 382531Swollman * Internet Group Management Protocol (IGMP) routines. 39189592Sbms * [RFC1112, RFC2236, RFC3376] 402531Swollman * 412531Swollman * Written by Steve Deering, Stanford, May 1988. 422531Swollman * Modified by Rosen Sharma, Stanford, Aug 1994. 439209Swollman * Modified by Bill Fenner, Xerox PARC, Feb 1995. 4414622Sfenner * Modified to fully comply to IGMPv2 by Bill Fenner, Oct 1995. 45189592Sbms * Significantly rewritten for IGMPv3, VIMAGE, and SMP by Bruce Simpson. 462531Swollman * 4714622Sfenner * MULTICAST Revision: 3.5.1.4 482531Swollman */ 491541Srgrimes 50172467Ssilby#include <sys/cdefs.h> 51172467Ssilby__FBSDID("$FreeBSD: head/sys/netinet/igmp.c 191816 2009-05-05 10:56:12Z zec $"); 52172467Ssilby 53101091Srwatson#include "opt_mac.h" 54189106Sbz#include "opt_route.h" 55101091Srwatson 561541Srgrimes#include <sys/param.h> 571549Srgrimes#include <sys/systm.h> 58189592Sbms#include <sys/module.h> 5929024Sbde#include <sys/malloc.h> 601541Srgrimes#include <sys/mbuf.h> 611541Srgrimes#include <sys/socket.h> 621541Srgrimes#include <sys/protosw.h> 6312296Sphk#include <sys/kernel.h> 646472Swollman#include <sys/sysctl.h> 65181803Sbz#include <sys/vimage.h> 66189592Sbms#include <sys/ktr.h> 67189592Sbms#include <sys/condvar.h> 681541Srgrimes 691541Srgrimes#include <net/if.h> 70189592Sbms#include <net/netisr.h> 711541Srgrimes#include <net/route.h> 72185571Sbz#include <net/vnet.h> 731541Srgrimes 741541Srgrimes#include <netinet/in.h> 751541Srgrimes#include <netinet/in_var.h> 761541Srgrimes#include <netinet/in_systm.h> 771541Srgrimes#include <netinet/ip.h> 781541Srgrimes#include <netinet/ip_var.h> 79152592Sandre#include <netinet/ip_options.h> 801541Srgrimes#include <netinet/igmp.h> 811541Srgrimes#include <netinet/igmp_var.h> 82185571Sbz#include <netinet/vinet.h> 831541Srgrimes 8460105Sjlemon#include <machine/in_cksum.h> 8560105Sjlemon 86163606Srwatson#include <security/mac/mac_framework.h> 87163606Srwatson 88189592Sbms#ifndef KTR_IGMPV3 89191657Sbms#define KTR_IGMPV3 KTR_INET 90189592Sbms#endif 9130309Sphk 92189592Sbmsstatic struct igmp_ifinfo * 93189592Sbms igi_alloc_locked(struct ifnet *); 94189592Sbmsstatic void igi_delete_locked(const struct ifnet *); 95189592Sbmsstatic void igmp_dispatch_queue(struct ifqueue *, int, const int); 96189592Sbmsstatic void igmp_fasttimo_vnet(void); 97189592Sbmsstatic void igmp_final_leave(struct in_multi *, struct igmp_ifinfo *); 98189592Sbmsstatic int igmp_handle_state_change(struct in_multi *, 99189592Sbms struct igmp_ifinfo *); 100189592Sbmsstatic int igmp_initial_join(struct in_multi *, struct igmp_ifinfo *); 101189592Sbmsstatic int igmp_input_v1_query(struct ifnet *, const struct ip *); 102189592Sbmsstatic int igmp_input_v2_query(struct ifnet *, const struct ip *, 103189592Sbms const struct igmp *); 104189592Sbmsstatic int igmp_input_v3_query(struct ifnet *, const struct ip *, 105189592Sbms /*const*/ struct igmpv3 *); 106189592Sbmsstatic int igmp_input_v3_group_query(struct in_multi *, 107189592Sbms struct igmp_ifinfo *, int, /*const*/ struct igmpv3 *); 108189592Sbmsstatic int igmp_input_v1_report(struct ifnet *, /*const*/ struct ip *, 109189592Sbms /*const*/ struct igmp *); 110189592Sbmsstatic int igmp_input_v2_report(struct ifnet *, /*const*/ struct ip *, 111189592Sbms /*const*/ struct igmp *); 112189592Sbmsstatic void igmp_intr(struct mbuf *); 113189592Sbmsstatic int igmp_isgroupreported(const struct in_addr); 114189592Sbmsstatic struct mbuf * 115189592Sbms igmp_ra_alloc(void); 116189592Sbms#ifdef KTR 117189592Sbmsstatic char * igmp_rec_type_to_str(const int); 118185088Szec#endif 119189592Sbmsstatic void igmp_set_version(struct igmp_ifinfo *, const int); 120189592Sbmsstatic void igmp_slowtimo_vnet(void); 121189592Sbmsstatic void igmp_sysinit(void); 122189592Sbmsstatic int igmp_v1v2_queue_report(struct in_multi *, const int); 123189592Sbmsstatic void igmp_v1v2_process_group_timer(struct in_multi *, const int); 124189592Sbmsstatic void igmp_v1v2_process_querier_timers(struct igmp_ifinfo *); 125189592Sbmsstatic void igmp_v2_update_group(struct in_multi *, const int); 126189592Sbmsstatic void igmp_v3_cancel_link_timers(struct igmp_ifinfo *); 127189592Sbmsstatic void igmp_v3_dispatch_general_query(struct igmp_ifinfo *); 128189592Sbmsstatic struct mbuf * 129189592Sbms igmp_v3_encap_report(struct ifnet *, struct mbuf *); 130189592Sbmsstatic int igmp_v3_enqueue_group_record(struct ifqueue *, 131189592Sbms struct in_multi *, const int, const int, const int); 132189592Sbmsstatic int igmp_v3_enqueue_filter_change(struct ifqueue *, 133189592Sbms struct in_multi *); 134189592Sbmsstatic void igmp_v3_process_group_timers(struct igmp_ifinfo *, 135189592Sbms struct ifqueue *, struct ifqueue *, struct in_multi *, 136189592Sbms const int); 137189592Sbmsstatic int igmp_v3_merge_state_changes(struct in_multi *, 138189592Sbms struct ifqueue *); 139189592Sbmsstatic void igmp_v3_suppress_group_record(struct in_multi *); 140189592Sbmsstatic int sysctl_igmp_default_version(SYSCTL_HANDLER_ARGS); 141189592Sbmsstatic int sysctl_igmp_gsr(SYSCTL_HANDLER_ARGS); 142189592Sbmsstatic int sysctl_igmp_ifinfo(SYSCTL_HANDLER_ARGS); 1432531Swollman 144189592Sbmsstatic vnet_attach_fn vnet_igmp_iattach; 145189592Sbmsstatic vnet_detach_fn vnet_igmp_idetach; 14612296Sphk 147130333Srwatson/* 148189592Sbms * System-wide globals. 149189592Sbms * 150189592Sbms * Unlocked access to these is OK, except for the global IGMP output 151189592Sbms * queue. The IGMP subsystem lock ends up being system-wide for the moment, 152189592Sbms * because all VIMAGEs have to share a global output queue, as netisrs 153189592Sbms * themselves are not virtualized. 154189592Sbms * 155189592Sbms * Locking: 156189592Sbms * * The permitted lock order is: IN_MULTI_LOCK, IGMP_LOCK, IF_ADDR_LOCK. 157189592Sbms * Any may be taken independently; if any are held at the same 158189592Sbms * time, the above lock order must be followed. 159191264Sbms * * All output is delegated to the netisr. 160191264Sbms * Now that Giant has been eliminated, the netisr may be inlined. 161189592Sbms * * IN_MULTI_LOCK covers in_multi. 162189592Sbms * * IGMP_LOCK covers igmp_ifinfo and any global variables in this file, 163189592Sbms * including the output queue. 164189592Sbms * * IF_ADDR_LOCK covers if_multiaddrs, which is used for a variety of 165189592Sbms * per-link state iterators. 166189592Sbms * * igmp_ifinfo is valid as long as PF_INET is attached to the interface, 167189592Sbms * therefore it is not refcounted. 168189592Sbms * We allow unlocked reads of igmp_ifinfo when accessed via in_multi. 169189592Sbms * 170189592Sbms * Reference counting 171189592Sbms * * IGMP acquires its own reference every time an in_multi is passed to 172189592Sbms * it and the group is being joined for the first time. 173189592Sbms * * IGMP releases its reference(s) on in_multi in a deferred way, 174189592Sbms * because the operations which process the release run as part of 175189592Sbms * a loop whose control variables are directly affected by the release 176189592Sbms * (that, and not recursing on the IF_ADDR_LOCK). 177189592Sbms * 178189592Sbms * VIMAGE: Each in_multi corresponds to an ifp, and each ifp corresponds 179189592Sbms * to a vnet in ifp->if_vnet. 180189592Sbms * 181189931Sbms * SMPng: XXX We may potentially race operations on ifma_protospec. 182189931Sbms * The problem is that we currently lack a clean way of taking the 183189931Sbms * IF_ADDR_LOCK() between the ifnet and in layers w/o recursing, 184189931Sbms * as anything which modifies ifma needs to be covered by that lock. 185189931Sbms * So check for ifma_protospec being NULL before proceeding. 186130333Srwatson */ 187189592Sbmsstruct mtx igmp_mtx; 188189592Sbms 189189592Sbmsstruct mbuf *m_raopt; /* Router Alert option */ 190189592SbmsMALLOC_DEFINE(M_IGMP, "igmp", "igmp state"); 191189592Sbms 192189592Sbms/* 193189592Sbms * Global netisr output queue. 194189592Sbms */ 195189592Sbmsstruct ifqueue igmpoq; 196189592Sbms 197189592Sbms/* 198189592Sbms * VIMAGE-wide globals. 199189592Sbms * 200189592Sbms * The IGMPv3 timers themselves need to run per-image, however, 201189592Sbms * protosw timers run globally (see tcp). 202189592Sbms * An ifnet can only be in one vimage at a time, and the loopback 203189592Sbms * ifnet, loif, is itself virtualized. 204189592Sbms * It would otherwise be possible to seriously hose IGMP state, 205189592Sbms * and create inconsistencies in upstream multicast routing, if you have 206189592Sbms * multiple VIMAGEs running on the same link joining different multicast 207189592Sbms * groups, UNLESS the "primary IP address" is different. This is because 208189592Sbms * IGMP for IPv4 does not force link-local addresses to be used for each 209189592Sbms * node, unlike MLD for IPv6. 210189592Sbms * Obviously the IGMPv3 per-interface state has per-vimage granularity 211189592Sbms * also as a result. 212189592Sbms * 213189592Sbms * FUTURE: Stop using IFP_TO_IA/INADDR_ANY, and use source address selection 214189592Sbms * policy to control the address used by IGMP on the link. 215189592Sbms */ 216185088Szec#ifdef VIMAGE_GLOBALS 217189592Sbmsint interface_timers_running; /* IGMPv3 general query response */ 218189592Sbmsint state_change_timers_running; /* IGMPv3 state-change retransmit */ 219189592Sbmsint current_state_timers_running; /* IGMPv1/v2 host report; 220189592Sbms * IGMPv3 g/sg query response */ 221130333Srwatson 222189592SbmsLIST_HEAD(, igmp_ifinfo) igi_head; 223189592Sbmsstruct igmpstat igmpstat; 224189592Sbmsstruct timeval igmp_gsrdelay; 225189592Sbms 226189592Sbmsint igmp_recvifkludge; 227189592Sbmsint igmp_sendra; 228189592Sbmsint igmp_sendlocal; 229189592Sbmsint igmp_v1enable; 230189592Sbmsint igmp_v2enable; 231189592Sbmsint igmp_legacysupp; 232189592Sbmsint igmp_default_version; 233189592Sbms#endif /* VIMAGE_GLOBALS */ 234189592Sbms 235130333Srwatson/* 236189592Sbms * Virtualized sysctls. 237130333Srwatson */ 238189592SbmsSYSCTL_V_STRUCT(V_NET, vnet_inet, _net_inet_igmp, IGMPCTL_STATS, stats, 239189592Sbms CTLFLAG_RW, igmpstat, igmpstat, ""); 240189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, recvifkludge, 241189592Sbms CTLFLAG_RW, igmp_recvifkludge, 0, 242189592Sbms "Rewrite IGMPv1/v2 reports from 0.0.0.0 to contain subnet address"); 243189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, sendra, 244189592Sbms CTLFLAG_RW, igmp_sendra, 0, 245189592Sbms "Send IP Router Alert option in IGMPv2/v3 messages"); 246189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, sendlocal, 247189592Sbms CTLFLAG_RW, igmp_sendlocal, 0, 248189592Sbms "Send IGMP membership reports for 224.0.0.0/24 groups"); 249189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, v1enable, 250189592Sbms CTLFLAG_RW, igmp_v1enable, 0, 251189592Sbms "Enable backwards compatibility with IGMPv1"); 252189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, v2enable, 253189592Sbms CTLFLAG_RW, igmp_v2enable, 0, 254189592Sbms "Enable backwards compatibility with IGMPv2"); 255189592SbmsSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, legacysupp, 256189592Sbms CTLFLAG_RW, igmp_legacysupp, 0, 257189592Sbms "Allow v1/v2 reports to suppress v3 group responses"); 258189592SbmsSYSCTL_V_PROC(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, default_version, 259189592Sbms CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, igmp_default_version, 0, 260189592Sbms sysctl_igmp_default_version, "I", 261189592Sbms "Default version of IGMP to run on each interface"); 262189592SbmsSYSCTL_V_PROC(V_NET, vnet_inet, _net_inet_igmp, OID_AUTO, gsrdelay, 263189592Sbms CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, igmp_gsrdelay.tv_sec, 0, 264189592Sbms sysctl_igmp_gsr, "I", 265189592Sbms "Rate limit for IGMPv3 Group-and-Source queries in seconds"); 266130333Srwatson 267189592Sbms/* 268189592Sbms * Non-virtualized sysctls. 269189592Sbms */ 270189592SbmsSYSCTL_NODE(_net_inet_igmp, OID_AUTO, ifinfo, CTLFLAG_RD | CTLFLAG_MPSAFE, 271189592Sbms sysctl_igmp_ifinfo, "Per-interface IGMPv3 state"); 2721541Srgrimes 273189592Sbmsstatic __inline void 274189592Sbmsigmp_save_context(struct mbuf *m, struct ifnet *ifp) 275189592Sbms{ 276189592Sbms 277189592Sbms#ifdef VIMAGE 278189592Sbms m->m_pkthdr.header = ifp->if_vnet; 279189592Sbms#endif /* VIMAGE */ 280189592Sbms m->m_pkthdr.flowid = ifp->if_index; 281189592Sbms} 282189592Sbms 283189592Sbmsstatic __inline void 284189592Sbmsigmp_scrub_context(struct mbuf *m) 285189592Sbms{ 286189592Sbms 287189592Sbms m->m_pkthdr.header = NULL; 288189592Sbms m->m_pkthdr.flowid = 0; 289189592Sbms} 290189592Sbms 291189592Sbms#ifdef KTR 292189592Sbmsstatic __inline char * 293189592Sbmsinet_ntoa_haddr(in_addr_t haddr) 294189592Sbms{ 295189592Sbms struct in_addr ia; 296189592Sbms 297189592Sbms ia.s_addr = htonl(haddr); 298189592Sbms return (inet_ntoa(ia)); 299189592Sbms} 300119180Srwatson#endif 301119180Srwatson 302189592Sbms/* 303189592Sbms * Restore context from a queued IGMP output chain. 304189592Sbms * Return saved ifindex. 305189592Sbms * 306189592Sbms * VIMAGE: The assertion is there to make sure that we 307189592Sbms * actually called CURVNET_SET() with what's in the mbuf chain. 308189592Sbms */ 309189592Sbmsstatic __inline uint32_t 310189592Sbmsigmp_restore_context(struct mbuf *m) 3111541Srgrimes{ 31214622Sfenner 313189592Sbms#ifdef notyet 314189592Sbms#if defined(VIMAGE) && defined(INVARIANTS) 315189592Sbms KASSERT(curvnet == (m->m_pkthdr.header), 316189592Sbms ("%s: called when curvnet was not restored", __func__)); 317189592Sbms#endif 318189592Sbms#endif 319189592Sbms return (m->m_pkthdr.flowid); 320189592Sbms} 321189592Sbms 322189592Sbms/* 323189592Sbms * Retrieve or set default IGMP version. 324189592Sbms * 325189592Sbms * VIMAGE: Assume curvnet set by caller. 326189592Sbms * SMPng: NOTE: Serialized by IGMP lock. 327189592Sbms */ 328189592Sbmsstatic int 329189592Sbmssysctl_igmp_default_version(SYSCTL_HANDLER_ARGS) 330189592Sbms{ 331191548Szec INIT_VNET_INET(curvnet); 332189592Sbms int error; 333189592Sbms int new; 334189592Sbms 335189592Sbms error = sysctl_wire_old_buffer(req, sizeof(int)); 336189592Sbms if (error) 337189592Sbms return (error); 338189592Sbms 339189592Sbms IGMP_LOCK(); 340189592Sbms 341189592Sbms new = V_igmp_default_version; 342189592Sbms 343189592Sbms error = sysctl_handle_int(oidp, &new, 0, req); 344189592Sbms if (error || !req->newptr) 345189592Sbms goto out_locked; 346189592Sbms 347189592Sbms if (new < IGMP_VERSION_1 || new > IGMP_VERSION_3) { 348189592Sbms error = EINVAL; 349189592Sbms goto out_locked; 350189592Sbms } 351189592Sbms 352189592Sbms CTR2(KTR_IGMPV3, "change igmp_default_version from %d to %d", 353189592Sbms V_igmp_default_version, new); 354189592Sbms 355189592Sbms V_igmp_default_version = new; 356189592Sbms 357189592Sbmsout_locked: 358189592Sbms IGMP_UNLOCK(); 359189592Sbms return (error); 360189592Sbms} 361189592Sbms 362189592Sbms/* 363189592Sbms * Retrieve or set threshold between group-source queries in seconds. 364189592Sbms * 365189592Sbms * VIMAGE: Assume curvnet set by caller. 366189592Sbms * SMPng: NOTE: Serialized by IGMP lock. 367189592Sbms */ 368189592Sbmsstatic int 369189592Sbmssysctl_igmp_gsr(SYSCTL_HANDLER_ARGS) 370189592Sbms{ 371191548Szec INIT_VNET_INET(curvnet); 372189592Sbms int error; 373189592Sbms int i; 374189592Sbms 375189592Sbms error = sysctl_wire_old_buffer(req, sizeof(int)); 376189592Sbms if (error) 377189592Sbms return (error); 378189592Sbms 379189592Sbms IGMP_LOCK(); 380189592Sbms 381189592Sbms i = V_igmp_gsrdelay.tv_sec; 382189592Sbms 383189592Sbms error = sysctl_handle_int(oidp, &i, 0, req); 384189592Sbms if (error || !req->newptr) 385189592Sbms goto out_locked; 386189592Sbms 387189592Sbms if (i < -1 || i >= 60) { 388189592Sbms error = EINVAL; 389189592Sbms goto out_locked; 390189592Sbms } 391189592Sbms 392189592Sbms CTR2(KTR_IGMPV3, "change igmp_gsrdelay from %d to %d", 393189592Sbms V_igmp_gsrdelay.tv_sec, i); 394189592Sbms V_igmp_gsrdelay.tv_sec = i; 395189592Sbms 396189592Sbmsout_locked: 397189592Sbms IGMP_UNLOCK(); 398189592Sbms return (error); 399189592Sbms} 400189592Sbms 401189592Sbms/* 402189592Sbms * Expose struct igmp_ifinfo to userland, keyed by ifindex. 403189592Sbms * For use by ifmcstat(8). 404189592Sbms * 405189592Sbms * SMPng: NOTE: Does an unlocked ifindex space read. 406189592Sbms * VIMAGE: Assume curvnet set by caller. The node handler itself 407189592Sbms * is not directly virtualized. 408189592Sbms */ 409189592Sbmsstatic int 410189592Sbmssysctl_igmp_ifinfo(SYSCTL_HANDLER_ARGS) 411189592Sbms{ 412189592Sbms INIT_VNET_NET(curvnet); 413191548Szec INIT_VNET_INET(curvnet); 414189592Sbms int *name; 415189592Sbms int error; 416189592Sbms u_int namelen; 417189592Sbms struct ifnet *ifp; 418189592Sbms struct igmp_ifinfo *igi; 419189592Sbms 420189592Sbms name = (int *)arg1; 421189592Sbms namelen = arg2; 422189592Sbms 423189592Sbms if (req->newptr != NULL) 424189592Sbms return (EPERM); 425189592Sbms 426189592Sbms if (namelen != 1) 427189592Sbms return (EINVAL); 428189592Sbms 429189592Sbms error = sysctl_wire_old_buffer(req, sizeof(struct igmp_ifinfo)); 430189592Sbms if (error) 431189592Sbms return (error); 432189592Sbms 433189592Sbms IN_MULTI_LOCK(); 434189592Sbms IGMP_LOCK(); 435189592Sbms 436189592Sbms if (name[0] <= 0 || name[0] > V_if_index) { 437189592Sbms error = ENOENT; 438189592Sbms goto out_locked; 439189592Sbms } 440189592Sbms 441189592Sbms error = ENOENT; 442189592Sbms 443189592Sbms ifp = ifnet_byindex(name[0]); 444189592Sbms if (ifp == NULL) 445189592Sbms goto out_locked; 446189592Sbms 447189592Sbms LIST_FOREACH(igi, &V_igi_head, igi_link) { 448189592Sbms if (ifp == igi->igi_ifp) { 449189592Sbms error = SYSCTL_OUT(req, igi, 450189592Sbms sizeof(struct igmp_ifinfo)); 451189592Sbms break; 452189592Sbms } 453189592Sbms } 454189592Sbms 455189592Sbmsout_locked: 456189592Sbms IGMP_UNLOCK(); 457189592Sbms IN_MULTI_UNLOCK(); 458189592Sbms return (error); 459189592Sbms} 460189592Sbms 461189592Sbms/* 462189592Sbms * Dispatch an entire queue of pending packet chains 463189592Sbms * using the netisr. 464189592Sbms * VIMAGE: Assumes the vnet pointer has been set. 465189592Sbms */ 466189592Sbmsstatic void 467189592Sbmsigmp_dispatch_queue(struct ifqueue *ifq, int limit, const int loop) 468189592Sbms{ 469189592Sbms struct mbuf *m; 470189592Sbms 471189592Sbms for (;;) { 472189592Sbms _IF_DEQUEUE(ifq, m); 473189592Sbms if (m == NULL) 474189592Sbms break; 475189592Sbms CTR3(KTR_IGMPV3, "%s: dispatch %p from %p", __func__, ifq, m); 476189592Sbms if (loop) 477189592Sbms m->m_flags |= M_IGMP_LOOP; 478189592Sbms netisr_dispatch(NETISR_IGMP, m); 479189592Sbms if (--limit == 0) 480189592Sbms break; 481189592Sbms } 482189592Sbms} 483189592Sbms 484189592Sbms/* 485189592Sbms * Filter outgoing IGMP report state by group. 486189592Sbms * 487189592Sbms * Reports are ALWAYS suppressed for ALL-HOSTS (224.0.0.1). 488189592Sbms * If the net.inet.igmp.sendlocal sysctl is 0, then IGMP reports are 489189592Sbms * disabled for all groups in the 224.0.0.0/24 link-local scope. However, 490189592Sbms * this may break certain IGMP snooping switches which rely on the old 491189592Sbms * report behaviour. 492189592Sbms * 493189592Sbms * Return zero if the given group is one for which IGMP reports 494189592Sbms * should be suppressed, or non-zero if reports should be issued. 495189592Sbms */ 496189592Sbmsstatic __inline int 497189592Sbmsigmp_isgroupreported(const struct in_addr addr) 498189592Sbms{ 499191548Szec INIT_VNET_INET(curvnet); 500189592Sbms 501189592Sbms if (in_allhosts(addr) || 502189592Sbms ((!V_igmp_sendlocal && IN_LOCAL_GROUP(ntohl(addr.s_addr))))) 503189592Sbms return (0); 504189592Sbms 505189592Sbms return (1); 506189592Sbms} 507189592Sbms 508189592Sbms/* 509189592Sbms * Construct a Router Alert option to use in outgoing packets. 510189592Sbms */ 511189592Sbmsstatic struct mbuf * 512189592Sbmsigmp_ra_alloc(void) 513189592Sbms{ 514189592Sbms struct mbuf *m; 515189592Sbms struct ipoption *p; 516189592Sbms 517189592Sbms MGET(m, M_DONTWAIT, MT_DATA); 518189592Sbms p = mtod(m, struct ipoption *); 519189592Sbms p->ipopt_dst.s_addr = INADDR_ANY; 520189592Sbms p->ipopt_list[0] = IPOPT_RA; /* Router Alert Option */ 521189592Sbms p->ipopt_list[1] = 0x04; /* 4 bytes long */ 522189592Sbms p->ipopt_list[2] = IPOPT_EOL; /* End of IP option list */ 523189592Sbms p->ipopt_list[3] = 0x00; /* pad byte */ 524189592Sbms m->m_len = sizeof(p->ipopt_dst) + p->ipopt_list[1]; 525189592Sbms 526189592Sbms return (m); 527189592Sbms} 528189592Sbms 529189592Sbms/* 530189592Sbms * Attach IGMP when PF_INET is attached to an interface. 531189592Sbms * 532189592Sbms * VIMAGE: Currently we set the vnet pointer, although it is 533189592Sbms * likely that it was already set by our caller. 534189592Sbms */ 535189592Sbmsstruct igmp_ifinfo * 536189592Sbmsigmp_domifattach(struct ifnet *ifp) 537189592Sbms{ 538189592Sbms struct igmp_ifinfo *igi; 539189592Sbms 540189592Sbms CTR3(KTR_IGMPV3, "%s: called for ifp %p(%s)", 541189592Sbms __func__, ifp, ifp->if_xname); 542189592Sbms 543189592Sbms CURVNET_SET(ifp->if_vnet); 544189592Sbms IGMP_LOCK(); 545189592Sbms 546189592Sbms igi = igi_alloc_locked(ifp); 547189592Sbms if (!(ifp->if_flags & IFF_MULTICAST)) 548189592Sbms igi->igi_flags |= IGIF_SILENT; 549189592Sbms 550189592Sbms IGMP_UNLOCK(); 551189592Sbms CURVNET_RESTORE(); 552189592Sbms 553189592Sbms return (igi); 554189592Sbms} 555189592Sbms 556189592Sbms/* 557189592Sbms * VIMAGE: assume curvnet set by caller. 558189592Sbms */ 559189592Sbmsstatic struct igmp_ifinfo * 560189592Sbmsigi_alloc_locked(/*const*/ struct ifnet *ifp) 561189592Sbms{ 562191548Szec INIT_VNET_INET(ifp->if_vnet); 563189592Sbms struct igmp_ifinfo *igi; 564189592Sbms 565189592Sbms IGMP_LOCK_ASSERT(); 566189592Sbms 567189592Sbms igi = malloc(sizeof(struct igmp_ifinfo), M_IGMP, M_NOWAIT|M_ZERO); 568189592Sbms if (igi == NULL) 569189592Sbms goto out; 570189592Sbms 571189592Sbms igi->igi_ifp = ifp; 572189592Sbms igi->igi_version = V_igmp_default_version; 573189592Sbms igi->igi_flags = 0; 574189592Sbms igi->igi_rv = IGMP_RV_INIT; 575189592Sbms igi->igi_qi = IGMP_QI_INIT; 576189592Sbms igi->igi_qri = IGMP_QRI_INIT; 577189592Sbms igi->igi_uri = IGMP_URI_INIT; 578189592Sbms 579189592Sbms SLIST_INIT(&igi->igi_relinmhead); 580189592Sbms 5811541Srgrimes /* 582189592Sbms * Responses to general queries are subject to bounds. 5831541Srgrimes */ 584189592Sbms IFQ_SET_MAXLEN(&igi->igi_gq, IGMP_MAX_RESPONSE_PACKETS); 5859209Swollman 586189592Sbms LIST_INSERT_HEAD(&V_igi_head, igi, igi_link); 5879209Swollman 588189592Sbms CTR2(KTR_IGMPV3, "allocate igmp_ifinfo for ifp %p(%s)", 589189592Sbms ifp, ifp->if_xname); 590189592Sbms 591189592Sbmsout: 592189592Sbms return (igi); 593189592Sbms} 594189592Sbms 595189592Sbms/* 596189592Sbms * Hook for ifdetach. 597189592Sbms * 598189592Sbms * NOTE: Some finalization tasks need to run before the protocol domain 599189592Sbms * is detached, but also before the link layer does its cleanup. 600189592Sbms * 601189592Sbms * SMPNG: igmp_ifdetach() needs to take IF_ADDR_LOCK(). 602189931Sbms * XXX This is also bitten by unlocked ifma_protospec access. 603189592Sbms * 604189592Sbms * VIMAGE: curvnet should have been set by caller, but let's not assume 605189592Sbms * that for now. 606189592Sbms */ 607189592Sbmsvoid 608189592Sbmsigmp_ifdetach(struct ifnet *ifp) 609189592Sbms{ 610189592Sbms struct igmp_ifinfo *igi; 611189592Sbms struct ifmultiaddr *ifma; 612189592Sbms struct in_multi *inm, *tinm; 613189592Sbms 614189592Sbms CTR3(KTR_IGMPV3, "%s: called for ifp %p(%s)", __func__, ifp, 615189592Sbms ifp->if_xname); 616189592Sbms 617189592Sbms CURVNET_SET(ifp->if_vnet); 618189592Sbms 619189592Sbms IGMP_LOCK(); 620189592Sbms 621189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 622189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 623189592Sbms IF_ADDR_LOCK(ifp); 624189592Sbms TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 625189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 626189931Sbms ifma->ifma_protospec == NULL) 627189592Sbms continue; 628189931Sbms#if 0 629189931Sbms KASSERT(ifma->ifma_protospec != NULL, 630189931Sbms ("%s: ifma_protospec is NULL", __func__)); 631189931Sbms#endif 632189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 633189592Sbms if (inm->inm_state == IGMP_LEAVING_MEMBER) { 634189592Sbms SLIST_INSERT_HEAD(&igi->igi_relinmhead, 635189592Sbms inm, inm_nrele); 636189592Sbms } 637189592Sbms inm_clear_recorded(inm); 638189592Sbms } 639189592Sbms IF_ADDR_UNLOCK(ifp); 640189592Sbms /* 641189592Sbms * Free the in_multi reference(s) for this IGMP lifecycle. 642189592Sbms */ 643189592Sbms SLIST_FOREACH_SAFE(inm, &igi->igi_relinmhead, inm_nrele, 644189592Sbms tinm) { 645189592Sbms SLIST_REMOVE_HEAD(&igi->igi_relinmhead, inm_nrele); 646189592Sbms inm_release_locked(inm); 647189592Sbms } 648189592Sbms } 649189592Sbms 650189592Sbms IGMP_UNLOCK(); 651189592Sbms 652189592Sbms CURVNET_RESTORE(); 6531541Srgrimes} 6541541Srgrimes 655189592Sbms/* 656189592Sbms * Hook for domifdetach. 657189592Sbms * 658189592Sbms * VIMAGE: curvnet should have been set by caller, but let's not assume 659189592Sbms * that for now. 660189592Sbms */ 661189592Sbmsvoid 662189592Sbmsigmp_domifdetach(struct ifnet *ifp) 6632531Swollman{ 664189592Sbms struct igmp_ifinfo *igi; 665189592Sbms 666189592Sbms CTR3(KTR_IGMPV3, "%s: called for ifp %p(%s)", 667189592Sbms __func__, ifp, ifp->if_xname); 668189592Sbms 669189592Sbms CURVNET_SET(ifp->if_vnet); 670189592Sbms IGMP_LOCK(); 671189592Sbms 672189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 673189592Sbms igi_delete_locked(ifp); 674189592Sbms 675189592Sbms IGMP_UNLOCK(); 676189592Sbms CURVNET_RESTORE(); 677189592Sbms} 678189592Sbms 679189592Sbmsstatic void 680189592Sbmsigi_delete_locked(const struct ifnet *ifp) 681189592Sbms{ 682191548Szec INIT_VNET_INET(ifp->if_vnet); 683189592Sbms struct igmp_ifinfo *igi, *tigi; 684189592Sbms 685189592Sbms CTR3(KTR_IGMPV3, "%s: freeing igmp_ifinfo for ifp %p(%s)", 686189592Sbms __func__, ifp, ifp->if_xname); 687189592Sbms 688189592Sbms IGMP_LOCK_ASSERT(); 689189592Sbms 690189592Sbms LIST_FOREACH_SAFE(igi, &V_igi_head, igi_link, tigi) { 691189592Sbms if (igi->igi_ifp == ifp) { 692189592Sbms /* 693189592Sbms * Free deferred General Query responses. 694189592Sbms */ 695189592Sbms _IF_DRAIN(&igi->igi_gq); 696189592Sbms 697189592Sbms LIST_REMOVE(igi, igi_link); 698189592Sbms 699189592Sbms KASSERT(SLIST_EMPTY(&igi->igi_relinmhead), 700189592Sbms ("%s: there are dangling in_multi references", 701189592Sbms __func__)); 702189592Sbms 703189592Sbms free(igi, M_IGMP); 704189592Sbms return; 705189592Sbms } 706189592Sbms } 707189592Sbms 708189592Sbms#ifdef INVARIANTS 709189592Sbms panic("%s: igmp_ifinfo not found for ifp %p\n", __func__, ifp); 710189592Sbms#endif 711189592Sbms} 712189592Sbms 713189592Sbms/* 714189592Sbms * Process a received IGMPv1 query. 715189592Sbms * Return non-zero if the message should be dropped. 716189592Sbms * 717189592Sbms * VIMAGE: The curvnet pointer is derived from the input ifp. 718189592Sbms */ 719189592Sbmsstatic int 720189592Sbmsigmp_input_v1_query(struct ifnet *ifp, const struct ip *ip) 721189592Sbms{ 722183550Szec INIT_VNET_INET(ifp->if_vnet); 723189592Sbms struct ifmultiaddr *ifma; 724189592Sbms struct igmp_ifinfo *igi; 725189592Sbms struct in_multi *inm; 7262531Swollman 727189592Sbms /* 728189592Sbms * IGMPv1 General Queries SHOULD always addressed to 224.0.0.1. 729189592Sbms * igmp_group is always ignored. Do not drop it as a userland 730189592Sbms * daemon may wish to see it. 731189592Sbms */ 732189592Sbms if (!in_allhosts(ip->ip_dst)) { 733190965Srwatson IGMPSTAT_INC(igps_rcv_badqueries); 734189592Sbms return (0); 735189592Sbms } 736189592Sbms 737190965Srwatson IGMPSTAT_INC(igps_rcv_gen_queries); 738189592Sbms 739189592Sbms /* 740189592Sbms * Switch to IGMPv1 host compatibility mode. 741189592Sbms */ 742189592Sbms IN_MULTI_LOCK(); 743189592Sbms IGMP_LOCK(); 744189592Sbms 745189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 746189592Sbms KASSERT(igi != NULL, ("%s: no igmp_ifinfo for ifp %p", __func__, ifp)); 747189592Sbms 748189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 749189592Sbms CTR2(KTR_IGMPV3, "ignore v1 query on IGIF_LOOPBACK ifp %p(%s)", 750189592Sbms ifp, ifp->if_xname); 751189592Sbms goto out_locked; 752189592Sbms } 753189592Sbms 754189592Sbms igmp_set_version(igi, IGMP_VERSION_1); 755189592Sbms 756189592Sbms CTR2(KTR_IGMPV3, "process v1 query on ifp %p(%s)", ifp, ifp->if_xname); 757189592Sbms 758189592Sbms /* 759189592Sbms * Start the timers in all of our group records 760189592Sbms * for the interface on which the query arrived, 761189592Sbms * except those which are already running. 762189592Sbms */ 763189592Sbms IF_ADDR_LOCK(ifp); 764189592Sbms TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 765189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 766189931Sbms ifma->ifma_protospec == NULL) 767189592Sbms continue; 768189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 769189592Sbms if (inm->inm_timer != 0) 770189592Sbms continue; 771189592Sbms switch (inm->inm_state) { 772189592Sbms case IGMP_NOT_MEMBER: 773189592Sbms case IGMP_SILENT_MEMBER: 774189592Sbms break; 775189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 776189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 777189592Sbms case IGMP_REPORTING_MEMBER: 778189592Sbms case IGMP_IDLE_MEMBER: 779189592Sbms case IGMP_LAZY_MEMBER: 780189592Sbms case IGMP_SLEEPING_MEMBER: 781189592Sbms case IGMP_AWAKENING_MEMBER: 782189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 783189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY( 784189592Sbms IGMP_V1V2_MAX_RI * PR_FASTHZ); 785189592Sbms V_current_state_timers_running = 1; 786189592Sbms break; 787189592Sbms case IGMP_LEAVING_MEMBER: 788189592Sbms break; 789119181Srwatson } 790119181Srwatson } 791189592Sbms IF_ADDR_UNLOCK(ifp); 792189592Sbms 793189592Sbmsout_locked: 794189592Sbms IGMP_UNLOCK(); 795189592Sbms IN_MULTI_UNLOCK(); 796189592Sbms 797189592Sbms return (0); 798189592Sbms} 799189592Sbms 800189592Sbms/* 801189592Sbms * Process a received IGMPv2 general or group-specific query. 802189592Sbms */ 803189592Sbmsstatic int 804189592Sbmsigmp_input_v2_query(struct ifnet *ifp, const struct ip *ip, 805189592Sbms const struct igmp *igmp) 806189592Sbms{ 807191548Szec INIT_VNET_INET(ifp->if_vnet); 808189592Sbms struct ifmultiaddr *ifma; 809189592Sbms struct igmp_ifinfo *igi; 810189592Sbms struct in_multi *inm; 811189592Sbms uint16_t timer; 812189592Sbms 813189592Sbms /* 814189592Sbms * Perform lazy allocation of IGMP link info if required, 815189592Sbms * and switch to IGMPv2 host compatibility mode. 816189592Sbms */ 817189592Sbms IN_MULTI_LOCK(); 818189592Sbms IGMP_LOCK(); 819189592Sbms 820189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 821189592Sbms KASSERT(igi != NULL, ("%s: no igmp_ifinfo for ifp %p", __func__, ifp)); 822189592Sbms 823189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 824189592Sbms CTR2(KTR_IGMPV3, "ignore v2 query on IGIF_LOOPBACK ifp %p(%s)", 825189592Sbms ifp, ifp->if_xname); 826189592Sbms goto out_locked; 827144163Ssam } 828189592Sbms 829189592Sbms igmp_set_version(igi, IGMP_VERSION_2); 830189592Sbms 831189592Sbms timer = igmp->igmp_code * PR_FASTHZ / IGMP_TIMER_SCALE; 832189592Sbms if (timer == 0) 833189592Sbms timer = 1; 834189592Sbms 835189592Sbms if (!in_nullhost(igmp->igmp_group)) { 836189592Sbms /* 837189592Sbms * IGMPv2 Group-Specific Query. 838189592Sbms * If this is a group-specific IGMPv2 query, we need only 839189592Sbms * look up the single group to process it. 840189592Sbms */ 841189592Sbms inm = inm_lookup(ifp, igmp->igmp_group); 842189592Sbms if (inm != NULL) { 843189592Sbms CTR3(KTR_IGMPV3, "process v2 query %s on ifp %p(%s)", 844189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 845189592Sbms igmp_v2_update_group(inm, timer); 846189592Sbms } 847190965Srwatson IGMPSTAT_INC(igps_rcv_group_queries); 848189592Sbms } else { 849189592Sbms /* 850189592Sbms * IGMPv2 General Query. 851189592Sbms * If this was not sent to the all-hosts group, ignore it. 852189592Sbms */ 853189592Sbms if (in_allhosts(ip->ip_dst)) { 854189592Sbms /* 855189592Sbms * For each reporting group joined on this 856189592Sbms * interface, kick the report timer. 857189592Sbms */ 858189592Sbms CTR2(KTR_IGMPV3, 859189592Sbms "process v2 general query on ifp %p(%s)", 860189592Sbms ifp, ifp->if_xname); 861189592Sbms 862189592Sbms IF_ADDR_LOCK(ifp); 863189592Sbms TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 864189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 865189931Sbms ifma->ifma_protospec == NULL) 866189592Sbms continue; 867189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 868189592Sbms igmp_v2_update_group(inm, timer); 869189592Sbms } 870189592Sbms IF_ADDR_UNLOCK(ifp); 871189592Sbms } 872190965Srwatson IGMPSTAT_INC(igps_rcv_gen_queries); 873189592Sbms } 874189592Sbms 875189592Sbmsout_locked: 876189592Sbms IGMP_UNLOCK(); 877189592Sbms IN_MULTI_UNLOCK(); 878189592Sbms 879189592Sbms return (0); 8802531Swollman} 8812531Swollman 882189592Sbms/* 883189592Sbms * Update the report timer on a group in response to an IGMPv2 query. 884189592Sbms * 885189592Sbms * If we are becoming the reporting member for this group, start the timer. 886189592Sbms * If we already are the reporting member for this group, and timer is 887189592Sbms * below the threshold, reset it. 888189592Sbms * 889189592Sbms * We may be updating the group for the first time since we switched 890189592Sbms * to IGMPv3. If we are, then we must clear any recorded source lists, 891189592Sbms * and transition to REPORTING state; the group timer is overloaded 892189592Sbms * for group and group-source query responses. 893189592Sbms * 894189592Sbms * Unlike IGMPv3, the delay per group should be jittered 895189592Sbms * to avoid bursts of IGMPv2 reports. 896189592Sbms */ 897189592Sbmsstatic void 898189592Sbmsigmp_v2_update_group(struct in_multi *inm, const int timer) 899189592Sbms{ 900191548Szec INIT_VNET_INET(curvnet); 901189592Sbms 902189592Sbms CTR4(KTR_IGMPV3, "%s: %s/%s timer=%d", __func__, 903189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname, timer); 904189592Sbms 905189592Sbms IN_MULTI_LOCK_ASSERT(); 906189592Sbms 907189592Sbms switch (inm->inm_state) { 908189592Sbms case IGMP_NOT_MEMBER: 909189592Sbms case IGMP_SILENT_MEMBER: 910189592Sbms break; 911189592Sbms case IGMP_REPORTING_MEMBER: 912189592Sbms if (inm->inm_timer != 0 && 913189592Sbms inm->inm_timer <= timer) { 914189592Sbms CTR1(KTR_IGMPV3, "%s: REPORTING and timer running, " 915189592Sbms "skipping.", __func__); 916189592Sbms break; 917189592Sbms } 918189592Sbms /* FALLTHROUGH */ 919189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 920189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 921189592Sbms case IGMP_IDLE_MEMBER: 922189592Sbms case IGMP_LAZY_MEMBER: 923189592Sbms case IGMP_AWAKENING_MEMBER: 924189592Sbms CTR1(KTR_IGMPV3, "%s: ->REPORTING", __func__); 925189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 926189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY(timer); 927189592Sbms V_current_state_timers_running = 1; 928189592Sbms break; 929189592Sbms case IGMP_SLEEPING_MEMBER: 930189592Sbms CTR1(KTR_IGMPV3, "%s: ->AWAKENING", __func__); 931189592Sbms inm->inm_state = IGMP_AWAKENING_MEMBER; 932189592Sbms break; 933189592Sbms case IGMP_LEAVING_MEMBER: 934189592Sbms break; 935189592Sbms } 936189592Sbms} 937189592Sbms 938189592Sbms/* 939189592Sbms * Process a received IGMPv3 general, group-specific or 940189592Sbms * group-and-source-specific query. 941189592Sbms * Assumes m has already been pulled up to the full IGMP message length. 942189592Sbms * Return 0 if successful, otherwise an appropriate error code is returned. 943189592Sbms */ 944189592Sbmsstatic int 945189592Sbmsigmp_input_v3_query(struct ifnet *ifp, const struct ip *ip, 946189592Sbms /*const*/ struct igmpv3 *igmpv3) 947189592Sbms{ 948191548Szec INIT_VNET_INET(ifp->if_vnet); 949189592Sbms struct igmp_ifinfo *igi; 950189592Sbms struct in_multi *inm; 951189592Sbms uint32_t maxresp, nsrc, qqi; 952189592Sbms uint16_t timer; 953189592Sbms uint8_t qrv; 954189592Sbms 955189592Sbms CTR2(KTR_IGMPV3, "process v3 query on ifp %p(%s)", ifp, ifp->if_xname); 956189592Sbms 957189592Sbms maxresp = igmpv3->igmp_code; /* in 1/10ths of a second */ 958189592Sbms if (maxresp >= 128) { 959189592Sbms maxresp = IGMP_MANT(igmpv3->igmp_code) << 960189592Sbms (IGMP_EXP(igmpv3->igmp_code) + 3); 961189592Sbms } 962189592Sbms 963189592Sbms /* 964189592Sbms * Robustness must never be less than 2 for on-wire IGMPv3. 965189592Sbms * FIXME: Check if ifp has IGIF_LOOPBACK set, as we make 966189592Sbms * an exception for interfaces whose IGMPv3 state changes 967189592Sbms * are redirected to loopback (e.g. MANET). 968189592Sbms */ 969189592Sbms qrv = IGMP_QRV(igmpv3->igmp_misc); 970189592Sbms if (qrv < 2) { 971189592Sbms CTR3(KTR_IGMPV3, "%s: clamping qrv %d to %d", __func__, 972189592Sbms qrv, IGMP_RV_INIT); 973189592Sbms qrv = IGMP_RV_INIT; 974189592Sbms } 975189592Sbms 976189592Sbms qqi = igmpv3->igmp_qqi; 977189592Sbms if (qqi >= 128) { 978190691Sbms qqi = IGMP_MANT(igmpv3->igmp_qqi) << 979190691Sbms (IGMP_EXP(igmpv3->igmp_qqi) + 3); 980189592Sbms } 981189592Sbms 982189592Sbms timer = maxresp * PR_FASTHZ / IGMP_TIMER_SCALE; 983189592Sbms if (timer == 0) 984189592Sbms timer = 1; 985189592Sbms 986189592Sbms nsrc = ntohs(igmpv3->igmp_numsrc); 987189592Sbms 988189592Sbms IN_MULTI_LOCK(); 989189592Sbms IGMP_LOCK(); 990189592Sbms 991189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 992189592Sbms KASSERT(igi != NULL, ("%s: no igmp_ifinfo for ifp %p", __func__, ifp)); 993189592Sbms 994189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 995189592Sbms CTR2(KTR_IGMPV3, "ignore v3 query on IGIF_LOOPBACK ifp %p(%s)", 996189592Sbms ifp, ifp->if_xname); 997189592Sbms goto out_locked; 998189592Sbms } 999189592Sbms 1000189592Sbms igmp_set_version(igi, IGMP_VERSION_3); 1001189592Sbms 1002189592Sbms igi->igi_rv = qrv; 1003189592Sbms igi->igi_qi = qqi; 1004189592Sbms igi->igi_qri = maxresp; 1005189592Sbms 1006189592Sbms CTR4(KTR_IGMPV3, "%s: qrv %d qi %d qri %d", __func__, qrv, qqi, 1007189592Sbms maxresp); 1008189592Sbms 1009189592Sbms if (in_nullhost(igmpv3->igmp_group)) { 1010189592Sbms /* 1011189592Sbms * IGMPv3 General Query. 1012189592Sbms * Schedule a current-state report on this ifp for 1013189592Sbms * all groups, possibly containing source lists. 1014189592Sbms */ 1015190965Srwatson IGMPSTAT_INC(igps_rcv_gen_queries); 1016189592Sbms 1017189592Sbms if (!in_allhosts(ip->ip_dst) || nsrc > 0) { 1018189592Sbms /* 1019189592Sbms * General Queries SHOULD be directed to 224.0.0.1. 1020189592Sbms * A general query with a source list has undefined 1021189592Sbms * behaviour; discard it. 1022189592Sbms */ 1023190965Srwatson IGMPSTAT_INC(igps_rcv_badqueries); 1024189592Sbms goto out_locked; 1025189592Sbms } 1026189592Sbms 1027189592Sbms CTR2(KTR_IGMPV3, "process v3 general query on ifp %p(%s)", 1028189592Sbms ifp, ifp->if_xname); 1029189592Sbms 1030189592Sbms /* 1031189592Sbms * If there is a pending General Query response 1032189592Sbms * scheduled earlier than the selected delay, do 1033189592Sbms * not schedule any other reports. 1034189592Sbms * Otherwise, reset the interface timer. 1035189592Sbms */ 1036189592Sbms if (igi->igi_v3_timer == 0 || igi->igi_v3_timer >= timer) { 1037189592Sbms igi->igi_v3_timer = IGMP_RANDOM_DELAY(timer); 1038189592Sbms V_interface_timers_running = 1; 1039189592Sbms } 1040189592Sbms } else { 1041189592Sbms /* 1042189592Sbms * IGMPv3 Group-specific or Group-and-source-specific Query. 1043189592Sbms * 1044189592Sbms * Group-source-specific queries are throttled on 1045189592Sbms * a per-group basis to defeat denial-of-service attempts. 1046189592Sbms * Queries for groups we are not a member of on this 1047189592Sbms * link are simply ignored. 1048189592Sbms */ 1049189592Sbms inm = inm_lookup(ifp, igmpv3->igmp_group); 1050189592Sbms if (inm == NULL) 1051189592Sbms goto out_locked; 1052189592Sbms if (nsrc > 0) { 1053190965Srwatson IGMPSTAT_INC(igps_rcv_gsr_queries); 1054189592Sbms if (!ratecheck(&inm->inm_lastgsrtv, 1055189592Sbms &V_igmp_gsrdelay)) { 1056189592Sbms CTR1(KTR_IGMPV3, "%s: GS query throttled.", 1057189592Sbms __func__); 1058190965Srwatson IGMPSTAT_INC(igps_drop_gsr_queries); 1059189592Sbms goto out_locked; 1060189592Sbms } 1061189592Sbms } else { 1062190965Srwatson IGMPSTAT_INC(igps_rcv_group_queries); 1063189592Sbms } 1064189592Sbms CTR3(KTR_IGMPV3, "process v3 %s query on ifp %p(%s)", 1065189592Sbms inet_ntoa(igmpv3->igmp_group), ifp, ifp->if_xname); 1066189592Sbms /* 1067189592Sbms * If there is a pending General Query response 1068189592Sbms * scheduled sooner than the selected delay, no 1069189592Sbms * further report need be scheduled. 1070189592Sbms * Otherwise, prepare to respond to the 1071189592Sbms * group-specific or group-and-source query. 1072189592Sbms */ 1073189592Sbms if (igi->igi_v3_timer == 0 || igi->igi_v3_timer >= timer) 1074189592Sbms igmp_input_v3_group_query(inm, igi, timer, igmpv3); 1075189592Sbms } 1076189592Sbms 1077189592Sbmsout_locked: 1078189592Sbms IGMP_UNLOCK(); 1079189592Sbms IN_MULTI_UNLOCK(); 1080189592Sbms 1081189592Sbms return (0); 1082189592Sbms} 1083189592Sbms 1084189592Sbms/* 1085189592Sbms * Process a recieved IGMPv3 group-specific or group-and-source-specific 1086189592Sbms * query. 1087189592Sbms * Return <0 if any error occured. Currently this is ignored. 1088189592Sbms */ 1089189592Sbmsstatic int 1090189592Sbmsigmp_input_v3_group_query(struct in_multi *inm, struct igmp_ifinfo *igi, 1091189592Sbms int timer, /*const*/ struct igmpv3 *igmpv3) 1092189592Sbms{ 1093191548Szec INIT_VNET_INET(curvnet); 1094189592Sbms int retval; 1095189592Sbms uint16_t nsrc; 1096189592Sbms 1097189592Sbms IN_MULTI_LOCK_ASSERT(); 1098189592Sbms IGMP_LOCK_ASSERT(); 1099189592Sbms 1100189592Sbms retval = 0; 1101189592Sbms 1102189592Sbms switch (inm->inm_state) { 1103189592Sbms case IGMP_NOT_MEMBER: 1104189592Sbms case IGMP_SILENT_MEMBER: 1105189592Sbms case IGMP_SLEEPING_MEMBER: 1106189592Sbms case IGMP_LAZY_MEMBER: 1107189592Sbms case IGMP_AWAKENING_MEMBER: 1108189592Sbms case IGMP_IDLE_MEMBER: 1109189592Sbms case IGMP_LEAVING_MEMBER: 1110189592Sbms return (retval); 1111189592Sbms break; 1112189592Sbms case IGMP_REPORTING_MEMBER: 1113189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1114189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1115189592Sbms break; 1116189592Sbms } 1117189592Sbms 1118189592Sbms nsrc = ntohs(igmpv3->igmp_numsrc); 1119189592Sbms 1120191816Szec if (!IS_DEFAULT_VNET(curvnet)) 1121191816Szec return (retval); 1122191816Szec 1123189592Sbms /* 1124189592Sbms * Deal with group-specific queries upfront. 1125189592Sbms * If any group query is already pending, purge any recorded 1126189592Sbms * source-list state if it exists, and schedule a query response 1127189592Sbms * for this group-specific query. 1128189592Sbms */ 1129189592Sbms if (nsrc == 0) { 1130189592Sbms if (inm->inm_state == IGMP_G_QUERY_PENDING_MEMBER || 1131189592Sbms inm->inm_state == IGMP_SG_QUERY_PENDING_MEMBER) { 1132189592Sbms inm_clear_recorded(inm); 1133189592Sbms timer = min(inm->inm_timer, timer); 1134189592Sbms } 1135189592Sbms inm->inm_state = IGMP_G_QUERY_PENDING_MEMBER; 1136189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY(timer); 1137189592Sbms V_current_state_timers_running = 1; 1138189592Sbms return (retval); 1139189592Sbms } 1140189592Sbms 1141189592Sbms /* 1142189592Sbms * Deal with the case where a group-and-source-specific query has 1143189592Sbms * been received but a group-specific query is already pending. 1144189592Sbms */ 1145189592Sbms if (inm->inm_state == IGMP_G_QUERY_PENDING_MEMBER) { 1146189592Sbms timer = min(inm->inm_timer, timer); 1147189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY(timer); 1148189592Sbms V_current_state_timers_running = 1; 1149189592Sbms return (retval); 1150189592Sbms } 1151189592Sbms 1152189592Sbms /* 1153189592Sbms * Finally, deal with the case where a group-and-source-specific 1154189592Sbms * query has been received, where a response to a previous g-s-r 1155189592Sbms * query exists, or none exists. 1156189592Sbms * In this case, we need to parse the source-list which the Querier 1157189592Sbms * has provided us with and check if we have any source list filter 1158189592Sbms * entries at T1 for these sources. If we do not, there is no need 1159189592Sbms * schedule a report and the query may be dropped. 1160189592Sbms * If we do, we must record them and schedule a current-state 1161189592Sbms * report for those sources. 1162189592Sbms * FIXME: Handling source lists larger than 1 mbuf requires that 1163189592Sbms * we pass the mbuf chain pointer down to this function, and use 1164189592Sbms * m_getptr() to walk the chain. 1165189592Sbms */ 1166189592Sbms if (inm->inm_nsrc > 0) { 1167189592Sbms const struct in_addr *ap; 1168189592Sbms int i, nrecorded; 1169189592Sbms 1170189592Sbms ap = (const struct in_addr *)(igmpv3 + 1); 1171189592Sbms nrecorded = 0; 1172189592Sbms for (i = 0; i < nsrc; i++, ap++) { 1173189592Sbms retval = inm_record_source(inm, ap->s_addr); 1174189592Sbms if (retval < 0) 1175189592Sbms break; 1176189592Sbms nrecorded += retval; 1177189592Sbms } 1178189592Sbms if (nrecorded > 0) { 1179189592Sbms CTR1(KTR_IGMPV3, 1180189592Sbms "%s: schedule response to SG query", __func__); 1181189592Sbms inm->inm_state = IGMP_SG_QUERY_PENDING_MEMBER; 1182189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY(timer); 1183189592Sbms V_current_state_timers_running = 1; 1184189592Sbms } 1185189592Sbms } 1186189592Sbms 1187189592Sbms return (retval); 1188189592Sbms} 1189189592Sbms 1190189592Sbms/* 1191189592Sbms * Process a received IGMPv1 host membership report. 1192189592Sbms * 1193189592Sbms * NOTE: 0.0.0.0 workaround breaks const correctness. 1194189592Sbms */ 1195189592Sbmsstatic int 1196189592Sbmsigmp_input_v1_report(struct ifnet *ifp, /*const*/ struct ip *ip, 1197189592Sbms /*const*/ struct igmp *igmp) 1198189592Sbms{ 1199191548Szec INIT_VNET_INET(ifp->if_vnet); 1200189592Sbms struct in_ifaddr *ia; 1201189592Sbms struct in_multi *inm; 1202189592Sbms 1203190965Srwatson IGMPSTAT_INC(igps_rcv_reports); 1204189592Sbms 1205189592Sbms if (ifp->if_flags & IFF_LOOPBACK) 1206189592Sbms return (0); 1207189592Sbms 1208189592Sbms if (!IN_MULTICAST(ntohl(igmp->igmp_group.s_addr) || 1209189592Sbms !in_hosteq(igmp->igmp_group, ip->ip_dst))) { 1210190965Srwatson IGMPSTAT_INC(igps_rcv_badreports); 1211189592Sbms return (EINVAL); 1212189592Sbms } 1213189592Sbms 1214189592Sbms /* 1215189592Sbms * RFC 3376, Section 4.2.13, 9.2, 9.3: 1216189592Sbms * Booting clients may use the source address 0.0.0.0. Some 1217189592Sbms * IGMP daemons may not know how to use IP_RECVIF to determine 1218189592Sbms * the interface upon which this message was received. 1219189592Sbms * Replace 0.0.0.0 with the subnet address if told to do so. 1220189592Sbms */ 1221189592Sbms if (V_igmp_recvifkludge && in_nullhost(ip->ip_src)) { 1222189592Sbms IFP_TO_IA(ifp, ia); 1223189592Sbms if (ia != NULL) 1224189592Sbms ip->ip_src.s_addr = htonl(ia->ia_subnet); 1225189592Sbms } 1226189592Sbms 1227189592Sbms CTR3(KTR_IGMPV3, "process v1 report %s on ifp %p(%s)", 1228189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1229189592Sbms 1230189592Sbms /* 1231189592Sbms * IGMPv1 report suppression. 1232189592Sbms * If we are a member of this group, and our membership should be 1233189592Sbms * reported, stop our group timer and transition to the 'lazy' state. 1234189592Sbms */ 1235189592Sbms IN_MULTI_LOCK(); 1236189592Sbms inm = inm_lookup(ifp, igmp->igmp_group); 1237189592Sbms if (inm != NULL) { 1238189592Sbms struct igmp_ifinfo *igi; 1239189592Sbms 1240189592Sbms igi = inm->inm_igi; 1241189592Sbms if (igi == NULL) { 1242189592Sbms KASSERT(igi != NULL, 1243189592Sbms ("%s: no igi for ifp %p", __func__, ifp)); 1244189592Sbms goto out_locked; 1245189592Sbms } 1246189592Sbms 1247190965Srwatson IGMPSTAT_INC(igps_rcv_ourreports); 1248189592Sbms 1249189592Sbms /* 1250189592Sbms * If we are in IGMPv3 host mode, do not allow the 1251189592Sbms * other host's IGMPv1 report to suppress our reports 1252189592Sbms * unless explicitly configured to do so. 1253189592Sbms */ 1254189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 1255189592Sbms if (V_igmp_legacysupp) 1256189592Sbms igmp_v3_suppress_group_record(inm); 1257189592Sbms goto out_locked; 1258189592Sbms } 1259189592Sbms 1260189592Sbms inm->inm_timer = 0; 1261189592Sbms 1262189592Sbms switch (inm->inm_state) { 1263189592Sbms case IGMP_NOT_MEMBER: 1264189592Sbms case IGMP_SILENT_MEMBER: 1265189592Sbms break; 1266189592Sbms case IGMP_IDLE_MEMBER: 1267189592Sbms case IGMP_LAZY_MEMBER: 1268189592Sbms case IGMP_AWAKENING_MEMBER: 1269189592Sbms CTR3(KTR_IGMPV3, 1270189592Sbms "report suppressed for %s on ifp %p(%s)", 1271189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1272189592Sbms case IGMP_SLEEPING_MEMBER: 1273189592Sbms inm->inm_state = IGMP_SLEEPING_MEMBER; 1274189592Sbms break; 1275189592Sbms case IGMP_REPORTING_MEMBER: 1276189592Sbms CTR3(KTR_IGMPV3, 1277189592Sbms "report suppressed for %s on ifp %p(%s)", 1278189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1279189592Sbms if (igi->igi_version == IGMP_VERSION_1) 1280189592Sbms inm->inm_state = IGMP_LAZY_MEMBER; 1281189592Sbms else if (igi->igi_version == IGMP_VERSION_2) 1282189592Sbms inm->inm_state = IGMP_SLEEPING_MEMBER; 1283189592Sbms break; 1284189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1285189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1286189592Sbms case IGMP_LEAVING_MEMBER: 1287189592Sbms break; 1288189592Sbms } 1289189592Sbms } 1290189592Sbms 1291189592Sbmsout_locked: 1292189592Sbms IN_MULTI_UNLOCK(); 1293189592Sbms 1294189592Sbms return (0); 1295189592Sbms} 1296189592Sbms 1297189592Sbms/* 1298189592Sbms * Process a received IGMPv2 host membership report. 1299189592Sbms * 1300189592Sbms * NOTE: 0.0.0.0 workaround breaks const correctness. 1301189592Sbms */ 1302189592Sbmsstatic int 1303189592Sbmsigmp_input_v2_report(struct ifnet *ifp, /*const*/ struct ip *ip, 1304189592Sbms /*const*/ struct igmp *igmp) 1305189592Sbms{ 1306191548Szec INIT_VNET_INET(ifp->if_vnet); 1307189592Sbms struct in_ifaddr *ia; 1308189592Sbms struct in_multi *inm; 1309189592Sbms 1310189592Sbms /* 1311189592Sbms * Make sure we don't hear our own membership report. Fast 1312189592Sbms * leave requires knowing that we are the only member of a 1313189592Sbms * group. 1314189592Sbms */ 1315189592Sbms IFP_TO_IA(ifp, ia); 1316189592Sbms if (ia != NULL && in_hosteq(ip->ip_src, IA_SIN(ia)->sin_addr)) 1317189592Sbms return (0); 1318189592Sbms 1319190965Srwatson IGMPSTAT_INC(igps_rcv_reports); 1320189592Sbms 1321189592Sbms if (ifp->if_flags & IFF_LOOPBACK) 1322189592Sbms return (0); 1323189592Sbms 1324189592Sbms if (!IN_MULTICAST(ntohl(igmp->igmp_group.s_addr)) || 1325189592Sbms !in_hosteq(igmp->igmp_group, ip->ip_dst)) { 1326190965Srwatson IGMPSTAT_INC(igps_rcv_badreports); 1327189592Sbms return (EINVAL); 1328189592Sbms } 1329189592Sbms 1330189592Sbms /* 1331189592Sbms * RFC 3376, Section 4.2.13, 9.2, 9.3: 1332189592Sbms * Booting clients may use the source address 0.0.0.0. Some 1333189592Sbms * IGMP daemons may not know how to use IP_RECVIF to determine 1334189592Sbms * the interface upon which this message was received. 1335189592Sbms * Replace 0.0.0.0 with the subnet address if told to do so. 1336189592Sbms */ 1337189592Sbms if (V_igmp_recvifkludge && in_nullhost(ip->ip_src)) { 1338189592Sbms if (ia != NULL) 1339189592Sbms ip->ip_src.s_addr = htonl(ia->ia_subnet); 1340189592Sbms } 1341189592Sbms 1342189592Sbms CTR3(KTR_IGMPV3, "process v2 report %s on ifp %p(%s)", 1343189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1344189592Sbms 1345189592Sbms /* 1346189592Sbms * IGMPv2 report suppression. 1347189592Sbms * If we are a member of this group, and our membership should be 1348189592Sbms * reported, and our group timer is pending or about to be reset, 1349189592Sbms * stop our group timer by transitioning to the 'lazy' state. 1350189592Sbms */ 1351189592Sbms IN_MULTI_LOCK(); 1352189592Sbms inm = inm_lookup(ifp, igmp->igmp_group); 1353189592Sbms if (inm != NULL) { 1354189592Sbms struct igmp_ifinfo *igi; 1355189592Sbms 1356189592Sbms igi = inm->inm_igi; 1357189592Sbms KASSERT(igi != NULL, ("%s: no igi for ifp %p", __func__, ifp)); 1358189592Sbms 1359190965Srwatson IGMPSTAT_INC(igps_rcv_ourreports); 1360189592Sbms 1361189592Sbms /* 1362189592Sbms * If we are in IGMPv3 host mode, do not allow the 1363189592Sbms * other host's IGMPv1 report to suppress our reports 1364189592Sbms * unless explicitly configured to do so. 1365189592Sbms */ 1366189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 1367189592Sbms if (V_igmp_legacysupp) 1368189592Sbms igmp_v3_suppress_group_record(inm); 1369189592Sbms goto out_locked; 1370189592Sbms } 1371189592Sbms 1372189592Sbms inm->inm_timer = 0; 1373189592Sbms 1374189592Sbms switch (inm->inm_state) { 1375189592Sbms case IGMP_NOT_MEMBER: 1376189592Sbms case IGMP_SILENT_MEMBER: 1377189592Sbms case IGMP_SLEEPING_MEMBER: 1378189592Sbms break; 1379189592Sbms case IGMP_REPORTING_MEMBER: 1380189592Sbms case IGMP_IDLE_MEMBER: 1381189592Sbms case IGMP_AWAKENING_MEMBER: 1382189592Sbms CTR3(KTR_IGMPV3, 1383189592Sbms "report suppressed for %s on ifp %p(%s)", 1384189592Sbms inet_ntoa(igmp->igmp_group), ifp, ifp->if_xname); 1385189592Sbms case IGMP_LAZY_MEMBER: 1386189592Sbms inm->inm_state = IGMP_LAZY_MEMBER; 1387189592Sbms break; 1388189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1389189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1390189592Sbms case IGMP_LEAVING_MEMBER: 1391189592Sbms break; 1392189592Sbms } 1393189592Sbms } 1394189592Sbms 1395189592Sbmsout_locked: 1396189592Sbms IN_MULTI_UNLOCK(); 1397189592Sbms 1398189592Sbms return (0); 1399189592Sbms} 1400189592Sbms 14011541Srgrimesvoid 1402189592Sbmsigmp_input(struct mbuf *m, int off) 14031541Srgrimes{ 1404189592Sbms int iphlen; 1405189592Sbms struct ifnet *ifp; 1406189592Sbms struct igmp *igmp; 1407189592Sbms struct ip *ip; 1408189592Sbms int igmplen; 1409189592Sbms int minlen; 1410189592Sbms int queryver; 1411189592Sbms 1412189592Sbms CTR3(KTR_IGMPV3, "%s: called w/mbuf (%p,%d)", __func__, m, off); 1413189592Sbms 1414189592Sbms ifp = m->m_pkthdr.rcvif; 1415183550Szec INIT_VNET_INET(ifp->if_vnet); 14161541Srgrimes 1417190965Srwatson IGMPSTAT_INC(igps_rcv_total); 14181541Srgrimes 14191541Srgrimes ip = mtod(m, struct ip *); 1420189592Sbms iphlen = off; 14211541Srgrimes igmplen = ip->ip_len; 14221541Srgrimes 14231541Srgrimes /* 1424164863Srwatson * Validate lengths. 14251541Srgrimes */ 14261541Srgrimes if (igmplen < IGMP_MINLEN) { 1427190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 14281541Srgrimes m_freem(m); 14291541Srgrimes return; 14301541Srgrimes } 1431189592Sbms 1432189592Sbms /* 1433189592Sbms * Always pullup to the minimum size for v1/v2 or v3 1434189592Sbms * to amortize calls to m_pullup(). 1435189592Sbms */ 1436189592Sbms minlen = iphlen; 1437189592Sbms if (igmplen >= IGMP_V3_QUERY_MINLEN) 1438189592Sbms minlen += IGMP_V3_QUERY_MINLEN; 1439189592Sbms else 1440189592Sbms minlen += IGMP_MINLEN; 14411541Srgrimes if ((m->m_flags & M_EXT || m->m_len < minlen) && 14421541Srgrimes (m = m_pullup(m, minlen)) == 0) { 1443190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 14441541Srgrimes return; 14451541Srgrimes } 1446189592Sbms ip = mtod(m, struct ip *); 14471541Srgrimes 1448189592Sbms if (ip->ip_ttl != 1) { 1449190965Srwatson IGMPSTAT_INC(igps_rcv_badttl); 1450189592Sbms m_freem(m); 1451189592Sbms return; 1452189592Sbms } 1453189592Sbms 14541541Srgrimes /* 1455164863Srwatson * Validate checksum. 14561541Srgrimes */ 14571541Srgrimes m->m_data += iphlen; 14581541Srgrimes m->m_len -= iphlen; 14591541Srgrimes igmp = mtod(m, struct igmp *); 14601541Srgrimes if (in_cksum(m, igmplen)) { 1461190965Srwatson IGMPSTAT_INC(igps_rcv_badsum); 14621541Srgrimes m_freem(m); 14631541Srgrimes return; 14641541Srgrimes } 14651541Srgrimes m->m_data -= iphlen; 14661541Srgrimes m->m_len += iphlen; 14672531Swollman 14681541Srgrimes switch (igmp->igmp_type) { 1469189592Sbms case IGMP_HOST_MEMBERSHIP_QUERY: 1470189592Sbms if (igmplen == IGMP_MINLEN) { 1471189592Sbms if (igmp->igmp_code == 0) 1472189592Sbms queryver = IGMP_VERSION_1; 1473189592Sbms else 1474189592Sbms queryver = IGMP_VERSION_2; 1475189592Sbms } else if (igmplen >= IGMP_V3_QUERY_MINLEN) { 1476189592Sbms queryver = IGMP_VERSION_3; 1477189592Sbms } else { 1478190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 1479189592Sbms m_freem(m); 1480189592Sbms return; 1481189592Sbms } 14821541Srgrimes 1483189592Sbms switch (queryver) { 1484189592Sbms case IGMP_VERSION_1: 1485190965Srwatson IGMPSTAT_INC(igps_rcv_v1v2_queries); 1486189592Sbms if (!V_igmp_v1enable) 1487189592Sbms break; 1488189592Sbms if (igmp_input_v1_query(ifp, ip) != 0) { 1489144163Ssam m_freem(m); 1490144163Ssam return; 1491144163Ssam } 1492189592Sbms break; 14934028Spst 1494189592Sbms case IGMP_VERSION_2: 1495190965Srwatson IGMPSTAT_INC(igps_rcv_v1v2_queries); 1496189592Sbms if (!V_igmp_v2enable) 1497189592Sbms break; 1498189592Sbms if (igmp_input_v2_query(ifp, ip, igmp) != 0) { 14992531Swollman m_freem(m); 15002531Swollman return; 15012531Swollman } 1502189592Sbms break; 15032531Swollman 1504189592Sbms case IGMP_VERSION_3: { 1505189592Sbms struct igmpv3 *igmpv3; 1506189592Sbms uint16_t igmpv3len; 1507189592Sbms uint16_t srclen; 1508189592Sbms int nsrc; 1509189592Sbms 1510190965Srwatson IGMPSTAT_INC(igps_rcv_v3_queries); 1511189592Sbms igmpv3 = (struct igmpv3 *)igmp; 1512189592Sbms /* 1513189592Sbms * Validate length based on source count. 1514189592Sbms */ 1515189592Sbms nsrc = ntohs(igmpv3->igmp_numsrc); 1516189592Sbms srclen = sizeof(struct in_addr) * nsrc; 1517189592Sbms if (nsrc * sizeof(in_addr_t) > srclen) { 1518190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 1519189592Sbms return; 15202531Swollman } 1521189592Sbms /* 1522189592Sbms * m_pullup() may modify m, so pullup in 1523189592Sbms * this scope. 1524189592Sbms */ 1525189592Sbms igmpv3len = iphlen + IGMP_V3_QUERY_MINLEN + 1526189592Sbms srclen; 1527189592Sbms if ((m->m_flags & M_EXT || 1528189592Sbms m->m_len < igmpv3len) && 1529189592Sbms (m = m_pullup(m, igmpv3len)) == NULL) { 1530190965Srwatson IGMPSTAT_INC(igps_rcv_tooshort); 1531189592Sbms return; 1532189592Sbms } 1533189592Sbms igmpv3 = (struct igmpv3 *)(mtod(m, uint8_t *) 1534189592Sbms + iphlen); 1535189592Sbms if (igmp_input_v3_query(ifp, ip, igmpv3) != 0) { 1536189592Sbms m_freem(m); 1537189592Sbms return; 1538189592Sbms } 15391541Srgrimes } 1540189592Sbms break; 15411541Srgrimes } 15421541Srgrimes break; 15431541Srgrimes 1544189592Sbms case IGMP_v1_HOST_MEMBERSHIP_REPORT: 1545189592Sbms if (!V_igmp_v1enable) 154614622Sfenner break; 1547189592Sbms if (igmp_input_v1_report(ifp, ip, igmp) != 0) { 1548189592Sbms m_freem(m); 1549189592Sbms return; 1550189592Sbms } 1551189592Sbms break; 155214622Sfenner 1553189592Sbms case IGMP_v2_HOST_MEMBERSHIP_REPORT: 1554189592Sbms if (!V_igmp_v2enable) 15551541Srgrimes break; 1556189592Sbms if (!ip_checkrouteralert(m)) 1557190965Srwatson IGMPSTAT_INC(igps_rcv_nora); 1558189592Sbms if (igmp_input_v2_report(ifp, ip, igmp) != 0) { 15591541Srgrimes m_freem(m); 15601541Srgrimes return; 15611541Srgrimes } 1562189592Sbms break; 15631541Srgrimes 1564189592Sbms case IGMP_v3_HOST_MEMBERSHIP_REPORT: 15651541Srgrimes /* 1566189592Sbms * Hosts do not need to process IGMPv3 membership reports, 1567189592Sbms * as report suppression is no longer required. 15681541Srgrimes */ 1569189592Sbms if (!ip_checkrouteralert(m)) 1570190965Srwatson IGMPSTAT_INC(igps_rcv_nora); 1571189592Sbms break; 15721541Srgrimes 1573189592Sbms default: 15741541Srgrimes break; 15751541Srgrimes } 15761541Srgrimes 15771541Srgrimes /* 1578164863Srwatson * Pass all valid IGMP packets up to any process(es) listening on a 1579164863Srwatson * raw IGMP socket. 15801541Srgrimes */ 158182890Sjulian rip_input(m, off); 15821541Srgrimes} 15831541Srgrimes 1584189592Sbms 1585189592Sbms/* 1586189592Sbms * Fast timeout handler (global). 1587189592Sbms * VIMAGE: Timeout handlers are expected to service all vimages. 1588189592Sbms */ 15891541Srgrimesvoid 1590189592Sbmsigmp_fasttimo(void) 15911541Srgrimes{ 1592189592Sbms VNET_ITERATOR_DECL(vnet_iter); 15931541Srgrimes 1594189592Sbms VNET_LIST_RLOCK(); 1595189592Sbms VNET_FOREACH(vnet_iter) { 1596189592Sbms CURVNET_SET(vnet_iter); 1597189592Sbms igmp_fasttimo_vnet(); 1598189592Sbms CURVNET_RESTORE(); 1599189592Sbms } 1600189592Sbms VNET_LIST_RUNLOCK(); 1601189592Sbms} 1602189592Sbms 1603189592Sbms/* 1604189592Sbms * Fast timeout handler (per-vnet). 1605189592Sbms * Sends are shuffled off to a netisr to deal with Giant. 1606189592Sbms * 1607189592Sbms * VIMAGE: Assume caller has set up our curvnet. 1608189592Sbms */ 1609189592Sbmsstatic void 1610189592Sbmsigmp_fasttimo_vnet(void) 1611189592Sbms{ 1612191548Szec INIT_VNET_INET(curvnet); 1613189592Sbms struct ifqueue scq; /* State-change packets */ 1614189592Sbms struct ifqueue qrq; /* Query response packets */ 1615189592Sbms struct ifnet *ifp; 1616189592Sbms struct igmp_ifinfo *igi; 1617189592Sbms struct ifmultiaddr *ifma, *tifma; 1618189592Sbms struct in_multi *inm; 1619189592Sbms int loop, uri_fasthz; 1620189592Sbms 1621189592Sbms loop = 0; 1622189592Sbms uri_fasthz = 0; 1623189592Sbms 1624189592Sbms /* 1625189592Sbms * Quick check to see if any work needs to be done, in order to 1626189592Sbms * minimize the overhead of fasttimo processing. 1627189592Sbms * SMPng: XXX Unlocked reads. 1628189592Sbms */ 1629189592Sbms if (!V_current_state_timers_running && 1630189592Sbms !V_interface_timers_running && 1631189592Sbms !V_state_change_timers_running) 1632189592Sbms return; 1633189592Sbms 1634189592Sbms IN_MULTI_LOCK(); 1635189592Sbms IGMP_LOCK(); 1636189592Sbms 1637189592Sbms /* 1638189592Sbms * IGMPv3 General Query response timer processing. 1639189592Sbms */ 1640189592Sbms if (V_interface_timers_running) { 1641189592Sbms CTR1(KTR_IGMPV3, "%s: interface timers running", __func__); 1642189592Sbms 1643189592Sbms V_interface_timers_running = 0; 1644189592Sbms LIST_FOREACH(igi, &V_igi_head, igi_link) { 1645189592Sbms if (igi->igi_v3_timer == 0) { 1646189592Sbms /* Do nothing. */ 1647189592Sbms } else if (--igi->igi_v3_timer == 0) { 1648189592Sbms igmp_v3_dispatch_general_query(igi); 1649189592Sbms } else { 1650189592Sbms V_interface_timers_running = 1; 1651189592Sbms } 1652189592Sbms } 1653189592Sbms } 1654189592Sbms 1655189592Sbms if (!V_current_state_timers_running && 1656189592Sbms !V_state_change_timers_running) 1657189592Sbms goto out_locked; 1658189592Sbms 1659189592Sbms V_current_state_timers_running = 0; 1660189592Sbms V_state_change_timers_running = 0; 1661189592Sbms 1662189592Sbms CTR1(KTR_IGMPV3, "%s: state change timers running", __func__); 1663189592Sbms 1664189592Sbms /* 1665189592Sbms * IGMPv1/v2/v3 host report and state-change timer processing. 1666189592Sbms * Note: Processing a v3 group timer may remove a node. 1667189592Sbms */ 1668189592Sbms LIST_FOREACH(igi, &V_igi_head, igi_link) { 1669189592Sbms ifp = igi->igi_ifp; 1670189592Sbms 1671189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 1672189592Sbms loop = (igi->igi_flags & IGIF_LOOPBACK) ? 1 : 0; 1673189592Sbms uri_fasthz = IGMP_RANDOM_DELAY(igi->igi_uri * 1674189592Sbms PR_FASTHZ); 1675189592Sbms 1676189592Sbms memset(&qrq, 0, sizeof(struct ifqueue)); 1677189592Sbms IFQ_SET_MAXLEN(&qrq, IGMP_MAX_G_GS_PACKETS); 1678189592Sbms 1679189592Sbms memset(&scq, 0, sizeof(struct ifqueue)); 1680189592Sbms IFQ_SET_MAXLEN(&scq, IGMP_MAX_STATE_CHANGE_PACKETS); 1681189592Sbms } 1682189592Sbms 1683189592Sbms IF_ADDR_LOCK(ifp); 1684189592Sbms TAILQ_FOREACH_SAFE(ifma, &ifp->if_multiaddrs, ifma_link, 1685189592Sbms tifma) { 1686189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 1687189931Sbms ifma->ifma_protospec == NULL) 1688189592Sbms continue; 1689189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 1690189592Sbms switch (igi->igi_version) { 1691189592Sbms case IGMP_VERSION_1: 1692189592Sbms case IGMP_VERSION_2: 1693189592Sbms igmp_v1v2_process_group_timer(inm, 1694189592Sbms igi->igi_version); 1695189592Sbms break; 1696189592Sbms case IGMP_VERSION_3: 1697189592Sbms igmp_v3_process_group_timers(igi, &qrq, 1698189592Sbms &scq, inm, uri_fasthz); 1699189592Sbms break; 1700189592Sbms } 1701189592Sbms } 1702189592Sbms IF_ADDR_UNLOCK(ifp); 1703189592Sbms 1704189592Sbms if (igi->igi_version == IGMP_VERSION_3) { 1705189592Sbms struct in_multi *tinm; 1706189592Sbms 1707189592Sbms igmp_dispatch_queue(&qrq, 0, loop); 1708189592Sbms igmp_dispatch_queue(&scq, 0, loop); 1709189592Sbms 1710189592Sbms /* 1711189592Sbms * Free the in_multi reference(s) for this 1712189592Sbms * IGMP lifecycle. 1713189592Sbms */ 1714189592Sbms SLIST_FOREACH_SAFE(inm, &igi->igi_relinmhead, 1715189592Sbms inm_nrele, tinm) { 1716189592Sbms SLIST_REMOVE_HEAD(&igi->igi_relinmhead, 1717189592Sbms inm_nrele); 1718189592Sbms inm_release_locked(inm); 1719189592Sbms } 1720189592Sbms } 1721189592Sbms } 1722189592Sbms 1723189592Sbmsout_locked: 1724189592Sbms IGMP_UNLOCK(); 1725189592Sbms IN_MULTI_UNLOCK(); 1726189592Sbms} 1727189592Sbms 1728189592Sbms/* 1729189592Sbms * Update host report group timer for IGMPv1/v2. 1730189592Sbms * Will update the global pending timer flags. 1731189592Sbms */ 1732189592Sbmsstatic void 1733189592Sbmsigmp_v1v2_process_group_timer(struct in_multi *inm, const int version) 1734189592Sbms{ 1735191548Szec INIT_VNET_INET(curvnet); 1736189592Sbms int report_timer_expired; 1737189592Sbms 1738148682Srwatson IN_MULTI_LOCK_ASSERT(); 1739189592Sbms IGMP_LOCK_ASSERT(); 1740148682Srwatson 1741189592Sbms if (inm->inm_timer == 0) { 1742189592Sbms report_timer_expired = 0; 1743189592Sbms } else if (--inm->inm_timer == 0) { 1744189592Sbms report_timer_expired = 1; 174514622Sfenner } else { 1746189592Sbms V_current_state_timers_running = 1; 1747189592Sbms return; 1748189592Sbms } 1749189592Sbms 1750189592Sbms switch (inm->inm_state) { 1751189592Sbms case IGMP_NOT_MEMBER: 1752189592Sbms case IGMP_SILENT_MEMBER: 1753189592Sbms case IGMP_IDLE_MEMBER: 1754189592Sbms case IGMP_LAZY_MEMBER: 1755189592Sbms case IGMP_SLEEPING_MEMBER: 1756189592Sbms case IGMP_AWAKENING_MEMBER: 1757189592Sbms break; 1758189592Sbms case IGMP_REPORTING_MEMBER: 1759189592Sbms if (report_timer_expired) { 1760189592Sbms inm->inm_state = IGMP_IDLE_MEMBER; 1761189592Sbms (void)igmp_v1v2_queue_report(inm, 1762189592Sbms (version == IGMP_VERSION_2) ? 1763189592Sbms IGMP_v2_HOST_MEMBERSHIP_REPORT : 1764189592Sbms IGMP_v1_HOST_MEMBERSHIP_REPORT); 1765144163Ssam } 1766189592Sbms break; 1767189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1768189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1769189592Sbms case IGMP_LEAVING_MEMBER: 1770189592Sbms break; 17711541Srgrimes } 17721541Srgrimes} 17731541Srgrimes 1774189592Sbms/* 1775189592Sbms * Update a group's timers for IGMPv3. 1776189592Sbms * Will update the global pending timer flags. 1777189592Sbms * Note: Unlocked read from igi. 1778189592Sbms */ 1779189592Sbmsstatic void 1780189592Sbmsigmp_v3_process_group_timers(struct igmp_ifinfo *igi, 1781189592Sbms struct ifqueue *qrq, struct ifqueue *scq, 1782189592Sbms struct in_multi *inm, const int uri_fasthz) 17831541Srgrimes{ 1784191548Szec INIT_VNET_INET(curvnet); 1785189592Sbms int query_response_timer_expired; 1786189592Sbms int state_change_retransmit_timer_expired; 1787119181Srwatson 1788148682Srwatson IN_MULTI_LOCK_ASSERT(); 1789189592Sbms IGMP_LOCK_ASSERT(); 1790148682Srwatson 1791189592Sbms query_response_timer_expired = 0; 1792189592Sbms state_change_retransmit_timer_expired = 0; 1793189592Sbms 1794189592Sbms /* 1795189592Sbms * During a transition from v1/v2 compatibility mode back to v3, 1796189592Sbms * a group record in REPORTING state may still have its group 1797189592Sbms * timer active. This is a no-op in this function; it is easier 1798189592Sbms * to deal with it here than to complicate the slow-timeout path. 1799189592Sbms */ 1800189592Sbms if (inm->inm_timer == 0) { 1801189592Sbms query_response_timer_expired = 0; 1802189592Sbms } else if (--inm->inm_timer == 0) { 1803189592Sbms query_response_timer_expired = 1; 1804189592Sbms } else { 1805189592Sbms V_current_state_timers_running = 1; 1806189592Sbms } 1807189592Sbms 1808189592Sbms if (inm->inm_sctimer == 0) { 1809189592Sbms state_change_retransmit_timer_expired = 0; 1810189592Sbms } else if (--inm->inm_sctimer == 0) { 1811189592Sbms state_change_retransmit_timer_expired = 1; 1812189592Sbms } else { 1813189592Sbms V_state_change_timers_running = 1; 1814189592Sbms } 1815189592Sbms 1816189592Sbms /* We are in fasttimo, so be quick about it. */ 1817189592Sbms if (!state_change_retransmit_timer_expired && 1818189592Sbms !query_response_timer_expired) 1819189592Sbms return; 1820189592Sbms 1821189592Sbms switch (inm->inm_state) { 1822189592Sbms case IGMP_NOT_MEMBER: 1823189592Sbms case IGMP_SILENT_MEMBER: 1824189592Sbms case IGMP_SLEEPING_MEMBER: 1825189592Sbms case IGMP_LAZY_MEMBER: 1826189592Sbms case IGMP_AWAKENING_MEMBER: 1827189592Sbms case IGMP_IDLE_MEMBER: 1828189592Sbms break; 1829189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 1830189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 1831189592Sbms /* 1832189592Sbms * Respond to a previously pending Group-Specific 1833189592Sbms * or Group-and-Source-Specific query by enqueueing 1834189592Sbms * the appropriate Current-State report for 1835189592Sbms * immediate transmission. 1836189592Sbms */ 1837189592Sbms if (query_response_timer_expired) { 1838189592Sbms int retval; 1839189592Sbms 1840189592Sbms retval = igmp_v3_enqueue_group_record(qrq, inm, 0, 1, 1841189592Sbms (inm->inm_state == IGMP_SG_QUERY_PENDING_MEMBER)); 1842189592Sbms CTR2(KTR_IGMPV3, "%s: enqueue record = %d", 1843189592Sbms __func__, retval); 1844189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 1845189592Sbms /* XXX Clear recorded sources for next time. */ 1846189592Sbms inm_clear_recorded(inm); 1847189592Sbms } 1848189592Sbms /* FALLTHROUGH */ 1849189592Sbms case IGMP_REPORTING_MEMBER: 1850189592Sbms case IGMP_LEAVING_MEMBER: 1851189592Sbms if (state_change_retransmit_timer_expired) { 1852189592Sbms /* 1853189592Sbms * State-change retransmission timer fired. 1854189592Sbms * If there are any further pending retransmissions, 1855189592Sbms * set the global pending state-change flag, and 1856189592Sbms * reset the timer. 1857189592Sbms */ 1858189592Sbms if (--inm->inm_scrv > 0) { 1859189592Sbms inm->inm_sctimer = uri_fasthz; 1860189592Sbms V_state_change_timers_running = 1; 1861189592Sbms } 1862189592Sbms /* 1863189592Sbms * Retransmit the previously computed state-change 1864189592Sbms * report. If there are no further pending 1865189592Sbms * retransmissions, the mbuf queue will be consumed. 1866189592Sbms * Update T0 state to T1 as we have now sent 1867189592Sbms * a state-change. 1868189592Sbms */ 1869189592Sbms (void)igmp_v3_merge_state_changes(inm, scq); 1870189592Sbms 1871189592Sbms inm_commit(inm); 1872189592Sbms CTR3(KTR_IGMPV3, "%s: T1 -> T0 for %s/%s", __func__, 1873189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 1874189592Sbms 1875189592Sbms /* 1876189592Sbms * If we are leaving the group for good, make sure 1877189592Sbms * we release IGMP's reference to it. 1878189592Sbms * This release must be deferred using a SLIST, 1879189592Sbms * as we are called from a loop which traverses 1880189592Sbms * the in_ifmultiaddr TAILQ. 1881189592Sbms */ 1882189592Sbms if (inm->inm_state == IGMP_LEAVING_MEMBER && 1883189592Sbms inm->inm_scrv == 0) { 1884189592Sbms inm->inm_state = IGMP_NOT_MEMBER; 1885189592Sbms SLIST_INSERT_HEAD(&igi->igi_relinmhead, 1886189592Sbms inm, inm_nrele); 1887189592Sbms } 1888189592Sbms } 1889189592Sbms break; 1890189592Sbms } 18911541Srgrimes} 18921541Srgrimes 1893189592Sbms 1894189592Sbms/* 1895189592Sbms * Suppress a group's pending response to a group or source/group query. 1896189592Sbms * 1897189592Sbms * Do NOT suppress state changes. This leads to IGMPv3 inconsistency. 1898189592Sbms * Do NOT update ST1/ST0 as this operation merely suppresses 1899189592Sbms * the currently pending group record. 1900189592Sbms * Do NOT suppress the response to a general query. It is possible but 1901189592Sbms * it would require adding another state or flag. 1902189592Sbms */ 1903189592Sbmsstatic void 1904189592Sbmsigmp_v3_suppress_group_record(struct in_multi *inm) 19051541Srgrimes{ 19061541Srgrimes 1907189592Sbms IN_MULTI_LOCK_ASSERT(); 1908189592Sbms 1909189592Sbms KASSERT(inm->inm_igi->igi_version == IGMP_VERSION_3, 1910189592Sbms ("%s: not IGMPv3 mode on link", __func__)); 1911189592Sbms 1912189592Sbms if (inm->inm_state != IGMP_G_QUERY_PENDING_MEMBER || 1913189592Sbms inm->inm_state != IGMP_SG_QUERY_PENDING_MEMBER) 1914189592Sbms return; 1915189592Sbms 1916189592Sbms if (inm->inm_state == IGMP_SG_QUERY_PENDING_MEMBER) 1917189592Sbms inm_clear_recorded(inm); 1918189592Sbms 1919189592Sbms inm->inm_timer = 0; 1920189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 1921189592Sbms} 1922189592Sbms 1923189592Sbms/* 1924189592Sbms * Switch to a different IGMP version on the given interface, 1925189592Sbms * as per Section 7.2.1. 1926189592Sbms */ 1927189592Sbmsstatic void 1928189592Sbmsigmp_set_version(struct igmp_ifinfo *igi, const int version) 1929189592Sbms{ 1930189592Sbms 1931189592Sbms IGMP_LOCK_ASSERT(); 1932189592Sbms 1933189592Sbms CTR4(KTR_IGMPV3, "%s: switching to v%d on ifp %p(%s)", __func__, 1934189592Sbms version, igi->igi_ifp, igi->igi_ifp->if_xname); 1935189592Sbms 1936189592Sbms if (version == IGMP_VERSION_1 || version == IGMP_VERSION_2) { 1937189592Sbms int old_version_timer; 1938189592Sbms /* 1939189592Sbms * Compute the "Older Version Querier Present" timer as per 1940189592Sbms * Section 8.12. 1941189592Sbms */ 1942189592Sbms old_version_timer = igi->igi_rv * igi->igi_qi + igi->igi_qri; 1943189592Sbms old_version_timer *= PR_SLOWHZ; 1944189592Sbms 1945189592Sbms if (version == IGMP_VERSION_1) { 1946189592Sbms igi->igi_v1_timer = old_version_timer; 1947189592Sbms igi->igi_v2_timer = 0; 1948189592Sbms } else if (version == IGMP_VERSION_2) { 1949189592Sbms igi->igi_v1_timer = 0; 1950189592Sbms igi->igi_v2_timer = old_version_timer; 1951189592Sbms } 1952189592Sbms } 1953189592Sbms 1954189592Sbms if (igi->igi_v1_timer == 0 && igi->igi_v2_timer > 0) { 1955189592Sbms if (igi->igi_version != IGMP_VERSION_2) { 1956189592Sbms igi->igi_version = IGMP_VERSION_2; 1957189592Sbms igmp_v3_cancel_link_timers(igi); 1958189592Sbms } 1959189592Sbms } else if (igi->igi_v1_timer > 0) { 1960189592Sbms if (igi->igi_version != IGMP_VERSION_1) { 1961189592Sbms igi->igi_version = IGMP_VERSION_1; 1962189592Sbms igmp_v3_cancel_link_timers(igi); 1963189592Sbms } 1964189592Sbms } 1965189592Sbms} 1966189592Sbms 1967189592Sbms/* 1968189592Sbms * Cancel pending IGMPv3 timers for the given link and all groups 1969189592Sbms * joined on it; state-change, general-query, and group-query timers. 1970189592Sbms */ 1971189592Sbmsstatic void 1972189592Sbmsigmp_v3_cancel_link_timers(struct igmp_ifinfo *igi) 1973189592Sbms{ 1974191548Szec INIT_VNET_INET(curvnet); 1975189592Sbms struct ifmultiaddr *ifma; 1976189592Sbms struct ifnet *ifp; 1977189592Sbms struct in_multi *inm; 1978189592Sbms 1979189592Sbms CTR3(KTR_IGMPV3, "%s: cancel v3 timers on ifp %p(%s)", __func__, 1980189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 1981189592Sbms 1982189592Sbms IN_MULTI_LOCK_ASSERT(); 1983189592Sbms IGMP_LOCK_ASSERT(); 1984189592Sbms 19851541Srgrimes /* 1986189592Sbms * Fast-track this potentially expensive operation 1987189592Sbms * by checking all the global 'timer pending' flags. 19881541Srgrimes */ 1989189592Sbms if (!V_interface_timers_running && 1990189592Sbms !V_state_change_timers_running && 1991189592Sbms !V_current_state_timers_running) 19921541Srgrimes return; 19931541Srgrimes 1994189592Sbms igi->igi_v3_timer = 0; 1995189592Sbms 1996189592Sbms ifp = igi->igi_ifp; 1997189592Sbms 1998189592Sbms IF_ADDR_LOCK(ifp); 1999189592Sbms TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 2000189592Sbms if (ifma->ifma_addr->sa_family != AF_INET) 2001189592Sbms continue; 2002189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 2003189592Sbms switch (inm->inm_state) { 2004189592Sbms case IGMP_NOT_MEMBER: 2005189592Sbms case IGMP_SILENT_MEMBER: 2006189592Sbms case IGMP_IDLE_MEMBER: 2007189592Sbms case IGMP_LAZY_MEMBER: 2008189592Sbms case IGMP_SLEEPING_MEMBER: 2009189592Sbms case IGMP_AWAKENING_MEMBER: 2010189592Sbms break; 2011189592Sbms case IGMP_LEAVING_MEMBER: 2012189592Sbms /* 2013189592Sbms * If we are leaving the group and switching 2014189592Sbms * IGMP version, we need to release the final 2015189592Sbms * reference held for issuing the INCLUDE {}. 2016189592Sbms * 2017189592Sbms * SMPNG: Must drop and re-acquire IF_ADDR_LOCK 2018189592Sbms * around inm_release_locked(), as it is not 2019189592Sbms * a recursive mutex. 2020189592Sbms */ 2021189592Sbms IF_ADDR_UNLOCK(ifp); 2022189592Sbms inm_release_locked(inm); 2023189592Sbms IF_ADDR_LOCK(ifp); 2024189592Sbms /* FALLTHROUGH */ 2025189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 2026189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 2027189592Sbms inm_clear_recorded(inm); 2028189592Sbms /* FALLTHROUGH */ 2029189592Sbms case IGMP_REPORTING_MEMBER: 2030189592Sbms inm->inm_sctimer = 0; 2031189592Sbms inm->inm_timer = 0; 2032189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 2033189592Sbms /* 2034189592Sbms * Free any pending IGMPv3 state-change records. 2035189592Sbms */ 2036189592Sbms _IF_DRAIN(&inm->inm_scq); 2037189592Sbms break; 2038189592Sbms } 2039189592Sbms } 2040189592Sbms IF_ADDR_UNLOCK(ifp); 2041189592Sbms} 2042189592Sbms 2043189592Sbms/* 2044189592Sbms * Update the Older Version Querier Present timers for a link. 2045189592Sbms * See Section 7.2.1 of RFC 3376. 2046189592Sbms */ 2047189592Sbmsstatic void 2048189592Sbmsigmp_v1v2_process_querier_timers(struct igmp_ifinfo *igi) 2049189592Sbms{ 2050191548Szec INIT_VNET_INET(curvnet); 2051189592Sbms 2052189592Sbms IGMP_LOCK_ASSERT(); 2053189592Sbms 2054189592Sbms if (igi->igi_v1_timer == 0 && igi->igi_v2_timer == 0) { 2055189592Sbms /* 2056189592Sbms * IGMPv1 and IGMPv2 Querier Present timers expired. 2057189592Sbms * 2058189592Sbms * Revert to IGMPv3. 2059189592Sbms */ 2060189592Sbms if (igi->igi_version != IGMP_VERSION_3) { 2061189592Sbms CTR5(KTR_IGMPV3, 2062189592Sbms "%s: transition from v%d -> v%d on %p(%s)", 2063189592Sbms __func__, igi->igi_version, IGMP_VERSION_3, 2064189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 2065189592Sbms igi->igi_version = IGMP_VERSION_3; 2066189592Sbms } 2067189592Sbms } else if (igi->igi_v1_timer == 0 && igi->igi_v2_timer > 0) { 2068189592Sbms /* 2069189592Sbms * IGMPv1 Querier Present timer expired, 2070189592Sbms * IGMPv2 Querier Present timer running. 2071189592Sbms * If IGMPv2 was disabled since last timeout, 2072189592Sbms * revert to IGMPv3. 2073189592Sbms * If IGMPv2 is enabled, revert to IGMPv2. 2074189592Sbms */ 2075189592Sbms if (!V_igmp_v2enable) { 2076189592Sbms CTR5(KTR_IGMPV3, 2077189592Sbms "%s: transition from v%d -> v%d on %p(%s)", 2078189592Sbms __func__, igi->igi_version, IGMP_VERSION_3, 2079189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 2080189592Sbms igi->igi_v2_timer = 0; 2081189592Sbms igi->igi_version = IGMP_VERSION_3; 2082189592Sbms } else { 2083189592Sbms --igi->igi_v2_timer; 2084189592Sbms if (igi->igi_version != IGMP_VERSION_2) { 2085189592Sbms CTR5(KTR_IGMPV3, 2086189592Sbms "%s: transition from v%d -> v%d on %p(%s)", 2087189592Sbms __func__, igi->igi_version, IGMP_VERSION_2, 2088189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 2089189592Sbms igi->igi_version = IGMP_VERSION_2; 2090183550Szec } 20911541Srgrimes } 2092189592Sbms } else if (igi->igi_v1_timer > 0) { 2093189592Sbms /* 2094189592Sbms * IGMPv1 Querier Present timer running. 2095189592Sbms * Stop IGMPv2 timer if running. 2096189592Sbms * 2097189592Sbms * If IGMPv1 was disabled since last timeout, 2098189592Sbms * revert to IGMPv3. 2099189592Sbms * If IGMPv1 is enabled, reset IGMPv2 timer if running. 2100189592Sbms */ 2101189592Sbms if (!V_igmp_v1enable) { 2102189592Sbms CTR5(KTR_IGMPV3, 2103189592Sbms "%s: transition from v%d -> v%d on %p(%s)", 2104189592Sbms __func__, igi->igi_version, IGMP_VERSION_3, 2105189592Sbms igi->igi_ifp, igi->igi_ifp->if_xname); 2106189592Sbms igi->igi_v1_timer = 0; 2107189592Sbms igi->igi_version = IGMP_VERSION_3; 2108189592Sbms } else { 2109189592Sbms --igi->igi_v1_timer; 2110189592Sbms } 2111189592Sbms if (igi->igi_v2_timer > 0) { 2112189592Sbms CTR3(KTR_IGMPV3, 2113189592Sbms "%s: cancel v2 timer on %p(%s)", 2114189592Sbms __func__, igi->igi_ifp, igi->igi_ifp->if_xname); 2115189592Sbms igi->igi_v2_timer = 0; 2116189592Sbms } 21171541Srgrimes } 21181541Srgrimes} 21191541Srgrimes 2120189592Sbms/* 2121189592Sbms * Global slowtimo handler. 2122189592Sbms * VIMAGE: Timeout handlers are expected to service all vimages. 2123189592Sbms */ 21242531Swollmanvoid 2125119181Srwatsonigmp_slowtimo(void) 21262531Swollman{ 2127183550Szec VNET_ITERATOR_DECL(vnet_iter); 21282531Swollman 2129183550Szec VNET_LIST_RLOCK(); 2130183550Szec VNET_FOREACH(vnet_iter) { 2131183550Szec CURVNET_SET(vnet_iter); 2132189592Sbms igmp_slowtimo_vnet(); 2133183550Szec CURVNET_RESTORE(); 21342531Swollman } 2135183550Szec VNET_LIST_RUNLOCK(); 21362531Swollman} 21372531Swollman 2138189592Sbms/* 2139189592Sbms * Per-vnet slowtimo handler. 2140189592Sbms */ 21411541Srgrimesstatic void 2142189592Sbmsigmp_slowtimo_vnet(void) 21431541Srgrimes{ 2144191548Szec INIT_VNET_INET(curvnet); 2145189592Sbms struct igmp_ifinfo *igi; 21461541Srgrimes 2147189592Sbms IGMP_LOCK(); 2148189592Sbms 2149189592Sbms LIST_FOREACH(igi, &V_igi_head, igi_link) { 2150189592Sbms igmp_v1v2_process_querier_timers(igi); 2151189592Sbms } 2152189592Sbms 2153189592Sbms IGMP_UNLOCK(); 2154189592Sbms} 2155189592Sbms 2156189592Sbms/* 2157189592Sbms * Dispatch an IGMPv1/v2 host report or leave message. 2158189592Sbms * These are always small enough to fit inside a single mbuf. 2159189592Sbms */ 2160189592Sbmsstatic int 2161189592Sbmsigmp_v1v2_queue_report(struct in_multi *inm, const int type) 2162189592Sbms{ 2163189592Sbms struct ifnet *ifp; 2164189592Sbms struct igmp *igmp; 2165189592Sbms struct ip *ip; 2166189592Sbms struct mbuf *m; 2167189592Sbms 2168148682Srwatson IN_MULTI_LOCK_ASSERT(); 2169189592Sbms IGMP_LOCK_ASSERT(); 2170148682Srwatson 2171189592Sbms ifp = inm->inm_ifp; 2172189592Sbms 2173151967Sandre MGETHDR(m, M_DONTWAIT, MT_DATA); 2174119181Srwatson if (m == NULL) 2175189592Sbms return (ENOMEM); 2176189592Sbms MH_ALIGN(m, sizeof(struct ip) + sizeof(struct igmp)); 21772531Swollman 2178189592Sbms m->m_pkthdr.len = sizeof(struct ip) + sizeof(struct igmp); 2179189592Sbms 21802531Swollman m->m_data += sizeof(struct ip); 2181189592Sbms m->m_len = sizeof(struct igmp); 2182189592Sbms 2183119181Srwatson igmp = mtod(m, struct igmp *); 2184119181Srwatson igmp->igmp_type = type; 2185119181Srwatson igmp->igmp_code = 0; 2186119181Srwatson igmp->igmp_group = inm->inm_addr; 2187119181Srwatson igmp->igmp_cksum = 0; 2188189592Sbms igmp->igmp_cksum = in_cksum(m, sizeof(struct igmp)); 21891541Srgrimes 2190119181Srwatson m->m_data -= sizeof(struct ip); 2191119181Srwatson m->m_len += sizeof(struct ip); 2192189592Sbms 2193119181Srwatson ip = mtod(m, struct ip *); 2194119181Srwatson ip->ip_tos = 0; 2195189592Sbms ip->ip_len = sizeof(struct ip) + sizeof(struct igmp); 2196119181Srwatson ip->ip_off = 0; 2197119181Srwatson ip->ip_p = IPPROTO_IGMP; 2198119181Srwatson ip->ip_src.s_addr = INADDR_ANY; 21991541Srgrimes 2200189592Sbms if (type == IGMP_HOST_LEAVE_MESSAGE) 2201189592Sbms ip->ip_dst.s_addr = htonl(INADDR_ALLRTRS_GROUP); 2202189592Sbms else 2203189592Sbms ip->ip_dst = inm->inm_addr; 2204189592Sbms 2205189592Sbms igmp_save_context(m, ifp); 2206189592Sbms 2207189592Sbms m->m_flags |= M_IGMPV2; 2208189592Sbms if (inm->inm_igi->igi_flags & IGIF_LOOPBACK) 2209189592Sbms m->m_flags |= M_IGMP_LOOP; 2210189592Sbms 2211189592Sbms CTR2(KTR_IGMPV3, "%s: netisr_dispatch(NETISR_IGMP, %p)", __func__, m); 2212189592Sbms netisr_dispatch(NETISR_IGMP, m); 2213189592Sbms 2214189592Sbms return (0); 2215189592Sbms} 2216189592Sbms 2217189592Sbms/* 2218189592Sbms * Process a state change from the upper layer for the given IPv4 group. 2219189592Sbms * 2220189592Sbms * Each socket holds a reference on the in_multi in its own ip_moptions. 2221189592Sbms * The socket layer will have made the necessary updates to.the group 2222189592Sbms * state, it is now up to IGMP to issue a state change report if there 2223189592Sbms * has been any change between T0 (when the last state-change was issued) 2224189592Sbms * and T1 (now). 2225189592Sbms * 2226189592Sbms * We use the IGMPv3 state machine at group level. The IGMP module 2227189592Sbms * however makes the decision as to which IGMP protocol version to speak. 2228189592Sbms * A state change *from* INCLUDE {} always means an initial join. 2229189592Sbms * A state change *to* INCLUDE {} always means a final leave. 2230189592Sbms * 2231189592Sbms * FUTURE: If IGIF_V3LITE is enabled for this interface, then we can 2232189592Sbms * save ourselves a bunch of work; any exclusive mode groups need not 2233189592Sbms * compute source filter lists. 2234189592Sbms * 2235189592Sbms * VIMAGE: curvnet should have been set by caller, as this routine 2236189592Sbms * is called from the socket option handlers. 2237189592Sbms */ 2238189592Sbmsint 2239189592Sbmsigmp_change_state(struct in_multi *inm) 2240189592Sbms{ 2241189592Sbms struct igmp_ifinfo *igi; 2242189592Sbms struct ifnet *ifp; 2243189592Sbms int error; 2244189592Sbms 2245189592Sbms IN_MULTI_LOCK_ASSERT(); 2246189592Sbms 2247189592Sbms error = 0; 2248189592Sbms 2249189592Sbms /* 2250189592Sbms * Try to detect if the upper layer just asked us to change state 2251189592Sbms * for an interface which has now gone away. 2252189592Sbms */ 2253189592Sbms KASSERT(inm->inm_ifma != NULL, ("%s: no ifma", __func__)); 2254189592Sbms ifp = inm->inm_ifma->ifma_ifp; 2255189592Sbms if (ifp != NULL) { 2256189592Sbms /* 2257189592Sbms * Sanity check that netinet's notion of ifp is the 2258189592Sbms * same as net's. 2259189592Sbms */ 2260189592Sbms KASSERT(inm->inm_ifp == ifp, ("%s: bad ifp", __func__)); 2261189592Sbms } 2262189592Sbms 2263189592Sbms IGMP_LOCK(); 2264189592Sbms 2265189592Sbms igi = ((struct in_ifinfo *)ifp->if_afdata[AF_INET])->ii_igmp; 2266189592Sbms KASSERT(igi != NULL, ("%s: no igmp_ifinfo for ifp %p", __func__, ifp)); 2267189592Sbms 2268189592Sbms /* 2269189592Sbms * If we detect a state transition to or from MCAST_UNDEFINED 2270189592Sbms * for this group, then we are starting or finishing an IGMP 2271189592Sbms * life cycle for this group. 2272189592Sbms */ 2273189592Sbms if (inm->inm_st[1].iss_fmode != inm->inm_st[0].iss_fmode) { 2274189592Sbms CTR3(KTR_IGMPV3, "%s: inm transition %d -> %d", __func__, 2275189592Sbms inm->inm_st[0].iss_fmode, inm->inm_st[1].iss_fmode); 2276189592Sbms if (inm->inm_st[0].iss_fmode == MCAST_UNDEFINED) { 2277189592Sbms CTR1(KTR_IGMPV3, "%s: initial join", __func__); 2278189592Sbms error = igmp_initial_join(inm, igi); 2279189592Sbms goto out_locked; 2280189592Sbms } else if (inm->inm_st[1].iss_fmode == MCAST_UNDEFINED) { 2281189592Sbms CTR1(KTR_IGMPV3, "%s: final leave", __func__); 2282189592Sbms igmp_final_leave(inm, igi); 2283189592Sbms goto out_locked; 2284189592Sbms } 2285189592Sbms } else { 2286189592Sbms CTR1(KTR_IGMPV3, "%s: filter set change", __func__); 2287189592Sbms } 2288189592Sbms 2289189592Sbms error = igmp_handle_state_change(inm, igi); 2290189592Sbms 2291189592Sbmsout_locked: 2292189592Sbms IGMP_UNLOCK(); 2293189592Sbms return (error); 2294189592Sbms} 2295189592Sbms 2296189592Sbms/* 2297189592Sbms * Perform the initial join for an IGMP group. 2298189592Sbms * 2299189592Sbms * When joining a group: 2300189592Sbms * If the group should have its IGMP traffic suppressed, do nothing. 2301189592Sbms * IGMPv1 starts sending IGMPv1 host membership reports. 2302189592Sbms * IGMPv2 starts sending IGMPv2 host membership reports. 2303189592Sbms * IGMPv3 will schedule an IGMPv3 state-change report containing the 2304189592Sbms * initial state of the membership. 2305189592Sbms */ 2306189592Sbmsstatic int 2307189592Sbmsigmp_initial_join(struct in_multi *inm, struct igmp_ifinfo *igi) 2308189592Sbms{ 2309191548Szec INIT_VNET_INET(curvnet); 2310189592Sbms struct ifnet *ifp; 2311189592Sbms struct ifqueue *ifq; 2312189592Sbms int error, retval, syncstates; 2313189592Sbms 2314189592Sbms CTR4(KTR_IGMPV3, "%s: initial join %s on ifp %p(%s)", 2315189592Sbms __func__, inet_ntoa(inm->inm_addr), inm->inm_ifp, 2316189592Sbms inm->inm_ifp->if_xname); 2317189592Sbms 2318189592Sbms error = 0; 2319189592Sbms syncstates = 1; 2320189592Sbms 2321189592Sbms ifp = inm->inm_ifp; 2322189592Sbms 2323189592Sbms IN_MULTI_LOCK_ASSERT(); 2324189592Sbms IGMP_LOCK_ASSERT(); 2325189592Sbms 2326189592Sbms KASSERT(igi && igi->igi_ifp == ifp, ("%s: inconsistent ifp", __func__)); 2327189592Sbms 2328189592Sbms /* 2329189592Sbms * Groups joined on loopback or marked as 'not reported', 2330189592Sbms * e.g. 224.0.0.1, enter the IGMP_SILENT_MEMBER state and 2331189592Sbms * are never reported in any IGMP protocol exchanges. 2332189592Sbms * All other groups enter the appropriate IGMP state machine 2333189592Sbms * for the version in use on this link. 2334189592Sbms * A link marked as IGIF_SILENT causes IGMP to be completely 2335189592Sbms * disabled for the link. 2336189592Sbms */ 2337189592Sbms if ((ifp->if_flags & IFF_LOOPBACK) || 2338189592Sbms (igi->igi_flags & IGIF_SILENT) || 2339189592Sbms !igmp_isgroupreported(inm->inm_addr)) { 2340189592Sbms CTR1(KTR_IGMPV3, 2341189592Sbms"%s: not kicking state machine for silent group", __func__); 2342189592Sbms inm->inm_state = IGMP_SILENT_MEMBER; 2343189592Sbms inm->inm_timer = 0; 2344189592Sbms } else { 2345189592Sbms /* 2346189592Sbms * Deal with overlapping in_multi lifecycle. 2347189592Sbms * If this group was LEAVING, then make sure 2348189592Sbms * we drop the reference we picked up to keep the 2349189592Sbms * group around for the final INCLUDE {} enqueue. 2350189592Sbms */ 2351189592Sbms if (igi->igi_version == IGMP_VERSION_3 && 2352189592Sbms inm->inm_state == IGMP_LEAVING_MEMBER) 2353189592Sbms inm_release_locked(inm); 2354189592Sbms 2355189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 2356189592Sbms 2357189592Sbms switch (igi->igi_version) { 2358189592Sbms case IGMP_VERSION_1: 2359189592Sbms case IGMP_VERSION_2: 2360189592Sbms inm->inm_state = IGMP_IDLE_MEMBER; 2361189592Sbms error = igmp_v1v2_queue_report(inm, 2362189592Sbms (igi->igi_version == IGMP_VERSION_2) ? 2363189592Sbms IGMP_v2_HOST_MEMBERSHIP_REPORT : 2364189592Sbms IGMP_v1_HOST_MEMBERSHIP_REPORT); 2365189592Sbms if (error == 0) { 2366189592Sbms inm->inm_timer = IGMP_RANDOM_DELAY( 2367189592Sbms IGMP_V1V2_MAX_RI * PR_FASTHZ); 2368189592Sbms V_current_state_timers_running = 1; 2369189592Sbms } 2370189592Sbms break; 2371189592Sbms 2372189592Sbms case IGMP_VERSION_3: 2373189592Sbms /* 2374189592Sbms * Defer update of T0 to T1, until the first copy 2375189592Sbms * of the state change has been transmitted. 2376189592Sbms */ 2377189592Sbms syncstates = 0; 2378189592Sbms 2379189592Sbms /* 2380189592Sbms * Immediately enqueue a State-Change Report for 2381189592Sbms * this interface, freeing any previous reports. 2382189592Sbms * Don't kick the timers if there is nothing to do, 2383189592Sbms * or if an error occurred. 2384189592Sbms */ 2385189592Sbms ifq = &inm->inm_scq; 2386189592Sbms _IF_DRAIN(ifq); 2387189592Sbms retval = igmp_v3_enqueue_group_record(ifq, inm, 1, 2388189592Sbms 0, 0); 2389189592Sbms CTR2(KTR_IGMPV3, "%s: enqueue record = %d", 2390189592Sbms __func__, retval); 2391189592Sbms if (retval <= 0) { 2392189592Sbms error = retval * -1; 2393189592Sbms break; 2394189592Sbms } 2395189592Sbms 2396189592Sbms /* 2397189592Sbms * Schedule transmission of pending state-change 2398189592Sbms * report up to RV times for this link. The timer 2399189592Sbms * will fire at the next igmp_fasttimo (~200ms), 2400189592Sbms * giving us an opportunity to merge the reports. 2401189592Sbms */ 2402189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 2403189592Sbms inm->inm_scrv = 1; 2404189592Sbms } else { 2405189592Sbms KASSERT(igi->igi_rv > 1, 2406189592Sbms ("%s: invalid robustness %d", __func__, 2407189592Sbms igi->igi_rv)); 2408189592Sbms inm->inm_scrv = igi->igi_rv; 2409189592Sbms } 2410189592Sbms inm->inm_sctimer = 1; 2411189592Sbms V_state_change_timers_running = 1; 2412189592Sbms 2413189592Sbms error = 0; 2414189592Sbms break; 2415189592Sbms } 2416189592Sbms } 2417189592Sbms 2418189592Sbms /* 2419189592Sbms * Only update the T0 state if state change is atomic, 2420189592Sbms * i.e. we don't need to wait for a timer to fire before we 2421189592Sbms * can consider the state change to have been communicated. 2422189592Sbms */ 2423189592Sbms if (syncstates) { 2424189592Sbms inm_commit(inm); 2425189592Sbms CTR3(KTR_IGMPV3, "%s: T1 -> T0 for %s/%s", __func__, 2426189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 2427189592Sbms } 2428189592Sbms 2429189592Sbms return (error); 2430189592Sbms} 2431189592Sbms 2432189592Sbms/* 2433189592Sbms * Issue an intermediate state change during the IGMP life-cycle. 2434189592Sbms */ 2435189592Sbmsstatic int 2436189592Sbmsigmp_handle_state_change(struct in_multi *inm, struct igmp_ifinfo *igi) 2437189592Sbms{ 2438191548Szec INIT_VNET_INET(curvnet); 2439189592Sbms struct ifnet *ifp; 2440189592Sbms int retval; 2441189592Sbms 2442189592Sbms CTR4(KTR_IGMPV3, "%s: state change for %s on ifp %p(%s)", 2443189592Sbms __func__, inet_ntoa(inm->inm_addr), inm->inm_ifp, 2444189592Sbms inm->inm_ifp->if_xname); 2445189592Sbms 2446189592Sbms ifp = inm->inm_ifp; 2447189592Sbms 2448189592Sbms IN_MULTI_LOCK_ASSERT(); 2449189592Sbms IGMP_LOCK_ASSERT(); 2450189592Sbms 2451189592Sbms KASSERT(igi && igi->igi_ifp == ifp, ("%s: inconsistent ifp", __func__)); 2452189592Sbms 2453189592Sbms if ((ifp->if_flags & IFF_LOOPBACK) || 2454189592Sbms (igi->igi_flags & IGIF_SILENT) || 2455189592Sbms !igmp_isgroupreported(inm->inm_addr) || 2456189592Sbms (igi->igi_version != IGMP_VERSION_3)) { 2457189592Sbms if (!igmp_isgroupreported(inm->inm_addr)) { 2458189592Sbms CTR1(KTR_IGMPV3, 2459189592Sbms"%s: not kicking state machine for silent group", __func__); 2460189592Sbms } 2461189592Sbms CTR1(KTR_IGMPV3, "%s: nothing to do", __func__); 2462189592Sbms inm_commit(inm); 2463189592Sbms CTR3(KTR_IGMPV3, "%s: T1 -> T0 for %s/%s", __func__, 2464189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 2465189592Sbms return (0); 2466189592Sbms } 2467189592Sbms 2468189592Sbms _IF_DRAIN(&inm->inm_scq); 2469189592Sbms 2470189592Sbms retval = igmp_v3_enqueue_group_record(&inm->inm_scq, inm, 1, 0, 0); 2471189592Sbms CTR2(KTR_IGMPV3, "%s: enqueue record = %d", __func__, retval); 2472189592Sbms if (retval <= 0) 2473189592Sbms return (-retval); 2474189592Sbms 2475189592Sbms /* 2476189592Sbms * If record(s) were enqueued, start the state-change 2477189592Sbms * report timer for this group. 2478189592Sbms */ 2479189592Sbms inm->inm_scrv = ((igi->igi_flags & IGIF_LOOPBACK) ? 1 : igi->igi_rv); 2480189592Sbms inm->inm_sctimer = 1; 2481189592Sbms V_state_change_timers_running = 1; 2482189592Sbms 2483189592Sbms return (0); 2484189592Sbms} 2485189592Sbms 2486189592Sbms/* 2487189592Sbms * Perform the final leave for an IGMP group. 2488189592Sbms * 2489189592Sbms * When leaving a group: 2490189592Sbms * IGMPv1 does nothing. 2491189592Sbms * IGMPv2 sends a host leave message, if and only if we are the reporter. 2492189592Sbms * IGMPv3 enqueues a state-change report containing a transition 2493189592Sbms * to INCLUDE {} for immediate transmission. 2494189592Sbms */ 2495189592Sbmsstatic void 2496189592Sbmsigmp_final_leave(struct in_multi *inm, struct igmp_ifinfo *igi) 2497189592Sbms{ 2498191548Szec INIT_VNET_INET(curvnet); 2499189592Sbms int syncstates; 2500189592Sbms 2501189592Sbms syncstates = 1; 2502189592Sbms 2503189592Sbms CTR4(KTR_IGMPV3, "%s: final leave %s on ifp %p(%s)", 2504189592Sbms __func__, inet_ntoa(inm->inm_addr), inm->inm_ifp, 2505189592Sbms inm->inm_ifp->if_xname); 2506189592Sbms 2507189592Sbms IN_MULTI_LOCK_ASSERT(); 2508189592Sbms IGMP_LOCK_ASSERT(); 2509189592Sbms 2510189592Sbms switch (inm->inm_state) { 2511189592Sbms case IGMP_NOT_MEMBER: 2512189592Sbms case IGMP_SILENT_MEMBER: 2513189592Sbms case IGMP_LEAVING_MEMBER: 2514189592Sbms /* Already leaving or left; do nothing. */ 2515189592Sbms CTR1(KTR_IGMPV3, 2516189592Sbms"%s: not kicking state machine for silent group", __func__); 2517189592Sbms break; 2518189592Sbms case IGMP_REPORTING_MEMBER: 2519189592Sbms case IGMP_IDLE_MEMBER: 2520189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 2521189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 2522189592Sbms if (igi->igi_version == IGMP_VERSION_2) { 2523189592Sbms#ifdef INVARIANTS 2524189592Sbms if (inm->inm_state == IGMP_G_QUERY_PENDING_MEMBER || 2525189592Sbms inm->inm_state == IGMP_SG_QUERY_PENDING_MEMBER) 2526189592Sbms panic("%s: IGMPv3 state reached, not IGMPv3 mode", 2527189592Sbms __func__); 2528189592Sbms#endif 2529189592Sbms igmp_v1v2_queue_report(inm, IGMP_HOST_LEAVE_MESSAGE); 2530189592Sbms inm->inm_state = IGMP_NOT_MEMBER; 2531189592Sbms } else if (igi->igi_version == IGMP_VERSION_3) { 2532189592Sbms /* 2533189592Sbms * Stop group timer and all pending reports. 2534189592Sbms * Immediately enqueue a state-change report 2535189592Sbms * TO_IN {} to be sent on the next fast timeout, 2536189592Sbms * giving us an opportunity to merge reports. 2537189592Sbms */ 2538189592Sbms _IF_DRAIN(&inm->inm_scq); 2539189592Sbms inm->inm_timer = 0; 2540189592Sbms if (igi->igi_flags & IGIF_LOOPBACK) { 2541189592Sbms inm->inm_scrv = 1; 2542189592Sbms } else { 2543189592Sbms inm->inm_scrv = igi->igi_rv; 2544189592Sbms } 2545189592Sbms CTR4(KTR_IGMPV3, "%s: Leaving %s/%s with %d " 2546189592Sbms "pending retransmissions.", __func__, 2547189592Sbms inet_ntoa(inm->inm_addr), 2548189592Sbms inm->inm_ifp->if_xname, inm->inm_scrv); 2549189592Sbms if (inm->inm_scrv == 0) { 2550189592Sbms inm->inm_state = IGMP_NOT_MEMBER; 2551189592Sbms inm->inm_sctimer = 0; 2552189592Sbms } else { 2553189592Sbms int retval; 2554189592Sbms 2555189592Sbms inm_acquire_locked(inm); 2556189592Sbms 2557189592Sbms retval = igmp_v3_enqueue_group_record( 2558189592Sbms &inm->inm_scq, inm, 1, 0, 0); 2559189592Sbms KASSERT(retval != 0, 2560189592Sbms ("%s: enqueue record = %d", __func__, 2561189592Sbms retval)); 2562189592Sbms 2563189592Sbms inm->inm_state = IGMP_LEAVING_MEMBER; 2564189592Sbms inm->inm_sctimer = 1; 2565189592Sbms V_state_change_timers_running = 1; 2566189592Sbms syncstates = 0; 2567189592Sbms } 2568189592Sbms break; 2569189592Sbms } 2570189592Sbms break; 2571189592Sbms case IGMP_LAZY_MEMBER: 2572189592Sbms case IGMP_SLEEPING_MEMBER: 2573189592Sbms case IGMP_AWAKENING_MEMBER: 2574189592Sbms /* Our reports are suppressed; do nothing. */ 2575189592Sbms break; 2576189592Sbms } 2577189592Sbms 2578189592Sbms if (syncstates) { 2579189592Sbms inm_commit(inm); 2580189592Sbms CTR3(KTR_IGMPV3, "%s: T1 -> T0 for %s/%s", __func__, 2581189592Sbms inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 2582189592Sbms inm->inm_st[1].iss_fmode = MCAST_UNDEFINED; 2583189592Sbms CTR3(KTR_IGMPV3, "%s: T1 now MCAST_UNDEFINED for %s/%s", 2584189592Sbms __func__, inet_ntoa(inm->inm_addr), inm->inm_ifp->if_xname); 2585189592Sbms } 2586189592Sbms} 2587189592Sbms 2588189592Sbms/* 2589189592Sbms * Enqueue an IGMPv3 group record to the given output queue. 2590189592Sbms * 2591189592Sbms * XXX This function could do with having the allocation code 2592189592Sbms * split out, and the multiple-tree-walks coalesced into a single 2593189592Sbms * routine as has been done in igmp_v3_enqueue_filter_change(). 2594189592Sbms * 2595189592Sbms * If is_state_change is zero, a current-state record is appended. 2596189592Sbms * If is_state_change is non-zero, a state-change report is appended. 2597189592Sbms * 2598189592Sbms * If is_group_query is non-zero, an mbuf packet chain is allocated. 2599189592Sbms * If is_group_query is zero, and if there is a packet with free space 2600189592Sbms * at the tail of the queue, it will be appended to providing there 2601189592Sbms * is enough free space. 2602189592Sbms * Otherwise a new mbuf packet chain is allocated. 2603189592Sbms * 2604189592Sbms * If is_source_query is non-zero, each source is checked to see if 2605189592Sbms * it was recorded for a Group-Source query, and will be omitted if 2606189592Sbms * it is not both in-mode and recorded. 2607189592Sbms * 2608189592Sbms * The function will attempt to allocate leading space in the packet 2609189592Sbms * for the IP/IGMP header to be prepended without fragmenting the chain. 2610189592Sbms * 2611189592Sbms * If successful the size of all data appended to the queue is returned, 2612189592Sbms * otherwise an error code less than zero is returned, or zero if 2613189592Sbms * no record(s) were appended. 2614189592Sbms */ 2615189592Sbmsstatic int 2616189592Sbmsigmp_v3_enqueue_group_record(struct ifqueue *ifq, struct in_multi *inm, 2617189592Sbms const int is_state_change, const int is_group_query, 2618189592Sbms const int is_source_query) 2619189592Sbms{ 2620189592Sbms struct igmp_grouprec ig; 2621189592Sbms struct igmp_grouprec *pig; 2622189592Sbms struct ifnet *ifp; 2623189592Sbms struct ip_msource *ims, *nims; 2624189592Sbms struct mbuf *m0, *m, *md; 2625189592Sbms int error, is_filter_list_change; 2626189592Sbms int minrec0len, m0srcs, msrcs, nbytes, off; 2627189592Sbms int record_has_sources; 2628189592Sbms int now; 2629189592Sbms int type; 2630189592Sbms in_addr_t naddr; 2631189592Sbms uint8_t mode; 2632189592Sbms 2633189592Sbms IN_MULTI_LOCK_ASSERT(); 2634189592Sbms 2635189592Sbms error = 0; 2636189592Sbms ifp = inm->inm_ifp; 2637189592Sbms is_filter_list_change = 0; 2638189592Sbms m = NULL; 2639189592Sbms m0 = NULL; 2640189592Sbms m0srcs = 0; 2641189592Sbms msrcs = 0; 2642189592Sbms nbytes = 0; 2643189592Sbms nims = NULL; 2644189592Sbms record_has_sources = 1; 2645189592Sbms pig = NULL; 2646189592Sbms type = IGMP_DO_NOTHING; 2647189592Sbms mode = inm->inm_st[1].iss_fmode; 2648189592Sbms 2649189592Sbms /* 2650189592Sbms * If we did not transition out of ASM mode during t0->t1, 2651189592Sbms * and there are no source nodes to process, we can skip 2652189592Sbms * the generation of source records. 2653189592Sbms */ 2654189592Sbms if (inm->inm_st[0].iss_asm > 0 && inm->inm_st[1].iss_asm > 0 && 2655189592Sbms inm->inm_nsrc == 0) 2656189592Sbms record_has_sources = 0; 2657189592Sbms 2658189592Sbms if (is_state_change) { 2659189592Sbms /* 2660189592Sbms * Queue a state change record. 2661189592Sbms * If the mode did not change, and there are non-ASM 2662189592Sbms * listeners or source filters present, 2663189592Sbms * we potentially need to issue two records for the group. 2664189592Sbms * If we are transitioning to MCAST_UNDEFINED, we need 2665189592Sbms * not send any sources. 2666189592Sbms * If there are ASM listeners, and there was no filter 2667189592Sbms * mode transition of any kind, do nothing. 2668189592Sbms */ 2669189592Sbms if (mode != inm->inm_st[0].iss_fmode) { 2670189592Sbms if (mode == MCAST_EXCLUDE) { 2671189592Sbms CTR1(KTR_IGMPV3, "%s: change to EXCLUDE", 2672189592Sbms __func__); 2673189592Sbms type = IGMP_CHANGE_TO_EXCLUDE_MODE; 2674189592Sbms } else { 2675189592Sbms CTR1(KTR_IGMPV3, "%s: change to INCLUDE", 2676189592Sbms __func__); 2677189592Sbms type = IGMP_CHANGE_TO_INCLUDE_MODE; 2678189592Sbms if (mode == MCAST_UNDEFINED) 2679189592Sbms record_has_sources = 0; 2680189592Sbms } 2681189592Sbms } else { 2682189592Sbms if (record_has_sources) { 2683189592Sbms is_filter_list_change = 1; 2684189592Sbms } else { 2685189592Sbms type = IGMP_DO_NOTHING; 2686189592Sbms } 2687189592Sbms } 2688189592Sbms } else { 2689189592Sbms /* 2690189592Sbms * Queue a current state record. 2691189592Sbms */ 2692189592Sbms if (mode == MCAST_EXCLUDE) { 2693189592Sbms type = IGMP_MODE_IS_EXCLUDE; 2694189592Sbms } else if (mode == MCAST_INCLUDE) { 2695189592Sbms type = IGMP_MODE_IS_INCLUDE; 2696189592Sbms KASSERT(inm->inm_st[1].iss_asm == 0, 2697189592Sbms ("%s: inm %p is INCLUDE but ASM count is %d", 2698189592Sbms __func__, inm, inm->inm_st[1].iss_asm)); 2699189592Sbms } 2700189592Sbms } 2701189592Sbms 2702189592Sbms /* 2703189592Sbms * Generate the filter list changes using a separate function. 2704189592Sbms */ 2705189592Sbms if (is_filter_list_change) 2706189592Sbms return (igmp_v3_enqueue_filter_change(ifq, inm)); 2707189592Sbms 2708189592Sbms if (type == IGMP_DO_NOTHING) { 2709189592Sbms CTR3(KTR_IGMPV3, "%s: nothing to do for %s/%s", 2710189592Sbms __func__, inet_ntoa(inm->inm_addr), 2711189592Sbms inm->inm_ifp->if_xname); 2712189592Sbms return (0); 2713189592Sbms } 2714189592Sbms 2715189592Sbms /* 2716189592Sbms * If any sources are present, we must be able to fit at least 2717189592Sbms * one in the trailing space of the tail packet's mbuf, 2718189592Sbms * ideally more. 2719189592Sbms */ 2720189592Sbms minrec0len = sizeof(struct igmp_grouprec); 2721189592Sbms if (record_has_sources) 2722189592Sbms minrec0len += sizeof(in_addr_t); 2723189592Sbms 2724189592Sbms CTR4(KTR_IGMPV3, "%s: queueing %s for %s/%s", __func__, 2725189592Sbms igmp_rec_type_to_str(type), inet_ntoa(inm->inm_addr), 2726189592Sbms inm->inm_ifp->if_xname); 2727189592Sbms 2728189592Sbms /* 2729189592Sbms * Check if we have a packet in the tail of the queue for this 2730189592Sbms * group into which the first group record for this group will fit. 2731189592Sbms * Otherwise allocate a new packet. 2732189592Sbms * Always allocate leading space for IP+RA_OPT+IGMP+REPORT. 2733189592Sbms * Note: Group records for G/GSR query responses MUST be sent 2734189592Sbms * in their own packet. 2735189592Sbms */ 2736189592Sbms m0 = ifq->ifq_tail; 2737189592Sbms if (!is_group_query && 2738189592Sbms m0 != NULL && 2739189592Sbms (m0->m_pkthdr.PH_vt.vt_nrecs + 1 <= IGMP_V3_REPORT_MAXRECS) && 2740189592Sbms (m0->m_pkthdr.len + minrec0len) < 2741189592Sbms (ifp->if_mtu - IGMP_LEADINGSPACE)) { 2742189592Sbms m0srcs = (ifp->if_mtu - m0->m_pkthdr.len - 2743189592Sbms sizeof(struct igmp_grouprec)) / sizeof(in_addr_t); 2744189592Sbms m = m0; 2745189592Sbms CTR1(KTR_IGMPV3, "%s: use existing packet", __func__); 2746189592Sbms } else { 2747189592Sbms if (_IF_QFULL(ifq)) { 2748189592Sbms CTR1(KTR_IGMPV3, "%s: outbound queue full", __func__); 2749189592Sbms return (-ENOMEM); 2750189592Sbms } 2751189592Sbms m = NULL; 2752189592Sbms m0srcs = (ifp->if_mtu - IGMP_LEADINGSPACE - 2753189592Sbms sizeof(struct igmp_grouprec)) / sizeof(in_addr_t); 2754190692Sbms if (!is_state_change && !is_group_query) { 2755189592Sbms m = m_getcl(M_DONTWAIT, MT_DATA, M_PKTHDR); 2756190692Sbms if (m) 2757190692Sbms m->m_data += IGMP_LEADINGSPACE; 2758190692Sbms } 2759189592Sbms if (m == NULL) { 2760189592Sbms m = m_gethdr(M_DONTWAIT, MT_DATA); 2761189592Sbms if (m) 2762189592Sbms MH_ALIGN(m, IGMP_LEADINGSPACE); 2763189592Sbms } 2764189592Sbms if (m == NULL) 2765189592Sbms return (-ENOMEM); 2766189592Sbms 2767189592Sbms igmp_save_context(m, ifp); 2768189592Sbms 2769189592Sbms CTR1(KTR_IGMPV3, "%s: allocated first packet", __func__); 2770189592Sbms } 2771189592Sbms 2772189592Sbms /* 2773189592Sbms * Append group record. 2774189592Sbms * If we have sources, we don't know how many yet. 2775189592Sbms */ 2776189592Sbms ig.ig_type = type; 2777189592Sbms ig.ig_datalen = 0; 2778189592Sbms ig.ig_numsrc = 0; 2779189592Sbms ig.ig_group = inm->inm_addr; 2780189592Sbms if (!m_append(m, sizeof(struct igmp_grouprec), (void *)&ig)) { 2781189592Sbms if (m != m0) 2782189592Sbms m_freem(m); 2783189592Sbms CTR1(KTR_IGMPV3, "%s: m_append() failed.", __func__); 2784189592Sbms return (-ENOMEM); 2785189592Sbms } 2786189592Sbms nbytes += sizeof(struct igmp_grouprec); 2787189592Sbms 2788189592Sbms /* 2789189592Sbms * Append as many sources as will fit in the first packet. 2790189592Sbms * If we are appending to a new packet, the chain allocation 2791189592Sbms * may potentially use clusters; use m_getptr() in this case. 2792189592Sbms * If we are appending to an existing packet, we need to obtain 2793189592Sbms * a pointer to the group record after m_append(), in case a new 2794189592Sbms * mbuf was allocated. 2795189592Sbms * Only append sources which are in-mode at t1. If we are 2796189592Sbms * transitioning to MCAST_UNDEFINED state on the group, do not 2797189592Sbms * include source entries. 2798189592Sbms * Only report recorded sources in our filter set when responding 2799189592Sbms * to a group-source query. 2800189592Sbms */ 2801189592Sbms if (record_has_sources) { 2802189592Sbms if (m == m0) { 2803189592Sbms md = m_last(m); 2804189592Sbms pig = (struct igmp_grouprec *)(mtod(md, uint8_t *) + 2805189592Sbms md->m_len - nbytes); 2806189592Sbms } else { 2807189592Sbms md = m_getptr(m, 0, &off); 2808189592Sbms pig = (struct igmp_grouprec *)(mtod(md, uint8_t *) + 2809189592Sbms off); 2810189592Sbms } 2811189592Sbms msrcs = 0; 2812189592Sbms RB_FOREACH_SAFE(ims, ip_msource_tree, &inm->inm_srcs, nims) { 2813189592Sbms CTR2(KTR_IGMPV3, "%s: visit node %s", __func__, 2814189592Sbms inet_ntoa_haddr(ims->ims_haddr)); 2815189592Sbms now = ims_get_mode(inm, ims, 1); 2816189592Sbms CTR2(KTR_IGMPV3, "%s: node is %d", __func__, now); 2817189592Sbms if ((now != mode) || 2818189592Sbms (now == mode && mode == MCAST_UNDEFINED)) { 2819189592Sbms CTR1(KTR_IGMPV3, "%s: skip node", __func__); 2820189592Sbms continue; 2821189592Sbms } 2822189592Sbms if (is_source_query && ims->ims_stp == 0) { 2823189592Sbms CTR1(KTR_IGMPV3, "%s: skip unrecorded node", 2824189592Sbms __func__); 2825189592Sbms continue; 2826189592Sbms } 2827189592Sbms CTR1(KTR_IGMPV3, "%s: append node", __func__); 2828189592Sbms naddr = htonl(ims->ims_haddr); 2829189592Sbms if (!m_append(m, sizeof(in_addr_t), (void *)&naddr)) { 2830189592Sbms if (m != m0) 2831189592Sbms m_freem(m); 2832189592Sbms CTR1(KTR_IGMPV3, "%s: m_append() failed.", 2833189592Sbms __func__); 2834189592Sbms return (-ENOMEM); 2835189592Sbms } 2836189592Sbms nbytes += sizeof(in_addr_t); 2837189592Sbms ++msrcs; 2838189592Sbms if (msrcs == m0srcs) 2839189592Sbms break; 2840189592Sbms } 2841189592Sbms CTR2(KTR_IGMPV3, "%s: msrcs is %d this packet", __func__, 2842189592Sbms msrcs); 2843189592Sbms pig->ig_numsrc = htons(msrcs); 2844189592Sbms nbytes += (msrcs * sizeof(in_addr_t)); 2845189592Sbms } 2846189592Sbms 2847189592Sbms if (is_source_query && msrcs == 0) { 2848189592Sbms CTR1(KTR_IGMPV3, "%s: no recorded sources to report", __func__); 2849189592Sbms if (m != m0) 2850189592Sbms m_freem(m); 2851189592Sbms return (0); 2852189592Sbms } 2853189592Sbms 2854189592Sbms /* 2855189592Sbms * We are good to go with first packet. 2856189592Sbms */ 2857189592Sbms if (m != m0) { 2858189592Sbms CTR1(KTR_IGMPV3, "%s: enqueueing first packet", __func__); 2859189592Sbms m->m_pkthdr.PH_vt.vt_nrecs = 1; 2860189592Sbms _IF_ENQUEUE(ifq, m); 2861189592Sbms } else 2862189592Sbms m->m_pkthdr.PH_vt.vt_nrecs++; 2863189592Sbms 2864189592Sbms /* 2865189592Sbms * No further work needed if no source list in packet(s). 2866189592Sbms */ 2867189592Sbms if (!record_has_sources) 2868189592Sbms return (nbytes); 2869189592Sbms 2870189592Sbms /* 2871189592Sbms * Whilst sources remain to be announced, we need to allocate 2872189592Sbms * a new packet and fill out as many sources as will fit. 2873189592Sbms * Always try for a cluster first. 2874189592Sbms */ 2875189592Sbms while (nims != NULL) { 2876189592Sbms if (_IF_QFULL(ifq)) { 2877189592Sbms CTR1(KTR_IGMPV3, "%s: outbound queue full", __func__); 2878189592Sbms return (-ENOMEM); 2879189592Sbms } 2880189592Sbms m = m_getcl(M_DONTWAIT, MT_DATA, M_PKTHDR); 2881190692Sbms if (m) 2882190692Sbms m->m_data += IGMP_LEADINGSPACE; 2883189592Sbms if (m == NULL) { 2884189592Sbms m = m_gethdr(M_DONTWAIT, MT_DATA); 2885189592Sbms if (m) 2886189592Sbms MH_ALIGN(m, IGMP_LEADINGSPACE); 2887189592Sbms } 2888189592Sbms if (m == NULL) 2889189592Sbms return (-ENOMEM); 2890189592Sbms igmp_save_context(m, ifp); 2891189592Sbms md = m_getptr(m, 0, &off); 2892189592Sbms pig = (struct igmp_grouprec *)(mtod(md, uint8_t *) + off); 2893189592Sbms CTR1(KTR_IGMPV3, "%s: allocated next packet", __func__); 2894189592Sbms 2895189592Sbms if (!m_append(m, sizeof(struct igmp_grouprec), (void *)&ig)) { 2896189592Sbms if (m != m0) 2897189592Sbms m_freem(m); 2898189592Sbms CTR1(KTR_IGMPV3, "%s: m_append() failed.", __func__); 2899189592Sbms return (-ENOMEM); 2900189592Sbms } 2901189592Sbms m->m_pkthdr.PH_vt.vt_nrecs = 1; 2902189592Sbms nbytes += sizeof(struct igmp_grouprec); 2903189592Sbms 2904189592Sbms m0srcs = (ifp->if_mtu - IGMP_LEADINGSPACE - 2905189592Sbms sizeof(struct igmp_grouprec)) / sizeof(in_addr_t); 2906189592Sbms 2907189592Sbms msrcs = 0; 2908189592Sbms RB_FOREACH_FROM(ims, ip_msource_tree, nims) { 2909189592Sbms CTR2(KTR_IGMPV3, "%s: visit node %s", __func__, 2910189592Sbms inet_ntoa_haddr(ims->ims_haddr)); 2911189592Sbms now = ims_get_mode(inm, ims, 1); 2912189592Sbms if ((now != mode) || 2913189592Sbms (now == mode && mode == MCAST_UNDEFINED)) { 2914189592Sbms CTR1(KTR_IGMPV3, "%s: skip node", __func__); 2915189592Sbms continue; 2916189592Sbms } 2917189592Sbms if (is_source_query && ims->ims_stp == 0) { 2918189592Sbms CTR1(KTR_IGMPV3, "%s: skip unrecorded node", 2919189592Sbms __func__); 2920189592Sbms continue; 2921189592Sbms } 2922189592Sbms CTR1(KTR_IGMPV3, "%s: append node", __func__); 2923189592Sbms naddr = htonl(ims->ims_haddr); 2924189592Sbms if (!m_append(m, sizeof(in_addr_t), (void *)&naddr)) { 2925189592Sbms if (m != m0) 2926189592Sbms m_freem(m); 2927189592Sbms CTR1(KTR_IGMPV3, "%s: m_append() failed.", 2928189592Sbms __func__); 2929189592Sbms return (-ENOMEM); 2930189592Sbms } 2931189592Sbms ++msrcs; 2932189592Sbms if (msrcs == m0srcs) 2933189592Sbms break; 2934189592Sbms } 2935189592Sbms pig->ig_numsrc = htons(msrcs); 2936189592Sbms nbytes += (msrcs * sizeof(in_addr_t)); 2937189592Sbms 2938189592Sbms CTR1(KTR_IGMPV3, "%s: enqueueing next packet", __func__); 2939189592Sbms _IF_ENQUEUE(ifq, m); 2940189592Sbms } 2941189592Sbms 2942189592Sbms return (nbytes); 2943189592Sbms} 2944189592Sbms 2945189592Sbms/* 2946189592Sbms * Type used to mark record pass completion. 2947189592Sbms * We exploit the fact we can cast to this easily from the 2948189592Sbms * current filter modes on each ip_msource node. 2949189592Sbms */ 2950189592Sbmstypedef enum { 2951189592Sbms REC_NONE = 0x00, /* MCAST_UNDEFINED */ 2952189592Sbms REC_ALLOW = 0x01, /* MCAST_INCLUDE */ 2953189592Sbms REC_BLOCK = 0x02, /* MCAST_EXCLUDE */ 2954189592Sbms REC_FULL = REC_ALLOW | REC_BLOCK 2955189592Sbms} rectype_t; 2956189592Sbms 2957189592Sbms/* 2958189592Sbms * Enqueue an IGMPv3 filter list change to the given output queue. 2959189592Sbms * 2960189592Sbms * Source list filter state is held in an RB-tree. When the filter list 2961189592Sbms * for a group is changed without changing its mode, we need to compute 2962189592Sbms * the deltas between T0 and T1 for each source in the filter set, 2963189592Sbms * and enqueue the appropriate ALLOW_NEW/BLOCK_OLD records. 2964189592Sbms * 2965189592Sbms * As we may potentially queue two record types, and the entire R-B tree 2966189592Sbms * needs to be walked at once, we break this out into its own function 2967189592Sbms * so we can generate a tightly packed queue of packets. 2968189592Sbms * 2969189592Sbms * XXX This could be written to only use one tree walk, although that makes 2970189592Sbms * serializing into the mbuf chains a bit harder. For now we do two walks 2971189592Sbms * which makes things easier on us, and it may or may not be harder on 2972189592Sbms * the L2 cache. 2973189592Sbms * 2974189592Sbms * If successful the size of all data appended to the queue is returned, 2975189592Sbms * otherwise an error code less than zero is returned, or zero if 2976189592Sbms * no record(s) were appended. 2977189592Sbms */ 2978189592Sbmsstatic int 2979189592Sbmsigmp_v3_enqueue_filter_change(struct ifqueue *ifq, struct in_multi *inm) 2980189592Sbms{ 2981189592Sbms static const int MINRECLEN = 2982189592Sbms sizeof(struct igmp_grouprec) + sizeof(in_addr_t); 2983189592Sbms struct ifnet *ifp; 2984189592Sbms struct igmp_grouprec ig; 2985189592Sbms struct igmp_grouprec *pig; 2986189592Sbms struct ip_msource *ims, *nims; 2987189592Sbms struct mbuf *m, *m0, *md; 2988189592Sbms in_addr_t naddr; 2989191657Sbms int m0srcs, nbytes, npbytes, off, rsrcs, schanged; 2990189592Sbms int nallow, nblock; 2991189592Sbms uint8_t mode, now, then; 2992189592Sbms rectype_t crt, drt, nrt; 2993189592Sbms 2994189592Sbms IN_MULTI_LOCK_ASSERT(); 2995189592Sbms 2996189592Sbms if (inm->inm_nsrc == 0 || 2997189592Sbms (inm->inm_st[0].iss_asm > 0 && inm->inm_st[1].iss_asm > 0)) 2998189592Sbms return (0); 2999189592Sbms 3000189592Sbms ifp = inm->inm_ifp; /* interface */ 3001189592Sbms mode = inm->inm_st[1].iss_fmode; /* filter mode at t1 */ 3002189592Sbms crt = REC_NONE; /* current group record type */ 3003189592Sbms drt = REC_NONE; /* mask of completed group record types */ 3004189592Sbms nrt = REC_NONE; /* record type for current node */ 3005189592Sbms m0srcs = 0; /* # source which will fit in current mbuf chain */ 3006189592Sbms nbytes = 0; /* # of bytes appended to group's state-change queue */ 3007191657Sbms npbytes = 0; /* # of bytes appended this packet */ 3008189592Sbms rsrcs = 0; /* # sources encoded in current record */ 3009189592Sbms schanged = 0; /* # nodes encoded in overall filter change */ 3010189592Sbms nallow = 0; /* # of source entries in ALLOW_NEW */ 3011189592Sbms nblock = 0; /* # of source entries in BLOCK_OLD */ 3012189592Sbms nims = NULL; /* next tree node pointer */ 3013189592Sbms 3014189592Sbms /* 3015189592Sbms * For each possible filter record mode. 3016189592Sbms * The first kind of source we encounter tells us which 3017189592Sbms * is the first kind of record we start appending. 3018189592Sbms * If a node transitioned to UNDEFINED at t1, its mode is treated 3019189592Sbms * as the inverse of the group's filter mode. 3020189592Sbms */ 3021189592Sbms while (drt != REC_FULL) { 3022189592Sbms do { 3023189592Sbms m0 = ifq->ifq_tail; 3024189592Sbms if (m0 != NULL && 3025189592Sbms (m0->m_pkthdr.PH_vt.vt_nrecs + 1 <= 3026189592Sbms IGMP_V3_REPORT_MAXRECS) && 3027189592Sbms (m0->m_pkthdr.len + MINRECLEN) < 3028189592Sbms (ifp->if_mtu - IGMP_LEADINGSPACE)) { 3029189592Sbms m = m0; 3030189592Sbms m0srcs = (ifp->if_mtu - m0->m_pkthdr.len - 3031189592Sbms sizeof(struct igmp_grouprec)) / 3032189592Sbms sizeof(in_addr_t); 3033189592Sbms CTR1(KTR_IGMPV3, 3034189592Sbms "%s: use previous packet", __func__); 3035189592Sbms } else { 3036189592Sbms m = m_getcl(M_DONTWAIT, MT_DATA, M_PKTHDR); 3037190692Sbms if (m) 3038190692Sbms m->m_data += IGMP_LEADINGSPACE; 3039189592Sbms if (m == NULL) { 3040189592Sbms m = m_gethdr(M_DONTWAIT, MT_DATA); 3041189592Sbms if (m) 3042189592Sbms MH_ALIGN(m, IGMP_LEADINGSPACE); 3043189592Sbms } 3044189592Sbms if (m == NULL) { 3045189592Sbms CTR1(KTR_IGMPV3, 3046189592Sbms "%s: m_get*() failed", __func__); 3047189592Sbms return (-ENOMEM); 3048189592Sbms } 3049189592Sbms m->m_pkthdr.PH_vt.vt_nrecs = 0; 3050189592Sbms igmp_save_context(m, ifp); 3051189592Sbms m0srcs = (ifp->if_mtu - IGMP_LEADINGSPACE - 3052189592Sbms sizeof(struct igmp_grouprec)) / 3053189592Sbms sizeof(in_addr_t); 3054191657Sbms npbytes = 0; 3055189592Sbms CTR1(KTR_IGMPV3, 3056189592Sbms "%s: allocated new packet", __func__); 3057189592Sbms } 3058189592Sbms /* 3059189592Sbms * Append the IGMP group record header to the 3060189592Sbms * current packet's data area. 3061189592Sbms * Recalculate pointer to free space for next 3062189592Sbms * group record, in case m_append() allocated 3063189592Sbms * a new mbuf or cluster. 3064189592Sbms */ 3065189592Sbms memset(&ig, 0, sizeof(ig)); 3066189592Sbms ig.ig_group = inm->inm_addr; 3067189592Sbms if (!m_append(m, sizeof(ig), (void *)&ig)) { 3068189592Sbms if (m != m0) 3069189592Sbms m_freem(m); 3070189592Sbms CTR1(KTR_IGMPV3, 3071189592Sbms "%s: m_append() failed", __func__); 3072189592Sbms return (-ENOMEM); 3073189592Sbms } 3074191657Sbms npbytes += sizeof(struct igmp_grouprec); 3075191657Sbms if (m != m0) { 3076191657Sbms /* new packet; offset in c hain */ 3077191657Sbms md = m_getptr(m, npbytes - 3078191657Sbms sizeof(struct igmp_grouprec), &off); 3079189592Sbms pig = (struct igmp_grouprec *)(mtod(md, 3080191657Sbms uint8_t *) + off); 3081189592Sbms } else { 3082191657Sbms /* current packet; offset from last append */ 3083191657Sbms md = m_last(m); 3084189592Sbms pig = (struct igmp_grouprec *)(mtod(md, 3085191657Sbms uint8_t *) + md->m_len - 3086191657Sbms sizeof(struct igmp_grouprec)); 3087189592Sbms } 3088189592Sbms /* 3089189592Sbms * Begin walking the tree for this record type 3090189592Sbms * pass, or continue from where we left off 3091189592Sbms * previously if we had to allocate a new packet. 3092189592Sbms * Only report deltas in-mode at t1. 3093189592Sbms * We need not report included sources as allowed 3094189592Sbms * if we are in inclusive mode on the group, 3095189592Sbms * however the converse is not true. 3096189592Sbms */ 3097189592Sbms rsrcs = 0; 3098189592Sbms if (nims == NULL) 3099189592Sbms nims = RB_MIN(ip_msource_tree, &inm->inm_srcs); 3100189592Sbms RB_FOREACH_FROM(ims, ip_msource_tree, nims) { 3101189592Sbms CTR2(KTR_IGMPV3, "%s: visit node %s", 3102189592Sbms __func__, inet_ntoa_haddr(ims->ims_haddr)); 3103189592Sbms now = ims_get_mode(inm, ims, 1); 3104189592Sbms then = ims_get_mode(inm, ims, 0); 3105189592Sbms CTR3(KTR_IGMPV3, "%s: mode: t0 %d, t1 %d", 3106189592Sbms __func__, then, now); 3107189592Sbms if (now == then) { 3108189592Sbms CTR1(KTR_IGMPV3, 3109189592Sbms "%s: skip unchanged", __func__); 3110189592Sbms continue; 3111189592Sbms } 3112189592Sbms if (mode == MCAST_EXCLUDE && 3113189592Sbms now == MCAST_INCLUDE) { 3114189592Sbms CTR1(KTR_IGMPV3, 3115189592Sbms "%s: skip IN src on EX group", 3116189592Sbms __func__); 3117189592Sbms continue; 3118189592Sbms } 3119189592Sbms nrt = (rectype_t)now; 3120189592Sbms if (nrt == REC_NONE) 3121189592Sbms nrt = (rectype_t)(~mode & REC_FULL); 3122189592Sbms if (schanged++ == 0) { 3123189592Sbms crt = nrt; 3124189592Sbms } else if (crt != nrt) 3125189592Sbms continue; 3126189592Sbms naddr = htonl(ims->ims_haddr); 3127189592Sbms if (!m_append(m, sizeof(in_addr_t), 3128189592Sbms (void *)&naddr)) { 3129189592Sbms if (m != m0) 3130189592Sbms m_freem(m); 3131189592Sbms CTR1(KTR_IGMPV3, 3132189592Sbms "%s: m_append() failed", __func__); 3133189592Sbms return (-ENOMEM); 3134189592Sbms } 3135189592Sbms nallow += !!(crt == REC_ALLOW); 3136189592Sbms nblock += !!(crt == REC_BLOCK); 3137189592Sbms if (++rsrcs == m0srcs) 3138189592Sbms break; 3139189592Sbms } 3140189592Sbms /* 3141189592Sbms * If we did not append any tree nodes on this 3142189592Sbms * pass, back out of allocations. 3143189592Sbms */ 3144189592Sbms if (rsrcs == 0) { 3145191657Sbms npbytes -= sizeof(struct igmp_grouprec); 3146189592Sbms if (m != m0) { 3147189592Sbms CTR1(KTR_IGMPV3, 3148189592Sbms "%s: m_free(m)", __func__); 3149189592Sbms m_freem(m); 3150189592Sbms } else { 3151189592Sbms CTR1(KTR_IGMPV3, 3152189592Sbms "%s: m_adj(m, -ig)", __func__); 3153189592Sbms m_adj(m, -((int)sizeof( 3154189592Sbms struct igmp_grouprec))); 3155189592Sbms } 3156189592Sbms continue; 3157189592Sbms } 3158191657Sbms npbytes += (rsrcs * sizeof(in_addr_t)); 3159189592Sbms if (crt == REC_ALLOW) 3160189592Sbms pig->ig_type = IGMP_ALLOW_NEW_SOURCES; 3161189592Sbms else if (crt == REC_BLOCK) 3162189592Sbms pig->ig_type = IGMP_BLOCK_OLD_SOURCES; 3163189592Sbms pig->ig_numsrc = htons(rsrcs); 3164189592Sbms /* 3165189592Sbms * Count the new group record, and enqueue this 3166189592Sbms * packet if it wasn't already queued. 3167189592Sbms */ 3168189592Sbms m->m_pkthdr.PH_vt.vt_nrecs++; 3169189592Sbms if (m != m0) 3170189592Sbms _IF_ENQUEUE(ifq, m); 3171191657Sbms nbytes += npbytes; 3172189592Sbms } while (nims != NULL); 3173189592Sbms drt |= crt; 3174189592Sbms crt = (~crt & REC_FULL); 3175189592Sbms } 3176189592Sbms 3177189592Sbms CTR3(KTR_IGMPV3, "%s: queued %d ALLOW_NEW, %d BLOCK_OLD", __func__, 3178189592Sbms nallow, nblock); 3179189592Sbms 3180189592Sbms return (nbytes); 3181189592Sbms} 3182189592Sbms 3183189592Sbmsstatic int 3184189592Sbmsigmp_v3_merge_state_changes(struct in_multi *inm, struct ifqueue *ifscq) 3185189592Sbms{ 3186189592Sbms struct ifqueue *gq; 3187189592Sbms struct mbuf *m; /* pending state-change */ 3188189592Sbms struct mbuf *m0; /* copy of pending state-change */ 3189189592Sbms struct mbuf *mt; /* last state-change in packet */ 3190189592Sbms int docopy, domerge; 3191189592Sbms u_int recslen; 3192189592Sbms 3193189592Sbms docopy = 0; 3194189592Sbms domerge = 0; 3195189592Sbms recslen = 0; 3196189592Sbms 3197189592Sbms IN_MULTI_LOCK_ASSERT(); 3198189592Sbms IGMP_LOCK_ASSERT(); 3199189592Sbms 3200189592Sbms /* 3201189592Sbms * If there are further pending retransmissions, make a writable 3202189592Sbms * copy of each queued state-change message before merging. 3203189592Sbms */ 3204189592Sbms if (inm->inm_scrv > 0) 3205189592Sbms docopy = 1; 3206189592Sbms 3207189592Sbms gq = &inm->inm_scq; 3208189592Sbms#ifdef KTR 3209189592Sbms if (gq->ifq_head == NULL) { 3210189592Sbms CTR2(KTR_IGMPV3, "%s: WARNING: queue for inm %p is empty", 3211189592Sbms __func__, inm); 3212189592Sbms } 3213189592Sbms#endif 3214189592Sbms 3215189592Sbms m = gq->ifq_head; 3216189592Sbms while (m != NULL) { 3217189592Sbms /* 3218189592Sbms * Only merge the report into the current packet if 3219189592Sbms * there is sufficient space to do so; an IGMPv3 report 3220189592Sbms * packet may only contain 65,535 group records. 3221189592Sbms * Always use a simple mbuf chain concatentation to do this, 3222189592Sbms * as large state changes for single groups may have 3223189592Sbms * allocated clusters. 3224189592Sbms */ 3225189592Sbms domerge = 0; 3226189592Sbms mt = ifscq->ifq_tail; 3227189592Sbms if (mt != NULL) { 3228189592Sbms recslen = m_length(m, NULL); 3229189592Sbms 3230189592Sbms if ((mt->m_pkthdr.PH_vt.vt_nrecs + 3231189592Sbms m->m_pkthdr.PH_vt.vt_nrecs <= 3232189592Sbms IGMP_V3_REPORT_MAXRECS) && 3233189592Sbms (mt->m_pkthdr.len + recslen <= 3234189592Sbms (inm->inm_ifp->if_mtu - IGMP_LEADINGSPACE))) 3235189592Sbms domerge = 1; 3236189592Sbms } 3237189592Sbms 3238189592Sbms if (!domerge && _IF_QFULL(gq)) { 3239189592Sbms CTR2(KTR_IGMPV3, 3240189592Sbms "%s: outbound queue full, skipping whole packet %p", 3241189592Sbms __func__, m); 3242189592Sbms mt = m->m_nextpkt; 3243189592Sbms if (!docopy) 3244189592Sbms m_freem(m); 3245189592Sbms m = mt; 3246189592Sbms continue; 3247189592Sbms } 3248189592Sbms 3249189592Sbms if (!docopy) { 3250189592Sbms CTR2(KTR_IGMPV3, "%s: dequeueing %p", __func__, m); 3251189592Sbms _IF_DEQUEUE(gq, m0); 3252189592Sbms m = m0->m_nextpkt; 3253189592Sbms } else { 3254189592Sbms CTR2(KTR_IGMPV3, "%s: copying %p", __func__, m); 3255189592Sbms m0 = m_dup(m, M_NOWAIT); 3256189592Sbms if (m0 == NULL) 3257189592Sbms return (ENOMEM); 3258189592Sbms m0->m_nextpkt = NULL; 3259189592Sbms m = m->m_nextpkt; 3260189592Sbms } 3261189592Sbms 3262189592Sbms if (!domerge) { 3263189592Sbms CTR3(KTR_IGMPV3, "%s: queueing %p to ifscq %p)", 3264189592Sbms __func__, m0, ifscq); 3265189592Sbms _IF_ENQUEUE(ifscq, m0); 3266189592Sbms } else { 3267189592Sbms struct mbuf *mtl; /* last mbuf of packet mt */ 3268189592Sbms 3269189592Sbms CTR3(KTR_IGMPV3, "%s: merging %p with ifscq tail %p)", 3270189592Sbms __func__, m0, mt); 3271189592Sbms 3272189592Sbms mtl = m_last(mt); 3273189592Sbms m0->m_flags &= ~M_PKTHDR; 3274189592Sbms mt->m_pkthdr.len += recslen; 3275189592Sbms mt->m_pkthdr.PH_vt.vt_nrecs += 3276189592Sbms m0->m_pkthdr.PH_vt.vt_nrecs; 3277189592Sbms 3278189592Sbms mtl->m_next = m0; 3279189592Sbms } 3280189592Sbms } 3281189592Sbms 3282189592Sbms return (0); 3283189592Sbms} 3284189592Sbms 3285189592Sbms/* 3286189592Sbms * Respond to a pending IGMPv3 General Query. 3287189592Sbms */ 3288189592Sbmsstatic void 3289189592Sbmsigmp_v3_dispatch_general_query(struct igmp_ifinfo *igi) 3290189592Sbms{ 3291191548Szec INIT_VNET_INET(curvnet); 3292189592Sbms struct ifmultiaddr *ifma, *tifma; 3293189592Sbms struct ifnet *ifp; 3294189592Sbms struct in_multi *inm; 3295189592Sbms int retval, loop; 3296189592Sbms 3297189592Sbms IN_MULTI_LOCK_ASSERT(); 3298189592Sbms IGMP_LOCK_ASSERT(); 3299189592Sbms 3300189592Sbms KASSERT(igi->igi_version == IGMP_VERSION_3, 3301189592Sbms ("%s: called when version %d", __func__, igi->igi_version)); 3302189592Sbms 3303189592Sbms ifp = igi->igi_ifp; 3304189592Sbms 3305189592Sbms IF_ADDR_LOCK(ifp); 3306189592Sbms TAILQ_FOREACH_SAFE(ifma, &ifp->if_multiaddrs, ifma_link, tifma) { 3307189931Sbms if (ifma->ifma_addr->sa_family != AF_INET || 3308189931Sbms ifma->ifma_protospec == NULL) 3309189592Sbms continue; 3310189592Sbms 3311189592Sbms inm = (struct in_multi *)ifma->ifma_protospec; 3312189592Sbms KASSERT(ifp == inm->inm_ifp, 3313189592Sbms ("%s: inconsistent ifp", __func__)); 3314189592Sbms 3315189592Sbms switch (inm->inm_state) { 3316189592Sbms case IGMP_NOT_MEMBER: 3317189592Sbms case IGMP_SILENT_MEMBER: 3318189592Sbms break; 3319189592Sbms case IGMP_REPORTING_MEMBER: 3320189592Sbms case IGMP_IDLE_MEMBER: 3321189592Sbms case IGMP_LAZY_MEMBER: 3322189592Sbms case IGMP_SLEEPING_MEMBER: 3323189592Sbms case IGMP_AWAKENING_MEMBER: 3324189592Sbms inm->inm_state = IGMP_REPORTING_MEMBER; 3325189592Sbms retval = igmp_v3_enqueue_group_record(&igi->igi_gq, 3326189592Sbms inm, 0, 0, 0); 3327189592Sbms CTR2(KTR_IGMPV3, "%s: enqueue record = %d", 3328189592Sbms __func__, retval); 3329189592Sbms break; 3330189592Sbms case IGMP_G_QUERY_PENDING_MEMBER: 3331189592Sbms case IGMP_SG_QUERY_PENDING_MEMBER: 3332189592Sbms case IGMP_LEAVING_MEMBER: 3333189592Sbms break; 3334189592Sbms } 3335189592Sbms } 3336189592Sbms IF_ADDR_UNLOCK(ifp); 3337189592Sbms 3338189592Sbms loop = (igi->igi_flags & IGIF_LOOPBACK) ? 1 : 0; 3339189592Sbms igmp_dispatch_queue(&igi->igi_gq, IGMP_MAX_RESPONSE_BURST, loop); 3340189592Sbms 3341189592Sbms /* 3342189592Sbms * Slew transmission of bursts over 500ms intervals. 3343189592Sbms */ 3344189592Sbms if (igi->igi_gq.ifq_head != NULL) { 3345189592Sbms igi->igi_v3_timer = 1 + IGMP_RANDOM_DELAY( 3346189592Sbms IGMP_RESPONSE_BURST_INTERVAL); 3347189592Sbms V_interface_timers_running = 1; 3348189592Sbms } 3349189592Sbms} 3350189592Sbms 3351189592Sbms/* 3352189592Sbms * Transmit the next pending IGMP message in the output queue. 3353189592Sbms * 3354189592Sbms * We get called from netisr_processqueue(). A mutex private to igmpoq 3355189592Sbms * will be acquired and released around this routine. 3356189592Sbms * 3357189592Sbms * VIMAGE: Needs to store/restore vnet pointer on a per-mbuf-chain basis. 3358189592Sbms * MRT: Nothing needs to be done, as IGMP traffic is always local to 3359189592Sbms * a link and uses a link-scope multicast address. 3360189592Sbms */ 3361189592Sbmsstatic void 3362189592Sbmsigmp_intr(struct mbuf *m) 3363189592Sbms{ 3364189592Sbms struct ip_moptions imo; 3365189592Sbms struct ifnet *ifp; 3366189592Sbms struct mbuf *ipopts, *m0; 3367189592Sbms int error; 3368189592Sbms uint32_t ifindex; 3369189592Sbms 3370189592Sbms CTR2(KTR_IGMPV3, "%s: transmit %p", __func__, m); 3371189592Sbms 3372189592Sbms /* 3373191548Szec * Set VNET image pointer from enqueued mbuf chain 3374189592Sbms * before doing anything else. Whilst we use interface 3375189592Sbms * indexes to guard against interface detach, they are 3376189592Sbms * unique to each VIMAGE and must be retrieved. 3377189592Sbms */ 3378191816Szec CURVNET_SET((struct vnet *)(m->m_pkthdr.header)); 3379191548Szec INIT_VNET_NET(curvnet); 3380191548Szec INIT_VNET_INET(curvnet); 3381189592Sbms ifindex = igmp_restore_context(m); 3382189592Sbms 3383189592Sbms /* 3384189592Sbms * Check if the ifnet still exists. This limits the scope of 3385189592Sbms * any race in the absence of a global ifp lock for low cost 3386189592Sbms * (an array lookup). 3387189592Sbms */ 3388189592Sbms ifp = ifnet_byindex(ifindex); 3389189592Sbms if (ifp == NULL) { 3390189592Sbms CTR3(KTR_IGMPV3, "%s: dropped %p as ifindex %u went away.", 3391189592Sbms __func__, m, ifindex); 3392189592Sbms m_freem(m); 3393190951Srwatson IPSTAT_INC(ips_noroute); 3394189592Sbms goto out; 3395189592Sbms } 3396189592Sbms 3397189592Sbms ipopts = V_igmp_sendra ? m_raopt : NULL; 3398189592Sbms 3399119181Srwatson imo.imo_multicast_ttl = 1; 340015292Swollman imo.imo_multicast_vif = -1; 3401181803Sbz imo.imo_multicast_loop = (V_ip_mrouter != NULL); 34021541Srgrimes 340315292Swollman /* 3404189592Sbms * If the user requested that IGMP traffic be explicitly 3405189592Sbms * redirected to the loopback interface (e.g. they are running a 3406189592Sbms * MANET interface and the routing protocol needs to see the 3407189592Sbms * updates), handle this now. 340815292Swollman */ 3409189592Sbms if (m->m_flags & M_IGMP_LOOP) 3410189592Sbms imo.imo_multicast_ifp = V_loif; 3411189592Sbms else 3412189592Sbms imo.imo_multicast_ifp = ifp; 34132531Swollman 3414189592Sbms if (m->m_flags & M_IGMPV2) { 3415189592Sbms m0 = m; 3416189592Sbms } else { 3417189592Sbms m0 = igmp_v3_encap_report(ifp, m); 3418189592Sbms if (m0 == NULL) { 3419189592Sbms CTR2(KTR_IGMPV3, "%s: dropped %p", __func__, m); 3420189592Sbms m_freem(m); 3421190951Srwatson IPSTAT_INC(ips_odropped); 3422189592Sbms goto out; 3423189592Sbms } 3424189592Sbms } 3425189592Sbms 3426189592Sbms igmp_scrub_context(m0); 3427189592Sbms m->m_flags &= ~(M_PROTOFLAGS); 3428189592Sbms m0->m_pkthdr.rcvif = V_loif; 3429189592Sbms#ifdef MAC 3430189592Sbms mac_netinet_igmp_send(ifp, m0); 3431189592Sbms#endif 3432189592Sbms error = ip_output(m0, ipopts, NULL, 0, &imo, NULL); 3433189592Sbms if (error) { 3434189592Sbms CTR3(KTR_IGMPV3, "%s: ip_output(%p) = %d", __func__, m0, error); 3435189592Sbms goto out; 3436189592Sbms } 3437189592Sbms 3438190965Srwatson IGMPSTAT_INC(igps_snd_reports); 3439189592Sbms 3440189592Sbmsout: 3441189592Sbms /* 3442189592Sbms * We must restore the existing vnet pointer before 3443189592Sbms * continuing as we are run from netisr context. 3444189592Sbms */ 3445189592Sbms CURVNET_RESTORE(); 34461541Srgrimes} 3447189592Sbms 3448189592Sbms/* 3449189592Sbms * Encapsulate an IGMPv3 report. 3450189592Sbms * 3451189592Sbms * The internal mbuf flag M_IGMPV3_HDR is used to indicate that the mbuf 3452189592Sbms * chain has already had its IP/IGMPv3 header prepended. In this case 3453189592Sbms * the function will not attempt to prepend; the lengths and checksums 3454189592Sbms * will however be re-computed. 3455189592Sbms * 3456189592Sbms * Returns a pointer to the new mbuf chain head, or NULL if the 3457189592Sbms * allocation failed. 3458189592Sbms */ 3459189592Sbmsstatic struct mbuf * 3460189592Sbmsigmp_v3_encap_report(struct ifnet *ifp, struct mbuf *m) 3461189592Sbms{ 3462189592Sbms INIT_VNET_INET(curvnet); 3463189592Sbms struct igmp_report *igmp; 3464189592Sbms struct ip *ip; 3465189592Sbms int hdrlen, igmpreclen; 3466189592Sbms 3467189592Sbms KASSERT((m->m_flags & M_PKTHDR), 3468189592Sbms ("%s: mbuf chain %p is !M_PKTHDR", __func__, m)); 3469189592Sbms 3470189592Sbms igmpreclen = m_length(m, NULL); 3471189592Sbms hdrlen = sizeof(struct ip) + sizeof(struct igmp_report); 3472189592Sbms 3473189592Sbms if (m->m_flags & M_IGMPV3_HDR) { 3474189592Sbms igmpreclen -= hdrlen; 3475189592Sbms } else { 3476189592Sbms M_PREPEND(m, hdrlen, M_DONTWAIT); 3477189592Sbms if (m == NULL) 3478189592Sbms return (NULL); 3479189592Sbms m->m_flags |= M_IGMPV3_HDR; 3480189592Sbms } 3481189592Sbms 3482189592Sbms CTR2(KTR_IGMPV3, "%s: igmpreclen is %d", __func__, igmpreclen); 3483189592Sbms 3484189592Sbms m->m_data += sizeof(struct ip); 3485189592Sbms m->m_len -= sizeof(struct ip); 3486189592Sbms 3487189592Sbms igmp = mtod(m, struct igmp_report *); 3488189592Sbms igmp->ir_type = IGMP_v3_HOST_MEMBERSHIP_REPORT; 3489189592Sbms igmp->ir_rsv1 = 0; 3490189592Sbms igmp->ir_rsv2 = 0; 3491189592Sbms igmp->ir_numgrps = htons(m->m_pkthdr.PH_vt.vt_nrecs); 3492189592Sbms igmp->ir_cksum = 0; 3493189592Sbms igmp->ir_cksum = in_cksum(m, sizeof(struct igmp_report) + igmpreclen); 3494189592Sbms m->m_pkthdr.PH_vt.vt_nrecs = 0; 3495189592Sbms 3496189592Sbms m->m_data -= sizeof(struct ip); 3497189592Sbms m->m_len += sizeof(struct ip); 3498189592Sbms 3499189592Sbms ip = mtod(m, struct ip *); 3500189592Sbms ip->ip_tos = IPTOS_PREC_INTERNETCONTROL; 3501189592Sbms ip->ip_len = hdrlen + igmpreclen; 3502189592Sbms ip->ip_off = IP_DF; 3503189592Sbms ip->ip_p = IPPROTO_IGMP; 3504189592Sbms ip->ip_sum = 0; 3505189592Sbms 3506189592Sbms ip->ip_src.s_addr = INADDR_ANY; 3507189592Sbms 3508189592Sbms if (m->m_flags & M_IGMP_LOOP) { 3509189592Sbms struct in_ifaddr *ia; 3510189592Sbms 3511189592Sbms IFP_TO_IA(ifp, ia); 3512189592Sbms if (ia != NULL) 3513189592Sbms ip->ip_src = ia->ia_addr.sin_addr; 3514189592Sbms } 3515189592Sbms 3516189592Sbms ip->ip_dst.s_addr = htonl(INADDR_ALLRPTS_GROUP); 3517189592Sbms 3518189592Sbms return (m); 3519189592Sbms} 3520189592Sbms 3521189592Sbms#ifdef KTR 3522189592Sbmsstatic char * 3523189592Sbmsigmp_rec_type_to_str(const int type) 3524189592Sbms{ 3525189592Sbms 3526189592Sbms switch (type) { 3527189592Sbms case IGMP_CHANGE_TO_EXCLUDE_MODE: 3528189592Sbms return "TO_EX"; 3529189592Sbms break; 3530189592Sbms case IGMP_CHANGE_TO_INCLUDE_MODE: 3531189592Sbms return "TO_IN"; 3532189592Sbms break; 3533189592Sbms case IGMP_MODE_IS_EXCLUDE: 3534189592Sbms return "MODE_EX"; 3535189592Sbms break; 3536189592Sbms case IGMP_MODE_IS_INCLUDE: 3537189592Sbms return "MODE_IN"; 3538189592Sbms break; 3539189592Sbms case IGMP_ALLOW_NEW_SOURCES: 3540189592Sbms return "ALLOW_NEW"; 3541189592Sbms break; 3542189592Sbms case IGMP_BLOCK_OLD_SOURCES: 3543189592Sbms return "BLOCK_OLD"; 3544189592Sbms break; 3545189592Sbms default: 3546189592Sbms break; 3547189592Sbms } 3548189592Sbms return "unknown"; 3549189592Sbms} 3550189592Sbms#endif 3551189592Sbms 3552189592Sbmsstatic void 3553189592Sbmsigmp_sysinit(void) 3554189592Sbms{ 3555189592Sbms 3556189592Sbms CTR1(KTR_IGMPV3, "%s: initializing", __func__); 3557189592Sbms 3558189592Sbms IGMP_LOCK_INIT(); 3559189592Sbms 3560189592Sbms mtx_init(&igmpoq.ifq_mtx, "igmpoq_mtx", NULL, MTX_DEF); 3561189592Sbms IFQ_SET_MAXLEN(&igmpoq, IFQ_MAXLEN); 3562189592Sbms 3563189592Sbms m_raopt = igmp_ra_alloc(); 3564189592Sbms 3565191264Sbms netisr_register(NETISR_IGMP, igmp_intr, &igmpoq, 0); 3566189592Sbms} 3567189592Sbms 3568189592Sbmsstatic void 3569189592Sbmsigmp_sysuninit(void) 3570189592Sbms{ 3571189592Sbms 3572189592Sbms CTR1(KTR_IGMPV3, "%s: tearing down", __func__); 3573189592Sbms 3574189592Sbms netisr_unregister(NETISR_IGMP); 3575189592Sbms mtx_destroy(&igmpoq.ifq_mtx); 3576189592Sbms 3577189592Sbms m_free(m_raopt); 3578189592Sbms m_raopt = NULL; 3579189592Sbms 3580189592Sbms IGMP_LOCK_DESTROY(); 3581189592Sbms} 3582189592Sbms 3583189592Sbms/* 3584189592Sbms * Initialize an IGMPv3 instance. 3585189592Sbms * VIMAGE: Assumes curvnet set by caller and called per vimage. 3586189592Sbms */ 3587189592Sbmsstatic int 3588189592Sbmsvnet_igmp_iattach(const void *unused __unused) 3589189592Sbms{ 3590189592Sbms INIT_VNET_INET(curvnet); 3591189592Sbms 3592189592Sbms CTR1(KTR_IGMPV3, "%s: initializing", __func__); 3593189592Sbms 3594189592Sbms LIST_INIT(&V_igi_head); 3595189592Sbms 3596189592Sbms V_current_state_timers_running = 0; 3597189592Sbms V_state_change_timers_running = 0; 3598189592Sbms V_interface_timers_running = 0; 3599189592Sbms 3600189592Sbms /* 3601189592Sbms * Initialize sysctls to default values. 3602189592Sbms */ 3603189592Sbms V_igmp_recvifkludge = 1; 3604189592Sbms V_igmp_sendra = 1; 3605189592Sbms V_igmp_sendlocal = 1; 3606189592Sbms V_igmp_v1enable = 1; 3607189592Sbms V_igmp_v2enable = 1; 3608189592Sbms V_igmp_legacysupp = 0; 3609189592Sbms V_igmp_default_version = IGMP_VERSION_3; 3610189592Sbms V_igmp_gsrdelay.tv_sec = 10; 3611189592Sbms V_igmp_gsrdelay.tv_usec = 0; 3612189592Sbms 3613189592Sbms memset(&V_igmpstat, 0, sizeof(struct igmpstat)); 3614189592Sbms V_igmpstat.igps_version = IGPS_VERSION_3; 3615189592Sbms V_igmpstat.igps_len = sizeof(struct igmpstat); 3616189592Sbms 3617189592Sbms return (0); 3618189592Sbms} 3619189592Sbms 3620189592Sbmsstatic int 3621189592Sbmsvnet_igmp_idetach(const void *unused __unused) 3622189592Sbms{ 3623191734Szec#ifdef INVARIANTS 3624189592Sbms INIT_VNET_INET(curvnet); 3625191734Szec#endif 3626189592Sbms 3627189592Sbms CTR1(KTR_IGMPV3, "%s: tearing down", __func__); 3628189592Sbms 3629189592Sbms KASSERT(LIST_EMPTY(&V_igi_head), 3630189592Sbms ("%s: igi list not empty; ifnets not detached?", __func__)); 3631189592Sbms 3632189592Sbms return (0); 3633189592Sbms} 3634189592Sbms 3635191548Szec#ifndef VIMAGE_GLOBALS 3636191548Szecstatic vnet_modinfo_t vnet_igmp_modinfo = { 3637191548Szec .vmi_id = VNET_MOD_IGMP, 3638191548Szec .vmi_name = "igmp", 3639191548Szec .vmi_dependson = VNET_MOD_INET, 3640191548Szec .vmi_iattach = vnet_igmp_iattach, 3641191548Szec .vmi_idetach = vnet_igmp_idetach 3642189592Sbms}; 3643191548Szec#endif 3644189592Sbms 3645189592Sbmsstatic int 3646189592Sbmsigmp_modevent(module_t mod, int type, void *unused __unused) 3647189592Sbms{ 3648189592Sbms 3649189592Sbms switch (type) { 3650189592Sbms case MOD_LOAD: 3651189592Sbms igmp_sysinit(); 3652191548Szec#ifndef VIMAGE_GLOBALS 3653189592Sbms vnet_mod_register(&vnet_igmp_modinfo); 3654189592Sbms#else 3655191548Szec vnet_igmp_iattach(NULL); 3656191548Szec#endif 3657189592Sbms break; 3658189592Sbms case MOD_UNLOAD: 3659191548Szec#ifndef VIMAGE_GLOBALS 3660191548Szec vnet_mod_deregister(&vnet_igmp_modinfo); 3661189592Sbms#else 3662191548Szec vnet_igmp_idetach(NULL); 3663191548Szec#endif 3664189592Sbms igmp_sysuninit(); 3665189592Sbms break; 3666189592Sbms default: 3667189592Sbms return (EOPNOTSUPP); 3668189592Sbms } 3669189592Sbms return (0); 3670189592Sbms} 3671189592Sbms 3672189592Sbmsstatic moduledata_t igmp_mod = { 3673189592Sbms "igmp", 3674189592Sbms igmp_modevent, 3675189592Sbms 0 3676189592Sbms}; 3677189592SbmsDECLARE_MODULE(igmp, igmp_mod, SI_SUB_PSEUDO, SI_ORDER_ANY); 3678