in_var.h revision 194951
10SN/A/*-
2157SN/A * Copyright (c) 1985, 1986, 1993
30SN/A *	The Regents of the University of California.  All rights reserved.
40SN/A *
50SN/A * Redistribution and use in source and binary forms, with or without
60SN/A * modification, are permitted provided that the following conditions
7157SN/A * are met:
80SN/A * 1. Redistributions of source code must retain the above copyright
9157SN/A *    notice, this list of conditions and the following disclaimer.
100SN/A * 2. Redistributions in binary form must reproduce the above copyright
110SN/A *    notice, this list of conditions and the following disclaimer in the
120SN/A *    documentation and/or other materials provided with the distribution.
130SN/A * 4. Neither the name of the University nor the names of its contributors
140SN/A *    may be used to endorse or promote products derived from this software
150SN/A *    without specific prior written permission.
160SN/A *
170SN/A * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
180SN/A * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
190SN/A * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
200SN/A * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21157SN/A * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22157SN/A * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23157SN/A * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
240SN/A * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
250SN/A * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
260SN/A * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
270SN/A * SUCH DAMAGE.
280SN/A *
290SN/A *	@(#)in_var.h	8.2 (Berkeley) 1/9/95
300SN/A * $FreeBSD: head/sys/netinet/in_var.h 194951 2009-06-25 11:52:33Z rwatson $
310SN/A */
320SN/A
330SN/A#ifndef _NETINET_IN_VAR_H_
340SN/A#define _NETINET_IN_VAR_H_
350SN/A
360SN/A#include <sys/queue.h>
370SN/A#include <sys/fnv_hash.h>
380SN/A#include <sys/tree.h>
390SN/A
400SN/Astruct igmp_ifinfo;
410SN/Astruct in_multi;
420SN/Astruct lltable;
430SN/A
440SN/A/*
450SN/A * IPv4 per-interface state.
460SN/A */
470SN/Astruct in_ifinfo {
480SN/A	struct lltable		*ii_llt;	/* ARP state */
49	struct igmp_ifinfo	*ii_igmp;	/* IGMP state */
50	struct in_multi		*ii_allhosts;	/* 224.0.0.1 membership */
51};
52
53/*
54 * Interface address, Internet version.  One of these structures
55 * is allocated for each Internet address on an interface.
56 * The ifaddr structure contains the protocol-independent part
57 * of the structure and is assumed to be first.
58 */
59struct in_ifaddr {
60	struct	ifaddr ia_ifa;		/* protocol-independent info */
61#define	ia_ifp		ia_ifa.ifa_ifp
62#define ia_flags	ia_ifa.ifa_flags
63					/* ia_{,sub}net{,mask} in host order */
64	u_long	ia_net;			/* network number of interface */
65	u_long	ia_netmask;		/* mask of net part */
66	u_long	ia_subnet;		/* subnet number, including net */
67	u_long	ia_subnetmask;		/* mask of subnet part */
68	struct	in_addr ia_netbroadcast; /* to recognize net broadcasts */
69	LIST_ENTRY(in_ifaddr) ia_hash;	/* entry in bucket of inet addresses */
70	TAILQ_ENTRY(in_ifaddr) ia_link;	/* list of internet addresses */
71	struct	sockaddr_in ia_addr;	/* reserve space for interface name */
72	struct	sockaddr_in ia_dstaddr; /* reserve space for broadcast addr */
73#define	ia_broadaddr	ia_dstaddr
74	struct	sockaddr_in ia_sockmask; /* reserve space for general netmask */
75};
76
77struct	in_aliasreq {
78	char	ifra_name[IFNAMSIZ];		/* if name, e.g. "en0" */
79	struct	sockaddr_in ifra_addr;
80	struct	sockaddr_in ifra_broadaddr;
81#define ifra_dstaddr ifra_broadaddr
82	struct	sockaddr_in ifra_mask;
83};
84/*
85 * Given a pointer to an in_ifaddr (ifaddr),
86 * return a pointer to the addr as a sockaddr_in.
87 */
88#define IA_SIN(ia)    (&(((struct in_ifaddr *)(ia))->ia_addr))
89#define IA_DSTSIN(ia) (&(((struct in_ifaddr *)(ia))->ia_dstaddr))
90
91#define IN_LNAOF(in, ifa) \
92	((ntohl((in).s_addr) & ~((struct in_ifaddr *)(ifa)->ia_subnetmask))
93
94
95#ifdef	_KERNEL
96extern	u_char	inetctlerrmap[];
97
98#define LLTABLE(ifp)	\
99	((struct in_ifinfo *)(ifp)->if_afdata[AF_INET])->ii_llt
100/*
101 * Hash table for IP addresses.
102 */
103TAILQ_HEAD(in_ifaddrhead, in_ifaddr);
104LIST_HEAD(in_ifaddrhashhead, in_ifaddr);
105#ifdef VIMAGE_GLOBALS
106extern	struct in_ifaddrhashhead *in_ifaddrhashtbl;
107extern	struct in_ifaddrhead in_ifaddrhead;
108extern	u_long in_ifaddrhmask;			/* mask for hash table */
109#endif
110
111#define INADDR_NHASH_LOG2       9
112#define INADDR_NHASH		(1 << INADDR_NHASH_LOG2)
113#define INADDR_HASHVAL(x)	fnv_32_buf((&(x)), sizeof(x), FNV1_32_INIT)
114#define INADDR_HASH(x) \
115	(&V_in_ifaddrhashtbl[INADDR_HASHVAL(x) & V_in_ifaddrhmask])
116
117extern	struct rwlock in_ifaddr_lock;
118
119#define	IN_IFADDR_LOCK_INIT()	rw_init(&in_ifaddr_lock, "in_ifaddr_lock")
120#define	IN_IFADDR_LOCK_ASSERT()	rw_assert(&in_ifaddr_lock, RA_LOCKED)
121#define	IN_IFADDR_RLOCK()	rw_rlock(&in_ifaddr_lock)
122#define	IN_IFADDR_RLOCK_ASSERT()	rw_assert(&in_ifaddr_lock, RA_RLOCKED)
123#define	IN_IFADDR_RUNLOCK()	rw_runlock(&in_ifaddr_lock)
124#define	IN_IFADDR_WLOCK()	rw_wlock(&in_ifaddr_lock)
125#define	IN_IFADDR_WLOCK_ASSERT()	rw_assert(&in_ifaddr_lock, RA_WLOCKED)
126#define	IN_IFADDR_WUNLOCK()	rw_wunlock(&in_ifaddr_lock)
127
128/*
129 * Macro for finding the internet address structure (in_ifaddr)
130 * corresponding to one of our IP addresses (in_addr).
131 */
132#define INADDR_TO_IFADDR(addr, ia) \
133	/* struct in_addr addr; */ \
134	/* struct in_ifaddr *ia; */ \
135do { \
136\
137	LIST_FOREACH(ia, INADDR_HASH((addr).s_addr), ia_hash) \
138		if (IA_SIN(ia)->sin_addr.s_addr == (addr).s_addr) \
139			break; \
140} while (0)
141
142/*
143 * Macro for finding the interface (ifnet structure) corresponding to one
144 * of our IP addresses.
145 */
146#define INADDR_TO_IFP(addr, ifp) \
147	/* struct in_addr addr; */ \
148	/* struct ifnet *ifp; */ \
149{ \
150	struct in_ifaddr *ia; \
151\
152	INADDR_TO_IFADDR(addr, ia); \
153	(ifp) = (ia == NULL) ? NULL : ia->ia_ifp; \
154}
155
156/*
157 * Macro for finding the internet address structure (in_ifaddr) corresponding
158 * to a given interface (ifnet structure).
159 */
160#define IFP_TO_IA(ifp, ia)						\
161	/* struct ifnet *ifp; */					\
162	/* struct in_ifaddr *ia; */					\
163{									\
164	for ((ia) = TAILQ_FIRST(&V_in_ifaddrhead);			\
165	    (ia) != NULL && (ia)->ia_ifp != (ifp);			\
166	    (ia) = TAILQ_NEXT((ia), ia_link))				\
167		continue;						\
168	if ((ia) != NULL)						\
169		ifa_ref(&(ia)->ia_ifa);					\
170}
171#endif
172
173/*
174 * IP datagram reassembly.
175 */
176#define	IPREASS_NHASH_LOG2	6
177#define	IPREASS_NHASH		(1 << IPREASS_NHASH_LOG2)
178#define	IPREASS_HMASK		(IPREASS_NHASH - 1)
179#define	IPREASS_HASH(x,y) \
180	(((((x) & 0xF) | ((((x) >> 8) & 0xF) << 4)) ^ (y)) & IPREASS_HMASK)
181
182/*
183 * Legacy IPv4 IGMP per-link structure.
184 */
185struct router_info {
186	struct ifnet *rti_ifp;
187	int    rti_type; /* type of router which is querier on this interface */
188	int    rti_time; /* # of slow timeouts since last old query */
189	SLIST_ENTRY(router_info) rti_list;
190};
191
192/*
193 * Per-interface IGMP router version information.
194 */
195struct igmp_ifinfo {
196	LIST_ENTRY(igmp_ifinfo) igi_link;
197	struct ifnet *igi_ifp;	/* interface this instance belongs to */
198	uint32_t igi_version;	/* IGMPv3 Host Compatibility Mode */
199	uint32_t igi_v1_timer;	/* IGMPv1 Querier Present timer (s) */
200	uint32_t igi_v2_timer;	/* IGMPv2 Querier Present timer (s) */
201	uint32_t igi_v3_timer;	/* IGMPv3 General Query (interface) timer (s)*/
202	uint32_t igi_flags;	/* IGMP per-interface flags */
203	uint32_t igi_rv;	/* IGMPv3 Robustness Variable */
204	uint32_t igi_qi;	/* IGMPv3 Query Interval (s) */
205	uint32_t igi_qri;	/* IGMPv3 Query Response Interval (s) */
206	uint32_t igi_uri;	/* IGMPv3 Unsolicited Report Interval (s) */
207	SLIST_HEAD(,in_multi)	igi_relinmhead; /* released groups */
208	struct ifqueue	 igi_gq;	/* queue of general query responses */
209};
210
211#define IGIF_SILENT	0x00000001	/* Do not use IGMP on this ifp */
212#define IGIF_LOOPBACK	0x00000002	/* Send IGMP reports to loopback */
213
214/*
215 * IPv4 multicast IGMP-layer source entry.
216 */
217struct ip_msource {
218	RB_ENTRY(ip_msource)	ims_link;	/* RB tree links */
219	in_addr_t		ims_haddr;	/* host byte order */
220	struct ims_st {
221		uint16_t	ex;		/* # of exclusive members */
222		uint16_t	in;		/* # of inclusive members */
223	}			ims_st[2];	/* state at t0, t1 */
224	uint8_t			ims_stp;	/* pending query */
225};
226
227/*
228 * IPv4 multicast PCB-layer source entry.
229 */
230struct in_msource {
231	RB_ENTRY(ip_msource)	ims_link;	/* RB tree links */
232	in_addr_t		ims_haddr;	/* host byte order */
233	uint8_t			imsl_st[2];	/* state before/at commit */
234};
235
236RB_HEAD(ip_msource_tree, ip_msource);	/* define struct ip_msource_tree */
237
238static __inline int
239ip_msource_cmp(const struct ip_msource *a, const struct ip_msource *b)
240{
241
242	if (a->ims_haddr < b->ims_haddr)
243		return (-1);
244	if (a->ims_haddr == b->ims_haddr)
245		return (0);
246	return (1);
247}
248RB_PROTOTYPE(ip_msource_tree, ip_msource, ims_link, ip_msource_cmp);
249
250/*
251 * IPv4 multicast PCB-layer group filter descriptor.
252 */
253struct in_mfilter {
254	struct ip_msource_tree	imf_sources; /* source list for (S,G) */
255	u_long			imf_nsrc;    /* # of source entries */
256	uint8_t			imf_st[2];   /* state before/at commit */
257};
258
259/*
260 * IPv4 group descriptor.
261 *
262 * For every entry on an ifnet's if_multiaddrs list which represents
263 * an IP multicast group, there is one of these structures.
264 *
265 * If any source filters are present, then a node will exist in the RB-tree
266 * to permit fast lookup by source whenever an operation takes place.
267 * This permits pre-order traversal when we issue reports.
268 * Source filter trees are kept separately from the socket layer to
269 * greatly simplify locking.
270 *
271 * When IGMPv3 is active, inm_timer is the response to group query timer.
272 * The state-change timer inm_sctimer is separate; whenever state changes
273 * for the group the state change record is generated and transmitted,
274 * and kept if retransmissions are necessary.
275 *
276 * FUTURE: inm_link is now only used when groups are being purged
277 * on a detaching ifnet. It could be demoted to a SLIST_ENTRY, but
278 * because it is at the very start of the struct, we can't do this
279 * w/o breaking the ABI for ifmcstat.
280 */
281struct in_multi {
282	LIST_ENTRY(in_multi) inm_link;	/* to-be-released by in_ifdetach */
283	struct	in_addr inm_addr;	/* IP multicast address, convenience */
284	struct	ifnet *inm_ifp;		/* back pointer to ifnet */
285	struct	ifmultiaddr *inm_ifma;	/* back pointer to ifmultiaddr */
286	u_int	inm_timer;		/* IGMPv1/v2 group / v3 query timer */
287	u_int	inm_state;		/* state of the membership */
288	void	*inm_rti;		/* unused, legacy field */
289	u_int	inm_refcount;		/* reference count */
290
291	/* New fields for IGMPv3 follow. */
292	struct igmp_ifinfo	*inm_igi;	/* IGMP info */
293	SLIST_ENTRY(in_multi)	 inm_nrele;	/* to-be-released by IGMP */
294	struct ip_msource_tree	 inm_srcs;	/* tree of sources */
295	u_long			 inm_nsrc;	/* # of tree entries */
296
297	struct ifqueue		 inm_scq;	/* queue of pending
298						 * state-change packets */
299	struct timeval		 inm_lastgsrtv;	/* Time of last G-S-R query */
300	uint16_t		 inm_sctimer;	/* state-change timer */
301	uint16_t		 inm_scrv;	/* state-change rexmit count */
302
303	/*
304	 * SSM state counters which track state at T0 (the time the last
305	 * state-change report's RV timer went to zero) and T1
306	 * (time of pending report, i.e. now).
307	 * Used for computing IGMPv3 state-change reports. Several refcounts
308	 * are maintained here to optimize for common use-cases.
309	 */
310	struct inm_st {
311		uint16_t	iss_fmode;	/* IGMP filter mode */
312		uint16_t	iss_asm;	/* # of ASM listeners */
313		uint16_t	iss_ex;		/* # of exclusive members */
314		uint16_t	iss_in;		/* # of inclusive members */
315		uint16_t	iss_rec;	/* # of recorded sources */
316	}			inm_st[2];	/* state at t0, t1 */
317};
318
319/*
320 * Helper function to derive the filter mode on a source entry
321 * from its internal counters. Predicates are:
322 *  A source is only excluded if all listeners exclude it.
323 *  A source is only included if no listeners exclude it,
324 *  and at least one listener includes it.
325 * May be used by ifmcstat(8).
326 */
327static __inline uint8_t
328ims_get_mode(const struct in_multi *inm, const struct ip_msource *ims,
329    uint8_t t)
330{
331
332	t = !!t;
333	if (inm->inm_st[t].iss_ex > 0 &&
334	    inm->inm_st[t].iss_ex == ims->ims_st[t].ex)
335		return (MCAST_EXCLUDE);
336	else if (ims->ims_st[t].in > 0 && ims->ims_st[t].ex == 0)
337		return (MCAST_INCLUDE);
338	return (MCAST_UNDEFINED);
339}
340
341#ifdef _KERNEL
342
343#ifdef SYSCTL_DECL
344SYSCTL_DECL(_net_inet);
345SYSCTL_DECL(_net_inet_ip);
346SYSCTL_DECL(_net_inet_raw);
347#endif
348
349LIST_HEAD(in_multihead, in_multi);	/* XXX unused */
350#ifdef VIMAGE_GLOBALS
351extern struct in_multihead in_multihead;
352#endif
353
354/*
355 * Lock macros for IPv4 layer multicast address lists.  IPv4 lock goes
356 * before link layer multicast locks in the lock order.  In most cases,
357 * consumers of IN_*_MULTI() macros should acquire the locks before
358 * calling them; users of the in_{add,del}multi() functions should not.
359 */
360extern struct mtx in_multi_mtx;
361#define	IN_MULTI_LOCK()		mtx_lock(&in_multi_mtx)
362#define	IN_MULTI_UNLOCK()	mtx_unlock(&in_multi_mtx)
363#define	IN_MULTI_LOCK_ASSERT()	mtx_assert(&in_multi_mtx, MA_OWNED)
364#define	IN_MULTI_UNLOCK_ASSERT() mtx_assert(&in_multi_mtx, MA_NOTOWNED)
365
366/*
367 * Function for looking up an in_multi record for an IPv4 multicast address
368 * on a given interface. ifp must be valid. If no record found, return NULL.
369 * The IN_MULTI_LOCK and IF_ADDR_LOCK on ifp must be held.
370 */
371static __inline struct in_multi *
372inm_lookup_locked(struct ifnet *ifp, const struct in_addr ina)
373{
374	struct ifmultiaddr *ifma;
375	struct in_multi *inm;
376
377	IN_MULTI_LOCK_ASSERT();
378	IF_ADDR_LOCK_ASSERT(ifp);
379
380	inm = NULL;
381	TAILQ_FOREACH(ifma, &((ifp)->if_multiaddrs), ifma_link) {
382		if (ifma->ifma_addr->sa_family == AF_INET) {
383			inm = (struct in_multi *)ifma->ifma_protospec;
384			if (inm->inm_addr.s_addr == ina.s_addr)
385				break;
386			inm = NULL;
387		}
388	}
389	return (inm);
390}
391
392/*
393 * Wrapper for inm_lookup_locked().
394 * The IF_ADDR_LOCK will be taken on ifp and released on return.
395 */
396static __inline struct in_multi *
397inm_lookup(struct ifnet *ifp, const struct in_addr ina)
398{
399	struct in_multi *inm;
400
401	IN_MULTI_LOCK_ASSERT();
402	IF_ADDR_LOCK(ifp);
403	inm = inm_lookup_locked(ifp, ina);
404	IF_ADDR_UNLOCK(ifp);
405
406	return (inm);
407}
408
409/* Acquire an in_multi record. */
410static __inline void
411inm_acquire_locked(struct in_multi *inm)
412{
413
414	IN_MULTI_LOCK_ASSERT();
415	++inm->inm_refcount;
416}
417
418/*
419 * Return values for imo_multi_filter().
420 */
421#define MCAST_PASS		0	/* Pass */
422#define MCAST_NOTGMEMBER	1	/* This host not a member of group */
423#define MCAST_NOTSMEMBER	2	/* This host excluded source */
424#define MCAST_MUTED		3	/* [deprecated] */
425
426struct	rtentry;
427struct	route;
428struct	ip_moptions;
429
430int	imo_multi_filter(const struct ip_moptions *, const struct ifnet *,
431	    const struct sockaddr *, const struct sockaddr *);
432void	inm_commit(struct in_multi *);
433void	inm_clear_recorded(struct in_multi *);
434void	inm_print(const struct in_multi *);
435int	inm_record_source(struct in_multi *inm, const in_addr_t);
436void	inm_release(struct in_multi *);
437void	inm_release_locked(struct in_multi *);
438struct	in_multi *
439	in_addmulti(struct in_addr *, struct ifnet *);
440void	in_delmulti(struct in_multi *);
441int	in_joingroup(struct ifnet *, const struct in_addr *,
442	    /*const*/ struct in_mfilter *, struct in_multi **);
443int	in_joingroup_locked(struct ifnet *, const struct in_addr *,
444	    /*const*/ struct in_mfilter *, struct in_multi **);
445int	in_leavegroup(struct in_multi *, /*const*/ struct in_mfilter *);
446int	in_leavegroup_locked(struct in_multi *,
447	    /*const*/ struct in_mfilter *);
448int	in_control(struct socket *, u_long, caddr_t, struct ifnet *,
449	    struct thread *);
450void	in_rtqdrain(void);
451void	ip_input(struct mbuf *);
452int	in_ifadown(struct ifaddr *ifa, int);
453void	in_ifscrub(struct ifnet *, struct in_ifaddr *);
454struct	mbuf	*ip_fastforward(struct mbuf *);
455void	*in_domifattach(struct ifnet *);
456void	in_domifdetach(struct ifnet *, void *);
457
458
459/* XXX */
460void	 in_rtalloc_ign(struct route *ro, u_long ignflags, u_int fibnum);
461void	 in_rtalloc(struct route *ro, u_int fibnum);
462struct rtentry *in_rtalloc1(struct sockaddr *, int, u_long, u_int);
463void	 in_rtredirect(struct sockaddr *, struct sockaddr *,
464	    struct sockaddr *, int, struct sockaddr *, u_int);
465int	 in_rtrequest(int, struct sockaddr *,
466	    struct sockaddr *, struct sockaddr *, int, struct rtentry **, u_int);
467
468#if 0
469int	 in_rt_getifa(struct rt_addrinfo *, u_int fibnum);
470int	 in_rtioctl(u_long, caddr_t, u_int);
471int	 in_rtrequest1(int, struct rt_addrinfo *, struct rtentry **, u_int);
472#endif
473#endif /* _KERNEL */
474
475/* INET6 stuff */
476#include <netinet6/in6_var.h>
477
478#endif /* _NETINET_IN_VAR_H_ */
479