in_proto.c revision 223963
1/*-
2 * Copyright (c) 1982, 1986, 1993
3 *	The Regents of the University of California.  All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 *    notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 *    notice, this list of conditions and the following disclaimer in the
12 *    documentation and/or other materials provided with the distribution.
13 * 4. Neither the name of the University nor the names of its contributors
14 *    may be used to endorse or promote products derived from this software
15 *    without specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27 * SUCH DAMAGE.
28 *
29 *	@(#)in_proto.c	8.2 (Berkeley) 2/9/95
30 */
31
32#include <sys/cdefs.h>
33__FBSDID("$FreeBSD: head/sys/netinet/in_proto.c 223963 2011-07-12 19:29:29Z tuexen $");
34
35#include "opt_ipx.h"
36#include "opt_mrouting.h"
37#include "opt_ipsec.h"
38#include "opt_inet.h"
39#include "opt_inet6.h"
40#include "opt_pf.h"
41#include "opt_sctp.h"
42#include "opt_mpath.h"
43
44#include <sys/param.h>
45#include <sys/systm.h>
46#include <sys/kernel.h>
47#include <sys/socket.h>
48#include <sys/domain.h>
49#include <sys/proc.h>
50#include <sys/protosw.h>
51#include <sys/queue.h>
52#include <sys/sysctl.h>
53
54/*
55 * While this file provides the domain and protocol switch tables for IPv4, it
56 * also provides the sysctl node declarations for net.inet.* often shared with
57 * IPv6 for common features or by upper layer protocols.  In case of no IPv4
58 * support compile out everything but these sysctl nodes.
59 */
60#ifdef INET
61#include <net/if.h>
62#include <net/route.h>
63#ifdef RADIX_MPATH
64#include <net/radix_mpath.h>
65#endif
66#include <net/vnet.h>
67#endif /* INET */
68
69#if defined(INET) || defined(INET6)
70#include <netinet/in.h>
71#endif
72
73#ifdef INET
74#include <netinet/in_systm.h>
75#include <netinet/in_var.h>
76#include <netinet/ip.h>
77#include <netinet/ip_var.h>
78#include <netinet/ip_icmp.h>
79#include <netinet/igmp_var.h>
80#include <netinet/tcp.h>
81#include <netinet/tcp_timer.h>
82#include <netinet/tcp_var.h>
83#include <netinet/udp.h>
84#include <netinet/udp_var.h>
85#include <netinet/ip_encap.h>
86
87/*
88 * TCP/IP protocol family: IP, ICMP, UDP, TCP.
89 */
90
91static struct pr_usrreqs nousrreqs;
92
93#ifdef IPSEC
94#include <netipsec/ipsec.h>
95#endif /* IPSEC */
96
97#ifdef SCTP
98#include <netinet/in_pcb.h>
99#include <netinet/sctp_pcb.h>
100#include <netinet/sctp.h>
101#include <netinet/sctp_var.h>
102#endif /* SCTP */
103
104#ifdef DEV_PFSYNC
105#include <net/pfvar.h>
106#include <net/if_pfsync.h>
107#endif
108
109FEATURE(inet, "Internet Protocol version 4");
110
111extern	struct domain inetdomain;
112
113/* Spacer for loadable protocols. */
114#define IPPROTOSPACER   			\
115{						\
116	.pr_domain =		&inetdomain,	\
117	.pr_protocol =		PROTO_SPACER,	\
118	.pr_usrreqs =		&nousrreqs	\
119}
120
121struct protosw inetsw[] = {
122{
123	.pr_type =		0,
124	.pr_domain =		&inetdomain,
125	.pr_protocol =		IPPROTO_IP,
126	.pr_init =		ip_init,
127#ifdef VIMAGE
128	.pr_destroy =		ip_destroy,
129#endif
130	.pr_slowtimo =		ip_slowtimo,
131	.pr_drain =		ip_drain,
132	.pr_usrreqs =		&nousrreqs
133},
134{
135	.pr_type =		SOCK_DGRAM,
136	.pr_domain =		&inetdomain,
137	.pr_protocol =		IPPROTO_UDP,
138	.pr_flags =		PR_ATOMIC|PR_ADDR,
139	.pr_input =		udp_input,
140	.pr_ctlinput =		udp_ctlinput,
141	.pr_ctloutput =		udp_ctloutput,
142	.pr_init =		udp_init,
143#ifdef VIMAGE
144	.pr_destroy =		udp_destroy,
145#endif
146	.pr_usrreqs =		&udp_usrreqs
147},
148{
149	.pr_type =		SOCK_STREAM,
150	.pr_domain =		&inetdomain,
151	.pr_protocol =		IPPROTO_TCP,
152	.pr_flags =		PR_CONNREQUIRED|PR_IMPLOPCL|PR_WANTRCVD,
153	.pr_input =		tcp_input,
154	.pr_ctlinput =		tcp_ctlinput,
155	.pr_ctloutput =		tcp_ctloutput,
156	.pr_init =		tcp_init,
157#ifdef VIMAGE
158	.pr_destroy =		tcp_destroy,
159#endif
160	.pr_slowtimo =		tcp_slowtimo,
161	.pr_drain =		tcp_drain,
162	.pr_usrreqs =		&tcp_usrreqs
163},
164#ifdef SCTP
165{
166	.pr_type =		SOCK_SEQPACKET,
167	.pr_domain =		&inetdomain,
168	.pr_protocol =		IPPROTO_SCTP,
169	.pr_flags =		PR_WANTRCVD,
170	.pr_input =		sctp_input,
171	.pr_ctlinput =		sctp_ctlinput,
172	.pr_ctloutput =		sctp_ctloutput,
173	.pr_init =		sctp_init,
174#ifdef VIMAGE
175	.pr_destroy =		sctp_finish,
176#endif
177	.pr_drain =		sctp_drain,
178	.pr_usrreqs =		&sctp_usrreqs
179},
180{
181	.pr_type =		SOCK_STREAM,
182	.pr_domain =		&inetdomain,
183	.pr_protocol =		IPPROTO_SCTP,
184	.pr_flags =		PR_WANTRCVD,
185	.pr_input =		sctp_input,
186	.pr_ctlinput =		sctp_ctlinput,
187	.pr_ctloutput =		sctp_ctloutput,
188	.pr_drain =		sctp_drain,
189	.pr_usrreqs =		&sctp_usrreqs
190},
191#endif /* SCTP */
192{
193	.pr_type =		SOCK_RAW,
194	.pr_domain =		&inetdomain,
195	.pr_protocol =		IPPROTO_RAW,
196	.pr_flags =		PR_ATOMIC|PR_ADDR,
197	.pr_input =		rip_input,
198	.pr_ctlinput =		rip_ctlinput,
199	.pr_ctloutput =		rip_ctloutput,
200	.pr_usrreqs =		&rip_usrreqs
201},
202{
203	.pr_type =		SOCK_RAW,
204	.pr_domain =		&inetdomain,
205	.pr_protocol =		IPPROTO_ICMP,
206	.pr_flags =		PR_ATOMIC|PR_ADDR|PR_LASTHDR,
207	.pr_input =		icmp_input,
208	.pr_ctloutput =		rip_ctloutput,
209	.pr_usrreqs =		&rip_usrreqs
210},
211{
212	.pr_type =		SOCK_RAW,
213	.pr_domain =		&inetdomain,
214	.pr_protocol =		IPPROTO_IGMP,
215	.pr_flags =		PR_ATOMIC|PR_ADDR|PR_LASTHDR,
216	.pr_input =		igmp_input,
217	.pr_ctloutput =		rip_ctloutput,
218	.pr_fasttimo =		igmp_fasttimo,
219	.pr_slowtimo =		igmp_slowtimo,
220	.pr_usrreqs =		&rip_usrreqs
221},
222{
223	.pr_type =		SOCK_RAW,
224	.pr_domain =		&inetdomain,
225	.pr_protocol =		IPPROTO_RSVP,
226	.pr_flags =		PR_ATOMIC|PR_ADDR|PR_LASTHDR,
227	.pr_input =		rsvp_input,
228	.pr_ctloutput =		rip_ctloutput,
229	.pr_usrreqs =		&rip_usrreqs
230},
231#ifdef IPSEC
232{
233	.pr_type =		SOCK_RAW,
234	.pr_domain =		&inetdomain,
235	.pr_protocol =		IPPROTO_AH,
236	.pr_flags =		PR_ATOMIC|PR_ADDR,
237	.pr_input =		ah4_input,
238	.pr_ctlinput =		ah4_ctlinput,
239	.pr_usrreqs =		&nousrreqs
240},
241{
242	.pr_type =		SOCK_RAW,
243	.pr_domain =		&inetdomain,
244	.pr_protocol =		IPPROTO_ESP,
245	.pr_flags =		PR_ATOMIC|PR_ADDR,
246	.pr_input =		esp4_input,
247	.pr_ctlinput =		esp4_ctlinput,
248	.pr_usrreqs =		&nousrreqs
249},
250{
251	.pr_type =		SOCK_RAW,
252	.pr_domain =		&inetdomain,
253	.pr_protocol =		IPPROTO_IPCOMP,
254	.pr_flags =		PR_ATOMIC|PR_ADDR,
255	.pr_input =		ipcomp4_input,
256	.pr_usrreqs =		&nousrreqs
257},
258#endif /* IPSEC */
259{
260	.pr_type =		SOCK_RAW,
261	.pr_domain =		&inetdomain,
262	.pr_protocol =		IPPROTO_IPV4,
263	.pr_flags =		PR_ATOMIC|PR_ADDR|PR_LASTHDR,
264	.pr_input =		encap4_input,
265	.pr_ctloutput =		rip_ctloutput,
266	.pr_init =		encap_init,
267	.pr_usrreqs =		&rip_usrreqs
268},
269{
270	.pr_type =		SOCK_RAW,
271	.pr_domain =		&inetdomain,
272	.pr_protocol =		IPPROTO_MOBILE,
273	.pr_flags =		PR_ATOMIC|PR_ADDR|PR_LASTHDR,
274	.pr_input =		encap4_input,
275	.pr_ctloutput =		rip_ctloutput,
276	.pr_init =		encap_init,
277	.pr_usrreqs =		&rip_usrreqs
278},
279{
280	.pr_type =		SOCK_RAW,
281	.pr_domain =		&inetdomain,
282	.pr_protocol =		IPPROTO_ETHERIP,
283	.pr_flags =		PR_ATOMIC|PR_ADDR|PR_LASTHDR,
284	.pr_input =		encap4_input,
285	.pr_ctloutput =		rip_ctloutput,
286	.pr_init =		encap_init,
287	.pr_usrreqs =		&rip_usrreqs
288},
289{
290	.pr_type =		SOCK_RAW,
291	.pr_domain =		&inetdomain,
292	.pr_protocol =		IPPROTO_GRE,
293	.pr_flags =		PR_ATOMIC|PR_ADDR|PR_LASTHDR,
294	.pr_input =		encap4_input,
295	.pr_ctloutput =		rip_ctloutput,
296	.pr_init =		encap_init,
297	.pr_usrreqs =		&rip_usrreqs
298},
299# ifdef INET6
300{
301	.pr_type =		SOCK_RAW,
302	.pr_domain =		&inetdomain,
303	.pr_protocol =		IPPROTO_IPV6,
304	.pr_flags =		PR_ATOMIC|PR_ADDR|PR_LASTHDR,
305	.pr_input =		encap4_input,
306	.pr_ctloutput =		rip_ctloutput,
307	.pr_init =		encap_init,
308	.pr_usrreqs =		&rip_usrreqs
309},
310#endif
311{
312	.pr_type =		SOCK_RAW,
313	.pr_domain =		&inetdomain,
314	.pr_protocol =		IPPROTO_PIM,
315	.pr_flags =		PR_ATOMIC|PR_ADDR|PR_LASTHDR,
316	.pr_input =		encap4_input,
317	.pr_ctloutput =		rip_ctloutput,
318	.pr_usrreqs =		&rip_usrreqs
319},
320#ifdef DEV_PFSYNC
321{
322	.pr_type =		SOCK_RAW,
323	.pr_domain =		&inetdomain,
324	.pr_protocol =		IPPROTO_PFSYNC,
325	.pr_flags =		PR_ATOMIC|PR_ADDR,
326	.pr_input =		pfsync_input,
327	.pr_ctloutput =		rip_ctloutput,
328	.pr_usrreqs =		&rip_usrreqs
329},
330#endif	/* DEV_PFSYNC */
331/* Spacer n-times for loadable protocols. */
332IPPROTOSPACER,
333IPPROTOSPACER,
334IPPROTOSPACER,
335IPPROTOSPACER,
336IPPROTOSPACER,
337IPPROTOSPACER,
338IPPROTOSPACER,
339IPPROTOSPACER,
340/* raw wildcard */
341{
342	.pr_type =		SOCK_RAW,
343	.pr_domain =		&inetdomain,
344	.pr_flags =		PR_ATOMIC|PR_ADDR,
345	.pr_input =		rip_input,
346	.pr_ctloutput =		rip_ctloutput,
347	.pr_init =		rip_init,
348#ifdef VIMAGE
349	.pr_destroy =		rip_destroy,
350#endif
351	.pr_usrreqs =		&rip_usrreqs
352},
353};
354
355extern int in_inithead(void **, int);
356extern int in_detachhead(void **, int);
357
358struct domain inetdomain = {
359	.dom_family =		AF_INET,
360	.dom_name =		"internet",
361	.dom_protosw =		inetsw,
362	.dom_protoswNPROTOSW =	&inetsw[sizeof(inetsw)/sizeof(inetsw[0])],
363#ifdef RADIX_MPATH
364	.dom_rtattach =		rn4_mpath_inithead,
365#else
366	.dom_rtattach =		in_inithead,
367#endif
368#ifdef VIMAGE
369	.dom_rtdetach =		in_detachhead,
370#endif
371	.dom_rtoffset =		32,
372	.dom_maxrtkey =		sizeof(struct sockaddr_in),
373	.dom_ifattach =		in_domifattach,
374	.dom_ifdetach =		in_domifdetach
375};
376
377VNET_DOMAIN_SET(inet);
378#endif /* INET */
379
380SYSCTL_NODE(_net,      PF_INET,		inet,	CTLFLAG_RW, 0,
381	"Internet Family");
382
383SYSCTL_NODE(_net_inet, IPPROTO_IP,	ip,	CTLFLAG_RW, 0,	"IP");
384SYSCTL_NODE(_net_inet, IPPROTO_ICMP,	icmp,	CTLFLAG_RW, 0,	"ICMP");
385SYSCTL_NODE(_net_inet, IPPROTO_UDP,	udp,	CTLFLAG_RW, 0,	"UDP");
386SYSCTL_NODE(_net_inet, IPPROTO_TCP,	tcp,	CTLFLAG_RW, 0,	"TCP");
387#ifdef SCTP
388SYSCTL_NODE(_net_inet, IPPROTO_SCTP,	sctp,	CTLFLAG_RW, 0,	"SCTP");
389#endif
390SYSCTL_NODE(_net_inet, IPPROTO_IGMP,	igmp,	CTLFLAG_RW, 0,	"IGMP");
391#ifdef IPSEC
392/* XXX no protocol # to use, pick something "reserved" */
393SYSCTL_NODE(_net_inet, 253,		ipsec,	CTLFLAG_RW, 0,	"IPSEC");
394SYSCTL_NODE(_net_inet, IPPROTO_AH,	ah,	CTLFLAG_RW, 0,	"AH");
395SYSCTL_NODE(_net_inet, IPPROTO_ESP,	esp,	CTLFLAG_RW, 0,	"ESP");
396SYSCTL_NODE(_net_inet, IPPROTO_IPCOMP,	ipcomp,	CTLFLAG_RW, 0,	"IPCOMP");
397SYSCTL_NODE(_net_inet, IPPROTO_IPIP,	ipip,	CTLFLAG_RW, 0,	"IPIP");
398#endif /* IPSEC */
399SYSCTL_NODE(_net_inet, IPPROTO_RAW,	raw,	CTLFLAG_RW, 0,	"RAW");
400#ifdef DEV_PFSYNC
401SYSCTL_NODE(_net_inet, IPPROTO_PFSYNC,	pfsync,	CTLFLAG_RW, 0,	"PFSYNC");
402#endif
403