udp6_usrreq.c revision 182537
1/*-
2 * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 *    notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 *    notice, this list of conditions and the following disclaimer in the
12 *    documentation and/or other materials provided with the distribution.
13 * 3. Neither the name of the project nor the names of its contributors
14 *    may be used to endorse or promote products derived from this software
15 *    without specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27 * SUCH DAMAGE.
28 *
29 *	$KAME: udp6_usrreq.c,v 1.27 2001/05/21 05:45:10 jinmei Exp $
30 *	$KAME: udp6_output.c,v 1.31 2001/05/21 16:39:15 jinmei Exp $
31 */
32
33/*-
34 * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1995
35 *	The Regents of the University of California.
36 * All rights reserved.
37 *
38 * Redistribution and use in source and binary forms, with or without
39 * modification, are permitted provided that the following conditions
40 * are met:
41 * 1. Redistributions of source code must retain the above copyright
42 *    notice, this list of conditions and the following disclaimer.
43 * 2. Redistributions in binary form must reproduce the above copyright
44 *    notice, this list of conditions and the following disclaimer in the
45 *    documentation and/or other materials provided with the distribution.
46 * 4. Neither the name of the University nor the names of its contributors
47 *    may be used to endorse or promote products derived from this software
48 *    without specific prior written permission.
49 *
50 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
51 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
52 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
53 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
54 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
55 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
56 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
57 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
58 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
59 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
60 * SUCH DAMAGE.
61 *
62 *	@(#)udp_usrreq.c	8.6 (Berkeley) 5/23/95
63 */
64
65#include <sys/cdefs.h>
66__FBSDID("$FreeBSD: head/sys/netinet6/udp6_usrreq.c 182537 2008-08-31 13:16:45Z rwatson $");
67
68#include "opt_inet.h"
69#include "opt_inet6.h"
70#include "opt_ipsec.h"
71#include "opt_mac.h"
72
73#include <sys/param.h>
74#include <sys/kernel.h>
75#include <sys/lock.h>
76#include <sys/mbuf.h>
77#include <sys/priv.h>
78#include <sys/proc.h>
79#include <sys/protosw.h>
80#include <sys/signalvar.h>
81#include <sys/socket.h>
82#include <sys/socketvar.h>
83#include <sys/sx.h>
84#include <sys/sysctl.h>
85#include <sys/syslog.h>
86#include <sys/systm.h>
87#include <sys/vimage.h>
88
89#include <net/if.h>
90#include <net/if_types.h>
91#include <net/route.h>
92
93#include <netinet/in.h>
94#include <netinet/in_pcb.h>
95#include <netinet/in_systm.h>
96#include <netinet/in_var.h>
97#include <netinet/ip.h>
98#include <netinet/ip_icmp.h>
99#include <netinet/ip6.h>
100#include <netinet/icmp_var.h>
101#include <netinet/icmp6.h>
102#include <netinet/ip_var.h>
103#include <netinet/udp.h>
104#include <netinet/udp_var.h>
105#include <netinet6/ip6protosw.h>
106#include <netinet6/ip6_var.h>
107#include <netinet6/in6_pcb.h>
108#include <netinet6/udp6_var.h>
109#include <netinet6/scope6_var.h>
110
111#ifdef IPSEC
112#include <netipsec/ipsec.h>
113#include <netipsec/ipsec6.h>
114#endif /* IPSEC */
115
116#include <security/mac/mac_framework.h>
117
118/*
119 * UDP protocol implementation.
120 * Per RFC 768, August, 1980.
121 */
122
123extern struct protosw	inetsw[];
124static void		udp6_detach(struct socket *so);
125
126static void
127udp6_append(struct inpcb *inp, struct mbuf *n, int off,
128    struct sockaddr_in6 *fromsa)
129{
130	struct socket *so;
131	struct mbuf *opts;
132
133	INP_LOCK_ASSERT(inp);
134
135#ifdef IPSEC
136	/* Check AH/ESP integrity. */
137	if (ipsec6_in_reject(n, inp)) {
138		m_freem(n);
139		V_ipsec6stat.in_polvio++;
140		return;
141	}
142#endif /* IPSEC */
143#ifdef MAC
144	if (mac_inpcb_check_deliver(inp, n) != 0) {
145		m_freem(n);
146		return;
147	}
148#endif
149	opts = NULL;
150	if (inp->in6p_flags & IN6P_CONTROLOPTS ||
151	    inp->inp_socket->so_options & SO_TIMESTAMP)
152		ip6_savecontrol(inp, n, &opts);
153	m_adj(n, off + sizeof(struct udphdr));
154
155	so = inp->inp_socket;
156	SOCKBUF_LOCK(&so->so_rcv);
157	if (sbappendaddr_locked(&so->so_rcv, (struct sockaddr *)fromsa, n,
158	    opts) == 0) {
159		SOCKBUF_UNLOCK(&so->so_rcv);
160		m_freem(n);
161		if (opts)
162			m_freem(opts);
163		V_udpstat.udps_fullsock++;
164	} else
165		sorwakeup_locked(so);
166}
167
168int
169udp6_input(struct mbuf **mp, int *offp, int proto)
170{
171	struct mbuf *m = *mp;
172	struct ip6_hdr *ip6;
173	struct udphdr *uh;
174	struct inpcb *inp;
175	int off = *offp;
176	int plen, ulen;
177	struct sockaddr_in6 fromsa;
178
179	ip6 = mtod(m, struct ip6_hdr *);
180
181	if (faithprefix_p != NULL && (*faithprefix_p)(&ip6->ip6_dst)) {
182		/* XXX send icmp6 host/port unreach? */
183		m_freem(m);
184		return (IPPROTO_DONE);
185	}
186
187#ifndef PULLDOWN_TEST
188	IP6_EXTHDR_CHECK(m, off, sizeof(struct udphdr), IPPROTO_DONE);
189	ip6 = mtod(m, struct ip6_hdr *);
190	uh = (struct udphdr *)((caddr_t)ip6 + off);
191#else
192	IP6_EXTHDR_GET(uh, struct udphdr *, m, off, sizeof(*uh));
193	if (!uh)
194		return (IPPROTO_DONE);
195#endif
196
197	V_udpstat.udps_ipackets++;
198
199	/*
200	 * Destination port of 0 is illegal, based on RFC768.
201	 */
202	if (uh->uh_dport == 0)
203		goto badunlocked;
204
205	plen = ntohs(ip6->ip6_plen) - off + sizeof(*ip6);
206	ulen = ntohs((u_short)uh->uh_ulen);
207
208	if (plen != ulen) {
209		V_udpstat.udps_badlen++;
210		goto badunlocked;
211	}
212
213	/*
214	 * Checksum extended UDP header and data.
215	 */
216	if (uh->uh_sum == 0) {
217		V_udpstat.udps_nosum++;
218		goto badunlocked;
219	}
220	if (in6_cksum(m, IPPROTO_UDP, off, ulen) != 0) {
221		V_udpstat.udps_badsum++;
222		goto badunlocked;
223	}
224
225	/*
226	 * Construct sockaddr format source address.
227	 */
228	init_sin6(&fromsa, m);
229	fromsa.sin6_port = uh->uh_sport;
230
231	INP_INFO_RLOCK(&V_udbinfo);
232	if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst)) {
233		struct inpcb *last;
234
235		/*
236		 * In the event that laddr should be set to the link-local
237		 * address (this happens in RIPng), the multicast address
238		 * specified in the received packet will not match laddr.  To
239		 * handle this situation, matching is relaxed if the
240		 * receiving interface is the same as one specified in the
241		 * socket and if the destination multicast address matches
242		 * one of the multicast groups specified in the socket.
243		 */
244
245		/*
246		 * KAME note: traditionally we dropped udpiphdr from mbuf
247		 * here.  We need udphdr for IPsec processing so we do that
248		 * later.
249		 */
250		last = NULL;
251		LIST_FOREACH(inp, &V_udb, inp_list) {
252			if ((inp->inp_vflag & INP_IPV6) == 0)
253				continue;
254			if (inp->in6p_lport != uh->uh_dport)
255				continue;
256			/*
257			 * XXX: Do not check source port of incoming datagram
258			 * unless inp_connect() has been called to bind the
259			 * fport part of the 4-tuple; the source could be
260			 * trying to talk to us with an ephemeral port.
261			 */
262			if (inp->inp_fport != 0 &&
263			    inp->inp_fport != uh->uh_sport)
264				continue;
265			if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) {
266				if (!IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr,
267							&ip6->ip6_dst))
268					continue;
269			}
270			if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) {
271				if (!IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr,
272							&ip6->ip6_src) ||
273				    inp->in6p_fport != uh->uh_sport)
274					continue;
275			}
276
277			if (last != NULL) {
278				struct mbuf *n;
279
280				if ((n = m_copy(m, 0, M_COPYALL)) != NULL) {
281					INP_RLOCK(last);
282					udp6_append(last, n, off, &fromsa);
283					INP_RUNLOCK(last);
284				}
285			}
286			last = inp;
287			/*
288			 * Don't look for additional matches if this one does
289			 * not have either the SO_REUSEPORT or SO_REUSEADDR
290			 * socket options set.  This heuristic avoids
291			 * searching through all pcbs in the common case of a
292			 * non-shared port.  It assumes that an application
293			 * will never clear these options after setting them.
294			 */
295			if ((last->inp_socket->so_options &
296			     (SO_REUSEPORT|SO_REUSEADDR)) == 0)
297				break;
298		}
299
300		if (last == NULL) {
301			/*
302			 * No matching pcb found; discard datagram.  (No need
303			 * to send an ICMP Port Unreachable for a broadcast
304			 * or multicast datgram.)
305			 */
306			V_udpstat.udps_noport++;
307			V_udpstat.udps_noportmcast++;
308			goto badheadlocked;
309		}
310		INP_RLOCK(last);
311		INP_INFO_RUNLOCK(&V_udbinfo);
312		udp6_append(last, m, off, &fromsa);
313		INP_RUNLOCK(last);
314		return (IPPROTO_DONE);
315	}
316	/*
317	 * Locate pcb for datagram.
318	 */
319	inp = in6_pcblookup_hash(&V_udbinfo, &ip6->ip6_src, uh->uh_sport,
320	    &ip6->ip6_dst, uh->uh_dport, 1, m->m_pkthdr.rcvif);
321	if (inp == NULL) {
322		if (udp_log_in_vain) {
323			char ip6bufs[INET6_ADDRSTRLEN];
324			char ip6bufd[INET6_ADDRSTRLEN];
325
326			log(LOG_INFO,
327			    "Connection attempt to UDP [%s]:%d from [%s]:%d\n",
328			    ip6_sprintf(ip6bufd, &ip6->ip6_dst),
329			    ntohs(uh->uh_dport),
330			    ip6_sprintf(ip6bufs, &ip6->ip6_src),
331			    ntohs(uh->uh_sport));
332		}
333		V_udpstat.udps_noport++;
334		if (m->m_flags & M_MCAST) {
335			printf("UDP6: M_MCAST is set in a unicast packet.\n");
336			V_udpstat.udps_noportmcast++;
337			goto badheadlocked;
338		}
339		INP_INFO_RUNLOCK(&V_udbinfo);
340		if (V_udp_blackhole)
341			goto badunlocked;
342		if (badport_bandlim(BANDLIM_ICMP6_UNREACH) < 0)
343			goto badunlocked;
344		icmp6_error(m, ICMP6_DST_UNREACH, ICMP6_DST_UNREACH_NOPORT, 0);
345		return (IPPROTO_DONE);
346	}
347	INP_RLOCK(inp);
348	INP_INFO_RUNLOCK(&V_udbinfo);
349	udp6_append(inp, m, off, &fromsa);
350	INP_RUNLOCK(inp);
351	return (IPPROTO_DONE);
352
353badheadlocked:
354	INP_INFO_RUNLOCK(&V_udbinfo);
355badunlocked:
356	if (m)
357		m_freem(m);
358	return (IPPROTO_DONE);
359}
360
361void
362udp6_ctlinput(int cmd, struct sockaddr *sa, void *d)
363{
364	struct udphdr uh;
365	struct ip6_hdr *ip6;
366	struct mbuf *m;
367	int off = 0;
368	struct ip6ctlparam *ip6cp = NULL;
369	const struct sockaddr_in6 *sa6_src = NULL;
370	void *cmdarg;
371	struct inpcb *(*notify)(struct inpcb *, int) = udp_notify;
372	struct udp_portonly {
373		u_int16_t uh_sport;
374		u_int16_t uh_dport;
375	} *uhp;
376
377	if (sa->sa_family != AF_INET6 ||
378	    sa->sa_len != sizeof(struct sockaddr_in6))
379		return;
380
381	if ((unsigned)cmd >= PRC_NCMDS)
382		return;
383	if (PRC_IS_REDIRECT(cmd))
384		notify = in6_rtchange, d = NULL;
385	else if (cmd == PRC_HOSTDEAD)
386		d = NULL;
387	else if (inet6ctlerrmap[cmd] == 0)
388		return;
389
390	/* if the parameter is from icmp6, decode it. */
391	if (d != NULL) {
392		ip6cp = (struct ip6ctlparam *)d;
393		m = ip6cp->ip6c_m;
394		ip6 = ip6cp->ip6c_ip6;
395		off = ip6cp->ip6c_off;
396		cmdarg = ip6cp->ip6c_cmdarg;
397		sa6_src = ip6cp->ip6c_src;
398	} else {
399		m = NULL;
400		ip6 = NULL;
401		cmdarg = NULL;
402		sa6_src = &sa6_any;
403	}
404
405	if (ip6) {
406		/*
407		 * XXX: We assume that when IPV6 is non NULL,
408		 * M and OFF are valid.
409		 */
410
411		/* Check if we can safely examine src and dst ports. */
412		if (m->m_pkthdr.len < off + sizeof(*uhp))
413			return;
414
415		bzero(&uh, sizeof(uh));
416		m_copydata(m, off, sizeof(*uhp), (caddr_t)&uh);
417
418		(void) in6_pcbnotify(&V_udbinfo, sa, uh.uh_dport,
419		    (struct sockaddr *)ip6cp->ip6c_src, uh.uh_sport, cmd,
420		    cmdarg, notify);
421	} else
422		(void) in6_pcbnotify(&V_udbinfo, sa, 0,
423		    (const struct sockaddr *)sa6_src, 0, cmd, cmdarg, notify);
424}
425
426static int
427udp6_getcred(SYSCTL_HANDLER_ARGS)
428{
429	struct xucred xuc;
430	struct sockaddr_in6 addrs[2];
431	struct inpcb *inp;
432	int error;
433
434	error = priv_check(req->td, PRIV_NETINET_GETCRED);
435	if (error)
436		return (error);
437
438	if (req->newlen != sizeof(addrs))
439		return (EINVAL);
440	if (req->oldlen != sizeof(struct xucred))
441		return (EINVAL);
442	error = SYSCTL_IN(req, addrs, sizeof(addrs));
443	if (error)
444		return (error);
445	if ((error = sa6_embedscope(&addrs[0], V_ip6_use_defzone)) != 0 ||
446	    (error = sa6_embedscope(&addrs[1], V_ip6_use_defzone)) != 0) {
447		return (error);
448	}
449	INP_INFO_RLOCK(&V_udbinfo);
450	inp = in6_pcblookup_hash(&V_udbinfo, &addrs[1].sin6_addr,
451	    addrs[1].sin6_port, &addrs[0].sin6_addr, addrs[0].sin6_port, 1,
452	    NULL);
453	if (inp != NULL) {
454		INP_RLOCK(inp);
455		INP_INFO_RUNLOCK(&V_udbinfo);
456		if (inp->inp_socket == NULL)
457			error = ENOENT;
458		if (error == 0)
459			error = cr_canseesocket(req->td->td_ucred,
460			    inp->inp_socket);
461		if (error == 0)
462			cru2x(inp->inp_socket->so_cred, &xuc);
463		INP_RUNLOCK(inp);
464	} else {
465		INP_INFO_RUNLOCK(&V_udbinfo);
466		error = ENOENT;
467	}
468	if (error == 0)
469		error = SYSCTL_OUT(req, &xuc, sizeof(struct xucred));
470	return (error);
471}
472
473SYSCTL_PROC(_net_inet6_udp6, OID_AUTO, getcred, CTLTYPE_OPAQUE|CTLFLAG_RW, 0,
474    0, udp6_getcred, "S,xucred", "Get the xucred of a UDP6 connection");
475
476static int
477udp6_output(struct inpcb *inp, struct mbuf *m, struct sockaddr *addr6,
478    struct mbuf *control, struct thread *td)
479{
480	u_int32_t ulen = m->m_pkthdr.len;
481	u_int32_t plen = sizeof(struct udphdr) + ulen;
482	struct ip6_hdr *ip6;
483	struct udphdr *udp6;
484	struct in6_addr *laddr, *faddr;
485	struct sockaddr_in6 *sin6 = NULL;
486	struct ifnet *oifp = NULL;
487	int scope_ambiguous = 0;
488	u_short fport;
489	int error = 0;
490	struct ip6_pktopts *optp, opt;
491	int af = AF_INET6, hlen = sizeof(struct ip6_hdr);
492	int flags;
493	struct sockaddr_in6 tmp;
494
495	INP_WLOCK_ASSERT(inp);
496
497	if (addr6) {
498		/* addr6 has been validated in udp6_send(). */
499		sin6 = (struct sockaddr_in6 *)addr6;
500
501		/* protect *sin6 from overwrites */
502		tmp = *sin6;
503		sin6 = &tmp;
504
505		/*
506		 * Application should provide a proper zone ID or the use of
507		 * default zone IDs should be enabled.  Unfortunately, some
508		 * applications do not behave as it should, so we need a
509		 * workaround.  Even if an appropriate ID is not determined,
510		 * we'll see if we can determine the outgoing interface.  If we
511		 * can, determine the zone ID based on the interface below.
512		 */
513		if (sin6->sin6_scope_id == 0 && !V_ip6_use_defzone)
514			scope_ambiguous = 1;
515		if ((error = sa6_embedscope(sin6, V_ip6_use_defzone)) != 0)
516			return (error);
517	}
518
519	if (control) {
520		if ((error = ip6_setpktopts(control, &opt,
521		    inp->in6p_outputopts, td->td_ucred, IPPROTO_UDP)) != 0)
522			goto release;
523		optp = &opt;
524	} else
525		optp = inp->in6p_outputopts;
526
527	if (sin6) {
528		faddr = &sin6->sin6_addr;
529
530		/*
531		 * IPv4 version of udp_output calls in_pcbconnect in this case,
532		 * which needs splnet and affects performance.
533		 * Since we saw no essential reason for calling in_pcbconnect,
534		 * we get rid of such kind of logic, and call in6_selectsrc
535		 * and in6_pcbsetport in order to fill in the local address
536		 * and the local port.
537		 */
538		if (sin6->sin6_port == 0) {
539			error = EADDRNOTAVAIL;
540			goto release;
541		}
542
543		if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) {
544			/* how about ::ffff:0.0.0.0 case? */
545			error = EISCONN;
546			goto release;
547		}
548
549		fport = sin6->sin6_port; /* allow 0 port */
550
551		if (IN6_IS_ADDR_V4MAPPED(faddr)) {
552			if ((inp->in6p_flags & IN6P_IPV6_V6ONLY)) {
553				/*
554				 * I believe we should explicitly discard the
555				 * packet when mapped addresses are disabled,
556				 * rather than send the packet as an IPv6 one.
557				 * If we chose the latter approach, the packet
558				 * might be sent out on the wire based on the
559				 * default route, the situation which we'd
560				 * probably want to avoid.
561				 * (20010421 jinmei@kame.net)
562				 */
563				error = EINVAL;
564				goto release;
565			}
566			if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr) &&
567			    !IN6_IS_ADDR_V4MAPPED(&inp->in6p_laddr)) {
568				/*
569				 * when remote addr is an IPv4-mapped address,
570				 * local addr should not be an IPv6 address,
571				 * since you cannot determine how to map IPv6
572				 * source address to IPv4.
573				 */
574				error = EINVAL;
575				goto release;
576			}
577
578			af = AF_INET;
579		}
580
581		if (!IN6_IS_ADDR_V4MAPPED(faddr)) {
582			laddr = in6_selectsrc(sin6, optp, inp, NULL,
583			    td->td_ucred, &oifp, &error);
584			if (oifp && scope_ambiguous &&
585			    (error = in6_setscope(&sin6->sin6_addr,
586			    oifp, NULL))) {
587				goto release;
588			}
589		} else
590			laddr = &inp->in6p_laddr;	/* XXX */
591		if (laddr == NULL) {
592			if (error == 0)
593				error = EADDRNOTAVAIL;
594			goto release;
595		}
596		if (inp->in6p_lport == 0 &&
597		    (error = in6_pcbsetport(laddr, inp, td->td_ucred)) != 0)
598			goto release;
599	} else {
600		if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) {
601			error = ENOTCONN;
602			goto release;
603		}
604		if (IN6_IS_ADDR_V4MAPPED(&inp->in6p_faddr)) {
605			if ((inp->in6p_flags & IN6P_IPV6_V6ONLY)) {
606				/*
607				 * XXX: this case would happen when the
608				 * application sets the V6ONLY flag after
609				 * connecting the foreign address.
610				 * Such applications should be fixed,
611				 * so we bark here.
612				 */
613				log(LOG_INFO, "udp6_output: IPV6_V6ONLY "
614				    "option was set for a connected socket\n");
615				error = EINVAL;
616				goto release;
617			} else
618				af = AF_INET;
619		}
620		laddr = &inp->in6p_laddr;
621		faddr = &inp->in6p_faddr;
622		fport = inp->in6p_fport;
623	}
624
625	if (af == AF_INET)
626		hlen = sizeof(struct ip);
627
628	/*
629	 * Calculate data length and get a mbuf
630	 * for UDP and IP6 headers.
631	 */
632	M_PREPEND(m, hlen + sizeof(struct udphdr), M_DONTWAIT);
633	if (m == 0) {
634		error = ENOBUFS;
635		goto release;
636	}
637
638	/*
639	 * Stuff checksum and output datagram.
640	 */
641	udp6 = (struct udphdr *)(mtod(m, caddr_t) + hlen);
642	udp6->uh_sport = inp->in6p_lport; /* lport is always set in the PCB */
643	udp6->uh_dport = fport;
644	if (plen <= 0xffff)
645		udp6->uh_ulen = htons((u_short)plen);
646	else
647		udp6->uh_ulen = 0;
648	udp6->uh_sum = 0;
649
650	switch (af) {
651	case AF_INET6:
652		ip6 = mtod(m, struct ip6_hdr *);
653		ip6->ip6_flow	= inp->in6p_flowinfo & IPV6_FLOWINFO_MASK;
654		ip6->ip6_vfc	&= ~IPV6_VERSION_MASK;
655		ip6->ip6_vfc	|= IPV6_VERSION;
656#if 0				/* ip6_plen will be filled in ip6_output. */
657		ip6->ip6_plen	= htons((u_short)plen);
658#endif
659		ip6->ip6_nxt	= IPPROTO_UDP;
660		ip6->ip6_hlim	= in6_selecthlim(inp, NULL);
661		ip6->ip6_src	= *laddr;
662		ip6->ip6_dst	= *faddr;
663
664		if ((udp6->uh_sum = in6_cksum(m, IPPROTO_UDP,
665				sizeof(struct ip6_hdr), plen)) == 0) {
666			udp6->uh_sum = 0xffff;
667		}
668
669		flags = 0;
670
671		V_udpstat.udps_opackets++;
672		error = ip6_output(m, optp, NULL, flags, inp->in6p_moptions,
673		    NULL, inp);
674		break;
675	case AF_INET:
676		error = EAFNOSUPPORT;
677		goto release;
678	}
679	goto releaseopt;
680
681release:
682	m_freem(m);
683
684releaseopt:
685	if (control) {
686		ip6_clearpktopts(&opt, -1);
687		m_freem(control);
688	}
689	return (error);
690}
691
692static void
693udp6_abort(struct socket *so)
694{
695	struct inpcb *inp;
696
697	inp = sotoinpcb(so);
698	KASSERT(inp != NULL, ("udp6_abort: inp == NULL"));
699
700#ifdef INET
701	if (inp->inp_vflag & INP_IPV4) {
702		struct pr_usrreqs *pru;
703
704		pru = inetsw[ip_protox[IPPROTO_UDP]].pr_usrreqs;
705		(*pru->pru_abort)(so);
706		return;
707	}
708#endif
709
710	INP_INFO_WLOCK(&V_udbinfo);
711	INP_WLOCK(inp);
712	if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) {
713		in6_pcbdisconnect(inp);
714		inp->in6p_laddr = in6addr_any;
715		soisdisconnected(so);
716	}
717	INP_WUNLOCK(inp);
718	INP_INFO_WUNLOCK(&V_udbinfo);
719}
720
721static int
722udp6_attach(struct socket *so, int proto, struct thread *td)
723{
724	struct inpcb *inp;
725	int error;
726
727	inp = sotoinpcb(so);
728	KASSERT(inp == NULL, ("udp6_attach: inp != NULL"));
729
730	if (so->so_snd.sb_hiwat == 0 || so->so_rcv.sb_hiwat == 0) {
731		error = soreserve(so, udp_sendspace, udp_recvspace);
732		if (error)
733			return (error);
734	}
735	INP_INFO_WLOCK(&V_udbinfo);
736	error = in_pcballoc(so, &V_udbinfo);
737	if (error) {
738		INP_INFO_WUNLOCK(&V_udbinfo);
739		return (error);
740	}
741	inp = (struct inpcb *)so->so_pcb;
742	INP_INFO_WUNLOCK(&V_udbinfo);
743	inp->inp_vflag |= INP_IPV6;
744	if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0)
745		inp->inp_vflag |= INP_IPV4;
746	inp->in6p_hops = -1;	/* use kernel default */
747	inp->in6p_cksum = -1;	/* just to be sure */
748	/*
749	 * XXX: ugly!!
750	 * IPv4 TTL initialization is necessary for an IPv6 socket as well,
751	 * because the socket may be bound to an IPv6 wildcard address,
752	 * which may match an IPv4-mapped IPv6 address.
753	 */
754	inp->inp_ip_ttl = V_ip_defttl;
755	INP_WUNLOCK(inp);
756	return (0);
757}
758
759static int
760udp6_bind(struct socket *so, struct sockaddr *nam, struct thread *td)
761{
762	struct inpcb *inp;
763	int error;
764
765	inp = sotoinpcb(so);
766	KASSERT(inp != NULL, ("udp6_bind: inp == NULL"));
767
768	INP_INFO_WLOCK(&V_udbinfo);
769	INP_WLOCK(inp);
770	inp->inp_vflag &= ~INP_IPV4;
771	inp->inp_vflag |= INP_IPV6;
772	if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0) {
773		struct sockaddr_in6 *sin6_p;
774
775		sin6_p = (struct sockaddr_in6 *)nam;
776
777		if (IN6_IS_ADDR_UNSPECIFIED(&sin6_p->sin6_addr))
778			inp->inp_vflag |= INP_IPV4;
779		else if (IN6_IS_ADDR_V4MAPPED(&sin6_p->sin6_addr)) {
780			struct sockaddr_in sin;
781
782			in6_sin6_2_sin(&sin, sin6_p);
783			inp->inp_vflag |= INP_IPV4;
784			inp->inp_vflag &= ~INP_IPV6;
785			error = in_pcbbind(inp, (struct sockaddr *)&sin,
786			    td->td_ucred);
787			goto out;
788		}
789	}
790
791	error = in6_pcbbind(inp, nam, td->td_ucred);
792out:
793	INP_WUNLOCK(inp);
794	INP_INFO_WUNLOCK(&V_udbinfo);
795	return (error);
796}
797
798static void
799udp6_close(struct socket *so)
800{
801	struct inpcb *inp;
802
803	inp = sotoinpcb(so);
804	KASSERT(inp != NULL, ("udp6_close: inp == NULL"));
805
806#ifdef INET
807	if (inp->inp_vflag & INP_IPV4) {
808		struct pr_usrreqs *pru;
809
810		pru = inetsw[ip_protox[IPPROTO_UDP]].pr_usrreqs;
811		(*pru->pru_disconnect)(so);
812		return;
813	}
814#endif
815	INP_INFO_WLOCK(&V_udbinfo);
816	INP_WLOCK(inp);
817	if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) {
818		in6_pcbdisconnect(inp);
819		inp->in6p_laddr = in6addr_any;
820		soisdisconnected(so);
821	}
822	INP_WUNLOCK(inp);
823	INP_INFO_WUNLOCK(&V_udbinfo);
824}
825
826static int
827udp6_connect(struct socket *so, struct sockaddr *nam, struct thread *td)
828{
829	struct inpcb *inp;
830	int error;
831
832	inp = sotoinpcb(so);
833	KASSERT(inp != NULL, ("udp6_connect: inp == NULL"));
834
835	INP_INFO_WLOCK(&V_udbinfo);
836	INP_WLOCK(inp);
837	if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0) {
838		struct sockaddr_in6 *sin6_p;
839
840		sin6_p = (struct sockaddr_in6 *)nam;
841		if (IN6_IS_ADDR_V4MAPPED(&sin6_p->sin6_addr)) {
842			struct sockaddr_in sin;
843
844			if (inp->inp_faddr.s_addr != INADDR_ANY) {
845				error = EISCONN;
846				goto out;
847			}
848			in6_sin6_2_sin(&sin, sin6_p);
849			error = in_pcbconnect(inp, (struct sockaddr *)&sin,
850			    td->td_ucred);
851			if (error == 0) {
852				inp->inp_vflag |= INP_IPV4;
853				inp->inp_vflag &= ~INP_IPV6;
854				soisconnected(so);
855			}
856			goto out;
857		}
858	}
859	if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) {
860		error = EISCONN;
861		goto out;
862	}
863	error = in6_pcbconnect(inp, nam, td->td_ucred);
864	if (error == 0) {
865		if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0) {
866			/* should be non mapped addr */
867			inp->inp_vflag &= ~INP_IPV4;
868			inp->inp_vflag |= INP_IPV6;
869		}
870		soisconnected(so);
871	}
872out:
873	INP_WUNLOCK(inp);
874	INP_INFO_WUNLOCK(&V_udbinfo);
875	return (error);
876}
877
878static void
879udp6_detach(struct socket *so)
880{
881	struct inpcb *inp;
882
883	inp = sotoinpcb(so);
884	KASSERT(inp != NULL, ("udp6_detach: inp == NULL"));
885
886	INP_INFO_WLOCK(&V_udbinfo);
887	INP_WLOCK(inp);
888	in6_pcbdetach(inp);
889	in6_pcbfree(inp);
890	INP_INFO_WUNLOCK(&V_udbinfo);
891}
892
893static int
894udp6_disconnect(struct socket *so)
895{
896	struct inpcb *inp;
897	int error;
898
899	inp = sotoinpcb(so);
900	KASSERT(inp != NULL, ("udp6_disconnect: inp == NULL"));
901
902	INP_INFO_WLOCK(&V_udbinfo);
903	INP_WLOCK(inp);
904
905#ifdef INET
906	if (inp->inp_vflag & INP_IPV4) {
907		struct pr_usrreqs *pru;
908
909		pru = inetsw[ip_protox[IPPROTO_UDP]].pr_usrreqs;
910		error = (*pru->pru_disconnect)(so);
911		goto out;
912	}
913#endif
914
915	if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) {
916		error = ENOTCONN;
917		goto out;
918	}
919
920	in6_pcbdisconnect(inp);
921	inp->in6p_laddr = in6addr_any;
922	/* XXXRW: so_state locking? */
923	so->so_state &= ~SS_ISCONNECTED;		/* XXX */
924out:
925	INP_WUNLOCK(inp);
926	INP_INFO_WUNLOCK(&V_udbinfo);
927	return (0);
928}
929
930static int
931udp6_send(struct socket *so, int flags, struct mbuf *m,
932    struct sockaddr *addr, struct mbuf *control, struct thread *td)
933{
934	struct inpcb *inp;
935	int error = 0;
936
937	inp = sotoinpcb(so);
938	KASSERT(inp != NULL, ("udp6_send: inp == NULL"));
939
940	INP_INFO_WLOCK(&V_udbinfo);
941	INP_WLOCK(inp);
942	if (addr) {
943		if (addr->sa_len != sizeof(struct sockaddr_in6)) {
944			error = EINVAL;
945			goto bad;
946		}
947		if (addr->sa_family != AF_INET6) {
948			error = EAFNOSUPPORT;
949			goto bad;
950		}
951	}
952
953#ifdef INET
954	if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0) {
955		int hasv4addr;
956		struct sockaddr_in6 *sin6 = 0;
957
958		if (addr == 0)
959			hasv4addr = (inp->inp_vflag & INP_IPV4);
960		else {
961			sin6 = (struct sockaddr_in6 *)addr;
962			hasv4addr = IN6_IS_ADDR_V4MAPPED(&sin6->sin6_addr)
963			    ? 1 : 0;
964		}
965		if (hasv4addr) {
966			struct pr_usrreqs *pru;
967
968			if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr) &&
969			    !IN6_IS_ADDR_V4MAPPED(&inp->in6p_laddr)) {
970				/*
971				 * When remote addr is IPv4-mapped address,
972				 * local addr should not be an IPv6 address;
973				 * since you cannot determine how to map IPv6
974				 * source address to IPv4.
975				 */
976				error = EINVAL;
977				goto out;
978			}
979			if (sin6)
980				in6_sin6_2_sin_in_sock(addr);
981			pru = inetsw[ip_protox[IPPROTO_UDP]].pr_usrreqs;
982			error = ((*pru->pru_send)(so, flags, m, addr, control,
983			    td));
984			/* addr will just be freed in sendit(). */
985			goto out;
986		}
987	}
988#endif
989#ifdef MAC
990	mac_inpcb_create_mbuf(inp, m);
991#endif
992	error = udp6_output(inp, m, addr, control, td);
993out:
994	INP_WUNLOCK(inp);
995	INP_INFO_WUNLOCK(&V_udbinfo);
996	return (error);
997
998bad:
999	INP_WUNLOCK(inp);
1000	INP_INFO_WUNLOCK(&V_udbinfo);
1001	m_freem(m);
1002	return (error);
1003}
1004
1005struct pr_usrreqs udp6_usrreqs = {
1006	.pru_abort =		udp6_abort,
1007	.pru_attach =		udp6_attach,
1008	.pru_bind =		udp6_bind,
1009	.pru_connect =		udp6_connect,
1010	.pru_control =		in6_control,
1011	.pru_detach =		udp6_detach,
1012	.pru_disconnect =	udp6_disconnect,
1013	.pru_peeraddr =		in6_mapped_peeraddr,
1014	.pru_send =		udp6_send,
1015	.pru_shutdown =		udp_shutdown,
1016	.pru_sockaddr =		in6_mapped_sockaddr,
1017	.pru_soreceive =	soreceive_dgram,
1018	.pru_sosend =		sosend_dgram,
1019	.pru_sosetlabel =	in_pcbsosetlabel,
1020	.pru_close =		udp6_close
1021};
1022