in6_pcb.c revision 157978
1/* $FreeBSD: head/sys/netinet6/in6_pcb.c 157978 2006-04-23 15:06:16Z rwatson $ */ 2/* $KAME: in6_pcb.c,v 1.31 2001/05/21 05:45:10 jinmei Exp $ */ 3 4/*- 5 * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project. 6 * All rights reserved. 7 * 8 * Redistribution and use in source and binary forms, with or without 9 * modification, are permitted provided that the following conditions 10 * are met: 11 * 1. Redistributions of source code must retain the above copyright 12 * notice, this list of conditions and the following disclaimer. 13 * 2. Redistributions in binary form must reproduce the above copyright 14 * notice, this list of conditions and the following disclaimer in the 15 * documentation and/or other materials provided with the distribution. 16 * 3. Neither the name of the project nor the names of its contributors 17 * may be used to endorse or promote products derived from this software 18 * without specific prior written permission. 19 * 20 * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND 21 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 22 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 23 * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE 24 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 25 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 26 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 28 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 29 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 30 * SUCH DAMAGE. 31 * 32 */ 33 34/*- 35 * Copyright (c) 1982, 1986, 1991, 1993 36 * The Regents of the University of California. All rights reserved. 37 * 38 * Redistribution and use in source and binary forms, with or without 39 * modification, are permitted provided that the following conditions 40 * are met: 41 * 1. Redistributions of source code must retain the above copyright 42 * notice, this list of conditions and the following disclaimer. 43 * 2. Redistributions in binary form must reproduce the above copyright 44 * notice, this list of conditions and the following disclaimer in the 45 * documentation and/or other materials provided with the distribution. 46 * 4. Neither the name of the University nor the names of its contributors 47 * may be used to endorse or promote products derived from this software 48 * without specific prior written permission. 49 * 50 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 51 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 52 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 53 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 54 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 55 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 56 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 57 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 58 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 59 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 60 * SUCH DAMAGE. 61 * 62 * @(#)in_pcb.c 8.2 (Berkeley) 1/4/94 63 */ 64 65#include "opt_inet.h" 66#include "opt_inet6.h" 67#include "opt_ipsec.h" 68 69#include <sys/param.h> 70#include <sys/systm.h> 71#include <sys/malloc.h> 72#include <sys/mbuf.h> 73#include <sys/domain.h> 74#include <sys/protosw.h> 75#include <sys/socket.h> 76#include <sys/socketvar.h> 77#include <sys/sockio.h> 78#include <sys/errno.h> 79#include <sys/time.h> 80#include <sys/proc.h> 81#include <sys/jail.h> 82 83#include <vm/uma.h> 84 85#include <net/if.h> 86#include <net/if_types.h> 87#include <net/route.h> 88 89#include <netinet/in.h> 90#include <netinet/in_var.h> 91#include <netinet/in_systm.h> 92#include <netinet/tcp_var.h> 93#include <netinet/ip6.h> 94#include <netinet/ip_var.h> 95#include <netinet6/ip6_var.h> 96#include <netinet6/nd6.h> 97#include <netinet/in_pcb.h> 98#include <netinet6/in6_pcb.h> 99#include <netinet6/scope6_var.h> 100 101#ifdef IPSEC 102#include <netinet6/ipsec.h> 103#ifdef INET6 104#include <netinet6/ipsec6.h> 105#endif 106#include <netinet6/ah.h> 107#ifdef INET6 108#include <netinet6/ah6.h> 109#endif 110#include <netkey/key.h> 111#endif /* IPSEC */ 112 113#ifdef FAST_IPSEC 114#include <netipsec/ipsec.h> 115#include <netipsec/ipsec6.h> 116#include <netipsec/key.h> 117#endif /* FAST_IPSEC */ 118 119struct in6_addr zeroin6_addr; 120 121int 122in6_pcbbind(inp, nam, cred) 123 register struct inpcb *inp; 124 struct sockaddr *nam; 125 struct ucred *cred; 126{ 127 struct socket *so = inp->inp_socket; 128 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)NULL; 129 struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 130 u_short lport = 0; 131 int wild = 0, reuseport = (so->so_options & SO_REUSEPORT); 132 133 INP_INFO_WLOCK_ASSERT(pcbinfo); 134 INP_LOCK_ASSERT(inp); 135 136 if (!in6_ifaddr) /* XXX broken! */ 137 return (EADDRNOTAVAIL); 138 if (inp->inp_lport || !IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) 139 return (EINVAL); 140 if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT)) == 0) 141 wild = 1; 142 if (nam) { 143 int error; 144 145 sin6 = (struct sockaddr_in6 *)nam; 146 if (nam->sa_len != sizeof(*sin6)) 147 return (EINVAL); 148 /* 149 * family check. 150 */ 151 if (nam->sa_family != AF_INET6) 152 return (EAFNOSUPPORT); 153 154 if ((error = sa6_embedscope(sin6, ip6_use_defzone)) != 0) 155 return(error); 156 157 lport = sin6->sin6_port; 158 if (IN6_IS_ADDR_MULTICAST(&sin6->sin6_addr)) { 159 /* 160 * Treat SO_REUSEADDR as SO_REUSEPORT for multicast; 161 * allow compepte duplication of binding if 162 * SO_REUSEPORT is set, or if SO_REUSEADDR is set 163 * and a multicast address is bound on both 164 * new and duplicated sockets. 165 */ 166 if (so->so_options & SO_REUSEADDR) 167 reuseport = SO_REUSEADDR|SO_REUSEPORT; 168 } else if (!IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) { 169 struct ifaddr *ia = NULL; 170 171 sin6->sin6_port = 0; /* yech... */ 172 if ((ia = ifa_ifwithaddr((struct sockaddr *)sin6)) == 0) 173 return (EADDRNOTAVAIL); 174 175 /* 176 * XXX: bind to an anycast address might accidentally 177 * cause sending a packet with anycast source address. 178 * We should allow to bind to a deprecated address, since 179 * the application dares to use it. 180 */ 181 if (ia && 182 ((struct in6_ifaddr *)ia)->ia6_flags & 183 (IN6_IFF_ANYCAST|IN6_IFF_NOTREADY|IN6_IFF_DETACHED)) { 184 return (EADDRNOTAVAIL); 185 } 186 } 187 if (lport) { 188 struct inpcb *t; 189 190 /* GROSS */ 191 if (ntohs(lport) <= ipport_reservedhigh && 192 ntohs(lport) >= ipport_reservedlow && 193 suser_cred(cred, SUSER_ALLOWJAIL)) 194 return (EACCES); 195 if (so->so_cred->cr_uid != 0 && 196 !IN6_IS_ADDR_MULTICAST(&sin6->sin6_addr)) { 197 t = in6_pcblookup_local(pcbinfo, 198 &sin6->sin6_addr, lport, 199 INPLOOKUP_WILDCARD); 200 if (t && 201 ((t->inp_vflag & INP_TIMEWAIT) == 0) && 202 (so->so_type != SOCK_STREAM || 203 IN6_IS_ADDR_UNSPECIFIED(&t->in6p_faddr)) && 204 (!IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr) || 205 !IN6_IS_ADDR_UNSPECIFIED(&t->in6p_laddr) || 206 (t->inp_socket->so_options & SO_REUSEPORT) 207 == 0) && (so->so_cred->cr_uid != 208 t->inp_socket->so_cred->cr_uid)) 209 return (EADDRINUSE); 210 if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0 && 211 IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) { 212 struct sockaddr_in sin; 213 214 in6_sin6_2_sin(&sin, sin6); 215 t = in_pcblookup_local(pcbinfo, 216 sin.sin_addr, lport, 217 INPLOOKUP_WILDCARD); 218 if (t && 219 ((t->inp_vflag & 220 INP_TIMEWAIT) == 0) && 221 (so->so_type != SOCK_STREAM || 222 ntohl(t->inp_faddr.s_addr) == 223 INADDR_ANY) && 224 (so->so_cred->cr_uid != 225 t->inp_socket->so_cred->cr_uid)) 226 return (EADDRINUSE); 227 } 228 } 229 t = in6_pcblookup_local(pcbinfo, &sin6->sin6_addr, 230 lport, wild); 231 if (t && (reuseport & ((t->inp_vflag & INP_TIMEWAIT) ? 232 intotw(t)->tw_so_options : 233 t->inp_socket->so_options)) == 0) 234 return (EADDRINUSE); 235 if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0 && 236 IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) { 237 struct sockaddr_in sin; 238 239 in6_sin6_2_sin(&sin, sin6); 240 t = in_pcblookup_local(pcbinfo, sin.sin_addr, 241 lport, wild); 242 if (t && t->inp_vflag & INP_TIMEWAIT) { 243 if ((reuseport & 244 intotw(t)->tw_so_options) == 0 && 245 (ntohl(t->inp_laddr.s_addr) != 246 INADDR_ANY || ((inp->inp_vflag & 247 INP_IPV6PROTO) == 248 (t->inp_vflag & INP_IPV6PROTO)))) 249 return (EADDRINUSE); 250 } 251 else if (t && 252 (reuseport & t->inp_socket->so_options) 253 == 0 && (ntohl(t->inp_laddr.s_addr) != 254 INADDR_ANY || INP_SOCKAF(so) == 255 INP_SOCKAF(t->inp_socket))) 256 return (EADDRINUSE); 257 } 258 } 259 inp->in6p_laddr = sin6->sin6_addr; 260 } 261 if (lport == 0) { 262 int e; 263 if ((e = in6_pcbsetport(&inp->in6p_laddr, inp, cred)) != 0) 264 return (e); 265 } 266 else { 267 inp->inp_lport = lport; 268 if (in_pcbinshash(inp) != 0) { 269 inp->in6p_laddr = in6addr_any; 270 inp->inp_lport = 0; 271 return (EAGAIN); 272 } 273 } 274 return (0); 275} 276 277/* 278 * Transform old in6_pcbconnect() into an inner subroutine for new 279 * in6_pcbconnect(): Do some validity-checking on the remote 280 * address (in mbuf 'nam') and then determine local host address 281 * (i.e., which interface) to use to access that remote host. 282 * 283 * This preserves definition of in6_pcbconnect(), while supporting a 284 * slightly different version for T/TCP. (This is more than 285 * a bit of a kludge, but cleaning up the internal interfaces would 286 * have forced minor changes in every protocol). 287 */ 288 289int 290in6_pcbladdr(inp, nam, plocal_addr6) 291 register struct inpcb *inp; 292 struct sockaddr *nam; 293 struct in6_addr **plocal_addr6; 294{ 295 register struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)nam; 296 int error = 0; 297 struct ifnet *ifp = NULL; 298 int scope_ambiguous = 0; 299 300 if (nam->sa_len != sizeof (*sin6)) 301 return (EINVAL); 302 if (sin6->sin6_family != AF_INET6) 303 return (EAFNOSUPPORT); 304 if (sin6->sin6_port == 0) 305 return (EADDRNOTAVAIL); 306 307 if (sin6->sin6_scope_id == 0 && !ip6_use_defzone) 308 scope_ambiguous = 1; 309 if ((error = sa6_embedscope(sin6, ip6_use_defzone)) != 0) 310 return(error); 311 312 INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 313 INP_LOCK_ASSERT(inp); 314 315 if (in6_ifaddr) { 316 /* 317 * If the destination address is UNSPECIFIED addr, 318 * use the loopback addr, e.g ::1. 319 */ 320 if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) 321 sin6->sin6_addr = in6addr_loopback; 322 } 323 324 /* 325 * XXX: in6_selectsrc might replace the bound local address 326 * with the address specified by setsockopt(IPV6_PKTINFO). 327 * Is it the intended behavior? 328 */ 329 *plocal_addr6 = in6_selectsrc(sin6, inp->in6p_outputopts, 330 inp->in6p_moptions, NULL, 331 &inp->in6p_laddr, &ifp, &error); 332 if (ifp && scope_ambiguous && 333 (error = in6_setscope(&sin6->sin6_addr, ifp, NULL)) != 0) { 334 return(error); 335 } 336 337 if (*plocal_addr6 == 0) { 338 if (error == 0) 339 error = EADDRNOTAVAIL; 340 return (error); 341 } 342 /* 343 * Don't do pcblookup call here; return interface in 344 * plocal_addr6 345 * and exit to caller, that will do the lookup. 346 */ 347 348 return (0); 349} 350 351/* 352 * Outer subroutine: 353 * Connect from a socket to a specified address. 354 * Both address and port must be specified in argument sin. 355 * If don't have a local address for this socket yet, 356 * then pick one. 357 */ 358int 359in6_pcbconnect(inp, nam, cred) 360 register struct inpcb *inp; 361 struct sockaddr *nam; 362 struct ucred *cred; 363{ 364 struct in6_addr *addr6; 365 register struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)nam; 366 int error; 367 368 INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 369 INP_LOCK_ASSERT(inp); 370 371 /* 372 * Call inner routine, to assign local interface address. 373 * in6_pcbladdr() may automatically fill in sin6_scope_id. 374 */ 375 if ((error = in6_pcbladdr(inp, nam, &addr6)) != 0) 376 return (error); 377 378 if (in6_pcblookup_hash(inp->inp_pcbinfo, &sin6->sin6_addr, 379 sin6->sin6_port, 380 IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr) 381 ? addr6 : &inp->in6p_laddr, 382 inp->inp_lport, 0, NULL) != NULL) { 383 return (EADDRINUSE); 384 } 385 if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) { 386 if (inp->inp_lport == 0) { 387 error = in6_pcbbind(inp, (struct sockaddr *)0, cred); 388 if (error) 389 return (error); 390 } 391 inp->in6p_laddr = *addr6; 392 } 393 inp->in6p_faddr = sin6->sin6_addr; 394 inp->inp_fport = sin6->sin6_port; 395 /* update flowinfo - draft-itojun-ipv6-flowlabel-api-00 */ 396 inp->in6p_flowinfo &= ~IPV6_FLOWLABEL_MASK; 397 if (inp->in6p_flags & IN6P_AUTOFLOWLABEL) 398 inp->in6p_flowinfo |= 399 (htonl(ip6_randomflowlabel()) & IPV6_FLOWLABEL_MASK); 400 401 in_pcbrehash(inp); 402#ifdef IPSEC 403 if (inp->inp_socket->so_type == SOCK_STREAM) 404 ipsec_pcbconn(inp->inp_sp); 405#endif 406 return (0); 407} 408 409void 410in6_pcbdisconnect(inp) 411 struct inpcb *inp; 412{ 413 414 INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 415 INP_LOCK_ASSERT(inp); 416 417 bzero((caddr_t)&inp->in6p_faddr, sizeof(inp->in6p_faddr)); 418 inp->inp_fport = 0; 419 /* clear flowinfo - draft-itojun-ipv6-flowlabel-api-00 */ 420 inp->in6p_flowinfo &= ~IPV6_FLOWLABEL_MASK; 421 in_pcbrehash(inp); 422#ifdef IPSEC 423 ipsec_pcbdisconn(inp->inp_sp); 424#endif 425} 426 427void 428in6_pcbdetach(struct inpcb *inp) 429{ 430 431 KASSERT(inp->inp_socket != NULL, ("in6_pcbdetach: inp_socket == NULL")); 432 inp->inp_socket->so_pcb = NULL; 433 inp->inp_socket = NULL; 434} 435 436void 437in6_pcbfree(struct inpcb *inp) 438{ 439 struct inpcbinfo *ipi = inp->inp_pcbinfo; 440 441 KASSERT(inp->inp_socket == NULL, ("in6_pcbfree: inp_socket != NULL")); 442 INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 443 INP_LOCK_ASSERT(inp); 444 445#if defined(IPSEC) || defined(FAST_IPSEC) 446 if (inp->in6p_sp != NULL) 447 ipsec6_delete_pcbpolicy(inp); 448#endif /* IPSEC */ 449 inp->inp_gencnt = ++ipi->ipi_gencnt; 450 in_pcbremlists(inp); 451 ip6_freepcbopts(inp->in6p_outputopts); 452 ip6_freemoptions(inp->in6p_moptions); 453 /* Check and free IPv4 related resources in case of mapped addr */ 454 if (inp->inp_options) 455 (void)m_free(inp->inp_options); 456 ip_freemoptions(inp->inp_moptions); 457 inp->inp_vflag = 0; 458 INP_LOCK_DESTROY(inp); 459 uma_zfree(ipi->ipi_zone, inp); 460} 461 462struct sockaddr * 463in6_sockaddr(port, addr_p) 464 in_port_t port; 465 struct in6_addr *addr_p; 466{ 467 struct sockaddr_in6 *sin6; 468 469 MALLOC(sin6, struct sockaddr_in6 *, sizeof *sin6, M_SONAME, M_WAITOK); 470 bzero(sin6, sizeof *sin6); 471 sin6->sin6_family = AF_INET6; 472 sin6->sin6_len = sizeof(*sin6); 473 sin6->sin6_port = port; 474 sin6->sin6_addr = *addr_p; 475 (void)sa6_recoverscope(sin6); /* XXX: should catch errors */ 476 477 return (struct sockaddr *)sin6; 478} 479 480struct sockaddr * 481in6_v4mapsin6_sockaddr(port, addr_p) 482 in_port_t port; 483 struct in_addr *addr_p; 484{ 485 struct sockaddr_in sin; 486 struct sockaddr_in6 *sin6_p; 487 488 bzero(&sin, sizeof sin); 489 sin.sin_family = AF_INET; 490 sin.sin_len = sizeof(sin); 491 sin.sin_port = port; 492 sin.sin_addr = *addr_p; 493 494 MALLOC(sin6_p, struct sockaddr_in6 *, sizeof *sin6_p, M_SONAME, 495 M_WAITOK); 496 in6_sin_2_v4mapsin6(&sin, sin6_p); 497 498 return (struct sockaddr *)sin6_p; 499} 500 501/* 502 * The calling convention of in6_setsockaddr() and in6_setpeeraddr() was 503 * modified to match the pru_sockaddr() and pru_peeraddr() entry points 504 * in struct pr_usrreqs, so that protocols can just reference then directly 505 * without the need for a wrapper function. The socket must have a valid 506 * (i.e., non-nil) PCB, but it should be impossible to get an invalid one 507 * except through a kernel programming error, so it is acceptable to panic 508 * (or in this case trap) if the PCB is invalid. (Actually, we don't trap 509 * because there actually /is/ a programming error somewhere... XXX) 510 */ 511int 512in6_setsockaddr(so, nam) 513 struct socket *so; 514 struct sockaddr **nam; 515{ 516 register struct inpcb *inp; 517 struct in6_addr addr; 518 in_port_t port; 519 520 inp = sotoinpcb(so); 521 KASSERT(inp != NULL, ("in6_setsockaddr: inp == NULL")); 522 523 INP_LOCK(inp); 524 port = inp->inp_lport; 525 addr = inp->in6p_laddr; 526 INP_UNLOCK(inp); 527 528 *nam = in6_sockaddr(port, &addr); 529 return 0; 530} 531 532int 533in6_setpeeraddr(so, nam) 534 struct socket *so; 535 struct sockaddr **nam; 536{ 537 struct inpcb *inp; 538 struct in6_addr addr; 539 in_port_t port; 540 541 inp = sotoinpcb(so); 542 KASSERT(inp != NULL, ("in6_setpeeraddr: inp == NULL")); 543 544 INP_LOCK(inp); 545 port = inp->inp_fport; 546 addr = inp->in6p_faddr; 547 INP_UNLOCK(inp); 548 549 *nam = in6_sockaddr(port, &addr); 550 return 0; 551} 552 553int 554in6_mapped_sockaddr(struct socket *so, struct sockaddr **nam) 555{ 556 struct inpcb *inp; 557 int error; 558 559 inp = sotoinpcb(so); 560 KASSERT(inp != NULL, ("in6_mapped_sockaddr: inp == NULL")); 561 562 if ((inp->inp_vflag & (INP_IPV4 | INP_IPV6)) == INP_IPV4) { 563 error = in_setsockaddr(so, nam, &tcbinfo); 564 if (error == 0) 565 in6_sin_2_v4mapsin6_in_sock(nam); 566 } else { 567 /* scope issues will be handled in in6_setsockaddr(). */ 568 error = in6_setsockaddr(so, nam); 569 } 570 571 return error; 572} 573 574int 575in6_mapped_peeraddr(struct socket *so, struct sockaddr **nam) 576{ 577 struct inpcb *inp; 578 int error; 579 580 inp = sotoinpcb(so); 581 KASSERT(inp != NULL, ("in6_mapped_peeraddr: inp == NULL")); 582 583 if ((inp->inp_vflag & (INP_IPV4 | INP_IPV6)) == INP_IPV4) { 584 error = in_setpeeraddr(so, nam, &tcbinfo); 585 if (error == 0) 586 in6_sin_2_v4mapsin6_in_sock(nam); 587 } else 588 /* scope issues will be handled in in6_setpeeraddr(). */ 589 error = in6_setpeeraddr(so, nam); 590 591 return error; 592} 593 594/* 595 * Pass some notification to all connections of a protocol 596 * associated with address dst. The local address and/or port numbers 597 * may be specified to limit the search. The "usual action" will be 598 * taken, depending on the ctlinput cmd. The caller must filter any 599 * cmds that are uninteresting (e.g., no error in the map). 600 * Call the protocol specific routine (if any) to report 601 * any errors for each matching socket. 602 */ 603void 604in6_pcbnotify(pcbinfo, dst, fport_arg, src, lport_arg, cmd, cmdarg, notify) 605 struct inpcbinfo *pcbinfo; 606 struct sockaddr *dst; 607 const struct sockaddr *src; 608 u_int fport_arg, lport_arg; 609 int cmd; 610 void *cmdarg; 611 struct inpcb *(*notify) __P((struct inpcb *, int)); 612{ 613 struct inpcbhead *head; 614 struct inpcb *inp, *ninp; 615 struct sockaddr_in6 sa6_src, *sa6_dst; 616 u_short fport = fport_arg, lport = lport_arg; 617 u_int32_t flowinfo; 618 int errno; 619 620 if ((unsigned)cmd >= PRC_NCMDS || dst->sa_family != AF_INET6) 621 return; 622 623 sa6_dst = (struct sockaddr_in6 *)dst; 624 if (IN6_IS_ADDR_UNSPECIFIED(&sa6_dst->sin6_addr)) 625 return; 626 627 /* 628 * note that src can be NULL when we get notify by local fragmentation. 629 */ 630 sa6_src = (src == NULL) ? sa6_any : *(const struct sockaddr_in6 *)src; 631 flowinfo = sa6_src.sin6_flowinfo; 632 633 /* 634 * Redirects go to all references to the destination, 635 * and use in6_rtchange to invalidate the route cache. 636 * Dead host indications: also use in6_rtchange to invalidate 637 * the cache, and deliver the error to all the sockets. 638 * Otherwise, if we have knowledge of the local port and address, 639 * deliver only to that socket. 640 */ 641 if (PRC_IS_REDIRECT(cmd) || cmd == PRC_HOSTDEAD) { 642 fport = 0; 643 lport = 0; 644 bzero((caddr_t)&sa6_src.sin6_addr, sizeof(sa6_src.sin6_addr)); 645 646 if (cmd != PRC_HOSTDEAD) 647 notify = in6_rtchange; 648 } 649 errno = inet6ctlerrmap[cmd]; 650 head = pcbinfo->listhead; 651 INP_INFO_WLOCK(pcbinfo); 652 for (inp = LIST_FIRST(head); inp != NULL; inp = ninp) { 653 INP_LOCK(inp); 654 ninp = LIST_NEXT(inp, inp_list); 655 656 if ((inp->inp_vflag & INP_IPV6) == 0) { 657 INP_UNLOCK(inp); 658 continue; 659 } 660 661 /* 662 * If the error designates a new path MTU for a destination 663 * and the application (associated with this socket) wanted to 664 * know the value, notify. Note that we notify for all 665 * disconnected sockets if the corresponding application 666 * wanted. This is because some UDP applications keep sending 667 * sockets disconnected. 668 * XXX: should we avoid to notify the value to TCP sockets? 669 */ 670 if (cmd == PRC_MSGSIZE && (inp->inp_flags & IN6P_MTU) != 0 && 671 (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) || 672 IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, &sa6_dst->sin6_addr))) { 673 ip6_notify_pmtu(inp, (struct sockaddr_in6 *)dst, 674 (u_int32_t *)cmdarg); 675 } 676 677 /* 678 * Detect if we should notify the error. If no source and 679 * destination ports are specifed, but non-zero flowinfo and 680 * local address match, notify the error. This is the case 681 * when the error is delivered with an encrypted buffer 682 * by ESP. Otherwise, just compare addresses and ports 683 * as usual. 684 */ 685 if (lport == 0 && fport == 0 && flowinfo && 686 inp->inp_socket != NULL && 687 flowinfo == (inp->in6p_flowinfo & IPV6_FLOWLABEL_MASK) && 688 IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, &sa6_src.sin6_addr)) 689 goto do_notify; 690 else if (!IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, 691 &sa6_dst->sin6_addr) || 692 inp->inp_socket == 0 || 693 (lport && inp->inp_lport != lport) || 694 (!IN6_IS_ADDR_UNSPECIFIED(&sa6_src.sin6_addr) && 695 !IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, 696 &sa6_src.sin6_addr)) || 697 (fport && inp->inp_fport != fport)) { 698 INP_UNLOCK(inp); 699 continue; 700 } 701 702 do_notify: 703 if (notify) { 704 if ((*notify)(inp, errno)) 705 INP_UNLOCK(inp); 706 } else 707 INP_UNLOCK(inp); 708 } 709 INP_INFO_WUNLOCK(pcbinfo); 710} 711 712/* 713 * Lookup a PCB based on the local address and port. 714 */ 715struct inpcb * 716in6_pcblookup_local(pcbinfo, laddr, lport_arg, wild_okay) 717 struct inpcbinfo *pcbinfo; 718 struct in6_addr *laddr; 719 u_int lport_arg; 720 int wild_okay; 721{ 722 register struct inpcb *inp; 723 int matchwild = 3, wildcard; 724 u_short lport = lport_arg; 725 726 if (!wild_okay) { 727 struct inpcbhead *head; 728 /* 729 * Look for an unconnected (wildcard foreign addr) PCB that 730 * matches the local address and port we're looking for. 731 */ 732 head = &pcbinfo->hashbase[INP_PCBHASH(INADDR_ANY, lport, 0, 733 pcbinfo->hashmask)]; 734 LIST_FOREACH(inp, head, inp_hash) { 735 if ((inp->inp_vflag & INP_IPV6) == 0) 736 continue; 737 if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) && 738 IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr) && 739 inp->inp_lport == lport) { 740 /* 741 * Found. 742 */ 743 return (inp); 744 } 745 } 746 /* 747 * Not found. 748 */ 749 return (NULL); 750 } else { 751 struct inpcbporthead *porthash; 752 struct inpcbport *phd; 753 struct inpcb *match = NULL; 754 /* 755 * Best fit PCB lookup. 756 * 757 * First see if this local port is in use by looking on the 758 * port hash list. 759 */ 760 porthash = &pcbinfo->porthashbase[INP_PCBPORTHASH(lport, 761 pcbinfo->porthashmask)]; 762 LIST_FOREACH(phd, porthash, phd_hash) { 763 if (phd->phd_port == lport) 764 break; 765 } 766 if (phd != NULL) { 767 /* 768 * Port is in use by one or more PCBs. Look for best 769 * fit. 770 */ 771 LIST_FOREACH(inp, &phd->phd_pcblist, inp_portlist) { 772 wildcard = 0; 773 if ((inp->inp_vflag & INP_IPV6) == 0) 774 continue; 775 if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) 776 wildcard++; 777 if (!IN6_IS_ADDR_UNSPECIFIED( 778 &inp->in6p_laddr)) { 779 if (IN6_IS_ADDR_UNSPECIFIED(laddr)) 780 wildcard++; 781 else if (!IN6_ARE_ADDR_EQUAL( 782 &inp->in6p_laddr, laddr)) 783 continue; 784 } else { 785 if (!IN6_IS_ADDR_UNSPECIFIED(laddr)) 786 wildcard++; 787 } 788 if (wildcard < matchwild) { 789 match = inp; 790 matchwild = wildcard; 791 if (matchwild == 0) { 792 break; 793 } 794 } 795 } 796 } 797 return (match); 798 } 799} 800 801void 802in6_pcbpurgeif0(pcbinfo, ifp) 803 struct inpcbinfo *pcbinfo; 804 struct ifnet *ifp; 805{ 806 struct in6pcb *in6p; 807 struct ip6_moptions *im6o; 808 struct in6_multi_mship *imm, *nimm; 809 810 INP_INFO_RLOCK(pcbinfo); 811 LIST_FOREACH(in6p, pcbinfo->listhead, inp_list) { 812 INP_LOCK(in6p); 813 im6o = in6p->in6p_moptions; 814 if ((in6p->inp_vflag & INP_IPV6) && 815 im6o) { 816 /* 817 * Unselect the outgoing interface if it is being 818 * detached. 819 */ 820 if (im6o->im6o_multicast_ifp == ifp) 821 im6o->im6o_multicast_ifp = NULL; 822 823 /* 824 * Drop multicast group membership if we joined 825 * through the interface being detached. 826 * XXX controversial - is it really legal for kernel 827 * to force this? 828 */ 829 for (imm = im6o->im6o_memberships.lh_first; 830 imm != NULL; imm = nimm) { 831 nimm = imm->i6mm_chain.le_next; 832 if (imm->i6mm_maddr->in6m_ifp == ifp) { 833 LIST_REMOVE(imm, i6mm_chain); 834 in6_delmulti(imm->i6mm_maddr); 835 free(imm, M_IP6MADDR); 836 } 837 } 838 } 839 INP_UNLOCK(in6p); 840 } 841 INP_INFO_RUNLOCK(pcbinfo); 842} 843 844/* 845 * Check for alternatives when higher level complains 846 * about service problems. For now, invalidate cached 847 * routing information. If the route was created dynamically 848 * (by a redirect), time to try a default gateway again. 849 */ 850void 851in6_losing(in6p) 852 struct inpcb *in6p; 853{ 854 /* 855 * We don't store route pointers in the routing table anymore 856 */ 857 return; 858} 859 860/* 861 * After a routing change, flush old routing 862 * and allocate a (hopefully) better one. 863 */ 864struct inpcb * 865in6_rtchange(inp, errno) 866 struct inpcb *inp; 867 int errno; 868{ 869 /* 870 * We don't store route pointers in the routing table anymore 871 */ 872 return inp; 873} 874 875/* 876 * Lookup PCB in hash list. 877 */ 878struct inpcb * 879in6_pcblookup_hash(pcbinfo, faddr, fport_arg, laddr, lport_arg, wildcard, ifp) 880 struct inpcbinfo *pcbinfo; 881 struct in6_addr *faddr, *laddr; 882 u_int fport_arg, lport_arg; 883 int wildcard; 884 struct ifnet *ifp; 885{ 886 struct inpcbhead *head; 887 register struct inpcb *inp; 888 u_short fport = fport_arg, lport = lport_arg; 889 int faith; 890 891 if (faithprefix_p != NULL) 892 faith = (*faithprefix_p)(laddr); 893 else 894 faith = 0; 895 896 /* 897 * First look for an exact match. 898 */ 899 head = &pcbinfo->hashbase[INP_PCBHASH(faddr->s6_addr32[3] /* XXX */, 900 lport, fport, 901 pcbinfo->hashmask)]; 902 LIST_FOREACH(inp, head, inp_hash) { 903 if ((inp->inp_vflag & INP_IPV6) == 0) 904 continue; 905 if (IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, faddr) && 906 IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr) && 907 inp->inp_fport == fport && 908 inp->inp_lport == lport) { 909 /* 910 * Found. 911 */ 912 return (inp); 913 } 914 } 915 if (wildcard) { 916 struct inpcb *local_wild = NULL; 917 918 head = &pcbinfo->hashbase[INP_PCBHASH(INADDR_ANY, lport, 0, 919 pcbinfo->hashmask)]; 920 LIST_FOREACH(inp, head, inp_hash) { 921 if ((inp->inp_vflag & INP_IPV6) == 0) 922 continue; 923 if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) && 924 inp->inp_lport == lport) { 925 if (faith && (inp->inp_flags & INP_FAITH) == 0) 926 continue; 927 if (IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, 928 laddr)) 929 return (inp); 930 else if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) 931 local_wild = inp; 932 } 933 } 934 return (local_wild); 935 } 936 937 /* 938 * Not found. 939 */ 940 return (NULL); 941} 942 943void 944init_sin6(struct sockaddr_in6 *sin6, struct mbuf *m) 945{ 946 struct ip6_hdr *ip; 947 948 ip = mtod(m, struct ip6_hdr *); 949 bzero(sin6, sizeof(*sin6)); 950 sin6->sin6_len = sizeof(*sin6); 951 sin6->sin6_family = AF_INET6; 952 sin6->sin6_addr = ip->ip6_src; 953 954 (void)sa6_recoverscope(sin6); /* XXX: should catch errors... */ 955 956 return; 957} 958