in6_src.c revision 1.61
1/* $OpenBSD: in6_src.c,v 1.61 2015/09/11 20:16:03 claudio Exp $ */ 2/* $KAME: in6_src.c,v 1.36 2001/02/06 04:08:17 itojun Exp $ */ 3 4/* 5 * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project. 6 * All rights reserved. 7 * 8 * Redistribution and use in source and binary forms, with or without 9 * modification, are permitted provided that the following conditions 10 * are met: 11 * 1. Redistributions of source code must retain the above copyright 12 * notice, this list of conditions and the following disclaimer. 13 * 2. Redistributions in binary form must reproduce the above copyright 14 * notice, this list of conditions and the following disclaimer in the 15 * documentation and/or other materials provided with the distribution. 16 * 3. Neither the name of the project nor the names of its contributors 17 * may be used to endorse or promote products derived from this software 18 * without specific prior written permission. 19 * 20 * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND 21 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 22 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 23 * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE 24 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 25 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 26 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 28 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 29 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 30 * SUCH DAMAGE. 31 */ 32 33/* 34 * Copyright (c) 1982, 1986, 1991, 1993 35 * The Regents of the University of California. All rights reserved. 36 * 37 * Redistribution and use in source and binary forms, with or without 38 * modification, are permitted provided that the following conditions 39 * are met: 40 * 1. Redistributions of source code must retain the above copyright 41 * notice, this list of conditions and the following disclaimer. 42 * 2. Redistributions in binary form must reproduce the above copyright 43 * notice, this list of conditions and the following disclaimer in the 44 * documentation and/or other materials provided with the distribution. 45 * 3. Neither the name of the University nor the names of its contributors 46 * may be used to endorse or promote products derived from this software 47 * without specific prior written permission. 48 * 49 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 50 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 51 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 52 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 53 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 54 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 55 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 56 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 57 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 58 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 59 * SUCH DAMAGE. 60 * 61 * @(#)in_pcb.c 8.2 (Berkeley) 1/4/94 62 */ 63 64#include <sys/param.h> 65#include <sys/systm.h> 66#include <sys/mbuf.h> 67#include <sys/protosw.h> 68#include <sys/socket.h> 69#include <sys/socketvar.h> 70#include <sys/ioctl.h> 71#include <sys/errno.h> 72#include <sys/time.h> 73 74#include <net/if.h> 75#include <net/if_var.h> 76#include <net/route.h> 77 78#include <netinet/in.h> 79#include <netinet/ip.h> 80#include <netinet/in_pcb.h> 81#include <netinet6/in6_var.h> 82#include <netinet/ip6.h> 83#include <netinet6/ip6_var.h> 84#include <netinet6/nd6.h> 85 86int in6_selectif(struct sockaddr_in6 *, struct ip6_pktopts *, 87 struct ip6_moptions *, struct route_in6 *, struct ifnet **, u_int); 88 89/* 90 * Return an IPv6 address, which is the most appropriate for a given 91 * destination and user specified options. 92 * If necessary, this function lookups the routing table and returns 93 * an entry to the caller for later use. 94 */ 95int 96in6_selectsrc(struct in6_addr **in6src, struct sockaddr_in6 *dstsock, 97 struct ip6_pktopts *opts, struct ip6_moptions *mopts, 98 struct route_in6 *ro, struct in6_addr *laddr, u_int rtableid) 99{ 100 struct ifnet *ifp = NULL; 101 struct in6_addr *dst; 102 struct in6_ifaddr *ia6 = NULL; 103 struct in6_pktinfo *pi = NULL; 104 int error; 105 106 dst = &dstsock->sin6_addr; 107 108 /* 109 * If the source address is explicitly specified by the caller, 110 * check if the requested source address is indeed a unicast address 111 * assigned to the node, and can be used as the packet's source 112 * address. If everything is okay, use the address as source. 113 */ 114 if (opts && (pi = opts->ip6po_pktinfo) && 115 !IN6_IS_ADDR_UNSPECIFIED(&pi->ipi6_addr)) { 116 struct sockaddr_in6 sa6; 117 118 /* get the outgoing interface */ 119 error = in6_selectif(dstsock, opts, mopts, ro, &ifp, rtableid); 120 if (error) 121 return (error); 122 123 bzero(&sa6, sizeof(sa6)); 124 sa6.sin6_family = AF_INET6; 125 sa6.sin6_len = sizeof(sa6); 126 sa6.sin6_addr = pi->ipi6_addr; 127 128 if (ifp && IN6_IS_SCOPE_EMBED(&sa6.sin6_addr)) 129 sa6.sin6_addr.s6_addr16[1] = htons(ifp->if_index); 130 if_put(ifp); /* put reference from in6_selectif */ 131 132 ia6 = ifatoia6(ifa_ifwithaddr(sin6tosa(&sa6), rtableid)); 133 if (ia6 == NULL || 134 (ia6->ia6_flags & (IN6_IFF_ANYCAST | IN6_IFF_NOTREADY))) 135 return (EADDRNOTAVAIL); 136 137 pi->ipi6_addr = sa6.sin6_addr; /* XXX: this overrides pi */ 138 139 *in6src = &pi->ipi6_addr; 140 return (0); 141 } 142 143 /* 144 * If the source address is not specified but the socket(if any) 145 * is already bound, use the bound address. 146 */ 147 if (laddr && !IN6_IS_ADDR_UNSPECIFIED(laddr)) { 148 *in6src = laddr; 149 return (0); 150 } 151 152 /* 153 * If the caller doesn't specify the source address but 154 * the outgoing interface, use an address associated with 155 * the interface. 156 */ 157 if (pi && pi->ipi6_ifindex) { 158 ifp = if_get(pi->ipi6_ifindex); 159 if (ifp == NULL) 160 return (ENXIO); /* XXX: better error? */ 161 162 ia6 = in6_ifawithscope(ifp, dst, rtableid); 163 if_put(ifp); 164 165 if (ia6 == NULL) 166 return (EADDRNOTAVAIL); 167 168 *in6src = &ia6->ia_addr.sin6_addr; 169 return (0); 170 } 171 172 /* 173 * If the destination address is a link-local unicast address or 174 * a link/interface-local multicast address, and if the outgoing 175 * interface is specified by the sin6_scope_id filed, use an address 176 * associated with the interface. 177 * XXX: We're now trying to define more specific semantics of 178 * sin6_scope_id field, so this part will be rewritten in 179 * the near future. 180 */ 181 if ((IN6_IS_ADDR_LINKLOCAL(dst) || IN6_IS_ADDR_MC_LINKLOCAL(dst) || 182 IN6_IS_ADDR_MC_INTFACELOCAL(dst)) && dstsock->sin6_scope_id) { 183 ifp = if_get(dstsock->sin6_scope_id); 184 if (ifp == NULL) 185 return (ENXIO); /* XXX: better error? */ 186 187 ia6 = in6_ifawithscope(ifp, dst, rtableid); 188 if_put(ifp); 189 190 if (ia6 == NULL) 191 return (EADDRNOTAVAIL); 192 193 *in6src = &ia6->ia_addr.sin6_addr; 194 return (0); 195 } 196 197 /* 198 * If the destination address is a multicast address and 199 * the outgoing interface for the address is specified 200 * by the caller, use an address associated with the interface. 201 * Even if the outgoing interface is not specified, we also 202 * choose a loopback interface as the outgoing interface. 203 */ 204 if (IN6_IS_ADDR_MULTICAST(dst)) { 205 ifp = mopts ? if_get(mopts->im6o_ifidx) : NULL; 206 207 if (!ifp && dstsock->sin6_scope_id) 208 ifp = if_get(htons(dstsock->sin6_scope_id)); 209 210 if (ifp) { 211 ia6 = in6_ifawithscope(ifp, dst, rtableid); 212 if_put(ifp); 213 214 if (ia6 == NULL) 215 return (EADDRNOTAVAIL); 216 217 *in6src = &ia6->ia_addr.sin6_addr; 218 return (0); 219 } 220 } 221 222 /* 223 * If the next hop address for the packet is specified 224 * by caller, use an address associated with the route 225 * to the next hop. 226 */ 227 { 228 struct sockaddr_in6 *sin6_next; 229 struct rtentry *rt; 230 231 if (opts && opts->ip6po_nexthop) { 232 sin6_next = satosin6(opts->ip6po_nexthop); 233 rt = nd6_lookup(&sin6_next->sin6_addr, 1, NULL, 234 rtableid); 235 if (rt) { 236 ia6 = in6_ifawithscope(rt->rt_ifp, dst, 237 rtableid); 238 if (ia6 == NULL) 239 ia6 = ifatoia6(rt->rt_ifa); 240 } 241 if (ia6 == NULL) 242 return (EADDRNOTAVAIL); 243 244 *in6src = &ia6->ia_addr.sin6_addr; 245 return (0); 246 } 247 } 248 249 /* 250 * If route is known or can be allocated now, 251 * our src addr is taken from the i/f, else punt. 252 */ 253 if (ro) { 254 if (ro->ro_rt && ((ro->ro_rt->rt_flags & RTF_UP) == 0 || 255 !IN6_ARE_ADDR_EQUAL(&ro->ro_dst.sin6_addr, dst))) { 256 rtfree(ro->ro_rt); 257 ro->ro_rt = NULL; 258 } 259 if (ro->ro_rt == (struct rtentry *)0 || 260 ro->ro_rt->rt_ifp == (struct ifnet *)0) { 261 struct sockaddr_in6 *sa6; 262 263 /* No route yet, so try to acquire one */ 264 bzero(&ro->ro_dst, sizeof(struct sockaddr_in6)); 265 ro->ro_tableid = rtableid; 266 sa6 = &ro->ro_dst; 267 sa6->sin6_family = AF_INET6; 268 sa6->sin6_len = sizeof(struct sockaddr_in6); 269 sa6->sin6_addr = *dst; 270 sa6->sin6_scope_id = dstsock->sin6_scope_id; 271 if (IN6_IS_ADDR_MULTICAST(dst)) { 272 ro->ro_rt = rtalloc(sin6tosa(&ro->ro_dst), 273 RT_REPORT|RT_RESOLVE, ro->ro_tableid); 274 } else { 275 ro->ro_rt = rtalloc_mpath(sin6tosa(&ro->ro_dst), 276 NULL, ro->ro_tableid); 277 } 278 } 279 280 /* 281 * in_pcbconnect() checks out IFF_LOOPBACK to skip using 282 * the address. But we don't know why it does so. 283 * It is necessary to ensure the scope even for lo0 284 * so doesn't check out IFF_LOOPBACK. 285 */ 286 287 if (ro->ro_rt) { 288 ia6 = in6_ifawithscope(ro->ro_rt->rt_ifa->ifa_ifp, dst, 289 rtableid); 290 if (ia6 == NULL) /* xxx scope error ?*/ 291 ia6 = ifatoia6(ro->ro_rt->rt_ifa); 292 } 293 if (ia6 == NULL) 294 return (EHOSTUNREACH); /* no route */ 295 296 *in6src = &ia6->ia_addr.sin6_addr; 297 return (0); 298 } 299 300 return (EADDRNOTAVAIL); 301} 302 303struct rtentry * 304in6_selectroute(struct sockaddr_in6 *dstsock, struct ip6_pktopts *opts, 305 struct route_in6 *ro, unsigned int rtableid) 306{ 307 struct sockaddr_in6 *sin6_next; 308 struct in6_addr *dst; 309 310 dst = &dstsock->sin6_addr; 311 312 /* 313 * If the next hop address for the packet is specified by the caller, 314 * use it as the gateway. 315 */ 316 if (opts && opts->ip6po_nexthop) { 317 struct route_in6 *ron; 318 319 sin6_next = satosin6(opts->ip6po_nexthop); 320 321 /* We only support AF_INET6 next hops */ 322 if (sin6_next->sin6_family != AF_INET6) 323 return (NULL); 324 325 /* 326 * If the next hop is an IPv6 address, then the node identified 327 * by that address must be a neighbor of the sending host. 328 */ 329 ron = &opts->ip6po_nextroute; 330 if ((ron->ro_rt && 331 (ron->ro_rt->rt_flags & (RTF_UP | RTF_GATEWAY)) != 332 RTF_UP) || 333 !IN6_ARE_ADDR_EQUAL(&ron->ro_dst.sin6_addr, 334 &sin6_next->sin6_addr)) { 335 if (ron->ro_rt) { 336 rtfree(ron->ro_rt); 337 ron->ro_rt = NULL; 338 } 339 ron->ro_dst = *sin6_next; 340 ron->ro_tableid = rtableid; 341 } 342 if (ron->ro_rt == NULL) { 343 /* multi path case? */ 344 ron->ro_rt = rtalloc(sin6tosa(&ron->ro_dst), 345 RT_REPORT|RT_RESOLVE, ron->ro_tableid); 346 if (ron->ro_rt == NULL || 347 (ron->ro_rt->rt_flags & RTF_GATEWAY)) { 348 if (ron->ro_rt) { 349 rtfree(ron->ro_rt); 350 ron->ro_rt = NULL; 351 } 352 return (NULL); 353 } 354 } 355 if (!nd6_is_addr_neighbor(sin6_next, ron->ro_rt->rt_ifp)) { 356 rtfree(ron->ro_rt); 357 ron->ro_rt = NULL; 358 return (NULL); 359 } 360 361 return (ron->ro_rt); 362 } 363 364 /* 365 * Use a cached route if it exists and is valid, else try to allocate 366 * a new one. Note that we should check the address family of the 367 * cached destination, in case of sharing the cache with IPv4. 368 */ 369 if (ro) { 370 if (ro->ro_rt && 371 (!(ro->ro_rt->rt_flags & RTF_UP) || 372 sin6tosa(&ro->ro_dst)->sa_family != AF_INET6 || 373 !IN6_ARE_ADDR_EQUAL(&ro->ro_dst.sin6_addr, dst))) { 374 rtfree(ro->ro_rt); 375 ro->ro_rt = NULL; 376 } 377 if (ro->ro_rt == NULL) { 378 struct sockaddr_in6 *sa6; 379 380 /* No route yet, so try to acquire one */ 381 bzero(&ro->ro_dst, sizeof(struct sockaddr_in6)); 382 ro->ro_tableid = rtableid; 383 sa6 = &ro->ro_dst; 384 *sa6 = *dstsock; 385 sa6->sin6_scope_id = 0; 386 ro->ro_tableid = rtableid; 387 ro->ro_rt = rtalloc_mpath(sin6tosa(&ro->ro_dst), 388 NULL, ro->ro_tableid); 389 } 390 391 /* 392 * Check if the outgoing interface conflicts with 393 * the interface specified by ipi6_ifindex (if specified). 394 * Note that loopback interface is always okay. 395 * (this may happen when we are sending a packet to one of 396 * our own addresses.) 397 */ 398 if (opts && opts->ip6po_pktinfo && 399 opts->ip6po_pktinfo->ipi6_ifindex) { 400 if (ro->ro_rt != NULL && 401 (ro->ro_rt->rt_ifp->if_flags & IFF_LOOPBACK) == 0 && 402 ro->ro_rt->rt_ifp->if_index != 403 opts->ip6po_pktinfo->ipi6_ifindex) { 404 return (NULL); 405 } 406 } 407 408 return (ro->ro_rt); 409 } 410 411 return (NULL); 412} 413 414int 415in6_selectif(struct sockaddr_in6 *dstsock, struct ip6_pktopts *opts, 416 struct ip6_moptions *mopts, struct route_in6 *ro, struct ifnet **retifp, 417 u_int rtableid) 418{ 419 struct rtentry *rt = NULL; 420 struct in6_pktinfo *pi = NULL; 421 422 /* If the caller specify the outgoing interface explicitly, use it. */ 423 if (opts && (pi = opts->ip6po_pktinfo) != NULL && pi->ipi6_ifindex) { 424 *retifp = if_get(pi->ipi6_ifindex); 425 if (*retifp != NULL) 426 return (0); 427 } 428 429 /* 430 * If the destination address is a multicast address and the outgoing 431 * interface for the address is specified by the caller, use it. 432 */ 433 if (IN6_IS_ADDR_MULTICAST(&dstsock->sin6_addr) && 434 mopts != NULL && (*retifp = if_get(mopts->im6o_ifidx)) != NULL) 435 return (0); 436 437 rt = in6_selectroute(dstsock, opts, ro, rtableid); 438 if (rt == NULL) 439 return (EHOSTUNREACH); 440 441 /* 442 * do not use a rejected or black hole route. 443 * XXX: this check should be done in the L2 output routine. 444 * However, if we skipped this check here, we'd see the following 445 * scenario: 446 * - install a rejected route for a scoped address prefix 447 * (like fe80::/10) 448 * - send a packet to a destination that matches the scoped prefix, 449 * with ambiguity about the scope zone. 450 * - pick the outgoing interface from the route, and disambiguate the 451 * scope zone with the interface. 452 * - ip6_output() would try to get another route with the "new" 453 * destination, which may be valid. 454 * - we'd see no error on output. 455 * Although this may not be very harmful, it should still be confusing. 456 * We thus reject the case here. 457 */ 458 if (rt && (rt->rt_flags & (RTF_REJECT | RTF_BLACKHOLE))) 459 return (rt->rt_flags & RTF_HOST ? EHOSTUNREACH : ENETUNREACH); 460 461 /* 462 * Adjust the "outgoing" interface. If we're going to loop the packet 463 * back to ourselves, the ifp would be the loopback interface. 464 * However, we'd rather know the interface associated to the 465 * destination address (which should probably be one of our own 466 * addresses.) 467 */ 468 if (rt && rt->rt_ifa && rt->rt_ifa->ifa_ifp) 469 *retifp = if_ref(rt->rt_ifa->ifa_ifp); 470 471 return (0); 472} 473 474/* 475 * Default hop limit selection. The precedence is as follows: 476 * 1. Hoplimit value specified via ioctl. 477 * 2. (If the outgoing interface is detected) the current 478 * hop limit of the interface specified by router advertisement. 479 * 3. The system default hoplimit. 480*/ 481int 482in6_selecthlim(struct inpcb *in6p, struct ifnet *ifp) 483{ 484 if (in6p && in6p->inp_hops >= 0) 485 return (in6p->inp_hops); 486 else if (ifp) 487 return (ND_IFINFO(ifp)->chlim); 488 else 489 return (ip6_defhlim); 490} 491 492/* 493 * generate kernel-internal form (scopeid embedded into s6_addr16[1]). 494 * If the address scope of is link-local, embed the interface index in the 495 * address. The routine determines our precedence 496 * between advanced API scope/interface specification and basic API 497 * specification. 498 * 499 * this function should be nuked in the future, when we get rid of 500 * embedded scopeid thing. 501 * 502 * XXX actually, it is over-specification to return ifp against sin6_scope_id. 503 * there can be multiple interfaces that belong to a particular scope zone 504 * (in specification, we have 1:N mapping between a scope zone and interfaces). 505 * we may want to change the function to return something other than ifp. 506 */ 507int 508in6_embedscope(struct in6_addr *in6, const struct sockaddr_in6 *sin6, 509 struct inpcb *in6p) 510{ 511 struct ifnet *ifp = NULL; 512 u_int32_t scopeid; 513 514 *in6 = sin6->sin6_addr; 515 scopeid = sin6->sin6_scope_id; 516 517 /* 518 * don't try to read sin6->sin6_addr beyond here, since the caller may 519 * ask us to overwrite existing sockaddr_in6 520 */ 521 522 if (IN6_IS_SCOPE_EMBED(in6)) { 523 struct in6_pktinfo *pi; 524 525 /* 526 * KAME assumption: link id == interface id 527 */ 528 529 if (in6p && in6p->inp_outputopts6 && 530 (pi = in6p->inp_outputopts6->ip6po_pktinfo) && 531 pi->ipi6_ifindex) { 532 ifp = if_get(pi->ipi6_ifindex); 533 if (ifp == NULL) 534 return ENXIO; /* XXX EINVAL? */ 535 in6->s6_addr16[1] = htons(pi->ipi6_ifindex); 536 } else if (in6p && IN6_IS_ADDR_MULTICAST(in6) && 537 in6p->inp_moptions6 && 538 (ifp = if_get(in6p->inp_moptions6->im6o_ifidx))) { 539 in6->s6_addr16[1] = htons(ifp->if_index); 540 } else if (scopeid) { 541 ifp = if_get(scopeid); 542 if (ifp == NULL) 543 return ENXIO; /* XXX EINVAL? */ 544 /*XXX assignment to 16bit from 32bit variable */ 545 in6->s6_addr16[1] = htons(scopeid & 0xffff); 546 } 547 if_put(ifp); 548 } 549 550 return 0; 551} 552 553/* 554 * generate standard sockaddr_in6 from embedded form. 555 * touches sin6_addr and sin6_scope_id only. 556 * 557 * this function should be nuked in the future, when we get rid of 558 * embedded scopeid thing. 559 */ 560void 561in6_recoverscope(struct sockaddr_in6 *sin6, const struct in6_addr *in6) 562{ 563 u_int32_t scopeid; 564 565 sin6->sin6_addr = *in6; 566 567 /* 568 * don't try to read *in6 beyond here, since the caller may 569 * ask us to overwrite existing sockaddr_in6 570 */ 571 572 sin6->sin6_scope_id = 0; 573 if (IN6_IS_SCOPE_EMBED(in6)) { 574 /* 575 * KAME assumption: link id == interface id 576 */ 577 scopeid = ntohs(sin6->sin6_addr.s6_addr16[1]); 578 if (scopeid) { 579 sin6->sin6_addr.s6_addr16[1] = 0; 580 sin6->sin6_scope_id = scopeid; 581 } 582 } 583} 584 585/* 586 * just clear the embedded scope identifer. 587 */ 588void 589in6_clearscope(struct in6_addr *addr) 590{ 591 if (IN6_IS_SCOPE_EMBED(addr)) 592 addr->s6_addr16[1] = 0; 593} 594