if_vlan.c revision 241610
1/*- 2 * Copyright 1998 Massachusetts Institute of Technology 3 * 4 * Permission to use, copy, modify, and distribute this software and 5 * its documentation for any purpose and without fee is hereby 6 * granted, provided that both the above copyright notice and this 7 * permission notice appear in all copies, that both the above 8 * copyright notice and this permission notice appear in all 9 * supporting documentation, and that the name of M.I.T. not be used 10 * in advertising or publicity pertaining to distribution of the 11 * software without specific, written prior permission. M.I.T. makes 12 * no representations about the suitability of this software for any 13 * purpose. It is provided "as is" without express or implied 14 * warranty. 15 * 16 * THIS SOFTWARE IS PROVIDED BY M.I.T. ``AS IS''. M.I.T. DISCLAIMS 17 * ALL EXPRESS OR IMPLIED WARRANTIES WITH REGARD TO THIS SOFTWARE, 18 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF 19 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. IN NO EVENT 20 * SHALL M.I.T. BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 21 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 22 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF 23 * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND 24 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, 25 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT 26 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27 * SUCH DAMAGE. 28 */ 29 30/* 31 * if_vlan.c - pseudo-device driver for IEEE 802.1Q virtual LANs. 32 * Might be extended some day to also handle IEEE 802.1p priority 33 * tagging. This is sort of sneaky in the implementation, since 34 * we need to pretend to be enough of an Ethernet implementation 35 * to make arp work. The way we do this is by telling everyone 36 * that we are an Ethernet, and then catch the packets that 37 * ether_output() sends to us via if_transmit(), rewrite them for 38 * use by the real outgoing interface, and ask it to send them. 39 */ 40 41#include <sys/cdefs.h> 42__FBSDID("$FreeBSD: head/sys/net/if_vlan.c 241610 2012-10-16 13:37:54Z glebius $"); 43 44#include "opt_vlan.h" 45 46#include <sys/param.h> 47#include <sys/kernel.h> 48#include <sys/lock.h> 49#include <sys/malloc.h> 50#include <sys/mbuf.h> 51#include <sys/module.h> 52#include <sys/rwlock.h> 53#include <sys/queue.h> 54#include <sys/socket.h> 55#include <sys/sockio.h> 56#include <sys/sysctl.h> 57#include <sys/systm.h> 58#include <sys/sx.h> 59 60#include <net/bpf.h> 61#include <net/ethernet.h> 62#include <net/if.h> 63#include <net/if_clone.h> 64#include <net/if_dl.h> 65#include <net/if_types.h> 66#include <net/if_vlan_var.h> 67#include <net/vnet.h> 68 69#define VLAN_DEF_HWIDTH 4 70#define VLAN_IFFLAGS (IFF_BROADCAST | IFF_MULTICAST) 71 72#define UP_AND_RUNNING(ifp) \ 73 ((ifp)->if_flags & IFF_UP && (ifp)->if_drv_flags & IFF_DRV_RUNNING) 74 75LIST_HEAD(ifvlanhead, ifvlan); 76 77struct ifvlantrunk { 78 struct ifnet *parent; /* parent interface of this trunk */ 79 struct rwlock rw; 80#ifdef VLAN_ARRAY 81#define VLAN_ARRAY_SIZE (EVL_VLID_MASK + 1) 82 struct ifvlan *vlans[VLAN_ARRAY_SIZE]; /* static table */ 83#else 84 struct ifvlanhead *hash; /* dynamic hash-list table */ 85 uint16_t hmask; 86 uint16_t hwidth; 87#endif 88 int refcnt; 89}; 90 91struct vlan_mc_entry { 92 struct sockaddr_dl mc_addr; 93 SLIST_ENTRY(vlan_mc_entry) mc_entries; 94}; 95 96struct ifvlan { 97 struct ifvlantrunk *ifv_trunk; 98 struct ifnet *ifv_ifp; 99 void *ifv_cookie; 100#define TRUNK(ifv) ((ifv)->ifv_trunk) 101#define PARENT(ifv) ((ifv)->ifv_trunk->parent) 102 int ifv_pflags; /* special flags we have set on parent */ 103 struct ifv_linkmib { 104 int ifvm_encaplen; /* encapsulation length */ 105 int ifvm_mtufudge; /* MTU fudged by this much */ 106 int ifvm_mintu; /* min transmission unit */ 107 uint16_t ifvm_proto; /* encapsulation ethertype */ 108 uint16_t ifvm_tag; /* tag to apply on packets leaving if */ 109 } ifv_mib; 110 SLIST_HEAD(, vlan_mc_entry) vlan_mc_listhead; 111#ifndef VLAN_ARRAY 112 LIST_ENTRY(ifvlan) ifv_list; 113#endif 114}; 115#define ifv_proto ifv_mib.ifvm_proto 116#define ifv_vid ifv_mib.ifvm_tag 117#define ifv_encaplen ifv_mib.ifvm_encaplen 118#define ifv_mtufudge ifv_mib.ifvm_mtufudge 119#define ifv_mintu ifv_mib.ifvm_mintu 120 121/* Special flags we should propagate to parent. */ 122static struct { 123 int flag; 124 int (*func)(struct ifnet *, int); 125} vlan_pflags[] = { 126 {IFF_PROMISC, ifpromisc}, 127 {IFF_ALLMULTI, if_allmulti}, 128 {0, NULL} 129}; 130 131SYSCTL_DECL(_net_link); 132static SYSCTL_NODE(_net_link, IFT_L2VLAN, vlan, CTLFLAG_RW, 0, 133 "IEEE 802.1Q VLAN"); 134static SYSCTL_NODE(_net_link_vlan, PF_LINK, link, CTLFLAG_RW, 0, 135 "for consistency"); 136 137static int soft_pad = 0; 138SYSCTL_INT(_net_link_vlan, OID_AUTO, soft_pad, CTLFLAG_RW, &soft_pad, 0, 139 "pad short frames before tagging"); 140 141static const char vlanname[] = "vlan"; 142static MALLOC_DEFINE(M_VLAN, vlanname, "802.1Q Virtual LAN Interface"); 143 144static eventhandler_tag ifdetach_tag; 145static eventhandler_tag iflladdr_tag; 146 147/* 148 * We have a global mutex, that is used to serialize configuration 149 * changes and isn't used in normal packet delivery. 150 * 151 * We also have a per-trunk rwlock, that is locked shared on packet 152 * processing and exclusive when configuration is changed. 153 * 154 * The VLAN_ARRAY substitutes the dynamic hash with a static array 155 * with 4096 entries. In theory this can give a boost in processing, 156 * however on practice it does not. Probably this is because array 157 * is too big to fit into CPU cache. 158 */ 159static struct sx ifv_lock; 160#define VLAN_LOCK_INIT() sx_init(&ifv_lock, "vlan_global") 161#define VLAN_LOCK_DESTROY() sx_destroy(&ifv_lock) 162#define VLAN_LOCK_ASSERT() sx_assert(&ifv_lock, SA_LOCKED) 163#define VLAN_LOCK() sx_xlock(&ifv_lock) 164#define VLAN_UNLOCK() sx_xunlock(&ifv_lock) 165#define TRUNK_LOCK_INIT(trunk) rw_init(&(trunk)->rw, vlanname) 166#define TRUNK_LOCK_DESTROY(trunk) rw_destroy(&(trunk)->rw) 167#define TRUNK_LOCK(trunk) rw_wlock(&(trunk)->rw) 168#define TRUNK_UNLOCK(trunk) rw_wunlock(&(trunk)->rw) 169#define TRUNK_LOCK_ASSERT(trunk) rw_assert(&(trunk)->rw, RA_WLOCKED) 170#define TRUNK_RLOCK(trunk) rw_rlock(&(trunk)->rw) 171#define TRUNK_RUNLOCK(trunk) rw_runlock(&(trunk)->rw) 172#define TRUNK_LOCK_RASSERT(trunk) rw_assert(&(trunk)->rw, RA_RLOCKED) 173 174#ifndef VLAN_ARRAY 175static void vlan_inithash(struct ifvlantrunk *trunk); 176static void vlan_freehash(struct ifvlantrunk *trunk); 177static int vlan_inshash(struct ifvlantrunk *trunk, struct ifvlan *ifv); 178static int vlan_remhash(struct ifvlantrunk *trunk, struct ifvlan *ifv); 179static void vlan_growhash(struct ifvlantrunk *trunk, int howmuch); 180static __inline struct ifvlan * vlan_gethash(struct ifvlantrunk *trunk, 181 uint16_t vid); 182#endif 183static void trunk_destroy(struct ifvlantrunk *trunk); 184 185static void vlan_init(void *foo); 186static void vlan_input(struct ifnet *ifp, struct mbuf *m); 187static int vlan_ioctl(struct ifnet *ifp, u_long cmd, caddr_t addr); 188static void vlan_qflush(struct ifnet *ifp); 189static int vlan_setflag(struct ifnet *ifp, int flag, int status, 190 int (*func)(struct ifnet *, int)); 191static int vlan_setflags(struct ifnet *ifp, int status); 192static int vlan_setmulti(struct ifnet *ifp); 193static int vlan_transmit(struct ifnet *ifp, struct mbuf *m); 194static void vlan_unconfig(struct ifnet *ifp); 195static void vlan_unconfig_locked(struct ifnet *ifp, int departing); 196static int vlan_config(struct ifvlan *ifv, struct ifnet *p, uint16_t tag); 197static void vlan_link_state(struct ifnet *ifp); 198static void vlan_capabilities(struct ifvlan *ifv); 199static void vlan_trunk_capabilities(struct ifnet *ifp); 200 201static struct ifnet *vlan_clone_match_ethervid(struct if_clone *, 202 const char *, int *); 203static int vlan_clone_match(struct if_clone *, const char *); 204static int vlan_clone_create(struct if_clone *, char *, size_t, caddr_t); 205static int vlan_clone_destroy(struct if_clone *, struct ifnet *); 206 207static void vlan_ifdetach(void *arg, struct ifnet *ifp); 208static void vlan_iflladdr(void *arg, struct ifnet *ifp); 209 210static struct if_clone *vlan_cloner; 211 212#ifdef VIMAGE 213static VNET_DEFINE(struct if_clone *, vlan_cloner); 214#define V_vlan_cloner VNET(vlan_cloner) 215#endif 216 217#ifndef VLAN_ARRAY 218#define HASH(n, m) ((((n) >> 8) ^ ((n) >> 4) ^ (n)) & (m)) 219 220static void 221vlan_inithash(struct ifvlantrunk *trunk) 222{ 223 int i, n; 224 225 /* 226 * The trunk must not be locked here since we call malloc(M_WAITOK). 227 * It is OK in case this function is called before the trunk struct 228 * gets hooked up and becomes visible from other threads. 229 */ 230 231 KASSERT(trunk->hwidth == 0 && trunk->hash == NULL, 232 ("%s: hash already initialized", __func__)); 233 234 trunk->hwidth = VLAN_DEF_HWIDTH; 235 n = 1 << trunk->hwidth; 236 trunk->hmask = n - 1; 237 trunk->hash = malloc(sizeof(struct ifvlanhead) * n, M_VLAN, M_WAITOK); 238 for (i = 0; i < n; i++) 239 LIST_INIT(&trunk->hash[i]); 240} 241 242static void 243vlan_freehash(struct ifvlantrunk *trunk) 244{ 245#ifdef INVARIANTS 246 int i; 247 248 KASSERT(trunk->hwidth > 0, ("%s: hwidth not positive", __func__)); 249 for (i = 0; i < (1 << trunk->hwidth); i++) 250 KASSERT(LIST_EMPTY(&trunk->hash[i]), 251 ("%s: hash table not empty", __func__)); 252#endif 253 free(trunk->hash, M_VLAN); 254 trunk->hash = NULL; 255 trunk->hwidth = trunk->hmask = 0; 256} 257 258static int 259vlan_inshash(struct ifvlantrunk *trunk, struct ifvlan *ifv) 260{ 261 int i, b; 262 struct ifvlan *ifv2; 263 264 TRUNK_LOCK_ASSERT(trunk); 265 KASSERT(trunk->hwidth > 0, ("%s: hwidth not positive", __func__)); 266 267 b = 1 << trunk->hwidth; 268 i = HASH(ifv->ifv_vid, trunk->hmask); 269 LIST_FOREACH(ifv2, &trunk->hash[i], ifv_list) 270 if (ifv->ifv_vid == ifv2->ifv_vid) 271 return (EEXIST); 272 273 /* 274 * Grow the hash when the number of vlans exceeds half of the number of 275 * hash buckets squared. This will make the average linked-list length 276 * buckets/2. 277 */ 278 if (trunk->refcnt > (b * b) / 2) { 279 vlan_growhash(trunk, 1); 280 i = HASH(ifv->ifv_vid, trunk->hmask); 281 } 282 LIST_INSERT_HEAD(&trunk->hash[i], ifv, ifv_list); 283 trunk->refcnt++; 284 285 return (0); 286} 287 288static int 289vlan_remhash(struct ifvlantrunk *trunk, struct ifvlan *ifv) 290{ 291 int i, b; 292 struct ifvlan *ifv2; 293 294 TRUNK_LOCK_ASSERT(trunk); 295 KASSERT(trunk->hwidth > 0, ("%s: hwidth not positive", __func__)); 296 297 b = 1 << trunk->hwidth; 298 i = HASH(ifv->ifv_vid, trunk->hmask); 299 LIST_FOREACH(ifv2, &trunk->hash[i], ifv_list) 300 if (ifv2 == ifv) { 301 trunk->refcnt--; 302 LIST_REMOVE(ifv2, ifv_list); 303 if (trunk->refcnt < (b * b) / 2) 304 vlan_growhash(trunk, -1); 305 return (0); 306 } 307 308 panic("%s: vlan not found\n", __func__); 309 return (ENOENT); /*NOTREACHED*/ 310} 311 312/* 313 * Grow the hash larger or smaller if memory permits. 314 */ 315static void 316vlan_growhash(struct ifvlantrunk *trunk, int howmuch) 317{ 318 struct ifvlan *ifv; 319 struct ifvlanhead *hash2; 320 int hwidth2, i, j, n, n2; 321 322 TRUNK_LOCK_ASSERT(trunk); 323 KASSERT(trunk->hwidth > 0, ("%s: hwidth not positive", __func__)); 324 325 if (howmuch == 0) { 326 /* Harmless yet obvious coding error */ 327 printf("%s: howmuch is 0\n", __func__); 328 return; 329 } 330 331 hwidth2 = trunk->hwidth + howmuch; 332 n = 1 << trunk->hwidth; 333 n2 = 1 << hwidth2; 334 /* Do not shrink the table below the default */ 335 if (hwidth2 < VLAN_DEF_HWIDTH) 336 return; 337 338 /* M_NOWAIT because we're called with trunk mutex held */ 339 hash2 = malloc(sizeof(struct ifvlanhead) * n2, M_VLAN, M_NOWAIT); 340 if (hash2 == NULL) { 341 printf("%s: out of memory -- hash size not changed\n", 342 __func__); 343 return; /* We can live with the old hash table */ 344 } 345 for (j = 0; j < n2; j++) 346 LIST_INIT(&hash2[j]); 347 for (i = 0; i < n; i++) 348 while ((ifv = LIST_FIRST(&trunk->hash[i])) != NULL) { 349 LIST_REMOVE(ifv, ifv_list); 350 j = HASH(ifv->ifv_vid, n2 - 1); 351 LIST_INSERT_HEAD(&hash2[j], ifv, ifv_list); 352 } 353 free(trunk->hash, M_VLAN); 354 trunk->hash = hash2; 355 trunk->hwidth = hwidth2; 356 trunk->hmask = n2 - 1; 357 358 if (bootverbose) 359 if_printf(trunk->parent, 360 "VLAN hash table resized from %d to %d buckets\n", n, n2); 361} 362 363static __inline struct ifvlan * 364vlan_gethash(struct ifvlantrunk *trunk, uint16_t vid) 365{ 366 struct ifvlan *ifv; 367 368 TRUNK_LOCK_RASSERT(trunk); 369 370 LIST_FOREACH(ifv, &trunk->hash[HASH(vid, trunk->hmask)], ifv_list) 371 if (ifv->ifv_vid == vid) 372 return (ifv); 373 return (NULL); 374} 375 376#if 0 377/* Debugging code to view the hashtables. */ 378static void 379vlan_dumphash(struct ifvlantrunk *trunk) 380{ 381 int i; 382 struct ifvlan *ifv; 383 384 for (i = 0; i < (1 << trunk->hwidth); i++) { 385 printf("%d: ", i); 386 LIST_FOREACH(ifv, &trunk->hash[i], ifv_list) 387 printf("%s ", ifv->ifv_ifp->if_xname); 388 printf("\n"); 389 } 390} 391#endif /* 0 */ 392#else 393 394static __inline struct ifvlan * 395vlan_gethash(struct ifvlantrunk *trunk, uint16_t vid) 396{ 397 398 return trunk->vlans[vid]; 399} 400 401static __inline int 402vlan_inshash(struct ifvlantrunk *trunk, struct ifvlan *ifv) 403{ 404 405 if (trunk->vlans[ifv->ifv_vid] != NULL) 406 return EEXIST; 407 trunk->vlans[ifv->ifv_vid] = ifv; 408 trunk->refcnt++; 409 410 return (0); 411} 412 413static __inline int 414vlan_remhash(struct ifvlantrunk *trunk, struct ifvlan *ifv) 415{ 416 417 trunk->vlans[ifv->ifv_vid] = NULL; 418 trunk->refcnt--; 419 420 return (0); 421} 422 423static __inline void 424vlan_freehash(struct ifvlantrunk *trunk) 425{ 426} 427 428static __inline void 429vlan_inithash(struct ifvlantrunk *trunk) 430{ 431} 432 433#endif /* !VLAN_ARRAY */ 434 435static void 436trunk_destroy(struct ifvlantrunk *trunk) 437{ 438 VLAN_LOCK_ASSERT(); 439 440 TRUNK_LOCK(trunk); 441 vlan_freehash(trunk); 442 trunk->parent->if_vlantrunk = NULL; 443 TRUNK_UNLOCK(trunk); 444 TRUNK_LOCK_DESTROY(trunk); 445 free(trunk, M_VLAN); 446} 447 448/* 449 * Program our multicast filter. What we're actually doing is 450 * programming the multicast filter of the parent. This has the 451 * side effect of causing the parent interface to receive multicast 452 * traffic that it doesn't really want, which ends up being discarded 453 * later by the upper protocol layers. Unfortunately, there's no way 454 * to avoid this: there really is only one physical interface. 455 * 456 * XXX: There is a possible race here if more than one thread is 457 * modifying the multicast state of the vlan interface at the same time. 458 */ 459static int 460vlan_setmulti(struct ifnet *ifp) 461{ 462 struct ifnet *ifp_p; 463 struct ifmultiaddr *ifma, *rifma = NULL; 464 struct ifvlan *sc; 465 struct vlan_mc_entry *mc; 466 int error; 467 468 /*VLAN_LOCK_ASSERT();*/ 469 470 /* Find the parent. */ 471 sc = ifp->if_softc; 472 ifp_p = PARENT(sc); 473 474 CURVNET_SET_QUIET(ifp_p->if_vnet); 475 476 /* First, remove any existing filter entries. */ 477 while ((mc = SLIST_FIRST(&sc->vlan_mc_listhead)) != NULL) { 478 error = if_delmulti(ifp_p, (struct sockaddr *)&mc->mc_addr); 479 if (error) 480 return (error); 481 SLIST_REMOVE_HEAD(&sc->vlan_mc_listhead, mc_entries); 482 free(mc, M_VLAN); 483 } 484 485 /* Now program new ones. */ 486 TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 487 if (ifma->ifma_addr->sa_family != AF_LINK) 488 continue; 489 mc = malloc(sizeof(struct vlan_mc_entry), M_VLAN, M_NOWAIT); 490 if (mc == NULL) 491 return (ENOMEM); 492 bcopy(ifma->ifma_addr, &mc->mc_addr, ifma->ifma_addr->sa_len); 493 mc->mc_addr.sdl_index = ifp_p->if_index; 494 SLIST_INSERT_HEAD(&sc->vlan_mc_listhead, mc, mc_entries); 495 error = if_addmulti(ifp_p, (struct sockaddr *)&mc->mc_addr, 496 &rifma); 497 if (error) 498 return (error); 499 } 500 501 CURVNET_RESTORE(); 502 return (0); 503} 504 505/* 506 * A handler for parent interface link layer address changes. 507 * If the parent interface link layer address is changed we 508 * should also change it on all children vlans. 509 */ 510static void 511vlan_iflladdr(void *arg __unused, struct ifnet *ifp) 512{ 513 struct ifvlan *ifv; 514#ifndef VLAN_ARRAY 515 struct ifvlan *next; 516#endif 517 int i; 518 519 /* 520 * Check if it's a trunk interface first of all 521 * to avoid needless locking. 522 */ 523 if (ifp->if_vlantrunk == NULL) 524 return; 525 526 VLAN_LOCK(); 527 /* 528 * OK, it's a trunk. Loop over and change all vlan's lladdrs on it. 529 */ 530#ifdef VLAN_ARRAY 531 for (i = 0; i < VLAN_ARRAY_SIZE; i++) 532 if ((ifv = ifp->if_vlantrunk->vlans[i])) { 533#else /* VLAN_ARRAY */ 534 for (i = 0; i < (1 << ifp->if_vlantrunk->hwidth); i++) 535 LIST_FOREACH_SAFE(ifv, &ifp->if_vlantrunk->hash[i], ifv_list, next) { 536#endif /* VLAN_ARRAY */ 537 VLAN_UNLOCK(); 538 if_setlladdr(ifv->ifv_ifp, IF_LLADDR(ifp), 539 ifp->if_addrlen); 540 VLAN_LOCK(); 541 } 542 VLAN_UNLOCK(); 543 544} 545 546/* 547 * A handler for network interface departure events. 548 * Track departure of trunks here so that we don't access invalid 549 * pointers or whatever if a trunk is ripped from under us, e.g., 550 * by ejecting its hot-plug card. However, if an ifnet is simply 551 * being renamed, then there's no need to tear down the state. 552 */ 553static void 554vlan_ifdetach(void *arg __unused, struct ifnet *ifp) 555{ 556 struct ifvlan *ifv; 557 int i; 558 559 /* 560 * Check if it's a trunk interface first of all 561 * to avoid needless locking. 562 */ 563 if (ifp->if_vlantrunk == NULL) 564 return; 565 566 /* If the ifnet is just being renamed, don't do anything. */ 567 if (ifp->if_flags & IFF_RENAMING) 568 return; 569 570 VLAN_LOCK(); 571 /* 572 * OK, it's a trunk. Loop over and detach all vlan's on it. 573 * Check trunk pointer after each vlan_unconfig() as it will 574 * free it and set to NULL after the last vlan was detached. 575 */ 576#ifdef VLAN_ARRAY 577 for (i = 0; i < VLAN_ARRAY_SIZE; i++) 578 if ((ifv = ifp->if_vlantrunk->vlans[i])) { 579 vlan_unconfig_locked(ifv->ifv_ifp, 1); 580 if (ifp->if_vlantrunk == NULL) 581 break; 582 } 583#else /* VLAN_ARRAY */ 584restart: 585 for (i = 0; i < (1 << ifp->if_vlantrunk->hwidth); i++) 586 if ((ifv = LIST_FIRST(&ifp->if_vlantrunk->hash[i]))) { 587 vlan_unconfig_locked(ifv->ifv_ifp, 1); 588 if (ifp->if_vlantrunk) 589 goto restart; /* trunk->hwidth can change */ 590 else 591 break; 592 } 593#endif /* VLAN_ARRAY */ 594 /* Trunk should have been destroyed in vlan_unconfig(). */ 595 KASSERT(ifp->if_vlantrunk == NULL, ("%s: purge failed", __func__)); 596 VLAN_UNLOCK(); 597} 598 599/* 600 * Return the trunk device for a virtual interface. 601 */ 602static struct ifnet * 603vlan_trunkdev(struct ifnet *ifp) 604{ 605 struct ifvlan *ifv; 606 607 if (ifp->if_type != IFT_L2VLAN) 608 return (NULL); 609 ifv = ifp->if_softc; 610 ifp = NULL; 611 VLAN_LOCK(); 612 if (ifv->ifv_trunk) 613 ifp = PARENT(ifv); 614 VLAN_UNLOCK(); 615 return (ifp); 616} 617 618/* 619 * Return the 12-bit VLAN VID for this interface, for use by external 620 * components such as Infiniband. 621 * 622 * XXXRW: Note that the function name here is historical; it should be named 623 * vlan_vid(). 624 */ 625static int 626vlan_tag(struct ifnet *ifp, uint16_t *vidp) 627{ 628 struct ifvlan *ifv; 629 630 if (ifp->if_type != IFT_L2VLAN) 631 return (EINVAL); 632 ifv = ifp->if_softc; 633 *vidp = ifv->ifv_vid; 634 return (0); 635} 636 637/* 638 * Return a driver specific cookie for this interface. Synchronization 639 * with setcookie must be provided by the driver. 640 */ 641static void * 642vlan_cookie(struct ifnet *ifp) 643{ 644 struct ifvlan *ifv; 645 646 if (ifp->if_type != IFT_L2VLAN) 647 return (NULL); 648 ifv = ifp->if_softc; 649 return (ifv->ifv_cookie); 650} 651 652/* 653 * Store a cookie in our softc that drivers can use to store driver 654 * private per-instance data in. 655 */ 656static int 657vlan_setcookie(struct ifnet *ifp, void *cookie) 658{ 659 struct ifvlan *ifv; 660 661 if (ifp->if_type != IFT_L2VLAN) 662 return (EINVAL); 663 ifv = ifp->if_softc; 664 ifv->ifv_cookie = cookie; 665 return (0); 666} 667 668/* 669 * Return the vlan device present at the specific VID. 670 */ 671static struct ifnet * 672vlan_devat(struct ifnet *ifp, uint16_t vid) 673{ 674 struct ifvlantrunk *trunk; 675 struct ifvlan *ifv; 676 677 trunk = ifp->if_vlantrunk; 678 if (trunk == NULL) 679 return (NULL); 680 ifp = NULL; 681 TRUNK_RLOCK(trunk); 682 ifv = vlan_gethash(trunk, vid); 683 if (ifv) 684 ifp = ifv->ifv_ifp; 685 TRUNK_RUNLOCK(trunk); 686 return (ifp); 687} 688 689/* 690 * VLAN support can be loaded as a module. The only place in the 691 * system that's intimately aware of this is ether_input. We hook 692 * into this code through vlan_input_p which is defined there and 693 * set here. Noone else in the system should be aware of this so 694 * we use an explicit reference here. 695 */ 696extern void (*vlan_input_p)(struct ifnet *, struct mbuf *); 697 698/* For if_link_state_change() eyes only... */ 699extern void (*vlan_link_state_p)(struct ifnet *); 700 701static int 702vlan_modevent(module_t mod, int type, void *data) 703{ 704 705 switch (type) { 706 case MOD_LOAD: 707 ifdetach_tag = EVENTHANDLER_REGISTER(ifnet_departure_event, 708 vlan_ifdetach, NULL, EVENTHANDLER_PRI_ANY); 709 if (ifdetach_tag == NULL) 710 return (ENOMEM); 711 iflladdr_tag = EVENTHANDLER_REGISTER(iflladdr_event, 712 vlan_iflladdr, NULL, EVENTHANDLER_PRI_ANY); 713 if (iflladdr_tag == NULL) 714 return (ENOMEM); 715 VLAN_LOCK_INIT(); 716 vlan_input_p = vlan_input; 717 vlan_link_state_p = vlan_link_state; 718 vlan_trunk_cap_p = vlan_trunk_capabilities; 719 vlan_trunkdev_p = vlan_trunkdev; 720 vlan_cookie_p = vlan_cookie; 721 vlan_setcookie_p = vlan_setcookie; 722 vlan_tag_p = vlan_tag; 723 vlan_devat_p = vlan_devat; 724#ifndef VIMAGE 725 vlan_cloner = if_clone_advanced(vlanname, 0, vlan_clone_match, 726 vlan_clone_create, vlan_clone_destroy); 727#endif 728 if (bootverbose) 729 printf("vlan: initialized, using " 730#ifdef VLAN_ARRAY 731 "full-size arrays" 732#else 733 "hash tables with chaining" 734#endif 735 736 "\n"); 737 break; 738 case MOD_UNLOAD: 739#ifndef VIMAGE 740 if_clone_detach(vlan_cloner); 741#endif 742 EVENTHANDLER_DEREGISTER(ifnet_departure_event, ifdetach_tag); 743 EVENTHANDLER_DEREGISTER(iflladdr_event, iflladdr_tag); 744 vlan_input_p = NULL; 745 vlan_link_state_p = NULL; 746 vlan_trunk_cap_p = NULL; 747 vlan_trunkdev_p = NULL; 748 vlan_tag_p = NULL; 749 vlan_cookie_p = NULL; 750 vlan_setcookie_p = NULL; 751 vlan_devat_p = NULL; 752 VLAN_LOCK_DESTROY(); 753 if (bootverbose) 754 printf("vlan: unloaded\n"); 755 break; 756 default: 757 return (EOPNOTSUPP); 758 } 759 return (0); 760} 761 762static moduledata_t vlan_mod = { 763 "if_vlan", 764 vlan_modevent, 765 0 766}; 767 768DECLARE_MODULE(if_vlan, vlan_mod, SI_SUB_PSEUDO, SI_ORDER_ANY); 769MODULE_VERSION(if_vlan, 3); 770 771#ifdef VIMAGE 772static void 773vnet_vlan_init(const void *unused __unused) 774{ 775 776 vlan_cloner = if_clone_advanced(vlanname, 0, vlan_clone_match, 777 vlan_clone_create, vlan_clone_destroy); 778 V_vlan_cloner = vlan_cloner; 779} 780VNET_SYSINIT(vnet_vlan_init, SI_SUB_PROTO_IFATTACHDOMAIN, SI_ORDER_ANY, 781 vnet_vlan_init, NULL); 782 783static void 784vnet_vlan_uninit(const void *unused __unused) 785{ 786 787 if_clone_detach(V_vlan_cloner); 788} 789VNET_SYSUNINIT(vnet_vlan_uninit, SI_SUB_PROTO_IFATTACHDOMAIN, SI_ORDER_FIRST, 790 vnet_vlan_uninit, NULL); 791#endif 792 793static struct ifnet * 794vlan_clone_match_ethervid(struct if_clone *ifc, const char *name, int *vidp) 795{ 796 const char *cp; 797 struct ifnet *ifp; 798 int vid; 799 800 /* Check for <etherif>.<vlan> style interface names. */ 801 IFNET_RLOCK_NOSLEEP(); 802 TAILQ_FOREACH(ifp, &V_ifnet, if_link) { 803 /* 804 * We can handle non-ethernet hardware types as long as 805 * they handle the tagging and headers themselves. 806 */ 807 if (ifp->if_type != IFT_ETHER && 808 (ifp->if_capenable & IFCAP_VLAN_HWTAGGING) == 0) 809 continue; 810 if (strncmp(ifp->if_xname, name, strlen(ifp->if_xname)) != 0) 811 continue; 812 cp = name + strlen(ifp->if_xname); 813 if (*cp++ != '.') 814 continue; 815 if (*cp == '\0') 816 continue; 817 vid = 0; 818 for(; *cp >= '0' && *cp <= '9'; cp++) 819 vid = (vid * 10) + (*cp - '0'); 820 if (*cp != '\0') 821 continue; 822 if (vidp != NULL) 823 *vidp = vid; 824 break; 825 } 826 IFNET_RUNLOCK_NOSLEEP(); 827 828 return (ifp); 829} 830 831static int 832vlan_clone_match(struct if_clone *ifc, const char *name) 833{ 834 const char *cp; 835 836 if (vlan_clone_match_ethervid(ifc, name, NULL) != NULL) 837 return (1); 838 839 if (strncmp(vlanname, name, strlen(vlanname)) != 0) 840 return (0); 841 for (cp = name + 4; *cp != '\0'; cp++) { 842 if (*cp < '0' || *cp > '9') 843 return (0); 844 } 845 846 return (1); 847} 848 849static int 850vlan_clone_create(struct if_clone *ifc, char *name, size_t len, caddr_t params) 851{ 852 char *dp; 853 int wildcard; 854 int unit; 855 int error; 856 int vid; 857 int ethertag; 858 struct ifvlan *ifv; 859 struct ifnet *ifp; 860 struct ifnet *p; 861 struct ifaddr *ifa; 862 struct sockaddr_dl *sdl; 863 struct vlanreq vlr; 864 static const u_char eaddr[ETHER_ADDR_LEN]; /* 00:00:00:00:00:00 */ 865 866 /* 867 * There are 3 (ugh) ways to specify the cloned device: 868 * o pass a parameter block with the clone request. 869 * o specify parameters in the text of the clone device name 870 * o specify no parameters and get an unattached device that 871 * must be configured separately. 872 * The first technique is preferred; the latter two are 873 * supported for backwards compatibilty. 874 * 875 * XXXRW: Note historic use of the word "tag" here. New ioctls may be 876 * called for. 877 */ 878 if (params) { 879 error = copyin(params, &vlr, sizeof(vlr)); 880 if (error) 881 return error; 882 p = ifunit(vlr.vlr_parent); 883 if (p == NULL) 884 return ENXIO; 885 /* 886 * Don't let the caller set up a VLAN VID with 887 * anything except VLID bits. 888 */ 889 if (vlr.vlr_tag & ~EVL_VLID_MASK) 890 return (EINVAL); 891 error = ifc_name2unit(name, &unit); 892 if (error != 0) 893 return (error); 894 895 ethertag = 1; 896 vid = vlr.vlr_tag; 897 wildcard = (unit < 0); 898 } else if ((p = vlan_clone_match_ethervid(ifc, name, &vid)) != NULL) { 899 ethertag = 1; 900 unit = -1; 901 wildcard = 0; 902 903 /* 904 * Don't let the caller set up a VLAN VID with 905 * anything except VLID bits. 906 */ 907 if (vid & ~EVL_VLID_MASK) 908 return (EINVAL); 909 } else { 910 ethertag = 0; 911 912 error = ifc_name2unit(name, &unit); 913 if (error != 0) 914 return (error); 915 916 wildcard = (unit < 0); 917 } 918 919 error = ifc_alloc_unit(ifc, &unit); 920 if (error != 0) 921 return (error); 922 923 /* In the wildcard case, we need to update the name. */ 924 if (wildcard) { 925 for (dp = name; *dp != '\0'; dp++); 926 if (snprintf(dp, len - (dp-name), "%d", unit) > 927 len - (dp-name) - 1) { 928 panic("%s: interface name too long", __func__); 929 } 930 } 931 932 ifv = malloc(sizeof(struct ifvlan), M_VLAN, M_WAITOK | M_ZERO); 933 ifp = ifv->ifv_ifp = if_alloc(IFT_ETHER); 934 if (ifp == NULL) { 935 ifc_free_unit(ifc, unit); 936 free(ifv, M_VLAN); 937 return (ENOSPC); 938 } 939 SLIST_INIT(&ifv->vlan_mc_listhead); 940 941 ifp->if_softc = ifv; 942 /* 943 * Set the name manually rather than using if_initname because 944 * we don't conform to the default naming convention for interfaces. 945 */ 946 strlcpy(ifp->if_xname, name, IFNAMSIZ); 947 ifp->if_dname = vlanname; 948 ifp->if_dunit = unit; 949 /* NB: flags are not set here */ 950 ifp->if_linkmib = &ifv->ifv_mib; 951 ifp->if_linkmiblen = sizeof(ifv->ifv_mib); 952 /* NB: mtu is not set here */ 953 954 ifp->if_init = vlan_init; 955 ifp->if_transmit = vlan_transmit; 956 ifp->if_qflush = vlan_qflush; 957 ifp->if_ioctl = vlan_ioctl; 958 ifp->if_flags = VLAN_IFFLAGS; 959 ether_ifattach(ifp, eaddr); 960 /* Now undo some of the damage... */ 961 ifp->if_baudrate = 0; 962 ifp->if_type = IFT_L2VLAN; 963 ifp->if_hdrlen = ETHER_VLAN_ENCAP_LEN; 964 ifa = ifp->if_addr; 965 sdl = (struct sockaddr_dl *)ifa->ifa_addr; 966 sdl->sdl_type = IFT_L2VLAN; 967 968 if (ethertag) { 969 error = vlan_config(ifv, p, vid); 970 if (error != 0) { 971 /* 972 * Since we've partially failed, we need to back 973 * out all the way, otherwise userland could get 974 * confused. Thus, we destroy the interface. 975 */ 976 ether_ifdetach(ifp); 977 vlan_unconfig(ifp); 978 if_free(ifp); 979 ifc_free_unit(ifc, unit); 980 free(ifv, M_VLAN); 981 982 return (error); 983 } 984 985 /* Update flags on the parent, if necessary. */ 986 vlan_setflags(ifp, 1); 987 } 988 989 return (0); 990} 991 992static int 993vlan_clone_destroy(struct if_clone *ifc, struct ifnet *ifp) 994{ 995 struct ifvlan *ifv = ifp->if_softc; 996 int unit = ifp->if_dunit; 997 998 ether_ifdetach(ifp); /* first, remove it from system-wide lists */ 999 vlan_unconfig(ifp); /* now it can be unconfigured and freed */ 1000 if_free(ifp); 1001 free(ifv, M_VLAN); 1002 ifc_free_unit(ifc, unit); 1003 1004 return (0); 1005} 1006 1007/* 1008 * The ifp->if_init entry point for vlan(4) is a no-op. 1009 */ 1010static void 1011vlan_init(void *foo __unused) 1012{ 1013} 1014 1015/* 1016 * The if_transmit method for vlan(4) interface. 1017 */ 1018static int 1019vlan_transmit(struct ifnet *ifp, struct mbuf *m) 1020{ 1021 struct ifvlan *ifv; 1022 struct ifnet *p; 1023 int error, len, mcast; 1024 1025 ifv = ifp->if_softc; 1026 p = PARENT(ifv); 1027 len = m->m_pkthdr.len; 1028 mcast = (m->m_flags & (M_MCAST | M_BCAST)) ? 1 : 0; 1029 1030 BPF_MTAP(ifp, m); 1031 1032 /* 1033 * Do not run parent's if_transmit() if the parent is not up, 1034 * or parent's driver will cause a system crash. 1035 */ 1036 if (!UP_AND_RUNNING(p)) { 1037 m_freem(m); 1038 ifp->if_oerrors++; 1039 return (0); 1040 } 1041 1042 /* 1043 * Pad the frame to the minimum size allowed if told to. 1044 * This option is in accord with IEEE Std 802.1Q, 2003 Ed., 1045 * paragraph C.4.4.3.b. It can help to work around buggy 1046 * bridges that violate paragraph C.4.4.3.a from the same 1047 * document, i.e., fail to pad short frames after untagging. 1048 * E.g., a tagged frame 66 bytes long (incl. FCS) is OK, but 1049 * untagging it will produce a 62-byte frame, which is a runt 1050 * and requires padding. There are VLAN-enabled network 1051 * devices that just discard such runts instead or mishandle 1052 * them somehow. 1053 */ 1054 if (soft_pad && p->if_type == IFT_ETHER) { 1055 static char pad[8]; /* just zeros */ 1056 int n; 1057 1058 for (n = ETHERMIN + ETHER_HDR_LEN - m->m_pkthdr.len; 1059 n > 0; n -= sizeof(pad)) 1060 if (!m_append(m, min(n, sizeof(pad)), pad)) 1061 break; 1062 1063 if (n > 0) { 1064 if_printf(ifp, "cannot pad short frame\n"); 1065 ifp->if_oerrors++; 1066 m_freem(m); 1067 return (0); 1068 } 1069 } 1070 1071 /* 1072 * If underlying interface can do VLAN tag insertion itself, 1073 * just pass the packet along. However, we need some way to 1074 * tell the interface where the packet came from so that it 1075 * knows how to find the VLAN tag to use, so we attach a 1076 * packet tag that holds it. 1077 */ 1078 if (p->if_capenable & IFCAP_VLAN_HWTAGGING) { 1079 m->m_pkthdr.ether_vtag = ifv->ifv_vid; 1080 m->m_flags |= M_VLANTAG; 1081 } else { 1082 m = ether_vlanencap(m, ifv->ifv_vid); 1083 if (m == NULL) { 1084 if_printf(ifp, "unable to prepend VLAN header\n"); 1085 ifp->if_oerrors++; 1086 return (0); 1087 } 1088 } 1089 1090 /* 1091 * Send it, precisely as ether_output() would have. 1092 */ 1093 error = (p->if_transmit)(p, m); 1094 if (!error) { 1095 ifp->if_opackets++; 1096 ifp->if_omcasts += mcast; 1097 ifp->if_obytes += len; 1098 } else 1099 ifp->if_oerrors++; 1100 return (error); 1101} 1102 1103/* 1104 * The ifp->if_qflush entry point for vlan(4) is a no-op. 1105 */ 1106static void 1107vlan_qflush(struct ifnet *ifp __unused) 1108{ 1109} 1110 1111static void 1112vlan_input(struct ifnet *ifp, struct mbuf *m) 1113{ 1114 struct ifvlantrunk *trunk = ifp->if_vlantrunk; 1115 struct ifvlan *ifv; 1116 uint16_t vid; 1117 1118 KASSERT(trunk != NULL, ("%s: no trunk", __func__)); 1119 1120 if (m->m_flags & M_VLANTAG) { 1121 /* 1122 * Packet is tagged, but m contains a normal 1123 * Ethernet frame; the tag is stored out-of-band. 1124 */ 1125 vid = EVL_VLANOFTAG(m->m_pkthdr.ether_vtag); 1126 m->m_flags &= ~M_VLANTAG; 1127 } else { 1128 struct ether_vlan_header *evl; 1129 1130 /* 1131 * Packet is tagged in-band as specified by 802.1q. 1132 */ 1133 switch (ifp->if_type) { 1134 case IFT_ETHER: 1135 if (m->m_len < sizeof(*evl) && 1136 (m = m_pullup(m, sizeof(*evl))) == NULL) { 1137 if_printf(ifp, "cannot pullup VLAN header\n"); 1138 return; 1139 } 1140 evl = mtod(m, struct ether_vlan_header *); 1141 vid = EVL_VLANOFTAG(ntohs(evl->evl_tag)); 1142 1143 /* 1144 * Remove the 802.1q header by copying the Ethernet 1145 * addresses over it and adjusting the beginning of 1146 * the data in the mbuf. The encapsulated Ethernet 1147 * type field is already in place. 1148 */ 1149 bcopy((char *)evl, (char *)evl + ETHER_VLAN_ENCAP_LEN, 1150 ETHER_HDR_LEN - ETHER_TYPE_LEN); 1151 m_adj(m, ETHER_VLAN_ENCAP_LEN); 1152 break; 1153 1154 default: 1155#ifdef INVARIANTS 1156 panic("%s: %s has unsupported if_type %u", 1157 __func__, ifp->if_xname, ifp->if_type); 1158#endif 1159 m_freem(m); 1160 ifp->if_noproto++; 1161 return; 1162 } 1163 } 1164 1165 TRUNK_RLOCK(trunk); 1166 ifv = vlan_gethash(trunk, vid); 1167 if (ifv == NULL || !UP_AND_RUNNING(ifv->ifv_ifp)) { 1168 TRUNK_RUNLOCK(trunk); 1169 m_freem(m); 1170 ifp->if_noproto++; 1171 return; 1172 } 1173 TRUNK_RUNLOCK(trunk); 1174 1175 m->m_pkthdr.rcvif = ifv->ifv_ifp; 1176 ifv->ifv_ifp->if_ipackets++; 1177 1178 /* Pass it back through the parent's input routine. */ 1179 (*ifp->if_input)(ifv->ifv_ifp, m); 1180} 1181 1182static int 1183vlan_config(struct ifvlan *ifv, struct ifnet *p, uint16_t vid) 1184{ 1185 struct ifvlantrunk *trunk; 1186 struct ifnet *ifp; 1187 int error = 0; 1188 1189 /* VID numbers 0x0 and 0xFFF are reserved */ 1190 if (vid == 0 || vid == 0xFFF) 1191 return (EINVAL); 1192 if (p->if_type != IFT_ETHER && 1193 (p->if_capenable & IFCAP_VLAN_HWTAGGING) == 0) 1194 return (EPROTONOSUPPORT); 1195 if ((p->if_flags & VLAN_IFFLAGS) != VLAN_IFFLAGS) 1196 return (EPROTONOSUPPORT); 1197 if (ifv->ifv_trunk) 1198 return (EBUSY); 1199 1200 if (p->if_vlantrunk == NULL) { 1201 trunk = malloc(sizeof(struct ifvlantrunk), 1202 M_VLAN, M_WAITOK | M_ZERO); 1203 vlan_inithash(trunk); 1204 VLAN_LOCK(); 1205 if (p->if_vlantrunk != NULL) { 1206 /* A race that that is very unlikely to be hit. */ 1207 vlan_freehash(trunk); 1208 free(trunk, M_VLAN); 1209 goto exists; 1210 } 1211 TRUNK_LOCK_INIT(trunk); 1212 TRUNK_LOCK(trunk); 1213 p->if_vlantrunk = trunk; 1214 trunk->parent = p; 1215 } else { 1216 VLAN_LOCK(); 1217exists: 1218 trunk = p->if_vlantrunk; 1219 TRUNK_LOCK(trunk); 1220 } 1221 1222 ifv->ifv_vid = vid; /* must set this before vlan_inshash() */ 1223 error = vlan_inshash(trunk, ifv); 1224 if (error) 1225 goto done; 1226 ifv->ifv_proto = ETHERTYPE_VLAN; 1227 ifv->ifv_encaplen = ETHER_VLAN_ENCAP_LEN; 1228 ifv->ifv_mintu = ETHERMIN; 1229 ifv->ifv_pflags = 0; 1230 1231 /* 1232 * If the parent supports the VLAN_MTU capability, 1233 * i.e. can Tx/Rx larger than ETHER_MAX_LEN frames, 1234 * use it. 1235 */ 1236 if (p->if_capenable & IFCAP_VLAN_MTU) { 1237 /* 1238 * No need to fudge the MTU since the parent can 1239 * handle extended frames. 1240 */ 1241 ifv->ifv_mtufudge = 0; 1242 } else { 1243 /* 1244 * Fudge the MTU by the encapsulation size. This 1245 * makes us incompatible with strictly compliant 1246 * 802.1Q implementations, but allows us to use 1247 * the feature with other NetBSD implementations, 1248 * which might still be useful. 1249 */ 1250 ifv->ifv_mtufudge = ifv->ifv_encaplen; 1251 } 1252 1253 ifv->ifv_trunk = trunk; 1254 ifp = ifv->ifv_ifp; 1255 /* 1256 * Initialize fields from our parent. This duplicates some 1257 * work with ether_ifattach() but allows for non-ethernet 1258 * interfaces to also work. 1259 */ 1260 ifp->if_mtu = p->if_mtu - ifv->ifv_mtufudge; 1261 ifp->if_baudrate = p->if_baudrate; 1262 ifp->if_output = p->if_output; 1263 ifp->if_input = p->if_input; 1264 ifp->if_resolvemulti = p->if_resolvemulti; 1265 ifp->if_addrlen = p->if_addrlen; 1266 ifp->if_broadcastaddr = p->if_broadcastaddr; 1267 1268 /* 1269 * Copy only a selected subset of flags from the parent. 1270 * Other flags are none of our business. 1271 */ 1272#define VLAN_COPY_FLAGS (IFF_SIMPLEX) 1273 ifp->if_flags &= ~VLAN_COPY_FLAGS; 1274 ifp->if_flags |= p->if_flags & VLAN_COPY_FLAGS; 1275#undef VLAN_COPY_FLAGS 1276 1277 ifp->if_link_state = p->if_link_state; 1278 1279 vlan_capabilities(ifv); 1280 1281 /* 1282 * Set up our interface address to reflect the underlying 1283 * physical interface's. 1284 */ 1285 bcopy(IF_LLADDR(p), IF_LLADDR(ifp), p->if_addrlen); 1286 ((struct sockaddr_dl *)ifp->if_addr->ifa_addr)->sdl_alen = 1287 p->if_addrlen; 1288 1289 /* 1290 * Configure multicast addresses that may already be 1291 * joined on the vlan device. 1292 */ 1293 (void)vlan_setmulti(ifp); /* XXX: VLAN lock held */ 1294 1295 /* We are ready for operation now. */ 1296 ifp->if_drv_flags |= IFF_DRV_RUNNING; 1297done: 1298 TRUNK_UNLOCK(trunk); 1299 if (error == 0) 1300 EVENTHANDLER_INVOKE(vlan_config, p, ifv->ifv_vid); 1301 VLAN_UNLOCK(); 1302 1303 return (error); 1304} 1305 1306static void 1307vlan_unconfig(struct ifnet *ifp) 1308{ 1309 1310 VLAN_LOCK(); 1311 vlan_unconfig_locked(ifp, 0); 1312 VLAN_UNLOCK(); 1313} 1314 1315static void 1316vlan_unconfig_locked(struct ifnet *ifp, int departing) 1317{ 1318 struct ifvlantrunk *trunk; 1319 struct vlan_mc_entry *mc; 1320 struct ifvlan *ifv; 1321 struct ifnet *parent; 1322 int error; 1323 1324 VLAN_LOCK_ASSERT(); 1325 1326 ifv = ifp->if_softc; 1327 trunk = ifv->ifv_trunk; 1328 parent = NULL; 1329 1330 if (trunk != NULL) { 1331 1332 TRUNK_LOCK(trunk); 1333 parent = trunk->parent; 1334 1335 /* 1336 * Since the interface is being unconfigured, we need to 1337 * empty the list of multicast groups that we may have joined 1338 * while we were alive from the parent's list. 1339 */ 1340 while ((mc = SLIST_FIRST(&ifv->vlan_mc_listhead)) != NULL) { 1341 /* 1342 * If the parent interface is being detached, 1343 * all its multicast addresses have already 1344 * been removed. Warn about errors if 1345 * if_delmulti() does fail, but don't abort as 1346 * all callers expect vlan destruction to 1347 * succeed. 1348 */ 1349 if (!departing) { 1350 error = if_delmulti(parent, 1351 (struct sockaddr *)&mc->mc_addr); 1352 if (error) 1353 if_printf(ifp, 1354 "Failed to delete multicast address from parent: %d\n", 1355 error); 1356 } 1357 SLIST_REMOVE_HEAD(&ifv->vlan_mc_listhead, mc_entries); 1358 free(mc, M_VLAN); 1359 } 1360 1361 vlan_setflags(ifp, 0); /* clear special flags on parent */ 1362 vlan_remhash(trunk, ifv); 1363 ifv->ifv_trunk = NULL; 1364 1365 /* 1366 * Check if we were the last. 1367 */ 1368 if (trunk->refcnt == 0) { 1369 trunk->parent->if_vlantrunk = NULL; 1370 /* 1371 * XXXGL: If some ithread has already entered 1372 * vlan_input() and is now blocked on the trunk 1373 * lock, then it should preempt us right after 1374 * unlock and finish its work. Then we will acquire 1375 * lock again in trunk_destroy(). 1376 */ 1377 TRUNK_UNLOCK(trunk); 1378 trunk_destroy(trunk); 1379 } else 1380 TRUNK_UNLOCK(trunk); 1381 } 1382 1383 /* Disconnect from parent. */ 1384 if (ifv->ifv_pflags) 1385 if_printf(ifp, "%s: ifv_pflags unclean\n", __func__); 1386 ifp->if_mtu = ETHERMTU; 1387 ifp->if_link_state = LINK_STATE_UNKNOWN; 1388 ifp->if_drv_flags &= ~IFF_DRV_RUNNING; 1389 1390 /* 1391 * Only dispatch an event if vlan was 1392 * attached, otherwise there is nothing 1393 * to cleanup anyway. 1394 */ 1395 if (parent != NULL) 1396 EVENTHANDLER_INVOKE(vlan_unconfig, parent, ifv->ifv_vid); 1397} 1398 1399/* Handle a reference counted flag that should be set on the parent as well */ 1400static int 1401vlan_setflag(struct ifnet *ifp, int flag, int status, 1402 int (*func)(struct ifnet *, int)) 1403{ 1404 struct ifvlan *ifv; 1405 int error; 1406 1407 /* XXX VLAN_LOCK_ASSERT(); */ 1408 1409 ifv = ifp->if_softc; 1410 status = status ? (ifp->if_flags & flag) : 0; 1411 /* Now "status" contains the flag value or 0 */ 1412 1413 /* 1414 * See if recorded parent's status is different from what 1415 * we want it to be. If it is, flip it. We record parent's 1416 * status in ifv_pflags so that we won't clear parent's flag 1417 * we haven't set. In fact, we don't clear or set parent's 1418 * flags directly, but get or release references to them. 1419 * That's why we can be sure that recorded flags still are 1420 * in accord with actual parent's flags. 1421 */ 1422 if (status != (ifv->ifv_pflags & flag)) { 1423 error = (*func)(PARENT(ifv), status); 1424 if (error) 1425 return (error); 1426 ifv->ifv_pflags &= ~flag; 1427 ifv->ifv_pflags |= status; 1428 } 1429 return (0); 1430} 1431 1432/* 1433 * Handle IFF_* flags that require certain changes on the parent: 1434 * if "status" is true, update parent's flags respective to our if_flags; 1435 * if "status" is false, forcedly clear the flags set on parent. 1436 */ 1437static int 1438vlan_setflags(struct ifnet *ifp, int status) 1439{ 1440 int error, i; 1441 1442 for (i = 0; vlan_pflags[i].flag; i++) { 1443 error = vlan_setflag(ifp, vlan_pflags[i].flag, 1444 status, vlan_pflags[i].func); 1445 if (error) 1446 return (error); 1447 } 1448 return (0); 1449} 1450 1451/* Inform all vlans that their parent has changed link state */ 1452static void 1453vlan_link_state(struct ifnet *ifp) 1454{ 1455 struct ifvlantrunk *trunk = ifp->if_vlantrunk; 1456 struct ifvlan *ifv; 1457 int i; 1458 1459 TRUNK_LOCK(trunk); 1460#ifdef VLAN_ARRAY 1461 for (i = 0; i < VLAN_ARRAY_SIZE; i++) 1462 if (trunk->vlans[i] != NULL) { 1463 ifv = trunk->vlans[i]; 1464#else 1465 for (i = 0; i < (1 << trunk->hwidth); i++) 1466 LIST_FOREACH(ifv, &trunk->hash[i], ifv_list) { 1467#endif 1468 ifv->ifv_ifp->if_baudrate = trunk->parent->if_baudrate; 1469 if_link_state_change(ifv->ifv_ifp, 1470 trunk->parent->if_link_state); 1471 } 1472 TRUNK_UNLOCK(trunk); 1473} 1474 1475static void 1476vlan_capabilities(struct ifvlan *ifv) 1477{ 1478 struct ifnet *p = PARENT(ifv); 1479 struct ifnet *ifp = ifv->ifv_ifp; 1480 1481 TRUNK_LOCK_ASSERT(TRUNK(ifv)); 1482 1483 /* 1484 * If the parent interface can do checksum offloading 1485 * on VLANs, then propagate its hardware-assisted 1486 * checksumming flags. Also assert that checksum 1487 * offloading requires hardware VLAN tagging. 1488 */ 1489 if (p->if_capabilities & IFCAP_VLAN_HWCSUM) 1490 ifp->if_capabilities = p->if_capabilities & IFCAP_HWCSUM; 1491 1492 if (p->if_capenable & IFCAP_VLAN_HWCSUM && 1493 p->if_capenable & IFCAP_VLAN_HWTAGGING) { 1494 ifp->if_capenable = p->if_capenable & IFCAP_HWCSUM; 1495 ifp->if_hwassist = p->if_hwassist & (CSUM_IP | CSUM_TCP | 1496 CSUM_UDP | CSUM_SCTP | CSUM_IP_FRAGS | CSUM_FRAGMENT); 1497 } else { 1498 ifp->if_capenable = 0; 1499 ifp->if_hwassist = 0; 1500 } 1501 /* 1502 * If the parent interface can do TSO on VLANs then 1503 * propagate the hardware-assisted flag. TSO on VLANs 1504 * does not necessarily require hardware VLAN tagging. 1505 */ 1506 if (p->if_capabilities & IFCAP_VLAN_HWTSO) 1507 ifp->if_capabilities |= p->if_capabilities & IFCAP_TSO; 1508 if (p->if_capenable & IFCAP_VLAN_HWTSO) { 1509 ifp->if_capenable |= p->if_capenable & IFCAP_TSO; 1510 ifp->if_hwassist |= p->if_hwassist & CSUM_TSO; 1511 } else { 1512 ifp->if_capenable &= ~(p->if_capenable & IFCAP_TSO); 1513 ifp->if_hwassist &= ~(p->if_hwassist & CSUM_TSO); 1514 } 1515 1516 /* 1517 * If the parent interface can offload TCP connections over VLANs then 1518 * propagate its TOE capability to the VLAN interface. 1519 * 1520 * All TOE drivers in the tree today can deal with VLANs. If this 1521 * changes then IFCAP_VLAN_TOE should be promoted to a full capability 1522 * with its own bit. 1523 */ 1524#define IFCAP_VLAN_TOE IFCAP_TOE 1525 if (p->if_capabilities & IFCAP_VLAN_TOE) 1526 ifp->if_capabilities |= p->if_capabilities & IFCAP_TOE; 1527 if (p->if_capenable & IFCAP_VLAN_TOE) { 1528 TOEDEV(ifp) = TOEDEV(p); 1529 ifp->if_capenable |= p->if_capenable & IFCAP_TOE; 1530 } 1531} 1532 1533static void 1534vlan_trunk_capabilities(struct ifnet *ifp) 1535{ 1536 struct ifvlantrunk *trunk = ifp->if_vlantrunk; 1537 struct ifvlan *ifv; 1538 int i; 1539 1540 TRUNK_LOCK(trunk); 1541#ifdef VLAN_ARRAY 1542 for (i = 0; i < VLAN_ARRAY_SIZE; i++) 1543 if (trunk->vlans[i] != NULL) { 1544 ifv = trunk->vlans[i]; 1545#else 1546 for (i = 0; i < (1 << trunk->hwidth); i++) { 1547 LIST_FOREACH(ifv, &trunk->hash[i], ifv_list) 1548#endif 1549 vlan_capabilities(ifv); 1550 } 1551 TRUNK_UNLOCK(trunk); 1552} 1553 1554static int 1555vlan_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data) 1556{ 1557 struct ifnet *p; 1558 struct ifreq *ifr; 1559 struct ifaddr *ifa; 1560 struct ifvlan *ifv; 1561 struct vlanreq vlr; 1562 int error = 0; 1563 1564 ifr = (struct ifreq *)data; 1565 ifa = (struct ifaddr *) data; 1566 ifv = ifp->if_softc; 1567 1568 switch (cmd) { 1569 case SIOCSIFADDR: 1570 ifp->if_flags |= IFF_UP; 1571#ifdef INET 1572 if (ifa->ifa_addr->sa_family == AF_INET) 1573 arp_ifinit(ifp, ifa); 1574#endif 1575 break; 1576 case SIOCGIFADDR: 1577 { 1578 struct sockaddr *sa; 1579 1580 sa = (struct sockaddr *)&ifr->ifr_data; 1581 bcopy(IF_LLADDR(ifp), sa->sa_data, ifp->if_addrlen); 1582 } 1583 break; 1584 case SIOCGIFMEDIA: 1585 VLAN_LOCK(); 1586 if (TRUNK(ifv) != NULL) { 1587 p = PARENT(ifv); 1588 VLAN_UNLOCK(); 1589 error = (*p->if_ioctl)(p, SIOCGIFMEDIA, data); 1590 /* Limit the result to the parent's current config. */ 1591 if (error == 0) { 1592 struct ifmediareq *ifmr; 1593 1594 ifmr = (struct ifmediareq *)data; 1595 if (ifmr->ifm_count >= 1 && ifmr->ifm_ulist) { 1596 ifmr->ifm_count = 1; 1597 error = copyout(&ifmr->ifm_current, 1598 ifmr->ifm_ulist, 1599 sizeof(int)); 1600 } 1601 } 1602 } else { 1603 VLAN_UNLOCK(); 1604 error = EINVAL; 1605 } 1606 break; 1607 1608 case SIOCSIFMEDIA: 1609 error = EINVAL; 1610 break; 1611 1612 case SIOCSIFMTU: 1613 /* 1614 * Set the interface MTU. 1615 */ 1616 VLAN_LOCK(); 1617 if (TRUNK(ifv) != NULL) { 1618 if (ifr->ifr_mtu > 1619 (PARENT(ifv)->if_mtu - ifv->ifv_mtufudge) || 1620 ifr->ifr_mtu < 1621 (ifv->ifv_mintu - ifv->ifv_mtufudge)) 1622 error = EINVAL; 1623 else 1624 ifp->if_mtu = ifr->ifr_mtu; 1625 } else 1626 error = EINVAL; 1627 VLAN_UNLOCK(); 1628 break; 1629 1630 case SIOCSETVLAN: 1631#ifdef VIMAGE 1632 /* 1633 * XXXRW/XXXBZ: The goal in these checks is to allow a VLAN 1634 * interface to be delegated to a jail without allowing the 1635 * jail to change what underlying interface/VID it is 1636 * associated with. We are not entirely convinced that this 1637 * is the right way to accomplish that policy goal. 1638 */ 1639 if (ifp->if_vnet != ifp->if_home_vnet) { 1640 error = EPERM; 1641 break; 1642 } 1643#endif 1644 error = copyin(ifr->ifr_data, &vlr, sizeof(vlr)); 1645 if (error) 1646 break; 1647 if (vlr.vlr_parent[0] == '\0') { 1648 vlan_unconfig(ifp); 1649 break; 1650 } 1651 p = ifunit(vlr.vlr_parent); 1652 if (p == NULL) { 1653 error = ENOENT; 1654 break; 1655 } 1656 /* 1657 * Don't let the caller set up a VLAN VID with 1658 * anything except VLID bits. 1659 */ 1660 if (vlr.vlr_tag & ~EVL_VLID_MASK) { 1661 error = EINVAL; 1662 break; 1663 } 1664 error = vlan_config(ifv, p, vlr.vlr_tag); 1665 if (error) 1666 break; 1667 1668 /* Update flags on the parent, if necessary. */ 1669 vlan_setflags(ifp, 1); 1670 break; 1671 1672 case SIOCGETVLAN: 1673#ifdef VIMAGE 1674 if (ifp->if_vnet != ifp->if_home_vnet) { 1675 error = EPERM; 1676 break; 1677 } 1678#endif 1679 bzero(&vlr, sizeof(vlr)); 1680 VLAN_LOCK(); 1681 if (TRUNK(ifv) != NULL) { 1682 strlcpy(vlr.vlr_parent, PARENT(ifv)->if_xname, 1683 sizeof(vlr.vlr_parent)); 1684 vlr.vlr_tag = ifv->ifv_vid; 1685 } 1686 VLAN_UNLOCK(); 1687 error = copyout(&vlr, ifr->ifr_data, sizeof(vlr)); 1688 break; 1689 1690 case SIOCSIFFLAGS: 1691 /* 1692 * We should propagate selected flags to the parent, 1693 * e.g., promiscuous mode. 1694 */ 1695 if (TRUNK(ifv) != NULL) 1696 error = vlan_setflags(ifp, 1); 1697 break; 1698 1699 case SIOCADDMULTI: 1700 case SIOCDELMULTI: 1701 /* 1702 * If we don't have a parent, just remember the membership for 1703 * when we do. 1704 */ 1705 if (TRUNK(ifv) != NULL) 1706 error = vlan_setmulti(ifp); 1707 break; 1708 1709 default: 1710 error = EINVAL; 1711 break; 1712 } 1713 1714 return (error); 1715} 1716