if_gre.c revision 180639
1123992Ssobomax/* $NetBSD: if_gre.c,v 1.49 2003/12/11 00:22:29 itojun Exp $ */ 2103026Ssobomax/* $FreeBSD: head/sys/net/if_gre.c 180639 2008-07-20 21:45:15Z julian $ */ 3103026Ssobomax 4139823Simp/*- 5103026Ssobomax * Copyright (c) 1998 The NetBSD Foundation, Inc. 6103026Ssobomax * All rights reserved. 7103026Ssobomax * 8103026Ssobomax * This code is derived from software contributed to The NetBSD Foundation 9103026Ssobomax * by Heiko W.Rupp <hwr@pilhuhn.de> 10103026Ssobomax * 11148613Sbz * IPv6-over-GRE contributed by Gert Doering <gert@greenie.muc.de> 12148613Sbz * 13103026Ssobomax * Redistribution and use in source and binary forms, with or without 14103026Ssobomax * modification, are permitted provided that the following conditions 15103026Ssobomax * are met: 16103026Ssobomax * 1. Redistributions of source code must retain the above copyright 17103026Ssobomax * notice, this list of conditions and the following disclaimer. 18103026Ssobomax * 2. Redistributions in binary form must reproduce the above copyright 19103026Ssobomax * notice, this list of conditions and the following disclaimer in the 20103026Ssobomax * documentation and/or other materials provided with the distribution. 21103026Ssobomax * 3. All advertising materials mentioning features or use of this software 22103026Ssobomax * must display the following acknowledgement: 23103026Ssobomax * This product includes software developed by the NetBSD 24103026Ssobomax * Foundation, Inc. and its contributors. 25103026Ssobomax * 4. Neither the name of The NetBSD Foundation nor the names of its 26103026Ssobomax * contributors may be used to endorse or promote products derived 27103026Ssobomax * from this software without specific prior written permission. 28103026Ssobomax * 29103026Ssobomax * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 30103026Ssobomax * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 31103026Ssobomax * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 32103026Ssobomax * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 33103026Ssobomax * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 34103026Ssobomax * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 35103026Ssobomax * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 36103026Ssobomax * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 37103026Ssobomax * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 38103026Ssobomax * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 39103026Ssobomax * POSSIBILITY OF SUCH DAMAGE. 40103026Ssobomax */ 41103026Ssobomax 42103026Ssobomax/* 43103026Ssobomax * Encapsulate L3 protocols into IP 44148613Sbz * See RFC 2784 (successor of RFC 1701 and 1702) for more details. 45103026Ssobomax * If_gre is compatible with Cisco GRE tunnels, so you can 46103026Ssobomax * have a NetBSD box as the other end of a tunnel interface of a Cisco 47103026Ssobomax * router. See gre(4) for more details. 48103026Ssobomax * Also supported: IP in IP encaps (proto 55) as of RFC 2004 49103026Ssobomax */ 50103026Ssobomax 51103394Sbde#include "opt_atalk.h" 52103026Ssobomax#include "opt_inet.h" 53122699Sbms#include "opt_inet6.h" 54103026Ssobomax 55103026Ssobomax#include <sys/param.h> 56103026Ssobomax#include <sys/kernel.h> 57103026Ssobomax#include <sys/malloc.h> 58129880Sphk#include <sys/module.h> 59103026Ssobomax#include <sys/mbuf.h> 60164033Srwatson#include <sys/priv.h> 61178888Sjulian#include <sys/proc.h> 62103026Ssobomax#include <sys/protosw.h> 63103026Ssobomax#include <sys/socket.h> 64103026Ssobomax#include <sys/sockio.h> 65103026Ssobomax#include <sys/sysctl.h> 66103344Sbde#include <sys/systm.h> 67103026Ssobomax 68103026Ssobomax#include <net/ethernet.h> 69103026Ssobomax#include <net/if.h> 70130933Sbrooks#include <net/if_clone.h> 71103026Ssobomax#include <net/if_types.h> 72103026Ssobomax#include <net/route.h> 73103026Ssobomax 74103026Ssobomax#ifdef INET 75103026Ssobomax#include <netinet/in.h> 76103026Ssobomax#include <netinet/in_systm.h> 77103026Ssobomax#include <netinet/in_var.h> 78103026Ssobomax#include <netinet/ip.h> 79103026Ssobomax#include <netinet/ip_gre.h> 80103026Ssobomax#include <netinet/ip_var.h> 81103026Ssobomax#include <netinet/ip_encap.h> 82103026Ssobomax#else 83103026Ssobomax#error "Huh? if_gre without inet?" 84103026Ssobomax#endif 85103026Ssobomax 86103026Ssobomax#include <net/bpf.h> 87103026Ssobomax 88103026Ssobomax#include <net/if_gre.h> 89103026Ssobomax 90103026Ssobomax/* 91103026Ssobomax * It is not easy to calculate the right value for a GRE MTU. 92103026Ssobomax * We leave this task to the admin and use the same default that 93103026Ssobomax * other vendors use. 94103026Ssobomax */ 95103026Ssobomax#define GREMTU 1476 96103026Ssobomax 97103026Ssobomax#define GRENAME "gre" 98103026Ssobomax 99127307Srwatson/* 100127307Srwatson * gre_mtx protects all global variables in if_gre.c. 101127307Srwatson * XXX: gre_softc data not protected yet. 102127307Srwatson */ 103127307Srwatsonstruct mtx gre_mtx; 104103026Ssobomaxstatic MALLOC_DEFINE(M_GRE, GRENAME, "Generic Routing Encapsulation"); 105103026Ssobomax 106103026Ssobomaxstruct gre_softc_head gre_softc_list; 107103026Ssobomax 108160195Ssamstatic int gre_clone_create(struct if_clone *, int, caddr_t); 109105300Salfredstatic void gre_clone_destroy(struct ifnet *); 110103032Ssobomaxstatic int gre_ioctl(struct ifnet *, u_long, caddr_t); 111103032Ssobomaxstatic int gre_output(struct ifnet *, struct mbuf *, struct sockaddr *, 112103032Ssobomax struct rtentry *rt); 113103026Ssobomax 114130933SbrooksIFC_SIMPLE_DECLARE(gre, 0); 115103026Ssobomax 116103032Ssobomaxstatic int gre_compute_route(struct gre_softc *sc); 117103026Ssobomax 118105300Salfredstatic void greattach(void); 119103026Ssobomax 120103026Ssobomax#ifdef INET 121103026Ssobomaxextern struct domain inetdomain; 122152242Srustatic const struct protosw in_gre_protosw = { 123152242Sru .pr_type = SOCK_RAW, 124152242Sru .pr_domain = &inetdomain, 125152242Sru .pr_protocol = IPPROTO_GRE, 126152242Sru .pr_flags = PR_ATOMIC|PR_ADDR, 127154625Sbz .pr_input = gre_input, 128152242Sru .pr_output = (pr_output_t *)rip_output, 129152242Sru .pr_ctlinput = rip_ctlinput, 130152242Sru .pr_ctloutput = rip_ctloutput, 131152242Sru .pr_usrreqs = &rip_usrreqs 132103026Ssobomax}; 133152242Srustatic const struct protosw in_mobile_protosw = { 134152242Sru .pr_type = SOCK_RAW, 135152242Sru .pr_domain = &inetdomain, 136152242Sru .pr_protocol = IPPROTO_MOBILE, 137152242Sru .pr_flags = PR_ATOMIC|PR_ADDR, 138154625Sbz .pr_input = gre_mobile_input, 139152242Sru .pr_output = (pr_output_t *)rip_output, 140152242Sru .pr_ctlinput = rip_ctlinput, 141152242Sru .pr_ctloutput = rip_ctloutput, 142152242Sru .pr_usrreqs = &rip_usrreqs 143103026Ssobomax}; 144103026Ssobomax#endif 145103026Ssobomax 146103026SsobomaxSYSCTL_DECL(_net_link); 147123338SbmsSYSCTL_NODE(_net_link, IFT_TUNNEL, gre, CTLFLAG_RW, 0, 148103026Ssobomax "Generic Routing Encapsulation"); 149103026Ssobomax#ifndef MAX_GRE_NEST 150103026Ssobomax/* 151103026Ssobomax * This macro controls the default upper limitation on nesting of gre tunnels. 152103026Ssobomax * Since, setting a large value to this macro with a careless configuration 153103026Ssobomax * may introduce system crash, we don't allow any nestings by default. 154103026Ssobomax * If you need to configure nested gre tunnels, you can define this macro 155103026Ssobomax * in your kernel configuration file. However, if you do so, please be 156103026Ssobomax * careful to configure the tunnels so that it won't make a loop. 157103026Ssobomax */ 158103026Ssobomax#define MAX_GRE_NEST 1 159103026Ssobomax#endif 160103026Ssobomaxstatic int max_gre_nesting = MAX_GRE_NEST; 161103026SsobomaxSYSCTL_INT(_net_link_gre, OID_AUTO, max_nesting, CTLFLAG_RW, 162103026Ssobomax &max_gre_nesting, 0, "Max nested tunnels"); 163103026Ssobomax 164103026Ssobomax/* ARGSUSED */ 165103032Ssobomaxstatic void 166103026Ssobomaxgreattach(void) 167103026Ssobomax{ 168103026Ssobomax 169127307Srwatson mtx_init(&gre_mtx, "gre_mtx", NULL, MTX_DEF); 170103026Ssobomax LIST_INIT(&gre_softc_list); 171103026Ssobomax if_clone_attach(&gre_cloner); 172103026Ssobomax} 173103026Ssobomax 174103032Ssobomaxstatic int 175160195Ssamgre_clone_create(ifc, unit, params) 176103026Ssobomax struct if_clone *ifc; 177103026Ssobomax int unit; 178160195Ssam caddr_t params; 179103026Ssobomax{ 180103026Ssobomax struct gre_softc *sc; 181103026Ssobomax 182131673Sbms sc = malloc(sizeof(struct gre_softc), M_GRE, M_WAITOK | M_ZERO); 183103026Ssobomax 184147643Sbz GRE2IFP(sc) = if_alloc(IFT_TUNNEL); 185147643Sbz if (GRE2IFP(sc) == NULL) { 186147643Sbz free(sc, M_GRE); 187147643Sbz return (ENOSPC); 188147643Sbz } 189147643Sbz 190147643Sbz GRE2IFP(sc)->if_softc = sc; 191147256Sbrooks if_initname(GRE2IFP(sc), ifc->ifc_name, unit); 192147643Sbz 193147256Sbrooks GRE2IFP(sc)->if_snd.ifq_maxlen = IFQ_MAXLEN; 194147256Sbrooks GRE2IFP(sc)->if_addrlen = 0; 195147256Sbrooks GRE2IFP(sc)->if_hdrlen = 24; /* IP + GRE */ 196147256Sbrooks GRE2IFP(sc)->if_mtu = GREMTU; 197147256Sbrooks GRE2IFP(sc)->if_flags = IFF_POINTOPOINT|IFF_MULTICAST; 198147256Sbrooks GRE2IFP(sc)->if_output = gre_output; 199147256Sbrooks GRE2IFP(sc)->if_ioctl = gre_ioctl; 200103026Ssobomax sc->g_dst.s_addr = sc->g_src.s_addr = INADDR_ANY; 201103026Ssobomax sc->g_proto = IPPROTO_GRE; 202147256Sbrooks GRE2IFP(sc)->if_flags |= IFF_LINK0; 203103026Ssobomax sc->encap = NULL; 204103026Ssobomax sc->called = 0; 205178888Sjulian sc->gre_fibnum = curthread->td_proc->p_fibnum; 206125024Ssobomax sc->wccp_ver = WCCP_V1; 207179894Sthompsa sc->key = 0; 208147256Sbrooks if_attach(GRE2IFP(sc)); 209147256Sbrooks bpfattach(GRE2IFP(sc), DLT_NULL, sizeof(u_int32_t)); 210127307Srwatson mtx_lock(&gre_mtx); 211103026Ssobomax LIST_INSERT_HEAD(&gre_softc_list, sc, sc_list); 212127307Srwatson mtx_unlock(&gre_mtx); 213103026Ssobomax return (0); 214103026Ssobomax} 215103026Ssobomax 216103032Ssobomaxstatic void 217127307Srwatsongre_clone_destroy(ifp) 218127307Srwatson struct ifnet *ifp; 219127307Srwatson{ 220127307Srwatson struct gre_softc *sc = ifp->if_softc; 221127307Srwatson 222127307Srwatson mtx_lock(&gre_mtx); 223127307Srwatson LIST_REMOVE(sc, sc_list); 224127307Srwatson mtx_unlock(&gre_mtx); 225151266Sthompsa 226151266Sthompsa#ifdef INET 227151266Sthompsa if (sc->encap != NULL) 228151266Sthompsa encap_detach(sc->encap); 229151266Sthompsa#endif 230151266Sthompsa bpfdetach(ifp); 231151266Sthompsa if_detach(ifp); 232151266Sthompsa if_free(ifp); 233151266Sthompsa free(sc, M_GRE); 234127307Srwatson} 235127307Srwatson 236103026Ssobomax/* 237103026Ssobomax * The output routine. Takes a packet and encapsulates it in the protocol 238103026Ssobomax * given by sc->g_proto. See also RFC 1701 and RFC 2004 239103026Ssobomax */ 240103032Ssobomaxstatic int 241103026Ssobomaxgre_output(struct ifnet *ifp, struct mbuf *m, struct sockaddr *dst, 242103026Ssobomax struct rtentry *rt) 243103026Ssobomax{ 244103026Ssobomax int error = 0; 245103026Ssobomax struct gre_softc *sc = ifp->if_softc; 246103026Ssobomax struct greip *gh; 247103026Ssobomax struct ip *ip; 248180041Sjulian u_short gre_ip_id = 0; 249180041Sjulian uint8_t gre_ip_tos = 0; 250123992Ssobomax u_int16_t etype = 0; 251103026Ssobomax struct mobile_h mob_h; 252147611Sdwmalone u_int32_t af; 253180639Sjulian int extra = 0; 254103026Ssobomax 255103026Ssobomax /* 256103026Ssobomax * gre may cause infinite recursion calls when misconfigured. 257103026Ssobomax * We'll prevent this by introducing upper limit. 258103026Ssobomax */ 259103026Ssobomax if (++(sc->called) > max_gre_nesting) { 260103026Ssobomax printf("%s: gre_output: recursively called too many " 261147256Sbrooks "times(%d)\n", if_name(GRE2IFP(sc)), sc->called); 262103026Ssobomax m_freem(m); 263103026Ssobomax error = EIO; /* is there better errno? */ 264103026Ssobomax goto end; 265103026Ssobomax } 266103026Ssobomax 267148887Srwatson if (!((ifp->if_flags & IFF_UP) && 268148887Srwatson (ifp->if_drv_flags & IFF_DRV_RUNNING)) || 269103026Ssobomax sc->g_src.s_addr == INADDR_ANY || sc->g_dst.s_addr == INADDR_ANY) { 270103026Ssobomax m_freem(m); 271103026Ssobomax error = ENETDOWN; 272103026Ssobomax goto end; 273103026Ssobomax } 274103026Ssobomax 275103026Ssobomax gh = NULL; 276103026Ssobomax ip = NULL; 277103026Ssobomax 278147611Sdwmalone /* BPF writes need to be handled specially. */ 279147611Sdwmalone if (dst->sa_family == AF_UNSPEC) { 280147611Sdwmalone bcopy(dst->sa_data, &af, sizeof(af)); 281147611Sdwmalone dst->sa_family = af; 282147611Sdwmalone } 283147611Sdwmalone 284159180Scsjp if (bpf_peers_present(ifp->if_bpf)) { 285147611Sdwmalone af = dst->sa_family; 286123922Ssam bpf_mtap2(ifp->if_bpf, &af, sizeof(af), m); 287103026Ssobomax } 288103026Ssobomax 289103026Ssobomax m->m_flags &= ~(M_BCAST|M_MCAST); 290103026Ssobomax 291103026Ssobomax if (sc->g_proto == IPPROTO_MOBILE) { 292103026Ssobomax if (dst->sa_family == AF_INET) { 293103026Ssobomax struct mbuf *m0; 294103026Ssobomax int msiz; 295103026Ssobomax 296103026Ssobomax ip = mtod(m, struct ip *); 297103026Ssobomax 298103026Ssobomax /* 299103026Ssobomax * RFC2004 specifies that fragmented diagrams shouldn't 300103026Ssobomax * be encapsulated. 301103026Ssobomax */ 302158416Shsu if (ip->ip_off & (IP_MF | IP_OFFMASK)) { 303103026Ssobomax _IF_DROP(&ifp->if_snd); 304103026Ssobomax m_freem(m); 305103026Ssobomax error = EINVAL; /* is there better errno? */ 306103026Ssobomax goto end; 307103026Ssobomax } 308103026Ssobomax memset(&mob_h, 0, MOB_H_SIZ_L); 309103026Ssobomax mob_h.proto = (ip->ip_p) << 8; 310103026Ssobomax mob_h.odst = ip->ip_dst.s_addr; 311103026Ssobomax ip->ip_dst.s_addr = sc->g_dst.s_addr; 312103026Ssobomax 313103026Ssobomax /* 314103026Ssobomax * If the packet comes from our host, we only change 315103026Ssobomax * the destination address in the IP header. 316103026Ssobomax * Else we also need to save and change the source 317103026Ssobomax */ 318103026Ssobomax if (in_hosteq(ip->ip_src, sc->g_src)) { 319103026Ssobomax msiz = MOB_H_SIZ_S; 320103026Ssobomax } else { 321103026Ssobomax mob_h.proto |= MOB_H_SBIT; 322103026Ssobomax mob_h.osrc = ip->ip_src.s_addr; 323103026Ssobomax ip->ip_src.s_addr = sc->g_src.s_addr; 324103026Ssobomax msiz = MOB_H_SIZ_L; 325103026Ssobomax } 326103026Ssobomax mob_h.proto = htons(mob_h.proto); 327123992Ssobomax mob_h.hcrc = gre_in_cksum((u_int16_t *)&mob_h, msiz); 328103026Ssobomax 329103026Ssobomax if ((m->m_data - msiz) < m->m_pktdat) { 330103026Ssobomax /* need new mbuf */ 331151967Sandre MGETHDR(m0, M_DONTWAIT, MT_DATA); 332103026Ssobomax if (m0 == NULL) { 333103026Ssobomax _IF_DROP(&ifp->if_snd); 334103026Ssobomax m_freem(m); 335103026Ssobomax error = ENOBUFS; 336103026Ssobomax goto end; 337103026Ssobomax } 338103026Ssobomax m0->m_next = m; 339103026Ssobomax m->m_data += sizeof(struct ip); 340103026Ssobomax m->m_len -= sizeof(struct ip); 341103026Ssobomax m0->m_pkthdr.len = m->m_pkthdr.len + msiz; 342103026Ssobomax m0->m_len = msiz + sizeof(struct ip); 343103026Ssobomax m0->m_data += max_linkhdr; 344103026Ssobomax memcpy(mtod(m0, caddr_t), (caddr_t)ip, 345103026Ssobomax sizeof(struct ip)); 346103026Ssobomax m = m0; 347103026Ssobomax } else { /* we have some space left in the old one */ 348103026Ssobomax m->m_data -= msiz; 349103026Ssobomax m->m_len += msiz; 350103026Ssobomax m->m_pkthdr.len += msiz; 351103026Ssobomax bcopy(ip, mtod(m, caddr_t), 352103026Ssobomax sizeof(struct ip)); 353103026Ssobomax } 354103026Ssobomax ip = mtod(m, struct ip *); 355103026Ssobomax memcpy((caddr_t)(ip + 1), &mob_h, (unsigned)msiz); 356103026Ssobomax ip->ip_len = ntohs(ip->ip_len) + msiz; 357103026Ssobomax } else { /* AF_INET */ 358103026Ssobomax _IF_DROP(&ifp->if_snd); 359103026Ssobomax m_freem(m); 360103026Ssobomax error = EINVAL; 361103026Ssobomax goto end; 362103026Ssobomax } 363103026Ssobomax } else if (sc->g_proto == IPPROTO_GRE) { 364103026Ssobomax switch (dst->sa_family) { 365103026Ssobomax case AF_INET: 366103026Ssobomax ip = mtod(m, struct ip *); 367180041Sjulian gre_ip_tos = ip->ip_tos; 368180041Sjulian gre_ip_id = ip->ip_id; 369180639Sjulian if (sc->wccp_ver == WCCP_V2) { 370180639Sjulian extra = sizeof(uint32_t); 371180639Sjulian etype = WCCP_PROTOCOL_TYPE; 372180639Sjulian } else { 373180639Sjulian etype = ETHERTYPE_IP; 374180639Sjulian } 375103026Ssobomax break; 376148613Sbz#ifdef INET6 377148613Sbz case AF_INET6: 378180041Sjulian gre_ip_id = ip_newid(); 379148613Sbz etype = ETHERTYPE_IPV6; 380148613Sbz break; 381148613Sbz#endif 382103026Ssobomax#ifdef NETATALK 383103026Ssobomax case AF_APPLETALK: 384103026Ssobomax etype = ETHERTYPE_ATALK; 385103026Ssobomax break; 386103026Ssobomax#endif 387103026Ssobomax default: 388103026Ssobomax _IF_DROP(&ifp->if_snd); 389103026Ssobomax m_freem(m); 390103026Ssobomax error = EAFNOSUPPORT; 391103026Ssobomax goto end; 392103026Ssobomax } 393179894Sthompsa 394179894Sthompsa /* Reserve space for GRE header + optional GRE key */ 395180639Sjulian int hdrlen = sizeof(struct greip) + extra; 396179894Sthompsa if (sc->key) 397179894Sthompsa hdrlen += sizeof(uint32_t); 398179894Sthompsa M_PREPEND(m, hdrlen, M_DONTWAIT); 399103026Ssobomax } else { 400103026Ssobomax _IF_DROP(&ifp->if_snd); 401103026Ssobomax m_freem(m); 402103026Ssobomax error = EINVAL; 403103026Ssobomax goto end; 404103026Ssobomax } 405103026Ssobomax 406128580Sandre if (m == NULL) { /* mbuf allocation failed */ 407103026Ssobomax _IF_DROP(&ifp->if_snd); 408103026Ssobomax error = ENOBUFS; 409103026Ssobomax goto end; 410103026Ssobomax } 411103026Ssobomax 412178888Sjulian M_SETFIB(m, sc->gre_fibnum); /* The envelope may use a different FIB */ 413178888Sjulian 414103026Ssobomax gh = mtod(m, struct greip *); 415103026Ssobomax if (sc->g_proto == IPPROTO_GRE) { 416179894Sthompsa uint32_t *options = gh->gi_options; 417179894Sthompsa 418180639Sjulian memset((void *)gh, 0, sizeof(struct greip) + extra); 419103026Ssobomax gh->gi_ptype = htons(etype); 420179894Sthompsa gh->gi_flags = 0; 421179894Sthompsa 422179894Sthompsa /* Add key option */ 423179894Sthompsa if (sc->key) 424179894Sthompsa { 425179894Sthompsa gh->gi_flags |= htons(GRE_KP); 426179894Sthompsa *(options++) = htonl(sc->key); 427179894Sthompsa } 428103026Ssobomax } 429103026Ssobomax 430103026Ssobomax gh->gi_pr = sc->g_proto; 431103026Ssobomax if (sc->g_proto != IPPROTO_MOBILE) { 432103026Ssobomax gh->gi_src = sc->g_src; 433103026Ssobomax gh->gi_dst = sc->g_dst; 434133163Ssobomax ((struct ip*)gh)->ip_v = IPPROTO_IPV4; 435103026Ssobomax ((struct ip*)gh)->ip_hl = (sizeof(struct ip)) >> 2; 436103032Ssobomax ((struct ip*)gh)->ip_ttl = GRE_TTL; 437180041Sjulian ((struct ip*)gh)->ip_tos = gre_ip_tos; 438180041Sjulian ((struct ip*)gh)->ip_id = gre_ip_id; 439125226Ssobomax gh->gi_len = m->m_pkthdr.len; 440103026Ssobomax } 441103026Ssobomax 442103026Ssobomax ifp->if_opackets++; 443103026Ssobomax ifp->if_obytes += m->m_pkthdr.len; 444128583Sandre /* 445128583Sandre * Send it off and with IP_FORWARD flag to prevent it from 446128583Sandre * overwriting the ip_id again. ip_id is already set to the 447128583Sandre * ip_id of the encapsulated packet. 448128583Sandre */ 449128580Sandre error = ip_output(m, NULL, &sc->route, IP_FORWARDING, 450123992Ssobomax (struct ip_moptions *)NULL, (struct inpcb *)NULL); 451103026Ssobomax end: 452103026Ssobomax sc->called = 0; 453103026Ssobomax if (error) 454103026Ssobomax ifp->if_oerrors++; 455103026Ssobomax return (error); 456103026Ssobomax} 457103026Ssobomax 458103032Ssobomaxstatic int 459103026Ssobomaxgre_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data) 460103026Ssobomax{ 461103026Ssobomax struct ifreq *ifr = (struct ifreq *)data; 462103026Ssobomax struct if_laddrreq *lifr = (struct if_laddrreq *)data; 463103026Ssobomax struct in_aliasreq *aifr = (struct in_aliasreq *)data; 464103026Ssobomax struct gre_softc *sc = ifp->if_softc; 465103026Ssobomax int s; 466103026Ssobomax struct sockaddr_in si; 467103026Ssobomax struct sockaddr *sa = NULL; 468179894Sthompsa int error, adj; 469103026Ssobomax struct sockaddr_in sp, sm, dp, dm; 470179894Sthompsa uint32_t key; 471103026Ssobomax 472103026Ssobomax error = 0; 473179894Sthompsa adj = 0; 474103026Ssobomax 475103026Ssobomax s = splnet(); 476103026Ssobomax switch (cmd) { 477103026Ssobomax case SIOCSIFADDR: 478103026Ssobomax ifp->if_flags |= IFF_UP; 479103026Ssobomax break; 480125020Ssobomax case SIOCSIFDSTADDR: 481103026Ssobomax break; 482103026Ssobomax case SIOCSIFFLAGS: 483164033Srwatson /* 484171056Srwatson * XXXRW: Isn't this priv_check() redundant to the ifnet 485171056Srwatson * layer check? 486164033Srwatson */ 487164033Srwatson if ((error = priv_check(curthread, PRIV_NET_SETIFFLAGS)) != 0) 488103026Ssobomax break; 489103026Ssobomax if ((ifr->ifr_flags & IFF_LINK0) != 0) 490103026Ssobomax sc->g_proto = IPPROTO_GRE; 491103026Ssobomax else 492103026Ssobomax sc->g_proto = IPPROTO_MOBILE; 493125024Ssobomax if ((ifr->ifr_flags & IFF_LINK2) != 0) 494125024Ssobomax sc->wccp_ver = WCCP_V2; 495125024Ssobomax else 496125024Ssobomax sc->wccp_ver = WCCP_V1; 497103026Ssobomax goto recompute; 498103026Ssobomax case SIOCSIFMTU: 499164033Srwatson /* 500171056Srwatson * XXXRW: Isn't this priv_check() redundant to the ifnet 501171056Srwatson * layer check? 502164033Srwatson */ 503164033Srwatson if ((error = priv_check(curthread, PRIV_NET_SETIFMTU)) != 0) 504103026Ssobomax break; 505103026Ssobomax if (ifr->ifr_mtu < 576) { 506103026Ssobomax error = EINVAL; 507103026Ssobomax break; 508103026Ssobomax } 509103026Ssobomax ifp->if_mtu = ifr->ifr_mtu; 510103026Ssobomax break; 511103026Ssobomax case SIOCGIFMTU: 512147256Sbrooks ifr->ifr_mtu = GRE2IFP(sc)->if_mtu; 513103026Ssobomax break; 514103026Ssobomax case SIOCADDMULTI: 515164033Srwatson /* 516171056Srwatson * XXXRW: Isn't this priv_checkr() redundant to the ifnet 517171056Srwatson * layer check? 518164033Srwatson */ 519164033Srwatson if ((error = priv_check(curthread, PRIV_NET_ADDMULTI)) != 0) 520164033Srwatson break; 521164033Srwatson if (ifr == 0) { 522164033Srwatson error = EAFNOSUPPORT; 523164033Srwatson break; 524164033Srwatson } 525164033Srwatson switch (ifr->ifr_addr.sa_family) { 526164033Srwatson#ifdef INET 527164033Srwatson case AF_INET: 528164033Srwatson break; 529164033Srwatson#endif 530164033Srwatson#ifdef INET6 531164033Srwatson case AF_INET6: 532164033Srwatson break; 533164033Srwatson#endif 534164033Srwatson default: 535164033Srwatson error = EAFNOSUPPORT; 536164033Srwatson break; 537164033Srwatson } 538164033Srwatson break; 539103026Ssobomax case SIOCDELMULTI: 540164033Srwatson /* 541171056Srwatson * XXXRW: Isn't this priv_check() redundant to the ifnet 542171056Srwatson * layer check? 543164033Srwatson */ 544164033Srwatson if ((error = priv_check(curthread, PRIV_NET_DELIFGROUP)) != 0) 545103026Ssobomax break; 546103026Ssobomax if (ifr == 0) { 547103026Ssobomax error = EAFNOSUPPORT; 548103026Ssobomax break; 549103026Ssobomax } 550103026Ssobomax switch (ifr->ifr_addr.sa_family) { 551103026Ssobomax#ifdef INET 552103026Ssobomax case AF_INET: 553103026Ssobomax break; 554103026Ssobomax#endif 555148613Sbz#ifdef INET6 556148613Sbz case AF_INET6: 557148613Sbz break; 558148613Sbz#endif 559103026Ssobomax default: 560103026Ssobomax error = EAFNOSUPPORT; 561103026Ssobomax break; 562103026Ssobomax } 563103026Ssobomax break; 564103026Ssobomax case GRESPROTO: 565164033Srwatson /* 566171056Srwatson * XXXRW: Isn't this priv_check() redundant to the ifnet 567171056Srwatson * layer check? 568164033Srwatson */ 569164033Srwatson if ((error = priv_check(curthread, PRIV_NET_GRE)) != 0) 570103026Ssobomax break; 571103026Ssobomax sc->g_proto = ifr->ifr_flags; 572103026Ssobomax switch (sc->g_proto) { 573103026Ssobomax case IPPROTO_GRE: 574103026Ssobomax ifp->if_flags |= IFF_LINK0; 575103026Ssobomax break; 576103026Ssobomax case IPPROTO_MOBILE: 577103026Ssobomax ifp->if_flags &= ~IFF_LINK0; 578103026Ssobomax break; 579103026Ssobomax default: 580103026Ssobomax error = EPROTONOSUPPORT; 581103026Ssobomax break; 582103026Ssobomax } 583103026Ssobomax goto recompute; 584103026Ssobomax case GREGPROTO: 585103026Ssobomax ifr->ifr_flags = sc->g_proto; 586103026Ssobomax break; 587103026Ssobomax case GRESADDRS: 588103026Ssobomax case GRESADDRD: 589164033Srwatson error = priv_check(curthread, PRIV_NET_GRE); 590164033Srwatson if (error) 591164033Srwatson return (error); 592103026Ssobomax /* 593103026Ssobomax * set tunnel endpoints, compute a less specific route 594103026Ssobomax * to the remote end and mark if as up 595103026Ssobomax */ 596103026Ssobomax sa = &ifr->ifr_addr; 597103026Ssobomax if (cmd == GRESADDRS) 598103026Ssobomax sc->g_src = (satosin(sa))->sin_addr; 599103026Ssobomax if (cmd == GRESADDRD) 600103026Ssobomax sc->g_dst = (satosin(sa))->sin_addr; 601103026Ssobomax recompute: 602103026Ssobomax#ifdef INET 603103026Ssobomax if (sc->encap != NULL) { 604103026Ssobomax encap_detach(sc->encap); 605103026Ssobomax sc->encap = NULL; 606103026Ssobomax } 607103026Ssobomax#endif 608103026Ssobomax if ((sc->g_src.s_addr != INADDR_ANY) && 609103026Ssobomax (sc->g_dst.s_addr != INADDR_ANY)) { 610103026Ssobomax bzero(&sp, sizeof(sp)); 611103026Ssobomax bzero(&sm, sizeof(sm)); 612103026Ssobomax bzero(&dp, sizeof(dp)); 613103026Ssobomax bzero(&dm, sizeof(dm)); 614103026Ssobomax sp.sin_len = sm.sin_len = dp.sin_len = dm.sin_len = 615103026Ssobomax sizeof(struct sockaddr_in); 616103026Ssobomax sp.sin_family = sm.sin_family = dp.sin_family = 617103026Ssobomax dm.sin_family = AF_INET; 618103026Ssobomax sp.sin_addr = sc->g_src; 619103026Ssobomax dp.sin_addr = sc->g_dst; 620125020Ssobomax sm.sin_addr.s_addr = dm.sin_addr.s_addr = 621103026Ssobomax INADDR_BROADCAST; 622103026Ssobomax#ifdef INET 623103026Ssobomax sc->encap = encap_attach(AF_INET, sc->g_proto, 624103026Ssobomax sintosa(&sp), sintosa(&sm), sintosa(&dp), 625103026Ssobomax sintosa(&dm), (sc->g_proto == IPPROTO_GRE) ? 626103026Ssobomax &in_gre_protosw : &in_mobile_protosw, sc); 627103026Ssobomax if (sc->encap == NULL) 628103026Ssobomax printf("%s: unable to attach encap\n", 629147256Sbrooks if_name(GRE2IFP(sc))); 630103026Ssobomax#endif 631103026Ssobomax if (sc->route.ro_rt != 0) /* free old route */ 632103026Ssobomax RTFREE(sc->route.ro_rt); 633103026Ssobomax if (gre_compute_route(sc) == 0) 634148887Srwatson ifp->if_drv_flags |= IFF_DRV_RUNNING; 635103026Ssobomax else 636148887Srwatson ifp->if_drv_flags &= ~IFF_DRV_RUNNING; 637103026Ssobomax } 638103026Ssobomax break; 639103026Ssobomax case GREGADDRS: 640103026Ssobomax memset(&si, 0, sizeof(si)); 641103026Ssobomax si.sin_family = AF_INET; 642103026Ssobomax si.sin_len = sizeof(struct sockaddr_in); 643103026Ssobomax si.sin_addr.s_addr = sc->g_src.s_addr; 644103026Ssobomax sa = sintosa(&si); 645103026Ssobomax ifr->ifr_addr = *sa; 646103026Ssobomax break; 647103026Ssobomax case GREGADDRD: 648103026Ssobomax memset(&si, 0, sizeof(si)); 649103026Ssobomax si.sin_family = AF_INET; 650103026Ssobomax si.sin_len = sizeof(struct sockaddr_in); 651103026Ssobomax si.sin_addr.s_addr = sc->g_dst.s_addr; 652103026Ssobomax sa = sintosa(&si); 653103026Ssobomax ifr->ifr_addr = *sa; 654103026Ssobomax break; 655103026Ssobomax case SIOCSIFPHYADDR: 656164033Srwatson /* 657171056Srwatson * XXXRW: Isn't this priv_check() redundant to the ifnet 658171056Srwatson * layer check? 659164033Srwatson */ 660164033Srwatson if ((error = priv_check(curthread, PRIV_NET_SETIFPHYS)) != 0) 661103026Ssobomax break; 662103026Ssobomax if (aifr->ifra_addr.sin_family != AF_INET || 663103026Ssobomax aifr->ifra_dstaddr.sin_family != AF_INET) { 664103026Ssobomax error = EAFNOSUPPORT; 665103026Ssobomax break; 666103026Ssobomax } 667103026Ssobomax if (aifr->ifra_addr.sin_len != sizeof(si) || 668103026Ssobomax aifr->ifra_dstaddr.sin_len != sizeof(si)) { 669103026Ssobomax error = EINVAL; 670103026Ssobomax break; 671103026Ssobomax } 672103026Ssobomax sc->g_src = aifr->ifra_addr.sin_addr; 673103026Ssobomax sc->g_dst = aifr->ifra_dstaddr.sin_addr; 674103026Ssobomax goto recompute; 675103026Ssobomax case SIOCSLIFPHYADDR: 676164033Srwatson /* 677171056Srwatson * XXXRW: Isn't this priv_check() redundant to the ifnet 678171056Srwatson * layer check? 679164033Srwatson */ 680164033Srwatson if ((error = priv_check(curthread, PRIV_NET_SETIFPHYS)) != 0) 681103026Ssobomax break; 682103026Ssobomax if (lifr->addr.ss_family != AF_INET || 683103026Ssobomax lifr->dstaddr.ss_family != AF_INET) { 684103026Ssobomax error = EAFNOSUPPORT; 685103026Ssobomax break; 686103026Ssobomax } 687103026Ssobomax if (lifr->addr.ss_len != sizeof(si) || 688103026Ssobomax lifr->dstaddr.ss_len != sizeof(si)) { 689103026Ssobomax error = EINVAL; 690103026Ssobomax break; 691103026Ssobomax } 692155440Sqingli sc->g_src = (satosin(&lifr->addr))->sin_addr; 693103026Ssobomax sc->g_dst = 694155440Sqingli (satosin(&lifr->dstaddr))->sin_addr; 695103026Ssobomax goto recompute; 696103026Ssobomax case SIOCDIFPHYADDR: 697164033Srwatson /* 698171056Srwatson * XXXRW: Isn't this priv_check() redundant to the ifnet 699171056Srwatson * layer check? 700164033Srwatson */ 701164033Srwatson if ((error = priv_check(curthread, PRIV_NET_SETIFPHYS)) != 0) 702103026Ssobomax break; 703103026Ssobomax sc->g_src.s_addr = INADDR_ANY; 704103026Ssobomax sc->g_dst.s_addr = INADDR_ANY; 705103026Ssobomax goto recompute; 706103026Ssobomax case SIOCGLIFPHYADDR: 707103026Ssobomax if (sc->g_src.s_addr == INADDR_ANY || 708103026Ssobomax sc->g_dst.s_addr == INADDR_ANY) { 709103026Ssobomax error = EADDRNOTAVAIL; 710103026Ssobomax break; 711103026Ssobomax } 712103026Ssobomax memset(&si, 0, sizeof(si)); 713103026Ssobomax si.sin_family = AF_INET; 714103026Ssobomax si.sin_len = sizeof(struct sockaddr_in); 715103026Ssobomax si.sin_addr.s_addr = sc->g_src.s_addr; 716103026Ssobomax memcpy(&lifr->addr, &si, sizeof(si)); 717103026Ssobomax si.sin_addr.s_addr = sc->g_dst.s_addr; 718103026Ssobomax memcpy(&lifr->dstaddr, &si, sizeof(si)); 719103026Ssobomax break; 720103026Ssobomax case SIOCGIFPSRCADDR: 721122699Sbms#ifdef INET6 722122699Sbms case SIOCGIFPSRCADDR_IN6: 723122699Sbms#endif 724103026Ssobomax if (sc->g_src.s_addr == INADDR_ANY) { 725103026Ssobomax error = EADDRNOTAVAIL; 726103026Ssobomax break; 727103026Ssobomax } 728103026Ssobomax memset(&si, 0, sizeof(si)); 729103026Ssobomax si.sin_family = AF_INET; 730103026Ssobomax si.sin_len = sizeof(struct sockaddr_in); 731103026Ssobomax si.sin_addr.s_addr = sc->g_src.s_addr; 732103026Ssobomax bcopy(&si, &ifr->ifr_addr, sizeof(ifr->ifr_addr)); 733103026Ssobomax break; 734103026Ssobomax case SIOCGIFPDSTADDR: 735122699Sbms#ifdef INET6 736122699Sbms case SIOCGIFPDSTADDR_IN6: 737122699Sbms#endif 738103026Ssobomax if (sc->g_dst.s_addr == INADDR_ANY) { 739103026Ssobomax error = EADDRNOTAVAIL; 740103026Ssobomax break; 741103026Ssobomax } 742103026Ssobomax memset(&si, 0, sizeof(si)); 743103026Ssobomax si.sin_family = AF_INET; 744103026Ssobomax si.sin_len = sizeof(struct sockaddr_in); 745103026Ssobomax si.sin_addr.s_addr = sc->g_dst.s_addr; 746103026Ssobomax bcopy(&si, &ifr->ifr_addr, sizeof(ifr->ifr_addr)); 747103026Ssobomax break; 748179894Sthompsa case GRESKEY: 749179894Sthompsa error = priv_check(curthread, PRIV_NET_GRE); 750179894Sthompsa if (error) 751179894Sthompsa break; 752179894Sthompsa error = copyin(ifr->ifr_data, &key, sizeof(key)); 753179894Sthompsa if (error) 754179894Sthompsa break; 755179894Sthompsa /* adjust MTU for option header */ 756179894Sthompsa if (key == 0 && sc->key != 0) /* clear */ 757179894Sthompsa adj += sizeof(key); 758179894Sthompsa else if (key != 0 && sc->key == 0) /* set */ 759179894Sthompsa adj -= sizeof(key); 760179894Sthompsa 761179894Sthompsa if (ifp->if_mtu + adj < 576) { 762179894Sthompsa error = EINVAL; 763179894Sthompsa break; 764179894Sthompsa } 765179894Sthompsa ifp->if_mtu += adj; 766179894Sthompsa sc->key = key; 767179894Sthompsa break; 768179894Sthompsa case GREGKEY: 769179894Sthompsa error = copyout(&sc->key, ifr->ifr_data, sizeof(sc->key)); 770179894Sthompsa break; 771179894Sthompsa 772103026Ssobomax default: 773103026Ssobomax error = EINVAL; 774103026Ssobomax break; 775103026Ssobomax } 776103026Ssobomax 777103026Ssobomax splx(s); 778103026Ssobomax return (error); 779103026Ssobomax} 780103026Ssobomax 781103026Ssobomax/* 782103026Ssobomax * computes a route to our destination that is not the one 783103026Ssobomax * which would be taken by ip_output(), as this one will loop back to 784103026Ssobomax * us. If the interface is p2p as a--->b, then a routing entry exists 785103026Ssobomax * If we now send a packet to b (e.g. ping b), this will come down here 786123992Ssobomax * gets src=a, dst=b tacked on and would from ip_output() sent back to 787103026Ssobomax * if_gre. 788103026Ssobomax * Goal here is to compute a route to b that is less specific than 789103026Ssobomax * a-->b. We know that this one exists as in normal operation we have 790103026Ssobomax * at least a default route which matches. 791103026Ssobomax */ 792103032Ssobomaxstatic int 793103026Ssobomaxgre_compute_route(struct gre_softc *sc) 794103026Ssobomax{ 795103026Ssobomax struct route *ro; 796103026Ssobomax 797103026Ssobomax ro = &sc->route; 798103026Ssobomax 799103026Ssobomax memset(ro, 0, sizeof(struct route)); 800103026Ssobomax ((struct sockaddr_in *)&ro->ro_dst)->sin_addr = sc->g_dst; 801103026Ssobomax ro->ro_dst.sa_family = AF_INET; 802103026Ssobomax ro->ro_dst.sa_len = sizeof(ro->ro_dst); 803103026Ssobomax 804103026Ssobomax /* 805103026Ssobomax * toggle last bit, so our interface is not found, but a less 806103026Ssobomax * specific route. I'd rather like to specify a shorter mask, 807103026Ssobomax * but this is not possible. Should work though. XXX 808178888Sjulian * XXX MRT Use a different FIB for the tunnel to solve this problem. 809103026Ssobomax */ 810147256Sbrooks if ((GRE2IFP(sc)->if_flags & IFF_LINK1) == 0) { 811177416Sjulian ((struct sockaddr_in *)&ro->ro_dst)->sin_addr.s_addr ^= 812177416Sjulian htonl(0x01); 813103026Ssobomax } 814103026Ssobomax 815103026Ssobomax#ifdef DIAGNOSTIC 816147256Sbrooks printf("%s: searching for a route to %s", if_name(GRE2IFP(sc)), 817103026Ssobomax inet_ntoa(((struct sockaddr_in *)&ro->ro_dst)->sin_addr)); 818103026Ssobomax#endif 819103026Ssobomax 820178888Sjulian rtalloc_fib(ro, sc->gre_fibnum); 821103026Ssobomax 822103026Ssobomax /* 823103026Ssobomax * check if this returned a route at all and this route is no 824103026Ssobomax * recursion to ourself 825103026Ssobomax */ 826103026Ssobomax if (ro->ro_rt == NULL || ro->ro_rt->rt_ifp->if_softc == sc) { 827103026Ssobomax#ifdef DIAGNOSTIC 828103026Ssobomax if (ro->ro_rt == NULL) 829103026Ssobomax printf(" - no route found!\n"); 830103026Ssobomax else 831103026Ssobomax printf(" - route loops back to ourself!\n"); 832103026Ssobomax#endif 833103026Ssobomax return EADDRNOTAVAIL; 834103026Ssobomax } 835103026Ssobomax 836103026Ssobomax /* 837103026Ssobomax * now change it back - else ip_output will just drop 838103026Ssobomax * the route and search one to this interface ... 839103026Ssobomax */ 840147256Sbrooks if ((GRE2IFP(sc)->if_flags & IFF_LINK1) == 0) 841103026Ssobomax ((struct sockaddr_in *)&ro->ro_dst)->sin_addr = sc->g_dst; 842103026Ssobomax 843103026Ssobomax#ifdef DIAGNOSTIC 844103026Ssobomax printf(", choosing %s with gateway %s", if_name(ro->ro_rt->rt_ifp), 845103026Ssobomax inet_ntoa(((struct sockaddr_in *)(ro->ro_rt->rt_gateway))->sin_addr)); 846103026Ssobomax printf("\n"); 847103026Ssobomax#endif 848103026Ssobomax 849103026Ssobomax return 0; 850103026Ssobomax} 851103026Ssobomax 852103026Ssobomax/* 853103026Ssobomax * do a checksum of a buffer - much like in_cksum, which operates on 854103026Ssobomax * mbufs. 855103026Ssobomax */ 856123992Ssobomaxu_int16_t 857123992Ssobomaxgre_in_cksum(u_int16_t *p, u_int len) 858103026Ssobomax{ 859123992Ssobomax u_int32_t sum = 0; 860103026Ssobomax int nwords = len >> 1; 861103026Ssobomax 862103026Ssobomax while (nwords-- != 0) 863103026Ssobomax sum += *p++; 864103026Ssobomax 865103026Ssobomax if (len & 1) { 866103026Ssobomax union { 867103026Ssobomax u_short w; 868103026Ssobomax u_char c[2]; 869103026Ssobomax } u; 870103026Ssobomax u.c[0] = *(u_char *)p; 871103026Ssobomax u.c[1] = 0; 872103026Ssobomax sum += u.w; 873103026Ssobomax } 874103026Ssobomax 875103026Ssobomax /* end-around-carry */ 876103026Ssobomax sum = (sum >> 16) + (sum & 0xffff); 877103026Ssobomax sum += (sum >> 16); 878103026Ssobomax return (~sum); 879103026Ssobomax} 880103026Ssobomax 881103026Ssobomaxstatic int 882103026Ssobomaxgremodevent(module_t mod, int type, void *data) 883103026Ssobomax{ 884103026Ssobomax 885103026Ssobomax switch (type) { 886103026Ssobomax case MOD_LOAD: 887103026Ssobomax greattach(); 888103026Ssobomax break; 889103026Ssobomax case MOD_UNLOAD: 890103026Ssobomax if_clone_detach(&gre_cloner); 891127307Srwatson mtx_destroy(&gre_mtx); 892103026Ssobomax break; 893132199Sphk default: 894132199Sphk return EOPNOTSUPP; 895103026Ssobomax } 896103026Ssobomax return 0; 897103026Ssobomax} 898103026Ssobomax 899103026Ssobomaxstatic moduledata_t gre_mod = { 900103026Ssobomax "if_gre", 901103026Ssobomax gremodevent, 902103026Ssobomax 0 903103026Ssobomax}; 904103026Ssobomax 905103026SsobomaxDECLARE_MODULE(if_gre, gre_mod, SI_SUB_PSEUDO, SI_ORDER_ANY); 906103026SsobomaxMODULE_VERSION(if_gre, 1); 907