2 * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * 3. Neither the name of the project nor the names of its contributors
14 * may be used to endorse or promote products derived from this software
15 * without specific prior written permission.
17 * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * $FreeBSD: src/sys/net/if_gif.c,v 1.4.2.15 2002/11/08 16:57:13 ume Exp $
30 * $DragonFly: src/sys/net/gif/if_gif.c,v 1.21 2008/05/14 11:59:23 sephe Exp $
31 * $KAME: if_gif.c,v 1.87 2001/10/19 08:50:27 itojun Exp $
35 #include "opt_inet6.h"
37 #include <sys/param.h>
38 #include <sys/systm.h>
39 #include <sys/kernel.h>
41 #include <sys/malloc.h>
43 #include <sys/socket.h>
44 #include <sys/sockio.h>
45 #include <sys/errno.h>
47 #include <sys/sysctl.h>
48 #include <sys/syslog.h>
49 #include <sys/protosw.h>
51 #include <sys/thread2.h>
53 #include <machine/cpu.h>
56 #include <net/if_types.h>
57 #include <net/netisr.h>
58 #include <net/route.h>
60 #include <net/if_clone.h>
62 #include <netinet/in.h>
63 #include <netinet/in_systm.h>
64 #include <netinet/ip.h>
66 #include <netinet/in_var.h>
67 #include <netinet/in_gif.h>
68 #include <netinet/ip_var.h>
73 #include <netinet/in.h>
75 #include <netinet6/in6_var.h>
76 #include <netinet/ip6.h>
77 #include <netinet6/ip6_var.h>
78 #include <netinet6/in6_gif.h>
79 #include <netinet6/ip6protosw.h>
82 #include <netinet/ip_encap.h>
85 #include <net/net_osdep.h>
89 static MALLOC_DEFINE(M_GIF, "gif", "Generic Tunnel Interface");
90 LIST_HEAD(, gif_softc) gif_softc_list;
92 int gif_clone_create (struct if_clone *, int, caddr_t);
93 void gif_clone_destroy (struct ifnet *);
95 struct if_clone gif_cloner = IF_CLONE_INITIALIZER("gif", gif_clone_create,
96 gif_clone_destroy, 0, IF_MAXUNIT);
98 static int gifmodevent (module_t, int, void *);
99 static void gif_clear_cache(struct gif_softc *sc);
101 SYSCTL_DECL(_net_link);
102 SYSCTL_NODE(_net_link, IFT_GIF, gif, CTLFLAG_RW, 0,
103 "Generic Tunnel Interface");
106 * This macro controls the default upper limitation on nesting of gif tunnels.
107 * Since, setting a large value to this macro with a careless configuration
108 * may introduce system crash, we don't allow any nestings by default.
109 * If you need to configure nested gif tunnels, you can define this macro
110 * in your kernel configuration file. However, if you do so, please be
111 * careful to configure the tunnels so that it won't make a loop.
113 #define MAX_GIF_NEST 1
115 static int max_gif_nesting = MAX_GIF_NEST;
116 SYSCTL_INT(_net_link_gif, OID_AUTO, max_nesting, CTLFLAG_RW,
117 &max_gif_nesting, 0, "Max nested tunnels");
120 * By default, we disallow creation of multiple tunnels between the same
121 * pair of addresses. Some applications require this functionality so
122 * we allow control over this check here.
125 static int parallel_tunnels = 1;
127 static int parallel_tunnels = 0;
129 SYSCTL_INT(_net_link_gif, OID_AUTO, parallel_tunnels, CTLFLAG_RW,
130 ¶llel_tunnels, 0, "Allow parallel tunnels?");
133 gif_clone_create(struct if_clone *ifc, int unit, caddr_t params)
135 struct gif_softc *sc;
137 sc = kmalloc (sizeof(struct gif_softc), M_GIF, M_WAITOK | M_ZERO);
139 sc->gif_if.if_softc = sc;
140 if_initname(&(sc->gif_if), GIFNAME, unit);
144 LIST_INSERT_HEAD(&gif_softc_list, sc, gif_list);
149 gifattach0(struct gif_softc *sc)
152 sc->encap_cookie4 = sc->encap_cookie6 = NULL;
154 sc->gif_if.if_addrlen = 0;
155 sc->gif_if.if_mtu = GIF_MTU;
156 sc->gif_if.if_flags = IFF_POINTOPOINT | IFF_MULTICAST;
158 /* turn off ingress filter */
159 sc->gif_if.if_flags |= IFF_LINK2;
161 sc->gif_if.if_ioctl = gif_ioctl;
162 sc->gif_if.if_output = gif_output;
163 sc->gif_if.if_type = IFT_GIF;
164 sc->gif_if.if_snd.ifq_maxlen = IFQ_MAXLEN;
165 if_attach(&sc->gif_if, NULL);
166 bpfattach(&sc->gif_if, DLT_NULL, sizeof(u_int));
170 gif_clone_destroy(struct ifnet *ifp)
172 struct gif_softc *sc = ifp->if_softc;
175 gif_delete_tunnel(&sc->gif_if);
176 LIST_REMOVE(sc, gif_list);
178 if (sc->encap_cookie6 != NULL) {
179 err = encap_detach(sc->encap_cookie6);
180 KASSERT(err == 0, ("Unexpected error detaching encap_cookie6"));
184 if (sc->encap_cookie4 != NULL) {
185 err = encap_detach(sc->encap_cookie4);
186 KASSERT(err == 0, ("Unexpected error detaching encap_cookie4"));
198 gif_clear_cache(struct gif_softc *sc)
202 for (n = 0; n < ncpus; ++n) {
203 if (sc->gif_ro[n].ro_rt) {
204 RTFREE(sc->gif_ro[n].ro_rt);
205 sc->gif_ro[n].ro_rt = NULL;
207 if (sc->gif_ro6[n].ro_rt) {
208 RTFREE(sc->gif_ro6[n].ro_rt);
209 sc->gif_ro6[n].ro_rt = NULL;
215 gifmodevent(module_t mod, int type, void *data)
220 LIST_INIT(&gif_softc_list);
221 if_clone_attach(&gif_cloner);
224 ip6_gif_hlim = GIF_HLIM;
229 if_clone_detach(&gif_cloner);
231 while (!LIST_EMPTY(&gif_softc_list))
232 gif_clone_destroy(&LIST_FIRST(&gif_softc_list)->gif_if);
242 static moduledata_t gif_mod = {
248 DECLARE_MODULE(if_gif, gif_mod, SI_SUB_PSEUDO, SI_ORDER_ANY);
251 gif_encapcheck(const struct mbuf *m, int off, int proto, void *arg)
254 struct gif_softc *sc;
256 sc = (struct gif_softc *)arg;
260 if ((sc->gif_if.if_flags & IFF_UP) == 0)
263 /* no physical address */
264 if (!sc->gif_psrc || !sc->gif_pdst)
280 /* Bail on short packets */
281 if (m->m_pkthdr.len < sizeof(ip))
284 m_copydata(m, 0, sizeof(ip), (caddr_t)&ip);
289 if (sc->gif_psrc->sa_family != AF_INET ||
290 sc->gif_pdst->sa_family != AF_INET)
292 return gif_encapcheck4(m, off, proto, arg);
296 if (m->m_pkthdr.len < sizeof(struct ip6_hdr))
298 if (sc->gif_psrc->sa_family != AF_INET6 ||
299 sc->gif_pdst->sa_family != AF_INET6)
301 return gif_encapcheck6(m, off, proto, arg);
313 gif_output_serialized(struct ifnet *ifp, struct mbuf *m, struct sockaddr *dst,
316 struct gif_softc *sc = (struct gif_softc*)ifp;
318 static int called = 0; /* XXX: MUTEX */
321 * gif may cause infinite recursion calls when misconfigured.
322 * We'll prevent this by introducing upper limit.
323 * XXX: this mechanism may introduce another problem about
324 * mutual exclusion of the variable CALLED, especially if we
327 if (++called > max_gif_nesting) {
329 "gif_output: recursively called too many times(%d)\n",
332 error = EIO; /* is there better errno? */
336 m->m_flags &= ~(M_BCAST|M_MCAST);
337 if (!(ifp->if_flags & IFF_UP) ||
338 sc->gif_psrc == NULL || sc->gif_pdst == NULL) {
346 * We need to prepend the address family as
349 uint32_t af = dst->sa_family;
351 bpf_ptap(ifp->if_bpf, m, &af, sizeof(af));
354 ifp->if_obytes += m->m_pkthdr.len;
356 /* inner AF-specific encapsulation */
358 /* XXX should we check if our outer source is legal? */
360 /* dispatch to output logic based on outer AF */
361 switch (sc->gif_psrc->sa_family) {
364 error = in_gif_output(ifp, dst->sa_family, m);
369 error = in6_gif_output(ifp, dst->sa_family, m);
379 called = 0; /* reset recursion counter */
386 gif_output(struct ifnet *ifp, struct mbuf *m, struct sockaddr *dst,
391 ifnet_serialize_tx(ifp);
392 error = gif_output_serialized(ifp, m, dst, rt);
393 ifnet_deserialize_tx(ifp);
398 gif_input(struct mbuf *m, int af, struct ifnet *ifp)
408 m->m_pkthdr.rcvif = ifp;
412 * We need to prepend the address family as
417 bpf_ptap(ifp->if_bpf, m, &af1, sizeof(af1));
421 * Put the packet to the network layer input queue according to the
422 * specified address family.
423 * Note: older versions of gif_input directly called network layer
424 * input functions, e.g. ip6_input, here. We changed the policy to
425 * prevent too many recursive calls of such input functions, which
426 * might cause kernel panic. But the change may introduce another
427 * problem; if the input queue is full, packets are discarded.
428 * The kernel stack overflow really happened, and we believed
429 * queue-full rarely occurs, so we changed the policy.
448 ifp->if_ibytes += m->m_pkthdr.len;
449 m->m_flags &= ~M_HASH;
450 netisr_queue(isr, m);
455 /* XXX how should we handle IPv6 scope on SIOC[GS]IFPHYADDR? */
457 gif_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data, struct ucred *cr)
459 struct gif_softc *sc = (struct gif_softc*)ifp;
460 struct ifreq *ifr = (struct ifreq*)data;
462 struct sockaddr *dst, *src;
463 #ifdef SIOCSIFMTU /* xxx */
469 ifp->if_flags |= IFF_UP;
479 #ifdef SIOCSIFMTU /* xxx */
485 if (mtu < GIF_MTU_MIN || mtu > GIF_MTU_MAX)
489 #endif /* SIOCSIFMTU */
495 case SIOCSIFPHYADDR_IN6:
497 case SIOCSLIFPHYADDR:
501 src = (struct sockaddr *)
502 &(((struct in_aliasreq *)data)->ifra_addr);
503 dst = (struct sockaddr *)
504 &(((struct in_aliasreq *)data)->ifra_dstaddr);
508 case SIOCSIFPHYADDR_IN6:
509 src = (struct sockaddr *)
510 &(((struct in6_aliasreq *)data)->ifra_addr);
511 dst = (struct sockaddr *)
512 &(((struct in6_aliasreq *)data)->ifra_dstaddr);
515 case SIOCSLIFPHYADDR:
516 src = (struct sockaddr *)
517 &(((struct if_laddrreq *)data)->addr);
518 dst = (struct sockaddr *)
519 &(((struct if_laddrreq *)data)->dstaddr);
525 /* sa_family must be equal */
526 if (src->sa_family != dst->sa_family)
529 /* validate sa_len */
530 switch (src->sa_family) {
533 if (src->sa_len != sizeof(struct sockaddr_in))
539 if (src->sa_len != sizeof(struct sockaddr_in6))
546 switch (dst->sa_family) {
549 if (dst->sa_len != sizeof(struct sockaddr_in))
555 if (dst->sa_len != sizeof(struct sockaddr_in6))
563 /* check sa_family looks sane for the cmd */
566 if (src->sa_family == AF_INET)
570 case SIOCSIFPHYADDR_IN6:
571 if (src->sa_family == AF_INET6)
575 case SIOCSLIFPHYADDR:
576 /* checks done in the above */
580 error = gif_set_tunnel(&sc->gif_if, src, dst);
583 #ifdef SIOCDIFPHYADDR
585 gif_delete_tunnel(&sc->gif_if);
589 case SIOCGIFPSRCADDR:
591 case SIOCGIFPSRCADDR_IN6:
593 if (sc->gif_psrc == NULL) {
594 error = EADDRNOTAVAIL;
600 case SIOCGIFPSRCADDR:
601 dst = &ifr->ifr_addr;
602 size = sizeof(ifr->ifr_addr);
606 case SIOCGIFPSRCADDR_IN6:
607 dst = (struct sockaddr *)
608 &(((struct in6_ifreq *)data)->ifr_addr);
609 size = sizeof(((struct in6_ifreq *)data)->ifr_addr);
613 error = EADDRNOTAVAIL;
616 if (src->sa_len > size)
618 bcopy((caddr_t)src, (caddr_t)dst, src->sa_len);
621 case SIOCGIFPDSTADDR:
623 case SIOCGIFPDSTADDR_IN6:
625 if (sc->gif_pdst == NULL) {
626 error = EADDRNOTAVAIL;
632 case SIOCGIFPDSTADDR:
633 dst = &ifr->ifr_addr;
634 size = sizeof(ifr->ifr_addr);
638 case SIOCGIFPDSTADDR_IN6:
639 dst = (struct sockaddr *)
640 &(((struct in6_ifreq *)data)->ifr_addr);
641 size = sizeof(((struct in6_ifreq *)data)->ifr_addr);
645 error = EADDRNOTAVAIL;
648 if (src->sa_len > size)
650 bcopy((caddr_t)src, (caddr_t)dst, src->sa_len);
653 case SIOCGLIFPHYADDR:
654 if (sc->gif_psrc == NULL || sc->gif_pdst == NULL) {
655 error = EADDRNOTAVAIL;
661 dst = (struct sockaddr *)
662 &(((struct if_laddrreq *)data)->addr);
663 size = sizeof(((struct if_laddrreq *)data)->addr);
664 if (src->sa_len > size)
666 bcopy((caddr_t)src, (caddr_t)dst, src->sa_len);
670 dst = (struct sockaddr *)
671 &(((struct if_laddrreq *)data)->dstaddr);
672 size = sizeof(((struct if_laddrreq *)data)->dstaddr);
673 if (src->sa_len > size)
675 bcopy((caddr_t)src, (caddr_t)dst, src->sa_len);
679 /* if_ioctl() takes care of it */
691 gif_set_tunnel(struct ifnet *ifp, struct sockaddr *src, struct sockaddr *dst)
693 struct gif_softc *sc = (struct gif_softc *)ifp;
694 struct gif_softc *sc2;
695 struct sockaddr *osrc, *odst, *sa;
700 LIST_FOREACH(sc2, &gif_softc_list, gif_list) {
703 if (!sc2->gif_pdst || !sc2->gif_psrc)
705 if (sc2->gif_pdst->sa_family != dst->sa_family ||
706 sc2->gif_pdst->sa_len != dst->sa_len ||
707 sc2->gif_psrc->sa_family != src->sa_family ||
708 sc2->gif_psrc->sa_len != src->sa_len)
712 * Disallow parallel tunnels unless instructed
715 if (!parallel_tunnels &&
716 bcmp(sc2->gif_pdst, dst, dst->sa_len) == 0 &&
717 bcmp(sc2->gif_psrc, src, src->sa_len) == 0) {
718 error = EADDRNOTAVAIL;
722 /* XXX both end must be valid? (I mean, not 0.0.0.0) */
725 /* XXX we can detach from both, but be polite just in case */
727 switch (sc->gif_psrc->sa_family) {
743 sa = (struct sockaddr *)kmalloc(src->sa_len, M_IFADDR, M_WAITOK);
744 bcopy((caddr_t)src, (caddr_t)sa, src->sa_len);
748 sa = (struct sockaddr *)kmalloc(dst->sa_len, M_IFADDR, M_WAITOK);
749 bcopy((caddr_t)dst, (caddr_t)sa, dst->sa_len);
752 switch (sc->gif_psrc->sa_family) {
755 error = in_gif_attach(sc);
760 error = in6_gif_attach(sc);
766 kfree((caddr_t)sc->gif_psrc, M_IFADDR);
767 kfree((caddr_t)sc->gif_pdst, M_IFADDR);
774 kfree((caddr_t)osrc, M_IFADDR);
776 kfree((caddr_t)odst, M_IFADDR);
778 if (sc->gif_psrc && sc->gif_pdst)
779 ifp->if_flags |= IFF_RUNNING;
781 ifp->if_flags &= ~IFF_RUNNING;
787 if (sc->gif_psrc && sc->gif_pdst)
788 ifp->if_flags |= IFF_RUNNING;
790 ifp->if_flags &= ~IFF_RUNNING;
797 gif_delete_tunnel(struct ifnet *ifp)
799 struct gif_softc *sc = (struct gif_softc *)ifp;
804 kfree((caddr_t)sc->gif_psrc, M_IFADDR);
808 kfree((caddr_t)sc->gif_pdst, M_IFADDR);
811 /* it is safe to detach from both */
820 if (sc->gif_psrc && sc->gif_pdst)
821 ifp->if_flags |= IFF_RUNNING;
823 ifp->if_flags &= ~IFF_RUNNING;