/* $OpenBSD: if_mpe.c,v 1.22 2010/08/25 13:57:07 claudio Exp $ */ /* * Copyright (c) 2008 Pierre-Yves Ritschard * * Permission to use, copy, modify, and distribute this software for any * purpose with or without fee is hereby granted, provided that the above * copyright notice and this permission notice appear in all copies. * * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */ #include "mpe.h" #include #include #include #include #include #include #include #include #include #include #include #ifdef INET #include #include #include #include #endif #ifdef INET6 #include #ifndef INET #include #endif #endif /* INET6 */ #include "bpfilter.h" #if NBPFILTER > 0 #include #endif #include #ifdef MPLS_DEBUG #define DPRINTF(x) do { if (mpedebug) printf x ; } while (0) #else #define DPRINTF(x) #endif void mpeattach(int); int mpeoutput(struct ifnet *, struct mbuf *, struct sockaddr *, struct rtentry *); int mpeioctl(struct ifnet *, u_long, caddr_t); void mpestart(struct ifnet *); int mpe_clone_create(struct if_clone *, int); int mpe_clone_destroy(struct ifnet *); int mpe_newlabel(struct ifnet *, int, struct shim_hdr *); LIST_HEAD(, mpe_softc) mpeif_list; struct if_clone mpe_cloner = IF_CLONE_INITIALIZER("mpe", mpe_clone_create, mpe_clone_destroy); extern int mpls_mapttl_ip; extern int mpls_mapttl_ip6; void mpeattach(int nmpe) { LIST_INIT(&mpeif_list); if_clone_attach(&mpe_cloner); } int mpe_clone_create(struct if_clone *ifc, int unit) { struct ifnet *ifp; struct mpe_softc *mpeif; int s; if ((mpeif = malloc(sizeof(*mpeif), M_DEVBUF, M_NOWAIT|M_ZERO)) == NULL) return (ENOMEM); mpeif->sc_shim.shim_label = 0; mpeif->sc_unit = unit; ifp = &mpeif->sc_if; snprintf(ifp->if_xname, sizeof ifp->if_xname, "mpe%d", unit); ifp->if_flags = IFF_POINTOPOINT; ifp->if_softc = mpeif; ifp->if_mtu = MPE_MTU; ifp->if_ioctl = mpeioctl; ifp->if_output = mpeoutput; ifp->if_start = mpestart; ifp->if_type = IFT_MPLS; ifp->if_hdrlen = MPE_HDRLEN; IFQ_SET_MAXLEN(&ifp->if_snd, ifqmaxlen); IFQ_SET_READY(&ifp->if_snd); if_attach(ifp); if_alloc_sadl(ifp); #if NBPFILTER > 0 bpfattach(&ifp->if_bpf, ifp, DLT_NULL, sizeof(u_int32_t)); #endif s = splnet(); LIST_INSERT_HEAD(&mpeif_list, mpeif, sc_list); splx(s); return (0); } int mpe_clone_destroy(struct ifnet *ifp) { struct mpe_softc *mpeif = ifp->if_softc; int s; s = splnet(); LIST_REMOVE(mpeif, sc_list); splx(s); if_detach(ifp); free(mpeif, M_DEVBUF); return (0); } struct sockaddr_storage mpedst; /* * Start output on the mpe interface. */ void mpestart(struct ifnet *ifp) { struct mbuf *m; struct sockaddr *sa = (struct sockaddr *)&mpedst; int s; sa_family_t af; struct rtentry *rt; for (;;) { s = splnet(); IFQ_DEQUEUE(&ifp->if_snd, m); splx(s); if (m == NULL) return; af = *mtod(m, sa_family_t *); m_adj(m, sizeof(af)); switch (af) { case AF_INET: bzero(sa, sizeof(struct sockaddr_in)); satosin(sa)->sin_family = af; satosin(sa)->sin_len = sizeof(struct sockaddr_in); bcopy(mtod(m, caddr_t), &satosin(sa)->sin_addr, sizeof(in_addr_t)); m_adj(m, sizeof(in_addr_t)); break; default: m_freem(m); continue; } rt = rtalloc1(sa, RT_REPORT, 0); if (rt == NULL) { /* no route give up */ m_freem(m); continue; } #if NBPFILTER > 0 if (ifp->if_bpf) { /* remove MPLS label before passing packet to bpf */ m->m_data += sizeof(struct shim_hdr); m->m_len -= sizeof(struct shim_hdr); m->m_pkthdr.len -= sizeof(struct shim_hdr); bpf_mtap_af(ifp->if_bpf, af, m, BPF_DIRECTION_OUT); m->m_data -= sizeof(struct shim_hdr); m->m_len += sizeof(struct shim_hdr); m->m_pkthdr.len += sizeof(struct shim_hdr); } #endif /* XXX lie, but mpls_output will only look at sa_family */ sa->sa_family = AF_MPLS; mpls_output(rt->rt_ifp, m, sa, rt); RTFREE(rt); } } int mpeoutput(struct ifnet *ifp, struct mbuf *m, struct sockaddr *dst, struct rtentry *rt) { struct shim_hdr shim; int s; int error; int off; u_int8_t op = 0; #ifdef DIAGNOSTIC if (ifp->if_rdomain != rtable_l2(m->m_pkthdr.rdomain)) { printf("%s: trying to send packet on wrong domain. " "if %d vs. mbuf %d\n", ifp->if_xname, ifp->if_rdomain, rtable_l2(m->m_pkthdr.rdomain)); } #endif m->m_pkthdr.rcvif = ifp; /* XXX assumes MPLS is always in rdomain 0 */ m->m_pkthdr.rdomain = 0; error = 0; switch (dst->sa_family) { #ifdef INET case AF_INET: if (rt && rt->rt_flags & RTF_MPLS) { shim.shim_label = ((struct rt_mpls *)rt->rt_llinfo)->mpls_label; shim.shim_label |= MPLS_BOS_MASK; op = ((struct rt_mpls *)rt->rt_llinfo)->mpls_operation; } if (op != MPLS_OP_PUSH) { m_freem(m); error = ENETUNREACH; goto out; } if (mpls_mapttl_ip) { struct ip *ip; ip = mtod(m, struct ip *); shim.shim_label |= htonl(ip->ip_ttl) & MPLS_TTL_MASK; } else shim.shim_label |= htonl(mpls_defttl) & MPLS_TTL_MASK; off = sizeof(sa_family_t) + sizeof(in_addr_t); M_PREPEND(m, sizeof(shim) + off, M_DONTWAIT); if (m == NULL) { m_freem(m); error = ENOBUFS; goto out; } *mtod(m, sa_family_t *) = AF_INET; m_copyback(m, sizeof(sa_family_t), sizeof(in_addr_t), (caddr_t)&((satosin(dst)->sin_addr)), M_NOWAIT); break; #endif default: m_freem(m); error = ENETDOWN; goto out; } m_copyback(m, off, sizeof(shim), (caddr_t)&shim, M_NOWAIT); s = splnet(); IFQ_ENQUEUE(&ifp->if_snd, m, NULL, error); if (error) { /* mbuf is already freed */ splx(s); return (error); } if_start(ifp); splx(s); out: if (error) ifp->if_oerrors++; return (error); } /* ARGSUSED */ int mpeioctl(struct ifnet *ifp, u_long cmd, caddr_t data) { int error; struct mpe_softc *ifm; struct ifreq *ifr; struct shim_hdr shim; ifr = (struct ifreq *)data; error = 0; switch (cmd) { case SIOCSIFADDR: if (!ISSET(ifp->if_flags, IFF_UP)) if_up(ifp); break; case SIOCSIFFLAGS: if (ifp->if_flags & IFF_UP) ifp->if_flags |= IFF_RUNNING; else ifp->if_flags &= ~IFF_RUNNING; break; case SIOCSIFMTU: if (ifr->ifr_mtu < MPE_MTU_MIN || ifr->ifr_mtu > MPE_MTU_MAX) error = EINVAL; else ifp->if_mtu = ifr->ifr_mtu; break; case SIOCGETLABEL: ifm = ifp->if_softc; shim.shim_label = ((ntohl(ifm->sc_shim.shim_label & MPLS_LABEL_MASK)) >> MPLS_LABEL_OFFSET); error = copyout(&shim, ifr->ifr_data, sizeof(shim)); break; case SIOCSETLABEL: ifm = ifp->if_softc; if ((error = copyin(ifr->ifr_data, &shim, sizeof(shim)))) break; if (shim.shim_label > MPLS_LABEL_MAX || shim.shim_label <= MPLS_LABEL_RESERVED_MAX) { error = EINVAL; break; } shim.shim_label = htonl(shim.shim_label << MPLS_LABEL_OFFSET); if (ifm->sc_shim.shim_label == shim.shim_label) break; LIST_FOREACH(ifm, &mpeif_list, sc_list) { if (ifm != ifp->if_softc && ifm->sc_shim.shim_label == shim.shim_label) { error = EEXIST; break; } } if (error) break; ifm = ifp->if_softc; if (ifm->sc_shim.shim_label) { /* remove old MPLS route */ mpe_newlabel(ifp, RTM_DELETE, &ifm->sc_shim); } /* add new MPLS route */ error = mpe_newlabel(ifp, RTM_ADD, &shim); if (error) break; ifm->sc_shim.shim_label = shim.shim_label; break; case SIOCSIFRDOMAIN: /* must readd the MPLS "route" for our label */ ifm = ifp->if_softc; if (ifr->ifr_rdomainid != ifp->if_rdomain) { if (ifm->sc_shim.shim_label) { shim.shim_label = ifm->sc_shim.shim_label; error = mpe_newlabel(ifp, RTM_ADD, &shim); } } /* return with ENOTTY so that the parent handler finishes */ return (ENOTTY); default: return (ENOTTY); } return (error); } void mpe_input(struct mbuf *m, struct ifnet *ifp, struct sockaddr_mpls *smpls, u_int8_t ttl) { struct ip *ip; int s, hlen; /* label -> AF lookup */ if (mpls_mapttl_ip) { if (m->m_len < sizeof (struct ip) && (m = m_pullup(m, sizeof(struct ip))) == NULL) return; ip = mtod(m, struct ip *); hlen = ip->ip_hl << 2; if (m->m_len < hlen) { if ((m = m_pullup(m, hlen)) == NULL) return; ip = mtod(m, struct ip *); } if (in_cksum(m, hlen) != 0) { m_free(m); return; } /* set IP ttl from MPLS ttl */ ip->ip_ttl = ttl; /* recalculate checksum */ ip->ip_sum = 0; ip->ip_sum = in_cksum(m, hlen); } /* new receive if and move into correct rdomain */ m->m_pkthdr.rcvif = ifp; m->m_pkthdr.rdomain = ifp->if_rdomain; #if NBPFILTER > 0 if (ifp && ifp->if_bpf) bpf_mtap_af(ifp->if_bpf, AF_INET, m, BPF_DIRECTION_IN); #endif s = splnet(); IF_INPUT_ENQUEUE(&ipintrq, m); schednetisr(NETISR_IP); splx(s); } void mpe_input6(struct mbuf *m, struct ifnet *ifp, struct sockaddr_mpls *smpls, u_int8_t ttl) { struct ip6_hdr *ip6hdr; int s; /* label -> AF lookup */ if (mpls_mapttl_ip6) { if (m->m_len < sizeof (struct ip6_hdr) && (m = m_pullup(m, sizeof(struct ip6_hdr))) == NULL) return; ip6hdr = mtod(m, struct ip6_hdr *); /* set IPv6 ttl from MPLS ttl */ ip6hdr->ip6_hlim = ttl; } /* new receive if and move into correct rdomain */ m->m_pkthdr.rcvif = ifp; m->m_pkthdr.rdomain = ifp->if_rdomain; #if NBPFILTER > 0 if (ifp && ifp->if_bpf) bpf_mtap_af(ifp->if_bpf, AF_INET6, m, BPF_DIRECTION_IN); #endif s = splnet(); IF_INPUT_ENQUEUE(&ip6intrq, m); schednetisr(NETISR_IPV6); splx(s); } int mpe_newlabel(struct ifnet *ifp, int cmd, struct shim_hdr *shim) { struct rtentry *nrt; struct sockaddr_mpls dst; struct rt_addrinfo info; int error; bzero(&dst, sizeof(dst)); dst.smpls_len = sizeof(dst); dst.smpls_family = AF_MPLS; dst.smpls_label = shim->shim_label; bzero(&info, sizeof(info)); info.rti_flags = RTF_UP | RTF_MPLS; info.rti_mpls = MPLS_OP_POP; info.rti_info[RTAX_DST] = smplstosa(&dst); info.rti_info[RTAX_GATEWAY] = (struct sockaddr *)ifp->if_sadl; error = rtrequest1(cmd, &info, RTP_CONNECTED, &nrt, 0); rt_missmsg(cmd, &info, error ? 0 : nrt->rt_flags, ifp, error, 0); if (cmd == RTM_DELETE) { if (error == 0 && nrt != NULL) { if (nrt->rt_refcnt <= 0) { nrt->rt_refcnt++; rtfree(nrt); } } } if (cmd == RTM_ADD && error == 0 && nrt != NULL) { nrt->rt_refcnt--; } return (error); }