/* $OpenBSD: radix_mpath.c,v 1.33 2015/09/28 08:36:24 mpi Exp $ */ /* $KAME: radix_mpath.c,v 1.13 2002/10/28 21:05:59 itojun Exp $ */ /* * Copyright (C) 2001 WIDE Project. * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * 3. Neither the name of the project nor the names of its contributors * may be used to endorse or promote products derived from this software * without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF * SUCH DAMAGE. * THE AUTHORS DO NOT GUARANTEE THAT THIS SOFTWARE DOES NOT INFRINGE * ANY OTHERS' INTELLECTUAL PROPERTIES. IN NO EVENT SHALL THE AUTHORS * BE LIABLE FOR ANY INFRINGEMENT OF ANY OTHERS' INTELLECTUAL * PROPERTIES. */ #include #include #include #include #include #include #include #include #include #include #include #ifdef INET6 #include #include #endif int rn_mpath_capable(struct radix_node_head *rnh) { return rnh->rnh_multipath; } struct radix_node * rn_mpath_next(struct radix_node *rn, int mode) { struct radix_node *next; struct rtentry *nt, *rt = (struct rtentry *)rn; if (!rn->rn_dupedkey) return NULL; next = rn->rn_dupedkey; if (rn->rn_mask != next->rn_mask) return NULL; switch (mode) { case RMP_MODE_BYPRIO: /* scan all of the list until we find a match */ while (next) { if (rn->rn_mask != next->rn_mask) return NULL; nt = (struct rtentry *)next; if ((rt->rt_priority & RTP_MASK) == (nt->rt_priority & RTP_MASK)) return next; rn = next; next = next->rn_dupedkey; } return NULL; case RMP_MODE_ACTIVE: nt = (struct rtentry *)next; if (rt->rt_priority != nt->rt_priority) return NULL; break; case RMP_MODE_ALL: break; } return next; } struct rtentry * rt_mpath_next(struct rtentry *rt) { struct radix_node *rn = (struct radix_node *)rt; return ((struct rtentry *)rn_mpath_next(rn, RMP_MODE_ACTIVE)); } /* * return first route matching prio or the node just before. */ struct radix_node * rn_mpath_prio(struct radix_node *rn, u_int8_t prio) { struct radix_node *hit = rn; struct rtentry *rt; if (prio == RTP_ANY) return (hit); do { rt = (struct rtentry *)rn; if (rt->rt_priority == prio) /* perfect match */ return (rn); /* list is sorted remember last more prefered (smaller) entry */ if (rt->rt_priority < prio) hit = rn; } while ((rn = rn_mpath_next(rn, RMP_MODE_ALL)) != NULL); return (hit); } /* * Adjust the RTF_MPATH flag for the part of the rn_dupedkey chain * that matches the prio. */ void rn_mpath_adj_mpflag(struct radix_node *rn, u_int8_t prio) { struct rtentry *rt = (struct rtentry *)rn; if (!rn) return; prio &= RTP_MASK; rt = rt_mpath_matchgate(rt, NULL, prio); rn = (struct radix_node *)rt; if (!rn) return; if (rn_mpath_next(rn, RMP_MODE_BYPRIO)) { while (rn != NULL) { ((struct rtentry *)rn)->rt_flags |= RTF_MPATH; rn = rn_mpath_next(rn, RMP_MODE_BYPRIO); } } else rt->rt_flags &= ~RTF_MPATH; } int rn_mpath_active_count(struct radix_node *rn) { int i; i = 1; while ((rn = rn_mpath_next(rn, RMP_MODE_ACTIVE)) != NULL) i++; return i; } /* * return best matching route based on gateway and prio. If both are * specified it acts as a lookup function to get the actual rt. * If gate is NULL the first node matching the prio will be returned. */ struct rtentry * rt_mpath_matchgate(struct rtentry *rt, struct sockaddr *gate, u_int8_t prio) { struct radix_node *rn = (struct radix_node *)rt; do { rt = (struct rtentry *)rn; /* first find routes with correct priority */ if (prio != RTP_ANY && (rt->rt_priority & RTP_MASK) != (prio & RTP_MASK)) continue; /* if no gate is set we found a match */ if (!gate) return rt; if (rt->rt_gateway->sa_len == gate->sa_len && !memcmp(rt->rt_gateway, gate, gate->sa_len)) break; } while ((rn = rn_mpath_next(rn, RMP_MODE_ALL)) != NULL); return (struct rtentry *)rn; } /* * check if we have the same key/mask/gateway on the table already. */ int rt_mpath_conflict(struct radix_node_head *rnh, struct sockaddr *dst, struct sockaddr *netmask, struct sockaddr *gate, u_int8_t prio, int mpathok) { struct radix_node *rn1; struct rtentry *rt1; char *p, *q, *eq; int same, l, skip; rn1 = rnh->rnh_lookup(dst, netmask, rnh); if (!rn1) return 0; /* * unlike other functions we have in this file, we have to check * all key/mask/gateway as rnh_lookup can match less specific entry. */ rt1 = (struct rtentry *)rn1; /* compare key. */ if (rt_key(rt1)->sa_len != dst->sa_len || bcmp(rt_key(rt1), dst, rt_key(rt1)->sa_len)) goto different; /* key was the same. compare netmask. hairy... */ if (rt_mask(rt1) && netmask) { skip = rnh->rnh_treetop->rn_off; if (rt_mask(rt1)->sa_len > netmask->sa_len) { /* * as rt_mask(rt1) is made optimal by radix.c, * there must be some 1-bits on rt_mask(rt1) * after netmask->sa_len. therefore, in * this case, the entries are different. */ if (rt_mask(rt1)->sa_len > skip) goto different; else { /* no bits to compare, i.e. same*/ goto maskmatched; } } l = rt_mask(rt1)->sa_len; if (skip > l) { /* no bits to compare, i.e. same */ goto maskmatched; } p = (char *)rt_mask(rt1); q = (char *)netmask; if (bcmp(p + skip, q + skip, l - skip)) goto different; /* * need to go through all the bit, as netmask is not * optimal and can contain trailing 0s */ eq = (char *)netmask + netmask->sa_len; q += l; same = 1; while (eq > q) if (*q++) { same = 0; break; } if (!same) goto different; } else if (!rt_mask(rt1) && !netmask) ; /* no mask to compare, i.e. same */ else { /* one has mask and the other does not, different */ goto different; } maskmatched: if (!mpathok && rt1->rt_priority == prio) return EEXIST; /* key/mask were the same. compare gateway for all multipaths */ if (rt_mpath_matchgate(rt1, gate, prio)) /* all key/mask/gateway are the same. conflicting entry. */ return EEXIST; different: return 0; } void rn_mpath_reprio(struct radix_node *rn, int newprio) { struct radix_node *prev = rn->rn_p; struct radix_node *next = rn->rn_dupedkey; struct radix_node *t, *tt, *saved_tt, *head; struct rtentry *rt = (struct rtentry *)rn; int mid, oldprio, prioinv = 0; oldprio = rt->rt_priority; rt->rt_priority = newprio; /* same prio, no change needed */ if (oldprio == newprio) return; if (rn_mpath_next(rn, RMP_MODE_ALL) == NULL) { /* no need to move node, route is alone */ if (prev->rn_mask != rn->rn_mask) return; /* ... or route is last and prio gets bigger */ if (oldprio < newprio) return; } /* remove node from dupedkey list and reinsert at correct place */ if (prev->rn_dupedkey == rn) { prev->rn_dupedkey = next; if (next) next->rn_p = prev; else next = prev; } else { if (next == NULL) panic("next == NULL"); next->rn_p = prev; if (prev->rn_l == rn) prev->rn_l = next; else prev->rn_r = next; } /* re-insert rn at the right spot, so first rewind to the head */ for (tt = next; tt->rn_p->rn_dupedkey == tt; tt = tt->rn_p) ; saved_tt = tt; /* * Stolen from radix.c rn_addroute(). * This is nasty code with a certain amount of magic and dragons. * t is the element where the re-priorized rn is inserted -- before * or after depending on prioinv. saved_tt points to the head of the * dupedkey chain and tt is a bit of a helper * * First we skip with tt to the start of the mpath group then we * search the right spot to enter our node. */ for (; tt; tt = tt->rn_dupedkey) if (rn->rn_mask == tt->rn_mask) break; head = tt; /* store current head entry for rn_mklist check */ tt = rn_mpath_prio(tt, newprio); if (((struct rtentry *)tt)->rt_priority != newprio) { if (((struct rtentry *)tt)->rt_priority > newprio) prioinv = 1; t = tt; } else { mid = rn_mpath_active_count(tt) / 2; do { t = tt; tt = rn_mpath_next(tt, RMP_MODE_ACTIVE); } while (tt && --mid > 0); } /* insert rn before or after t depending on prioinv */ rn_link_dupedkey(rn, t, prioinv); /* the rn_mklist needs to be fixed if the best route changed */ if (rn->rn_mklist && rn->rn_flags & RNF_NORMAL) { if (rn->rn_mklist->rm_leaf != rn) { if (rn->rn_mklist->rm_leaf->rn_p == rn) /* changed route is now best */ rn->rn_mklist->rm_leaf = rn; } else if (rn->rn_dupedkey != head) { /* rn moved behind head, so head is new head */ rn->rn_mklist->rm_leaf = head; } } }