ref: b638c7753d8498eaec90f06a7c140ffe0ed76cdb
parent: d72a4043993d02b56873dfe40767cef9336685fc
author: cinap_lenrek <[email protected]>
date: Sun Nov 10 14:50:46 EST 2019
devip: use the routing table for local source ip address selection when making outgoing connections, the source ip was selected by just iterating from the first to the last interface and trying each local address until a route was found. the result was kind of hard to predict as it depends on the interface order. this change replaces the algorithm with the route lookup algorithm that we already have which takes more specific desination and source prefixes into account. so the order of interfaces does not matter anymore.
--- a/sys/src/9/ip/arp.c
+++ b/sys/src/9/ip/arp.c
@@ -401,7 +401,7 @@
if((ifc = findipifc(fs, ia, ia, Runi)) == nil)
error("no interface");
rlock(ifc);
- if(!ipv6local(ifc, ia, ip) || arpenter(fs, V6, ip, mac, n, ia, ifc, 0) < 0){
+ if(!ipv6local(ifc, ia, 0, ip) || arpenter(fs, V6, ip, mac, n, ia, ifc, 0) < 0){
runlock(ifc);
error("destination unreachable");
}
@@ -450,7 +450,7 @@
qlock(arp);
state = arpstate[a->state];
ipmove(ip, a->ip);
- if(ifc->m == nil || a->ifcid != ifc->ifcid || !ipv6local(ifc, ia, ip)){
+ if(ifc->m == nil || a->ifcid != ifc->ifcid || !ipv6local(ifc, ia, 0, ip)){
qunlock(arp);
runlock(ifc);
continue;
@@ -507,7 +507,7 @@
} else {
arprelease(f->arp, a);
}
- if(!ipv6local(ifc, src, targ))
+ if(!ipv6local(ifc, src, 0, targ))
return;
send:
if(!waserror()){
--- a/sys/src/9/ip/ethermedium.c
+++ b/sys/src/9/ip/ethermedium.c
@@ -462,7 +462,7 @@
memmove(targ, a->ip+IPv4off, IPv4addrlen);
arprelease(er->f->arp, a);
- if(!ipv4local(ifc, src, targ))
+ if(!ipv4local(ifc, src, 0, targ))
return;
n = sizeof(Etherarp);
--- a/sys/src/9/ip/icmp.c
+++ b/sys/src/9/ip/icmp.c
@@ -218,7 +218,7 @@
uchar ia[IPv4addrlen];
p = (Icmp *)bp->rp;
- if(!ip4reply(f, p->src) || !ipv4local(ifc, ia, p->src))
+ if(!ip4reply(f, p->src) || !ipv4local(ifc, ia, 0, p->src))
return;
netlog(f, Logicmp, "sending icmpttlexceeded %V -> src %V dst %V\n",
--- a/sys/src/9/ip/icmp6.c
+++ b/sys/src/9/ip/icmp6.c
@@ -332,7 +332,7 @@
ipmove(addr, p->src);
if(!isv6mcast(p->dst))
ipmove(p->src, p->dst);
- else if (!ipv6local(ifc, p->src, addr))
+ else if (!ipv6local(ifc, p->src, 0, addr))
return nil;
ipmove(p->dst, addr);
p->type = EchoReplyV6;
@@ -434,7 +434,7 @@
uchar ia[IPaddrlen];
p = (Ip6hdr *)bp->rp;
- if(isv6mcast(p->dst) || isv6mcast(p->src) || !ipv6local(ifc, ia, p->src))
+ if(isv6mcast(p->dst) || isv6mcast(p->src) || !ipv6local(ifc, ia, 0, p->src))
return;
netlog(f, Logicmp, "send icmphostunr %I -> src %I dst %I\n",
@@ -471,7 +471,7 @@
uchar ia[IPaddrlen];
p = (Ip6hdr *)bp->rp;
- if(isv6mcast(p->dst) || isv6mcast(p->src) || !ipv6local(ifc, ia, p->src))
+ if(isv6mcast(p->dst) || isv6mcast(p->src) || !ipv6local(ifc, ia, 0, p->src))
return;
netlog(f, Logicmp, "send icmpttlexceeded6 %I -> src %I dst %I\n",
@@ -504,7 +504,7 @@
uchar ia[IPaddrlen];
p = (Ip6hdr *)bp->rp;
- if(isv6mcast(p->dst) || isv6mcast(p->src) || !ipv6local(ifc, ia, p->src))
+ if(isv6mcast(p->dst) || isv6mcast(p->src) || !ipv6local(ifc, ia, 0, p->src))
return;
netlog(f, Logicmp, "send icmppkttoobig6 %I -> src %I dst %I\n",
@@ -769,7 +769,7 @@
/* fall through */
case Tuniproxy:
- if(ipv6local(ifc, ia, np->src)) {
+ if(ipv6local(ifc, ia, 0, np->src)) {
if(arpenter(icmp->f, V6, np->src, np->lnaddr, 8*np->olen-2, ia, ifc, 0) < 0)
break;
pktflags |= Sflag;
@@ -801,7 +801,7 @@
lifc = iplocalonifc(ifc, np->target);
if(lifc != nil && lifc->tentative)
arpenter(icmp->f, V6, np->target, np->lnaddr, 8*np->olen-2, np->target, ifc, 0);
- else if(ipv6local(ifc, ia, np->target))
+ else if(ipv6local(ifc, ia, 0, np->target))
arpenter(icmp->f, V6, np->target, np->lnaddr, 8*np->olen-2, ia, ifc, 1);
freeblist(bp);
break;
--- a/sys/src/9/ip/ip.h
+++ b/sys/src/9/ip/ip.h
@@ -567,6 +567,8 @@
extern void remroute(Fs *f, uchar *a, uchar *mask, uchar *s, uchar *smask, uchar *gate, int type, Ipifc *ifc, char *tag);
extern Route* v4lookup(Fs *f, uchar *a, uchar *s, Routehint *h);
extern Route* v6lookup(Fs *f, uchar *a, uchar *s, Routehint *h);
+extern Route* v4source(Fs *f, uchar *a, uchar *s);
+extern Route* v6source(Fs *f, uchar *a, uchar *s);
extern long routeread(Fs *f, char*, ulong, int);
extern long routewrite(Fs *f, Chan*, char*, int);
extern void routetype(int type, char p[8]);
@@ -664,8 +666,8 @@
extern Ipifc* findipifc(Fs*, uchar *local, uchar *remote, int type);
extern Ipifc* findipifcstr(Fs *f, char *s);
extern void findlocalip(Fs*, uchar *local, uchar *remote);
-extern int ipv4local(Ipifc *ifc, uchar *local, uchar *remote);
-extern int ipv6local(Ipifc *ifc, uchar *local, uchar *remote);
+extern int ipv4local(Ipifc *ifc, uchar *local, int prefixlen, uchar *remote);
+extern int ipv6local(Ipifc *ifc, uchar *local, int prefixlen, uchar *remote);
extern Iplifc* iplocalonifc(Ipifc *ifc, uchar *ip);
extern Iplifc* ipremoteonifc(Ipifc *ifc, uchar *ip);
extern int ipproxyifc(Fs *f, Ipifc *ifc, uchar *ip);
--- a/sys/src/9/ip/ipifc.c
+++ b/sys/src/9/ip/ipifc.c
@@ -1263,10 +1263,17 @@
}
/*
- * return v4 address associated with an interface close to remote
+ * ipv4local, ipv6local:
+ * return a local address associated with an interface close to remote.
+ * prefixlen is the number of leading bits in the local address that
+ * have to match an interface address to be considered. this is used
+ * by source specific routes to filter on the source address.
+ * return non-zero on success or zero when no address was found.
+ *
+ * for ipv4local, all addresses are 4 byte format.
*/
int
-ipv4local(Ipifc *ifc, uchar *local, uchar *remote)
+ipv4local(Ipifc *ifc, uchar *local, int prefixlen, uchar *remote)
{
Iplifc *lifc;
int a, b;
@@ -1275,6 +1282,10 @@
for(lifc = ifc->lifc; lifc != nil; lifc = lifc->next){
if((lifc->type & Rv4) == 0 || ipcmp(lifc->local, IPnoaddr) == 0)
continue;
+
+ if(prefixlen && comprefixlen(lifc->local+IPv4off, local, IPv4addrlen) < prefixlen)
+ continue;
+
a = comprefixlen(lifc->local+IPv4off, remote, IPv4addrlen);
if(a > b){
b = a;
@@ -1284,11 +1295,8 @@
return b >= 0;
}
-/*
- * return v6 address associated with an interface close to remote
- */
int
-ipv6local(Ipifc *ifc, uchar *local, uchar *remote)
+ipv6local(Ipifc *ifc, uchar *local, int prefixlen, uchar *remote)
{
struct {
int atype;
@@ -1300,12 +1308,13 @@
Iplifc *lifc;
if(isv4(remote)){
- ipmove(local, v4prefix);
- return ipv4local(ifc, local+IPv4off, remote+IPv4off);
+ memmove(local, v4prefix, IPv4off);
+ if((prefixlen -= IPv4off*8) < 0)
+ prefixlen = 0;
+ return ipv4local(ifc, local+IPv4off, prefixlen, remote+IPv4off);
}
atype = v6addrtype(remote);
- ipmove(local, v6Unspecified);
b.atype = unknownv6;
b.deprecated = 1;
b.comprefixlen = 0;
@@ -1315,6 +1324,9 @@
if(lifc->tentative)
continue;
+ if(prefixlen && comprefixlen(lifc->local, local, IPaddrlen) < prefixlen)
+ continue;
+
a.atype = v6addrtype(lifc->local);
a.deprecated = lifc->preflt != ~0UL && lifc->preflt < now-lifc->origint;
a.comprefixlen = comprefixlen(lifc->local, remote, IPaddrlen);
@@ -1347,53 +1359,21 @@
return b.atype >= atype;
}
+/*
+ * find the local address for a remote destination
+ */
void
findlocalip(Fs *f, uchar *local, uchar *remote)
{
- Route *r;
- Iplifc *lifc;
- Ipifc *ifc, *nifc;
- Conv **cp;
-
- for(cp = f->ipifc->conv; *cp != nil; cp++){
- ifc = (Ipifc*)(*cp)->ptcl;
- rlock(ifc);
- for(lifc = ifc->lifc; lifc != nil; lifc = lifc->next){
- if(lifc->tentative)
- continue;
-
- r = v6lookup(f, remote, lifc->local, nil);
- if(r == nil || (nifc = r->ifc) == nil)
- continue;
- if(r->type & Runi){
- ipmove(local, remote);
- runlock(ifc);
- return;
- }
- if(nifc != ifc) rlock(nifc);
- if((r->type & (Rifc|Rbcast|Rmulti|Rv4)) == Rv4){
- ipmove(local, v4prefix);
- if(ipv4local(nifc, local+IPv4off, r->v4.gate)){
- if(nifc != ifc) runlock(nifc);
- runlock(ifc);
- return;
- }
- }
- if(ipv6local(nifc, local, remote)){
- if(nifc != ifc) runlock(nifc);
- runlock(ifc);
- return;
- }
- if(nifc != ifc) runlock(nifc);
- }
- runlock(ifc);
+ if(isv4(remote)) {
+ memmove(local, v4prefix, IPv4off);
+ if(v4source(f, remote+IPv4off, local+IPv4off) == nil)
+ findprimaryipv4(f, local);
+ } else {
+ if(v6source(f, remote, local) == nil)
+ findprimaryipv6(f, local);
}
- if(isv4(remote))
- findprimaryipv4(f, local);
- else
- findprimaryipv6(f, local);
}
-
/*
* see if this address is bound to the interface
--- a/sys/src/9/ip/iproute.c
+++ b/sys/src/9/ip/iproute.c
@@ -535,10 +535,64 @@
wunlock(&routelock);
}
+/* get the outgoing interface for route r */
+static Ipifc*
+routefindipifc(Route *r, Fs *f)
+{
+ uchar local[IPaddrlen], gate[IPaddrlen];
+ Ipifc *ifc;
+ int i;
+
+ ifc = r->ifc;
+ if(ifc != nil && ifc->ifcid == r->ifcid)
+ return ifc;
+
+ if(r->type & Rsrc) {
+ if(r->type & Rv4) {
+ hnputl(local+IPv4off, r->v4.source);
+ memmove(local, v4prefix, IPv4off);
+ } else {
+ for(i = 0; i < IPllen; i++)
+ hnputl(local+4*i, r->v6.source[i]);
+ }
+ } else {
+ ipmove(local, IPnoaddr);
+ }
+
+ if(r->type & Rifc) {
+ if(r->type & Rv4) {
+ hnputl(gate+IPv4off, r->v4.address);
+ memmove(gate, v4prefix, IPv4off);
+ } else {
+ for(i = 0; i < IPllen; i++)
+ hnputl(gate+4*i, r->v6.address[i]);
+ }
+ } else {
+ if(r->type & Rv4)
+ v4tov6(gate, r->v4.gate);
+ else
+ ipmove(gate, r->v6.gate);
+ }
+
+ if((ifc = findipifc(f, local, gate, r->type)) == nil)
+ return nil;
+
+ r->ifc = ifc;
+ r->ifcid = ifc->ifcid;
+ return ifc;
+}
+
+/*
+ * v4lookup, v6lookup:
+ * lookup a route to destination address a from source address s
+ * and return the route. returns nil if no route was found.
+ * an optional Routehint can be passed in rh to cache the lookup.
+ *
+ * for v4lookup, addresses are in 4 byte format.
+ */
Route*
v4lookup(Fs *f, uchar *a, uchar *s, Routehint *rh)
{
- uchar local[IPaddrlen], gate[IPaddrlen];
ulong la, ls;
Route *p, *q;
Ipifc *ifc;
@@ -577,23 +631,9 @@
p = p->mid;
}
- if(q == nil || q->ref == 0)
+ if(q == nil || q->ref == 0 || routefindipifc(q, f) == nil)
return nil;
- if(q->ifc == nil || q->ifcid != q->ifc->ifcid){
- if(q->type & Rifc) {
- hnputl(gate+IPv4off, q->v4.address);
- memmove(gate, v4prefix, IPv4off);
- } else
- v4tov6(gate, q->v4.gate);
- v4tov6(local, s);
- ifc = findipifc(f, local, gate, q->type);
- if(ifc == nil)
- return nil;
- q->ifc = ifc;
- q->ifcid = ifc->ifcid;
- }
-
if(rh != nil){
rh->r = q;
rh->rgen = v4routegeneration;
@@ -605,7 +645,6 @@
Route*
v6lookup(Fs *f, uchar *a, uchar *s, Routehint *rh)
{
- uchar gate[IPaddrlen];
ulong la[IPllen], ls[IPllen];
ulong x, y;
Route *p, *q;
@@ -684,27 +723,127 @@
next: ;
}
- if(q == nil || q->ref == 0)
+ if(q == nil || q->ref == 0 || routefindipifc(q, f) == nil)
return nil;
- if(q->ifc == nil || q->ifcid != q->ifc->ifcid){
- if(q->type & Rifc) {
- for(h = 0; h < IPllen; h++)
- hnputl(gate+4*h, q->v6.address[h]);
- ifc = findipifc(f, s, gate, q->type);
- } else
- ifc = findipifc(f, s, q->v6.gate, q->type);
- if(ifc == nil)
- return nil;
- q->ifc = ifc;
- q->ifcid = ifc->ifcid;
- }
-
if(rh != nil){
rh->r = q;
rh->rgen = v6routegeneration;
}
+ return q;
+}
+
+/*
+ * v4source, v6source:
+ * lookup a route to destination address a and also find
+ * a suitable source address s on the outgoing interface.
+ * return the route on success or nil when no route
+ * was found.
+ *
+ * for v4source, addresses are in 4 byte format.
+ */
+Route*
+v4source(Fs *f, uchar *a, uchar *s)
+{
+ uchar src[IPv4addrlen];
+ int splen;
+ ulong x, la;
+ Route *p, *q;
+ Ipifc *ifc;
+
+ q = nil;
+ la = nhgetl(a);
+ rlock(&routelock);
+ for(p = f->v4root[V4H(la)]; p != nil;){
+ if(la < p->v4.address){
+ p = p->left;
+ continue;
+ }
+ if(la > p->v4.endaddress){
+ p = p->right;
+ continue;
+ }
+ splen = 0;
+ if(p->type & Rsrc){
+ /* calculate local prefix length for source specific routes */
+ for(x = ~(p->v4.endsource ^ p->v4.source); x & 0x80000000UL; x <<= 1)
+ splen++;
+ hnputl(src, p->v4.source);
+ }
+ if((ifc = routefindipifc(p, f)) == nil
+ || !ipv4local(ifc, src, splen, (p->type & (Rifc|Rbcast|Rmulti|Rv4))==Rv4? p->v4.gate: a)){
+ p = p->mid;
+ continue;
+ }
+ memmove(s, src, IPv4addrlen);
+ q = p;
+ p = p->mid;
+ }
+ runlock(&routelock);
+ return q;
+}
+
+Route*
+v6source(Fs *f, uchar *a, uchar *s)
+{
+ uchar src[IPaddrlen];
+ int splen, h;
+ ulong x, y, la[IPllen];
+ Route *p, *q;
+ Ipifc *ifc;
+
+ q = nil;
+ for(h = 0; h < IPllen; h++)
+ la[h] = nhgetl(a+4*h);
+ rlock(&routelock);
+ for(p = f->v6root[V6H(la)]; p != nil;){
+ for(h = 0; h < IPllen; h++){
+ x = la[h];
+ y = p->v6.address[h];
+ if(x == y)
+ continue;
+ if(x < y){
+ p = p->left;
+ goto next;
+ }
+ break;
+ }
+ for(h = 0; h < IPllen; h++){
+ x = la[h];
+ y = p->v6.endaddress[h];
+ if(x == y)
+ continue;
+ if(x > y){
+ p = p->right;
+ goto next;
+ }
+ break;
+ }
+ splen = 0;
+ if(p->type & Rsrc){
+ /* calculate local prefix length for source specific routes */
+ for(h = 0; h < IPllen; h++){
+ hnputl(src+4*h, p->v6.source[h]);
+ if((x = ~(p->v6.endsource[h] ^ p->v6.source[h])) != ~0UL){
+ for(; x & 0x80000000UL; x <<= 1)
+ splen++;
+ break;
+ }
+ splen += 32;
+ }
+ }
+ if((ifc = routefindipifc(p, f)) == nil
+ || !ipv6local(ifc, src, splen, a)){
+ p = p->mid;
+ continue;
+ }
+ ipmove(s, src);
+ q = p;
+ p = p->mid;
+next: ;
+ }
+ runlock(&routelock);
return q;
}
--- a/sys/src/9/ip/rudp.c
+++ b/sys/src/9/ip/rudp.c
@@ -559,15 +559,12 @@
default:
/* connection oriented rudp */
if(ipcmp(c->raddr, IPnoaddr) == 0){
- /* save the src address in the conversation */
- ipmove(c->raddr, raddr);
- c->rport = rport;
-
/* reply with the same ip address (if not broadcast) */
if(ipforme(f, laddr) != Runi)
- ipv6local(ifc, c->laddr, c->raddr);
- else
- ipmove(c->laddr, laddr);
+ ipv6local(ifc, laddr, 0, raddr);
+ ipmove(c->laddr, laddr);
+ ipmove(c->raddr, raddr);
+ c->rport = rport;
}
break;
}
--- a/sys/src/9/ip/udp.c
+++ b/sys/src/9/ip/udp.c
@@ -423,7 +423,7 @@
if(ucb->headers == 0){
/* create a new conversation */
if(ipforme(f, laddr) != Runi)
- ipv6local(ifc, laddr, raddr);
+ ipv6local(ifc, laddr, 0, raddr);
c = Fsnewcall(c, raddr, rport, laddr, lport, version);
if(c == nil){
qunlock(udp);