X net/ipv6: Catching unreachable routes in cache ...

For now could get under helloweb loaded from several places via wrk e.g. [ 2223.320576] +cU 2001067c1254000e0010000000000001 80 00000000000000000000000000000000 00 00000000000000000000000000000000 00000000 00000001 00000000 01200200 lo [ 2223.320601] . U 2001067c125400000000000000000000 30 00000000000000000000000000000000 00 00000000000000000000000000000000 00000400 00000001 00000000 00200200 lo That means that unreachable 2001:67c:1254:e:10::1/128 cached was cloned from unreachable 2001:67c:1254::/48 in time when 2001:67c:1254:e:10::/80 was absent. But that unreachable route in cache was removed pretty fast, when route for 2001:67c:1254:e:10::/80 appeared again. Still watching...

X net/ipv6: Catching unreachable routes in cache ...
For now could get under helloweb loaded from several places via wrk e.g. [ 2223.320576] +cU 2001067c1254000e0010000000000001 80 00000000000000000000000000000000 00 00000000000000000000000000000000 00000000 00000001 00000000 01200200 lo [ 2223.320601] . U 2001067c125400000000000000000000 30 00000000000000000000000000000000 00 00000000000000000000000000000000 00000400 00000001 00000000 00200200 lo That means that unreachable 2001:67c:1254:e:10::1/128 cached was cloned from unreachable 2001:67c:1254::/48 in time when 2001:67c:1254:e:10::/80 was absent. But that unreachable route in cache was removed pretty fast, when route for 2001:67c:1254:e:10::/80 appeared again. Still watching...
a023f92b · Kirill Smelkov · a11efd7b · a023f92b · a023f92b · a023f92b
Commit a023f92b authored Jun 08, 2016 by Kirill Smelkov
Showing with 87 additions and 5 deletions

include/net/ip6_fib.h include/net/ip6_fib.h +2 -2

net/ipv6/fib6_rules.c net/ipv6/fib6_rules.c +1 -0

net/ipv6/ip6_fib.c net/ipv6/ip6_fib.c +4 -1

net/ipv6/route.c net/ipv6/route.c +80 -2

No files found.
--- a/include/net/ip6_fib.h
+++ b/include/net/ip6_fib.h
@@ -188,9 +188,9 @@ static inline void rt6_set_from(struct rt6_info *rt, struct rt6_info *from)
 {
 	struct dst_entry *new = (struct dst_entry *) from;

-	rt->rt6i_flags &= ~RTF_EXPIRES;
+	rt->rt6i_flags &= ~RTF_EXPIRES; // XXX cache always not expires ?
 	dst_hold(new);
-	rt->dst.from = new;
+	rt->dst.from = new; // XXX try to track rt->dst.from in monitor dump - to know from which route this was cloned
 }

 static inline void ip6_rt_put(struct rt6_info *rt)

--- a/net/ipv6/fib6_rules.c
+++ b/net/ipv6/fib6_rules.c
@@ -86,6 +86,7 @@ static int fib6_rule_action(struct fib_rule *rule, struct flowi *flp,
 		struct fib6_rule *r = (struct fib6_rule *)rule;

 		/*
+                 * XXX is it relevant?
 		 * If we need to find a source address for this traffic,
 		 * we check the result if it meets requirement of the rule.
 		 */

--- a/net/ipv6/ip6_fib.c
+++ b/net/ipv6/ip6_fib.c
@@ -81,7 +81,7 @@ static int fib6_walk_continue(struct fib6_walker_t *w);
 *	A routing update causes an increase of the serial number on the
 *	affected subtree. This allows for cached routes to be asynchronously
 *	tested when modifications are made to the destination cache as a
- *	result of redirects, path MTU changes, etc.
+ *	result of redirects, path MTU changes, etc. XXX NOTE!
 */

 static __u32 rt_sernum;
@@ -460,6 +460,9 @@ static struct fib6_node *fib6_add_1(struct fib6_node *root,
 		 *	Exact match ?
 		 */

+                // NOTE relookup entry, when entry is already "same" _daddr_
+                // (i.e. it could be unreachable in fib, but tryung to add as reachable -> BUG)
+                // XXX ^^^ wrong - here we only locate fib6_node place - content is set by caller
 		if (plen == fn->fn_bit) {
 			/* clean up an intermediate node */
 			if (!(fn->fn_flags & RTN_RTINFO)) {

--- a/net/ipv6/route.c
+++ b/net/ipv6/route.c
@@ -903,6 +903,7 @@ static struct rt6_info *rt6_alloc_cow(struct rt6_info *ort,
 	return rt;
 }

+// NOTE here
 static struct rt6_info *rt6_alloc_clone(struct rt6_info *ort,
 					const struct in6_addr *daddr)
 {
@@ -946,7 +947,7 @@ static struct rt6_info *ip6_pol_route(struct net *net, struct fib6_table *table,
 	if (!(rt->rt6i_flags & (RTF_NONEXTHOP | RTF_GATEWAY)))
 		nrt = rt6_alloc_cow(rt, &fl6->daddr, &fl6->saddr);
 	else if (!(rt->dst.flags & DST_HOST))
-		nrt = rt6_alloc_clone(rt, &fl6->daddr);
+		nrt = rt6_alloc_clone(rt, &fl6->daddr);     // <-- NOTE here
 	else
 		goto out2;

@@ -955,7 +956,7 @@ static struct rt6_info *ip6_pol_route(struct net *net, struct fib6_table *table,

 	dst_hold(&rt->dst);
 	if (nrt) {
-		err = ip6_ins_rt(nrt);
+		err = ip6_ins_rt(nrt);  // <-- NOTE here cloned route inserted back
 		if (!err)
 			goto out2;
 	}
@@ -1160,6 +1161,7 @@ static void ip6_rt_update_pmtu(struct dst_entry *dst, struct sock *sk,
 	}
 }

+// NOTE
 void ip6_update_pmtu(struct sk_buff *skb, struct net *net, __be32 mtu,
 		     int oif, u32 mark)
 {
@@ -2781,6 +2783,55 @@ static int inet6_rtm_getroute(struct sk_buff *in_skb, struct nlmsghdr* nlh)
 	return err;
 }

+static void rt6_print(const struct rt6_info *rt)
+{
+        // TODO?
+        // dst  CHECK
+        // table    (rt6i_table->tb6_id)
+        // prefsrc  rt->rt6i_prefsrc
+        // protocol rt->rt6i_protocol
+        static const struct in6_addr in6_zero = {};
+
+        char rttype, rtcached;
+
+        rtcached = rt->rt6i_flags & RTF_CACHE ? 'c' : ' ';
+
+        // see rt6_fill_node()
+        rttype = '?';
+        if (rt->rt6i_flags & RTF_REJECT) {
+            switch(rt->dst.error) {
+		case -EINVAL:
+			rttype = 'B';   // rtm->rtm_type = RTN_BLACKHOLE;
+			break;
+		case -EACCES:
+			rttype = 'P';   // rtm->rtm_type = RTN_PROHIBIT;
+			break;
+		case -EAGAIN:
+			rttype = 'T';   // rtm->rtm_type = RTN_THROW;
+			break;
+		default:
+			rttype = 'U';   // rtm->rtm_type = RTN_UNREACHABLE;
+			break;
+            }
+        }
+        else if (rt->rt6i_flags & RTF_LOCAL)
+                rttype = 'l';   // rtm->rtm_type = RTN_LOCAL;
+	else if (rt->dst.dev && (rt->dst.dev->flags & IFF_LOOPBACK))
+		rttype = 'l';   // rtm->rtm_type = RTN_LOCAL;
+	else
+		rttype = ' ';   // rtm->rtm_type = RTN_UNICAST;
+
+        printk("%c%c %pi6 %02x %pi6 %02x %pi6 %08x %08x %08x %08x %8s",
+                rtcached, rttype,
+                &rt->rt6i_dst.addr, rt->rt6i_dst.plen,
+                &rt->rt6i_src.addr, rt->rt6i_src.plen,
+                (rt->rt6i_flags & RTF_GATEWAY ? &rt->rt6i_gateway : &in6_zero),
+                rt->rt6i_metric, atomic_read(&rt->dst.__refcnt),
+                rt->dst.__use, rt->rt6i_flags,
+                rt->dst.dev ? rt->dst.dev->name : ""
+        );
+}
+
 void inet6_rt_notify(int event, struct rt6_info *rt, struct nl_info *info)
 {
 	struct sk_buff *skb;
@@ -2788,6 +2839,33 @@ void inet6_rt_notify(int event, struct rt6_info *rt, struct nl_info *info)
 	u32 seq;
 	int err;

+        if (event == RTM_NEWROUTE || event == RTM_DELROUTE) {
+            struct rt6_info *rt_from;
+            char adddel = (event == RTM_NEWROUTE ? '+' : '-');
+
+            if (!(rt->rt6i_flags & RTF_CACHE))  goto rtnotrace; // only cached
+            if (!(rt->rt6i_flags & RTF_REJECT)) goto rtnotrace; // only unreachable
+
+            // show route
+            printk(KERN_ERR "%c", adddel);
+            rt6_print(rt);
+            printk("\n");
+
+            // show route this route is cached from
+            rt_from = rt;
+            while (rt_from && rt_from->rt6i_flags & RTF_CACHE) {
+                rt_from = (struct rt6_info *)rt_from->dst.from;
+                printk(KERN_ERR " .");
+                if (rt_from)
+                    rt6_print(rt_from);
+                else
+                    printk("nil");
+                printk("\n");
+            }
+
+        }
+rtnotrace:
+
 	err = -ENOBUFS;
 	seq = info->nlh ? info->nlh->nlmsg_seq : 0;