2 * DECnet An implementation of the DECnet protocol suite for the LINUX
3 * operating system. DECnet is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
6 * DECnet Routing Forwarding Information Base (Glue/Info List)
8 * Author: Steve Whitehouse <SteveW@ACM.org>
12 * Alexey Kuznetsov : SMP locking changes
13 * Steve Whitehouse : Rewrote it... Well to be more correct, I
14 * copied most of it from the ipv4 fib code.
15 * Steve Whitehouse : Updated it in style and fixed a few bugs
16 * which were fixed in the ipv4 code since
17 * this code was copied from it.
20 #include <linux/string.h>
21 #include <linux/net.h>
22 #include <linux/socket.h>
23 #include <linux/slab.h>
24 #include <linux/sockios.h>
25 #include <linux/init.h>
26 #include <linux/skbuff.h>
27 #include <linux/netlink.h>
28 #include <linux/rtnetlink.h>
29 #include <linux/proc_fs.h>
30 #include <linux/netdevice.h>
31 #include <linux/timer.h>
32 #include <linux/spinlock.h>
33 #include <linux/atomic.h>
34 #include <asm/uaccess.h>
35 #include <net/neighbour.h>
38 #include <net/fib_rules.h>
40 #include <net/dn_route.h>
41 #include <net/dn_fib.h>
42 #include <net/dn_neigh.h>
43 #include <net/dn_dev.h>
45 #define RT_MIN_TABLE 1
47 #define for_fib_info() { struct dn_fib_info *fi;\
48 for(fi = dn_fib_info_list; fi; fi = fi->fib_next)
49 #define endfor_fib_info() }
51 #define for_nexthops(fi) { int nhsel; const struct dn_fib_nh *nh;\
52 for(nhsel = 0, nh = (fi)->fib_nh; nhsel < (fi)->fib_nhs; nh++, nhsel++)
54 #define change_nexthops(fi) { int nhsel; struct dn_fib_nh *nh;\
55 for(nhsel = 0, nh = (struct dn_fib_nh *)((fi)->fib_nh); nhsel < (fi)->fib_nhs; nh++, nhsel++)
57 #define endfor_nexthops(fi) }
59 static DEFINE_SPINLOCK(dn_fib_multipath_lock);
60 static struct dn_fib_info *dn_fib_info_list;
61 static DEFINE_SPINLOCK(dn_fib_info_lock);
67 } dn_fib_props[RTN_MAX+1] = {
68 [RTN_UNSPEC] = { .error = 0, .scope = RT_SCOPE_NOWHERE },
69 [RTN_UNICAST] = { .error = 0, .scope = RT_SCOPE_UNIVERSE },
70 [RTN_LOCAL] = { .error = 0, .scope = RT_SCOPE_HOST },
71 [RTN_BROADCAST] = { .error = -EINVAL, .scope = RT_SCOPE_NOWHERE },
72 [RTN_ANYCAST] = { .error = -EINVAL, .scope = RT_SCOPE_NOWHERE },
73 [RTN_MULTICAST] = { .error = -EINVAL, .scope = RT_SCOPE_NOWHERE },
74 [RTN_BLACKHOLE] = { .error = -EINVAL, .scope = RT_SCOPE_UNIVERSE },
75 [RTN_UNREACHABLE] = { .error = -EHOSTUNREACH, .scope = RT_SCOPE_UNIVERSE },
76 [RTN_PROHIBIT] = { .error = -EACCES, .scope = RT_SCOPE_UNIVERSE },
77 [RTN_THROW] = { .error = -EAGAIN, .scope = RT_SCOPE_UNIVERSE },
78 [RTN_NAT] = { .error = 0, .scope = RT_SCOPE_NOWHERE },
79 [RTN_XRESOLVE] = { .error = -EINVAL, .scope = RT_SCOPE_NOWHERE },
82 static int dn_fib_sync_down(__le16 local, struct net_device *dev, int force);
83 static int dn_fib_sync_up(struct net_device *dev);
85 void dn_fib_free_info(struct dn_fib_info *fi)
87 if (fi->fib_dead == 0) {
88 printk(KERN_DEBUG "DECnet: BUG! Attempt to free alive dn_fib_info\n");
96 } endfor_nexthops(fi);
100 void dn_fib_release_info(struct dn_fib_info *fi)
102 spin_lock(&dn_fib_info_lock);
103 if (fi && --fi->fib_treeref == 0) {
105 fi->fib_next->fib_prev = fi->fib_prev;
107 fi->fib_prev->fib_next = fi->fib_next;
108 if (fi == dn_fib_info_list)
109 dn_fib_info_list = fi->fib_next;
113 spin_unlock(&dn_fib_info_lock);
116 static inline int dn_fib_nh_comp(const struct dn_fib_info *fi, const struct dn_fib_info *ofi)
118 const struct dn_fib_nh *onh = ofi->fib_nh;
121 if (nh->nh_oif != onh->nh_oif ||
122 nh->nh_gw != onh->nh_gw ||
123 nh->nh_scope != onh->nh_scope ||
124 nh->nh_weight != onh->nh_weight ||
125 ((nh->nh_flags^onh->nh_flags)&~RTNH_F_DEAD))
128 } endfor_nexthops(fi);
132 static inline struct dn_fib_info *dn_fib_find_info(const struct dn_fib_info *nfi)
135 if (fi->fib_nhs != nfi->fib_nhs)
137 if (nfi->fib_protocol == fi->fib_protocol &&
138 nfi->fib_prefsrc == fi->fib_prefsrc &&
139 nfi->fib_priority == fi->fib_priority &&
140 memcmp(nfi->fib_metrics, fi->fib_metrics, sizeof(fi->fib_metrics)) == 0 &&
141 ((nfi->fib_flags^fi->fib_flags)&~RTNH_F_DEAD) == 0 &&
142 (nfi->fib_nhs == 0 || dn_fib_nh_comp(fi, nfi) == 0))
148 __le16 dn_fib_get_attr16(struct rtattr *attr, int attrlen, int type)
150 while(RTA_OK(attr,attrlen)) {
151 if (attr->rta_type == type)
152 return *(__le16*)RTA_DATA(attr);
153 attr = RTA_NEXT(attr, attrlen);
159 static int dn_fib_count_nhs(struct rtattr *rta)
162 struct rtnexthop *nhp = RTA_DATA(rta);
163 int nhlen = RTA_PAYLOAD(rta);
165 while(nhlen >= (int)sizeof(struct rtnexthop)) {
166 if ((nhlen -= nhp->rtnh_len) < 0)
169 nhp = RTNH_NEXT(nhp);
175 static int dn_fib_get_nhs(struct dn_fib_info *fi, const struct rtattr *rta, const struct rtmsg *r)
177 struct rtnexthop *nhp = RTA_DATA(rta);
178 int nhlen = RTA_PAYLOAD(rta);
180 change_nexthops(fi) {
181 int attrlen = nhlen - sizeof(struct rtnexthop);
182 if (attrlen < 0 || (nhlen -= nhp->rtnh_len) < 0)
185 nh->nh_flags = (r->rtm_flags&~0xFF) | nhp->rtnh_flags;
186 nh->nh_oif = nhp->rtnh_ifindex;
187 nh->nh_weight = nhp->rtnh_hops + 1;
190 nh->nh_gw = dn_fib_get_attr16(RTNH_DATA(nhp), attrlen, RTA_GATEWAY);
192 nhp = RTNH_NEXT(nhp);
193 } endfor_nexthops(fi);
199 static int dn_fib_check_nh(const struct rtmsg *r, struct dn_fib_info *fi, struct dn_fib_nh *nh)
205 struct dn_fib_res res;
207 if (nh->nh_flags&RTNH_F_ONLINK) {
208 struct net_device *dev;
210 if (r->rtm_scope >= RT_SCOPE_LINK)
212 if (dnet_addr_type(nh->nh_gw) != RTN_UNICAST)
214 if ((dev = __dev_get_by_index(&init_net, nh->nh_oif)) == NULL)
216 if (!(dev->flags&IFF_UP))
220 nh->nh_scope = RT_SCOPE_LINK;
224 memset(&fld, 0, sizeof(fld));
225 fld.daddr = nh->nh_gw;
226 fld.flowidn_oif = nh->nh_oif;
227 fld.flowidn_scope = r->rtm_scope + 1;
229 if (fld.flowidn_scope < RT_SCOPE_LINK)
230 fld.flowidn_scope = RT_SCOPE_LINK;
232 if ((err = dn_fib_lookup(&fld, &res)) != 0)
236 if (res.type != RTN_UNICAST && res.type != RTN_LOCAL)
238 nh->nh_scope = res.scope;
239 nh->nh_oif = DN_FIB_RES_OIF(res);
240 nh->nh_dev = DN_FIB_RES_DEV(res);
241 if (nh->nh_dev == NULL)
243 dev_hold(nh->nh_dev);
245 if (!(nh->nh_dev->flags & IFF_UP))
249 dn_fib_res_put(&res);
252 struct net_device *dev;
254 if (nh->nh_flags&(RTNH_F_PERVASIVE|RTNH_F_ONLINK))
257 dev = __dev_get_by_index(&init_net, nh->nh_oif);
258 if (dev == NULL || dev->dn_ptr == NULL)
260 if (!(dev->flags&IFF_UP))
263 dev_hold(nh->nh_dev);
264 nh->nh_scope = RT_SCOPE_HOST;
271 struct dn_fib_info *dn_fib_create_info(const struct rtmsg *r, struct dn_kern_rta *rta, const struct nlmsghdr *nlh, int *errp)
274 struct dn_fib_info *fi = NULL;
275 struct dn_fib_info *ofi;
278 if (r->rtm_type > RTN_MAX)
281 if (dn_fib_props[r->rtm_type].scope > r->rtm_scope)
285 nhs = dn_fib_count_nhs(rta->rta_mp);
290 fi = kzalloc(sizeof(*fi)+nhs*sizeof(struct dn_fib_nh), GFP_KERNEL);
295 fi->fib_protocol = r->rtm_protocol;
297 fi->fib_flags = r->rtm_flags;
298 if (rta->rta_priority)
299 fi->fib_priority = *rta->rta_priority;
301 int attrlen = RTA_PAYLOAD(rta->rta_mx);
302 struct rtattr *attr = RTA_DATA(rta->rta_mx);
304 while(RTA_OK(attr, attrlen)) {
305 unsigned int flavour = attr->rta_type;
308 if (flavour > RTAX_MAX)
310 fi->fib_metrics[flavour-1] = *(unsigned int *)RTA_DATA(attr);
312 attr = RTA_NEXT(attr, attrlen);
315 if (rta->rta_prefsrc)
316 memcpy(&fi->fib_prefsrc, rta->rta_prefsrc, 2);
319 if ((err = dn_fib_get_nhs(fi, rta->rta_mp, r)) != 0)
321 if (rta->rta_oif && fi->fib_nh->nh_oif != *rta->rta_oif)
323 if (rta->rta_gw && memcmp(&fi->fib_nh->nh_gw, rta->rta_gw, 2))
326 struct dn_fib_nh *nh = fi->fib_nh;
328 nh->nh_oif = *rta->rta_oif;
330 memcpy(&nh->nh_gw, rta->rta_gw, 2);
331 nh->nh_flags = r->rtm_flags;
335 if (r->rtm_type == RTN_NAT) {
336 if (rta->rta_gw == NULL || nhs != 1 || rta->rta_oif)
338 memcpy(&fi->fib_nh->nh_gw, rta->rta_gw, 2);
342 if (dn_fib_props[r->rtm_type].error) {
343 if (rta->rta_gw || rta->rta_oif || rta->rta_mp)
348 if (r->rtm_scope > RT_SCOPE_HOST)
351 if (r->rtm_scope == RT_SCOPE_HOST) {
352 struct dn_fib_nh *nh = fi->fib_nh;
354 /* Local address is added */
355 if (nhs != 1 || nh->nh_gw)
357 nh->nh_scope = RT_SCOPE_NOWHERE;
358 nh->nh_dev = dev_get_by_index(&init_net, fi->fib_nh->nh_oif);
360 if (nh->nh_dev == NULL)
363 change_nexthops(fi) {
364 if ((err = dn_fib_check_nh(r, fi, nh)) != 0)
366 } endfor_nexthops(fi)
369 if (fi->fib_prefsrc) {
370 if (r->rtm_type != RTN_LOCAL || rta->rta_dst == NULL ||
371 memcmp(&fi->fib_prefsrc, rta->rta_dst, 2))
372 if (dnet_addr_type(fi->fib_prefsrc) != RTN_LOCAL)
377 if ((ofi = dn_fib_find_info(fi)) != NULL) {
379 dn_fib_free_info(fi);
385 atomic_inc(&fi->fib_clntref);
386 spin_lock(&dn_fib_info_lock);
387 fi->fib_next = dn_fib_info_list;
389 if (dn_fib_info_list)
390 dn_fib_info_list->fib_prev = fi;
391 dn_fib_info_list = fi;
392 spin_unlock(&dn_fib_info_lock);
402 dn_fib_free_info(fi);
408 int dn_fib_semantic_match(int type, struct dn_fib_info *fi, const struct flowidn *fld, struct dn_fib_res *res)
410 int err = dn_fib_props[type].error;
413 if (fi->fib_flags & RTNH_F_DEAD)
420 DN_FIB_RES_RESET(*res);
421 atomic_inc(&fi->fib_clntref);
426 if (nh->nh_flags & RTNH_F_DEAD)
428 if (!fld->flowidn_oif ||
429 fld->flowidn_oif == nh->nh_oif)
432 if (nhsel < fi->fib_nhs) {
434 atomic_inc(&fi->fib_clntref);
441 net_err_ratelimited("DECnet: impossible routing event : dn_fib_semantic_match type=%d\n",
450 void dn_fib_select_multipath(const struct flowidn *fld, struct dn_fib_res *res)
452 struct dn_fib_info *fi = res->fi;
455 spin_lock_bh(&dn_fib_multipath_lock);
456 if (fi->fib_power <= 0) {
458 change_nexthops(fi) {
459 if (!(nh->nh_flags&RTNH_F_DEAD)) {
460 power += nh->nh_weight;
461 nh->nh_power = nh->nh_weight;
463 } endfor_nexthops(fi);
464 fi->fib_power = power;
466 spin_unlock_bh(&dn_fib_multipath_lock);
472 w = jiffies % fi->fib_power;
474 change_nexthops(fi) {
475 if (!(nh->nh_flags&RTNH_F_DEAD) && nh->nh_power) {
476 if ((w -= nh->nh_power) <= 0) {
480 spin_unlock_bh(&dn_fib_multipath_lock);
484 } endfor_nexthops(fi);
486 spin_unlock_bh(&dn_fib_multipath_lock);
490 static int dn_fib_check_attr(struct rtmsg *r, struct rtattr **rta)
494 for(i = 1; i <= RTA_MAX; i++) {
495 struct rtattr *attr = rta[i-1];
497 if (RTA_PAYLOAD(attr) < 4 && RTA_PAYLOAD(attr) != 2)
499 if (i != RTA_MULTIPATH && i != RTA_METRICS &&
501 rta[i-1] = (struct rtattr *)RTA_DATA(attr);
508 static inline u32 rtm_get_table(struct rtattr **rta, u8 table)
510 if (rta[RTA_TABLE - 1])
511 table = nla_get_u32((struct nlattr *) rta[RTA_TABLE - 1]);
516 static int dn_fib_rtm_delroute(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
518 struct net *net = sock_net(skb->sk);
519 struct dn_fib_table *tb;
520 struct rtattr **rta = arg;
521 struct rtmsg *r = NLMSG_DATA(nlh);
523 if (!net_eq(net, &init_net))
526 if (dn_fib_check_attr(r, rta))
529 tb = dn_fib_get_table(rtm_get_table(rta, r->rtm_table), 0);
531 return tb->delete(tb, r, (struct dn_kern_rta *)rta, nlh, &NETLINK_CB(skb));
536 static int dn_fib_rtm_newroute(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
538 struct net *net = sock_net(skb->sk);
539 struct dn_fib_table *tb;
540 struct rtattr **rta = arg;
541 struct rtmsg *r = NLMSG_DATA(nlh);
543 if (!net_eq(net, &init_net))
546 if (dn_fib_check_attr(r, rta))
549 tb = dn_fib_get_table(rtm_get_table(rta, r->rtm_table), 1);
551 return tb->insert(tb, r, (struct dn_kern_rta *)rta, nlh, &NETLINK_CB(skb));
556 static void fib_magic(int cmd, int type, __le16 dst, int dst_len, struct dn_ifaddr *ifa)
558 struct dn_fib_table *tb;
563 struct dn_kern_rta rta;
565 memset(&req.rtm, 0, sizeof(req.rtm));
566 memset(&rta, 0, sizeof(rta));
568 if (type == RTN_UNICAST)
569 tb = dn_fib_get_table(RT_MIN_TABLE, 1);
571 tb = dn_fib_get_table(RT_TABLE_LOCAL, 1);
576 req.nlh.nlmsg_len = sizeof(req);
577 req.nlh.nlmsg_type = cmd;
578 req.nlh.nlmsg_flags = NLM_F_REQUEST|NLM_F_CREATE|NLM_F_APPEND;
579 req.nlh.nlmsg_pid = 0;
580 req.nlh.nlmsg_seq = 0;
582 req.rtm.rtm_dst_len = dst_len;
583 req.rtm.rtm_table = tb->n;
584 req.rtm.rtm_protocol = RTPROT_KERNEL;
585 req.rtm.rtm_scope = (type != RTN_LOCAL ? RT_SCOPE_LINK : RT_SCOPE_HOST);
586 req.rtm.rtm_type = type;
589 rta.rta_prefsrc = &ifa->ifa_local;
590 rta.rta_oif = &ifa->ifa_dev->dev->ifindex;
592 if (cmd == RTM_NEWROUTE)
593 tb->insert(tb, &req.rtm, &rta, &req.nlh, NULL);
595 tb->delete(tb, &req.rtm, &rta, &req.nlh, NULL);
598 static void dn_fib_add_ifaddr(struct dn_ifaddr *ifa)
601 fib_magic(RTM_NEWROUTE, RTN_LOCAL, ifa->ifa_local, 16, ifa);
604 if (!(dev->flags&IFF_UP))
606 /* In the future, we will want to add default routes here */
611 static void dn_fib_del_ifaddr(struct dn_ifaddr *ifa)
614 struct net_device *dev;
615 struct dn_dev *dn_db;
616 struct dn_ifaddr *ifa2;
620 /* Scan device list */
622 for_each_netdev_rcu(&init_net, dev) {
623 dn_db = rcu_dereference(dev->dn_ptr);
626 for (ifa2 = rcu_dereference(dn_db->ifa_list);
628 ifa2 = rcu_dereference(ifa2->ifa_next)) {
629 if (ifa2->ifa_local == ifa->ifa_local) {
638 fib_magic(RTM_DELROUTE, RTN_LOCAL, ifa->ifa_local, 16, ifa);
640 if (dnet_addr_type(ifa->ifa_local) != RTN_LOCAL) {
641 if (dn_fib_sync_down(ifa->ifa_local, NULL, 0))
647 static void dn_fib_disable_addr(struct net_device *dev, int force)
649 if (dn_fib_sync_down(0, dev, force))
651 dn_rt_cache_flush(0);
652 neigh_ifdown(&dn_neigh_table, dev);
655 static int dn_fib_dnaddr_event(struct notifier_block *this, unsigned long event, void *ptr)
657 struct dn_ifaddr *ifa = (struct dn_ifaddr *)ptr;
661 dn_fib_add_ifaddr(ifa);
662 dn_fib_sync_up(ifa->ifa_dev->dev);
663 dn_rt_cache_flush(-1);
666 dn_fib_del_ifaddr(ifa);
667 if (ifa->ifa_dev && ifa->ifa_dev->ifa_list == NULL) {
668 dn_fib_disable_addr(ifa->ifa_dev->dev, 1);
670 dn_rt_cache_flush(-1);
677 static int dn_fib_sync_down(__le16 local, struct net_device *dev, int force)
680 int scope = RT_SCOPE_NOWHERE;
687 * This makes no sense for DECnet.... we will almost
688 * certainly have more than one local address the same
689 * over all our interfaces. It needs thinking about
692 if (local && fi->fib_prefsrc == local) {
693 fi->fib_flags |= RTNH_F_DEAD;
695 } else if (dev && fi->fib_nhs) {
698 change_nexthops(fi) {
699 if (nh->nh_flags&RTNH_F_DEAD)
701 else if (nh->nh_dev == dev &&
702 nh->nh_scope != scope) {
703 spin_lock_bh(&dn_fib_multipath_lock);
704 nh->nh_flags |= RTNH_F_DEAD;
705 fi->fib_power -= nh->nh_power;
707 spin_unlock_bh(&dn_fib_multipath_lock);
710 } endfor_nexthops(fi)
711 if (dead == fi->fib_nhs) {
712 fi->fib_flags |= RTNH_F_DEAD;
721 static int dn_fib_sync_up(struct net_device *dev)
725 if (!(dev->flags&IFF_UP))
731 change_nexthops(fi) {
732 if (!(nh->nh_flags&RTNH_F_DEAD)) {
736 if (nh->nh_dev == NULL || !(nh->nh_dev->flags&IFF_UP))
738 if (nh->nh_dev != dev || dev->dn_ptr == NULL)
741 spin_lock_bh(&dn_fib_multipath_lock);
743 nh->nh_flags &= ~RTNH_F_DEAD;
744 spin_unlock_bh(&dn_fib_multipath_lock);
745 } endfor_nexthops(fi);
748 fi->fib_flags &= ~RTNH_F_DEAD;
755 static struct notifier_block dn_fib_dnaddr_notifier = {
756 .notifier_call = dn_fib_dnaddr_event,
759 void __exit dn_fib_cleanup(void)
761 dn_fib_table_cleanup();
762 dn_fib_rules_cleanup();
764 unregister_dnaddr_notifier(&dn_fib_dnaddr_notifier);
768 void __init dn_fib_init(void)
773 register_dnaddr_notifier(&dn_fib_dnaddr_notifier);
775 rtnl_register(PF_DECnet, RTM_NEWROUTE, dn_fib_rtm_newroute, NULL, NULL);
776 rtnl_register(PF_DECnet, RTM_DELROUTE, dn_fib_rtm_delroute, NULL, NULL);