2 * DECnet An implementation of the DECnet protocol suite for the LINUX
3 * operating system. DECnet is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
6 * DECnet Routing Forwarding Information Base (Glue/Info List)
8 * Author: Steve Whitehouse <SteveW@ACM.org>
12 * Alexey Kuznetsov : SMP locking changes
13 * Steve Whitehouse : Rewrote it... Well to be more correct, I
14 * copied most of it from the ipv4 fib code.
15 * Steve Whitehouse : Updated it in style and fixed a few bugs
16 * which were fixed in the ipv4 code since
17 * this code was copied from it.
20 #include <linux/string.h>
21 #include <linux/net.h>
22 #include <linux/socket.h>
23 #include <linux/slab.h>
24 #include <linux/sockios.h>
25 #include <linux/init.h>
26 #include <linux/skbuff.h>
27 #include <linux/netlink.h>
28 #include <linux/rtnetlink.h>
29 #include <linux/proc_fs.h>
30 #include <linux/netdevice.h>
31 #include <linux/timer.h>
32 #include <linux/spinlock.h>
33 #include <linux/atomic.h>
34 #include <asm/uaccess.h>
35 #include <net/neighbour.h>
38 #include <net/fib_rules.h>
40 #include <net/dn_route.h>
41 #include <net/dn_fib.h>
42 #include <net/dn_neigh.h>
43 #include <net/dn_dev.h>
45 #define RT_MIN_TABLE 1
47 #define for_fib_info() { struct dn_fib_info *fi;\
48 for(fi = dn_fib_info_list; fi; fi = fi->fib_next)
49 #define endfor_fib_info() }
51 #define for_nexthops(fi) { int nhsel; const struct dn_fib_nh *nh;\
52 for(nhsel = 0, nh = (fi)->fib_nh; nhsel < (fi)->fib_nhs; nh++, nhsel++)
54 #define change_nexthops(fi) { int nhsel; struct dn_fib_nh *nh;\
55 for(nhsel = 0, nh = (struct dn_fib_nh *)((fi)->fib_nh); nhsel < (fi)->fib_nhs; nh++, nhsel++)
57 #define endfor_nexthops(fi) }
59 static DEFINE_SPINLOCK(dn_fib_multipath_lock
);
60 static struct dn_fib_info
*dn_fib_info_list
;
61 static DEFINE_SPINLOCK(dn_fib_info_lock
);
67 } dn_fib_props
[RTN_MAX
+1] = {
68 [RTN_UNSPEC
] = { .error
= 0, .scope
= RT_SCOPE_NOWHERE
},
69 [RTN_UNICAST
] = { .error
= 0, .scope
= RT_SCOPE_UNIVERSE
},
70 [RTN_LOCAL
] = { .error
= 0, .scope
= RT_SCOPE_HOST
},
71 [RTN_BROADCAST
] = { .error
= -EINVAL
, .scope
= RT_SCOPE_NOWHERE
},
72 [RTN_ANYCAST
] = { .error
= -EINVAL
, .scope
= RT_SCOPE_NOWHERE
},
73 [RTN_MULTICAST
] = { .error
= -EINVAL
, .scope
= RT_SCOPE_NOWHERE
},
74 [RTN_BLACKHOLE
] = { .error
= -EINVAL
, .scope
= RT_SCOPE_UNIVERSE
},
75 [RTN_UNREACHABLE
] = { .error
= -EHOSTUNREACH
, .scope
= RT_SCOPE_UNIVERSE
},
76 [RTN_PROHIBIT
] = { .error
= -EACCES
, .scope
= RT_SCOPE_UNIVERSE
},
77 [RTN_THROW
] = { .error
= -EAGAIN
, .scope
= RT_SCOPE_UNIVERSE
},
78 [RTN_NAT
] = { .error
= 0, .scope
= RT_SCOPE_NOWHERE
},
79 [RTN_XRESOLVE
] = { .error
= -EINVAL
, .scope
= RT_SCOPE_NOWHERE
},
82 static int dn_fib_sync_down(__le16 local
, struct net_device
*dev
, int force
);
83 static int dn_fib_sync_up(struct net_device
*dev
);
85 void dn_fib_free_info(struct dn_fib_info
*fi
)
87 if (fi
->fib_dead
== 0) {
88 printk(KERN_DEBUG
"DECnet: BUG! Attempt to free alive dn_fib_info\n");
96 } endfor_nexthops(fi
);
100 void dn_fib_release_info(struct dn_fib_info
*fi
)
102 spin_lock(&dn_fib_info_lock
);
103 if (fi
&& --fi
->fib_treeref
== 0) {
105 fi
->fib_next
->fib_prev
= fi
->fib_prev
;
107 fi
->fib_prev
->fib_next
= fi
->fib_next
;
108 if (fi
== dn_fib_info_list
)
109 dn_fib_info_list
= fi
->fib_next
;
113 spin_unlock(&dn_fib_info_lock
);
116 static inline int dn_fib_nh_comp(const struct dn_fib_info
*fi
, const struct dn_fib_info
*ofi
)
118 const struct dn_fib_nh
*onh
= ofi
->fib_nh
;
121 if (nh
->nh_oif
!= onh
->nh_oif
||
122 nh
->nh_gw
!= onh
->nh_gw
||
123 nh
->nh_scope
!= onh
->nh_scope
||
124 nh
->nh_weight
!= onh
->nh_weight
||
125 ((nh
->nh_flags
^onh
->nh_flags
)&~RTNH_F_DEAD
))
128 } endfor_nexthops(fi
);
132 static inline struct dn_fib_info
*dn_fib_find_info(const struct dn_fib_info
*nfi
)
135 if (fi
->fib_nhs
!= nfi
->fib_nhs
)
137 if (nfi
->fib_protocol
== fi
->fib_protocol
&&
138 nfi
->fib_prefsrc
== fi
->fib_prefsrc
&&
139 nfi
->fib_priority
== fi
->fib_priority
&&
140 memcmp(nfi
->fib_metrics
, fi
->fib_metrics
, sizeof(fi
->fib_metrics
)) == 0 &&
141 ((nfi
->fib_flags
^fi
->fib_flags
)&~RTNH_F_DEAD
) == 0 &&
142 (nfi
->fib_nhs
== 0 || dn_fib_nh_comp(fi
, nfi
) == 0))
148 static int dn_fib_count_nhs(const struct nlattr
*attr
)
150 struct rtnexthop
*nhp
= nla_data(attr
);
151 int nhs
= 0, nhlen
= nla_len(attr
);
153 while(nhlen
>= (int)sizeof(struct rtnexthop
)) {
154 if ((nhlen
-= nhp
->rtnh_len
) < 0)
157 nhp
= RTNH_NEXT(nhp
);
163 static int dn_fib_get_nhs(struct dn_fib_info
*fi
, const struct nlattr
*attr
,
164 const struct rtmsg
*r
)
166 struct rtnexthop
*nhp
= nla_data(attr
);
167 int nhlen
= nla_len(attr
);
169 change_nexthops(fi
) {
170 int attrlen
= nhlen
- sizeof(struct rtnexthop
);
171 if (attrlen
< 0 || (nhlen
-= nhp
->rtnh_len
) < 0)
174 nh
->nh_flags
= (r
->rtm_flags
&~0xFF) | nhp
->rtnh_flags
;
175 nh
->nh_oif
= nhp
->rtnh_ifindex
;
176 nh
->nh_weight
= nhp
->rtnh_hops
+ 1;
179 struct nlattr
*gw_attr
;
181 gw_attr
= nla_find((struct nlattr
*) (nhp
+ 1), attrlen
, RTA_GATEWAY
);
182 nh
->nh_gw
= gw_attr
? nla_get_le16(gw_attr
) : 0;
184 nhp
= RTNH_NEXT(nhp
);
185 } endfor_nexthops(fi
);
191 static int dn_fib_check_nh(const struct rtmsg
*r
, struct dn_fib_info
*fi
, struct dn_fib_nh
*nh
)
197 struct dn_fib_res res
;
199 if (nh
->nh_flags
&RTNH_F_ONLINK
) {
200 struct net_device
*dev
;
202 if (r
->rtm_scope
>= RT_SCOPE_LINK
)
204 if (dnet_addr_type(nh
->nh_gw
) != RTN_UNICAST
)
206 if ((dev
= __dev_get_by_index(&init_net
, nh
->nh_oif
)) == NULL
)
208 if (!(dev
->flags
&IFF_UP
))
212 nh
->nh_scope
= RT_SCOPE_LINK
;
216 memset(&fld
, 0, sizeof(fld
));
217 fld
.daddr
= nh
->nh_gw
;
218 fld
.flowidn_oif
= nh
->nh_oif
;
219 fld
.flowidn_scope
= r
->rtm_scope
+ 1;
221 if (fld
.flowidn_scope
< RT_SCOPE_LINK
)
222 fld
.flowidn_scope
= RT_SCOPE_LINK
;
224 if ((err
= dn_fib_lookup(&fld
, &res
)) != 0)
228 if (res
.type
!= RTN_UNICAST
&& res
.type
!= RTN_LOCAL
)
230 nh
->nh_scope
= res
.scope
;
231 nh
->nh_oif
= DN_FIB_RES_OIF(res
);
232 nh
->nh_dev
= DN_FIB_RES_DEV(res
);
233 if (nh
->nh_dev
== NULL
)
235 dev_hold(nh
->nh_dev
);
237 if (!(nh
->nh_dev
->flags
& IFF_UP
))
241 dn_fib_res_put(&res
);
244 struct net_device
*dev
;
246 if (nh
->nh_flags
&(RTNH_F_PERVASIVE
|RTNH_F_ONLINK
))
249 dev
= __dev_get_by_index(&init_net
, nh
->nh_oif
);
250 if (dev
== NULL
|| dev
->dn_ptr
== NULL
)
252 if (!(dev
->flags
&IFF_UP
))
255 dev_hold(nh
->nh_dev
);
256 nh
->nh_scope
= RT_SCOPE_HOST
;
263 struct dn_fib_info
*dn_fib_create_info(const struct rtmsg
*r
, struct nlattr
*attrs
[],
264 const struct nlmsghdr
*nlh
, int *errp
)
267 struct dn_fib_info
*fi
= NULL
;
268 struct dn_fib_info
*ofi
;
271 if (r
->rtm_type
> RTN_MAX
)
274 if (dn_fib_props
[r
->rtm_type
].scope
> r
->rtm_scope
)
277 if (attrs
[RTA_MULTIPATH
] &&
278 (nhs
= dn_fib_count_nhs(attrs
[RTA_MULTIPATH
])) == 0)
281 fi
= kzalloc(sizeof(*fi
)+nhs
*sizeof(struct dn_fib_nh
), GFP_KERNEL
);
286 fi
->fib_protocol
= r
->rtm_protocol
;
288 fi
->fib_flags
= r
->rtm_flags
;
290 if (attrs
[RTA_PRIORITY
])
291 fi
->fib_priority
= nla_get_u32(attrs
[RTA_PRIORITY
]);
293 if (attrs
[RTA_METRICS
]) {
297 nla_for_each_nested(attr
, attrs
[RTA_METRICS
], rem
) {
298 int type
= nla_type(attr
);
301 if (type
> RTAX_MAX
|| nla_len(attr
) < 4)
304 fi
->fib_metrics
[type
-1] = nla_get_u32(attr
);
309 if (attrs
[RTA_PREFSRC
])
310 fi
->fib_prefsrc
= nla_get_le16(attrs
[RTA_PREFSRC
]);
312 if (attrs
[RTA_MULTIPATH
]) {
313 if ((err
= dn_fib_get_nhs(fi
, attrs
[RTA_MULTIPATH
], r
)) != 0)
316 if (attrs
[RTA_OIF
] &&
317 fi
->fib_nh
->nh_oif
!= nla_get_u32(attrs
[RTA_OIF
]))
320 if (attrs
[RTA_GATEWAY
] &&
321 fi
->fib_nh
->nh_gw
!= nla_get_le16(attrs
[RTA_GATEWAY
]))
324 struct dn_fib_nh
*nh
= fi
->fib_nh
;
327 nh
->nh_oif
= nla_get_u32(attrs
[RTA_OIF
]);
329 if (attrs
[RTA_GATEWAY
])
330 nh
->nh_gw
= nla_get_le16(attrs
[RTA_GATEWAY
]);
332 nh
->nh_flags
= r
->rtm_flags
;
336 if (r
->rtm_type
== RTN_NAT
) {
337 if (!attrs
[RTA_GATEWAY
] || nhs
!= 1 || attrs
[RTA_OIF
])
340 fi
->fib_nh
->nh_gw
= nla_get_le16(attrs
[RTA_GATEWAY
]);
344 if (dn_fib_props
[r
->rtm_type
].error
) {
345 if (attrs
[RTA_GATEWAY
] || attrs
[RTA_OIF
] || attrs
[RTA_MULTIPATH
])
351 if (r
->rtm_scope
> RT_SCOPE_HOST
)
354 if (r
->rtm_scope
== RT_SCOPE_HOST
) {
355 struct dn_fib_nh
*nh
= fi
->fib_nh
;
357 /* Local address is added */
358 if (nhs
!= 1 || nh
->nh_gw
)
360 nh
->nh_scope
= RT_SCOPE_NOWHERE
;
361 nh
->nh_dev
= dev_get_by_index(&init_net
, fi
->fib_nh
->nh_oif
);
363 if (nh
->nh_dev
== NULL
)
366 change_nexthops(fi
) {
367 if ((err
= dn_fib_check_nh(r
, fi
, nh
)) != 0)
369 } endfor_nexthops(fi
)
372 if (fi
->fib_prefsrc
) {
373 if (r
->rtm_type
!= RTN_LOCAL
|| !attrs
[RTA_DST
] ||
374 fi
->fib_prefsrc
!= nla_get_le16(attrs
[RTA_DST
]))
375 if (dnet_addr_type(fi
->fib_prefsrc
) != RTN_LOCAL
)
380 if ((ofi
= dn_fib_find_info(fi
)) != NULL
) {
382 dn_fib_free_info(fi
);
388 atomic_inc(&fi
->fib_clntref
);
389 spin_lock(&dn_fib_info_lock
);
390 fi
->fib_next
= dn_fib_info_list
;
392 if (dn_fib_info_list
)
393 dn_fib_info_list
->fib_prev
= fi
;
394 dn_fib_info_list
= fi
;
395 spin_unlock(&dn_fib_info_lock
);
405 dn_fib_free_info(fi
);
411 int dn_fib_semantic_match(int type
, struct dn_fib_info
*fi
, const struct flowidn
*fld
, struct dn_fib_res
*res
)
413 int err
= dn_fib_props
[type
].error
;
416 if (fi
->fib_flags
& RTNH_F_DEAD
)
423 DN_FIB_RES_RESET(*res
);
424 atomic_inc(&fi
->fib_clntref
);
429 if (nh
->nh_flags
& RTNH_F_DEAD
)
431 if (!fld
->flowidn_oif
||
432 fld
->flowidn_oif
== nh
->nh_oif
)
435 if (nhsel
< fi
->fib_nhs
) {
437 atomic_inc(&fi
->fib_clntref
);
444 net_err_ratelimited("DECnet: impossible routing event : dn_fib_semantic_match type=%d\n",
453 void dn_fib_select_multipath(const struct flowidn
*fld
, struct dn_fib_res
*res
)
455 struct dn_fib_info
*fi
= res
->fi
;
458 spin_lock_bh(&dn_fib_multipath_lock
);
459 if (fi
->fib_power
<= 0) {
461 change_nexthops(fi
) {
462 if (!(nh
->nh_flags
&RTNH_F_DEAD
)) {
463 power
+= nh
->nh_weight
;
464 nh
->nh_power
= nh
->nh_weight
;
466 } endfor_nexthops(fi
);
467 fi
->fib_power
= power
;
469 spin_unlock_bh(&dn_fib_multipath_lock
);
475 w
= jiffies
% fi
->fib_power
;
477 change_nexthops(fi
) {
478 if (!(nh
->nh_flags
&RTNH_F_DEAD
) && nh
->nh_power
) {
479 if ((w
-= nh
->nh_power
) <= 0) {
483 spin_unlock_bh(&dn_fib_multipath_lock
);
487 } endfor_nexthops(fi
);
489 spin_unlock_bh(&dn_fib_multipath_lock
);
492 static inline u32
rtm_get_table(struct nlattr
*attrs
[], u8 table
)
494 if (attrs
[RTA_TABLE
])
495 table
= nla_get_u32(attrs
[RTA_TABLE
]);
500 static int dn_fib_rtm_delroute(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
502 struct net
*net
= sock_net(skb
->sk
);
503 struct dn_fib_table
*tb
;
504 struct rtmsg
*r
= nlmsg_data(nlh
);
505 struct nlattr
*attrs
[RTA_MAX
+1];
508 if (!netlink_capable(skb
, CAP_NET_ADMIN
))
511 if (!net_eq(net
, &init_net
))
514 err
= nlmsg_parse(nlh
, sizeof(*r
), attrs
, RTA_MAX
, rtm_dn_policy
);
518 tb
= dn_fib_get_table(rtm_get_table(attrs
, r
->rtm_table
), 0);
522 return tb
->delete(tb
, r
, attrs
, nlh
, &NETLINK_CB(skb
));
525 static int dn_fib_rtm_newroute(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
527 struct net
*net
= sock_net(skb
->sk
);
528 struct dn_fib_table
*tb
;
529 struct rtmsg
*r
= nlmsg_data(nlh
);
530 struct nlattr
*attrs
[RTA_MAX
+1];
533 if (!netlink_capable(skb
, CAP_NET_ADMIN
))
536 if (!net_eq(net
, &init_net
))
539 err
= nlmsg_parse(nlh
, sizeof(*r
), attrs
, RTA_MAX
, rtm_dn_policy
);
543 tb
= dn_fib_get_table(rtm_get_table(attrs
, r
->rtm_table
), 1);
547 return tb
->insert(tb
, r
, attrs
, nlh
, &NETLINK_CB(skb
));
550 static void fib_magic(int cmd
, int type
, __le16 dst
, int dst_len
, struct dn_ifaddr
*ifa
)
552 struct dn_fib_table
*tb
;
567 .prefsrc
= ifa
->ifa_local
,
573 .oif
= ifa
->ifa_dev
->dev
->ifindex
,
575 struct nlattr
*attrs
[RTA_MAX
+1] = {
576 [RTA_DST
] = (struct nlattr
*) &dst_attr
,
577 [RTA_PREFSRC
] = (struct nlattr
* ) &prefsrc_attr
,
578 [RTA_OIF
] = (struct nlattr
*) &oif_attr
,
581 memset(&req
.rtm
, 0, sizeof(req
.rtm
));
583 if (type
== RTN_UNICAST
)
584 tb
= dn_fib_get_table(RT_MIN_TABLE
, 1);
586 tb
= dn_fib_get_table(RT_TABLE_LOCAL
, 1);
591 req
.nlh
.nlmsg_len
= sizeof(req
);
592 req
.nlh
.nlmsg_type
= cmd
;
593 req
.nlh
.nlmsg_flags
= NLM_F_REQUEST
|NLM_F_CREATE
|NLM_F_APPEND
;
594 req
.nlh
.nlmsg_pid
= 0;
595 req
.nlh
.nlmsg_seq
= 0;
597 req
.rtm
.rtm_dst_len
= dst_len
;
598 req
.rtm
.rtm_table
= tb
->n
;
599 req
.rtm
.rtm_protocol
= RTPROT_KERNEL
;
600 req
.rtm
.rtm_scope
= (type
!= RTN_LOCAL
? RT_SCOPE_LINK
: RT_SCOPE_HOST
);
601 req
.rtm
.rtm_type
= type
;
603 if (cmd
== RTM_NEWROUTE
)
604 tb
->insert(tb
, &req
.rtm
, attrs
, &req
.nlh
, NULL
);
606 tb
->delete(tb
, &req
.rtm
, attrs
, &req
.nlh
, NULL
);
609 static void dn_fib_add_ifaddr(struct dn_ifaddr
*ifa
)
612 fib_magic(RTM_NEWROUTE
, RTN_LOCAL
, ifa
->ifa_local
, 16, ifa
);
615 if (!(dev
->flags
&IFF_UP
))
617 /* In the future, we will want to add default routes here */
622 static void dn_fib_del_ifaddr(struct dn_ifaddr
*ifa
)
625 struct net_device
*dev
;
626 struct dn_dev
*dn_db
;
627 struct dn_ifaddr
*ifa2
;
631 /* Scan device list */
633 for_each_netdev_rcu(&init_net
, dev
) {
634 dn_db
= rcu_dereference(dev
->dn_ptr
);
637 for (ifa2
= rcu_dereference(dn_db
->ifa_list
);
639 ifa2
= rcu_dereference(ifa2
->ifa_next
)) {
640 if (ifa2
->ifa_local
== ifa
->ifa_local
) {
649 fib_magic(RTM_DELROUTE
, RTN_LOCAL
, ifa
->ifa_local
, 16, ifa
);
651 if (dnet_addr_type(ifa
->ifa_local
) != RTN_LOCAL
) {
652 if (dn_fib_sync_down(ifa
->ifa_local
, NULL
, 0))
658 static void dn_fib_disable_addr(struct net_device
*dev
, int force
)
660 if (dn_fib_sync_down(0, dev
, force
))
662 dn_rt_cache_flush(0);
663 neigh_ifdown(&dn_neigh_table
, dev
);
666 static int dn_fib_dnaddr_event(struct notifier_block
*this, unsigned long event
, void *ptr
)
668 struct dn_ifaddr
*ifa
= (struct dn_ifaddr
*)ptr
;
672 dn_fib_add_ifaddr(ifa
);
673 dn_fib_sync_up(ifa
->ifa_dev
->dev
);
674 dn_rt_cache_flush(-1);
677 dn_fib_del_ifaddr(ifa
);
678 if (ifa
->ifa_dev
&& ifa
->ifa_dev
->ifa_list
== NULL
) {
679 dn_fib_disable_addr(ifa
->ifa_dev
->dev
, 1);
681 dn_rt_cache_flush(-1);
688 static int dn_fib_sync_down(__le16 local
, struct net_device
*dev
, int force
)
691 int scope
= RT_SCOPE_NOWHERE
;
698 * This makes no sense for DECnet.... we will almost
699 * certainly have more than one local address the same
700 * over all our interfaces. It needs thinking about
703 if (local
&& fi
->fib_prefsrc
== local
) {
704 fi
->fib_flags
|= RTNH_F_DEAD
;
706 } else if (dev
&& fi
->fib_nhs
) {
709 change_nexthops(fi
) {
710 if (nh
->nh_flags
&RTNH_F_DEAD
)
712 else if (nh
->nh_dev
== dev
&&
713 nh
->nh_scope
!= scope
) {
714 spin_lock_bh(&dn_fib_multipath_lock
);
715 nh
->nh_flags
|= RTNH_F_DEAD
;
716 fi
->fib_power
-= nh
->nh_power
;
718 spin_unlock_bh(&dn_fib_multipath_lock
);
721 } endfor_nexthops(fi
)
722 if (dead
== fi
->fib_nhs
) {
723 fi
->fib_flags
|= RTNH_F_DEAD
;
732 static int dn_fib_sync_up(struct net_device
*dev
)
736 if (!(dev
->flags
&IFF_UP
))
742 change_nexthops(fi
) {
743 if (!(nh
->nh_flags
&RTNH_F_DEAD
)) {
747 if (nh
->nh_dev
== NULL
|| !(nh
->nh_dev
->flags
&IFF_UP
))
749 if (nh
->nh_dev
!= dev
|| dev
->dn_ptr
== NULL
)
752 spin_lock_bh(&dn_fib_multipath_lock
);
754 nh
->nh_flags
&= ~RTNH_F_DEAD
;
755 spin_unlock_bh(&dn_fib_multipath_lock
);
756 } endfor_nexthops(fi
);
759 fi
->fib_flags
&= ~RTNH_F_DEAD
;
766 static struct notifier_block dn_fib_dnaddr_notifier
= {
767 .notifier_call
= dn_fib_dnaddr_event
,
770 void __exit
dn_fib_cleanup(void)
772 dn_fib_table_cleanup();
773 dn_fib_rules_cleanup();
775 unregister_dnaddr_notifier(&dn_fib_dnaddr_notifier
);
779 void __init
dn_fib_init(void)
784 register_dnaddr_notifier(&dn_fib_dnaddr_notifier
);
786 rtnl_register(PF_DECnet
, RTM_NEWROUTE
, dn_fib_rtm_newroute
, NULL
, NULL
);
787 rtnl_register(PF_DECnet
, RTM_DELROUTE
, dn_fib_rtm_delroute
, NULL
, NULL
);