]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - net/ipv4/fib_frontend.c
netlink: add netlink_kernel_cfg parameter to netlink_kernel_create
[mirror_ubuntu-artful-kernel.git] / net / ipv4 / fib_frontend.c
CommitLineData
1da177e4
LT
1/*
2 * INET An implementation of the TCP/IP protocol suite for the LINUX
3 * operating system. INET is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
5 *
6 * IPv4 Forwarding Information Base: FIB frontend.
7 *
1da177e4
LT
8 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
9 *
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
14 */
15
1da177e4
LT
16#include <linux/module.h>
17#include <asm/uaccess.h>
1da177e4 18#include <linux/bitops.h>
4fc268d2 19#include <linux/capability.h>
1da177e4
LT
20#include <linux/types.h>
21#include <linux/kernel.h>
1da177e4
LT
22#include <linux/mm.h>
23#include <linux/string.h>
24#include <linux/socket.h>
25#include <linux/sockios.h>
26#include <linux/errno.h>
27#include <linux/in.h>
28#include <linux/inet.h>
14c85021 29#include <linux/inetdevice.h>
1da177e4 30#include <linux/netdevice.h>
1823730f 31#include <linux/if_addr.h>
1da177e4
LT
32#include <linux/if_arp.h>
33#include <linux/skbuff.h>
7a9bc9b8 34#include <linux/cache.h>
1da177e4 35#include <linux/init.h>
1af5a8c4 36#include <linux/list.h>
5a0e3ad6 37#include <linux/slab.h>
1da177e4
LT
38
39#include <net/ip.h>
40#include <net/protocol.h>
41#include <net/route.h>
42#include <net/tcp.h>
43#include <net/sock.h>
1da177e4
LT
44#include <net/arp.h>
45#include <net/ip_fib.h>
63f3444f 46#include <net/rtnetlink.h>
990078af 47#include <net/xfrm.h>
1da177e4 48
1da177e4
LT
49#ifndef CONFIG_IP_MULTIPLE_TABLES
50
7b1a74fd 51static int __net_init fib4_rules_init(struct net *net)
c3e9a353 52{
93456b6d
DL
53 struct fib_table *local_table, *main_table;
54
5348ba85 55 local_table = fib_trie_table(RT_TABLE_LOCAL);
93456b6d 56 if (local_table == NULL)
dbb50165
DL
57 return -ENOMEM;
58
5348ba85 59 main_table = fib_trie_table(RT_TABLE_MAIN);
93456b6d 60 if (main_table == NULL)
dbb50165
DL
61 goto fail;
62
93456b6d 63 hlist_add_head_rcu(&local_table->tb_hlist,
e4aef8ae 64 &net->ipv4.fib_table_hash[TABLE_LOCAL_INDEX]);
93456b6d 65 hlist_add_head_rcu(&main_table->tb_hlist,
e4aef8ae 66 &net->ipv4.fib_table_hash[TABLE_MAIN_INDEX]);
dbb50165
DL
67 return 0;
68
69fail:
93456b6d 70 kfree(local_table);
dbb50165 71 return -ENOMEM;
c3e9a353 72}
1af5a8c4 73#else
1da177e4 74
8ad4942c 75struct fib_table *fib_new_table(struct net *net, u32 id)
1da177e4
LT
76{
77 struct fib_table *tb;
1af5a8c4 78 unsigned int h;
1da177e4 79
1af5a8c4
PM
80 if (id == 0)
81 id = RT_TABLE_MAIN;
8ad4942c 82 tb = fib_get_table(net, id);
1af5a8c4
PM
83 if (tb)
84 return tb;
7f9b8052 85
5348ba85 86 tb = fib_trie_table(id);
1da177e4
LT
87 if (!tb)
88 return NULL;
1af5a8c4 89 h = id & (FIB_TABLE_HASHSZ - 1);
e4aef8ae 90 hlist_add_head_rcu(&tb->tb_hlist, &net->ipv4.fib_table_hash[h]);
1da177e4
LT
91 return tb;
92}
93
8ad4942c 94struct fib_table *fib_get_table(struct net *net, u32 id)
1af5a8c4
PM
95{
96 struct fib_table *tb;
97 struct hlist_node *node;
e4aef8ae 98 struct hlist_head *head;
1af5a8c4 99 unsigned int h;
1da177e4 100
1af5a8c4
PM
101 if (id == 0)
102 id = RT_TABLE_MAIN;
103 h = id & (FIB_TABLE_HASHSZ - 1);
e4aef8ae 104
1af5a8c4 105 rcu_read_lock();
e4aef8ae
DL
106 head = &net->ipv4.fib_table_hash[h];
107 hlist_for_each_entry_rcu(tb, node, head, tb_hlist) {
1af5a8c4
PM
108 if (tb->tb_id == id) {
109 rcu_read_unlock();
110 return tb;
111 }
112 }
113 rcu_read_unlock();
114 return NULL;
115}
1da177e4
LT
116#endif /* CONFIG_IP_MULTIPLE_TABLES */
117
e4aef8ae 118static void fib_flush(struct net *net)
1da177e4
LT
119{
120 int flushed = 0;
1da177e4 121 struct fib_table *tb;
1af5a8c4 122 struct hlist_node *node;
e4aef8ae 123 struct hlist_head *head;
1af5a8c4 124 unsigned int h;
1da177e4 125
1af5a8c4 126 for (h = 0; h < FIB_TABLE_HASHSZ; h++) {
e4aef8ae
DL
127 head = &net->ipv4.fib_table_hash[h];
128 hlist_for_each_entry(tb, node, head, tb_hlist)
16c6cf8b 129 flushed += fib_table_flush(tb);
1da177e4 130 }
1da177e4
LT
131
132 if (flushed)
76e6ebfb 133 rt_cache_flush(net, -1);
1da177e4
LT
134}
135
05538116
LAT
136/*
137 * Find address type as if only "dev" was present in the system. If
138 * on_dev is NULL then all interfaces are taken into consideration.
139 */
95c96174
ED
140static inline unsigned int __inet_dev_addr_type(struct net *net,
141 const struct net_device *dev,
142 __be32 addr)
1da177e4 143{
9ade2286 144 struct flowi4 fl4 = { .daddr = addr };
1da177e4 145 struct fib_result res;
95c96174 146 unsigned int ret = RTN_BROADCAST;
03cf786c 147 struct fib_table *local_table;
1da177e4 148
1e637c74 149 if (ipv4_is_zeronet(addr) || ipv4_is_lbcast(addr))
1da177e4 150 return RTN_BROADCAST;
f97c1e0c 151 if (ipv4_is_multicast(addr))
1da177e4
LT
152 return RTN_MULTICAST;
153
154#ifdef CONFIG_IP_MULTIPLE_TABLES
155 res.r = NULL;
156#endif
e905a9ed 157
6b175b26 158 local_table = fib_get_table(net, RT_TABLE_LOCAL);
03cf786c 159 if (local_table) {
1da177e4 160 ret = RTN_UNICAST;
ebc0ffae 161 rcu_read_lock();
9ade2286 162 if (!fib_table_lookup(local_table, &fl4, &res, FIB_LOOKUP_NOREF)) {
05538116
LAT
163 if (!dev || dev == res.fi->fib_dev)
164 ret = res.type;
1da177e4 165 }
ebc0ffae 166 rcu_read_unlock();
1da177e4
LT
167 }
168 return ret;
169}
170
6b175b26 171unsigned int inet_addr_type(struct net *net, __be32 addr)
05538116 172{
6b175b26 173 return __inet_dev_addr_type(net, NULL, addr);
05538116 174}
4bc2f18b 175EXPORT_SYMBOL(inet_addr_type);
05538116 176
6b175b26
EB
177unsigned int inet_dev_addr_type(struct net *net, const struct net_device *dev,
178 __be32 addr)
05538116 179{
6a31d2a9 180 return __inet_dev_addr_type(net, dev, addr);
05538116 181}
4bc2f18b 182EXPORT_SYMBOL(inet_dev_addr_type);
05538116 183
35ebf65e
DM
184__be32 fib_compute_spec_dst(struct sk_buff *skb)
185{
186 struct net_device *dev = skb->dev;
187 struct in_device *in_dev;
188 struct fib_result res;
a207a4b2 189 struct rtable *rt;
35ebf65e
DM
190 struct flowi4 fl4;
191 struct net *net;
a207a4b2 192 int scope;
35ebf65e 193
a207a4b2
DM
194 rt = skb_rtable(skb);
195 if (!(rt->rt_flags & (RTCF_BROADCAST | RTCF_MULTICAST)))
35ebf65e
DM
196 return ip_hdr(skb)->daddr;
197
198 in_dev = __in_dev_get_rcu(dev);
199 BUG_ON(!in_dev);
35ebf65e
DM
200
201 net = dev_net(dev);
a207a4b2
DM
202
203 scope = RT_SCOPE_UNIVERSE;
204 if (!ipv4_is_zeronet(ip_hdr(skb)->saddr)) {
205 fl4.flowi4_oif = 0;
206 fl4.flowi4_iif = net->loopback_dev->ifindex;
207 fl4.daddr = ip_hdr(skb)->saddr;
208 fl4.saddr = 0;
209 fl4.flowi4_tos = RT_TOS(ip_hdr(skb)->tos);
210 fl4.flowi4_scope = scope;
211 fl4.flowi4_mark = IN_DEV_SRC_VMARK(in_dev) ? skb->mark : 0;
212 if (!fib_lookup(net, &fl4, &res))
213 return FIB_RES_PREFSRC(net, res);
214 } else {
215 scope = RT_SCOPE_LINK;
216 }
217
218 return inet_select_addr(dev, ip_hdr(skb)->saddr, scope);
35ebf65e
DM
219}
220
7a9bc9b8
DM
221#ifdef CONFIG_IP_ROUTE_CLASSID
222int fib_num_tclassid_users __read_mostly;
223#endif
224
1da177e4 225/* Given (packet source, input interface) and optional (dst, oif, tos):
6a31d2a9
ED
226 * - (main) check, that source is valid i.e. not broadcast or our local
227 * address.
228 * - figure out what "logical" interface this packet arrived
229 * and calculate "specific destination" address.
230 * - check, that packet arrived from expected physical interface.
ebc0ffae 231 * called with rcu_read_lock()
1da177e4 232 */
7a9bc9b8
DM
233static int __fib_validate_source(struct sk_buff *skb, __be32 src, __be32 dst,
234 u8 tos, int oif, struct net_device *dev,
235 int rpf, struct in_device *idev, u32 *itag)
1da177e4 236{
7a9bc9b8 237 int ret, no_addr, accept_local;
1da177e4 238 struct fib_result res;
9e56e380 239 struct flowi4 fl4;
5b707aaa 240 struct net *net;
9e56e380 241 bool dev_match;
1da177e4 242
9ade2286
DM
243 fl4.flowi4_oif = 0;
244 fl4.flowi4_iif = oif;
9ade2286
DM
245 fl4.daddr = src;
246 fl4.saddr = dst;
247 fl4.flowi4_tos = tos;
248 fl4.flowi4_scope = RT_SCOPE_UNIVERSE;
cc7e17ea 249
7a9bc9b8 250 no_addr = accept_local = 0;
9e56e380 251 no_addr = idev->ifa_list == NULL;
990078af 252
9e56e380
DM
253 accept_local = IN_DEV_ACCEPT_LOCAL(idev);
254 fl4.flowi4_mark = IN_DEV_SRC_VMARK(idev) ? skb->mark : 0;
1da177e4 255
c346dca1 256 net = dev_net(dev);
9ade2286 257 if (fib_lookup(net, &fl4, &res))
1da177e4 258 goto last_resort;
8153a10c
PM
259 if (res.type != RTN_UNICAST) {
260 if (res.type != RTN_LOCAL || !accept_local)
ebc0ffae 261 goto e_inval;
8153a10c 262 }
1da177e4 263 fib_combine_itag(itag, &res);
6f86b325
DM
264 dev_match = false;
265
1da177e4 266#ifdef CONFIG_IP_ROUTE_MULTIPATH
6f86b325
DM
267 for (ret = 0; ret < res.fi->fib_nhs; ret++) {
268 struct fib_nh *nh = &res.fi->fib_nh[ret];
269
270 if (nh->nh_dev == dev) {
271 dev_match = true;
272 break;
273 }
274 }
1da177e4
LT
275#else
276 if (FIB_RES_DEV(res) == dev)
6f86b325 277 dev_match = true;
1da177e4 278#endif
6f86b325 279 if (dev_match) {
1da177e4 280 ret = FIB_RES_NH(res).nh_scope >= RT_SCOPE_HOST;
1da177e4
LT
281 return ret;
282 }
1da177e4
LT
283 if (no_addr)
284 goto last_resort;
c1cf8422 285 if (rpf == 1)
b5f7e755 286 goto e_rpf;
9ade2286 287 fl4.flowi4_oif = dev->ifindex;
1da177e4
LT
288
289 ret = 0;
9ade2286 290 if (fib_lookup(net, &fl4, &res) == 0) {
41347dcd 291 if (res.type == RTN_UNICAST)
1da177e4 292 ret = FIB_RES_NH(res).nh_scope >= RT_SCOPE_HOST;
1da177e4
LT
293 }
294 return ret;
295
296last_resort:
297 if (rpf)
b5f7e755 298 goto e_rpf;
1da177e4
LT
299 *itag = 0;
300 return 0;
301
1da177e4
LT
302e_inval:
303 return -EINVAL;
b5f7e755
ED
304e_rpf:
305 return -EXDEV;
1da177e4
LT
306}
307
7a9bc9b8
DM
308/* Ignore rp_filter for packets protected by IPsec. */
309int fib_validate_source(struct sk_buff *skb, __be32 src, __be32 dst,
310 u8 tos, int oif, struct net_device *dev,
311 struct in_device *idev, u32 *itag)
312{
313 int r = secpath_exists(skb) ? 0 : IN_DEV_RPFILTER(idev);
314
315 if (!r && !fib_num_tclassid_users) {
316 *itag = 0;
317 return 0;
318 }
319 return __fib_validate_source(skb, src, dst, tos, oif, dev, r, idev, itag);
320}
321
81f7bf6c 322static inline __be32 sk_extract_addr(struct sockaddr *addr)
4e902c57
TG
323{
324 return ((struct sockaddr_in *) addr)->sin_addr.s_addr;
325}
326
327static int put_rtax(struct nlattr *mx, int len, int type, u32 value)
328{
329 struct nlattr *nla;
330
331 nla = (struct nlattr *) ((char *) mx + len);
332 nla->nla_type = type;
333 nla->nla_len = nla_attr_size(4);
334 *(u32 *) nla_data(nla) = value;
335
336 return len + nla_total_size(4);
337}
338
4b5d47d4 339static int rtentry_to_fib_config(struct net *net, int cmd, struct rtentry *rt,
4e902c57
TG
340 struct fib_config *cfg)
341{
6d85c10a 342 __be32 addr;
4e902c57
TG
343 int plen;
344
345 memset(cfg, 0, sizeof(*cfg));
4b5d47d4 346 cfg->fc_nlinfo.nl_net = net;
4e902c57
TG
347
348 if (rt->rt_dst.sa_family != AF_INET)
349 return -EAFNOSUPPORT;
350
351 /*
352 * Check mask for validity:
353 * a) it must be contiguous.
354 * b) destination must have all host bits clear.
355 * c) if application forgot to set correct family (AF_INET),
356 * reject request unless it is absolutely clear i.e.
357 * both family and mask are zero.
358 */
359 plen = 32;
360 addr = sk_extract_addr(&rt->rt_dst);
361 if (!(rt->rt_flags & RTF_HOST)) {
81f7bf6c 362 __be32 mask = sk_extract_addr(&rt->rt_genmask);
4e902c57
TG
363
364 if (rt->rt_genmask.sa_family != AF_INET) {
365 if (mask || rt->rt_genmask.sa_family)
366 return -EAFNOSUPPORT;
367 }
368
369 if (bad_mask(mask, addr))
370 return -EINVAL;
371
372 plen = inet_mask_len(mask);
373 }
374
375 cfg->fc_dst_len = plen;
376 cfg->fc_dst = addr;
377
378 if (cmd != SIOCDELRT) {
379 cfg->fc_nlflags = NLM_F_CREATE;
380 cfg->fc_protocol = RTPROT_BOOT;
381 }
382
383 if (rt->rt_metric)
384 cfg->fc_priority = rt->rt_metric - 1;
385
386 if (rt->rt_flags & RTF_REJECT) {
387 cfg->fc_scope = RT_SCOPE_HOST;
388 cfg->fc_type = RTN_UNREACHABLE;
389 return 0;
390 }
391
392 cfg->fc_scope = RT_SCOPE_NOWHERE;
393 cfg->fc_type = RTN_UNICAST;
394
395 if (rt->rt_dev) {
396 char *colon;
397 struct net_device *dev;
398 char devname[IFNAMSIZ];
399
400 if (copy_from_user(devname, rt->rt_dev, IFNAMSIZ-1))
401 return -EFAULT;
402
403 devname[IFNAMSIZ-1] = 0;
404 colon = strchr(devname, ':');
405 if (colon)
406 *colon = 0;
4b5d47d4 407 dev = __dev_get_by_name(net, devname);
4e902c57
TG
408 if (!dev)
409 return -ENODEV;
410 cfg->fc_oif = dev->ifindex;
411 if (colon) {
412 struct in_ifaddr *ifa;
413 struct in_device *in_dev = __in_dev_get_rtnl(dev);
414 if (!in_dev)
415 return -ENODEV;
416 *colon = ':';
417 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next)
418 if (strcmp(ifa->ifa_label, devname) == 0)
419 break;
420 if (ifa == NULL)
421 return -ENODEV;
422 cfg->fc_prefsrc = ifa->ifa_local;
423 }
424 }
425
426 addr = sk_extract_addr(&rt->rt_gateway);
427 if (rt->rt_gateway.sa_family == AF_INET && addr) {
428 cfg->fc_gw = addr;
429 if (rt->rt_flags & RTF_GATEWAY &&
4b5d47d4 430 inet_addr_type(net, addr) == RTN_UNICAST)
4e902c57
TG
431 cfg->fc_scope = RT_SCOPE_UNIVERSE;
432 }
433
434 if (cmd == SIOCDELRT)
435 return 0;
436
437 if (rt->rt_flags & RTF_GATEWAY && !cfg->fc_gw)
438 return -EINVAL;
439
440 if (cfg->fc_scope == RT_SCOPE_NOWHERE)
441 cfg->fc_scope = RT_SCOPE_LINK;
442
443 if (rt->rt_flags & (RTF_MTU | RTF_WINDOW | RTF_IRTT)) {
444 struct nlattr *mx;
445 int len = 0;
446
447 mx = kzalloc(3 * nla_total_size(4), GFP_KERNEL);
e905a9ed 448 if (mx == NULL)
4e902c57
TG
449 return -ENOMEM;
450
451 if (rt->rt_flags & RTF_MTU)
452 len = put_rtax(mx, len, RTAX_ADVMSS, rt->rt_mtu - 40);
453
454 if (rt->rt_flags & RTF_WINDOW)
455 len = put_rtax(mx, len, RTAX_WINDOW, rt->rt_window);
456
457 if (rt->rt_flags & RTF_IRTT)
458 len = put_rtax(mx, len, RTAX_RTT, rt->rt_irtt << 3);
459
460 cfg->fc_mx = mx;
461 cfg->fc_mx_len = len;
462 }
463
464 return 0;
465}
466
1da177e4 467/*
6a31d2a9
ED
468 * Handle IP routing ioctl calls.
469 * These are used to manipulate the routing tables
1da177e4 470 */
1bad118a 471int ip_rt_ioctl(struct net *net, unsigned int cmd, void __user *arg)
1da177e4 472{
4e902c57
TG
473 struct fib_config cfg;
474 struct rtentry rt;
1da177e4 475 int err;
1da177e4
LT
476
477 switch (cmd) {
478 case SIOCADDRT: /* Add a route */
479 case SIOCDELRT: /* Delete a route */
480 if (!capable(CAP_NET_ADMIN))
481 return -EPERM;
4e902c57
TG
482
483 if (copy_from_user(&rt, arg, sizeof(rt)))
1da177e4 484 return -EFAULT;
4e902c57 485
1da177e4 486 rtnl_lock();
1bad118a 487 err = rtentry_to_fib_config(net, cmd, &rt, &cfg);
1da177e4 488 if (err == 0) {
4e902c57
TG
489 struct fib_table *tb;
490
1da177e4 491 if (cmd == SIOCDELRT) {
1bad118a 492 tb = fib_get_table(net, cfg.fc_table);
1da177e4 493 if (tb)
16c6cf8b 494 err = fib_table_delete(tb, &cfg);
4e902c57
TG
495 else
496 err = -ESRCH;
1da177e4 497 } else {
1bad118a 498 tb = fib_new_table(net, cfg.fc_table);
1da177e4 499 if (tb)
16c6cf8b 500 err = fib_table_insert(tb, &cfg);
4e902c57
TG
501 else
502 err = -ENOBUFS;
1da177e4 503 }
4e902c57
TG
504
505 /* allocated by rtentry_to_fib_config() */
506 kfree(cfg.fc_mx);
1da177e4
LT
507 }
508 rtnl_unlock();
509 return err;
510 }
511 return -EINVAL;
512}
513
6a31d2a9 514const struct nla_policy rtm_ipv4_policy[RTA_MAX + 1] = {
4e902c57
TG
515 [RTA_DST] = { .type = NLA_U32 },
516 [RTA_SRC] = { .type = NLA_U32 },
517 [RTA_IIF] = { .type = NLA_U32 },
518 [RTA_OIF] = { .type = NLA_U32 },
519 [RTA_GATEWAY] = { .type = NLA_U32 },
520 [RTA_PRIORITY] = { .type = NLA_U32 },
521 [RTA_PREFSRC] = { .type = NLA_U32 },
522 [RTA_METRICS] = { .type = NLA_NESTED },
5176f91e 523 [RTA_MULTIPATH] = { .len = sizeof(struct rtnexthop) },
4e902c57 524 [RTA_FLOW] = { .type = NLA_U32 },
4e902c57
TG
525};
526
4b5d47d4 527static int rtm_to_fib_config(struct net *net, struct sk_buff *skb,
6a31d2a9 528 struct nlmsghdr *nlh, struct fib_config *cfg)
1da177e4 529{
4e902c57
TG
530 struct nlattr *attr;
531 int err, remaining;
532 struct rtmsg *rtm;
533
534 err = nlmsg_validate(nlh, sizeof(*rtm), RTA_MAX, rtm_ipv4_policy);
535 if (err < 0)
536 goto errout;
537
538 memset(cfg, 0, sizeof(*cfg));
539
540 rtm = nlmsg_data(nlh);
4e902c57 541 cfg->fc_dst_len = rtm->rtm_dst_len;
4e902c57
TG
542 cfg->fc_tos = rtm->rtm_tos;
543 cfg->fc_table = rtm->rtm_table;
544 cfg->fc_protocol = rtm->rtm_protocol;
545 cfg->fc_scope = rtm->rtm_scope;
546 cfg->fc_type = rtm->rtm_type;
547 cfg->fc_flags = rtm->rtm_flags;
548 cfg->fc_nlflags = nlh->nlmsg_flags;
549
550 cfg->fc_nlinfo.pid = NETLINK_CB(skb).pid;
551 cfg->fc_nlinfo.nlh = nlh;
4b5d47d4 552 cfg->fc_nlinfo.nl_net = net;
4e902c57 553
a0ee18b9
TG
554 if (cfg->fc_type > RTN_MAX) {
555 err = -EINVAL;
556 goto errout;
557 }
558
4e902c57 559 nlmsg_for_each_attr(attr, nlh, sizeof(struct rtmsg), remaining) {
8f4c1f9b 560 switch (nla_type(attr)) {
4e902c57 561 case RTA_DST:
17fb2c64 562 cfg->fc_dst = nla_get_be32(attr);
4e902c57 563 break;
4e902c57
TG
564 case RTA_OIF:
565 cfg->fc_oif = nla_get_u32(attr);
566 break;
567 case RTA_GATEWAY:
17fb2c64 568 cfg->fc_gw = nla_get_be32(attr);
4e902c57
TG
569 break;
570 case RTA_PRIORITY:
571 cfg->fc_priority = nla_get_u32(attr);
572 break;
573 case RTA_PREFSRC:
17fb2c64 574 cfg->fc_prefsrc = nla_get_be32(attr);
4e902c57
TG
575 break;
576 case RTA_METRICS:
577 cfg->fc_mx = nla_data(attr);
578 cfg->fc_mx_len = nla_len(attr);
579 break;
580 case RTA_MULTIPATH:
581 cfg->fc_mp = nla_data(attr);
582 cfg->fc_mp_len = nla_len(attr);
583 break;
584 case RTA_FLOW:
585 cfg->fc_flow = nla_get_u32(attr);
586 break;
4e902c57
TG
587 case RTA_TABLE:
588 cfg->fc_table = nla_get_u32(attr);
589 break;
1da177e4
LT
590 }
591 }
4e902c57 592
1da177e4 593 return 0;
4e902c57
TG
594errout:
595 return err;
1da177e4
LT
596}
597
6ed2533e 598static int inet_rtm_delroute(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1da177e4 599{
3b1e0a65 600 struct net *net = sock_net(skb->sk);
4e902c57
TG
601 struct fib_config cfg;
602 struct fib_table *tb;
603 int err;
1da177e4 604
4b5d47d4 605 err = rtm_to_fib_config(net, skb, nlh, &cfg);
4e902c57
TG
606 if (err < 0)
607 goto errout;
1da177e4 608
8ad4942c 609 tb = fib_get_table(net, cfg.fc_table);
4e902c57
TG
610 if (tb == NULL) {
611 err = -ESRCH;
612 goto errout;
613 }
614
16c6cf8b 615 err = fib_table_delete(tb, &cfg);
4e902c57
TG
616errout:
617 return err;
1da177e4
LT
618}
619
6ed2533e 620static int inet_rtm_newroute(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1da177e4 621{
3b1e0a65 622 struct net *net = sock_net(skb->sk);
4e902c57
TG
623 struct fib_config cfg;
624 struct fib_table *tb;
625 int err;
1da177e4 626
4b5d47d4 627 err = rtm_to_fib_config(net, skb, nlh, &cfg);
4e902c57
TG
628 if (err < 0)
629 goto errout;
1da177e4 630
226b0b4a 631 tb = fib_new_table(net, cfg.fc_table);
4e902c57
TG
632 if (tb == NULL) {
633 err = -ENOBUFS;
634 goto errout;
635 }
636
16c6cf8b 637 err = fib_table_insert(tb, &cfg);
4e902c57
TG
638errout:
639 return err;
1da177e4
LT
640}
641
63f3444f 642static int inet_dump_fib(struct sk_buff *skb, struct netlink_callback *cb)
1da177e4 643{
3b1e0a65 644 struct net *net = sock_net(skb->sk);
1af5a8c4
PM
645 unsigned int h, s_h;
646 unsigned int e = 0, s_e;
1da177e4 647 struct fib_table *tb;
1af5a8c4 648 struct hlist_node *node;
e4aef8ae 649 struct hlist_head *head;
1af5a8c4 650 int dumped = 0;
1da177e4 651
be403ea1
TG
652 if (nlmsg_len(cb->nlh) >= sizeof(struct rtmsg) &&
653 ((struct rtmsg *) nlmsg_data(cb->nlh))->rtm_flags & RTM_F_CLONED)
1da177e4
LT
654 return ip_rt_dump(skb, cb);
655
1af5a8c4
PM
656 s_h = cb->args[0];
657 s_e = cb->args[1];
658
659 for (h = s_h; h < FIB_TABLE_HASHSZ; h++, s_e = 0) {
660 e = 0;
e4aef8ae
DL
661 head = &net->ipv4.fib_table_hash[h];
662 hlist_for_each_entry(tb, node, head, tb_hlist) {
1af5a8c4
PM
663 if (e < s_e)
664 goto next;
665 if (dumped)
666 memset(&cb->args[2], 0, sizeof(cb->args) -
e905a9ed 667 2 * sizeof(cb->args[0]));
16c6cf8b 668 if (fib_table_dump(tb, skb, cb) < 0)
1af5a8c4
PM
669 goto out;
670 dumped = 1;
671next:
672 e++;
673 }
1da177e4 674 }
1af5a8c4
PM
675out:
676 cb->args[1] = e;
677 cb->args[0] = h;
1da177e4
LT
678
679 return skb->len;
680}
681
682/* Prepare and feed intra-kernel routing request.
6a31d2a9
ED
683 * Really, it should be netlink message, but :-( netlink
684 * can be not configured, so that we feed it directly
685 * to fib engine. It is legal, because all events occur
686 * only when netlink is already locked.
1da177e4 687 */
81f7bf6c 688static void fib_magic(int cmd, int type, __be32 dst, int dst_len, struct in_ifaddr *ifa)
1da177e4 689{
c346dca1 690 struct net *net = dev_net(ifa->ifa_dev->dev);
4e902c57
TG
691 struct fib_table *tb;
692 struct fib_config cfg = {
693 .fc_protocol = RTPROT_KERNEL,
694 .fc_type = type,
695 .fc_dst = dst,
696 .fc_dst_len = dst_len,
697 .fc_prefsrc = ifa->ifa_local,
698 .fc_oif = ifa->ifa_dev->dev->ifindex,
699 .fc_nlflags = NLM_F_CREATE | NLM_F_APPEND,
4d1169c1 700 .fc_nlinfo = {
4b5d47d4 701 .nl_net = net,
4d1169c1 702 },
4e902c57 703 };
1da177e4
LT
704
705 if (type == RTN_UNICAST)
4b5d47d4 706 tb = fib_new_table(net, RT_TABLE_MAIN);
1da177e4 707 else
4b5d47d4 708 tb = fib_new_table(net, RT_TABLE_LOCAL);
1da177e4
LT
709
710 if (tb == NULL)
711 return;
712
4e902c57 713 cfg.fc_table = tb->tb_id;
1da177e4 714
4e902c57
TG
715 if (type != RTN_LOCAL)
716 cfg.fc_scope = RT_SCOPE_LINK;
717 else
718 cfg.fc_scope = RT_SCOPE_HOST;
1da177e4
LT
719
720 if (cmd == RTM_NEWROUTE)
16c6cf8b 721 fib_table_insert(tb, &cfg);
1da177e4 722 else
16c6cf8b 723 fib_table_delete(tb, &cfg);
1da177e4
LT
724}
725
0ff60a45 726void fib_add_ifaddr(struct in_ifaddr *ifa)
1da177e4
LT
727{
728 struct in_device *in_dev = ifa->ifa_dev;
729 struct net_device *dev = in_dev->dev;
730 struct in_ifaddr *prim = ifa;
a144ea4b
AV
731 __be32 mask = ifa->ifa_mask;
732 __be32 addr = ifa->ifa_local;
6a31d2a9 733 __be32 prefix = ifa->ifa_address & mask;
1da177e4 734
6a31d2a9 735 if (ifa->ifa_flags & IFA_F_SECONDARY) {
1da177e4
LT
736 prim = inet_ifa_byprefix(in_dev, prefix, mask);
737 if (prim == NULL) {
058bd4d2 738 pr_warn("%s: bug: prim == NULL\n", __func__);
1da177e4
LT
739 return;
740 }
741 }
742
743 fib_magic(RTM_NEWROUTE, RTN_LOCAL, addr, 32, prim);
744
6a31d2a9 745 if (!(dev->flags & IFF_UP))
1da177e4
LT
746 return;
747
748 /* Add broadcast address, if it is explicitly assigned. */
a144ea4b 749 if (ifa->ifa_broadcast && ifa->ifa_broadcast != htonl(0xFFFFFFFF))
1da177e4
LT
750 fib_magic(RTM_NEWROUTE, RTN_BROADCAST, ifa->ifa_broadcast, 32, prim);
751
6a31d2a9 752 if (!ipv4_is_zeronet(prefix) && !(ifa->ifa_flags & IFA_F_SECONDARY) &&
1da177e4 753 (prefix != addr || ifa->ifa_prefixlen < 32)) {
6a31d2a9
ED
754 fib_magic(RTM_NEWROUTE,
755 dev->flags & IFF_LOOPBACK ? RTN_LOCAL : RTN_UNICAST,
756 prefix, ifa->ifa_prefixlen, prim);
1da177e4
LT
757
758 /* Add network specific broadcasts, when it takes a sense */
759 if (ifa->ifa_prefixlen < 31) {
760 fib_magic(RTM_NEWROUTE, RTN_BROADCAST, prefix, 32, prim);
6a31d2a9
ED
761 fib_magic(RTM_NEWROUTE, RTN_BROADCAST, prefix | ~mask,
762 32, prim);
1da177e4
LT
763 }
764 }
765}
766
e6abbaa2
JA
767/* Delete primary or secondary address.
768 * Optionally, on secondary address promotion consider the addresses
769 * from subnet iprim as deleted, even if they are in device list.
770 * In this case the secondary ifa can be in device list.
771 */
772void fib_del_ifaddr(struct in_ifaddr *ifa, struct in_ifaddr *iprim)
1da177e4
LT
773{
774 struct in_device *in_dev = ifa->ifa_dev;
775 struct net_device *dev = in_dev->dev;
776 struct in_ifaddr *ifa1;
e6abbaa2 777 struct in_ifaddr *prim = ifa, *prim1 = NULL;
6a31d2a9
ED
778 __be32 brd = ifa->ifa_address | ~ifa->ifa_mask;
779 __be32 any = ifa->ifa_address & ifa->ifa_mask;
1da177e4
LT
780#define LOCAL_OK 1
781#define BRD_OK 2
782#define BRD0_OK 4
783#define BRD1_OK 8
95c96174 784 unsigned int ok = 0;
e6abbaa2
JA
785 int subnet = 0; /* Primary network */
786 int gone = 1; /* Address is missing */
787 int same_prefsrc = 0; /* Another primary with same IP */
1da177e4 788
e6abbaa2 789 if (ifa->ifa_flags & IFA_F_SECONDARY) {
1da177e4
LT
790 prim = inet_ifa_byprefix(in_dev, any, ifa->ifa_mask);
791 if (prim == NULL) {
058bd4d2 792 pr_warn("%s: bug: prim == NULL\n", __func__);
1da177e4
LT
793 return;
794 }
e6abbaa2 795 if (iprim && iprim != prim) {
058bd4d2 796 pr_warn("%s: bug: iprim != prim\n", __func__);
e6abbaa2
JA
797 return;
798 }
799 } else if (!ipv4_is_zeronet(any) &&
800 (any != ifa->ifa_local || ifa->ifa_prefixlen < 32)) {
801 fib_magic(RTM_DELROUTE,
802 dev->flags & IFF_LOOPBACK ? RTN_LOCAL : RTN_UNICAST,
803 any, ifa->ifa_prefixlen, prim);
804 subnet = 1;
1da177e4
LT
805 }
806
807 /* Deletion is more complicated than add.
6a31d2a9
ED
808 * We should take care of not to delete too much :-)
809 *
810 * Scan address list to be sure that addresses are really gone.
1da177e4
LT
811 */
812
813 for (ifa1 = in_dev->ifa_list; ifa1; ifa1 = ifa1->ifa_next) {
e6abbaa2
JA
814 if (ifa1 == ifa) {
815 /* promotion, keep the IP */
816 gone = 0;
817 continue;
818 }
819 /* Ignore IFAs from our subnet */
820 if (iprim && ifa1->ifa_mask == iprim->ifa_mask &&
821 inet_ifa_match(ifa1->ifa_address, iprim))
822 continue;
823
824 /* Ignore ifa1 if it uses different primary IP (prefsrc) */
825 if (ifa1->ifa_flags & IFA_F_SECONDARY) {
826 /* Another address from our subnet? */
827 if (ifa1->ifa_mask == prim->ifa_mask &&
828 inet_ifa_match(ifa1->ifa_address, prim))
829 prim1 = prim;
830 else {
831 /* We reached the secondaries, so
832 * same_prefsrc should be determined.
833 */
834 if (!same_prefsrc)
835 continue;
836 /* Search new prim1 if ifa1 is not
837 * using the current prim1
838 */
839 if (!prim1 ||
840 ifa1->ifa_mask != prim1->ifa_mask ||
841 !inet_ifa_match(ifa1->ifa_address, prim1))
842 prim1 = inet_ifa_byprefix(in_dev,
843 ifa1->ifa_address,
844 ifa1->ifa_mask);
845 if (!prim1)
846 continue;
847 if (prim1->ifa_local != prim->ifa_local)
848 continue;
849 }
850 } else {
851 if (prim->ifa_local != ifa1->ifa_local)
852 continue;
853 prim1 = ifa1;
854 if (prim != prim1)
855 same_prefsrc = 1;
856 }
1da177e4
LT
857 if (ifa->ifa_local == ifa1->ifa_local)
858 ok |= LOCAL_OK;
859 if (ifa->ifa_broadcast == ifa1->ifa_broadcast)
860 ok |= BRD_OK;
861 if (brd == ifa1->ifa_broadcast)
862 ok |= BRD1_OK;
863 if (any == ifa1->ifa_broadcast)
864 ok |= BRD0_OK;
e6abbaa2
JA
865 /* primary has network specific broadcasts */
866 if (prim1 == ifa1 && ifa1->ifa_prefixlen < 31) {
867 __be32 brd1 = ifa1->ifa_address | ~ifa1->ifa_mask;
868 __be32 any1 = ifa1->ifa_address & ifa1->ifa_mask;
869
870 if (!ipv4_is_zeronet(any1)) {
871 if (ifa->ifa_broadcast == brd1 ||
872 ifa->ifa_broadcast == any1)
873 ok |= BRD_OK;
874 if (brd == brd1 || brd == any1)
875 ok |= BRD1_OK;
876 if (any == brd1 || any == any1)
877 ok |= BRD0_OK;
878 }
879 }
1da177e4
LT
880 }
881
6a31d2a9 882 if (!(ok & BRD_OK))
1da177e4 883 fib_magic(RTM_DELROUTE, RTN_BROADCAST, ifa->ifa_broadcast, 32, prim);
e6abbaa2
JA
884 if (subnet && ifa->ifa_prefixlen < 31) {
885 if (!(ok & BRD1_OK))
886 fib_magic(RTM_DELROUTE, RTN_BROADCAST, brd, 32, prim);
887 if (!(ok & BRD0_OK))
888 fib_magic(RTM_DELROUTE, RTN_BROADCAST, any, 32, prim);
889 }
6a31d2a9 890 if (!(ok & LOCAL_OK)) {
1da177e4
LT
891 fib_magic(RTM_DELROUTE, RTN_LOCAL, ifa->ifa_local, 32, prim);
892
893 /* Check, that this local address finally disappeared. */
e6abbaa2
JA
894 if (gone &&
895 inet_addr_type(dev_net(dev), ifa->ifa_local) != RTN_LOCAL) {
1da177e4 896 /* And the last, but not the least thing.
6a31d2a9
ED
897 * We must flush stray FIB entries.
898 *
899 * First of all, we scan fib_info list searching
900 * for stray nexthop entries, then ignite fib_flush.
901 */
c346dca1
YH
902 if (fib_sync_down_addr(dev_net(dev), ifa->ifa_local))
903 fib_flush(dev_net(dev));
1da177e4
LT
904 }
905 }
906#undef LOCAL_OK
907#undef BRD_OK
908#undef BRD0_OK
909#undef BRD1_OK
910}
911
6a31d2a9 912static void nl_fib_lookup(struct fib_result_nl *frn, struct fib_table *tb)
246955fe 913{
e905a9ed 914
246955fe 915 struct fib_result res;
9ade2286
DM
916 struct flowi4 fl4 = {
917 .flowi4_mark = frn->fl_mark,
918 .daddr = frn->fl_addr,
919 .flowi4_tos = frn->fl_tos,
920 .flowi4_scope = frn->fl_scope,
6a31d2a9 921 };
1194ed0a 922
912a41a4
SV
923#ifdef CONFIG_IP_MULTIPLE_TABLES
924 res.r = NULL;
925#endif
926
1194ed0a 927 frn->err = -ENOENT;
246955fe
RO
928 if (tb) {
929 local_bh_disable();
930
931 frn->tb_id = tb->tb_id;
ebc0ffae 932 rcu_read_lock();
9ade2286 933 frn->err = fib_table_lookup(tb, &fl4, &res, FIB_LOOKUP_NOREF);
246955fe
RO
934
935 if (!frn->err) {
936 frn->prefixlen = res.prefixlen;
937 frn->nh_sel = res.nh_sel;
938 frn->type = res.type;
939 frn->scope = res.scope;
940 }
ebc0ffae 941 rcu_read_unlock();
246955fe
RO
942 local_bh_enable();
943 }
944}
945
28f7b036 946static void nl_fib_input(struct sk_buff *skb)
246955fe 947{
6bd48fcf 948 struct net *net;
246955fe 949 struct fib_result_nl *frn;
28f7b036 950 struct nlmsghdr *nlh;
246955fe 951 struct fib_table *tb;
28f7b036 952 u32 pid;
1194ed0a 953
3b1e0a65 954 net = sock_net(skb->sk);
b529ccf2 955 nlh = nlmsg_hdr(skb);
ea86575e 956 if (skb->len < NLMSG_SPACE(0) || skb->len < nlh->nlmsg_len ||
d883a036 957 nlh->nlmsg_len < NLMSG_LENGTH(sizeof(*frn)))
ea86575e 958 return;
d883a036
DL
959
960 skb = skb_clone(skb, GFP_KERNEL);
961 if (skb == NULL)
962 return;
963 nlh = nlmsg_hdr(skb);
e905a9ed 964
246955fe 965 frn = (struct fib_result_nl *) NLMSG_DATA(nlh);
6bd48fcf 966 tb = fib_get_table(net, frn->tb_id_in);
246955fe
RO
967
968 nl_fib_lookup(frn, tb);
e905a9ed 969
6a31d2a9
ED
970 pid = NETLINK_CB(skb).pid; /* pid of sending process */
971 NETLINK_CB(skb).pid = 0; /* from kernel */
ac6d439d 972 NETLINK_CB(skb).dst_group = 0; /* unicast */
6bd48fcf 973 netlink_unicast(net->ipv4.fibnl, skb, pid, MSG_DONTWAIT);
e905a9ed 974}
246955fe 975
2c8c1e72 976static int __net_init nl_fib_lookup_init(struct net *net)
246955fe 977{
6bd48fcf 978 struct sock *sk;
a31f2d17
PNA
979 struct netlink_kernel_cfg cfg = {
980 .input = nl_fib_input,
981 };
982
983 sk = netlink_kernel_create(net, NETLINK_FIB_LOOKUP, THIS_MODULE, &cfg);
6bd48fcf 984 if (sk == NULL)
7b1a74fd 985 return -EAFNOSUPPORT;
6bd48fcf 986 net->ipv4.fibnl = sk;
7b1a74fd
DL
987 return 0;
988}
989
990static void nl_fib_lookup_exit(struct net *net)
991{
b7c6ba6e 992 netlink_kernel_release(net->ipv4.fibnl);
775516bf 993 net->ipv4.fibnl = NULL;
246955fe
RO
994}
995
e2ce1468 996static void fib_disable_ip(struct net_device *dev, int force, int delay)
1da177e4 997{
85326fa5 998 if (fib_sync_down_dev(dev, force))
c346dca1 999 fib_flush(dev_net(dev));
e2ce1468 1000 rt_cache_flush(dev_net(dev), delay);
1da177e4
LT
1001 arp_ifdown(dev);
1002}
1003
1004static int fib_inetaddr_event(struct notifier_block *this, unsigned long event, void *ptr)
1005{
6ed2533e 1006 struct in_ifaddr *ifa = (struct in_ifaddr *)ptr;
76e6ebfb 1007 struct net_device *dev = ifa->ifa_dev->dev;
436c3b66 1008 struct net *net = dev_net(dev);
1da177e4
LT
1009
1010 switch (event) {
1011 case NETDEV_UP:
1012 fib_add_ifaddr(ifa);
1013#ifdef CONFIG_IP_ROUTE_MULTIPATH
76e6ebfb 1014 fib_sync_up(dev);
1da177e4 1015#endif
436c3b66 1016 atomic_inc(&net->ipv4.dev_addr_genid);
76e6ebfb 1017 rt_cache_flush(dev_net(dev), -1);
1da177e4
LT
1018 break;
1019 case NETDEV_DOWN:
e6abbaa2 1020 fib_del_ifaddr(ifa, NULL);
436c3b66 1021 atomic_inc(&net->ipv4.dev_addr_genid);
9fcc2e8a 1022 if (ifa->ifa_dev->ifa_list == NULL) {
1da177e4 1023 /* Last address was deleted from this interface.
6a31d2a9 1024 * Disable IP.
1da177e4 1025 */
e2ce1468 1026 fib_disable_ip(dev, 1, 0);
1da177e4 1027 } else {
76e6ebfb 1028 rt_cache_flush(dev_net(dev), -1);
1da177e4
LT
1029 }
1030 break;
1031 }
1032 return NOTIFY_DONE;
1033}
1034
1035static int fib_netdev_event(struct notifier_block *this, unsigned long event, void *ptr)
1036{
1037 struct net_device *dev = ptr;
e5ed6399 1038 struct in_device *in_dev = __in_dev_get_rtnl(dev);
436c3b66 1039 struct net *net = dev_net(dev);
1da177e4
LT
1040
1041 if (event == NETDEV_UNREGISTER) {
e2ce1468 1042 fib_disable_ip(dev, 2, -1);
1da177e4
LT
1043 return NOTIFY_DONE;
1044 }
1045
1046 if (!in_dev)
1047 return NOTIFY_DONE;
1048
1049 switch (event) {
1050 case NETDEV_UP:
1051 for_ifa(in_dev) {
1052 fib_add_ifaddr(ifa);
1053 } endfor_ifa(in_dev);
1054#ifdef CONFIG_IP_ROUTE_MULTIPATH
1055 fib_sync_up(dev);
1056#endif
436c3b66 1057 atomic_inc(&net->ipv4.dev_addr_genid);
76e6ebfb 1058 rt_cache_flush(dev_net(dev), -1);
1da177e4
LT
1059 break;
1060 case NETDEV_DOWN:
e2ce1468 1061 fib_disable_ip(dev, 0, 0);
1da177e4
LT
1062 break;
1063 case NETDEV_CHANGEMTU:
1064 case NETDEV_CHANGE:
76e6ebfb 1065 rt_cache_flush(dev_net(dev), 0);
1da177e4 1066 break;
a5ee1551 1067 case NETDEV_UNREGISTER_BATCH:
6561a3b1
DM
1068 /* The batch unregister is only called on the first
1069 * device in the list of devices being unregistered.
1070 * Therefore we should not pass dev_net(dev) in here.
1071 */
1072 rt_cache_flush_batch(NULL);
a5ee1551 1073 break;
1da177e4
LT
1074 }
1075 return NOTIFY_DONE;
1076}
1077
1078static struct notifier_block fib_inetaddr_notifier = {
6ed2533e 1079 .notifier_call = fib_inetaddr_event,
1da177e4
LT
1080};
1081
1082static struct notifier_block fib_netdev_notifier = {
6ed2533e 1083 .notifier_call = fib_netdev_event,
1da177e4
LT
1084};
1085
7b1a74fd 1086static int __net_init ip_fib_net_init(struct net *net)
1da177e4 1087{
dce5cbee 1088 int err;
10da66f7
ED
1089 size_t size = sizeof(struct hlist_head) * FIB_TABLE_HASHSZ;
1090
1091 /* Avoid false sharing : Use at least a full cache line */
1092 size = max_t(size_t, size, L1_CACHE_BYTES);
1af5a8c4 1093
10da66f7 1094 net->ipv4.fib_table_hash = kzalloc(size, GFP_KERNEL);
e4aef8ae
DL
1095 if (net->ipv4.fib_table_hash == NULL)
1096 return -ENOMEM;
1097
dce5cbee
DL
1098 err = fib4_rules_init(net);
1099 if (err < 0)
1100 goto fail;
1101 return 0;
1102
1103fail:
1104 kfree(net->ipv4.fib_table_hash);
1105 return err;
7b1a74fd 1106}
1da177e4 1107
2c8c1e72 1108static void ip_fib_net_exit(struct net *net)
7b1a74fd
DL
1109{
1110 unsigned int i;
1111
1112#ifdef CONFIG_IP_MULTIPLE_TABLES
1113 fib4_rules_exit(net);
1114#endif
1115
e2666f84 1116 rtnl_lock();
7b1a74fd
DL
1117 for (i = 0; i < FIB_TABLE_HASHSZ; i++) {
1118 struct fib_table *tb;
1119 struct hlist_head *head;
1120 struct hlist_node *node, *tmp;
63f3444f 1121
e4aef8ae 1122 head = &net->ipv4.fib_table_hash[i];
7b1a74fd
DL
1123 hlist_for_each_entry_safe(tb, node, tmp, head, tb_hlist) {
1124 hlist_del(node);
16c6cf8b 1125 fib_table_flush(tb);
4aa2c466 1126 fib_free_table(tb);
7b1a74fd
DL
1127 }
1128 }
e2666f84 1129 rtnl_unlock();
e4aef8ae 1130 kfree(net->ipv4.fib_table_hash);
7b1a74fd
DL
1131}
1132
1133static int __net_init fib_net_init(struct net *net)
1134{
1135 int error;
1136
7b1a74fd
DL
1137 error = ip_fib_net_init(net);
1138 if (error < 0)
1139 goto out;
1140 error = nl_fib_lookup_init(net);
1141 if (error < 0)
1142 goto out_nlfl;
1143 error = fib_proc_init(net);
1144 if (error < 0)
1145 goto out_proc;
1146out:
1147 return error;
1148
1149out_proc:
1150 nl_fib_lookup_exit(net);
1151out_nlfl:
1152 ip_fib_net_exit(net);
1153 goto out;
1154}
1155
1156static void __net_exit fib_net_exit(struct net *net)
1157{
1158 fib_proc_exit(net);
1159 nl_fib_lookup_exit(net);
1160 ip_fib_net_exit(net);
1161}
1162
1163static struct pernet_operations fib_net_ops = {
1164 .init = fib_net_init,
1165 .exit = fib_net_exit,
1166};
1167
1168void __init ip_fib_init(void)
1169{
c7ac8679
GR
1170 rtnl_register(PF_INET, RTM_NEWROUTE, inet_rtm_newroute, NULL, NULL);
1171 rtnl_register(PF_INET, RTM_DELROUTE, inet_rtm_delroute, NULL, NULL);
1172 rtnl_register(PF_INET, RTM_GETROUTE, NULL, inet_dump_fib, NULL);
7b1a74fd
DL
1173
1174 register_pernet_subsys(&fib_net_ops);
1175 register_netdevice_notifier(&fib_netdev_notifier);
1176 register_inetaddr_notifier(&fib_inetaddr_notifier);
7f9b8052 1177
5348ba85 1178 fib_trie_init();
1da177e4 1179}