blob: 4b581c675bb2ba1f162313f0e4d717fdeff4d2b9 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Linux INET6 implementation
3 * FIB front-end.
4 *
5 * Authors:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09006 * Pedro Roque <roque@di.fc.ul.pt>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
12 */
13
14/* Changes:
15 *
16 * YOSHIFUJI Hideaki @USAGI
17 * reworked default router selection.
18 * - respect outgoing interface
19 * - select from (probably) reachable routers (i.e.
20 * routers in REACHABLE, STALE, DELAY or PROBE states).
21 * - always select the same router if it is (probably)
22 * reachable. otherwise, round-robin the list.
YOSHIFUJI Hideakic0bece92006-08-23 17:23:25 -070023 * Ville Nuorvala
24 * Fixed routing subtrees.
Linus Torvalds1da177e2005-04-16 15:20:36 -070025 */
26
Joe Perchesf3213832012-05-15 14:11:53 +000027#define pr_fmt(fmt) "IPv6: " fmt
28
Randy Dunlap4fc268d2006-01-11 12:17:47 -080029#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/errno.h>
Paul Gortmakerbc3b2d72011-07-15 11:47:34 -040031#include <linux/export.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/types.h>
33#include <linux/times.h>
34#include <linux/socket.h>
35#include <linux/sockios.h>
36#include <linux/net.h>
37#include <linux/route.h>
38#include <linux/netdevice.h>
39#include <linux/in6.h>
YOSHIFUJI Hideaki7bc570c2008-04-03 09:22:53 +090040#include <linux/mroute6.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041#include <linux/init.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#include <linux/if_arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#include <linux/proc_fs.h>
44#include <linux/seq_file.h>
Daniel Lezcano5b7c9312008-03-03 23:28:58 -080045#include <linux/nsproxy.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090046#include <linux/slab.h>
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020047#include <net/net_namespace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070048#include <net/snmp.h>
49#include <net/ipv6.h>
50#include <net/ip6_fib.h>
51#include <net/ip6_route.h>
52#include <net/ndisc.h>
53#include <net/addrconf.h>
54#include <net/tcp.h>
55#include <linux/rtnetlink.h>
56#include <net/dst.h>
57#include <net/xfrm.h>
Tom Tucker8d717402006-07-30 20:43:36 -070058#include <net/netevent.h>
Thomas Graf21713eb2006-08-15 00:35:24 -070059#include <net/netlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070060
61#include <asm/uaccess.h>
62
63#ifdef CONFIG_SYSCTL
64#include <linux/sysctl.h>
65#endif
66
Gao feng1716a962012-04-06 00:13:10 +000067static struct rt6_info *ip6_rt_copy(struct rt6_info *ort,
Eric Dumazet21efcfa2011-07-19 20:18:36 +000068 const struct in6_addr *dest);
Linus Torvalds1da177e2005-04-16 15:20:36 -070069static struct dst_entry *ip6_dst_check(struct dst_entry *dst, u32 cookie);
David S. Miller0dbaee32010-12-13 12:52:14 -080070static unsigned int ip6_default_advmss(const struct dst_entry *dst);
Steffen Klassertebb762f2011-11-23 02:12:51 +000071static unsigned int ip6_mtu(const struct dst_entry *dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -070072static struct dst_entry *ip6_negative_advice(struct dst_entry *);
73static void ip6_dst_destroy(struct dst_entry *);
74static void ip6_dst_ifdown(struct dst_entry *,
75 struct net_device *dev, int how);
Daniel Lezcano569d3642008-01-18 03:56:57 -080076static int ip6_dst_gc(struct dst_ops *ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -070077
78static int ip6_pkt_discard(struct sk_buff *skb);
79static int ip6_pkt_discard_out(struct sk_buff *skb);
80static void ip6_link_failure(struct sk_buff *skb);
81static void ip6_rt_update_pmtu(struct dst_entry *dst, u32 mtu);
82
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -080083#ifdef CONFIG_IPV6_ROUTE_INFO
Daniel Lezcanoefa2cea2008-03-04 13:46:48 -080084static struct rt6_info *rt6_add_route_info(struct net *net,
Eric Dumazetb71d1d42011-04-22 04:53:02 +000085 const struct in6_addr *prefix, int prefixlen,
86 const struct in6_addr *gwaddr, int ifindex,
Eric Dumazet95c96172012-04-15 05:58:06 +000087 unsigned int pref);
Daniel Lezcanoefa2cea2008-03-04 13:46:48 -080088static struct rt6_info *rt6_get_route_info(struct net *net,
Eric Dumazetb71d1d42011-04-22 04:53:02 +000089 const struct in6_addr *prefix, int prefixlen,
90 const struct in6_addr *gwaddr, int ifindex);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -080091#endif
92
David S. Miller06582542011-01-27 14:58:42 -080093static u32 *ipv6_cow_metrics(struct dst_entry *dst, unsigned long old)
94{
95 struct rt6_info *rt = (struct rt6_info *) dst;
96 struct inet_peer *peer;
97 u32 *p = NULL;
98
Yan, Zheng8e2ec632011-09-05 21:34:30 +000099 if (!(rt->dst.flags & DST_HOST))
100 return NULL;
101
David S. Millerfbfe95a2012-06-08 23:24:18 -0700102 peer = rt6_get_peer_create(rt);
David S. Miller06582542011-01-27 14:58:42 -0800103 if (peer) {
104 u32 *old_p = __DST_METRICS_PTR(old);
105 unsigned long prev, new;
106
107 p = peer->metrics;
108 if (inet_metrics_new(peer))
109 memcpy(p, old_p, sizeof(u32) * RTAX_MAX);
110
111 new = (unsigned long) p;
112 prev = cmpxchg(&dst->_metrics, old, new);
113
114 if (prev != old) {
115 p = __DST_METRICS_PTR(prev);
116 if (prev & DST_METRICS_READ_ONLY)
117 p = NULL;
118 }
119 }
120 return p;
121}
122
David S. Millerf894cbf2012-07-02 21:52:24 -0700123static inline const void *choose_neigh_daddr(struct rt6_info *rt,
124 struct sk_buff *skb,
125 const void *daddr)
David S. Miller39232972012-01-26 15:22:32 -0500126{
127 struct in6_addr *p = &rt->rt6i_gateway;
128
David S. Millera7563f32012-01-26 16:29:16 -0500129 if (!ipv6_addr_any(p))
David S. Miller39232972012-01-26 15:22:32 -0500130 return (const void *) p;
David S. Millerf894cbf2012-07-02 21:52:24 -0700131 else if (skb)
132 return &ipv6_hdr(skb)->daddr;
David S. Miller39232972012-01-26 15:22:32 -0500133 return daddr;
134}
135
David S. Millerf894cbf2012-07-02 21:52:24 -0700136static struct neighbour *ip6_neigh_lookup(const struct dst_entry *dst,
137 struct sk_buff *skb,
138 const void *daddr)
David S. Millerd3aaeb32011-07-18 00:40:17 -0700139{
David S. Miller39232972012-01-26 15:22:32 -0500140 struct rt6_info *rt = (struct rt6_info *) dst;
141 struct neighbour *n;
142
David S. Millerf894cbf2012-07-02 21:52:24 -0700143 daddr = choose_neigh_daddr(rt, skb, daddr);
David S. Miller39232972012-01-26 15:22:32 -0500144 n = __ipv6_neigh_lookup(&nd_tbl, dst->dev, daddr);
David S. Millerf83c7792011-12-28 15:41:23 -0500145 if (n)
146 return n;
147 return neigh_create(&nd_tbl, daddr, dst->dev);
148}
149
David S. Miller8ade06c2011-12-29 18:51:57 -0500150static int rt6_bind_neighbour(struct rt6_info *rt, struct net_device *dev)
David S. Millerf83c7792011-12-28 15:41:23 -0500151{
David S. Miller8ade06c2011-12-29 18:51:57 -0500152 struct neighbour *n = __ipv6_neigh_lookup(&nd_tbl, dev, &rt->rt6i_gateway);
153 if (!n) {
154 n = neigh_create(&nd_tbl, &rt->rt6i_gateway, dev);
155 if (IS_ERR(n))
156 return PTR_ERR(n);
157 }
David S. Millerf83c7792011-12-28 15:41:23 -0500158 dst_set_neighbour(&rt->dst, n);
159
160 return 0;
David S. Millerd3aaeb32011-07-18 00:40:17 -0700161}
162
Daniel Lezcano9a7ec3a2008-03-04 13:48:53 -0800163static struct dst_ops ip6_dst_ops_template = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164 .family = AF_INET6,
Harvey Harrison09640e62009-02-01 00:45:17 -0800165 .protocol = cpu_to_be16(ETH_P_IPV6),
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166 .gc = ip6_dst_gc,
167 .gc_thresh = 1024,
168 .check = ip6_dst_check,
David S. Miller0dbaee32010-12-13 12:52:14 -0800169 .default_advmss = ip6_default_advmss,
Steffen Klassertebb762f2011-11-23 02:12:51 +0000170 .mtu = ip6_mtu,
David S. Miller06582542011-01-27 14:58:42 -0800171 .cow_metrics = ipv6_cow_metrics,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 .destroy = ip6_dst_destroy,
173 .ifdown = ip6_dst_ifdown,
174 .negative_advice = ip6_negative_advice,
175 .link_failure = ip6_link_failure,
176 .update_pmtu = ip6_rt_update_pmtu,
Herbert Xu1ac06e02008-05-20 14:32:14 -0700177 .local_out = __ip6_local_out,
David S. Millerd3aaeb32011-07-18 00:40:17 -0700178 .neigh_lookup = ip6_neigh_lookup,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179};
180
Steffen Klassertebb762f2011-11-23 02:12:51 +0000181static unsigned int ip6_blackhole_mtu(const struct dst_entry *dst)
Roland Dreierec831ea2011-01-31 13:16:00 -0800182{
Steffen Klassert618f9bc2011-11-23 02:13:31 +0000183 unsigned int mtu = dst_metric_raw(dst, RTAX_MTU);
184
185 return mtu ? : dst->dev->mtu;
Roland Dreierec831ea2011-01-31 13:16:00 -0800186}
187
David S. Miller14e50e52007-05-24 18:17:54 -0700188static void ip6_rt_blackhole_update_pmtu(struct dst_entry *dst, u32 mtu)
189{
190}
191
Held Bernhard0972ddb2011-04-24 22:07:32 +0000192static u32 *ip6_rt_blackhole_cow_metrics(struct dst_entry *dst,
193 unsigned long old)
194{
195 return NULL;
196}
197
David S. Miller14e50e52007-05-24 18:17:54 -0700198static struct dst_ops ip6_dst_blackhole_ops = {
199 .family = AF_INET6,
Harvey Harrison09640e62009-02-01 00:45:17 -0800200 .protocol = cpu_to_be16(ETH_P_IPV6),
David S. Miller14e50e52007-05-24 18:17:54 -0700201 .destroy = ip6_dst_destroy,
202 .check = ip6_dst_check,
Steffen Klassertebb762f2011-11-23 02:12:51 +0000203 .mtu = ip6_blackhole_mtu,
Eric Dumazet214f45c2011-02-18 11:39:01 -0800204 .default_advmss = ip6_default_advmss,
David S. Miller14e50e52007-05-24 18:17:54 -0700205 .update_pmtu = ip6_rt_blackhole_update_pmtu,
Held Bernhard0972ddb2011-04-24 22:07:32 +0000206 .cow_metrics = ip6_rt_blackhole_cow_metrics,
David S. Millerd3aaeb32011-07-18 00:40:17 -0700207 .neigh_lookup = ip6_neigh_lookup,
David S. Miller14e50e52007-05-24 18:17:54 -0700208};
209
David S. Miller62fa8a82011-01-26 20:51:05 -0800210static const u32 ip6_template_metrics[RTAX_MAX] = {
211 [RTAX_HOPLIMIT - 1] = 255,
212};
213
Daniel Lezcanobdb32892008-03-04 13:48:10 -0800214static struct rt6_info ip6_null_entry_template = {
Changli Gaod8d1f302010-06-10 23:31:35 -0700215 .dst = {
216 .__refcnt = ATOMIC_INIT(1),
217 .__use = 1,
218 .obsolete = -1,
219 .error = -ENETUNREACH,
Changli Gaod8d1f302010-06-10 23:31:35 -0700220 .input = ip6_pkt_discard,
221 .output = ip6_pkt_discard_out,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222 },
223 .rt6i_flags = (RTF_REJECT | RTF_NONEXTHOP),
Jean-Mickael Guerin4f724272009-05-20 17:38:59 -0700224 .rt6i_protocol = RTPROT_KERNEL,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700225 .rt6i_metric = ~(u32) 0,
226 .rt6i_ref = ATOMIC_INIT(1),
227};
228
Thomas Graf101367c2006-08-04 03:39:02 -0700229#ifdef CONFIG_IPV6_MULTIPLE_TABLES
230
David S. Miller6723ab52006-10-18 21:20:57 -0700231static int ip6_pkt_prohibit(struct sk_buff *skb);
232static int ip6_pkt_prohibit_out(struct sk_buff *skb);
David S. Miller6723ab52006-10-18 21:20:57 -0700233
Adrian Bunk280a34c2008-04-21 02:29:32 -0700234static struct rt6_info ip6_prohibit_entry_template = {
Changli Gaod8d1f302010-06-10 23:31:35 -0700235 .dst = {
236 .__refcnt = ATOMIC_INIT(1),
237 .__use = 1,
238 .obsolete = -1,
239 .error = -EACCES,
Changli Gaod8d1f302010-06-10 23:31:35 -0700240 .input = ip6_pkt_prohibit,
241 .output = ip6_pkt_prohibit_out,
Thomas Graf101367c2006-08-04 03:39:02 -0700242 },
243 .rt6i_flags = (RTF_REJECT | RTF_NONEXTHOP),
Jean-Mickael Guerin4f724272009-05-20 17:38:59 -0700244 .rt6i_protocol = RTPROT_KERNEL,
Thomas Graf101367c2006-08-04 03:39:02 -0700245 .rt6i_metric = ~(u32) 0,
246 .rt6i_ref = ATOMIC_INIT(1),
247};
248
Daniel Lezcanobdb32892008-03-04 13:48:10 -0800249static struct rt6_info ip6_blk_hole_entry_template = {
Changli Gaod8d1f302010-06-10 23:31:35 -0700250 .dst = {
251 .__refcnt = ATOMIC_INIT(1),
252 .__use = 1,
253 .obsolete = -1,
254 .error = -EINVAL,
Changli Gaod8d1f302010-06-10 23:31:35 -0700255 .input = dst_discard,
256 .output = dst_discard,
Thomas Graf101367c2006-08-04 03:39:02 -0700257 },
258 .rt6i_flags = (RTF_REJECT | RTF_NONEXTHOP),
Jean-Mickael Guerin4f724272009-05-20 17:38:59 -0700259 .rt6i_protocol = RTPROT_KERNEL,
Thomas Graf101367c2006-08-04 03:39:02 -0700260 .rt6i_metric = ~(u32) 0,
261 .rt6i_ref = ATOMIC_INIT(1),
262};
263
264#endif
265
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266/* allocate dst with ip6_dst_ops */
David S. Miller97bab732012-06-09 22:36:36 -0700267static inline struct rt6_info *ip6_dst_alloc(struct net *net,
David S. Miller957c6652011-06-24 15:25:00 -0700268 struct net_device *dev,
David S. Miller8b96d222012-06-11 02:01:56 -0700269 int flags,
270 struct fib6_table *table)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271{
David S. Miller97bab732012-06-09 22:36:36 -0700272 struct rt6_info *rt = dst_alloc(&net->ipv6.ip6_dst_ops, dev,
273 0, 0, flags);
David S. Millercf911662011-04-28 14:31:47 -0700274
David S. Miller97bab732012-06-09 22:36:36 -0700275 if (rt) {
Madalin Bucurfbe58182011-09-26 07:04:56 +0000276 memset(&rt->rt6i_table, 0,
David S. Miller38308472011-12-03 18:02:47 -0500277 sizeof(*rt) - sizeof(struct dst_entry));
David S. Miller8b96d222012-06-11 02:01:56 -0700278 rt6_init_peer(rt, table ? &table->tb6_peers : net->ipv6.peers);
David S. Miller97bab732012-06-09 22:36:36 -0700279 }
David S. Millercf911662011-04-28 14:31:47 -0700280 return rt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281}
282
283static void ip6_dst_destroy(struct dst_entry *dst)
284{
285 struct rt6_info *rt = (struct rt6_info *)dst;
286 struct inet6_dev *idev = rt->rt6i_idev;
287
Yan, Zheng8e2ec632011-09-05 21:34:30 +0000288 if (!(rt->dst.flags & DST_HOST))
289 dst_destroy_metrics_generic(dst);
290
David S. Miller38308472011-12-03 18:02:47 -0500291 if (idev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292 rt->rt6i_idev = NULL;
293 in6_dev_put(idev);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900294 }
Gao feng1716a962012-04-06 00:13:10 +0000295
296 if (!(rt->rt6i_flags & RTF_EXPIRES) && dst->from)
297 dst_release(dst->from);
298
David S. Miller97bab732012-06-09 22:36:36 -0700299 if (rt6_has_peer(rt)) {
300 struct inet_peer *peer = rt6_peer_ptr(rt);
David S. Millerb3419362010-11-30 12:27:11 -0800301 inet_putpeer(peer);
302 }
303}
304
David S. Miller6431cbc2011-02-07 20:38:06 -0800305static atomic_t __rt6_peer_genid = ATOMIC_INIT(0);
306
307static u32 rt6_peer_genid(void)
308{
309 return atomic_read(&__rt6_peer_genid);
310}
311
David S. Millerb3419362010-11-30 12:27:11 -0800312void rt6_bind_peer(struct rt6_info *rt, int create)
313{
David S. Miller97bab732012-06-09 22:36:36 -0700314 struct inet_peer_base *base;
David S. Millerb3419362010-11-30 12:27:11 -0800315 struct inet_peer *peer;
316
David S. Miller97bab732012-06-09 22:36:36 -0700317 base = inetpeer_base_ptr(rt->_rt6i_peer);
318 if (!base)
319 return;
320
321 peer = inet_getpeer_v6(base, &rt->rt6i_dst.addr, create);
David S. Miller7b34ca22012-06-11 04:13:57 -0700322 if (peer) {
323 if (!rt6_set_peer(rt, peer))
324 inet_putpeer(peer);
325 else
326 rt->rt6i_peer_genid = rt6_peer_genid();
327 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328}
329
330static void ip6_dst_ifdown(struct dst_entry *dst, struct net_device *dev,
331 int how)
332{
333 struct rt6_info *rt = (struct rt6_info *)dst;
334 struct inet6_dev *idev = rt->rt6i_idev;
Denis V. Lunev5a3e55d2007-12-07 00:38:10 -0800335 struct net_device *loopback_dev =
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900336 dev_net(dev)->loopback_dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337
David S. Miller38308472011-12-03 18:02:47 -0500338 if (dev != loopback_dev && idev && idev->dev == dev) {
Denis V. Lunev5a3e55d2007-12-07 00:38:10 -0800339 struct inet6_dev *loopback_idev =
340 in6_dev_get(loopback_dev);
David S. Miller38308472011-12-03 18:02:47 -0500341 if (loopback_idev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 rt->rt6i_idev = loopback_idev;
343 in6_dev_put(idev);
344 }
345 }
346}
347
Eric Dumazeta50feda2012-05-18 18:57:34 +0000348static bool rt6_check_expired(const struct rt6_info *rt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349{
Gao feng1716a962012-04-06 00:13:10 +0000350 struct rt6_info *ort = NULL;
351
352 if (rt->rt6i_flags & RTF_EXPIRES) {
353 if (time_after(jiffies, rt->dst.expires))
Eric Dumazeta50feda2012-05-18 18:57:34 +0000354 return true;
Gao feng1716a962012-04-06 00:13:10 +0000355 } else if (rt->dst.from) {
356 ort = (struct rt6_info *) rt->dst.from;
357 return (ort->rt6i_flags & RTF_EXPIRES) &&
358 time_after(jiffies, ort->dst.expires);
359 }
Eric Dumazeta50feda2012-05-18 18:57:34 +0000360 return false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361}
362
Eric Dumazeta50feda2012-05-18 18:57:34 +0000363static bool rt6_need_strict(const struct in6_addr *daddr)
Thomas Grafc71099a2006-08-04 23:20:06 -0700364{
Eric Dumazeta02cec22010-09-22 20:43:57 +0000365 return ipv6_addr_type(daddr) &
366 (IPV6_ADDR_MULTICAST | IPV6_ADDR_LINKLOCAL | IPV6_ADDR_LOOPBACK);
Thomas Grafc71099a2006-08-04 23:20:06 -0700367}
368
Linus Torvalds1da177e2005-04-16 15:20:36 -0700369/*
Thomas Grafc71099a2006-08-04 23:20:06 -0700370 * Route lookup. Any table->tb6_lock is implied.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700371 */
372
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800373static inline struct rt6_info *rt6_device_match(struct net *net,
374 struct rt6_info *rt,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000375 const struct in6_addr *saddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376 int oif,
YOSHIFUJI Hideakid4208952008-06-27 20:14:54 -0700377 int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700378{
379 struct rt6_info *local = NULL;
380 struct rt6_info *sprt;
381
YOSHIFUJI Hideakidd3abc42008-07-02 18:30:18 +0900382 if (!oif && ipv6_addr_any(saddr))
383 goto out;
384
Changli Gaod8d1f302010-06-10 23:31:35 -0700385 for (sprt = rt; sprt; sprt = sprt->dst.rt6_next) {
David S. Millerd1918542011-12-28 20:19:20 -0500386 struct net_device *dev = sprt->dst.dev;
YOSHIFUJI Hideakidd3abc42008-07-02 18:30:18 +0900387
388 if (oif) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700389 if (dev->ifindex == oif)
390 return sprt;
391 if (dev->flags & IFF_LOOPBACK) {
David S. Miller38308472011-12-03 18:02:47 -0500392 if (!sprt->rt6i_idev ||
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393 sprt->rt6i_idev->dev->ifindex != oif) {
YOSHIFUJI Hideakid4208952008-06-27 20:14:54 -0700394 if (flags & RT6_LOOKUP_F_IFACE && oif)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 continue;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900396 if (local && (!oif ||
Linus Torvalds1da177e2005-04-16 15:20:36 -0700397 local->rt6i_idev->dev->ifindex == oif))
398 continue;
399 }
400 local = sprt;
401 }
YOSHIFUJI Hideakidd3abc42008-07-02 18:30:18 +0900402 } else {
403 if (ipv6_chk_addr(net, saddr, dev,
404 flags & RT6_LOOKUP_F_IFACE))
405 return sprt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700406 }
YOSHIFUJI Hideakidd3abc42008-07-02 18:30:18 +0900407 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700408
YOSHIFUJI Hideakidd3abc42008-07-02 18:30:18 +0900409 if (oif) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410 if (local)
411 return local;
412
YOSHIFUJI Hideakid4208952008-06-27 20:14:54 -0700413 if (flags & RT6_LOOKUP_F_IFACE)
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800414 return net->ipv6.ip6_null_entry;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415 }
YOSHIFUJI Hideakidd3abc42008-07-02 18:30:18 +0900416out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 return rt;
418}
419
YOSHIFUJI Hideaki27097252006-03-20 17:05:13 -0800420#ifdef CONFIG_IPV6_ROUTER_PREF
421static void rt6_probe(struct rt6_info *rt)
422{
Eric Dumazetf2c31e32011-07-29 19:00:53 +0000423 struct neighbour *neigh;
YOSHIFUJI Hideaki27097252006-03-20 17:05:13 -0800424 /*
425 * Okay, this does not seem to be appropriate
426 * for now, however, we need to check if it
427 * is really so; aka Router Reachability Probing.
428 *
429 * Router Reachability Probe MUST be rate-limited
430 * to no more than one per minute.
431 */
Eric Dumazetf2c31e32011-07-29 19:00:53 +0000432 rcu_read_lock();
David Miller27217452011-12-02 16:52:08 +0000433 neigh = rt ? dst_get_neighbour_noref(&rt->dst) : NULL;
YOSHIFUJI Hideaki27097252006-03-20 17:05:13 -0800434 if (!neigh || (neigh->nud_state & NUD_VALID))
Eric Dumazetf2c31e32011-07-29 19:00:53 +0000435 goto out;
YOSHIFUJI Hideaki27097252006-03-20 17:05:13 -0800436 read_lock_bh(&neigh->lock);
437 if (!(neigh->nud_state & NUD_VALID) &&
YOSHIFUJI Hideaki52e16352006-03-20 17:05:47 -0800438 time_after(jiffies, neigh->updated + rt->rt6i_idev->cnf.rtr_probe_interval)) {
YOSHIFUJI Hideaki27097252006-03-20 17:05:13 -0800439 struct in6_addr mcaddr;
440 struct in6_addr *target;
441
442 neigh->updated = jiffies;
443 read_unlock_bh(&neigh->lock);
444
445 target = (struct in6_addr *)&neigh->primary_key;
446 addrconf_addr_solict_mult(target, &mcaddr);
David S. Millerd1918542011-12-28 20:19:20 -0500447 ndisc_send_ns(rt->dst.dev, NULL, target, &mcaddr, NULL);
Eric Dumazetf2c31e32011-07-29 19:00:53 +0000448 } else {
YOSHIFUJI Hideaki27097252006-03-20 17:05:13 -0800449 read_unlock_bh(&neigh->lock);
Eric Dumazetf2c31e32011-07-29 19:00:53 +0000450 }
451out:
452 rcu_read_unlock();
YOSHIFUJI Hideaki27097252006-03-20 17:05:13 -0800453}
454#else
455static inline void rt6_probe(struct rt6_info *rt)
456{
YOSHIFUJI Hideaki27097252006-03-20 17:05:13 -0800457}
458#endif
459
Linus Torvalds1da177e2005-04-16 15:20:36 -0700460/*
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800461 * Default Router Selection (RFC 2461 6.3.6)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700462 */
Dave Jonesb6f99a22007-03-22 12:27:49 -0700463static inline int rt6_check_dev(struct rt6_info *rt, int oif)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700464{
David S. Millerd1918542011-12-28 20:19:20 -0500465 struct net_device *dev = rt->dst.dev;
David S. Miller161980f2007-04-06 11:42:27 -0700466 if (!oif || dev->ifindex == oif)
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800467 return 2;
David S. Miller161980f2007-04-06 11:42:27 -0700468 if ((dev->flags & IFF_LOOPBACK) &&
469 rt->rt6i_idev && rt->rt6i_idev->dev->ifindex == oif)
470 return 1;
471 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472}
473
Dave Jonesb6f99a22007-03-22 12:27:49 -0700474static inline int rt6_check_neigh(struct rt6_info *rt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700475{
Eric Dumazetf2c31e32011-07-29 19:00:53 +0000476 struct neighbour *neigh;
YOSHIFUJI Hideaki398bcbe2008-01-19 00:35:16 -0800477 int m;
Eric Dumazetf2c31e32011-07-29 19:00:53 +0000478
479 rcu_read_lock();
David Miller27217452011-12-02 16:52:08 +0000480 neigh = dst_get_neighbour_noref(&rt->dst);
YOSHIFUJI Hideaki4d0c5912006-05-26 13:23:41 -0700481 if (rt->rt6i_flags & RTF_NONEXTHOP ||
482 !(rt->rt6i_flags & RTF_GATEWAY))
483 m = 1;
484 else if (neigh) {
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800485 read_lock_bh(&neigh->lock);
486 if (neigh->nud_state & NUD_VALID)
YOSHIFUJI Hideaki4d0c5912006-05-26 13:23:41 -0700487 m = 2;
YOSHIFUJI Hideaki398bcbe2008-01-19 00:35:16 -0800488#ifdef CONFIG_IPV6_ROUTER_PREF
489 else if (neigh->nud_state & NUD_FAILED)
490 m = 0;
491#endif
492 else
YOSHIFUJI Hideakiea73ee22006-11-06 09:45:44 -0800493 m = 1;
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800494 read_unlock_bh(&neigh->lock);
YOSHIFUJI Hideaki398bcbe2008-01-19 00:35:16 -0800495 } else
496 m = 0;
Eric Dumazetf2c31e32011-07-29 19:00:53 +0000497 rcu_read_unlock();
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800498 return m;
499}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800501static int rt6_score_route(struct rt6_info *rt, int oif,
502 int strict)
503{
YOSHIFUJI Hideaki4d0c5912006-05-26 13:23:41 -0700504 int m, n;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900505
YOSHIFUJI Hideaki4d0c5912006-05-26 13:23:41 -0700506 m = rt6_check_dev(rt, oif);
YOSHIFUJI Hideaki77d16f42006-08-23 17:25:05 -0700507 if (!m && (strict & RT6_LOOKUP_F_IFACE))
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800508 return -1;
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -0800509#ifdef CONFIG_IPV6_ROUTER_PREF
510 m |= IPV6_DECODE_PREF(IPV6_EXTRACT_PREF(rt->rt6i_flags)) << 2;
511#endif
YOSHIFUJI Hideaki4d0c5912006-05-26 13:23:41 -0700512 n = rt6_check_neigh(rt);
YOSHIFUJI Hideaki557e92e2006-11-06 09:45:45 -0800513 if (!n && (strict & RT6_LOOKUP_F_REACHABLE))
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800514 return -1;
515 return m;
516}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700517
David S. Millerf11e6652007-03-24 20:36:25 -0700518static struct rt6_info *find_match(struct rt6_info *rt, int oif, int strict,
519 int *mpri, struct rt6_info *match)
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800520{
David S. Millerf11e6652007-03-24 20:36:25 -0700521 int m;
522
523 if (rt6_check_expired(rt))
524 goto out;
525
526 m = rt6_score_route(rt, oif, strict);
527 if (m < 0)
528 goto out;
529
530 if (m > *mpri) {
531 if (strict & RT6_LOOKUP_F_REACHABLE)
532 rt6_probe(match);
533 *mpri = m;
534 match = rt;
535 } else if (strict & RT6_LOOKUP_F_REACHABLE) {
536 rt6_probe(rt);
537 }
538
539out:
540 return match;
541}
542
543static struct rt6_info *find_rr_leaf(struct fib6_node *fn,
544 struct rt6_info *rr_head,
545 u32 metric, int oif, int strict)
546{
547 struct rt6_info *rt, *match;
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800548 int mpri = -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700549
David S. Millerf11e6652007-03-24 20:36:25 -0700550 match = NULL;
551 for (rt = rr_head; rt && rt->rt6i_metric == metric;
Changli Gaod8d1f302010-06-10 23:31:35 -0700552 rt = rt->dst.rt6_next)
David S. Millerf11e6652007-03-24 20:36:25 -0700553 match = find_match(rt, oif, strict, &mpri, match);
554 for (rt = fn->leaf; rt && rt != rr_head && rt->rt6i_metric == metric;
Changli Gaod8d1f302010-06-10 23:31:35 -0700555 rt = rt->dst.rt6_next)
David S. Millerf11e6652007-03-24 20:36:25 -0700556 match = find_match(rt, oif, strict, &mpri, match);
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800557
David S. Millerf11e6652007-03-24 20:36:25 -0700558 return match;
559}
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800560
David S. Millerf11e6652007-03-24 20:36:25 -0700561static struct rt6_info *rt6_select(struct fib6_node *fn, int oif, int strict)
562{
563 struct rt6_info *match, *rt0;
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800564 struct net *net;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700565
David S. Millerf11e6652007-03-24 20:36:25 -0700566 rt0 = fn->rr_ptr;
567 if (!rt0)
568 fn->rr_ptr = rt0 = fn->leaf;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700569
David S. Millerf11e6652007-03-24 20:36:25 -0700570 match = find_rr_leaf(fn, rt0, rt0->rt6i_metric, oif, strict);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800572 if (!match &&
David S. Millerf11e6652007-03-24 20:36:25 -0700573 (strict & RT6_LOOKUP_F_REACHABLE)) {
Changli Gaod8d1f302010-06-10 23:31:35 -0700574 struct rt6_info *next = rt0->dst.rt6_next;
David S. Millerf11e6652007-03-24 20:36:25 -0700575
YOSHIFUJI Hideaki554cfb72006-03-20 17:00:26 -0800576 /* no entries matched; do round-robin */
David S. Millerf11e6652007-03-24 20:36:25 -0700577 if (!next || next->rt6i_metric != rt0->rt6i_metric)
578 next = fn->leaf;
579
580 if (next != rt0)
581 fn->rr_ptr = next;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700582 }
583
David S. Millerd1918542011-12-28 20:19:20 -0500584 net = dev_net(rt0->dst.dev);
Eric Dumazeta02cec22010-09-22 20:43:57 +0000585 return match ? match : net->ipv6.ip6_null_entry;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586}
587
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800588#ifdef CONFIG_IPV6_ROUTE_INFO
589int rt6_route_rcv(struct net_device *dev, u8 *opt, int len,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000590 const struct in6_addr *gwaddr)
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800591{
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900592 struct net *net = dev_net(dev);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800593 struct route_info *rinfo = (struct route_info *) opt;
594 struct in6_addr prefix_buf, *prefix;
595 unsigned int pref;
YOSHIFUJI Hideaki4bed72e2008-05-27 17:37:49 +0900596 unsigned long lifetime;
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800597 struct rt6_info *rt;
598
599 if (len < sizeof(struct route_info)) {
600 return -EINVAL;
601 }
602
603 /* Sanity check for prefix_len and length */
604 if (rinfo->length > 3) {
605 return -EINVAL;
606 } else if (rinfo->prefix_len > 128) {
607 return -EINVAL;
608 } else if (rinfo->prefix_len > 64) {
609 if (rinfo->length < 2) {
610 return -EINVAL;
611 }
612 } else if (rinfo->prefix_len > 0) {
613 if (rinfo->length < 1) {
614 return -EINVAL;
615 }
616 }
617
618 pref = rinfo->route_pref;
619 if (pref == ICMPV6_ROUTER_PREF_INVALID)
Jens Rosenboom3933fc92009-09-10 06:25:11 +0000620 return -EINVAL;
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800621
YOSHIFUJI Hideaki4bed72e2008-05-27 17:37:49 +0900622 lifetime = addrconf_timeout_fixup(ntohl(rinfo->lifetime), HZ);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800623
624 if (rinfo->length == 3)
625 prefix = (struct in6_addr *)rinfo->prefix;
626 else {
627 /* this function is safe */
628 ipv6_addr_prefix(&prefix_buf,
629 (struct in6_addr *)rinfo->prefix,
630 rinfo->prefix_len);
631 prefix = &prefix_buf;
632 }
633
Daniel Lezcanoefa2cea2008-03-04 13:46:48 -0800634 rt = rt6_get_route_info(net, prefix, rinfo->prefix_len, gwaddr,
635 dev->ifindex);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800636
637 if (rt && !lifetime) {
Thomas Grafe0a1ad732006-08-22 00:00:21 -0700638 ip6_del_rt(rt);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800639 rt = NULL;
640 }
641
642 if (!rt && lifetime)
Daniel Lezcanoefa2cea2008-03-04 13:46:48 -0800643 rt = rt6_add_route_info(net, prefix, rinfo->prefix_len, gwaddr, dev->ifindex,
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800644 pref);
645 else if (rt)
646 rt->rt6i_flags = RTF_ROUTEINFO |
647 (rt->rt6i_flags & ~RTF_PREF_MASK) | RTF_PREF(pref);
648
649 if (rt) {
Gao feng1716a962012-04-06 00:13:10 +0000650 if (!addrconf_finite_timeout(lifetime))
651 rt6_clean_expires(rt);
652 else
653 rt6_set_expires(rt, jiffies + HZ * lifetime);
654
Changli Gaod8d1f302010-06-10 23:31:35 -0700655 dst_release(&rt->dst);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800656 }
657 return 0;
658}
659#endif
660
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800661#define BACKTRACK(__net, saddr) \
YOSHIFUJI Hideaki982f56f2006-08-23 17:22:39 -0700662do { \
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800663 if (rt == __net->ipv6.ip6_null_entry) { \
YOSHIFUJI Hideaki982f56f2006-08-23 17:22:39 -0700664 struct fib6_node *pn; \
Ville Nuorvalae0eda7b2006-10-16 22:11:11 -0700665 while (1) { \
YOSHIFUJI Hideaki982f56f2006-08-23 17:22:39 -0700666 if (fn->fn_flags & RTN_TL_ROOT) \
667 goto out; \
668 pn = fn->parent; \
669 if (FIB6_SUBTREE(pn) && FIB6_SUBTREE(pn) != fn) \
Kim Nordlund8bce65b2006-12-13 16:38:29 -0800670 fn = fib6_lookup(FIB6_SUBTREE(pn), NULL, saddr); \
YOSHIFUJI Hideaki982f56f2006-08-23 17:22:39 -0700671 else \
672 fn = pn; \
673 if (fn->fn_flags & RTN_RTINFO) \
674 goto restart; \
Thomas Grafc71099a2006-08-04 23:20:06 -0700675 } \
Thomas Grafc71099a2006-08-04 23:20:06 -0700676 } \
David S. Miller38308472011-12-03 18:02:47 -0500677} while (0)
Thomas Grafc71099a2006-08-04 23:20:06 -0700678
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800679static struct rt6_info *ip6_pol_route_lookup(struct net *net,
680 struct fib6_table *table,
David S. Miller4c9483b2011-03-12 16:22:43 -0500681 struct flowi6 *fl6, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700682{
683 struct fib6_node *fn;
684 struct rt6_info *rt;
685
Thomas Grafc71099a2006-08-04 23:20:06 -0700686 read_lock_bh(&table->tb6_lock);
David S. Miller4c9483b2011-03-12 16:22:43 -0500687 fn = fib6_lookup(&table->tb6_root, &fl6->daddr, &fl6->saddr);
Thomas Grafc71099a2006-08-04 23:20:06 -0700688restart:
689 rt = fn->leaf;
David S. Miller4c9483b2011-03-12 16:22:43 -0500690 rt = rt6_device_match(net, rt, &fl6->saddr, fl6->flowi6_oif, flags);
691 BACKTRACK(net, &fl6->saddr);
Thomas Grafc71099a2006-08-04 23:20:06 -0700692out:
Changli Gaod8d1f302010-06-10 23:31:35 -0700693 dst_use(&rt->dst, jiffies);
Thomas Grafc71099a2006-08-04 23:20:06 -0700694 read_unlock_bh(&table->tb6_lock);
Thomas Grafc71099a2006-08-04 23:20:06 -0700695 return rt;
696
697}
698
Florian Westphalea6e5742011-09-05 16:05:44 +0200699struct dst_entry * ip6_route_lookup(struct net *net, struct flowi6 *fl6,
700 int flags)
701{
702 return fib6_rule_lookup(net, fl6, flags, ip6_pol_route_lookup);
703}
704EXPORT_SYMBOL_GPL(ip6_route_lookup);
705
YOSHIFUJI Hideaki9acd9f32008-04-10 15:42:10 +0900706struct rt6_info *rt6_lookup(struct net *net, const struct in6_addr *daddr,
707 const struct in6_addr *saddr, int oif, int strict)
Thomas Grafc71099a2006-08-04 23:20:06 -0700708{
David S. Miller4c9483b2011-03-12 16:22:43 -0500709 struct flowi6 fl6 = {
710 .flowi6_oif = oif,
711 .daddr = *daddr,
Thomas Grafc71099a2006-08-04 23:20:06 -0700712 };
713 struct dst_entry *dst;
YOSHIFUJI Hideaki77d16f42006-08-23 17:25:05 -0700714 int flags = strict ? RT6_LOOKUP_F_IFACE : 0;
Thomas Grafc71099a2006-08-04 23:20:06 -0700715
Thomas Grafadaa70b2006-10-13 15:01:03 -0700716 if (saddr) {
David S. Miller4c9483b2011-03-12 16:22:43 -0500717 memcpy(&fl6.saddr, saddr, sizeof(*saddr));
Thomas Grafadaa70b2006-10-13 15:01:03 -0700718 flags |= RT6_LOOKUP_F_HAS_SADDR;
719 }
720
David S. Miller4c9483b2011-03-12 16:22:43 -0500721 dst = fib6_rule_lookup(net, &fl6, flags, ip6_pol_route_lookup);
Thomas Grafc71099a2006-08-04 23:20:06 -0700722 if (dst->error == 0)
723 return (struct rt6_info *) dst;
724
725 dst_release(dst);
726
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727 return NULL;
728}
729
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +0900730EXPORT_SYMBOL(rt6_lookup);
731
Thomas Grafc71099a2006-08-04 23:20:06 -0700732/* ip6_ins_rt is called with FREE table->tb6_lock.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 It takes new route entry, the addition fails by any reason the
734 route is freed. In any case, if caller does not hold it, it may
735 be destroyed.
736 */
737
Thomas Graf86872cb2006-08-22 00:01:08 -0700738static int __ip6_ins_rt(struct rt6_info *rt, struct nl_info *info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739{
740 int err;
Thomas Grafc71099a2006-08-04 23:20:06 -0700741 struct fib6_table *table;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700742
Thomas Grafc71099a2006-08-04 23:20:06 -0700743 table = rt->rt6i_table;
744 write_lock_bh(&table->tb6_lock);
Thomas Graf86872cb2006-08-22 00:01:08 -0700745 err = fib6_add(&table->tb6_root, rt, info);
Thomas Grafc71099a2006-08-04 23:20:06 -0700746 write_unlock_bh(&table->tb6_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747
748 return err;
749}
750
Thomas Graf40e22e82006-08-22 00:00:45 -0700751int ip6_ins_rt(struct rt6_info *rt)
752{
Denis V. Lunev4d1169c2008-01-10 03:26:13 -0800753 struct nl_info info = {
David S. Millerd1918542011-12-28 20:19:20 -0500754 .nl_net = dev_net(rt->dst.dev),
Denis V. Lunev4d1169c2008-01-10 03:26:13 -0800755 };
Denis V. Lunev528c4ce2007-12-13 09:45:12 -0800756 return __ip6_ins_rt(rt, &info);
Thomas Graf40e22e82006-08-22 00:00:45 -0700757}
758
Gao feng1716a962012-04-06 00:13:10 +0000759static struct rt6_info *rt6_alloc_cow(struct rt6_info *ort,
Eric Dumazet21efcfa2011-07-19 20:18:36 +0000760 const struct in6_addr *daddr,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000761 const struct in6_addr *saddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700762{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700763 struct rt6_info *rt;
764
765 /*
766 * Clone the route.
767 */
768
Eric Dumazet21efcfa2011-07-19 20:18:36 +0000769 rt = ip6_rt_copy(ort, daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700770
771 if (rt) {
David S. Miller14deae42009-01-04 16:04:39 -0800772 int attempts = !in_softirq();
773
David S. Miller38308472011-12-03 18:02:47 -0500774 if (!(rt->rt6i_flags & RTF_GATEWAY)) {
David S. Millerbb3c3682011-12-13 17:35:06 -0500775 if (ort->rt6i_dst.plen != 128 &&
Eric Dumazet21efcfa2011-07-19 20:18:36 +0000776 ipv6_addr_equal(&ort->rt6i_dst.addr, daddr))
YOSHIFUJI Hideaki58c4fb82005-12-21 22:56:42 +0900777 rt->rt6i_flags |= RTF_ANYCAST;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000778 rt->rt6i_gateway = *daddr;
YOSHIFUJI Hideaki58c4fb82005-12-21 22:56:42 +0900779 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780
Linus Torvalds1da177e2005-04-16 15:20:36 -0700781 rt->rt6i_flags |= RTF_CACHE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700782
783#ifdef CONFIG_IPV6_SUBTREES
784 if (rt->rt6i_src.plen && saddr) {
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000785 rt->rt6i_src.addr = *saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700786 rt->rt6i_src.plen = 128;
787 }
788#endif
789
David S. Miller14deae42009-01-04 16:04:39 -0800790 retry:
David S. Miller8ade06c2011-12-29 18:51:57 -0500791 if (rt6_bind_neighbour(rt, rt->dst.dev)) {
David S. Millerd1918542011-12-28 20:19:20 -0500792 struct net *net = dev_net(rt->dst.dev);
David S. Miller14deae42009-01-04 16:04:39 -0800793 int saved_rt_min_interval =
794 net->ipv6.sysctl.ip6_rt_gc_min_interval;
795 int saved_rt_elasticity =
796 net->ipv6.sysctl.ip6_rt_gc_elasticity;
797
798 if (attempts-- > 0) {
799 net->ipv6.sysctl.ip6_rt_gc_elasticity = 1;
800 net->ipv6.sysctl.ip6_rt_gc_min_interval = 0;
801
Alexey Dobriyan86393e52009-08-29 01:34:49 +0000802 ip6_dst_gc(&net->ipv6.ip6_dst_ops);
David S. Miller14deae42009-01-04 16:04:39 -0800803
804 net->ipv6.sysctl.ip6_rt_gc_elasticity =
805 saved_rt_elasticity;
806 net->ipv6.sysctl.ip6_rt_gc_min_interval =
807 saved_rt_min_interval;
808 goto retry;
809 }
810
Joe Perchesf3213832012-05-15 14:11:53 +0000811 net_warn_ratelimited("Neighbour table overflow\n");
Changli Gaod8d1f302010-06-10 23:31:35 -0700812 dst_free(&rt->dst);
David S. Miller14deae42009-01-04 16:04:39 -0800813 return NULL;
814 }
YOSHIFUJI Hideaki95a9a5b2006-03-20 16:55:51 -0800815 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700816
YOSHIFUJI Hideaki95a9a5b2006-03-20 16:55:51 -0800817 return rt;
818}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700819
Eric Dumazet21efcfa2011-07-19 20:18:36 +0000820static struct rt6_info *rt6_alloc_clone(struct rt6_info *ort,
821 const struct in6_addr *daddr)
YOSHIFUJI Hideaki299d9932006-03-20 16:58:32 -0800822{
Eric Dumazet21efcfa2011-07-19 20:18:36 +0000823 struct rt6_info *rt = ip6_rt_copy(ort, daddr);
824
YOSHIFUJI Hideaki299d9932006-03-20 16:58:32 -0800825 if (rt) {
YOSHIFUJI Hideaki299d9932006-03-20 16:58:32 -0800826 rt->rt6i_flags |= RTF_CACHE;
David Miller27217452011-12-02 16:52:08 +0000827 dst_set_neighbour(&rt->dst, neigh_clone(dst_get_neighbour_noref_raw(&ort->dst)));
YOSHIFUJI Hideaki299d9932006-03-20 16:58:32 -0800828 }
829 return rt;
830}
831
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800832static struct rt6_info *ip6_pol_route(struct net *net, struct fib6_table *table, int oif,
David S. Miller4c9483b2011-03-12 16:22:43 -0500833 struct flowi6 *fl6, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700834{
835 struct fib6_node *fn;
YOSHIFUJI Hideaki519fbd82006-03-20 17:00:05 -0800836 struct rt6_info *rt, *nrt;
Thomas Grafc71099a2006-08-04 23:20:06 -0700837 int strict = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700838 int attempts = 3;
YOSHIFUJI Hideaki519fbd82006-03-20 17:00:05 -0800839 int err;
YOSHIFUJI Hideaki53b79972008-07-19 22:35:03 -0700840 int reachable = net->ipv6.devconf_all->forwarding ? 0 : RT6_LOOKUP_F_REACHABLE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700841
YOSHIFUJI Hideaki77d16f42006-08-23 17:25:05 -0700842 strict |= flags & RT6_LOOKUP_F_IFACE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700843
844relookup:
Thomas Grafc71099a2006-08-04 23:20:06 -0700845 read_lock_bh(&table->tb6_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700846
YOSHIFUJI Hideaki8238dd02006-03-20 17:04:35 -0800847restart_2:
David S. Miller4c9483b2011-03-12 16:22:43 -0500848 fn = fib6_lookup(&table->tb6_root, &fl6->daddr, &fl6->saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700849
850restart:
Pavel Emelyanov4acad722007-10-15 13:02:51 -0700851 rt = rt6_select(fn, oif, strict | reachable);
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800852
David S. Miller4c9483b2011-03-12 16:22:43 -0500853 BACKTRACK(net, &fl6->saddr);
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800854 if (rt == net->ipv6.ip6_null_entry ||
YOSHIFUJI Hideaki8238dd02006-03-20 17:04:35 -0800855 rt->rt6i_flags & RTF_CACHE)
YOSHIFUJI Hideaki1ddef0442006-03-20 17:01:24 -0800856 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700857
Changli Gaod8d1f302010-06-10 23:31:35 -0700858 dst_hold(&rt->dst);
Thomas Grafc71099a2006-08-04 23:20:06 -0700859 read_unlock_bh(&table->tb6_lock);
YOSHIFUJI Hideakifb9de912006-03-20 16:59:08 -0800860
David Miller27217452011-12-02 16:52:08 +0000861 if (!dst_get_neighbour_noref_raw(&rt->dst) && !(rt->rt6i_flags & RTF_NONEXTHOP))
David S. Miller4c9483b2011-03-12 16:22:43 -0500862 nrt = rt6_alloc_cow(rt, &fl6->daddr, &fl6->saddr);
David S. Miller7343ff32011-03-09 19:55:25 -0800863 else if (!(rt->dst.flags & DST_HOST))
David S. Miller4c9483b2011-03-12 16:22:43 -0500864 nrt = rt6_alloc_clone(rt, &fl6->daddr);
David S. Miller7343ff32011-03-09 19:55:25 -0800865 else
866 goto out2;
YOSHIFUJI Hideakie40cf352006-03-20 16:59:27 -0800867
Changli Gaod8d1f302010-06-10 23:31:35 -0700868 dst_release(&rt->dst);
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800869 rt = nrt ? : net->ipv6.ip6_null_entry;
YOSHIFUJI Hideaki519fbd82006-03-20 17:00:05 -0800870
Changli Gaod8d1f302010-06-10 23:31:35 -0700871 dst_hold(&rt->dst);
YOSHIFUJI Hideaki519fbd82006-03-20 17:00:05 -0800872 if (nrt) {
Thomas Graf40e22e82006-08-22 00:00:45 -0700873 err = ip6_ins_rt(nrt);
YOSHIFUJI Hideaki519fbd82006-03-20 17:00:05 -0800874 if (!err)
875 goto out2;
876 }
877
878 if (--attempts <= 0)
879 goto out2;
880
881 /*
Thomas Grafc71099a2006-08-04 23:20:06 -0700882 * Race condition! In the gap, when table->tb6_lock was
YOSHIFUJI Hideaki519fbd82006-03-20 17:00:05 -0800883 * released someone could insert this route. Relookup.
884 */
Changli Gaod8d1f302010-06-10 23:31:35 -0700885 dst_release(&rt->dst);
YOSHIFUJI Hideaki519fbd82006-03-20 17:00:05 -0800886 goto relookup;
887
888out:
YOSHIFUJI Hideaki8238dd02006-03-20 17:04:35 -0800889 if (reachable) {
890 reachable = 0;
891 goto restart_2;
892 }
Changli Gaod8d1f302010-06-10 23:31:35 -0700893 dst_hold(&rt->dst);
Thomas Grafc71099a2006-08-04 23:20:06 -0700894 read_unlock_bh(&table->tb6_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895out2:
Changli Gaod8d1f302010-06-10 23:31:35 -0700896 rt->dst.lastuse = jiffies;
897 rt->dst.__use++;
Thomas Grafc71099a2006-08-04 23:20:06 -0700898
899 return rt;
900}
901
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800902static struct rt6_info *ip6_pol_route_input(struct net *net, struct fib6_table *table,
David S. Miller4c9483b2011-03-12 16:22:43 -0500903 struct flowi6 *fl6, int flags)
Pavel Emelyanov4acad722007-10-15 13:02:51 -0700904{
David S. Miller4c9483b2011-03-12 16:22:43 -0500905 return ip6_pol_route(net, table, fl6->flowi6_iif, fl6, flags);
Pavel Emelyanov4acad722007-10-15 13:02:51 -0700906}
907
Shmulik Ladkani72331bc2012-04-01 04:03:45 +0000908static struct dst_entry *ip6_route_input_lookup(struct net *net,
909 struct net_device *dev,
910 struct flowi6 *fl6, int flags)
911{
912 if (rt6_need_strict(&fl6->daddr) && dev->type != ARPHRD_PIMREG)
913 flags |= RT6_LOOKUP_F_IFACE;
914
915 return fib6_rule_lookup(net, fl6, flags, ip6_pol_route_input);
916}
917
Thomas Grafc71099a2006-08-04 23:20:06 -0700918void ip6_route_input(struct sk_buff *skb)
919{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000920 const struct ipv6hdr *iph = ipv6_hdr(skb);
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900921 struct net *net = dev_net(skb->dev);
Thomas Grafadaa70b2006-10-13 15:01:03 -0700922 int flags = RT6_LOOKUP_F_HAS_SADDR;
David S. Miller4c9483b2011-03-12 16:22:43 -0500923 struct flowi6 fl6 = {
924 .flowi6_iif = skb->dev->ifindex,
925 .daddr = iph->daddr,
926 .saddr = iph->saddr,
David S. Miller38308472011-12-03 18:02:47 -0500927 .flowlabel = (* (__be32 *) iph) & IPV6_FLOWINFO_MASK,
David S. Miller4c9483b2011-03-12 16:22:43 -0500928 .flowi6_mark = skb->mark,
929 .flowi6_proto = iph->nexthdr,
Thomas Grafc71099a2006-08-04 23:20:06 -0700930 };
Thomas Grafadaa70b2006-10-13 15:01:03 -0700931
Shmulik Ladkani72331bc2012-04-01 04:03:45 +0000932 skb_dst_set(skb, ip6_route_input_lookup(net, skb->dev, &fl6, flags));
Thomas Grafc71099a2006-08-04 23:20:06 -0700933}
934
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800935static struct rt6_info *ip6_pol_route_output(struct net *net, struct fib6_table *table,
David S. Miller4c9483b2011-03-12 16:22:43 -0500936 struct flowi6 *fl6, int flags)
Thomas Grafc71099a2006-08-04 23:20:06 -0700937{
David S. Miller4c9483b2011-03-12 16:22:43 -0500938 return ip6_pol_route(net, table, fl6->flowi6_oif, fl6, flags);
Thomas Grafc71099a2006-08-04 23:20:06 -0700939}
940
Florian Westphal9c7a4f92011-03-22 19:17:36 -0700941struct dst_entry * ip6_route_output(struct net *net, const struct sock *sk,
David S. Miller4c9483b2011-03-12 16:22:43 -0500942 struct flowi6 *fl6)
Thomas Grafc71099a2006-08-04 23:20:06 -0700943{
944 int flags = 0;
945
David McCullough4dc27d1c2012-06-25 15:42:26 +0000946 fl6->flowi6_iif = net->loopback_dev->ifindex;
947
David S. Miller4c9483b2011-03-12 16:22:43 -0500948 if ((sk && sk->sk_bound_dev_if) || rt6_need_strict(&fl6->daddr))
YOSHIFUJI Hideaki77d16f42006-08-23 17:25:05 -0700949 flags |= RT6_LOOKUP_F_IFACE;
Thomas Grafc71099a2006-08-04 23:20:06 -0700950
David S. Miller4c9483b2011-03-12 16:22:43 -0500951 if (!ipv6_addr_any(&fl6->saddr))
Thomas Grafadaa70b2006-10-13 15:01:03 -0700952 flags |= RT6_LOOKUP_F_HAS_SADDR;
YOSHIFUJI Hideaki / 吉藤英明0c9a2ac2010-03-07 00:14:44 +0000953 else if (sk)
954 flags |= rt6_srcprefs2flags(inet6_sk(sk)->srcprefs);
Thomas Grafadaa70b2006-10-13 15:01:03 -0700955
David S. Miller4c9483b2011-03-12 16:22:43 -0500956 return fib6_rule_lookup(net, fl6, flags, ip6_pol_route_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700957}
958
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +0900959EXPORT_SYMBOL(ip6_route_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700960
David S. Miller2774c132011-03-01 14:59:04 -0800961struct dst_entry *ip6_blackhole_route(struct net *net, struct dst_entry *dst_orig)
David S. Miller14e50e52007-05-24 18:17:54 -0700962{
David S. Miller5c1e6aa2011-04-28 14:13:38 -0700963 struct rt6_info *rt, *ort = (struct rt6_info *) dst_orig;
David S. Miller14e50e52007-05-24 18:17:54 -0700964 struct dst_entry *new = NULL;
965
David S. Miller5c1e6aa2011-04-28 14:13:38 -0700966 rt = dst_alloc(&ip6_dst_blackhole_ops, ort->dst.dev, 1, 0, 0);
David S. Miller14e50e52007-05-24 18:17:54 -0700967 if (rt) {
David S. Millercf911662011-04-28 14:31:47 -0700968 memset(&rt->rt6i_table, 0, sizeof(*rt) - sizeof(struct dst_entry));
David S. Miller97bab732012-06-09 22:36:36 -0700969 rt6_init_peer(rt, net->ipv6.peers);
David S. Millercf911662011-04-28 14:31:47 -0700970
Changli Gaod8d1f302010-06-10 23:31:35 -0700971 new = &rt->dst;
David S. Miller14e50e52007-05-24 18:17:54 -0700972
David S. Miller14e50e52007-05-24 18:17:54 -0700973 new->__use = 1;
Herbert Xu352e5122007-11-13 21:34:06 -0800974 new->input = dst_discard;
975 new->output = dst_discard;
David S. Miller14e50e52007-05-24 18:17:54 -0700976
Eric Dumazet21efcfa2011-07-19 20:18:36 +0000977 if (dst_metrics_read_only(&ort->dst))
978 new->_metrics = ort->dst._metrics;
979 else
980 dst_copy_metrics(new, &ort->dst);
David S. Miller14e50e52007-05-24 18:17:54 -0700981 rt->rt6i_idev = ort->rt6i_idev;
982 if (rt->rt6i_idev)
983 in6_dev_hold(rt->rt6i_idev);
David S. Miller14e50e52007-05-24 18:17:54 -0700984
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000985 rt->rt6i_gateway = ort->rt6i_gateway;
Gao feng1716a962012-04-06 00:13:10 +0000986 rt->rt6i_flags = ort->rt6i_flags;
987 rt6_clean_expires(rt);
David S. Miller14e50e52007-05-24 18:17:54 -0700988 rt->rt6i_metric = 0;
989
990 memcpy(&rt->rt6i_dst, &ort->rt6i_dst, sizeof(struct rt6key));
991#ifdef CONFIG_IPV6_SUBTREES
992 memcpy(&rt->rt6i_src, &ort->rt6i_src, sizeof(struct rt6key));
993#endif
994
995 dst_free(new);
996 }
997
David S. Miller69ead7a2011-03-01 14:45:33 -0800998 dst_release(dst_orig);
999 return new ? new : ERR_PTR(-ENOMEM);
David S. Miller14e50e52007-05-24 18:17:54 -07001000}
David S. Miller14e50e52007-05-24 18:17:54 -07001001
Linus Torvalds1da177e2005-04-16 15:20:36 -07001002/*
1003 * Destination cache support functions
1004 */
1005
1006static struct dst_entry *ip6_dst_check(struct dst_entry *dst, u32 cookie)
1007{
1008 struct rt6_info *rt;
1009
1010 rt = (struct rt6_info *) dst;
1011
David S. Miller6431cbc2011-02-07 20:38:06 -08001012 if (rt->rt6i_node && (rt->rt6i_node->fn_sernum == cookie)) {
1013 if (rt->rt6i_peer_genid != rt6_peer_genid()) {
David S. Miller97bab732012-06-09 22:36:36 -07001014 if (!rt6_has_peer(rt))
David S. Miller6431cbc2011-02-07 20:38:06 -08001015 rt6_bind_peer(rt, 0);
1016 rt->rt6i_peer_genid = rt6_peer_genid();
1017 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001018 return dst;
David S. Miller6431cbc2011-02-07 20:38:06 -08001019 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001020 return NULL;
1021}
1022
1023static struct dst_entry *ip6_negative_advice(struct dst_entry *dst)
1024{
1025 struct rt6_info *rt = (struct rt6_info *) dst;
1026
1027 if (rt) {
YOSHIFUJI Hideaki / 吉藤英明54c1a852010-03-28 07:15:45 +00001028 if (rt->rt6i_flags & RTF_CACHE) {
1029 if (rt6_check_expired(rt)) {
1030 ip6_del_rt(rt);
1031 dst = NULL;
1032 }
1033 } else {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001034 dst_release(dst);
YOSHIFUJI Hideaki / 吉藤英明54c1a852010-03-28 07:15:45 +00001035 dst = NULL;
1036 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001037 }
YOSHIFUJI Hideaki / 吉藤英明54c1a852010-03-28 07:15:45 +00001038 return dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001039}
1040
1041static void ip6_link_failure(struct sk_buff *skb)
1042{
1043 struct rt6_info *rt;
1044
Alexey Dobriyan3ffe5332010-02-18 08:25:24 +00001045 icmpv6_send(skb, ICMPV6_DEST_UNREACH, ICMPV6_ADDR_UNREACH, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001046
Eric Dumazetadf30902009-06-02 05:19:30 +00001047 rt = (struct rt6_info *) skb_dst(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001048 if (rt) {
Gao feng1716a962012-04-06 00:13:10 +00001049 if (rt->rt6i_flags & RTF_CACHE)
1050 rt6_update_expires(rt, 0);
1051 else if (rt->rt6i_node && (rt->rt6i_flags & RTF_DEFAULT))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001052 rt->rt6i_node->fn_sernum = -1;
1053 }
1054}
1055
1056static void ip6_rt_update_pmtu(struct dst_entry *dst, u32 mtu)
1057{
1058 struct rt6_info *rt6 = (struct rt6_info*)dst;
1059
David S. Miller81aded22012-06-15 14:54:11 -07001060 dst_confirm(dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001061 if (mtu < dst_mtu(dst) && rt6->rt6i_dst.plen == 128) {
David S. Miller81aded22012-06-15 14:54:11 -07001062 struct net *net = dev_net(dst->dev);
1063
Linus Torvalds1da177e2005-04-16 15:20:36 -07001064 rt6->rt6i_flags |= RTF_MODIFIED;
1065 if (mtu < IPV6_MIN_MTU) {
David S. Millerdefb3512010-12-08 21:16:57 -08001066 u32 features = dst_metric(dst, RTAX_FEATURES);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001067 mtu = IPV6_MIN_MTU;
David S. Millerdefb3512010-12-08 21:16:57 -08001068 features |= RTAX_FEATURE_ALLFRAG;
1069 dst_metric_set(dst, RTAX_FEATURES, features);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001070 }
David S. Millerdefb3512010-12-08 21:16:57 -08001071 dst_metric_set(dst, RTAX_MTU, mtu);
David S. Miller81aded22012-06-15 14:54:11 -07001072 rt6_update_expires(rt6, net->ipv6.sysctl.ip6_rt_mtu_expires);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001073 }
1074}
1075
David S. Miller42ae66c2012-06-15 20:01:57 -07001076void ip6_update_pmtu(struct sk_buff *skb, struct net *net, __be32 mtu,
1077 int oif, u32 mark)
David S. Miller81aded22012-06-15 14:54:11 -07001078{
1079 const struct ipv6hdr *iph = (struct ipv6hdr *) skb->data;
1080 struct dst_entry *dst;
1081 struct flowi6 fl6;
1082
1083 memset(&fl6, 0, sizeof(fl6));
1084 fl6.flowi6_oif = oif;
1085 fl6.flowi6_mark = mark;
1086 fl6.flowi6_flags = FLOWI_FLAG_PRECOW_METRICS;
1087 fl6.daddr = iph->daddr;
1088 fl6.saddr = iph->saddr;
1089 fl6.flowlabel = (*(__be32 *) iph) & IPV6_FLOWINFO_MASK;
1090
1091 dst = ip6_route_output(net, NULL, &fl6);
1092 if (!dst->error)
1093 ip6_rt_update_pmtu(dst, ntohl(mtu));
1094 dst_release(dst);
1095}
1096EXPORT_SYMBOL_GPL(ip6_update_pmtu);
1097
1098void ip6_sk_update_pmtu(struct sk_buff *skb, struct sock *sk, __be32 mtu)
1099{
1100 ip6_update_pmtu(skb, sock_net(sk), mtu,
1101 sk->sk_bound_dev_if, sk->sk_mark);
1102}
1103EXPORT_SYMBOL_GPL(ip6_sk_update_pmtu);
1104
David S. Miller0dbaee32010-12-13 12:52:14 -08001105static unsigned int ip6_default_advmss(const struct dst_entry *dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001106{
David S. Miller0dbaee32010-12-13 12:52:14 -08001107 struct net_device *dev = dst->dev;
1108 unsigned int mtu = dst_mtu(dst);
1109 struct net *net = dev_net(dev);
1110
Linus Torvalds1da177e2005-04-16 15:20:36 -07001111 mtu -= sizeof(struct ipv6hdr) + sizeof(struct tcphdr);
1112
Daniel Lezcano55786892008-03-04 13:47:47 -08001113 if (mtu < net->ipv6.sysctl.ip6_rt_min_advmss)
1114 mtu = net->ipv6.sysctl.ip6_rt_min_advmss;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001115
1116 /*
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001117 * Maximal non-jumbo IPv6 payload is IPV6_MAXPLEN and
1118 * corresponding MSS is IPV6_MAXPLEN - tcp_header_size.
1119 * IPV6_MAXPLEN is also valid and means: "any MSS,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001120 * rely only on pmtu discovery"
1121 */
1122 if (mtu > IPV6_MAXPLEN - sizeof(struct tcphdr))
1123 mtu = IPV6_MAXPLEN;
1124 return mtu;
1125}
1126
Steffen Klassertebb762f2011-11-23 02:12:51 +00001127static unsigned int ip6_mtu(const struct dst_entry *dst)
David S. Millerd33e4552010-12-14 13:01:14 -08001128{
David S. Millerd33e4552010-12-14 13:01:14 -08001129 struct inet6_dev *idev;
Steffen Klassert618f9bc2011-11-23 02:13:31 +00001130 unsigned int mtu = dst_metric_raw(dst, RTAX_MTU);
1131
1132 if (mtu)
1133 return mtu;
1134
1135 mtu = IPV6_MIN_MTU;
David S. Millerd33e4552010-12-14 13:01:14 -08001136
1137 rcu_read_lock();
1138 idev = __in6_dev_get(dst->dev);
1139 if (idev)
1140 mtu = idev->cnf.mtu6;
1141 rcu_read_unlock();
1142
1143 return mtu;
1144}
1145
YOSHIFUJI Hideaki3b009442007-12-06 16:11:48 -08001146static struct dst_entry *icmp6_dst_gc_list;
1147static DEFINE_SPINLOCK(icmp6_dst_lock);
Thomas Graf5d0bbee2006-08-04 03:37:36 -07001148
YOSHIFUJI Hideaki3b009442007-12-06 16:11:48 -08001149struct dst_entry *icmp6_dst_alloc(struct net_device *dev,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001150 struct neighbour *neigh,
David S. Miller87a11572011-12-06 17:04:13 -05001151 struct flowi6 *fl6)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001152{
David S. Miller87a11572011-12-06 17:04:13 -05001153 struct dst_entry *dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001154 struct rt6_info *rt;
1155 struct inet6_dev *idev = in6_dev_get(dev);
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001156 struct net *net = dev_net(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001157
David S. Miller38308472011-12-03 18:02:47 -05001158 if (unlikely(!idev))
Eric Dumazet122bdf62012-03-14 21:13:11 +00001159 return ERR_PTR(-ENODEV);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001160
David S. Miller8b96d222012-06-11 02:01:56 -07001161 rt = ip6_dst_alloc(net, dev, 0, NULL);
David S. Miller38308472011-12-03 18:02:47 -05001162 if (unlikely(!rt)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001163 in6_dev_put(idev);
David S. Miller87a11572011-12-06 17:04:13 -05001164 dst = ERR_PTR(-ENOMEM);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001165 goto out;
1166 }
1167
Linus Torvalds1da177e2005-04-16 15:20:36 -07001168 if (neigh)
1169 neigh_hold(neigh);
David S. Miller14deae42009-01-04 16:04:39 -08001170 else {
David S. Millerf894cbf2012-07-02 21:52:24 -07001171 neigh = ip6_neigh_lookup(&rt->dst, NULL, &fl6->daddr);
David S. Millerb43faac2011-12-13 16:48:21 -05001172 if (IS_ERR(neigh)) {
RongQing.Li252c3d82012-01-12 22:33:46 +00001173 in6_dev_put(idev);
David S. Millerb43faac2011-12-13 16:48:21 -05001174 dst_free(&rt->dst);
1175 return ERR_CAST(neigh);
1176 }
David S. Miller14deae42009-01-04 16:04:39 -08001177 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001178
Yan, Zheng8e2ec632011-09-05 21:34:30 +00001179 rt->dst.flags |= DST_HOST;
1180 rt->dst.output = ip6_output;
David S. Miller69cce1d2011-07-17 23:09:49 -07001181 dst_set_neighbour(&rt->dst, neigh);
Changli Gaod8d1f302010-06-10 23:31:35 -07001182 atomic_set(&rt->dst.__refcnt, 1);
David S. Miller87a11572011-12-06 17:04:13 -05001183 rt->rt6i_dst.addr = fl6->daddr;
Yan, Zheng8e2ec632011-09-05 21:34:30 +00001184 rt->rt6i_dst.plen = 128;
1185 rt->rt6i_idev = idev;
Gao feng70116872011-10-28 02:46:57 +00001186 dst_metric_set(&rt->dst, RTAX_HOPLIMIT, 255);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001187
YOSHIFUJI Hideaki3b009442007-12-06 16:11:48 -08001188 spin_lock_bh(&icmp6_dst_lock);
Changli Gaod8d1f302010-06-10 23:31:35 -07001189 rt->dst.next = icmp6_dst_gc_list;
1190 icmp6_dst_gc_list = &rt->dst;
YOSHIFUJI Hideaki3b009442007-12-06 16:11:48 -08001191 spin_unlock_bh(&icmp6_dst_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001192
Daniel Lezcano55786892008-03-04 13:47:47 -08001193 fib6_force_start_gc(net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001194
David S. Miller87a11572011-12-06 17:04:13 -05001195 dst = xfrm_lookup(net, &rt->dst, flowi6_to_flowi(fl6), NULL, 0);
1196
Linus Torvalds1da177e2005-04-16 15:20:36 -07001197out:
David S. Miller87a11572011-12-06 17:04:13 -05001198 return dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001199}
1200
Stephen Hemminger3d0f24a2008-07-22 14:35:50 -07001201int icmp6_dst_gc(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001202{
Hagen Paul Pfeifere9476e92011-02-25 05:45:19 +00001203 struct dst_entry *dst, **pprev;
Stephen Hemminger3d0f24a2008-07-22 14:35:50 -07001204 int more = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001205
YOSHIFUJI Hideaki3b009442007-12-06 16:11:48 -08001206 spin_lock_bh(&icmp6_dst_lock);
1207 pprev = &icmp6_dst_gc_list;
Thomas Graf5d0bbee2006-08-04 03:37:36 -07001208
Linus Torvalds1da177e2005-04-16 15:20:36 -07001209 while ((dst = *pprev) != NULL) {
1210 if (!atomic_read(&dst->__refcnt)) {
1211 *pprev = dst->next;
1212 dst_free(dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001213 } else {
1214 pprev = &dst->next;
Stephen Hemminger3d0f24a2008-07-22 14:35:50 -07001215 ++more;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001216 }
1217 }
1218
YOSHIFUJI Hideaki3b009442007-12-06 16:11:48 -08001219 spin_unlock_bh(&icmp6_dst_lock);
Thomas Graf5d0bbee2006-08-04 03:37:36 -07001220
Stephen Hemminger3d0f24a2008-07-22 14:35:50 -07001221 return more;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001222}
1223
David S. Miller1e493d12008-09-10 17:27:15 -07001224static void icmp6_clean_all(int (*func)(struct rt6_info *rt, void *arg),
1225 void *arg)
1226{
1227 struct dst_entry *dst, **pprev;
1228
1229 spin_lock_bh(&icmp6_dst_lock);
1230 pprev = &icmp6_dst_gc_list;
1231 while ((dst = *pprev) != NULL) {
1232 struct rt6_info *rt = (struct rt6_info *) dst;
1233 if (func(rt, arg)) {
1234 *pprev = dst->next;
1235 dst_free(dst);
1236 } else {
1237 pprev = &dst->next;
1238 }
1239 }
1240 spin_unlock_bh(&icmp6_dst_lock);
1241}
1242
Daniel Lezcano569d3642008-01-18 03:56:57 -08001243static int ip6_dst_gc(struct dst_ops *ops)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001244{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001245 unsigned long now = jiffies;
Alexey Dobriyan86393e52009-08-29 01:34:49 +00001246 struct net *net = container_of(ops, struct net, ipv6.ip6_dst_ops);
Daniel Lezcano7019b782008-03-04 13:50:14 -08001247 int rt_min_interval = net->ipv6.sysctl.ip6_rt_gc_min_interval;
1248 int rt_max_size = net->ipv6.sysctl.ip6_rt_max_size;
1249 int rt_elasticity = net->ipv6.sysctl.ip6_rt_gc_elasticity;
1250 int rt_gc_timeout = net->ipv6.sysctl.ip6_rt_gc_timeout;
1251 unsigned long rt_last_gc = net->ipv6.ip6_rt_last_gc;
Eric Dumazetfc66f952010-10-08 06:37:34 +00001252 int entries;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001253
Eric Dumazetfc66f952010-10-08 06:37:34 +00001254 entries = dst_entries_get_fast(ops);
Daniel Lezcano7019b782008-03-04 13:50:14 -08001255 if (time_after(rt_last_gc + rt_min_interval, now) &&
Eric Dumazetfc66f952010-10-08 06:37:34 +00001256 entries <= rt_max_size)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001257 goto out;
1258
Benjamin Thery6891a342008-03-04 13:49:47 -08001259 net->ipv6.ip6_rt_gc_expire++;
1260 fib6_run_gc(net->ipv6.ip6_rt_gc_expire, net);
1261 net->ipv6.ip6_rt_last_gc = now;
Eric Dumazetfc66f952010-10-08 06:37:34 +00001262 entries = dst_entries_get_slow(ops);
1263 if (entries < ops->gc_thresh)
Daniel Lezcano7019b782008-03-04 13:50:14 -08001264 net->ipv6.ip6_rt_gc_expire = rt_gc_timeout>>1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001265out:
Daniel Lezcano7019b782008-03-04 13:50:14 -08001266 net->ipv6.ip6_rt_gc_expire -= net->ipv6.ip6_rt_gc_expire>>rt_elasticity;
Eric Dumazetfc66f952010-10-08 06:37:34 +00001267 return entries > rt_max_size;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001268}
1269
1270/* Clean host part of a prefix. Not necessary in radix tree,
1271 but results in cleaner routing tables.
1272
1273 Remove it only when all the things will work!
1274 */
1275
YOSHIFUJI Hideaki6b75d092008-03-10 06:00:30 -04001276int ip6_dst_hoplimit(struct dst_entry *dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001277{
David S. Miller5170ae82010-12-12 21:35:57 -08001278 int hoplimit = dst_metric_raw(dst, RTAX_HOPLIMIT);
David S. Millera02e4b72010-12-12 21:39:02 -08001279 if (hoplimit == 0) {
YOSHIFUJI Hideaki6b75d092008-03-10 06:00:30 -04001280 struct net_device *dev = dst->dev;
Eric Dumazetc68f24c2010-06-14 04:46:20 +00001281 struct inet6_dev *idev;
1282
1283 rcu_read_lock();
1284 idev = __in6_dev_get(dev);
1285 if (idev)
YOSHIFUJI Hideaki6b75d092008-03-10 06:00:30 -04001286 hoplimit = idev->cnf.hop_limit;
Eric Dumazetc68f24c2010-06-14 04:46:20 +00001287 else
YOSHIFUJI Hideaki53b79972008-07-19 22:35:03 -07001288 hoplimit = dev_net(dev)->ipv6.devconf_all->hop_limit;
Eric Dumazetc68f24c2010-06-14 04:46:20 +00001289 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001290 }
1291 return hoplimit;
1292}
David S. Millerabbf46a2010-12-12 21:14:46 -08001293EXPORT_SYMBOL(ip6_dst_hoplimit);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001294
1295/*
1296 *
1297 */
1298
Thomas Graf86872cb2006-08-22 00:01:08 -07001299int ip6_route_add(struct fib6_config *cfg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001300{
1301 int err;
Daniel Lezcano55786892008-03-04 13:47:47 -08001302 struct net *net = cfg->fc_nlinfo.nl_net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001303 struct rt6_info *rt = NULL;
1304 struct net_device *dev = NULL;
1305 struct inet6_dev *idev = NULL;
Thomas Grafc71099a2006-08-04 23:20:06 -07001306 struct fib6_table *table;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001307 int addr_type;
1308
Thomas Graf86872cb2006-08-22 00:01:08 -07001309 if (cfg->fc_dst_len > 128 || cfg->fc_src_len > 128)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001310 return -EINVAL;
1311#ifndef CONFIG_IPV6_SUBTREES
Thomas Graf86872cb2006-08-22 00:01:08 -07001312 if (cfg->fc_src_len)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001313 return -EINVAL;
1314#endif
Thomas Graf86872cb2006-08-22 00:01:08 -07001315 if (cfg->fc_ifindex) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001316 err = -ENODEV;
Daniel Lezcano55786892008-03-04 13:47:47 -08001317 dev = dev_get_by_index(net, cfg->fc_ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001318 if (!dev)
1319 goto out;
1320 idev = in6_dev_get(dev);
1321 if (!idev)
1322 goto out;
1323 }
1324
Thomas Graf86872cb2006-08-22 00:01:08 -07001325 if (cfg->fc_metric == 0)
1326 cfg->fc_metric = IP6_RT_PRIO_USER;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001327
Matti Vaittinend71314b2011-11-14 00:14:49 +00001328 err = -ENOBUFS;
David S. Miller38308472011-12-03 18:02:47 -05001329 if (cfg->fc_nlinfo.nlh &&
1330 !(cfg->fc_nlinfo.nlh->nlmsg_flags & NLM_F_CREATE)) {
Matti Vaittinend71314b2011-11-14 00:14:49 +00001331 table = fib6_get_table(net, cfg->fc_table);
David S. Miller38308472011-12-03 18:02:47 -05001332 if (!table) {
Joe Perchesf3213832012-05-15 14:11:53 +00001333 pr_warn("NLM_F_CREATE should be specified when creating new route\n");
Matti Vaittinend71314b2011-11-14 00:14:49 +00001334 table = fib6_new_table(net, cfg->fc_table);
1335 }
1336 } else {
1337 table = fib6_new_table(net, cfg->fc_table);
1338 }
David S. Miller38308472011-12-03 18:02:47 -05001339
1340 if (!table)
Thomas Grafc71099a2006-08-04 23:20:06 -07001341 goto out;
Thomas Grafc71099a2006-08-04 23:20:06 -07001342
David S. Miller8b96d222012-06-11 02:01:56 -07001343 rt = ip6_dst_alloc(net, NULL, DST_NOCOUNT, table);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001344
David S. Miller38308472011-12-03 18:02:47 -05001345 if (!rt) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001346 err = -ENOMEM;
1347 goto out;
1348 }
1349
Changli Gaod8d1f302010-06-10 23:31:35 -07001350 rt->dst.obsolete = -1;
Gao feng1716a962012-04-06 00:13:10 +00001351
1352 if (cfg->fc_flags & RTF_EXPIRES)
1353 rt6_set_expires(rt, jiffies +
1354 clock_t_to_jiffies(cfg->fc_expires));
1355 else
1356 rt6_clean_expires(rt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001357
Thomas Graf86872cb2006-08-22 00:01:08 -07001358 if (cfg->fc_protocol == RTPROT_UNSPEC)
1359 cfg->fc_protocol = RTPROT_BOOT;
1360 rt->rt6i_protocol = cfg->fc_protocol;
1361
1362 addr_type = ipv6_addr_type(&cfg->fc_dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001363
1364 if (addr_type & IPV6_ADDR_MULTICAST)
Changli Gaod8d1f302010-06-10 23:31:35 -07001365 rt->dst.input = ip6_mc_input;
Maciej Żenczykowskiab79ad12010-09-27 00:07:02 +00001366 else if (cfg->fc_flags & RTF_LOCAL)
1367 rt->dst.input = ip6_input;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001368 else
Changli Gaod8d1f302010-06-10 23:31:35 -07001369 rt->dst.input = ip6_forward;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001370
Changli Gaod8d1f302010-06-10 23:31:35 -07001371 rt->dst.output = ip6_output;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001372
Thomas Graf86872cb2006-08-22 00:01:08 -07001373 ipv6_addr_prefix(&rt->rt6i_dst.addr, &cfg->fc_dst, cfg->fc_dst_len);
1374 rt->rt6i_dst.plen = cfg->fc_dst_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001375 if (rt->rt6i_dst.plen == 128)
David S. Miller11d53b42011-06-24 15:23:34 -07001376 rt->dst.flags |= DST_HOST;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001377
Yan, Zheng8e2ec632011-09-05 21:34:30 +00001378 if (!(rt->dst.flags & DST_HOST) && cfg->fc_mx) {
1379 u32 *metrics = kzalloc(sizeof(u32) * RTAX_MAX, GFP_KERNEL);
1380 if (!metrics) {
1381 err = -ENOMEM;
1382 goto out;
1383 }
1384 dst_init_metrics(&rt->dst, metrics, 0);
1385 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001386#ifdef CONFIG_IPV6_SUBTREES
Thomas Graf86872cb2006-08-22 00:01:08 -07001387 ipv6_addr_prefix(&rt->rt6i_src.addr, &cfg->fc_src, cfg->fc_src_len);
1388 rt->rt6i_src.plen = cfg->fc_src_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001389#endif
1390
Thomas Graf86872cb2006-08-22 00:01:08 -07001391 rt->rt6i_metric = cfg->fc_metric;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001392
1393 /* We cannot add true routes via loopback here,
1394 they would result in kernel looping; promote them to reject routes
1395 */
Thomas Graf86872cb2006-08-22 00:01:08 -07001396 if ((cfg->fc_flags & RTF_REJECT) ||
David S. Miller38308472011-12-03 18:02:47 -05001397 (dev && (dev->flags & IFF_LOOPBACK) &&
1398 !(addr_type & IPV6_ADDR_LOOPBACK) &&
1399 !(cfg->fc_flags & RTF_LOCAL))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001400 /* hold loopback dev/idev if we haven't done so. */
Daniel Lezcano55786892008-03-04 13:47:47 -08001401 if (dev != net->loopback_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001402 if (dev) {
1403 dev_put(dev);
1404 in6_dev_put(idev);
1405 }
Daniel Lezcano55786892008-03-04 13:47:47 -08001406 dev = net->loopback_dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001407 dev_hold(dev);
1408 idev = in6_dev_get(dev);
1409 if (!idev) {
1410 err = -ENODEV;
1411 goto out;
1412 }
1413 }
Changli Gaod8d1f302010-06-10 23:31:35 -07001414 rt->dst.output = ip6_pkt_discard_out;
1415 rt->dst.input = ip6_pkt_discard;
1416 rt->dst.error = -ENETUNREACH;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001417 rt->rt6i_flags = RTF_REJECT|RTF_NONEXTHOP;
1418 goto install_route;
1419 }
1420
Thomas Graf86872cb2006-08-22 00:01:08 -07001421 if (cfg->fc_flags & RTF_GATEWAY) {
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001422 const struct in6_addr *gw_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001423 int gwa_type;
1424
Thomas Graf86872cb2006-08-22 00:01:08 -07001425 gw_addr = &cfg->fc_gateway;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001426 rt->rt6i_gateway = *gw_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001427 gwa_type = ipv6_addr_type(gw_addr);
1428
1429 if (gwa_type != (IPV6_ADDR_LINKLOCAL|IPV6_ADDR_UNICAST)) {
1430 struct rt6_info *grt;
1431
1432 /* IPv6 strictly inhibits using not link-local
1433 addresses as nexthop address.
1434 Otherwise, router will not able to send redirects.
1435 It is very good, but in some (rare!) circumstances
1436 (SIT, PtP, NBMA NOARP links) it is handy to allow
1437 some exceptions. --ANK
1438 */
1439 err = -EINVAL;
David S. Miller38308472011-12-03 18:02:47 -05001440 if (!(gwa_type & IPV6_ADDR_UNICAST))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001441 goto out;
1442
Daniel Lezcano55786892008-03-04 13:47:47 -08001443 grt = rt6_lookup(net, gw_addr, NULL, cfg->fc_ifindex, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001444
1445 err = -EHOSTUNREACH;
David S. Miller38308472011-12-03 18:02:47 -05001446 if (!grt)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001447 goto out;
1448 if (dev) {
David S. Millerd1918542011-12-28 20:19:20 -05001449 if (dev != grt->dst.dev) {
Changli Gaod8d1f302010-06-10 23:31:35 -07001450 dst_release(&grt->dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001451 goto out;
1452 }
1453 } else {
David S. Millerd1918542011-12-28 20:19:20 -05001454 dev = grt->dst.dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001455 idev = grt->rt6i_idev;
1456 dev_hold(dev);
1457 in6_dev_hold(grt->rt6i_idev);
1458 }
David S. Miller38308472011-12-03 18:02:47 -05001459 if (!(grt->rt6i_flags & RTF_GATEWAY))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001460 err = 0;
Changli Gaod8d1f302010-06-10 23:31:35 -07001461 dst_release(&grt->dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001462
1463 if (err)
1464 goto out;
1465 }
1466 err = -EINVAL;
David S. Miller38308472011-12-03 18:02:47 -05001467 if (!dev || (dev->flags & IFF_LOOPBACK))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001468 goto out;
1469 }
1470
1471 err = -ENODEV;
David S. Miller38308472011-12-03 18:02:47 -05001472 if (!dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001473 goto out;
1474
Daniel Walterc3968a82011-04-13 21:10:57 +00001475 if (!ipv6_addr_any(&cfg->fc_prefsrc)) {
1476 if (!ipv6_chk_addr(net, &cfg->fc_prefsrc, dev, 0)) {
1477 err = -EINVAL;
1478 goto out;
1479 }
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001480 rt->rt6i_prefsrc.addr = cfg->fc_prefsrc;
Daniel Walterc3968a82011-04-13 21:10:57 +00001481 rt->rt6i_prefsrc.plen = 128;
1482 } else
1483 rt->rt6i_prefsrc.plen = 0;
1484
Thomas Graf86872cb2006-08-22 00:01:08 -07001485 if (cfg->fc_flags & (RTF_GATEWAY | RTF_NONEXTHOP)) {
David S. Miller8ade06c2011-12-29 18:51:57 -05001486 err = rt6_bind_neighbour(rt, dev);
David S. Millerf83c7792011-12-28 15:41:23 -05001487 if (err)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001488 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001489 }
1490
Thomas Graf86872cb2006-08-22 00:01:08 -07001491 rt->rt6i_flags = cfg->fc_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001492
1493install_route:
Thomas Graf86872cb2006-08-22 00:01:08 -07001494 if (cfg->fc_mx) {
1495 struct nlattr *nla;
1496 int remaining;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001497
Thomas Graf86872cb2006-08-22 00:01:08 -07001498 nla_for_each_attr(nla, cfg->fc_mx, cfg->fc_mx_len, remaining) {
Thomas Graf8f4c1f92007-09-12 14:44:36 +02001499 int type = nla_type(nla);
Thomas Graf86872cb2006-08-22 00:01:08 -07001500
1501 if (type) {
1502 if (type > RTAX_MAX) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001503 err = -EINVAL;
1504 goto out;
1505 }
Thomas Graf86872cb2006-08-22 00:01:08 -07001506
David S. Millerdefb3512010-12-08 21:16:57 -08001507 dst_metric_set(&rt->dst, type, nla_get_u32(nla));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001508 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001509 }
1510 }
1511
Changli Gaod8d1f302010-06-10 23:31:35 -07001512 rt->dst.dev = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001513 rt->rt6i_idev = idev;
Thomas Grafc71099a2006-08-04 23:20:06 -07001514 rt->rt6i_table = table;
Daniel Lezcano63152fc2008-03-03 23:31:11 -08001515
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001516 cfg->fc_nlinfo.nl_net = dev_net(dev);
Daniel Lezcano63152fc2008-03-03 23:31:11 -08001517
Thomas Graf86872cb2006-08-22 00:01:08 -07001518 return __ip6_ins_rt(rt, &cfg->fc_nlinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001519
1520out:
1521 if (dev)
1522 dev_put(dev);
1523 if (idev)
1524 in6_dev_put(idev);
1525 if (rt)
Changli Gaod8d1f302010-06-10 23:31:35 -07001526 dst_free(&rt->dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001527 return err;
1528}
1529
Thomas Graf86872cb2006-08-22 00:01:08 -07001530static int __ip6_del_rt(struct rt6_info *rt, struct nl_info *info)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001531{
1532 int err;
Thomas Grafc71099a2006-08-04 23:20:06 -07001533 struct fib6_table *table;
David S. Millerd1918542011-12-28 20:19:20 -05001534 struct net *net = dev_net(rt->dst.dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001535
Daniel Lezcano8ed67782008-03-04 13:48:30 -08001536 if (rt == net->ipv6.ip6_null_entry)
Patrick McHardy6c813a72006-08-06 22:22:47 -07001537 return -ENOENT;
1538
Thomas Grafc71099a2006-08-04 23:20:06 -07001539 table = rt->rt6i_table;
1540 write_lock_bh(&table->tb6_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001541
Thomas Graf86872cb2006-08-22 00:01:08 -07001542 err = fib6_del(rt, info);
Changli Gaod8d1f302010-06-10 23:31:35 -07001543 dst_release(&rt->dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001544
Thomas Grafc71099a2006-08-04 23:20:06 -07001545 write_unlock_bh(&table->tb6_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001546
1547 return err;
1548}
1549
Thomas Grafe0a1ad732006-08-22 00:00:21 -07001550int ip6_del_rt(struct rt6_info *rt)
1551{
Denis V. Lunev4d1169c2008-01-10 03:26:13 -08001552 struct nl_info info = {
David S. Millerd1918542011-12-28 20:19:20 -05001553 .nl_net = dev_net(rt->dst.dev),
Denis V. Lunev4d1169c2008-01-10 03:26:13 -08001554 };
Denis V. Lunev528c4ce2007-12-13 09:45:12 -08001555 return __ip6_del_rt(rt, &info);
Thomas Grafe0a1ad732006-08-22 00:00:21 -07001556}
1557
Thomas Graf86872cb2006-08-22 00:01:08 -07001558static int ip6_route_del(struct fib6_config *cfg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001559{
Thomas Grafc71099a2006-08-04 23:20:06 -07001560 struct fib6_table *table;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001561 struct fib6_node *fn;
1562 struct rt6_info *rt;
1563 int err = -ESRCH;
1564
Daniel Lezcano55786892008-03-04 13:47:47 -08001565 table = fib6_get_table(cfg->fc_nlinfo.nl_net, cfg->fc_table);
David S. Miller38308472011-12-03 18:02:47 -05001566 if (!table)
Thomas Grafc71099a2006-08-04 23:20:06 -07001567 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001568
Thomas Grafc71099a2006-08-04 23:20:06 -07001569 read_lock_bh(&table->tb6_lock);
1570
1571 fn = fib6_locate(&table->tb6_root,
Thomas Graf86872cb2006-08-22 00:01:08 -07001572 &cfg->fc_dst, cfg->fc_dst_len,
1573 &cfg->fc_src, cfg->fc_src_len);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001574
Linus Torvalds1da177e2005-04-16 15:20:36 -07001575 if (fn) {
Changli Gaod8d1f302010-06-10 23:31:35 -07001576 for (rt = fn->leaf; rt; rt = rt->dst.rt6_next) {
Thomas Graf86872cb2006-08-22 00:01:08 -07001577 if (cfg->fc_ifindex &&
David S. Millerd1918542011-12-28 20:19:20 -05001578 (!rt->dst.dev ||
1579 rt->dst.dev->ifindex != cfg->fc_ifindex))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001580 continue;
Thomas Graf86872cb2006-08-22 00:01:08 -07001581 if (cfg->fc_flags & RTF_GATEWAY &&
1582 !ipv6_addr_equal(&cfg->fc_gateway, &rt->rt6i_gateway))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001583 continue;
Thomas Graf86872cb2006-08-22 00:01:08 -07001584 if (cfg->fc_metric && cfg->fc_metric != rt->rt6i_metric)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001585 continue;
Changli Gaod8d1f302010-06-10 23:31:35 -07001586 dst_hold(&rt->dst);
Thomas Grafc71099a2006-08-04 23:20:06 -07001587 read_unlock_bh(&table->tb6_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001588
Thomas Graf86872cb2006-08-22 00:01:08 -07001589 return __ip6_del_rt(rt, &cfg->fc_nlinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001590 }
1591 }
Thomas Grafc71099a2006-08-04 23:20:06 -07001592 read_unlock_bh(&table->tb6_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001593
1594 return err;
1595}
1596
1597/*
1598 * Handle redirects
1599 */
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001600struct ip6rd_flowi {
David S. Miller4c9483b2011-03-12 16:22:43 -05001601 struct flowi6 fl6;
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001602 struct in6_addr gateway;
1603};
Linus Torvalds1da177e2005-04-16 15:20:36 -07001604
Daniel Lezcano8ed67782008-03-04 13:48:30 -08001605static struct rt6_info *__ip6_route_redirect(struct net *net,
1606 struct fib6_table *table,
David S. Miller4c9483b2011-03-12 16:22:43 -05001607 struct flowi6 *fl6,
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001608 int flags)
1609{
David S. Miller4c9483b2011-03-12 16:22:43 -05001610 struct ip6rd_flowi *rdfl = (struct ip6rd_flowi *)fl6;
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001611 struct rt6_info *rt;
1612 struct fib6_node *fn;
Thomas Grafc71099a2006-08-04 23:20:06 -07001613
Linus Torvalds1da177e2005-04-16 15:20:36 -07001614 /*
YOSHIFUJI Hideakie843b9e2006-03-20 17:07:49 -08001615 * Get the "current" route for this destination and
1616 * check if the redirect has come from approriate router.
1617 *
1618 * RFC 2461 specifies that redirects should only be
1619 * accepted if they come from the nexthop to the target.
1620 * Due to the way the routes are chosen, this notion
1621 * is a bit fuzzy and one might need to check all possible
1622 * routes.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001623 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001624
Thomas Grafc71099a2006-08-04 23:20:06 -07001625 read_lock_bh(&table->tb6_lock);
David S. Miller4c9483b2011-03-12 16:22:43 -05001626 fn = fib6_lookup(&table->tb6_root, &fl6->daddr, &fl6->saddr);
YOSHIFUJI Hideakie843b9e2006-03-20 17:07:49 -08001627restart:
Changli Gaod8d1f302010-06-10 23:31:35 -07001628 for (rt = fn->leaf; rt; rt = rt->dst.rt6_next) {
YOSHIFUJI Hideakie843b9e2006-03-20 17:07:49 -08001629 /*
1630 * Current route is on-link; redirect is always invalid.
1631 *
1632 * Seems, previous statement is not true. It could
1633 * be node, which looks for us as on-link (f.e. proxy ndisc)
1634 * But then router serving it might decide, that we should
1635 * know truth 8)8) --ANK (980726).
1636 */
1637 if (rt6_check_expired(rt))
1638 continue;
1639 if (!(rt->rt6i_flags & RTF_GATEWAY))
1640 continue;
David S. Millerd1918542011-12-28 20:19:20 -05001641 if (fl6->flowi6_oif != rt->dst.dev->ifindex)
YOSHIFUJI Hideakie843b9e2006-03-20 17:07:49 -08001642 continue;
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001643 if (!ipv6_addr_equal(&rdfl->gateway, &rt->rt6i_gateway))
YOSHIFUJI Hideakie843b9e2006-03-20 17:07:49 -08001644 continue;
1645 break;
1646 }
YOSHIFUJI Hideakie843b9e2006-03-20 17:07:49 -08001647
YOSHIFUJI Hideakicb15d9c2006-08-23 17:23:11 -07001648 if (!rt)
Daniel Lezcano8ed67782008-03-04 13:48:30 -08001649 rt = net->ipv6.ip6_null_entry;
David S. Miller4c9483b2011-03-12 16:22:43 -05001650 BACKTRACK(net, &fl6->saddr);
YOSHIFUJI Hideakicb15d9c2006-08-23 17:23:11 -07001651out:
Changli Gaod8d1f302010-06-10 23:31:35 -07001652 dst_hold(&rt->dst);
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001653
1654 read_unlock_bh(&table->tb6_lock);
1655
1656 return rt;
1657};
1658
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001659static struct rt6_info *ip6_route_redirect(const struct in6_addr *dest,
1660 const struct in6_addr *src,
1661 const struct in6_addr *gateway,
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001662 struct net_device *dev)
1663{
Thomas Grafadaa70b2006-10-13 15:01:03 -07001664 int flags = RT6_LOOKUP_F_HAS_SADDR;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001665 struct net *net = dev_net(dev);
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001666 struct ip6rd_flowi rdfl = {
David S. Miller4c9483b2011-03-12 16:22:43 -05001667 .fl6 = {
1668 .flowi6_oif = dev->ifindex,
1669 .daddr = *dest,
1670 .saddr = *src,
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001671 },
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001672 };
Thomas Grafadaa70b2006-10-13 15:01:03 -07001673
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001674 rdfl.gateway = *gateway;
Brian Haley86c36ce2009-10-07 13:58:01 -07001675
Thomas Grafadaa70b2006-10-13 15:01:03 -07001676 if (rt6_need_strict(dest))
1677 flags |= RT6_LOOKUP_F_IFACE;
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001678
David S. Miller4c9483b2011-03-12 16:22:43 -05001679 return (struct rt6_info *)fib6_rule_lookup(net, &rdfl.fl6,
Daniel Lezcano58f09b72008-03-03 23:25:27 -08001680 flags, __ip6_route_redirect);
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001681}
1682
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001683void rt6_redirect(const struct in6_addr *dest, const struct in6_addr *src,
1684 const struct in6_addr *saddr,
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001685 struct neighbour *neigh, u8 *lladdr, int on_link)
1686{
1687 struct rt6_info *rt, *nrt = NULL;
1688 struct netevent_redirect netevent;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001689 struct net *net = dev_net(neigh->dev);
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001690
1691 rt = ip6_route_redirect(dest, src, saddr, neigh->dev);
1692
Daniel Lezcano8ed67782008-03-04 13:48:30 -08001693 if (rt == net->ipv6.ip6_null_entry) {
Joe Perchese87cc472012-05-13 21:56:26 +00001694 net_dbg_ratelimited("rt6_redirect: source isn't a valid nexthop for redirect target\n");
YOSHIFUJI Hideakia6279452006-08-23 17:18:26 -07001695 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001696 }
1697
Linus Torvalds1da177e2005-04-16 15:20:36 -07001698 /*
1699 * We have finally decided to accept it.
1700 */
1701
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001702 neigh_update(neigh, lladdr, NUD_STALE,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001703 NEIGH_UPDATE_F_WEAK_OVERRIDE|
1704 NEIGH_UPDATE_F_OVERRIDE|
1705 (on_link ? 0 : (NEIGH_UPDATE_F_OVERRIDE_ISROUTER|
1706 NEIGH_UPDATE_F_ISROUTER))
1707 );
1708
1709 /*
1710 * Redirect received -> path was valid.
1711 * Look, redirects are sent only in response to data packets,
1712 * so that this nexthop apparently is reachable. --ANK
1713 */
Changli Gaod8d1f302010-06-10 23:31:35 -07001714 dst_confirm(&rt->dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001715
1716 /* Duplicate redirect: silently ignore. */
David Miller27217452011-12-02 16:52:08 +00001717 if (neigh == dst_get_neighbour_noref_raw(&rt->dst))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001718 goto out;
1719
Eric Dumazet21efcfa2011-07-19 20:18:36 +00001720 nrt = ip6_rt_copy(rt, dest);
David S. Miller38308472011-12-03 18:02:47 -05001721 if (!nrt)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001722 goto out;
1723
1724 nrt->rt6i_flags = RTF_GATEWAY|RTF_UP|RTF_DYNAMIC|RTF_CACHE;
1725 if (on_link)
1726 nrt->rt6i_flags &= ~RTF_GATEWAY;
1727
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001728 nrt->rt6i_gateway = *(struct in6_addr *)neigh->primary_key;
David S. Miller69cce1d2011-07-17 23:09:49 -07001729 dst_set_neighbour(&nrt->dst, neigh_clone(neigh));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001730
Thomas Graf40e22e82006-08-22 00:00:45 -07001731 if (ip6_ins_rt(nrt))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001732 goto out;
1733
Changli Gaod8d1f302010-06-10 23:31:35 -07001734 netevent.old = &rt->dst;
1735 netevent.new = &nrt->dst;
Tom Tucker8d717402006-07-30 20:43:36 -07001736 call_netevent_notifiers(NETEVENT_REDIRECT, &netevent);
1737
David S. Miller38308472011-12-03 18:02:47 -05001738 if (rt->rt6i_flags & RTF_CACHE) {
Thomas Grafe0a1ad732006-08-22 00:00:21 -07001739 ip6_del_rt(rt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001740 return;
1741 }
1742
1743out:
Changli Gaod8d1f302010-06-10 23:31:35 -07001744 dst_release(&rt->dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001745}
1746
1747/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07001748 * Misc support functions
1749 */
1750
Gao feng1716a962012-04-06 00:13:10 +00001751static struct rt6_info *ip6_rt_copy(struct rt6_info *ort,
Eric Dumazet21efcfa2011-07-19 20:18:36 +00001752 const struct in6_addr *dest)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001753{
David S. Millerd1918542011-12-28 20:19:20 -05001754 struct net *net = dev_net(ort->dst.dev);
David S. Miller8b96d222012-06-11 02:01:56 -07001755 struct rt6_info *rt = ip6_dst_alloc(net, ort->dst.dev, 0,
1756 ort->rt6i_table);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001757
1758 if (rt) {
Changli Gaod8d1f302010-06-10 23:31:35 -07001759 rt->dst.input = ort->dst.input;
1760 rt->dst.output = ort->dst.output;
Yan, Zheng8e2ec632011-09-05 21:34:30 +00001761 rt->dst.flags |= DST_HOST;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001762
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001763 rt->rt6i_dst.addr = *dest;
Yan, Zheng8e2ec632011-09-05 21:34:30 +00001764 rt->rt6i_dst.plen = 128;
David S. Millerdefb3512010-12-08 21:16:57 -08001765 dst_copy_metrics(&rt->dst, &ort->dst);
Changli Gaod8d1f302010-06-10 23:31:35 -07001766 rt->dst.error = ort->dst.error;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001767 rt->rt6i_idev = ort->rt6i_idev;
1768 if (rt->rt6i_idev)
1769 in6_dev_hold(rt->rt6i_idev);
Changli Gaod8d1f302010-06-10 23:31:35 -07001770 rt->dst.lastuse = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001771
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001772 rt->rt6i_gateway = ort->rt6i_gateway;
Gao feng1716a962012-04-06 00:13:10 +00001773 rt->rt6i_flags = ort->rt6i_flags;
1774 if ((ort->rt6i_flags & (RTF_DEFAULT | RTF_ADDRCONF)) ==
1775 (RTF_DEFAULT | RTF_ADDRCONF))
1776 rt6_set_from(rt, ort);
1777 else
1778 rt6_clean_expires(rt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001779 rt->rt6i_metric = 0;
1780
Linus Torvalds1da177e2005-04-16 15:20:36 -07001781#ifdef CONFIG_IPV6_SUBTREES
1782 memcpy(&rt->rt6i_src, &ort->rt6i_src, sizeof(struct rt6key));
1783#endif
Florian Westphal0f6c6392011-05-20 11:27:24 +00001784 memcpy(&rt->rt6i_prefsrc, &ort->rt6i_prefsrc, sizeof(struct rt6key));
Thomas Grafc71099a2006-08-04 23:20:06 -07001785 rt->rt6i_table = ort->rt6i_table;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001786 }
1787 return rt;
1788}
1789
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001790#ifdef CONFIG_IPV6_ROUTE_INFO
Daniel Lezcanoefa2cea2008-03-04 13:46:48 -08001791static struct rt6_info *rt6_get_route_info(struct net *net,
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001792 const struct in6_addr *prefix, int prefixlen,
1793 const struct in6_addr *gwaddr, int ifindex)
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001794{
1795 struct fib6_node *fn;
1796 struct rt6_info *rt = NULL;
Thomas Grafc71099a2006-08-04 23:20:06 -07001797 struct fib6_table *table;
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001798
Daniel Lezcanoefa2cea2008-03-04 13:46:48 -08001799 table = fib6_get_table(net, RT6_TABLE_INFO);
David S. Miller38308472011-12-03 18:02:47 -05001800 if (!table)
Thomas Grafc71099a2006-08-04 23:20:06 -07001801 return NULL;
1802
1803 write_lock_bh(&table->tb6_lock);
1804 fn = fib6_locate(&table->tb6_root, prefix ,prefixlen, NULL, 0);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001805 if (!fn)
1806 goto out;
1807
Changli Gaod8d1f302010-06-10 23:31:35 -07001808 for (rt = fn->leaf; rt; rt = rt->dst.rt6_next) {
David S. Millerd1918542011-12-28 20:19:20 -05001809 if (rt->dst.dev->ifindex != ifindex)
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001810 continue;
1811 if ((rt->rt6i_flags & (RTF_ROUTEINFO|RTF_GATEWAY)) != (RTF_ROUTEINFO|RTF_GATEWAY))
1812 continue;
1813 if (!ipv6_addr_equal(&rt->rt6i_gateway, gwaddr))
1814 continue;
Changli Gaod8d1f302010-06-10 23:31:35 -07001815 dst_hold(&rt->dst);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001816 break;
1817 }
1818out:
Thomas Grafc71099a2006-08-04 23:20:06 -07001819 write_unlock_bh(&table->tb6_lock);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001820 return rt;
1821}
1822
Daniel Lezcanoefa2cea2008-03-04 13:46:48 -08001823static struct rt6_info *rt6_add_route_info(struct net *net,
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001824 const struct in6_addr *prefix, int prefixlen,
1825 const struct in6_addr *gwaddr, int ifindex,
Eric Dumazet95c96172012-04-15 05:58:06 +00001826 unsigned int pref)
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001827{
Thomas Graf86872cb2006-08-22 00:01:08 -07001828 struct fib6_config cfg = {
1829 .fc_table = RT6_TABLE_INFO,
Rami Rosen238fc7e2008-02-09 23:43:11 -08001830 .fc_metric = IP6_RT_PRIO_USER,
Thomas Graf86872cb2006-08-22 00:01:08 -07001831 .fc_ifindex = ifindex,
1832 .fc_dst_len = prefixlen,
1833 .fc_flags = RTF_GATEWAY | RTF_ADDRCONF | RTF_ROUTEINFO |
1834 RTF_UP | RTF_PREF(pref),
Daniel Lezcanoefa2cea2008-03-04 13:46:48 -08001835 .fc_nlinfo.pid = 0,
1836 .fc_nlinfo.nlh = NULL,
1837 .fc_nlinfo.nl_net = net,
Thomas Graf86872cb2006-08-22 00:01:08 -07001838 };
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001839
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001840 cfg.fc_dst = *prefix;
1841 cfg.fc_gateway = *gwaddr;
Thomas Graf86872cb2006-08-22 00:01:08 -07001842
YOSHIFUJI Hideakie317da92006-03-20 17:06:42 -08001843 /* We should treat it as a default route if prefix length is 0. */
1844 if (!prefixlen)
Thomas Graf86872cb2006-08-22 00:01:08 -07001845 cfg.fc_flags |= RTF_DEFAULT;
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001846
Thomas Graf86872cb2006-08-22 00:01:08 -07001847 ip6_route_add(&cfg);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001848
Daniel Lezcanoefa2cea2008-03-04 13:46:48 -08001849 return rt6_get_route_info(net, prefix, prefixlen, gwaddr, ifindex);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001850}
1851#endif
1852
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001853struct rt6_info *rt6_get_dflt_router(const struct in6_addr *addr, struct net_device *dev)
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001854{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001855 struct rt6_info *rt;
Thomas Grafc71099a2006-08-04 23:20:06 -07001856 struct fib6_table *table;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001857
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001858 table = fib6_get_table(dev_net(dev), RT6_TABLE_DFLT);
David S. Miller38308472011-12-03 18:02:47 -05001859 if (!table)
Thomas Grafc71099a2006-08-04 23:20:06 -07001860 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001861
Thomas Grafc71099a2006-08-04 23:20:06 -07001862 write_lock_bh(&table->tb6_lock);
Changli Gaod8d1f302010-06-10 23:31:35 -07001863 for (rt = table->tb6_root.leaf; rt; rt=rt->dst.rt6_next) {
David S. Millerd1918542011-12-28 20:19:20 -05001864 if (dev == rt->dst.dev &&
YOSHIFUJI Hideaki045927f2006-03-20 17:00:48 -08001865 ((rt->rt6i_flags & (RTF_ADDRCONF | RTF_DEFAULT)) == (RTF_ADDRCONF | RTF_DEFAULT)) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -07001866 ipv6_addr_equal(&rt->rt6i_gateway, addr))
1867 break;
1868 }
1869 if (rt)
Changli Gaod8d1f302010-06-10 23:31:35 -07001870 dst_hold(&rt->dst);
Thomas Grafc71099a2006-08-04 23:20:06 -07001871 write_unlock_bh(&table->tb6_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001872 return rt;
1873}
1874
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001875struct rt6_info *rt6_add_dflt_router(const struct in6_addr *gwaddr,
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -08001876 struct net_device *dev,
1877 unsigned int pref)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001878{
Thomas Graf86872cb2006-08-22 00:01:08 -07001879 struct fib6_config cfg = {
1880 .fc_table = RT6_TABLE_DFLT,
Rami Rosen238fc7e2008-02-09 23:43:11 -08001881 .fc_metric = IP6_RT_PRIO_USER,
Thomas Graf86872cb2006-08-22 00:01:08 -07001882 .fc_ifindex = dev->ifindex,
1883 .fc_flags = RTF_GATEWAY | RTF_ADDRCONF | RTF_DEFAULT |
1884 RTF_UP | RTF_EXPIRES | RTF_PREF(pref),
Daniel Lezcano55786892008-03-04 13:47:47 -08001885 .fc_nlinfo.pid = 0,
1886 .fc_nlinfo.nlh = NULL,
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001887 .fc_nlinfo.nl_net = dev_net(dev),
Thomas Graf86872cb2006-08-22 00:01:08 -07001888 };
Linus Torvalds1da177e2005-04-16 15:20:36 -07001889
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001890 cfg.fc_gateway = *gwaddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001891
Thomas Graf86872cb2006-08-22 00:01:08 -07001892 ip6_route_add(&cfg);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001893
Linus Torvalds1da177e2005-04-16 15:20:36 -07001894 return rt6_get_dflt_router(gwaddr, dev);
1895}
1896
Daniel Lezcano7b4da532008-03-04 13:47:14 -08001897void rt6_purge_dflt_routers(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001898{
1899 struct rt6_info *rt;
Thomas Grafc71099a2006-08-04 23:20:06 -07001900 struct fib6_table *table;
1901
1902 /* NOTE: Keep consistent with rt6_get_dflt_router */
Daniel Lezcano7b4da532008-03-04 13:47:14 -08001903 table = fib6_get_table(net, RT6_TABLE_DFLT);
David S. Miller38308472011-12-03 18:02:47 -05001904 if (!table)
Thomas Grafc71099a2006-08-04 23:20:06 -07001905 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001906
1907restart:
Thomas Grafc71099a2006-08-04 23:20:06 -07001908 read_lock_bh(&table->tb6_lock);
Changli Gaod8d1f302010-06-10 23:31:35 -07001909 for (rt = table->tb6_root.leaf; rt; rt = rt->dst.rt6_next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001910 if (rt->rt6i_flags & (RTF_DEFAULT | RTF_ADDRCONF)) {
Changli Gaod8d1f302010-06-10 23:31:35 -07001911 dst_hold(&rt->dst);
Thomas Grafc71099a2006-08-04 23:20:06 -07001912 read_unlock_bh(&table->tb6_lock);
Thomas Grafe0a1ad732006-08-22 00:00:21 -07001913 ip6_del_rt(rt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001914 goto restart;
1915 }
1916 }
Thomas Grafc71099a2006-08-04 23:20:06 -07001917 read_unlock_bh(&table->tb6_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001918}
1919
Daniel Lezcano55786892008-03-04 13:47:47 -08001920static void rtmsg_to_fib6_config(struct net *net,
1921 struct in6_rtmsg *rtmsg,
Thomas Graf86872cb2006-08-22 00:01:08 -07001922 struct fib6_config *cfg)
1923{
1924 memset(cfg, 0, sizeof(*cfg));
1925
1926 cfg->fc_table = RT6_TABLE_MAIN;
1927 cfg->fc_ifindex = rtmsg->rtmsg_ifindex;
1928 cfg->fc_metric = rtmsg->rtmsg_metric;
1929 cfg->fc_expires = rtmsg->rtmsg_info;
1930 cfg->fc_dst_len = rtmsg->rtmsg_dst_len;
1931 cfg->fc_src_len = rtmsg->rtmsg_src_len;
1932 cfg->fc_flags = rtmsg->rtmsg_flags;
1933
Daniel Lezcano55786892008-03-04 13:47:47 -08001934 cfg->fc_nlinfo.nl_net = net;
Benjamin Theryf1243c22008-02-26 18:10:03 -08001935
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001936 cfg->fc_dst = rtmsg->rtmsg_dst;
1937 cfg->fc_src = rtmsg->rtmsg_src;
1938 cfg->fc_gateway = rtmsg->rtmsg_gateway;
Thomas Graf86872cb2006-08-22 00:01:08 -07001939}
1940
Daniel Lezcano55786892008-03-04 13:47:47 -08001941int ipv6_route_ioctl(struct net *net, unsigned int cmd, void __user *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001942{
Thomas Graf86872cb2006-08-22 00:01:08 -07001943 struct fib6_config cfg;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001944 struct in6_rtmsg rtmsg;
1945 int err;
1946
1947 switch(cmd) {
1948 case SIOCADDRT: /* Add a route */
1949 case SIOCDELRT: /* Delete a route */
1950 if (!capable(CAP_NET_ADMIN))
1951 return -EPERM;
1952 err = copy_from_user(&rtmsg, arg,
1953 sizeof(struct in6_rtmsg));
1954 if (err)
1955 return -EFAULT;
Thomas Graf86872cb2006-08-22 00:01:08 -07001956
Daniel Lezcano55786892008-03-04 13:47:47 -08001957 rtmsg_to_fib6_config(net, &rtmsg, &cfg);
Thomas Graf86872cb2006-08-22 00:01:08 -07001958
Linus Torvalds1da177e2005-04-16 15:20:36 -07001959 rtnl_lock();
1960 switch (cmd) {
1961 case SIOCADDRT:
Thomas Graf86872cb2006-08-22 00:01:08 -07001962 err = ip6_route_add(&cfg);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001963 break;
1964 case SIOCDELRT:
Thomas Graf86872cb2006-08-22 00:01:08 -07001965 err = ip6_route_del(&cfg);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001966 break;
1967 default:
1968 err = -EINVAL;
1969 }
1970 rtnl_unlock();
1971
1972 return err;
Stephen Hemminger3ff50b72007-04-20 17:09:22 -07001973 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001974
1975 return -EINVAL;
1976}
1977
1978/*
1979 * Drop the packet on the floor
1980 */
1981
Brian Haleyd5fdd6b2009-06-23 04:31:07 -07001982static int ip6_pkt_drop(struct sk_buff *skb, u8 code, int ipstats_mib_noroutes)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001983{
YOSHIFUJI Hideaki612f09e2007-04-13 16:18:02 -07001984 int type;
Eric Dumazetadf30902009-06-02 05:19:30 +00001985 struct dst_entry *dst = skb_dst(skb);
YOSHIFUJI Hideaki612f09e2007-04-13 16:18:02 -07001986 switch (ipstats_mib_noroutes) {
1987 case IPSTATS_MIB_INNOROUTES:
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001988 type = ipv6_addr_type(&ipv6_hdr(skb)->daddr);
Ulrich Weber45bb0062010-02-25 23:28:58 +00001989 if (type == IPV6_ADDR_ANY) {
Denis V. Lunev3bd653c2008-10-08 10:54:51 -07001990 IP6_INC_STATS(dev_net(dst->dev), ip6_dst_idev(dst),
1991 IPSTATS_MIB_INADDRERRORS);
YOSHIFUJI Hideaki612f09e2007-04-13 16:18:02 -07001992 break;
1993 }
1994 /* FALLTHROUGH */
1995 case IPSTATS_MIB_OUTNOROUTES:
Denis V. Lunev3bd653c2008-10-08 10:54:51 -07001996 IP6_INC_STATS(dev_net(dst->dev), ip6_dst_idev(dst),
1997 ipstats_mib_noroutes);
YOSHIFUJI Hideaki612f09e2007-04-13 16:18:02 -07001998 break;
1999 }
Alexey Dobriyan3ffe5332010-02-18 08:25:24 +00002000 icmpv6_send(skb, ICMPV6_DEST_UNREACH, code, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002001 kfree_skb(skb);
2002 return 0;
2003}
2004
Thomas Graf9ce8ade2006-10-18 20:46:54 -07002005static int ip6_pkt_discard(struct sk_buff *skb)
2006{
YOSHIFUJI Hideaki612f09e2007-04-13 16:18:02 -07002007 return ip6_pkt_drop(skb, ICMPV6_NOROUTE, IPSTATS_MIB_INNOROUTES);
Thomas Graf9ce8ade2006-10-18 20:46:54 -07002008}
2009
Arnaldo Carvalho de Melo20380732005-08-16 02:18:02 -03002010static int ip6_pkt_discard_out(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002011{
Eric Dumazetadf30902009-06-02 05:19:30 +00002012 skb->dev = skb_dst(skb)->dev;
YOSHIFUJI Hideaki612f09e2007-04-13 16:18:02 -07002013 return ip6_pkt_drop(skb, ICMPV6_NOROUTE, IPSTATS_MIB_OUTNOROUTES);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002014}
2015
David S. Miller6723ab52006-10-18 21:20:57 -07002016#ifdef CONFIG_IPV6_MULTIPLE_TABLES
2017
Thomas Graf9ce8ade2006-10-18 20:46:54 -07002018static int ip6_pkt_prohibit(struct sk_buff *skb)
2019{
YOSHIFUJI Hideaki612f09e2007-04-13 16:18:02 -07002020 return ip6_pkt_drop(skb, ICMPV6_ADM_PROHIBITED, IPSTATS_MIB_INNOROUTES);
Thomas Graf9ce8ade2006-10-18 20:46:54 -07002021}
2022
2023static int ip6_pkt_prohibit_out(struct sk_buff *skb)
2024{
Eric Dumazetadf30902009-06-02 05:19:30 +00002025 skb->dev = skb_dst(skb)->dev;
YOSHIFUJI Hideaki612f09e2007-04-13 16:18:02 -07002026 return ip6_pkt_drop(skb, ICMPV6_ADM_PROHIBITED, IPSTATS_MIB_OUTNOROUTES);
Thomas Graf9ce8ade2006-10-18 20:46:54 -07002027}
2028
David S. Miller6723ab52006-10-18 21:20:57 -07002029#endif
2030
Linus Torvalds1da177e2005-04-16 15:20:36 -07002031/*
2032 * Allocate a dst for local (unicast / anycast) address.
2033 */
2034
2035struct rt6_info *addrconf_dst_alloc(struct inet6_dev *idev,
2036 const struct in6_addr *addr,
David S. Miller8f031512011-12-06 16:48:14 -05002037 bool anycast)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002038{
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002039 struct net *net = dev_net(idev->dev);
David S. Miller8b96d222012-06-11 02:01:56 -07002040 struct rt6_info *rt = ip6_dst_alloc(net, net->loopback_dev, 0, NULL);
David S. Millerf83c7792011-12-28 15:41:23 -05002041 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002042
David S. Miller38308472011-12-03 18:02:47 -05002043 if (!rt) {
Joe Perchesf3213832012-05-15 14:11:53 +00002044 net_warn_ratelimited("Maximum number of routes reached, consider increasing route/max_size\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07002045 return ERR_PTR(-ENOMEM);
Ben Greear40385652010-11-08 12:33:48 +00002046 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07002047
Linus Torvalds1da177e2005-04-16 15:20:36 -07002048 in6_dev_hold(idev);
2049
David S. Miller11d53b42011-06-24 15:23:34 -07002050 rt->dst.flags |= DST_HOST;
Changli Gaod8d1f302010-06-10 23:31:35 -07002051 rt->dst.input = ip6_input;
2052 rt->dst.output = ip6_output;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002053 rt->rt6i_idev = idev;
Changli Gaod8d1f302010-06-10 23:31:35 -07002054 rt->dst.obsolete = -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002055
2056 rt->rt6i_flags = RTF_UP | RTF_NONEXTHOP;
YOSHIFUJI Hideaki58c4fb82005-12-21 22:56:42 +09002057 if (anycast)
2058 rt->rt6i_flags |= RTF_ANYCAST;
2059 else
Linus Torvalds1da177e2005-04-16 15:20:36 -07002060 rt->rt6i_flags |= RTF_LOCAL;
David S. Miller8ade06c2011-12-29 18:51:57 -05002061 err = rt6_bind_neighbour(rt, rt->dst.dev);
David S. Millerf83c7792011-12-28 15:41:23 -05002062 if (err) {
Changli Gaod8d1f302010-06-10 23:31:35 -07002063 dst_free(&rt->dst);
David S. Millerf83c7792011-12-28 15:41:23 -05002064 return ERR_PTR(err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002065 }
2066
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00002067 rt->rt6i_dst.addr = *addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002068 rt->rt6i_dst.plen = 128;
Daniel Lezcano55786892008-03-04 13:47:47 -08002069 rt->rt6i_table = fib6_get_table(net, RT6_TABLE_LOCAL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002070
Changli Gaod8d1f302010-06-10 23:31:35 -07002071 atomic_set(&rt->dst.__refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002072
2073 return rt;
2074}
2075
Daniel Walterc3968a82011-04-13 21:10:57 +00002076int ip6_route_get_saddr(struct net *net,
2077 struct rt6_info *rt,
Eric Dumazetb71d1d42011-04-22 04:53:02 +00002078 const struct in6_addr *daddr,
Daniel Walterc3968a82011-04-13 21:10:57 +00002079 unsigned int prefs,
2080 struct in6_addr *saddr)
2081{
2082 struct inet6_dev *idev = ip6_dst_idev((struct dst_entry*)rt);
2083 int err = 0;
2084 if (rt->rt6i_prefsrc.plen)
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00002085 *saddr = rt->rt6i_prefsrc.addr;
Daniel Walterc3968a82011-04-13 21:10:57 +00002086 else
2087 err = ipv6_dev_get_saddr(net, idev ? idev->dev : NULL,
2088 daddr, prefs, saddr);
2089 return err;
2090}
2091
2092/* remove deleted ip from prefsrc entries */
2093struct arg_dev_net_ip {
2094 struct net_device *dev;
2095 struct net *net;
2096 struct in6_addr *addr;
2097};
2098
2099static int fib6_remove_prefsrc(struct rt6_info *rt, void *arg)
2100{
2101 struct net_device *dev = ((struct arg_dev_net_ip *)arg)->dev;
2102 struct net *net = ((struct arg_dev_net_ip *)arg)->net;
2103 struct in6_addr *addr = ((struct arg_dev_net_ip *)arg)->addr;
2104
David S. Millerd1918542011-12-28 20:19:20 -05002105 if (((void *)rt->dst.dev == dev || !dev) &&
Daniel Walterc3968a82011-04-13 21:10:57 +00002106 rt != net->ipv6.ip6_null_entry &&
2107 ipv6_addr_equal(addr, &rt->rt6i_prefsrc.addr)) {
2108 /* remove prefsrc entry */
2109 rt->rt6i_prefsrc.plen = 0;
2110 }
2111 return 0;
2112}
2113
2114void rt6_remove_prefsrc(struct inet6_ifaddr *ifp)
2115{
2116 struct net *net = dev_net(ifp->idev->dev);
2117 struct arg_dev_net_ip adni = {
2118 .dev = ifp->idev->dev,
2119 .net = net,
2120 .addr = &ifp->addr,
2121 };
2122 fib6_clean_all(net, fib6_remove_prefsrc, 0, &adni);
2123}
2124
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002125struct arg_dev_net {
2126 struct net_device *dev;
2127 struct net *net;
2128};
2129
Linus Torvalds1da177e2005-04-16 15:20:36 -07002130static int fib6_ifdown(struct rt6_info *rt, void *arg)
2131{
stephen hemmingerbc3ef662010-12-16 17:42:40 +00002132 const struct arg_dev_net *adn = arg;
2133 const struct net_device *dev = adn->dev;
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002134
David S. Millerd1918542011-12-28 20:19:20 -05002135 if ((rt->dst.dev == dev || !dev) &&
David S. Millerc159d302011-12-26 15:24:36 -05002136 rt != adn->net->ipv6.ip6_null_entry)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002137 return -1;
David S. Millerc159d302011-12-26 15:24:36 -05002138
Linus Torvalds1da177e2005-04-16 15:20:36 -07002139 return 0;
2140}
2141
Daniel Lezcanof3db4852008-03-03 23:27:06 -08002142void rt6_ifdown(struct net *net, struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002143{
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002144 struct arg_dev_net adn = {
2145 .dev = dev,
2146 .net = net,
2147 };
2148
2149 fib6_clean_all(net, fib6_ifdown, 0, &adn);
David S. Miller1e493d12008-09-10 17:27:15 -07002150 icmp6_clean_all(fib6_ifdown, &adn);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002151}
2152
Eric Dumazet95c96172012-04-15 05:58:06 +00002153struct rt6_mtu_change_arg {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002154 struct net_device *dev;
Eric Dumazet95c96172012-04-15 05:58:06 +00002155 unsigned int mtu;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002156};
2157
2158static int rt6_mtu_change_route(struct rt6_info *rt, void *p_arg)
2159{
2160 struct rt6_mtu_change_arg *arg = (struct rt6_mtu_change_arg *) p_arg;
2161 struct inet6_dev *idev;
2162
2163 /* In IPv6 pmtu discovery is not optional,
2164 so that RTAX_MTU lock cannot disable it.
2165 We still use this lock to block changes
2166 caused by addrconf/ndisc.
2167 */
2168
2169 idev = __in6_dev_get(arg->dev);
David S. Miller38308472011-12-03 18:02:47 -05002170 if (!idev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002171 return 0;
2172
2173 /* For administrative MTU increase, there is no way to discover
2174 IPv6 PMTU increase, so PMTU increase should be updated here.
2175 Since RFC 1981 doesn't include administrative MTU increase
2176 update PMTU increase is a MUST. (i.e. jumbo frame)
2177 */
2178 /*
2179 If new MTU is less than route PMTU, this new MTU will be the
2180 lowest MTU in the path, update the route PMTU to reflect PMTU
2181 decreases; if new MTU is greater than route PMTU, and the
2182 old MTU is the lowest MTU in the path, update the route PMTU
2183 to reflect the increase. In this case if the other nodes' MTU
2184 also have the lowest MTU, TOO BIG MESSAGE will be lead to
2185 PMTU discouvery.
2186 */
David S. Millerd1918542011-12-28 20:19:20 -05002187 if (rt->dst.dev == arg->dev &&
Changli Gaod8d1f302010-06-10 23:31:35 -07002188 !dst_metric_locked(&rt->dst, RTAX_MTU) &&
2189 (dst_mtu(&rt->dst) >= arg->mtu ||
2190 (dst_mtu(&rt->dst) < arg->mtu &&
2191 dst_mtu(&rt->dst) == idev->cnf.mtu6))) {
David S. Millerdefb3512010-12-08 21:16:57 -08002192 dst_metric_set(&rt->dst, RTAX_MTU, arg->mtu);
Simon Arlott566cfd82007-07-26 00:09:55 -07002193 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07002194 return 0;
2195}
2196
Eric Dumazet95c96172012-04-15 05:58:06 +00002197void rt6_mtu_change(struct net_device *dev, unsigned int mtu)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002198{
Thomas Grafc71099a2006-08-04 23:20:06 -07002199 struct rt6_mtu_change_arg arg = {
2200 .dev = dev,
2201 .mtu = mtu,
2202 };
Linus Torvalds1da177e2005-04-16 15:20:36 -07002203
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002204 fib6_clean_all(dev_net(dev), rt6_mtu_change_route, 0, &arg);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002205}
2206
Patrick McHardyef7c79e2007-06-05 12:38:30 -07002207static const struct nla_policy rtm_ipv6_policy[RTA_MAX+1] = {
Thomas Graf5176f912006-08-26 20:13:18 -07002208 [RTA_GATEWAY] = { .len = sizeof(struct in6_addr) },
Thomas Graf86872cb2006-08-22 00:01:08 -07002209 [RTA_OIF] = { .type = NLA_U32 },
Thomas Grafab364a62006-08-22 00:01:47 -07002210 [RTA_IIF] = { .type = NLA_U32 },
Thomas Graf86872cb2006-08-22 00:01:08 -07002211 [RTA_PRIORITY] = { .type = NLA_U32 },
2212 [RTA_METRICS] = { .type = NLA_NESTED },
2213};
2214
2215static int rtm_to_fib6_config(struct sk_buff *skb, struct nlmsghdr *nlh,
2216 struct fib6_config *cfg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002217{
Thomas Graf86872cb2006-08-22 00:01:08 -07002218 struct rtmsg *rtm;
2219 struct nlattr *tb[RTA_MAX+1];
2220 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002221
Thomas Graf86872cb2006-08-22 00:01:08 -07002222 err = nlmsg_parse(nlh, sizeof(*rtm), tb, RTA_MAX, rtm_ipv6_policy);
2223 if (err < 0)
2224 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002225
Thomas Graf86872cb2006-08-22 00:01:08 -07002226 err = -EINVAL;
2227 rtm = nlmsg_data(nlh);
2228 memset(cfg, 0, sizeof(*cfg));
2229
2230 cfg->fc_table = rtm->rtm_table;
2231 cfg->fc_dst_len = rtm->rtm_dst_len;
2232 cfg->fc_src_len = rtm->rtm_src_len;
2233 cfg->fc_flags = RTF_UP;
2234 cfg->fc_protocol = rtm->rtm_protocol;
2235
2236 if (rtm->rtm_type == RTN_UNREACHABLE)
2237 cfg->fc_flags |= RTF_REJECT;
2238
Maciej Żenczykowskiab79ad12010-09-27 00:07:02 +00002239 if (rtm->rtm_type == RTN_LOCAL)
2240 cfg->fc_flags |= RTF_LOCAL;
2241
Thomas Graf86872cb2006-08-22 00:01:08 -07002242 cfg->fc_nlinfo.pid = NETLINK_CB(skb).pid;
2243 cfg->fc_nlinfo.nlh = nlh;
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09002244 cfg->fc_nlinfo.nl_net = sock_net(skb->sk);
Thomas Graf86872cb2006-08-22 00:01:08 -07002245
2246 if (tb[RTA_GATEWAY]) {
2247 nla_memcpy(&cfg->fc_gateway, tb[RTA_GATEWAY], 16);
2248 cfg->fc_flags |= RTF_GATEWAY;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002249 }
Thomas Graf86872cb2006-08-22 00:01:08 -07002250
2251 if (tb[RTA_DST]) {
2252 int plen = (rtm->rtm_dst_len + 7) >> 3;
2253
2254 if (nla_len(tb[RTA_DST]) < plen)
2255 goto errout;
2256
2257 nla_memcpy(&cfg->fc_dst, tb[RTA_DST], plen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002258 }
Thomas Graf86872cb2006-08-22 00:01:08 -07002259
2260 if (tb[RTA_SRC]) {
2261 int plen = (rtm->rtm_src_len + 7) >> 3;
2262
2263 if (nla_len(tb[RTA_SRC]) < plen)
2264 goto errout;
2265
2266 nla_memcpy(&cfg->fc_src, tb[RTA_SRC], plen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002267 }
Thomas Graf86872cb2006-08-22 00:01:08 -07002268
Daniel Walterc3968a82011-04-13 21:10:57 +00002269 if (tb[RTA_PREFSRC])
2270 nla_memcpy(&cfg->fc_prefsrc, tb[RTA_PREFSRC], 16);
2271
Thomas Graf86872cb2006-08-22 00:01:08 -07002272 if (tb[RTA_OIF])
2273 cfg->fc_ifindex = nla_get_u32(tb[RTA_OIF]);
2274
2275 if (tb[RTA_PRIORITY])
2276 cfg->fc_metric = nla_get_u32(tb[RTA_PRIORITY]);
2277
2278 if (tb[RTA_METRICS]) {
2279 cfg->fc_mx = nla_data(tb[RTA_METRICS]);
2280 cfg->fc_mx_len = nla_len(tb[RTA_METRICS]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002281 }
Thomas Graf86872cb2006-08-22 00:01:08 -07002282
2283 if (tb[RTA_TABLE])
2284 cfg->fc_table = nla_get_u32(tb[RTA_TABLE]);
2285
2286 err = 0;
2287errout:
2288 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002289}
2290
Thomas Grafc127ea22007-03-22 11:58:32 -07002291static int inet6_rtm_delroute(struct sk_buff *skb, struct nlmsghdr* nlh, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002292{
Thomas Graf86872cb2006-08-22 00:01:08 -07002293 struct fib6_config cfg;
2294 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002295
Thomas Graf86872cb2006-08-22 00:01:08 -07002296 err = rtm_to_fib6_config(skb, nlh, &cfg);
2297 if (err < 0)
2298 return err;
2299
2300 return ip6_route_del(&cfg);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002301}
2302
Thomas Grafc127ea22007-03-22 11:58:32 -07002303static int inet6_rtm_newroute(struct sk_buff *skb, struct nlmsghdr* nlh, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002304{
Thomas Graf86872cb2006-08-22 00:01:08 -07002305 struct fib6_config cfg;
2306 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002307
Thomas Graf86872cb2006-08-22 00:01:08 -07002308 err = rtm_to_fib6_config(skb, nlh, &cfg);
2309 if (err < 0)
2310 return err;
2311
2312 return ip6_route_add(&cfg);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002313}
2314
Thomas Graf339bf982006-11-10 14:10:15 -08002315static inline size_t rt6_nlmsg_size(void)
2316{
2317 return NLMSG_ALIGN(sizeof(struct rtmsg))
2318 + nla_total_size(16) /* RTA_SRC */
2319 + nla_total_size(16) /* RTA_DST */
2320 + nla_total_size(16) /* RTA_GATEWAY */
2321 + nla_total_size(16) /* RTA_PREFSRC */
2322 + nla_total_size(4) /* RTA_TABLE */
2323 + nla_total_size(4) /* RTA_IIF */
2324 + nla_total_size(4) /* RTA_OIF */
2325 + nla_total_size(4) /* RTA_PRIORITY */
Noriaki TAKAMIYA6a2b9ce2007-01-23 22:09:41 -08002326 + RTAX_MAX * nla_total_size(4) /* RTA_METRICS */
Thomas Graf339bf982006-11-10 14:10:15 -08002327 + nla_total_size(sizeof(struct rta_cacheinfo));
2328}
2329
Brian Haley191cd582008-08-14 15:33:21 -07002330static int rt6_fill_node(struct net *net,
2331 struct sk_buff *skb, struct rt6_info *rt,
Jamal Hadi Salim0d51aa82005-06-21 13:51:04 -07002332 struct in6_addr *dst, struct in6_addr *src,
2333 int iif, int type, u32 pid, u32 seq,
YOSHIFUJI Hideaki7bc570c2008-04-03 09:22:53 +09002334 int prefix, int nowait, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002335{
David S. Miller346f8702011-12-29 15:22:33 -05002336 const struct inet_peer *peer;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002337 struct rtmsg *rtm;
Thomas Graf2d7202b2006-08-22 00:01:27 -07002338 struct nlmsghdr *nlh;
Thomas Grafe3703b32006-11-27 09:27:07 -08002339 long expires;
Patrick McHardy9e762a42006-08-10 23:09:48 -07002340 u32 table;
Eric Dumazetf2c31e32011-07-29 19:00:53 +00002341 struct neighbour *n;
David S. Miller346f8702011-12-29 15:22:33 -05002342 u32 ts, tsage;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002343
2344 if (prefix) { /* user wants prefix routes only */
2345 if (!(rt->rt6i_flags & RTF_PREFIX_RT)) {
2346 /* success since this is not a prefix route */
2347 return 1;
2348 }
2349 }
2350
Thomas Graf2d7202b2006-08-22 00:01:27 -07002351 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*rtm), flags);
David S. Miller38308472011-12-03 18:02:47 -05002352 if (!nlh)
Patrick McHardy26932562007-01-31 23:16:40 -08002353 return -EMSGSIZE;
Thomas Graf2d7202b2006-08-22 00:01:27 -07002354
2355 rtm = nlmsg_data(nlh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002356 rtm->rtm_family = AF_INET6;
2357 rtm->rtm_dst_len = rt->rt6i_dst.plen;
2358 rtm->rtm_src_len = rt->rt6i_src.plen;
2359 rtm->rtm_tos = 0;
Thomas Grafc71099a2006-08-04 23:20:06 -07002360 if (rt->rt6i_table)
Patrick McHardy9e762a42006-08-10 23:09:48 -07002361 table = rt->rt6i_table->tb6_id;
Thomas Grafc71099a2006-08-04 23:20:06 -07002362 else
Patrick McHardy9e762a42006-08-10 23:09:48 -07002363 table = RT6_TABLE_UNSPEC;
2364 rtm->rtm_table = table;
David S. Millerc78679e2012-04-01 20:27:33 -04002365 if (nla_put_u32(skb, RTA_TABLE, table))
2366 goto nla_put_failure;
David S. Miller38308472011-12-03 18:02:47 -05002367 if (rt->rt6i_flags & RTF_REJECT)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002368 rtm->rtm_type = RTN_UNREACHABLE;
David S. Miller38308472011-12-03 18:02:47 -05002369 else if (rt->rt6i_flags & RTF_LOCAL)
Maciej Żenczykowskiab79ad12010-09-27 00:07:02 +00002370 rtm->rtm_type = RTN_LOCAL;
David S. Millerd1918542011-12-28 20:19:20 -05002371 else if (rt->dst.dev && (rt->dst.dev->flags & IFF_LOOPBACK))
Linus Torvalds1da177e2005-04-16 15:20:36 -07002372 rtm->rtm_type = RTN_LOCAL;
2373 else
2374 rtm->rtm_type = RTN_UNICAST;
2375 rtm->rtm_flags = 0;
2376 rtm->rtm_scope = RT_SCOPE_UNIVERSE;
2377 rtm->rtm_protocol = rt->rt6i_protocol;
David S. Miller38308472011-12-03 18:02:47 -05002378 if (rt->rt6i_flags & RTF_DYNAMIC)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002379 rtm->rtm_protocol = RTPROT_REDIRECT;
2380 else if (rt->rt6i_flags & RTF_ADDRCONF)
2381 rtm->rtm_protocol = RTPROT_KERNEL;
David S. Miller38308472011-12-03 18:02:47 -05002382 else if (rt->rt6i_flags & RTF_DEFAULT)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002383 rtm->rtm_protocol = RTPROT_RA;
2384
David S. Miller38308472011-12-03 18:02:47 -05002385 if (rt->rt6i_flags & RTF_CACHE)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002386 rtm->rtm_flags |= RTM_F_CLONED;
2387
2388 if (dst) {
David S. Millerc78679e2012-04-01 20:27:33 -04002389 if (nla_put(skb, RTA_DST, 16, dst))
2390 goto nla_put_failure;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09002391 rtm->rtm_dst_len = 128;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002392 } else if (rtm->rtm_dst_len)
David S. Millerc78679e2012-04-01 20:27:33 -04002393 if (nla_put(skb, RTA_DST, 16, &rt->rt6i_dst.addr))
2394 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002395#ifdef CONFIG_IPV6_SUBTREES
2396 if (src) {
David S. Millerc78679e2012-04-01 20:27:33 -04002397 if (nla_put(skb, RTA_SRC, 16, src))
2398 goto nla_put_failure;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09002399 rtm->rtm_src_len = 128;
David S. Millerc78679e2012-04-01 20:27:33 -04002400 } else if (rtm->rtm_src_len &&
2401 nla_put(skb, RTA_SRC, 16, &rt->rt6i_src.addr))
2402 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002403#endif
YOSHIFUJI Hideaki7bc570c2008-04-03 09:22:53 +09002404 if (iif) {
2405#ifdef CONFIG_IPV6_MROUTE
2406 if (ipv6_addr_is_multicast(&rt->rt6i_dst.addr)) {
Benjamin Thery8229efd2008-12-10 16:30:15 -08002407 int err = ip6mr_get_route(net, skb, rtm, nowait);
YOSHIFUJI Hideaki7bc570c2008-04-03 09:22:53 +09002408 if (err <= 0) {
2409 if (!nowait) {
2410 if (err == 0)
2411 return 0;
2412 goto nla_put_failure;
2413 } else {
2414 if (err == -EMSGSIZE)
2415 goto nla_put_failure;
2416 }
2417 }
2418 } else
2419#endif
David S. Millerc78679e2012-04-01 20:27:33 -04002420 if (nla_put_u32(skb, RTA_IIF, iif))
2421 goto nla_put_failure;
YOSHIFUJI Hideaki7bc570c2008-04-03 09:22:53 +09002422 } else if (dst) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002423 struct in6_addr saddr_buf;
David S. Millerc78679e2012-04-01 20:27:33 -04002424 if (ip6_route_get_saddr(net, rt, dst, 0, &saddr_buf) == 0 &&
2425 nla_put(skb, RTA_PREFSRC, 16, &saddr_buf))
2426 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002427 }
Thomas Graf2d7202b2006-08-22 00:01:27 -07002428
Daniel Walterc3968a82011-04-13 21:10:57 +00002429 if (rt->rt6i_prefsrc.plen) {
2430 struct in6_addr saddr_buf;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00002431 saddr_buf = rt->rt6i_prefsrc.addr;
David S. Millerc78679e2012-04-01 20:27:33 -04002432 if (nla_put(skb, RTA_PREFSRC, 16, &saddr_buf))
2433 goto nla_put_failure;
Daniel Walterc3968a82011-04-13 21:10:57 +00002434 }
2435
David S. Millerdefb3512010-12-08 21:16:57 -08002436 if (rtnetlink_put_metrics(skb, dst_metrics_ptr(&rt->dst)) < 0)
Thomas Graf2d7202b2006-08-22 00:01:27 -07002437 goto nla_put_failure;
2438
Eric Dumazetf2c31e32011-07-29 19:00:53 +00002439 rcu_read_lock();
David Miller27217452011-12-02 16:52:08 +00002440 n = dst_get_neighbour_noref(&rt->dst);
Eric Dumazet94f826b2012-03-27 09:53:52 +00002441 if (n) {
2442 if (nla_put(skb, RTA_GATEWAY, 16, &n->primary_key) < 0) {
2443 rcu_read_unlock();
2444 goto nla_put_failure;
2445 }
2446 }
Eric Dumazetf2c31e32011-07-29 19:00:53 +00002447 rcu_read_unlock();
Thomas Graf2d7202b2006-08-22 00:01:27 -07002448
David S. Millerc78679e2012-04-01 20:27:33 -04002449 if (rt->dst.dev &&
2450 nla_put_u32(skb, RTA_OIF, rt->dst.dev->ifindex))
2451 goto nla_put_failure;
2452 if (nla_put_u32(skb, RTA_PRIORITY, rt->rt6i_metric))
2453 goto nla_put_failure;
YOSHIFUJI Hideaki36e3dea2008-05-13 02:52:55 +09002454 if (!(rt->rt6i_flags & RTF_EXPIRES))
2455 expires = 0;
David S. Millerd1918542011-12-28 20:19:20 -05002456 else if (rt->dst.expires - jiffies < INT_MAX)
2457 expires = rt->dst.expires - jiffies;
YOSHIFUJI Hideaki36e3dea2008-05-13 02:52:55 +09002458 else
2459 expires = INT_MAX;
YOSHIFUJI Hideaki69cdf8f2008-05-19 16:55:13 -07002460
David S. Miller97bab732012-06-09 22:36:36 -07002461 peer = NULL;
2462 if (rt6_has_peer(rt))
2463 peer = rt6_peer_ptr(rt);
David S. Miller346f8702011-12-29 15:22:33 -05002464 ts = tsage = 0;
2465 if (peer && peer->tcp_ts_stamp) {
2466 ts = peer->tcp_ts;
2467 tsage = get_seconds() - peer->tcp_ts_stamp;
2468 }
2469
2470 if (rtnl_put_cacheinfo(skb, &rt->dst, 0, ts, tsage,
Changli Gaod8d1f302010-06-10 23:31:35 -07002471 expires, rt->dst.error) < 0)
Thomas Grafe3703b32006-11-27 09:27:07 -08002472 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002473
Thomas Graf2d7202b2006-08-22 00:01:27 -07002474 return nlmsg_end(skb, nlh);
2475
2476nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08002477 nlmsg_cancel(skb, nlh);
2478 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002479}
2480
Patrick McHardy1b43af52006-08-10 23:11:17 -07002481int rt6_dump_route(struct rt6_info *rt, void *p_arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002482{
2483 struct rt6_rtnl_dump_arg *arg = (struct rt6_rtnl_dump_arg *) p_arg;
2484 int prefix;
2485
Thomas Graf2d7202b2006-08-22 00:01:27 -07002486 if (nlmsg_len(arg->cb->nlh) >= sizeof(struct rtmsg)) {
2487 struct rtmsg *rtm = nlmsg_data(arg->cb->nlh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002488 prefix = (rtm->rtm_flags & RTM_F_PREFIX) != 0;
2489 } else
2490 prefix = 0;
2491
Brian Haley191cd582008-08-14 15:33:21 -07002492 return rt6_fill_node(arg->net,
2493 arg->skb, rt, NULL, NULL, 0, RTM_NEWROUTE,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002494 NETLINK_CB(arg->cb->skb).pid, arg->cb->nlh->nlmsg_seq,
YOSHIFUJI Hideaki7bc570c2008-04-03 09:22:53 +09002495 prefix, 0, NLM_F_MULTI);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002496}
2497
Thomas Grafc127ea22007-03-22 11:58:32 -07002498static int inet6_rtm_getroute(struct sk_buff *in_skb, struct nlmsghdr* nlh, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002499{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09002500 struct net *net = sock_net(in_skb->sk);
Thomas Grafab364a62006-08-22 00:01:47 -07002501 struct nlattr *tb[RTA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -07002502 struct rt6_info *rt;
Thomas Grafab364a62006-08-22 00:01:47 -07002503 struct sk_buff *skb;
2504 struct rtmsg *rtm;
David S. Miller4c9483b2011-03-12 16:22:43 -05002505 struct flowi6 fl6;
Shmulik Ladkani72331bc2012-04-01 04:03:45 +00002506 int err, iif = 0, oif = 0;
Thomas Grafab364a62006-08-22 00:01:47 -07002507
2508 err = nlmsg_parse(nlh, sizeof(*rtm), tb, RTA_MAX, rtm_ipv6_policy);
2509 if (err < 0)
2510 goto errout;
2511
2512 err = -EINVAL;
David S. Miller4c9483b2011-03-12 16:22:43 -05002513 memset(&fl6, 0, sizeof(fl6));
Thomas Grafab364a62006-08-22 00:01:47 -07002514
2515 if (tb[RTA_SRC]) {
2516 if (nla_len(tb[RTA_SRC]) < sizeof(struct in6_addr))
2517 goto errout;
2518
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00002519 fl6.saddr = *(struct in6_addr *)nla_data(tb[RTA_SRC]);
Thomas Grafab364a62006-08-22 00:01:47 -07002520 }
2521
2522 if (tb[RTA_DST]) {
2523 if (nla_len(tb[RTA_DST]) < sizeof(struct in6_addr))
2524 goto errout;
2525
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00002526 fl6.daddr = *(struct in6_addr *)nla_data(tb[RTA_DST]);
Thomas Grafab364a62006-08-22 00:01:47 -07002527 }
2528
2529 if (tb[RTA_IIF])
2530 iif = nla_get_u32(tb[RTA_IIF]);
2531
2532 if (tb[RTA_OIF])
Shmulik Ladkani72331bc2012-04-01 04:03:45 +00002533 oif = nla_get_u32(tb[RTA_OIF]);
Thomas Grafab364a62006-08-22 00:01:47 -07002534
2535 if (iif) {
2536 struct net_device *dev;
Shmulik Ladkani72331bc2012-04-01 04:03:45 +00002537 int flags = 0;
2538
Daniel Lezcano55786892008-03-04 13:47:47 -08002539 dev = __dev_get_by_index(net, iif);
Thomas Grafab364a62006-08-22 00:01:47 -07002540 if (!dev) {
2541 err = -ENODEV;
2542 goto errout;
2543 }
Shmulik Ladkani72331bc2012-04-01 04:03:45 +00002544
2545 fl6.flowi6_iif = iif;
2546
2547 if (!ipv6_addr_any(&fl6.saddr))
2548 flags |= RT6_LOOKUP_F_HAS_SADDR;
2549
2550 rt = (struct rt6_info *)ip6_route_input_lookup(net, dev, &fl6,
2551 flags);
2552 } else {
2553 fl6.flowi6_oif = oif;
2554
2555 rt = (struct rt6_info *)ip6_route_output(net, NULL, &fl6);
Thomas Grafab364a62006-08-22 00:01:47 -07002556 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07002557
2558 skb = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
David S. Miller38308472011-12-03 18:02:47 -05002559 if (!skb) {
Shmulik Ladkani2173bff2012-04-03 23:13:00 +00002560 dst_release(&rt->dst);
Thomas Grafab364a62006-08-22 00:01:47 -07002561 err = -ENOBUFS;
2562 goto errout;
2563 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07002564
2565 /* Reserve room for dummy headers, this skb can pass
2566 through good chunk of routing engine.
2567 */
Arnaldo Carvalho de Melo459a98e2007-03-19 15:30:44 -07002568 skb_reset_mac_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002569 skb_reserve(skb, MAX_HEADER + sizeof(struct ipv6hdr));
2570
Changli Gaod8d1f302010-06-10 23:31:35 -07002571 skb_dst_set(skb, &rt->dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002572
David S. Miller4c9483b2011-03-12 16:22:43 -05002573 err = rt6_fill_node(net, skb, rt, &fl6.daddr, &fl6.saddr, iif,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002574 RTM_NEWROUTE, NETLINK_CB(in_skb).pid,
YOSHIFUJI Hideaki7bc570c2008-04-03 09:22:53 +09002575 nlh->nlmsg_seq, 0, 0, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002576 if (err < 0) {
Thomas Grafab364a62006-08-22 00:01:47 -07002577 kfree_skb(skb);
2578 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002579 }
2580
Daniel Lezcano55786892008-03-04 13:47:47 -08002581 err = rtnl_unicast(skb, net, NETLINK_CB(in_skb).pid);
Thomas Grafab364a62006-08-22 00:01:47 -07002582errout:
Linus Torvalds1da177e2005-04-16 15:20:36 -07002583 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002584}
2585
Thomas Graf86872cb2006-08-22 00:01:08 -07002586void inet6_rt_notify(int event, struct rt6_info *rt, struct nl_info *info)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002587{
2588 struct sk_buff *skb;
Daniel Lezcano55786892008-03-04 13:47:47 -08002589 struct net *net = info->nl_net;
Denis V. Lunev528c4ce2007-12-13 09:45:12 -08002590 u32 seq;
2591 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002592
Denis V. Lunev528c4ce2007-12-13 09:45:12 -08002593 err = -ENOBUFS;
David S. Miller38308472011-12-03 18:02:47 -05002594 seq = info->nlh ? info->nlh->nlmsg_seq : 0;
Thomas Graf86872cb2006-08-22 00:01:08 -07002595
Thomas Graf339bf982006-11-10 14:10:15 -08002596 skb = nlmsg_new(rt6_nlmsg_size(), gfp_any());
David S. Miller38308472011-12-03 18:02:47 -05002597 if (!skb)
Thomas Graf21713eb2006-08-15 00:35:24 -07002598 goto errout;
2599
Brian Haley191cd582008-08-14 15:33:21 -07002600 err = rt6_fill_node(net, skb, rt, NULL, NULL, 0,
YOSHIFUJI Hideaki7bc570c2008-04-03 09:22:53 +09002601 event, info->pid, seq, 0, 0, 0);
Patrick McHardy26932562007-01-31 23:16:40 -08002602 if (err < 0) {
2603 /* -EMSGSIZE implies BUG in rt6_nlmsg_size() */
2604 WARN_ON(err == -EMSGSIZE);
2605 kfree_skb(skb);
2606 goto errout;
2607 }
Pablo Neira Ayuso1ce85fe2009-02-24 23:18:28 -08002608 rtnl_notify(skb, net, info->pid, RTNLGRP_IPV6_ROUTE,
2609 info->nlh, gfp_any());
2610 return;
Thomas Graf21713eb2006-08-15 00:35:24 -07002611errout:
2612 if (err < 0)
Daniel Lezcano55786892008-03-04 13:47:47 -08002613 rtnl_set_sk_err(net, RTNLGRP_IPV6_ROUTE, err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002614}
2615
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002616static int ip6_route_dev_notify(struct notifier_block *this,
2617 unsigned long event, void *data)
2618{
2619 struct net_device *dev = (struct net_device *)data;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002620 struct net *net = dev_net(dev);
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002621
2622 if (event == NETDEV_REGISTER && (dev->flags & IFF_LOOPBACK)) {
Changli Gaod8d1f302010-06-10 23:31:35 -07002623 net->ipv6.ip6_null_entry->dst.dev = dev;
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002624 net->ipv6.ip6_null_entry->rt6i_idev = in6_dev_get(dev);
2625#ifdef CONFIG_IPV6_MULTIPLE_TABLES
Changli Gaod8d1f302010-06-10 23:31:35 -07002626 net->ipv6.ip6_prohibit_entry->dst.dev = dev;
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002627 net->ipv6.ip6_prohibit_entry->rt6i_idev = in6_dev_get(dev);
Changli Gaod8d1f302010-06-10 23:31:35 -07002628 net->ipv6.ip6_blk_hole_entry->dst.dev = dev;
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002629 net->ipv6.ip6_blk_hole_entry->rt6i_idev = in6_dev_get(dev);
2630#endif
2631 }
2632
2633 return NOTIFY_OK;
2634}
2635
Linus Torvalds1da177e2005-04-16 15:20:36 -07002636/*
2637 * /proc
2638 */
2639
2640#ifdef CONFIG_PROC_FS
2641
Linus Torvalds1da177e2005-04-16 15:20:36 -07002642struct rt6_proc_arg
2643{
2644 char *buffer;
2645 int offset;
2646 int length;
2647 int skip;
2648 int len;
2649};
2650
2651static int rt6_info_route(struct rt6_info *rt, void *p_arg)
2652{
Alexey Dobriyan33120b32007-11-06 05:27:11 -08002653 struct seq_file *m = p_arg;
David S. Miller69cce1d2011-07-17 23:09:49 -07002654 struct neighbour *n;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002655
Harvey Harrison4b7a4272008-10-29 12:50:24 -07002656 seq_printf(m, "%pi6 %02x ", &rt->rt6i_dst.addr, rt->rt6i_dst.plen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002657
2658#ifdef CONFIG_IPV6_SUBTREES
Harvey Harrison4b7a4272008-10-29 12:50:24 -07002659 seq_printf(m, "%pi6 %02x ", &rt->rt6i_src.addr, rt->rt6i_src.plen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002660#else
Alexey Dobriyan33120b32007-11-06 05:27:11 -08002661 seq_puts(m, "00000000000000000000000000000000 00 ");
Linus Torvalds1da177e2005-04-16 15:20:36 -07002662#endif
Eric Dumazetf2c31e32011-07-29 19:00:53 +00002663 rcu_read_lock();
David Miller27217452011-12-02 16:52:08 +00002664 n = dst_get_neighbour_noref(&rt->dst);
David S. Miller69cce1d2011-07-17 23:09:49 -07002665 if (n) {
2666 seq_printf(m, "%pi6", n->primary_key);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002667 } else {
Alexey Dobriyan33120b32007-11-06 05:27:11 -08002668 seq_puts(m, "00000000000000000000000000000000");
Linus Torvalds1da177e2005-04-16 15:20:36 -07002669 }
Eric Dumazetf2c31e32011-07-29 19:00:53 +00002670 rcu_read_unlock();
Alexey Dobriyan33120b32007-11-06 05:27:11 -08002671 seq_printf(m, " %08x %08x %08x %08x %8s\n",
Changli Gaod8d1f302010-06-10 23:31:35 -07002672 rt->rt6i_metric, atomic_read(&rt->dst.__refcnt),
2673 rt->dst.__use, rt->rt6i_flags,
David S. Millerd1918542011-12-28 20:19:20 -05002674 rt->dst.dev ? rt->dst.dev->name : "");
Linus Torvalds1da177e2005-04-16 15:20:36 -07002675 return 0;
2676}
2677
Alexey Dobriyan33120b32007-11-06 05:27:11 -08002678static int ipv6_route_show(struct seq_file *m, void *v)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002679{
Daniel Lezcanof3db4852008-03-03 23:27:06 -08002680 struct net *net = (struct net *)m->private;
Josh Hunt32b293a2011-12-28 13:23:07 +00002681 fib6_clean_all_ro(net, rt6_info_route, 0, m);
Alexey Dobriyan33120b32007-11-06 05:27:11 -08002682 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002683}
2684
Alexey Dobriyan33120b32007-11-06 05:27:11 -08002685static int ipv6_route_open(struct inode *inode, struct file *file)
2686{
Pavel Emelyanovde05c552008-07-18 04:07:21 -07002687 return single_open_net(inode, file, ipv6_route_show);
Daniel Lezcanof3db4852008-03-03 23:27:06 -08002688}
2689
Alexey Dobriyan33120b32007-11-06 05:27:11 -08002690static const struct file_operations ipv6_route_proc_fops = {
2691 .owner = THIS_MODULE,
2692 .open = ipv6_route_open,
2693 .read = seq_read,
2694 .llseek = seq_lseek,
Pavel Emelyanovb6fcbdb2008-07-18 04:07:44 -07002695 .release = single_release_net,
Alexey Dobriyan33120b32007-11-06 05:27:11 -08002696};
2697
Linus Torvalds1da177e2005-04-16 15:20:36 -07002698static int rt6_stats_seq_show(struct seq_file *seq, void *v)
2699{
Daniel Lezcano69ddb802008-03-04 13:46:23 -08002700 struct net *net = (struct net *)seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002701 seq_printf(seq, "%04x %04x %04x %04x %04x %04x %04x\n",
Daniel Lezcano69ddb802008-03-04 13:46:23 -08002702 net->ipv6.rt6_stats->fib_nodes,
2703 net->ipv6.rt6_stats->fib_route_nodes,
2704 net->ipv6.rt6_stats->fib_rt_alloc,
2705 net->ipv6.rt6_stats->fib_rt_entries,
2706 net->ipv6.rt6_stats->fib_rt_cache,
Eric Dumazetfc66f952010-10-08 06:37:34 +00002707 dst_entries_get_slow(&net->ipv6.ip6_dst_ops),
Daniel Lezcano69ddb802008-03-04 13:46:23 -08002708 net->ipv6.rt6_stats->fib_discarded_routes);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002709
2710 return 0;
2711}
2712
2713static int rt6_stats_seq_open(struct inode *inode, struct file *file)
2714{
Pavel Emelyanovde05c552008-07-18 04:07:21 -07002715 return single_open_net(inode, file, rt6_stats_seq_show);
Daniel Lezcano69ddb802008-03-04 13:46:23 -08002716}
2717
Arjan van de Ven9a321442007-02-12 00:55:35 -08002718static const struct file_operations rt6_stats_seq_fops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002719 .owner = THIS_MODULE,
2720 .open = rt6_stats_seq_open,
2721 .read = seq_read,
2722 .llseek = seq_lseek,
Pavel Emelyanovb6fcbdb2008-07-18 04:07:44 -07002723 .release = single_release_net,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002724};
2725#endif /* CONFIG_PROC_FS */
2726
2727#ifdef CONFIG_SYSCTL
2728
Linus Torvalds1da177e2005-04-16 15:20:36 -07002729static
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002730int ipv6_sysctl_rtcache_flush(ctl_table *ctl, int write,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002731 void __user *buffer, size_t *lenp, loff_t *ppos)
2732{
Lucian Adrian Grijincuc486da32011-02-24 19:48:03 +00002733 struct net *net;
2734 int delay;
2735 if (!write)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002736 return -EINVAL;
Lucian Adrian Grijincuc486da32011-02-24 19:48:03 +00002737
2738 net = (struct net *)ctl->extra1;
2739 delay = net->ipv6.sysctl.flush_delay;
2740 proc_dointvec(ctl, write, buffer, lenp, ppos);
2741 fib6_run_gc(delay <= 0 ? ~0UL : (unsigned long)delay, net);
2742 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002743}
2744
Daniel Lezcano760f2d02008-01-10 02:53:43 -08002745ctl_table ipv6_route_table_template[] = {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09002746 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002747 .procname = "flush",
Daniel Lezcano49905092008-01-10 03:01:01 -08002748 .data = &init_net.ipv6.sysctl.flush_delay,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002749 .maxlen = sizeof(int),
Dave Jones89c8b3a12005-04-28 12:11:49 -07002750 .mode = 0200,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002751 .proc_handler = ipv6_sysctl_rtcache_flush
Linus Torvalds1da177e2005-04-16 15:20:36 -07002752 },
2753 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002754 .procname = "gc_thresh",
Daniel Lezcano9a7ec3a2008-03-04 13:48:53 -08002755 .data = &ip6_dst_ops_template.gc_thresh,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002756 .maxlen = sizeof(int),
2757 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002758 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002759 },
2760 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002761 .procname = "max_size",
Daniel Lezcano49905092008-01-10 03:01:01 -08002762 .data = &init_net.ipv6.sysctl.ip6_rt_max_size,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002763 .maxlen = sizeof(int),
2764 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002765 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002766 },
2767 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002768 .procname = "gc_min_interval",
Daniel Lezcano49905092008-01-10 03:01:01 -08002769 .data = &init_net.ipv6.sysctl.ip6_rt_gc_min_interval,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002770 .maxlen = sizeof(int),
2771 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002772 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002773 },
2774 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002775 .procname = "gc_timeout",
Daniel Lezcano49905092008-01-10 03:01:01 -08002776 .data = &init_net.ipv6.sysctl.ip6_rt_gc_timeout,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002777 .maxlen = sizeof(int),
2778 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002779 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002780 },
2781 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002782 .procname = "gc_interval",
Daniel Lezcano49905092008-01-10 03:01:01 -08002783 .data = &init_net.ipv6.sysctl.ip6_rt_gc_interval,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002784 .maxlen = sizeof(int),
2785 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002786 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002787 },
2788 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002789 .procname = "gc_elasticity",
Daniel Lezcano49905092008-01-10 03:01:01 -08002790 .data = &init_net.ipv6.sysctl.ip6_rt_gc_elasticity,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002791 .maxlen = sizeof(int),
2792 .mode = 0644,
Min Zhangf3d3f612010-08-14 22:42:51 -07002793 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002794 },
2795 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002796 .procname = "mtu_expires",
Daniel Lezcano49905092008-01-10 03:01:01 -08002797 .data = &init_net.ipv6.sysctl.ip6_rt_mtu_expires,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002798 .maxlen = sizeof(int),
2799 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002800 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002801 },
2802 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002803 .procname = "min_adv_mss",
Daniel Lezcano49905092008-01-10 03:01:01 -08002804 .data = &init_net.ipv6.sysctl.ip6_rt_min_advmss,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002805 .maxlen = sizeof(int),
2806 .mode = 0644,
Min Zhangf3d3f612010-08-14 22:42:51 -07002807 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002808 },
2809 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002810 .procname = "gc_min_interval_ms",
Daniel Lezcano49905092008-01-10 03:01:01 -08002811 .data = &init_net.ipv6.sysctl.ip6_rt_gc_min_interval,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002812 .maxlen = sizeof(int),
2813 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002814 .proc_handler = proc_dointvec_ms_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002815 },
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002816 { }
Linus Torvalds1da177e2005-04-16 15:20:36 -07002817};
2818
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002819struct ctl_table * __net_init ipv6_route_sysctl_init(struct net *net)
Daniel Lezcano760f2d02008-01-10 02:53:43 -08002820{
2821 struct ctl_table *table;
2822
2823 table = kmemdup(ipv6_route_table_template,
2824 sizeof(ipv6_route_table_template),
2825 GFP_KERNEL);
YOSHIFUJI Hideaki5ee09102008-02-28 00:24:28 +09002826
2827 if (table) {
2828 table[0].data = &net->ipv6.sysctl.flush_delay;
Lucian Adrian Grijincuc486da32011-02-24 19:48:03 +00002829 table[0].extra1 = net;
Alexey Dobriyan86393e52009-08-29 01:34:49 +00002830 table[1].data = &net->ipv6.ip6_dst_ops.gc_thresh;
YOSHIFUJI Hideaki5ee09102008-02-28 00:24:28 +09002831 table[2].data = &net->ipv6.sysctl.ip6_rt_max_size;
2832 table[3].data = &net->ipv6.sysctl.ip6_rt_gc_min_interval;
2833 table[4].data = &net->ipv6.sysctl.ip6_rt_gc_timeout;
2834 table[5].data = &net->ipv6.sysctl.ip6_rt_gc_interval;
2835 table[6].data = &net->ipv6.sysctl.ip6_rt_gc_elasticity;
2836 table[7].data = &net->ipv6.sysctl.ip6_rt_mtu_expires;
2837 table[8].data = &net->ipv6.sysctl.ip6_rt_min_advmss;
Alexey Dobriyan9c69fab2009-12-18 20:11:03 -08002838 table[9].data = &net->ipv6.sysctl.ip6_rt_gc_min_interval;
YOSHIFUJI Hideaki5ee09102008-02-28 00:24:28 +09002839 }
2840
Daniel Lezcano760f2d02008-01-10 02:53:43 -08002841 return table;
2842}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002843#endif
2844
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002845static int __net_init ip6_route_net_init(struct net *net)
Daniel Lezcanocdb18762008-03-04 13:45:33 -08002846{
Pavel Emelyanov633d4242008-04-21 14:25:23 -07002847 int ret = -ENOMEM;
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002848
Alexey Dobriyan86393e52009-08-29 01:34:49 +00002849 memcpy(&net->ipv6.ip6_dst_ops, &ip6_dst_ops_template,
2850 sizeof(net->ipv6.ip6_dst_ops));
Benjamin Theryf2fc6a52008-03-04 13:49:23 -08002851
Eric Dumazetfc66f952010-10-08 06:37:34 +00002852 if (dst_entries_init(&net->ipv6.ip6_dst_ops) < 0)
2853 goto out_ip6_dst_ops;
2854
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002855 net->ipv6.ip6_null_entry = kmemdup(&ip6_null_entry_template,
2856 sizeof(*net->ipv6.ip6_null_entry),
2857 GFP_KERNEL);
2858 if (!net->ipv6.ip6_null_entry)
Eric Dumazetfc66f952010-10-08 06:37:34 +00002859 goto out_ip6_dst_entries;
Changli Gaod8d1f302010-06-10 23:31:35 -07002860 net->ipv6.ip6_null_entry->dst.path =
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002861 (struct dst_entry *)net->ipv6.ip6_null_entry;
Changli Gaod8d1f302010-06-10 23:31:35 -07002862 net->ipv6.ip6_null_entry->dst.ops = &net->ipv6.ip6_dst_ops;
David S. Miller62fa8a82011-01-26 20:51:05 -08002863 dst_init_metrics(&net->ipv6.ip6_null_entry->dst,
2864 ip6_template_metrics, true);
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002865
2866#ifdef CONFIG_IPV6_MULTIPLE_TABLES
2867 net->ipv6.ip6_prohibit_entry = kmemdup(&ip6_prohibit_entry_template,
2868 sizeof(*net->ipv6.ip6_prohibit_entry),
2869 GFP_KERNEL);
Peter Zijlstra68fffc62008-10-07 14:12:10 -07002870 if (!net->ipv6.ip6_prohibit_entry)
2871 goto out_ip6_null_entry;
Changli Gaod8d1f302010-06-10 23:31:35 -07002872 net->ipv6.ip6_prohibit_entry->dst.path =
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002873 (struct dst_entry *)net->ipv6.ip6_prohibit_entry;
Changli Gaod8d1f302010-06-10 23:31:35 -07002874 net->ipv6.ip6_prohibit_entry->dst.ops = &net->ipv6.ip6_dst_ops;
David S. Miller62fa8a82011-01-26 20:51:05 -08002875 dst_init_metrics(&net->ipv6.ip6_prohibit_entry->dst,
2876 ip6_template_metrics, true);
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002877
2878 net->ipv6.ip6_blk_hole_entry = kmemdup(&ip6_blk_hole_entry_template,
2879 sizeof(*net->ipv6.ip6_blk_hole_entry),
2880 GFP_KERNEL);
Peter Zijlstra68fffc62008-10-07 14:12:10 -07002881 if (!net->ipv6.ip6_blk_hole_entry)
2882 goto out_ip6_prohibit_entry;
Changli Gaod8d1f302010-06-10 23:31:35 -07002883 net->ipv6.ip6_blk_hole_entry->dst.path =
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002884 (struct dst_entry *)net->ipv6.ip6_blk_hole_entry;
Changli Gaod8d1f302010-06-10 23:31:35 -07002885 net->ipv6.ip6_blk_hole_entry->dst.ops = &net->ipv6.ip6_dst_ops;
David S. Miller62fa8a82011-01-26 20:51:05 -08002886 dst_init_metrics(&net->ipv6.ip6_blk_hole_entry->dst,
2887 ip6_template_metrics, true);
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002888#endif
2889
Peter Zijlstrab339a47c2008-10-07 14:15:00 -07002890 net->ipv6.sysctl.flush_delay = 0;
2891 net->ipv6.sysctl.ip6_rt_max_size = 4096;
2892 net->ipv6.sysctl.ip6_rt_gc_min_interval = HZ / 2;
2893 net->ipv6.sysctl.ip6_rt_gc_timeout = 60*HZ;
2894 net->ipv6.sysctl.ip6_rt_gc_interval = 30*HZ;
2895 net->ipv6.sysctl.ip6_rt_gc_elasticity = 9;
2896 net->ipv6.sysctl.ip6_rt_mtu_expires = 10*60*HZ;
2897 net->ipv6.sysctl.ip6_rt_min_advmss = IPV6_MIN_MTU - 20 - 40;
2898
Benjamin Thery6891a342008-03-04 13:49:47 -08002899 net->ipv6.ip6_rt_gc_expire = 30*HZ;
2900
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002901 ret = 0;
2902out:
2903 return ret;
Benjamin Theryf2fc6a52008-03-04 13:49:23 -08002904
Peter Zijlstra68fffc62008-10-07 14:12:10 -07002905#ifdef CONFIG_IPV6_MULTIPLE_TABLES
2906out_ip6_prohibit_entry:
2907 kfree(net->ipv6.ip6_prohibit_entry);
2908out_ip6_null_entry:
2909 kfree(net->ipv6.ip6_null_entry);
2910#endif
Eric Dumazetfc66f952010-10-08 06:37:34 +00002911out_ip6_dst_entries:
2912 dst_entries_destroy(&net->ipv6.ip6_dst_ops);
Benjamin Theryf2fc6a52008-03-04 13:49:23 -08002913out_ip6_dst_ops:
Benjamin Theryf2fc6a52008-03-04 13:49:23 -08002914 goto out;
Daniel Lezcanocdb18762008-03-04 13:45:33 -08002915}
2916
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002917static void __net_exit ip6_route_net_exit(struct net *net)
Daniel Lezcanocdb18762008-03-04 13:45:33 -08002918{
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002919 kfree(net->ipv6.ip6_null_entry);
2920#ifdef CONFIG_IPV6_MULTIPLE_TABLES
2921 kfree(net->ipv6.ip6_prohibit_entry);
2922 kfree(net->ipv6.ip6_blk_hole_entry);
2923#endif
Xiaotian Feng41bb78b2010-11-02 16:11:05 +00002924 dst_entries_destroy(&net->ipv6.ip6_dst_ops);
Daniel Lezcanocdb18762008-03-04 13:45:33 -08002925}
2926
Thomas Grafd1896342012-06-18 12:08:33 +00002927static int __net_init ip6_route_net_init_late(struct net *net)
2928{
2929#ifdef CONFIG_PROC_FS
2930 proc_net_fops_create(net, "ipv6_route", 0, &ipv6_route_proc_fops);
2931 proc_net_fops_create(net, "rt6_stats", S_IRUGO, &rt6_stats_seq_fops);
2932#endif
2933 return 0;
2934}
2935
2936static void __net_exit ip6_route_net_exit_late(struct net *net)
2937{
2938#ifdef CONFIG_PROC_FS
2939 proc_net_remove(net, "ipv6_route");
2940 proc_net_remove(net, "rt6_stats");
2941#endif
2942}
2943
Daniel Lezcanocdb18762008-03-04 13:45:33 -08002944static struct pernet_operations ip6_route_net_ops = {
2945 .init = ip6_route_net_init,
2946 .exit = ip6_route_net_exit,
2947};
2948
David S. Millerc3426b42012-06-09 16:27:05 -07002949static int __net_init ipv6_inetpeer_init(struct net *net)
2950{
2951 struct inet_peer_base *bp = kmalloc(sizeof(*bp), GFP_KERNEL);
2952
2953 if (!bp)
2954 return -ENOMEM;
2955 inet_peer_base_init(bp);
2956 net->ipv6.peers = bp;
2957 return 0;
2958}
2959
2960static void __net_exit ipv6_inetpeer_exit(struct net *net)
2961{
2962 struct inet_peer_base *bp = net->ipv6.peers;
2963
2964 net->ipv6.peers = NULL;
David S. Miller56a6b242012-06-09 16:32:41 -07002965 inetpeer_invalidate_tree(bp);
David S. Millerc3426b42012-06-09 16:27:05 -07002966 kfree(bp);
2967}
2968
David S. Miller2b823f72012-06-09 19:00:16 -07002969static struct pernet_operations ipv6_inetpeer_ops = {
David S. Millerc3426b42012-06-09 16:27:05 -07002970 .init = ipv6_inetpeer_init,
2971 .exit = ipv6_inetpeer_exit,
2972};
2973
Thomas Grafd1896342012-06-18 12:08:33 +00002974static struct pernet_operations ip6_route_net_late_ops = {
2975 .init = ip6_route_net_init_late,
2976 .exit = ip6_route_net_exit_late,
2977};
2978
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002979static struct notifier_block ip6_route_dev_notifier = {
2980 .notifier_call = ip6_route_dev_notify,
2981 .priority = 0,
2982};
2983
Daniel Lezcano433d49c2007-12-07 00:43:48 -08002984int __init ip6_route_init(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002985{
Daniel Lezcano433d49c2007-12-07 00:43:48 -08002986 int ret;
2987
Daniel Lezcano9a7ec3a2008-03-04 13:48:53 -08002988 ret = -ENOMEM;
2989 ip6_dst_ops_template.kmem_cachep =
2990 kmem_cache_create("ip6_dst_cache", sizeof(struct rt6_info), 0,
2991 SLAB_HWCACHE_ALIGN, NULL);
2992 if (!ip6_dst_ops_template.kmem_cachep)
Fernando Carrijoc19a28e2009-01-07 18:09:08 -08002993 goto out;
David S. Miller14e50e52007-05-24 18:17:54 -07002994
Eric Dumazetfc66f952010-10-08 06:37:34 +00002995 ret = dst_entries_init(&ip6_dst_blackhole_ops);
Daniel Lezcano8ed67782008-03-04 13:48:30 -08002996 if (ret)
Daniel Lezcanobdb32892008-03-04 13:48:10 -08002997 goto out_kmem_cache;
Daniel Lezcanobdb32892008-03-04 13:48:10 -08002998
David S. Millerc3426b42012-06-09 16:27:05 -07002999 ret = register_pernet_subsys(&ipv6_inetpeer_ops);
3000 if (ret)
David S. Millere8803b62012-06-16 01:12:19 -07003001 goto out_dst_entries;
Thomas Graf2a0c4512012-06-14 23:00:17 +00003002
David S. Miller7e52b332012-06-15 15:51:55 -07003003 ret = register_pernet_subsys(&ip6_route_net_ops);
3004 if (ret)
3005 goto out_register_inetpeer;
David S. Millerc3426b42012-06-09 16:27:05 -07003006
Arnaud Ebalard5dc121e2008-10-01 02:37:56 -07003007 ip6_dst_blackhole_ops.kmem_cachep = ip6_dst_ops_template.kmem_cachep;
3008
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003009 /* Registering of the loopback is done before this portion of code,
3010 * the loopback reference in rt6_info will not be taken, do it
3011 * manually for init_net */
Changli Gaod8d1f302010-06-10 23:31:35 -07003012 init_net.ipv6.ip6_null_entry->dst.dev = init_net.loopback_dev;
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003013 init_net.ipv6.ip6_null_entry->rt6i_idev = in6_dev_get(init_net.loopback_dev);
3014 #ifdef CONFIG_IPV6_MULTIPLE_TABLES
Changli Gaod8d1f302010-06-10 23:31:35 -07003015 init_net.ipv6.ip6_prohibit_entry->dst.dev = init_net.loopback_dev;
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003016 init_net.ipv6.ip6_prohibit_entry->rt6i_idev = in6_dev_get(init_net.loopback_dev);
Changli Gaod8d1f302010-06-10 23:31:35 -07003017 init_net.ipv6.ip6_blk_hole_entry->dst.dev = init_net.loopback_dev;
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003018 init_net.ipv6.ip6_blk_hole_entry->rt6i_idev = in6_dev_get(init_net.loopback_dev);
3019 #endif
David S. Millere8803b62012-06-16 01:12:19 -07003020 ret = fib6_init();
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003021 if (ret)
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003022 goto out_register_subsys;
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003023
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003024 ret = xfrm6_init();
3025 if (ret)
David S. Millere8803b62012-06-16 01:12:19 -07003026 goto out_fib6_init;
Daniel Lezcanoc35b7e72007-12-08 00:14:11 -08003027
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003028 ret = fib6_rules_init();
3029 if (ret)
3030 goto xfrm6_init;
Daniel Lezcano7e5449c2007-12-08 00:14:54 -08003031
Thomas Grafd1896342012-06-18 12:08:33 +00003032 ret = register_pernet_subsys(&ip6_route_net_late_ops);
3033 if (ret)
3034 goto fib6_rules_init;
3035
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003036 ret = -ENOBUFS;
Greg Rosec7ac8672011-06-10 01:27:09 +00003037 if (__rtnl_register(PF_INET6, RTM_NEWROUTE, inet6_rtm_newroute, NULL, NULL) ||
3038 __rtnl_register(PF_INET6, RTM_DELROUTE, inet6_rtm_delroute, NULL, NULL) ||
3039 __rtnl_register(PF_INET6, RTM_GETROUTE, inet6_rtm_getroute, NULL, NULL))
Thomas Grafd1896342012-06-18 12:08:33 +00003040 goto out_register_late_subsys;
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003041
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003042 ret = register_netdevice_notifier(&ip6_route_dev_notifier);
Daniel Lezcanocdb18762008-03-04 13:45:33 -08003043 if (ret)
Thomas Grafd1896342012-06-18 12:08:33 +00003044 goto out_register_late_subsys;
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003045
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003046out:
3047 return ret;
3048
Thomas Grafd1896342012-06-18 12:08:33 +00003049out_register_late_subsys:
3050 unregister_pernet_subsys(&ip6_route_net_late_ops);
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003051fib6_rules_init:
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003052 fib6_rules_cleanup();
3053xfrm6_init:
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003054 xfrm6_fini();
Thomas Graf2a0c4512012-06-14 23:00:17 +00003055out_fib6_init:
3056 fib6_gc_cleanup();
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003057out_register_subsys:
3058 unregister_pernet_subsys(&ip6_route_net_ops);
David S. Miller7e52b332012-06-15 15:51:55 -07003059out_register_inetpeer:
3060 unregister_pernet_subsys(&ipv6_inetpeer_ops);
Eric Dumazetfc66f952010-10-08 06:37:34 +00003061out_dst_entries:
3062 dst_entries_destroy(&ip6_dst_blackhole_ops);
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003063out_kmem_cache:
Benjamin Theryf2fc6a52008-03-04 13:49:23 -08003064 kmem_cache_destroy(ip6_dst_ops_template.kmem_cachep);
Daniel Lezcano433d49c2007-12-07 00:43:48 -08003065 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003066}
3067
3068void ip6_route_cleanup(void)
3069{
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003070 unregister_netdevice_notifier(&ip6_route_dev_notifier);
Thomas Grafd1896342012-06-18 12:08:33 +00003071 unregister_pernet_subsys(&ip6_route_net_late_ops);
Thomas Graf101367c2006-08-04 03:39:02 -07003072 fib6_rules_cleanup();
Linus Torvalds1da177e2005-04-16 15:20:36 -07003073 xfrm6_fini();
Linus Torvalds1da177e2005-04-16 15:20:36 -07003074 fib6_gc_cleanup();
David S. Millerc3426b42012-06-09 16:27:05 -07003075 unregister_pernet_subsys(&ipv6_inetpeer_ops);
Daniel Lezcano8ed67782008-03-04 13:48:30 -08003076 unregister_pernet_subsys(&ip6_route_net_ops);
Xiaotian Feng41bb78b2010-11-02 16:11:05 +00003077 dst_entries_destroy(&ip6_dst_blackhole_ops);
Benjamin Theryf2fc6a52008-03-04 13:49:23 -08003078 kmem_cache_destroy(ip6_dst_ops_template.kmem_cachep);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003079}