blob: c4864c1e8f1363aa898293bf5461a488c200ffb0 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Linux INET6 implementation
3 *
4 * Authors:
5 * Pedro Roque <roque@di.fc.ul.pt>
6 *
7 * This program is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation; either version
10 * 2 of the License, or (at your option) any later version.
11 */
12
13#ifndef _IP6_FIB_H
14#define _IP6_FIB_H
15
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/ipv6_route.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/rtnetlink.h>
18#include <linux/spinlock.h>
Ido Schimmel16ab6d72017-08-03 13:28:16 +020019#include <linux/notifier.h>
Thomas Graf86872cb2006-08-22 00:01:08 -070020#include <net/dst.h>
21#include <net/flow.h>
22#include <net/netlink.h>
David S. Millerb3419362010-11-30 12:27:11 -080023#include <net/inetpeer.h>
Ido Schimmel16ab6d72017-08-03 13:28:16 +020024#include <net/fib_notifier.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025
Neil Hormana33bc5c2009-07-30 18:52:15 -070026#ifdef CONFIG_IPV6_MULTIPLE_TABLES
27#define FIB6_TABLE_HASHSZ 256
28#else
29#define FIB6_TABLE_HASHSZ 1
30#endif
31
Linus Torvalds1da177e2005-04-16 15:20:36 -070032struct rt6_info;
33
Eric Dumazetfd2c3ef2009-11-03 03:26:03 +000034struct fib6_config {
Thomas Graf86872cb2006-08-22 00:01:08 -070035 u32 fc_table;
36 u32 fc_metric;
37 int fc_dst_len;
38 int fc_src_len;
39 int fc_ifindex;
40 u32 fc_flags;
41 u32 fc_protocol;
David Ahern0ae81332017-02-02 12:37:08 -080042 u16 fc_type; /* only 8 bits are used */
43 u16 fc_delete_all_nh : 1,
44 __unused : 15;
Thomas Graf86872cb2006-08-22 00:01:08 -070045
46 struct in6_addr fc_dst;
47 struct in6_addr fc_src;
Daniel Walterc3968a82011-04-13 21:10:57 +000048 struct in6_addr fc_prefsrc;
Thomas Graf86872cb2006-08-22 00:01:08 -070049 struct in6_addr fc_gateway;
50
51 unsigned long fc_expires;
52 struct nlattr *fc_mx;
53 int fc_mx_len;
Nicolas Dichtel51ebd3182012-10-22 03:42:09 +000054 int fc_mp_len;
55 struct nlattr *fc_mp;
Thomas Graf86872cb2006-08-22 00:01:08 -070056
57 struct nl_info fc_nlinfo;
Roopa Prabhu19e42e42015-07-21 10:43:48 +020058 struct nlattr *fc_encap;
59 u16 fc_encap_type;
Thomas Graf86872cb2006-08-22 00:01:08 -070060};
61
Eric Dumazetfd2c3ef2009-11-03 03:26:03 +000062struct fib6_node {
Linus Torvalds1da177e2005-04-16 15:20:36 -070063 struct fib6_node *parent;
64 struct fib6_node *left;
65 struct fib6_node *right;
Kim Nordlund8bce65b2006-12-13 16:38:29 -080066#ifdef CONFIG_IPV6_SUBTREES
Linus Torvalds1da177e2005-04-16 15:20:36 -070067 struct fib6_node *subtree;
Kim Nordlund8bce65b2006-12-13 16:38:29 -080068#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070069 struct rt6_info *leaf;
70
71 __u16 fn_bit; /* bit key */
72 __u16 fn_flags;
Hannes Frederic Sowa42b18702014-10-06 19:58:35 +020073 int fn_sernum;
David S. Millerf11e6652007-03-24 20:36:25 -070074 struct rt6_info *rr_ptr;
Wei Wangc5cff852017-08-21 09:47:10 -070075 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -070076};
77
YOSHIFUJI Hideaki7fc33162006-08-23 17:22:24 -070078#ifndef CONFIG_IPV6_SUBTREES
79#define FIB6_SUBTREE(fn) NULL
80#else
81#define FIB6_SUBTREE(fn) ((fn)->subtree)
82#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070083
Florian Westphale715b6d2015-01-05 23:57:44 +010084struct mx6_config {
85 const u32 *mx;
86 DECLARE_BITMAP(mx_valid, RTAX_MAX);
87};
88
Linus Torvalds1da177e2005-04-16 15:20:36 -070089/*
90 * routing information
91 *
92 */
93
Eric Dumazetfd2c3ef2009-11-03 03:26:03 +000094struct rt6key {
Linus Torvalds1da177e2005-04-16 15:20:36 -070095 struct in6_addr addr;
96 int plen;
97};
98
Thomas Grafc71099a2006-08-04 23:20:06 -070099struct fib6_table;
100
Wei Wang35732d02017-10-06 12:05:57 -0700101struct rt6_exception_bucket {
102 struct hlist_head chain;
103 int depth;
104};
105
106struct rt6_exception {
107 struct hlist_node hlist;
108 struct rt6_info *rt6i;
109 unsigned long stamp;
110 struct rcu_head rcu;
111};
112
113#define FIB6_EXCEPTION_BUCKET_SIZE_SHIFT 10
114#define FIB6_EXCEPTION_BUCKET_SIZE (1 << FIB6_EXCEPTION_BUCKET_SIZE_SHIFT)
115#define FIB6_MAX_DEPTH 5
116
Eric Dumazetfd2c3ef2009-11-03 03:26:03 +0000117struct rt6_info {
Changli Gaod8d1f302010-06-10 23:31:35 -0700118 struct dst_entry dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119
YOSHIFUJI Hideaki / 吉藤英明bd2c77a2010-03-31 22:24:22 +0000120 /*
121 * Tail elements of dst_entry (__refcnt etc.)
122 * and these elements (rarely used in hot path) are in
123 * the same cache line.
124 */
125 struct fib6_table *rt6i_table;
Wei Wang4e587ea2017-08-25 15:03:10 -0700126 struct fib6_node __rcu *rt6i_node;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127
128 struct in6_addr rt6i_gateway;
YOSHIFUJI Hideaki / 吉藤英明bd2c77a2010-03-31 22:24:22 +0000129
Nicolas Dichtel51ebd3182012-10-22 03:42:09 +0000130 /* Multipath routes:
131 * siblings is a list of rt6_info that have the the same metric/weight,
132 * destination, but not the same gateway. nsiblings is just a cache
133 * to speed up lookup.
134 */
135 struct list_head rt6i_siblings;
136 unsigned int rt6i_nsiblings;
137
Linus Torvalds1da177e2005-04-16 15:20:36 -0700138 atomic_t rt6i_ref;
Herbert Xub4ce9272007-11-13 21:33:32 -0800139
Ido Schimmelfe400792017-08-15 09:09:49 +0200140 unsigned int rt6i_nh_flags;
141
YOSHIFUJI Hideaki / 吉藤英明bd2c77a2010-03-31 22:24:22 +0000142 /* These are in a separate cache line. */
143 struct rt6key rt6i_dst ____cacheline_aligned_in_smp;
144 u32 rt6i_flags;
145 struct rt6key rt6i_src;
Daniel Walterc3968a82011-04-13 21:10:57 +0000146 struct rt6key rt6i_prefsrc;
Herbert Xub4ce9272007-11-13 21:33:32 -0800147
Martin KaFai Lau8d0b94a2015-05-22 20:56:04 -0700148 struct list_head rt6i_uncached;
149 struct uncached_list *rt6i_uncached_list;
150
YOSHIFUJI Hideaki / 吉藤英明bd2c77a2010-03-31 22:24:22 +0000151 struct inet6_dev *rt6i_idev;
Martin KaFai Laud52d3992015-05-22 20:56:06 -0700152 struct rt6_info * __percpu *rt6i_pcpu;
Wei Wang35732d02017-10-06 12:05:57 -0700153 struct rt6_exception_bucket __rcu *rt6i_exception_bucket;
Noriaki TAKAMIYAa47ed4c2007-09-06 03:31:25 -0700154
Hannes Frederic Sowa705f1c82014-09-28 00:46:06 +0200155 u32 rt6i_metric;
Martin KaFai Lau4b32b5a2015-04-28 13:03:06 -0700156 u32 rt6i_pmtu;
YOSHIFUJI Hideaki / 吉藤英明bd2c77a2010-03-31 22:24:22 +0000157 /* more non-fragment space at head required */
158 unsigned short rt6i_nfheader_len;
YOSHIFUJI Hideaki / 吉藤英明bd2c77a2010-03-31 22:24:22 +0000159 u8 rt6i_protocol;
Wei Wang35732d02017-10-06 12:05:57 -0700160 u8 exception_bucket_flushed:1,
161 unused:7;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162};
163
YOSHIFUJI Hideaki7a3025b2006-10-13 16:17:25 +0900164static inline struct inet6_dev *ip6_dst_idev(struct dst_entry *dst)
165{
166 return ((struct rt6_info *)dst)->rt6i_idev;
167}
168
Gao feng1716a962012-04-06 00:13:10 +0000169static inline void rt6_clean_expires(struct rt6_info *rt)
170{
Gao feng1716a962012-04-06 00:13:10 +0000171 rt->rt6i_flags &= ~RTF_EXPIRES;
Hannes Frederic Sowa01ba16d2013-10-24 10:14:27 +0200172 rt->dst.expires = 0;
Gao feng1716a962012-04-06 00:13:10 +0000173}
174
175static inline void rt6_set_expires(struct rt6_info *rt, unsigned long expires)
176{
Gao feng1716a962012-04-06 00:13:10 +0000177 rt->dst.expires = expires;
YOSHIFUJI Hideaki / 吉藤英明ecd98832013-02-20 00:29:08 +0000178 rt->rt6i_flags |= RTF_EXPIRES;
Gao feng1716a962012-04-06 00:13:10 +0000179}
180
YOSHIFUJI Hideaki / 吉藤英明ecd98832013-02-20 00:29:08 +0000181static inline void rt6_update_expires(struct rt6_info *rt0, int timeout)
Gao feng1716a962012-04-06 00:13:10 +0000182{
YOSHIFUJI Hideaki / 吉藤英明ecd98832013-02-20 00:29:08 +0000183 struct rt6_info *rt;
Gao feng1716a962012-04-06 00:13:10 +0000184
YOSHIFUJI Hideaki / 吉藤英明ecd98832013-02-20 00:29:08 +0000185 for (rt = rt0; rt && !(rt->rt6i_flags & RTF_EXPIRES);
186 rt = (struct rt6_info *)rt->dst.from);
187 if (rt && rt != rt0)
188 rt0->dst.expires = rt->dst.expires;
189
190 dst_set_expires(&rt0->dst, timeout);
191 rt0->rt6i_flags |= RTF_EXPIRES;
Gao feng1716a962012-04-06 00:13:10 +0000192}
193
Wei Wangc5cff852017-08-21 09:47:10 -0700194/* Function to safely get fn->sernum for passed in rt
195 * and store result in passed in cookie.
196 * Return true if we can get cookie safely
197 * Return false if not
198 */
199static inline bool rt6_get_cookie_safe(const struct rt6_info *rt,
200 u32 *cookie)
201{
202 struct fib6_node *fn;
203 bool status = false;
204
205 rcu_read_lock();
206 fn = rcu_dereference(rt->rt6i_node);
207
208 if (fn) {
209 *cookie = fn->fn_sernum;
210 status = true;
211 }
212
213 rcu_read_unlock();
214 return status;
215}
216
Martin KaFai Laub197df42015-05-22 20:56:01 -0700217static inline u32 rt6_get_cookie(const struct rt6_info *rt)
218{
Wei Wangc5cff852017-08-21 09:47:10 -0700219 u32 cookie = 0;
220
Martin KaFai Lau02bcf4e2015-11-11 11:51:08 -0800221 if (rt->rt6i_flags & RTF_PCPU ||
Wei Wanga4c2fd72017-06-17 10:42:42 -0700222 (unlikely(!list_empty(&rt->rt6i_uncached)) && rt->dst.from))
Martin KaFai Lau3da59bd2015-05-22 20:56:03 -0700223 rt = (struct rt6_info *)(rt->dst.from);
224
Wei Wangc5cff852017-08-21 09:47:10 -0700225 rt6_get_cookie_safe(rt, &cookie);
226
227 return cookie;
Martin KaFai Laub197df42015-05-22 20:56:01 -0700228}
229
Amerigo Wang94e187c2012-10-29 00:13:19 +0000230static inline void ip6_rt_put(struct rt6_info *rt)
231{
232 /* dst_release() accepts a NULL parameter.
233 * We rely on dst being first structure in struct rt6_info
234 */
235 BUILD_BUG_ON(offsetof(struct rt6_info, dst) != 0);
236 dst_release(&rt->dst);
237}
238
Ido Schimmela460aa82017-08-03 13:28:25 +0200239void rt6_free_pcpu(struct rt6_info *non_pcpu_rt);
240
241static inline void rt6_hold(struct rt6_info *rt)
242{
243 atomic_inc(&rt->rt6i_ref);
244}
245
246static inline void rt6_release(struct rt6_info *rt)
247{
248 if (atomic_dec_and_test(&rt->rt6i_ref)) {
249 rt6_free_pcpu(rt);
250 dst_dev_put(&rt->dst);
251 dst_release(&rt->dst);
252 }
253}
254
Hannes Frederic Sowa94b2cfe2014-10-06 19:58:34 +0200255enum fib6_walk_state {
256#ifdef CONFIG_IPV6_SUBTREES
257 FWS_S,
258#endif
259 FWS_L,
260 FWS_R,
261 FWS_C,
262 FWS_U
263};
264
265struct fib6_walker {
Alexey Dobriyanbbef49d2010-02-18 08:13:30 +0000266 struct list_head lh;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267 struct fib6_node *root, *node;
268 struct rt6_info *leaf;
Hannes Frederic Sowa94b2cfe2014-10-06 19:58:34 +0200269 enum fib6_walk_state state;
270 bool prune;
Patrick McHardy2bec5a32010-02-08 05:19:03 +0000271 unsigned int skip;
272 unsigned int count;
Hannes Frederic Sowa94b2cfe2014-10-06 19:58:34 +0200273 int (*func)(struct fib6_walker *);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274 void *args;
275};
276
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277struct rt6_statistics {
278 __u32 fib_nodes;
279 __u32 fib_route_nodes;
280 __u32 fib_rt_alloc; /* permanent routes */
281 __u32 fib_rt_entries; /* rt entries in table */
282 __u32 fib_rt_cache; /* cache routes */
283 __u32 fib_discarded_routes;
284};
285
286#define RTN_TL_ROOT 0x0001
287#define RTN_ROOT 0x0002 /* tree root node */
288#define RTN_RTINFO 0x0004 /* node with valid routing info */
289
290/*
291 * priority levels (or metrics)
292 *
293 */
294
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295
Thomas Grafc71099a2006-08-04 23:20:06 -0700296struct fib6_table {
297 struct hlist_node tb6_hlist;
298 u32 tb6_id;
299 rwlock_t tb6_lock;
300 struct fib6_node tb6_root;
David S. Miller8e773272012-06-11 00:01:52 -0700301 struct inet_peer_base tb6_peers;
David Ahern830218c2016-10-24 10:52:35 -0700302 unsigned int flags;
Ido Schimmele1ee0a52017-08-03 13:28:19 +0200303 unsigned int fib_seq;
David Ahern830218c2016-10-24 10:52:35 -0700304#define RT6_TABLE_HAS_DFLT_ROUTER BIT(0)
Thomas Grafc71099a2006-08-04 23:20:06 -0700305};
306
307#define RT6_TABLE_UNSPEC RT_TABLE_UNSPEC
308#define RT6_TABLE_MAIN RT_TABLE_MAIN
Thomas Grafc71099a2006-08-04 23:20:06 -0700309#define RT6_TABLE_DFLT RT6_TABLE_MAIN
310#define RT6_TABLE_INFO RT6_TABLE_MAIN
311#define RT6_TABLE_PREFIX RT6_TABLE_MAIN
312
313#ifdef CONFIG_IPV6_MULTIPLE_TABLES
314#define FIB6_TABLE_MIN 1
315#define FIB6_TABLE_MAX RT_TABLE_MAX
Thomas Graf101367c2006-08-04 03:39:02 -0700316#define RT6_TABLE_LOCAL RT_TABLE_LOCAL
Thomas Grafc71099a2006-08-04 23:20:06 -0700317#else
318#define FIB6_TABLE_MIN RT_TABLE_MAIN
319#define FIB6_TABLE_MAX FIB6_TABLE_MIN
Thomas Graf101367c2006-08-04 03:39:02 -0700320#define RT6_TABLE_LOCAL RT6_TABLE_MAIN
Thomas Grafc71099a2006-08-04 23:20:06 -0700321#endif
322
Daniel Lezcano8ed67782008-03-04 13:48:30 -0800323typedef struct rt6_info *(*pol_lookup_t)(struct net *,
324 struct fib6_table *,
David S. Miller4c9483b2011-03-12 16:22:43 -0500325 struct flowi6 *, int);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700326
Ido Schimmeldf77fe42017-08-03 13:28:17 +0200327struct fib6_entry_notifier_info {
328 struct fib_notifier_info info; /* must be first */
329 struct rt6_info *rt;
330};
331
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332/*
333 * exported functions
334 */
335
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700336struct fib6_table *fib6_get_table(struct net *net, u32 id);
337struct fib6_table *fib6_new_table(struct net *net, u32 id);
338struct dst_entry *fib6_rule_lookup(struct net *net, struct flowi6 *fl6,
339 int flags, pol_lookup_t lookup);
Thomas Grafc71099a2006-08-04 23:20:06 -0700340
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700341struct fib6_node *fib6_lookup(struct fib6_node *root,
342 const struct in6_addr *daddr,
343 const struct in6_addr *saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700345struct fib6_node *fib6_locate(struct fib6_node *root,
346 const struct in6_addr *daddr, int dst_len,
347 const struct in6_addr *saddr, int src_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700349void fib6_clean_all(struct net *net, int (*func)(struct rt6_info *, void *arg),
Li RongQing0c3584d2013-12-27 16:32:38 +0800350 void *arg);
Thomas Grafc71099a2006-08-04 23:20:06 -0700351
Florian Westphale715b6d2015-01-05 23:57:44 +0100352int fib6_add(struct fib6_node *root, struct rt6_info *rt,
David Ahern333c4302017-05-21 10:12:04 -0600353 struct nl_info *info, struct mx6_config *mxc,
354 struct netlink_ext_ack *extack);
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700355int fib6_del(struct rt6_info *rt, struct nl_info *info);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356
Roopa Prabhu37a1d362015-09-13 10:18:33 -0700357void inet6_rt_notify(int event, struct rt6_info *rt, struct nl_info *info,
358 unsigned int flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700360void fib6_run_gc(unsigned long expires, struct net *net, bool force);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700362void fib6_gc_cleanup(void);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700364int fib6_init(void);
Thomas Graf101367c2006-08-04 03:39:02 -0700365
Hannes Frederic Sowa8d2ca1d2013-09-21 16:55:59 +0200366int ipv6_route_open(struct inode *inode, struct file *file);
367
Ido Schimmel16ab6d72017-08-03 13:28:16 +0200368int call_fib6_notifier(struct notifier_block *nb, struct net *net,
369 enum fib_event_type event_type,
370 struct fib_notifier_info *info);
371int call_fib6_notifiers(struct net *net, enum fib_event_type event_type,
372 struct fib_notifier_info *info);
373
374int __net_init fib6_notifier_init(struct net *net);
375void __net_exit fib6_notifier_exit(struct net *net);
376
Ido Schimmele1ee0a52017-08-03 13:28:19 +0200377unsigned int fib6_tables_seq_read(struct net *net);
378int fib6_tables_dump(struct net *net, struct notifier_block *nb);
379
Wei Wang180ca442017-10-06 12:05:56 -0700380void fib6_update_sernum(struct rt6_info *rt);
381
Daniel Lezcano7e5449c2007-12-08 00:14:54 -0800382#ifdef CONFIG_IPV6_MULTIPLE_TABLES
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700383int fib6_rules_init(void);
384void fib6_rules_cleanup(void);
Ido Schimmele3ea9732017-08-03 13:28:15 +0200385bool fib6_rule_default(const struct fib_rule *rule);
Ido Schimmeldcb18f72017-08-03 13:28:18 +0200386int fib6_rules_dump(struct net *net, struct notifier_block *nb);
387unsigned int fib6_rules_seq_read(struct net *net);
Daniel Lezcano7e5449c2007-12-08 00:14:54 -0800388#else
389static inline int fib6_rules_init(void)
390{
391 return 0;
392}
393static inline void fib6_rules_cleanup(void)
394{
395 return ;
396}
Ido Schimmele3ea9732017-08-03 13:28:15 +0200397static inline bool fib6_rule_default(const struct fib_rule *rule)
398{
399 return true;
400}
Ido Schimmeldcb18f72017-08-03 13:28:18 +0200401static inline int fib6_rules_dump(struct net *net, struct notifier_block *nb)
402{
403 return 0;
404}
405static inline unsigned int fib6_rules_seq_read(struct net *net)
406{
407 return 0;
408}
Daniel Lezcano7e5449c2007-12-08 00:14:54 -0800409#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410#endif