Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* |
| 2 | * net/dst.h Protocol independent destination cache definitions. |
| 3 | * |
| 4 | * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru> |
| 5 | * |
| 6 | */ |
| 7 | |
| 8 | #ifndef _NET_DST_H |
| 9 | #define _NET_DST_H |
| 10 | |
Alexey Dobriyan | 86393e5 | 2009-08-29 01:34:49 +0000 | [diff] [blame] | 11 | #include <net/dst_ops.h> |
Arnaldo Carvalho de Melo | 14c8502 | 2005-12-27 02:43:12 -0200 | [diff] [blame] | 12 | #include <linux/netdevice.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 13 | #include <linux/rtnetlink.h> |
| 14 | #include <linux/rcupdate.h> |
Paul Gortmaker | 187f188 | 2011-11-23 20:12:59 -0500 | [diff] [blame] | 15 | #include <linux/bug.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 16 | #include <linux/jiffies.h> |
| 17 | #include <net/neighbour.h> |
| 18 | #include <asm/processor.h> |
| 19 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 20 | #define DST_GC_MIN (HZ/10) |
| 21 | #define DST_GC_INC (HZ/2) |
| 22 | #define DST_GC_MAX (120*HZ) |
| 23 | |
| 24 | /* Each dst_entry has reference count and sits in some parent list(s). |
| 25 | * When it is removed from parent list, it is "freed" (dst_free). |
| 26 | * After this it enters dead state (dst->obsolete > 0) and if its refcnt |
| 27 | * is zero, it can be destroyed immediately, otherwise it is added |
| 28 | * to gc list and garbage collector periodically checks the refcnt. |
| 29 | */ |
| 30 | |
| 31 | struct sk_buff; |
| 32 | |
Eric Dumazet | fd2c3ef | 2009-11-03 03:26:03 +0000 | [diff] [blame] | 33 | struct dst_entry { |
Eric Dumazet | 1e19e02 | 2007-02-09 16:26:55 -0800 | [diff] [blame] | 34 | struct rcu_head rcu_head; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 35 | struct dst_entry *child; |
| 36 | struct net_device *dev; |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 37 | struct dst_ops *ops; |
| 38 | unsigned long _metrics; |
YOSHIFUJI Hideaki / 吉藤英明 | ecd9883 | 2013-02-20 00:29:08 +0000 | [diff] [blame] | 39 | unsigned long expires; |
Zhang Yanmin | f1dd9c3 | 2008-03-12 22:52:37 -0700 | [diff] [blame] | 40 | struct dst_entry *path; |
YOSHIFUJI Hideaki / 吉藤英明 | ecd9883 | 2013-02-20 00:29:08 +0000 | [diff] [blame] | 41 | struct dst_entry *from; |
Alexey Dobriyan | def8b4f | 2008-10-28 13:24:06 -0700 | [diff] [blame] | 42 | #ifdef CONFIG_XFRM |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 43 | struct xfrm_state *xfrm; |
Eric Dumazet | 5635c10 | 2008-11-16 19:46:36 -0800 | [diff] [blame] | 44 | #else |
| 45 | void *__pad1; |
Alexey Dobriyan | def8b4f | 2008-10-28 13:24:06 -0700 | [diff] [blame] | 46 | #endif |
Eldad Zack | 7f95e18 | 2012-06-16 15:14:49 +0200 | [diff] [blame] | 47 | int (*input)(struct sk_buff *); |
Eric W. Biederman | ede2059 | 2015-10-07 16:48:47 -0500 | [diff] [blame] | 48 | int (*output)(struct net *net, struct sock *sk, struct sk_buff *skb); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 49 | |
David S. Miller | 5110effe | 2012-07-02 02:21:03 -0700 | [diff] [blame] | 50 | unsigned short flags; |
David S. Miller | f6b72b62 | 2011-07-14 07:53:20 -0700 | [diff] [blame] | 51 | #define DST_HOST 0x0001 |
| 52 | #define DST_NOXFRM 0x0002 |
| 53 | #define DST_NOPOLICY 0x0004 |
| 54 | #define DST_NOHASH 0x0008 |
| 55 | #define DST_NOCACHE 0x0010 |
| 56 | #define DST_NOCOUNT 0x0020 |
Hannes Frederic Sowa | e90c148 | 2014-03-06 09:11:07 +0100 | [diff] [blame] | 57 | #define DST_FAKE_RTABLE 0x0040 |
| 58 | #define DST_XFRM_TUNNEL 0x0080 |
| 59 | #define DST_XFRM_QUEUE 0x0100 |
Thomas Graf | f38a9eb | 2015-07-21 10:43:56 +0200 | [diff] [blame] | 60 | #define DST_METADATA 0x0200 |
David S. Miller | f6b72b62 | 2011-07-14 07:53:20 -0700 | [diff] [blame] | 61 | |
David S. Miller | 5110effe | 2012-07-02 02:21:03 -0700 | [diff] [blame] | 62 | unsigned short pending_confirm; |
| 63 | |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 64 | short error; |
David S. Miller | f5b0a87 | 2012-07-19 12:31:33 -0700 | [diff] [blame] | 65 | |
| 66 | /* A non-zero value of dst->obsolete forces by-hand validation |
| 67 | * of the route entry. Positive values are set by the generic |
| 68 | * dst layer to indicate that the entry has been forcefully |
| 69 | * destroyed. |
| 70 | * |
| 71 | * Negative values are used by the implementation layer code to |
| 72 | * force invocation of the dst_ops->check() method. |
| 73 | */ |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 74 | short obsolete; |
David S. Miller | f5b0a87 | 2012-07-19 12:31:33 -0700 | [diff] [blame] | 75 | #define DST_OBSOLETE_NONE 0 |
| 76 | #define DST_OBSOLETE_DEAD 2 |
| 77 | #define DST_OBSOLETE_FORCE_CHK -1 |
David S. Miller | ceb3320 | 2012-07-17 11:31:28 -0700 | [diff] [blame] | 78 | #define DST_OBSOLETE_KILL -2 |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 79 | unsigned short header_len; /* more space at head required */ |
| 80 | unsigned short trailer_len; /* space to reserve at tail */ |
Patrick McHardy | c7066f7 | 2011-01-14 13:36:42 +0100 | [diff] [blame] | 81 | #ifdef CONFIG_IP_ROUTE_CLASSID |
Zhang Yanmin | f1dd9c3 | 2008-03-12 22:52:37 -0700 | [diff] [blame] | 82 | __u32 tclassid; |
Eric Dumazet | 5635c10 | 2008-11-16 19:46:36 -0800 | [diff] [blame] | 83 | #else |
| 84 | __u32 __pad2; |
Zhang Yanmin | f1dd9c3 | 2008-03-12 22:52:37 -0700 | [diff] [blame] | 85 | #endif |
| 86 | |
Jiri Benc | 751a587 | 2015-08-21 12:41:14 +0200 | [diff] [blame] | 87 | #ifdef CONFIG_64BIT |
Eric Dumazet | 5635c10 | 2008-11-16 19:46:36 -0800 | [diff] [blame] | 88 | /* |
| 89 | * Align __refcnt to a 64 bytes alignment |
| 90 | * (L1_CACHE_SIZE would be too much) |
| 91 | */ |
Jiri Benc | 0868e25 | 2016-04-22 12:40:02 +0200 | [diff] [blame] | 92 | long __pad_to_align_refcnt[2]; |
Eric Dumazet | 5635c10 | 2008-11-16 19:46:36 -0800 | [diff] [blame] | 93 | #endif |
Zhang Yanmin | f1dd9c3 | 2008-03-12 22:52:37 -0700 | [diff] [blame] | 94 | /* |
| 95 | * __refcnt wants to be on a different cache line from |
| 96 | * input/output/ops or performance tanks badly |
| 97 | */ |
Eric Dumazet | 1e19e02 | 2007-02-09 16:26:55 -0800 | [diff] [blame] | 98 | atomic_t __refcnt; /* client references */ |
| 99 | int __use; |
Zhang Yanmin | f1dd9c3 | 2008-03-12 22:52:37 -0700 | [diff] [blame] | 100 | unsigned long lastuse; |
Jiri Benc | 751a587 | 2015-08-21 12:41:14 +0200 | [diff] [blame] | 101 | struct lwtunnel_state *lwtstate; |
Eric Dumazet | 1e19e02 | 2007-02-09 16:26:55 -0800 | [diff] [blame] | 102 | union { |
Eric Dumazet | fc766e4c | 2010-10-29 03:09:24 +0000 | [diff] [blame] | 103 | struct dst_entry *next; |
| 104 | struct rtable __rcu *rt_next; |
| 105 | struct rt6_info *rt6_next; |
| 106 | struct dn_route __rcu *dn_next; |
Eric Dumazet | 1e19e02 | 2007-02-09 16:26:55 -0800 | [diff] [blame] | 107 | }; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 108 | }; |
| 109 | |
Joe Perches | a4023dd | 2013-09-20 11:23:21 -0700 | [diff] [blame] | 110 | u32 *dst_cow_metrics_generic(struct dst_entry *dst, unsigned long old); |
Eric Dumazet | a37e6e3 | 2012-08-07 10:55:45 +0000 | [diff] [blame] | 111 | extern const u32 dst_default_metrics[]; |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 112 | |
Michal Kubeček | e5fd387 | 2014-03-27 13:04:08 +0100 | [diff] [blame] | 113 | #define DST_METRICS_READ_ONLY 0x1UL |
Michal Kubeček | e5fd387 | 2014-03-27 13:04:08 +0100 | [diff] [blame] | 114 | #define DST_METRICS_FLAGS 0x3UL |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 115 | #define __DST_METRICS_PTR(Y) \ |
Michal Kubeček | e5fd387 | 2014-03-27 13:04:08 +0100 | [diff] [blame] | 116 | ((u32 *)((Y) & ~DST_METRICS_FLAGS)) |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 117 | #define DST_METRICS_PTR(X) __DST_METRICS_PTR((X)->_metrics) |
| 118 | |
| 119 | static inline bool dst_metrics_read_only(const struct dst_entry *dst) |
| 120 | { |
| 121 | return dst->_metrics & DST_METRICS_READ_ONLY; |
| 122 | } |
| 123 | |
Joe Perches | a4023dd | 2013-09-20 11:23:21 -0700 | [diff] [blame] | 124 | void __dst_destroy_metrics_generic(struct dst_entry *dst, unsigned long old); |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 125 | |
| 126 | static inline void dst_destroy_metrics_generic(struct dst_entry *dst) |
| 127 | { |
| 128 | unsigned long val = dst->_metrics; |
| 129 | if (!(val & DST_METRICS_READ_ONLY)) |
| 130 | __dst_destroy_metrics_generic(dst, val); |
| 131 | } |
| 132 | |
| 133 | static inline u32 *dst_metrics_write_ptr(struct dst_entry *dst) |
| 134 | { |
| 135 | unsigned long p = dst->_metrics; |
| 136 | |
Stephen Hemminger | 1f37070 | 2011-05-24 13:50:52 -0400 | [diff] [blame] | 137 | BUG_ON(!p); |
| 138 | |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 139 | if (p & DST_METRICS_READ_ONLY) |
| 140 | return dst->ops->cow_metrics(dst, p); |
| 141 | return __DST_METRICS_PTR(p); |
| 142 | } |
| 143 | |
| 144 | /* This may only be invoked before the entry has reached global |
| 145 | * visibility. |
| 146 | */ |
| 147 | static inline void dst_init_metrics(struct dst_entry *dst, |
| 148 | const u32 *src_metrics, |
| 149 | bool read_only) |
| 150 | { |
| 151 | dst->_metrics = ((unsigned long) src_metrics) | |
| 152 | (read_only ? DST_METRICS_READ_ONLY : 0); |
| 153 | } |
| 154 | |
| 155 | static inline void dst_copy_metrics(struct dst_entry *dest, const struct dst_entry *src) |
| 156 | { |
| 157 | u32 *dst_metrics = dst_metrics_write_ptr(dest); |
| 158 | |
| 159 | if (dst_metrics) { |
| 160 | u32 *src_metrics = DST_METRICS_PTR(src); |
| 161 | |
| 162 | memcpy(dst_metrics, src_metrics, RTAX_MAX * sizeof(u32)); |
| 163 | } |
| 164 | } |
| 165 | |
| 166 | static inline u32 *dst_metrics_ptr(struct dst_entry *dst) |
| 167 | { |
| 168 | return DST_METRICS_PTR(dst); |
| 169 | } |
| 170 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 171 | static inline u32 |
David S. Miller | 5170ae8 | 2010-12-12 21:35:57 -0800 | [diff] [blame] | 172 | dst_metric_raw(const struct dst_entry *dst, const int metric) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 173 | { |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 174 | u32 *p = DST_METRICS_PTR(dst); |
| 175 | |
| 176 | return p[metric-1]; |
David S. Miller | defb351 | 2010-12-08 21:16:57 -0800 | [diff] [blame] | 177 | } |
| 178 | |
David S. Miller | 5170ae8 | 2010-12-12 21:35:57 -0800 | [diff] [blame] | 179 | static inline u32 |
| 180 | dst_metric(const struct dst_entry *dst, const int metric) |
| 181 | { |
David S. Miller | 0dbaee3 | 2010-12-13 12:52:14 -0800 | [diff] [blame] | 182 | WARN_ON_ONCE(metric == RTAX_HOPLIMIT || |
David S. Miller | d33e455 | 2010-12-14 13:01:14 -0800 | [diff] [blame] | 183 | metric == RTAX_ADVMSS || |
| 184 | metric == RTAX_MTU); |
David S. Miller | 5170ae8 | 2010-12-12 21:35:57 -0800 | [diff] [blame] | 185 | return dst_metric_raw(dst, metric); |
| 186 | } |
| 187 | |
David S. Miller | 0dbaee3 | 2010-12-13 12:52:14 -0800 | [diff] [blame] | 188 | static inline u32 |
| 189 | dst_metric_advmss(const struct dst_entry *dst) |
| 190 | { |
| 191 | u32 advmss = dst_metric_raw(dst, RTAX_ADVMSS); |
| 192 | |
| 193 | if (!advmss) |
| 194 | advmss = dst->ops->default_advmss(dst); |
| 195 | |
| 196 | return advmss; |
| 197 | } |
| 198 | |
David S. Miller | defb351 | 2010-12-08 21:16:57 -0800 | [diff] [blame] | 199 | static inline void dst_metric_set(struct dst_entry *dst, int metric, u32 val) |
| 200 | { |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 201 | u32 *p = dst_metrics_write_ptr(dst); |
David S. Miller | defb351 | 2010-12-08 21:16:57 -0800 | [diff] [blame] | 202 | |
David S. Miller | 62fa8a8 | 2011-01-26 20:51:05 -0800 | [diff] [blame] | 203 | if (p) |
| 204 | p[metric-1] = val; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 205 | } |
| 206 | |
Daniel Borkmann | c3a8d94 | 2015-08-31 15:58:47 +0200 | [diff] [blame] | 207 | /* Kernel-internal feature bits that are unallocated in user space. */ |
| 208 | #define DST_FEATURE_ECN_CA (1 << 31) |
| 209 | |
| 210 | #define DST_FEATURE_MASK (DST_FEATURE_ECN_CA) |
| 211 | #define DST_FEATURE_ECN_MASK (DST_FEATURE_ECN_CA | RTAX_FEATURE_ECN) |
| 212 | |
Gilad Ben-Yossef | 0c3adfb | 2009-10-28 04:15:23 +0000 | [diff] [blame] | 213 | static inline u32 |
| 214 | dst_feature(const struct dst_entry *dst, u32 feature) |
| 215 | { |
David S. Miller | bb5b7c1 | 2009-12-15 20:56:42 -0800 | [diff] [blame] | 216 | return dst_metric(dst, RTAX_FEATURES) & feature; |
Gilad Ben-Yossef | 0c3adfb | 2009-10-28 04:15:23 +0000 | [diff] [blame] | 217 | } |
| 218 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 219 | static inline u32 dst_mtu(const struct dst_entry *dst) |
| 220 | { |
Steffen Klassert | 618f9bc | 2011-11-23 02:13:31 +0000 | [diff] [blame] | 221 | return dst->ops->mtu(dst); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 222 | } |
| 223 | |
Stephen Hemminger | c1e20f7 | 2008-07-18 23:02:15 -0700 | [diff] [blame] | 224 | /* RTT metrics are stored in milliseconds for user ABI, but used as jiffies */ |
| 225 | static inline unsigned long dst_metric_rtt(const struct dst_entry *dst, int metric) |
| 226 | { |
| 227 | return msecs_to_jiffies(dst_metric(dst, metric)); |
| 228 | } |
| 229 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 230 | static inline u32 |
| 231 | dst_allfrag(const struct dst_entry *dst) |
| 232 | { |
Gilad Ben-Yossef | 0c3adfb | 2009-10-28 04:15:23 +0000 | [diff] [blame] | 233 | int ret = dst_feature(dst, RTAX_FEATURE_ALLFRAG); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 234 | return ret; |
| 235 | } |
| 236 | |
| 237 | static inline int |
David S. Miller | d33e455 | 2010-12-14 13:01:14 -0800 | [diff] [blame] | 238 | dst_metric_locked(const struct dst_entry *dst, int metric) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 239 | { |
| 240 | return dst_metric(dst, RTAX_LOCK) & (1<<metric); |
| 241 | } |
| 242 | |
Eldad Zack | 7f95e18 | 2012-06-16 15:14:49 +0200 | [diff] [blame] | 243 | static inline void dst_hold(struct dst_entry *dst) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 244 | { |
Eric Dumazet | 5635c10 | 2008-11-16 19:46:36 -0800 | [diff] [blame] | 245 | /* |
| 246 | * If your kernel compilation stops here, please check |
| 247 | * __pad_to_align_refcnt declaration in struct dst_entry |
| 248 | */ |
| 249 | BUILD_BUG_ON(offsetof(struct dst_entry, __refcnt) & 63); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 250 | atomic_inc(&dst->__refcnt); |
| 251 | } |
| 252 | |
Pavel Emelyanov | 03f49f3 | 2007-11-10 21:28:34 -0800 | [diff] [blame] | 253 | static inline void dst_use(struct dst_entry *dst, unsigned long time) |
| 254 | { |
| 255 | dst_hold(dst); |
| 256 | dst->__use++; |
| 257 | dst->lastuse = time; |
| 258 | } |
| 259 | |
Eric Dumazet | 7fee226 | 2010-05-11 23:19:48 +0000 | [diff] [blame] | 260 | static inline void dst_use_noref(struct dst_entry *dst, unsigned long time) |
| 261 | { |
| 262 | dst->__use++; |
| 263 | dst->lastuse = time; |
| 264 | } |
| 265 | |
Eldad Zack | 7f95e18 | 2012-06-16 15:14:49 +0200 | [diff] [blame] | 266 | static inline struct dst_entry *dst_clone(struct dst_entry *dst) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 267 | { |
| 268 | if (dst) |
| 269 | atomic_inc(&dst->__refcnt); |
| 270 | return dst; |
| 271 | } |
| 272 | |
Joe Perches | a4023dd | 2013-09-20 11:23:21 -0700 | [diff] [blame] | 273 | void dst_release(struct dst_entry *dst); |
Eric Dumazet | 7fee226 | 2010-05-11 23:19:48 +0000 | [diff] [blame] | 274 | |
| 275 | static inline void refdst_drop(unsigned long refdst) |
| 276 | { |
| 277 | if (!(refdst & SKB_DST_NOREF)) |
| 278 | dst_release((struct dst_entry *)(refdst & SKB_DST_PTRMASK)); |
| 279 | } |
| 280 | |
| 281 | /** |
| 282 | * skb_dst_drop - drops skb dst |
| 283 | * @skb: buffer |
| 284 | * |
| 285 | * Drops dst reference count if a reference was taken. |
| 286 | */ |
Eric Dumazet | adf3090 | 2009-06-02 05:19:30 +0000 | [diff] [blame] | 287 | static inline void skb_dst_drop(struct sk_buff *skb) |
| 288 | { |
Eric Dumazet | 7fee226 | 2010-05-11 23:19:48 +0000 | [diff] [blame] | 289 | if (skb->_skb_refdst) { |
| 290 | refdst_drop(skb->_skb_refdst); |
| 291 | skb->_skb_refdst = 0UL; |
| 292 | } |
| 293 | } |
| 294 | |
Joe Stringer | e79e259 | 2015-08-26 11:31:47 -0700 | [diff] [blame] | 295 | static inline void __skb_dst_copy(struct sk_buff *nskb, unsigned long refdst) |
Eric Dumazet | 7fee226 | 2010-05-11 23:19:48 +0000 | [diff] [blame] | 296 | { |
Joe Stringer | e79e259 | 2015-08-26 11:31:47 -0700 | [diff] [blame] | 297 | nskb->_skb_refdst = refdst; |
Eric Dumazet | 7fee226 | 2010-05-11 23:19:48 +0000 | [diff] [blame] | 298 | if (!(nskb->_skb_refdst & SKB_DST_NOREF)) |
| 299 | dst_clone(skb_dst(nskb)); |
| 300 | } |
| 301 | |
Joe Stringer | e79e259 | 2015-08-26 11:31:47 -0700 | [diff] [blame] | 302 | static inline void skb_dst_copy(struct sk_buff *nskb, const struct sk_buff *oskb) |
| 303 | { |
| 304 | __skb_dst_copy(nskb, oskb->_skb_refdst); |
| 305 | } |
| 306 | |
Eric Dumazet | 7fee226 | 2010-05-11 23:19:48 +0000 | [diff] [blame] | 307 | /** |
| 308 | * skb_dst_force - makes sure skb dst is refcounted |
| 309 | * @skb: buffer |
| 310 | * |
| 311 | * If dst is not yet refcounted, let's do it |
| 312 | */ |
| 313 | static inline void skb_dst_force(struct sk_buff *skb) |
| 314 | { |
| 315 | if (skb_dst_is_noref(skb)) { |
| 316 | WARN_ON(!rcu_read_lock_held()); |
| 317 | skb->_skb_refdst &= ~SKB_DST_NOREF; |
| 318 | dst_clone(skb_dst(skb)); |
| 319 | } |
Eric Dumazet | adf3090 | 2009-06-02 05:19:30 +0000 | [diff] [blame] | 320 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 321 | |
Eric Dumazet | 5037e9e | 2015-12-14 14:08:53 -0800 | [diff] [blame] | 322 | /** |
| 323 | * dst_hold_safe - Take a reference on a dst if possible |
| 324 | * @dst: pointer to dst entry |
| 325 | * |
| 326 | * This helper returns false if it could not safely |
| 327 | * take a reference on a dst. |
| 328 | */ |
| 329 | static inline bool dst_hold_safe(struct dst_entry *dst) |
| 330 | { |
| 331 | if (dst->flags & DST_NOCACHE) |
| 332 | return atomic_inc_not_zero(&dst->__refcnt); |
| 333 | dst_hold(dst); |
| 334 | return true; |
| 335 | } |
| 336 | |
| 337 | /** |
| 338 | * skb_dst_force_safe - makes sure skb dst is refcounted |
| 339 | * @skb: buffer |
| 340 | * |
| 341 | * If dst is not yet refcounted and not destroyed, grab a ref on it. |
| 342 | */ |
| 343 | static inline void skb_dst_force_safe(struct sk_buff *skb) |
| 344 | { |
| 345 | if (skb_dst_is_noref(skb)) { |
| 346 | struct dst_entry *dst = skb_dst(skb); |
| 347 | |
| 348 | if (!dst_hold_safe(dst)) |
| 349 | dst = NULL; |
| 350 | |
| 351 | skb->_skb_refdst = (unsigned long)dst; |
| 352 | } |
| 353 | } |
| 354 | |
Eric Dumazet | d19d56d | 2010-05-17 22:36:55 -0700 | [diff] [blame] | 355 | |
| 356 | /** |
Eric Dumazet | 290b895 | 2010-09-27 00:33:35 +0000 | [diff] [blame] | 357 | * __skb_tunnel_rx - prepare skb for rx reinsert |
| 358 | * @skb: buffer |
| 359 | * @dev: tunnel device |
Nicolas Dichtel | ea23192 | 2013-09-02 15:34:58 +0200 | [diff] [blame] | 360 | * @net: netns for packet i/o |
Eric Dumazet | 290b895 | 2010-09-27 00:33:35 +0000 | [diff] [blame] | 361 | * |
| 362 | * After decapsulation, packet is going to re-enter (netif_rx()) our stack, |
| 363 | * so make some cleanups. (no accounting done) |
| 364 | */ |
Nicolas Dichtel | ea23192 | 2013-09-02 15:34:58 +0200 | [diff] [blame] | 365 | static inline void __skb_tunnel_rx(struct sk_buff *skb, struct net_device *dev, |
| 366 | struct net *net) |
Eric Dumazet | 290b895 | 2010-09-27 00:33:35 +0000 | [diff] [blame] | 367 | { |
| 368 | skb->dev = dev; |
Tom Herbert | bdeab99 | 2011-08-14 19:45:55 +0000 | [diff] [blame] | 369 | |
| 370 | /* |
Tom Herbert | 7539fad | 2013-12-15 22:12:18 -0800 | [diff] [blame] | 371 | * Clear hash so that we can recalulate the hash for the |
Tom Herbert | bdeab99 | 2011-08-14 19:45:55 +0000 | [diff] [blame] | 372 | * encapsulated packet, unless we have already determine the hash |
| 373 | * over the L4 4-tuple. |
| 374 | */ |
Tom Herbert | 7539fad | 2013-12-15 22:12:18 -0800 | [diff] [blame] | 375 | skb_clear_hash_if_not_l4(skb); |
Eric Dumazet | 290b895 | 2010-09-27 00:33:35 +0000 | [diff] [blame] | 376 | skb_set_queue_mapping(skb, 0); |
Nicolas Dichtel | ea23192 | 2013-09-02 15:34:58 +0200 | [diff] [blame] | 377 | skb_scrub_packet(skb, !net_eq(net, dev_net(dev))); |
Eric Dumazet | 290b895 | 2010-09-27 00:33:35 +0000 | [diff] [blame] | 378 | } |
| 379 | |
| 380 | /** |
Eric Dumazet | d19d56d | 2010-05-17 22:36:55 -0700 | [diff] [blame] | 381 | * skb_tunnel_rx - prepare skb for rx reinsert |
| 382 | * @skb: buffer |
| 383 | * @dev: tunnel device |
| 384 | * |
| 385 | * After decapsulation, packet is going to re-enter (netif_rx()) our stack, |
| 386 | * so make some cleanups, and perform accounting. |
Eric Dumazet | 290b895 | 2010-09-27 00:33:35 +0000 | [diff] [blame] | 387 | * Note: this accounting is not SMP safe. |
Eric Dumazet | d19d56d | 2010-05-17 22:36:55 -0700 | [diff] [blame] | 388 | */ |
Nicolas Dichtel | ea23192 | 2013-09-02 15:34:58 +0200 | [diff] [blame] | 389 | static inline void skb_tunnel_rx(struct sk_buff *skb, struct net_device *dev, |
| 390 | struct net *net) |
Eric Dumazet | d19d56d | 2010-05-17 22:36:55 -0700 | [diff] [blame] | 391 | { |
Eric Dumazet | d19d56d | 2010-05-17 22:36:55 -0700 | [diff] [blame] | 392 | /* TODO : stats should be SMP safe */ |
| 393 | dev->stats.rx_packets++; |
| 394 | dev->stats.rx_bytes += skb->len; |
Nicolas Dichtel | ea23192 | 2013-09-02 15:34:58 +0200 | [diff] [blame] | 395 | __skb_tunnel_rx(skb, dev, net); |
Eric Dumazet | d19d56d | 2010-05-17 22:36:55 -0700 | [diff] [blame] | 396 | } |
| 397 | |
Daniel Borkmann | 808c1b6 | 2016-03-16 01:42:50 +0100 | [diff] [blame] | 398 | static inline u32 dst_tclassid(const struct sk_buff *skb) |
| 399 | { |
| 400 | #ifdef CONFIG_IP_ROUTE_CLASSID |
| 401 | const struct dst_entry *dst; |
| 402 | |
| 403 | dst = skb_dst(skb); |
| 404 | if (dst) |
| 405 | return dst->tclassid; |
| 406 | #endif |
| 407 | return 0; |
| 408 | } |
| 409 | |
Eric W. Biederman | ede2059 | 2015-10-07 16:48:47 -0500 | [diff] [blame] | 410 | int dst_discard_out(struct net *net, struct sock *sk, struct sk_buff *skb); |
Eric Dumazet | aad8872 | 2014-04-15 13:47:15 -0400 | [diff] [blame] | 411 | static inline int dst_discard(struct sk_buff *skb) |
| 412 | { |
Eric W. Biederman | ede2059 | 2015-10-07 16:48:47 -0500 | [diff] [blame] | 413 | return dst_discard_out(&init_net, skb->sk, skb); |
Eric Dumazet | aad8872 | 2014-04-15 13:47:15 -0400 | [diff] [blame] | 414 | } |
Joe Perches | a4023dd | 2013-09-20 11:23:21 -0700 | [diff] [blame] | 415 | void *dst_alloc(struct dst_ops *ops, struct net_device *dev, int initial_ref, |
| 416 | int initial_obsolete, unsigned short flags); |
Thomas Graf | f38a9eb | 2015-07-21 10:43:56 +0200 | [diff] [blame] | 417 | void dst_init(struct dst_entry *dst, struct dst_ops *ops, |
| 418 | struct net_device *dev, int initial_ref, int initial_obsolete, |
| 419 | unsigned short flags); |
Joe Perches | a4023dd | 2013-09-20 11:23:21 -0700 | [diff] [blame] | 420 | void __dst_free(struct dst_entry *dst); |
| 421 | struct dst_entry *dst_destroy(struct dst_entry *dst); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 422 | |
Eldad Zack | 7f95e18 | 2012-06-16 15:14:49 +0200 | [diff] [blame] | 423 | static inline void dst_free(struct dst_entry *dst) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 424 | { |
David S. Miller | f5b0a87 | 2012-07-19 12:31:33 -0700 | [diff] [blame] | 425 | if (dst->obsolete > 0) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 426 | return; |
| 427 | if (!atomic_read(&dst->__refcnt)) { |
| 428 | dst = dst_destroy(dst); |
| 429 | if (!dst) |
| 430 | return; |
| 431 | } |
| 432 | __dst_free(dst); |
| 433 | } |
| 434 | |
| 435 | static inline void dst_rcu_free(struct rcu_head *head) |
| 436 | { |
| 437 | struct dst_entry *dst = container_of(head, struct dst_entry, rcu_head); |
| 438 | dst_free(dst); |
| 439 | } |
| 440 | |
| 441 | static inline void dst_confirm(struct dst_entry *dst) |
| 442 | { |
David S. Miller | 5110effe | 2012-07-02 02:21:03 -0700 | [diff] [blame] | 443 | dst->pending_confirm = 1; |
| 444 | } |
Eric Dumazet | f2c31e3 | 2011-07-29 19:00:53 +0000 | [diff] [blame] | 445 | |
David S. Miller | 5110effe | 2012-07-02 02:21:03 -0700 | [diff] [blame] | 446 | static inline int dst_neigh_output(struct dst_entry *dst, struct neighbour *n, |
| 447 | struct sk_buff *skb) |
| 448 | { |
Eric Dumazet | 425f09a | 2012-08-07 02:19:56 +0000 | [diff] [blame] | 449 | const struct hh_cache *hh; |
David S. Miller | 5110effe | 2012-07-02 02:21:03 -0700 | [diff] [blame] | 450 | |
Eric Dumazet | 425f09a | 2012-08-07 02:19:56 +0000 | [diff] [blame] | 451 | if (dst->pending_confirm) { |
| 452 | unsigned long now = jiffies; |
| 453 | |
David S. Miller | 5110effe | 2012-07-02 02:21:03 -0700 | [diff] [blame] | 454 | dst->pending_confirm = 0; |
Eric Dumazet | 425f09a | 2012-08-07 02:19:56 +0000 | [diff] [blame] | 455 | /* avoid dirtying neighbour */ |
| 456 | if (n->confirmed != now) |
| 457 | n->confirmed = now; |
David S. Miller | 69cce1d | 2011-07-17 23:09:49 -0700 | [diff] [blame] | 458 | } |
David S. Miller | 5110effe | 2012-07-02 02:21:03 -0700 | [diff] [blame] | 459 | |
| 460 | hh = &n->hh; |
| 461 | if ((n->nud_state & NUD_CONNECTED) && hh->hh_len) |
| 462 | return neigh_hh_output(hh, skb); |
| 463 | else |
| 464 | return n->output(n, skb); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 465 | } |
| 466 | |
David S. Miller | d3aaeb3 | 2011-07-18 00:40:17 -0700 | [diff] [blame] | 467 | static inline struct neighbour *dst_neigh_lookup(const struct dst_entry *dst, const void *daddr) |
| 468 | { |
Zhouyi Zhou | aaa0c23 | 2013-03-14 17:21:50 +0000 | [diff] [blame] | 469 | struct neighbour *n = dst->ops->neigh_lookup(dst, NULL, daddr); |
| 470 | return IS_ERR(n) ? NULL : n; |
David S. Miller | f894cbf | 2012-07-02 21:52:24 -0700 | [diff] [blame] | 471 | } |
| 472 | |
| 473 | static inline struct neighbour *dst_neigh_lookup_skb(const struct dst_entry *dst, |
| 474 | struct sk_buff *skb) |
| 475 | { |
Zhouyi Zhou | aaa0c23 | 2013-03-14 17:21:50 +0000 | [diff] [blame] | 476 | struct neighbour *n = dst->ops->neigh_lookup(dst, skb, NULL); |
| 477 | return IS_ERR(n) ? NULL : n; |
David S. Miller | d3aaeb3 | 2011-07-18 00:40:17 -0700 | [diff] [blame] | 478 | } |
| 479 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 480 | static inline void dst_link_failure(struct sk_buff *skb) |
| 481 | { |
Eric Dumazet | adf3090 | 2009-06-02 05:19:30 +0000 | [diff] [blame] | 482 | struct dst_entry *dst = skb_dst(skb); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 483 | if (dst && dst->ops && dst->ops->link_failure) |
| 484 | dst->ops->link_failure(skb); |
| 485 | } |
| 486 | |
| 487 | static inline void dst_set_expires(struct dst_entry *dst, int timeout) |
| 488 | { |
| 489 | unsigned long expires = jiffies + timeout; |
| 490 | |
| 491 | if (expires == 0) |
| 492 | expires = 1; |
| 493 | |
| 494 | if (dst->expires == 0 || time_before(expires, dst->expires)) |
| 495 | dst->expires = expires; |
| 496 | } |
| 497 | |
| 498 | /* Output packet to network from transport. */ |
Eric W. Biederman | 13206b6 | 2015-10-07 16:48:35 -0500 | [diff] [blame] | 499 | static inline int dst_output(struct net *net, struct sock *sk, struct sk_buff *skb) |
Eric Dumazet | aad8872 | 2014-04-15 13:47:15 -0400 | [diff] [blame] | 500 | { |
Eric W. Biederman | ede2059 | 2015-10-07 16:48:47 -0500 | [diff] [blame] | 501 | return skb_dst(skb)->output(net, sk, skb); |
Eric Dumazet | aad8872 | 2014-04-15 13:47:15 -0400 | [diff] [blame] | 502 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 503 | |
| 504 | /* Input packet from network to transport. */ |
| 505 | static inline int dst_input(struct sk_buff *skb) |
| 506 | { |
Eric Dumazet | adf3090 | 2009-06-02 05:19:30 +0000 | [diff] [blame] | 507 | return skb_dst(skb)->input(skb); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 508 | } |
| 509 | |
| 510 | static inline struct dst_entry *dst_check(struct dst_entry *dst, u32 cookie) |
| 511 | { |
| 512 | if (dst->obsolete) |
| 513 | dst = dst->ops->check(dst, cookie); |
| 514 | return dst; |
| 515 | } |
| 516 | |
Thomas Graf | f38a9eb | 2015-07-21 10:43:56 +0200 | [diff] [blame] | 517 | void dst_subsys_init(void); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 518 | |
Herbert Xu | 815f4e5 | 2007-12-12 10:36:59 -0800 | [diff] [blame] | 519 | /* Flags for xfrm_lookup flags argument. */ |
| 520 | enum { |
David S. Miller | 80c0bc9 | 2011-03-01 14:36:37 -0800 | [diff] [blame] | 521 | XFRM_LOOKUP_ICMP = 1 << 0, |
Steffen Klassert | b8c203b | 2014-09-16 10:08:49 +0200 | [diff] [blame] | 522 | XFRM_LOOKUP_QUEUE = 1 << 1, |
huaibin Wang | ac37e25 | 2015-02-11 18:10:36 +0100 | [diff] [blame] | 523 | XFRM_LOOKUP_KEEP_DST_REF = 1 << 2, |
Herbert Xu | 815f4e5 | 2007-12-12 10:36:59 -0800 | [diff] [blame] | 524 | }; |
| 525 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 526 | struct flowi; |
| 527 | #ifndef CONFIG_XFRM |
David S. Miller | 452edd5 | 2011-03-02 13:27:41 -0800 | [diff] [blame] | 528 | static inline struct dst_entry *xfrm_lookup(struct net *net, |
| 529 | struct dst_entry *dst_orig, |
Eric Dumazet | 6f9c961 | 2015-09-25 07:39:10 -0700 | [diff] [blame] | 530 | const struct flowi *fl, |
| 531 | const struct sock *sk, |
David S. Miller | 452edd5 | 2011-03-02 13:27:41 -0800 | [diff] [blame] | 532 | int flags) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 533 | { |
David S. Miller | 452edd5 | 2011-03-02 13:27:41 -0800 | [diff] [blame] | 534 | return dst_orig; |
Steffen Klassert | f92ee61 | 2014-09-16 10:08:40 +0200 | [diff] [blame] | 535 | } |
| 536 | |
| 537 | static inline struct dst_entry *xfrm_lookup_route(struct net *net, |
| 538 | struct dst_entry *dst_orig, |
| 539 | const struct flowi *fl, |
Eric Dumazet | 6f9c961 | 2015-09-25 07:39:10 -0700 | [diff] [blame] | 540 | const struct sock *sk, |
Steffen Klassert | f92ee61 | 2014-09-16 10:08:40 +0200 | [diff] [blame] | 541 | int flags) |
| 542 | { |
| 543 | return dst_orig; |
| 544 | } |
Vlad Yasevich | e87b399 | 2013-10-15 22:01:29 -0400 | [diff] [blame] | 545 | |
| 546 | static inline struct xfrm_state *dst_xfrm(const struct dst_entry *dst) |
| 547 | { |
| 548 | return NULL; |
| 549 | } |
| 550 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 551 | #else |
Joe Perches | a4023dd | 2013-09-20 11:23:21 -0700 | [diff] [blame] | 552 | struct dst_entry *xfrm_lookup(struct net *net, struct dst_entry *dst_orig, |
Eric Dumazet | 6f9c961 | 2015-09-25 07:39:10 -0700 | [diff] [blame] | 553 | const struct flowi *fl, const struct sock *sk, |
Joe Perches | a4023dd | 2013-09-20 11:23:21 -0700 | [diff] [blame] | 554 | int flags); |
Vlad Yasevich | e87b399 | 2013-10-15 22:01:29 -0400 | [diff] [blame] | 555 | |
Steffen Klassert | f92ee61 | 2014-09-16 10:08:40 +0200 | [diff] [blame] | 556 | struct dst_entry *xfrm_lookup_route(struct net *net, struct dst_entry *dst_orig, |
Eric Dumazet | 6f9c961 | 2015-09-25 07:39:10 -0700 | [diff] [blame] | 557 | const struct flowi *fl, const struct sock *sk, |
Steffen Klassert | f92ee61 | 2014-09-16 10:08:40 +0200 | [diff] [blame] | 558 | int flags); |
| 559 | |
Vlad Yasevich | e87b399 | 2013-10-15 22:01:29 -0400 | [diff] [blame] | 560 | /* skb attached with this dst needs transformation if dst->xfrm is valid */ |
| 561 | static inline struct xfrm_state *dst_xfrm(const struct dst_entry *dst) |
| 562 | { |
| 563 | return dst->xfrm; |
| 564 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 565 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 566 | |
| 567 | #endif /* _NET_DST_H */ |