blob: 0933c7455a3014656b0d0b7dd5fc44dffb5c4563 [file] [log] [blame]
Eric W. Biederman5f256be2007-09-12 11:50:50 +02001/*
2 * Operations on the network namespace
3 */
4#ifndef __NET_NET_NAMESPACE_H
5#define __NET_NET_NAMESPACE_H
6
Arun Sharma600634972011-07-26 16:09:06 -07007#include <linux/atomic.h>
Eric W. Biederman5f256be2007-09-12 11:50:50 +02008#include <linux/workqueue.h>
9#include <linux/list.h>
David S. Millerbee95252011-05-26 16:40:37 -040010#include <linux/sysctl.h>
Eric W. Biederman5f256be2007-09-12 11:50:50 +020011
Cong Wang6a662712014-04-15 16:25:34 -070012#include <net/flow.h>
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -070013#include <net/netns/core.h>
Pavel Emelyanov852566f52008-07-18 04:01:24 -070014#include <net/netns/mib.h>
Denis V. Luneva0a53c82007-12-11 04:19:17 -080015#include <net/netns/unix.h>
Denis V. Lunev2aaef4e2007-12-11 04:19:54 -080016#include <net/netns/packet.h>
Pavel Emelyanov8afd3512007-12-16 13:29:36 -080017#include <net/netns/ipv4.h>
Daniel Lezcanob0f159d2008-01-10 02:49:06 -080018#include <net/netns/ipv6.h>
Alexander Aring633fc862014-02-28 07:32:49 +010019#include <net/netns/ieee802154_6lowpan.h>
Eric W. Biederman4db67e82012-08-06 08:42:04 +000020#include <net/netns/sctp.h>
Pavel Emelyanov67019cc2008-04-13 22:28:42 -070021#include <net/netns/dccp.h>
Gao fengf3c1a442013-03-24 23:50:39 +000022#include <net/netns/netfilter.h>
Alexey Dobriyan8d870052008-01-31 04:02:13 -080023#include <net/netns/x_tables.h>
Alexey Dobriyandfdb8d72008-10-08 11:35:02 +020024#if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
25#include <net/netns/conntrack.h>
26#endif
Pablo Neira Ayuso99633ab2013-10-10 23:28:33 +020027#include <net/netns/nftables.h>
Alexey Dobriyand62ddc22008-11-25 17:14:31 -080028#include <net/netns/xfrm.h>
Eric W. Biederman01891972015-03-03 19:10:47 -060029#include <net/netns/mpls.h>
Al Viro435d5f42014-10-31 22:56:04 -040030#include <linux/ns_common.h>
Pablo Neira Ayuso04c52de2015-06-17 10:28:25 -050031#include <linux/idr.h>
32#include <linux/skbuff.h>
Denis V. Luneva0a53c82007-12-11 04:19:17 -080033
Eric W. Biederman038e7332012-06-14 02:31:10 -070034struct user_namespace;
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020035struct proc_dir_entry;
Eric W. Biederman2774c7a2007-09-26 22:10:56 -070036struct net_device;
Denis V. Lunev97c53ca2007-11-19 22:26:51 -080037struct sock;
Pavel Emelyanov1597fbc2007-12-01 23:51:01 +110038struct ctl_table_header;
Pavel Emelyanovdec827d2008-04-15 00:36:08 -070039struct net_generic;
Johannes Berg134e6372009-07-10 09:51:34 +000040struct sock;
Julian Anastasov2553d062011-03-04 12:18:07 +020041struct netns_ipvs;
Pavel Emelyanov1597fbc2007-12-01 23:51:01 +110042
Eric Dumazet7c28bd02009-10-24 06:13:17 -070043
44#define NETDEV_HASHBITS 8
45#define NETDEV_HASHENTRIES (1 << NETDEV_HASHBITS)
46
Eric W. Biederman5f256be2007-09-12 11:50:50 +020047struct net {
Al Viroa685e082011-06-08 21:13:01 -040048 atomic_t passive; /* To decided when the network
49 * namespace should be freed.
50 */
Eric W. Biederman5f256be2007-09-12 11:50:50 +020051 atomic_t count; /* To decided when the network
Al Viroa685e082011-06-08 21:13:01 -040052 * namespace should be shut down.
Eric W. Biederman5f256be2007-09-12 11:50:50 +020053 */
Eric Dumazet8e602ce2010-10-14 05:56:18 +000054 spinlock_t rules_mod_lock;
55
Eric Dumazet33cf7c92015-03-11 18:53:14 -070056 atomic64_t cookie_gen;
57
Eric W. Biederman5f256be2007-09-12 11:50:50 +020058 struct list_head list; /* list of network namespaces */
Eric W. Biederman2b035b32009-11-29 22:25:27 +000059 struct list_head cleanup_list; /* namespaces on death row */
Eric W. Biederman72ad9372009-12-03 02:29:03 +000060 struct list_head exit_list; /* Use only net_mutex */
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020061
Eric W. Biederman038e7332012-06-14 02:31:10 -070062 struct user_namespace *user_ns; /* Owning user namespace */
WANG Congde133462015-05-15 14:47:32 -070063 spinlock_t nsid_lock;
Nicolas Dichtel0c7aecd2015-01-15 15:11:15 +010064 struct idr netns_ids;
Eric W. Biederman038e7332012-06-14 02:31:10 -070065
Al Viro435d5f42014-10-31 22:56:04 -040066 struct ns_common ns;
Eric W. Biederman98f842e2011-06-15 10:21:48 -070067
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020068 struct proc_dir_entry *proc_net;
69 struct proc_dir_entry *proc_net_stat;
Eric W. Biederman881d9662007-09-17 11:56:21 -070070
Al Viro73455092008-07-14 21:22:20 -040071#ifdef CONFIG_SYSCTL
72 struct ctl_table_set sysctls;
73#endif
Eric W. Biederman95bdfcc2007-11-30 23:55:42 +110074
Eric Dumazet8e602ce2010-10-14 05:56:18 +000075 struct sock *rtnl; /* rtnetlink socket */
76 struct sock *genl_sock;
Eric W. Biederman2774c7a2007-09-26 22:10:56 -070077
Eric W. Biederman881d9662007-09-17 11:56:21 -070078 struct list_head dev_base_head;
79 struct hlist_head *dev_name_head;
80 struct hlist_head *dev_index_head;
Thomas Graf4e985ad2011-06-21 03:11:20 +000081 unsigned int dev_base_seq; /* protected by rtnl_mutex */
Pavel Emelyanovaa79e662012-08-08 21:53:19 +000082 int ifindex;
Eric W. Biederman50624c92013-09-23 21:19:49 -070083 unsigned int dev_unreg_count;
Denis V. Lunev97c53ca2007-11-19 22:26:51 -080084
Denis V. Lunev5fd30ee2008-01-10 03:20:28 -080085 /* core fib_rules */
86 struct list_head rules_ops;
Denis V. Lunev5fd30ee2008-01-10 03:20:28 -080087
Denis V. Lunevd12d01d2007-11-19 22:28:35 -080088
Eric Dumazet8e602ce2010-10-14 05:56:18 +000089 struct net_device *loopback_dev; /* The loopback */
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -070090 struct netns_core core;
Pavel Emelyanov852566f52008-07-18 04:01:24 -070091 struct netns_mib mib;
Denis V. Lunev2aaef4e2007-12-11 04:19:54 -080092 struct netns_packet packet;
Denis V. Luneva0a53c82007-12-11 04:19:17 -080093 struct netns_unix unx;
Pavel Emelyanov8afd3512007-12-16 13:29:36 -080094 struct netns_ipv4 ipv4;
Eric Dumazetdfd56b82011-12-10 09:48:31 +000095#if IS_ENABLED(CONFIG_IPV6)
Daniel Lezcanob0f159d2008-01-10 02:49:06 -080096 struct netns_ipv6 ipv6;
97#endif
Alexander Aring633fc862014-02-28 07:32:49 +010098#if IS_ENABLED(CONFIG_IEEE802154_6LOWPAN)
99 struct netns_ieee802154_lowpan ieee802154_lowpan;
100#endif
Eric W. Biederman4db67e82012-08-06 08:42:04 +0000101#if defined(CONFIG_IP_SCTP) || defined(CONFIG_IP_SCTP_MODULE)
102 struct netns_sctp sctp;
103#endif
Pavel Emelyanov67019cc2008-04-13 22:28:42 -0700104#if defined(CONFIG_IP_DCCP) || defined(CONFIG_IP_DCCP_MODULE)
105 struct netns_dccp dccp;
106#endif
Alexey Dobriyan8d870052008-01-31 04:02:13 -0800107#ifdef CONFIG_NETFILTER
Gao fengf3c1a442013-03-24 23:50:39 +0000108 struct netns_nf nf;
Alexey Dobriyan8d870052008-01-31 04:02:13 -0800109 struct netns_xt xt;
Alexey Dobriyandfdb8d72008-10-08 11:35:02 +0200110#if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
111 struct netns_ct ct;
112#endif
Pablo Neira Ayuso99633ab2013-10-10 23:28:33 +0200113#if defined(CONFIG_NF_TABLES) || defined(CONFIG_NF_TABLES_MODULE)
114 struct netns_nftables nft;
115#endif
Amerigo Wangc038a762012-09-18 16:50:08 +0000116#if IS_ENABLED(CONFIG_NF_DEFRAG_IPV6)
117 struct netns_nf_frag nf_frag;
118#endif
Alexey Dobriyancd8c20b2010-01-13 16:02:14 +0100119 struct sock *nfnl;
120 struct sock *nfnl_stash;
Andreas Schultz3499abb2015-08-05 17:51:45 +0200121#if IS_ENABLED(CONFIG_NETFILTER_NETLINK_ACCT)
122 struct list_head nfnl_acct_list;
123#endif
Pablo Neira19576c92015-12-09 14:07:40 +0100124#if IS_ENABLED(CONFIG_NF_CT_NETLINK_TIMEOUT)
125 struct list_head nfct_timeout_list;
126#endif
Alexey Dobriyan8d870052008-01-31 04:02:13 -0800127#endif
Johannes Berg3d23e342009-09-29 23:27:28 +0200128#ifdef CONFIG_WEXT_CORE
Johannes Bergb333b3d222009-06-24 01:34:48 +0000129 struct sk_buff_head wext_nlevents;
130#endif
Eric Dumazet1c877332010-10-25 03:20:11 +0000131 struct net_generic __rcu *gen;
Eric Dumazet8e602ce2010-10-14 05:56:18 +0000132
133 /* Note : following structs are cache line aligned */
134#ifdef CONFIG_XFRM
135 struct netns_xfrm xfrm;
136#endif
JunweiZhang8b4d14d2013-06-26 16:40:06 +0800137#if IS_ENABLED(CONFIG_IP_VS)
Hans Schillstrom61b1ab42011-01-03 14:44:42 +0100138 struct netns_ipvs *ipvs;
JunweiZhang8b4d14d2013-06-26 16:40:06 +0800139#endif
Eric W. Biederman01891972015-03-03 19:10:47 -0600140#if IS_ENABLED(CONFIG_MPLS)
141 struct netns_mpls mpls;
142#endif
Andrey Vagin51d7ccc2012-07-16 04:28:49 +0000143 struct sock *diag_nlsk;
Timo Teräs5aad1de2013-05-27 20:46:33 +0000144 atomic_t fnhe_genid;
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200145};
146
Denis V. Lunevc0f39322008-04-02 00:10:28 -0700147#include <linux/seq_file_net.h>
148
Daniel Lezcano4fabcd72007-09-13 09:16:29 +0200149/* Init's network namespace */
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200150extern struct net init_net;
Denis V. Luneva4aa8342008-04-03 13:04:33 -0700151
Eric W. Biedermand727abc2012-06-14 02:16:42 -0700152#ifdef CONFIG_NET_NS
Joe Perchese67e16e2013-09-21 10:22:48 -0700153struct net *copy_net_ns(unsigned long flags, struct user_namespace *user_ns,
154 struct net *old_net);
Denis V. Lunev225c0a02008-04-02 00:09:29 -0700155
Eric W. Biedermand727abc2012-06-14 02:16:42 -0700156#else /* CONFIG_NET_NS */
157#include <linux/sched.h>
158#include <linux/nsproxy.h>
Eric W. Biederman038e7332012-06-14 02:31:10 -0700159static inline struct net *copy_net_ns(unsigned long flags,
160 struct user_namespace *user_ns, struct net *old_net)
Eric W. Biederman9dd776b2007-09-26 22:04:26 -0700161{
Eric W. Biedermand727abc2012-06-14 02:16:42 -0700162 if (flags & CLONE_NEWNET)
163 return ERR_PTR(-EINVAL);
164 return old_net;
Eric W. Biederman9dd776b2007-09-26 22:04:26 -0700165}
Eric W. Biedermand727abc2012-06-14 02:16:42 -0700166#endif /* CONFIG_NET_NS */
Denis V. Lunev225c0a02008-04-02 00:09:29 -0700167
168
169extern struct list_head net_namespace_list;
Eric W. Biederman9dd776b2007-09-26 22:04:26 -0700170
Joe Perchese67e16e2013-09-21 10:22:48 -0700171struct net *get_net_ns_by_pid(pid_t pid);
172struct net *get_net_ns_by_fd(int pid);
Johannes Berg30ffee82009-07-10 09:51:35 +0000173
Rashika Kheria535d3ae2014-02-09 22:29:14 +0530174#ifdef CONFIG_SYSCTL
175void ipx_register_sysctl(void);
176void ipx_unregister_sysctl(void);
177#else
178#define ipx_register_sysctl()
179#define ipx_unregister_sysctl()
180#endif
181
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700182#ifdef CONFIG_NET_NS
Joe Perchese67e16e2013-09-21 10:22:48 -0700183void __put_net(struct net *net);
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200184
185static inline struct net *get_net(struct net *net)
186{
187 atomic_inc(&net->count);
188 return net;
189}
190
Eric W. Biederman077130c2007-09-13 09:18:57 +0200191static inline struct net *maybe_get_net(struct net *net)
192{
193 /* Used when we know struct net exists but we
194 * aren't guaranteed a previous reference count
195 * exists. If the reference count is zero this
196 * function fails and returns NULL.
197 */
198 if (!atomic_inc_not_zero(&net->count))
199 net = NULL;
200 return net;
201}
202
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200203static inline void put_net(struct net *net)
204{
205 if (atomic_dec_and_test(&net->count))
206 __put_net(net);
207}
208
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900209static inline
210int net_eq(const struct net *net1, const struct net *net2)
211{
212 return net1 == net2;
213}
Al Viroa685e082011-06-08 21:13:01 -0400214
Joe Perchese67e16e2013-09-21 10:22:48 -0700215void net_drop_ns(void *);
Al Viroa685e082011-06-08 21:13:01 -0400216
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700217#else
Eric W. Biedermanb9f75f42008-06-20 22:16:51 -0700218
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700219static inline struct net *get_net(struct net *net)
220{
221 return net;
222}
223
224static inline void put_net(struct net *net)
225{
226}
227
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700228static inline struct net *maybe_get_net(struct net *net)
229{
230 return net;
231}
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900232
233static inline
234int net_eq(const struct net *net1, const struct net *net2)
235{
236 return 1;
237}
Al Viroa685e082011-06-08 21:13:01 -0400238
239#define net_drop_ns NULL
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700240#endif
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200241
Denis V. Lunev5d1e4462008-04-16 01:58:04 -0700242
Eric W. Biederman0c5c9fb2015-03-11 23:06:44 -0500243typedef struct {
Eric Dumazet8f424b52008-11-12 00:53:30 -0800244#ifdef CONFIG_NET_NS
Eric W. Biederman0c5c9fb2015-03-11 23:06:44 -0500245 struct net *net;
Eric Dumazet8f424b52008-11-12 00:53:30 -0800246#endif
Eric W. Biederman0c5c9fb2015-03-11 23:06:44 -0500247} possible_net_t;
248
249static inline void write_pnet(possible_net_t *pnet, struct net *net)
250{
251#ifdef CONFIG_NET_NS
252 pnet->net = net;
253#endif
254}
255
256static inline struct net *read_pnet(const possible_net_t *pnet)
257{
258#ifdef CONFIG_NET_NS
259 return pnet->net;
260#else
261 return &init_net;
262#endif
263}
Denis V. Lunev5d1e4462008-04-16 01:58:04 -0700264
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200265#define for_each_net(VAR) \
266 list_for_each_entry(VAR, &net_namespace_list, list)
267
Johannes Berg11a28d32009-07-10 09:51:33 +0000268#define for_each_net_rcu(VAR) \
269 list_for_each_entry_rcu(VAR, &net_namespace_list, list)
270
Pavel Emelyanov46650792007-10-08 20:38:39 -0700271#ifdef CONFIG_NET_NS
272#define __net_init
273#define __net_exit
Denis V. Lunev022cbae2007-11-13 03:23:50 -0800274#define __net_initdata
Andi Kleen04a6f822012-10-04 17:12:11 -0700275#define __net_initconst
Pavel Emelyanov46650792007-10-08 20:38:39 -0700276#else
277#define __net_init __init
Fabian Frederickbd721ea2016-08-02 14:03:33 -0700278#define __net_exit __ref
Denis V. Lunev022cbae2007-11-13 03:23:50 -0800279#define __net_initdata __initdata
Andi Kleen04a6f822012-10-04 17:12:11 -0700280#define __net_initconst __initconst
Pavel Emelyanov46650792007-10-08 20:38:39 -0700281#endif
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200282
Nicolas Dichtel7a0877d2015-05-07 11:02:49 +0200283int peernet2id_alloc(struct net *net, struct net *peer);
Nicolas Dichtel59324cf2015-05-07 11:02:53 +0200284int peernet2id(struct net *net, struct net *peer);
285bool peernet_has_id(struct net *net, struct net *peer);
Nicolas Dichtel0c7aecd2015-01-15 15:11:15 +0100286struct net *get_net_ns_by_id(struct net *net, int id);
287
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200288struct pernet_operations {
289 struct list_head list;
290 int (*init)(struct net *net);
291 void (*exit)(struct net *net);
Eric W. Biederman72ad9372009-12-03 02:29:03 +0000292 void (*exit_batch)(struct list_head *net_exit_list);
Eric W. Biedermanf875bae2009-11-29 22:25:28 +0000293 int *id;
294 size_t size;
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200295};
296
Eric W. Biederman17edde52009-02-22 00:11:09 -0800297/*
298 * Use these carefully. If you implement a network device and it
299 * needs per network namespace operations use device pernet operations,
300 * otherwise use pernet subsys operations.
301 *
Johannes Berg4edf5472009-07-15 06:16:34 +0000302 * Network interfaces need to be removed from a dying netns _before_
303 * subsys notifiers can be called, as most of the network code cleanup
304 * (which is done from subsys notifiers) runs with the assumption that
305 * dev_remove_pack has been called so no new packets will arrive during
306 * and after the cleanup functions have been called. dev_remove_pack
307 * is not per namespace so instead the guarantee of no more packets
308 * arriving in a network namespace is provided by ensuring that all
309 * network devices and all sockets have left the network namespace
310 * before the cleanup methods are called.
Eric W. Biederman17edde52009-02-22 00:11:09 -0800311 *
312 * For the longest time the ipv4 icmp code was registered as a pernet
313 * device which caused kernel oops, and panics during network
314 * namespace cleanup. So please don't get this wrong.
315 */
Joe Perchese67e16e2013-09-21 10:22:48 -0700316int register_pernet_subsys(struct pernet_operations *);
317void unregister_pernet_subsys(struct pernet_operations *);
318int register_pernet_device(struct pernet_operations *);
319void unregister_pernet_device(struct pernet_operations *);
Eric W. Biedermanf875bae2009-11-29 22:25:28 +0000320
Eric W. Biederman95bdfcc2007-11-30 23:55:42 +1100321struct ctl_table;
322struct ctl_table_header;
Pavel Emelyanovd62c6122008-05-19 13:45:33 -0700323
Eric W. Biederman2ca794e2012-04-19 13:20:32 +0000324#ifdef CONFIG_SYSCTL
Joe Perchese67e16e2013-09-21 10:22:48 -0700325int net_sysctl_init(void);
326struct ctl_table_header *register_net_sysctl(struct net *net, const char *path,
327 struct ctl_table *table);
328void unregister_net_sysctl_table(struct ctl_table_header *header);
Eric W. Biederman48c74952012-04-23 12:13:02 +0000329#else
330static inline int net_sysctl_init(void) { return 0; }
331static inline struct ctl_table_header *register_net_sysctl(struct net *net,
332 const char *path, struct ctl_table *table)
333{
334 return NULL;
335}
336static inline void unregister_net_sysctl_table(struct ctl_table_header *header)
337{
338}
339#endif
340
fan.duca4c3fc2013-07-30 08:33:53 +0800341static inline int rt_genid_ipv4(struct net *net)
Nicolas Dichtelb42664f2012-09-10 22:09:44 +0000342{
fan.duca4c3fc2013-07-30 08:33:53 +0800343 return atomic_read(&net->ipv4.rt_genid);
Nicolas Dichtelb42664f2012-09-10 22:09:44 +0000344}
345
fan.duca4c3fc2013-07-30 08:33:53 +0800346static inline void rt_genid_bump_ipv4(struct net *net)
Nicolas Dichtelb42664f2012-09-10 22:09:44 +0000347{
fan.duca4c3fc2013-07-30 08:33:53 +0800348 atomic_inc(&net->ipv4.rt_genid);
349}
350
Hannes Frederic Sowa705f1c82014-09-28 00:46:06 +0200351extern void (*__fib6_flush_trees)(struct net *net);
fan.duca4c3fc2013-07-30 08:33:53 +0800352static inline void rt_genid_bump_ipv6(struct net *net)
353{
Hannes Frederic Sowa705f1c82014-09-28 00:46:06 +0200354 if (__fib6_flush_trees)
355 __fib6_flush_trees(net);
fan.duca4c3fc2013-07-30 08:33:53 +0800356}
fan.duca4c3fc2013-07-30 08:33:53 +0800357
Luis R. Rodriguez599018a2014-04-17 18:22:54 -0700358#if IS_ENABLED(CONFIG_IEEE802154_6LOWPAN)
359static inline struct netns_ieee802154_lowpan *
360net_ieee802154_lowpan(struct net *net)
361{
362 return &net->ieee802154_lowpan;
363}
Luis R. Rodriguez599018a2014-04-17 18:22:54 -0700364#endif
365
fan.duca4c3fc2013-07-30 08:33:53 +0800366/* For callers who don't really care about whether it's IPv4 or IPv6 */
367static inline void rt_genid_bump_all(struct net *net)
368{
369 rt_genid_bump_ipv4(net);
370 rt_genid_bump_ipv6(net);
Nicolas Dichtelb42664f2012-09-10 22:09:44 +0000371}
Eric W. Biederman95bdfcc2007-11-30 23:55:42 +1100372
Timo Teräs5aad1de2013-05-27 20:46:33 +0000373static inline int fnhe_genid(struct net *net)
374{
375 return atomic_read(&net->fnhe_genid);
376}
377
378static inline void fnhe_genid_bump(struct net *net)
379{
380 atomic_inc(&net->fnhe_genid);
381}
382
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200383#endif /* __NET_NET_NAMESPACE_H */