blob: 5ae57f1ab7551e556c0145dcb51206d5de08ecc6 [file] [log] [blame]
Eric W. Biederman5f256be2007-09-12 11:50:50 +02001/*
2 * Operations on the network namespace
3 */
4#ifndef __NET_NET_NAMESPACE_H
5#define __NET_NET_NAMESPACE_H
6
Arun Sharma600634972011-07-26 16:09:06 -07007#include <linux/atomic.h>
Eric W. Biederman5f256be2007-09-12 11:50:50 +02008#include <linux/workqueue.h>
9#include <linux/list.h>
David S. Millerbee95252011-05-26 16:40:37 -040010#include <linux/sysctl.h>
Eric W. Biederman5f256be2007-09-12 11:50:50 +020011
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -070012#include <net/netns/core.h>
Pavel Emelyanov852566f52008-07-18 04:01:24 -070013#include <net/netns/mib.h>
Denis V. Luneva0a53c82007-12-11 04:19:17 -080014#include <net/netns/unix.h>
Denis V. Lunev2aaef4e2007-12-11 04:19:54 -080015#include <net/netns/packet.h>
Pavel Emelyanov8afd3512007-12-16 13:29:36 -080016#include <net/netns/ipv4.h>
Daniel Lezcanob0f159d2008-01-10 02:49:06 -080017#include <net/netns/ipv6.h>
Eric W. Biederman4db67e82012-08-06 08:42:04 +000018#include <net/netns/sctp.h>
Pavel Emelyanov67019cc2008-04-13 22:28:42 -070019#include <net/netns/dccp.h>
Alexey Dobriyan8d870052008-01-31 04:02:13 -080020#include <net/netns/x_tables.h>
Alexey Dobriyandfdb8d72008-10-08 11:35:02 +020021#if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
22#include <net/netns/conntrack.h>
23#endif
Alexey Dobriyand62ddc22008-11-25 17:14:31 -080024#include <net/netns/xfrm.h>
Denis V. Luneva0a53c82007-12-11 04:19:17 -080025
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020026struct proc_dir_entry;
Eric W. Biederman2774c7a2007-09-26 22:10:56 -070027struct net_device;
Denis V. Lunev97c53ca2007-11-19 22:26:51 -080028struct sock;
Pavel Emelyanov1597fbc2007-12-01 23:51:01 +110029struct ctl_table_header;
Pavel Emelyanovdec827d2008-04-15 00:36:08 -070030struct net_generic;
Johannes Berg134e6372009-07-10 09:51:34 +000031struct sock;
Julian Anastasov2553d062011-03-04 12:18:07 +020032struct netns_ipvs;
Pavel Emelyanov1597fbc2007-12-01 23:51:01 +110033
Eric Dumazet7c28bd02009-10-24 06:13:17 -070034
35#define NETDEV_HASHBITS 8
36#define NETDEV_HASHENTRIES (1 << NETDEV_HASHBITS)
37
Eric W. Biederman5f256be2007-09-12 11:50:50 +020038struct net {
Al Viroa685e082011-06-08 21:13:01 -040039 atomic_t passive; /* To decided when the network
40 * namespace should be freed.
41 */
Eric W. Biederman5f256be2007-09-12 11:50:50 +020042 atomic_t count; /* To decided when the network
Al Viroa685e082011-06-08 21:13:01 -040043 * namespace should be shut down.
Eric W. Biederman5f256be2007-09-12 11:50:50 +020044 */
Denis V. Lunev5d1e4462008-04-16 01:58:04 -070045#ifdef NETNS_REFCNT_DEBUG
Eric W. Biederman5f256be2007-09-12 11:50:50 +020046 atomic_t use_count; /* To track references we
47 * destroy on demand
48 */
Denis V. Lunev5d1e4462008-04-16 01:58:04 -070049#endif
Eric Dumazet8e602ce2010-10-14 05:56:18 +000050 spinlock_t rules_mod_lock;
51
Eric W. Biederman5f256be2007-09-12 11:50:50 +020052 struct list_head list; /* list of network namespaces */
Eric W. Biederman2b035b32009-11-29 22:25:27 +000053 struct list_head cleanup_list; /* namespaces on death row */
Eric W. Biederman72ad9372009-12-03 02:29:03 +000054 struct list_head exit_list; /* Use only net_mutex */
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020055
56 struct proc_dir_entry *proc_net;
57 struct proc_dir_entry *proc_net_stat;
Eric W. Biederman881d9662007-09-17 11:56:21 -070058
Al Viro73455092008-07-14 21:22:20 -040059#ifdef CONFIG_SYSCTL
60 struct ctl_table_set sysctls;
61#endif
Eric W. Biederman95bdfcc2007-11-30 23:55:42 +110062
Eric Dumazet8e602ce2010-10-14 05:56:18 +000063 struct sock *rtnl; /* rtnetlink socket */
64 struct sock *genl_sock;
Eric W. Biederman2774c7a2007-09-26 22:10:56 -070065
Eric W. Biederman881d9662007-09-17 11:56:21 -070066 struct list_head dev_base_head;
67 struct hlist_head *dev_name_head;
68 struct hlist_head *dev_index_head;
Thomas Graf4e985ad2011-06-21 03:11:20 +000069 unsigned int dev_base_seq; /* protected by rtnl_mutex */
Pavel Emelyanovaa79e662012-08-08 21:53:19 +000070 int ifindex;
Denis V. Lunev97c53ca2007-11-19 22:26:51 -080071
Denis V. Lunev5fd30ee2008-01-10 03:20:28 -080072 /* core fib_rules */
73 struct list_head rules_ops;
Denis V. Lunev5fd30ee2008-01-10 03:20:28 -080074
Denis V. Lunevd12d01d2007-11-19 22:28:35 -080075
Eric Dumazet8e602ce2010-10-14 05:56:18 +000076 struct net_device *loopback_dev; /* The loopback */
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -070077 struct netns_core core;
Pavel Emelyanov852566f52008-07-18 04:01:24 -070078 struct netns_mib mib;
Denis V. Lunev2aaef4e2007-12-11 04:19:54 -080079 struct netns_packet packet;
Denis V. Luneva0a53c82007-12-11 04:19:17 -080080 struct netns_unix unx;
Pavel Emelyanov8afd3512007-12-16 13:29:36 -080081 struct netns_ipv4 ipv4;
Eric Dumazetdfd56b82011-12-10 09:48:31 +000082#if IS_ENABLED(CONFIG_IPV6)
Daniel Lezcanob0f159d2008-01-10 02:49:06 -080083 struct netns_ipv6 ipv6;
84#endif
Eric W. Biederman4db67e82012-08-06 08:42:04 +000085#if defined(CONFIG_IP_SCTP) || defined(CONFIG_IP_SCTP_MODULE)
86 struct netns_sctp sctp;
87#endif
Pavel Emelyanov67019cc2008-04-13 22:28:42 -070088#if defined(CONFIG_IP_DCCP) || defined(CONFIG_IP_DCCP_MODULE)
89 struct netns_dccp dccp;
90#endif
Alexey Dobriyan8d870052008-01-31 04:02:13 -080091#ifdef CONFIG_NETFILTER
92 struct netns_xt xt;
Alexey Dobriyandfdb8d72008-10-08 11:35:02 +020093#if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
94 struct netns_ct ct;
95#endif
Alexey Dobriyancd8c20b2010-01-13 16:02:14 +010096 struct sock *nfnl;
97 struct sock *nfnl_stash;
Alexey Dobriyan8d870052008-01-31 04:02:13 -080098#endif
Johannes Berg3d23e342009-09-29 23:27:28 +020099#ifdef CONFIG_WEXT_CORE
Johannes Bergb333b3d222009-06-24 01:34:48 +0000100 struct sk_buff_head wext_nlevents;
101#endif
Eric Dumazet1c877332010-10-25 03:20:11 +0000102 struct net_generic __rcu *gen;
Eric Dumazet8e602ce2010-10-14 05:56:18 +0000103
104 /* Note : following structs are cache line aligned */
105#ifdef CONFIG_XFRM
106 struct netns_xfrm xfrm;
107#endif
Hans Schillstrom61b1ab42011-01-03 14:44:42 +0100108 struct netns_ipvs *ipvs;
Andrey Vagin51d7ccc2012-07-16 04:28:49 +0000109 struct sock *diag_nlsk;
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200110};
111
Pavel Emelyanov1fb94892012-08-08 21:53:36 +0000112/*
113 * ifindex generation is per-net namespace, and loopback is
114 * always the 1st device in ns (see net_dev_init), thus any
115 * loopback device should get ifindex 1
116 */
117
118#define LOOPBACK_IFINDEX 1
Denis V. Lunev225c0a02008-04-02 00:09:29 -0700119
Denis V. Lunevc0f39322008-04-02 00:10:28 -0700120#include <linux/seq_file_net.h>
121
Daniel Lezcano4fabcd72007-09-13 09:16:29 +0200122/* Init's network namespace */
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200123extern struct net init_net;
Denis V. Luneva4aa8342008-04-03 13:04:33 -0700124
125#ifdef CONFIG_NET
Eric W. Biederman9dd776b2007-09-26 22:04:26 -0700126extern struct net *copy_net_ns(unsigned long flags, struct net *net_ns);
Denis V. Lunev225c0a02008-04-02 00:09:29 -0700127
128#else /* CONFIG_NET */
Eric W. Biederman9dd776b2007-09-26 22:04:26 -0700129static inline struct net *copy_net_ns(unsigned long flags, struct net *net_ns)
130{
131 /* There is nothing to copy so this is a noop */
132 return net_ns;
133}
Denis V. Lunev225c0a02008-04-02 00:09:29 -0700134#endif /* CONFIG_NET */
135
136
137extern struct list_head net_namespace_list;
Eric W. Biederman9dd776b2007-09-26 22:04:26 -0700138
Johannes Berg30ffee82009-07-10 09:51:35 +0000139extern struct net *get_net_ns_by_pid(pid_t pid);
Eric W. Biedermanf0630522011-05-04 17:51:50 -0700140extern struct net *get_net_ns_by_fd(int pid);
Johannes Berg30ffee82009-07-10 09:51:35 +0000141
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700142#ifdef CONFIG_NET_NS
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200143extern void __put_net(struct net *net);
144
145static inline struct net *get_net(struct net *net)
146{
147 atomic_inc(&net->count);
148 return net;
149}
150
Eric W. Biederman077130c2007-09-13 09:18:57 +0200151static inline struct net *maybe_get_net(struct net *net)
152{
153 /* Used when we know struct net exists but we
154 * aren't guaranteed a previous reference count
155 * exists. If the reference count is zero this
156 * function fails and returns NULL.
157 */
158 if (!atomic_inc_not_zero(&net->count))
159 net = NULL;
160 return net;
161}
162
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200163static inline void put_net(struct net *net)
164{
165 if (atomic_dec_and_test(&net->count))
166 __put_net(net);
167}
168
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900169static inline
170int net_eq(const struct net *net1, const struct net *net2)
171{
172 return net1 == net2;
173}
Al Viroa685e082011-06-08 21:13:01 -0400174
175extern void net_drop_ns(void *);
176
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700177#else
Eric W. Biedermanb9f75f42008-06-20 22:16:51 -0700178
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700179static inline struct net *get_net(struct net *net)
180{
181 return net;
182}
183
184static inline void put_net(struct net *net)
185{
186}
187
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700188static inline struct net *maybe_get_net(struct net *net)
189{
190 return net;
191}
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900192
193static inline
194int net_eq(const struct net *net1, const struct net *net2)
195{
196 return 1;
197}
Al Viroa685e082011-06-08 21:13:01 -0400198
199#define net_drop_ns NULL
Pavel Emelyanovd4655792007-11-01 00:43:49 -0700200#endif
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200201
Denis V. Lunev5d1e4462008-04-16 01:58:04 -0700202
203#ifdef NETNS_REFCNT_DEBUG
204static inline struct net *hold_net(struct net *net)
205{
206 if (net)
207 atomic_inc(&net->use_count);
208 return net;
209}
210
211static inline void release_net(struct net *net)
212{
213 if (net)
214 atomic_dec(&net->use_count);
215}
216#else
217static inline struct net *hold_net(struct net *net)
218{
219 return net;
220}
221
222static inline void release_net(struct net *net)
223{
224}
225#endif
226
Eric Dumazet8f424b52008-11-12 00:53:30 -0800227#ifdef CONFIG_NET_NS
228
229static inline void write_pnet(struct net **pnet, struct net *net)
230{
231 *pnet = net;
232}
233
234static inline struct net *read_pnet(struct net * const *pnet)
235{
236 return *pnet;
237}
238
239#else
240
241#define write_pnet(pnet, net) do { (void)(net);} while (0)
242#define read_pnet(pnet) (&init_net)
243
244#endif
Denis V. Lunev5d1e4462008-04-16 01:58:04 -0700245
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200246#define for_each_net(VAR) \
247 list_for_each_entry(VAR, &net_namespace_list, list)
248
Johannes Berg11a28d32009-07-10 09:51:33 +0000249#define for_each_net_rcu(VAR) \
250 list_for_each_entry_rcu(VAR, &net_namespace_list, list)
251
Pavel Emelyanov46650792007-10-08 20:38:39 -0700252#ifdef CONFIG_NET_NS
253#define __net_init
254#define __net_exit
Denis V. Lunev022cbae2007-11-13 03:23:50 -0800255#define __net_initdata
Pavel Emelyanov46650792007-10-08 20:38:39 -0700256#else
257#define __net_init __init
258#define __net_exit __exit_refok
Denis V. Lunev022cbae2007-11-13 03:23:50 -0800259#define __net_initdata __initdata
Pavel Emelyanov46650792007-10-08 20:38:39 -0700260#endif
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200261
262struct pernet_operations {
263 struct list_head list;
264 int (*init)(struct net *net);
265 void (*exit)(struct net *net);
Eric W. Biederman72ad9372009-12-03 02:29:03 +0000266 void (*exit_batch)(struct list_head *net_exit_list);
Eric W. Biedermanf875bae2009-11-29 22:25:28 +0000267 int *id;
268 size_t size;
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200269};
270
Eric W. Biederman17edde52009-02-22 00:11:09 -0800271/*
272 * Use these carefully. If you implement a network device and it
273 * needs per network namespace operations use device pernet operations,
274 * otherwise use pernet subsys operations.
275 *
Johannes Berg4edf5472009-07-15 06:16:34 +0000276 * Network interfaces need to be removed from a dying netns _before_
277 * subsys notifiers can be called, as most of the network code cleanup
278 * (which is done from subsys notifiers) runs with the assumption that
279 * dev_remove_pack has been called so no new packets will arrive during
280 * and after the cleanup functions have been called. dev_remove_pack
281 * is not per namespace so instead the guarantee of no more packets
282 * arriving in a network namespace is provided by ensuring that all
283 * network devices and all sockets have left the network namespace
284 * before the cleanup methods are called.
Eric W. Biederman17edde52009-02-22 00:11:09 -0800285 *
286 * For the longest time the ipv4 icmp code was registered as a pernet
287 * device which caused kernel oops, and panics during network
288 * namespace cleanup. So please don't get this wrong.
289 */
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200290extern int register_pernet_subsys(struct pernet_operations *);
291extern void unregister_pernet_subsys(struct pernet_operations *);
292extern int register_pernet_device(struct pernet_operations *);
293extern void unregister_pernet_device(struct pernet_operations *);
Eric W. Biedermanf875bae2009-11-29 22:25:28 +0000294
Eric W. Biederman95bdfcc2007-11-30 23:55:42 +1100295struct ctl_table;
296struct ctl_table_header;
Pavel Emelyanovd62c6122008-05-19 13:45:33 -0700297
Eric W. Biederman2ca794e2012-04-19 13:20:32 +0000298#ifdef CONFIG_SYSCTL
299extern int net_sysctl_init(void);
Eric W. Biedermanab41a2c2012-04-19 13:18:47 +0000300extern struct ctl_table_header *register_net_sysctl(struct net *net,
301 const char *path, struct ctl_table *table);
Eric W. Biederman95bdfcc2007-11-30 23:55:42 +1100302extern void unregister_net_sysctl_table(struct ctl_table_header *header);
Eric W. Biederman48c74952012-04-23 12:13:02 +0000303#else
304static inline int net_sysctl_init(void) { return 0; }
305static inline struct ctl_table_header *register_net_sysctl(struct net *net,
306 const char *path, struct ctl_table *table)
307{
308 return NULL;
309}
310static inline void unregister_net_sysctl_table(struct ctl_table_header *header)
311{
312}
313#endif
314
Eric W. Biederman95bdfcc2007-11-30 23:55:42 +1100315
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200316#endif /* __NET_NET_NAMESPACE_H */