net_namespace.h 7.9 KB
Newer Older
1 2 3 4 5 6
/*
 * Operations on the network namespace
 */
#ifndef __NET_NET_NAMESPACE_H
#define __NET_NET_NAMESPACE_H

A
Arun Sharma 已提交
7
#include <linux/atomic.h>
8 9
#include <linux/workqueue.h>
#include <linux/list.h>
10
#include <linux/sysctl.h>
11

12
#include <net/netns/core.h>
P
Pavel Emelyanov 已提交
13
#include <net/netns/mib.h>
14
#include <net/netns/unix.h>
15
#include <net/netns/packet.h>
16
#include <net/netns/ipv4.h>
17
#include <net/netns/ipv6.h>
18
#include <net/netns/sctp.h>
19
#include <net/netns/dccp.h>
20
#include <net/netns/x_tables.h>
21 22 23
#if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
#include <net/netns/conntrack.h>
#endif
24
#include <net/netns/xfrm.h>
25

26
struct user_namespace;
27
struct proc_dir_entry;
28
struct net_device;
29
struct sock;
30
struct ctl_table_header;
31
struct net_generic;
J
Johannes Berg 已提交
32
struct sock;
J
Julian Anastasov 已提交
33
struct netns_ipvs;
34

35 36 37 38

#define NETDEV_HASHBITS    8
#define NETDEV_HASHENTRIES (1 << NETDEV_HASHBITS)

39
struct net {
40 41 42
	atomic_t		passive;	/* To decided when the network
						 * namespace should be freed.
						 */
43
	atomic_t		count;		/* To decided when the network
44
						 *  namespace should be shut down.
45
						 */
46
#ifdef NETNS_REFCNT_DEBUG
47 48 49
	atomic_t		use_count;	/* To track references we
						 * destroy on demand
						 */
50
#endif
E
Eric Dumazet 已提交
51 52
	spinlock_t		rules_mod_lock;

53
	struct list_head	list;		/* list of network namespaces */
54
	struct list_head	cleanup_list;	/* namespaces on death row */
55
	struct list_head	exit_list;	/* Use only net_mutex */
56

57 58
	struct user_namespace   *user_ns;	/* Owning user namespace */

59 60
	struct proc_dir_entry 	*proc_net;
	struct proc_dir_entry 	*proc_net_stat;
61

62 63 64
#ifdef CONFIG_SYSCTL
	struct ctl_table_set	sysctls;
#endif
65

E
Eric Dumazet 已提交
66 67
	struct sock 		*rtnl;			/* rtnetlink socket */
	struct sock		*genl_sock;
68

69 70 71
	struct list_head 	dev_base_head;
	struct hlist_head 	*dev_name_head;
	struct hlist_head	*dev_index_head;
72
	unsigned int		dev_base_seq;	/* protected by rtnl_mutex */
73
	int			ifindex;
74

75 76 77
	/* core fib_rules */
	struct list_head	rules_ops;

78

E
Eric Dumazet 已提交
79
	struct net_device       *loopback_dev;          /* The loopback */
80
	struct netns_core	core;
P
Pavel Emelyanov 已提交
81
	struct netns_mib	mib;
82
	struct netns_packet	packet;
83
	struct netns_unix	unx;
84
	struct netns_ipv4	ipv4;
E
Eric Dumazet 已提交
85
#if IS_ENABLED(CONFIG_IPV6)
86 87
	struct netns_ipv6	ipv6;
#endif
88 89 90
#if defined(CONFIG_IP_SCTP) || defined(CONFIG_IP_SCTP_MODULE)
	struct netns_sctp	sctp;
#endif
91 92 93
#if defined(CONFIG_IP_DCCP) || defined(CONFIG_IP_DCCP_MODULE)
	struct netns_dccp	dccp;
#endif
94 95
#ifdef CONFIG_NETFILTER
	struct netns_xt		xt;
96 97
#if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
	struct netns_ct		ct;
98 99 100
#endif
#if IS_ENABLED(CONFIG_NF_DEFRAG_IPV6)
	struct netns_nf_frag	nf_frag;
101
#endif
102 103
	struct sock		*nfnl;
	struct sock		*nfnl_stash;
104
#endif
J
Johannes Berg 已提交
105
#ifdef CONFIG_WEXT_CORE
106
	struct sk_buff_head	wext_nlevents;
107
#endif
E
Eric Dumazet 已提交
108
	struct net_generic __rcu	*gen;
E
Eric Dumazet 已提交
109 110 111 112 113

	/* Note : following structs are cache line aligned */
#ifdef CONFIG_XFRM
	struct netns_xfrm	xfrm;
#endif
114
	struct netns_ipvs	*ipvs;
A
Andrey Vagin 已提交
115
	struct sock		*diag_nlsk;
116
	atomic_t		rt_genid;
117 118
};

119 120 121 122 123 124 125
/*
 * ifindex generation is per-net namespace, and loopback is
 * always the 1st device in ns (see net_dev_init), thus any
 * loopback device should get ifindex 1
 */

#define LOOPBACK_IFINDEX	1
126

127 128
#include <linux/seq_file_net.h>

129
/* Init's network namespace */
130
extern struct net init_net;
131

132
#ifdef CONFIG_NET_NS
133 134
extern struct net *copy_net_ns(unsigned long flags,
	struct user_namespace *user_ns, struct net *old_net);
135

136 137 138
#else /* CONFIG_NET_NS */
#include <linux/sched.h>
#include <linux/nsproxy.h>
139 140
static inline struct net *copy_net_ns(unsigned long flags,
	struct user_namespace *user_ns, struct net *old_net)
141
{
142 143 144
	if (flags & CLONE_NEWNET)
		return ERR_PTR(-EINVAL);
	return old_net;
145
}
146
#endif /* CONFIG_NET_NS */
147 148 149


extern struct list_head net_namespace_list;
150

151
extern struct net *get_net_ns_by_pid(pid_t pid);
152
extern struct net *get_net_ns_by_fd(int pid);
153

154
#ifdef CONFIG_NET_NS
155 156 157 158 159 160 161 162
extern void __put_net(struct net *net);

static inline struct net *get_net(struct net *net)
{
	atomic_inc(&net->count);
	return net;
}

163 164 165 166 167 168 169 170 171 172 173 174
static inline struct net *maybe_get_net(struct net *net)
{
	/* Used when we know struct net exists but we
	 * aren't guaranteed a previous reference count
	 * exists.  If the reference count is zero this
	 * function fails and returns NULL.
	 */
	if (!atomic_inc_not_zero(&net->count))
		net = NULL;
	return net;
}

175 176 177 178 179 180
static inline void put_net(struct net *net)
{
	if (atomic_dec_and_test(&net->count))
		__put_net(net);
}

181 182 183 184 185
static inline
int net_eq(const struct net *net1, const struct net *net2)
{
	return net1 == net2;
}
186 187 188

extern void net_drop_ns(void *);

189
#else
190

191 192 193 194 195 196 197 198 199
static inline struct net *get_net(struct net *net)
{
	return net;
}

static inline void put_net(struct net *net)
{
}

200 201 202 203 204 205 206 207 208 209
static inline struct net *maybe_get_net(struct net *net)
{
	return net;
}

static inline
int net_eq(const struct net *net1, const struct net *net2)
{
	return 1;
}
210 211

#define net_drop_ns NULL
212 213 214 215
#endif


#ifdef NETNS_REFCNT_DEBUG
216 217
static inline struct net *hold_net(struct net *net)
{
218 219
	if (net)
		atomic_inc(&net->use_count);
220 221 222 223 224
	return net;
}

static inline void release_net(struct net *net)
{
225 226
	if (net)
		atomic_dec(&net->use_count);
227
}
228 229
#else
static inline struct net *hold_net(struct net *net)
230 231 232
{
	return net;
}
233

234
static inline void release_net(struct net *net)
235 236
{
}
237
#endif
238

239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256
#ifdef CONFIG_NET_NS

static inline void write_pnet(struct net **pnet, struct net *net)
{
	*pnet = net;
}

static inline struct net *read_pnet(struct net * const *pnet)
{
	return *pnet;
}

#else

#define write_pnet(pnet, net)	do { (void)(net);} while (0)
#define read_pnet(pnet)		(&init_net)

#endif
257

258 259 260
#define for_each_net(VAR)				\
	list_for_each_entry(VAR, &net_namespace_list, list)

261 262 263
#define for_each_net_rcu(VAR)				\
	list_for_each_entry_rcu(VAR, &net_namespace_list, list)

264 265 266
#ifdef CONFIG_NET_NS
#define __net_init
#define __net_exit
267
#define __net_initdata
268
#define __net_initconst
269 270 271
#else
#define __net_init	__init
#define __net_exit	__exit_refok
272
#define __net_initdata	__initdata
273
#define __net_initconst	__initconst
274
#endif
275 276 277 278 279

struct pernet_operations {
	struct list_head list;
	int (*init)(struct net *net);
	void (*exit)(struct net *net);
280
	void (*exit_batch)(struct list_head *net_exit_list);
281 282
	int *id;
	size_t size;
283 284
};

E
Eric W. Biederman 已提交
285 286 287 288 289
/*
 * Use these carefully.  If you implement a network device and it
 * needs per network namespace operations use device pernet operations,
 * otherwise use pernet subsys operations.
 *
290 291 292 293 294 295 296 297 298
 * Network interfaces need to be removed from a dying netns _before_
 * subsys notifiers can be called, as most of the network code cleanup
 * (which is done from subsys notifiers) runs with the assumption that
 * dev_remove_pack has been called so no new packets will arrive during
 * and after the cleanup functions have been called.  dev_remove_pack
 * is not per namespace so instead the guarantee of no more packets
 * arriving in a network namespace is provided by ensuring that all
 * network devices and all sockets have left the network namespace
 * before the cleanup methods are called.
E
Eric W. Biederman 已提交
299 300 301 302 303
 *
 * For the longest time the ipv4 icmp code was registered as a pernet
 * device which caused kernel oops, and panics during network
 * namespace cleanup.   So please don't get this wrong.
 */
304 305 306 307
extern int register_pernet_subsys(struct pernet_operations *);
extern void unregister_pernet_subsys(struct pernet_operations *);
extern int register_pernet_device(struct pernet_operations *);
extern void unregister_pernet_device(struct pernet_operations *);
308

309 310
struct ctl_table;
struct ctl_table_header;
311

312 313
#ifdef CONFIG_SYSCTL
extern int net_sysctl_init(void);
314 315
extern struct ctl_table_header *register_net_sysctl(struct net *net,
	const char *path, struct ctl_table *table);
316
extern void unregister_net_sysctl_table(struct ctl_table_header *header);
317 318 319 320 321 322 323 324 325 326 327 328
#else
static inline int net_sysctl_init(void) { return 0; }
static inline struct ctl_table_header *register_net_sysctl(struct net *net,
	const char *path, struct ctl_table *table)
{
	return NULL;
}
static inline void unregister_net_sysctl_table(struct ctl_table_header *header)
{
}
#endif

329 330 331 332 333 334 335 336 337
static inline int rt_genid(struct net *net)
{
	return atomic_read(&net->rt_genid);
}

static inline void rt_genid_bump(struct net *net)
{
	atomic_inc(&net->rt_genid);
}
338

339
#endif /* __NET_NET_NAMESPACE_H */