blob: 3f6d37deac4505f6bf75d4a43749fc08b3013091 [file] [log] [blame]
Eric W. Biederman5f256be2007-09-12 11:50:50 +02001#include <linux/workqueue.h>
2#include <linux/rtnetlink.h>
3#include <linux/cache.h>
4#include <linux/slab.h>
5#include <linux/list.h>
6#include <linux/delay.h>
Eric W. Biederman9dd776b2007-09-26 22:04:26 -07007#include <linux/sched.h>
Eric W. Biederman5f256be2007-09-12 11:50:50 +02008#include <net/net_namespace.h>
9
10/*
11 * Our network namespace constructor/destructor lists
12 */
13
14static LIST_HEAD(pernet_list);
15static struct list_head *first_device = &pernet_list;
16static DEFINE_MUTEX(net_mutex);
17
Eric W. Biederman5f256be2007-09-12 11:50:50 +020018LIST_HEAD(net_namespace_list);
19
Eric W. Biederman5f256be2007-09-12 11:50:50 +020020struct net init_net;
21EXPORT_SYMBOL_GPL(init_net);
22
Pavel Emelyanov6a1a3b92007-11-01 00:44:50 -070023/*
24 * setup_net runs the initializers for the network namespace object.
25 */
Pavel Emelyanov1a2ee932007-11-01 00:45:59 -070026static __net_init int setup_net(struct net *net)
Pavel Emelyanov6a1a3b92007-11-01 00:44:50 -070027{
28 /* Must be called with net_mutex held */
29 struct pernet_operations *ops;
30 int error;
31
32 atomic_set(&net->count, 1);
33 atomic_set(&net->use_count, 0);
34
35 error = 0;
36 list_for_each_entry(ops, &pernet_list, list) {
37 if (ops->init) {
38 error = ops->init(net);
39 if (error < 0)
40 goto out_undo;
41 }
42 }
43out:
44 return error;
45
46out_undo:
47 /* Walk through the list backwards calling the exit functions
48 * for the pernet modules whose init functions did not fail.
49 */
50 list_for_each_entry_continue_reverse(ops, &pernet_list, list) {
51 if (ops->exit)
52 ops->exit(net);
53 }
54
55 rcu_barrier();
56 goto out;
57}
58
59#ifdef CONFIG_NET_NS
Pavel Emelyanovd57a9212007-11-01 00:46:50 -070060static struct kmem_cache *net_cachep;
61
Eric W. Biederman5f256be2007-09-12 11:50:50 +020062static struct net *net_alloc(void)
63{
Pavel Emelyanov32f0c4c2007-10-09 13:02:17 -070064 return kmem_cache_zalloc(net_cachep, GFP_KERNEL);
Eric W. Biederman5f256be2007-09-12 11:50:50 +020065}
Eric W. Biederman5f256be2007-09-12 11:50:50 +020066
Johann Felix Soden45a19b02007-11-07 01:30:30 -080067static void net_free(struct net *net)
68{
69 if (!net)
70 return;
71
72 if (unlikely(atomic_read(&net->use_count) != 0)) {
73 printk(KERN_EMERG "network namespace not free! Usage: %d\n",
74 atomic_read(&net->use_count));
75 return;
76 }
77
78 kmem_cache_free(net_cachep, net);
79}
80
Pavel Emelyanov6a1a3b92007-11-01 00:44:50 -070081struct net *copy_net_ns(unsigned long flags, struct net *old_net)
82{
83 struct net *new_net = NULL;
84 int err;
85
86 get_net(old_net);
87
88 if (!(flags & CLONE_NEWNET))
89 return old_net;
90
91 err = -ENOMEM;
92 new_net = net_alloc();
93 if (!new_net)
94 goto out;
95
96 mutex_lock(&net_mutex);
97 err = setup_net(new_net);
98 if (err)
99 goto out_unlock;
100
101 rtnl_lock();
102 list_add_tail(&new_net->list, &net_namespace_list);
103 rtnl_unlock();
104
105
106out_unlock:
107 mutex_unlock(&net_mutex);
108out:
109 put_net(old_net);
110 if (err) {
111 net_free(new_net);
112 new_net = ERR_PTR(err);
113 }
114 return new_net;
115}
116
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200117static void cleanup_net(struct work_struct *work)
118{
119 struct pernet_operations *ops;
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200120 struct net *net;
121
122 net = container_of(work, struct net, work);
123
124 mutex_lock(&net_mutex);
125
126 /* Don't let anyone else find us. */
Eric W. Biedermanf4618d32007-09-26 22:40:08 -0700127 rtnl_lock();
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200128 list_del(&net->list);
Eric W. Biedermanf4618d32007-09-26 22:40:08 -0700129 rtnl_unlock();
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200130
131 /* Run all of the network namespace exit methods */
Pavel Emelyanov768f35912007-09-18 13:20:41 -0700132 list_for_each_entry_reverse(ops, &pernet_list, list) {
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200133 if (ops->exit)
134 ops->exit(net);
135 }
136
137 mutex_unlock(&net_mutex);
138
139 /* Ensure there are no outstanding rcu callbacks using this
140 * network namespace.
141 */
142 rcu_barrier();
143
144 /* Finally it is safe to free my network namespace structure */
145 net_free(net);
146}
147
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200148void __put_net(struct net *net)
149{
150 /* Cleanup the network namespace in process context */
151 INIT_WORK(&net->work, cleanup_net);
152 schedule_work(&net->work);
153}
154EXPORT_SYMBOL_GPL(__put_net);
155
Pavel Emelyanov6a1a3b92007-11-01 00:44:50 -0700156#else
Eric W. Biederman9dd776b2007-09-26 22:04:26 -0700157struct net *copy_net_ns(unsigned long flags, struct net *old_net)
158{
Pavel Emelyanov6a1a3b92007-11-01 00:44:50 -0700159 if (flags & CLONE_NEWNET)
160 return ERR_PTR(-EINVAL);
161 return old_net;
Eric W. Biederman9dd776b2007-09-26 22:04:26 -0700162}
Pavel Emelyanov6a1a3b92007-11-01 00:44:50 -0700163#endif
Eric W. Biederman9dd776b2007-09-26 22:04:26 -0700164
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200165static int __init net_ns_init(void)
166{
167 int err;
168
169 printk(KERN_INFO "net_namespace: %zd bytes\n", sizeof(struct net));
Pavel Emelyanovd57a9212007-11-01 00:46:50 -0700170#ifdef CONFIG_NET_NS
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200171 net_cachep = kmem_cache_create("net_namespace", sizeof(struct net),
172 SMP_CACHE_BYTES,
173 SLAB_PANIC, NULL);
Pavel Emelyanovd57a9212007-11-01 00:46:50 -0700174#endif
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200175 mutex_lock(&net_mutex);
176 err = setup_net(&init_net);
177
Eric W. Biedermanf4618d32007-09-26 22:40:08 -0700178 rtnl_lock();
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200179 list_add_tail(&init_net.list, &net_namespace_list);
Eric W. Biedermanf4618d32007-09-26 22:40:08 -0700180 rtnl_unlock();
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200181
182 mutex_unlock(&net_mutex);
183 if (err)
184 panic("Could not setup the initial network namespace");
185
186 return 0;
187}
188
189pure_initcall(net_ns_init);
190
191static int register_pernet_operations(struct list_head *list,
192 struct pernet_operations *ops)
193{
194 struct net *net, *undo_net;
195 int error;
196
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200197 list_add_tail(&ops->list, list);
Pavel Emelyanov1dba3232007-11-01 00:42:43 -0700198 if (ops->init) {
199 for_each_net(net) {
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200200 error = ops->init(net);
201 if (error)
202 goto out_undo;
203 }
204 }
Pavel Emelyanov1dba3232007-11-01 00:42:43 -0700205 return 0;
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200206
207out_undo:
208 /* If I have an error cleanup all namespaces I initialized */
209 list_del(&ops->list);
Pavel Emelyanov1dba3232007-11-01 00:42:43 -0700210 if (ops->exit) {
211 for_each_net(undo_net) {
212 if (undo_net == net)
213 goto undone;
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200214 ops->exit(undo_net);
Pavel Emelyanov1dba3232007-11-01 00:42:43 -0700215 }
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200216 }
217undone:
Pavel Emelyanov1dba3232007-11-01 00:42:43 -0700218 return error;
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200219}
220
221static void unregister_pernet_operations(struct pernet_operations *ops)
222{
223 struct net *net;
224
225 list_del(&ops->list);
Pavel Emelyanov1dba3232007-11-01 00:42:43 -0700226 if (ops->exit)
227 for_each_net(net)
Eric W. Biederman5f256be2007-09-12 11:50:50 +0200228 ops->exit(net);
229}
230
231/**
232 * register_pernet_subsys - register a network namespace subsystem
233 * @ops: pernet operations structure for the subsystem
234 *
235 * Register a subsystem which has init and exit functions
236 * that are called when network namespaces are created and
237 * destroyed respectively.
238 *
239 * When registered all network namespace init functions are
240 * called for every existing network namespace. Allowing kernel
241 * modules to have a race free view of the set of network namespaces.
242 *
243 * When a new network namespace is created all of the init
244 * methods are called in the order in which they were registered.
245 *
246 * When a network namespace is destroyed all of the exit methods
247 * are called in the reverse of the order with which they were
248 * registered.
249 */
250int register_pernet_subsys(struct pernet_operations *ops)
251{
252 int error;
253 mutex_lock(&net_mutex);
254 error = register_pernet_operations(first_device, ops);
255 mutex_unlock(&net_mutex);
256 return error;
257}
258EXPORT_SYMBOL_GPL(register_pernet_subsys);
259
260/**
261 * unregister_pernet_subsys - unregister a network namespace subsystem
262 * @ops: pernet operations structure to manipulate
263 *
264 * Remove the pernet operations structure from the list to be
265 * used when network namespaces are created or destoryed. In
266 * addition run the exit method for all existing network
267 * namespaces.
268 */
269void unregister_pernet_subsys(struct pernet_operations *module)
270{
271 mutex_lock(&net_mutex);
272 unregister_pernet_operations(module);
273 mutex_unlock(&net_mutex);
274}
275EXPORT_SYMBOL_GPL(unregister_pernet_subsys);
276
277/**
278 * register_pernet_device - register a network namespace device
279 * @ops: pernet operations structure for the subsystem
280 *
281 * Register a device which has init and exit functions
282 * that are called when network namespaces are created and
283 * destroyed respectively.
284 *
285 * When registered all network namespace init functions are
286 * called for every existing network namespace. Allowing kernel
287 * modules to have a race free view of the set of network namespaces.
288 *
289 * When a new network namespace is created all of the init
290 * methods are called in the order in which they were registered.
291 *
292 * When a network namespace is destroyed all of the exit methods
293 * are called in the reverse of the order with which they were
294 * registered.
295 */
296int register_pernet_device(struct pernet_operations *ops)
297{
298 int error;
299 mutex_lock(&net_mutex);
300 error = register_pernet_operations(&pernet_list, ops);
301 if (!error && (first_device == &pernet_list))
302 first_device = &ops->list;
303 mutex_unlock(&net_mutex);
304 return error;
305}
306EXPORT_SYMBOL_GPL(register_pernet_device);
307
308/**
309 * unregister_pernet_device - unregister a network namespace netdevice
310 * @ops: pernet operations structure to manipulate
311 *
312 * Remove the pernet operations structure from the list to be
313 * used when network namespaces are created or destoryed. In
314 * addition run the exit method for all existing network
315 * namespaces.
316 */
317void unregister_pernet_device(struct pernet_operations *ops)
318{
319 mutex_lock(&net_mutex);
320 if (&ops->list == first_device)
321 first_device = first_device->next;
322 unregister_pernet_operations(ops);
323 mutex_unlock(&net_mutex);
324}
325EXPORT_SYMBOL_GPL(unregister_pernet_device);