blob: 3346829ea07f09e28107c4b227d8b5d5763be30b [file] [log] [blame]
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -08001/* netfilter.c: look after the filters for various protocols.
Harald Weltef6ebe772005-08-09 20:21:49 -07002 * Heavily influenced by the old firewall.c by David Bonn and Alan Cox.
3 *
4 * Thanks to Rob `CmdrTaco' Malda for not influencing this code in any
5 * way.
6 *
7 * Rusty Russell (C)2000 -- This code is GPL.
Harald Weltef6ebe772005-08-09 20:21:49 -07008 */
Harald Weltef6ebe772005-08-09 20:21:49 -07009#include <linux/kernel.h>
10#include <linux/netfilter.h>
11#include <net/protocol.h>
12#include <linux/init.h>
13#include <linux/skbuff.h>
14#include <linux/wait.h>
15#include <linux/module.h>
16#include <linux/interrupt.h>
17#include <linux/if.h>
18#include <linux/netdevice.h>
19#include <linux/inetdevice.h>
20#include <linux/proc_fs.h>
Patrick McHardyd486dd12007-02-12 11:09:55 -080021#include <linux/mutex.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090022#include <linux/slab.h>
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020023#include <net/net_namespace.h>
Harald Weltef6ebe772005-08-09 20:21:49 -070024#include <net/sock.h>
25
26#include "nf_internals.h"
27
Patrick McHardyd486dd12007-02-12 11:09:55 -080028static DEFINE_MUTEX(afinfo_mutex);
Patrick McHardybce80322006-04-06 14:18:09 -070029
Arnd Bergmann0906a372010-03-09 20:59:15 +010030const struct nf_afinfo __rcu *nf_afinfo[NFPROTO_NUMPROTO] __read_mostly;
Patrick McHardybce80322006-04-06 14:18:09 -070031EXPORT_SYMBOL(nf_afinfo);
32
Patrick McHardy1e796fd2007-12-17 22:42:27 -080033int nf_register_afinfo(const struct nf_afinfo *afinfo)
Patrick McHardybce80322006-04-06 14:18:09 -070034{
Patrick McHardyd486dd12007-02-12 11:09:55 -080035 int err;
36
37 err = mutex_lock_interruptible(&afinfo_mutex);
38 if (err < 0)
39 return err;
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +000040 RCU_INIT_POINTER(nf_afinfo[afinfo->family], afinfo);
Patrick McHardyd486dd12007-02-12 11:09:55 -080041 mutex_unlock(&afinfo_mutex);
Patrick McHardybce80322006-04-06 14:18:09 -070042 return 0;
43}
44EXPORT_SYMBOL_GPL(nf_register_afinfo);
45
Patrick McHardy1e796fd2007-12-17 22:42:27 -080046void nf_unregister_afinfo(const struct nf_afinfo *afinfo)
Patrick McHardybce80322006-04-06 14:18:09 -070047{
Patrick McHardyd486dd12007-02-12 11:09:55 -080048 mutex_lock(&afinfo_mutex);
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +000049 RCU_INIT_POINTER(nf_afinfo[afinfo->family], NULL);
Patrick McHardyd486dd12007-02-12 11:09:55 -080050 mutex_unlock(&afinfo_mutex);
Patrick McHardybce80322006-04-06 14:18:09 -070051 synchronize_rcu();
52}
53EXPORT_SYMBOL_GPL(nf_unregister_afinfo);
54
Jan Engelhardt7e9c6ee2008-10-08 11:35:00 +020055struct list_head nf_hooks[NFPROTO_NUMPROTO][NF_MAX_HOOKS] __read_mostly;
Harald Weltef6ebe772005-08-09 20:21:49 -070056EXPORT_SYMBOL(nf_hooks);
Patrick McHardyfd706d62007-02-12 11:10:14 -080057static DEFINE_MUTEX(nf_hook_mutex);
Harald Weltef6ebe772005-08-09 20:21:49 -070058
59int nf_register_hook(struct nf_hook_ops *reg)
60{
Li Zefan4c610972007-12-04 23:22:26 -080061 struct nf_hook_ops *elem;
Patrick McHardyfd706d62007-02-12 11:10:14 -080062 int err;
Harald Weltef6ebe772005-08-09 20:21:49 -070063
Patrick McHardyfd706d62007-02-12 11:10:14 -080064 err = mutex_lock_interruptible(&nf_hook_mutex);
65 if (err < 0)
66 return err;
Li Zefan4c610972007-12-04 23:22:26 -080067 list_for_each_entry(elem, &nf_hooks[reg->pf][reg->hooknum], list) {
68 if (reg->priority < elem->priority)
Harald Weltef6ebe772005-08-09 20:21:49 -070069 break;
70 }
Li Zefan4c610972007-12-04 23:22:26 -080071 list_add_rcu(&reg->list, elem->list.prev);
Patrick McHardyfd706d62007-02-12 11:10:14 -080072 mutex_unlock(&nf_hook_mutex);
Harald Weltef6ebe772005-08-09 20:21:49 -070073 return 0;
74}
75EXPORT_SYMBOL(nf_register_hook);
76
77void nf_unregister_hook(struct nf_hook_ops *reg)
78{
Patrick McHardyfd706d62007-02-12 11:10:14 -080079 mutex_lock(&nf_hook_mutex);
Harald Weltef6ebe772005-08-09 20:21:49 -070080 list_del_rcu(&reg->list);
Patrick McHardyfd706d62007-02-12 11:10:14 -080081 mutex_unlock(&nf_hook_mutex);
Harald Weltef6ebe772005-08-09 20:21:49 -070082
83 synchronize_net();
84}
85EXPORT_SYMBOL(nf_unregister_hook);
86
Patrick McHardy972d1cb2006-04-06 14:09:12 -070087int nf_register_hooks(struct nf_hook_ops *reg, unsigned int n)
88{
89 unsigned int i;
90 int err = 0;
91
92 for (i = 0; i < n; i++) {
93 err = nf_register_hook(&reg[i]);
94 if (err)
95 goto err;
96 }
97 return err;
98
99err:
100 if (i > 0)
101 nf_unregister_hooks(reg, i);
102 return err;
103}
104EXPORT_SYMBOL(nf_register_hooks);
105
106void nf_unregister_hooks(struct nf_hook_ops *reg, unsigned int n)
107{
Changli Gaof68c5302010-10-04 22:24:12 +0200108 while (n-- > 0)
109 nf_unregister_hook(&reg[n]);
Patrick McHardy972d1cb2006-04-06 14:09:12 -0700110}
111EXPORT_SYMBOL(nf_unregister_hooks);
112
Harald Weltef6ebe772005-08-09 20:21:49 -0700113unsigned int nf_iterate(struct list_head *head,
Herbert Xu3db05fe2007-10-15 00:53:15 -0700114 struct sk_buff *skb,
Jan Engelhardt76108ce2008-10-08 11:35:00 +0200115 unsigned int hook,
Harald Weltef6ebe772005-08-09 20:21:49 -0700116 const struct net_device *indev,
117 const struct net_device *outdev,
118 struct list_head **i,
119 int (*okfn)(struct sk_buff *),
120 int hook_thresh)
121{
122 unsigned int verdict;
123
124 /*
125 * The caller must not block between calls to this
126 * function because of risk of continuing from deleted element.
127 */
128 list_for_each_continue_rcu(*i, head) {
129 struct nf_hook_ops *elem = (struct nf_hook_ops *)*i;
130
131 if (hook_thresh > elem->priority)
132 continue;
133
134 /* Optimization: we don't need to hold module
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800135 reference here, since function can't sleep. --RR */
Patrick McHardyde9963f2011-02-14 17:35:07 +0100136repeat:
Harald Weltef6ebe772005-08-09 20:21:49 -0700137 verdict = elem->hook(hook, skb, indev, outdev, okfn);
138 if (verdict != NF_ACCEPT) {
139#ifdef CONFIG_NETFILTER_DEBUG
140 if (unlikely((verdict & NF_VERDICT_MASK)
141 > NF_MAX_VERDICT)) {
142 NFDEBUG("Evil return from %p(%u).\n",
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800143 elem->hook, hook);
Harald Weltef6ebe772005-08-09 20:21:49 -0700144 continue;
145 }
146#endif
147 if (verdict != NF_REPEAT)
148 return verdict;
Patrick McHardyde9963f2011-02-14 17:35:07 +0100149 goto repeat;
Harald Weltef6ebe772005-08-09 20:21:49 -0700150 }
151 }
152 return NF_ACCEPT;
153}
154
155
156/* Returns 1 if okfn() needs to be executed by the caller,
157 * -EPERM for NF_DROP, 0 otherwise. */
Jan Engelhardt76108ce2008-10-08 11:35:00 +0200158int nf_hook_slow(u_int8_t pf, unsigned int hook, struct sk_buff *skb,
Harald Weltef6ebe772005-08-09 20:21:49 -0700159 struct net_device *indev,
160 struct net_device *outdev,
161 int (*okfn)(struct sk_buff *),
162 int hook_thresh)
163{
164 struct list_head *elem;
165 unsigned int verdict;
166 int ret = 0;
167
168 /* We may already have this, but read-locks nest anyway */
169 rcu_read_lock();
170
171 elem = &nf_hooks[pf][hook];
172next_hook:
Herbert Xu3db05fe2007-10-15 00:53:15 -0700173 verdict = nf_iterate(&nf_hooks[pf][hook], skb, hook, indev,
Harald Weltef6ebe772005-08-09 20:21:49 -0700174 outdev, &elem, okfn, hook_thresh);
175 if (verdict == NF_ACCEPT || verdict == NF_STOP) {
176 ret = 1;
Eric Parisda683652010-11-16 11:52:38 +0000177 } else if ((verdict & NF_VERDICT_MASK) == NF_DROP) {
Herbert Xu3db05fe2007-10-15 00:53:15 -0700178 kfree_skb(skb);
Florian Westphalf615df72011-01-18 15:52:14 +0100179 ret = NF_DROP_GETERR(verdict);
Eric Parisda683652010-11-16 11:52:38 +0000180 if (ret == 0)
181 ret = -EPERM;
Patrick McHardyf9c63992007-12-05 01:27:46 -0800182 } else if ((verdict & NF_VERDICT_MASK) == NF_QUEUE) {
Florian Westphalf1585082011-01-18 15:27:28 +0100183 ret = nf_queue(skb, elem, pf, hook, indev, outdev, okfn,
Florian Westphalf615df72011-01-18 15:52:14 +0100184 verdict >> NF_VERDICT_QBITS);
Florian Westphal06cdb632011-01-18 15:28:38 +0100185 if (ret < 0) {
186 if (ret == -ECANCELED)
187 goto next_hook;
Florian Westphal94b27cc2011-01-18 16:08:30 +0100188 if (ret == -ESRCH &&
189 (verdict & NF_VERDICT_FLAG_QUEUE_BYPASS))
190 goto next_hook;
Florian Westphal06cdb632011-01-18 15:28:38 +0100191 kfree_skb(skb);
192 }
Florian Westphalf1585082011-01-18 15:27:28 +0100193 ret = 0;
Harald Weltef6ebe772005-08-09 20:21:49 -0700194 }
Harald Weltef6ebe772005-08-09 20:21:49 -0700195 rcu_read_unlock();
196 return ret;
197}
198EXPORT_SYMBOL(nf_hook_slow);
199
200
Herbert Xu37d41872007-10-14 00:39:18 -0700201int skb_make_writable(struct sk_buff *skb, unsigned int writable_len)
Harald Weltef6ebe772005-08-09 20:21:49 -0700202{
Herbert Xu37d41872007-10-14 00:39:18 -0700203 if (writable_len > skb->len)
Harald Weltef6ebe772005-08-09 20:21:49 -0700204 return 0;
205
206 /* Not exclusive use of packet? Must copy. */
Herbert Xu37d41872007-10-14 00:39:18 -0700207 if (!skb_cloned(skb)) {
208 if (writable_len <= skb_headlen(skb))
209 return 1;
210 } else if (skb_clone_writable(skb, writable_len))
211 return 1;
Harald Weltef6ebe772005-08-09 20:21:49 -0700212
Herbert Xu37d41872007-10-14 00:39:18 -0700213 if (writable_len <= skb_headlen(skb))
214 writable_len = 0;
215 else
216 writable_len -= skb_headlen(skb);
Harald Weltef6ebe772005-08-09 20:21:49 -0700217
Herbert Xu37d41872007-10-14 00:39:18 -0700218 return !!__pskb_pull_tail(skb, writable_len);
Harald Weltef6ebe772005-08-09 20:21:49 -0700219}
220EXPORT_SYMBOL(skb_make_writable);
221
Yasuyuki Kozakai5f79e0f2007-03-23 11:17:07 -0700222#if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
Harald Weltef6ebe772005-08-09 20:21:49 -0700223/* This does not belong here, but locally generated errors need it if connection
224 tracking in use: without this, connection may not be in hash table, and hence
225 manufactured ICMP or RST packets will not be associated with it. */
Eric Dumazet0e60ebe2010-11-15 18:17:21 +0100226void (*ip_ct_attach)(struct sk_buff *, struct sk_buff *) __rcu __read_mostly;
Harald Weltef6ebe772005-08-09 20:21:49 -0700227EXPORT_SYMBOL(ip_ct_attach);
228
229void nf_ct_attach(struct sk_buff *new, struct sk_buff *skb)
230{
231 void (*attach)(struct sk_buff *, struct sk_buff *);
232
Patrick McHardyc3a47ab2007-02-12 11:09:19 -0800233 if (skb->nfct) {
234 rcu_read_lock();
235 attach = rcu_dereference(ip_ct_attach);
236 if (attach)
237 attach(new, skb);
238 rcu_read_unlock();
Harald Weltef6ebe772005-08-09 20:21:49 -0700239 }
240}
241EXPORT_SYMBOL(nf_ct_attach);
Yasuyuki Kozakaide6e05c2007-03-23 11:17:27 -0700242
Eric Dumazet0e60ebe2010-11-15 18:17:21 +0100243void (*nf_ct_destroy)(struct nf_conntrack *) __rcu __read_mostly;
Yasuyuki Kozakaide6e05c2007-03-23 11:17:27 -0700244EXPORT_SYMBOL(nf_ct_destroy);
245
246void nf_conntrack_destroy(struct nf_conntrack *nfct)
247{
248 void (*destroy)(struct nf_conntrack *);
249
250 rcu_read_lock();
251 destroy = rcu_dereference(nf_ct_destroy);
252 BUG_ON(destroy == NULL);
253 destroy(nfct);
254 rcu_read_unlock();
255}
256EXPORT_SYMBOL(nf_conntrack_destroy);
257#endif /* CONFIG_NF_CONNTRACK */
Harald Weltef6ebe772005-08-09 20:21:49 -0700258
259#ifdef CONFIG_PROC_FS
260struct proc_dir_entry *proc_net_netfilter;
261EXPORT_SYMBOL(proc_net_netfilter);
262#endif
263
264void __init netfilter_init(void)
265{
266 int i, h;
Jan Engelhardt7e9c6ee2008-10-08 11:35:00 +0200267 for (i = 0; i < ARRAY_SIZE(nf_hooks); i++) {
Harald Weltef6ebe772005-08-09 20:21:49 -0700268 for (h = 0; h < NF_MAX_HOOKS; h++)
269 INIT_LIST_HEAD(&nf_hooks[i][h]);
270 }
271
272#ifdef CONFIG_PROC_FS
Eric W. Biederman457c4cb2007-09-12 12:01:34 +0200273 proc_net_netfilter = proc_mkdir("netfilter", init_net.proc_net);
Harald Weltef6ebe772005-08-09 20:21:49 -0700274 if (!proc_net_netfilter)
275 panic("cannot create netfilter proc entry");
276#endif
277
278 if (netfilter_queue_init() < 0)
279 panic("cannot initialize nf_queue");
280 if (netfilter_log_init() < 0)
281 panic("cannot initialize nf_log");
282}
Patrick McHardy4f536522008-01-14 23:48:39 -0800283
284#ifdef CONFIG_SYSCTL
285struct ctl_path nf_net_netfilter_sysctl_path[] = {
Eric W. Biedermanf8572d82009-11-05 13:32:03 -0800286 { .procname = "net", },
287 { .procname = "netfilter", },
Patrick McHardy4f536522008-01-14 23:48:39 -0800288 { }
289};
290EXPORT_SYMBOL_GPL(nf_net_netfilter_sysctl_path);
291#endif /* CONFIG_SYSCTL */