blob: 39705f9bc1546ea55dc69a5aeca6ae304da1e9f7 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Packet matching code.
3 *
4 * Copyright (C) 1999 Paul `Rusty' Russell & Michael J. Neuling
Harald Welte2e4e6a12006-01-12 13:30:04 -08005 * Copyright (C) 2000-2005 Netfilter Core Team <coreteam@netfilter.org>
Linus Torvalds1da177e2005-04-16 15:20:36 -07006 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
10 *
11 * 19 Jan 2002 Harald Welte <laforge@gnumonks.org>
12 * - increase module usage count as soon as we have rules inside
13 * a table
Harald Welte2e4e6a12006-01-12 13:30:04 -080014 * 08 Oct 2005 Harald Welte <lafore@netfilter.org>
15 * - Generalize into "x_tables" layer and "{ip,ip6,arp}_tables"
Linus Torvalds1da177e2005-04-16 15:20:36 -070016 */
17#include <linux/config.h>
18#include <linux/cache.h>
Randy Dunlap4fc268d2006-01-11 12:17:47 -080019#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/skbuff.h>
21#include <linux/kmod.h>
22#include <linux/vmalloc.h>
23#include <linux/netdevice.h>
24#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025#include <linux/icmp.h>
26#include <net/ip.h>
27#include <asm/uaccess.h>
Ingo Molnar57b47a52006-03-20 22:35:41 -080028#include <linux/mutex.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070029#include <linux/proc_fs.h>
30#include <linux/err.h>
David S. Millerc8923c62005-10-13 14:41:23 -070031#include <linux/cpumask.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032
Harald Welte2e4e6a12006-01-12 13:30:04 -080033#include <linux/netfilter/x_tables.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070034#include <linux/netfilter_ipv4/ip_tables.h>
35
36MODULE_LICENSE("GPL");
37MODULE_AUTHOR("Netfilter Core Team <coreteam@netfilter.org>");
38MODULE_DESCRIPTION("IPv4 packet filter");
39
40/*#define DEBUG_IP_FIREWALL*/
41/*#define DEBUG_ALLOW_ALL*/ /* Useful for remote debugging */
42/*#define DEBUG_IP_FIREWALL_USER*/
43
44#ifdef DEBUG_IP_FIREWALL
45#define dprintf(format, args...) printk(format , ## args)
46#else
47#define dprintf(format, args...)
48#endif
49
50#ifdef DEBUG_IP_FIREWALL_USER
51#define duprintf(format, args...) printk(format , ## args)
52#else
53#define duprintf(format, args...)
54#endif
55
56#ifdef CONFIG_NETFILTER_DEBUG
57#define IP_NF_ASSERT(x) \
58do { \
59 if (!(x)) \
60 printk("IP_NF_ASSERT: %s:%s:%u\n", \
61 __FUNCTION__, __FILE__, __LINE__); \
62} while(0)
63#else
64#define IP_NF_ASSERT(x)
65#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070066
67#if 0
68/* All the better to debug you with... */
69#define static
70#define inline
71#endif
72
73/*
74 We keep a set of rules for each CPU, so we can avoid write-locking
75 them in the softirq when updating the counters and therefore
76 only need to read-lock in the softirq; doing a write_lock_bh() in user
77 context stops packets coming through and allows user context to read
78 the counters or update the rules.
79
Linus Torvalds1da177e2005-04-16 15:20:36 -070080 Hence the start of any table is given by get_table() below. */
81
Linus Torvalds1da177e2005-04-16 15:20:36 -070082/* Returns whether matches rule or not. */
83static inline int
84ip_packet_match(const struct iphdr *ip,
85 const char *indev,
86 const char *outdev,
87 const struct ipt_ip *ipinfo,
88 int isfrag)
89{
90 size_t i;
91 unsigned long ret;
92
93#define FWINV(bool,invflg) ((bool) ^ !!(ipinfo->invflags & invflg))
94
95 if (FWINV((ip->saddr&ipinfo->smsk.s_addr) != ipinfo->src.s_addr,
96 IPT_INV_SRCIP)
97 || FWINV((ip->daddr&ipinfo->dmsk.s_addr) != ipinfo->dst.s_addr,
98 IPT_INV_DSTIP)) {
99 dprintf("Source or dest mismatch.\n");
100
101 dprintf("SRC: %u.%u.%u.%u. Mask: %u.%u.%u.%u. Target: %u.%u.%u.%u.%s\n",
102 NIPQUAD(ip->saddr),
103 NIPQUAD(ipinfo->smsk.s_addr),
104 NIPQUAD(ipinfo->src.s_addr),
105 ipinfo->invflags & IPT_INV_SRCIP ? " (INV)" : "");
106 dprintf("DST: %u.%u.%u.%u Mask: %u.%u.%u.%u Target: %u.%u.%u.%u.%s\n",
107 NIPQUAD(ip->daddr),
108 NIPQUAD(ipinfo->dmsk.s_addr),
109 NIPQUAD(ipinfo->dst.s_addr),
110 ipinfo->invflags & IPT_INV_DSTIP ? " (INV)" : "");
111 return 0;
112 }
113
114 /* Look for ifname matches; this should unroll nicely. */
115 for (i = 0, ret = 0; i < IFNAMSIZ/sizeof(unsigned long); i++) {
116 ret |= (((const unsigned long *)indev)[i]
117 ^ ((const unsigned long *)ipinfo->iniface)[i])
118 & ((const unsigned long *)ipinfo->iniface_mask)[i];
119 }
120
121 if (FWINV(ret != 0, IPT_INV_VIA_IN)) {
122 dprintf("VIA in mismatch (%s vs %s).%s\n",
123 indev, ipinfo->iniface,
124 ipinfo->invflags&IPT_INV_VIA_IN ?" (INV)":"");
125 return 0;
126 }
127
128 for (i = 0, ret = 0; i < IFNAMSIZ/sizeof(unsigned long); i++) {
129 ret |= (((const unsigned long *)outdev)[i]
130 ^ ((const unsigned long *)ipinfo->outiface)[i])
131 & ((const unsigned long *)ipinfo->outiface_mask)[i];
132 }
133
134 if (FWINV(ret != 0, IPT_INV_VIA_OUT)) {
135 dprintf("VIA out mismatch (%s vs %s).%s\n",
136 outdev, ipinfo->outiface,
137 ipinfo->invflags&IPT_INV_VIA_OUT ?" (INV)":"");
138 return 0;
139 }
140
141 /* Check specific protocol */
142 if (ipinfo->proto
143 && FWINV(ip->protocol != ipinfo->proto, IPT_INV_PROTO)) {
144 dprintf("Packet protocol %hi does not match %hi.%s\n",
145 ip->protocol, ipinfo->proto,
146 ipinfo->invflags&IPT_INV_PROTO ? " (INV)":"");
147 return 0;
148 }
149
150 /* If we have a fragment rule but the packet is not a fragment
151 * then we return zero */
152 if (FWINV((ipinfo->flags&IPT_F_FRAG) && !isfrag, IPT_INV_FRAG)) {
153 dprintf("Fragment rule but not fragment.%s\n",
154 ipinfo->invflags & IPT_INV_FRAG ? " (INV)" : "");
155 return 0;
156 }
157
158 return 1;
159}
160
161static inline int
162ip_checkentry(const struct ipt_ip *ip)
163{
164 if (ip->flags & ~IPT_F_MASK) {
165 duprintf("Unknown flag bits set: %08X\n",
166 ip->flags & ~IPT_F_MASK);
167 return 0;
168 }
169 if (ip->invflags & ~IPT_INV_MASK) {
170 duprintf("Unknown invflag bits set: %08X\n",
171 ip->invflags & ~IPT_INV_MASK);
172 return 0;
173 }
174 return 1;
175}
176
177static unsigned int
178ipt_error(struct sk_buff **pskb,
179 const struct net_device *in,
180 const struct net_device *out,
181 unsigned int hooknum,
Patrick McHardyc4986732006-03-20 18:02:56 -0800182 const struct xt_target *target,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183 const void *targinfo,
184 void *userinfo)
185{
186 if (net_ratelimit())
187 printk("ip_tables: error: `%s'\n", (char *)targinfo);
188
189 return NF_DROP;
190}
191
192static inline
193int do_match(struct ipt_entry_match *m,
194 const struct sk_buff *skb,
195 const struct net_device *in,
196 const struct net_device *out,
197 int offset,
198 int *hotdrop)
199{
200 /* Stop iteration if it doesn't match */
Patrick McHardy1c524832006-03-20 18:02:15 -0800201 if (!m->u.kernel.match->match(skb, in, out, m->u.kernel.match, m->data,
202 offset, skb->nh.iph->ihl*4, hotdrop))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 return 1;
204 else
205 return 0;
206}
207
208static inline struct ipt_entry *
209get_entry(void *base, unsigned int offset)
210{
211 return (struct ipt_entry *)(base + offset);
212}
213
214/* Returns one of the generic firewall policies, like NF_ACCEPT. */
215unsigned int
216ipt_do_table(struct sk_buff **pskb,
217 unsigned int hook,
218 const struct net_device *in,
219 const struct net_device *out,
220 struct ipt_table *table,
221 void *userdata)
222{
223 static const char nulldevname[IFNAMSIZ] __attribute__((aligned(sizeof(long))));
224 u_int16_t offset;
225 struct iphdr *ip;
226 u_int16_t datalen;
227 int hotdrop = 0;
228 /* Initializing verdict to NF_DROP keeps gcc happy. */
229 unsigned int verdict = NF_DROP;
230 const char *indev, *outdev;
231 void *table_base;
232 struct ipt_entry *e, *back;
Harald Welte2e4e6a12006-01-12 13:30:04 -0800233 struct xt_table_info *private = table->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234
235 /* Initialization */
236 ip = (*pskb)->nh.iph;
237 datalen = (*pskb)->len - ip->ihl * 4;
238 indev = in ? in->name : nulldevname;
239 outdev = out ? out->name : nulldevname;
240 /* We handle fragments by dealing with the first fragment as
241 * if it was a normal packet. All other fragments are treated
242 * normally, except that they will NEVER match rules that ask
243 * things we don't know, ie. tcp syn flag or ports). If the
244 * rule is also a fragment-specific rule, non-fragments won't
245 * match it. */
246 offset = ntohs(ip->frag_off) & IP_OFFSET;
247
248 read_lock_bh(&table->lock);
249 IP_NF_ASSERT(table->valid_hooks & (1 << hook));
Harald Welte2e4e6a12006-01-12 13:30:04 -0800250 table_base = (void *)private->entries[smp_processor_id()];
251 e = get_entry(table_base, private->hook_entry[hook]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252
253 /* For return from builtin chain */
Harald Welte2e4e6a12006-01-12 13:30:04 -0800254 back = get_entry(table_base, private->underflow[hook]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255
256 do {
257 IP_NF_ASSERT(e);
258 IP_NF_ASSERT(back);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700259 if (ip_packet_match(ip, indev, outdev, &e->ip, offset)) {
260 struct ipt_entry_target *t;
261
262 if (IPT_MATCH_ITERATE(e, do_match,
263 *pskb, in, out,
264 offset, &hotdrop) != 0)
265 goto no_match;
266
267 ADD_COUNTER(e->counters, ntohs(ip->tot_len), 1);
268
269 t = ipt_get_target(e);
270 IP_NF_ASSERT(t->u.kernel.target);
271 /* Standard target? */
272 if (!t->u.kernel.target->target) {
273 int v;
274
275 v = ((struct ipt_standard_target *)t)->verdict;
276 if (v < 0) {
277 /* Pop from stack? */
278 if (v != IPT_RETURN) {
279 verdict = (unsigned)(-v) - 1;
280 break;
281 }
282 e = back;
283 back = get_entry(table_base,
284 back->comefrom);
285 continue;
286 }
Patrick McHardy05465342005-08-21 23:31:43 -0700287 if (table_base + v != (void *)e + e->next_offset
288 && !(e->ip.flags & IPT_F_GOTO)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289 /* Save old back ptr in next entry */
290 struct ipt_entry *next
291 = (void *)e + e->next_offset;
292 next->comefrom
293 = (void *)back - table_base;
294 /* set back pointer to next entry */
295 back = next;
296 }
297
298 e = get_entry(table_base, v);
299 } else {
300 /* Targets which reenter must return
301 abs. verdicts */
302#ifdef CONFIG_NETFILTER_DEBUG
303 ((struct ipt_entry *)table_base)->comefrom
304 = 0xeeeeeeec;
305#endif
306 verdict = t->u.kernel.target->target(pskb,
307 in, out,
308 hook,
Patrick McHardy1c524832006-03-20 18:02:15 -0800309 t->u.kernel.target,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 t->data,
311 userdata);
312
313#ifdef CONFIG_NETFILTER_DEBUG
314 if (((struct ipt_entry *)table_base)->comefrom
315 != 0xeeeeeeec
316 && verdict == IPT_CONTINUE) {
317 printk("Target %s reentered!\n",
318 t->u.kernel.target->name);
319 verdict = NF_DROP;
320 }
321 ((struct ipt_entry *)table_base)->comefrom
322 = 0x57acc001;
323#endif
324 /* Target might have changed stuff. */
325 ip = (*pskb)->nh.iph;
326 datalen = (*pskb)->len - ip->ihl * 4;
327
328 if (verdict == IPT_CONTINUE)
329 e = (void *)e + e->next_offset;
330 else
331 /* Verdict */
332 break;
333 }
334 } else {
335
336 no_match:
337 e = (void *)e + e->next_offset;
338 }
339 } while (!hotdrop);
340
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 read_unlock_bh(&table->lock);
342
343#ifdef DEBUG_ALLOW_ALL
344 return NF_ACCEPT;
345#else
346 if (hotdrop)
347 return NF_DROP;
348 else return verdict;
349#endif
350}
351
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352/* All zeroes == unconditional rule. */
353static inline int
354unconditional(const struct ipt_ip *ip)
355{
356 unsigned int i;
357
358 for (i = 0; i < sizeof(*ip)/sizeof(__u32); i++)
359 if (((__u32 *)ip)[i])
360 return 0;
361
362 return 1;
363}
364
365/* Figures out from what hook each rule can be called: returns 0 if
366 there are loops. Puts hook bitmask in comefrom. */
367static int
Harald Welte2e4e6a12006-01-12 13:30:04 -0800368mark_source_chains(struct xt_table_info *newinfo,
Eric Dumazet31836062005-12-13 23:13:48 -0800369 unsigned int valid_hooks, void *entry0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370{
371 unsigned int hook;
372
373 /* No recursion; use packet counter to save back ptrs (reset
374 to 0 as we leave), and comefrom to save source hook bitmask */
375 for (hook = 0; hook < NF_IP_NUMHOOKS; hook++) {
376 unsigned int pos = newinfo->hook_entry[hook];
377 struct ipt_entry *e
Eric Dumazet31836062005-12-13 23:13:48 -0800378 = (struct ipt_entry *)(entry0 + pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379
380 if (!(valid_hooks & (1 << hook)))
381 continue;
382
383 /* Set initial back pointer. */
384 e->counters.pcnt = pos;
385
386 for (;;) {
387 struct ipt_standard_target *t
388 = (void *)ipt_get_target(e);
389
390 if (e->comefrom & (1 << NF_IP_NUMHOOKS)) {
391 printk("iptables: loop hook %u pos %u %08X.\n",
392 hook, pos, e->comefrom);
393 return 0;
394 }
395 e->comefrom
396 |= ((1 << hook) | (1 << NF_IP_NUMHOOKS));
397
398 /* Unconditional return/END. */
399 if (e->target_offset == sizeof(struct ipt_entry)
400 && (strcmp(t->target.u.user.name,
401 IPT_STANDARD_TARGET) == 0)
402 && t->verdict < 0
403 && unconditional(&e->ip)) {
404 unsigned int oldpos, size;
405
406 /* Return: backtrack through the last
407 big jump. */
408 do {
409 e->comefrom ^= (1<<NF_IP_NUMHOOKS);
410#ifdef DEBUG_IP_FIREWALL_USER
411 if (e->comefrom
412 & (1 << NF_IP_NUMHOOKS)) {
413 duprintf("Back unset "
414 "on hook %u "
415 "rule %u\n",
416 hook, pos);
417 }
418#endif
419 oldpos = pos;
420 pos = e->counters.pcnt;
421 e->counters.pcnt = 0;
422
423 /* We're at the start. */
424 if (pos == oldpos)
425 goto next;
426
427 e = (struct ipt_entry *)
Eric Dumazet31836062005-12-13 23:13:48 -0800428 (entry0 + pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700429 } while (oldpos == pos + e->next_offset);
430
431 /* Move along one */
432 size = e->next_offset;
433 e = (struct ipt_entry *)
Eric Dumazet31836062005-12-13 23:13:48 -0800434 (entry0 + pos + size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435 e->counters.pcnt = pos;
436 pos += size;
437 } else {
438 int newpos = t->verdict;
439
440 if (strcmp(t->target.u.user.name,
441 IPT_STANDARD_TARGET) == 0
442 && newpos >= 0) {
443 /* This a jump; chase it. */
444 duprintf("Jump rule %u -> %u\n",
445 pos, newpos);
446 } else {
447 /* ... this is a fallthru */
448 newpos = pos + e->next_offset;
449 }
450 e = (struct ipt_entry *)
Eric Dumazet31836062005-12-13 23:13:48 -0800451 (entry0 + newpos);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700452 e->counters.pcnt = pos;
453 pos = newpos;
454 }
455 }
456 next:
457 duprintf("Finished chain %u\n", hook);
458 }
459 return 1;
460}
461
462static inline int
463cleanup_match(struct ipt_entry_match *m, unsigned int *i)
464{
465 if (i && (*i)-- == 0)
466 return 1;
467
468 if (m->u.kernel.match->destroy)
Patrick McHardy1c524832006-03-20 18:02:15 -0800469 m->u.kernel.match->destroy(m->u.kernel.match, m->data,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700470 m->u.match_size - sizeof(*m));
471 module_put(m->u.kernel.match->me);
472 return 0;
473}
474
475static inline int
476standard_check(const struct ipt_entry_target *t,
477 unsigned int max_offset)
478{
479 struct ipt_standard_target *targ = (void *)t;
480
481 /* Check standard info. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700482 if (targ->verdict >= 0
483 && targ->verdict > max_offset - sizeof(struct ipt_entry)) {
484 duprintf("ipt_standard_check: bad verdict (%i)\n",
485 targ->verdict);
486 return 0;
487 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700488 if (targ->verdict < -NF_MAX_VERDICT - 1) {
489 duprintf("ipt_standard_check: bad negative verdict (%i)\n",
490 targ->verdict);
491 return 0;
492 }
493 return 1;
494}
495
496static inline int
497check_match(struct ipt_entry_match *m,
498 const char *name,
499 const struct ipt_ip *ip,
500 unsigned int hookmask,
501 unsigned int *i)
502{
503 struct ipt_match *match;
Patrick McHardy3cdc7c92006-03-20 18:00:36 -0800504 int ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505
Harald Welte2e4e6a12006-01-12 13:30:04 -0800506 match = try_then_request_module(xt_find_match(AF_INET, m->u.user.name,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700507 m->u.user.revision),
508 "ipt_%s", m->u.user.name);
509 if (IS_ERR(match) || !match) {
510 duprintf("check_match: `%s' not found\n", m->u.user.name);
511 return match ? PTR_ERR(match) : -ENOENT;
512 }
513 m->u.kernel.match = match;
514
Patrick McHardy3cdc7c92006-03-20 18:00:36 -0800515 ret = xt_check_match(match, AF_INET, m->u.match_size - sizeof(*m),
516 name, hookmask, ip->proto,
517 ip->invflags & IPT_INV_PROTO);
518 if (ret)
519 goto err;
520
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 if (m->u.kernel.match->checkentry
Patrick McHardy1c524832006-03-20 18:02:15 -0800522 && !m->u.kernel.match->checkentry(name, ip, match, m->data,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700523 m->u.match_size - sizeof(*m),
524 hookmask)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700525 duprintf("ip_tables: check failed for `%s'.\n",
526 m->u.kernel.match->name);
Patrick McHardy3cdc7c92006-03-20 18:00:36 -0800527 ret = -EINVAL;
528 goto err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700529 }
530
531 (*i)++;
532 return 0;
Patrick McHardy3cdc7c92006-03-20 18:00:36 -0800533err:
534 module_put(m->u.kernel.match->me);
535 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536}
537
538static struct ipt_target ipt_standard_target;
539
540static inline int
541check_entry(struct ipt_entry *e, const char *name, unsigned int size,
542 unsigned int *i)
543{
544 struct ipt_entry_target *t;
545 struct ipt_target *target;
546 int ret;
547 unsigned int j;
548
549 if (!ip_checkentry(&e->ip)) {
550 duprintf("ip_tables: ip check failed %p %s.\n", e, name);
551 return -EINVAL;
552 }
553
554 j = 0;
555 ret = IPT_MATCH_ITERATE(e, check_match, name, &e->ip, e->comefrom, &j);
556 if (ret != 0)
557 goto cleanup_matches;
558
559 t = ipt_get_target(e);
Harald Welte2e4e6a12006-01-12 13:30:04 -0800560 target = try_then_request_module(xt_find_target(AF_INET,
561 t->u.user.name,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700562 t->u.user.revision),
563 "ipt_%s", t->u.user.name);
564 if (IS_ERR(target) || !target) {
565 duprintf("check_entry: `%s' not found\n", t->u.user.name);
566 ret = target ? PTR_ERR(target) : -ENOENT;
567 goto cleanup_matches;
568 }
569 t->u.kernel.target = target;
570
Patrick McHardy3cdc7c92006-03-20 18:00:36 -0800571 ret = xt_check_target(target, AF_INET, t->u.target_size - sizeof(*t),
572 name, e->comefrom, e->ip.proto,
573 e->ip.invflags & IPT_INV_PROTO);
574 if (ret)
575 goto err;
576
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577 if (t->u.kernel.target == &ipt_standard_target) {
578 if (!standard_check(t, size)) {
579 ret = -EINVAL;
580 goto cleanup_matches;
581 }
582 } else if (t->u.kernel.target->checkentry
Patrick McHardy1c524832006-03-20 18:02:15 -0800583 && !t->u.kernel.target->checkentry(name, e, target, t->data,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700584 t->u.target_size
585 - sizeof(*t),
586 e->comefrom)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700587 duprintf("ip_tables: check failed for `%s'.\n",
588 t->u.kernel.target->name);
589 ret = -EINVAL;
Patrick McHardy3cdc7c92006-03-20 18:00:36 -0800590 goto err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700591 }
592
593 (*i)++;
594 return 0;
Patrick McHardy3cdc7c92006-03-20 18:00:36 -0800595 err:
596 module_put(t->u.kernel.target->me);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597 cleanup_matches:
598 IPT_MATCH_ITERATE(e, cleanup_match, &j);
599 return ret;
600}
601
602static inline int
603check_entry_size_and_hooks(struct ipt_entry *e,
Harald Welte2e4e6a12006-01-12 13:30:04 -0800604 struct xt_table_info *newinfo,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700605 unsigned char *base,
606 unsigned char *limit,
607 const unsigned int *hook_entries,
608 const unsigned int *underflows,
609 unsigned int *i)
610{
611 unsigned int h;
612
613 if ((unsigned long)e % __alignof__(struct ipt_entry) != 0
614 || (unsigned char *)e + sizeof(struct ipt_entry) >= limit) {
615 duprintf("Bad offset %p\n", e);
616 return -EINVAL;
617 }
618
619 if (e->next_offset
620 < sizeof(struct ipt_entry) + sizeof(struct ipt_entry_target)) {
621 duprintf("checking: element %p size %u\n",
622 e, e->next_offset);
623 return -EINVAL;
624 }
625
626 /* Check hooks & underflows */
627 for (h = 0; h < NF_IP_NUMHOOKS; h++) {
628 if ((unsigned char *)e - base == hook_entries[h])
629 newinfo->hook_entry[h] = hook_entries[h];
630 if ((unsigned char *)e - base == underflows[h])
631 newinfo->underflow[h] = underflows[h];
632 }
633
634 /* FIXME: underflows must be unconditional, standard verdicts
635 < 0 (not IPT_RETURN). --RR */
636
637 /* Clear counters and comefrom */
Harald Welte2e4e6a12006-01-12 13:30:04 -0800638 e->counters = ((struct xt_counters) { 0, 0 });
Linus Torvalds1da177e2005-04-16 15:20:36 -0700639 e->comefrom = 0;
640
641 (*i)++;
642 return 0;
643}
644
645static inline int
646cleanup_entry(struct ipt_entry *e, unsigned int *i)
647{
648 struct ipt_entry_target *t;
649
650 if (i && (*i)-- == 0)
651 return 1;
652
653 /* Cleanup all matches */
654 IPT_MATCH_ITERATE(e, cleanup_match, NULL);
655 t = ipt_get_target(e);
656 if (t->u.kernel.target->destroy)
Patrick McHardy1c524832006-03-20 18:02:15 -0800657 t->u.kernel.target->destroy(t->u.kernel.target, t->data,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700658 t->u.target_size - sizeof(*t));
659 module_put(t->u.kernel.target->me);
660 return 0;
661}
662
663/* Checks and translates the user-supplied table segment (held in
664 newinfo) */
665static int
666translate_table(const char *name,
667 unsigned int valid_hooks,
Harald Welte2e4e6a12006-01-12 13:30:04 -0800668 struct xt_table_info *newinfo,
Eric Dumazet31836062005-12-13 23:13:48 -0800669 void *entry0,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670 unsigned int size,
671 unsigned int number,
672 const unsigned int *hook_entries,
673 const unsigned int *underflows)
674{
675 unsigned int i;
676 int ret;
677
678 newinfo->size = size;
679 newinfo->number = number;
680
681 /* Init all hooks to impossible value. */
682 for (i = 0; i < NF_IP_NUMHOOKS; i++) {
683 newinfo->hook_entry[i] = 0xFFFFFFFF;
684 newinfo->underflow[i] = 0xFFFFFFFF;
685 }
686
687 duprintf("translate_table: size %u\n", newinfo->size);
688 i = 0;
689 /* Walk through entries, checking offsets. */
Eric Dumazet31836062005-12-13 23:13:48 -0800690 ret = IPT_ENTRY_ITERATE(entry0, newinfo->size,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691 check_entry_size_and_hooks,
692 newinfo,
Eric Dumazet31836062005-12-13 23:13:48 -0800693 entry0,
694 entry0 + size,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700695 hook_entries, underflows, &i);
696 if (ret != 0)
697 return ret;
698
699 if (i != number) {
700 duprintf("translate_table: %u not %u entries\n",
701 i, number);
702 return -EINVAL;
703 }
704
705 /* Check hooks all assigned */
706 for (i = 0; i < NF_IP_NUMHOOKS; i++) {
707 /* Only hooks which are valid */
708 if (!(valid_hooks & (1 << i)))
709 continue;
710 if (newinfo->hook_entry[i] == 0xFFFFFFFF) {
711 duprintf("Invalid hook entry %u %u\n",
712 i, hook_entries[i]);
713 return -EINVAL;
714 }
715 if (newinfo->underflow[i] == 0xFFFFFFFF) {
716 duprintf("Invalid underflow %u %u\n",
717 i, underflows[i]);
718 return -EINVAL;
719 }
720 }
721
Eric Dumazet31836062005-12-13 23:13:48 -0800722 if (!mark_source_chains(newinfo, valid_hooks, entry0))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723 return -ELOOP;
724
725 /* Finally, each sanity check must pass */
726 i = 0;
Eric Dumazet31836062005-12-13 23:13:48 -0800727 ret = IPT_ENTRY_ITERATE(entry0, newinfo->size,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700728 check_entry, name, size, &i);
729
730 if (ret != 0) {
Eric Dumazet31836062005-12-13 23:13:48 -0800731 IPT_ENTRY_ITERATE(entry0, newinfo->size,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700732 cleanup_entry, &i);
733 return ret;
734 }
735
736 /* And one copy for every other CPU */
David S. Millerc8923c62005-10-13 14:41:23 -0700737 for_each_cpu(i) {
Eric Dumazet31836062005-12-13 23:13:48 -0800738 if (newinfo->entries[i] && newinfo->entries[i] != entry0)
739 memcpy(newinfo->entries[i], entry0, newinfo->size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700740 }
741
742 return ret;
743}
744
Linus Torvalds1da177e2005-04-16 15:20:36 -0700745/* Gets counters. */
746static inline int
747add_entry_to_counter(const struct ipt_entry *e,
Harald Welte2e4e6a12006-01-12 13:30:04 -0800748 struct xt_counters total[],
Linus Torvalds1da177e2005-04-16 15:20:36 -0700749 unsigned int *i)
750{
751 ADD_COUNTER(total[*i], e->counters.bcnt, e->counters.pcnt);
752
753 (*i)++;
754 return 0;
755}
756
Eric Dumazet31836062005-12-13 23:13:48 -0800757static inline int
758set_entry_to_counter(const struct ipt_entry *e,
759 struct ipt_counters total[],
760 unsigned int *i)
761{
762 SET_COUNTER(total[*i], e->counters.bcnt, e->counters.pcnt);
763
764 (*i)++;
765 return 0;
766}
767
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768static void
Harald Welte2e4e6a12006-01-12 13:30:04 -0800769get_counters(const struct xt_table_info *t,
770 struct xt_counters counters[])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700771{
772 unsigned int cpu;
773 unsigned int i;
Eric Dumazet31836062005-12-13 23:13:48 -0800774 unsigned int curcpu;
775
776 /* Instead of clearing (by a previous call to memset())
777 * the counters and using adds, we set the counters
778 * with data used by 'current' CPU
779 * We dont care about preemption here.
780 */
781 curcpu = raw_smp_processor_id();
782
783 i = 0;
784 IPT_ENTRY_ITERATE(t->entries[curcpu],
785 t->size,
786 set_entry_to_counter,
787 counters,
788 &i);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700789
David S. Millerc8923c62005-10-13 14:41:23 -0700790 for_each_cpu(cpu) {
Eric Dumazet31836062005-12-13 23:13:48 -0800791 if (cpu == curcpu)
792 continue;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700793 i = 0;
Eric Dumazet31836062005-12-13 23:13:48 -0800794 IPT_ENTRY_ITERATE(t->entries[cpu],
Linus Torvalds1da177e2005-04-16 15:20:36 -0700795 t->size,
796 add_entry_to_counter,
797 counters,
798 &i);
799 }
800}
801
802static int
803copy_entries_to_user(unsigned int total_size,
804 struct ipt_table *table,
805 void __user *userptr)
806{
807 unsigned int off, num, countersize;
808 struct ipt_entry *e;
Harald Welte2e4e6a12006-01-12 13:30:04 -0800809 struct xt_counters *counters;
810 struct xt_table_info *private = table->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700811 int ret = 0;
Eric Dumazet31836062005-12-13 23:13:48 -0800812 void *loc_cpu_entry;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700813
814 /* We need atomic snapshot of counters: rest doesn't change
815 (other than comefrom, which userspace doesn't care
816 about). */
Harald Welte2e4e6a12006-01-12 13:30:04 -0800817 countersize = sizeof(struct xt_counters) * private->number;
Eric Dumazet31836062005-12-13 23:13:48 -0800818 counters = vmalloc_node(countersize, numa_node_id());
Linus Torvalds1da177e2005-04-16 15:20:36 -0700819
820 if (counters == NULL)
821 return -ENOMEM;
822
823 /* First, sum counters... */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700824 write_lock_bh(&table->lock);
Harald Welte2e4e6a12006-01-12 13:30:04 -0800825 get_counters(private, counters);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700826 write_unlock_bh(&table->lock);
827
Eric Dumazet31836062005-12-13 23:13:48 -0800828 /* choose the copy that is on our node/cpu, ...
829 * This choice is lazy (because current thread is
830 * allowed to migrate to another cpu)
831 */
Harald Welte2e4e6a12006-01-12 13:30:04 -0800832 loc_cpu_entry = private->entries[raw_smp_processor_id()];
Eric Dumazet31836062005-12-13 23:13:48 -0800833 /* ... then copy entire thing ... */
834 if (copy_to_user(userptr, loc_cpu_entry, total_size) != 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700835 ret = -EFAULT;
836 goto free_counters;
837 }
838
839 /* FIXME: use iterator macros --RR */
840 /* ... then go back and fix counters and names */
841 for (off = 0, num = 0; off < total_size; off += e->next_offset, num++){
842 unsigned int i;
843 struct ipt_entry_match *m;
844 struct ipt_entry_target *t;
845
Eric Dumazet31836062005-12-13 23:13:48 -0800846 e = (struct ipt_entry *)(loc_cpu_entry + off);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700847 if (copy_to_user(userptr + off
848 + offsetof(struct ipt_entry, counters),
849 &counters[num],
850 sizeof(counters[num])) != 0) {
851 ret = -EFAULT;
852 goto free_counters;
853 }
854
855 for (i = sizeof(struct ipt_entry);
856 i < e->target_offset;
857 i += m->u.match_size) {
858 m = (void *)e + i;
859
860 if (copy_to_user(userptr + off + i
861 + offsetof(struct ipt_entry_match,
862 u.user.name),
863 m->u.kernel.match->name,
864 strlen(m->u.kernel.match->name)+1)
865 != 0) {
866 ret = -EFAULT;
867 goto free_counters;
868 }
869 }
870
871 t = ipt_get_target(e);
872 if (copy_to_user(userptr + off + e->target_offset
873 + offsetof(struct ipt_entry_target,
874 u.user.name),
875 t->u.kernel.target->name,
876 strlen(t->u.kernel.target->name)+1) != 0) {
877 ret = -EFAULT;
878 goto free_counters;
879 }
880 }
881
882 free_counters:
883 vfree(counters);
884 return ret;
885}
886
887static int
888get_entries(const struct ipt_get_entries *entries,
889 struct ipt_get_entries __user *uptr)
890{
891 int ret;
892 struct ipt_table *t;
893
Harald Welte2e4e6a12006-01-12 13:30:04 -0800894 t = xt_find_table_lock(AF_INET, entries->name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895 if (t && !IS_ERR(t)) {
Harald Welte2e4e6a12006-01-12 13:30:04 -0800896 struct xt_table_info *private = t->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700897 duprintf("t->private->number = %u\n",
Harald Welte2e4e6a12006-01-12 13:30:04 -0800898 private->number);
899 if (entries->size == private->size)
900 ret = copy_entries_to_user(private->size,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700901 t, uptr->entrytable);
902 else {
903 duprintf("get_entries: I've got %u not %u!\n",
Harald Welte2e4e6a12006-01-12 13:30:04 -0800904 private->size,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700905 entries->size);
906 ret = -EINVAL;
907 }
908 module_put(t->me);
Harald Welte2e4e6a12006-01-12 13:30:04 -0800909 xt_table_unlock(t);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700910 } else
911 ret = t ? PTR_ERR(t) : -ENOENT;
912
913 return ret;
914}
915
916static int
917do_replace(void __user *user, unsigned int len)
918{
919 int ret;
920 struct ipt_replace tmp;
921 struct ipt_table *t;
Harald Welte2e4e6a12006-01-12 13:30:04 -0800922 struct xt_table_info *newinfo, *oldinfo;
923 struct xt_counters *counters;
Eric Dumazet31836062005-12-13 23:13:48 -0800924 void *loc_cpu_entry, *loc_cpu_old_entry;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700925
926 if (copy_from_user(&tmp, user, sizeof(tmp)) != 0)
927 return -EFAULT;
928
929 /* Hack: Causes ipchains to give correct error msg --RR */
930 if (len != sizeof(tmp) + tmp.size)
931 return -ENOPROTOOPT;
932
Kirill Korotaevee4bb812006-02-04 02:16:56 -0800933 /* overflow check */
934 if (tmp.size >= (INT_MAX - sizeof(struct xt_table_info)) / NR_CPUS -
935 SMP_CACHE_BYTES)
936 return -ENOMEM;
937 if (tmp.num_counters >= INT_MAX / sizeof(struct xt_counters))
938 return -ENOMEM;
939
Harald Welte2e4e6a12006-01-12 13:30:04 -0800940 newinfo = xt_alloc_table_info(tmp.size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700941 if (!newinfo)
942 return -ENOMEM;
943
Eric Dumazet31836062005-12-13 23:13:48 -0800944 /* choose the copy that is our node/cpu */
945 loc_cpu_entry = newinfo->entries[raw_smp_processor_id()];
946 if (copy_from_user(loc_cpu_entry, user + sizeof(tmp),
Linus Torvalds1da177e2005-04-16 15:20:36 -0700947 tmp.size) != 0) {
948 ret = -EFAULT;
949 goto free_newinfo;
950 }
951
Harald Welte2e4e6a12006-01-12 13:30:04 -0800952 counters = vmalloc(tmp.num_counters * sizeof(struct xt_counters));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700953 if (!counters) {
954 ret = -ENOMEM;
955 goto free_newinfo;
956 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700957
958 ret = translate_table(tmp.name, tmp.valid_hooks,
Eric Dumazet31836062005-12-13 23:13:48 -0800959 newinfo, loc_cpu_entry, tmp.size, tmp.num_entries,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700960 tmp.hook_entry, tmp.underflow);
961 if (ret != 0)
962 goto free_newinfo_counters;
963
964 duprintf("ip_tables: Translated table\n");
965
Harald Welte2e4e6a12006-01-12 13:30:04 -0800966 t = try_then_request_module(xt_find_table_lock(AF_INET, tmp.name),
Linus Torvalds1da177e2005-04-16 15:20:36 -0700967 "iptable_%s", tmp.name);
968 if (!t || IS_ERR(t)) {
969 ret = t ? PTR_ERR(t) : -ENOENT;
970 goto free_newinfo_counters_untrans;
971 }
972
973 /* You lied! */
974 if (tmp.valid_hooks != t->valid_hooks) {
975 duprintf("Valid hook crap: %08X vs %08X\n",
976 tmp.valid_hooks, t->valid_hooks);
977 ret = -EINVAL;
978 goto put_module;
979 }
980
Harald Welte2e4e6a12006-01-12 13:30:04 -0800981 oldinfo = xt_replace_table(t, tmp.num_counters, newinfo, &ret);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700982 if (!oldinfo)
983 goto put_module;
984
985 /* Update module usage count based on number of rules */
986 duprintf("do_replace: oldnum=%u, initnum=%u, newnum=%u\n",
987 oldinfo->number, oldinfo->initial_entries, newinfo->number);
988 if ((oldinfo->number > oldinfo->initial_entries) ||
989 (newinfo->number <= oldinfo->initial_entries))
990 module_put(t->me);
991 if ((oldinfo->number > oldinfo->initial_entries) &&
992 (newinfo->number <= oldinfo->initial_entries))
993 module_put(t->me);
994
995 /* Get the old counters. */
996 get_counters(oldinfo, counters);
997 /* Decrease module usage counts and free resource */
Eric Dumazet31836062005-12-13 23:13:48 -0800998 loc_cpu_old_entry = oldinfo->entries[raw_smp_processor_id()];
999 IPT_ENTRY_ITERATE(loc_cpu_old_entry, oldinfo->size, cleanup_entry,NULL);
Harald Welte2e4e6a12006-01-12 13:30:04 -08001000 xt_free_table_info(oldinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001001 if (copy_to_user(tmp.counters, counters,
Harald Welte2e4e6a12006-01-12 13:30:04 -08001002 sizeof(struct xt_counters) * tmp.num_counters) != 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001003 ret = -EFAULT;
1004 vfree(counters);
Harald Welte2e4e6a12006-01-12 13:30:04 -08001005 xt_table_unlock(t);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001006 return ret;
1007
1008 put_module:
1009 module_put(t->me);
Harald Welte2e4e6a12006-01-12 13:30:04 -08001010 xt_table_unlock(t);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011 free_newinfo_counters_untrans:
Eric Dumazet31836062005-12-13 23:13:48 -08001012 IPT_ENTRY_ITERATE(loc_cpu_entry, newinfo->size, cleanup_entry,NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001013 free_newinfo_counters:
1014 vfree(counters);
1015 free_newinfo:
Harald Welte2e4e6a12006-01-12 13:30:04 -08001016 xt_free_table_info(newinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001017 return ret;
1018}
1019
1020/* We're lazy, and add to the first CPU; overflow works its fey magic
1021 * and everything is OK. */
1022static inline int
1023add_counter_to_entry(struct ipt_entry *e,
Harald Welte2e4e6a12006-01-12 13:30:04 -08001024 const struct xt_counters addme[],
Linus Torvalds1da177e2005-04-16 15:20:36 -07001025 unsigned int *i)
1026{
1027#if 0
1028 duprintf("add_counter: Entry %u %lu/%lu + %lu/%lu\n",
1029 *i,
1030 (long unsigned int)e->counters.pcnt,
1031 (long unsigned int)e->counters.bcnt,
1032 (long unsigned int)addme[*i].pcnt,
1033 (long unsigned int)addme[*i].bcnt);
1034#endif
1035
1036 ADD_COUNTER(e->counters, addme[*i].bcnt, addme[*i].pcnt);
1037
1038 (*i)++;
1039 return 0;
1040}
1041
1042static int
1043do_add_counters(void __user *user, unsigned int len)
1044{
1045 unsigned int i;
Harald Welte2e4e6a12006-01-12 13:30:04 -08001046 struct xt_counters_info tmp, *paddc;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001047 struct ipt_table *t;
Harald Welte2e4e6a12006-01-12 13:30:04 -08001048 struct xt_table_info *private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001049 int ret = 0;
Eric Dumazet31836062005-12-13 23:13:48 -08001050 void *loc_cpu_entry;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001051
1052 if (copy_from_user(&tmp, user, sizeof(tmp)) != 0)
1053 return -EFAULT;
1054
Harald Welte2e4e6a12006-01-12 13:30:04 -08001055 if (len != sizeof(tmp) + tmp.num_counters*sizeof(struct xt_counters))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001056 return -EINVAL;
1057
Eric Dumazet31836062005-12-13 23:13:48 -08001058 paddc = vmalloc_node(len, numa_node_id());
Linus Torvalds1da177e2005-04-16 15:20:36 -07001059 if (!paddc)
1060 return -ENOMEM;
1061
1062 if (copy_from_user(paddc, user, len) != 0) {
1063 ret = -EFAULT;
1064 goto free;
1065 }
1066
Harald Welte2e4e6a12006-01-12 13:30:04 -08001067 t = xt_find_table_lock(AF_INET, tmp.name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001068 if (!t || IS_ERR(t)) {
1069 ret = t ? PTR_ERR(t) : -ENOENT;
1070 goto free;
1071 }
1072
1073 write_lock_bh(&t->lock);
Harald Welte2e4e6a12006-01-12 13:30:04 -08001074 private = t->private;
1075 if (private->number != paddc->num_counters) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001076 ret = -EINVAL;
1077 goto unlock_up_free;
1078 }
1079
1080 i = 0;
Eric Dumazet31836062005-12-13 23:13:48 -08001081 /* Choose the copy that is on our node */
Harald Welte2e4e6a12006-01-12 13:30:04 -08001082 loc_cpu_entry = private->entries[raw_smp_processor_id()];
Eric Dumazet31836062005-12-13 23:13:48 -08001083 IPT_ENTRY_ITERATE(loc_cpu_entry,
Harald Welte2e4e6a12006-01-12 13:30:04 -08001084 private->size,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001085 add_counter_to_entry,
1086 paddc->counters,
1087 &i);
1088 unlock_up_free:
1089 write_unlock_bh(&t->lock);
Harald Welte2e4e6a12006-01-12 13:30:04 -08001090 xt_table_unlock(t);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001091 module_put(t->me);
1092 free:
1093 vfree(paddc);
1094
1095 return ret;
1096}
1097
1098static int
1099do_ipt_set_ctl(struct sock *sk, int cmd, void __user *user, unsigned int len)
1100{
1101 int ret;
1102
1103 if (!capable(CAP_NET_ADMIN))
1104 return -EPERM;
1105
1106 switch (cmd) {
1107 case IPT_SO_SET_REPLACE:
1108 ret = do_replace(user, len);
1109 break;
1110
1111 case IPT_SO_SET_ADD_COUNTERS:
1112 ret = do_add_counters(user, len);
1113 break;
1114
1115 default:
1116 duprintf("do_ipt_set_ctl: unknown request %i\n", cmd);
1117 ret = -EINVAL;
1118 }
1119
1120 return ret;
1121}
1122
1123static int
1124do_ipt_get_ctl(struct sock *sk, int cmd, void __user *user, int *len)
1125{
1126 int ret;
1127
1128 if (!capable(CAP_NET_ADMIN))
1129 return -EPERM;
1130
1131 switch (cmd) {
1132 case IPT_SO_GET_INFO: {
1133 char name[IPT_TABLE_MAXNAMELEN];
1134 struct ipt_table *t;
1135
1136 if (*len != sizeof(struct ipt_getinfo)) {
1137 duprintf("length %u != %u\n", *len,
1138 sizeof(struct ipt_getinfo));
1139 ret = -EINVAL;
1140 break;
1141 }
1142
1143 if (copy_from_user(name, user, sizeof(name)) != 0) {
1144 ret = -EFAULT;
1145 break;
1146 }
1147 name[IPT_TABLE_MAXNAMELEN-1] = '\0';
1148
Harald Welte2e4e6a12006-01-12 13:30:04 -08001149 t = try_then_request_module(xt_find_table_lock(AF_INET, name),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001150 "iptable_%s", name);
1151 if (t && !IS_ERR(t)) {
1152 struct ipt_getinfo info;
Harald Welte2e4e6a12006-01-12 13:30:04 -08001153 struct xt_table_info *private = t->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001154
1155 info.valid_hooks = t->valid_hooks;
Harald Welte2e4e6a12006-01-12 13:30:04 -08001156 memcpy(info.hook_entry, private->hook_entry,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001157 sizeof(info.hook_entry));
Harald Welte2e4e6a12006-01-12 13:30:04 -08001158 memcpy(info.underflow, private->underflow,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001159 sizeof(info.underflow));
Harald Welte2e4e6a12006-01-12 13:30:04 -08001160 info.num_entries = private->number;
1161 info.size = private->size;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001162 memcpy(info.name, name, sizeof(info.name));
1163
1164 if (copy_to_user(user, &info, *len) != 0)
1165 ret = -EFAULT;
1166 else
1167 ret = 0;
Harald Welte2e4e6a12006-01-12 13:30:04 -08001168 xt_table_unlock(t);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001169 module_put(t->me);
1170 } else
1171 ret = t ? PTR_ERR(t) : -ENOENT;
1172 }
1173 break;
1174
1175 case IPT_SO_GET_ENTRIES: {
1176 struct ipt_get_entries get;
1177
1178 if (*len < sizeof(get)) {
1179 duprintf("get_entries: %u < %u\n", *len, sizeof(get));
1180 ret = -EINVAL;
1181 } else if (copy_from_user(&get, user, sizeof(get)) != 0) {
1182 ret = -EFAULT;
1183 } else if (*len != sizeof(struct ipt_get_entries) + get.size) {
1184 duprintf("get_entries: %u != %u\n", *len,
1185 sizeof(struct ipt_get_entries) + get.size);
1186 ret = -EINVAL;
1187 } else
1188 ret = get_entries(&get, user);
1189 break;
1190 }
1191
1192 case IPT_SO_GET_REVISION_MATCH:
1193 case IPT_SO_GET_REVISION_TARGET: {
1194 struct ipt_get_revision rev;
Harald Welte2e4e6a12006-01-12 13:30:04 -08001195 int target;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001196
1197 if (*len != sizeof(rev)) {
1198 ret = -EINVAL;
1199 break;
1200 }
1201 if (copy_from_user(&rev, user, sizeof(rev)) != 0) {
1202 ret = -EFAULT;
1203 break;
1204 }
1205
1206 if (cmd == IPT_SO_GET_REVISION_TARGET)
Harald Welte2e4e6a12006-01-12 13:30:04 -08001207 target = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001208 else
Harald Welte2e4e6a12006-01-12 13:30:04 -08001209 target = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001210
Harald Welte2e4e6a12006-01-12 13:30:04 -08001211 try_then_request_module(xt_find_revision(AF_INET, rev.name,
1212 rev.revision,
1213 target, &ret),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001214 "ipt_%s", rev.name);
1215 break;
1216 }
1217
1218 default:
1219 duprintf("do_ipt_get_ctl: unknown request %i\n", cmd);
1220 ret = -EINVAL;
1221 }
1222
1223 return ret;
1224}
1225
Harald Welte2e4e6a12006-01-12 13:30:04 -08001226int ipt_register_table(struct xt_table *table, const struct ipt_replace *repl)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001227{
1228 int ret;
Harald Welte2e4e6a12006-01-12 13:30:04 -08001229 struct xt_table_info *newinfo;
1230 static struct xt_table_info bootstrap
Linus Torvalds1da177e2005-04-16 15:20:36 -07001231 = { 0, 0, 0, { 0 }, { 0 }, { } };
Eric Dumazet31836062005-12-13 23:13:48 -08001232 void *loc_cpu_entry;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001233
Harald Welte2e4e6a12006-01-12 13:30:04 -08001234 newinfo = xt_alloc_table_info(repl->size);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001235 if (!newinfo)
1236 return -ENOMEM;
1237
Eric Dumazet31836062005-12-13 23:13:48 -08001238 /* choose the copy on our node/cpu
1239 * but dont care of preemption
1240 */
1241 loc_cpu_entry = newinfo->entries[raw_smp_processor_id()];
1242 memcpy(loc_cpu_entry, repl->entries, repl->size);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001243
1244 ret = translate_table(table->name, table->valid_hooks,
Eric Dumazet31836062005-12-13 23:13:48 -08001245 newinfo, loc_cpu_entry, repl->size,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001246 repl->num_entries,
1247 repl->hook_entry,
1248 repl->underflow);
1249 if (ret != 0) {
Harald Welte2e4e6a12006-01-12 13:30:04 -08001250 xt_free_table_info(newinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001251 return ret;
1252 }
1253
Harald Welte2e4e6a12006-01-12 13:30:04 -08001254 if (xt_register_table(table, &bootstrap, newinfo) != 0) {
1255 xt_free_table_info(newinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001256 return ret;
1257 }
1258
Harald Welte2e4e6a12006-01-12 13:30:04 -08001259 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001260}
1261
1262void ipt_unregister_table(struct ipt_table *table)
1263{
Harald Welte2e4e6a12006-01-12 13:30:04 -08001264 struct xt_table_info *private;
Eric Dumazet31836062005-12-13 23:13:48 -08001265 void *loc_cpu_entry;
1266
Harald Welte2e4e6a12006-01-12 13:30:04 -08001267 private = xt_unregister_table(table);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001268
1269 /* Decrease module usage counts and free resources */
Harald Welte2e4e6a12006-01-12 13:30:04 -08001270 loc_cpu_entry = private->entries[raw_smp_processor_id()];
1271 IPT_ENTRY_ITERATE(loc_cpu_entry, private->size, cleanup_entry, NULL);
1272 xt_free_table_info(private);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001273}
1274
1275/* Returns 1 if the type and code is matched by the range, 0 otherwise */
1276static inline int
1277icmp_type_code_match(u_int8_t test_type, u_int8_t min_code, u_int8_t max_code,
1278 u_int8_t type, u_int8_t code,
1279 int invert)
1280{
1281 return ((test_type == 0xFF) || (type == test_type && code >= min_code && code <= max_code))
1282 ^ invert;
1283}
1284
1285static int
1286icmp_match(const struct sk_buff *skb,
1287 const struct net_device *in,
1288 const struct net_device *out,
Patrick McHardyc4986732006-03-20 18:02:56 -08001289 const struct xt_match *match,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001290 const void *matchinfo,
1291 int offset,
Harald Welte2e4e6a12006-01-12 13:30:04 -08001292 unsigned int protoff,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293 int *hotdrop)
1294{
1295 struct icmphdr _icmph, *ic;
1296 const struct ipt_icmp *icmpinfo = matchinfo;
1297
1298 /* Must not be a fragment. */
1299 if (offset)
1300 return 0;
1301
Harald Welte2e4e6a12006-01-12 13:30:04 -08001302 ic = skb_header_pointer(skb, protoff, sizeof(_icmph), &_icmph);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001303 if (ic == NULL) {
1304 /* We've been asked to examine this packet, and we
1305 * can't. Hence, no choice but to drop.
1306 */
1307 duprintf("Dropping evil ICMP tinygram.\n");
1308 *hotdrop = 1;
1309 return 0;
1310 }
1311
1312 return icmp_type_code_match(icmpinfo->type,
1313 icmpinfo->code[0],
1314 icmpinfo->code[1],
1315 ic->type, ic->code,
1316 !!(icmpinfo->invflags&IPT_ICMP_INV));
1317}
1318
1319/* Called when user tries to insert an entry of this type. */
1320static int
1321icmp_checkentry(const char *tablename,
Harald Welte2e4e6a12006-01-12 13:30:04 -08001322 const void *info,
Patrick McHardyc4986732006-03-20 18:02:56 -08001323 const struct xt_match *match,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001324 void *matchinfo,
1325 unsigned int matchsize,
1326 unsigned int hook_mask)
1327{
1328 const struct ipt_icmp *icmpinfo = matchinfo;
1329
Patrick McHardy1d5cd902006-03-20 18:01:14 -08001330 /* Must specify no unknown invflags */
1331 return !(icmpinfo->invflags & ~IPT_ICMP_INV);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001332}
1333
1334/* The built-in targets: standard (NULL) and error. */
1335static struct ipt_target ipt_standard_target = {
1336 .name = IPT_STANDARD_TARGET,
Patrick McHardy1d5cd902006-03-20 18:01:14 -08001337 .targetsize = sizeof(int),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001338};
1339
1340static struct ipt_target ipt_error_target = {
1341 .name = IPT_ERROR_TARGET,
1342 .target = ipt_error,
Patrick McHardy1d5cd902006-03-20 18:01:14 -08001343 .targetsize = IPT_FUNCTION_MAXNAMELEN,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001344};
1345
1346static struct nf_sockopt_ops ipt_sockopts = {
1347 .pf = PF_INET,
1348 .set_optmin = IPT_BASE_CTL,
1349 .set_optmax = IPT_SO_SET_MAX+1,
1350 .set = do_ipt_set_ctl,
1351 .get_optmin = IPT_BASE_CTL,
1352 .get_optmax = IPT_SO_GET_MAX+1,
1353 .get = do_ipt_get_ctl,
1354};
1355
Linus Torvalds1da177e2005-04-16 15:20:36 -07001356static struct ipt_match icmp_matchstruct = {
1357 .name = "icmp",
Patrick McHardy1d5cd902006-03-20 18:01:14 -08001358 .match = icmp_match,
1359 .matchsize = sizeof(struct ipt_icmp),
1360 .proto = IPPROTO_ICMP,
1361 .checkentry = icmp_checkentry,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001362};
1363
Linus Torvalds1da177e2005-04-16 15:20:36 -07001364static int __init init(void)
1365{
1366 int ret;
1367
Harald Welte2e4e6a12006-01-12 13:30:04 -08001368 xt_proto_init(AF_INET);
1369
Linus Torvalds1da177e2005-04-16 15:20:36 -07001370 /* Noone else will be downing sem now, so we won't sleep */
Harald Welte2e4e6a12006-01-12 13:30:04 -08001371 xt_register_target(AF_INET, &ipt_standard_target);
1372 xt_register_target(AF_INET, &ipt_error_target);
1373 xt_register_match(AF_INET, &icmp_matchstruct);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001374
1375 /* Register setsockopt */
1376 ret = nf_register_sockopt(&ipt_sockopts);
1377 if (ret < 0) {
1378 duprintf("Unable to register sockopts.\n");
1379 return ret;
1380 }
1381
Harald Welte2e4e6a12006-01-12 13:30:04 -08001382 printk("ip_tables: (C) 2000-2006 Netfilter Core Team\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001383 return 0;
1384}
1385
1386static void __exit fini(void)
1387{
1388 nf_unregister_sockopt(&ipt_sockopts);
Harald Welte2e4e6a12006-01-12 13:30:04 -08001389
1390 xt_unregister_match(AF_INET, &icmp_matchstruct);
1391 xt_unregister_target(AF_INET, &ipt_error_target);
1392 xt_unregister_target(AF_INET, &ipt_standard_target);
1393
1394 xt_proto_fini(AF_INET);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001395}
1396
1397EXPORT_SYMBOL(ipt_register_table);
1398EXPORT_SYMBOL(ipt_unregister_table);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001399EXPORT_SYMBOL(ipt_do_table);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001400module_init(init);
1401module_exit(fini);