]> bbs.cooldavid.org Git - net-next-2.6.git/blame - net/ipv4/netfilter/ip_tables.c
Merge branch 'for-linus' of git://git.kernel.dk/linux-2.6-block
[net-next-2.6.git] / net / ipv4 / netfilter / ip_tables.c
CommitLineData
1da177e4
LT
1/*
2 * Packet matching code.
3 *
4 * Copyright (C) 1999 Paul `Rusty' Russell & Michael J. Neuling
2e4e6a17 5 * Copyright (C) 2000-2005 Netfilter Core Team <coreteam@netfilter.org>
1da177e4
LT
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
1da177e4 10 */
90e7d4ab 11#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
1da177e4 12#include <linux/cache.h>
4fc268d2 13#include <linux/capability.h>
1da177e4
LT
14#include <linux/skbuff.h>
15#include <linux/kmod.h>
16#include <linux/vmalloc.h>
17#include <linux/netdevice.h>
18#include <linux/module.h>
1da177e4
LT
19#include <linux/icmp.h>
20#include <net/ip.h>
2722971c 21#include <net/compat.h>
1da177e4 22#include <asm/uaccess.h>
57b47a53 23#include <linux/mutex.h>
1da177e4
LT
24#include <linux/proc_fs.h>
25#include <linux/err.h>
c8923c6b 26#include <linux/cpumask.h>
1da177e4 27
2e4e6a17 28#include <linux/netfilter/x_tables.h>
1da177e4 29#include <linux/netfilter_ipv4/ip_tables.h>
f01ffbd6 30#include <net/netfilter/nf_log.h>
e3eaa991 31#include "../../netfilter/xt_repldata.h"
1da177e4
LT
32
33MODULE_LICENSE("GPL");
34MODULE_AUTHOR("Netfilter Core Team <coreteam@netfilter.org>");
35MODULE_DESCRIPTION("IPv4 packet filter");
36
37/*#define DEBUG_IP_FIREWALL*/
38/*#define DEBUG_ALLOW_ALL*/ /* Useful for remote debugging */
39/*#define DEBUG_IP_FIREWALL_USER*/
40
41#ifdef DEBUG_IP_FIREWALL
ff67e4e4 42#define dprintf(format, args...) pr_info(format , ## args)
1da177e4
LT
43#else
44#define dprintf(format, args...)
45#endif
46
47#ifdef DEBUG_IP_FIREWALL_USER
ff67e4e4 48#define duprintf(format, args...) pr_info(format , ## args)
1da177e4
LT
49#else
50#define duprintf(format, args...)
51#endif
52
53#ifdef CONFIG_NETFILTER_DEBUG
af567603 54#define IP_NF_ASSERT(x) WARN_ON(!(x))
1da177e4
LT
55#else
56#define IP_NF_ASSERT(x)
57#endif
1da177e4
LT
58
59#if 0
60/* All the better to debug you with... */
61#define static
62#define inline
63#endif
64
e3eaa991
JE
65void *ipt_alloc_initial_table(const struct xt_table *info)
66{
67 return xt_alloc_initial_table(ipt, IPT);
68}
69EXPORT_SYMBOL_GPL(ipt_alloc_initial_table);
70
1da177e4
LT
71/*
72 We keep a set of rules for each CPU, so we can avoid write-locking
73 them in the softirq when updating the counters and therefore
74 only need to read-lock in the softirq; doing a write_lock_bh() in user
75 context stops packets coming through and allows user context to read
76 the counters or update the rules.
77
1da177e4
LT
78 Hence the start of any table is given by get_table() below. */
79
1da177e4 80/* Returns whether matches rule or not. */
022748a9 81/* Performance critical - called for every packet */
9c547959 82static inline bool
1da177e4
LT
83ip_packet_match(const struct iphdr *ip,
84 const char *indev,
85 const char *outdev,
86 const struct ipt_ip *ipinfo,
87 int isfrag)
88{
1da177e4
LT
89 unsigned long ret;
90
e79ec50b 91#define FWINV(bool, invflg) ((bool) ^ !!(ipinfo->invflags & (invflg)))
1da177e4
LT
92
93 if (FWINV((ip->saddr&ipinfo->smsk.s_addr) != ipinfo->src.s_addr,
3666ed1c
JP
94 IPT_INV_SRCIP) ||
95 FWINV((ip->daddr&ipinfo->dmsk.s_addr) != ipinfo->dst.s_addr,
96 IPT_INV_DSTIP)) {
1da177e4
LT
97 dprintf("Source or dest mismatch.\n");
98
cffee385
HH
99 dprintf("SRC: %pI4. Mask: %pI4. Target: %pI4.%s\n",
100 &ip->saddr, &ipinfo->smsk.s_addr, &ipinfo->src.s_addr,
1da177e4 101 ipinfo->invflags & IPT_INV_SRCIP ? " (INV)" : "");
cffee385
HH
102 dprintf("DST: %pI4 Mask: %pI4 Target: %pI4.%s\n",
103 &ip->daddr, &ipinfo->dmsk.s_addr, &ipinfo->dst.s_addr,
1da177e4 104 ipinfo->invflags & IPT_INV_DSTIP ? " (INV)" : "");
9c547959 105 return false;
1da177e4
LT
106 }
107
b8dfe498 108 ret = ifname_compare_aligned(indev, ipinfo->iniface, ipinfo->iniface_mask);
1da177e4
LT
109
110 if (FWINV(ret != 0, IPT_INV_VIA_IN)) {
111 dprintf("VIA in mismatch (%s vs %s).%s\n",
112 indev, ipinfo->iniface,
113 ipinfo->invflags&IPT_INV_VIA_IN ?" (INV)":"");
9c547959 114 return false;
1da177e4
LT
115 }
116
b8dfe498 117 ret = ifname_compare_aligned(outdev, ipinfo->outiface, ipinfo->outiface_mask);
1da177e4
LT
118
119 if (FWINV(ret != 0, IPT_INV_VIA_OUT)) {
120 dprintf("VIA out mismatch (%s vs %s).%s\n",
121 outdev, ipinfo->outiface,
122 ipinfo->invflags&IPT_INV_VIA_OUT ?" (INV)":"");
9c547959 123 return false;
1da177e4
LT
124 }
125
126 /* Check specific protocol */
3666ed1c
JP
127 if (ipinfo->proto &&
128 FWINV(ip->protocol != ipinfo->proto, IPT_INV_PROTO)) {
1da177e4
LT
129 dprintf("Packet protocol %hi does not match %hi.%s\n",
130 ip->protocol, ipinfo->proto,
131 ipinfo->invflags&IPT_INV_PROTO ? " (INV)":"");
9c547959 132 return false;
1da177e4
LT
133 }
134
135 /* If we have a fragment rule but the packet is not a fragment
136 * then we return zero */
137 if (FWINV((ipinfo->flags&IPT_F_FRAG) && !isfrag, IPT_INV_FRAG)) {
138 dprintf("Fragment rule but not fragment.%s\n",
139 ipinfo->invflags & IPT_INV_FRAG ? " (INV)" : "");
9c547959 140 return false;
1da177e4
LT
141 }
142
9c547959 143 return true;
1da177e4
LT
144}
145
022748a9 146static bool
1da177e4
LT
147ip_checkentry(const struct ipt_ip *ip)
148{
149 if (ip->flags & ~IPT_F_MASK) {
150 duprintf("Unknown flag bits set: %08X\n",
151 ip->flags & ~IPT_F_MASK);
ccb79bdc 152 return false;
1da177e4
LT
153 }
154 if (ip->invflags & ~IPT_INV_MASK) {
155 duprintf("Unknown invflag bits set: %08X\n",
156 ip->invflags & ~IPT_INV_MASK);
ccb79bdc 157 return false;
1da177e4 158 }
ccb79bdc 159 return true;
1da177e4
LT
160}
161
162static unsigned int
4b560b44 163ipt_error(struct sk_buff *skb, const struct xt_action_param *par)
1da177e4
LT
164{
165 if (net_ratelimit())
ff67e4e4 166 pr_info("error: `%s'\n", (const char *)par->targinfo);
1da177e4
LT
167
168 return NF_DROP;
169}
170
022748a9 171/* Performance critical */
1da177e4 172static inline struct ipt_entry *
d5d1baa1 173get_entry(const void *base, unsigned int offset)
1da177e4
LT
174{
175 return (struct ipt_entry *)(base + offset);
176}
177
ba9dda3a 178/* All zeroes == unconditional rule. */
022748a9 179/* Mildly perf critical (only if packet tracing is on) */
47901dc2 180static inline bool unconditional(const struct ipt_ip *ip)
ba9dda3a 181{
47901dc2 182 static const struct ipt_ip uncond;
ba9dda3a 183
47901dc2 184 return memcmp(ip, &uncond, sizeof(uncond)) == 0;
e79ec50b 185#undef FWINV
ba9dda3a
JK
186}
187
d5d1baa1
JE
188/* for const-correctness */
189static inline const struct ipt_entry_target *
190ipt_get_target_c(const struct ipt_entry *e)
191{
192 return ipt_get_target((struct ipt_entry *)e);
193}
194
ba9dda3a
JK
195#if defined(CONFIG_NETFILTER_XT_TARGET_TRACE) || \
196 defined(CONFIG_NETFILTER_XT_TARGET_TRACE_MODULE)
022748a9 197static const char *const hooknames[] = {
6e23ae2a
PM
198 [NF_INET_PRE_ROUTING] = "PREROUTING",
199 [NF_INET_LOCAL_IN] = "INPUT",
9c547959 200 [NF_INET_FORWARD] = "FORWARD",
6e23ae2a
PM
201 [NF_INET_LOCAL_OUT] = "OUTPUT",
202 [NF_INET_POST_ROUTING] = "POSTROUTING",
ba9dda3a
JK
203};
204
205enum nf_ip_trace_comments {
206 NF_IP_TRACE_COMMENT_RULE,
207 NF_IP_TRACE_COMMENT_RETURN,
208 NF_IP_TRACE_COMMENT_POLICY,
209};
210
022748a9 211static const char *const comments[] = {
ba9dda3a
JK
212 [NF_IP_TRACE_COMMENT_RULE] = "rule",
213 [NF_IP_TRACE_COMMENT_RETURN] = "return",
214 [NF_IP_TRACE_COMMENT_POLICY] = "policy",
215};
216
217static struct nf_loginfo trace_loginfo = {
218 .type = NF_LOG_TYPE_LOG,
219 .u = {
220 .log = {
221 .level = 4,
222 .logflags = NF_LOG_MASK,
223 },
224 },
225};
226
022748a9 227/* Mildly perf critical (only if packet tracing is on) */
ba9dda3a 228static inline int
d5d1baa1 229get_chainname_rulenum(const struct ipt_entry *s, const struct ipt_entry *e,
4f2f6f23
JE
230 const char *hookname, const char **chainname,
231 const char **comment, unsigned int *rulenum)
ba9dda3a 232{
d5d1baa1 233 const struct ipt_standard_target *t = (void *)ipt_get_target_c(s);
ba9dda3a
JK
234
235 if (strcmp(t->target.u.kernel.target->name, IPT_ERROR_TARGET) == 0) {
236 /* Head of user chain: ERROR target with chainname */
237 *chainname = t->target.data;
238 (*rulenum) = 0;
239 } else if (s == e) {
240 (*rulenum)++;
241
3666ed1c
JP
242 if (s->target_offset == sizeof(struct ipt_entry) &&
243 strcmp(t->target.u.kernel.target->name,
244 IPT_STANDARD_TARGET) == 0 &&
245 t->verdict < 0 &&
246 unconditional(&s->ip)) {
ba9dda3a
JK
247 /* Tail of chains: STANDARD target (return/policy) */
248 *comment = *chainname == hookname
4f2f6f23
JE
249 ? comments[NF_IP_TRACE_COMMENT_POLICY]
250 : comments[NF_IP_TRACE_COMMENT_RETURN];
ba9dda3a
JK
251 }
252 return 1;
253 } else
254 (*rulenum)++;
255
256 return 0;
257}
258
d5d1baa1 259static void trace_packet(const struct sk_buff *skb,
ba9dda3a
JK
260 unsigned int hook,
261 const struct net_device *in,
262 const struct net_device *out,
ecb6f85e 263 const char *tablename,
d5d1baa1
JE
264 const struct xt_table_info *private,
265 const struct ipt_entry *e)
ba9dda3a 266{
d5d1baa1 267 const void *table_base;
5452e425 268 const struct ipt_entry *root;
4f2f6f23 269 const char *hookname, *chainname, *comment;
72b2b1dd 270 const struct ipt_entry *iter;
ba9dda3a
JK
271 unsigned int rulenum = 0;
272
ccf5bd8c 273 table_base = private->entries[smp_processor_id()];
ba9dda3a
JK
274 root = get_entry(table_base, private->hook_entry[hook]);
275
4f2f6f23
JE
276 hookname = chainname = hooknames[hook];
277 comment = comments[NF_IP_TRACE_COMMENT_RULE];
ba9dda3a 278
72b2b1dd
JE
279 xt_entry_foreach(iter, root, private->size - private->hook_entry[hook])
280 if (get_chainname_rulenum(iter, e, hookname,
281 &chainname, &comment, &rulenum) != 0)
282 break;
ba9dda3a
JK
283
284 nf_log_packet(AF_INET, hook, skb, in, out, &trace_loginfo,
285 "TRACE: %s:%s:%s:%u ",
286 tablename, chainname, comment, rulenum);
287}
288#endif
289
98e86403
JE
290static inline __pure
291struct ipt_entry *ipt_next_entry(const struct ipt_entry *entry)
292{
293 return (void *)entry + entry->next_offset;
294}
295
1da177e4
LT
296/* Returns one of the generic firewall policies, like NF_ACCEPT. */
297unsigned int
3db05fea 298ipt_do_table(struct sk_buff *skb,
1da177e4
LT
299 unsigned int hook,
300 const struct net_device *in,
301 const struct net_device *out,
e60a13e0 302 struct xt_table *table)
1da177e4
LT
303{
304 static const char nulldevname[IFNAMSIZ] __attribute__((aligned(sizeof(long))));
5452e425 305 const struct iphdr *ip;
1da177e4
LT
306 /* Initializing verdict to NF_DROP keeps gcc happy. */
307 unsigned int verdict = NF_DROP;
308 const char *indev, *outdev;
d5d1baa1 309 const void *table_base;
f3c5c1bf
JE
310 struct ipt_entry *e, **jumpstack;
311 unsigned int *stackptr, origptr, cpu;
d5d1baa1 312 const struct xt_table_info *private;
de74c169 313 struct xt_action_param acpar;
1da177e4
LT
314
315 /* Initialization */
3db05fea 316 ip = ip_hdr(skb);
1da177e4
LT
317 indev = in ? in->name : nulldevname;
318 outdev = out ? out->name : nulldevname;
319 /* We handle fragments by dealing with the first fragment as
320 * if it was a normal packet. All other fragments are treated
321 * normally, except that they will NEVER match rules that ask
322 * things we don't know, ie. tcp syn flag or ports). If the
323 * rule is also a fragment-specific rule, non-fragments won't
324 * match it. */
de74c169
JE
325 acpar.fragoff = ntohs(ip->frag_off) & IP_OFFSET;
326 acpar.thoff = ip_hdrlen(skb);
b4ba2611 327 acpar.hotdrop = false;
de74c169
JE
328 acpar.in = in;
329 acpar.out = out;
330 acpar.family = NFPROTO_IPV4;
331 acpar.hooknum = hook;
1da177e4 332
1da177e4 333 IP_NF_ASSERT(table->valid_hooks & (1 << hook));
942e4a2b
SH
334 xt_info_rdlock_bh();
335 private = table->private;
f3c5c1bf
JE
336 cpu = smp_processor_id();
337 table_base = private->entries[cpu];
338 jumpstack = (struct ipt_entry **)private->jumpstack[cpu];
7489aec8 339 stackptr = per_cpu_ptr(private->stackptr, cpu);
f3c5c1bf 340 origptr = *stackptr;
78454473 341
2e4e6a17 342 e = get_entry(table_base, private->hook_entry[hook]);
1da177e4 343
cecc74de 344 pr_debug("Entering %s(hook %u); sp at %u (UF %p)\n",
f3c5c1bf
JE
345 table->name, hook, origptr,
346 get_entry(table_base, private->underflow[hook]));
1da177e4
LT
347
348 do {
d5d1baa1 349 const struct ipt_entry_target *t;
dcea992a 350 const struct xt_entry_match *ematch;
a1ff4ac8 351
1da177e4 352 IP_NF_ASSERT(e);
a1ff4ac8 353 if (!ip_packet_match(ip, indev, outdev,
de74c169 354 &e->ip, acpar.fragoff)) {
dcea992a 355 no_match:
a1ff4ac8
JE
356 e = ipt_next_entry(e);
357 continue;
358 }
1da177e4 359
ef53d702 360 xt_ematch_foreach(ematch, e) {
de74c169
JE
361 acpar.match = ematch->u.kernel.match;
362 acpar.matchinfo = ematch->data;
363 if (!acpar.match->match(skb, &acpar))
dcea992a 364 goto no_match;
ef53d702 365 }
dcea992a 366
a1ff4ac8 367 ADD_COUNTER(e->counters, ntohs(ip->tot_len), 1);
1da177e4 368
a1ff4ac8
JE
369 t = ipt_get_target(e);
370 IP_NF_ASSERT(t->u.kernel.target);
ba9dda3a
JK
371
372#if defined(CONFIG_NETFILTER_XT_TARGET_TRACE) || \
373 defined(CONFIG_NETFILTER_XT_TARGET_TRACE_MODULE)
a1ff4ac8
JE
374 /* The packet is traced: log it */
375 if (unlikely(skb->nf_trace))
376 trace_packet(skb, hook, in, out,
377 table->name, private, e);
ba9dda3a 378#endif
a1ff4ac8
JE
379 /* Standard target? */
380 if (!t->u.kernel.target->target) {
381 int v;
382
383 v = ((struct ipt_standard_target *)t)->verdict;
384 if (v < 0) {
385 /* Pop from stack? */
386 if (v != IPT_RETURN) {
387 verdict = (unsigned)(-v) - 1;
388 break;
1da177e4 389 }
f3c5c1bf
JE
390 if (*stackptr == 0) {
391 e = get_entry(table_base,
392 private->underflow[hook]);
cecc74de 393 pr_debug("Underflow (this is normal) "
f3c5c1bf
JE
394 "to %p\n", e);
395 } else {
396 e = jumpstack[--*stackptr];
cecc74de 397 pr_debug("Pulled %p out from pos %u\n",
f3c5c1bf
JE
398 e, *stackptr);
399 e = ipt_next_entry(e);
400 }
a1ff4ac8
JE
401 continue;
402 }
3666ed1c
JP
403 if (table_base + v != ipt_next_entry(e) &&
404 !(e->ip.flags & IPT_F_GOTO)) {
f3c5c1bf
JE
405 if (*stackptr >= private->stacksize) {
406 verdict = NF_DROP;
407 break;
408 }
409 jumpstack[(*stackptr)++] = e;
cecc74de 410 pr_debug("Pushed %p into pos %u\n",
f3c5c1bf 411 e, *stackptr - 1);
a1ff4ac8 412 }
1da177e4 413
a1ff4ac8 414 e = get_entry(table_base, v);
7a6b1c46
JE
415 continue;
416 }
417
de74c169
JE
418 acpar.target = t->u.kernel.target;
419 acpar.targinfo = t->data;
bb70dfa5 420
de74c169 421 verdict = t->u.kernel.target->target(skb, &acpar);
7a6b1c46
JE
422 /* Target might have changed stuff. */
423 ip = ip_hdr(skb);
7a6b1c46
JE
424 if (verdict == IPT_CONTINUE)
425 e = ipt_next_entry(e);
426 else
427 /* Verdict */
428 break;
b4ba2611 429 } while (!acpar.hotdrop);
942e4a2b 430 xt_info_rdunlock_bh();
cecc74de 431 pr_debug("Exiting %s; resetting sp from %u to %u\n",
f3c5c1bf
JE
432 __func__, *stackptr, origptr);
433 *stackptr = origptr;
1da177e4
LT
434#ifdef DEBUG_ALLOW_ALL
435 return NF_ACCEPT;
436#else
b4ba2611 437 if (acpar.hotdrop)
1da177e4
LT
438 return NF_DROP;
439 else return verdict;
440#endif
441}
442
1da177e4
LT
443/* Figures out from what hook each rule can be called: returns 0 if
444 there are loops. Puts hook bitmask in comefrom. */
445static int
d5d1baa1 446mark_source_chains(const struct xt_table_info *newinfo,
31836064 447 unsigned int valid_hooks, void *entry0)
1da177e4
LT
448{
449 unsigned int hook;
450
451 /* No recursion; use packet counter to save back ptrs (reset
452 to 0 as we leave), and comefrom to save source hook bitmask */
6e23ae2a 453 for (hook = 0; hook < NF_INET_NUMHOOKS; hook++) {
1da177e4 454 unsigned int pos = newinfo->hook_entry[hook];
9c547959 455 struct ipt_entry *e = (struct ipt_entry *)(entry0 + pos);
1da177e4
LT
456
457 if (!(valid_hooks & (1 << hook)))
458 continue;
459
460 /* Set initial back pointer. */
461 e->counters.pcnt = pos;
462
463 for (;;) {
d5d1baa1
JE
464 const struct ipt_standard_target *t
465 = (void *)ipt_get_target_c(e);
e1b4b9f3 466 int visited = e->comefrom & (1 << hook);
1da177e4 467
6e23ae2a 468 if (e->comefrom & (1 << NF_INET_NUMHOOKS)) {
654d0fbd 469 pr_err("iptables: loop hook %u pos %u %08X.\n",
1da177e4
LT
470 hook, pos, e->comefrom);
471 return 0;
472 }
9c547959 473 e->comefrom |= ((1 << hook) | (1 << NF_INET_NUMHOOKS));
1da177e4
LT
474
475 /* Unconditional return/END. */
3666ed1c
JP
476 if ((e->target_offset == sizeof(struct ipt_entry) &&
477 (strcmp(t->target.u.user.name,
478 IPT_STANDARD_TARGET) == 0) &&
479 t->verdict < 0 && unconditional(&e->ip)) ||
480 visited) {
1da177e4
LT
481 unsigned int oldpos, size;
482
1f9352ae
PM
483 if ((strcmp(t->target.u.user.name,
484 IPT_STANDARD_TARGET) == 0) &&
485 t->verdict < -NF_MAX_VERDICT - 1) {
74c9c0c1
DM
486 duprintf("mark_source_chains: bad "
487 "negative verdict (%i)\n",
488 t->verdict);
489 return 0;
490 }
491
1da177e4
LT
492 /* Return: backtrack through the last
493 big jump. */
494 do {
6e23ae2a 495 e->comefrom ^= (1<<NF_INET_NUMHOOKS);
1da177e4
LT
496#ifdef DEBUG_IP_FIREWALL_USER
497 if (e->comefrom
6e23ae2a 498 & (1 << NF_INET_NUMHOOKS)) {
1da177e4
LT
499 duprintf("Back unset "
500 "on hook %u "
501 "rule %u\n",
502 hook, pos);
503 }
504#endif
505 oldpos = pos;
506 pos = e->counters.pcnt;
507 e->counters.pcnt = 0;
508
509 /* We're at the start. */
510 if (pos == oldpos)
511 goto next;
512
513 e = (struct ipt_entry *)
31836064 514 (entry0 + pos);
1da177e4
LT
515 } while (oldpos == pos + e->next_offset);
516
517 /* Move along one */
518 size = e->next_offset;
519 e = (struct ipt_entry *)
31836064 520 (entry0 + pos + size);
1da177e4
LT
521 e->counters.pcnt = pos;
522 pos += size;
523 } else {
524 int newpos = t->verdict;
525
526 if (strcmp(t->target.u.user.name,
3666ed1c
JP
527 IPT_STANDARD_TARGET) == 0 &&
528 newpos >= 0) {
74c9c0c1
DM
529 if (newpos > newinfo->size -
530 sizeof(struct ipt_entry)) {
531 duprintf("mark_source_chains: "
532 "bad verdict (%i)\n",
533 newpos);
534 return 0;
535 }
1da177e4
LT
536 /* This a jump; chase it. */
537 duprintf("Jump rule %u -> %u\n",
538 pos, newpos);
539 } else {
540 /* ... this is a fallthru */
541 newpos = pos + e->next_offset;
542 }
543 e = (struct ipt_entry *)
31836064 544 (entry0 + newpos);
1da177e4
LT
545 e->counters.pcnt = pos;
546 pos = newpos;
547 }
548 }
549 next:
550 duprintf("Finished chain %u\n", hook);
551 }
552 return 1;
553}
554
6bdb331b 555static void cleanup_match(struct ipt_entry_match *m, struct net *net)
1da177e4 556{
6be3d859
JE
557 struct xt_mtdtor_param par;
558
f54e9367 559 par.net = net;
6be3d859
JE
560 par.match = m->u.kernel.match;
561 par.matchinfo = m->data;
916a917d 562 par.family = NFPROTO_IPV4;
6be3d859
JE
563 if (par.match->destroy != NULL)
564 par.match->destroy(&par);
565 module_put(par.match->me);
1da177e4
LT
566}
567
022748a9 568static int
d5d1baa1 569check_entry(const struct ipt_entry *e, const char *name)
a96be246 570{
d5d1baa1 571 const struct ipt_entry_target *t;
a96be246
DM
572
573 if (!ip_checkentry(&e->ip)) {
b5cad0df 574 duprintf("ip check failed %p %s.\n", e, par->match->name);
a96be246
DM
575 return -EINVAL;
576 }
577
9c547959
PM
578 if (e->target_offset + sizeof(struct ipt_entry_target) >
579 e->next_offset)
a96be246
DM
580 return -EINVAL;
581
d5d1baa1 582 t = ipt_get_target_c(e);
a96be246
DM
583 if (e->target_offset + t->u.target_size > e->next_offset)
584 return -EINVAL;
585
586 return 0;
587}
588
022748a9 589static int
6bdb331b 590check_match(struct ipt_entry_match *m, struct xt_mtchk_param *par)
a96be246 591{
9b4fce7a 592 const struct ipt_ip *ip = par->entryinfo;
a96be246
DM
593 int ret;
594
9b4fce7a
JE
595 par->match = m->u.kernel.match;
596 par->matchinfo = m->data;
597
916a917d 598 ret = xt_check_match(par, m->u.match_size - sizeof(*m),
9b4fce7a 599 ip->proto, ip->invflags & IPT_INV_PROTO);
367c6790 600 if (ret < 0) {
b5cad0df 601 duprintf("check failed for `%s'.\n", par->match->name);
367c6790 602 return ret;
a96be246 603 }
367c6790 604 return 0;
a96be246
DM
605}
606
022748a9 607static int
6bdb331b 608find_check_match(struct ipt_entry_match *m, struct xt_mtchk_param *par)
1da177e4 609{
6709dbbb 610 struct xt_match *match;
3cdc7c95 611 int ret;
1da177e4 612
fd0ec0e6
JE
613 match = xt_request_find_match(NFPROTO_IPV4, m->u.user.name,
614 m->u.user.revision);
615 if (IS_ERR(match)) {
a96be246 616 duprintf("find_check_match: `%s' not found\n", m->u.user.name);
fd0ec0e6 617 return PTR_ERR(match);
1da177e4
LT
618 }
619 m->u.kernel.match = match;
620
6bdb331b 621 ret = check_match(m, par);
3cdc7c95
PM
622 if (ret)
623 goto err;
624
1da177e4 625 return 0;
3cdc7c95
PM
626err:
627 module_put(m->u.kernel.match->me);
628 return ret;
1da177e4
LT
629}
630
add67461 631static int check_target(struct ipt_entry *e, struct net *net, const char *name)
a96be246 632{
af5d6dc2
JE
633 struct ipt_entry_target *t = ipt_get_target(e);
634 struct xt_tgchk_param par = {
add67461 635 .net = net,
af5d6dc2
JE
636 .table = name,
637 .entryinfo = e,
638 .target = t->u.kernel.target,
639 .targinfo = t->data,
640 .hook_mask = e->comefrom,
916a917d 641 .family = NFPROTO_IPV4,
af5d6dc2 642 };
e905a9ed 643 int ret;
a96be246 644
916a917d 645 ret = xt_check_target(&par, t->u.target_size - sizeof(*t),
af5d6dc2 646 e->ip.proto, e->ip.invflags & IPT_INV_PROTO);
367c6790 647 if (ret < 0) {
ff67e4e4 648 duprintf("check failed for `%s'.\n",
a96be246 649 t->u.kernel.target->name);
367c6790 650 return ret;
a96be246 651 }
367c6790 652 return 0;
a96be246 653}
1da177e4 654
022748a9 655static int
a83d8e8d 656find_check_entry(struct ipt_entry *e, struct net *net, const char *name,
0559518b 657 unsigned int size)
1da177e4
LT
658{
659 struct ipt_entry_target *t;
6709dbbb 660 struct xt_target *target;
1da177e4
LT
661 int ret;
662 unsigned int j;
9b4fce7a 663 struct xt_mtchk_param mtpar;
dcea992a 664 struct xt_entry_match *ematch;
1da177e4 665
a96be246
DM
666 ret = check_entry(e, name);
667 if (ret)
668 return ret;
590bdf7f 669
1da177e4 670 j = 0;
a83d8e8d 671 mtpar.net = net;
9b4fce7a
JE
672 mtpar.table = name;
673 mtpar.entryinfo = &e->ip;
674 mtpar.hook_mask = e->comefrom;
916a917d 675 mtpar.family = NFPROTO_IPV4;
dcea992a 676 xt_ematch_foreach(ematch, e) {
6bdb331b 677 ret = find_check_match(ematch, &mtpar);
dcea992a 678 if (ret != 0)
6bdb331b
JE
679 goto cleanup_matches;
680 ++j;
dcea992a 681 }
1da177e4
LT
682
683 t = ipt_get_target(e);
d2a7b6ba
JE
684 target = xt_request_find_target(NFPROTO_IPV4, t->u.user.name,
685 t->u.user.revision);
686 if (IS_ERR(target)) {
a96be246 687 duprintf("find_check_entry: `%s' not found\n", t->u.user.name);
d2a7b6ba 688 ret = PTR_ERR(target);
1da177e4
LT
689 goto cleanup_matches;
690 }
691 t->u.kernel.target = target;
692
add67461 693 ret = check_target(e, net, name);
3cdc7c95
PM
694 if (ret)
695 goto err;
1da177e4 696 return 0;
3cdc7c95
PM
697 err:
698 module_put(t->u.kernel.target->me);
1da177e4 699 cleanup_matches:
6bdb331b
JE
700 xt_ematch_foreach(ematch, e) {
701 if (j-- == 0)
dcea992a 702 break;
6bdb331b
JE
703 cleanup_match(ematch, net);
704 }
1da177e4
LT
705 return ret;
706}
707
d5d1baa1 708static bool check_underflow(const struct ipt_entry *e)
e2fe35c1
JE
709{
710 const struct ipt_entry_target *t;
711 unsigned int verdict;
712
713 if (!unconditional(&e->ip))
714 return false;
d5d1baa1 715 t = ipt_get_target_c(e);
e2fe35c1
JE
716 if (strcmp(t->u.user.name, XT_STANDARD_TARGET) != 0)
717 return false;
718 verdict = ((struct ipt_standard_target *)t)->verdict;
719 verdict = -verdict - 1;
720 return verdict == NF_DROP || verdict == NF_ACCEPT;
721}
722
022748a9 723static int
1da177e4 724check_entry_size_and_hooks(struct ipt_entry *e,
2e4e6a17 725 struct xt_table_info *newinfo,
d5d1baa1
JE
726 const unsigned char *base,
727 const unsigned char *limit,
1da177e4
LT
728 const unsigned int *hook_entries,
729 const unsigned int *underflows,
0559518b 730 unsigned int valid_hooks)
1da177e4
LT
731{
732 unsigned int h;
733
3666ed1c
JP
734 if ((unsigned long)e % __alignof__(struct ipt_entry) != 0 ||
735 (unsigned char *)e + sizeof(struct ipt_entry) >= limit) {
1da177e4
LT
736 duprintf("Bad offset %p\n", e);
737 return -EINVAL;
738 }
739
740 if (e->next_offset
741 < sizeof(struct ipt_entry) + sizeof(struct ipt_entry_target)) {
742 duprintf("checking: element %p size %u\n",
743 e, e->next_offset);
744 return -EINVAL;
745 }
746
747 /* Check hooks & underflows */
6e23ae2a 748 for (h = 0; h < NF_INET_NUMHOOKS; h++) {
a7d51738
JE
749 if (!(valid_hooks & (1 << h)))
750 continue;
1da177e4
LT
751 if ((unsigned char *)e - base == hook_entries[h])
752 newinfo->hook_entry[h] = hook_entries[h];
90e7d4ab 753 if ((unsigned char *)e - base == underflows[h]) {
e2fe35c1
JE
754 if (!check_underflow(e)) {
755 pr_err("Underflows must be unconditional and "
756 "use the STANDARD target with "
757 "ACCEPT/DROP\n");
90e7d4ab
JE
758 return -EINVAL;
759 }
1da177e4 760 newinfo->underflow[h] = underflows[h];
90e7d4ab 761 }
1da177e4
LT
762 }
763
1da177e4 764 /* Clear counters and comefrom */
2e4e6a17 765 e->counters = ((struct xt_counters) { 0, 0 });
1da177e4 766 e->comefrom = 0;
1da177e4
LT
767 return 0;
768}
769
0559518b
JE
770static void
771cleanup_entry(struct ipt_entry *e, struct net *net)
1da177e4 772{
a2df1648 773 struct xt_tgdtor_param par;
1da177e4 774 struct ipt_entry_target *t;
dcea992a 775 struct xt_entry_match *ematch;
1da177e4 776
1da177e4 777 /* Cleanup all matches */
dcea992a 778 xt_ematch_foreach(ematch, e)
6bdb331b 779 cleanup_match(ematch, net);
1da177e4 780 t = ipt_get_target(e);
a2df1648 781
add67461 782 par.net = net;
a2df1648
JE
783 par.target = t->u.kernel.target;
784 par.targinfo = t->data;
916a917d 785 par.family = NFPROTO_IPV4;
a2df1648
JE
786 if (par.target->destroy != NULL)
787 par.target->destroy(&par);
788 module_put(par.target->me);
1da177e4
LT
789}
790
791/* Checks and translates the user-supplied table segment (held in
792 newinfo) */
793static int
0f234214
JE
794translate_table(struct net *net, struct xt_table_info *newinfo, void *entry0,
795 const struct ipt_replace *repl)
1da177e4 796{
72b2b1dd 797 struct ipt_entry *iter;
1da177e4 798 unsigned int i;
72b2b1dd 799 int ret = 0;
1da177e4 800
0f234214
JE
801 newinfo->size = repl->size;
802 newinfo->number = repl->num_entries;
1da177e4
LT
803
804 /* Init all hooks to impossible value. */
6e23ae2a 805 for (i = 0; i < NF_INET_NUMHOOKS; i++) {
1da177e4
LT
806 newinfo->hook_entry[i] = 0xFFFFFFFF;
807 newinfo->underflow[i] = 0xFFFFFFFF;
808 }
809
810 duprintf("translate_table: size %u\n", newinfo->size);
811 i = 0;
812 /* Walk through entries, checking offsets. */
72b2b1dd
JE
813 xt_entry_foreach(iter, entry0, newinfo->size) {
814 ret = check_entry_size_and_hooks(iter, newinfo, entry0,
6b4ff2d7
JE
815 entry0 + repl->size,
816 repl->hook_entry,
817 repl->underflow,
818 repl->valid_hooks);
72b2b1dd 819 if (ret != 0)
0559518b
JE
820 return ret;
821 ++i;
f3c5c1bf
JE
822 if (strcmp(ipt_get_target(iter)->u.user.name,
823 XT_ERROR_TARGET) == 0)
824 ++newinfo->stacksize;
72b2b1dd 825 }
1da177e4 826
0f234214 827 if (i != repl->num_entries) {
1da177e4 828 duprintf("translate_table: %u not %u entries\n",
0f234214 829 i, repl->num_entries);
1da177e4
LT
830 return -EINVAL;
831 }
832
833 /* Check hooks all assigned */
6e23ae2a 834 for (i = 0; i < NF_INET_NUMHOOKS; i++) {
1da177e4 835 /* Only hooks which are valid */
0f234214 836 if (!(repl->valid_hooks & (1 << i)))
1da177e4
LT
837 continue;
838 if (newinfo->hook_entry[i] == 0xFFFFFFFF) {
839 duprintf("Invalid hook entry %u %u\n",
0f234214 840 i, repl->hook_entry[i]);
1da177e4
LT
841 return -EINVAL;
842 }
843 if (newinfo->underflow[i] == 0xFFFFFFFF) {
844 duprintf("Invalid underflow %u %u\n",
0f234214 845 i, repl->underflow[i]);
1da177e4
LT
846 return -EINVAL;
847 }
848 }
849
0f234214 850 if (!mark_source_chains(newinfo, repl->valid_hooks, entry0))
74c9c0c1
DM
851 return -ELOOP;
852
1da177e4
LT
853 /* Finally, each sanity check must pass */
854 i = 0;
72b2b1dd 855 xt_entry_foreach(iter, entry0, newinfo->size) {
0f234214 856 ret = find_check_entry(iter, net, repl->name, repl->size);
72b2b1dd
JE
857 if (ret != 0)
858 break;
0559518b 859 ++i;
72b2b1dd 860 }
1da177e4 861
74c9c0c1 862 if (ret != 0) {
0559518b
JE
863 xt_entry_foreach(iter, entry0, newinfo->size) {
864 if (i-- == 0)
72b2b1dd 865 break;
0559518b
JE
866 cleanup_entry(iter, net);
867 }
74c9c0c1
DM
868 return ret;
869 }
1da177e4
LT
870
871 /* And one copy for every other CPU */
6f912042 872 for_each_possible_cpu(i) {
31836064
ED
873 if (newinfo->entries[i] && newinfo->entries[i] != entry0)
874 memcpy(newinfo->entries[i], entry0, newinfo->size);
1da177e4
LT
875 }
876
877 return ret;
878}
879
1da177e4 880static void
2e4e6a17
HW
881get_counters(const struct xt_table_info *t,
882 struct xt_counters counters[])
1da177e4 883{
72b2b1dd 884 struct ipt_entry *iter;
1da177e4
LT
885 unsigned int cpu;
886 unsigned int i;
31836064
ED
887 unsigned int curcpu;
888
889 /* Instead of clearing (by a previous call to memset())
890 * the counters and using adds, we set the counters
942e4a2b
SH
891 * with data used by 'current' CPU.
892 *
893 * Bottom half has to be disabled to prevent deadlock
894 * if new softirq were to run and call ipt_do_table
31836064 895 */
942e4a2b
SH
896 local_bh_disable();
897 curcpu = smp_processor_id();
31836064
ED
898
899 i = 0;
0559518b
JE
900 xt_entry_foreach(iter, t->entries[curcpu], t->size) {
901 SET_COUNTER(counters[i], iter->counters.bcnt,
6b4ff2d7 902 iter->counters.pcnt);
0559518b
JE
903 ++i;
904 }
1da177e4 905
6f912042 906 for_each_possible_cpu(cpu) {
31836064
ED
907 if (cpu == curcpu)
908 continue;
1da177e4 909 i = 0;
942e4a2b 910 xt_info_wrlock(cpu);
0559518b
JE
911 xt_entry_foreach(iter, t->entries[cpu], t->size) {
912 ADD_COUNTER(counters[i], iter->counters.bcnt,
6b4ff2d7 913 iter->counters.pcnt);
0559518b
JE
914 ++i; /* macro does multi eval of i */
915 }
942e4a2b 916 xt_info_wrunlock(cpu);
1da177e4 917 }
78454473
SH
918 local_bh_enable();
919}
920
d5d1baa1 921static struct xt_counters *alloc_counters(const struct xt_table *table)
1da177e4 922{
2722971c 923 unsigned int countersize;
2e4e6a17 924 struct xt_counters *counters;
d5d1baa1 925 const struct xt_table_info *private = table->private;
1da177e4
LT
926
927 /* We need atomic snapshot of counters: rest doesn't change
928 (other than comefrom, which userspace doesn't care
929 about). */
2e4e6a17 930 countersize = sizeof(struct xt_counters) * private->number;
31836064 931 counters = vmalloc_node(countersize, numa_node_id());
1da177e4
LT
932
933 if (counters == NULL)
942e4a2b 934 return ERR_PTR(-ENOMEM);
78454473 935
942e4a2b 936 get_counters(private, counters);
1da177e4 937
2722971c
DM
938 return counters;
939}
940
941static int
942copy_entries_to_user(unsigned int total_size,
d5d1baa1 943 const struct xt_table *table,
2722971c
DM
944 void __user *userptr)
945{
946 unsigned int off, num;
d5d1baa1 947 const struct ipt_entry *e;
2722971c 948 struct xt_counters *counters;
5452e425 949 const struct xt_table_info *private = table->private;
2722971c 950 int ret = 0;
5452e425 951 const void *loc_cpu_entry;
2722971c
DM
952
953 counters = alloc_counters(table);
954 if (IS_ERR(counters))
955 return PTR_ERR(counters);
956
31836064
ED
957 /* choose the copy that is on our node/cpu, ...
958 * This choice is lazy (because current thread is
959 * allowed to migrate to another cpu)
960 */
2e4e6a17 961 loc_cpu_entry = private->entries[raw_smp_processor_id()];
31836064 962 if (copy_to_user(userptr, loc_cpu_entry, total_size) != 0) {
1da177e4
LT
963 ret = -EFAULT;
964 goto free_counters;
965 }
966
967 /* FIXME: use iterator macros --RR */
968 /* ... then go back and fix counters and names */
969 for (off = 0, num = 0; off < total_size; off += e->next_offset, num++){
970 unsigned int i;
5452e425
JE
971 const struct ipt_entry_match *m;
972 const struct ipt_entry_target *t;
1da177e4 973
31836064 974 e = (struct ipt_entry *)(loc_cpu_entry + off);
1da177e4
LT
975 if (copy_to_user(userptr + off
976 + offsetof(struct ipt_entry, counters),
977 &counters[num],
978 sizeof(counters[num])) != 0) {
979 ret = -EFAULT;
980 goto free_counters;
981 }
982
983 for (i = sizeof(struct ipt_entry);
984 i < e->target_offset;
985 i += m->u.match_size) {
986 m = (void *)e + i;
987
988 if (copy_to_user(userptr + off + i
989 + offsetof(struct ipt_entry_match,
990 u.user.name),
991 m->u.kernel.match->name,
992 strlen(m->u.kernel.match->name)+1)
993 != 0) {
994 ret = -EFAULT;
995 goto free_counters;
996 }
997 }
998
d5d1baa1 999 t = ipt_get_target_c(e);
1da177e4
LT
1000 if (copy_to_user(userptr + off + e->target_offset
1001 + offsetof(struct ipt_entry_target,
1002 u.user.name),
1003 t->u.kernel.target->name,
1004 strlen(t->u.kernel.target->name)+1) != 0) {
1005 ret = -EFAULT;
1006 goto free_counters;
1007 }
1008 }
1009
1010 free_counters:
1011 vfree(counters);
1012 return ret;
1013}
1014
2722971c 1015#ifdef CONFIG_COMPAT
739674fb 1016static void compat_standard_from_user(void *dst, const void *src)
2722971c 1017{
9fa492cd 1018 int v = *(compat_int_t *)src;
2722971c 1019
9fa492cd 1020 if (v > 0)
b386d9f5 1021 v += xt_compat_calc_jump(AF_INET, v);
9fa492cd
PM
1022 memcpy(dst, &v, sizeof(v));
1023}
46c5ea3c 1024
739674fb 1025static int compat_standard_to_user(void __user *dst, const void *src)
2722971c 1026{
9fa492cd 1027 compat_int_t cv = *(int *)src;
2722971c 1028
9fa492cd 1029 if (cv > 0)
b386d9f5 1030 cv -= xt_compat_calc_jump(AF_INET, cv);
9fa492cd 1031 return copy_to_user(dst, &cv, sizeof(cv)) ? -EFAULT : 0;
2722971c
DM
1032}
1033
d5d1baa1 1034static int compat_calc_entry(const struct ipt_entry *e,
4b478248 1035 const struct xt_table_info *info,
d5d1baa1 1036 const void *base, struct xt_table_info *newinfo)
2722971c 1037{
dcea992a 1038 const struct xt_entry_match *ematch;
d5d1baa1 1039 const struct ipt_entry_target *t;
e5b5ef7d 1040 unsigned int entry_offset;
2722971c
DM
1041 int off, i, ret;
1042
30c08c41 1043 off = sizeof(struct ipt_entry) - sizeof(struct compat_ipt_entry);
2722971c 1044 entry_offset = (void *)e - base;
dcea992a 1045 xt_ematch_foreach(ematch, e)
6bdb331b 1046 off += xt_compat_match_offset(ematch->u.kernel.match);
d5d1baa1 1047 t = ipt_get_target_c(e);
9fa492cd 1048 off += xt_compat_target_offset(t->u.kernel.target);
2722971c 1049 newinfo->size -= off;
b386d9f5 1050 ret = xt_compat_add_offset(AF_INET, entry_offset, off);
2722971c
DM
1051 if (ret)
1052 return ret;
1053
6e23ae2a 1054 for (i = 0; i < NF_INET_NUMHOOKS; i++) {
4b478248
PM
1055 if (info->hook_entry[i] &&
1056 (e < (struct ipt_entry *)(base + info->hook_entry[i])))
2722971c 1057 newinfo->hook_entry[i] -= off;
4b478248
PM
1058 if (info->underflow[i] &&
1059 (e < (struct ipt_entry *)(base + info->underflow[i])))
2722971c
DM
1060 newinfo->underflow[i] -= off;
1061 }
1062 return 0;
1063}
1064
259d4e41 1065static int compat_table_info(const struct xt_table_info *info,
4b478248 1066 struct xt_table_info *newinfo)
2722971c 1067{
72b2b1dd 1068 struct ipt_entry *iter;
2722971c 1069 void *loc_cpu_entry;
0559518b 1070 int ret;
2722971c
DM
1071
1072 if (!newinfo || !info)
1073 return -EINVAL;
1074
259d4e41
ED
1075 /* we dont care about newinfo->entries[] */
1076 memcpy(newinfo, info, offsetof(struct xt_table_info, entries));
1077 newinfo->initial_entries = 0;
2722971c 1078 loc_cpu_entry = info->entries[raw_smp_processor_id()];
72b2b1dd
JE
1079 xt_entry_foreach(iter, loc_cpu_entry, info->size) {
1080 ret = compat_calc_entry(iter, info, loc_cpu_entry, newinfo);
1081 if (ret != 0)
0559518b 1082 return ret;
72b2b1dd 1083 }
0559518b 1084 return 0;
2722971c
DM
1085}
1086#endif
1087
d5d1baa1
JE
1088static int get_info(struct net *net, void __user *user,
1089 const int *len, int compat)
2722971c
DM
1090{
1091 char name[IPT_TABLE_MAXNAMELEN];
e60a13e0 1092 struct xt_table *t;
2722971c
DM
1093 int ret;
1094
1095 if (*len != sizeof(struct ipt_getinfo)) {
c9d8fe13
PM
1096 duprintf("length %u != %zu\n", *len,
1097 sizeof(struct ipt_getinfo));
2722971c
DM
1098 return -EINVAL;
1099 }
1100
1101 if (copy_from_user(name, user, sizeof(name)) != 0)
1102 return -EFAULT;
1103
1104 name[IPT_TABLE_MAXNAMELEN-1] = '\0';
1105#ifdef CONFIG_COMPAT
1106 if (compat)
1107 xt_compat_lock(AF_INET);
1108#endif
34bd137b 1109 t = try_then_request_module(xt_find_table_lock(net, AF_INET, name),
4b478248 1110 "iptable_%s", name);
2722971c
DM
1111 if (t && !IS_ERR(t)) {
1112 struct ipt_getinfo info;
5452e425 1113 const struct xt_table_info *private = t->private;
2722971c 1114#ifdef CONFIG_COMPAT
14c7dbe0
AD
1115 struct xt_table_info tmp;
1116
2722971c 1117 if (compat) {
2722971c 1118 ret = compat_table_info(private, &tmp);
b386d9f5 1119 xt_compat_flush_offsets(AF_INET);
4b478248 1120 private = &tmp;
2722971c
DM
1121 }
1122#endif
1123 info.valid_hooks = t->valid_hooks;
1124 memcpy(info.hook_entry, private->hook_entry,
4b478248 1125 sizeof(info.hook_entry));
2722971c 1126 memcpy(info.underflow, private->underflow,
4b478248 1127 sizeof(info.underflow));
2722971c
DM
1128 info.num_entries = private->number;
1129 info.size = private->size;
1130 strcpy(info.name, name);
1131
1132 if (copy_to_user(user, &info, *len) != 0)
1133 ret = -EFAULT;
1134 else
1135 ret = 0;
1136
1137 xt_table_unlock(t);
1138 module_put(t->me);
1139 } else
1140 ret = t ? PTR_ERR(t) : -ENOENT;
1141#ifdef CONFIG_COMPAT
1142 if (compat)
1143 xt_compat_unlock(AF_INET);
1144#endif
1145 return ret;
1146}
1147
1148static int
d5d1baa1
JE
1149get_entries(struct net *net, struct ipt_get_entries __user *uptr,
1150 const int *len)
2722971c
DM
1151{
1152 int ret;
1153 struct ipt_get_entries get;
e60a13e0 1154 struct xt_table *t;
2722971c
DM
1155
1156 if (*len < sizeof(get)) {
c9d8fe13 1157 duprintf("get_entries: %u < %zu\n", *len, sizeof(get));
2722971c
DM
1158 return -EINVAL;
1159 }
1160 if (copy_from_user(&get, uptr, sizeof(get)) != 0)
1161 return -EFAULT;
1162 if (*len != sizeof(struct ipt_get_entries) + get.size) {
c9d8fe13
PM
1163 duprintf("get_entries: %u != %zu\n",
1164 *len, sizeof(get) + get.size);
2722971c
DM
1165 return -EINVAL;
1166 }
1167
34bd137b 1168 t = xt_find_table_lock(net, AF_INET, get.name);
2722971c 1169 if (t && !IS_ERR(t)) {
5452e425 1170 const struct xt_table_info *private = t->private;
9c547959 1171 duprintf("t->private->number = %u\n", private->number);
2722971c
DM
1172 if (get.size == private->size)
1173 ret = copy_entries_to_user(private->size,
1174 t, uptr->entrytable);
1175 else {
1176 duprintf("get_entries: I've got %u not %u!\n",
9c547959 1177 private->size, get.size);
544473c1 1178 ret = -EAGAIN;
2722971c
DM
1179 }
1180 module_put(t->me);
1181 xt_table_unlock(t);
1182 } else
1183 ret = t ? PTR_ERR(t) : -ENOENT;
1184
1185 return ret;
1186}
1187
1188static int
34bd137b 1189__do_replace(struct net *net, const char *name, unsigned int valid_hooks,
4b478248
PM
1190 struct xt_table_info *newinfo, unsigned int num_counters,
1191 void __user *counters_ptr)
2722971c
DM
1192{
1193 int ret;
e60a13e0 1194 struct xt_table *t;
2722971c
DM
1195 struct xt_table_info *oldinfo;
1196 struct xt_counters *counters;
1197 void *loc_cpu_old_entry;
72b2b1dd 1198 struct ipt_entry *iter;
2722971c
DM
1199
1200 ret = 0;
1201 counters = vmalloc(num_counters * sizeof(struct xt_counters));
1202 if (!counters) {
1203 ret = -ENOMEM;
1204 goto out;
1205 }
1206
34bd137b 1207 t = try_then_request_module(xt_find_table_lock(net, AF_INET, name),
2722971c
DM
1208 "iptable_%s", name);
1209 if (!t || IS_ERR(t)) {
1210 ret = t ? PTR_ERR(t) : -ENOENT;
1211 goto free_newinfo_counters_untrans;
1212 }
1213
1214 /* You lied! */
1215 if (valid_hooks != t->valid_hooks) {
1216 duprintf("Valid hook crap: %08X vs %08X\n",
1217 valid_hooks, t->valid_hooks);
1218 ret = -EINVAL;
1219 goto put_module;
1220 }
1221
1222 oldinfo = xt_replace_table(t, num_counters, newinfo, &ret);
1223 if (!oldinfo)
1224 goto put_module;
1225
1226 /* Update module usage count based on number of rules */
1227 duprintf("do_replace: oldnum=%u, initnum=%u, newnum=%u\n",
1228 oldinfo->number, oldinfo->initial_entries, newinfo->number);
1229 if ((oldinfo->number > oldinfo->initial_entries) ||
1230 (newinfo->number <= oldinfo->initial_entries))
1231 module_put(t->me);
1232 if ((oldinfo->number > oldinfo->initial_entries) &&
1233 (newinfo->number <= oldinfo->initial_entries))
1234 module_put(t->me);
1235
942e4a2b 1236 /* Get the old counters, and synchronize with replace */
2722971c 1237 get_counters(oldinfo, counters);
942e4a2b 1238
2722971c
DM
1239 /* Decrease module usage counts and free resource */
1240 loc_cpu_old_entry = oldinfo->entries[raw_smp_processor_id()];
72b2b1dd 1241 xt_entry_foreach(iter, loc_cpu_old_entry, oldinfo->size)
0559518b 1242 cleanup_entry(iter, net);
72b2b1dd 1243
2722971c
DM
1244 xt_free_table_info(oldinfo);
1245 if (copy_to_user(counters_ptr, counters,
1246 sizeof(struct xt_counters) * num_counters) != 0)
1247 ret = -EFAULT;
1248 vfree(counters);
1249 xt_table_unlock(t);
1250 return ret;
1251
1252 put_module:
1253 module_put(t->me);
1254 xt_table_unlock(t);
1255 free_newinfo_counters_untrans:
1256 vfree(counters);
1257 out:
1258 return ret;
1259}
1260
1261static int
d5d1baa1 1262do_replace(struct net *net, const void __user *user, unsigned int len)
2722971c
DM
1263{
1264 int ret;
1265 struct ipt_replace tmp;
1266 struct xt_table_info *newinfo;
1267 void *loc_cpu_entry;
72b2b1dd 1268 struct ipt_entry *iter;
2722971c
DM
1269
1270 if (copy_from_user(&tmp, user, sizeof(tmp)) != 0)
1271 return -EFAULT;
1272
2722971c 1273 /* overflow check */
2722971c
DM
1274 if (tmp.num_counters >= INT_MAX / sizeof(struct xt_counters))
1275 return -ENOMEM;
1276
1277 newinfo = xt_alloc_table_info(tmp.size);
1278 if (!newinfo)
1279 return -ENOMEM;
1280
9c547959 1281 /* choose the copy that is on our node/cpu */
2722971c
DM
1282 loc_cpu_entry = newinfo->entries[raw_smp_processor_id()];
1283 if (copy_from_user(loc_cpu_entry, user + sizeof(tmp),
1284 tmp.size) != 0) {
1285 ret = -EFAULT;
1286 goto free_newinfo;
1287 }
1288
0f234214 1289 ret = translate_table(net, newinfo, loc_cpu_entry, &tmp);
2722971c
DM
1290 if (ret != 0)
1291 goto free_newinfo;
1292
ff67e4e4 1293 duprintf("Translated table\n");
2722971c 1294
34bd137b 1295 ret = __do_replace(net, tmp.name, tmp.valid_hooks, newinfo,
4b478248 1296 tmp.num_counters, tmp.counters);
2722971c
DM
1297 if (ret)
1298 goto free_newinfo_untrans;
1299 return 0;
1300
1301 free_newinfo_untrans:
72b2b1dd 1302 xt_entry_foreach(iter, loc_cpu_entry, newinfo->size)
0559518b 1303 cleanup_entry(iter, net);
2722971c
DM
1304 free_newinfo:
1305 xt_free_table_info(newinfo);
1306 return ret;
1307}
1308
2722971c 1309static int
d5d1baa1
JE
1310do_add_counters(struct net *net, const void __user *user,
1311 unsigned int len, int compat)
2722971c 1312{
942e4a2b 1313 unsigned int i, curcpu;
2722971c
DM
1314 struct xt_counters_info tmp;
1315 struct xt_counters *paddc;
1316 unsigned int num_counters;
5452e425 1317 const char *name;
2722971c
DM
1318 int size;
1319 void *ptmp;
e60a13e0 1320 struct xt_table *t;
5452e425 1321 const struct xt_table_info *private;
2722971c
DM
1322 int ret = 0;
1323 void *loc_cpu_entry;
72b2b1dd 1324 struct ipt_entry *iter;
2722971c
DM
1325#ifdef CONFIG_COMPAT
1326 struct compat_xt_counters_info compat_tmp;
1327
1328 if (compat) {
1329 ptmp = &compat_tmp;
1330 size = sizeof(struct compat_xt_counters_info);
1331 } else
1332#endif
1333 {
1334 ptmp = &tmp;
1335 size = sizeof(struct xt_counters_info);
1336 }
1337
1338 if (copy_from_user(ptmp, user, size) != 0)
1339 return -EFAULT;
1340
1341#ifdef CONFIG_COMPAT
1342 if (compat) {
1343 num_counters = compat_tmp.num_counters;
1344 name = compat_tmp.name;
1345 } else
1346#endif
1347 {
1348 num_counters = tmp.num_counters;
1349 name = tmp.name;
1350 }
1351
1352 if (len != size + num_counters * sizeof(struct xt_counters))
1353 return -EINVAL;
1354
1355 paddc = vmalloc_node(len - size, numa_node_id());
1356 if (!paddc)
1357 return -ENOMEM;
1358
1359 if (copy_from_user(paddc, user + size, len - size) != 0) {
1360 ret = -EFAULT;
1361 goto free;
1362 }
1363
34bd137b 1364 t = xt_find_table_lock(net, AF_INET, name);
2722971c
DM
1365 if (!t || IS_ERR(t)) {
1366 ret = t ? PTR_ERR(t) : -ENOENT;
1367 goto free;
1368 }
1369
942e4a2b 1370 local_bh_disable();
2722971c
DM
1371 private = t->private;
1372 if (private->number != num_counters) {
1373 ret = -EINVAL;
1374 goto unlock_up_free;
1375 }
1376
1377 i = 0;
1378 /* Choose the copy that is on our node */
942e4a2b
SH
1379 curcpu = smp_processor_id();
1380 loc_cpu_entry = private->entries[curcpu];
1381 xt_info_wrlock(curcpu);
0559518b
JE
1382 xt_entry_foreach(iter, loc_cpu_entry, private->size) {
1383 ADD_COUNTER(iter->counters, paddc[i].bcnt, paddc[i].pcnt);
1384 ++i;
1385 }
942e4a2b 1386 xt_info_wrunlock(curcpu);
2722971c 1387 unlock_up_free:
942e4a2b 1388 local_bh_enable();
2722971c
DM
1389 xt_table_unlock(t);
1390 module_put(t->me);
1391 free:
1392 vfree(paddc);
1393
1394 return ret;
1395}
1396
1397#ifdef CONFIG_COMPAT
1398struct compat_ipt_replace {
1399 char name[IPT_TABLE_MAXNAMELEN];
1400 u32 valid_hooks;
1401 u32 num_entries;
1402 u32 size;
6e23ae2a
PM
1403 u32 hook_entry[NF_INET_NUMHOOKS];
1404 u32 underflow[NF_INET_NUMHOOKS];
2722971c
DM
1405 u32 num_counters;
1406 compat_uptr_t counters; /* struct ipt_counters * */
1407 struct compat_ipt_entry entries[0];
1408};
1409
a18aa31b
PM
1410static int
1411compat_copy_entry_to_user(struct ipt_entry *e, void __user **dstptr,
b0a6363c 1412 unsigned int *size, struct xt_counters *counters,
0559518b 1413 unsigned int i)
2722971c 1414{
3e597c60 1415 struct ipt_entry_target *t;
2722971c
DM
1416 struct compat_ipt_entry __user *ce;
1417 u_int16_t target_offset, next_offset;
1418 compat_uint_t origsize;
dcea992a
JE
1419 const struct xt_entry_match *ematch;
1420 int ret = 0;
2722971c 1421
2722971c
DM
1422 origsize = *size;
1423 ce = (struct compat_ipt_entry __user *)*dstptr;
0559518b
JE
1424 if (copy_to_user(ce, e, sizeof(struct ipt_entry)) != 0 ||
1425 copy_to_user(&ce->counters, &counters[i],
1426 sizeof(counters[i])) != 0)
1427 return -EFAULT;
a18aa31b 1428
2722971c 1429 *dstptr += sizeof(struct compat_ipt_entry);
30c08c41
PM
1430 *size -= sizeof(struct ipt_entry) - sizeof(struct compat_ipt_entry);
1431
dcea992a
JE
1432 xt_ematch_foreach(ematch, e) {
1433 ret = xt_compat_match_to_user(ematch, dstptr, size);
1434 if (ret != 0)
6bdb331b 1435 return ret;
dcea992a 1436 }
2722971c 1437 target_offset = e->target_offset - (origsize - *size);
2722971c 1438 t = ipt_get_target(e);
9fa492cd 1439 ret = xt_compat_target_to_user(t, dstptr, size);
2722971c 1440 if (ret)
0559518b 1441 return ret;
2722971c 1442 next_offset = e->next_offset - (origsize - *size);
0559518b
JE
1443 if (put_user(target_offset, &ce->target_offset) != 0 ||
1444 put_user(next_offset, &ce->next_offset) != 0)
1445 return -EFAULT;
2722971c 1446 return 0;
2722971c
DM
1447}
1448
022748a9 1449static int
4c1b52bc 1450compat_find_calc_match(struct ipt_entry_match *m,
4b478248
PM
1451 const char *name,
1452 const struct ipt_ip *ip,
1453 unsigned int hookmask,
6bdb331b 1454 int *size)
2722971c 1455{
6709dbbb 1456 struct xt_match *match;
2722971c 1457
fd0ec0e6
JE
1458 match = xt_request_find_match(NFPROTO_IPV4, m->u.user.name,
1459 m->u.user.revision);
1460 if (IS_ERR(match)) {
2722971c 1461 duprintf("compat_check_calc_match: `%s' not found\n",
4b478248 1462 m->u.user.name);
fd0ec0e6 1463 return PTR_ERR(match);
2722971c
DM
1464 }
1465 m->u.kernel.match = match;
9fa492cd 1466 *size += xt_compat_match_offset(match);
4c1b52bc
DM
1467 return 0;
1468}
1469
0559518b 1470static void compat_release_entry(struct compat_ipt_entry *e)
4c1b52bc
DM
1471{
1472 struct ipt_entry_target *t;
dcea992a 1473 struct xt_entry_match *ematch;
4c1b52bc 1474
4c1b52bc 1475 /* Cleanup all matches */
dcea992a 1476 xt_ematch_foreach(ematch, e)
6bdb331b 1477 module_put(ematch->u.kernel.match->me);
73cd598d 1478 t = compat_ipt_get_target(e);
4c1b52bc 1479 module_put(t->u.kernel.target->me);
4c1b52bc
DM
1480}
1481
022748a9 1482static int
73cd598d 1483check_compat_entry_size_and_hooks(struct compat_ipt_entry *e,
4b478248
PM
1484 struct xt_table_info *newinfo,
1485 unsigned int *size,
d5d1baa1
JE
1486 const unsigned char *base,
1487 const unsigned char *limit,
1488 const unsigned int *hook_entries,
1489 const unsigned int *underflows,
4b478248 1490 const char *name)
2722971c 1491{
dcea992a 1492 struct xt_entry_match *ematch;
2722971c 1493 struct ipt_entry_target *t;
6709dbbb 1494 struct xt_target *target;
e5b5ef7d 1495 unsigned int entry_offset;
b0a6363c
PM
1496 unsigned int j;
1497 int ret, off, h;
2722971c
DM
1498
1499 duprintf("check_compat_entry_size_and_hooks %p\n", e);
3666ed1c
JP
1500 if ((unsigned long)e % __alignof__(struct compat_ipt_entry) != 0 ||
1501 (unsigned char *)e + sizeof(struct compat_ipt_entry) >= limit) {
2722971c
DM
1502 duprintf("Bad offset %p, limit = %p\n", e, limit);
1503 return -EINVAL;
1504 }
1505
1506 if (e->next_offset < sizeof(struct compat_ipt_entry) +
4b478248 1507 sizeof(struct compat_xt_entry_target)) {
2722971c
DM
1508 duprintf("checking: element %p size %u\n",
1509 e, e->next_offset);
1510 return -EINVAL;
1511 }
1512
73cd598d
PM
1513 /* For purposes of check_entry casting the compat entry is fine */
1514 ret = check_entry((struct ipt_entry *)e, name);
a96be246
DM
1515 if (ret)
1516 return ret;
590bdf7f 1517
30c08c41 1518 off = sizeof(struct ipt_entry) - sizeof(struct compat_ipt_entry);
2722971c
DM
1519 entry_offset = (void *)e - (void *)base;
1520 j = 0;
dcea992a
JE
1521 xt_ematch_foreach(ematch, e) {
1522 ret = compat_find_calc_match(ematch, name,
6b4ff2d7 1523 &e->ip, e->comefrom, &off);
dcea992a 1524 if (ret != 0)
6bdb331b
JE
1525 goto release_matches;
1526 ++j;
dcea992a 1527 }
2722971c 1528
73cd598d 1529 t = compat_ipt_get_target(e);
d2a7b6ba
JE
1530 target = xt_request_find_target(NFPROTO_IPV4, t->u.user.name,
1531 t->u.user.revision);
1532 if (IS_ERR(target)) {
a96be246 1533 duprintf("check_compat_entry_size_and_hooks: `%s' not found\n",
4b478248 1534 t->u.user.name);
d2a7b6ba 1535 ret = PTR_ERR(target);
4c1b52bc 1536 goto release_matches;
2722971c
DM
1537 }
1538 t->u.kernel.target = target;
1539
9fa492cd 1540 off += xt_compat_target_offset(target);
2722971c 1541 *size += off;
b386d9f5 1542 ret = xt_compat_add_offset(AF_INET, entry_offset, off);
2722971c
DM
1543 if (ret)
1544 goto out;
1545
1546 /* Check hooks & underflows */
6e23ae2a 1547 for (h = 0; h < NF_INET_NUMHOOKS; h++) {
2722971c
DM
1548 if ((unsigned char *)e - base == hook_entries[h])
1549 newinfo->hook_entry[h] = hook_entries[h];
1550 if ((unsigned char *)e - base == underflows[h])
1551 newinfo->underflow[h] = underflows[h];
1552 }
1553
1554 /* Clear counters and comefrom */
73cd598d 1555 memset(&e->counters, 0, sizeof(e->counters));
2722971c 1556 e->comefrom = 0;
2722971c 1557 return 0;
bec71b16 1558
2722971c 1559out:
bec71b16 1560 module_put(t->u.kernel.target->me);
4c1b52bc 1561release_matches:
6bdb331b
JE
1562 xt_ematch_foreach(ematch, e) {
1563 if (j-- == 0)
dcea992a 1564 break;
6bdb331b
JE
1565 module_put(ematch->u.kernel.match->me);
1566 }
2722971c
DM
1567 return ret;
1568}
1569
4b478248 1570static int
73cd598d 1571compat_copy_entry_from_user(struct compat_ipt_entry *e, void **dstptr,
4b478248
PM
1572 unsigned int *size, const char *name,
1573 struct xt_table_info *newinfo, unsigned char *base)
2722971c
DM
1574{
1575 struct ipt_entry_target *t;
6709dbbb 1576 struct xt_target *target;
2722971c
DM
1577 struct ipt_entry *de;
1578 unsigned int origsize;
920b868a 1579 int ret, h;
dcea992a 1580 struct xt_entry_match *ematch;
2722971c
DM
1581
1582 ret = 0;
1583 origsize = *size;
1584 de = (struct ipt_entry *)*dstptr;
1585 memcpy(de, e, sizeof(struct ipt_entry));
73cd598d 1586 memcpy(&de->counters, &e->counters, sizeof(e->counters));
2722971c 1587
73cd598d 1588 *dstptr += sizeof(struct ipt_entry);
30c08c41
PM
1589 *size += sizeof(struct ipt_entry) - sizeof(struct compat_ipt_entry);
1590
dcea992a
JE
1591 xt_ematch_foreach(ematch, e) {
1592 ret = xt_compat_match_from_user(ematch, dstptr, size);
1593 if (ret != 0)
6bdb331b 1594 return ret;
dcea992a 1595 }
2722971c 1596 de->target_offset = e->target_offset - (origsize - *size);
73cd598d 1597 t = compat_ipt_get_target(e);
2722971c 1598 target = t->u.kernel.target;
9fa492cd 1599 xt_compat_target_from_user(t, dstptr, size);
2722971c
DM
1600
1601 de->next_offset = e->next_offset - (origsize - *size);
6e23ae2a 1602 for (h = 0; h < NF_INET_NUMHOOKS; h++) {
2722971c
DM
1603 if ((unsigned char *)de - base < newinfo->hook_entry[h])
1604 newinfo->hook_entry[h] -= origsize - *size;
1605 if ((unsigned char *)de - base < newinfo->underflow[h])
1606 newinfo->underflow[h] -= origsize - *size;
1607 }
f6677f43
DM
1608 return ret;
1609}
1610
022748a9 1611static int
0559518b 1612compat_check_entry(struct ipt_entry *e, struct net *net, const char *name)
f6677f43 1613{
dcea992a 1614 struct xt_entry_match *ematch;
9b4fce7a 1615 struct xt_mtchk_param mtpar;
b0a6363c 1616 unsigned int j;
dcea992a 1617 int ret = 0;
f6677f43 1618
4c1b52bc 1619 j = 0;
a83d8e8d 1620 mtpar.net = net;
9b4fce7a
JE
1621 mtpar.table = name;
1622 mtpar.entryinfo = &e->ip;
1623 mtpar.hook_mask = e->comefrom;
916a917d 1624 mtpar.family = NFPROTO_IPV4;
dcea992a 1625 xt_ematch_foreach(ematch, e) {
6bdb331b 1626 ret = check_match(ematch, &mtpar);
dcea992a 1627 if (ret != 0)
6bdb331b
JE
1628 goto cleanup_matches;
1629 ++j;
dcea992a 1630 }
4c1b52bc 1631
add67461 1632 ret = check_target(e, net, name);
4c1b52bc
DM
1633 if (ret)
1634 goto cleanup_matches;
4c1b52bc
DM
1635 return 0;
1636
1637 cleanup_matches:
6bdb331b
JE
1638 xt_ematch_foreach(ematch, e) {
1639 if (j-- == 0)
dcea992a 1640 break;
6bdb331b
JE
1641 cleanup_match(ematch, net);
1642 }
4c1b52bc 1643 return ret;
f6677f43
DM
1644}
1645
1da177e4 1646static int
a83d8e8d
AD
1647translate_compat_table(struct net *net,
1648 const char *name,
4b478248
PM
1649 unsigned int valid_hooks,
1650 struct xt_table_info **pinfo,
1651 void **pentry0,
1652 unsigned int total_size,
1653 unsigned int number,
1654 unsigned int *hook_entries,
1655 unsigned int *underflows)
1da177e4 1656{
920b868a 1657 unsigned int i, j;
2722971c
DM
1658 struct xt_table_info *newinfo, *info;
1659 void *pos, *entry0, *entry1;
72b2b1dd
JE
1660 struct compat_ipt_entry *iter0;
1661 struct ipt_entry *iter1;
2722971c 1662 unsigned int size;
0559518b 1663 int ret;
1da177e4 1664
2722971c
DM
1665 info = *pinfo;
1666 entry0 = *pentry0;
1667 size = total_size;
1668 info->number = number;
1669
1670 /* Init all hooks to impossible value. */
6e23ae2a 1671 for (i = 0; i < NF_INET_NUMHOOKS; i++) {
2722971c
DM
1672 info->hook_entry[i] = 0xFFFFFFFF;
1673 info->underflow[i] = 0xFFFFFFFF;
1674 }
1675
1676 duprintf("translate_compat_table: size %u\n", info->size);
920b868a 1677 j = 0;
2722971c
DM
1678 xt_compat_lock(AF_INET);
1679 /* Walk through entries, checking offsets. */
72b2b1dd
JE
1680 xt_entry_foreach(iter0, entry0, total_size) {
1681 ret = check_compat_entry_size_and_hooks(iter0, info, &size,
6b4ff2d7
JE
1682 entry0,
1683 entry0 + total_size,
1684 hook_entries,
1685 underflows,
1686 name);
72b2b1dd 1687 if (ret != 0)
0559518b
JE
1688 goto out_unlock;
1689 ++j;
72b2b1dd 1690 }
2722971c
DM
1691
1692 ret = -EINVAL;
920b868a 1693 if (j != number) {
2722971c 1694 duprintf("translate_compat_table: %u not %u entries\n",
920b868a 1695 j, number);
2722971c
DM
1696 goto out_unlock;
1697 }
1698
1699 /* Check hooks all assigned */
6e23ae2a 1700 for (i = 0; i < NF_INET_NUMHOOKS; i++) {
2722971c
DM
1701 /* Only hooks which are valid */
1702 if (!(valid_hooks & (1 << i)))
1703 continue;
1704 if (info->hook_entry[i] == 0xFFFFFFFF) {
1705 duprintf("Invalid hook entry %u %u\n",
1706 i, hook_entries[i]);
1707 goto out_unlock;
1da177e4 1708 }
2722971c
DM
1709 if (info->underflow[i] == 0xFFFFFFFF) {
1710 duprintf("Invalid underflow %u %u\n",
1711 i, underflows[i]);
1712 goto out_unlock;
1713 }
1714 }
1715
1716 ret = -ENOMEM;
1717 newinfo = xt_alloc_table_info(size);
1718 if (!newinfo)
1719 goto out_unlock;
1720
1721 newinfo->number = number;
6e23ae2a 1722 for (i = 0; i < NF_INET_NUMHOOKS; i++) {
2722971c
DM
1723 newinfo->hook_entry[i] = info->hook_entry[i];
1724 newinfo->underflow[i] = info->underflow[i];
1725 }
1726 entry1 = newinfo->entries[raw_smp_processor_id()];
1727 pos = entry1;
4b478248 1728 size = total_size;
72b2b1dd 1729 xt_entry_foreach(iter0, entry0, total_size) {
6b4ff2d7
JE
1730 ret = compat_copy_entry_from_user(iter0, &pos, &size,
1731 name, newinfo, entry1);
72b2b1dd
JE
1732 if (ret != 0)
1733 break;
1734 }
b386d9f5 1735 xt_compat_flush_offsets(AF_INET);
2722971c
DM
1736 xt_compat_unlock(AF_INET);
1737 if (ret)
1738 goto free_newinfo;
1739
1740 ret = -ELOOP;
1741 if (!mark_source_chains(newinfo, valid_hooks, entry1))
1742 goto free_newinfo;
1743
4c1b52bc 1744 i = 0;
72b2b1dd 1745 xt_entry_foreach(iter1, entry1, newinfo->size) {
0559518b 1746 ret = compat_check_entry(iter1, net, name);
72b2b1dd
JE
1747 if (ret != 0)
1748 break;
0559518b 1749 ++i;
72b2b1dd 1750 }
4c1b52bc 1751 if (ret) {
72b2b1dd
JE
1752 /*
1753 * The first i matches need cleanup_entry (calls ->destroy)
1754 * because they had called ->check already. The other j-i
1755 * entries need only release.
1756 */
1757 int skip = i;
4c1b52bc 1758 j -= i;
72b2b1dd
JE
1759 xt_entry_foreach(iter0, entry0, newinfo->size) {
1760 if (skip-- > 0)
1761 continue;
0559518b 1762 if (j-- == 0)
72b2b1dd 1763 break;
0559518b 1764 compat_release_entry(iter0);
72b2b1dd 1765 }
0559518b
JE
1766 xt_entry_foreach(iter1, entry1, newinfo->size) {
1767 if (i-- == 0)
72b2b1dd 1768 break;
0559518b
JE
1769 cleanup_entry(iter1, net);
1770 }
4c1b52bc
DM
1771 xt_free_table_info(newinfo);
1772 return ret;
1773 }
f6677f43 1774
2722971c 1775 /* And one copy for every other CPU */
fb1bb34d 1776 for_each_possible_cpu(i)
2722971c
DM
1777 if (newinfo->entries[i] && newinfo->entries[i] != entry1)
1778 memcpy(newinfo->entries[i], entry1, newinfo->size);
1779
1780 *pinfo = newinfo;
1781 *pentry0 = entry1;
1782 xt_free_table_info(info);
1783 return 0;
1da177e4 1784
2722971c
DM
1785free_newinfo:
1786 xt_free_table_info(newinfo);
1787out:
0559518b
JE
1788 xt_entry_foreach(iter0, entry0, total_size) {
1789 if (j-- == 0)
72b2b1dd 1790 break;
0559518b
JE
1791 compat_release_entry(iter0);
1792 }
1da177e4 1793 return ret;
2722971c 1794out_unlock:
b386d9f5 1795 xt_compat_flush_offsets(AF_INET);
2722971c
DM
1796 xt_compat_unlock(AF_INET);
1797 goto out;
1da177e4
LT
1798}
1799
1800static int
34bd137b 1801compat_do_replace(struct net *net, void __user *user, unsigned int len)
1da177e4
LT
1802{
1803 int ret;
2722971c
DM
1804 struct compat_ipt_replace tmp;
1805 struct xt_table_info *newinfo;
1806 void *loc_cpu_entry;
72b2b1dd 1807 struct ipt_entry *iter;
1da177e4
LT
1808
1809 if (copy_from_user(&tmp, user, sizeof(tmp)) != 0)
1810 return -EFAULT;
1811
ee4bb818 1812 /* overflow check */
259d4e41 1813 if (tmp.size >= INT_MAX / num_possible_cpus())
ee4bb818
KK
1814 return -ENOMEM;
1815 if (tmp.num_counters >= INT_MAX / sizeof(struct xt_counters))
1816 return -ENOMEM;
1817
2e4e6a17 1818 newinfo = xt_alloc_table_info(tmp.size);
1da177e4
LT
1819 if (!newinfo)
1820 return -ENOMEM;
1821
9c547959 1822 /* choose the copy that is on our node/cpu */
31836064
ED
1823 loc_cpu_entry = newinfo->entries[raw_smp_processor_id()];
1824 if (copy_from_user(loc_cpu_entry, user + sizeof(tmp),
1da177e4
LT
1825 tmp.size) != 0) {
1826 ret = -EFAULT;
1827 goto free_newinfo;
1828 }
1829
a83d8e8d 1830 ret = translate_compat_table(net, tmp.name, tmp.valid_hooks,
4b478248
PM
1831 &newinfo, &loc_cpu_entry, tmp.size,
1832 tmp.num_entries, tmp.hook_entry,
1833 tmp.underflow);
2722971c 1834 if (ret != 0)
1da177e4 1835 goto free_newinfo;
1da177e4 1836
2722971c 1837 duprintf("compat_do_replace: Translated table\n");
1da177e4 1838
34bd137b 1839 ret = __do_replace(net, tmp.name, tmp.valid_hooks, newinfo,
4b478248 1840 tmp.num_counters, compat_ptr(tmp.counters));
2722971c
DM
1841 if (ret)
1842 goto free_newinfo_untrans;
1843 return 0;
1da177e4 1844
2722971c 1845 free_newinfo_untrans:
72b2b1dd 1846 xt_entry_foreach(iter, loc_cpu_entry, newinfo->size)
0559518b 1847 cleanup_entry(iter, net);
2722971c
DM
1848 free_newinfo:
1849 xt_free_table_info(newinfo);
1850 return ret;
1851}
1da177e4 1852
2722971c
DM
1853static int
1854compat_do_ipt_set_ctl(struct sock *sk, int cmd, void __user *user,
4b478248 1855 unsigned int len)
2722971c
DM
1856{
1857 int ret;
1da177e4 1858
2722971c
DM
1859 if (!capable(CAP_NET_ADMIN))
1860 return -EPERM;
1da177e4 1861
2722971c
DM
1862 switch (cmd) {
1863 case IPT_SO_SET_REPLACE:
3b1e0a65 1864 ret = compat_do_replace(sock_net(sk), user, len);
2722971c 1865 break;
1da177e4 1866
2722971c 1867 case IPT_SO_SET_ADD_COUNTERS:
3b1e0a65 1868 ret = do_add_counters(sock_net(sk), user, len, 1);
2722971c
DM
1869 break;
1870
1871 default:
1872 duprintf("do_ipt_set_ctl: unknown request %i\n", cmd);
1873 ret = -EINVAL;
1874 }
1da177e4 1875
1da177e4
LT
1876 return ret;
1877}
1878
4b478248 1879struct compat_ipt_get_entries {
2722971c
DM
1880 char name[IPT_TABLE_MAXNAMELEN];
1881 compat_uint_t size;
1882 struct compat_ipt_entry entrytable[0];
1883};
1da177e4 1884
4b478248
PM
1885static int
1886compat_copy_entries_to_user(unsigned int total_size, struct xt_table *table,
1887 void __user *userptr)
2722971c 1888{
2722971c 1889 struct xt_counters *counters;
5452e425 1890 const struct xt_table_info *private = table->private;
2722971c
DM
1891 void __user *pos;
1892 unsigned int size;
1893 int ret = 0;
5452e425 1894 const void *loc_cpu_entry;
a18aa31b 1895 unsigned int i = 0;
72b2b1dd 1896 struct ipt_entry *iter;
1da177e4 1897
2722971c
DM
1898 counters = alloc_counters(table);
1899 if (IS_ERR(counters))
1900 return PTR_ERR(counters);
1901
1902 /* choose the copy that is on our node/cpu, ...
1903 * This choice is lazy (because current thread is
1904 * allowed to migrate to another cpu)
1905 */
1906 loc_cpu_entry = private->entries[raw_smp_processor_id()];
1907 pos = userptr;
1908 size = total_size;
72b2b1dd
JE
1909 xt_entry_foreach(iter, loc_cpu_entry, total_size) {
1910 ret = compat_copy_entry_to_user(iter, &pos,
6b4ff2d7 1911 &size, counters, i++);
72b2b1dd
JE
1912 if (ret != 0)
1913 break;
1914 }
2722971c 1915
2722971c
DM
1916 vfree(counters);
1917 return ret;
1da177e4
LT
1918}
1919
1920static int
34bd137b
AD
1921compat_get_entries(struct net *net, struct compat_ipt_get_entries __user *uptr,
1922 int *len)
1da177e4 1923{
2722971c
DM
1924 int ret;
1925 struct compat_ipt_get_entries get;
e60a13e0 1926 struct xt_table *t;
1da177e4 1927
2722971c 1928 if (*len < sizeof(get)) {
c9d8fe13 1929 duprintf("compat_get_entries: %u < %zu\n", *len, sizeof(get));
1da177e4 1930 return -EINVAL;
2722971c 1931 }
1da177e4 1932
2722971c
DM
1933 if (copy_from_user(&get, uptr, sizeof(get)) != 0)
1934 return -EFAULT;
1da177e4 1935
2722971c 1936 if (*len != sizeof(struct compat_ipt_get_entries) + get.size) {
c9d8fe13
PM
1937 duprintf("compat_get_entries: %u != %zu\n",
1938 *len, sizeof(get) + get.size);
2722971c 1939 return -EINVAL;
1da177e4
LT
1940 }
1941
2722971c 1942 xt_compat_lock(AF_INET);
34bd137b 1943 t = xt_find_table_lock(net, AF_INET, get.name);
2722971c 1944 if (t && !IS_ERR(t)) {
5452e425 1945 const struct xt_table_info *private = t->private;
2722971c 1946 struct xt_table_info info;
9c547959 1947 duprintf("t->private->number = %u\n", private->number);
2722971c
DM
1948 ret = compat_table_info(private, &info);
1949 if (!ret && get.size == info.size) {
1950 ret = compat_copy_entries_to_user(private->size,
4b478248 1951 t, uptr->entrytable);
2722971c
DM
1952 } else if (!ret) {
1953 duprintf("compat_get_entries: I've got %u not %u!\n",
9c547959 1954 private->size, get.size);
544473c1 1955 ret = -EAGAIN;
2722971c 1956 }
b386d9f5 1957 xt_compat_flush_offsets(AF_INET);
2722971c
DM
1958 module_put(t->me);
1959 xt_table_unlock(t);
1960 } else
1da177e4 1961 ret = t ? PTR_ERR(t) : -ENOENT;
1da177e4 1962
2722971c
DM
1963 xt_compat_unlock(AF_INET);
1964 return ret;
1965}
1da177e4 1966
79030ed0
PM
1967static int do_ipt_get_ctl(struct sock *, int, void __user *, int *);
1968
2722971c
DM
1969static int
1970compat_do_ipt_get_ctl(struct sock *sk, int cmd, void __user *user, int *len)
1971{
1972 int ret;
1da177e4 1973
82fac054
BS
1974 if (!capable(CAP_NET_ADMIN))
1975 return -EPERM;
1976
2722971c
DM
1977 switch (cmd) {
1978 case IPT_SO_GET_INFO:
3b1e0a65 1979 ret = get_info(sock_net(sk), user, len, 1);
2722971c
DM
1980 break;
1981 case IPT_SO_GET_ENTRIES:
3b1e0a65 1982 ret = compat_get_entries(sock_net(sk), user, len);
2722971c
DM
1983 break;
1984 default:
79030ed0 1985 ret = do_ipt_get_ctl(sk, cmd, user, len);
2722971c 1986 }
1da177e4
LT
1987 return ret;
1988}
2722971c 1989#endif
1da177e4
LT
1990
1991static int
9c547959 1992do_ipt_set_ctl(struct sock *sk, int cmd, void __user *user, unsigned int len)
1da177e4
LT
1993{
1994 int ret;
1995
1996 if (!capable(CAP_NET_ADMIN))
1997 return -EPERM;
1998
1999 switch (cmd) {
2000 case IPT_SO_SET_REPLACE:
3b1e0a65 2001 ret = do_replace(sock_net(sk), user, len);
1da177e4
LT
2002 break;
2003
2004 case IPT_SO_SET_ADD_COUNTERS:
3b1e0a65 2005 ret = do_add_counters(sock_net(sk), user, len, 0);
1da177e4
LT
2006 break;
2007
2008 default:
2009 duprintf("do_ipt_set_ctl: unknown request %i\n", cmd);
2010 ret = -EINVAL;
2011 }
2012
2013 return ret;
2014}
2015
2016static int
2017do_ipt_get_ctl(struct sock *sk, int cmd, void __user *user, int *len)
2018{
2019 int ret;
2020
2021 if (!capable(CAP_NET_ADMIN))
2022 return -EPERM;
2023
2024 switch (cmd) {
2722971c 2025 case IPT_SO_GET_INFO:
3b1e0a65 2026 ret = get_info(sock_net(sk), user, len, 0);
2722971c 2027 break;
1da177e4 2028
2722971c 2029 case IPT_SO_GET_ENTRIES:
3b1e0a65 2030 ret = get_entries(sock_net(sk), user, len);
1da177e4 2031 break;
1da177e4
LT
2032
2033 case IPT_SO_GET_REVISION_MATCH:
2034 case IPT_SO_GET_REVISION_TARGET: {
2035 struct ipt_get_revision rev;
2e4e6a17 2036 int target;
1da177e4
LT
2037
2038 if (*len != sizeof(rev)) {
2039 ret = -EINVAL;
2040 break;
2041 }
2042 if (copy_from_user(&rev, user, sizeof(rev)) != 0) {
2043 ret = -EFAULT;
2044 break;
2045 }
2046
2047 if (cmd == IPT_SO_GET_REVISION_TARGET)
2e4e6a17 2048 target = 1;
1da177e4 2049 else
2e4e6a17 2050 target = 0;
1da177e4 2051
2e4e6a17
HW
2052 try_then_request_module(xt_find_revision(AF_INET, rev.name,
2053 rev.revision,
2054 target, &ret),
1da177e4
LT
2055 "ipt_%s", rev.name);
2056 break;
2057 }
2058
2059 default:
2060 duprintf("do_ipt_get_ctl: unknown request %i\n", cmd);
2061 ret = -EINVAL;
2062 }
2063
2064 return ret;
2065}
2066
35aad0ff
JE
2067struct xt_table *ipt_register_table(struct net *net,
2068 const struct xt_table *table,
44d34e72 2069 const struct ipt_replace *repl)
1da177e4
LT
2070{
2071 int ret;
2e4e6a17 2072 struct xt_table_info *newinfo;
f3c5c1bf 2073 struct xt_table_info bootstrap = {0};
31836064 2074 void *loc_cpu_entry;
a98da11d 2075 struct xt_table *new_table;
1da177e4 2076
2e4e6a17 2077 newinfo = xt_alloc_table_info(repl->size);
44d34e72
AD
2078 if (!newinfo) {
2079 ret = -ENOMEM;
2080 goto out;
2081 }
1da177e4 2082
9c547959 2083 /* choose the copy on our node/cpu, but dont care about preemption */
31836064
ED
2084 loc_cpu_entry = newinfo->entries[raw_smp_processor_id()];
2085 memcpy(loc_cpu_entry, repl->entries, repl->size);
1da177e4 2086
0f234214 2087 ret = translate_table(net, newinfo, loc_cpu_entry, repl);
44d34e72
AD
2088 if (ret != 0)
2089 goto out_free;
1da177e4 2090
44d34e72 2091 new_table = xt_register_table(net, table, &bootstrap, newinfo);
a98da11d 2092 if (IS_ERR(new_table)) {
44d34e72
AD
2093 ret = PTR_ERR(new_table);
2094 goto out_free;
1da177e4
LT
2095 }
2096
44d34e72
AD
2097 return new_table;
2098
2099out_free:
2100 xt_free_table_info(newinfo);
2101out:
2102 return ERR_PTR(ret);
1da177e4
LT
2103}
2104
f54e9367 2105void ipt_unregister_table(struct net *net, struct xt_table *table)
1da177e4 2106{
2e4e6a17 2107 struct xt_table_info *private;
31836064 2108 void *loc_cpu_entry;
df200969 2109 struct module *table_owner = table->me;
72b2b1dd 2110 struct ipt_entry *iter;
31836064 2111
e905a9ed 2112 private = xt_unregister_table(table);
1da177e4
LT
2113
2114 /* Decrease module usage counts and free resources */
2e4e6a17 2115 loc_cpu_entry = private->entries[raw_smp_processor_id()];
72b2b1dd 2116 xt_entry_foreach(iter, loc_cpu_entry, private->size)
0559518b 2117 cleanup_entry(iter, net);
df200969
AD
2118 if (private->number > private->initial_entries)
2119 module_put(table_owner);
2e4e6a17 2120 xt_free_table_info(private);
1da177e4
LT
2121}
2122
2123/* Returns 1 if the type and code is matched by the range, 0 otherwise */
1d93a9cb 2124static inline bool
1da177e4
LT
2125icmp_type_code_match(u_int8_t test_type, u_int8_t min_code, u_int8_t max_code,
2126 u_int8_t type, u_int8_t code,
1d93a9cb 2127 bool invert)
1da177e4 2128{
9c547959
PM
2129 return ((test_type == 0xFF) ||
2130 (type == test_type && code >= min_code && code <= max_code))
1da177e4
LT
2131 ^ invert;
2132}
2133
1d93a9cb 2134static bool
62fc8051 2135icmp_match(const struct sk_buff *skb, struct xt_action_param *par)
1da177e4 2136{
5452e425
JE
2137 const struct icmphdr *ic;
2138 struct icmphdr _icmph;
f7108a20 2139 const struct ipt_icmp *icmpinfo = par->matchinfo;
1da177e4
LT
2140
2141 /* Must not be a fragment. */
f7108a20 2142 if (par->fragoff != 0)
1d93a9cb 2143 return false;
1da177e4 2144
f7108a20 2145 ic = skb_header_pointer(skb, par->thoff, sizeof(_icmph), &_icmph);
1da177e4
LT
2146 if (ic == NULL) {
2147 /* We've been asked to examine this packet, and we
2148 * can't. Hence, no choice but to drop.
2149 */
2150 duprintf("Dropping evil ICMP tinygram.\n");
b4ba2611 2151 par->hotdrop = true;
1d93a9cb 2152 return false;
1da177e4
LT
2153 }
2154
2155 return icmp_type_code_match(icmpinfo->type,
2156 icmpinfo->code[0],
2157 icmpinfo->code[1],
2158 ic->type, ic->code,
2159 !!(icmpinfo->invflags&IPT_ICMP_INV));
2160}
2161
b0f38452 2162static int icmp_checkentry(const struct xt_mtchk_param *par)
1da177e4 2163{
9b4fce7a 2164 const struct ipt_icmp *icmpinfo = par->matchinfo;
1da177e4 2165
1d5cd909 2166 /* Must specify no unknown invflags */
bd414ee6 2167 return (icmpinfo->invflags & ~IPT_ICMP_INV) ? -EINVAL : 0;
1da177e4
LT
2168}
2169
4538506b
JE
2170static struct xt_target ipt_builtin_tg[] __read_mostly = {
2171 {
2172 .name = IPT_STANDARD_TARGET,
2173 .targetsize = sizeof(int),
2174 .family = NFPROTO_IPV4,
2722971c 2175#ifdef CONFIG_COMPAT
4538506b
JE
2176 .compatsize = sizeof(compat_int_t),
2177 .compat_from_user = compat_standard_from_user,
2178 .compat_to_user = compat_standard_to_user,
2722971c 2179#endif
4538506b
JE
2180 },
2181 {
2182 .name = IPT_ERROR_TARGET,
2183 .target = ipt_error,
2184 .targetsize = IPT_FUNCTION_MAXNAMELEN,
2185 .family = NFPROTO_IPV4,
2186 },
1da177e4
LT
2187};
2188
2189static struct nf_sockopt_ops ipt_sockopts = {
2190 .pf = PF_INET,
2191 .set_optmin = IPT_BASE_CTL,
2192 .set_optmax = IPT_SO_SET_MAX+1,
2193 .set = do_ipt_set_ctl,
2722971c
DM
2194#ifdef CONFIG_COMPAT
2195 .compat_set = compat_do_ipt_set_ctl,
2196#endif
1da177e4
LT
2197 .get_optmin = IPT_BASE_CTL,
2198 .get_optmax = IPT_SO_GET_MAX+1,
2199 .get = do_ipt_get_ctl,
2722971c
DM
2200#ifdef CONFIG_COMPAT
2201 .compat_get = compat_do_ipt_get_ctl,
2202#endif
16fcec35 2203 .owner = THIS_MODULE,
1da177e4
LT
2204};
2205
4538506b
JE
2206static struct xt_match ipt_builtin_mt[] __read_mostly = {
2207 {
2208 .name = "icmp",
2209 .match = icmp_match,
2210 .matchsize = sizeof(struct ipt_icmp),
2211 .checkentry = icmp_checkentry,
2212 .proto = IPPROTO_ICMP,
2213 .family = NFPROTO_IPV4,
2214 },
1da177e4
LT
2215};
2216
3cb609d5
AD
2217static int __net_init ip_tables_net_init(struct net *net)
2218{
383ca5b8 2219 return xt_proto_init(net, NFPROTO_IPV4);
3cb609d5
AD
2220}
2221
2222static void __net_exit ip_tables_net_exit(struct net *net)
2223{
383ca5b8 2224 xt_proto_fini(net, NFPROTO_IPV4);
3cb609d5
AD
2225}
2226
2227static struct pernet_operations ip_tables_net_ops = {
2228 .init = ip_tables_net_init,
2229 .exit = ip_tables_net_exit,
2230};
2231
65b4b4e8 2232static int __init ip_tables_init(void)
1da177e4
LT
2233{
2234 int ret;
2235
3cb609d5 2236 ret = register_pernet_subsys(&ip_tables_net_ops);
0eff66e6
PM
2237 if (ret < 0)
2238 goto err1;
2e4e6a17 2239
1da177e4 2240 /* Noone else will be downing sem now, so we won't sleep */
4538506b 2241 ret = xt_register_targets(ipt_builtin_tg, ARRAY_SIZE(ipt_builtin_tg));
0eff66e6
PM
2242 if (ret < 0)
2243 goto err2;
4538506b 2244 ret = xt_register_matches(ipt_builtin_mt, ARRAY_SIZE(ipt_builtin_mt));
0eff66e6
PM
2245 if (ret < 0)
2246 goto err4;
1da177e4
LT
2247
2248 /* Register setsockopt */
2249 ret = nf_register_sockopt(&ipt_sockopts);
0eff66e6
PM
2250 if (ret < 0)
2251 goto err5;
1da177e4 2252
ff67e4e4 2253 pr_info("(C) 2000-2006 Netfilter Core Team\n");
1da177e4 2254 return 0;
0eff66e6
PM
2255
2256err5:
4538506b 2257 xt_unregister_matches(ipt_builtin_mt, ARRAY_SIZE(ipt_builtin_mt));
0eff66e6 2258err4:
4538506b 2259 xt_unregister_targets(ipt_builtin_tg, ARRAY_SIZE(ipt_builtin_tg));
0eff66e6 2260err2:
3cb609d5 2261 unregister_pernet_subsys(&ip_tables_net_ops);
0eff66e6
PM
2262err1:
2263 return ret;
1da177e4
LT
2264}
2265
65b4b4e8 2266static void __exit ip_tables_fini(void)
1da177e4
LT
2267{
2268 nf_unregister_sockopt(&ipt_sockopts);
2e4e6a17 2269
4538506b
JE
2270 xt_unregister_matches(ipt_builtin_mt, ARRAY_SIZE(ipt_builtin_mt));
2271 xt_unregister_targets(ipt_builtin_tg, ARRAY_SIZE(ipt_builtin_tg));
3cb609d5 2272 unregister_pernet_subsys(&ip_tables_net_ops);
1da177e4
LT
2273}
2274
2275EXPORT_SYMBOL(ipt_register_table);
2276EXPORT_SYMBOL(ipt_unregister_table);
1da177e4 2277EXPORT_SYMBOL(ipt_do_table);
65b4b4e8
AM
2278module_init(ip_tables_init);
2279module_exit(ip_tables_fini);