]> bbs.cooldavid.org Git - net-next-2.6.git/blame - net/ipv4/devinet.c
[IPv4]: Use rtnl registration interface
[net-next-2.6.git] / net / ipv4 / devinet.c
CommitLineData
1da177e4
LT
1/*
2 * NET3 IP device support routines.
3 *
4 * Version: $Id: devinet.c,v 1.44 2001/10/31 21:55:54 davem Exp $
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 * Derived from the IP parts of dev.c 1.0.19
02c30a84 12 * Authors: Ross Biro
1da177e4
LT
13 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
14 * Mark Evans, <evansmp@uhura.aston.ac.uk>
15 *
16 * Additional Authors:
17 * Alan Cox, <gw4pts@gw4pts.ampr.org>
18 * Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
19 *
20 * Changes:
21 * Alexey Kuznetsov: pa_* fields are replaced with ifaddr
22 * lists.
23 * Cyrus Durgin: updated for kmod
24 * Matthias Andree: in devinet_ioctl, compare label and
25 * address (4.4BSD alias style support),
26 * fall back to comparing just the label
27 * if no match found.
28 */
29
1da177e4
LT
30
31#include <asm/uaccess.h>
32#include <asm/system.h>
33#include <linux/bitops.h>
4fc268d2 34#include <linux/capability.h>
1da177e4
LT
35#include <linux/module.h>
36#include <linux/types.h>
37#include <linux/kernel.h>
1da177e4
LT
38#include <linux/string.h>
39#include <linux/mm.h>
40#include <linux/socket.h>
41#include <linux/sockios.h>
42#include <linux/in.h>
43#include <linux/errno.h>
44#include <linux/interrupt.h>
1823730f 45#include <linux/if_addr.h>
1da177e4
LT
46#include <linux/if_ether.h>
47#include <linux/inet.h>
48#include <linux/netdevice.h>
49#include <linux/etherdevice.h>
50#include <linux/skbuff.h>
1da177e4
LT
51#include <linux/init.h>
52#include <linux/notifier.h>
53#include <linux/inetdevice.h>
54#include <linux/igmp.h>
55#ifdef CONFIG_SYSCTL
56#include <linux/sysctl.h>
57#endif
58#include <linux/kmod.h>
59
14c85021 60#include <net/arp.h>
1da177e4
LT
61#include <net/ip.h>
62#include <net/route.h>
63#include <net/ip_fib.h>
63f3444f 64#include <net/rtnetlink.h>
1da177e4
LT
65
66struct ipv4_devconf ipv4_devconf = {
67 .accept_redirects = 1,
68 .send_redirects = 1,
69 .secure_redirects = 1,
70 .shared_media = 1,
71};
72
73static struct ipv4_devconf ipv4_devconf_dflt = {
74 .accept_redirects = 1,
75 .send_redirects = 1,
76 .secure_redirects = 1,
77 .shared_media = 1,
78 .accept_source_route = 1,
79};
80
5c753978
TG
81static struct nla_policy ifa_ipv4_policy[IFA_MAX+1] __read_mostly = {
82 [IFA_LOCAL] = { .type = NLA_U32 },
83 [IFA_ADDRESS] = { .type = NLA_U32 },
84 [IFA_BROADCAST] = { .type = NLA_U32 },
85 [IFA_ANYCAST] = { .type = NLA_U32 },
5176f91e 86 [IFA_LABEL] = { .type = NLA_STRING, .len = IFNAMSIZ - 1 },
5c753978
TG
87};
88
d6062cbb 89static void rtmsg_ifa(int event, struct in_ifaddr *, struct nlmsghdr *, u32);
1da177e4 90
e041c683 91static BLOCKING_NOTIFIER_HEAD(inetaddr_chain);
1da177e4
LT
92static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
93 int destroy);
94#ifdef CONFIG_SYSCTL
95static void devinet_sysctl_register(struct in_device *in_dev,
96 struct ipv4_devconf *p);
97static void devinet_sysctl_unregister(struct ipv4_devconf *p);
98#endif
99
100/* Locks all the inet devices. */
101
102static struct in_ifaddr *inet_alloc_ifa(void)
103{
0da974f4 104 struct in_ifaddr *ifa = kzalloc(sizeof(*ifa), GFP_KERNEL);
1da177e4
LT
105
106 if (ifa) {
1da177e4
LT
107 INIT_RCU_HEAD(&ifa->rcu_head);
108 }
109
110 return ifa;
111}
112
113static void inet_rcu_free_ifa(struct rcu_head *head)
114{
115 struct in_ifaddr *ifa = container_of(head, struct in_ifaddr, rcu_head);
116 if (ifa->ifa_dev)
117 in_dev_put(ifa->ifa_dev);
118 kfree(ifa);
119}
120
121static inline void inet_free_ifa(struct in_ifaddr *ifa)
122{
123 call_rcu(&ifa->rcu_head, inet_rcu_free_ifa);
124}
125
126void in_dev_finish_destroy(struct in_device *idev)
127{
128 struct net_device *dev = idev->dev;
129
130 BUG_TRAP(!idev->ifa_list);
131 BUG_TRAP(!idev->mc_list);
132#ifdef NET_REFCNT_DEBUG
133 printk(KERN_DEBUG "in_dev_finish_destroy: %p=%s\n",
134 idev, dev ? dev->name : "NIL");
135#endif
136 dev_put(dev);
137 if (!idev->dead)
138 printk("Freeing alive in_device %p\n", idev);
139 else {
140 kfree(idev);
141 }
142}
143
144struct in_device *inetdev_init(struct net_device *dev)
145{
146 struct in_device *in_dev;
147
148 ASSERT_RTNL();
149
0da974f4 150 in_dev = kzalloc(sizeof(*in_dev), GFP_KERNEL);
1da177e4
LT
151 if (!in_dev)
152 goto out;
1da177e4
LT
153 INIT_RCU_HEAD(&in_dev->rcu_head);
154 memcpy(&in_dev->cnf, &ipv4_devconf_dflt, sizeof(in_dev->cnf));
155 in_dev->cnf.sysctl = NULL;
156 in_dev->dev = dev;
157 if ((in_dev->arp_parms = neigh_parms_alloc(dev, &arp_tbl)) == NULL)
158 goto out_kfree;
159 /* Reference in_dev->dev */
160 dev_hold(dev);
161#ifdef CONFIG_SYSCTL
162 neigh_sysctl_register(dev, in_dev->arp_parms, NET_IPV4,
163 NET_IPV4_NEIGH, "ipv4", NULL, NULL);
164#endif
165
30c4cf57 166 /* Account for reference dev->ip_ptr (below) */
1da177e4 167 in_dev_hold(in_dev);
1da177e4
LT
168
169#ifdef CONFIG_SYSCTL
170 devinet_sysctl_register(in_dev, &in_dev->cnf);
171#endif
172 ip_mc_init_dev(in_dev);
173 if (dev->flags & IFF_UP)
174 ip_mc_up(in_dev);
483479ec 175
30c4cf57
DS
176 /* we can receive as soon as ip_ptr is set -- do this last */
177 rcu_assign_pointer(dev->ip_ptr, in_dev);
483479ec 178out:
1da177e4
LT
179 return in_dev;
180out_kfree:
181 kfree(in_dev);
182 in_dev = NULL;
183 goto out;
184}
185
186static void in_dev_rcu_put(struct rcu_head *head)
187{
188 struct in_device *idev = container_of(head, struct in_device, rcu_head);
189 in_dev_put(idev);
190}
191
192static void inetdev_destroy(struct in_device *in_dev)
193{
194 struct in_ifaddr *ifa;
195 struct net_device *dev;
196
197 ASSERT_RTNL();
198
199 dev = in_dev->dev;
200 if (dev == &loopback_dev)
201 return;
202
203 in_dev->dead = 1;
204
205 ip_mc_destroy_dev(in_dev);
206
207 while ((ifa = in_dev->ifa_list) != NULL) {
208 inet_del_ifa(in_dev, &in_dev->ifa_list, 0);
209 inet_free_ifa(ifa);
210 }
211
212#ifdef CONFIG_SYSCTL
213 devinet_sysctl_unregister(&in_dev->cnf);
214#endif
215
216 dev->ip_ptr = NULL;
217
218#ifdef CONFIG_SYSCTL
219 neigh_sysctl_unregister(in_dev->arp_parms);
220#endif
221 neigh_parms_release(&arp_tbl, in_dev->arp_parms);
222 arp_ifdown(dev);
223
224 call_rcu(&in_dev->rcu_head, in_dev_rcu_put);
225}
226
ff428d72 227int inet_addr_onlink(struct in_device *in_dev, __be32 a, __be32 b)
1da177e4
LT
228{
229 rcu_read_lock();
230 for_primary_ifa(in_dev) {
231 if (inet_ifa_match(a, ifa)) {
232 if (!b || inet_ifa_match(b, ifa)) {
233 rcu_read_unlock();
234 return 1;
235 }
236 }
237 } endfor_ifa(in_dev);
238 rcu_read_unlock();
239 return 0;
240}
241
d6062cbb
TG
242static void __inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
243 int destroy, struct nlmsghdr *nlh, u32 pid)
1da177e4 244{
8f937c60 245 struct in_ifaddr *promote = NULL;
0ff60a45
JHS
246 struct in_ifaddr *ifa, *ifa1 = *ifap;
247 struct in_ifaddr *last_prim = in_dev->ifa_list;
248 struct in_ifaddr *prev_prom = NULL;
249 int do_promote = IN_DEV_PROMOTE_SECONDARIES(in_dev);
1da177e4
LT
250
251 ASSERT_RTNL();
252
e905a9ed 253 /* 1. Deleting primary ifaddr forces deletion all secondaries
8f937c60
HW
254 * unless alias promotion is set
255 **/
1da177e4
LT
256
257 if (!(ifa1->ifa_flags & IFA_F_SECONDARY)) {
1da177e4
LT
258 struct in_ifaddr **ifap1 = &ifa1->ifa_next;
259
260 while ((ifa = *ifap1) != NULL) {
e905a9ed 261 if (!(ifa->ifa_flags & IFA_F_SECONDARY) &&
0ff60a45
JHS
262 ifa1->ifa_scope <= ifa->ifa_scope)
263 last_prim = ifa;
264
1da177e4
LT
265 if (!(ifa->ifa_flags & IFA_F_SECONDARY) ||
266 ifa1->ifa_mask != ifa->ifa_mask ||
267 !inet_ifa_match(ifa1->ifa_address, ifa)) {
268 ifap1 = &ifa->ifa_next;
0ff60a45 269 prev_prom = ifa;
1da177e4
LT
270 continue;
271 }
272
0ff60a45 273 if (!do_promote) {
8f937c60 274 *ifap1 = ifa->ifa_next;
1da177e4 275
d6062cbb 276 rtmsg_ifa(RTM_DELADDR, ifa, nlh, pid);
e041c683
AS
277 blocking_notifier_call_chain(&inetaddr_chain,
278 NETDEV_DOWN, ifa);
8f937c60
HW
279 inet_free_ifa(ifa);
280 } else {
281 promote = ifa;
282 break;
283 }
1da177e4
LT
284 }
285 }
286
287 /* 2. Unlink it */
288
289 *ifap = ifa1->ifa_next;
290
291 /* 3. Announce address deletion */
292
293 /* Send message first, then call notifier.
294 At first sight, FIB update triggered by notifier
295 will refer to already deleted ifaddr, that could confuse
296 netlink listeners. It is not true: look, gated sees
297 that route deleted and if it still thinks that ifaddr
298 is valid, it will try to restore deleted routes... Grr.
299 So that, this order is correct.
300 */
d6062cbb 301 rtmsg_ifa(RTM_DELADDR, ifa1, nlh, pid);
e041c683 302 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_DOWN, ifa1);
1da177e4 303
0ff60a45
JHS
304 if (promote) {
305
306 if (prev_prom) {
307 prev_prom->ifa_next = promote->ifa_next;
308 promote->ifa_next = last_prim->ifa_next;
309 last_prim->ifa_next = promote;
310 }
8f937c60 311
8f937c60 312 promote->ifa_flags &= ~IFA_F_SECONDARY;
d6062cbb 313 rtmsg_ifa(RTM_NEWADDR, promote, nlh, pid);
e041c683
AS
314 blocking_notifier_call_chain(&inetaddr_chain,
315 NETDEV_UP, promote);
0ff60a45
JHS
316 for (ifa = promote->ifa_next; ifa; ifa = ifa->ifa_next) {
317 if (ifa1->ifa_mask != ifa->ifa_mask ||
318 !inet_ifa_match(ifa1->ifa_address, ifa))
319 continue;
320 fib_add_ifaddr(ifa);
321 }
322
323 }
324 if (destroy) {
325 inet_free_ifa(ifa1);
326
327 if (!in_dev->ifa_list)
328 inetdev_destroy(in_dev);
8f937c60 329 }
1da177e4
LT
330}
331
d6062cbb
TG
332static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
333 int destroy)
334{
335 __inet_del_ifa(in_dev, ifap, destroy, NULL, 0);
336}
337
338static int __inet_insert_ifa(struct in_ifaddr *ifa, struct nlmsghdr *nlh,
339 u32 pid)
1da177e4
LT
340{
341 struct in_device *in_dev = ifa->ifa_dev;
342 struct in_ifaddr *ifa1, **ifap, **last_primary;
343
344 ASSERT_RTNL();
345
346 if (!ifa->ifa_local) {
347 inet_free_ifa(ifa);
348 return 0;
349 }
350
351 ifa->ifa_flags &= ~IFA_F_SECONDARY;
352 last_primary = &in_dev->ifa_list;
353
354 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
355 ifap = &ifa1->ifa_next) {
356 if (!(ifa1->ifa_flags & IFA_F_SECONDARY) &&
357 ifa->ifa_scope <= ifa1->ifa_scope)
358 last_primary = &ifa1->ifa_next;
359 if (ifa1->ifa_mask == ifa->ifa_mask &&
360 inet_ifa_match(ifa1->ifa_address, ifa)) {
361 if (ifa1->ifa_local == ifa->ifa_local) {
362 inet_free_ifa(ifa);
363 return -EEXIST;
364 }
365 if (ifa1->ifa_scope != ifa->ifa_scope) {
366 inet_free_ifa(ifa);
367 return -EINVAL;
368 }
369 ifa->ifa_flags |= IFA_F_SECONDARY;
370 }
371 }
372
373 if (!(ifa->ifa_flags & IFA_F_SECONDARY)) {
374 net_srandom(ifa->ifa_local);
375 ifap = last_primary;
376 }
377
378 ifa->ifa_next = *ifap;
379 *ifap = ifa;
380
381 /* Send message first, then call notifier.
382 Notifier will trigger FIB update, so that
383 listeners of netlink will know about new ifaddr */
d6062cbb 384 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, pid);
e041c683 385 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
1da177e4
LT
386
387 return 0;
388}
389
d6062cbb
TG
390static int inet_insert_ifa(struct in_ifaddr *ifa)
391{
392 return __inet_insert_ifa(ifa, NULL, 0);
393}
394
1da177e4
LT
395static int inet_set_ifa(struct net_device *dev, struct in_ifaddr *ifa)
396{
e5ed6399 397 struct in_device *in_dev = __in_dev_get_rtnl(dev);
1da177e4
LT
398
399 ASSERT_RTNL();
400
401 if (!in_dev) {
402 in_dev = inetdev_init(dev);
403 if (!in_dev) {
404 inet_free_ifa(ifa);
405 return -ENOBUFS;
406 }
407 }
408 if (ifa->ifa_dev != in_dev) {
409 BUG_TRAP(!ifa->ifa_dev);
410 in_dev_hold(in_dev);
411 ifa->ifa_dev = in_dev;
412 }
413 if (LOOPBACK(ifa->ifa_local))
414 ifa->ifa_scope = RT_SCOPE_HOST;
415 return inet_insert_ifa(ifa);
416}
417
418struct in_device *inetdev_by_index(int ifindex)
419{
420 struct net_device *dev;
421 struct in_device *in_dev = NULL;
422 read_lock(&dev_base_lock);
423 dev = __dev_get_by_index(ifindex);
424 if (dev)
425 in_dev = in_dev_get(dev);
426 read_unlock(&dev_base_lock);
427 return in_dev;
428}
429
430/* Called only from RTNL semaphored context. No locks. */
431
60cad5da
AV
432struct in_ifaddr *inet_ifa_byprefix(struct in_device *in_dev, __be32 prefix,
433 __be32 mask)
1da177e4
LT
434{
435 ASSERT_RTNL();
436
437 for_primary_ifa(in_dev) {
438 if (ifa->ifa_mask == mask && inet_ifa_match(prefix, ifa))
439 return ifa;
440 } endfor_ifa(in_dev);
441 return NULL;
442}
443
444static int inet_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
445{
dfdd5fd4 446 struct nlattr *tb[IFA_MAX+1];
1da177e4 447 struct in_device *in_dev;
dfdd5fd4 448 struct ifaddrmsg *ifm;
1da177e4 449 struct in_ifaddr *ifa, **ifap;
dfdd5fd4 450 int err = -EINVAL;
1da177e4
LT
451
452 ASSERT_RTNL();
453
dfdd5fd4
TG
454 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
455 if (err < 0)
456 goto errout;
457
458 ifm = nlmsg_data(nlh);
459 in_dev = inetdev_by_index(ifm->ifa_index);
460 if (in_dev == NULL) {
461 err = -ENODEV;
462 goto errout;
463 }
464
1da177e4
LT
465 __in_dev_put(in_dev);
466
467 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
468 ifap = &ifa->ifa_next) {
dfdd5fd4 469 if (tb[IFA_LOCAL] &&
a7a628c4 470 ifa->ifa_local != nla_get_be32(tb[IFA_LOCAL]))
dfdd5fd4
TG
471 continue;
472
473 if (tb[IFA_LABEL] && nla_strcmp(tb[IFA_LABEL], ifa->ifa_label))
1da177e4 474 continue;
dfdd5fd4
TG
475
476 if (tb[IFA_ADDRESS] &&
477 (ifm->ifa_prefixlen != ifa->ifa_prefixlen ||
a7a628c4 478 !inet_ifa_match(nla_get_be32(tb[IFA_ADDRESS]), ifa)))
dfdd5fd4
TG
479 continue;
480
d6062cbb 481 __inet_del_ifa(in_dev, ifap, 1, nlh, NETLINK_CB(skb).pid);
1da177e4
LT
482 return 0;
483 }
dfdd5fd4
TG
484
485 err = -EADDRNOTAVAIL;
486errout:
487 return err;
1da177e4
LT
488}
489
5c753978 490static struct in_ifaddr *rtm_to_ifaddr(struct nlmsghdr *nlh)
1da177e4 491{
5c753978
TG
492 struct nlattr *tb[IFA_MAX+1];
493 struct in_ifaddr *ifa;
494 struct ifaddrmsg *ifm;
1da177e4
LT
495 struct net_device *dev;
496 struct in_device *in_dev;
5c753978 497 int err = -EINVAL;
1da177e4 498
5c753978
TG
499 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
500 if (err < 0)
501 goto errout;
1da177e4 502
5c753978 503 ifm = nlmsg_data(nlh);
c4e38f41
EP
504 if (ifm->ifa_prefixlen > 32 || tb[IFA_LOCAL] == NULL) {
505 err = -EINVAL;
5c753978 506 goto errout;
c4e38f41 507 }
1da177e4 508
5c753978
TG
509 dev = __dev_get_by_index(ifm->ifa_index);
510 if (dev == NULL) {
511 err = -ENODEV;
512 goto errout;
513 }
1da177e4 514
5c753978
TG
515 in_dev = __in_dev_get_rtnl(dev);
516 if (in_dev == NULL) {
1da177e4 517 in_dev = inetdev_init(dev);
5c753978
TG
518 if (in_dev == NULL) {
519 err = -ENOBUFS;
520 goto errout;
521 }
1da177e4
LT
522 }
523
5c753978
TG
524 ifa = inet_alloc_ifa();
525 if (ifa == NULL) {
526 /*
527 * A potential indev allocation can be left alive, it stays
528 * assigned to its device and is destroy with it.
529 */
530 err = -ENOBUFS;
531 goto errout;
532 }
533
534 in_dev_hold(in_dev);
535
536 if (tb[IFA_ADDRESS] == NULL)
537 tb[IFA_ADDRESS] = tb[IFA_LOCAL];
1da177e4 538
1da177e4
LT
539 ifa->ifa_prefixlen = ifm->ifa_prefixlen;
540 ifa->ifa_mask = inet_make_mask(ifm->ifa_prefixlen);
1da177e4
LT
541 ifa->ifa_flags = ifm->ifa_flags;
542 ifa->ifa_scope = ifm->ifa_scope;
5c753978
TG
543 ifa->ifa_dev = in_dev;
544
a7a628c4
AV
545 ifa->ifa_local = nla_get_be32(tb[IFA_LOCAL]);
546 ifa->ifa_address = nla_get_be32(tb[IFA_ADDRESS]);
5c753978
TG
547
548 if (tb[IFA_BROADCAST])
a7a628c4 549 ifa->ifa_broadcast = nla_get_be32(tb[IFA_BROADCAST]);
5c753978
TG
550
551 if (tb[IFA_ANYCAST])
a7a628c4 552 ifa->ifa_anycast = nla_get_be32(tb[IFA_ANYCAST]);
5c753978
TG
553
554 if (tb[IFA_LABEL])
555 nla_strlcpy(ifa->ifa_label, tb[IFA_LABEL], IFNAMSIZ);
1da177e4
LT
556 else
557 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
558
5c753978
TG
559 return ifa;
560
561errout:
562 return ERR_PTR(err);
563}
564
565static int inet_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
566{
567 struct in_ifaddr *ifa;
568
569 ASSERT_RTNL();
570
571 ifa = rtm_to_ifaddr(nlh);
572 if (IS_ERR(ifa))
573 return PTR_ERR(ifa);
574
d6062cbb 575 return __inet_insert_ifa(ifa, nlh, NETLINK_CB(skb).pid);
1da177e4
LT
576}
577
578/*
579 * Determine a default network mask, based on the IP address.
580 */
581
714e85be 582static __inline__ int inet_abc_len(__be32 addr)
1da177e4
LT
583{
584 int rc = -1; /* Something else, probably a multicast. */
585
e905a9ed
YH
586 if (ZERONET(addr))
587 rc = 0;
1da177e4 588 else {
714e85be 589 __u32 haddr = ntohl(addr);
1da177e4 590
714e85be 591 if (IN_CLASSA(haddr))
1da177e4 592 rc = 8;
714e85be 593 else if (IN_CLASSB(haddr))
1da177e4 594 rc = 16;
714e85be 595 else if (IN_CLASSC(haddr))
1da177e4
LT
596 rc = 24;
597 }
598
e905a9ed 599 return rc;
1da177e4
LT
600}
601
602
603int devinet_ioctl(unsigned int cmd, void __user *arg)
604{
605 struct ifreq ifr;
606 struct sockaddr_in sin_orig;
607 struct sockaddr_in *sin = (struct sockaddr_in *)&ifr.ifr_addr;
608 struct in_device *in_dev;
609 struct in_ifaddr **ifap = NULL;
610 struct in_ifaddr *ifa = NULL;
611 struct net_device *dev;
612 char *colon;
613 int ret = -EFAULT;
614 int tryaddrmatch = 0;
615
616 /*
617 * Fetch the caller's info block into kernel space
618 */
619
620 if (copy_from_user(&ifr, arg, sizeof(struct ifreq)))
621 goto out;
622 ifr.ifr_name[IFNAMSIZ - 1] = 0;
623
624 /* save original address for comparison */
625 memcpy(&sin_orig, sin, sizeof(*sin));
626
627 colon = strchr(ifr.ifr_name, ':');
628 if (colon)
629 *colon = 0;
630
631#ifdef CONFIG_KMOD
632 dev_load(ifr.ifr_name);
633#endif
634
132adf54 635 switch (cmd) {
1da177e4
LT
636 case SIOCGIFADDR: /* Get interface address */
637 case SIOCGIFBRDADDR: /* Get the broadcast address */
638 case SIOCGIFDSTADDR: /* Get the destination address */
639 case SIOCGIFNETMASK: /* Get the netmask for the interface */
640 /* Note that these ioctls will not sleep,
641 so that we do not impose a lock.
642 One day we will be forced to put shlock here (I mean SMP)
643 */
644 tryaddrmatch = (sin_orig.sin_family == AF_INET);
645 memset(sin, 0, sizeof(*sin));
646 sin->sin_family = AF_INET;
647 break;
648
649 case SIOCSIFFLAGS:
650 ret = -EACCES;
651 if (!capable(CAP_NET_ADMIN))
652 goto out;
653 break;
654 case SIOCSIFADDR: /* Set interface address (and family) */
655 case SIOCSIFBRDADDR: /* Set the broadcast address */
656 case SIOCSIFDSTADDR: /* Set the destination address */
657 case SIOCSIFNETMASK: /* Set the netmask for the interface */
658 ret = -EACCES;
659 if (!capable(CAP_NET_ADMIN))
660 goto out;
661 ret = -EINVAL;
662 if (sin->sin_family != AF_INET)
663 goto out;
664 break;
665 default:
666 ret = -EINVAL;
667 goto out;
668 }
669
670 rtnl_lock();
671
672 ret = -ENODEV;
673 if ((dev = __dev_get_by_name(ifr.ifr_name)) == NULL)
674 goto done;
675
676 if (colon)
677 *colon = ':';
678
e5ed6399 679 if ((in_dev = __in_dev_get_rtnl(dev)) != NULL) {
1da177e4
LT
680 if (tryaddrmatch) {
681 /* Matthias Andree */
682 /* compare label and address (4.4BSD style) */
683 /* note: we only do this for a limited set of ioctls
684 and only if the original address family was AF_INET.
685 This is checked above. */
686 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
687 ifap = &ifa->ifa_next) {
688 if (!strcmp(ifr.ifr_name, ifa->ifa_label) &&
689 sin_orig.sin_addr.s_addr ==
690 ifa->ifa_address) {
691 break; /* found */
692 }
693 }
694 }
695 /* we didn't get a match, maybe the application is
696 4.3BSD-style and passed in junk so we fall back to
697 comparing just the label */
698 if (!ifa) {
699 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
700 ifap = &ifa->ifa_next)
701 if (!strcmp(ifr.ifr_name, ifa->ifa_label))
702 break;
703 }
704 }
705
706 ret = -EADDRNOTAVAIL;
707 if (!ifa && cmd != SIOCSIFADDR && cmd != SIOCSIFFLAGS)
708 goto done;
709
132adf54 710 switch (cmd) {
1da177e4
LT
711 case SIOCGIFADDR: /* Get interface address */
712 sin->sin_addr.s_addr = ifa->ifa_local;
713 goto rarok;
714
715 case SIOCGIFBRDADDR: /* Get the broadcast address */
716 sin->sin_addr.s_addr = ifa->ifa_broadcast;
717 goto rarok;
718
719 case SIOCGIFDSTADDR: /* Get the destination address */
720 sin->sin_addr.s_addr = ifa->ifa_address;
721 goto rarok;
722
723 case SIOCGIFNETMASK: /* Get the netmask for the interface */
724 sin->sin_addr.s_addr = ifa->ifa_mask;
725 goto rarok;
726
727 case SIOCSIFFLAGS:
728 if (colon) {
729 ret = -EADDRNOTAVAIL;
730 if (!ifa)
731 break;
732 ret = 0;
733 if (!(ifr.ifr_flags & IFF_UP))
734 inet_del_ifa(in_dev, ifap, 1);
735 break;
736 }
737 ret = dev_change_flags(dev, ifr.ifr_flags);
738 break;
739
740 case SIOCSIFADDR: /* Set interface address (and family) */
741 ret = -EINVAL;
742 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
743 break;
744
745 if (!ifa) {
746 ret = -ENOBUFS;
747 if ((ifa = inet_alloc_ifa()) == NULL)
748 break;
749 if (colon)
750 memcpy(ifa->ifa_label, ifr.ifr_name, IFNAMSIZ);
751 else
752 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
753 } else {
754 ret = 0;
755 if (ifa->ifa_local == sin->sin_addr.s_addr)
756 break;
757 inet_del_ifa(in_dev, ifap, 0);
758 ifa->ifa_broadcast = 0;
759 ifa->ifa_anycast = 0;
760 }
761
762 ifa->ifa_address = ifa->ifa_local = sin->sin_addr.s_addr;
763
764 if (!(dev->flags & IFF_POINTOPOINT)) {
765 ifa->ifa_prefixlen = inet_abc_len(ifa->ifa_address);
766 ifa->ifa_mask = inet_make_mask(ifa->ifa_prefixlen);
767 if ((dev->flags & IFF_BROADCAST) &&
768 ifa->ifa_prefixlen < 31)
769 ifa->ifa_broadcast = ifa->ifa_address |
770 ~ifa->ifa_mask;
771 } else {
772 ifa->ifa_prefixlen = 32;
773 ifa->ifa_mask = inet_make_mask(32);
774 }
775 ret = inet_set_ifa(dev, ifa);
776 break;
777
778 case SIOCSIFBRDADDR: /* Set the broadcast address */
779 ret = 0;
780 if (ifa->ifa_broadcast != sin->sin_addr.s_addr) {
781 inet_del_ifa(in_dev, ifap, 0);
782 ifa->ifa_broadcast = sin->sin_addr.s_addr;
783 inet_insert_ifa(ifa);
784 }
785 break;
786
787 case SIOCSIFDSTADDR: /* Set the destination address */
788 ret = 0;
789 if (ifa->ifa_address == sin->sin_addr.s_addr)
790 break;
791 ret = -EINVAL;
792 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
793 break;
794 ret = 0;
795 inet_del_ifa(in_dev, ifap, 0);
796 ifa->ifa_address = sin->sin_addr.s_addr;
797 inet_insert_ifa(ifa);
798 break;
799
800 case SIOCSIFNETMASK: /* Set the netmask for the interface */
801
802 /*
803 * The mask we set must be legal.
804 */
805 ret = -EINVAL;
806 if (bad_mask(sin->sin_addr.s_addr, 0))
807 break;
808 ret = 0;
809 if (ifa->ifa_mask != sin->sin_addr.s_addr) {
a144ea4b 810 __be32 old_mask = ifa->ifa_mask;
1da177e4
LT
811 inet_del_ifa(in_dev, ifap, 0);
812 ifa->ifa_mask = sin->sin_addr.s_addr;
813 ifa->ifa_prefixlen = inet_mask_len(ifa->ifa_mask);
814
815 /* See if current broadcast address matches
816 * with current netmask, then recalculate
817 * the broadcast address. Otherwise it's a
818 * funny address, so don't touch it since
819 * the user seems to know what (s)he's doing...
820 */
821 if ((dev->flags & IFF_BROADCAST) &&
822 (ifa->ifa_prefixlen < 31) &&
823 (ifa->ifa_broadcast ==
dcab5e1e 824 (ifa->ifa_local|~old_mask))) {
1da177e4
LT
825 ifa->ifa_broadcast = (ifa->ifa_local |
826 ~sin->sin_addr.s_addr);
827 }
828 inet_insert_ifa(ifa);
829 }
830 break;
831 }
832done:
833 rtnl_unlock();
834out:
835 return ret;
836rarok:
837 rtnl_unlock();
838 ret = copy_to_user(arg, &ifr, sizeof(struct ifreq)) ? -EFAULT : 0;
839 goto out;
840}
841
842static int inet_gifconf(struct net_device *dev, char __user *buf, int len)
843{
e5ed6399 844 struct in_device *in_dev = __in_dev_get_rtnl(dev);
1da177e4
LT
845 struct in_ifaddr *ifa;
846 struct ifreq ifr;
847 int done = 0;
848
849 if (!in_dev || (ifa = in_dev->ifa_list) == NULL)
850 goto out;
851
852 for (; ifa; ifa = ifa->ifa_next) {
853 if (!buf) {
854 done += sizeof(ifr);
855 continue;
856 }
857 if (len < (int) sizeof(ifr))
858 break;
859 memset(&ifr, 0, sizeof(struct ifreq));
860 if (ifa->ifa_label)
861 strcpy(ifr.ifr_name, ifa->ifa_label);
862 else
863 strcpy(ifr.ifr_name, dev->name);
864
865 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_family = AF_INET;
866 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_addr.s_addr =
867 ifa->ifa_local;
868
869 if (copy_to_user(buf, &ifr, sizeof(struct ifreq))) {
870 done = -EFAULT;
871 break;
872 }
873 buf += sizeof(struct ifreq);
874 len -= sizeof(struct ifreq);
875 done += sizeof(struct ifreq);
876 }
877out:
878 return done;
879}
880
a61ced5d 881__be32 inet_select_addr(const struct net_device *dev, __be32 dst, int scope)
1da177e4 882{
a61ced5d 883 __be32 addr = 0;
1da177e4
LT
884 struct in_device *in_dev;
885
886 rcu_read_lock();
e5ed6399 887 in_dev = __in_dev_get_rcu(dev);
1da177e4
LT
888 if (!in_dev)
889 goto no_in_dev;
890
891 for_primary_ifa(in_dev) {
892 if (ifa->ifa_scope > scope)
893 continue;
894 if (!dst || inet_ifa_match(dst, ifa)) {
895 addr = ifa->ifa_local;
896 break;
897 }
898 if (!addr)
899 addr = ifa->ifa_local;
900 } endfor_ifa(in_dev);
901no_in_dev:
902 rcu_read_unlock();
903
904 if (addr)
905 goto out;
906
907 /* Not loopback addresses on loopback should be preferred
908 in this case. It is importnat that lo is the first interface
909 in dev_base list.
910 */
911 read_lock(&dev_base_lock);
912 rcu_read_lock();
913 for (dev = dev_base; dev; dev = dev->next) {
e5ed6399 914 if ((in_dev = __in_dev_get_rcu(dev)) == NULL)
1da177e4
LT
915 continue;
916
917 for_primary_ifa(in_dev) {
918 if (ifa->ifa_scope != RT_SCOPE_LINK &&
919 ifa->ifa_scope <= scope) {
920 addr = ifa->ifa_local;
921 goto out_unlock_both;
922 }
923 } endfor_ifa(in_dev);
924 }
925out_unlock_both:
926 read_unlock(&dev_base_lock);
927 rcu_read_unlock();
928out:
929 return addr;
930}
931
60cad5da
AV
932static __be32 confirm_addr_indev(struct in_device *in_dev, __be32 dst,
933 __be32 local, int scope)
1da177e4
LT
934{
935 int same = 0;
a144ea4b 936 __be32 addr = 0;
1da177e4
LT
937
938 for_ifa(in_dev) {
939 if (!addr &&
940 (local == ifa->ifa_local || !local) &&
941 ifa->ifa_scope <= scope) {
942 addr = ifa->ifa_local;
943 if (same)
944 break;
945 }
946 if (!same) {
947 same = (!local || inet_ifa_match(local, ifa)) &&
948 (!dst || inet_ifa_match(dst, ifa));
949 if (same && addr) {
950 if (local || !dst)
951 break;
952 /* Is the selected addr into dst subnet? */
953 if (inet_ifa_match(addr, ifa))
954 break;
955 /* No, then can we use new local src? */
956 if (ifa->ifa_scope <= scope) {
957 addr = ifa->ifa_local;
958 break;
959 }
960 /* search for large dst subnet for addr */
961 same = 0;
962 }
963 }
964 } endfor_ifa(in_dev);
965
966 return same? addr : 0;
967}
968
969/*
970 * Confirm that local IP address exists using wildcards:
971 * - dev: only on this interface, 0=any interface
972 * - dst: only in the same subnet as dst, 0=any dst
973 * - local: address, 0=autoselect the local address
974 * - scope: maximum allowed scope value for the local address
975 */
60cad5da 976__be32 inet_confirm_addr(const struct net_device *dev, __be32 dst, __be32 local, int scope)
1da177e4 977{
60cad5da 978 __be32 addr = 0;
1da177e4
LT
979 struct in_device *in_dev;
980
981 if (dev) {
982 rcu_read_lock();
e5ed6399 983 if ((in_dev = __in_dev_get_rcu(dev)))
1da177e4
LT
984 addr = confirm_addr_indev(in_dev, dst, local, scope);
985 rcu_read_unlock();
986
987 return addr;
988 }
989
990 read_lock(&dev_base_lock);
991 rcu_read_lock();
992 for (dev = dev_base; dev; dev = dev->next) {
e5ed6399 993 if ((in_dev = __in_dev_get_rcu(dev))) {
1da177e4
LT
994 addr = confirm_addr_indev(in_dev, dst, local, scope);
995 if (addr)
996 break;
997 }
998 }
999 rcu_read_unlock();
1000 read_unlock(&dev_base_lock);
1001
1002 return addr;
1003}
1004
1005/*
1006 * Device notifier
1007 */
1008
1009int register_inetaddr_notifier(struct notifier_block *nb)
1010{
e041c683 1011 return blocking_notifier_chain_register(&inetaddr_chain, nb);
1da177e4
LT
1012}
1013
1014int unregister_inetaddr_notifier(struct notifier_block *nb)
1015{
e041c683 1016 return blocking_notifier_chain_unregister(&inetaddr_chain, nb);
1da177e4
LT
1017}
1018
1019/* Rename ifa_labels for a device name change. Make some effort to preserve existing
1020 * alias numbering and to create unique labels if possible.
1021*/
1022static void inetdev_changename(struct net_device *dev, struct in_device *in_dev)
e905a9ed 1023{
1da177e4
LT
1024 struct in_ifaddr *ifa;
1025 int named = 0;
1026
e905a9ed
YH
1027 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
1028 char old[IFNAMSIZ], *dot;
1da177e4
LT
1029
1030 memcpy(old, ifa->ifa_label, IFNAMSIZ);
e905a9ed 1031 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1da177e4
LT
1032 if (named++ == 0)
1033 continue;
1034 dot = strchr(ifa->ifa_label, ':');
e905a9ed
YH
1035 if (dot == NULL) {
1036 sprintf(old, ":%d", named);
1da177e4
LT
1037 dot = old;
1038 }
e905a9ed
YH
1039 if (strlen(dot) + strlen(dev->name) < IFNAMSIZ) {
1040 strcat(ifa->ifa_label, dot);
1041 } else {
1042 strcpy(ifa->ifa_label + (IFNAMSIZ - strlen(dot) - 1), dot);
1043 }
1044 }
1045}
1da177e4
LT
1046
1047/* Called only under RTNL semaphore */
1048
1049static int inetdev_event(struct notifier_block *this, unsigned long event,
1050 void *ptr)
1051{
1052 struct net_device *dev = ptr;
e5ed6399 1053 struct in_device *in_dev = __in_dev_get_rtnl(dev);
1da177e4
LT
1054
1055 ASSERT_RTNL();
1056
1057 if (!in_dev) {
8030f544 1058 if (event == NETDEV_REGISTER) {
1da177e4
LT
1059 in_dev = inetdev_init(dev);
1060 if (!in_dev)
1061 panic("devinet: Failed to create loopback\n");
8030f544
HX
1062 if (dev == &loopback_dev) {
1063 in_dev->cnf.no_xfrm = 1;
1064 in_dev->cnf.no_policy = 1;
1065 }
1da177e4
LT
1066 }
1067 goto out;
1068 }
1069
1070 switch (event) {
1071 case NETDEV_REGISTER:
1072 printk(KERN_DEBUG "inetdev_event: bug\n");
1073 dev->ip_ptr = NULL;
1074 break;
1075 case NETDEV_UP:
1076 if (dev->mtu < 68)
1077 break;
1078 if (dev == &loopback_dev) {
1079 struct in_ifaddr *ifa;
1080 if ((ifa = inet_alloc_ifa()) != NULL) {
1081 ifa->ifa_local =
1082 ifa->ifa_address = htonl(INADDR_LOOPBACK);
1083 ifa->ifa_prefixlen = 8;
1084 ifa->ifa_mask = inet_make_mask(8);
1085 in_dev_hold(in_dev);
1086 ifa->ifa_dev = in_dev;
1087 ifa->ifa_scope = RT_SCOPE_HOST;
1088 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1089 inet_insert_ifa(ifa);
1090 }
1091 }
1092 ip_mc_up(in_dev);
1093 break;
1094 case NETDEV_DOWN:
1095 ip_mc_down(in_dev);
1096 break;
1097 case NETDEV_CHANGEMTU:
1098 if (dev->mtu >= 68)
1099 break;
1100 /* MTU falled under 68, disable IP */
1101 case NETDEV_UNREGISTER:
1102 inetdev_destroy(in_dev);
1103 break;
1104 case NETDEV_CHANGENAME:
1105 /* Do not notify about label change, this event is
1106 * not interesting to applications using netlink.
1107 */
1108 inetdev_changename(dev, in_dev);
1109
1110#ifdef CONFIG_SYSCTL
1111 devinet_sysctl_unregister(&in_dev->cnf);
1112 neigh_sysctl_unregister(in_dev->arp_parms);
1113 neigh_sysctl_register(dev, in_dev->arp_parms, NET_IPV4,
1114 NET_IPV4_NEIGH, "ipv4", NULL, NULL);
1115 devinet_sysctl_register(in_dev, &in_dev->cnf);
1116#endif
1117 break;
1118 }
1119out:
1120 return NOTIFY_DONE;
1121}
1122
1123static struct notifier_block ip_netdev_notifier = {
1124 .notifier_call =inetdev_event,
1125};
1126
339bf98f
TG
1127static inline size_t inet_nlmsg_size(void)
1128{
1129 return NLMSG_ALIGN(sizeof(struct ifaddrmsg))
1130 + nla_total_size(4) /* IFA_ADDRESS */
1131 + nla_total_size(4) /* IFA_LOCAL */
1132 + nla_total_size(4) /* IFA_BROADCAST */
1133 + nla_total_size(4) /* IFA_ANYCAST */
1134 + nla_total_size(IFNAMSIZ); /* IFA_LABEL */
1135}
1136
1da177e4 1137static int inet_fill_ifaddr(struct sk_buff *skb, struct in_ifaddr *ifa,
b6544c0b 1138 u32 pid, u32 seq, int event, unsigned int flags)
1da177e4
LT
1139{
1140 struct ifaddrmsg *ifm;
1141 struct nlmsghdr *nlh;
1da177e4 1142
47f68512
TG
1143 nlh = nlmsg_put(skb, pid, seq, event, sizeof(*ifm), flags);
1144 if (nlh == NULL)
26932566 1145 return -EMSGSIZE;
47f68512
TG
1146
1147 ifm = nlmsg_data(nlh);
1da177e4
LT
1148 ifm->ifa_family = AF_INET;
1149 ifm->ifa_prefixlen = ifa->ifa_prefixlen;
1150 ifm->ifa_flags = ifa->ifa_flags|IFA_F_PERMANENT;
1151 ifm->ifa_scope = ifa->ifa_scope;
1152 ifm->ifa_index = ifa->ifa_dev->dev->ifindex;
47f68512 1153
1da177e4 1154 if (ifa->ifa_address)
a7a628c4 1155 NLA_PUT_BE32(skb, IFA_ADDRESS, ifa->ifa_address);
47f68512 1156
1da177e4 1157 if (ifa->ifa_local)
a7a628c4 1158 NLA_PUT_BE32(skb, IFA_LOCAL, ifa->ifa_local);
47f68512 1159
1da177e4 1160 if (ifa->ifa_broadcast)
a7a628c4 1161 NLA_PUT_BE32(skb, IFA_BROADCAST, ifa->ifa_broadcast);
47f68512 1162
1da177e4 1163 if (ifa->ifa_anycast)
a7a628c4 1164 NLA_PUT_BE32(skb, IFA_ANYCAST, ifa->ifa_anycast);
47f68512 1165
1da177e4 1166 if (ifa->ifa_label[0])
47f68512 1167 NLA_PUT_STRING(skb, IFA_LABEL, ifa->ifa_label);
1da177e4 1168
47f68512
TG
1169 return nlmsg_end(skb, nlh);
1170
1171nla_put_failure:
26932566
PM
1172 nlmsg_cancel(skb, nlh);
1173 return -EMSGSIZE;
1da177e4
LT
1174}
1175
1176static int inet_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb)
1177{
1178 int idx, ip_idx;
1179 struct net_device *dev;
1180 struct in_device *in_dev;
1181 struct in_ifaddr *ifa;
1182 int s_ip_idx, s_idx = cb->args[0];
1183
1184 s_ip_idx = ip_idx = cb->args[1];
1185 read_lock(&dev_base_lock);
1186 for (dev = dev_base, idx = 0; dev; dev = dev->next, idx++) {
1187 if (idx < s_idx)
1188 continue;
1189 if (idx > s_idx)
1190 s_ip_idx = 0;
1191 rcu_read_lock();
e5ed6399 1192 if ((in_dev = __in_dev_get_rcu(dev)) == NULL) {
1da177e4
LT
1193 rcu_read_unlock();
1194 continue;
1195 }
1196
1197 for (ifa = in_dev->ifa_list, ip_idx = 0; ifa;
1198 ifa = ifa->ifa_next, ip_idx++) {
1199 if (ip_idx < s_ip_idx)
1200 continue;
1201 if (inet_fill_ifaddr(skb, ifa, NETLINK_CB(cb->skb).pid,
1202 cb->nlh->nlmsg_seq,
b6544c0b 1203 RTM_NEWADDR, NLM_F_MULTI) <= 0) {
1da177e4
LT
1204 rcu_read_unlock();
1205 goto done;
1206 }
1207 }
1208 rcu_read_unlock();
1209 }
1210
1211done:
1212 read_unlock(&dev_base_lock);
1213 cb->args[0] = idx;
1214 cb->args[1] = ip_idx;
1215
1216 return skb->len;
1217}
1218
d6062cbb
TG
1219static void rtmsg_ifa(int event, struct in_ifaddr* ifa, struct nlmsghdr *nlh,
1220 u32 pid)
1da177e4 1221{
47f68512 1222 struct sk_buff *skb;
d6062cbb
TG
1223 u32 seq = nlh ? nlh->nlmsg_seq : 0;
1224 int err = -ENOBUFS;
1da177e4 1225
339bf98f 1226 skb = nlmsg_new(inet_nlmsg_size(), GFP_KERNEL);
47f68512 1227 if (skb == NULL)
d6062cbb
TG
1228 goto errout;
1229
1230 err = inet_fill_ifaddr(skb, ifa, pid, seq, event, 0);
26932566
PM
1231 if (err < 0) {
1232 /* -EMSGSIZE implies BUG in inet_nlmsg_size() */
1233 WARN_ON(err == -EMSGSIZE);
1234 kfree_skb(skb);
1235 goto errout;
1236 }
d6062cbb
TG
1237 err = rtnl_notify(skb, pid, RTNLGRP_IPV4_IFADDR, nlh, GFP_KERNEL);
1238errout:
1239 if (err < 0)
1240 rtnl_set_sk_err(RTNLGRP_IPV4_IFADDR, err);
1da177e4
LT
1241}
1242
1da177e4
LT
1243#ifdef CONFIG_SYSCTL
1244
1245void inet_forward_change(void)
1246{
1247 struct net_device *dev;
1248 int on = ipv4_devconf.forwarding;
1249
1250 ipv4_devconf.accept_redirects = !on;
1251 ipv4_devconf_dflt.forwarding = on;
1252
1253 read_lock(&dev_base_lock);
1254 for (dev = dev_base; dev; dev = dev->next) {
1255 struct in_device *in_dev;
1256 rcu_read_lock();
e5ed6399 1257 in_dev = __in_dev_get_rcu(dev);
1da177e4
LT
1258 if (in_dev)
1259 in_dev->cnf.forwarding = on;
1260 rcu_read_unlock();
1261 }
1262 read_unlock(&dev_base_lock);
1263
1264 rt_cache_flush(0);
1265}
1266
1267static int devinet_sysctl_forward(ctl_table *ctl, int write,
1268 struct file* filp, void __user *buffer,
1269 size_t *lenp, loff_t *ppos)
1270{
1271 int *valp = ctl->data;
1272 int val = *valp;
1273 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1274
1275 if (write && *valp != val) {
1276 if (valp == &ipv4_devconf.forwarding)
1277 inet_forward_change();
1278 else if (valp != &ipv4_devconf_dflt.forwarding)
1279 rt_cache_flush(0);
1280 }
1281
1282 return ret;
1283}
1284
1285int ipv4_doint_and_flush(ctl_table *ctl, int write,
1286 struct file* filp, void __user *buffer,
1287 size_t *lenp, loff_t *ppos)
1288{
1289 int *valp = ctl->data;
1290 int val = *valp;
1291 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1292
1293 if (write && *valp != val)
1294 rt_cache_flush(0);
1295
1296 return ret;
1297}
1298
1299int ipv4_doint_and_flush_strategy(ctl_table *table, int __user *name, int nlen,
1300 void __user *oldval, size_t __user *oldlenp,
1f29bcd7 1301 void __user *newval, size_t newlen)
1da177e4
LT
1302{
1303 int *valp = table->data;
1304 int new;
1305
1306 if (!newval || !newlen)
1307 return 0;
1308
1309 if (newlen != sizeof(int))
1310 return -EINVAL;
1311
1312 if (get_user(new, (int __user *)newval))
1313 return -EFAULT;
1314
1315 if (new == *valp)
1316 return 0;
1317
1318 if (oldval && oldlenp) {
1319 size_t len;
1320
1321 if (get_user(len, oldlenp))
1322 return -EFAULT;
1323
1324 if (len) {
1325 if (len > table->maxlen)
1326 len = table->maxlen;
1327 if (copy_to_user(oldval, valp, len))
1328 return -EFAULT;
1329 if (put_user(len, oldlenp))
1330 return -EFAULT;
1331 }
1332 }
1333
1334 *valp = new;
1335 rt_cache_flush(0);
1336 return 1;
1337}
1338
1339
1340static struct devinet_sysctl_table {
1341 struct ctl_table_header *sysctl_header;
1342 ctl_table devinet_vars[__NET_IPV4_CONF_MAX];
1343 ctl_table devinet_dev[2];
1344 ctl_table devinet_conf_dir[2];
1345 ctl_table devinet_proto_dir[2];
1346 ctl_table devinet_root_dir[2];
1347} devinet_sysctl = {
1348 .devinet_vars = {
1349 {
1350 .ctl_name = NET_IPV4_CONF_FORWARDING,
1351 .procname = "forwarding",
1352 .data = &ipv4_devconf.forwarding,
1353 .maxlen = sizeof(int),
1354 .mode = 0644,
1355 .proc_handler = &devinet_sysctl_forward,
1356 },
1357 {
1358 .ctl_name = NET_IPV4_CONF_MC_FORWARDING,
1359 .procname = "mc_forwarding",
1360 .data = &ipv4_devconf.mc_forwarding,
1361 .maxlen = sizeof(int),
1362 .mode = 0444,
1363 .proc_handler = &proc_dointvec,
1364 },
1365 {
1366 .ctl_name = NET_IPV4_CONF_ACCEPT_REDIRECTS,
1367 .procname = "accept_redirects",
1368 .data = &ipv4_devconf.accept_redirects,
1369 .maxlen = sizeof(int),
1370 .mode = 0644,
1371 .proc_handler = &proc_dointvec,
1372 },
1373 {
1374 .ctl_name = NET_IPV4_CONF_SECURE_REDIRECTS,
1375 .procname = "secure_redirects",
1376 .data = &ipv4_devconf.secure_redirects,
1377 .maxlen = sizeof(int),
1378 .mode = 0644,
1379 .proc_handler = &proc_dointvec,
1380 },
1381 {
1382 .ctl_name = NET_IPV4_CONF_SHARED_MEDIA,
1383 .procname = "shared_media",
1384 .data = &ipv4_devconf.shared_media,
1385 .maxlen = sizeof(int),
1386 .mode = 0644,
1387 .proc_handler = &proc_dointvec,
1388 },
1389 {
1390 .ctl_name = NET_IPV4_CONF_RP_FILTER,
1391 .procname = "rp_filter",
1392 .data = &ipv4_devconf.rp_filter,
1393 .maxlen = sizeof(int),
1394 .mode = 0644,
1395 .proc_handler = &proc_dointvec,
1396 },
1397 {
1398 .ctl_name = NET_IPV4_CONF_SEND_REDIRECTS,
1399 .procname = "send_redirects",
1400 .data = &ipv4_devconf.send_redirects,
1401 .maxlen = sizeof(int),
1402 .mode = 0644,
1403 .proc_handler = &proc_dointvec,
1404 },
1405 {
1406 .ctl_name = NET_IPV4_CONF_ACCEPT_SOURCE_ROUTE,
1407 .procname = "accept_source_route",
1408 .data = &ipv4_devconf.accept_source_route,
1409 .maxlen = sizeof(int),
1410 .mode = 0644,
1411 .proc_handler = &proc_dointvec,
1412 },
1413 {
1414 .ctl_name = NET_IPV4_CONF_PROXY_ARP,
1415 .procname = "proxy_arp",
1416 .data = &ipv4_devconf.proxy_arp,
1417 .maxlen = sizeof(int),
1418 .mode = 0644,
1419 .proc_handler = &proc_dointvec,
1420 },
1421 {
1422 .ctl_name = NET_IPV4_CONF_MEDIUM_ID,
1423 .procname = "medium_id",
1424 .data = &ipv4_devconf.medium_id,
1425 .maxlen = sizeof(int),
1426 .mode = 0644,
1427 .proc_handler = &proc_dointvec,
1428 },
1429 {
1430 .ctl_name = NET_IPV4_CONF_BOOTP_RELAY,
1431 .procname = "bootp_relay",
1432 .data = &ipv4_devconf.bootp_relay,
1433 .maxlen = sizeof(int),
1434 .mode = 0644,
1435 .proc_handler = &proc_dointvec,
1436 },
1437 {
1438 .ctl_name = NET_IPV4_CONF_LOG_MARTIANS,
1439 .procname = "log_martians",
1440 .data = &ipv4_devconf.log_martians,
1441 .maxlen = sizeof(int),
1442 .mode = 0644,
1443 .proc_handler = &proc_dointvec,
1444 },
1445 {
1446 .ctl_name = NET_IPV4_CONF_TAG,
1447 .procname = "tag",
1448 .data = &ipv4_devconf.tag,
1449 .maxlen = sizeof(int),
1450 .mode = 0644,
1451 .proc_handler = &proc_dointvec,
1452 },
1453 {
1454 .ctl_name = NET_IPV4_CONF_ARPFILTER,
1455 .procname = "arp_filter",
1456 .data = &ipv4_devconf.arp_filter,
1457 .maxlen = sizeof(int),
1458 .mode = 0644,
1459 .proc_handler = &proc_dointvec,
1460 },
1461 {
1462 .ctl_name = NET_IPV4_CONF_ARP_ANNOUNCE,
1463 .procname = "arp_announce",
1464 .data = &ipv4_devconf.arp_announce,
1465 .maxlen = sizeof(int),
1466 .mode = 0644,
1467 .proc_handler = &proc_dointvec,
1468 },
1469 {
1470 .ctl_name = NET_IPV4_CONF_ARP_IGNORE,
1471 .procname = "arp_ignore",
1472 .data = &ipv4_devconf.arp_ignore,
1473 .maxlen = sizeof(int),
abd596a4
NH
1474 .mode = 0644,
1475 .proc_handler = &proc_dointvec,
1476 },
1477 {
1478 .ctl_name = NET_IPV4_CONF_ARP_ACCEPT,
1479 .procname = "arp_accept",
1480 .data = &ipv4_devconf.arp_accept,
1481 .maxlen = sizeof(int),
1da177e4
LT
1482 .mode = 0644,
1483 .proc_handler = &proc_dointvec,
1484 },
1485 {
1486 .ctl_name = NET_IPV4_CONF_NOXFRM,
1487 .procname = "disable_xfrm",
1488 .data = &ipv4_devconf.no_xfrm,
1489 .maxlen = sizeof(int),
1490 .mode = 0644,
1491 .proc_handler = &ipv4_doint_and_flush,
1492 .strategy = &ipv4_doint_and_flush_strategy,
1493 },
1494 {
1495 .ctl_name = NET_IPV4_CONF_NOPOLICY,
1496 .procname = "disable_policy",
1497 .data = &ipv4_devconf.no_policy,
1498 .maxlen = sizeof(int),
1499 .mode = 0644,
1500 .proc_handler = &ipv4_doint_and_flush,
1501 .strategy = &ipv4_doint_and_flush_strategy,
1502 },
1503 {
1504 .ctl_name = NET_IPV4_CONF_FORCE_IGMP_VERSION,
1505 .procname = "force_igmp_version",
1506 .data = &ipv4_devconf.force_igmp_version,
1507 .maxlen = sizeof(int),
1508 .mode = 0644,
8f937c60
HW
1509 .proc_handler = &ipv4_doint_and_flush,
1510 .strategy = &ipv4_doint_and_flush_strategy,
1511 },
1512 {
1513 .ctl_name = NET_IPV4_CONF_PROMOTE_SECONDARIES,
1514 .procname = "promote_secondaries",
1515 .data = &ipv4_devconf.promote_secondaries,
1516 .maxlen = sizeof(int),
1517 .mode = 0644,
1da177e4
LT
1518 .proc_handler = &ipv4_doint_and_flush,
1519 .strategy = &ipv4_doint_and_flush_strategy,
1520 },
1521 },
1522 .devinet_dev = {
1523 {
1524 .ctl_name = NET_PROTO_CONF_ALL,
1525 .procname = "all",
1526 .mode = 0555,
1527 .child = devinet_sysctl.devinet_vars,
1528 },
1529 },
1530 .devinet_conf_dir = {
e905a9ed 1531 {
1da177e4
LT
1532 .ctl_name = NET_IPV4_CONF,
1533 .procname = "conf",
1534 .mode = 0555,
1535 .child = devinet_sysctl.devinet_dev,
1536 },
1537 },
1538 .devinet_proto_dir = {
1539 {
1540 .ctl_name = NET_IPV4,
1541 .procname = "ipv4",
1542 .mode = 0555,
1543 .child = devinet_sysctl.devinet_conf_dir,
1544 },
1545 },
1546 .devinet_root_dir = {
1547 {
1548 .ctl_name = CTL_NET,
1549 .procname = "net",
1550 .mode = 0555,
1551 .child = devinet_sysctl.devinet_proto_dir,
1552 },
1553 },
1554};
1555
1556static void devinet_sysctl_register(struct in_device *in_dev,
1557 struct ipv4_devconf *p)
1558{
1559 int i;
1560 struct net_device *dev = in_dev ? in_dev->dev : NULL;
42e5ea46
ACM
1561 struct devinet_sysctl_table *t = kmemdup(&devinet_sysctl, sizeof(*t),
1562 GFP_KERNEL);
1da177e4
LT
1563 char *dev_name = NULL;
1564
1565 if (!t)
1566 return;
1da177e4
LT
1567 for (i = 0; i < ARRAY_SIZE(t->devinet_vars) - 1; i++) {
1568 t->devinet_vars[i].data += (char *)p - (char *)&ipv4_devconf;
1da177e4
LT
1569 }
1570
1571 if (dev) {
e905a9ed 1572 dev_name = dev->name;
1da177e4
LT
1573 t->devinet_dev[0].ctl_name = dev->ifindex;
1574 } else {
1575 dev_name = "default";
1576 t->devinet_dev[0].ctl_name = NET_PROTO_CONF_DEFAULT;
1577 }
1578
e905a9ed
YH
1579 /*
1580 * Make a copy of dev_name, because '.procname' is regarded as const
1da177e4
LT
1581 * by sysctl and we wouldn't want anyone to change it under our feet
1582 * (see SIOCSIFNAME).
e905a9ed 1583 */
543537bd 1584 dev_name = kstrdup(dev_name, GFP_KERNEL);
1da177e4
LT
1585 if (!dev_name)
1586 goto free;
1587
1588 t->devinet_dev[0].procname = dev_name;
1589 t->devinet_dev[0].child = t->devinet_vars;
1da177e4 1590 t->devinet_conf_dir[0].child = t->devinet_dev;
1da177e4 1591 t->devinet_proto_dir[0].child = t->devinet_conf_dir;
1da177e4 1592 t->devinet_root_dir[0].child = t->devinet_proto_dir;
1da177e4 1593
0b4d4147 1594 t->sysctl_header = register_sysctl_table(t->devinet_root_dir);
1da177e4
LT
1595 if (!t->sysctl_header)
1596 goto free_procname;
1597
1598 p->sysctl = t;
1599 return;
1600
1601 /* error path */
1602 free_procname:
1603 kfree(dev_name);
1604 free:
1605 kfree(t);
1606 return;
1607}
1608
1609static void devinet_sysctl_unregister(struct ipv4_devconf *p)
1610{
1611 if (p->sysctl) {
1612 struct devinet_sysctl_table *t = p->sysctl;
1613 p->sysctl = NULL;
1614 unregister_sysctl_table(t->sysctl_header);
1615 kfree(t->devinet_dev[0].procname);
1616 kfree(t);
1617 }
1618}
1619#endif
1620
1621void __init devinet_init(void)
1622{
1623 register_gifconf(PF_INET, inet_gifconf);
1624 register_netdevice_notifier(&ip_netdev_notifier);
63f3444f
TG
1625
1626 rtnl_register(PF_INET, RTM_NEWADDR, inet_rtm_newaddr, NULL);
1627 rtnl_register(PF_INET, RTM_DELADDR, inet_rtm_deladdr, NULL);
1628 rtnl_register(PF_INET, RTM_GETADDR, NULL, inet_dump_ifaddr);
1da177e4
LT
1629#ifdef CONFIG_SYSCTL
1630 devinet_sysctl.sysctl_header =
0b4d4147 1631 register_sysctl_table(devinet_sysctl.devinet_root_dir);
1da177e4
LT
1632 devinet_sysctl_register(NULL, &ipv4_devconf_dflt);
1633#endif
1634}
1635
1da177e4
LT
1636EXPORT_SYMBOL(in_dev_finish_destroy);
1637EXPORT_SYMBOL(inet_select_addr);
1638EXPORT_SYMBOL(inetdev_by_index);
1639EXPORT_SYMBOL(register_inetaddr_notifier);
1640EXPORT_SYMBOL(unregister_inetaddr_notifier);