]> bbs.cooldavid.org Git - net-next-2.6.git/blame_incremental - net/core/rtnetlink.c
net: fib_rules: decouple address families from real address families
[net-next-2.6.git] / net / core / rtnetlink.c
... / ...
CommitLineData
1/*
2 * INET An implementation of the TCP/IP protocol suite for the LINUX
3 * operating system. INET is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
5 *
6 * Routing netlink socket interface: protocol independent part.
7 *
8 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
9 *
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
14 *
15 * Fixes:
16 * Vitaly E. Lavrov RTA_OK arithmetics was wrong.
17 */
18
19#include <linux/errno.h>
20#include <linux/module.h>
21#include <linux/types.h>
22#include <linux/socket.h>
23#include <linux/kernel.h>
24#include <linux/timer.h>
25#include <linux/string.h>
26#include <linux/sockios.h>
27#include <linux/net.h>
28#include <linux/fcntl.h>
29#include <linux/mm.h>
30#include <linux/slab.h>
31#include <linux/interrupt.h>
32#include <linux/capability.h>
33#include <linux/skbuff.h>
34#include <linux/init.h>
35#include <linux/security.h>
36#include <linux/mutex.h>
37#include <linux/if_addr.h>
38#include <linux/pci.h>
39
40#include <asm/uaccess.h>
41#include <asm/system.h>
42
43#include <linux/inet.h>
44#include <linux/netdevice.h>
45#include <net/ip.h>
46#include <net/protocol.h>
47#include <net/arp.h>
48#include <net/route.h>
49#include <net/udp.h>
50#include <net/sock.h>
51#include <net/pkt_sched.h>
52#include <net/fib_rules.h>
53#include <net/rtnetlink.h>
54#include <net/net_namespace.h>
55
56struct rtnl_link {
57 rtnl_doit_func doit;
58 rtnl_dumpit_func dumpit;
59};
60
61static DEFINE_MUTEX(rtnl_mutex);
62
63void rtnl_lock(void)
64{
65 mutex_lock(&rtnl_mutex);
66}
67EXPORT_SYMBOL(rtnl_lock);
68
69void __rtnl_unlock(void)
70{
71 mutex_unlock(&rtnl_mutex);
72}
73
74void rtnl_unlock(void)
75{
76 /* This fellow will unlock it for us. */
77 netdev_run_todo();
78}
79EXPORT_SYMBOL(rtnl_unlock);
80
81int rtnl_trylock(void)
82{
83 return mutex_trylock(&rtnl_mutex);
84}
85EXPORT_SYMBOL(rtnl_trylock);
86
87int rtnl_is_locked(void)
88{
89 return mutex_is_locked(&rtnl_mutex);
90}
91EXPORT_SYMBOL(rtnl_is_locked);
92
93#ifdef CONFIG_PROVE_LOCKING
94int lockdep_rtnl_is_held(void)
95{
96 return lockdep_is_held(&rtnl_mutex);
97}
98EXPORT_SYMBOL(lockdep_rtnl_is_held);
99#endif /* #ifdef CONFIG_PROVE_LOCKING */
100
101static struct rtnl_link *rtnl_msg_handlers[NPROTO];
102
103static inline int rtm_msgindex(int msgtype)
104{
105 int msgindex = msgtype - RTM_BASE;
106
107 /*
108 * msgindex < 0 implies someone tried to register a netlink
109 * control code. msgindex >= RTM_NR_MSGTYPES may indicate that
110 * the message type has not been added to linux/rtnetlink.h
111 */
112 BUG_ON(msgindex < 0 || msgindex >= RTM_NR_MSGTYPES);
113
114 return msgindex;
115}
116
117static rtnl_doit_func rtnl_get_doit(int protocol, int msgindex)
118{
119 struct rtnl_link *tab;
120
121 if (protocol < NPROTO)
122 tab = rtnl_msg_handlers[protocol];
123 else
124 tab = NULL;
125
126 if (tab == NULL || tab[msgindex].doit == NULL)
127 tab = rtnl_msg_handlers[PF_UNSPEC];
128
129 return tab ? tab[msgindex].doit : NULL;
130}
131
132static rtnl_dumpit_func rtnl_get_dumpit(int protocol, int msgindex)
133{
134 struct rtnl_link *tab;
135
136 if (protocol < NPROTO)
137 tab = rtnl_msg_handlers[protocol];
138 else
139 tab = NULL;
140
141 if (tab == NULL || tab[msgindex].dumpit == NULL)
142 tab = rtnl_msg_handlers[PF_UNSPEC];
143
144 return tab ? tab[msgindex].dumpit : NULL;
145}
146
147/**
148 * __rtnl_register - Register a rtnetlink message type
149 * @protocol: Protocol family or PF_UNSPEC
150 * @msgtype: rtnetlink message type
151 * @doit: Function pointer called for each request message
152 * @dumpit: Function pointer called for each dump request (NLM_F_DUMP) message
153 *
154 * Registers the specified function pointers (at least one of them has
155 * to be non-NULL) to be called whenever a request message for the
156 * specified protocol family and message type is received.
157 *
158 * The special protocol family PF_UNSPEC may be used to define fallback
159 * function pointers for the case when no entry for the specific protocol
160 * family exists.
161 *
162 * Returns 0 on success or a negative error code.
163 */
164int __rtnl_register(int protocol, int msgtype,
165 rtnl_doit_func doit, rtnl_dumpit_func dumpit)
166{
167 struct rtnl_link *tab;
168 int msgindex;
169
170 BUG_ON(protocol < 0 || protocol >= NPROTO);
171 msgindex = rtm_msgindex(msgtype);
172
173 tab = rtnl_msg_handlers[protocol];
174 if (tab == NULL) {
175 tab = kcalloc(RTM_NR_MSGTYPES, sizeof(*tab), GFP_KERNEL);
176 if (tab == NULL)
177 return -ENOBUFS;
178
179 rtnl_msg_handlers[protocol] = tab;
180 }
181
182 if (doit)
183 tab[msgindex].doit = doit;
184
185 if (dumpit)
186 tab[msgindex].dumpit = dumpit;
187
188 return 0;
189}
190EXPORT_SYMBOL_GPL(__rtnl_register);
191
192/**
193 * rtnl_register - Register a rtnetlink message type
194 *
195 * Identical to __rtnl_register() but panics on failure. This is useful
196 * as failure of this function is very unlikely, it can only happen due
197 * to lack of memory when allocating the chain to store all message
198 * handlers for a protocol. Meant for use in init functions where lack
199 * of memory implies no sense in continueing.
200 */
201void rtnl_register(int protocol, int msgtype,
202 rtnl_doit_func doit, rtnl_dumpit_func dumpit)
203{
204 if (__rtnl_register(protocol, msgtype, doit, dumpit) < 0)
205 panic("Unable to register rtnetlink message handler, "
206 "protocol = %d, message type = %d\n",
207 protocol, msgtype);
208}
209EXPORT_SYMBOL_GPL(rtnl_register);
210
211/**
212 * rtnl_unregister - Unregister a rtnetlink message type
213 * @protocol: Protocol family or PF_UNSPEC
214 * @msgtype: rtnetlink message type
215 *
216 * Returns 0 on success or a negative error code.
217 */
218int rtnl_unregister(int protocol, int msgtype)
219{
220 int msgindex;
221
222 BUG_ON(protocol < 0 || protocol >= NPROTO);
223 msgindex = rtm_msgindex(msgtype);
224
225 if (rtnl_msg_handlers[protocol] == NULL)
226 return -ENOENT;
227
228 rtnl_msg_handlers[protocol][msgindex].doit = NULL;
229 rtnl_msg_handlers[protocol][msgindex].dumpit = NULL;
230
231 return 0;
232}
233EXPORT_SYMBOL_GPL(rtnl_unregister);
234
235/**
236 * rtnl_unregister_all - Unregister all rtnetlink message type of a protocol
237 * @protocol : Protocol family or PF_UNSPEC
238 *
239 * Identical to calling rtnl_unregster() for all registered message types
240 * of a certain protocol family.
241 */
242void rtnl_unregister_all(int protocol)
243{
244 BUG_ON(protocol < 0 || protocol >= NPROTO);
245
246 kfree(rtnl_msg_handlers[protocol]);
247 rtnl_msg_handlers[protocol] = NULL;
248}
249EXPORT_SYMBOL_GPL(rtnl_unregister_all);
250
251static LIST_HEAD(link_ops);
252
253/**
254 * __rtnl_link_register - Register rtnl_link_ops with rtnetlink.
255 * @ops: struct rtnl_link_ops * to register
256 *
257 * The caller must hold the rtnl_mutex. This function should be used
258 * by drivers that create devices during module initialization. It
259 * must be called before registering the devices.
260 *
261 * Returns 0 on success or a negative error code.
262 */
263int __rtnl_link_register(struct rtnl_link_ops *ops)
264{
265 if (!ops->dellink)
266 ops->dellink = unregister_netdevice_queue;
267
268 list_add_tail(&ops->list, &link_ops);
269 return 0;
270}
271EXPORT_SYMBOL_GPL(__rtnl_link_register);
272
273/**
274 * rtnl_link_register - Register rtnl_link_ops with rtnetlink.
275 * @ops: struct rtnl_link_ops * to register
276 *
277 * Returns 0 on success or a negative error code.
278 */
279int rtnl_link_register(struct rtnl_link_ops *ops)
280{
281 int err;
282
283 rtnl_lock();
284 err = __rtnl_link_register(ops);
285 rtnl_unlock();
286 return err;
287}
288EXPORT_SYMBOL_GPL(rtnl_link_register);
289
290static void __rtnl_kill_links(struct net *net, struct rtnl_link_ops *ops)
291{
292 struct net_device *dev;
293 LIST_HEAD(list_kill);
294
295 for_each_netdev(net, dev) {
296 if (dev->rtnl_link_ops == ops)
297 ops->dellink(dev, &list_kill);
298 }
299 unregister_netdevice_many(&list_kill);
300}
301
302void rtnl_kill_links(struct net *net, struct rtnl_link_ops *ops)
303{
304 rtnl_lock();
305 __rtnl_kill_links(net, ops);
306 rtnl_unlock();
307}
308EXPORT_SYMBOL_GPL(rtnl_kill_links);
309
310/**
311 * __rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
312 * @ops: struct rtnl_link_ops * to unregister
313 *
314 * The caller must hold the rtnl_mutex.
315 */
316void __rtnl_link_unregister(struct rtnl_link_ops *ops)
317{
318 struct net *net;
319
320 for_each_net(net) {
321 __rtnl_kill_links(net, ops);
322 }
323 list_del(&ops->list);
324}
325EXPORT_SYMBOL_GPL(__rtnl_link_unregister);
326
327/**
328 * rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
329 * @ops: struct rtnl_link_ops * to unregister
330 */
331void rtnl_link_unregister(struct rtnl_link_ops *ops)
332{
333 rtnl_lock();
334 __rtnl_link_unregister(ops);
335 rtnl_unlock();
336}
337EXPORT_SYMBOL_GPL(rtnl_link_unregister);
338
339static const struct rtnl_link_ops *rtnl_link_ops_get(const char *kind)
340{
341 const struct rtnl_link_ops *ops;
342
343 list_for_each_entry(ops, &link_ops, list) {
344 if (!strcmp(ops->kind, kind))
345 return ops;
346 }
347 return NULL;
348}
349
350static size_t rtnl_link_get_size(const struct net_device *dev)
351{
352 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
353 size_t size;
354
355 if (!ops)
356 return 0;
357
358 size = nlmsg_total_size(sizeof(struct nlattr)) + /* IFLA_LINKINFO */
359 nlmsg_total_size(strlen(ops->kind) + 1); /* IFLA_INFO_KIND */
360
361 if (ops->get_size)
362 /* IFLA_INFO_DATA + nested data */
363 size += nlmsg_total_size(sizeof(struct nlattr)) +
364 ops->get_size(dev);
365
366 if (ops->get_xstats_size)
367 size += ops->get_xstats_size(dev); /* IFLA_INFO_XSTATS */
368
369 return size;
370}
371
372static int rtnl_link_fill(struct sk_buff *skb, const struct net_device *dev)
373{
374 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
375 struct nlattr *linkinfo, *data;
376 int err = -EMSGSIZE;
377
378 linkinfo = nla_nest_start(skb, IFLA_LINKINFO);
379 if (linkinfo == NULL)
380 goto out;
381
382 if (nla_put_string(skb, IFLA_INFO_KIND, ops->kind) < 0)
383 goto err_cancel_link;
384 if (ops->fill_xstats) {
385 err = ops->fill_xstats(skb, dev);
386 if (err < 0)
387 goto err_cancel_link;
388 }
389 if (ops->fill_info) {
390 data = nla_nest_start(skb, IFLA_INFO_DATA);
391 if (data == NULL)
392 goto err_cancel_link;
393 err = ops->fill_info(skb, dev);
394 if (err < 0)
395 goto err_cancel_data;
396 nla_nest_end(skb, data);
397 }
398
399 nla_nest_end(skb, linkinfo);
400 return 0;
401
402err_cancel_data:
403 nla_nest_cancel(skb, data);
404err_cancel_link:
405 nla_nest_cancel(skb, linkinfo);
406out:
407 return err;
408}
409
410static const int rtm_min[RTM_NR_FAMILIES] =
411{
412 [RTM_FAM(RTM_NEWLINK)] = NLMSG_LENGTH(sizeof(struct ifinfomsg)),
413 [RTM_FAM(RTM_NEWADDR)] = NLMSG_LENGTH(sizeof(struct ifaddrmsg)),
414 [RTM_FAM(RTM_NEWROUTE)] = NLMSG_LENGTH(sizeof(struct rtmsg)),
415 [RTM_FAM(RTM_NEWRULE)] = NLMSG_LENGTH(sizeof(struct fib_rule_hdr)),
416 [RTM_FAM(RTM_NEWQDISC)] = NLMSG_LENGTH(sizeof(struct tcmsg)),
417 [RTM_FAM(RTM_NEWTCLASS)] = NLMSG_LENGTH(sizeof(struct tcmsg)),
418 [RTM_FAM(RTM_NEWTFILTER)] = NLMSG_LENGTH(sizeof(struct tcmsg)),
419 [RTM_FAM(RTM_NEWACTION)] = NLMSG_LENGTH(sizeof(struct tcamsg)),
420 [RTM_FAM(RTM_GETMULTICAST)] = NLMSG_LENGTH(sizeof(struct rtgenmsg)),
421 [RTM_FAM(RTM_GETANYCAST)] = NLMSG_LENGTH(sizeof(struct rtgenmsg)),
422};
423
424static const int rta_max[RTM_NR_FAMILIES] =
425{
426 [RTM_FAM(RTM_NEWLINK)] = IFLA_MAX,
427 [RTM_FAM(RTM_NEWADDR)] = IFA_MAX,
428 [RTM_FAM(RTM_NEWROUTE)] = RTA_MAX,
429 [RTM_FAM(RTM_NEWRULE)] = FRA_MAX,
430 [RTM_FAM(RTM_NEWQDISC)] = TCA_MAX,
431 [RTM_FAM(RTM_NEWTCLASS)] = TCA_MAX,
432 [RTM_FAM(RTM_NEWTFILTER)] = TCA_MAX,
433 [RTM_FAM(RTM_NEWACTION)] = TCAA_MAX,
434};
435
436void __rta_fill(struct sk_buff *skb, int attrtype, int attrlen, const void *data)
437{
438 struct rtattr *rta;
439 int size = RTA_LENGTH(attrlen);
440
441 rta = (struct rtattr *)skb_put(skb, RTA_ALIGN(size));
442 rta->rta_type = attrtype;
443 rta->rta_len = size;
444 memcpy(RTA_DATA(rta), data, attrlen);
445 memset(RTA_DATA(rta) + attrlen, 0, RTA_ALIGN(size) - size);
446}
447EXPORT_SYMBOL(__rta_fill);
448
449int rtnetlink_send(struct sk_buff *skb, struct net *net, u32 pid, unsigned group, int echo)
450{
451 struct sock *rtnl = net->rtnl;
452 int err = 0;
453
454 NETLINK_CB(skb).dst_group = group;
455 if (echo)
456 atomic_inc(&skb->users);
457 netlink_broadcast(rtnl, skb, pid, group, GFP_KERNEL);
458 if (echo)
459 err = netlink_unicast(rtnl, skb, pid, MSG_DONTWAIT);
460 return err;
461}
462
463int rtnl_unicast(struct sk_buff *skb, struct net *net, u32 pid)
464{
465 struct sock *rtnl = net->rtnl;
466
467 return nlmsg_unicast(rtnl, skb, pid);
468}
469EXPORT_SYMBOL(rtnl_unicast);
470
471void rtnl_notify(struct sk_buff *skb, struct net *net, u32 pid, u32 group,
472 struct nlmsghdr *nlh, gfp_t flags)
473{
474 struct sock *rtnl = net->rtnl;
475 int report = 0;
476
477 if (nlh)
478 report = nlmsg_report(nlh);
479
480 nlmsg_notify(rtnl, skb, pid, group, report, flags);
481}
482EXPORT_SYMBOL(rtnl_notify);
483
484void rtnl_set_sk_err(struct net *net, u32 group, int error)
485{
486 struct sock *rtnl = net->rtnl;
487
488 netlink_set_err(rtnl, 0, group, error);
489}
490EXPORT_SYMBOL(rtnl_set_sk_err);
491
492int rtnetlink_put_metrics(struct sk_buff *skb, u32 *metrics)
493{
494 struct nlattr *mx;
495 int i, valid = 0;
496
497 mx = nla_nest_start(skb, RTA_METRICS);
498 if (mx == NULL)
499 return -ENOBUFS;
500
501 for (i = 0; i < RTAX_MAX; i++) {
502 if (metrics[i]) {
503 valid++;
504 NLA_PUT_U32(skb, i+1, metrics[i]);
505 }
506 }
507
508 if (!valid) {
509 nla_nest_cancel(skb, mx);
510 return 0;
511 }
512
513 return nla_nest_end(skb, mx);
514
515nla_put_failure:
516 nla_nest_cancel(skb, mx);
517 return -EMSGSIZE;
518}
519EXPORT_SYMBOL(rtnetlink_put_metrics);
520
521int rtnl_put_cacheinfo(struct sk_buff *skb, struct dst_entry *dst, u32 id,
522 u32 ts, u32 tsage, long expires, u32 error)
523{
524 struct rta_cacheinfo ci = {
525 .rta_lastuse = jiffies_to_clock_t(jiffies - dst->lastuse),
526 .rta_used = dst->__use,
527 .rta_clntref = atomic_read(&(dst->__refcnt)),
528 .rta_error = error,
529 .rta_id = id,
530 .rta_ts = ts,
531 .rta_tsage = tsage,
532 };
533
534 if (expires)
535 ci.rta_expires = jiffies_to_clock_t(expires);
536
537 return nla_put(skb, RTA_CACHEINFO, sizeof(ci), &ci);
538}
539EXPORT_SYMBOL_GPL(rtnl_put_cacheinfo);
540
541static void set_operstate(struct net_device *dev, unsigned char transition)
542{
543 unsigned char operstate = dev->operstate;
544
545 switch (transition) {
546 case IF_OPER_UP:
547 if ((operstate == IF_OPER_DORMANT ||
548 operstate == IF_OPER_UNKNOWN) &&
549 !netif_dormant(dev))
550 operstate = IF_OPER_UP;
551 break;
552
553 case IF_OPER_DORMANT:
554 if (operstate == IF_OPER_UP ||
555 operstate == IF_OPER_UNKNOWN)
556 operstate = IF_OPER_DORMANT;
557 break;
558 }
559
560 if (dev->operstate != operstate) {
561 write_lock_bh(&dev_base_lock);
562 dev->operstate = operstate;
563 write_unlock_bh(&dev_base_lock);
564 netdev_state_change(dev);
565 }
566}
567
568static unsigned int rtnl_dev_combine_flags(const struct net_device *dev,
569 const struct ifinfomsg *ifm)
570{
571 unsigned int flags = ifm->ifi_flags;
572
573 /* bugwards compatibility: ifi_change == 0 is treated as ~0 */
574 if (ifm->ifi_change)
575 flags = (flags & ifm->ifi_change) |
576 (dev->flags & ~ifm->ifi_change);
577
578 return flags;
579}
580
581static void copy_rtnl_link_stats(struct rtnl_link_stats *a,
582 const struct net_device_stats *b)
583{
584 a->rx_packets = b->rx_packets;
585 a->tx_packets = b->tx_packets;
586 a->rx_bytes = b->rx_bytes;
587 a->tx_bytes = b->tx_bytes;
588 a->rx_errors = b->rx_errors;
589 a->tx_errors = b->tx_errors;
590 a->rx_dropped = b->rx_dropped;
591 a->tx_dropped = b->tx_dropped;
592
593 a->multicast = b->multicast;
594 a->collisions = b->collisions;
595
596 a->rx_length_errors = b->rx_length_errors;
597 a->rx_over_errors = b->rx_over_errors;
598 a->rx_crc_errors = b->rx_crc_errors;
599 a->rx_frame_errors = b->rx_frame_errors;
600 a->rx_fifo_errors = b->rx_fifo_errors;
601 a->rx_missed_errors = b->rx_missed_errors;
602
603 a->tx_aborted_errors = b->tx_aborted_errors;
604 a->tx_carrier_errors = b->tx_carrier_errors;
605 a->tx_fifo_errors = b->tx_fifo_errors;
606 a->tx_heartbeat_errors = b->tx_heartbeat_errors;
607 a->tx_window_errors = b->tx_window_errors;
608
609 a->rx_compressed = b->rx_compressed;
610 a->tx_compressed = b->tx_compressed;
611}
612
613static void copy_rtnl_link_stats64(void *v, const struct net_device_stats *b)
614{
615 struct rtnl_link_stats64 a;
616
617 a.rx_packets = b->rx_packets;
618 a.tx_packets = b->tx_packets;
619 a.rx_bytes = b->rx_bytes;
620 a.tx_bytes = b->tx_bytes;
621 a.rx_errors = b->rx_errors;
622 a.tx_errors = b->tx_errors;
623 a.rx_dropped = b->rx_dropped;
624 a.tx_dropped = b->tx_dropped;
625
626 a.multicast = b->multicast;
627 a.collisions = b->collisions;
628
629 a.rx_length_errors = b->rx_length_errors;
630 a.rx_over_errors = b->rx_over_errors;
631 a.rx_crc_errors = b->rx_crc_errors;
632 a.rx_frame_errors = b->rx_frame_errors;
633 a.rx_fifo_errors = b->rx_fifo_errors;
634 a.rx_missed_errors = b->rx_missed_errors;
635
636 a.tx_aborted_errors = b->tx_aborted_errors;
637 a.tx_carrier_errors = b->tx_carrier_errors;
638 a.tx_fifo_errors = b->tx_fifo_errors;
639 a.tx_heartbeat_errors = b->tx_heartbeat_errors;
640 a.tx_window_errors = b->tx_window_errors;
641
642 a.rx_compressed = b->rx_compressed;
643 a.tx_compressed = b->tx_compressed;
644 memcpy(v, &a, sizeof(a));
645}
646
647static inline int rtnl_vfinfo_size(const struct net_device *dev)
648{
649 if (dev->dev.parent && dev_is_pci(dev->dev.parent))
650 return dev_num_vf(dev->dev.parent) *
651 sizeof(struct ifla_vf_info);
652 else
653 return 0;
654}
655
656static inline size_t if_nlmsg_size(const struct net_device *dev)
657{
658 return NLMSG_ALIGN(sizeof(struct ifinfomsg))
659 + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */
660 + nla_total_size(IFALIASZ) /* IFLA_IFALIAS */
661 + nla_total_size(IFNAMSIZ) /* IFLA_QDISC */
662 + nla_total_size(sizeof(struct rtnl_link_ifmap))
663 + nla_total_size(sizeof(struct rtnl_link_stats))
664 + nla_total_size(sizeof(struct rtnl_link_stats64))
665 + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */
666 + nla_total_size(MAX_ADDR_LEN) /* IFLA_BROADCAST */
667 + nla_total_size(4) /* IFLA_TXQLEN */
668 + nla_total_size(4) /* IFLA_WEIGHT */
669 + nla_total_size(4) /* IFLA_MTU */
670 + nla_total_size(4) /* IFLA_LINK */
671 + nla_total_size(4) /* IFLA_MASTER */
672 + nla_total_size(1) /* IFLA_OPERSTATE */
673 + nla_total_size(1) /* IFLA_LINKMODE */
674 + nla_total_size(4) /* IFLA_NUM_VF */
675 + nla_total_size(rtnl_vfinfo_size(dev)) /* IFLA_VFINFO */
676 + rtnl_link_get_size(dev); /* IFLA_LINKINFO */
677}
678
679static int rtnl_fill_ifinfo(struct sk_buff *skb, struct net_device *dev,
680 int type, u32 pid, u32 seq, u32 change,
681 unsigned int flags)
682{
683 struct ifinfomsg *ifm;
684 struct nlmsghdr *nlh;
685 const struct net_device_stats *stats;
686 struct nlattr *attr;
687
688 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ifm), flags);
689 if (nlh == NULL)
690 return -EMSGSIZE;
691
692 ifm = nlmsg_data(nlh);
693 ifm->ifi_family = AF_UNSPEC;
694 ifm->__ifi_pad = 0;
695 ifm->ifi_type = dev->type;
696 ifm->ifi_index = dev->ifindex;
697 ifm->ifi_flags = dev_get_flags(dev);
698 ifm->ifi_change = change;
699
700 NLA_PUT_STRING(skb, IFLA_IFNAME, dev->name);
701 NLA_PUT_U32(skb, IFLA_TXQLEN, dev->tx_queue_len);
702 NLA_PUT_U8(skb, IFLA_OPERSTATE,
703 netif_running(dev) ? dev->operstate : IF_OPER_DOWN);
704 NLA_PUT_U8(skb, IFLA_LINKMODE, dev->link_mode);
705 NLA_PUT_U32(skb, IFLA_MTU, dev->mtu);
706
707 if (dev->ifindex != dev->iflink)
708 NLA_PUT_U32(skb, IFLA_LINK, dev->iflink);
709
710 if (dev->master)
711 NLA_PUT_U32(skb, IFLA_MASTER, dev->master->ifindex);
712
713 if (dev->qdisc)
714 NLA_PUT_STRING(skb, IFLA_QDISC, dev->qdisc->ops->id);
715
716 if (dev->ifalias)
717 NLA_PUT_STRING(skb, IFLA_IFALIAS, dev->ifalias);
718
719 if (1) {
720 struct rtnl_link_ifmap map = {
721 .mem_start = dev->mem_start,
722 .mem_end = dev->mem_end,
723 .base_addr = dev->base_addr,
724 .irq = dev->irq,
725 .dma = dev->dma,
726 .port = dev->if_port,
727 };
728 NLA_PUT(skb, IFLA_MAP, sizeof(map), &map);
729 }
730
731 if (dev->addr_len) {
732 NLA_PUT(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr);
733 NLA_PUT(skb, IFLA_BROADCAST, dev->addr_len, dev->broadcast);
734 }
735
736 attr = nla_reserve(skb, IFLA_STATS,
737 sizeof(struct rtnl_link_stats));
738 if (attr == NULL)
739 goto nla_put_failure;
740
741 stats = dev_get_stats(dev);
742 copy_rtnl_link_stats(nla_data(attr), stats);
743
744 attr = nla_reserve(skb, IFLA_STATS64,
745 sizeof(struct rtnl_link_stats64));
746 if (attr == NULL)
747 goto nla_put_failure;
748 copy_rtnl_link_stats64(nla_data(attr), stats);
749
750 if (dev->netdev_ops->ndo_get_vf_config && dev->dev.parent) {
751 int i;
752 struct ifla_vf_info ivi;
753
754 NLA_PUT_U32(skb, IFLA_NUM_VF, dev_num_vf(dev->dev.parent));
755 for (i = 0; i < dev_num_vf(dev->dev.parent); i++) {
756 if (dev->netdev_ops->ndo_get_vf_config(dev, i, &ivi))
757 break;
758 NLA_PUT(skb, IFLA_VFINFO, sizeof(ivi), &ivi);
759 }
760 }
761 if (dev->rtnl_link_ops) {
762 if (rtnl_link_fill(skb, dev) < 0)
763 goto nla_put_failure;
764 }
765
766 return nlmsg_end(skb, nlh);
767
768nla_put_failure:
769 nlmsg_cancel(skb, nlh);
770 return -EMSGSIZE;
771}
772
773static int rtnl_dump_ifinfo(struct sk_buff *skb, struct netlink_callback *cb)
774{
775 struct net *net = sock_net(skb->sk);
776 int h, s_h;
777 int idx = 0, s_idx;
778 struct net_device *dev;
779 struct hlist_head *head;
780 struct hlist_node *node;
781
782 s_h = cb->args[0];
783 s_idx = cb->args[1];
784
785 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
786 idx = 0;
787 head = &net->dev_index_head[h];
788 hlist_for_each_entry(dev, node, head, index_hlist) {
789 if (idx < s_idx)
790 goto cont;
791 if (rtnl_fill_ifinfo(skb, dev, RTM_NEWLINK,
792 NETLINK_CB(cb->skb).pid,
793 cb->nlh->nlmsg_seq, 0,
794 NLM_F_MULTI) <= 0)
795 goto out;
796cont:
797 idx++;
798 }
799 }
800out:
801 cb->args[1] = idx;
802 cb->args[0] = h;
803
804 return skb->len;
805}
806
807const struct nla_policy ifla_policy[IFLA_MAX+1] = {
808 [IFLA_IFNAME] = { .type = NLA_STRING, .len = IFNAMSIZ-1 },
809 [IFLA_ADDRESS] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
810 [IFLA_BROADCAST] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
811 [IFLA_MAP] = { .len = sizeof(struct rtnl_link_ifmap) },
812 [IFLA_MTU] = { .type = NLA_U32 },
813 [IFLA_LINK] = { .type = NLA_U32 },
814 [IFLA_TXQLEN] = { .type = NLA_U32 },
815 [IFLA_WEIGHT] = { .type = NLA_U32 },
816 [IFLA_OPERSTATE] = { .type = NLA_U8 },
817 [IFLA_LINKMODE] = { .type = NLA_U8 },
818 [IFLA_LINKINFO] = { .type = NLA_NESTED },
819 [IFLA_NET_NS_PID] = { .type = NLA_U32 },
820 [IFLA_IFALIAS] = { .type = NLA_STRING, .len = IFALIASZ-1 },
821 [IFLA_VF_MAC] = { .type = NLA_BINARY,
822 .len = sizeof(struct ifla_vf_mac) },
823 [IFLA_VF_VLAN] = { .type = NLA_BINARY,
824 .len = sizeof(struct ifla_vf_vlan) },
825 [IFLA_VF_TX_RATE] = { .type = NLA_BINARY,
826 .len = sizeof(struct ifla_vf_tx_rate) },
827};
828EXPORT_SYMBOL(ifla_policy);
829
830static const struct nla_policy ifla_info_policy[IFLA_INFO_MAX+1] = {
831 [IFLA_INFO_KIND] = { .type = NLA_STRING },
832 [IFLA_INFO_DATA] = { .type = NLA_NESTED },
833};
834
835struct net *rtnl_link_get_net(struct net *src_net, struct nlattr *tb[])
836{
837 struct net *net;
838 /* Examine the link attributes and figure out which
839 * network namespace we are talking about.
840 */
841 if (tb[IFLA_NET_NS_PID])
842 net = get_net_ns_by_pid(nla_get_u32(tb[IFLA_NET_NS_PID]));
843 else
844 net = get_net(src_net);
845 return net;
846}
847EXPORT_SYMBOL(rtnl_link_get_net);
848
849static int validate_linkmsg(struct net_device *dev, struct nlattr *tb[])
850{
851 if (dev) {
852 if (tb[IFLA_ADDRESS] &&
853 nla_len(tb[IFLA_ADDRESS]) < dev->addr_len)
854 return -EINVAL;
855
856 if (tb[IFLA_BROADCAST] &&
857 nla_len(tb[IFLA_BROADCAST]) < dev->addr_len)
858 return -EINVAL;
859 }
860
861 return 0;
862}
863
864static int do_setlink(struct net_device *dev, struct ifinfomsg *ifm,
865 struct nlattr **tb, char *ifname, int modified)
866{
867 const struct net_device_ops *ops = dev->netdev_ops;
868 int send_addr_notify = 0;
869 int err;
870
871 if (tb[IFLA_NET_NS_PID]) {
872 struct net *net = rtnl_link_get_net(dev_net(dev), tb);
873 if (IS_ERR(net)) {
874 err = PTR_ERR(net);
875 goto errout;
876 }
877 err = dev_change_net_namespace(dev, net, ifname);
878 put_net(net);
879 if (err)
880 goto errout;
881 modified = 1;
882 }
883
884 if (tb[IFLA_MAP]) {
885 struct rtnl_link_ifmap *u_map;
886 struct ifmap k_map;
887
888 if (!ops->ndo_set_config) {
889 err = -EOPNOTSUPP;
890 goto errout;
891 }
892
893 if (!netif_device_present(dev)) {
894 err = -ENODEV;
895 goto errout;
896 }
897
898 u_map = nla_data(tb[IFLA_MAP]);
899 k_map.mem_start = (unsigned long) u_map->mem_start;
900 k_map.mem_end = (unsigned long) u_map->mem_end;
901 k_map.base_addr = (unsigned short) u_map->base_addr;
902 k_map.irq = (unsigned char) u_map->irq;
903 k_map.dma = (unsigned char) u_map->dma;
904 k_map.port = (unsigned char) u_map->port;
905
906 err = ops->ndo_set_config(dev, &k_map);
907 if (err < 0)
908 goto errout;
909
910 modified = 1;
911 }
912
913 if (tb[IFLA_ADDRESS]) {
914 struct sockaddr *sa;
915 int len;
916
917 if (!ops->ndo_set_mac_address) {
918 err = -EOPNOTSUPP;
919 goto errout;
920 }
921
922 if (!netif_device_present(dev)) {
923 err = -ENODEV;
924 goto errout;
925 }
926
927 len = sizeof(sa_family_t) + dev->addr_len;
928 sa = kmalloc(len, GFP_KERNEL);
929 if (!sa) {
930 err = -ENOMEM;
931 goto errout;
932 }
933 sa->sa_family = dev->type;
934 memcpy(sa->sa_data, nla_data(tb[IFLA_ADDRESS]),
935 dev->addr_len);
936 err = ops->ndo_set_mac_address(dev, sa);
937 kfree(sa);
938 if (err)
939 goto errout;
940 send_addr_notify = 1;
941 modified = 1;
942 }
943
944 if (tb[IFLA_MTU]) {
945 err = dev_set_mtu(dev, nla_get_u32(tb[IFLA_MTU]));
946 if (err < 0)
947 goto errout;
948 modified = 1;
949 }
950
951 /*
952 * Interface selected by interface index but interface
953 * name provided implies that a name change has been
954 * requested.
955 */
956 if (ifm->ifi_index > 0 && ifname[0]) {
957 err = dev_change_name(dev, ifname);
958 if (err < 0)
959 goto errout;
960 modified = 1;
961 }
962
963 if (tb[IFLA_IFALIAS]) {
964 err = dev_set_alias(dev, nla_data(tb[IFLA_IFALIAS]),
965 nla_len(tb[IFLA_IFALIAS]));
966 if (err < 0)
967 goto errout;
968 modified = 1;
969 }
970
971 if (tb[IFLA_BROADCAST]) {
972 nla_memcpy(dev->broadcast, tb[IFLA_BROADCAST], dev->addr_len);
973 send_addr_notify = 1;
974 }
975
976 if (ifm->ifi_flags || ifm->ifi_change) {
977 err = dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm));
978 if (err < 0)
979 goto errout;
980 }
981
982 if (tb[IFLA_TXQLEN])
983 dev->tx_queue_len = nla_get_u32(tb[IFLA_TXQLEN]);
984
985 if (tb[IFLA_OPERSTATE])
986 set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
987
988 if (tb[IFLA_LINKMODE]) {
989 write_lock_bh(&dev_base_lock);
990 dev->link_mode = nla_get_u8(tb[IFLA_LINKMODE]);
991 write_unlock_bh(&dev_base_lock);
992 }
993
994 if (tb[IFLA_VF_MAC]) {
995 struct ifla_vf_mac *ivm;
996 ivm = nla_data(tb[IFLA_VF_MAC]);
997 err = -EOPNOTSUPP;
998 if (ops->ndo_set_vf_mac)
999 err = ops->ndo_set_vf_mac(dev, ivm->vf, ivm->mac);
1000 if (err < 0)
1001 goto errout;
1002 modified = 1;
1003 }
1004
1005 if (tb[IFLA_VF_VLAN]) {
1006 struct ifla_vf_vlan *ivv;
1007 ivv = nla_data(tb[IFLA_VF_VLAN]);
1008 err = -EOPNOTSUPP;
1009 if (ops->ndo_set_vf_vlan)
1010 err = ops->ndo_set_vf_vlan(dev, ivv->vf,
1011 ivv->vlan,
1012 ivv->qos);
1013 if (err < 0)
1014 goto errout;
1015 modified = 1;
1016 }
1017 err = 0;
1018
1019 if (tb[IFLA_VF_TX_RATE]) {
1020 struct ifla_vf_tx_rate *ivt;
1021 ivt = nla_data(tb[IFLA_VF_TX_RATE]);
1022 err = -EOPNOTSUPP;
1023 if (ops->ndo_set_vf_tx_rate)
1024 err = ops->ndo_set_vf_tx_rate(dev, ivt->vf, ivt->rate);
1025 if (err < 0)
1026 goto errout;
1027 modified = 1;
1028 }
1029 err = 0;
1030
1031errout:
1032 if (err < 0 && modified && net_ratelimit())
1033 printk(KERN_WARNING "A link change request failed with "
1034 "some changes comitted already. Interface %s may "
1035 "have been left with an inconsistent configuration, "
1036 "please check.\n", dev->name);
1037
1038 if (send_addr_notify)
1039 call_netdevice_notifiers(NETDEV_CHANGEADDR, dev);
1040 return err;
1041}
1042
1043static int rtnl_setlink(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1044{
1045 struct net *net = sock_net(skb->sk);
1046 struct ifinfomsg *ifm;
1047 struct net_device *dev;
1048 int err;
1049 struct nlattr *tb[IFLA_MAX+1];
1050 char ifname[IFNAMSIZ];
1051
1052 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy);
1053 if (err < 0)
1054 goto errout;
1055
1056 if (tb[IFLA_IFNAME])
1057 nla_strlcpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
1058 else
1059 ifname[0] = '\0';
1060
1061 err = -EINVAL;
1062 ifm = nlmsg_data(nlh);
1063 if (ifm->ifi_index > 0)
1064 dev = __dev_get_by_index(net, ifm->ifi_index);
1065 else if (tb[IFLA_IFNAME])
1066 dev = __dev_get_by_name(net, ifname);
1067 else
1068 goto errout;
1069
1070 if (dev == NULL) {
1071 err = -ENODEV;
1072 goto errout;
1073 }
1074
1075 err = validate_linkmsg(dev, tb);
1076 if (err < 0)
1077 goto errout;
1078
1079 err = do_setlink(dev, ifm, tb, ifname, 0);
1080errout:
1081 return err;
1082}
1083
1084static int rtnl_dellink(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1085{
1086 struct net *net = sock_net(skb->sk);
1087 const struct rtnl_link_ops *ops;
1088 struct net_device *dev;
1089 struct ifinfomsg *ifm;
1090 char ifname[IFNAMSIZ];
1091 struct nlattr *tb[IFLA_MAX+1];
1092 int err;
1093
1094 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy);
1095 if (err < 0)
1096 return err;
1097
1098 if (tb[IFLA_IFNAME])
1099 nla_strlcpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
1100
1101 ifm = nlmsg_data(nlh);
1102 if (ifm->ifi_index > 0)
1103 dev = __dev_get_by_index(net, ifm->ifi_index);
1104 else if (tb[IFLA_IFNAME])
1105 dev = __dev_get_by_name(net, ifname);
1106 else
1107 return -EINVAL;
1108
1109 if (!dev)
1110 return -ENODEV;
1111
1112 ops = dev->rtnl_link_ops;
1113 if (!ops)
1114 return -EOPNOTSUPP;
1115
1116 ops->dellink(dev, NULL);
1117 return 0;
1118}
1119
1120int rtnl_configure_link(struct net_device *dev, const struct ifinfomsg *ifm)
1121{
1122 unsigned int old_flags;
1123 int err;
1124
1125 old_flags = dev->flags;
1126 if (ifm && (ifm->ifi_flags || ifm->ifi_change)) {
1127 err = __dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm));
1128 if (err < 0)
1129 return err;
1130 }
1131
1132 dev->rtnl_link_state = RTNL_LINK_INITIALIZED;
1133 rtmsg_ifinfo(RTM_NEWLINK, dev, ~0U);
1134
1135 __dev_notify_flags(dev, old_flags);
1136 return 0;
1137}
1138EXPORT_SYMBOL(rtnl_configure_link);
1139
1140struct net_device *rtnl_create_link(struct net *src_net, struct net *net,
1141 char *ifname, const struct rtnl_link_ops *ops, struct nlattr *tb[])
1142{
1143 int err;
1144 struct net_device *dev;
1145 unsigned int num_queues = 1;
1146 unsigned int real_num_queues = 1;
1147
1148 if (ops->get_tx_queues) {
1149 err = ops->get_tx_queues(src_net, tb, &num_queues,
1150 &real_num_queues);
1151 if (err)
1152 goto err;
1153 }
1154 err = -ENOMEM;
1155 dev = alloc_netdev_mq(ops->priv_size, ifname, ops->setup, num_queues);
1156 if (!dev)
1157 goto err;
1158
1159 dev_net_set(dev, net);
1160 dev->rtnl_link_ops = ops;
1161 dev->rtnl_link_state = RTNL_LINK_INITIALIZING;
1162 dev->real_num_tx_queues = real_num_queues;
1163
1164 if (strchr(dev->name, '%')) {
1165 err = dev_alloc_name(dev, dev->name);
1166 if (err < 0)
1167 goto err_free;
1168 }
1169
1170 if (tb[IFLA_MTU])
1171 dev->mtu = nla_get_u32(tb[IFLA_MTU]);
1172 if (tb[IFLA_ADDRESS])
1173 memcpy(dev->dev_addr, nla_data(tb[IFLA_ADDRESS]),
1174 nla_len(tb[IFLA_ADDRESS]));
1175 if (tb[IFLA_BROADCAST])
1176 memcpy(dev->broadcast, nla_data(tb[IFLA_BROADCAST]),
1177 nla_len(tb[IFLA_BROADCAST]));
1178 if (tb[IFLA_TXQLEN])
1179 dev->tx_queue_len = nla_get_u32(tb[IFLA_TXQLEN]);
1180 if (tb[IFLA_OPERSTATE])
1181 set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
1182 if (tb[IFLA_LINKMODE])
1183 dev->link_mode = nla_get_u8(tb[IFLA_LINKMODE]);
1184
1185 return dev;
1186
1187err_free:
1188 free_netdev(dev);
1189err:
1190 return ERR_PTR(err);
1191}
1192EXPORT_SYMBOL(rtnl_create_link);
1193
1194static int rtnl_newlink(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1195{
1196 struct net *net = sock_net(skb->sk);
1197 const struct rtnl_link_ops *ops;
1198 struct net_device *dev;
1199 struct ifinfomsg *ifm;
1200 char kind[MODULE_NAME_LEN];
1201 char ifname[IFNAMSIZ];
1202 struct nlattr *tb[IFLA_MAX+1];
1203 struct nlattr *linkinfo[IFLA_INFO_MAX+1];
1204 int err;
1205
1206#ifdef CONFIG_MODULES
1207replay:
1208#endif
1209 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy);
1210 if (err < 0)
1211 return err;
1212
1213 if (tb[IFLA_IFNAME])
1214 nla_strlcpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
1215 else
1216 ifname[0] = '\0';
1217
1218 ifm = nlmsg_data(nlh);
1219 if (ifm->ifi_index > 0)
1220 dev = __dev_get_by_index(net, ifm->ifi_index);
1221 else if (ifname[0])
1222 dev = __dev_get_by_name(net, ifname);
1223 else
1224 dev = NULL;
1225
1226 err = validate_linkmsg(dev, tb);
1227 if (err < 0)
1228 return err;
1229
1230 if (tb[IFLA_LINKINFO]) {
1231 err = nla_parse_nested(linkinfo, IFLA_INFO_MAX,
1232 tb[IFLA_LINKINFO], ifla_info_policy);
1233 if (err < 0)
1234 return err;
1235 } else
1236 memset(linkinfo, 0, sizeof(linkinfo));
1237
1238 if (linkinfo[IFLA_INFO_KIND]) {
1239 nla_strlcpy(kind, linkinfo[IFLA_INFO_KIND], sizeof(kind));
1240 ops = rtnl_link_ops_get(kind);
1241 } else {
1242 kind[0] = '\0';
1243 ops = NULL;
1244 }
1245
1246 if (1) {
1247 struct nlattr *attr[ops ? ops->maxtype + 1 : 0], **data = NULL;
1248 struct net *dest_net;
1249
1250 if (ops) {
1251 if (ops->maxtype && linkinfo[IFLA_INFO_DATA]) {
1252 err = nla_parse_nested(attr, ops->maxtype,
1253 linkinfo[IFLA_INFO_DATA],
1254 ops->policy);
1255 if (err < 0)
1256 return err;
1257 data = attr;
1258 }
1259 if (ops->validate) {
1260 err = ops->validate(tb, data);
1261 if (err < 0)
1262 return err;
1263 }
1264 }
1265
1266 if (dev) {
1267 int modified = 0;
1268
1269 if (nlh->nlmsg_flags & NLM_F_EXCL)
1270 return -EEXIST;
1271 if (nlh->nlmsg_flags & NLM_F_REPLACE)
1272 return -EOPNOTSUPP;
1273
1274 if (linkinfo[IFLA_INFO_DATA]) {
1275 if (!ops || ops != dev->rtnl_link_ops ||
1276 !ops->changelink)
1277 return -EOPNOTSUPP;
1278
1279 err = ops->changelink(dev, tb, data);
1280 if (err < 0)
1281 return err;
1282 modified = 1;
1283 }
1284
1285 return do_setlink(dev, ifm, tb, ifname, modified);
1286 }
1287
1288 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
1289 return -ENODEV;
1290
1291 if (ifm->ifi_index)
1292 return -EOPNOTSUPP;
1293 if (tb[IFLA_MAP] || tb[IFLA_MASTER] || tb[IFLA_PROTINFO])
1294 return -EOPNOTSUPP;
1295
1296 if (!ops) {
1297#ifdef CONFIG_MODULES
1298 if (kind[0]) {
1299 __rtnl_unlock();
1300 request_module("rtnl-link-%s", kind);
1301 rtnl_lock();
1302 ops = rtnl_link_ops_get(kind);
1303 if (ops)
1304 goto replay;
1305 }
1306#endif
1307 return -EOPNOTSUPP;
1308 }
1309
1310 if (!ifname[0])
1311 snprintf(ifname, IFNAMSIZ, "%s%%d", ops->kind);
1312
1313 dest_net = rtnl_link_get_net(net, tb);
1314 dev = rtnl_create_link(net, dest_net, ifname, ops, tb);
1315
1316 if (IS_ERR(dev))
1317 err = PTR_ERR(dev);
1318 else if (ops->newlink)
1319 err = ops->newlink(net, dev, tb, data);
1320 else
1321 err = register_netdevice(dev);
1322 if (err < 0 && !IS_ERR(dev)) {
1323 free_netdev(dev);
1324 goto out;
1325 }
1326
1327 err = rtnl_configure_link(dev, ifm);
1328 if (err < 0)
1329 unregister_netdevice(dev);
1330out:
1331 put_net(dest_net);
1332 return err;
1333 }
1334}
1335
1336static int rtnl_getlink(struct sk_buff *skb, struct nlmsghdr* nlh, void *arg)
1337{
1338 struct net *net = sock_net(skb->sk);
1339 struct ifinfomsg *ifm;
1340 char ifname[IFNAMSIZ];
1341 struct nlattr *tb[IFLA_MAX+1];
1342 struct net_device *dev = NULL;
1343 struct sk_buff *nskb;
1344 int err;
1345
1346 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy);
1347 if (err < 0)
1348 return err;
1349
1350 if (tb[IFLA_IFNAME])
1351 nla_strlcpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
1352
1353 ifm = nlmsg_data(nlh);
1354 if (ifm->ifi_index > 0)
1355 dev = __dev_get_by_index(net, ifm->ifi_index);
1356 else if (tb[IFLA_IFNAME])
1357 dev = __dev_get_by_name(net, ifname);
1358 else
1359 return -EINVAL;
1360
1361 if (dev == NULL)
1362 return -ENODEV;
1363
1364 nskb = nlmsg_new(if_nlmsg_size(dev), GFP_KERNEL);
1365 if (nskb == NULL)
1366 return -ENOBUFS;
1367
1368 err = rtnl_fill_ifinfo(nskb, dev, RTM_NEWLINK, NETLINK_CB(skb).pid,
1369 nlh->nlmsg_seq, 0, 0);
1370 if (err < 0) {
1371 /* -EMSGSIZE implies BUG in if_nlmsg_size */
1372 WARN_ON(err == -EMSGSIZE);
1373 kfree_skb(nskb);
1374 } else
1375 err = rtnl_unicast(nskb, net, NETLINK_CB(skb).pid);
1376
1377 return err;
1378}
1379
1380static int rtnl_dump_all(struct sk_buff *skb, struct netlink_callback *cb)
1381{
1382 int idx;
1383 int s_idx = cb->family;
1384
1385 if (s_idx == 0)
1386 s_idx = 1;
1387 for (idx = 1; idx < NPROTO; idx++) {
1388 int type = cb->nlh->nlmsg_type-RTM_BASE;
1389 if (idx < s_idx || idx == PF_PACKET)
1390 continue;
1391 if (rtnl_msg_handlers[idx] == NULL ||
1392 rtnl_msg_handlers[idx][type].dumpit == NULL)
1393 continue;
1394 if (idx > s_idx)
1395 memset(&cb->args[0], 0, sizeof(cb->args));
1396 if (rtnl_msg_handlers[idx][type].dumpit(skb, cb))
1397 break;
1398 }
1399 cb->family = idx;
1400
1401 return skb->len;
1402}
1403
1404void rtmsg_ifinfo(int type, struct net_device *dev, unsigned change)
1405{
1406 struct net *net = dev_net(dev);
1407 struct sk_buff *skb;
1408 int err = -ENOBUFS;
1409
1410 skb = nlmsg_new(if_nlmsg_size(dev), GFP_KERNEL);
1411 if (skb == NULL)
1412 goto errout;
1413
1414 err = rtnl_fill_ifinfo(skb, dev, type, 0, 0, change, 0);
1415 if (err < 0) {
1416 /* -EMSGSIZE implies BUG in if_nlmsg_size() */
1417 WARN_ON(err == -EMSGSIZE);
1418 kfree_skb(skb);
1419 goto errout;
1420 }
1421 rtnl_notify(skb, net, 0, RTNLGRP_LINK, NULL, GFP_KERNEL);
1422 return;
1423errout:
1424 if (err < 0)
1425 rtnl_set_sk_err(net, RTNLGRP_LINK, err);
1426}
1427
1428/* Protected by RTNL sempahore. */
1429static struct rtattr **rta_buf;
1430static int rtattr_max;
1431
1432/* Process one rtnetlink message. */
1433
1434static int rtnetlink_rcv_msg(struct sk_buff *skb, struct nlmsghdr *nlh)
1435{
1436 struct net *net = sock_net(skb->sk);
1437 rtnl_doit_func doit;
1438 int sz_idx, kind;
1439 int min_len;
1440 int family;
1441 int type;
1442 int err;
1443
1444 type = nlh->nlmsg_type;
1445 if (type > RTM_MAX)
1446 return -EOPNOTSUPP;
1447
1448 type -= RTM_BASE;
1449
1450 /* All the messages must have at least 1 byte length */
1451 if (nlh->nlmsg_len < NLMSG_LENGTH(sizeof(struct rtgenmsg)))
1452 return 0;
1453
1454 family = ((struct rtgenmsg *)NLMSG_DATA(nlh))->rtgen_family;
1455 sz_idx = type>>2;
1456 kind = type&3;
1457
1458 if (kind != 2 && security_netlink_recv(skb, CAP_NET_ADMIN))
1459 return -EPERM;
1460
1461 if (kind == 2 && nlh->nlmsg_flags&NLM_F_DUMP) {
1462 struct sock *rtnl;
1463 rtnl_dumpit_func dumpit;
1464
1465 dumpit = rtnl_get_dumpit(family, type);
1466 if (dumpit == NULL)
1467 return -EOPNOTSUPP;
1468
1469 __rtnl_unlock();
1470 rtnl = net->rtnl;
1471 err = netlink_dump_start(rtnl, skb, nlh, dumpit, NULL);
1472 rtnl_lock();
1473 return err;
1474 }
1475
1476 memset(rta_buf, 0, (rtattr_max * sizeof(struct rtattr *)));
1477
1478 min_len = rtm_min[sz_idx];
1479 if (nlh->nlmsg_len < min_len)
1480 return -EINVAL;
1481
1482 if (nlh->nlmsg_len > min_len) {
1483 int attrlen = nlh->nlmsg_len - NLMSG_ALIGN(min_len);
1484 struct rtattr *attr = (void *)nlh + NLMSG_ALIGN(min_len);
1485
1486 while (RTA_OK(attr, attrlen)) {
1487 unsigned flavor = attr->rta_type;
1488 if (flavor) {
1489 if (flavor > rta_max[sz_idx])
1490 return -EINVAL;
1491 rta_buf[flavor-1] = attr;
1492 }
1493 attr = RTA_NEXT(attr, attrlen);
1494 }
1495 }
1496
1497 doit = rtnl_get_doit(family, type);
1498 if (doit == NULL)
1499 return -EOPNOTSUPP;
1500
1501 return doit(skb, nlh, (void *)&rta_buf[0]);
1502}
1503
1504static void rtnetlink_rcv(struct sk_buff *skb)
1505{
1506 rtnl_lock();
1507 netlink_rcv_skb(skb, &rtnetlink_rcv_msg);
1508 rtnl_unlock();
1509}
1510
1511static int rtnetlink_event(struct notifier_block *this, unsigned long event, void *ptr)
1512{
1513 struct net_device *dev = ptr;
1514
1515 switch (event) {
1516 case NETDEV_UP:
1517 case NETDEV_DOWN:
1518 case NETDEV_PRE_UP:
1519 case NETDEV_POST_INIT:
1520 case NETDEV_REGISTER:
1521 case NETDEV_CHANGE:
1522 case NETDEV_PRE_TYPE_CHANGE:
1523 case NETDEV_GOING_DOWN:
1524 case NETDEV_UNREGISTER:
1525 case NETDEV_UNREGISTER_BATCH:
1526 break;
1527 default:
1528 rtmsg_ifinfo(RTM_NEWLINK, dev, 0);
1529 break;
1530 }
1531 return NOTIFY_DONE;
1532}
1533
1534static struct notifier_block rtnetlink_dev_notifier = {
1535 .notifier_call = rtnetlink_event,
1536};
1537
1538
1539static int __net_init rtnetlink_net_init(struct net *net)
1540{
1541 struct sock *sk;
1542 sk = netlink_kernel_create(net, NETLINK_ROUTE, RTNLGRP_MAX,
1543 rtnetlink_rcv, &rtnl_mutex, THIS_MODULE);
1544 if (!sk)
1545 return -ENOMEM;
1546 net->rtnl = sk;
1547 return 0;
1548}
1549
1550static void __net_exit rtnetlink_net_exit(struct net *net)
1551{
1552 netlink_kernel_release(net->rtnl);
1553 net->rtnl = NULL;
1554}
1555
1556static struct pernet_operations rtnetlink_net_ops = {
1557 .init = rtnetlink_net_init,
1558 .exit = rtnetlink_net_exit,
1559};
1560
1561void __init rtnetlink_init(void)
1562{
1563 int i;
1564
1565 rtattr_max = 0;
1566 for (i = 0; i < ARRAY_SIZE(rta_max); i++)
1567 if (rta_max[i] > rtattr_max)
1568 rtattr_max = rta_max[i];
1569 rta_buf = kmalloc(rtattr_max * sizeof(struct rtattr *), GFP_KERNEL);
1570 if (!rta_buf)
1571 panic("rtnetlink_init: cannot allocate rta_buf\n");
1572
1573 if (register_pernet_subsys(&rtnetlink_net_ops))
1574 panic("rtnetlink_init: cannot initialize rtnetlink\n");
1575
1576 netlink_set_nonroot(NETLINK_ROUTE, NL_NONROOT_RECV);
1577 register_netdevice_notifier(&rtnetlink_dev_notifier);
1578
1579 rtnl_register(PF_UNSPEC, RTM_GETLINK, rtnl_getlink, rtnl_dump_ifinfo);
1580 rtnl_register(PF_UNSPEC, RTM_SETLINK, rtnl_setlink, NULL);
1581 rtnl_register(PF_UNSPEC, RTM_NEWLINK, rtnl_newlink, NULL);
1582 rtnl_register(PF_UNSPEC, RTM_DELLINK, rtnl_dellink, NULL);
1583
1584 rtnl_register(PF_UNSPEC, RTM_GETADDR, NULL, rtnl_dump_all);
1585 rtnl_register(PF_UNSPEC, RTM_GETROUTE, NULL, rtnl_dump_all);
1586}
1587