]> bbs.cooldavid.org Git - net-next-2.6.git/blame - net/ipv6/ip6_tunnel.c
[IP_TUNNEL]: Don't limit the number of tunnels with generic name explicitly.
[net-next-2.6.git] / net / ipv6 / ip6_tunnel.c
CommitLineData
1da177e4 1/*
c4d3efaf 2 * IPv6 tunneling device
1da177e4
LT
3 * Linux INET6 implementation
4 *
5 * Authors:
1ab1457c 6 * Ville Nuorvala <vnuorval@tcs.hut.fi>
c4d3efaf 7 * Yasuyuki Kozakai <kozakai@linux-ipv6.org>
1da177e4
LT
8 *
9 * $Id$
10 *
11 * Based on:
c4d3efaf 12 * linux/net/ipv6/sit.c and linux/net/ipv4/ipip.c
1da177e4
LT
13 *
14 * RFC 2473
15 *
16 * This program is free software; you can redistribute it and/or
17 * modify it under the terms of the GNU General Public License
18 * as published by the Free Software Foundation; either version
19 * 2 of the License, or (at your option) any later version.
20 *
21 */
22
1da177e4 23#include <linux/module.h>
4fc268d2 24#include <linux/capability.h>
1da177e4
LT
25#include <linux/errno.h>
26#include <linux/types.h>
27#include <linux/sockios.h>
c4d3efaf 28#include <linux/icmp.h>
1da177e4
LT
29#include <linux/if.h>
30#include <linux/in.h>
31#include <linux/ip.h>
32#include <linux/if_tunnel.h>
33#include <linux/net.h>
34#include <linux/in6.h>
35#include <linux/netdevice.h>
36#include <linux/if_arp.h>
37#include <linux/icmpv6.h>
38#include <linux/init.h>
39#include <linux/route.h>
40#include <linux/rtnetlink.h>
41#include <linux/netfilter_ipv6.h>
42
43#include <asm/uaccess.h>
44#include <asm/atomic.h>
45
c4d3efaf 46#include <net/icmp.h>
1da177e4
LT
47#include <net/ip.h>
48#include <net/ipv6.h>
1da177e4
LT
49#include <net/ip6_route.h>
50#include <net/addrconf.h>
51#include <net/ip6_tunnel.h>
52#include <net/xfrm.h>
53#include <net/dsfield.h>
54#include <net/inet_ecn.h>
55
56MODULE_AUTHOR("Ville Nuorvala");
c4d3efaf 57MODULE_DESCRIPTION("IPv6 tunneling device");
1da177e4
LT
58MODULE_LICENSE("GPL");
59
60#define IPV6_TLV_TEL_DST_SIZE 8
61
62#ifdef IP6_TNL_DEBUG
63#define IP6_TNL_TRACE(x...) printk(KERN_DEBUG "%s:" x "\n", __FUNCTION__)
64#else
65#define IP6_TNL_TRACE(x...) do {;} while(0)
66#endif
67
68#define IPV6_TCLASS_MASK (IPV6_FLOWINFO_MASK & ~IPV6_FLOWLABEL_MASK)
c4d3efaf 69#define IPV6_TCLASS_SHIFT 20
1da177e4
LT
70
71#define HASH_SIZE 32
72
e69a4adc 73#define HASH(addr) ((__force u32)((addr)->s6_addr32[0] ^ (addr)->s6_addr32[1] ^ \
1ab1457c
YH
74 (addr)->s6_addr32[2] ^ (addr)->s6_addr32[3]) & \
75 (HASH_SIZE - 1))
1da177e4 76
3144581c
YK
77static int ip6_fb_tnl_dev_init(struct net_device *dev);
78static int ip6_tnl_dev_init(struct net_device *dev);
79static void ip6_tnl_dev_setup(struct net_device *dev);
1da177e4
LT
80
81/* the IPv6 tunnel fallback device */
3144581c 82static struct net_device *ip6_fb_tnl_dev;
1da177e4
LT
83
84
85/* lists for storing tunnels in use */
86static struct ip6_tnl *tnls_r_l[HASH_SIZE];
87static struct ip6_tnl *tnls_wc[1];
88static struct ip6_tnl **tnls[2] = { tnls_wc, tnls_r_l };
89
90/* lock for the tunnel lists */
3144581c 91static DEFINE_RWLOCK(ip6_tnl_lock);
1da177e4
LT
92
93static inline struct dst_entry *ip6_tnl_dst_check(struct ip6_tnl *t)
94{
95 struct dst_entry *dst = t->dst_cache;
96
1ab1457c 97 if (dst && dst->obsolete &&
1da177e4
LT
98 dst->ops->check(dst, t->dst_cookie) == NULL) {
99 t->dst_cache = NULL;
100 dst_release(dst);
101 return NULL;
102 }
103
104 return dst;
105}
106
107static inline void ip6_tnl_dst_reset(struct ip6_tnl *t)
108{
109 dst_release(t->dst_cache);
110 t->dst_cache = NULL;
111}
112
113static inline void ip6_tnl_dst_store(struct ip6_tnl *t, struct dst_entry *dst)
114{
115 struct rt6_info *rt = (struct rt6_info *) dst;
116 t->dst_cookie = rt->rt6i_node ? rt->rt6i_node->fn_sernum : 0;
117 dst_release(t->dst_cache);
118 t->dst_cache = dst;
119}
120
121/**
3144581c 122 * ip6_tnl_lookup - fetch tunnel matching the end-point addresses
1ab1457c
YH
123 * @remote: the address of the tunnel exit-point
124 * @local: the address of the tunnel entry-point
1da177e4 125 *
1ab1457c 126 * Return:
1da177e4 127 * tunnel matching given end-points if found,
1ab1457c 128 * else fallback tunnel if its device is up,
1da177e4
LT
129 * else %NULL
130 **/
131
132static struct ip6_tnl *
3144581c 133ip6_tnl_lookup(struct in6_addr *remote, struct in6_addr *local)
1da177e4
LT
134{
135 unsigned h0 = HASH(remote);
136 unsigned h1 = HASH(local);
137 struct ip6_tnl *t;
138
139 for (t = tnls_r_l[h0 ^ h1]; t; t = t->next) {
140 if (ipv6_addr_equal(local, &t->parms.laddr) &&
141 ipv6_addr_equal(remote, &t->parms.raddr) &&
142 (t->dev->flags & IFF_UP))
143 return t;
144 }
145 if ((t = tnls_wc[0]) != NULL && (t->dev->flags & IFF_UP))
146 return t;
147
148 return NULL;
149}
150
151/**
3144581c 152 * ip6_tnl_bucket - get head of list matching given tunnel parameters
1ab1457c 153 * @p: parameters containing tunnel end-points
1da177e4
LT
154 *
155 * Description:
3144581c 156 * ip6_tnl_bucket() returns the head of the list matching the
1da177e4
LT
157 * &struct in6_addr entries laddr and raddr in @p.
158 *
1ab1457c 159 * Return: head of IPv6 tunnel list
1da177e4
LT
160 **/
161
162static struct ip6_tnl **
3144581c 163ip6_tnl_bucket(struct ip6_tnl_parm *p)
1da177e4
LT
164{
165 struct in6_addr *remote = &p->raddr;
166 struct in6_addr *local = &p->laddr;
167 unsigned h = 0;
168 int prio = 0;
169
170 if (!ipv6_addr_any(remote) || !ipv6_addr_any(local)) {
171 prio = 1;
172 h = HASH(remote) ^ HASH(local);
173 }
174 return &tnls[prio][h];
175}
176
177/**
3144581c 178 * ip6_tnl_link - add tunnel to hash table
1da177e4
LT
179 * @t: tunnel to be added
180 **/
181
182static void
3144581c 183ip6_tnl_link(struct ip6_tnl *t)
1da177e4 184{
3144581c 185 struct ip6_tnl **tp = ip6_tnl_bucket(&t->parms);
1da177e4
LT
186
187 t->next = *tp;
3144581c 188 write_lock_bh(&ip6_tnl_lock);
1da177e4 189 *tp = t;
3144581c 190 write_unlock_bh(&ip6_tnl_lock);
1da177e4
LT
191}
192
193/**
3144581c 194 * ip6_tnl_unlink - remove tunnel from hash table
1da177e4
LT
195 * @t: tunnel to be removed
196 **/
197
198static void
3144581c 199ip6_tnl_unlink(struct ip6_tnl *t)
1da177e4
LT
200{
201 struct ip6_tnl **tp;
202
3144581c 203 for (tp = ip6_tnl_bucket(&t->parms); *tp; tp = &(*tp)->next) {
1da177e4 204 if (t == *tp) {
3144581c 205 write_lock_bh(&ip6_tnl_lock);
1da177e4 206 *tp = t->next;
3144581c 207 write_unlock_bh(&ip6_tnl_lock);
1da177e4
LT
208 break;
209 }
210 }
211}
212
213/**
214 * ip6_tnl_create() - create a new tunnel
215 * @p: tunnel parameters
216 * @pt: pointer to new tunnel
217 *
218 * Description:
219 * Create tunnel matching given parameters.
1ab1457c
YH
220 *
221 * Return:
567131a7 222 * created tunnel or NULL
1da177e4
LT
223 **/
224
567131a7 225static struct ip6_tnl *ip6_tnl_create(struct ip6_tnl_parm *p)
1da177e4
LT
226{
227 struct net_device *dev;
228 struct ip6_tnl *t;
229 char name[IFNAMSIZ];
230 int err;
231
34cc7ba6 232 if (p->name[0])
1da177e4 233 strlcpy(name, p->name, IFNAMSIZ);
34cc7ba6
PE
234 else
235 sprintf(name, "ip6tnl%%d");
236
3144581c 237 dev = alloc_netdev(sizeof (*t), name, ip6_tnl_dev_setup);
1da177e4 238 if (dev == NULL)
567131a7 239 goto failed;
1da177e4 240
2941a486 241 t = netdev_priv(dev);
3144581c 242 dev->init = ip6_tnl_dev_init;
1da177e4
LT
243 t->parms = *p;
244
245 if ((err = register_netdevice(dev)) < 0) {
246 free_netdev(dev);
567131a7 247 goto failed;
1da177e4
LT
248 }
249 dev_hold(dev);
3144581c 250 ip6_tnl_link(t);
567131a7
VN
251 return t;
252failed:
253 return NULL;
1da177e4
LT
254}
255
256/**
3144581c 257 * ip6_tnl_locate - find or create tunnel matching given parameters
1ab1457c 258 * @p: tunnel parameters
1da177e4
LT
259 * @create: != 0 if allowed to create new tunnel if no match found
260 *
261 * Description:
3144581c 262 * ip6_tnl_locate() first tries to locate an existing tunnel
1da177e4
LT
263 * based on @parms. If this is unsuccessful, but @create is set a new
264 * tunnel device is created and registered for use.
265 *
266 * Return:
567131a7 267 * matching tunnel or NULL
1da177e4
LT
268 **/
269
3144581c 270static struct ip6_tnl *ip6_tnl_locate(struct ip6_tnl_parm *p, int create)
1da177e4
LT
271{
272 struct in6_addr *remote = &p->raddr;
273 struct in6_addr *local = &p->laddr;
274 struct ip6_tnl *t;
275
3144581c 276 for (t = *ip6_tnl_bucket(p); t; t = t->next) {
1da177e4 277 if (ipv6_addr_equal(local, &t->parms.laddr) &&
567131a7
VN
278 ipv6_addr_equal(remote, &t->parms.raddr))
279 return t;
1da177e4
LT
280 }
281 if (!create)
567131a7
VN
282 return NULL;
283 return ip6_tnl_create(p);
1da177e4
LT
284}
285
286/**
3144581c 287 * ip6_tnl_dev_uninit - tunnel device uninitializer
1da177e4 288 * @dev: the device to be destroyed
1ab1457c 289 *
1da177e4 290 * Description:
3144581c 291 * ip6_tnl_dev_uninit() removes tunnel from its list
1da177e4
LT
292 **/
293
294static void
3144581c 295ip6_tnl_dev_uninit(struct net_device *dev)
1da177e4 296{
2941a486 297 struct ip6_tnl *t = netdev_priv(dev);
1da177e4 298
3144581c
YK
299 if (dev == ip6_fb_tnl_dev) {
300 write_lock_bh(&ip6_tnl_lock);
1da177e4 301 tnls_wc[0] = NULL;
3144581c 302 write_unlock_bh(&ip6_tnl_lock);
1da177e4 303 } else {
3144581c 304 ip6_tnl_unlink(t);
1da177e4
LT
305 }
306 ip6_tnl_dst_reset(t);
307 dev_put(dev);
308}
309
310/**
311 * parse_tvl_tnl_enc_lim - handle encapsulation limit option
312 * @skb: received socket buffer
313 *
1ab1457c
YH
314 * Return:
315 * 0 if none was found,
1da177e4
LT
316 * else index to encapsulation limit
317 **/
318
319static __u16
320parse_tlv_tnl_enc_lim(struct sk_buff *skb, __u8 * raw)
321{
322 struct ipv6hdr *ipv6h = (struct ipv6hdr *) raw;
323 __u8 nexthdr = ipv6h->nexthdr;
324 __u16 off = sizeof (*ipv6h);
325
326 while (ipv6_ext_hdr(nexthdr) && nexthdr != NEXTHDR_NONE) {
327 __u16 optlen = 0;
328 struct ipv6_opt_hdr *hdr;
329 if (raw + off + sizeof (*hdr) > skb->data &&
330 !pskb_may_pull(skb, raw - skb->data + off + sizeof (*hdr)))
331 break;
332
333 hdr = (struct ipv6_opt_hdr *) (raw + off);
334 if (nexthdr == NEXTHDR_FRAGMENT) {
335 struct frag_hdr *frag_hdr = (struct frag_hdr *) hdr;
336 if (frag_hdr->frag_off)
337 break;
338 optlen = 8;
339 } else if (nexthdr == NEXTHDR_AUTH) {
340 optlen = (hdr->hdrlen + 2) << 2;
341 } else {
342 optlen = ipv6_optlen(hdr);
343 }
344 if (nexthdr == NEXTHDR_DEST) {
345 __u16 i = off + 2;
346 while (1) {
347 struct ipv6_tlv_tnl_enc_lim *tel;
348
349 /* No more room for encapsulation limit */
350 if (i + sizeof (*tel) > off + optlen)
351 break;
352
353 tel = (struct ipv6_tlv_tnl_enc_lim *) &raw[i];
354 /* return index of option if found and valid */
355 if (tel->type == IPV6_TLV_TNL_ENCAP_LIMIT &&
356 tel->length == 1)
357 return i;
358 /* else jump to next option */
359 if (tel->type)
360 i += tel->length + 2;
361 else
362 i++;
363 }
364 }
365 nexthdr = hdr->nexthdr;
366 off += optlen;
367 }
368 return 0;
369}
370
371/**
e490d1d8 372 * ip6_tnl_err - tunnel error handler
1da177e4
LT
373 *
374 * Description:
e490d1d8 375 * ip6_tnl_err() should handle errors in the tunnel according
1da177e4
LT
376 * to the specifications in RFC 2473.
377 **/
378
d2acc347 379static int
502b0935 380ip6_tnl_err(struct sk_buff *skb, __u8 ipproto, struct inet6_skb_parm *opt,
704eae1f 381 int *type, int *code, int *msg, __u32 *info, int offset)
1da177e4
LT
382{
383 struct ipv6hdr *ipv6h = (struct ipv6hdr *) skb->data;
384 struct ip6_tnl *t;
385 int rel_msg = 0;
386 int rel_type = ICMPV6_DEST_UNREACH;
387 int rel_code = ICMPV6_ADDR_UNREACH;
388 __u32 rel_info = 0;
389 __u16 len;
d2acc347 390 int err = -ENOENT;
1da177e4 391
1ab1457c
YH
392 /* If the packet doesn't contain the original IPv6 header we are
393 in trouble since we might need the source address for further
1da177e4
LT
394 processing of the error. */
395
3144581c
YK
396 read_lock(&ip6_tnl_lock);
397 if ((t = ip6_tnl_lookup(&ipv6h->daddr, &ipv6h->saddr)) == NULL)
1da177e4
LT
398 goto out;
399
502b0935
YK
400 if (t->parms.proto != ipproto && t->parms.proto != 0)
401 goto out;
402
d2acc347
HX
403 err = 0;
404
e490d1d8 405 switch (*type) {
1da177e4
LT
406 __u32 teli;
407 struct ipv6_tlv_tnl_enc_lim *tel;
408 __u32 mtu;
409 case ICMPV6_DEST_UNREACH:
410 if (net_ratelimit())
411 printk(KERN_WARNING
412 "%s: Path to destination invalid "
413 "or inactive!\n", t->parms.name);
414 rel_msg = 1;
415 break;
416 case ICMPV6_TIME_EXCEED:
e490d1d8 417 if ((*code) == ICMPV6_EXC_HOPLIMIT) {
1da177e4
LT
418 if (net_ratelimit())
419 printk(KERN_WARNING
420 "%s: Too small hop limit or "
1ab1457c 421 "routing loop in tunnel!\n",
1da177e4
LT
422 t->parms.name);
423 rel_msg = 1;
424 }
425 break;
426 case ICMPV6_PARAMPROB:
107a5fe6 427 teli = 0;
e490d1d8 428 if ((*code) == ICMPV6_HDR_FIELD)
107a5fe6 429 teli = parse_tlv_tnl_enc_lim(skb, skb->data);
1da177e4 430
704eae1f 431 if (teli && teli == *info - 2) {
1da177e4
LT
432 tel = (struct ipv6_tlv_tnl_enc_lim *) &skb->data[teli];
433 if (tel->encap_limit == 0) {
434 if (net_ratelimit())
435 printk(KERN_WARNING
436 "%s: Too small encapsulation "
437 "limit or routing loop in "
438 "tunnel!\n", t->parms.name);
439 rel_msg = 1;
440 }
107a5fe6
VN
441 } else if (net_ratelimit()) {
442 printk(KERN_WARNING
443 "%s: Recipient unable to parse tunneled "
444 "packet!\n ", t->parms.name);
1da177e4
LT
445 }
446 break;
447 case ICMPV6_PKT_TOOBIG:
704eae1f 448 mtu = *info - offset;
1da177e4
LT
449 if (mtu < IPV6_MIN_MTU)
450 mtu = IPV6_MIN_MTU;
451 t->dev->mtu = mtu;
452
cc6cdac0 453 if ((len = sizeof (*ipv6h) + ntohs(ipv6h->payload_len)) > mtu) {
1da177e4
LT
454 rel_type = ICMPV6_PKT_TOOBIG;
455 rel_code = 0;
456 rel_info = mtu;
457 rel_msg = 1;
458 }
459 break;
460 }
e490d1d8
YK
461
462 *type = rel_type;
463 *code = rel_code;
464 *info = rel_info;
465 *msg = rel_msg;
466
467out:
3144581c 468 read_unlock(&ip6_tnl_lock);
e490d1d8
YK
469 return err;
470}
471
c4d3efaf
YK
472static int
473ip4ip6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
704eae1f 474 int type, int code, int offset, __be32 info)
c4d3efaf
YK
475{
476 int rel_msg = 0;
477 int rel_type = type;
478 int rel_code = code;
704eae1f 479 __u32 rel_info = ntohl(info);
c4d3efaf
YK
480 int err;
481 struct sk_buff *skb2;
482 struct iphdr *eiph;
483 struct flowi fl;
484 struct rtable *rt;
485
502b0935
YK
486 err = ip6_tnl_err(skb, IPPROTO_IPIP, opt, &rel_type, &rel_code,
487 &rel_msg, &rel_info, offset);
c4d3efaf
YK
488 if (err < 0)
489 return err;
490
491 if (rel_msg == 0)
492 return 0;
493
494 switch (rel_type) {
495 case ICMPV6_DEST_UNREACH:
496 if (rel_code != ICMPV6_ADDR_UNREACH)
497 return 0;
498 rel_type = ICMP_DEST_UNREACH;
499 rel_code = ICMP_HOST_UNREACH;
500 break;
501 case ICMPV6_PKT_TOOBIG:
502 if (rel_code != 0)
503 return 0;
504 rel_type = ICMP_DEST_UNREACH;
505 rel_code = ICMP_FRAG_NEEDED;
506 break;
507 default:
508 return 0;
509 }
510
511 if (!pskb_may_pull(skb, offset + sizeof(struct iphdr)))
512 return 0;
513
514 skb2 = skb_clone(skb, GFP_ATOMIC);
515 if (!skb2)
516 return 0;
517
518 dst_release(skb2->dst);
519 skb2->dst = NULL;
520 skb_pull(skb2, offset);
c1d2bbe1 521 skb_reset_network_header(skb2);
eddc9ec5 522 eiph = ip_hdr(skb2);
c4d3efaf
YK
523
524 /* Try to guess incoming interface */
525 memset(&fl, 0, sizeof(fl));
526 fl.fl4_dst = eiph->saddr;
527 fl.fl4_tos = RT_TOS(eiph->tos);
528 fl.proto = IPPROTO_IPIP;
f206351a 529 if (ip_route_output_key(&init_net, &rt, &fl))
c4d3efaf
YK
530 goto out;
531
532 skb2->dev = rt->u.dst.dev;
533
534 /* route "incoming" packet */
535 if (rt->rt_flags & RTCF_LOCAL) {
536 ip_rt_put(rt);
537 rt = NULL;
538 fl.fl4_dst = eiph->daddr;
539 fl.fl4_src = eiph->saddr;
540 fl.fl4_tos = eiph->tos;
f206351a 541 if (ip_route_output_key(&init_net, &rt, &fl) ||
c4d3efaf
YK
542 rt->u.dst.dev->type != ARPHRD_TUNNEL) {
543 ip_rt_put(rt);
544 goto out;
545 }
9937ded8 546 skb2->dst = (struct dst_entry *)rt;
c4d3efaf
YK
547 } else {
548 ip_rt_put(rt);
549 if (ip_route_input(skb2, eiph->daddr, eiph->saddr, eiph->tos,
550 skb2->dev) ||
551 skb2->dst->dev->type != ARPHRD_TUNNEL)
552 goto out;
553 }
554
555 /* change mtu on this route */
556 if (rel_type == ICMP_DEST_UNREACH && rel_code == ICMP_FRAG_NEEDED) {
557 if (rel_info > dst_mtu(skb2->dst))
558 goto out;
559
560 skb2->dst->ops->update_pmtu(skb2->dst, rel_info);
c4d3efaf
YK
561 }
562
704eae1f 563 icmp_send(skb2, rel_type, rel_code, htonl(rel_info));
c4d3efaf
YK
564
565out:
566 kfree_skb(skb2);
567 return 0;
568}
569
e490d1d8
YK
570static int
571ip6ip6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
704eae1f 572 int type, int code, int offset, __be32 info)
e490d1d8
YK
573{
574 int rel_msg = 0;
575 int rel_type = type;
576 int rel_code = code;
704eae1f 577 __u32 rel_info = ntohl(info);
e490d1d8
YK
578 int err;
579
502b0935
YK
580 err = ip6_tnl_err(skb, IPPROTO_IPV6, opt, &rel_type, &rel_code,
581 &rel_msg, &rel_info, offset);
e490d1d8
YK
582 if (err < 0)
583 return err;
584
585 if (rel_msg && pskb_may_pull(skb, offset + sizeof(struct ipv6hdr))) {
1da177e4
LT
586 struct rt6_info *rt;
587 struct sk_buff *skb2 = skb_clone(skb, GFP_ATOMIC);
305d4b3c 588
1da177e4 589 if (!skb2)
e490d1d8 590 return 0;
1da177e4
LT
591
592 dst_release(skb2->dst);
593 skb2->dst = NULL;
594 skb_pull(skb2, offset);
c1d2bbe1 595 skb_reset_network_header(skb2);
1da177e4
LT
596
597 /* Try to guess incoming interface */
0660e03f 598 rt = rt6_lookup(&ipv6_hdr(skb2)->saddr, NULL, 0, 0);
1da177e4
LT
599
600 if (rt && rt->rt6i_dev)
601 skb2->dev = rt->rt6i_dev;
602
603 icmpv6_send(skb2, rel_type, rel_code, rel_info, skb2->dev);
604
605 if (rt)
606 dst_release(&rt->u.dst);
607
608 kfree_skb(skb2);
609 }
e490d1d8
YK
610
611 return 0;
1da177e4
LT
612}
613
c4d3efaf
YK
614static void ip4ip6_dscp_ecn_decapsulate(struct ip6_tnl *t,
615 struct ipv6hdr *ipv6h,
616 struct sk_buff *skb)
617{
618 __u8 dsfield = ipv6_get_dsfield(ipv6h) & ~INET_ECN_MASK;
619
620 if (t->parms.flags & IP6_TNL_F_RCV_DSCP_COPY)
eddc9ec5 621 ipv4_change_dsfield(ip_hdr(skb), INET_ECN_MASK, dsfield);
c4d3efaf
YK
622
623 if (INET_ECN_is_ce(dsfield))
eddc9ec5 624 IP_ECN_set_ce(ip_hdr(skb));
c4d3efaf
YK
625}
626
8359925b
YK
627static void ip6ip6_dscp_ecn_decapsulate(struct ip6_tnl *t,
628 struct ipv6hdr *ipv6h,
629 struct sk_buff *skb)
1da177e4 630{
8359925b 631 if (t->parms.flags & IP6_TNL_F_RCV_DSCP_COPY)
29bb43b4 632 ipv6_copy_dscp(ipv6_get_dsfield(ipv6h), ipv6_hdr(skb));
1da177e4 633
8359925b 634 if (INET_ECN_is_ce(ipv6_get_dsfield(ipv6h)))
0660e03f 635 IP6_ECN_set_ce(ipv6_hdr(skb));
1da177e4 636}
8359925b 637
09c6bbf0
VN
638static inline int ip6_tnl_rcv_ctl(struct ip6_tnl *t)
639{
640 struct ip6_tnl_parm *p = &t->parms;
641 int ret = 0;
642
643 if (p->flags & IP6_TNL_F_CAP_RCV) {
1ab1457c 644 struct net_device *ldev = NULL;
09c6bbf0
VN
645
646 if (p->link)
881d966b 647 ldev = dev_get_by_index(&init_net, p->link);
09c6bbf0
VN
648
649 if ((ipv6_addr_is_multicast(&p->laddr) ||
bfeade08
DL
650 likely(ipv6_chk_addr(&init_net, &p->laddr, ldev, 0))) &&
651 likely(!ipv6_chk_addr(&init_net, &p->raddr, NULL, 0)))
09c6bbf0
VN
652 ret = 1;
653
654 if (ldev)
655 dev_put(ldev);
656 }
657 return ret;
658}
1da177e4
LT
659
660/**
3144581c 661 * ip6_tnl_rcv - decapsulate IPv6 packet and retransmit it locally
1da177e4 662 * @skb: received socket buffer
8359925b
YK
663 * @protocol: ethernet protocol ID
664 * @dscp_ecn_decapsulate: the function to decapsulate DSCP code and ECN
1da177e4
LT
665 *
666 * Return: 0
667 **/
668
8359925b 669static int ip6_tnl_rcv(struct sk_buff *skb, __u16 protocol,
502b0935 670 __u8 ipproto,
8359925b
YK
671 void (*dscp_ecn_decapsulate)(struct ip6_tnl *t,
672 struct ipv6hdr *ipv6h,
673 struct sk_buff *skb))
1da177e4 674{
1da177e4 675 struct ip6_tnl *t;
0660e03f 676 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
1da177e4 677
3144581c 678 read_lock(&ip6_tnl_lock);
1da177e4 679
3144581c 680 if ((t = ip6_tnl_lookup(&ipv6h->saddr, &ipv6h->daddr)) != NULL) {
502b0935
YK
681 if (t->parms.proto != ipproto && t->parms.proto != 0) {
682 read_unlock(&ip6_tnl_lock);
683 goto discard;
684 }
685
1da177e4 686 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
3144581c 687 read_unlock(&ip6_tnl_lock);
50fba2aa 688 goto discard;
1da177e4
LT
689 }
690
09c6bbf0 691 if (!ip6_tnl_rcv_ctl(t)) {
1da177e4 692 t->stat.rx_dropped++;
3144581c 693 read_unlock(&ip6_tnl_lock);
1da177e4
LT
694 goto discard;
695 }
696 secpath_reset(skb);
b0e380b1 697 skb->mac_header = skb->network_header;
c1d2bbe1 698 skb_reset_network_header(skb);
8359925b 699 skb->protocol = htons(protocol);
1da177e4
LT
700 skb->pkt_type = PACKET_HOST;
701 memset(skb->cb, 0, sizeof(struct inet6_skb_parm));
702 skb->dev = t->dev;
703 dst_release(skb->dst);
704 skb->dst = NULL;
53ab61c6 705 nf_reset(skb);
8359925b
YK
706
707 dscp_ecn_decapsulate(t, ipv6h, skb);
708
1da177e4
LT
709 t->stat.rx_packets++;
710 t->stat.rx_bytes += skb->len;
711 netif_rx(skb);
3144581c 712 read_unlock(&ip6_tnl_lock);
1da177e4
LT
713 return 0;
714 }
3144581c 715 read_unlock(&ip6_tnl_lock);
1da177e4 716 return 1;
50fba2aa
HX
717
718discard:
719 kfree_skb(skb);
720 return 0;
1da177e4
LT
721}
722
c4d3efaf
YK
723static int ip4ip6_rcv(struct sk_buff *skb)
724{
502b0935
YK
725 return ip6_tnl_rcv(skb, ETH_P_IP, IPPROTO_IPIP,
726 ip4ip6_dscp_ecn_decapsulate);
c4d3efaf
YK
727}
728
8359925b
YK
729static int ip6ip6_rcv(struct sk_buff *skb)
730{
502b0935
YK
731 return ip6_tnl_rcv(skb, ETH_P_IPV6, IPPROTO_IPV6,
732 ip6ip6_dscp_ecn_decapsulate);
8359925b
YK
733}
734
6fb32dde
VN
735struct ipv6_tel_txoption {
736 struct ipv6_txoptions ops;
737 __u8 dst_opt[8];
738};
1da177e4 739
6fb32dde
VN
740static void init_tel_txopt(struct ipv6_tel_txoption *opt, __u8 encap_limit)
741{
742 memset(opt, 0, sizeof(struct ipv6_tel_txoption));
1da177e4 743
6fb32dde
VN
744 opt->dst_opt[2] = IPV6_TLV_TNL_ENCAP_LIMIT;
745 opt->dst_opt[3] = 1;
746 opt->dst_opt[4] = encap_limit;
747 opt->dst_opt[5] = IPV6_TLV_PADN;
748 opt->dst_opt[6] = 1;
1da177e4 749
6fb32dde
VN
750 opt->ops.dst0opt = (struct ipv6_opt_hdr *) opt->dst_opt;
751 opt->ops.opt_nflen = 8;
1da177e4
LT
752}
753
754/**
3144581c 755 * ip6_tnl_addr_conflict - compare packet addresses to tunnel's own
1da177e4 756 * @t: the outgoing tunnel device
1ab1457c 757 * @hdr: IPv6 header from the incoming packet
1da177e4
LT
758 *
759 * Description:
1ab1457c 760 * Avoid trivial tunneling loop by checking that tunnel exit-point
1da177e4
LT
761 * doesn't match source of incoming packet.
762 *
1ab1457c 763 * Return:
1da177e4
LT
764 * 1 if conflict,
765 * 0 else
766 **/
767
768static inline int
3144581c 769ip6_tnl_addr_conflict(struct ip6_tnl *t, struct ipv6hdr *hdr)
1da177e4
LT
770{
771 return ipv6_addr_equal(&t->parms.raddr, &hdr->saddr);
772}
773
09c6bbf0
VN
774static inline int ip6_tnl_xmit_ctl(struct ip6_tnl *t)
775{
776 struct ip6_tnl_parm *p = &t->parms;
777 int ret = 0;
778
1ab1457c 779 if (p->flags & IP6_TNL_F_CAP_XMIT) {
09c6bbf0
VN
780 struct net_device *ldev = NULL;
781
782 if (p->link)
881d966b 783 ldev = dev_get_by_index(&init_net, p->link);
09c6bbf0 784
bfeade08 785 if (unlikely(!ipv6_chk_addr(&init_net, &p->laddr, ldev, 0)))
09c6bbf0
VN
786 printk(KERN_WARNING
787 "%s xmit: Local address not yet configured!\n",
788 p->name);
789 else if (!ipv6_addr_is_multicast(&p->raddr) &&
bfeade08 790 unlikely(ipv6_chk_addr(&init_net, &p->raddr, NULL, 0)))
09c6bbf0
VN
791 printk(KERN_WARNING
792 "%s xmit: Routing loop! "
793 "Remote address found on this node!\n",
794 p->name);
795 else
796 ret = 1;
797 if (ldev)
798 dev_put(ldev);
799 }
800 return ret;
801}
1da177e4 802/**
61ec2aec 803 * ip6_tnl_xmit2 - encapsulate packet and send
1da177e4 804 * @skb: the outgoing socket buffer
1ab1457c 805 * @dev: the outgoing tunnel device
61ec2aec
YK
806 * @dsfield: dscp code for outer header
807 * @fl: flow of tunneled packet
808 * @encap_limit: encapsulation limit
809 * @pmtu: Path MTU is stored if packet is too big
1da177e4
LT
810 *
811 * Description:
812 * Build new header and do some sanity checks on the packet before sending
813 * it.
814 *
1ab1457c 815 * Return:
c4d3efaf 816 * 0 on success
61ec2aec
YK
817 * -1 fail
818 * %-EMSGSIZE message too big. return mtu in this case.
1da177e4
LT
819 **/
820
61ec2aec
YK
821static int ip6_tnl_xmit2(struct sk_buff *skb,
822 struct net_device *dev,
823 __u8 dsfield,
824 struct flowi *fl,
825 int encap_limit,
826 __u32 *pmtu)
1da177e4 827{
2941a486 828 struct ip6_tnl *t = netdev_priv(dev);
1da177e4 829 struct net_device_stats *stats = &t->stat;
0660e03f 830 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
6fb32dde 831 struct ipv6_tel_txoption opt;
1da177e4
LT
832 struct dst_entry *dst;
833 struct net_device *tdev;
834 int mtu;
c2636b4d 835 unsigned int max_headroom = sizeof(struct ipv6hdr);
1da177e4 836 u8 proto;
61ec2aec 837 int err = -1;
1da177e4 838 int pkt_len;
1da177e4 839
1da177e4
LT
840 if ((dst = ip6_tnl_dst_check(t)) != NULL)
841 dst_hold(dst);
a57ebc90 842 else {
61ec2aec 843 dst = ip6_route_output(NULL, fl);
1da177e4 844
61ec2aec 845 if (dst->error || xfrm_lookup(&dst, fl, NULL, 0) < 0)
a57ebc90
PM
846 goto tx_err_link_failure;
847 }
1da177e4
LT
848
849 tdev = dst->dev;
850
851 if (tdev == dev) {
852 stats->collisions++;
853 if (net_ratelimit())
1ab1457c 854 printk(KERN_WARNING
1da177e4
LT
855 "%s: Local routing loop detected!\n",
856 t->parms.name);
857 goto tx_err_dst_release;
858 }
859 mtu = dst_mtu(dst) - sizeof (*ipv6h);
6fb32dde 860 if (encap_limit >= 0) {
1da177e4
LT
861 max_headroom += 8;
862 mtu -= 8;
863 }
864 if (mtu < IPV6_MIN_MTU)
865 mtu = IPV6_MIN_MTU;
26892058
YK
866 if (skb->dst)
867 skb->dst->ops->update_pmtu(skb->dst, mtu);
1da177e4 868 if (skb->len > mtu) {
61ec2aec
YK
869 *pmtu = mtu;
870 err = -EMSGSIZE;
1da177e4
LT
871 goto tx_err_dst_release;
872 }
873
874 /*
875 * Okay, now see if we can stuff it in the buffer as-is.
876 */
877 max_headroom += LL_RESERVED_SPACE(tdev);
1ab1457c 878
cfbba49d
PM
879 if (skb_headroom(skb) < max_headroom || skb_shared(skb) ||
880 (skb_cloned(skb) && !skb_clone_writable(skb, 0))) {
1da177e4 881 struct sk_buff *new_skb;
1ab1457c 882
1da177e4
LT
883 if (!(new_skb = skb_realloc_headroom(skb, max_headroom)))
884 goto tx_err_dst_release;
885
886 if (skb->sk)
887 skb_set_owner_w(new_skb, skb->sk);
888 kfree_skb(skb);
889 skb = new_skb;
890 }
891 dst_release(skb->dst);
892 skb->dst = dst_clone(dst);
893
b0e380b1 894 skb->transport_header = skb->network_header;
1da177e4 895
61ec2aec 896 proto = fl->proto;
6fb32dde
VN
897 if (encap_limit >= 0) {
898 init_tel_txopt(&opt, encap_limit);
899 ipv6_push_nfrag_opts(skb, &opt.ops, &proto, NULL);
900 }
e2d1bca7
ACM
901 skb_push(skb, sizeof(struct ipv6hdr));
902 skb_reset_network_header(skb);
0660e03f 903 ipv6h = ipv6_hdr(skb);
61ec2aec 904 *(__be32*)ipv6h = fl->fl6_flowlabel | htonl(0x60000000);
1da177e4
LT
905 dsfield = INET_ECN_encapsulate(0, dsfield);
906 ipv6_change_dsfield(ipv6h, ~INET_ECN_MASK, dsfield);
1da177e4
LT
907 ipv6h->hop_limit = t->parms.hop_limit;
908 ipv6h->nexthdr = proto;
61ec2aec
YK
909 ipv6_addr_copy(&ipv6h->saddr, &fl->fl6_src);
910 ipv6_addr_copy(&ipv6h->daddr, &fl->fl6_dst);
1da177e4
LT
911 nf_reset(skb);
912 pkt_len = skb->len;
ef76bc23 913 err = ip6_local_out(skb);
1da177e4 914
b9df3cb8 915 if (net_xmit_eval(err) == 0) {
1da177e4
LT
916 stats->tx_bytes += pkt_len;
917 stats->tx_packets++;
918 } else {
919 stats->tx_errors++;
920 stats->tx_aborted_errors++;
921 }
922 ip6_tnl_dst_store(t, dst);
1da177e4
LT
923 return 0;
924tx_err_link_failure:
925 stats->tx_carrier_errors++;
926 dst_link_failure(skb);
927tx_err_dst_release:
928 dst_release(dst);
61ec2aec
YK
929 return err;
930}
931
c4d3efaf
YK
932static inline int
933ip4ip6_tnl_xmit(struct sk_buff *skb, struct net_device *dev)
934{
935 struct ip6_tnl *t = netdev_priv(dev);
eddc9ec5 936 struct iphdr *iph = ip_hdr(skb);
c4d3efaf
YK
937 int encap_limit = -1;
938 struct flowi fl;
939 __u8 dsfield;
940 __u32 mtu;
941 int err;
942
502b0935
YK
943 if ((t->parms.proto != IPPROTO_IPIP && t->parms.proto != 0) ||
944 !ip6_tnl_xmit_ctl(t))
c4d3efaf
YK
945 return -1;
946
947 if (!(t->parms.flags & IP6_TNL_F_IGN_ENCAP_LIMIT))
948 encap_limit = t->parms.encap_limit;
949
950 memcpy(&fl, &t->fl, sizeof (fl));
951 fl.proto = IPPROTO_IPIP;
952
953 dsfield = ipv4_get_dsfield(iph);
954
955 if ((t->parms.flags & IP6_TNL_F_USE_ORIG_TCLASS))
b77f2fa6
AV
956 fl.fl6_flowlabel |= htonl((__u32)iph->tos << IPV6_TCLASS_SHIFT)
957 & IPV6_TCLASS_MASK;
c4d3efaf
YK
958
959 err = ip6_tnl_xmit2(skb, dev, dsfield, &fl, encap_limit, &mtu);
960 if (err != 0) {
961 /* XXX: send ICMP error even if DF is not set. */
962 if (err == -EMSGSIZE)
963 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_FRAG_NEEDED,
964 htonl(mtu));
965 return -1;
966 }
967
968 return 0;
969}
970
61ec2aec
YK
971static inline int
972ip6ip6_tnl_xmit(struct sk_buff *skb, struct net_device *dev)
973{
974 struct ip6_tnl *t = netdev_priv(dev);
0660e03f 975 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
61ec2aec
YK
976 int encap_limit = -1;
977 __u16 offset;
978 struct flowi fl;
979 __u8 dsfield;
980 __u32 mtu;
981 int err;
982
502b0935
YK
983 if ((t->parms.proto != IPPROTO_IPV6 && t->parms.proto != 0) ||
984 !ip6_tnl_xmit_ctl(t) || ip6_tnl_addr_conflict(t, ipv6h))
61ec2aec
YK
985 return -1;
986
d56f90a7
ACM
987 offset = parse_tlv_tnl_enc_lim(skb, skb_network_header(skb));
988 if (offset > 0) {
61ec2aec 989 struct ipv6_tlv_tnl_enc_lim *tel;
d56f90a7 990 tel = (struct ipv6_tlv_tnl_enc_lim *)&skb_network_header(skb)[offset];
61ec2aec
YK
991 if (tel->encap_limit == 0) {
992 icmpv6_send(skb, ICMPV6_PARAMPROB,
993 ICMPV6_HDR_FIELD, offset + 2, skb->dev);
994 return -1;
995 }
996 encap_limit = tel->encap_limit - 1;
997 } else if (!(t->parms.flags & IP6_TNL_F_IGN_ENCAP_LIMIT))
998 encap_limit = t->parms.encap_limit;
999
1000 memcpy(&fl, &t->fl, sizeof (fl));
1001 fl.proto = IPPROTO_IPV6;
1002
1003 dsfield = ipv6_get_dsfield(ipv6h);
1004 if ((t->parms.flags & IP6_TNL_F_USE_ORIG_TCLASS))
1005 fl.fl6_flowlabel |= (*(__be32 *) ipv6h & IPV6_TCLASS_MASK);
1006 if ((t->parms.flags & IP6_TNL_F_USE_ORIG_FLOWLABEL))
1007 fl.fl6_flowlabel |= (*(__be32 *) ipv6h & IPV6_FLOWLABEL_MASK);
1008
1009 err = ip6_tnl_xmit2(skb, dev, dsfield, &fl, encap_limit, &mtu);
1010 if (err != 0) {
1011 if (err == -EMSGSIZE)
1012 icmpv6_send(skb, ICMPV6_PKT_TOOBIG, 0, mtu, dev);
1013 return -1;
1014 }
1015
1016 return 0;
1017}
1018
1019static int
1020ip6_tnl_xmit(struct sk_buff *skb, struct net_device *dev)
1021{
1022 struct ip6_tnl *t = netdev_priv(dev);
1023 struct net_device_stats *stats = &t->stat;
1024 int ret;
1025
1026 if (t->recursion++) {
1027 t->stat.collisions++;
1028 goto tx_err;
1029 }
1030
1031 switch (skb->protocol) {
c4d3efaf
YK
1032 case __constant_htons(ETH_P_IP):
1033 ret = ip4ip6_tnl_xmit(skb, dev);
1034 break;
61ec2aec
YK
1035 case __constant_htons(ETH_P_IPV6):
1036 ret = ip6ip6_tnl_xmit(skb, dev);
1037 break;
1038 default:
1039 goto tx_err;
1040 }
1041
1042 if (ret < 0)
1043 goto tx_err;
1044
1045 t->recursion--;
1046 return 0;
1047
1da177e4
LT
1048tx_err:
1049 stats->tx_errors++;
1050 stats->tx_dropped++;
1051 kfree_skb(skb);
1052 t->recursion--;
1053 return 0;
1054}
1055
1056static void ip6_tnl_set_cap(struct ip6_tnl *t)
1057{
1058 struct ip6_tnl_parm *p = &t->parms;
09c6bbf0
VN
1059 int ltype = ipv6_addr_type(&p->laddr);
1060 int rtype = ipv6_addr_type(&p->raddr);
1da177e4
LT
1061
1062 p->flags &= ~(IP6_TNL_F_CAP_XMIT|IP6_TNL_F_CAP_RCV);
1063
09c6bbf0
VN
1064 if (ltype & (IPV6_ADDR_UNICAST|IPV6_ADDR_MULTICAST) &&
1065 rtype & (IPV6_ADDR_UNICAST|IPV6_ADDR_MULTICAST) &&
1066 !((ltype|rtype) & IPV6_ADDR_LOOPBACK) &&
305d4b3c 1067 (!((ltype|rtype) & IPV6_ADDR_LINKLOCAL) || p->link)) {
09c6bbf0
VN
1068 if (ltype&IPV6_ADDR_UNICAST)
1069 p->flags |= IP6_TNL_F_CAP_XMIT;
1070 if (rtype&IPV6_ADDR_UNICAST)
1071 p->flags |= IP6_TNL_F_CAP_RCV;
1da177e4
LT
1072 }
1073}
1074
3144581c 1075static void ip6_tnl_link_config(struct ip6_tnl *t)
1da177e4
LT
1076{
1077 struct net_device *dev = t->dev;
1078 struct ip6_tnl_parm *p = &t->parms;
1079 struct flowi *fl = &t->fl;
1080
1081 memcpy(&dev->dev_addr, &p->laddr, sizeof(struct in6_addr));
1082 memcpy(&dev->broadcast, &p->raddr, sizeof(struct in6_addr));
1083
1084 /* Set up flowi template */
1085 ipv6_addr_copy(&fl->fl6_src, &p->laddr);
1086 ipv6_addr_copy(&fl->fl6_dst, &p->raddr);
1087 fl->oif = p->link;
1088 fl->fl6_flowlabel = 0;
1089
1090 if (!(p->flags&IP6_TNL_F_USE_ORIG_TCLASS))
1091 fl->fl6_flowlabel |= IPV6_TCLASS_MASK & p->flowinfo;
1092 if (!(p->flags&IP6_TNL_F_USE_ORIG_FLOWLABEL))
1093 fl->fl6_flowlabel |= IPV6_FLOWLABEL_MASK & p->flowinfo;
1094
1095 ip6_tnl_set_cap(t);
1096
1097 if (p->flags&IP6_TNL_F_CAP_XMIT && p->flags&IP6_TNL_F_CAP_RCV)
1098 dev->flags |= IFF_POINTOPOINT;
1099 else
1100 dev->flags &= ~IFF_POINTOPOINT;
1101
1102 dev->iflink = p->link;
1103
1104 if (p->flags & IP6_TNL_F_CAP_XMIT) {
305d4b3c
VN
1105 int strict = (ipv6_addr_type(&p->raddr) &
1106 (IPV6_ADDR_MULTICAST|IPV6_ADDR_LINKLOCAL));
1107
1da177e4 1108 struct rt6_info *rt = rt6_lookup(&p->raddr, &p->laddr,
305d4b3c 1109 p->link, strict);
1da177e4
LT
1110
1111 if (rt == NULL)
1112 return;
1113
1114 if (rt->rt6i_dev) {
1115 dev->hard_header_len = rt->rt6i_dev->hard_header_len +
1116 sizeof (struct ipv6hdr);
1117
1118 dev->mtu = rt->rt6i_dev->mtu - sizeof (struct ipv6hdr);
1119
1120 if (dev->mtu < IPV6_MIN_MTU)
1121 dev->mtu = IPV6_MIN_MTU;
1122 }
1123 dst_release(&rt->u.dst);
1124 }
1125}
1126
1127/**
3144581c 1128 * ip6_tnl_change - update the tunnel parameters
1da177e4
LT
1129 * @t: tunnel to be changed
1130 * @p: tunnel configuration parameters
1131 * @active: != 0 if tunnel is ready for use
1132 *
1133 * Description:
3144581c 1134 * ip6_tnl_change() updates the tunnel parameters
1da177e4
LT
1135 **/
1136
1137static int
3144581c 1138ip6_tnl_change(struct ip6_tnl *t, struct ip6_tnl_parm *p)
1da177e4
LT
1139{
1140 ipv6_addr_copy(&t->parms.laddr, &p->laddr);
1141 ipv6_addr_copy(&t->parms.raddr, &p->raddr);
1142 t->parms.flags = p->flags;
1143 t->parms.hop_limit = p->hop_limit;
1144 t->parms.encap_limit = p->encap_limit;
1145 t->parms.flowinfo = p->flowinfo;
8181b8c1 1146 t->parms.link = p->link;
502b0935 1147 t->parms.proto = p->proto;
0c088890 1148 ip6_tnl_dst_reset(t);
3144581c 1149 ip6_tnl_link_config(t);
1da177e4
LT
1150 return 0;
1151}
1152
1153/**
3144581c 1154 * ip6_tnl_ioctl - configure ipv6 tunnels from userspace
1da177e4
LT
1155 * @dev: virtual device associated with tunnel
1156 * @ifr: parameters passed from userspace
1157 * @cmd: command to be performed
1158 *
1159 * Description:
3144581c 1160 * ip6_tnl_ioctl() is used for managing IPv6 tunnels
1ab1457c 1161 * from userspace.
1da177e4
LT
1162 *
1163 * The possible commands are the following:
1164 * %SIOCGETTUNNEL: get tunnel parameters for device
1165 * %SIOCADDTUNNEL: add tunnel matching given tunnel parameters
1166 * %SIOCCHGTUNNEL: change tunnel parameters to those given
1167 * %SIOCDELTUNNEL: delete tunnel
1168 *
1ab1457c 1169 * The fallback device "ip6tnl0", created during module
1da177e4
LT
1170 * initialization, can be used for creating other tunnel devices.
1171 *
1172 * Return:
1173 * 0 on success,
1174 * %-EFAULT if unable to copy data to or from userspace,
1175 * %-EPERM if current process hasn't %CAP_NET_ADMIN set
1176 * %-EINVAL if passed tunnel parameters are invalid,
1177 * %-EEXIST if changing a tunnel's parameters would cause a conflict
1178 * %-ENODEV if attempting to change or delete a nonexisting device
1179 **/
1180
1181static int
3144581c 1182ip6_tnl_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
1da177e4
LT
1183{
1184 int err = 0;
1da177e4
LT
1185 struct ip6_tnl_parm p;
1186 struct ip6_tnl *t = NULL;
1187
1188 switch (cmd) {
1189 case SIOCGETTUNNEL:
3144581c 1190 if (dev == ip6_fb_tnl_dev) {
567131a7 1191 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof (p))) {
1da177e4
LT
1192 err = -EFAULT;
1193 break;
1194 }
3144581c 1195 t = ip6_tnl_locate(&p, 0);
567131a7
VN
1196 }
1197 if (t == NULL)
2941a486 1198 t = netdev_priv(dev);
1da177e4
LT
1199 memcpy(&p, &t->parms, sizeof (p));
1200 if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof (p))) {
1201 err = -EFAULT;
1202 }
1203 break;
1204 case SIOCADDTUNNEL:
1205 case SIOCCHGTUNNEL:
1206 err = -EPERM;
1da177e4
LT
1207 if (!capable(CAP_NET_ADMIN))
1208 break;
567131a7
VN
1209 err = -EFAULT;
1210 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof (p)))
1da177e4 1211 break;
567131a7 1212 err = -EINVAL;
502b0935
YK
1213 if (p.proto != IPPROTO_IPV6 && p.proto != IPPROTO_IPIP &&
1214 p.proto != 0)
1da177e4 1215 break;
3144581c
YK
1216 t = ip6_tnl_locate(&p, cmd == SIOCADDTUNNEL);
1217 if (dev != ip6_fb_tnl_dev && cmd == SIOCCHGTUNNEL) {
567131a7
VN
1218 if (t != NULL) {
1219 if (t->dev != dev) {
1220 err = -EEXIST;
1221 break;
1222 }
1223 } else
1224 t = netdev_priv(dev);
1225
3144581c
YK
1226 ip6_tnl_unlink(t);
1227 err = ip6_tnl_change(t, &p);
1228 ip6_tnl_link(t);
1da177e4
LT
1229 netdev_state_change(dev);
1230 }
567131a7 1231 if (t) {
1da177e4 1232 err = 0;
567131a7
VN
1233 if (copy_to_user(ifr->ifr_ifru.ifru_data, &t->parms, sizeof (p)))
1234 err = -EFAULT;
1235
1236 } else
1237 err = (cmd == SIOCADDTUNNEL ? -ENOBUFS : -ENOENT);
1da177e4
LT
1238 break;
1239 case SIOCDELTUNNEL:
1240 err = -EPERM;
1241 if (!capable(CAP_NET_ADMIN))
1242 break;
1243
3144581c 1244 if (dev == ip6_fb_tnl_dev) {
567131a7
VN
1245 err = -EFAULT;
1246 if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof (p)))
1da177e4 1247 break;
567131a7 1248 err = -ENOENT;
3144581c 1249 if ((t = ip6_tnl_locate(&p, 0)) == NULL)
1da177e4 1250 break;
567131a7 1251 err = -EPERM;
3144581c 1252 if (t->dev == ip6_fb_tnl_dev)
1da177e4 1253 break;
567131a7 1254 dev = t->dev;
1da177e4 1255 }
22f8cde5
SH
1256 err = 0;
1257 unregister_netdevice(dev);
1da177e4
LT
1258 break;
1259 default:
1260 err = -EINVAL;
1261 }
1262 return err;
1263}
1264
1265/**
3144581c 1266 * ip6_tnl_get_stats - return the stats for tunnel device
1da177e4
LT
1267 * @dev: virtual device associated with tunnel
1268 *
1269 * Return: stats for device
1270 **/
1271
1272static struct net_device_stats *
3144581c 1273ip6_tnl_get_stats(struct net_device *dev)
1da177e4 1274{
2941a486 1275 return &(((struct ip6_tnl *)netdev_priv(dev))->stat);
1da177e4
LT
1276}
1277
1278/**
3144581c 1279 * ip6_tnl_change_mtu - change mtu manually for tunnel device
1da177e4
LT
1280 * @dev: virtual device associated with tunnel
1281 * @new_mtu: the new mtu
1282 *
1283 * Return:
1284 * 0 on success,
1285 * %-EINVAL if mtu too small
1286 **/
1287
1288static int
3144581c 1289ip6_tnl_change_mtu(struct net_device *dev, int new_mtu)
1da177e4
LT
1290{
1291 if (new_mtu < IPV6_MIN_MTU) {
1292 return -EINVAL;
1293 }
1294 dev->mtu = new_mtu;
1295 return 0;
1296}
1297
1298/**
3144581c 1299 * ip6_tnl_dev_setup - setup virtual tunnel device
1da177e4
LT
1300 * @dev: virtual device associated with tunnel
1301 *
1302 * Description:
1303 * Initialize function pointers and device parameters
1304 **/
1305
3144581c 1306static void ip6_tnl_dev_setup(struct net_device *dev)
1da177e4 1307{
3144581c 1308 dev->uninit = ip6_tnl_dev_uninit;
1da177e4 1309 dev->destructor = free_netdev;
61ec2aec 1310 dev->hard_start_xmit = ip6_tnl_xmit;
3144581c
YK
1311 dev->get_stats = ip6_tnl_get_stats;
1312 dev->do_ioctl = ip6_tnl_ioctl;
1313 dev->change_mtu = ip6_tnl_change_mtu;
1da177e4
LT
1314
1315 dev->type = ARPHRD_TUNNEL6;
1316 dev->hard_header_len = LL_MAX_HEADER + sizeof (struct ipv6hdr);
1317 dev->mtu = ETH_DATA_LEN - sizeof (struct ipv6hdr);
1318 dev->flags |= IFF_NOARP;
1319 dev->addr_len = sizeof(struct in6_addr);
1320}
1321
1322
1323/**
3144581c 1324 * ip6_tnl_dev_init_gen - general initializer for all tunnel devices
1da177e4
LT
1325 * @dev: virtual device associated with tunnel
1326 **/
1327
1328static inline void
3144581c 1329ip6_tnl_dev_init_gen(struct net_device *dev)
1da177e4 1330{
2941a486 1331 struct ip6_tnl *t = netdev_priv(dev);
1da177e4
LT
1332 t->dev = dev;
1333 strcpy(t->parms.name, dev->name);
1334}
1335
1336/**
3144581c 1337 * ip6_tnl_dev_init - initializer for all non fallback tunnel devices
1da177e4
LT
1338 * @dev: virtual device associated with tunnel
1339 **/
1340
1341static int
3144581c 1342ip6_tnl_dev_init(struct net_device *dev)
1da177e4 1343{
2941a486 1344 struct ip6_tnl *t = netdev_priv(dev);
3144581c
YK
1345 ip6_tnl_dev_init_gen(dev);
1346 ip6_tnl_link_config(t);
1da177e4
LT
1347 return 0;
1348}
1349
1350/**
3144581c 1351 * ip6_fb_tnl_dev_init - initializer for fallback tunnel device
1da177e4
LT
1352 * @dev: fallback device
1353 *
1354 * Return: 0
1355 **/
1356
1ab1457c 1357static int
3144581c 1358ip6_fb_tnl_dev_init(struct net_device *dev)
1da177e4 1359{
2941a486 1360 struct ip6_tnl *t = netdev_priv(dev);
3144581c 1361 ip6_tnl_dev_init_gen(dev);
502b0935 1362 t->parms.proto = IPPROTO_IPV6;
1da177e4
LT
1363 dev_hold(dev);
1364 tnls_wc[0] = t;
1365 return 0;
1366}
1367
c4d3efaf
YK
1368static struct xfrm6_tunnel ip4ip6_handler = {
1369 .handler = ip4ip6_rcv,
1370 .err_handler = ip4ip6_err,
1371 .priority = 1,
1372};
1373
1da177e4 1374static struct xfrm6_tunnel ip6ip6_handler = {
0303770d
PM
1375 .handler = ip6ip6_rcv,
1376 .err_handler = ip6ip6_err,
d2acc347 1377 .priority = 1,
1da177e4
LT
1378};
1379
1380/**
1381 * ip6_tunnel_init - register protocol and reserve needed resources
1382 *
1383 * Return: 0 on success
1384 **/
1385
1386static int __init ip6_tunnel_init(void)
1387{
1388 int err;
1389
c4d3efaf 1390 if (xfrm6_tunnel_register(&ip4ip6_handler, AF_INET)) {
3144581c 1391 printk(KERN_ERR "ip6_tunnel init: can't register ip4ip6\n");
c4d3efaf
YK
1392 err = -EAGAIN;
1393 goto out;
1394 }
1395
73d605d1 1396 if (xfrm6_tunnel_register(&ip6ip6_handler, AF_INET6)) {
3144581c 1397 printk(KERN_ERR "ip6_tunnel init: can't register ip6ip6\n");
c4d3efaf
YK
1398 err = -EAGAIN;
1399 goto unreg_ip4ip6;
1da177e4 1400 }
3144581c
YK
1401 ip6_fb_tnl_dev = alloc_netdev(sizeof(struct ip6_tnl), "ip6tnl0",
1402 ip6_tnl_dev_setup);
1da177e4 1403
3144581c 1404 if (!ip6_fb_tnl_dev) {
1da177e4
LT
1405 err = -ENOMEM;
1406 goto fail;
1407 }
3144581c 1408 ip6_fb_tnl_dev->init = ip6_fb_tnl_dev_init;
1da177e4 1409
3144581c
YK
1410 if ((err = register_netdev(ip6_fb_tnl_dev))) {
1411 free_netdev(ip6_fb_tnl_dev);
1da177e4
LT
1412 goto fail;
1413 }
1414 return 0;
1415fail:
73d605d1 1416 xfrm6_tunnel_deregister(&ip6ip6_handler, AF_INET6);
c4d3efaf
YK
1417unreg_ip4ip6:
1418 xfrm6_tunnel_deregister(&ip4ip6_handler, AF_INET);
1419out:
1da177e4
LT
1420 return err;
1421}
1422
3144581c 1423static void __exit ip6_tnl_destroy_tunnels(void)
b3fdd9f1
YK
1424{
1425 int h;
1426 struct ip6_tnl *t;
1427
1428 for (h = 0; h < HASH_SIZE; h++) {
1429 while ((t = tnls_r_l[h]) != NULL)
1430 unregister_netdevice(t->dev);
1431 }
1432
1433 t = tnls_wc[0];
1434 unregister_netdevice(t->dev);
1435}
1436
1da177e4
LT
1437/**
1438 * ip6_tunnel_cleanup - free resources and unregister protocol
1439 **/
1440
1441static void __exit ip6_tunnel_cleanup(void)
1442{
c4d3efaf 1443 if (xfrm6_tunnel_deregister(&ip4ip6_handler, AF_INET))
3144581c 1444 printk(KERN_INFO "ip6_tunnel close: can't deregister ip4ip6\n");
c4d3efaf 1445
73d605d1 1446 if (xfrm6_tunnel_deregister(&ip6ip6_handler, AF_INET6))
3144581c 1447 printk(KERN_INFO "ip6_tunnel close: can't deregister ip6ip6\n");
1da177e4 1448
b3fdd9f1 1449 rtnl_lock();
3144581c 1450 ip6_tnl_destroy_tunnels();
b3fdd9f1 1451 rtnl_unlock();
1da177e4
LT
1452}
1453
1454module_init(ip6_tunnel_init);
1455module_exit(ip6_tunnel_cleanup);