]> bbs.cooldavid.org Git - net-next-2.6.git/blame - net/ipv6/icmp.c
net: constify struct inet6_protocol
[net-next-2.6.git] / net / ipv6 / icmp.c
CommitLineData
1da177e4
LT
1/*
2 * Internet Control Message Protocol (ICMPv6)
3 * Linux INET6 implementation
4 *
5 * Authors:
6 * Pedro Roque <roque@di.fc.ul.pt>
7 *
1da177e4
LT
8 * Based on net/ipv4/icmp.c
9 *
10 * RFC 1885
11 *
12 * This program is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU General Public License
14 * as published by the Free Software Foundation; either version
15 * 2 of the License, or (at your option) any later version.
16 */
17
18/*
19 * Changes:
20 *
21 * Andi Kleen : exception handling
22 * Andi Kleen add rate limits. never reply to a icmp.
23 * add more length checks and other fixes.
24 * yoshfuji : ensure to sent parameter problem for
25 * fragments.
26 * YOSHIFUJI Hideaki @USAGI: added sysctl for icmp rate limit.
27 * Randy Dunlap and
28 * YOSHIFUJI Hideaki @USAGI: Per-interface statistics support
29 * Kazunori MIYAZAWA @USAGI: change output process to use ip6_append_data
30 */
31
32#include <linux/module.h>
33#include <linux/errno.h>
34#include <linux/types.h>
35#include <linux/socket.h>
36#include <linux/in.h>
37#include <linux/kernel.h>
1da177e4
LT
38#include <linux/sockios.h>
39#include <linux/net.h>
40#include <linux/skbuff.h>
41#include <linux/init.h>
763ecff1 42#include <linux/netfilter.h>
1da177e4
LT
43
44#ifdef CONFIG_SYSCTL
45#include <linux/sysctl.h>
46#endif
47
48#include <linux/inet.h>
49#include <linux/netdevice.h>
50#include <linux/icmpv6.h>
51
52#include <net/ip.h>
53#include <net/sock.h>
54
55#include <net/ipv6.h>
56#include <net/ip6_checksum.h>
57#include <net/protocol.h>
58#include <net/raw.h>
59#include <net/rawv6.h>
60#include <net/transp_v6.h>
61#include <net/ip6_route.h>
62#include <net/addrconf.h>
63#include <net/icmp.h>
8b7817f3 64#include <net/xfrm.h>
1ed8516f 65#include <net/inet_common.h>
1da177e4
LT
66
67#include <asm/uaccess.h>
68#include <asm/system.h>
69
ba89966c 70DEFINE_SNMP_STAT(struct icmpv6_mib, icmpv6_statistics) __read_mostly;
7159039a 71EXPORT_SYMBOL(icmpv6_statistics);
14878f75
DS
72DEFINE_SNMP_STAT(struct icmpv6msg_mib, icmpv6msg_statistics) __read_mostly;
73EXPORT_SYMBOL(icmpv6msg_statistics);
1da177e4
LT
74
75/*
76 * The ICMP socket(s). This is the most convenient way to flow control
77 * our ICMP output as well as maintain a clean interface throughout
78 * all layers. All Socketless IP sends will soon be gone.
79 *
80 * On SMP we have one ICMP socket per-cpu.
81 */
98c6d1b2
DL
82static inline struct sock *icmpv6_sk(struct net *net)
83{
84 return net->ipv6.icmp_sk[smp_processor_id()];
85}
1da177e4 86
e5bbef20 87static int icmpv6_rcv(struct sk_buff *skb);
1da177e4 88
41135cc8 89static const struct inet6_protocol icmpv6_protocol = {
1da177e4 90 .handler = icmpv6_rcv,
8b7817f3 91 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1da177e4
LT
92};
93
fdc0bde9 94static __inline__ struct sock *icmpv6_xmit_lock(struct net *net)
1da177e4 95{
fdc0bde9
DL
96 struct sock *sk;
97
1da177e4
LT
98 local_bh_disable();
99
fdc0bde9 100 sk = icmpv6_sk(net);
405666db 101 if (unlikely(!spin_trylock(&sk->sk_lock.slock))) {
1da177e4
LT
102 /* This can happen if the output path (f.e. SIT or
103 * ip6ip6 tunnel) signals dst_link_failure() for an
104 * outgoing ICMP6 packet.
105 */
106 local_bh_enable();
fdc0bde9 107 return NULL;
1da177e4 108 }
fdc0bde9 109 return sk;
1da177e4
LT
110}
111
405666db 112static __inline__ void icmpv6_xmit_unlock(struct sock *sk)
1da177e4 113{
405666db 114 spin_unlock_bh(&sk->sk_lock.slock);
1da177e4
LT
115}
116
1ab1457c 117/*
1da177e4
LT
118 * Slightly more convenient version of icmpv6_send.
119 */
d5fdd6ba 120void icmpv6_param_prob(struct sk_buff *skb, u8 code, int pos)
1da177e4
LT
121{
122 icmpv6_send(skb, ICMPV6_PARAMPROB, code, pos, skb->dev);
123 kfree_skb(skb);
124}
125
126/*
127 * Figure out, may we reply to this packet with icmp error.
128 *
129 * We do not reply, if:
130 * - it was icmp error message.
131 * - it is truncated, so that it is known, that protocol is ICMPV6
132 * (i.e. in the middle of some exthdr)
133 *
134 * --ANK (980726)
135 */
136
137static int is_ineligible(struct sk_buff *skb)
138{
0660e03f 139 int ptr = (u8 *)(ipv6_hdr(skb) + 1) - skb->data;
1da177e4 140 int len = skb->len - ptr;
0660e03f 141 __u8 nexthdr = ipv6_hdr(skb)->nexthdr;
1da177e4
LT
142
143 if (len < 0)
144 return 1;
145
0d3d077c 146 ptr = ipv6_skip_exthdr(skb, ptr, &nexthdr);
1da177e4
LT
147 if (ptr < 0)
148 return 0;
149 if (nexthdr == IPPROTO_ICMPV6) {
150 u8 _type, *tp;
151 tp = skb_header_pointer(skb,
152 ptr+offsetof(struct icmp6hdr, icmp6_type),
153 sizeof(_type), &_type);
154 if (tp == NULL ||
155 !(*tp & ICMPV6_INFOMSG_MASK))
156 return 1;
157 }
158 return 0;
159}
160
1ab1457c
YH
161/*
162 * Check the ICMP output rate limit
1da177e4 163 */
d5fdd6ba 164static inline int icmpv6_xrlim_allow(struct sock *sk, u8 type,
1da177e4
LT
165 struct flowi *fl)
166{
167 struct dst_entry *dst;
3b1e0a65 168 struct net *net = sock_net(sk);
1da177e4
LT
169 int res = 0;
170
171 /* Informational messages are not limited. */
172 if (type & ICMPV6_INFOMSG_MASK)
173 return 1;
174
175 /* Do not limit pmtu discovery, it would break it. */
176 if (type == ICMPV6_PKT_TOOBIG)
177 return 1;
178
1ab1457c 179 /*
1da177e4
LT
180 * Look up the output route.
181 * XXX: perhaps the expire for routing entries cloned by
182 * this lookup should be more aggressive (not longer than timeout).
183 */
9a43b709 184 dst = ip6_route_output(net, sk, fl);
1da177e4 185 if (dst->error) {
3bd653c8 186 IP6_INC_STATS(net, ip6_dst_idev(dst),
a11d206d 187 IPSTATS_MIB_OUTNOROUTES);
1da177e4
LT
188 } else if (dst->dev && (dst->dev->flags&IFF_LOOPBACK)) {
189 res = 1;
190 } else {
191 struct rt6_info *rt = (struct rt6_info *)dst;
9a43b709 192 int tmo = net->ipv6.sysctl.icmpv6_time;
1da177e4
LT
193
194 /* Give more bandwidth to wider prefixes. */
195 if (rt->rt6i_dst.plen < 128)
196 tmo >>= ((128 - rt->rt6i_dst.plen)>>5);
197
198 res = xrlim_allow(dst, tmo);
199 }
200 dst_release(dst);
201 return res;
202}
203
204/*
205 * an inline helper for the "simple" if statement below
206 * checks if parameter problem report is caused by an
1ab1457c 207 * unrecognized IPv6 option that has the Option Type
1da177e4
LT
208 * highest-order two bits set to 10
209 */
210
211static __inline__ int opt_unrec(struct sk_buff *skb, __u32 offset)
212{
213 u8 _optval, *op;
214
bbe735e4 215 offset += skb_network_offset(skb);
1da177e4
LT
216 op = skb_header_pointer(skb, offset, sizeof(_optval), &_optval);
217 if (op == NULL)
218 return 1;
219 return (*op & 0xC0) == 0x80;
220}
221
222static int icmpv6_push_pending_frames(struct sock *sk, struct flowi *fl, struct icmp6hdr *thdr, int len)
223{
224 struct sk_buff *skb;
225 struct icmp6hdr *icmp6h;
226 int err = 0;
227
228 if ((skb = skb_peek(&sk->sk_write_queue)) == NULL)
229 goto out;
230
cc70ab26 231 icmp6h = icmp6_hdr(skb);
1da177e4
LT
232 memcpy(icmp6h, thdr, sizeof(struct icmp6hdr));
233 icmp6h->icmp6_cksum = 0;
234
235 if (skb_queue_len(&sk->sk_write_queue) == 1) {
07f0757a 236 skb->csum = csum_partial(icmp6h,
1da177e4
LT
237 sizeof(struct icmp6hdr), skb->csum);
238 icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
239 &fl->fl6_dst,
240 len, fl->proto,
241 skb->csum);
242 } else {
868c86bc 243 __wsum tmp_csum = 0;
1da177e4
LT
244
245 skb_queue_walk(&sk->sk_write_queue, skb) {
246 tmp_csum = csum_add(tmp_csum, skb->csum);
247 }
248
07f0757a 249 tmp_csum = csum_partial(icmp6h,
1da177e4 250 sizeof(struct icmp6hdr), tmp_csum);
868c86bc
AV
251 icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
252 &fl->fl6_dst,
253 len, fl->proto,
254 tmp_csum);
1da177e4 255 }
1da177e4
LT
256 ip6_push_pending_frames(sk);
257out:
258 return err;
259}
260
261struct icmpv6_msg {
262 struct sk_buff *skb;
263 int offset;
763ecff1 264 uint8_t type;
1da177e4
LT
265};
266
267static int icmpv6_getfrag(void *from, char *to, int offset, int len, int odd, struct sk_buff *skb)
268{
269 struct icmpv6_msg *msg = (struct icmpv6_msg *) from;
270 struct sk_buff *org_skb = msg->skb;
5f92a738 271 __wsum csum = 0;
1da177e4
LT
272
273 csum = skb_copy_and_csum_bits(org_skb, msg->offset + offset,
274 to, len, csum);
275 skb->csum = csum_block_add(skb->csum, csum, odd);
763ecff1
YK
276 if (!(msg->type & ICMPV6_INFOMSG_MASK))
277 nf_ct_attach(skb, org_skb);
1da177e4
LT
278 return 0;
279}
280
59fbb3a6 281#if defined(CONFIG_IPV6_MIP6) || defined(CONFIG_IPV6_MIP6_MODULE)
79383236
MN
282static void mip6_addr_swap(struct sk_buff *skb)
283{
0660e03f 284 struct ipv6hdr *iph = ipv6_hdr(skb);
79383236
MN
285 struct inet6_skb_parm *opt = IP6CB(skb);
286 struct ipv6_destopt_hao *hao;
287 struct in6_addr tmp;
288 int off;
289
290 if (opt->dsthao) {
291 off = ipv6_find_tlv(skb, opt->dsthao, IPV6_TLV_HAO);
292 if (likely(off >= 0)) {
d56f90a7
ACM
293 hao = (struct ipv6_destopt_hao *)
294 (skb_network_header(skb) + off);
79383236
MN
295 ipv6_addr_copy(&tmp, &iph->saddr);
296 ipv6_addr_copy(&iph->saddr, &hao->addr);
297 ipv6_addr_copy(&hao->addr, &tmp);
298 }
299 }
300}
301#else
302static inline void mip6_addr_swap(struct sk_buff *skb) {}
303#endif
304
1da177e4
LT
305/*
306 * Send an ICMP message in response to a packet in error
307 */
d5fdd6ba 308void icmpv6_send(struct sk_buff *skb, u8 type, u8 code, __u32 info,
1da177e4
LT
309 struct net_device *dev)
310{
c346dca1 311 struct net *net = dev_net(skb->dev);
1da177e4 312 struct inet6_dev *idev = NULL;
0660e03f 313 struct ipv6hdr *hdr = ipv6_hdr(skb);
84427d53
YH
314 struct sock *sk;
315 struct ipv6_pinfo *np;
1da177e4
LT
316 struct in6_addr *saddr = NULL;
317 struct dst_entry *dst;
8b7817f3 318 struct dst_entry *dst2;
1da177e4
LT
319 struct icmp6hdr tmp_hdr;
320 struct flowi fl;
8b7817f3 321 struct flowi fl2;
1da177e4
LT
322 struct icmpv6_msg msg;
323 int iif = 0;
324 int addr_type = 0;
325 int len;
e651f03a 326 int hlimit;
1da177e4
LT
327 int err = 0;
328
27a884dc
ACM
329 if ((u8 *)hdr < skb->head ||
330 (skb->network_header + sizeof(*hdr)) > skb->tail)
1da177e4
LT
331 return;
332
333 /*
1ab1457c 334 * Make sure we respect the rules
1da177e4
LT
335 * i.e. RFC 1885 2.4(e)
336 * Rule (e.1) is enforced by not using icmpv6_send
337 * in any code that processes icmp errors.
338 */
339 addr_type = ipv6_addr_type(&hdr->daddr);
340
9a43b709 341 if (ipv6_chk_addr(net, &hdr->daddr, skb->dev, 0))
1da177e4
LT
342 saddr = &hdr->daddr;
343
344 /*
345 * Dest addr check
346 */
347
348 if ((addr_type & IPV6_ADDR_MULTICAST || skb->pkt_type != PACKET_HOST)) {
349 if (type != ICMPV6_PKT_TOOBIG &&
1ab1457c
YH
350 !(type == ICMPV6_PARAMPROB &&
351 code == ICMPV6_UNK_OPTION &&
1da177e4
LT
352 (opt_unrec(skb, info))))
353 return;
354
355 saddr = NULL;
356 }
357
358 addr_type = ipv6_addr_type(&hdr->saddr);
359
360 /*
361 * Source addr check
362 */
363
364 if (addr_type & IPV6_ADDR_LINKLOCAL)
365 iif = skb->dev->ifindex;
366
367 /*
8de3351e
YH
368 * Must not send error if the source does not uniquely
369 * identify a single node (RFC2463 Section 2.4).
370 * We check unspecified / multicast addresses here,
371 * and anycast addresses will be checked later.
1da177e4
LT
372 */
373 if ((addr_type == IPV6_ADDR_ANY) || (addr_type & IPV6_ADDR_MULTICAST)) {
64ce2073 374 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: addr_any/mcast source\n");
1da177e4
LT
375 return;
376 }
377
1ab1457c 378 /*
1da177e4
LT
379 * Never answer to a ICMP packet.
380 */
381 if (is_ineligible(skb)) {
64ce2073 382 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: no reply to icmp error\n");
1da177e4
LT
383 return;
384 }
385
79383236
MN
386 mip6_addr_swap(skb);
387
1da177e4
LT
388 memset(&fl, 0, sizeof(fl));
389 fl.proto = IPPROTO_ICMPV6;
390 ipv6_addr_copy(&fl.fl6_dst, &hdr->saddr);
391 if (saddr)
392 ipv6_addr_copy(&fl.fl6_src, saddr);
393 fl.oif = iif;
394 fl.fl_icmp_type = type;
395 fl.fl_icmp_code = code;
beb8d13b 396 security_skb_classify_flow(skb, &fl);
1da177e4 397
fdc0bde9
DL
398 sk = icmpv6_xmit_lock(net);
399 if (sk == NULL)
405666db 400 return;
fdc0bde9 401 np = inet6_sk(sk);
405666db 402
1da177e4
LT
403 if (!icmpv6_xrlim_allow(sk, type, &fl))
404 goto out;
405
406 tmp_hdr.icmp6_type = type;
407 tmp_hdr.icmp6_code = code;
408 tmp_hdr.icmp6_cksum = 0;
409 tmp_hdr.icmp6_pointer = htonl(info);
410
411 if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
412 fl.oif = np->mcast_oif;
413
414 err = ip6_dst_lookup(sk, &dst, &fl);
415 if (err)
416 goto out;
8de3351e
YH
417
418 /*
419 * We won't send icmp if the destination is known
420 * anycast.
421 */
422 if (((struct rt6_info *)dst)->rt6i_flags & RTF_ANYCAST) {
423 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: acast source\n");
424 goto out_dst_release;
425 }
426
8b7817f3
HX
427 /* No need to clone since we're just using its address. */
428 dst2 = dst;
429
52479b62 430 err = xfrm_lookup(net, &dst, &fl, sk, 0);
8b7817f3
HX
431 switch (err) {
432 case 0:
433 if (dst != dst2)
434 goto route_done;
435 break;
436 case -EPERM:
437 dst = NULL;
438 break;
439 default:
440 goto out;
441 }
442
443 if (xfrm_decode_session_reverse(skb, &fl2, AF_INET6))
af268182 444 goto relookup_failed;
8b7817f3 445
6c06a478 446 if (ip6_dst_lookup(sk, &dst2, &fl2))
af268182 447 goto relookup_failed;
1da177e4 448
6c06a478 449 err = xfrm_lookup(net, &dst2, &fl2, sk, XFRM_LOOKUP_ICMP);
af268182
HX
450 switch (err) {
451 case 0:
452 dst_release(dst);
453 dst = dst2;
454 break;
455 case -EPERM:
456 goto out_dst_release;
457 default:
458relookup_failed:
8b7817f3
HX
459 if (!dst)
460 goto out;
af268182 461 break;
8b7817f3
HX
462 }
463
8b7817f3 464route_done:
1da177e4
LT
465 if (ipv6_addr_is_multicast(&fl.fl6_dst))
466 hlimit = np->mcast_hops;
467 else
468 hlimit = np->hop_limit;
469 if (hlimit < 0)
6b75d090 470 hlimit = ip6_dst_hoplimit(dst);
1da177e4
LT
471
472 msg.skb = skb;
bbe735e4 473 msg.offset = skb_network_offset(skb);
763ecff1 474 msg.type = type;
1da177e4
LT
475
476 len = skb->len - msg.offset;
477 len = min_t(unsigned int, len, IPV6_MIN_MTU - sizeof(struct ipv6hdr) -sizeof(struct icmp6hdr));
478 if (len < 0) {
64ce2073 479 LIMIT_NETDEBUG(KERN_DEBUG "icmp: len problem\n");
1da177e4
LT
480 goto out_dst_release;
481 }
482
483 idev = in6_dev_get(skb->dev);
484
485 err = ip6_append_data(sk, icmpv6_getfrag, &msg,
486 len + sizeof(struct icmp6hdr),
e651f03a
GR
487 sizeof(struct icmp6hdr), hlimit,
488 np->tclass, NULL, &fl, (struct rt6_info*)dst,
1da177e4
LT
489 MSG_DONTWAIT);
490 if (err) {
491 ip6_flush_pending_frames(sk);
492 goto out_put;
493 }
494 err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, len + sizeof(struct icmp6hdr));
495
1da177e4
LT
496out_put:
497 if (likely(idev != NULL))
498 in6_dev_put(idev);
499out_dst_release:
500 dst_release(dst);
501out:
405666db 502 icmpv6_xmit_unlock(sk);
1da177e4
LT
503}
504
7159039a
YH
505EXPORT_SYMBOL(icmpv6_send);
506
1da177e4
LT
507static void icmpv6_echo_reply(struct sk_buff *skb)
508{
c346dca1 509 struct net *net = dev_net(skb->dev);
84427d53 510 struct sock *sk;
1da177e4 511 struct inet6_dev *idev;
84427d53 512 struct ipv6_pinfo *np;
1da177e4 513 struct in6_addr *saddr = NULL;
cc70ab26 514 struct icmp6hdr *icmph = icmp6_hdr(skb);
1da177e4
LT
515 struct icmp6hdr tmp_hdr;
516 struct flowi fl;
517 struct icmpv6_msg msg;
518 struct dst_entry *dst;
519 int err = 0;
520 int hlimit;
521
0660e03f 522 saddr = &ipv6_hdr(skb)->daddr;
1da177e4
LT
523
524 if (!ipv6_unicast_destination(skb))
525 saddr = NULL;
526
527 memcpy(&tmp_hdr, icmph, sizeof(tmp_hdr));
528 tmp_hdr.icmp6_type = ICMPV6_ECHO_REPLY;
529
530 memset(&fl, 0, sizeof(fl));
531 fl.proto = IPPROTO_ICMPV6;
0660e03f 532 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
1da177e4
LT
533 if (saddr)
534 ipv6_addr_copy(&fl.fl6_src, saddr);
535 fl.oif = skb->dev->ifindex;
536 fl.fl_icmp_type = ICMPV6_ECHO_REPLY;
beb8d13b 537 security_skb_classify_flow(skb, &fl);
1da177e4 538
fdc0bde9
DL
539 sk = icmpv6_xmit_lock(net);
540 if (sk == NULL)
405666db 541 return;
fdc0bde9 542 np = inet6_sk(sk);
405666db 543
1da177e4
LT
544 if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
545 fl.oif = np->mcast_oif;
546
547 err = ip6_dst_lookup(sk, &dst, &fl);
548 if (err)
549 goto out;
52479b62 550 if ((err = xfrm_lookup(net, &dst, &fl, sk, 0)) < 0)
e104411b 551 goto out;
1da177e4
LT
552
553 if (ipv6_addr_is_multicast(&fl.fl6_dst))
554 hlimit = np->mcast_hops;
555 else
556 hlimit = np->hop_limit;
557 if (hlimit < 0)
6b75d090 558 hlimit = ip6_dst_hoplimit(dst);
1da177e4
LT
559
560 idev = in6_dev_get(skb->dev);
561
562 msg.skb = skb;
563 msg.offset = 0;
763ecff1 564 msg.type = ICMPV6_ECHO_REPLY;
1da177e4
LT
565
566 err = ip6_append_data(sk, icmpv6_getfrag, &msg, skb->len + sizeof(struct icmp6hdr),
e651f03a 567 sizeof(struct icmp6hdr), hlimit, np->tclass, NULL, &fl,
1da177e4
LT
568 (struct rt6_info*)dst, MSG_DONTWAIT);
569
570 if (err) {
571 ip6_flush_pending_frames(sk);
572 goto out_put;
573 }
574 err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, skb->len + sizeof(struct icmp6hdr));
575
1ab1457c 576out_put:
1da177e4
LT
577 if (likely(idev != NULL))
578 in6_dev_put(idev);
1da177e4 579 dst_release(dst);
1ab1457c 580out:
405666db 581 icmpv6_xmit_unlock(sk);
1da177e4
LT
582}
583
d5fdd6ba 584static void icmpv6_notify(struct sk_buff *skb, u8 type, u8 code, __be32 info)
1da177e4 585{
41135cc8 586 const struct inet6_protocol *ipprot;
1da177e4
LT
587 int inner_offset;
588 int hash;
589 u8 nexthdr;
590
591 if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
592 return;
593
594 nexthdr = ((struct ipv6hdr *)skb->data)->nexthdr;
595 if (ipv6_ext_hdr(nexthdr)) {
596 /* now skip over extension headers */
0d3d077c 597 inner_offset = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr), &nexthdr);
1da177e4
LT
598 if (inner_offset<0)
599 return;
600 } else {
601 inner_offset = sizeof(struct ipv6hdr);
602 }
603
604 /* Checkin header including 8 bytes of inner protocol header. */
605 if (!pskb_may_pull(skb, inner_offset+8))
606 return;
607
1da177e4
LT
608 /* BUGGG_FUTURE: we should try to parse exthdrs in this packet.
609 Without this we will not able f.e. to make source routed
610 pmtu discovery.
611 Corresponding argument (opt) to notifiers is already added.
612 --ANK (980726)
613 */
614
615 hash = nexthdr & (MAX_INET_PROTOS - 1);
616
617 rcu_read_lock();
618 ipprot = rcu_dereference(inet6_protos[hash]);
619 if (ipprot && ipprot->err_handler)
620 ipprot->err_handler(skb, NULL, type, code, inner_offset, info);
621 rcu_read_unlock();
622
69d6da0b 623 raw6_icmp_error(skb, nexthdr, type, code, inner_offset, info);
1da177e4 624}
1ab1457c 625
1da177e4
LT
626/*
627 * Handle icmp messages
628 */
629
e5bbef20 630static int icmpv6_rcv(struct sk_buff *skb)
1da177e4 631{
1da177e4
LT
632 struct net_device *dev = skb->dev;
633 struct inet6_dev *idev = __in6_dev_get(dev);
634 struct in6_addr *saddr, *daddr;
635 struct ipv6hdr *orig_hdr;
636 struct icmp6hdr *hdr;
d5fdd6ba 637 u8 type;
1da177e4 638
aebcf82c 639 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
def8b4fa 640 struct sec_path *sp = skb_sec_path(skb);
8b7817f3
HX
641 int nh;
642
def8b4fa 643 if (!(sp && sp->xvec[sp->len - 1]->props.flags &
aebcf82c
HX
644 XFRM_STATE_ICMP))
645 goto drop_no_count;
646
8b7817f3
HX
647 if (!pskb_may_pull(skb, sizeof(*hdr) + sizeof(*orig_hdr)))
648 goto drop_no_count;
649
650 nh = skb_network_offset(skb);
651 skb_set_network_header(skb, sizeof(*hdr));
652
653 if (!xfrm6_policy_check_reverse(NULL, XFRM_POLICY_IN, skb))
654 goto drop_no_count;
655
656 skb_set_network_header(skb, nh);
657 }
658
e41b5368 659 ICMP6_INC_STATS_BH(dev_net(dev), idev, ICMP6_MIB_INMSGS);
1da177e4 660
0660e03f
ACM
661 saddr = &ipv6_hdr(skb)->saddr;
662 daddr = &ipv6_hdr(skb)->daddr;
1da177e4
LT
663
664 /* Perform checksum. */
fb286bb2 665 switch (skb->ip_summed) {
84fa7933 666 case CHECKSUM_COMPLETE:
fb286bb2
HX
667 if (!csum_ipv6_magic(saddr, daddr, skb->len, IPPROTO_ICMPV6,
668 skb->csum))
669 break;
670 /* fall through */
671 case CHECKSUM_NONE:
868c86bc
AV
672 skb->csum = ~csum_unfold(csum_ipv6_magic(saddr, daddr, skb->len,
673 IPPROTO_ICMPV6, 0));
fb286bb2 674 if (__skb_checksum_complete(skb)) {
5b095d98 675 LIMIT_NETDEBUG(KERN_DEBUG "ICMPv6 checksum failed [%pI6 > %pI6]\n",
0c6ce78a 676 saddr, daddr);
1da177e4
LT
677 goto discard_it;
678 }
679 }
680
8cf22943
HX
681 if (!pskb_pull(skb, sizeof(*hdr)))
682 goto discard_it;
1da177e4 683
cc70ab26 684 hdr = icmp6_hdr(skb);
1da177e4
LT
685
686 type = hdr->icmp6_type;
687
55d43808 688 ICMP6MSGIN_INC_STATS_BH(dev_net(dev), idev, type);
1da177e4
LT
689
690 switch (type) {
691 case ICMPV6_ECHO_REQUEST:
692 icmpv6_echo_reply(skb);
693 break;
694
695 case ICMPV6_ECHO_REPLY:
696 /* we couldn't care less */
697 break;
698
699 case ICMPV6_PKT_TOOBIG:
700 /* BUGGG_FUTURE: if packet contains rthdr, we cannot update
701 standard destination cache. Seems, only "advanced"
702 destination cache will allow to solve this problem
703 --ANK (980726)
704 */
705 if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
706 goto discard_it;
cc70ab26 707 hdr = icmp6_hdr(skb);
1da177e4
LT
708 orig_hdr = (struct ipv6hdr *) (hdr + 1);
709 rt6_pmtu_discovery(&orig_hdr->daddr, &orig_hdr->saddr, dev,
710 ntohl(hdr->icmp6_mtu));
711
712 /*
713 * Drop through to notify
714 */
715
716 case ICMPV6_DEST_UNREACH:
717 case ICMPV6_TIME_EXCEED:
718 case ICMPV6_PARAMPROB:
719 icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
720 break;
721
722 case NDISC_ROUTER_SOLICITATION:
723 case NDISC_ROUTER_ADVERTISEMENT:
724 case NDISC_NEIGHBOUR_SOLICITATION:
725 case NDISC_NEIGHBOUR_ADVERTISEMENT:
726 case NDISC_REDIRECT:
727 ndisc_rcv(skb);
728 break;
729
730 case ICMPV6_MGM_QUERY:
731 igmp6_event_query(skb);
732 break;
733
734 case ICMPV6_MGM_REPORT:
735 igmp6_event_report(skb);
736 break;
737
738 case ICMPV6_MGM_REDUCTION:
739 case ICMPV6_NI_QUERY:
740 case ICMPV6_NI_REPLY:
741 case ICMPV6_MLD2_REPORT:
742 case ICMPV6_DHAAD_REQUEST:
743 case ICMPV6_DHAAD_REPLY:
744 case ICMPV6_MOBILE_PREFIX_SOL:
745 case ICMPV6_MOBILE_PREFIX_ADV:
746 break;
747
748 default:
64ce2073 749 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6: msg of unknown type\n");
1da177e4
LT
750
751 /* informational */
752 if (type & ICMPV6_INFOMSG_MASK)
753 break;
754
1ab1457c
YH
755 /*
756 * error of unknown type.
757 * must pass to upper level
1da177e4
LT
758 */
759
760 icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
3ff50b79
SH
761 }
762
1da177e4
LT
763 kfree_skb(skb);
764 return 0;
765
766discard_it:
e41b5368 767 ICMP6_INC_STATS_BH(dev_net(dev), idev, ICMP6_MIB_INERRORS);
8b7817f3 768drop_no_count:
1da177e4
LT
769 kfree_skb(skb);
770 return 0;
771}
772
95e41e93
YH
773void icmpv6_flow_init(struct sock *sk, struct flowi *fl,
774 u8 type,
775 const struct in6_addr *saddr,
776 const struct in6_addr *daddr,
777 int oif)
778{
779 memset(fl, 0, sizeof(*fl));
780 ipv6_addr_copy(&fl->fl6_src, saddr);
781 ipv6_addr_copy(&fl->fl6_dst, daddr);
782 fl->proto = IPPROTO_ICMPV6;
783 fl->fl_icmp_type = type;
784 fl->fl_icmp_code = 0;
785 fl->oif = oif;
786 security_sk_classify_flow(sk, fl);
787}
788
640c41c7 789/*
b7e729c4 790 * Special lock-class for __icmpv6_sk:
640c41c7
IM
791 */
792static struct lock_class_key icmpv6_socket_sk_dst_lock_key;
793
98c6d1b2 794static int __net_init icmpv6_sk_init(struct net *net)
1da177e4
LT
795{
796 struct sock *sk;
797 int err, i, j;
798
98c6d1b2
DL
799 net->ipv6.icmp_sk =
800 kzalloc(nr_cpu_ids * sizeof(struct sock *), GFP_KERNEL);
801 if (net->ipv6.icmp_sk == NULL)
79c91159
DL
802 return -ENOMEM;
803
6f912042 804 for_each_possible_cpu(i) {
1ed8516f
DL
805 err = inet_ctl_sock_create(&sk, PF_INET6,
806 SOCK_RAW, IPPROTO_ICMPV6, net);
1da177e4
LT
807 if (err < 0) {
808 printk(KERN_ERR
809 "Failed to initialize the ICMP6 control socket "
810 "(err %d).\n",
811 err);
812 goto fail;
813 }
814
1ed8516f 815 net->ipv6.icmp_sk[i] = sk;
5c8cafd6 816
640c41c7
IM
817 /*
818 * Split off their lock-class, because sk->sk_dst_lock
819 * gets used from softirqs, which is safe for
b7e729c4 820 * __icmpv6_sk (because those never get directly used
640c41c7
IM
821 * via userspace syscalls), but unsafe for normal sockets.
822 */
823 lockdep_set_class(&sk->sk_dst_lock,
824 &icmpv6_socket_sk_dst_lock_key);
1da177e4
LT
825
826 /* Enough space for 2 64K ICMP packets, including
827 * sk_buff struct overhead.
828 */
829 sk->sk_sndbuf =
830 (2 * ((64 * 1024) + sizeof(struct sk_buff)));
1da177e4 831 }
1da177e4
LT
832 return 0;
833
834 fail:
5c8cafd6 835 for (j = 0; j < i; j++)
1ed8516f 836 inet_ctl_sock_destroy(net->ipv6.icmp_sk[j]);
98c6d1b2 837 kfree(net->ipv6.icmp_sk);
1da177e4
LT
838 return err;
839}
840
98c6d1b2 841static void __net_exit icmpv6_sk_exit(struct net *net)
1da177e4
LT
842{
843 int i;
844
6f912042 845 for_each_possible_cpu(i) {
1ed8516f 846 inet_ctl_sock_destroy(net->ipv6.icmp_sk[i]);
1da177e4 847 }
98c6d1b2
DL
848 kfree(net->ipv6.icmp_sk);
849}
850
8ed7edce 851static struct pernet_operations icmpv6_sk_ops = {
98c6d1b2
DL
852 .init = icmpv6_sk_init,
853 .exit = icmpv6_sk_exit,
854};
855
856int __init icmpv6_init(void)
857{
858 int err;
859
860 err = register_pernet_subsys(&icmpv6_sk_ops);
861 if (err < 0)
862 return err;
863
864 err = -EAGAIN;
865 if (inet6_add_protocol(&icmpv6_protocol, IPPROTO_ICMPV6) < 0)
866 goto fail;
867 return 0;
868
869fail:
870 printk(KERN_ERR "Failed to register ICMP6 protocol\n");
871 unregister_pernet_subsys(&icmpv6_sk_ops);
872 return err;
873}
874
8ed7edce 875void icmpv6_cleanup(void)
98c6d1b2
DL
876{
877 unregister_pernet_subsys(&icmpv6_sk_ops);
1da177e4
LT
878 inet6_del_protocol(&icmpv6_protocol, IPPROTO_ICMPV6);
879}
880
98c6d1b2 881
9b5b5cff 882static const struct icmp6_err {
1da177e4
LT
883 int err;
884 int fatal;
885} tab_unreach[] = {
886 { /* NOROUTE */
887 .err = ENETUNREACH,
888 .fatal = 0,
889 },
890 { /* ADM_PROHIBITED */
891 .err = EACCES,
892 .fatal = 1,
893 },
894 { /* Was NOT_NEIGHBOUR, now reserved */
895 .err = EHOSTUNREACH,
896 .fatal = 0,
897 },
898 { /* ADDR_UNREACH */
899 .err = EHOSTUNREACH,
900 .fatal = 0,
901 },
902 { /* PORT_UNREACH */
903 .err = ECONNREFUSED,
904 .fatal = 1,
905 },
906};
907
d5fdd6ba 908int icmpv6_err_convert(u8 type, u8 code, int *err)
1da177e4
LT
909{
910 int fatal = 0;
911
912 *err = EPROTO;
913
914 switch (type) {
915 case ICMPV6_DEST_UNREACH:
916 fatal = 1;
917 if (code <= ICMPV6_PORT_UNREACH) {
918 *err = tab_unreach[code].err;
919 fatal = tab_unreach[code].fatal;
920 }
921 break;
922
923 case ICMPV6_PKT_TOOBIG:
924 *err = EMSGSIZE;
925 break;
1ab1457c 926
1da177e4
LT
927 case ICMPV6_PARAMPROB:
928 *err = EPROTO;
929 fatal = 1;
930 break;
931
932 case ICMPV6_TIME_EXCEED:
933 *err = EHOSTUNREACH;
934 break;
3ff50b79 935 }
1da177e4
LT
936
937 return fatal;
938}
939
7159039a
YH
940EXPORT_SYMBOL(icmpv6_err_convert);
941
1da177e4 942#ifdef CONFIG_SYSCTL
760f2d01 943ctl_table ipv6_icmp_table_template[] = {
1da177e4
LT
944 {
945 .ctl_name = NET_IPV6_ICMP_RATELIMIT,
946 .procname = "ratelimit",
41a76906 947 .data = &init_net.ipv6.sysctl.icmpv6_time,
1da177e4
LT
948 .maxlen = sizeof(int),
949 .mode = 0644,
6d9f239a
AD
950 .proc_handler = proc_dointvec_ms_jiffies,
951 .strategy = sysctl_ms_jiffies
1da177e4
LT
952 },
953 { .ctl_name = 0 },
954};
760f2d01
DL
955
956struct ctl_table *ipv6_icmp_sysctl_init(struct net *net)
957{
958 struct ctl_table *table;
959
960 table = kmemdup(ipv6_icmp_table_template,
961 sizeof(ipv6_icmp_table_template),
962 GFP_KERNEL);
5ee09105
YH
963
964 if (table)
965 table[0].data = &net->ipv6.sysctl.icmpv6_time;
966
760f2d01
DL
967 return table;
968}
1da177e4
LT
969#endif
970