]> bbs.cooldavid.org Git - net-next-2.6.git/blame - net/ipv6/tcp_ipv6.c
ipv6: Add GRO support
[net-next-2.6.git] / net / ipv6 / tcp_ipv6.c
CommitLineData
1da177e4
LT
1/*
2 * TCP over IPv6
1ab1457c 3 * Linux INET6 implementation
1da177e4
LT
4 *
5 * Authors:
1ab1457c 6 * Pedro Roque <roque@di.fc.ul.pt>
1da177e4 7 *
1ab1457c 8 * Based on:
1da177e4
LT
9 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
eb4dea58 26#include <linux/bottom_half.h>
1da177e4 27#include <linux/module.h>
1da177e4
LT
28#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
41
42#include <linux/ipv6.h>
43#include <linux/icmpv6.h>
44#include <linux/random.h>
45
46#include <net/tcp.h>
47#include <net/ndisc.h>
5324a040 48#include <net/inet6_hashtables.h>
8129765a 49#include <net/inet6_connection_sock.h>
1da177e4
LT
50#include <net/ipv6.h>
51#include <net/transp_v6.h>
52#include <net/addrconf.h>
53#include <net/ip6_route.h>
54#include <net/ip6_checksum.h>
55#include <net/inet_ecn.h>
56#include <net/protocol.h>
57#include <net/xfrm.h>
1da177e4
LT
58#include <net/snmp.h>
59#include <net/dsfield.h>
6d6ee43e 60#include <net/timewait_sock.h>
18134bed 61#include <net/netdma.h>
3d58b5fa 62#include <net/inet_common.h>
1da177e4
LT
63
64#include <asm/uaccess.h>
65
66#include <linux/proc_fs.h>
67#include <linux/seq_file.h>
68
cfb6eeb4
YH
69#include <linux/crypto.h>
70#include <linux/scatterlist.h>
71
cfb6eeb4 72static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
6edafaaf
GJ
73static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
74 struct request_sock *req);
1da177e4
LT
75
76static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
1da177e4 77
8292a17a
ACM
78static struct inet_connection_sock_af_ops ipv6_mapped;
79static struct inet_connection_sock_af_ops ipv6_specific;
a928630a 80#ifdef CONFIG_TCP_MD5SIG
cfb6eeb4
YH
81static struct tcp_sock_af_ops tcp_sock_ipv6_specific;
82static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
9501f972
YH
83#else
84static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
85 struct in6_addr *addr)
86{
87 return NULL;
88}
a928630a 89#endif
1da177e4 90
1da177e4
LT
91static void tcp_v6_hash(struct sock *sk)
92{
93 if (sk->sk_state != TCP_CLOSE) {
8292a17a 94 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
1da177e4
LT
95 tcp_prot.hash(sk);
96 return;
97 }
98 local_bh_disable();
ab1e0a13 99 __inet6_hash(sk);
1da177e4
LT
100 local_bh_enable();
101 }
102}
103
868c86bc 104static __inline__ __sum16 tcp_v6_check(struct tcphdr *th, int len,
1ab1457c
YH
105 struct in6_addr *saddr,
106 struct in6_addr *daddr,
868c86bc 107 __wsum base)
1da177e4
LT
108{
109 return csum_ipv6_magic(saddr, daddr, len, IPPROTO_TCP, base);
110}
111
a94f723d 112static __u32 tcp_v6_init_sequence(struct sk_buff *skb)
1da177e4 113{
0660e03f
ACM
114 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
115 ipv6_hdr(skb)->saddr.s6_addr32,
aa8223c7
ACM
116 tcp_hdr(skb)->dest,
117 tcp_hdr(skb)->source);
1da177e4
LT
118}
119
1ab1457c 120static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
1da177e4
LT
121 int addr_len)
122{
123 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
1ab1457c 124 struct inet_sock *inet = inet_sk(sk);
d83d8461 125 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4
LT
126 struct ipv6_pinfo *np = inet6_sk(sk);
127 struct tcp_sock *tp = tcp_sk(sk);
128 struct in6_addr *saddr = NULL, *final_p = NULL, final;
129 struct flowi fl;
130 struct dst_entry *dst;
131 int addr_type;
132 int err;
133
1ab1457c 134 if (addr_len < SIN6_LEN_RFC2133)
1da177e4
LT
135 return -EINVAL;
136
1ab1457c 137 if (usin->sin6_family != AF_INET6)
1da177e4
LT
138 return(-EAFNOSUPPORT);
139
140 memset(&fl, 0, sizeof(fl));
141
142 if (np->sndflow) {
143 fl.fl6_flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
144 IP6_ECN_flow_init(fl.fl6_flowlabel);
145 if (fl.fl6_flowlabel&IPV6_FLOWLABEL_MASK) {
146 struct ip6_flowlabel *flowlabel;
147 flowlabel = fl6_sock_lookup(sk, fl.fl6_flowlabel);
148 if (flowlabel == NULL)
149 return -EINVAL;
150 ipv6_addr_copy(&usin->sin6_addr, &flowlabel->dst);
151 fl6_sock_release(flowlabel);
152 }
153 }
154
155 /*
1ab1457c
YH
156 * connect() to INADDR_ANY means loopback (BSD'ism).
157 */
158
159 if(ipv6_addr_any(&usin->sin6_addr))
160 usin->sin6_addr.s6_addr[15] = 0x1;
1da177e4
LT
161
162 addr_type = ipv6_addr_type(&usin->sin6_addr);
163
164 if(addr_type & IPV6_ADDR_MULTICAST)
165 return -ENETUNREACH;
166
167 if (addr_type&IPV6_ADDR_LINKLOCAL) {
168 if (addr_len >= sizeof(struct sockaddr_in6) &&
169 usin->sin6_scope_id) {
170 /* If interface is set while binding, indices
171 * must coincide.
172 */
173 if (sk->sk_bound_dev_if &&
174 sk->sk_bound_dev_if != usin->sin6_scope_id)
175 return -EINVAL;
176
177 sk->sk_bound_dev_if = usin->sin6_scope_id;
178 }
179
180 /* Connect to link-local address requires an interface */
181 if (!sk->sk_bound_dev_if)
182 return -EINVAL;
183 }
184
185 if (tp->rx_opt.ts_recent_stamp &&
186 !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
187 tp->rx_opt.ts_recent = 0;
188 tp->rx_opt.ts_recent_stamp = 0;
189 tp->write_seq = 0;
190 }
191
192 ipv6_addr_copy(&np->daddr, &usin->sin6_addr);
193 np->flow_label = fl.fl6_flowlabel;
194
195 /*
196 * TCP over IPv4
197 */
198
199 if (addr_type == IPV6_ADDR_MAPPED) {
d83d8461 200 u32 exthdrlen = icsk->icsk_ext_hdr_len;
1da177e4
LT
201 struct sockaddr_in sin;
202
203 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
204
205 if (__ipv6_only_sock(sk))
206 return -ENETUNREACH;
207
208 sin.sin_family = AF_INET;
209 sin.sin_port = usin->sin6_port;
210 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
211
d83d8461 212 icsk->icsk_af_ops = &ipv6_mapped;
1da177e4 213 sk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
214#ifdef CONFIG_TCP_MD5SIG
215 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
216#endif
1da177e4
LT
217
218 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
219
220 if (err) {
d83d8461
ACM
221 icsk->icsk_ext_hdr_len = exthdrlen;
222 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 223 sk->sk_backlog_rcv = tcp_v6_do_rcv;
cfb6eeb4
YH
224#ifdef CONFIG_TCP_MD5SIG
225 tp->af_specific = &tcp_sock_ipv6_specific;
226#endif
1da177e4
LT
227 goto failure;
228 } else {
229 ipv6_addr_set(&np->saddr, 0, 0, htonl(0x0000FFFF),
230 inet->saddr);
231 ipv6_addr_set(&np->rcv_saddr, 0, 0, htonl(0x0000FFFF),
232 inet->rcv_saddr);
233 }
234
235 return err;
236 }
237
238 if (!ipv6_addr_any(&np->rcv_saddr))
239 saddr = &np->rcv_saddr;
240
241 fl.proto = IPPROTO_TCP;
242 ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
243 ipv6_addr_copy(&fl.fl6_src,
244 (saddr ? saddr : &np->saddr));
245 fl.oif = sk->sk_bound_dev_if;
246 fl.fl_ip_dport = usin->sin6_port;
247 fl.fl_ip_sport = inet->sport;
248
249 if (np->opt && np->opt->srcrt) {
250 struct rt0_hdr *rt0 = (struct rt0_hdr *)np->opt->srcrt;
251 ipv6_addr_copy(&final, &fl.fl6_dst);
252 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
253 final_p = &final;
254 }
255
beb8d13b
VY
256 security_sk_classify_flow(sk, &fl);
257
1da177e4
LT
258 err = ip6_dst_lookup(sk, &dst, &fl);
259 if (err)
260 goto failure;
261 if (final_p)
262 ipv6_addr_copy(&fl.fl6_dst, final_p);
263
52479b62
AD
264 err = __xfrm_lookup(sock_net(sk), &dst, &fl, sk, XFRM_LOOKUP_WAIT);
265 if (err < 0) {
14e50e57
DM
266 if (err == -EREMOTE)
267 err = ip6_dst_blackhole(sk, &dst, &fl);
268 if (err < 0)
269 goto failure;
270 }
1da177e4
LT
271
272 if (saddr == NULL) {
273 saddr = &fl.fl6_src;
274 ipv6_addr_copy(&np->rcv_saddr, saddr);
275 }
276
277 /* set the source address */
278 ipv6_addr_copy(&np->saddr, saddr);
279 inet->rcv_saddr = LOOPBACK4_IPV6;
280
f83ef8c0 281 sk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 282 __ip6_dst_store(sk, dst, NULL, NULL);
1da177e4 283
d83d8461 284 icsk->icsk_ext_hdr_len = 0;
1da177e4 285 if (np->opt)
d83d8461
ACM
286 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
287 np->opt->opt_nflen);
1da177e4
LT
288
289 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
290
291 inet->dport = usin->sin6_port;
292
293 tcp_set_state(sk, TCP_SYN_SENT);
d8313f5c 294 err = inet6_hash_connect(&tcp_death_row, sk);
1da177e4
LT
295 if (err)
296 goto late_failure;
297
298 if (!tp->write_seq)
299 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
300 np->daddr.s6_addr32,
301 inet->sport,
302 inet->dport);
303
304 err = tcp_connect(sk);
305 if (err)
306 goto late_failure;
307
308 return 0;
309
310late_failure:
311 tcp_set_state(sk, TCP_CLOSE);
312 __sk_dst_reset(sk);
313failure:
314 inet->dport = 0;
315 sk->sk_route_caps = 0;
316 return err;
317}
318
319static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
04ce6909 320 int type, int code, int offset, __be32 info)
1da177e4
LT
321{
322 struct ipv6hdr *hdr = (struct ipv6hdr*)skb->data;
505cbfc5 323 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
1da177e4
LT
324 struct ipv6_pinfo *np;
325 struct sock *sk;
326 int err;
1ab1457c 327 struct tcp_sock *tp;
1da177e4 328 __u32 seq;
ca12a1a4 329 struct net *net = dev_net(skb->dev);
1da177e4 330
ca12a1a4 331 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
d86e0dac 332 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
1da177e4
LT
333
334 if (sk == NULL) {
e41b5368
DL
335 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
336 ICMP6_MIB_INERRORS);
1da177e4
LT
337 return;
338 }
339
340 if (sk->sk_state == TCP_TIME_WAIT) {
9469c7b4 341 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
342 return;
343 }
344
345 bh_lock_sock(sk);
346 if (sock_owned_by_user(sk))
de0744af 347 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
1da177e4
LT
348
349 if (sk->sk_state == TCP_CLOSE)
350 goto out;
351
352 tp = tcp_sk(sk);
1ab1457c 353 seq = ntohl(th->seq);
1da177e4
LT
354 if (sk->sk_state != TCP_LISTEN &&
355 !between(seq, tp->snd_una, tp->snd_nxt)) {
de0744af 356 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
357 goto out;
358 }
359
360 np = inet6_sk(sk);
361
362 if (type == ICMPV6_PKT_TOOBIG) {
363 struct dst_entry *dst = NULL;
364
365 if (sock_owned_by_user(sk))
366 goto out;
367 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
368 goto out;
369
370 /* icmp should have updated the destination cache entry */
371 dst = __sk_dst_check(sk, np->dst_cookie);
372
373 if (dst == NULL) {
374 struct inet_sock *inet = inet_sk(sk);
375 struct flowi fl;
376
377 /* BUGGG_FUTURE: Again, it is not clear how
378 to handle rthdr case. Ignore this complexity
379 for now.
380 */
381 memset(&fl, 0, sizeof(fl));
382 fl.proto = IPPROTO_TCP;
383 ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
384 ipv6_addr_copy(&fl.fl6_src, &np->saddr);
385 fl.oif = sk->sk_bound_dev_if;
386 fl.fl_ip_dport = inet->dport;
387 fl.fl_ip_sport = inet->sport;
beb8d13b 388 security_skb_classify_flow(skb, &fl);
1da177e4
LT
389
390 if ((err = ip6_dst_lookup(sk, &dst, &fl))) {
391 sk->sk_err_soft = -err;
392 goto out;
393 }
394
52479b62 395 if ((err = xfrm_lookup(net, &dst, &fl, sk, 0)) < 0) {
1da177e4
LT
396 sk->sk_err_soft = -err;
397 goto out;
398 }
399
400 } else
401 dst_hold(dst);
402
d83d8461 403 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
1da177e4
LT
404 tcp_sync_mss(sk, dst_mtu(dst));
405 tcp_simple_retransmit(sk);
406 } /* else let the usual retransmit timer handle it */
407 dst_release(dst);
408 goto out;
409 }
410
411 icmpv6_err_convert(type, code, &err);
412
60236fdd 413 /* Might be for an request_sock */
1da177e4 414 switch (sk->sk_state) {
60236fdd 415 struct request_sock *req, **prev;
1da177e4
LT
416 case TCP_LISTEN:
417 if (sock_owned_by_user(sk))
418 goto out;
419
8129765a
ACM
420 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
421 &hdr->saddr, inet6_iif(skb));
1da177e4
LT
422 if (!req)
423 goto out;
424
425 /* ICMPs are not backlogged, hence we cannot get
426 * an established socket here.
427 */
547b792c 428 WARN_ON(req->sk != NULL);
1da177e4 429
2e6599cb 430 if (seq != tcp_rsk(req)->snt_isn) {
de0744af 431 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
432 goto out;
433 }
434
463c84b9 435 inet_csk_reqsk_queue_drop(sk, req, prev);
1da177e4
LT
436 goto out;
437
438 case TCP_SYN_SENT:
439 case TCP_SYN_RECV: /* Cannot happen.
1ab1457c 440 It can, it SYNs are crossed. --ANK */
1da177e4 441 if (!sock_owned_by_user(sk)) {
1da177e4
LT
442 sk->sk_err = err;
443 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
444
445 tcp_done(sk);
446 } else
447 sk->sk_err_soft = err;
448 goto out;
449 }
450
451 if (!sock_owned_by_user(sk) && np->recverr) {
452 sk->sk_err = err;
453 sk->sk_error_report(sk);
454 } else
455 sk->sk_err_soft = err;
456
457out:
458 bh_unlock_sock(sk);
459 sock_put(sk);
460}
461
462
fd80eb94 463static int tcp_v6_send_synack(struct sock *sk, struct request_sock *req)
1da177e4 464{
ca304b61 465 struct inet6_request_sock *treq = inet6_rsk(req);
1da177e4
LT
466 struct ipv6_pinfo *np = inet6_sk(sk);
467 struct sk_buff * skb;
468 struct ipv6_txoptions *opt = NULL;
469 struct in6_addr * final_p = NULL, final;
470 struct flowi fl;
fd80eb94 471 struct dst_entry *dst;
1da177e4
LT
472 int err = -1;
473
474 memset(&fl, 0, sizeof(fl));
475 fl.proto = IPPROTO_TCP;
2e6599cb
ACM
476 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
477 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
1da177e4 478 fl.fl6_flowlabel = 0;
2e6599cb
ACM
479 fl.oif = treq->iif;
480 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
fd507037 481 fl.fl_ip_sport = inet_rsk(req)->loc_port;
4237c75c 482 security_req_classify_flow(req, &fl);
1da177e4 483
fd80eb94
DL
484 opt = np->opt;
485 if (opt && opt->srcrt) {
486 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
487 ipv6_addr_copy(&final, &fl.fl6_dst);
488 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
489 final_p = &final;
1da177e4
LT
490 }
491
fd80eb94
DL
492 err = ip6_dst_lookup(sk, &dst, &fl);
493 if (err)
494 goto done;
495 if (final_p)
496 ipv6_addr_copy(&fl.fl6_dst, final_p);
52479b62 497 if ((err = xfrm_lookup(sock_net(sk), &dst, &fl, sk, 0)) < 0)
fd80eb94
DL
498 goto done;
499
1da177e4
LT
500 skb = tcp_make_synack(sk, dst, req);
501 if (skb) {
aa8223c7 502 struct tcphdr *th = tcp_hdr(skb);
1da177e4
LT
503
504 th->check = tcp_v6_check(th, skb->len,
2e6599cb 505 &treq->loc_addr, &treq->rmt_addr,
07f0757a 506 csum_partial(th, skb->len, skb->csum));
1da177e4 507
2e6599cb 508 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
1da177e4 509 err = ip6_xmit(sk, skb, &fl, opt, 0);
b9df3cb8 510 err = net_xmit_eval(err);
1da177e4
LT
511 }
512
513done:
1ab1457c 514 if (opt && opt != np->opt)
1da177e4 515 sock_kfree_s(sk, opt, opt->tot_len);
78b91042 516 dst_release(dst);
1da177e4
LT
517 return err;
518}
519
c6aefafb
GG
520static inline void syn_flood_warning(struct sk_buff *skb)
521{
522#ifdef CONFIG_SYN_COOKIES
523 if (sysctl_tcp_syncookies)
524 printk(KERN_INFO
525 "TCPv6: Possible SYN flooding on port %d. "
526 "Sending cookies.\n", ntohs(tcp_hdr(skb)->dest));
527 else
528#endif
529 printk(KERN_INFO
530 "TCPv6: Possible SYN flooding on port %d. "
531 "Dropping request.\n", ntohs(tcp_hdr(skb)->dest));
532}
533
60236fdd 534static void tcp_v6_reqsk_destructor(struct request_sock *req)
1da177e4 535{
ca304b61
ACM
536 if (inet6_rsk(req)->pktopts)
537 kfree_skb(inet6_rsk(req)->pktopts);
1da177e4
LT
538}
539
cfb6eeb4
YH
540#ifdef CONFIG_TCP_MD5SIG
541static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
542 struct in6_addr *addr)
543{
544 struct tcp_sock *tp = tcp_sk(sk);
545 int i;
546
547 BUG_ON(tp == NULL);
548
549 if (!tp->md5sig_info || !tp->md5sig_info->entries6)
550 return NULL;
551
552 for (i = 0; i < tp->md5sig_info->entries6; i++) {
caad295f 553 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, addr))
f8ab18d2 554 return &tp->md5sig_info->keys6[i].base;
cfb6eeb4
YH
555 }
556 return NULL;
557}
558
559static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
560 struct sock *addr_sk)
561{
562 return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
563}
564
565static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
566 struct request_sock *req)
567{
568 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
569}
570
571static int tcp_v6_md5_do_add(struct sock *sk, struct in6_addr *peer,
572 char *newkey, u8 newkeylen)
573{
574 /* Add key to the list */
b0a713e9 575 struct tcp_md5sig_key *key;
cfb6eeb4
YH
576 struct tcp_sock *tp = tcp_sk(sk);
577 struct tcp6_md5sig_key *keys;
578
b0a713e9 579 key = tcp_v6_md5_do_lookup(sk, peer);
cfb6eeb4
YH
580 if (key) {
581 /* modify existing entry - just update that one */
b0a713e9
MD
582 kfree(key->key);
583 key->key = newkey;
584 key->keylen = newkeylen;
cfb6eeb4
YH
585 } else {
586 /* reallocate new list if current one is full. */
587 if (!tp->md5sig_info) {
588 tp->md5sig_info = kzalloc(sizeof(*tp->md5sig_info), GFP_ATOMIC);
589 if (!tp->md5sig_info) {
590 kfree(newkey);
591 return -ENOMEM;
592 }
3d7dbeac 593 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
cfb6eeb4 594 }
aacbe8c8
YH
595 if (tcp_alloc_md5sig_pool() == NULL) {
596 kfree(newkey);
597 return -ENOMEM;
598 }
cfb6eeb4
YH
599 if (tp->md5sig_info->alloced6 == tp->md5sig_info->entries6) {
600 keys = kmalloc((sizeof (tp->md5sig_info->keys6[0]) *
601 (tp->md5sig_info->entries6 + 1)), GFP_ATOMIC);
602
603 if (!keys) {
604 tcp_free_md5sig_pool();
605 kfree(newkey);
606 return -ENOMEM;
607 }
608
609 if (tp->md5sig_info->entries6)
610 memmove(keys, tp->md5sig_info->keys6,
611 (sizeof (tp->md5sig_info->keys6[0]) *
612 tp->md5sig_info->entries6));
613
614 kfree(tp->md5sig_info->keys6);
615 tp->md5sig_info->keys6 = keys;
616 tp->md5sig_info->alloced6++;
617 }
618
619 ipv6_addr_copy(&tp->md5sig_info->keys6[tp->md5sig_info->entries6].addr,
620 peer);
f8ab18d2
DM
621 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.key = newkey;
622 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.keylen = newkeylen;
cfb6eeb4
YH
623
624 tp->md5sig_info->entries6++;
625 }
626 return 0;
627}
628
629static int tcp_v6_md5_add_func(struct sock *sk, struct sock *addr_sk,
630 u8 *newkey, __u8 newkeylen)
631{
632 return tcp_v6_md5_do_add(sk, &inet6_sk(addr_sk)->daddr,
633 newkey, newkeylen);
634}
635
636static int tcp_v6_md5_do_del(struct sock *sk, struct in6_addr *peer)
637{
638 struct tcp_sock *tp = tcp_sk(sk);
639 int i;
640
641 for (i = 0; i < tp->md5sig_info->entries6; i++) {
caad295f 642 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, peer)) {
cfb6eeb4 643 /* Free the key */
f8ab18d2 644 kfree(tp->md5sig_info->keys6[i].base.key);
cfb6eeb4
YH
645 tp->md5sig_info->entries6--;
646
647 if (tp->md5sig_info->entries6 == 0) {
648 kfree(tp->md5sig_info->keys6);
649 tp->md5sig_info->keys6 = NULL;
ca983cef 650 tp->md5sig_info->alloced6 = 0;
cfb6eeb4
YH
651 } else {
652 /* shrink the database */
653 if (tp->md5sig_info->entries6 != i)
654 memmove(&tp->md5sig_info->keys6[i],
655 &tp->md5sig_info->keys6[i+1],
656 (tp->md5sig_info->entries6 - i)
657 * sizeof (tp->md5sig_info->keys6[0]));
658 }
77adefdc
YH
659 tcp_free_md5sig_pool();
660 return 0;
cfb6eeb4
YH
661 }
662 }
663 return -ENOENT;
664}
665
666static void tcp_v6_clear_md5_list (struct sock *sk)
667{
668 struct tcp_sock *tp = tcp_sk(sk);
669 int i;
670
671 if (tp->md5sig_info->entries6) {
672 for (i = 0; i < tp->md5sig_info->entries6; i++)
f8ab18d2 673 kfree(tp->md5sig_info->keys6[i].base.key);
cfb6eeb4
YH
674 tp->md5sig_info->entries6 = 0;
675 tcp_free_md5sig_pool();
676 }
677
678 kfree(tp->md5sig_info->keys6);
679 tp->md5sig_info->keys6 = NULL;
680 tp->md5sig_info->alloced6 = 0;
681
682 if (tp->md5sig_info->entries4) {
683 for (i = 0; i < tp->md5sig_info->entries4; i++)
f8ab18d2 684 kfree(tp->md5sig_info->keys4[i].base.key);
cfb6eeb4
YH
685 tp->md5sig_info->entries4 = 0;
686 tcp_free_md5sig_pool();
687 }
688
689 kfree(tp->md5sig_info->keys4);
690 tp->md5sig_info->keys4 = NULL;
691 tp->md5sig_info->alloced4 = 0;
692}
693
694static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
695 int optlen)
696{
697 struct tcp_md5sig cmd;
698 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
699 u8 *newkey;
700
701 if (optlen < sizeof(cmd))
702 return -EINVAL;
703
704 if (copy_from_user(&cmd, optval, sizeof(cmd)))
705 return -EFAULT;
706
707 if (sin6->sin6_family != AF_INET6)
708 return -EINVAL;
709
710 if (!cmd.tcpm_keylen) {
711 if (!tcp_sk(sk)->md5sig_info)
712 return -ENOENT;
e773e4fa 713 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
cfb6eeb4
YH
714 return tcp_v4_md5_do_del(sk, sin6->sin6_addr.s6_addr32[3]);
715 return tcp_v6_md5_do_del(sk, &sin6->sin6_addr);
716 }
717
718 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
719 return -EINVAL;
720
721 if (!tcp_sk(sk)->md5sig_info) {
722 struct tcp_sock *tp = tcp_sk(sk);
723 struct tcp_md5sig_info *p;
724
725 p = kzalloc(sizeof(struct tcp_md5sig_info), GFP_KERNEL);
726 if (!p)
727 return -ENOMEM;
728
729 tp->md5sig_info = p;
3d7dbeac 730 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
cfb6eeb4
YH
731 }
732
af879cc7 733 newkey = kmemdup(cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4
YH
734 if (!newkey)
735 return -ENOMEM;
e773e4fa 736 if (ipv6_addr_v4mapped(&sin6->sin6_addr)) {
cfb6eeb4
YH
737 return tcp_v4_md5_do_add(sk, sin6->sin6_addr.s6_addr32[3],
738 newkey, cmd.tcpm_keylen);
739 }
740 return tcp_v6_md5_do_add(sk, &sin6->sin6_addr, newkey, cmd.tcpm_keylen);
741}
742
49a72dfb
AL
743static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
744 struct in6_addr *daddr,
745 struct in6_addr *saddr, int nbytes)
cfb6eeb4 746{
cfb6eeb4 747 struct tcp6_pseudohdr *bp;
49a72dfb 748 struct scatterlist sg;
8d26d76d 749
cfb6eeb4 750 bp = &hp->md5_blk.ip6;
cfb6eeb4
YH
751 /* 1. TCP pseudo-header (RFC2460) */
752 ipv6_addr_copy(&bp->saddr, saddr);
753 ipv6_addr_copy(&bp->daddr, daddr);
49a72dfb 754 bp->protocol = cpu_to_be32(IPPROTO_TCP);
00b1304c 755 bp->len = cpu_to_be32(nbytes);
cfb6eeb4 756
49a72dfb
AL
757 sg_init_one(&sg, bp, sizeof(*bp));
758 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
759}
c7da57a1 760
49a72dfb
AL
761static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
762 struct in6_addr *daddr, struct in6_addr *saddr,
763 struct tcphdr *th)
764{
765 struct tcp_md5sig_pool *hp;
766 struct hash_desc *desc;
767
768 hp = tcp_get_md5sig_pool();
769 if (!hp)
770 goto clear_hash_noput;
771 desc = &hp->md5_desc;
772
773 if (crypto_hash_init(desc))
774 goto clear_hash;
775 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
776 goto clear_hash;
777 if (tcp_md5_hash_header(hp, th))
778 goto clear_hash;
779 if (tcp_md5_hash_key(hp, key))
780 goto clear_hash;
781 if (crypto_hash_final(desc, md5_hash))
cfb6eeb4 782 goto clear_hash;
cfb6eeb4 783
cfb6eeb4 784 tcp_put_md5sig_pool();
cfb6eeb4 785 return 0;
49a72dfb 786
cfb6eeb4
YH
787clear_hash:
788 tcp_put_md5sig_pool();
789clear_hash_noput:
790 memset(md5_hash, 0, 16);
49a72dfb 791 return 1;
cfb6eeb4
YH
792}
793
49a72dfb
AL
794static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
795 struct sock *sk, struct request_sock *req,
796 struct sk_buff *skb)
cfb6eeb4
YH
797{
798 struct in6_addr *saddr, *daddr;
49a72dfb
AL
799 struct tcp_md5sig_pool *hp;
800 struct hash_desc *desc;
801 struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4
YH
802
803 if (sk) {
804 saddr = &inet6_sk(sk)->saddr;
805 daddr = &inet6_sk(sk)->daddr;
49a72dfb 806 } else if (req) {
cfb6eeb4
YH
807 saddr = &inet6_rsk(req)->loc_addr;
808 daddr = &inet6_rsk(req)->rmt_addr;
49a72dfb
AL
809 } else {
810 struct ipv6hdr *ip6h = ipv6_hdr(skb);
811 saddr = &ip6h->saddr;
812 daddr = &ip6h->daddr;
cfb6eeb4 813 }
49a72dfb
AL
814
815 hp = tcp_get_md5sig_pool();
816 if (!hp)
817 goto clear_hash_noput;
818 desc = &hp->md5_desc;
819
820 if (crypto_hash_init(desc))
821 goto clear_hash;
822
823 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
824 goto clear_hash;
825 if (tcp_md5_hash_header(hp, th))
826 goto clear_hash;
827 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
828 goto clear_hash;
829 if (tcp_md5_hash_key(hp, key))
830 goto clear_hash;
831 if (crypto_hash_final(desc, md5_hash))
832 goto clear_hash;
833
834 tcp_put_md5sig_pool();
835 return 0;
836
837clear_hash:
838 tcp_put_md5sig_pool();
839clear_hash_noput:
840 memset(md5_hash, 0, 16);
841 return 1;
cfb6eeb4
YH
842}
843
844static int tcp_v6_inbound_md5_hash (struct sock *sk, struct sk_buff *skb)
845{
846 __u8 *hash_location = NULL;
847 struct tcp_md5sig_key *hash_expected;
0660e03f 848 struct ipv6hdr *ip6h = ipv6_hdr(skb);
aa8223c7 849 struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4 850 int genhash;
cfb6eeb4
YH
851 u8 newhash[16];
852
853 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
7d5d5525 854 hash_location = tcp_parse_md5sig_option(th);
cfb6eeb4 855
785957d3
DM
856 /* We've parsed the options - do we have a hash? */
857 if (!hash_expected && !hash_location)
858 return 0;
859
860 if (hash_expected && !hash_location) {
861 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
cfb6eeb4
YH
862 return 1;
863 }
864
785957d3
DM
865 if (!hash_expected && hash_location) {
866 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
cfb6eeb4
YH
867 return 1;
868 }
869
870 /* check the signature */
49a72dfb
AL
871 genhash = tcp_v6_md5_hash_skb(newhash,
872 hash_expected,
873 NULL, NULL, skb);
874
cfb6eeb4
YH
875 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
876 if (net_ratelimit()) {
5b095d98 877 printk(KERN_INFO "MD5 Hash %s for (%pI6, %u)->(%pI6, %u)\n",
cfb6eeb4 878 genhash ? "failed" : "mismatch",
0c6ce78a
HH
879 &ip6h->saddr, ntohs(th->source),
880 &ip6h->daddr, ntohs(th->dest));
cfb6eeb4
YH
881 }
882 return 1;
883 }
884 return 0;
885}
886#endif
887
c6aefafb 888struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
1da177e4 889 .family = AF_INET6,
2e6599cb 890 .obj_size = sizeof(struct tcp6_request_sock),
1da177e4 891 .rtx_syn_ack = tcp_v6_send_synack,
60236fdd
ACM
892 .send_ack = tcp_v6_reqsk_send_ack,
893 .destructor = tcp_v6_reqsk_destructor,
1da177e4
LT
894 .send_reset = tcp_v6_send_reset
895};
896
cfb6eeb4 897#ifdef CONFIG_TCP_MD5SIG
b6332e6c 898static struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
cfb6eeb4 899 .md5_lookup = tcp_v6_reqsk_md5_lookup,
cfb6eeb4 900};
b6332e6c 901#endif
cfb6eeb4 902
6d6ee43e
ACM
903static struct timewait_sock_ops tcp6_timewait_sock_ops = {
904 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
905 .twsk_unique = tcp_twsk_unique,
cfb6eeb4 906 .twsk_destructor= tcp_twsk_destructor,
6d6ee43e
ACM
907};
908
8292a17a 909static void tcp_v6_send_check(struct sock *sk, int len, struct sk_buff *skb)
1da177e4
LT
910{
911 struct ipv6_pinfo *np = inet6_sk(sk);
aa8223c7 912 struct tcphdr *th = tcp_hdr(skb);
1da177e4 913
84fa7933 914 if (skb->ip_summed == CHECKSUM_PARTIAL) {
1da177e4 915 th->check = ~csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP, 0);
663ead3b 916 skb->csum_start = skb_transport_header(skb) - skb->head;
ff1dcadb 917 skb->csum_offset = offsetof(struct tcphdr, check);
1da177e4 918 } else {
1ab1457c 919 th->check = csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP,
07f0757a 920 csum_partial(th, th->doff<<2,
1da177e4
LT
921 skb->csum));
922 }
923}
924
a430a43d
HX
925static int tcp_v6_gso_send_check(struct sk_buff *skb)
926{
927 struct ipv6hdr *ipv6h;
928 struct tcphdr *th;
929
930 if (!pskb_may_pull(skb, sizeof(*th)))
931 return -EINVAL;
932
0660e03f 933 ipv6h = ipv6_hdr(skb);
aa8223c7 934 th = tcp_hdr(skb);
a430a43d
HX
935
936 th->check = 0;
937 th->check = ~csum_ipv6_magic(&ipv6h->saddr, &ipv6h->daddr, skb->len,
938 IPPROTO_TCP, 0);
663ead3b 939 skb->csum_start = skb_transport_header(skb) - skb->head;
ff1dcadb 940 skb->csum_offset = offsetof(struct tcphdr, check);
84fa7933 941 skb->ip_summed = CHECKSUM_PARTIAL;
a430a43d
HX
942 return 0;
943}
1da177e4 944
626e264d
IJ
945static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
946 u32 ts, struct tcp_md5sig_key *key, int rst)
1da177e4 947{
aa8223c7 948 struct tcphdr *th = tcp_hdr(skb), *t1;
1da177e4
LT
949 struct sk_buff *buff;
950 struct flowi fl;
c346dca1 951 struct net *net = dev_net(skb->dst->dev);
e5047992 952 struct sock *ctl_sk = net->ipv6.tcp_sk;
77c676da 953 unsigned int tot_len = sizeof(struct tcphdr);
81ada62d 954 __be32 *topt;
1da177e4 955
626e264d
IJ
956 if (ts)
957 tot_len += TCPOLEN_TSTAMP_ALIGNED;
cfb6eeb4 958#ifdef CONFIG_TCP_MD5SIG
cfb6eeb4
YH
959 if (key)
960 tot_len += TCPOLEN_MD5SIG_ALIGNED;
961#endif
962
cfb6eeb4 963 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1da177e4 964 GFP_ATOMIC);
1ab1457c
YH
965 if (buff == NULL)
966 return;
1da177e4 967
cfb6eeb4 968 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1da177e4 969
cfb6eeb4 970 t1 = (struct tcphdr *) skb_push(buff, tot_len);
1da177e4
LT
971
972 /* Swap the send and the receive. */
973 memset(t1, 0, sizeof(*t1));
974 t1->dest = th->source;
975 t1->source = th->dest;
cfb6eeb4 976 t1->doff = tot_len / 4;
626e264d
IJ
977 t1->seq = htonl(seq);
978 t1->ack_seq = htonl(ack);
979 t1->ack = !rst || !th->ack;
980 t1->rst = rst;
981 t1->window = htons(win);
1da177e4 982
81ada62d
IJ
983 topt = (__be32 *)(t1 + 1);
984
626e264d
IJ
985 if (ts) {
986 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
987 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
988 *topt++ = htonl(tcp_time_stamp);
989 *topt++ = htonl(ts);
990 }
991
cfb6eeb4
YH
992#ifdef CONFIG_TCP_MD5SIG
993 if (key) {
81ada62d
IJ
994 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
995 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
996 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
78e645cb
IJ
997 &ipv6_hdr(skb)->saddr,
998 &ipv6_hdr(skb)->daddr, t1);
cfb6eeb4
YH
999 }
1000#endif
1001
07f0757a 1002 buff->csum = csum_partial(t1, tot_len, 0);
1da177e4
LT
1003
1004 memset(&fl, 0, sizeof(fl));
0660e03f
ACM
1005 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
1006 ipv6_addr_copy(&fl.fl6_src, &ipv6_hdr(skb)->daddr);
1da177e4
LT
1007
1008 t1->check = csum_ipv6_magic(&fl.fl6_src, &fl.fl6_dst,
52cd5750 1009 tot_len, IPPROTO_TCP,
1da177e4
LT
1010 buff->csum);
1011
1012 fl.proto = IPPROTO_TCP;
505cbfc5 1013 fl.oif = inet6_iif(skb);
1da177e4
LT
1014 fl.fl_ip_dport = t1->dest;
1015 fl.fl_ip_sport = t1->source;
beb8d13b 1016 security_skb_classify_flow(skb, &fl);
1da177e4 1017
c20121ae
DL
1018 /* Pass a socket to ip6_dst_lookup either it is for RST
1019 * Underlying function will use this to retrieve the network
1020 * namespace
1021 */
e5047992 1022 if (!ip6_dst_lookup(ctl_sk, &buff->dst, &fl)) {
52479b62 1023 if (xfrm_lookup(net, &buff->dst, &fl, NULL, 0) >= 0) {
e5047992 1024 ip6_xmit(ctl_sk, buff, &fl, NULL, 0);
63231bdd 1025 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
626e264d
IJ
1026 if (rst)
1027 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
1da177e4 1028 return;
ecc51b6d 1029 }
1da177e4
LT
1030 }
1031
1032 kfree_skb(buff);
1033}
1034
626e264d 1035static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
1da177e4 1036{
626e264d
IJ
1037 struct tcphdr *th = tcp_hdr(skb);
1038 u32 seq = 0, ack_seq = 0;
fa3e5b4e 1039 struct tcp_md5sig_key *key = NULL;
1da177e4 1040
626e264d 1041 if (th->rst)
1da177e4
LT
1042 return;
1043
626e264d
IJ
1044 if (!ipv6_unicast_destination(skb))
1045 return;
1da177e4 1046
cfb6eeb4 1047#ifdef CONFIG_TCP_MD5SIG
626e264d
IJ
1048 if (sk)
1049 key = tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr);
cfb6eeb4
YH
1050#endif
1051
626e264d
IJ
1052 if (th->ack)
1053 seq = ntohl(th->ack_seq);
1054 else
1055 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
1056 (th->doff << 2);
1da177e4 1057
626e264d
IJ
1058 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, key, 1);
1059}
1da177e4 1060
626e264d
IJ
1061static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack, u32 win, u32 ts,
1062 struct tcp_md5sig_key *key)
1063{
1064 tcp_v6_send_response(skb, seq, ack, win, ts, key, 0);
1da177e4
LT
1065}
1066
1067static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
1068{
8feaf0c0 1069 struct inet_timewait_sock *tw = inet_twsk(sk);
cfb6eeb4 1070 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1da177e4 1071
9501f972 1072 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
8feaf0c0 1073 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
9501f972 1074 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw));
1da177e4 1075
8feaf0c0 1076 inet_twsk_put(tw);
1da177e4
LT
1077}
1078
6edafaaf
GJ
1079static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
1080 struct request_sock *req)
1da177e4 1081{
9501f972 1082 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1, req->rcv_wnd, req->ts_recent,
6edafaaf 1083 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr));
1da177e4
LT
1084}
1085
1086
1087static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
1088{
60236fdd 1089 struct request_sock *req, **prev;
aa8223c7 1090 const struct tcphdr *th = tcp_hdr(skb);
1da177e4
LT
1091 struct sock *nsk;
1092
1093 /* Find possible connection requests. */
8129765a 1094 req = inet6_csk_search_req(sk, &prev, th->source,
0660e03f
ACM
1095 &ipv6_hdr(skb)->saddr,
1096 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1da177e4
LT
1097 if (req)
1098 return tcp_check_req(sk, skb, req, prev);
1099
3b1e0a65 1100 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
d86e0dac
PE
1101 &ipv6_hdr(skb)->saddr, th->source,
1102 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1da177e4
LT
1103
1104 if (nsk) {
1105 if (nsk->sk_state != TCP_TIME_WAIT) {
1106 bh_lock_sock(nsk);
1107 return nsk;
1108 }
9469c7b4 1109 inet_twsk_put(inet_twsk(nsk));
1da177e4
LT
1110 return NULL;
1111 }
1112
c6aefafb 1113#ifdef CONFIG_SYN_COOKIES
1da177e4 1114 if (!th->rst && !th->syn && th->ack)
c6aefafb 1115 sk = cookie_v6_check(sk, skb);
1da177e4
LT
1116#endif
1117 return sk;
1118}
1119
1da177e4
LT
1120/* FIXME: this is substantially similar to the ipv4 code.
1121 * Can some kind of merge be done? -- erics
1122 */
1123static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1124{
ca304b61 1125 struct inet6_request_sock *treq;
1da177e4
LT
1126 struct ipv6_pinfo *np = inet6_sk(sk);
1127 struct tcp_options_received tmp_opt;
1128 struct tcp_sock *tp = tcp_sk(sk);
60236fdd 1129 struct request_sock *req = NULL;
1da177e4 1130 __u32 isn = TCP_SKB_CB(skb)->when;
c6aefafb
GG
1131#ifdef CONFIG_SYN_COOKIES
1132 int want_cookie = 0;
1133#else
1134#define want_cookie 0
1135#endif
1da177e4
LT
1136
1137 if (skb->protocol == htons(ETH_P_IP))
1138 return tcp_v4_conn_request(sk, skb);
1139
1140 if (!ipv6_unicast_destination(skb))
1ab1457c 1141 goto drop;
1da177e4 1142
463c84b9 1143 if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
1da177e4 1144 if (net_ratelimit())
c6aefafb
GG
1145 syn_flood_warning(skb);
1146#ifdef CONFIG_SYN_COOKIES
1147 if (sysctl_tcp_syncookies)
1148 want_cookie = 1;
1149 else
1150#endif
1ab1457c 1151 goto drop;
1da177e4
LT
1152 }
1153
463c84b9 1154 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
1da177e4
LT
1155 goto drop;
1156
ca304b61 1157 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1da177e4
LT
1158 if (req == NULL)
1159 goto drop;
1160
cfb6eeb4
YH
1161#ifdef CONFIG_TCP_MD5SIG
1162 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1163#endif
1164
1da177e4
LT
1165 tcp_clear_options(&tmp_opt);
1166 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1167 tmp_opt.user_mss = tp->rx_opt.user_mss;
1168
1169 tcp_parse_options(skb, &tmp_opt, 0);
1170
4dfc2817 1171 if (want_cookie && !tmp_opt.saw_tstamp)
c6aefafb 1172 tcp_clear_options(&tmp_opt);
c6aefafb 1173
1da177e4
LT
1174 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1175 tcp_openreq_init(req, &tmp_opt, skb);
1176
ca304b61 1177 treq = inet6_rsk(req);
0660e03f
ACM
1178 ipv6_addr_copy(&treq->rmt_addr, &ipv6_hdr(skb)->saddr);
1179 ipv6_addr_copy(&treq->loc_addr, &ipv6_hdr(skb)->daddr);
c6aefafb
GG
1180 if (!want_cookie)
1181 TCP_ECN_create_request(req, tcp_hdr(skb));
1182
1183 if (want_cookie) {
1184 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
4dfc2817 1185 req->cookie_ts = tmp_opt.tstamp_ok;
c6aefafb
GG
1186 } else if (!isn) {
1187 if (ipv6_opt_accepted(sk, skb) ||
1188 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1189 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1190 atomic_inc(&skb->users);
1191 treq->pktopts = skb;
1192 }
1193 treq->iif = sk->sk_bound_dev_if;
1da177e4 1194
c6aefafb
GG
1195 /* So that link locals have meaning */
1196 if (!sk->sk_bound_dev_if &&
1197 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1198 treq->iif = inet6_iif(skb);
1da177e4 1199
a94f723d 1200 isn = tcp_v6_init_sequence(skb);
c6aefafb 1201 }
1da177e4 1202
2e6599cb 1203 tcp_rsk(req)->snt_isn = isn;
1da177e4 1204
4237c75c
VY
1205 security_inet_conn_request(sk, skb, req);
1206
fd80eb94 1207 if (tcp_v6_send_synack(sk, req))
1da177e4
LT
1208 goto drop;
1209
c6aefafb
GG
1210 if (!want_cookie) {
1211 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1212 return 0;
1213 }
1da177e4
LT
1214
1215drop:
1216 if (req)
60236fdd 1217 reqsk_free(req);
1da177e4 1218
1da177e4
LT
1219 return 0; /* don't send reset */
1220}
1221
1222static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
60236fdd 1223 struct request_sock *req,
1da177e4
LT
1224 struct dst_entry *dst)
1225{
78d15e82 1226 struct inet6_request_sock *treq;
1da177e4
LT
1227 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1228 struct tcp6_sock *newtcp6sk;
1229 struct inet_sock *newinet;
1230 struct tcp_sock *newtp;
1231 struct sock *newsk;
1232 struct ipv6_txoptions *opt;
cfb6eeb4
YH
1233#ifdef CONFIG_TCP_MD5SIG
1234 struct tcp_md5sig_key *key;
1235#endif
1da177e4
LT
1236
1237 if (skb->protocol == htons(ETH_P_IP)) {
1238 /*
1239 * v6 mapped
1240 */
1241
1242 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1243
1ab1457c 1244 if (newsk == NULL)
1da177e4
LT
1245 return NULL;
1246
1247 newtcp6sk = (struct tcp6_sock *)newsk;
1248 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1249
1250 newinet = inet_sk(newsk);
1251 newnp = inet6_sk(newsk);
1252 newtp = tcp_sk(newsk);
1253
1254 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1255
1256 ipv6_addr_set(&newnp->daddr, 0, 0, htonl(0x0000FFFF),
1257 newinet->daddr);
1258
1259 ipv6_addr_set(&newnp->saddr, 0, 0, htonl(0x0000FFFF),
1260 newinet->saddr);
1261
1262 ipv6_addr_copy(&newnp->rcv_saddr, &newnp->saddr);
1263
8292a17a 1264 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1da177e4 1265 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
1266#ifdef CONFIG_TCP_MD5SIG
1267 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1268#endif
1269
1da177e4
LT
1270 newnp->pktoptions = NULL;
1271 newnp->opt = NULL;
505cbfc5 1272 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1273 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1da177e4 1274
e6848976
ACM
1275 /*
1276 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1277 * here, tcp_create_openreq_child now does this for us, see the comment in
1278 * that function for the gory details. -acme
1da177e4 1279 */
1da177e4
LT
1280
1281 /* It is tricky place. Until this moment IPv4 tcp
8292a17a 1282 worked with IPv6 icsk.icsk_af_ops.
1da177e4
LT
1283 Sync it now.
1284 */
d83d8461 1285 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1da177e4
LT
1286
1287 return newsk;
1288 }
1289
78d15e82 1290 treq = inet6_rsk(req);
1da177e4
LT
1291 opt = np->opt;
1292
1293 if (sk_acceptq_is_full(sk))
1294 goto out_overflow;
1295
1da177e4
LT
1296 if (dst == NULL) {
1297 struct in6_addr *final_p = NULL, final;
1298 struct flowi fl;
1299
1300 memset(&fl, 0, sizeof(fl));
1301 fl.proto = IPPROTO_TCP;
2e6599cb 1302 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
1da177e4
LT
1303 if (opt && opt->srcrt) {
1304 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
1305 ipv6_addr_copy(&final, &fl.fl6_dst);
1306 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
1307 final_p = &final;
1308 }
2e6599cb 1309 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
1da177e4 1310 fl.oif = sk->sk_bound_dev_if;
2e6599cb 1311 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
fd507037 1312 fl.fl_ip_sport = inet_rsk(req)->loc_port;
4237c75c 1313 security_req_classify_flow(req, &fl);
1da177e4
LT
1314
1315 if (ip6_dst_lookup(sk, &dst, &fl))
1316 goto out;
1317
1318 if (final_p)
1319 ipv6_addr_copy(&fl.fl6_dst, final_p);
1320
52479b62 1321 if ((xfrm_lookup(sock_net(sk), &dst, &fl, sk, 0)) < 0)
1da177e4 1322 goto out;
1ab1457c 1323 }
1da177e4
LT
1324
1325 newsk = tcp_create_openreq_child(sk, req, skb);
1326 if (newsk == NULL)
1327 goto out;
1328
e6848976
ACM
1329 /*
1330 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1331 * count here, tcp_create_openreq_child now does this for us, see the
1332 * comment in that function for the gory details. -acme
1333 */
1da177e4 1334
59eed279 1335 newsk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 1336 __ip6_dst_store(newsk, dst, NULL, NULL);
1da177e4
LT
1337
1338 newtcp6sk = (struct tcp6_sock *)newsk;
1339 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1340
1341 newtp = tcp_sk(newsk);
1342 newinet = inet_sk(newsk);
1343 newnp = inet6_sk(newsk);
1344
1345 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1346
2e6599cb
ACM
1347 ipv6_addr_copy(&newnp->daddr, &treq->rmt_addr);
1348 ipv6_addr_copy(&newnp->saddr, &treq->loc_addr);
1349 ipv6_addr_copy(&newnp->rcv_saddr, &treq->loc_addr);
1350 newsk->sk_bound_dev_if = treq->iif;
1da177e4 1351
1ab1457c 1352 /* Now IPv6 options...
1da177e4
LT
1353
1354 First: no IPv4 options.
1355 */
1356 newinet->opt = NULL;
d35690be 1357 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1358
1359 /* Clone RX bits */
1360 newnp->rxopt.all = np->rxopt.all;
1361
1362 /* Clone pktoptions received with SYN */
1363 newnp->pktoptions = NULL;
2e6599cb
ACM
1364 if (treq->pktopts != NULL) {
1365 newnp->pktoptions = skb_clone(treq->pktopts, GFP_ATOMIC);
1366 kfree_skb(treq->pktopts);
1367 treq->pktopts = NULL;
1da177e4
LT
1368 if (newnp->pktoptions)
1369 skb_set_owner_r(newnp->pktoptions, newsk);
1370 }
1371 newnp->opt = NULL;
505cbfc5 1372 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1373 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1da177e4
LT
1374
1375 /* Clone native IPv6 options from listening socket (if any)
1376
1377 Yes, keeping reference count would be much more clever,
1378 but we make one more one thing there: reattach optmem
1379 to newsk.
1380 */
1381 if (opt) {
1382 newnp->opt = ipv6_dup_options(newsk, opt);
1383 if (opt != np->opt)
1384 sock_kfree_s(sk, opt, opt->tot_len);
1385 }
1386
d83d8461 1387 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1da177e4 1388 if (newnp->opt)
d83d8461
ACM
1389 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1390 newnp->opt->opt_flen);
1da177e4 1391
5d424d5a 1392 tcp_mtup_init(newsk);
1da177e4
LT
1393 tcp_sync_mss(newsk, dst_mtu(dst));
1394 newtp->advmss = dst_metric(dst, RTAX_ADVMSS);
1395 tcp_initialize_rcv_mss(newsk);
1396
1397 newinet->daddr = newinet->saddr = newinet->rcv_saddr = LOOPBACK4_IPV6;
1398
cfb6eeb4
YH
1399#ifdef CONFIG_TCP_MD5SIG
1400 /* Copy over the MD5 key from the original socket */
1401 if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1402 /* We're using one, so create a matching key
1403 * on the newsk structure. If we fail to get
1404 * memory, then we end up not copying the key
1405 * across. Shucks.
1406 */
af879cc7
ACM
1407 char *newkey = kmemdup(key->key, key->keylen, GFP_ATOMIC);
1408 if (newkey != NULL)
cfb6eeb4
YH
1409 tcp_v6_md5_do_add(newsk, &inet6_sk(sk)->daddr,
1410 newkey, key->keylen);
cfb6eeb4
YH
1411 }
1412#endif
1413
ab1e0a13 1414 __inet6_hash(newsk);
e56d8b8a 1415 __inet_inherit_port(sk, newsk);
1da177e4
LT
1416
1417 return newsk;
1418
1419out_overflow:
de0744af 1420 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1da177e4 1421out:
de0744af 1422 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1423 if (opt && opt != np->opt)
1424 sock_kfree_s(sk, opt, opt->tot_len);
1425 dst_release(dst);
1426 return NULL;
1427}
1428
b51655b9 1429static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1da177e4 1430{
84fa7933 1431 if (skb->ip_summed == CHECKSUM_COMPLETE) {
aa8223c7 1432 if (!tcp_v6_check(tcp_hdr(skb), skb->len, &ipv6_hdr(skb)->saddr,
0660e03f 1433 &ipv6_hdr(skb)->daddr, skb->csum)) {
fb286bb2 1434 skb->ip_summed = CHECKSUM_UNNECESSARY;
1da177e4 1435 return 0;
fb286bb2 1436 }
1da177e4 1437 }
fb286bb2 1438
aa8223c7 1439 skb->csum = ~csum_unfold(tcp_v6_check(tcp_hdr(skb), skb->len,
0660e03f
ACM
1440 &ipv6_hdr(skb)->saddr,
1441 &ipv6_hdr(skb)->daddr, 0));
fb286bb2 1442
1da177e4 1443 if (skb->len <= 76) {
fb286bb2 1444 return __skb_checksum_complete(skb);
1da177e4
LT
1445 }
1446 return 0;
1447}
1448
1449/* The socket must have it's spinlock held when we get
1450 * here.
1451 *
1452 * We have a potential double-lock case here, so even when
1453 * doing backlog processing we use the BH locking scheme.
1454 * This is because we cannot sleep with the original spinlock
1455 * held.
1456 */
1457static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1458{
1459 struct ipv6_pinfo *np = inet6_sk(sk);
1460 struct tcp_sock *tp;
1461 struct sk_buff *opt_skb = NULL;
1462
1463 /* Imagine: socket is IPv6. IPv4 packet arrives,
1464 goes to IPv4 receive handler and backlogged.
1465 From backlog it always goes here. Kerboom...
1466 Fortunately, tcp_rcv_established and rcv_established
1467 handle them correctly, but it is not case with
1468 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1469 */
1470
1471 if (skb->protocol == htons(ETH_P_IP))
1472 return tcp_v4_do_rcv(sk, skb);
1473
cfb6eeb4
YH
1474#ifdef CONFIG_TCP_MD5SIG
1475 if (tcp_v6_inbound_md5_hash (sk, skb))
1476 goto discard;
1477#endif
1478
fda9ef5d 1479 if (sk_filter(sk, skb))
1da177e4
LT
1480 goto discard;
1481
1482 /*
1483 * socket locking is here for SMP purposes as backlog rcv
1484 * is currently called with bh processing disabled.
1485 */
1486
1487 /* Do Stevens' IPV6_PKTOPTIONS.
1488
1489 Yes, guys, it is the only place in our code, where we
1490 may make it not affecting IPv4.
1491 The rest of code is protocol independent,
1492 and I do not like idea to uglify IPv4.
1493
1494 Actually, all the idea behind IPV6_PKTOPTIONS
1495 looks not very well thought. For now we latch
1496 options, received in the last packet, enqueued
1497 by tcp. Feel free to propose better solution.
1ab1457c 1498 --ANK (980728)
1da177e4
LT
1499 */
1500 if (np->rxopt.all)
1501 opt_skb = skb_clone(skb, GFP_ATOMIC);
1502
1503 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
1504 TCP_CHECK_TIMER(sk);
aa8223c7 1505 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1da177e4
LT
1506 goto reset;
1507 TCP_CHECK_TIMER(sk);
1508 if (opt_skb)
1509 goto ipv6_pktoptions;
1510 return 0;
1511 }
1512
ab6a5bb6 1513 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1da177e4
LT
1514 goto csum_err;
1515
1ab1457c 1516 if (sk->sk_state == TCP_LISTEN) {
1da177e4
LT
1517 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1518 if (!nsk)
1519 goto discard;
1520
1521 /*
1522 * Queue it on the new socket if the new socket is active,
1523 * otherwise we just shortcircuit this and continue with
1524 * the new socket..
1525 */
1ab1457c 1526 if(nsk != sk) {
1da177e4
LT
1527 if (tcp_child_process(sk, nsk, skb))
1528 goto reset;
1529 if (opt_skb)
1530 __kfree_skb(opt_skb);
1531 return 0;
1532 }
1533 }
1534
1535 TCP_CHECK_TIMER(sk);
aa8223c7 1536 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1da177e4
LT
1537 goto reset;
1538 TCP_CHECK_TIMER(sk);
1539 if (opt_skb)
1540 goto ipv6_pktoptions;
1541 return 0;
1542
1543reset:
cfb6eeb4 1544 tcp_v6_send_reset(sk, skb);
1da177e4
LT
1545discard:
1546 if (opt_skb)
1547 __kfree_skb(opt_skb);
1548 kfree_skb(skb);
1549 return 0;
1550csum_err:
63231bdd 1551 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1da177e4
LT
1552 goto discard;
1553
1554
1555ipv6_pktoptions:
1556 /* Do you ask, what is it?
1557
1558 1. skb was enqueued by tcp.
1559 2. skb is added to tail of read queue, rather than out of order.
1560 3. socket is not in passive state.
1561 4. Finally, it really contains options, which user wants to receive.
1562 */
1563 tp = tcp_sk(sk);
1564 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1565 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
333fad53 1566 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
505cbfc5 1567 np->mcast_oif = inet6_iif(opt_skb);
333fad53 1568 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
0660e03f 1569 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
1da177e4
LT
1570 if (ipv6_opt_accepted(sk, opt_skb)) {
1571 skb_set_owner_r(opt_skb, sk);
1572 opt_skb = xchg(&np->pktoptions, opt_skb);
1573 } else {
1574 __kfree_skb(opt_skb);
1575 opt_skb = xchg(&np->pktoptions, NULL);
1576 }
1577 }
1578
1579 if (opt_skb)
1580 kfree_skb(opt_skb);
1581 return 0;
1582}
1583
e5bbef20 1584static int tcp_v6_rcv(struct sk_buff *skb)
1da177e4 1585{
1ab1457c 1586 struct tcphdr *th;
1da177e4
LT
1587 struct sock *sk;
1588 int ret;
a86b1e30 1589 struct net *net = dev_net(skb->dev);
1da177e4
LT
1590
1591 if (skb->pkt_type != PACKET_HOST)
1592 goto discard_it;
1593
1594 /*
1595 * Count it even if it's bad.
1596 */
63231bdd 1597 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1da177e4
LT
1598
1599 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1600 goto discard_it;
1601
aa8223c7 1602 th = tcp_hdr(skb);
1da177e4
LT
1603
1604 if (th->doff < sizeof(struct tcphdr)/4)
1605 goto bad_packet;
1606 if (!pskb_may_pull(skb, th->doff*4))
1607 goto discard_it;
1608
60476372 1609 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1da177e4
LT
1610 goto bad_packet;
1611
aa8223c7 1612 th = tcp_hdr(skb);
1da177e4
LT
1613 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1614 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1615 skb->len - th->doff*4);
1616 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1617 TCP_SKB_CB(skb)->when = 0;
0660e03f 1618 TCP_SKB_CB(skb)->flags = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4
LT
1619 TCP_SKB_CB(skb)->sacked = 0;
1620
9a1f27c4 1621 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1da177e4
LT
1622 if (!sk)
1623 goto no_tcp_socket;
1624
1625process:
1626 if (sk->sk_state == TCP_TIME_WAIT)
1627 goto do_time_wait;
1628
1629 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1630 goto discard_and_relse;
1631
fda9ef5d 1632 if (sk_filter(sk, skb))
1da177e4
LT
1633 goto discard_and_relse;
1634
1635 skb->dev = NULL;
1636
293b9c42 1637 bh_lock_sock_nested(sk);
1da177e4
LT
1638 ret = 0;
1639 if (!sock_owned_by_user(sk)) {
1a2449a8 1640#ifdef CONFIG_NET_DMA
1ab1457c 1641 struct tcp_sock *tp = tcp_sk(sk);
b4caea8a
DM
1642 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
1643 tp->ucopy.dma_chan = get_softnet_dma();
1ab1457c
YH
1644 if (tp->ucopy.dma_chan)
1645 ret = tcp_v6_do_rcv(sk, skb);
1646 else
1a2449a8
CL
1647#endif
1648 {
1649 if (!tcp_prequeue(sk, skb))
1650 ret = tcp_v6_do_rcv(sk, skb);
1651 }
1da177e4
LT
1652 } else
1653 sk_add_backlog(sk, skb);
1654 bh_unlock_sock(sk);
1655
1656 sock_put(sk);
1657 return ret ? -1 : 0;
1658
1659no_tcp_socket:
1660 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1661 goto discard_it;
1662
1663 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1664bad_packet:
63231bdd 1665 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1da177e4 1666 } else {
cfb6eeb4 1667 tcp_v6_send_reset(NULL, skb);
1da177e4
LT
1668 }
1669
1670discard_it:
1671
1672 /*
1673 * Discard frame
1674 */
1675
1676 kfree_skb(skb);
1677 return 0;
1678
1679discard_and_relse:
1680 sock_put(sk);
1681 goto discard_it;
1682
1683do_time_wait:
1684 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
9469c7b4 1685 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1686 goto discard_it;
1687 }
1688
1689 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
63231bdd 1690 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
9469c7b4 1691 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1692 goto discard_it;
1693 }
1694
9469c7b4 1695 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1da177e4
LT
1696 case TCP_TW_SYN:
1697 {
1698 struct sock *sk2;
1699
c346dca1 1700 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
0660e03f 1701 &ipv6_hdr(skb)->daddr,
505cbfc5 1702 ntohs(th->dest), inet6_iif(skb));
1da177e4 1703 if (sk2 != NULL) {
295ff7ed
ACM
1704 struct inet_timewait_sock *tw = inet_twsk(sk);
1705 inet_twsk_deschedule(tw, &tcp_death_row);
1706 inet_twsk_put(tw);
1da177e4
LT
1707 sk = sk2;
1708 goto process;
1709 }
1710 /* Fall through to ACK */
1711 }
1712 case TCP_TW_ACK:
1713 tcp_v6_timewait_ack(sk, skb);
1714 break;
1715 case TCP_TW_RST:
1716 goto no_tcp_socket;
1717 case TCP_TW_SUCCESS:;
1718 }
1719 goto discard_it;
1720}
1721
1da177e4
LT
1722static int tcp_v6_remember_stamp(struct sock *sk)
1723{
1724 /* Alas, not yet... */
1725 return 0;
1726}
1727
8292a17a 1728static struct inet_connection_sock_af_ops ipv6_specific = {
543d9cfe
ACM
1729 .queue_xmit = inet6_csk_xmit,
1730 .send_check = tcp_v6_send_check,
1731 .rebuild_header = inet6_sk_rebuild_header,
1732 .conn_request = tcp_v6_conn_request,
1733 .syn_recv_sock = tcp_v6_syn_recv_sock,
1734 .remember_stamp = tcp_v6_remember_stamp,
1735 .net_header_len = sizeof(struct ipv6hdr),
1736 .setsockopt = ipv6_setsockopt,
1737 .getsockopt = ipv6_getsockopt,
1738 .addr2sockaddr = inet6_csk_addr2sockaddr,
1739 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1740 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1741#ifdef CONFIG_COMPAT
543d9cfe
ACM
1742 .compat_setsockopt = compat_ipv6_setsockopt,
1743 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1744#endif
1da177e4
LT
1745};
1746
cfb6eeb4 1747#ifdef CONFIG_TCP_MD5SIG
a928630a 1748static struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
cfb6eeb4 1749 .md5_lookup = tcp_v6_md5_lookup,
49a72dfb 1750 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4
YH
1751 .md5_add = tcp_v6_md5_add_func,
1752 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1753};
a928630a 1754#endif
cfb6eeb4 1755
1da177e4
LT
1756/*
1757 * TCP over IPv4 via INET6 API
1758 */
1759
8292a17a 1760static struct inet_connection_sock_af_ops ipv6_mapped = {
543d9cfe
ACM
1761 .queue_xmit = ip_queue_xmit,
1762 .send_check = tcp_v4_send_check,
1763 .rebuild_header = inet_sk_rebuild_header,
1764 .conn_request = tcp_v6_conn_request,
1765 .syn_recv_sock = tcp_v6_syn_recv_sock,
1766 .remember_stamp = tcp_v4_remember_stamp,
1767 .net_header_len = sizeof(struct iphdr),
1768 .setsockopt = ipv6_setsockopt,
1769 .getsockopt = ipv6_getsockopt,
1770 .addr2sockaddr = inet6_csk_addr2sockaddr,
1771 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1772 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1773#ifdef CONFIG_COMPAT
543d9cfe
ACM
1774 .compat_setsockopt = compat_ipv6_setsockopt,
1775 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1776#endif
1da177e4
LT
1777};
1778
cfb6eeb4 1779#ifdef CONFIG_TCP_MD5SIG
a928630a 1780static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
cfb6eeb4 1781 .md5_lookup = tcp_v4_md5_lookup,
49a72dfb 1782 .calc_md5_hash = tcp_v4_md5_hash_skb,
cfb6eeb4
YH
1783 .md5_add = tcp_v6_md5_add_func,
1784 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1785};
a928630a 1786#endif
cfb6eeb4 1787
1da177e4
LT
1788/* NOTE: A lot of things set to zero explicitly by call to
1789 * sk_alloc() so need not be done here.
1790 */
1791static int tcp_v6_init_sock(struct sock *sk)
1792{
6687e988 1793 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4
LT
1794 struct tcp_sock *tp = tcp_sk(sk);
1795
1796 skb_queue_head_init(&tp->out_of_order_queue);
1797 tcp_init_xmit_timers(sk);
1798 tcp_prequeue_init(tp);
1799
6687e988 1800 icsk->icsk_rto = TCP_TIMEOUT_INIT;
1da177e4
LT
1801 tp->mdev = TCP_TIMEOUT_INIT;
1802
1803 /* So many TCP implementations out there (incorrectly) count the
1804 * initial SYN frame in their delayed-ACK and congestion control
1805 * algorithms that we must have the following bandaid to talk
1806 * efficiently to them. -DaveM
1807 */
1808 tp->snd_cwnd = 2;
1809
1810 /* See draft-stevens-tcpca-spec-01 for discussion of the
1811 * initialization of these values.
1812 */
1813 tp->snd_ssthresh = 0x7fffffff;
1814 tp->snd_cwnd_clamp = ~0;
c1b4a7e6 1815 tp->mss_cache = 536;
1da177e4
LT
1816
1817 tp->reordering = sysctl_tcp_reordering;
1818
1819 sk->sk_state = TCP_CLOSE;
1820
8292a17a 1821 icsk->icsk_af_ops = &ipv6_specific;
6687e988 1822 icsk->icsk_ca_ops = &tcp_init_congestion_ops;
d83d8461 1823 icsk->icsk_sync_mss = tcp_sync_mss;
1da177e4
LT
1824 sk->sk_write_space = sk_stream_write_space;
1825 sock_set_flag(sk, SOCK_USE_WRITE_QUEUE);
1826
cfb6eeb4
YH
1827#ifdef CONFIG_TCP_MD5SIG
1828 tp->af_specific = &tcp_sock_ipv6_specific;
1829#endif
1830
1da177e4
LT
1831 sk->sk_sndbuf = sysctl_tcp_wmem[1];
1832 sk->sk_rcvbuf = sysctl_tcp_rmem[1];
1833
eb4dea58 1834 local_bh_disable();
1748376b 1835 percpu_counter_inc(&tcp_sockets_allocated);
eb4dea58 1836 local_bh_enable();
1da177e4
LT
1837
1838 return 0;
1839}
1840
7d06b2e0 1841static void tcp_v6_destroy_sock(struct sock *sk)
1da177e4 1842{
cfb6eeb4
YH
1843#ifdef CONFIG_TCP_MD5SIG
1844 /* Clean up the MD5 key list */
1845 if (tcp_sk(sk)->md5sig_info)
1846 tcp_v6_clear_md5_list(sk);
1847#endif
1da177e4 1848 tcp_v4_destroy_sock(sk);
7d06b2e0 1849 inet6_destroy_sock(sk);
1da177e4
LT
1850}
1851
952a10be 1852#ifdef CONFIG_PROC_FS
1da177e4 1853/* Proc filesystem TCPv6 sock list dumping. */
1ab1457c 1854static void get_openreq6(struct seq_file *seq,
60236fdd 1855 struct sock *sk, struct request_sock *req, int i, int uid)
1da177e4 1856{
1da177e4 1857 int ttd = req->expires - jiffies;
ca304b61
ACM
1858 struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1859 struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1da177e4
LT
1860
1861 if (ttd < 0)
1862 ttd = 0;
1863
1da177e4
LT
1864 seq_printf(seq,
1865 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1866 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1867 i,
1868 src->s6_addr32[0], src->s6_addr32[1],
1869 src->s6_addr32[2], src->s6_addr32[3],
fd507037 1870 ntohs(inet_rsk(req)->loc_port),
1da177e4
LT
1871 dest->s6_addr32[0], dest->s6_addr32[1],
1872 dest->s6_addr32[2], dest->s6_addr32[3],
2e6599cb 1873 ntohs(inet_rsk(req)->rmt_port),
1da177e4
LT
1874 TCP_SYN_RECV,
1875 0,0, /* could print option size, but that is af dependent. */
1ab1457c
YH
1876 1, /* timers active (only the expire timer) */
1877 jiffies_to_clock_t(ttd),
1da177e4
LT
1878 req->retrans,
1879 uid,
1ab1457c 1880 0, /* non standard timer */
1da177e4
LT
1881 0, /* open_requests have no inode */
1882 0, req);
1883}
1884
1885static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1886{
1887 struct in6_addr *dest, *src;
1888 __u16 destp, srcp;
1889 int timer_active;
1890 unsigned long timer_expires;
1891 struct inet_sock *inet = inet_sk(sp);
1892 struct tcp_sock *tp = tcp_sk(sp);
463c84b9 1893 const struct inet_connection_sock *icsk = inet_csk(sp);
1da177e4
LT
1894 struct ipv6_pinfo *np = inet6_sk(sp);
1895
1896 dest = &np->daddr;
1897 src = &np->rcv_saddr;
1898 destp = ntohs(inet->dport);
1899 srcp = ntohs(inet->sport);
463c84b9
ACM
1900
1901 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1da177e4 1902 timer_active = 1;
463c84b9
ACM
1903 timer_expires = icsk->icsk_timeout;
1904 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1da177e4 1905 timer_active = 4;
463c84b9 1906 timer_expires = icsk->icsk_timeout;
1da177e4
LT
1907 } else if (timer_pending(&sp->sk_timer)) {
1908 timer_active = 2;
1909 timer_expires = sp->sk_timer.expires;
1910 } else {
1911 timer_active = 0;
1912 timer_expires = jiffies;
1913 }
1914
1915 seq_printf(seq,
1916 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
7be87351 1917 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %p %lu %lu %u %u %d\n",
1da177e4
LT
1918 i,
1919 src->s6_addr32[0], src->s6_addr32[1],
1920 src->s6_addr32[2], src->s6_addr32[3], srcp,
1921 dest->s6_addr32[0], dest->s6_addr32[1],
1922 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1ab1457c 1923 sp->sk_state,
47da8ee6
SS
1924 tp->write_seq-tp->snd_una,
1925 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1da177e4
LT
1926 timer_active,
1927 jiffies_to_clock_t(timer_expires - jiffies),
463c84b9 1928 icsk->icsk_retransmits,
1da177e4 1929 sock_i_uid(sp),
6687e988 1930 icsk->icsk_probes_out,
1da177e4
LT
1931 sock_i_ino(sp),
1932 atomic_read(&sp->sk_refcnt), sp,
7be87351
SH
1933 jiffies_to_clock_t(icsk->icsk_rto),
1934 jiffies_to_clock_t(icsk->icsk_ack.ato),
463c84b9 1935 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
1da177e4
LT
1936 tp->snd_cwnd, tp->snd_ssthresh>=0xFFFF?-1:tp->snd_ssthresh
1937 );
1938}
1939
1ab1457c 1940static void get_timewait6_sock(struct seq_file *seq,
8feaf0c0 1941 struct inet_timewait_sock *tw, int i)
1da177e4
LT
1942{
1943 struct in6_addr *dest, *src;
1944 __u16 destp, srcp;
0fa1a53e 1945 struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
1da177e4
LT
1946 int ttd = tw->tw_ttd - jiffies;
1947
1948 if (ttd < 0)
1949 ttd = 0;
1950
0fa1a53e
ACM
1951 dest = &tw6->tw_v6_daddr;
1952 src = &tw6->tw_v6_rcv_saddr;
1da177e4
LT
1953 destp = ntohs(tw->tw_dport);
1954 srcp = ntohs(tw->tw_sport);
1955
1956 seq_printf(seq,
1957 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1958 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1959 i,
1960 src->s6_addr32[0], src->s6_addr32[1],
1961 src->s6_addr32[2], src->s6_addr32[3], srcp,
1962 dest->s6_addr32[0], dest->s6_addr32[1],
1963 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1964 tw->tw_substate, 0, 0,
1965 3, jiffies_to_clock_t(ttd), 0, 0, 0, 0,
1966 atomic_read(&tw->tw_refcnt), tw);
1967}
1968
1da177e4
LT
1969static int tcp6_seq_show(struct seq_file *seq, void *v)
1970{
1971 struct tcp_iter_state *st;
1972
1973 if (v == SEQ_START_TOKEN) {
1974 seq_puts(seq,
1975 " sl "
1976 "local_address "
1977 "remote_address "
1978 "st tx_queue rx_queue tr tm->when retrnsmt"
1979 " uid timeout inode\n");
1980 goto out;
1981 }
1982 st = seq->private;
1983
1984 switch (st->state) {
1985 case TCP_SEQ_STATE_LISTENING:
1986 case TCP_SEQ_STATE_ESTABLISHED:
1987 get_tcp6_sock(seq, v, st->num);
1988 break;
1989 case TCP_SEQ_STATE_OPENREQ:
1990 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1991 break;
1992 case TCP_SEQ_STATE_TIME_WAIT:
1993 get_timewait6_sock(seq, v, st->num);
1994 break;
1995 }
1996out:
1997 return 0;
1998}
1999
1da177e4 2000static struct tcp_seq_afinfo tcp6_seq_afinfo = {
1da177e4
LT
2001 .name = "tcp6",
2002 .family = AF_INET6,
5f4472c5
DL
2003 .seq_fops = {
2004 .owner = THIS_MODULE,
2005 },
9427c4b3
DL
2006 .seq_ops = {
2007 .show = tcp6_seq_show,
2008 },
1da177e4
LT
2009};
2010
6f8b13bc 2011int tcp6_proc_init(struct net *net)
1da177e4 2012{
6f8b13bc 2013 return tcp_proc_register(net, &tcp6_seq_afinfo);
1da177e4
LT
2014}
2015
6f8b13bc 2016void tcp6_proc_exit(struct net *net)
1da177e4 2017{
6f8b13bc 2018 tcp_proc_unregister(net, &tcp6_seq_afinfo);
1da177e4
LT
2019}
2020#endif
2021
2022struct proto tcpv6_prot = {
2023 .name = "TCPv6",
2024 .owner = THIS_MODULE,
2025 .close = tcp_close,
2026 .connect = tcp_v6_connect,
2027 .disconnect = tcp_disconnect,
463c84b9 2028 .accept = inet_csk_accept,
1da177e4
LT
2029 .ioctl = tcp_ioctl,
2030 .init = tcp_v6_init_sock,
2031 .destroy = tcp_v6_destroy_sock,
2032 .shutdown = tcp_shutdown,
2033 .setsockopt = tcp_setsockopt,
2034 .getsockopt = tcp_getsockopt,
1da177e4
LT
2035 .recvmsg = tcp_recvmsg,
2036 .backlog_rcv = tcp_v6_do_rcv,
2037 .hash = tcp_v6_hash,
ab1e0a13
ACM
2038 .unhash = inet_unhash,
2039 .get_port = inet_csk_get_port,
1da177e4
LT
2040 .enter_memory_pressure = tcp_enter_memory_pressure,
2041 .sockets_allocated = &tcp_sockets_allocated,
2042 .memory_allocated = &tcp_memory_allocated,
2043 .memory_pressure = &tcp_memory_pressure,
0a5578cf 2044 .orphan_count = &tcp_orphan_count,
1da177e4
LT
2045 .sysctl_mem = sysctl_tcp_mem,
2046 .sysctl_wmem = sysctl_tcp_wmem,
2047 .sysctl_rmem = sysctl_tcp_rmem,
2048 .max_header = MAX_TCP_HEADER,
2049 .obj_size = sizeof(struct tcp6_sock),
3ab5aee7 2050 .slab_flags = SLAB_DESTROY_BY_RCU,
6d6ee43e 2051 .twsk_prot = &tcp6_timewait_sock_ops,
60236fdd 2052 .rsk_prot = &tcp6_request_sock_ops,
39d8cda7 2053 .h.hashinfo = &tcp_hashinfo,
543d9cfe
ACM
2054#ifdef CONFIG_COMPAT
2055 .compat_setsockopt = compat_tcp_setsockopt,
2056 .compat_getsockopt = compat_tcp_getsockopt,
2057#endif
1da177e4
LT
2058};
2059
2060static struct inet6_protocol tcpv6_protocol = {
2061 .handler = tcp_v6_rcv,
2062 .err_handler = tcp_v6_err,
a430a43d 2063 .gso_send_check = tcp_v6_gso_send_check,
adcfc7d0 2064 .gso_segment = tcp_tso_segment,
1da177e4
LT
2065 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
2066};
2067
1da177e4
LT
2068static struct inet_protosw tcpv6_protosw = {
2069 .type = SOCK_STREAM,
2070 .protocol = IPPROTO_TCP,
2071 .prot = &tcpv6_prot,
2072 .ops = &inet6_stream_ops,
2073 .capability = -1,
2074 .no_check = 0,
d83d8461
ACM
2075 .flags = INET_PROTOSW_PERMANENT |
2076 INET_PROTOSW_ICSK,
1da177e4
LT
2077};
2078
93ec926b
DL
2079static int tcpv6_net_init(struct net *net)
2080{
5677242f
DL
2081 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2082 SOCK_RAW, IPPROTO_TCP, net);
93ec926b
DL
2083}
2084
2085static void tcpv6_net_exit(struct net *net)
2086{
5677242f 2087 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
d315492b 2088 inet_twsk_purge(net, &tcp_hashinfo, &tcp_death_row, AF_INET6);
93ec926b
DL
2089}
2090
2091static struct pernet_operations tcpv6_net_ops = {
2092 .init = tcpv6_net_init,
2093 .exit = tcpv6_net_exit,
2094};
2095
7f4e4868 2096int __init tcpv6_init(void)
1da177e4 2097{
7f4e4868
DL
2098 int ret;
2099
2100 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2101 if (ret)
2102 goto out;
2103
1da177e4 2104 /* register inet6 protocol */
7f4e4868
DL
2105 ret = inet6_register_protosw(&tcpv6_protosw);
2106 if (ret)
2107 goto out_tcpv6_protocol;
2108
93ec926b 2109 ret = register_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2110 if (ret)
2111 goto out_tcpv6_protosw;
2112out:
2113 return ret;
ae0f7d5f 2114
7f4e4868
DL
2115out_tcpv6_protocol:
2116 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2117out_tcpv6_protosw:
2118 inet6_unregister_protosw(&tcpv6_protosw);
2119 goto out;
2120}
2121
09f7709f 2122void tcpv6_exit(void)
7f4e4868 2123{
93ec926b 2124 unregister_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2125 inet6_unregister_protosw(&tcpv6_protosw);
2126 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
1da177e4 2127}