]> bbs.cooldavid.org Git - net-next-2.6.git/blame - net/ipv6/tcp_ipv6.c
TCPCT part 1f: Initiator Cookie => Responder
[net-next-2.6.git] / net / ipv6 / tcp_ipv6.c
CommitLineData
1da177e4
LT
1/*
2 * TCP over IPv6
1ab1457c 3 * Linux INET6 implementation
1da177e4
LT
4 *
5 * Authors:
1ab1457c 6 * Pedro Roque <roque@di.fc.ul.pt>
1da177e4 7 *
1ab1457c 8 * Based on:
1da177e4
LT
9 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
eb4dea58 26#include <linux/bottom_half.h>
1da177e4 27#include <linux/module.h>
1da177e4
LT
28#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
41
42#include <linux/ipv6.h>
43#include <linux/icmpv6.h>
44#include <linux/random.h>
45
46#include <net/tcp.h>
47#include <net/ndisc.h>
5324a040 48#include <net/inet6_hashtables.h>
8129765a 49#include <net/inet6_connection_sock.h>
1da177e4
LT
50#include <net/ipv6.h>
51#include <net/transp_v6.h>
52#include <net/addrconf.h>
53#include <net/ip6_route.h>
54#include <net/ip6_checksum.h>
55#include <net/inet_ecn.h>
56#include <net/protocol.h>
57#include <net/xfrm.h>
1da177e4
LT
58#include <net/snmp.h>
59#include <net/dsfield.h>
6d6ee43e 60#include <net/timewait_sock.h>
18134bed 61#include <net/netdma.h>
3d58b5fa 62#include <net/inet_common.h>
1da177e4
LT
63
64#include <asm/uaccess.h>
65
66#include <linux/proc_fs.h>
67#include <linux/seq_file.h>
68
cfb6eeb4
YH
69#include <linux/crypto.h>
70#include <linux/scatterlist.h>
71
cfb6eeb4 72static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
6edafaaf
GJ
73static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
74 struct request_sock *req);
1da177e4
LT
75
76static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
1da177e4 77
3b401a81
SH
78static const struct inet_connection_sock_af_ops ipv6_mapped;
79static const struct inet_connection_sock_af_ops ipv6_specific;
a928630a 80#ifdef CONFIG_TCP_MD5SIG
b2e4b3de
SH
81static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
82static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
9501f972
YH
83#else
84static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
85 struct in6_addr *addr)
86{
87 return NULL;
88}
a928630a 89#endif
1da177e4 90
1da177e4
LT
91static void tcp_v6_hash(struct sock *sk)
92{
93 if (sk->sk_state != TCP_CLOSE) {
8292a17a 94 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
1da177e4
LT
95 tcp_prot.hash(sk);
96 return;
97 }
98 local_bh_disable();
ab1e0a13 99 __inet6_hash(sk);
1da177e4
LT
100 local_bh_enable();
101 }
102}
103
684f2176 104static __inline__ __sum16 tcp_v6_check(int len,
1ab1457c
YH
105 struct in6_addr *saddr,
106 struct in6_addr *daddr,
868c86bc 107 __wsum base)
1da177e4
LT
108{
109 return csum_ipv6_magic(saddr, daddr, len, IPPROTO_TCP, base);
110}
111
a94f723d 112static __u32 tcp_v6_init_sequence(struct sk_buff *skb)
1da177e4 113{
0660e03f
ACM
114 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
115 ipv6_hdr(skb)->saddr.s6_addr32,
aa8223c7
ACM
116 tcp_hdr(skb)->dest,
117 tcp_hdr(skb)->source);
1da177e4
LT
118}
119
1ab1457c 120static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
1da177e4
LT
121 int addr_len)
122{
123 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
1ab1457c 124 struct inet_sock *inet = inet_sk(sk);
d83d8461 125 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4
LT
126 struct ipv6_pinfo *np = inet6_sk(sk);
127 struct tcp_sock *tp = tcp_sk(sk);
128 struct in6_addr *saddr = NULL, *final_p = NULL, final;
129 struct flowi fl;
130 struct dst_entry *dst;
131 int addr_type;
132 int err;
133
1ab1457c 134 if (addr_len < SIN6_LEN_RFC2133)
1da177e4
LT
135 return -EINVAL;
136
1ab1457c 137 if (usin->sin6_family != AF_INET6)
1da177e4
LT
138 return(-EAFNOSUPPORT);
139
140 memset(&fl, 0, sizeof(fl));
141
142 if (np->sndflow) {
143 fl.fl6_flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
144 IP6_ECN_flow_init(fl.fl6_flowlabel);
145 if (fl.fl6_flowlabel&IPV6_FLOWLABEL_MASK) {
146 struct ip6_flowlabel *flowlabel;
147 flowlabel = fl6_sock_lookup(sk, fl.fl6_flowlabel);
148 if (flowlabel == NULL)
149 return -EINVAL;
150 ipv6_addr_copy(&usin->sin6_addr, &flowlabel->dst);
151 fl6_sock_release(flowlabel);
152 }
153 }
154
155 /*
1ab1457c
YH
156 * connect() to INADDR_ANY means loopback (BSD'ism).
157 */
158
159 if(ipv6_addr_any(&usin->sin6_addr))
160 usin->sin6_addr.s6_addr[15] = 0x1;
1da177e4
LT
161
162 addr_type = ipv6_addr_type(&usin->sin6_addr);
163
164 if(addr_type & IPV6_ADDR_MULTICAST)
165 return -ENETUNREACH;
166
167 if (addr_type&IPV6_ADDR_LINKLOCAL) {
168 if (addr_len >= sizeof(struct sockaddr_in6) &&
169 usin->sin6_scope_id) {
170 /* If interface is set while binding, indices
171 * must coincide.
172 */
173 if (sk->sk_bound_dev_if &&
174 sk->sk_bound_dev_if != usin->sin6_scope_id)
175 return -EINVAL;
176
177 sk->sk_bound_dev_if = usin->sin6_scope_id;
178 }
179
180 /* Connect to link-local address requires an interface */
181 if (!sk->sk_bound_dev_if)
182 return -EINVAL;
183 }
184
185 if (tp->rx_opt.ts_recent_stamp &&
186 !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
187 tp->rx_opt.ts_recent = 0;
188 tp->rx_opt.ts_recent_stamp = 0;
189 tp->write_seq = 0;
190 }
191
192 ipv6_addr_copy(&np->daddr, &usin->sin6_addr);
193 np->flow_label = fl.fl6_flowlabel;
194
195 /*
196 * TCP over IPv4
197 */
198
199 if (addr_type == IPV6_ADDR_MAPPED) {
d83d8461 200 u32 exthdrlen = icsk->icsk_ext_hdr_len;
1da177e4
LT
201 struct sockaddr_in sin;
202
203 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
204
205 if (__ipv6_only_sock(sk))
206 return -ENETUNREACH;
207
208 sin.sin_family = AF_INET;
209 sin.sin_port = usin->sin6_port;
210 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
211
d83d8461 212 icsk->icsk_af_ops = &ipv6_mapped;
1da177e4 213 sk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
214#ifdef CONFIG_TCP_MD5SIG
215 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
216#endif
1da177e4
LT
217
218 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
219
220 if (err) {
d83d8461
ACM
221 icsk->icsk_ext_hdr_len = exthdrlen;
222 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 223 sk->sk_backlog_rcv = tcp_v6_do_rcv;
cfb6eeb4
YH
224#ifdef CONFIG_TCP_MD5SIG
225 tp->af_specific = &tcp_sock_ipv6_specific;
226#endif
1da177e4
LT
227 goto failure;
228 } else {
c720c7e8
ED
229 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
230 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
231 &np->rcv_saddr);
1da177e4
LT
232 }
233
234 return err;
235 }
236
237 if (!ipv6_addr_any(&np->rcv_saddr))
238 saddr = &np->rcv_saddr;
239
240 fl.proto = IPPROTO_TCP;
241 ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
242 ipv6_addr_copy(&fl.fl6_src,
243 (saddr ? saddr : &np->saddr));
244 fl.oif = sk->sk_bound_dev_if;
51953d5b 245 fl.mark = sk->sk_mark;
1da177e4 246 fl.fl_ip_dport = usin->sin6_port;
c720c7e8 247 fl.fl_ip_sport = inet->inet_sport;
1da177e4
LT
248
249 if (np->opt && np->opt->srcrt) {
250 struct rt0_hdr *rt0 = (struct rt0_hdr *)np->opt->srcrt;
251 ipv6_addr_copy(&final, &fl.fl6_dst);
252 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
253 final_p = &final;
254 }
255
beb8d13b
VY
256 security_sk_classify_flow(sk, &fl);
257
1da177e4
LT
258 err = ip6_dst_lookup(sk, &dst, &fl);
259 if (err)
260 goto failure;
261 if (final_p)
262 ipv6_addr_copy(&fl.fl6_dst, final_p);
263
52479b62
AD
264 err = __xfrm_lookup(sock_net(sk), &dst, &fl, sk, XFRM_LOOKUP_WAIT);
265 if (err < 0) {
14e50e57
DM
266 if (err == -EREMOTE)
267 err = ip6_dst_blackhole(sk, &dst, &fl);
268 if (err < 0)
269 goto failure;
270 }
1da177e4
LT
271
272 if (saddr == NULL) {
273 saddr = &fl.fl6_src;
274 ipv6_addr_copy(&np->rcv_saddr, saddr);
275 }
276
277 /* set the source address */
278 ipv6_addr_copy(&np->saddr, saddr);
c720c7e8 279 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 280
f83ef8c0 281 sk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 282 __ip6_dst_store(sk, dst, NULL, NULL);
1da177e4 283
d83d8461 284 icsk->icsk_ext_hdr_len = 0;
1da177e4 285 if (np->opt)
d83d8461
ACM
286 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
287 np->opt->opt_nflen);
1da177e4
LT
288
289 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
290
c720c7e8 291 inet->inet_dport = usin->sin6_port;
1da177e4
LT
292
293 tcp_set_state(sk, TCP_SYN_SENT);
d8313f5c 294 err = inet6_hash_connect(&tcp_death_row, sk);
1da177e4
LT
295 if (err)
296 goto late_failure;
297
298 if (!tp->write_seq)
299 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
300 np->daddr.s6_addr32,
c720c7e8
ED
301 inet->inet_sport,
302 inet->inet_dport);
1da177e4
LT
303
304 err = tcp_connect(sk);
305 if (err)
306 goto late_failure;
307
308 return 0;
309
310late_failure:
311 tcp_set_state(sk, TCP_CLOSE);
312 __sk_dst_reset(sk);
313failure:
c720c7e8 314 inet->inet_dport = 0;
1da177e4
LT
315 sk->sk_route_caps = 0;
316 return err;
317}
318
319static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
d5fdd6ba 320 u8 type, u8 code, int offset, __be32 info)
1da177e4
LT
321{
322 struct ipv6hdr *hdr = (struct ipv6hdr*)skb->data;
505cbfc5 323 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
1da177e4
LT
324 struct ipv6_pinfo *np;
325 struct sock *sk;
326 int err;
1ab1457c 327 struct tcp_sock *tp;
1da177e4 328 __u32 seq;
ca12a1a4 329 struct net *net = dev_net(skb->dev);
1da177e4 330
ca12a1a4 331 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
d86e0dac 332 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
1da177e4
LT
333
334 if (sk == NULL) {
e41b5368
DL
335 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
336 ICMP6_MIB_INERRORS);
1da177e4
LT
337 return;
338 }
339
340 if (sk->sk_state == TCP_TIME_WAIT) {
9469c7b4 341 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
342 return;
343 }
344
345 bh_lock_sock(sk);
346 if (sock_owned_by_user(sk))
de0744af 347 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
1da177e4
LT
348
349 if (sk->sk_state == TCP_CLOSE)
350 goto out;
351
352 tp = tcp_sk(sk);
1ab1457c 353 seq = ntohl(th->seq);
1da177e4
LT
354 if (sk->sk_state != TCP_LISTEN &&
355 !between(seq, tp->snd_una, tp->snd_nxt)) {
de0744af 356 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
357 goto out;
358 }
359
360 np = inet6_sk(sk);
361
362 if (type == ICMPV6_PKT_TOOBIG) {
363 struct dst_entry *dst = NULL;
364
365 if (sock_owned_by_user(sk))
366 goto out;
367 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
368 goto out;
369
370 /* icmp should have updated the destination cache entry */
371 dst = __sk_dst_check(sk, np->dst_cookie);
372
373 if (dst == NULL) {
374 struct inet_sock *inet = inet_sk(sk);
375 struct flowi fl;
376
377 /* BUGGG_FUTURE: Again, it is not clear how
378 to handle rthdr case. Ignore this complexity
379 for now.
380 */
381 memset(&fl, 0, sizeof(fl));
382 fl.proto = IPPROTO_TCP;
383 ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
384 ipv6_addr_copy(&fl.fl6_src, &np->saddr);
385 fl.oif = sk->sk_bound_dev_if;
51953d5b 386 fl.mark = sk->sk_mark;
c720c7e8
ED
387 fl.fl_ip_dport = inet->inet_dport;
388 fl.fl_ip_sport = inet->inet_sport;
beb8d13b 389 security_skb_classify_flow(skb, &fl);
1da177e4
LT
390
391 if ((err = ip6_dst_lookup(sk, &dst, &fl))) {
392 sk->sk_err_soft = -err;
393 goto out;
394 }
395
52479b62 396 if ((err = xfrm_lookup(net, &dst, &fl, sk, 0)) < 0) {
1da177e4
LT
397 sk->sk_err_soft = -err;
398 goto out;
399 }
400
401 } else
402 dst_hold(dst);
403
d83d8461 404 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
1da177e4
LT
405 tcp_sync_mss(sk, dst_mtu(dst));
406 tcp_simple_retransmit(sk);
407 } /* else let the usual retransmit timer handle it */
408 dst_release(dst);
409 goto out;
410 }
411
412 icmpv6_err_convert(type, code, &err);
413
60236fdd 414 /* Might be for an request_sock */
1da177e4 415 switch (sk->sk_state) {
60236fdd 416 struct request_sock *req, **prev;
1da177e4
LT
417 case TCP_LISTEN:
418 if (sock_owned_by_user(sk))
419 goto out;
420
8129765a
ACM
421 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
422 &hdr->saddr, inet6_iif(skb));
1da177e4
LT
423 if (!req)
424 goto out;
425
426 /* ICMPs are not backlogged, hence we cannot get
427 * an established socket here.
428 */
547b792c 429 WARN_ON(req->sk != NULL);
1da177e4 430
2e6599cb 431 if (seq != tcp_rsk(req)->snt_isn) {
de0744af 432 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
433 goto out;
434 }
435
463c84b9 436 inet_csk_reqsk_queue_drop(sk, req, prev);
1da177e4
LT
437 goto out;
438
439 case TCP_SYN_SENT:
440 case TCP_SYN_RECV: /* Cannot happen.
1ab1457c 441 It can, it SYNs are crossed. --ANK */
1da177e4 442 if (!sock_owned_by_user(sk)) {
1da177e4
LT
443 sk->sk_err = err;
444 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
445
446 tcp_done(sk);
447 } else
448 sk->sk_err_soft = err;
449 goto out;
450 }
451
452 if (!sock_owned_by_user(sk) && np->recverr) {
453 sk->sk_err = err;
454 sk->sk_error_report(sk);
455 } else
456 sk->sk_err_soft = err;
457
458out:
459 bh_unlock_sock(sk);
460 sock_put(sk);
461}
462
463
e6b4d113
WAS
464static int tcp_v6_send_synack(struct sock *sk, struct request_sock *req,
465 struct request_values *rvp)
1da177e4 466{
ca304b61 467 struct inet6_request_sock *treq = inet6_rsk(req);
1da177e4
LT
468 struct ipv6_pinfo *np = inet6_sk(sk);
469 struct sk_buff * skb;
470 struct ipv6_txoptions *opt = NULL;
471 struct in6_addr * final_p = NULL, final;
472 struct flowi fl;
fd80eb94 473 struct dst_entry *dst;
1da177e4
LT
474 int err = -1;
475
476 memset(&fl, 0, sizeof(fl));
477 fl.proto = IPPROTO_TCP;
2e6599cb
ACM
478 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
479 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
1da177e4 480 fl.fl6_flowlabel = 0;
2e6599cb 481 fl.oif = treq->iif;
51953d5b 482 fl.mark = sk->sk_mark;
2e6599cb 483 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
fd507037 484 fl.fl_ip_sport = inet_rsk(req)->loc_port;
4237c75c 485 security_req_classify_flow(req, &fl);
1da177e4 486
fd80eb94
DL
487 opt = np->opt;
488 if (opt && opt->srcrt) {
489 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
490 ipv6_addr_copy(&final, &fl.fl6_dst);
491 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
492 final_p = &final;
1da177e4
LT
493 }
494
fd80eb94
DL
495 err = ip6_dst_lookup(sk, &dst, &fl);
496 if (err)
497 goto done;
498 if (final_p)
499 ipv6_addr_copy(&fl.fl6_dst, final_p);
52479b62 500 if ((err = xfrm_lookup(sock_net(sk), &dst, &fl, sk, 0)) < 0)
fd80eb94
DL
501 goto done;
502
e6b4d113 503 skb = tcp_make_synack(sk, dst, req, rvp);
1da177e4 504 if (skb) {
aa8223c7 505 struct tcphdr *th = tcp_hdr(skb);
1da177e4 506
684f2176 507 th->check = tcp_v6_check(skb->len,
2e6599cb 508 &treq->loc_addr, &treq->rmt_addr,
07f0757a 509 csum_partial(th, skb->len, skb->csum));
1da177e4 510
2e6599cb 511 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
1da177e4 512 err = ip6_xmit(sk, skb, &fl, opt, 0);
b9df3cb8 513 err = net_xmit_eval(err);
1da177e4
LT
514 }
515
516done:
1ab1457c 517 if (opt && opt != np->opt)
1da177e4 518 sock_kfree_s(sk, opt, opt->tot_len);
78b91042 519 dst_release(dst);
1da177e4
LT
520 return err;
521}
522
c6aefafb
GG
523static inline void syn_flood_warning(struct sk_buff *skb)
524{
525#ifdef CONFIG_SYN_COOKIES
526 if (sysctl_tcp_syncookies)
527 printk(KERN_INFO
528 "TCPv6: Possible SYN flooding on port %d. "
529 "Sending cookies.\n", ntohs(tcp_hdr(skb)->dest));
530 else
531#endif
532 printk(KERN_INFO
533 "TCPv6: Possible SYN flooding on port %d. "
534 "Dropping request.\n", ntohs(tcp_hdr(skb)->dest));
535}
536
60236fdd 537static void tcp_v6_reqsk_destructor(struct request_sock *req)
1da177e4 538{
800d55f1 539 kfree_skb(inet6_rsk(req)->pktopts);
1da177e4
LT
540}
541
cfb6eeb4
YH
542#ifdef CONFIG_TCP_MD5SIG
543static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
544 struct in6_addr *addr)
545{
546 struct tcp_sock *tp = tcp_sk(sk);
547 int i;
548
549 BUG_ON(tp == NULL);
550
551 if (!tp->md5sig_info || !tp->md5sig_info->entries6)
552 return NULL;
553
554 for (i = 0; i < tp->md5sig_info->entries6; i++) {
caad295f 555 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, addr))
f8ab18d2 556 return &tp->md5sig_info->keys6[i].base;
cfb6eeb4
YH
557 }
558 return NULL;
559}
560
561static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
562 struct sock *addr_sk)
563{
564 return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
565}
566
567static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
568 struct request_sock *req)
569{
570 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
571}
572
573static int tcp_v6_md5_do_add(struct sock *sk, struct in6_addr *peer,
574 char *newkey, u8 newkeylen)
575{
576 /* Add key to the list */
b0a713e9 577 struct tcp_md5sig_key *key;
cfb6eeb4
YH
578 struct tcp_sock *tp = tcp_sk(sk);
579 struct tcp6_md5sig_key *keys;
580
b0a713e9 581 key = tcp_v6_md5_do_lookup(sk, peer);
cfb6eeb4
YH
582 if (key) {
583 /* modify existing entry - just update that one */
b0a713e9
MD
584 kfree(key->key);
585 key->key = newkey;
586 key->keylen = newkeylen;
cfb6eeb4
YH
587 } else {
588 /* reallocate new list if current one is full. */
589 if (!tp->md5sig_info) {
590 tp->md5sig_info = kzalloc(sizeof(*tp->md5sig_info), GFP_ATOMIC);
591 if (!tp->md5sig_info) {
592 kfree(newkey);
593 return -ENOMEM;
594 }
3d7dbeac 595 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
cfb6eeb4 596 }
aa133076 597 if (tcp_alloc_md5sig_pool(sk) == NULL) {
aacbe8c8
YH
598 kfree(newkey);
599 return -ENOMEM;
600 }
cfb6eeb4
YH
601 if (tp->md5sig_info->alloced6 == tp->md5sig_info->entries6) {
602 keys = kmalloc((sizeof (tp->md5sig_info->keys6[0]) *
603 (tp->md5sig_info->entries6 + 1)), GFP_ATOMIC);
604
605 if (!keys) {
606 tcp_free_md5sig_pool();
607 kfree(newkey);
608 return -ENOMEM;
609 }
610
611 if (tp->md5sig_info->entries6)
612 memmove(keys, tp->md5sig_info->keys6,
613 (sizeof (tp->md5sig_info->keys6[0]) *
614 tp->md5sig_info->entries6));
615
616 kfree(tp->md5sig_info->keys6);
617 tp->md5sig_info->keys6 = keys;
618 tp->md5sig_info->alloced6++;
619 }
620
621 ipv6_addr_copy(&tp->md5sig_info->keys6[tp->md5sig_info->entries6].addr,
622 peer);
f8ab18d2
DM
623 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.key = newkey;
624 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.keylen = newkeylen;
cfb6eeb4
YH
625
626 tp->md5sig_info->entries6++;
627 }
628 return 0;
629}
630
631static int tcp_v6_md5_add_func(struct sock *sk, struct sock *addr_sk,
632 u8 *newkey, __u8 newkeylen)
633{
634 return tcp_v6_md5_do_add(sk, &inet6_sk(addr_sk)->daddr,
635 newkey, newkeylen);
636}
637
638static int tcp_v6_md5_do_del(struct sock *sk, struct in6_addr *peer)
639{
640 struct tcp_sock *tp = tcp_sk(sk);
641 int i;
642
643 for (i = 0; i < tp->md5sig_info->entries6; i++) {
caad295f 644 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, peer)) {
cfb6eeb4 645 /* Free the key */
f8ab18d2 646 kfree(tp->md5sig_info->keys6[i].base.key);
cfb6eeb4
YH
647 tp->md5sig_info->entries6--;
648
649 if (tp->md5sig_info->entries6 == 0) {
650 kfree(tp->md5sig_info->keys6);
651 tp->md5sig_info->keys6 = NULL;
ca983cef 652 tp->md5sig_info->alloced6 = 0;
cfb6eeb4
YH
653 } else {
654 /* shrink the database */
655 if (tp->md5sig_info->entries6 != i)
656 memmove(&tp->md5sig_info->keys6[i],
657 &tp->md5sig_info->keys6[i+1],
658 (tp->md5sig_info->entries6 - i)
659 * sizeof (tp->md5sig_info->keys6[0]));
660 }
77adefdc
YH
661 tcp_free_md5sig_pool();
662 return 0;
cfb6eeb4
YH
663 }
664 }
665 return -ENOENT;
666}
667
668static void tcp_v6_clear_md5_list (struct sock *sk)
669{
670 struct tcp_sock *tp = tcp_sk(sk);
671 int i;
672
673 if (tp->md5sig_info->entries6) {
674 for (i = 0; i < tp->md5sig_info->entries6; i++)
f8ab18d2 675 kfree(tp->md5sig_info->keys6[i].base.key);
cfb6eeb4
YH
676 tp->md5sig_info->entries6 = 0;
677 tcp_free_md5sig_pool();
678 }
679
680 kfree(tp->md5sig_info->keys6);
681 tp->md5sig_info->keys6 = NULL;
682 tp->md5sig_info->alloced6 = 0;
683
684 if (tp->md5sig_info->entries4) {
685 for (i = 0; i < tp->md5sig_info->entries4; i++)
f8ab18d2 686 kfree(tp->md5sig_info->keys4[i].base.key);
cfb6eeb4
YH
687 tp->md5sig_info->entries4 = 0;
688 tcp_free_md5sig_pool();
689 }
690
691 kfree(tp->md5sig_info->keys4);
692 tp->md5sig_info->keys4 = NULL;
693 tp->md5sig_info->alloced4 = 0;
694}
695
696static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
697 int optlen)
698{
699 struct tcp_md5sig cmd;
700 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
701 u8 *newkey;
702
703 if (optlen < sizeof(cmd))
704 return -EINVAL;
705
706 if (copy_from_user(&cmd, optval, sizeof(cmd)))
707 return -EFAULT;
708
709 if (sin6->sin6_family != AF_INET6)
710 return -EINVAL;
711
712 if (!cmd.tcpm_keylen) {
713 if (!tcp_sk(sk)->md5sig_info)
714 return -ENOENT;
e773e4fa 715 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
cfb6eeb4
YH
716 return tcp_v4_md5_do_del(sk, sin6->sin6_addr.s6_addr32[3]);
717 return tcp_v6_md5_do_del(sk, &sin6->sin6_addr);
718 }
719
720 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
721 return -EINVAL;
722
723 if (!tcp_sk(sk)->md5sig_info) {
724 struct tcp_sock *tp = tcp_sk(sk);
725 struct tcp_md5sig_info *p;
726
727 p = kzalloc(sizeof(struct tcp_md5sig_info), GFP_KERNEL);
728 if (!p)
729 return -ENOMEM;
730
731 tp->md5sig_info = p;
3d7dbeac 732 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
cfb6eeb4
YH
733 }
734
af879cc7 735 newkey = kmemdup(cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4
YH
736 if (!newkey)
737 return -ENOMEM;
e773e4fa 738 if (ipv6_addr_v4mapped(&sin6->sin6_addr)) {
cfb6eeb4
YH
739 return tcp_v4_md5_do_add(sk, sin6->sin6_addr.s6_addr32[3],
740 newkey, cmd.tcpm_keylen);
741 }
742 return tcp_v6_md5_do_add(sk, &sin6->sin6_addr, newkey, cmd.tcpm_keylen);
743}
744
49a72dfb
AL
745static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
746 struct in6_addr *daddr,
747 struct in6_addr *saddr, int nbytes)
cfb6eeb4 748{
cfb6eeb4 749 struct tcp6_pseudohdr *bp;
49a72dfb 750 struct scatterlist sg;
8d26d76d 751
cfb6eeb4 752 bp = &hp->md5_blk.ip6;
cfb6eeb4
YH
753 /* 1. TCP pseudo-header (RFC2460) */
754 ipv6_addr_copy(&bp->saddr, saddr);
755 ipv6_addr_copy(&bp->daddr, daddr);
49a72dfb 756 bp->protocol = cpu_to_be32(IPPROTO_TCP);
00b1304c 757 bp->len = cpu_to_be32(nbytes);
cfb6eeb4 758
49a72dfb
AL
759 sg_init_one(&sg, bp, sizeof(*bp));
760 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
761}
c7da57a1 762
49a72dfb
AL
763static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
764 struct in6_addr *daddr, struct in6_addr *saddr,
765 struct tcphdr *th)
766{
767 struct tcp_md5sig_pool *hp;
768 struct hash_desc *desc;
769
770 hp = tcp_get_md5sig_pool();
771 if (!hp)
772 goto clear_hash_noput;
773 desc = &hp->md5_desc;
774
775 if (crypto_hash_init(desc))
776 goto clear_hash;
777 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
778 goto clear_hash;
779 if (tcp_md5_hash_header(hp, th))
780 goto clear_hash;
781 if (tcp_md5_hash_key(hp, key))
782 goto clear_hash;
783 if (crypto_hash_final(desc, md5_hash))
cfb6eeb4 784 goto clear_hash;
cfb6eeb4 785
cfb6eeb4 786 tcp_put_md5sig_pool();
cfb6eeb4 787 return 0;
49a72dfb 788
cfb6eeb4
YH
789clear_hash:
790 tcp_put_md5sig_pool();
791clear_hash_noput:
792 memset(md5_hash, 0, 16);
49a72dfb 793 return 1;
cfb6eeb4
YH
794}
795
49a72dfb
AL
796static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
797 struct sock *sk, struct request_sock *req,
798 struct sk_buff *skb)
cfb6eeb4
YH
799{
800 struct in6_addr *saddr, *daddr;
49a72dfb
AL
801 struct tcp_md5sig_pool *hp;
802 struct hash_desc *desc;
803 struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4
YH
804
805 if (sk) {
806 saddr = &inet6_sk(sk)->saddr;
807 daddr = &inet6_sk(sk)->daddr;
49a72dfb 808 } else if (req) {
cfb6eeb4
YH
809 saddr = &inet6_rsk(req)->loc_addr;
810 daddr = &inet6_rsk(req)->rmt_addr;
49a72dfb
AL
811 } else {
812 struct ipv6hdr *ip6h = ipv6_hdr(skb);
813 saddr = &ip6h->saddr;
814 daddr = &ip6h->daddr;
cfb6eeb4 815 }
49a72dfb
AL
816
817 hp = tcp_get_md5sig_pool();
818 if (!hp)
819 goto clear_hash_noput;
820 desc = &hp->md5_desc;
821
822 if (crypto_hash_init(desc))
823 goto clear_hash;
824
825 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
826 goto clear_hash;
827 if (tcp_md5_hash_header(hp, th))
828 goto clear_hash;
829 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
830 goto clear_hash;
831 if (tcp_md5_hash_key(hp, key))
832 goto clear_hash;
833 if (crypto_hash_final(desc, md5_hash))
834 goto clear_hash;
835
836 tcp_put_md5sig_pool();
837 return 0;
838
839clear_hash:
840 tcp_put_md5sig_pool();
841clear_hash_noput:
842 memset(md5_hash, 0, 16);
843 return 1;
cfb6eeb4
YH
844}
845
846static int tcp_v6_inbound_md5_hash (struct sock *sk, struct sk_buff *skb)
847{
848 __u8 *hash_location = NULL;
849 struct tcp_md5sig_key *hash_expected;
0660e03f 850 struct ipv6hdr *ip6h = ipv6_hdr(skb);
aa8223c7 851 struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4 852 int genhash;
cfb6eeb4
YH
853 u8 newhash[16];
854
855 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
7d5d5525 856 hash_location = tcp_parse_md5sig_option(th);
cfb6eeb4 857
785957d3
DM
858 /* We've parsed the options - do we have a hash? */
859 if (!hash_expected && !hash_location)
860 return 0;
861
862 if (hash_expected && !hash_location) {
863 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
cfb6eeb4
YH
864 return 1;
865 }
866
785957d3
DM
867 if (!hash_expected && hash_location) {
868 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
cfb6eeb4
YH
869 return 1;
870 }
871
872 /* check the signature */
49a72dfb
AL
873 genhash = tcp_v6_md5_hash_skb(newhash,
874 hash_expected,
875 NULL, NULL, skb);
876
cfb6eeb4
YH
877 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
878 if (net_ratelimit()) {
5b095d98 879 printk(KERN_INFO "MD5 Hash %s for (%pI6, %u)->(%pI6, %u)\n",
cfb6eeb4 880 genhash ? "failed" : "mismatch",
0c6ce78a
HH
881 &ip6h->saddr, ntohs(th->source),
882 &ip6h->daddr, ntohs(th->dest));
cfb6eeb4
YH
883 }
884 return 1;
885 }
886 return 0;
887}
888#endif
889
c6aefafb 890struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
1da177e4 891 .family = AF_INET6,
2e6599cb 892 .obj_size = sizeof(struct tcp6_request_sock),
1da177e4 893 .rtx_syn_ack = tcp_v6_send_synack,
60236fdd
ACM
894 .send_ack = tcp_v6_reqsk_send_ack,
895 .destructor = tcp_v6_reqsk_destructor,
1da177e4
LT
896 .send_reset = tcp_v6_send_reset
897};
898
cfb6eeb4 899#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 900static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
cfb6eeb4 901 .md5_lookup = tcp_v6_reqsk_md5_lookup,
e3afe7b7 902 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 903};
b6332e6c 904#endif
cfb6eeb4 905
6d6ee43e
ACM
906static struct timewait_sock_ops tcp6_timewait_sock_ops = {
907 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
908 .twsk_unique = tcp_twsk_unique,
cfb6eeb4 909 .twsk_destructor= tcp_twsk_destructor,
6d6ee43e
ACM
910};
911
8292a17a 912static void tcp_v6_send_check(struct sock *sk, int len, struct sk_buff *skb)
1da177e4
LT
913{
914 struct ipv6_pinfo *np = inet6_sk(sk);
aa8223c7 915 struct tcphdr *th = tcp_hdr(skb);
1da177e4 916
84fa7933 917 if (skb->ip_summed == CHECKSUM_PARTIAL) {
1da177e4 918 th->check = ~csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP, 0);
663ead3b 919 skb->csum_start = skb_transport_header(skb) - skb->head;
ff1dcadb 920 skb->csum_offset = offsetof(struct tcphdr, check);
1da177e4 921 } else {
1ab1457c 922 th->check = csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP,
07f0757a 923 csum_partial(th, th->doff<<2,
1da177e4
LT
924 skb->csum));
925 }
926}
927
a430a43d
HX
928static int tcp_v6_gso_send_check(struct sk_buff *skb)
929{
930 struct ipv6hdr *ipv6h;
931 struct tcphdr *th;
932
933 if (!pskb_may_pull(skb, sizeof(*th)))
934 return -EINVAL;
935
0660e03f 936 ipv6h = ipv6_hdr(skb);
aa8223c7 937 th = tcp_hdr(skb);
a430a43d
HX
938
939 th->check = 0;
940 th->check = ~csum_ipv6_magic(&ipv6h->saddr, &ipv6h->daddr, skb->len,
941 IPPROTO_TCP, 0);
663ead3b 942 skb->csum_start = skb_transport_header(skb) - skb->head;
ff1dcadb 943 skb->csum_offset = offsetof(struct tcphdr, check);
84fa7933 944 skb->ip_summed = CHECKSUM_PARTIAL;
a430a43d
HX
945 return 0;
946}
1da177e4 947
36990673
HX
948static struct sk_buff **tcp6_gro_receive(struct sk_buff **head,
949 struct sk_buff *skb)
684f2176 950{
36e7b1b8 951 struct ipv6hdr *iph = skb_gro_network_header(skb);
684f2176
HX
952
953 switch (skb->ip_summed) {
954 case CHECKSUM_COMPLETE:
86911732 955 if (!tcp_v6_check(skb_gro_len(skb), &iph->saddr, &iph->daddr,
684f2176
HX
956 skb->csum)) {
957 skb->ip_summed = CHECKSUM_UNNECESSARY;
958 break;
959 }
960
961 /* fall through */
962 case CHECKSUM_NONE:
963 NAPI_GRO_CB(skb)->flush = 1;
964 return NULL;
965 }
966
967 return tcp_gro_receive(head, skb);
968}
684f2176 969
36990673 970static int tcp6_gro_complete(struct sk_buff *skb)
684f2176
HX
971{
972 struct ipv6hdr *iph = ipv6_hdr(skb);
973 struct tcphdr *th = tcp_hdr(skb);
974
975 th->check = ~tcp_v6_check(skb->len - skb_transport_offset(skb),
976 &iph->saddr, &iph->daddr, 0);
977 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
978
979 return tcp_gro_complete(skb);
980}
684f2176 981
626e264d
IJ
982static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
983 u32 ts, struct tcp_md5sig_key *key, int rst)
1da177e4 984{
aa8223c7 985 struct tcphdr *th = tcp_hdr(skb), *t1;
1da177e4
LT
986 struct sk_buff *buff;
987 struct flowi fl;
adf30907 988 struct net *net = dev_net(skb_dst(skb)->dev);
e5047992 989 struct sock *ctl_sk = net->ipv6.tcp_sk;
77c676da 990 unsigned int tot_len = sizeof(struct tcphdr);
adf30907 991 struct dst_entry *dst;
81ada62d 992 __be32 *topt;
1da177e4 993
626e264d
IJ
994 if (ts)
995 tot_len += TCPOLEN_TSTAMP_ALIGNED;
cfb6eeb4 996#ifdef CONFIG_TCP_MD5SIG
cfb6eeb4
YH
997 if (key)
998 tot_len += TCPOLEN_MD5SIG_ALIGNED;
999#endif
1000
cfb6eeb4 1001 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1da177e4 1002 GFP_ATOMIC);
1ab1457c
YH
1003 if (buff == NULL)
1004 return;
1da177e4 1005
cfb6eeb4 1006 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1da177e4 1007
cfb6eeb4 1008 t1 = (struct tcphdr *) skb_push(buff, tot_len);
a8fdf2b3 1009 skb_reset_transport_header(skb);
1da177e4
LT
1010
1011 /* Swap the send and the receive. */
1012 memset(t1, 0, sizeof(*t1));
1013 t1->dest = th->source;
1014 t1->source = th->dest;
cfb6eeb4 1015 t1->doff = tot_len / 4;
626e264d
IJ
1016 t1->seq = htonl(seq);
1017 t1->ack_seq = htonl(ack);
1018 t1->ack = !rst || !th->ack;
1019 t1->rst = rst;
1020 t1->window = htons(win);
1da177e4 1021
81ada62d
IJ
1022 topt = (__be32 *)(t1 + 1);
1023
626e264d
IJ
1024 if (ts) {
1025 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1026 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
1027 *topt++ = htonl(tcp_time_stamp);
1028 *topt++ = htonl(ts);
1029 }
1030
cfb6eeb4
YH
1031#ifdef CONFIG_TCP_MD5SIG
1032 if (key) {
81ada62d
IJ
1033 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1034 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
1035 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
78e645cb
IJ
1036 &ipv6_hdr(skb)->saddr,
1037 &ipv6_hdr(skb)->daddr, t1);
cfb6eeb4
YH
1038 }
1039#endif
1040
07f0757a 1041 buff->csum = csum_partial(t1, tot_len, 0);
1da177e4
LT
1042
1043 memset(&fl, 0, sizeof(fl));
0660e03f
ACM
1044 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
1045 ipv6_addr_copy(&fl.fl6_src, &ipv6_hdr(skb)->daddr);
1da177e4
LT
1046
1047 t1->check = csum_ipv6_magic(&fl.fl6_src, &fl.fl6_dst,
52cd5750 1048 tot_len, IPPROTO_TCP,
1da177e4
LT
1049 buff->csum);
1050
1051 fl.proto = IPPROTO_TCP;
505cbfc5 1052 fl.oif = inet6_iif(skb);
1da177e4
LT
1053 fl.fl_ip_dport = t1->dest;
1054 fl.fl_ip_sport = t1->source;
beb8d13b 1055 security_skb_classify_flow(skb, &fl);
1da177e4 1056
c20121ae
DL
1057 /* Pass a socket to ip6_dst_lookup either it is for RST
1058 * Underlying function will use this to retrieve the network
1059 * namespace
1060 */
adf30907
ED
1061 if (!ip6_dst_lookup(ctl_sk, &dst, &fl)) {
1062 if (xfrm_lookup(net, &dst, &fl, NULL, 0) >= 0) {
1063 skb_dst_set(buff, dst);
e5047992 1064 ip6_xmit(ctl_sk, buff, &fl, NULL, 0);
63231bdd 1065 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
626e264d
IJ
1066 if (rst)
1067 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
1da177e4 1068 return;
ecc51b6d 1069 }
1da177e4
LT
1070 }
1071
1072 kfree_skb(buff);
1073}
1074
626e264d 1075static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
1da177e4 1076{
626e264d
IJ
1077 struct tcphdr *th = tcp_hdr(skb);
1078 u32 seq = 0, ack_seq = 0;
fa3e5b4e 1079 struct tcp_md5sig_key *key = NULL;
1da177e4 1080
626e264d 1081 if (th->rst)
1da177e4
LT
1082 return;
1083
626e264d
IJ
1084 if (!ipv6_unicast_destination(skb))
1085 return;
1da177e4 1086
cfb6eeb4 1087#ifdef CONFIG_TCP_MD5SIG
626e264d
IJ
1088 if (sk)
1089 key = tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr);
cfb6eeb4
YH
1090#endif
1091
626e264d
IJ
1092 if (th->ack)
1093 seq = ntohl(th->ack_seq);
1094 else
1095 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
1096 (th->doff << 2);
1da177e4 1097
626e264d
IJ
1098 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, key, 1);
1099}
1da177e4 1100
626e264d
IJ
1101static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack, u32 win, u32 ts,
1102 struct tcp_md5sig_key *key)
1103{
1104 tcp_v6_send_response(skb, seq, ack, win, ts, key, 0);
1da177e4
LT
1105}
1106
1107static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
1108{
8feaf0c0 1109 struct inet_timewait_sock *tw = inet_twsk(sk);
cfb6eeb4 1110 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1da177e4 1111
9501f972 1112 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
8feaf0c0 1113 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
9501f972 1114 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw));
1da177e4 1115
8feaf0c0 1116 inet_twsk_put(tw);
1da177e4
LT
1117}
1118
6edafaaf
GJ
1119static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
1120 struct request_sock *req)
1da177e4 1121{
9501f972 1122 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1, req->rcv_wnd, req->ts_recent,
6edafaaf 1123 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr));
1da177e4
LT
1124}
1125
1126
1127static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
1128{
60236fdd 1129 struct request_sock *req, **prev;
aa8223c7 1130 const struct tcphdr *th = tcp_hdr(skb);
1da177e4
LT
1131 struct sock *nsk;
1132
1133 /* Find possible connection requests. */
8129765a 1134 req = inet6_csk_search_req(sk, &prev, th->source,
0660e03f
ACM
1135 &ipv6_hdr(skb)->saddr,
1136 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1da177e4
LT
1137 if (req)
1138 return tcp_check_req(sk, skb, req, prev);
1139
3b1e0a65 1140 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
d86e0dac
PE
1141 &ipv6_hdr(skb)->saddr, th->source,
1142 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1da177e4
LT
1143
1144 if (nsk) {
1145 if (nsk->sk_state != TCP_TIME_WAIT) {
1146 bh_lock_sock(nsk);
1147 return nsk;
1148 }
9469c7b4 1149 inet_twsk_put(inet_twsk(nsk));
1da177e4
LT
1150 return NULL;
1151 }
1152
c6aefafb 1153#ifdef CONFIG_SYN_COOKIES
1da177e4 1154 if (!th->rst && !th->syn && th->ack)
c6aefafb 1155 sk = cookie_v6_check(sk, skb);
1da177e4
LT
1156#endif
1157 return sk;
1158}
1159
1da177e4
LT
1160/* FIXME: this is substantially similar to the ipv4 code.
1161 * Can some kind of merge be done? -- erics
1162 */
1163static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1164{
e6b4d113
WAS
1165 struct tcp_options_received tmp_opt;
1166 struct request_sock *req;
ca304b61 1167 struct inet6_request_sock *treq;
1da177e4 1168 struct ipv6_pinfo *np = inet6_sk(sk);
1da177e4 1169 struct tcp_sock *tp = tcp_sk(sk);
022c3f7d 1170 struct dst_entry *dst = __sk_dst_get(sk);
e6b4d113 1171 __u32 isn = TCP_SKB_CB(skb)->when;
c6aefafb
GG
1172#ifdef CONFIG_SYN_COOKIES
1173 int want_cookie = 0;
1174#else
1175#define want_cookie 0
1176#endif
1da177e4
LT
1177
1178 if (skb->protocol == htons(ETH_P_IP))
1179 return tcp_v4_conn_request(sk, skb);
1180
1181 if (!ipv6_unicast_destination(skb))
1ab1457c 1182 goto drop;
1da177e4 1183
463c84b9 1184 if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
1da177e4 1185 if (net_ratelimit())
c6aefafb
GG
1186 syn_flood_warning(skb);
1187#ifdef CONFIG_SYN_COOKIES
1188 if (sysctl_tcp_syncookies)
1189 want_cookie = 1;
1190 else
1191#endif
1ab1457c 1192 goto drop;
1da177e4
LT
1193 }
1194
463c84b9 1195 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
1da177e4
LT
1196 goto drop;
1197
ca304b61 1198 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1da177e4
LT
1199 if (req == NULL)
1200 goto drop;
1201
cfb6eeb4
YH
1202#ifdef CONFIG_TCP_MD5SIG
1203 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1204#endif
1205
1da177e4
LT
1206 tcp_clear_options(&tmp_opt);
1207 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1208 tmp_opt.user_mss = tp->rx_opt.user_mss;
1209
022c3f7d 1210 tcp_parse_options(skb, &tmp_opt, 0, dst);
1da177e4 1211
4dfc2817 1212 if (want_cookie && !tmp_opt.saw_tstamp)
c6aefafb 1213 tcp_clear_options(&tmp_opt);
c6aefafb 1214
1da177e4
LT
1215 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1216 tcp_openreq_init(req, &tmp_opt, skb);
1217
ca304b61 1218 treq = inet6_rsk(req);
0660e03f
ACM
1219 ipv6_addr_copy(&treq->rmt_addr, &ipv6_hdr(skb)->saddr);
1220 ipv6_addr_copy(&treq->loc_addr, &ipv6_hdr(skb)->daddr);
c6aefafb
GG
1221 if (!want_cookie)
1222 TCP_ECN_create_request(req, tcp_hdr(skb));
1223
1224 if (want_cookie) {
1225 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
4dfc2817 1226 req->cookie_ts = tmp_opt.tstamp_ok;
c6aefafb
GG
1227 } else if (!isn) {
1228 if (ipv6_opt_accepted(sk, skb) ||
1229 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1230 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1231 atomic_inc(&skb->users);
1232 treq->pktopts = skb;
1233 }
1234 treq->iif = sk->sk_bound_dev_if;
1da177e4 1235
c6aefafb
GG
1236 /* So that link locals have meaning */
1237 if (!sk->sk_bound_dev_if &&
1238 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1239 treq->iif = inet6_iif(skb);
1da177e4 1240
a94f723d 1241 isn = tcp_v6_init_sequence(skb);
c6aefafb 1242 }
2e6599cb 1243 tcp_rsk(req)->snt_isn = isn;
1da177e4 1244
4237c75c
VY
1245 security_inet_conn_request(sk, skb, req);
1246
e6b4d113
WAS
1247 if (tcp_v6_send_synack(sk, req, NULL) || want_cookie)
1248 goto drop_and_free;
1da177e4 1249
e6b4d113
WAS
1250 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1251 return 0;
1da177e4 1252
e6b4d113
WAS
1253drop_and_free:
1254 reqsk_free(req);
1da177e4 1255drop:
1da177e4
LT
1256 return 0; /* don't send reset */
1257}
1258
1259static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
60236fdd 1260 struct request_sock *req,
1da177e4
LT
1261 struct dst_entry *dst)
1262{
78d15e82 1263 struct inet6_request_sock *treq;
1da177e4
LT
1264 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1265 struct tcp6_sock *newtcp6sk;
1266 struct inet_sock *newinet;
1267 struct tcp_sock *newtp;
1268 struct sock *newsk;
1269 struct ipv6_txoptions *opt;
cfb6eeb4
YH
1270#ifdef CONFIG_TCP_MD5SIG
1271 struct tcp_md5sig_key *key;
1272#endif
1da177e4
LT
1273
1274 if (skb->protocol == htons(ETH_P_IP)) {
1275 /*
1276 * v6 mapped
1277 */
1278
1279 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1280
1ab1457c 1281 if (newsk == NULL)
1da177e4
LT
1282 return NULL;
1283
1284 newtcp6sk = (struct tcp6_sock *)newsk;
1285 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1286
1287 newinet = inet_sk(newsk);
1288 newnp = inet6_sk(newsk);
1289 newtp = tcp_sk(newsk);
1290
1291 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1292
c720c7e8 1293 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newnp->daddr);
1da177e4 1294
c720c7e8 1295 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
1da177e4
LT
1296
1297 ipv6_addr_copy(&newnp->rcv_saddr, &newnp->saddr);
1298
8292a17a 1299 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1da177e4 1300 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
1301#ifdef CONFIG_TCP_MD5SIG
1302 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1303#endif
1304
1da177e4
LT
1305 newnp->pktoptions = NULL;
1306 newnp->opt = NULL;
505cbfc5 1307 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1308 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1da177e4 1309
e6848976
ACM
1310 /*
1311 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1312 * here, tcp_create_openreq_child now does this for us, see the comment in
1313 * that function for the gory details. -acme
1da177e4 1314 */
1da177e4
LT
1315
1316 /* It is tricky place. Until this moment IPv4 tcp
8292a17a 1317 worked with IPv6 icsk.icsk_af_ops.
1da177e4
LT
1318 Sync it now.
1319 */
d83d8461 1320 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1da177e4
LT
1321
1322 return newsk;
1323 }
1324
78d15e82 1325 treq = inet6_rsk(req);
1da177e4
LT
1326 opt = np->opt;
1327
1328 if (sk_acceptq_is_full(sk))
1329 goto out_overflow;
1330
1da177e4
LT
1331 if (dst == NULL) {
1332 struct in6_addr *final_p = NULL, final;
1333 struct flowi fl;
1334
1335 memset(&fl, 0, sizeof(fl));
1336 fl.proto = IPPROTO_TCP;
2e6599cb 1337 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
1da177e4
LT
1338 if (opt && opt->srcrt) {
1339 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
1340 ipv6_addr_copy(&final, &fl.fl6_dst);
1341 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
1342 final_p = &final;
1343 }
2e6599cb 1344 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
1da177e4 1345 fl.oif = sk->sk_bound_dev_if;
51953d5b 1346 fl.mark = sk->sk_mark;
2e6599cb 1347 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
fd507037 1348 fl.fl_ip_sport = inet_rsk(req)->loc_port;
4237c75c 1349 security_req_classify_flow(req, &fl);
1da177e4
LT
1350
1351 if (ip6_dst_lookup(sk, &dst, &fl))
1352 goto out;
1353
1354 if (final_p)
1355 ipv6_addr_copy(&fl.fl6_dst, final_p);
1356
52479b62 1357 if ((xfrm_lookup(sock_net(sk), &dst, &fl, sk, 0)) < 0)
1da177e4 1358 goto out;
1ab1457c 1359 }
1da177e4
LT
1360
1361 newsk = tcp_create_openreq_child(sk, req, skb);
1362 if (newsk == NULL)
1363 goto out;
1364
e6848976
ACM
1365 /*
1366 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1367 * count here, tcp_create_openreq_child now does this for us, see the
1368 * comment in that function for the gory details. -acme
1369 */
1da177e4 1370
59eed279 1371 newsk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 1372 __ip6_dst_store(newsk, dst, NULL, NULL);
1da177e4
LT
1373
1374 newtcp6sk = (struct tcp6_sock *)newsk;
1375 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1376
1377 newtp = tcp_sk(newsk);
1378 newinet = inet_sk(newsk);
1379 newnp = inet6_sk(newsk);
1380
1381 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1382
2e6599cb
ACM
1383 ipv6_addr_copy(&newnp->daddr, &treq->rmt_addr);
1384 ipv6_addr_copy(&newnp->saddr, &treq->loc_addr);
1385 ipv6_addr_copy(&newnp->rcv_saddr, &treq->loc_addr);
1386 newsk->sk_bound_dev_if = treq->iif;
1da177e4 1387
1ab1457c 1388 /* Now IPv6 options...
1da177e4
LT
1389
1390 First: no IPv4 options.
1391 */
1392 newinet->opt = NULL;
d35690be 1393 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1394
1395 /* Clone RX bits */
1396 newnp->rxopt.all = np->rxopt.all;
1397
1398 /* Clone pktoptions received with SYN */
1399 newnp->pktoptions = NULL;
2e6599cb
ACM
1400 if (treq->pktopts != NULL) {
1401 newnp->pktoptions = skb_clone(treq->pktopts, GFP_ATOMIC);
1402 kfree_skb(treq->pktopts);
1403 treq->pktopts = NULL;
1da177e4
LT
1404 if (newnp->pktoptions)
1405 skb_set_owner_r(newnp->pktoptions, newsk);
1406 }
1407 newnp->opt = NULL;
505cbfc5 1408 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1409 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1da177e4
LT
1410
1411 /* Clone native IPv6 options from listening socket (if any)
1412
1413 Yes, keeping reference count would be much more clever,
1414 but we make one more one thing there: reattach optmem
1415 to newsk.
1416 */
1417 if (opt) {
1418 newnp->opt = ipv6_dup_options(newsk, opt);
1419 if (opt != np->opt)
1420 sock_kfree_s(sk, opt, opt->tot_len);
1421 }
1422
d83d8461 1423 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1da177e4 1424 if (newnp->opt)
d83d8461
ACM
1425 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1426 newnp->opt->opt_flen);
1da177e4 1427
5d424d5a 1428 tcp_mtup_init(newsk);
1da177e4
LT
1429 tcp_sync_mss(newsk, dst_mtu(dst));
1430 newtp->advmss = dst_metric(dst, RTAX_ADVMSS);
1431 tcp_initialize_rcv_mss(newsk);
1432
c720c7e8
ED
1433 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1434 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 1435
cfb6eeb4
YH
1436#ifdef CONFIG_TCP_MD5SIG
1437 /* Copy over the MD5 key from the original socket */
1438 if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1439 /* We're using one, so create a matching key
1440 * on the newsk structure. If we fail to get
1441 * memory, then we end up not copying the key
1442 * across. Shucks.
1443 */
af879cc7
ACM
1444 char *newkey = kmemdup(key->key, key->keylen, GFP_ATOMIC);
1445 if (newkey != NULL)
e547bc1e 1446 tcp_v6_md5_do_add(newsk, &newnp->daddr,
cfb6eeb4 1447 newkey, key->keylen);
cfb6eeb4
YH
1448 }
1449#endif
1450
ab1e0a13 1451 __inet6_hash(newsk);
e56d8b8a 1452 __inet_inherit_port(sk, newsk);
1da177e4
LT
1453
1454 return newsk;
1455
1456out_overflow:
de0744af 1457 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1da177e4 1458out:
de0744af 1459 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1460 if (opt && opt != np->opt)
1461 sock_kfree_s(sk, opt, opt->tot_len);
1462 dst_release(dst);
1463 return NULL;
1464}
1465
b51655b9 1466static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1da177e4 1467{
84fa7933 1468 if (skb->ip_summed == CHECKSUM_COMPLETE) {
684f2176 1469 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
0660e03f 1470 &ipv6_hdr(skb)->daddr, skb->csum)) {
fb286bb2 1471 skb->ip_summed = CHECKSUM_UNNECESSARY;
1da177e4 1472 return 0;
fb286bb2 1473 }
1da177e4 1474 }
fb286bb2 1475
684f2176 1476 skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
0660e03f
ACM
1477 &ipv6_hdr(skb)->saddr,
1478 &ipv6_hdr(skb)->daddr, 0));
fb286bb2 1479
1da177e4 1480 if (skb->len <= 76) {
fb286bb2 1481 return __skb_checksum_complete(skb);
1da177e4
LT
1482 }
1483 return 0;
1484}
1485
1486/* The socket must have it's spinlock held when we get
1487 * here.
1488 *
1489 * We have a potential double-lock case here, so even when
1490 * doing backlog processing we use the BH locking scheme.
1491 * This is because we cannot sleep with the original spinlock
1492 * held.
1493 */
1494static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1495{
1496 struct ipv6_pinfo *np = inet6_sk(sk);
1497 struct tcp_sock *tp;
1498 struct sk_buff *opt_skb = NULL;
1499
1500 /* Imagine: socket is IPv6. IPv4 packet arrives,
1501 goes to IPv4 receive handler and backlogged.
1502 From backlog it always goes here. Kerboom...
1503 Fortunately, tcp_rcv_established and rcv_established
1504 handle them correctly, but it is not case with
1505 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1506 */
1507
1508 if (skb->protocol == htons(ETH_P_IP))
1509 return tcp_v4_do_rcv(sk, skb);
1510
cfb6eeb4
YH
1511#ifdef CONFIG_TCP_MD5SIG
1512 if (tcp_v6_inbound_md5_hash (sk, skb))
1513 goto discard;
1514#endif
1515
fda9ef5d 1516 if (sk_filter(sk, skb))
1da177e4
LT
1517 goto discard;
1518
1519 /*
1520 * socket locking is here for SMP purposes as backlog rcv
1521 * is currently called with bh processing disabled.
1522 */
1523
1524 /* Do Stevens' IPV6_PKTOPTIONS.
1525
1526 Yes, guys, it is the only place in our code, where we
1527 may make it not affecting IPv4.
1528 The rest of code is protocol independent,
1529 and I do not like idea to uglify IPv4.
1530
1531 Actually, all the idea behind IPV6_PKTOPTIONS
1532 looks not very well thought. For now we latch
1533 options, received in the last packet, enqueued
1534 by tcp. Feel free to propose better solution.
1ab1457c 1535 --ANK (980728)
1da177e4
LT
1536 */
1537 if (np->rxopt.all)
1538 opt_skb = skb_clone(skb, GFP_ATOMIC);
1539
1540 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
1541 TCP_CHECK_TIMER(sk);
aa8223c7 1542 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1da177e4
LT
1543 goto reset;
1544 TCP_CHECK_TIMER(sk);
1545 if (opt_skb)
1546 goto ipv6_pktoptions;
1547 return 0;
1548 }
1549
ab6a5bb6 1550 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1da177e4
LT
1551 goto csum_err;
1552
1ab1457c 1553 if (sk->sk_state == TCP_LISTEN) {
1da177e4
LT
1554 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1555 if (!nsk)
1556 goto discard;
1557
1558 /*
1559 * Queue it on the new socket if the new socket is active,
1560 * otherwise we just shortcircuit this and continue with
1561 * the new socket..
1562 */
1ab1457c 1563 if(nsk != sk) {
1da177e4
LT
1564 if (tcp_child_process(sk, nsk, skb))
1565 goto reset;
1566 if (opt_skb)
1567 __kfree_skb(opt_skb);
1568 return 0;
1569 }
1570 }
1571
1572 TCP_CHECK_TIMER(sk);
aa8223c7 1573 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1da177e4
LT
1574 goto reset;
1575 TCP_CHECK_TIMER(sk);
1576 if (opt_skb)
1577 goto ipv6_pktoptions;
1578 return 0;
1579
1580reset:
cfb6eeb4 1581 tcp_v6_send_reset(sk, skb);
1da177e4
LT
1582discard:
1583 if (opt_skb)
1584 __kfree_skb(opt_skb);
1585 kfree_skb(skb);
1586 return 0;
1587csum_err:
63231bdd 1588 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1da177e4
LT
1589 goto discard;
1590
1591
1592ipv6_pktoptions:
1593 /* Do you ask, what is it?
1594
1595 1. skb was enqueued by tcp.
1596 2. skb is added to tail of read queue, rather than out of order.
1597 3. socket is not in passive state.
1598 4. Finally, it really contains options, which user wants to receive.
1599 */
1600 tp = tcp_sk(sk);
1601 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1602 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
333fad53 1603 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
505cbfc5 1604 np->mcast_oif = inet6_iif(opt_skb);
333fad53 1605 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
0660e03f 1606 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
1da177e4
LT
1607 if (ipv6_opt_accepted(sk, opt_skb)) {
1608 skb_set_owner_r(opt_skb, sk);
1609 opt_skb = xchg(&np->pktoptions, opt_skb);
1610 } else {
1611 __kfree_skb(opt_skb);
1612 opt_skb = xchg(&np->pktoptions, NULL);
1613 }
1614 }
1615
800d55f1 1616 kfree_skb(opt_skb);
1da177e4
LT
1617 return 0;
1618}
1619
e5bbef20 1620static int tcp_v6_rcv(struct sk_buff *skb)
1da177e4 1621{
1ab1457c 1622 struct tcphdr *th;
1da177e4
LT
1623 struct sock *sk;
1624 int ret;
a86b1e30 1625 struct net *net = dev_net(skb->dev);
1da177e4
LT
1626
1627 if (skb->pkt_type != PACKET_HOST)
1628 goto discard_it;
1629
1630 /*
1631 * Count it even if it's bad.
1632 */
63231bdd 1633 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1da177e4
LT
1634
1635 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1636 goto discard_it;
1637
aa8223c7 1638 th = tcp_hdr(skb);
1da177e4
LT
1639
1640 if (th->doff < sizeof(struct tcphdr)/4)
1641 goto bad_packet;
1642 if (!pskb_may_pull(skb, th->doff*4))
1643 goto discard_it;
1644
60476372 1645 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1da177e4
LT
1646 goto bad_packet;
1647
aa8223c7 1648 th = tcp_hdr(skb);
1da177e4
LT
1649 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1650 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1651 skb->len - th->doff*4);
1652 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1653 TCP_SKB_CB(skb)->when = 0;
0660e03f 1654 TCP_SKB_CB(skb)->flags = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4
LT
1655 TCP_SKB_CB(skb)->sacked = 0;
1656
9a1f27c4 1657 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1da177e4
LT
1658 if (!sk)
1659 goto no_tcp_socket;
1660
1661process:
1662 if (sk->sk_state == TCP_TIME_WAIT)
1663 goto do_time_wait;
1664
1665 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1666 goto discard_and_relse;
1667
fda9ef5d 1668 if (sk_filter(sk, skb))
1da177e4
LT
1669 goto discard_and_relse;
1670
1671 skb->dev = NULL;
1672
293b9c42 1673 bh_lock_sock_nested(sk);
1da177e4
LT
1674 ret = 0;
1675 if (!sock_owned_by_user(sk)) {
1a2449a8 1676#ifdef CONFIG_NET_DMA
1ab1457c 1677 struct tcp_sock *tp = tcp_sk(sk);
b4caea8a 1678 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
f67b4599 1679 tp->ucopy.dma_chan = dma_find_channel(DMA_MEMCPY);
1ab1457c
YH
1680 if (tp->ucopy.dma_chan)
1681 ret = tcp_v6_do_rcv(sk, skb);
1682 else
1a2449a8
CL
1683#endif
1684 {
1685 if (!tcp_prequeue(sk, skb))
1686 ret = tcp_v6_do_rcv(sk, skb);
1687 }
1da177e4
LT
1688 } else
1689 sk_add_backlog(sk, skb);
1690 bh_unlock_sock(sk);
1691
1692 sock_put(sk);
1693 return ret ? -1 : 0;
1694
1695no_tcp_socket:
1696 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1697 goto discard_it;
1698
1699 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1700bad_packet:
63231bdd 1701 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1da177e4 1702 } else {
cfb6eeb4 1703 tcp_v6_send_reset(NULL, skb);
1da177e4
LT
1704 }
1705
1706discard_it:
1707
1708 /*
1709 * Discard frame
1710 */
1711
1712 kfree_skb(skb);
1713 return 0;
1714
1715discard_and_relse:
1716 sock_put(sk);
1717 goto discard_it;
1718
1719do_time_wait:
1720 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
9469c7b4 1721 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1722 goto discard_it;
1723 }
1724
1725 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
63231bdd 1726 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
9469c7b4 1727 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1728 goto discard_it;
1729 }
1730
9469c7b4 1731 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1da177e4
LT
1732 case TCP_TW_SYN:
1733 {
1734 struct sock *sk2;
1735
c346dca1 1736 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
0660e03f 1737 &ipv6_hdr(skb)->daddr,
505cbfc5 1738 ntohs(th->dest), inet6_iif(skb));
1da177e4 1739 if (sk2 != NULL) {
295ff7ed
ACM
1740 struct inet_timewait_sock *tw = inet_twsk(sk);
1741 inet_twsk_deschedule(tw, &tcp_death_row);
1742 inet_twsk_put(tw);
1da177e4
LT
1743 sk = sk2;
1744 goto process;
1745 }
1746 /* Fall through to ACK */
1747 }
1748 case TCP_TW_ACK:
1749 tcp_v6_timewait_ack(sk, skb);
1750 break;
1751 case TCP_TW_RST:
1752 goto no_tcp_socket;
1753 case TCP_TW_SUCCESS:;
1754 }
1755 goto discard_it;
1756}
1757
1da177e4
LT
1758static int tcp_v6_remember_stamp(struct sock *sk)
1759{
1760 /* Alas, not yet... */
1761 return 0;
1762}
1763
3b401a81 1764static const struct inet_connection_sock_af_ops ipv6_specific = {
543d9cfe
ACM
1765 .queue_xmit = inet6_csk_xmit,
1766 .send_check = tcp_v6_send_check,
1767 .rebuild_header = inet6_sk_rebuild_header,
1768 .conn_request = tcp_v6_conn_request,
1769 .syn_recv_sock = tcp_v6_syn_recv_sock,
1770 .remember_stamp = tcp_v6_remember_stamp,
1771 .net_header_len = sizeof(struct ipv6hdr),
1772 .setsockopt = ipv6_setsockopt,
1773 .getsockopt = ipv6_getsockopt,
1774 .addr2sockaddr = inet6_csk_addr2sockaddr,
1775 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1776 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1777#ifdef CONFIG_COMPAT
543d9cfe
ACM
1778 .compat_setsockopt = compat_ipv6_setsockopt,
1779 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1780#endif
1da177e4
LT
1781};
1782
cfb6eeb4 1783#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1784static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
cfb6eeb4 1785 .md5_lookup = tcp_v6_md5_lookup,
49a72dfb 1786 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4
YH
1787 .md5_add = tcp_v6_md5_add_func,
1788 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1789};
a928630a 1790#endif
cfb6eeb4 1791
1da177e4
LT
1792/*
1793 * TCP over IPv4 via INET6 API
1794 */
1795
3b401a81 1796static const struct inet_connection_sock_af_ops ipv6_mapped = {
543d9cfe
ACM
1797 .queue_xmit = ip_queue_xmit,
1798 .send_check = tcp_v4_send_check,
1799 .rebuild_header = inet_sk_rebuild_header,
1800 .conn_request = tcp_v6_conn_request,
1801 .syn_recv_sock = tcp_v6_syn_recv_sock,
1802 .remember_stamp = tcp_v4_remember_stamp,
1803 .net_header_len = sizeof(struct iphdr),
1804 .setsockopt = ipv6_setsockopt,
1805 .getsockopt = ipv6_getsockopt,
1806 .addr2sockaddr = inet6_csk_addr2sockaddr,
1807 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1808 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1809#ifdef CONFIG_COMPAT
543d9cfe
ACM
1810 .compat_setsockopt = compat_ipv6_setsockopt,
1811 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1812#endif
1da177e4
LT
1813};
1814
cfb6eeb4 1815#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1816static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
cfb6eeb4 1817 .md5_lookup = tcp_v4_md5_lookup,
49a72dfb 1818 .calc_md5_hash = tcp_v4_md5_hash_skb,
cfb6eeb4
YH
1819 .md5_add = tcp_v6_md5_add_func,
1820 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1821};
a928630a 1822#endif
cfb6eeb4 1823
1da177e4
LT
1824/* NOTE: A lot of things set to zero explicitly by call to
1825 * sk_alloc() so need not be done here.
1826 */
1827static int tcp_v6_init_sock(struct sock *sk)
1828{
6687e988 1829 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4
LT
1830 struct tcp_sock *tp = tcp_sk(sk);
1831
1832 skb_queue_head_init(&tp->out_of_order_queue);
1833 tcp_init_xmit_timers(sk);
1834 tcp_prequeue_init(tp);
1835
6687e988 1836 icsk->icsk_rto = TCP_TIMEOUT_INIT;
1da177e4
LT
1837 tp->mdev = TCP_TIMEOUT_INIT;
1838
1839 /* So many TCP implementations out there (incorrectly) count the
1840 * initial SYN frame in their delayed-ACK and congestion control
1841 * algorithms that we must have the following bandaid to talk
1842 * efficiently to them. -DaveM
1843 */
1844 tp->snd_cwnd = 2;
1845
1846 /* See draft-stevens-tcpca-spec-01 for discussion of the
1847 * initialization of these values.
1848 */
0b6a05c1 1849 tp->snd_ssthresh = TCP_INFINITE_SSTHRESH;
1da177e4 1850 tp->snd_cwnd_clamp = ~0;
bee7ca9e 1851 tp->mss_cache = TCP_MSS_DEFAULT;
1da177e4
LT
1852
1853 tp->reordering = sysctl_tcp_reordering;
1854
1855 sk->sk_state = TCP_CLOSE;
1856
8292a17a 1857 icsk->icsk_af_ops = &ipv6_specific;
6687e988 1858 icsk->icsk_ca_ops = &tcp_init_congestion_ops;
d83d8461 1859 icsk->icsk_sync_mss = tcp_sync_mss;
1da177e4
LT
1860 sk->sk_write_space = sk_stream_write_space;
1861 sock_set_flag(sk, SOCK_USE_WRITE_QUEUE);
1862
cfb6eeb4
YH
1863#ifdef CONFIG_TCP_MD5SIG
1864 tp->af_specific = &tcp_sock_ipv6_specific;
1865#endif
1866
435cf559
WAS
1867 /* TCP Cookie Transactions */
1868 if (sysctl_tcp_cookie_size > 0) {
1869 /* Default, cookies without s_data_payload. */
1870 tp->cookie_values =
1871 kzalloc(sizeof(*tp->cookie_values),
1872 sk->sk_allocation);
1873 if (tp->cookie_values != NULL)
1874 kref_init(&tp->cookie_values->kref);
1875 }
1876 /* Presumed zeroed, in order of appearance:
1877 * cookie_in_always, cookie_out_never,
1878 * s_data_constant, s_data_in, s_data_out
1879 */
1da177e4
LT
1880 sk->sk_sndbuf = sysctl_tcp_wmem[1];
1881 sk->sk_rcvbuf = sysctl_tcp_rmem[1];
1882
eb4dea58 1883 local_bh_disable();
1748376b 1884 percpu_counter_inc(&tcp_sockets_allocated);
eb4dea58 1885 local_bh_enable();
1da177e4
LT
1886
1887 return 0;
1888}
1889
7d06b2e0 1890static void tcp_v6_destroy_sock(struct sock *sk)
1da177e4 1891{
cfb6eeb4
YH
1892#ifdef CONFIG_TCP_MD5SIG
1893 /* Clean up the MD5 key list */
1894 if (tcp_sk(sk)->md5sig_info)
1895 tcp_v6_clear_md5_list(sk);
1896#endif
1da177e4 1897 tcp_v4_destroy_sock(sk);
7d06b2e0 1898 inet6_destroy_sock(sk);
1da177e4
LT
1899}
1900
952a10be 1901#ifdef CONFIG_PROC_FS
1da177e4 1902/* Proc filesystem TCPv6 sock list dumping. */
1ab1457c 1903static void get_openreq6(struct seq_file *seq,
60236fdd 1904 struct sock *sk, struct request_sock *req, int i, int uid)
1da177e4 1905{
1da177e4 1906 int ttd = req->expires - jiffies;
ca304b61
ACM
1907 struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1908 struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1da177e4
LT
1909
1910 if (ttd < 0)
1911 ttd = 0;
1912
1da177e4
LT
1913 seq_printf(seq,
1914 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1915 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1916 i,
1917 src->s6_addr32[0], src->s6_addr32[1],
1918 src->s6_addr32[2], src->s6_addr32[3],
fd507037 1919 ntohs(inet_rsk(req)->loc_port),
1da177e4
LT
1920 dest->s6_addr32[0], dest->s6_addr32[1],
1921 dest->s6_addr32[2], dest->s6_addr32[3],
2e6599cb 1922 ntohs(inet_rsk(req)->rmt_port),
1da177e4
LT
1923 TCP_SYN_RECV,
1924 0,0, /* could print option size, but that is af dependent. */
1ab1457c
YH
1925 1, /* timers active (only the expire timer) */
1926 jiffies_to_clock_t(ttd),
1da177e4
LT
1927 req->retrans,
1928 uid,
1ab1457c 1929 0, /* non standard timer */
1da177e4
LT
1930 0, /* open_requests have no inode */
1931 0, req);
1932}
1933
1934static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1935{
1936 struct in6_addr *dest, *src;
1937 __u16 destp, srcp;
1938 int timer_active;
1939 unsigned long timer_expires;
1940 struct inet_sock *inet = inet_sk(sp);
1941 struct tcp_sock *tp = tcp_sk(sp);
463c84b9 1942 const struct inet_connection_sock *icsk = inet_csk(sp);
1da177e4
LT
1943 struct ipv6_pinfo *np = inet6_sk(sp);
1944
1945 dest = &np->daddr;
1946 src = &np->rcv_saddr;
c720c7e8
ED
1947 destp = ntohs(inet->inet_dport);
1948 srcp = ntohs(inet->inet_sport);
463c84b9
ACM
1949
1950 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1da177e4 1951 timer_active = 1;
463c84b9
ACM
1952 timer_expires = icsk->icsk_timeout;
1953 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1da177e4 1954 timer_active = 4;
463c84b9 1955 timer_expires = icsk->icsk_timeout;
1da177e4
LT
1956 } else if (timer_pending(&sp->sk_timer)) {
1957 timer_active = 2;
1958 timer_expires = sp->sk_timer.expires;
1959 } else {
1960 timer_active = 0;
1961 timer_expires = jiffies;
1962 }
1963
1964 seq_printf(seq,
1965 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
7be87351 1966 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %p %lu %lu %u %u %d\n",
1da177e4
LT
1967 i,
1968 src->s6_addr32[0], src->s6_addr32[1],
1969 src->s6_addr32[2], src->s6_addr32[3], srcp,
1970 dest->s6_addr32[0], dest->s6_addr32[1],
1971 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1ab1457c 1972 sp->sk_state,
47da8ee6
SS
1973 tp->write_seq-tp->snd_una,
1974 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1da177e4
LT
1975 timer_active,
1976 jiffies_to_clock_t(timer_expires - jiffies),
463c84b9 1977 icsk->icsk_retransmits,
1da177e4 1978 sock_i_uid(sp),
6687e988 1979 icsk->icsk_probes_out,
1da177e4
LT
1980 sock_i_ino(sp),
1981 atomic_read(&sp->sk_refcnt), sp,
7be87351
SH
1982 jiffies_to_clock_t(icsk->icsk_rto),
1983 jiffies_to_clock_t(icsk->icsk_ack.ato),
463c84b9 1984 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
0b6a05c1
IJ
1985 tp->snd_cwnd,
1986 tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
1da177e4
LT
1987 );
1988}
1989
1ab1457c 1990static void get_timewait6_sock(struct seq_file *seq,
8feaf0c0 1991 struct inet_timewait_sock *tw, int i)
1da177e4
LT
1992{
1993 struct in6_addr *dest, *src;
1994 __u16 destp, srcp;
0fa1a53e 1995 struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
1da177e4
LT
1996 int ttd = tw->tw_ttd - jiffies;
1997
1998 if (ttd < 0)
1999 ttd = 0;
2000
0fa1a53e
ACM
2001 dest = &tw6->tw_v6_daddr;
2002 src = &tw6->tw_v6_rcv_saddr;
1da177e4
LT
2003 destp = ntohs(tw->tw_dport);
2004 srcp = ntohs(tw->tw_sport);
2005
2006 seq_printf(seq,
2007 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
2008 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
2009 i,
2010 src->s6_addr32[0], src->s6_addr32[1],
2011 src->s6_addr32[2], src->s6_addr32[3], srcp,
2012 dest->s6_addr32[0], dest->s6_addr32[1],
2013 dest->s6_addr32[2], dest->s6_addr32[3], destp,
2014 tw->tw_substate, 0, 0,
2015 3, jiffies_to_clock_t(ttd), 0, 0, 0, 0,
2016 atomic_read(&tw->tw_refcnt), tw);
2017}
2018
1da177e4
LT
2019static int tcp6_seq_show(struct seq_file *seq, void *v)
2020{
2021 struct tcp_iter_state *st;
2022
2023 if (v == SEQ_START_TOKEN) {
2024 seq_puts(seq,
2025 " sl "
2026 "local_address "
2027 "remote_address "
2028 "st tx_queue rx_queue tr tm->when retrnsmt"
2029 " uid timeout inode\n");
2030 goto out;
2031 }
2032 st = seq->private;
2033
2034 switch (st->state) {
2035 case TCP_SEQ_STATE_LISTENING:
2036 case TCP_SEQ_STATE_ESTABLISHED:
2037 get_tcp6_sock(seq, v, st->num);
2038 break;
2039 case TCP_SEQ_STATE_OPENREQ:
2040 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
2041 break;
2042 case TCP_SEQ_STATE_TIME_WAIT:
2043 get_timewait6_sock(seq, v, st->num);
2044 break;
2045 }
2046out:
2047 return 0;
2048}
2049
1da177e4 2050static struct tcp_seq_afinfo tcp6_seq_afinfo = {
1da177e4
LT
2051 .name = "tcp6",
2052 .family = AF_INET6,
5f4472c5
DL
2053 .seq_fops = {
2054 .owner = THIS_MODULE,
2055 },
9427c4b3
DL
2056 .seq_ops = {
2057 .show = tcp6_seq_show,
2058 },
1da177e4
LT
2059};
2060
6f8b13bc 2061int tcp6_proc_init(struct net *net)
1da177e4 2062{
6f8b13bc 2063 return tcp_proc_register(net, &tcp6_seq_afinfo);
1da177e4
LT
2064}
2065
6f8b13bc 2066void tcp6_proc_exit(struct net *net)
1da177e4 2067{
6f8b13bc 2068 tcp_proc_unregister(net, &tcp6_seq_afinfo);
1da177e4
LT
2069}
2070#endif
2071
2072struct proto tcpv6_prot = {
2073 .name = "TCPv6",
2074 .owner = THIS_MODULE,
2075 .close = tcp_close,
2076 .connect = tcp_v6_connect,
2077 .disconnect = tcp_disconnect,
463c84b9 2078 .accept = inet_csk_accept,
1da177e4
LT
2079 .ioctl = tcp_ioctl,
2080 .init = tcp_v6_init_sock,
2081 .destroy = tcp_v6_destroy_sock,
2082 .shutdown = tcp_shutdown,
2083 .setsockopt = tcp_setsockopt,
2084 .getsockopt = tcp_getsockopt,
1da177e4
LT
2085 .recvmsg = tcp_recvmsg,
2086 .backlog_rcv = tcp_v6_do_rcv,
2087 .hash = tcp_v6_hash,
ab1e0a13
ACM
2088 .unhash = inet_unhash,
2089 .get_port = inet_csk_get_port,
1da177e4
LT
2090 .enter_memory_pressure = tcp_enter_memory_pressure,
2091 .sockets_allocated = &tcp_sockets_allocated,
2092 .memory_allocated = &tcp_memory_allocated,
2093 .memory_pressure = &tcp_memory_pressure,
0a5578cf 2094 .orphan_count = &tcp_orphan_count,
1da177e4
LT
2095 .sysctl_mem = sysctl_tcp_mem,
2096 .sysctl_wmem = sysctl_tcp_wmem,
2097 .sysctl_rmem = sysctl_tcp_rmem,
2098 .max_header = MAX_TCP_HEADER,
2099 .obj_size = sizeof(struct tcp6_sock),
3ab5aee7 2100 .slab_flags = SLAB_DESTROY_BY_RCU,
6d6ee43e 2101 .twsk_prot = &tcp6_timewait_sock_ops,
60236fdd 2102 .rsk_prot = &tcp6_request_sock_ops,
39d8cda7 2103 .h.hashinfo = &tcp_hashinfo,
543d9cfe
ACM
2104#ifdef CONFIG_COMPAT
2105 .compat_setsockopt = compat_tcp_setsockopt,
2106 .compat_getsockopt = compat_tcp_getsockopt,
2107#endif
1da177e4
LT
2108};
2109
41135cc8 2110static const struct inet6_protocol tcpv6_protocol = {
1da177e4
LT
2111 .handler = tcp_v6_rcv,
2112 .err_handler = tcp_v6_err,
a430a43d 2113 .gso_send_check = tcp_v6_gso_send_check,
adcfc7d0 2114 .gso_segment = tcp_tso_segment,
684f2176
HX
2115 .gro_receive = tcp6_gro_receive,
2116 .gro_complete = tcp6_gro_complete,
1da177e4
LT
2117 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
2118};
2119
1da177e4
LT
2120static struct inet_protosw tcpv6_protosw = {
2121 .type = SOCK_STREAM,
2122 .protocol = IPPROTO_TCP,
2123 .prot = &tcpv6_prot,
2124 .ops = &inet6_stream_ops,
1da177e4 2125 .no_check = 0,
d83d8461
ACM
2126 .flags = INET_PROTOSW_PERMANENT |
2127 INET_PROTOSW_ICSK,
1da177e4
LT
2128};
2129
93ec926b
DL
2130static int tcpv6_net_init(struct net *net)
2131{
5677242f
DL
2132 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2133 SOCK_RAW, IPPROTO_TCP, net);
93ec926b
DL
2134}
2135
2136static void tcpv6_net_exit(struct net *net)
2137{
5677242f 2138 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
d315492b 2139 inet_twsk_purge(net, &tcp_hashinfo, &tcp_death_row, AF_INET6);
93ec926b
DL
2140}
2141
2142static struct pernet_operations tcpv6_net_ops = {
2143 .init = tcpv6_net_init,
2144 .exit = tcpv6_net_exit,
2145};
2146
7f4e4868 2147int __init tcpv6_init(void)
1da177e4 2148{
7f4e4868
DL
2149 int ret;
2150
2151 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2152 if (ret)
2153 goto out;
2154
1da177e4 2155 /* register inet6 protocol */
7f4e4868
DL
2156 ret = inet6_register_protosw(&tcpv6_protosw);
2157 if (ret)
2158 goto out_tcpv6_protocol;
2159
93ec926b 2160 ret = register_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2161 if (ret)
2162 goto out_tcpv6_protosw;
2163out:
2164 return ret;
ae0f7d5f 2165
7f4e4868
DL
2166out_tcpv6_protocol:
2167 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2168out_tcpv6_protosw:
2169 inet6_unregister_protosw(&tcpv6_protosw);
2170 goto out;
2171}
2172
09f7709f 2173void tcpv6_exit(void)
7f4e4868 2174{
93ec926b 2175 unregister_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2176 inet6_unregister_protosw(&tcpv6_protosw);
2177 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
1da177e4 2178}