net: add sk_stream_is_writeable() helper
[linux-2.6-block.git] / net / ipv6 / tcp_ipv6.c
CommitLineData
1da177e4
LT
1/*
2 * TCP over IPv6
1ab1457c 3 * Linux INET6 implementation
1da177e4
LT
4 *
5 * Authors:
1ab1457c 6 * Pedro Roque <roque@di.fc.ul.pt>
1da177e4 7 *
1ab1457c 8 * Based on:
1da177e4
LT
9 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
eb4dea58 26#include <linux/bottom_half.h>
1da177e4 27#include <linux/module.h>
1da177e4
LT
28#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
5a0e3ad6 41#include <linux/slab.h>
1da177e4
LT
42
43#include <linux/ipv6.h>
44#include <linux/icmpv6.h>
45#include <linux/random.h>
46
47#include <net/tcp.h>
48#include <net/ndisc.h>
5324a040 49#include <net/inet6_hashtables.h>
8129765a 50#include <net/inet6_connection_sock.h>
1da177e4
LT
51#include <net/ipv6.h>
52#include <net/transp_v6.h>
53#include <net/addrconf.h>
54#include <net/ip6_route.h>
55#include <net/ip6_checksum.h>
56#include <net/inet_ecn.h>
57#include <net/protocol.h>
58#include <net/xfrm.h>
1da177e4
LT
59#include <net/snmp.h>
60#include <net/dsfield.h>
6d6ee43e 61#include <net/timewait_sock.h>
18134bed 62#include <net/netdma.h>
3d58b5fa 63#include <net/inet_common.h>
6e5714ea 64#include <net/secure_seq.h>
d1a4c0b3 65#include <net/tcp_memcontrol.h>
076bb0c8 66#include <net/busy_poll.h>
1da177e4
LT
67
68#include <asm/uaccess.h>
69
70#include <linux/proc_fs.h>
71#include <linux/seq_file.h>
72
cfb6eeb4
YH
73#include <linux/crypto.h>
74#include <linux/scatterlist.h>
75
cfb6eeb4 76static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
6edafaaf
GJ
77static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
78 struct request_sock *req);
1da177e4
LT
79
80static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
1da177e4 81
3b401a81
SH
82static const struct inet_connection_sock_af_ops ipv6_mapped;
83static const struct inet_connection_sock_af_ops ipv6_specific;
a928630a 84#ifdef CONFIG_TCP_MD5SIG
b2e4b3de
SH
85static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
86static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
9501f972
YH
87#else
88static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 89 const struct in6_addr *addr)
9501f972
YH
90{
91 return NULL;
92}
a928630a 93#endif
1da177e4 94
fae6ef87
NC
95static void inet6_sk_rx_dst_set(struct sock *sk, const struct sk_buff *skb)
96{
97 struct dst_entry *dst = skb_dst(skb);
98 const struct rt6_info *rt = (const struct rt6_info *)dst;
99
100 dst_hold(dst);
101 sk->sk_rx_dst = dst;
102 inet_sk(sk)->rx_dst_ifindex = skb->skb_iif;
103 if (rt->rt6i_node)
104 inet6_sk(sk)->rx_dst_cookie = rt->rt6i_node->fn_sernum;
105}
106
1da177e4
LT
107static void tcp_v6_hash(struct sock *sk)
108{
109 if (sk->sk_state != TCP_CLOSE) {
8292a17a 110 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
1da177e4
LT
111 tcp_prot.hash(sk);
112 return;
113 }
114 local_bh_disable();
9327f705 115 __inet6_hash(sk, NULL);
1da177e4
LT
116 local_bh_enable();
117 }
118}
119
cf533ea5 120static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
1da177e4 121{
0660e03f
ACM
122 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
123 ipv6_hdr(skb)->saddr.s6_addr32,
aa8223c7
ACM
124 tcp_hdr(skb)->dest,
125 tcp_hdr(skb)->source);
1da177e4
LT
126}
127
1ab1457c 128static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
1da177e4
LT
129 int addr_len)
130{
131 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
1ab1457c 132 struct inet_sock *inet = inet_sk(sk);
d83d8461 133 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4
LT
134 struct ipv6_pinfo *np = inet6_sk(sk);
135 struct tcp_sock *tp = tcp_sk(sk);
20c59de2 136 struct in6_addr *saddr = NULL, *final_p, final;
493f377d 137 struct rt6_info *rt;
4c9483b2 138 struct flowi6 fl6;
1da177e4
LT
139 struct dst_entry *dst;
140 int addr_type;
141 int err;
142
1ab1457c 143 if (addr_len < SIN6_LEN_RFC2133)
1da177e4
LT
144 return -EINVAL;
145
1ab1457c 146 if (usin->sin6_family != AF_INET6)
a02cec21 147 return -EAFNOSUPPORT;
1da177e4 148
4c9483b2 149 memset(&fl6, 0, sizeof(fl6));
1da177e4
LT
150
151 if (np->sndflow) {
4c9483b2
DM
152 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
153 IP6_ECN_flow_init(fl6.flowlabel);
154 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
1da177e4 155 struct ip6_flowlabel *flowlabel;
4c9483b2 156 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
1da177e4
LT
157 if (flowlabel == NULL)
158 return -EINVAL;
4e3fd7a0 159 usin->sin6_addr = flowlabel->dst;
1da177e4
LT
160 fl6_sock_release(flowlabel);
161 }
162 }
163
164 /*
1ab1457c
YH
165 * connect() to INADDR_ANY means loopback (BSD'ism).
166 */
167
168 if(ipv6_addr_any(&usin->sin6_addr))
169 usin->sin6_addr.s6_addr[15] = 0x1;
1da177e4
LT
170
171 addr_type = ipv6_addr_type(&usin->sin6_addr);
172
173 if(addr_type & IPV6_ADDR_MULTICAST)
174 return -ENETUNREACH;
175
176 if (addr_type&IPV6_ADDR_LINKLOCAL) {
177 if (addr_len >= sizeof(struct sockaddr_in6) &&
178 usin->sin6_scope_id) {
179 /* If interface is set while binding, indices
180 * must coincide.
181 */
182 if (sk->sk_bound_dev_if &&
183 sk->sk_bound_dev_if != usin->sin6_scope_id)
184 return -EINVAL;
185
186 sk->sk_bound_dev_if = usin->sin6_scope_id;
187 }
188
189 /* Connect to link-local address requires an interface */
190 if (!sk->sk_bound_dev_if)
191 return -EINVAL;
192 }
193
194 if (tp->rx_opt.ts_recent_stamp &&
195 !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
196 tp->rx_opt.ts_recent = 0;
197 tp->rx_opt.ts_recent_stamp = 0;
198 tp->write_seq = 0;
199 }
200
4e3fd7a0 201 np->daddr = usin->sin6_addr;
4c9483b2 202 np->flow_label = fl6.flowlabel;
1da177e4
LT
203
204 /*
205 * TCP over IPv4
206 */
207
208 if (addr_type == IPV6_ADDR_MAPPED) {
d83d8461 209 u32 exthdrlen = icsk->icsk_ext_hdr_len;
1da177e4
LT
210 struct sockaddr_in sin;
211
212 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
213
214 if (__ipv6_only_sock(sk))
215 return -ENETUNREACH;
216
217 sin.sin_family = AF_INET;
218 sin.sin_port = usin->sin6_port;
219 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
220
d83d8461 221 icsk->icsk_af_ops = &ipv6_mapped;
1da177e4 222 sk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
223#ifdef CONFIG_TCP_MD5SIG
224 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
225#endif
1da177e4
LT
226
227 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
228
229 if (err) {
d83d8461
ACM
230 icsk->icsk_ext_hdr_len = exthdrlen;
231 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 232 sk->sk_backlog_rcv = tcp_v6_do_rcv;
cfb6eeb4
YH
233#ifdef CONFIG_TCP_MD5SIG
234 tp->af_specific = &tcp_sock_ipv6_specific;
235#endif
1da177e4
LT
236 goto failure;
237 } else {
c720c7e8
ED
238 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
239 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
240 &np->rcv_saddr);
1da177e4
LT
241 }
242
243 return err;
244 }
245
246 if (!ipv6_addr_any(&np->rcv_saddr))
247 saddr = &np->rcv_saddr;
248
4c9483b2 249 fl6.flowi6_proto = IPPROTO_TCP;
4e3fd7a0
AD
250 fl6.daddr = np->daddr;
251 fl6.saddr = saddr ? *saddr : np->saddr;
4c9483b2
DM
252 fl6.flowi6_oif = sk->sk_bound_dev_if;
253 fl6.flowi6_mark = sk->sk_mark;
1958b856
DM
254 fl6.fl6_dport = usin->sin6_port;
255 fl6.fl6_sport = inet->inet_sport;
1da177e4 256
4c9483b2 257 final_p = fl6_update_dst(&fl6, np->opt, &final);
1da177e4 258
4c9483b2 259 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
beb8d13b 260
4c9483b2 261 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, true);
68d0c6d3
DM
262 if (IS_ERR(dst)) {
263 err = PTR_ERR(dst);
1da177e4 264 goto failure;
14e50e57 265 }
1da177e4
LT
266
267 if (saddr == NULL) {
4c9483b2 268 saddr = &fl6.saddr;
4e3fd7a0 269 np->rcv_saddr = *saddr;
1da177e4
LT
270 }
271
272 /* set the source address */
4e3fd7a0 273 np->saddr = *saddr;
c720c7e8 274 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 275
f83ef8c0 276 sk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 277 __ip6_dst_store(sk, dst, NULL, NULL);
1da177e4 278
493f377d
DM
279 rt = (struct rt6_info *) dst;
280 if (tcp_death_row.sysctl_tw_recycle &&
281 !tp->rx_opt.ts_recent_stamp &&
81166dd6
DM
282 ipv6_addr_equal(&rt->rt6i_dst.addr, &np->daddr))
283 tcp_fetch_timewait_stamp(sk, dst);
493f377d 284
d83d8461 285 icsk->icsk_ext_hdr_len = 0;
1da177e4 286 if (np->opt)
d83d8461
ACM
287 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
288 np->opt->opt_nflen);
1da177e4
LT
289
290 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
291
c720c7e8 292 inet->inet_dport = usin->sin6_port;
1da177e4
LT
293
294 tcp_set_state(sk, TCP_SYN_SENT);
d8313f5c 295 err = inet6_hash_connect(&tcp_death_row, sk);
1da177e4
LT
296 if (err)
297 goto late_failure;
298
2b916477 299 if (!tp->write_seq && likely(!tp->repair))
1da177e4
LT
300 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
301 np->daddr.s6_addr32,
c720c7e8
ED
302 inet->inet_sport,
303 inet->inet_dport);
1da177e4
LT
304
305 err = tcp_connect(sk);
306 if (err)
307 goto late_failure;
308
309 return 0;
310
311late_failure:
312 tcp_set_state(sk, TCP_CLOSE);
313 __sk_dst_reset(sk);
314failure:
c720c7e8 315 inet->inet_dport = 0;
1da177e4
LT
316 sk->sk_route_caps = 0;
317 return err;
318}
319
563d34d0
ED
320static void tcp_v6_mtu_reduced(struct sock *sk)
321{
322 struct dst_entry *dst;
323
324 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
325 return;
326
327 dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
328 if (!dst)
329 return;
330
331 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
332 tcp_sync_mss(sk, dst_mtu(dst));
333 tcp_simple_retransmit(sk);
334 }
335}
336
1da177e4 337static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
d5fdd6ba 338 u8 type, u8 code, int offset, __be32 info)
1da177e4 339{
b71d1d42 340 const struct ipv6hdr *hdr = (const struct ipv6hdr*)skb->data;
505cbfc5 341 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
1da177e4
LT
342 struct ipv6_pinfo *np;
343 struct sock *sk;
344 int err;
1ab1457c 345 struct tcp_sock *tp;
1da177e4 346 __u32 seq;
ca12a1a4 347 struct net *net = dev_net(skb->dev);
1da177e4 348
ca12a1a4 349 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
d86e0dac 350 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
1da177e4
LT
351
352 if (sk == NULL) {
e41b5368
DL
353 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
354 ICMP6_MIB_INERRORS);
1da177e4
LT
355 return;
356 }
357
358 if (sk->sk_state == TCP_TIME_WAIT) {
9469c7b4 359 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
360 return;
361 }
362
363 bh_lock_sock(sk);
563d34d0 364 if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
de0744af 365 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
1da177e4
LT
366
367 if (sk->sk_state == TCP_CLOSE)
368 goto out;
369
e802af9c
SH
370 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
371 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
372 goto out;
373 }
374
1da177e4 375 tp = tcp_sk(sk);
1ab1457c 376 seq = ntohl(th->seq);
1da177e4
LT
377 if (sk->sk_state != TCP_LISTEN &&
378 !between(seq, tp->snd_una, tp->snd_nxt)) {
de0744af 379 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
380 goto out;
381 }
382
383 np = inet6_sk(sk);
384
ec18d9a2
DM
385 if (type == NDISC_REDIRECT) {
386 struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
387
1ed5c48f 388 if (dst)
6700c270 389 dst->ops->redirect(dst, sk, skb);
50a75a89 390 goto out;
ec18d9a2
DM
391 }
392
1da177e4 393 if (type == ICMPV6_PKT_TOOBIG) {
0d4f0608
ED
394 /* We are not interested in TCP_LISTEN and open_requests
395 * (SYN-ACKs send out by Linux are always <576bytes so
396 * they should go through unfragmented).
397 */
398 if (sk->sk_state == TCP_LISTEN)
399 goto out;
400
563d34d0
ED
401 tp->mtu_info = ntohl(info);
402 if (!sock_owned_by_user(sk))
403 tcp_v6_mtu_reduced(sk);
d013ef2a
JA
404 else if (!test_and_set_bit(TCP_MTU_REDUCED_DEFERRED,
405 &tp->tsq_flags))
406 sock_hold(sk);
1da177e4
LT
407 goto out;
408 }
409
410 icmpv6_err_convert(type, code, &err);
411
60236fdd 412 /* Might be for an request_sock */
1da177e4 413 switch (sk->sk_state) {
60236fdd 414 struct request_sock *req, **prev;
1da177e4
LT
415 case TCP_LISTEN:
416 if (sock_owned_by_user(sk))
417 goto out;
418
8129765a
ACM
419 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
420 &hdr->saddr, inet6_iif(skb));
1da177e4
LT
421 if (!req)
422 goto out;
423
424 /* ICMPs are not backlogged, hence we cannot get
425 * an established socket here.
426 */
547b792c 427 WARN_ON(req->sk != NULL);
1da177e4 428
2e6599cb 429 if (seq != tcp_rsk(req)->snt_isn) {
de0744af 430 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
431 goto out;
432 }
433
463c84b9 434 inet_csk_reqsk_queue_drop(sk, req, prev);
5f1e942c 435 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
436 goto out;
437
438 case TCP_SYN_SENT:
439 case TCP_SYN_RECV: /* Cannot happen.
1ab1457c 440 It can, it SYNs are crossed. --ANK */
1da177e4 441 if (!sock_owned_by_user(sk)) {
1da177e4
LT
442 sk->sk_err = err;
443 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
444
445 tcp_done(sk);
446 } else
447 sk->sk_err_soft = err;
448 goto out;
449 }
450
451 if (!sock_owned_by_user(sk) && np->recverr) {
452 sk->sk_err = err;
453 sk->sk_error_report(sk);
454 } else
455 sk->sk_err_soft = err;
456
457out:
458 bh_unlock_sock(sk);
459 sock_put(sk);
460}
461
462
9f10d3f6
NC
463static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
464 struct flowi6 *fl6,
3840a06e 465 struct request_sock *req,
fff32699 466 u16 queue_mapping)
1da177e4 467{
ca304b61 468 struct inet6_request_sock *treq = inet6_rsk(req);
1da177e4
LT
469 struct ipv6_pinfo *np = inet6_sk(sk);
470 struct sk_buff * skb;
9494218f 471 int err = -ENOMEM;
1da177e4 472
9f10d3f6
NC
473 /* First, grab a route. */
474 if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
fd80eb94 475 goto done;
9494218f 476
1a2c6181 477 skb = tcp_make_synack(sk, dst, req, NULL);
9494218f 478
1da177e4 479 if (skb) {
8ad50d96 480 __tcp_v6_send_check(skb, &treq->loc_addr, &treq->rmt_addr);
1da177e4 481
9f10d3f6 482 fl6->daddr = treq->rmt_addr;
fff32699 483 skb_set_queue_mapping(skb, queue_mapping);
43264e0b 484 err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
b9df3cb8 485 err = net_xmit_eval(err);
1da177e4
LT
486 }
487
488done:
1da177e4
LT
489 return err;
490}
491
1a2c6181 492static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req)
72659ecc 493{
9f10d3f6 494 struct flowi6 fl6;
e6c022a4 495 int res;
9f10d3f6 496
1a2c6181 497 res = tcp_v6_send_synack(sk, NULL, &fl6, req, 0);
e6c022a4
ED
498 if (!res)
499 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
500 return res;
72659ecc
OP
501}
502
60236fdd 503static void tcp_v6_reqsk_destructor(struct request_sock *req)
1da177e4 504{
800d55f1 505 kfree_skb(inet6_rsk(req)->pktopts);
1da177e4
LT
506}
507
cfb6eeb4
YH
508#ifdef CONFIG_TCP_MD5SIG
509static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 510 const struct in6_addr *addr)
cfb6eeb4 511{
a915da9b 512 return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
cfb6eeb4
YH
513}
514
515static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
516 struct sock *addr_sk)
517{
518 return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
519}
520
521static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
522 struct request_sock *req)
523{
524 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
525}
526
cfb6eeb4
YH
527static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
528 int optlen)
529{
530 struct tcp_md5sig cmd;
531 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
cfb6eeb4
YH
532
533 if (optlen < sizeof(cmd))
534 return -EINVAL;
535
536 if (copy_from_user(&cmd, optval, sizeof(cmd)))
537 return -EFAULT;
538
539 if (sin6->sin6_family != AF_INET6)
540 return -EINVAL;
541
542 if (!cmd.tcpm_keylen) {
e773e4fa 543 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
a915da9b
ED
544 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
545 AF_INET);
546 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
547 AF_INET6);
cfb6eeb4
YH
548 }
549
550 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
551 return -EINVAL;
552
a915da9b
ED
553 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
554 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
555 AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4 556
a915da9b
ED
557 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
558 AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4
YH
559}
560
49a72dfb 561static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
b71d1d42
ED
562 const struct in6_addr *daddr,
563 const struct in6_addr *saddr, int nbytes)
cfb6eeb4 564{
cfb6eeb4 565 struct tcp6_pseudohdr *bp;
49a72dfb 566 struct scatterlist sg;
8d26d76d 567
cfb6eeb4 568 bp = &hp->md5_blk.ip6;
cfb6eeb4 569 /* 1. TCP pseudo-header (RFC2460) */
4e3fd7a0
AD
570 bp->saddr = *saddr;
571 bp->daddr = *daddr;
49a72dfb 572 bp->protocol = cpu_to_be32(IPPROTO_TCP);
00b1304c 573 bp->len = cpu_to_be32(nbytes);
cfb6eeb4 574
49a72dfb
AL
575 sg_init_one(&sg, bp, sizeof(*bp));
576 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
577}
c7da57a1 578
49a72dfb 579static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
b71d1d42 580 const struct in6_addr *daddr, struct in6_addr *saddr,
318cf7aa 581 const struct tcphdr *th)
49a72dfb
AL
582{
583 struct tcp_md5sig_pool *hp;
584 struct hash_desc *desc;
585
586 hp = tcp_get_md5sig_pool();
587 if (!hp)
588 goto clear_hash_noput;
589 desc = &hp->md5_desc;
590
591 if (crypto_hash_init(desc))
592 goto clear_hash;
593 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
594 goto clear_hash;
595 if (tcp_md5_hash_header(hp, th))
596 goto clear_hash;
597 if (tcp_md5_hash_key(hp, key))
598 goto clear_hash;
599 if (crypto_hash_final(desc, md5_hash))
cfb6eeb4 600 goto clear_hash;
cfb6eeb4 601
cfb6eeb4 602 tcp_put_md5sig_pool();
cfb6eeb4 603 return 0;
49a72dfb 604
cfb6eeb4
YH
605clear_hash:
606 tcp_put_md5sig_pool();
607clear_hash_noput:
608 memset(md5_hash, 0, 16);
49a72dfb 609 return 1;
cfb6eeb4
YH
610}
611
49a72dfb 612static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
318cf7aa
ED
613 const struct sock *sk,
614 const struct request_sock *req,
615 const struct sk_buff *skb)
cfb6eeb4 616{
b71d1d42 617 const struct in6_addr *saddr, *daddr;
49a72dfb
AL
618 struct tcp_md5sig_pool *hp;
619 struct hash_desc *desc;
318cf7aa 620 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4
YH
621
622 if (sk) {
623 saddr = &inet6_sk(sk)->saddr;
624 daddr = &inet6_sk(sk)->daddr;
49a72dfb 625 } else if (req) {
cfb6eeb4
YH
626 saddr = &inet6_rsk(req)->loc_addr;
627 daddr = &inet6_rsk(req)->rmt_addr;
49a72dfb 628 } else {
b71d1d42 629 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
49a72dfb
AL
630 saddr = &ip6h->saddr;
631 daddr = &ip6h->daddr;
cfb6eeb4 632 }
49a72dfb
AL
633
634 hp = tcp_get_md5sig_pool();
635 if (!hp)
636 goto clear_hash_noput;
637 desc = &hp->md5_desc;
638
639 if (crypto_hash_init(desc))
640 goto clear_hash;
641
642 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
643 goto clear_hash;
644 if (tcp_md5_hash_header(hp, th))
645 goto clear_hash;
646 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
647 goto clear_hash;
648 if (tcp_md5_hash_key(hp, key))
649 goto clear_hash;
650 if (crypto_hash_final(desc, md5_hash))
651 goto clear_hash;
652
653 tcp_put_md5sig_pool();
654 return 0;
655
656clear_hash:
657 tcp_put_md5sig_pool();
658clear_hash_noput:
659 memset(md5_hash, 0, 16);
660 return 1;
cfb6eeb4
YH
661}
662
318cf7aa 663static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
cfb6eeb4 664{
cf533ea5 665 const __u8 *hash_location = NULL;
cfb6eeb4 666 struct tcp_md5sig_key *hash_expected;
b71d1d42 667 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
318cf7aa 668 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4 669 int genhash;
cfb6eeb4
YH
670 u8 newhash[16];
671
672 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
7d5d5525 673 hash_location = tcp_parse_md5sig_option(th);
cfb6eeb4 674
785957d3
DM
675 /* We've parsed the options - do we have a hash? */
676 if (!hash_expected && !hash_location)
677 return 0;
678
679 if (hash_expected && !hash_location) {
680 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
cfb6eeb4
YH
681 return 1;
682 }
683
785957d3
DM
684 if (!hash_expected && hash_location) {
685 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
cfb6eeb4
YH
686 return 1;
687 }
688
689 /* check the signature */
49a72dfb
AL
690 genhash = tcp_v6_md5_hash_skb(newhash,
691 hash_expected,
692 NULL, NULL, skb);
693
cfb6eeb4 694 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
e87cc472
JP
695 net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
696 genhash ? "failed" : "mismatch",
697 &ip6h->saddr, ntohs(th->source),
698 &ip6h->daddr, ntohs(th->dest));
cfb6eeb4
YH
699 return 1;
700 }
701 return 0;
702}
703#endif
704
c6aefafb 705struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
1da177e4 706 .family = AF_INET6,
2e6599cb 707 .obj_size = sizeof(struct tcp6_request_sock),
72659ecc 708 .rtx_syn_ack = tcp_v6_rtx_synack,
60236fdd
ACM
709 .send_ack = tcp_v6_reqsk_send_ack,
710 .destructor = tcp_v6_reqsk_destructor,
72659ecc
OP
711 .send_reset = tcp_v6_send_reset,
712 .syn_ack_timeout = tcp_syn_ack_timeout,
1da177e4
LT
713};
714
cfb6eeb4 715#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 716static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
cfb6eeb4 717 .md5_lookup = tcp_v6_reqsk_md5_lookup,
e3afe7b7 718 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 719};
b6332e6c 720#endif
cfb6eeb4 721
626e264d 722static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
ee684b6f
AV
723 u32 tsval, u32 tsecr,
724 struct tcp_md5sig_key *key, int rst, u8 tclass)
1da177e4 725{
cf533ea5
ED
726 const struct tcphdr *th = tcp_hdr(skb);
727 struct tcphdr *t1;
1da177e4 728 struct sk_buff *buff;
4c9483b2 729 struct flowi6 fl6;
adf30907 730 struct net *net = dev_net(skb_dst(skb)->dev);
e5047992 731 struct sock *ctl_sk = net->ipv6.tcp_sk;
77c676da 732 unsigned int tot_len = sizeof(struct tcphdr);
adf30907 733 struct dst_entry *dst;
81ada62d 734 __be32 *topt;
1da177e4 735
ee684b6f 736 if (tsecr)
626e264d 737 tot_len += TCPOLEN_TSTAMP_ALIGNED;
cfb6eeb4 738#ifdef CONFIG_TCP_MD5SIG
cfb6eeb4
YH
739 if (key)
740 tot_len += TCPOLEN_MD5SIG_ALIGNED;
741#endif
742
cfb6eeb4 743 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1da177e4 744 GFP_ATOMIC);
1ab1457c
YH
745 if (buff == NULL)
746 return;
1da177e4 747
cfb6eeb4 748 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1da177e4 749
cfb6eeb4 750 t1 = (struct tcphdr *) skb_push(buff, tot_len);
6651ffc8 751 skb_reset_transport_header(buff);
1da177e4
LT
752
753 /* Swap the send and the receive. */
754 memset(t1, 0, sizeof(*t1));
755 t1->dest = th->source;
756 t1->source = th->dest;
cfb6eeb4 757 t1->doff = tot_len / 4;
626e264d
IJ
758 t1->seq = htonl(seq);
759 t1->ack_seq = htonl(ack);
760 t1->ack = !rst || !th->ack;
761 t1->rst = rst;
762 t1->window = htons(win);
1da177e4 763
81ada62d
IJ
764 topt = (__be32 *)(t1 + 1);
765
ee684b6f 766 if (tsecr) {
626e264d
IJ
767 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
768 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
ee684b6f
AV
769 *topt++ = htonl(tsval);
770 *topt++ = htonl(tsecr);
626e264d
IJ
771 }
772
cfb6eeb4
YH
773#ifdef CONFIG_TCP_MD5SIG
774 if (key) {
81ada62d
IJ
775 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
776 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
777 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
78e645cb
IJ
778 &ipv6_hdr(skb)->saddr,
779 &ipv6_hdr(skb)->daddr, t1);
cfb6eeb4
YH
780 }
781#endif
782
4c9483b2 783 memset(&fl6, 0, sizeof(fl6));
4e3fd7a0
AD
784 fl6.daddr = ipv6_hdr(skb)->saddr;
785 fl6.saddr = ipv6_hdr(skb)->daddr;
1da177e4 786
e5700aff
DM
787 buff->ip_summed = CHECKSUM_PARTIAL;
788 buff->csum = 0;
789
4c9483b2 790 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
1da177e4 791
4c9483b2 792 fl6.flowi6_proto = IPPROTO_TCP;
4c675258
AK
793 if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
794 fl6.flowi6_oif = inet6_iif(skb);
1958b856
DM
795 fl6.fl6_dport = t1->dest;
796 fl6.fl6_sport = t1->source;
4c9483b2 797 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
1da177e4 798
c20121ae
DL
799 /* Pass a socket to ip6_dst_lookup either it is for RST
800 * Underlying function will use this to retrieve the network
801 * namespace
802 */
4c9483b2 803 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL, false);
68d0c6d3
DM
804 if (!IS_ERR(dst)) {
805 skb_dst_set(buff, dst);
b903d324 806 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
68d0c6d3
DM
807 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
808 if (rst)
809 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
810 return;
1da177e4
LT
811 }
812
813 kfree_skb(buff);
814}
815
626e264d 816static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
1da177e4 817{
cf533ea5 818 const struct tcphdr *th = tcp_hdr(skb);
626e264d 819 u32 seq = 0, ack_seq = 0;
fa3e5b4e 820 struct tcp_md5sig_key *key = NULL;
658ddaaf
SL
821#ifdef CONFIG_TCP_MD5SIG
822 const __u8 *hash_location = NULL;
823 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
824 unsigned char newhash[16];
825 int genhash;
826 struct sock *sk1 = NULL;
827#endif
1da177e4 828
626e264d 829 if (th->rst)
1da177e4
LT
830 return;
831
626e264d
IJ
832 if (!ipv6_unicast_destination(skb))
833 return;
1da177e4 834
cfb6eeb4 835#ifdef CONFIG_TCP_MD5SIG
658ddaaf
SL
836 hash_location = tcp_parse_md5sig_option(th);
837 if (!sk && hash_location) {
838 /*
839 * active side is lost. Try to find listening socket through
840 * source port, and then find md5 key through listening socket.
841 * we are not loose security here:
842 * Incoming packet is checked with md5 hash with finding key,
843 * no RST generated if md5 hash doesn't match.
844 */
845 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
5ba24953
TH
846 &tcp_hashinfo, &ipv6h->saddr,
847 th->source, &ipv6h->daddr,
658ddaaf
SL
848 ntohs(th->source), inet6_iif(skb));
849 if (!sk1)
850 return;
851
852 rcu_read_lock();
853 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
854 if (!key)
855 goto release_sk1;
856
857 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
858 if (genhash || memcmp(hash_location, newhash, 16) != 0)
859 goto release_sk1;
860 } else {
861 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
862 }
cfb6eeb4
YH
863#endif
864
626e264d
IJ
865 if (th->ack)
866 seq = ntohl(th->ack_seq);
867 else
868 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
869 (th->doff << 2);
1da177e4 870
ee684b6f 871 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, 0, key, 1, 0);
658ddaaf
SL
872
873#ifdef CONFIG_TCP_MD5SIG
874release_sk1:
875 if (sk1) {
876 rcu_read_unlock();
877 sock_put(sk1);
878 }
879#endif
626e264d 880}
1da177e4 881
ee684b6f
AV
882static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack,
883 u32 win, u32 tsval, u32 tsecr,
b903d324 884 struct tcp_md5sig_key *key, u8 tclass)
626e264d 885{
ee684b6f 886 tcp_v6_send_response(skb, seq, ack, win, tsval, tsecr, key, 0, tclass);
1da177e4
LT
887}
888
889static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
890{
8feaf0c0 891 struct inet_timewait_sock *tw = inet_twsk(sk);
cfb6eeb4 892 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1da177e4 893
9501f972 894 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
8feaf0c0 895 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
ee684b6f 896 tcp_time_stamp + tcptw->tw_ts_offset,
b903d324
ED
897 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw),
898 tw->tw_tclass);
1da177e4 899
8feaf0c0 900 inet_twsk_put(tw);
1da177e4
LT
901}
902
6edafaaf
GJ
903static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
904 struct request_sock *req)
1da177e4 905{
ee684b6f
AV
906 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1,
907 req->rcv_wnd, tcp_time_stamp, req->ts_recent,
b903d324 908 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr), 0);
1da177e4
LT
909}
910
911
912static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
913{
60236fdd 914 struct request_sock *req, **prev;
aa8223c7 915 const struct tcphdr *th = tcp_hdr(skb);
1da177e4
LT
916 struct sock *nsk;
917
918 /* Find possible connection requests. */
8129765a 919 req = inet6_csk_search_req(sk, &prev, th->source,
0660e03f
ACM
920 &ipv6_hdr(skb)->saddr,
921 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1da177e4 922 if (req)
8336886f 923 return tcp_check_req(sk, skb, req, prev, false);
1da177e4 924
3b1e0a65 925 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
d86e0dac
PE
926 &ipv6_hdr(skb)->saddr, th->source,
927 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1da177e4
LT
928
929 if (nsk) {
930 if (nsk->sk_state != TCP_TIME_WAIT) {
931 bh_lock_sock(nsk);
932 return nsk;
933 }
9469c7b4 934 inet_twsk_put(inet_twsk(nsk));
1da177e4
LT
935 return NULL;
936 }
937
c6aefafb 938#ifdef CONFIG_SYN_COOKIES
af9b4738 939 if (!th->syn)
c6aefafb 940 sk = cookie_v6_check(sk, skb);
1da177e4
LT
941#endif
942 return sk;
943}
944
1da177e4
LT
945/* FIXME: this is substantially similar to the ipv4 code.
946 * Can some kind of merge be done? -- erics
947 */
948static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
949{
e6b4d113
WAS
950 struct tcp_options_received tmp_opt;
951 struct request_sock *req;
ca304b61 952 struct inet6_request_sock *treq;
1da177e4 953 struct ipv6_pinfo *np = inet6_sk(sk);
1da177e4 954 struct tcp_sock *tp = tcp_sk(sk);
e6b4d113 955 __u32 isn = TCP_SKB_CB(skb)->when;
493f377d 956 struct dst_entry *dst = NULL;
3840a06e 957 struct flowi6 fl6;
a2a385d6 958 bool want_cookie = false;
1da177e4
LT
959
960 if (skb->protocol == htons(ETH_P_IP))
961 return tcp_v4_conn_request(sk, skb);
962
963 if (!ipv6_unicast_destination(skb))
1ab1457c 964 goto drop;
1da177e4 965
463c84b9 966 if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
946cedcc
ED
967 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
968 if (!want_cookie)
969 goto drop;
1da177e4
LT
970 }
971
5f1e942c
VS
972 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1) {
973 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1da177e4 974 goto drop;
5f1e942c 975 }
1da177e4 976
ca304b61 977 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1da177e4
LT
978 if (req == NULL)
979 goto drop;
980
cfb6eeb4
YH
981#ifdef CONFIG_TCP_MD5SIG
982 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
983#endif
984
1da177e4
LT
985 tcp_clear_options(&tmp_opt);
986 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
987 tmp_opt.user_mss = tp->rx_opt.user_mss;
1a2c6181 988 tcp_parse_options(skb, &tmp_opt, 0, NULL);
1da177e4 989
4dfc2817 990 if (want_cookie && !tmp_opt.saw_tstamp)
c6aefafb 991 tcp_clear_options(&tmp_opt);
c6aefafb 992
1da177e4
LT
993 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
994 tcp_openreq_init(req, &tmp_opt, skb);
995
ca304b61 996 treq = inet6_rsk(req);
4e3fd7a0
AD
997 treq->rmt_addr = ipv6_hdr(skb)->saddr;
998 treq->loc_addr = ipv6_hdr(skb)->daddr;
172d69e6 999 if (!want_cookie || tmp_opt.tstamp_ok)
5d134f1c 1000 TCP_ECN_create_request(req, skb, sock_net(sk));
c6aefafb 1001
4d0fe50c
ED
1002 treq->iif = sk->sk_bound_dev_if;
1003
1004 /* So that link locals have meaning */
1005 if (!sk->sk_bound_dev_if &&
1006 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1007 treq->iif = inet6_iif(skb);
1008
2bbdf389 1009 if (!isn) {
c6aefafb
GG
1010 if (ipv6_opt_accepted(sk, skb) ||
1011 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1012 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1013 atomic_inc(&skb->users);
1014 treq->pktopts = skb;
1015 }
493f377d
DM
1016
1017 if (want_cookie) {
2bbdf389
FW
1018 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1019 req->cookie_ts = tmp_opt.tstamp_ok;
493f377d
DM
1020 goto have_isn;
1021 }
1022
1023 /* VJ's idea. We save last timestamp seen
1024 * from the destination in peer table, when entering
1025 * state TIME-WAIT, and check against it before
1026 * accepting new connection request.
1027 *
1028 * If "isn" is not zero, this request hit alive
1029 * timewait bucket, so that all the necessary checks
1030 * are made in the function processing timewait state.
1031 */
1032 if (tmp_opt.saw_tstamp &&
1033 tcp_death_row.sysctl_tw_recycle &&
81166dd6
DM
1034 (dst = inet6_csk_route_req(sk, &fl6, req)) != NULL) {
1035 if (!tcp_peer_is_proven(req, dst, true)) {
493f377d
DM
1036 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1037 goto drop_and_release;
1038 }
1039 }
1040 /* Kill the following clause, if you dislike this way. */
1041 else if (!sysctl_tcp_syncookies &&
1042 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1043 (sysctl_max_syn_backlog >> 2)) &&
81166dd6 1044 !tcp_peer_is_proven(req, dst, false)) {
493f377d
DM
1045 /* Without syncookies last quarter of
1046 * backlog is filled with destinations,
1047 * proven to be alive.
1048 * It means that we continue to communicate
1049 * to destinations, already remembered
1050 * to the moment of synflood.
1051 */
1052 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
1053 &treq->rmt_addr, ntohs(tcp_hdr(skb)->source));
1054 goto drop_and_release;
2bbdf389 1055 }
493f377d
DM
1056
1057 isn = tcp_v6_init_sequence(skb);
c6aefafb 1058 }
493f377d 1059have_isn:
2e6599cb 1060 tcp_rsk(req)->snt_isn = isn;
1da177e4 1061
437c5b53
NC
1062 if (security_inet_conn_request(sk, skb, req))
1063 goto drop_and_release;
4237c75c 1064
9f10d3f6 1065 if (tcp_v6_send_synack(sk, dst, &fl6, req,
fff32699 1066 skb_get_queue_mapping(skb)) ||
4957faad 1067 want_cookie)
e6b4d113 1068 goto drop_and_free;
1da177e4 1069
016818d0 1070 tcp_rsk(req)->snt_synack = tcp_time_stamp;
8336886f 1071 tcp_rsk(req)->listener = NULL;
e6b4d113
WAS
1072 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1073 return 0;
1da177e4 1074
493f377d
DM
1075drop_and_release:
1076 dst_release(dst);
e6b4d113
WAS
1077drop_and_free:
1078 reqsk_free(req);
1da177e4 1079drop:
5f1e942c 1080 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1081 return 0; /* don't send reset */
1082}
1083
1084static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
60236fdd 1085 struct request_sock *req,
1da177e4
LT
1086 struct dst_entry *dst)
1087{
78d15e82 1088 struct inet6_request_sock *treq;
1da177e4
LT
1089 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1090 struct tcp6_sock *newtcp6sk;
1091 struct inet_sock *newinet;
1092 struct tcp_sock *newtp;
1093 struct sock *newsk;
cfb6eeb4
YH
1094#ifdef CONFIG_TCP_MD5SIG
1095 struct tcp_md5sig_key *key;
1096#endif
3840a06e 1097 struct flowi6 fl6;
1da177e4
LT
1098
1099 if (skb->protocol == htons(ETH_P_IP)) {
1100 /*
1101 * v6 mapped
1102 */
1103
1104 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1105
1ab1457c 1106 if (newsk == NULL)
1da177e4
LT
1107 return NULL;
1108
1109 newtcp6sk = (struct tcp6_sock *)newsk;
1110 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1111
1112 newinet = inet_sk(newsk);
1113 newnp = inet6_sk(newsk);
1114 newtp = tcp_sk(newsk);
1115
1116 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1117
c720c7e8 1118 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newnp->daddr);
1da177e4 1119
c720c7e8 1120 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
1da177e4 1121
4e3fd7a0 1122 newnp->rcv_saddr = newnp->saddr;
1da177e4 1123
8292a17a 1124 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1da177e4 1125 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
1126#ifdef CONFIG_TCP_MD5SIG
1127 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1128#endif
1129
676a1184
YZ
1130 newnp->ipv6_ac_list = NULL;
1131 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1132 newnp->pktoptions = NULL;
1133 newnp->opt = NULL;
505cbfc5 1134 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1135 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
e7219858 1136 newnp->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4 1137
e6848976
ACM
1138 /*
1139 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1140 * here, tcp_create_openreq_child now does this for us, see the comment in
1141 * that function for the gory details. -acme
1da177e4 1142 */
1da177e4
LT
1143
1144 /* It is tricky place. Until this moment IPv4 tcp
8292a17a 1145 worked with IPv6 icsk.icsk_af_ops.
1da177e4
LT
1146 Sync it now.
1147 */
d83d8461 1148 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1da177e4
LT
1149
1150 return newsk;
1151 }
1152
78d15e82 1153 treq = inet6_rsk(req);
1da177e4
LT
1154
1155 if (sk_acceptq_is_full(sk))
1156 goto out_overflow;
1157
493f377d 1158 if (!dst) {
3840a06e 1159 dst = inet6_csk_route_req(sk, &fl6, req);
493f377d 1160 if (!dst)
1da177e4 1161 goto out;
1ab1457c 1162 }
1da177e4
LT
1163
1164 newsk = tcp_create_openreq_child(sk, req, skb);
1165 if (newsk == NULL)
093d2823 1166 goto out_nonewsk;
1da177e4 1167
e6848976
ACM
1168 /*
1169 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1170 * count here, tcp_create_openreq_child now does this for us, see the
1171 * comment in that function for the gory details. -acme
1172 */
1da177e4 1173
59eed279 1174 newsk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 1175 __ip6_dst_store(newsk, dst, NULL, NULL);
fae6ef87 1176 inet6_sk_rx_dst_set(newsk, skb);
1da177e4
LT
1177
1178 newtcp6sk = (struct tcp6_sock *)newsk;
1179 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1180
1181 newtp = tcp_sk(newsk);
1182 newinet = inet_sk(newsk);
1183 newnp = inet6_sk(newsk);
1184
1185 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1186
4e3fd7a0
AD
1187 newnp->daddr = treq->rmt_addr;
1188 newnp->saddr = treq->loc_addr;
1189 newnp->rcv_saddr = treq->loc_addr;
2e6599cb 1190 newsk->sk_bound_dev_if = treq->iif;
1da177e4 1191
1ab1457c 1192 /* Now IPv6 options...
1da177e4
LT
1193
1194 First: no IPv4 options.
1195 */
f6d8bd05 1196 newinet->inet_opt = NULL;
676a1184 1197 newnp->ipv6_ac_list = NULL;
d35690be 1198 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1199
1200 /* Clone RX bits */
1201 newnp->rxopt.all = np->rxopt.all;
1202
1203 /* Clone pktoptions received with SYN */
1204 newnp->pktoptions = NULL;
2e6599cb 1205 if (treq->pktopts != NULL) {
99a1dec7
MG
1206 newnp->pktoptions = skb_clone(treq->pktopts,
1207 sk_gfp_atomic(sk, GFP_ATOMIC));
ab185d7b 1208 consume_skb(treq->pktopts);
2e6599cb 1209 treq->pktopts = NULL;
1da177e4
LT
1210 if (newnp->pktoptions)
1211 skb_set_owner_r(newnp->pktoptions, newsk);
1212 }
1213 newnp->opt = NULL;
505cbfc5 1214 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1215 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
e7219858 1216 newnp->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4
LT
1217
1218 /* Clone native IPv6 options from listening socket (if any)
1219
1220 Yes, keeping reference count would be much more clever,
1221 but we make one more one thing there: reattach optmem
1222 to newsk.
1223 */
43264e0b
RL
1224 if (np->opt)
1225 newnp->opt = ipv6_dup_options(newsk, np->opt);
1da177e4 1226
d83d8461 1227 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1da177e4 1228 if (newnp->opt)
d83d8461
ACM
1229 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1230 newnp->opt->opt_flen);
1da177e4 1231
5d424d5a 1232 tcp_mtup_init(newsk);
1da177e4 1233 tcp_sync_mss(newsk, dst_mtu(dst));
0dbaee3b 1234 newtp->advmss = dst_metric_advmss(dst);
d135c522
NC
1235 if (tcp_sk(sk)->rx_opt.user_mss &&
1236 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1237 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1238
1da177e4
LT
1239 tcp_initialize_rcv_mss(newsk);
1240
c720c7e8
ED
1241 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1242 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 1243
cfb6eeb4
YH
1244#ifdef CONFIG_TCP_MD5SIG
1245 /* Copy over the MD5 key from the original socket */
1246 if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1247 /* We're using one, so create a matching key
1248 * on the newsk structure. If we fail to get
1249 * memory, then we end up not copying the key
1250 * across. Shucks.
1251 */
a915da9b 1252 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newnp->daddr,
99a1dec7
MG
1253 AF_INET6, key->key, key->keylen,
1254 sk_gfp_atomic(sk, GFP_ATOMIC));
cfb6eeb4
YH
1255 }
1256#endif
1257
093d2823 1258 if (__inet_inherit_port(sk, newsk) < 0) {
e337e24d
CP
1259 inet_csk_prepare_forced_close(newsk);
1260 tcp_done(newsk);
093d2823
BS
1261 goto out;
1262 }
9327f705 1263 __inet6_hash(newsk, NULL);
1da177e4
LT
1264
1265 return newsk;
1266
1267out_overflow:
de0744af 1268 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
093d2823 1269out_nonewsk:
1da177e4 1270 dst_release(dst);
093d2823
BS
1271out:
1272 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1273 return NULL;
1274}
1275
b51655b9 1276static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1da177e4 1277{
84fa7933 1278 if (skb->ip_summed == CHECKSUM_COMPLETE) {
684f2176 1279 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
0660e03f 1280 &ipv6_hdr(skb)->daddr, skb->csum)) {
fb286bb2 1281 skb->ip_summed = CHECKSUM_UNNECESSARY;
1da177e4 1282 return 0;
fb286bb2 1283 }
1da177e4 1284 }
fb286bb2 1285
684f2176 1286 skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
0660e03f
ACM
1287 &ipv6_hdr(skb)->saddr,
1288 &ipv6_hdr(skb)->daddr, 0));
fb286bb2 1289
1da177e4 1290 if (skb->len <= 76) {
fb286bb2 1291 return __skb_checksum_complete(skb);
1da177e4
LT
1292 }
1293 return 0;
1294}
1295
1296/* The socket must have it's spinlock held when we get
1297 * here.
1298 *
1299 * We have a potential double-lock case here, so even when
1300 * doing backlog processing we use the BH locking scheme.
1301 * This is because we cannot sleep with the original spinlock
1302 * held.
1303 */
1304static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1305{
1306 struct ipv6_pinfo *np = inet6_sk(sk);
1307 struct tcp_sock *tp;
1308 struct sk_buff *opt_skb = NULL;
1309
1310 /* Imagine: socket is IPv6. IPv4 packet arrives,
1311 goes to IPv4 receive handler and backlogged.
1312 From backlog it always goes here. Kerboom...
1313 Fortunately, tcp_rcv_established and rcv_established
1314 handle them correctly, but it is not case with
1315 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1316 */
1317
1318 if (skb->protocol == htons(ETH_P_IP))
1319 return tcp_v4_do_rcv(sk, skb);
1320
cfb6eeb4
YH
1321#ifdef CONFIG_TCP_MD5SIG
1322 if (tcp_v6_inbound_md5_hash (sk, skb))
1323 goto discard;
1324#endif
1325
fda9ef5d 1326 if (sk_filter(sk, skb))
1da177e4
LT
1327 goto discard;
1328
1329 /*
1330 * socket locking is here for SMP purposes as backlog rcv
1331 * is currently called with bh processing disabled.
1332 */
1333
1334 /* Do Stevens' IPV6_PKTOPTIONS.
1335
1336 Yes, guys, it is the only place in our code, where we
1337 may make it not affecting IPv4.
1338 The rest of code is protocol independent,
1339 and I do not like idea to uglify IPv4.
1340
1341 Actually, all the idea behind IPV6_PKTOPTIONS
1342 looks not very well thought. For now we latch
1343 options, received in the last packet, enqueued
1344 by tcp. Feel free to propose better solution.
1ab1457c 1345 --ANK (980728)
1da177e4
LT
1346 */
1347 if (np->rxopt.all)
99a1dec7 1348 opt_skb = skb_clone(skb, sk_gfp_atomic(sk, GFP_ATOMIC));
1da177e4
LT
1349
1350 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
5d299f3d
ED
1351 struct dst_entry *dst = sk->sk_rx_dst;
1352
bdeab991 1353 sock_rps_save_rxhash(sk, skb);
5d299f3d
ED
1354 if (dst) {
1355 if (inet_sk(sk)->rx_dst_ifindex != skb->skb_iif ||
1356 dst->ops->check(dst, np->rx_dst_cookie) == NULL) {
1357 dst_release(dst);
1358 sk->sk_rx_dst = NULL;
1359 }
1360 }
1361
aa8223c7 1362 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1da177e4 1363 goto reset;
1da177e4
LT
1364 if (opt_skb)
1365 goto ipv6_pktoptions;
1366 return 0;
1367 }
1368
ab6a5bb6 1369 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1da177e4
LT
1370 goto csum_err;
1371
1ab1457c 1372 if (sk->sk_state == TCP_LISTEN) {
1da177e4
LT
1373 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1374 if (!nsk)
1375 goto discard;
1376
1377 /*
1378 * Queue it on the new socket if the new socket is active,
1379 * otherwise we just shortcircuit this and continue with
1380 * the new socket..
1381 */
1ab1457c 1382 if(nsk != sk) {
bdeab991 1383 sock_rps_save_rxhash(nsk, skb);
1da177e4
LT
1384 if (tcp_child_process(sk, nsk, skb))
1385 goto reset;
1386 if (opt_skb)
1387 __kfree_skb(opt_skb);
1388 return 0;
1389 }
47482f13 1390 } else
bdeab991 1391 sock_rps_save_rxhash(sk, skb);
1da177e4 1392
aa8223c7 1393 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1da177e4 1394 goto reset;
1da177e4
LT
1395 if (opt_skb)
1396 goto ipv6_pktoptions;
1397 return 0;
1398
1399reset:
cfb6eeb4 1400 tcp_v6_send_reset(sk, skb);
1da177e4
LT
1401discard:
1402 if (opt_skb)
1403 __kfree_skb(opt_skb);
1404 kfree_skb(skb);
1405 return 0;
1406csum_err:
6a5dc9e5 1407 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_CSUMERRORS);
63231bdd 1408 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1da177e4
LT
1409 goto discard;
1410
1411
1412ipv6_pktoptions:
1413 /* Do you ask, what is it?
1414
1415 1. skb was enqueued by tcp.
1416 2. skb is added to tail of read queue, rather than out of order.
1417 3. socket is not in passive state.
1418 4. Finally, it really contains options, which user wants to receive.
1419 */
1420 tp = tcp_sk(sk);
1421 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1422 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
333fad53 1423 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
505cbfc5 1424 np->mcast_oif = inet6_iif(opt_skb);
333fad53 1425 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
0660e03f 1426 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
4c507d28 1427 if (np->rxopt.bits.rxtclass)
e7219858 1428 np->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4
LT
1429 if (ipv6_opt_accepted(sk, opt_skb)) {
1430 skb_set_owner_r(opt_skb, sk);
1431 opt_skb = xchg(&np->pktoptions, opt_skb);
1432 } else {
1433 __kfree_skb(opt_skb);
1434 opt_skb = xchg(&np->pktoptions, NULL);
1435 }
1436 }
1437
800d55f1 1438 kfree_skb(opt_skb);
1da177e4
LT
1439 return 0;
1440}
1441
e5bbef20 1442static int tcp_v6_rcv(struct sk_buff *skb)
1da177e4 1443{
cf533ea5 1444 const struct tcphdr *th;
b71d1d42 1445 const struct ipv6hdr *hdr;
1da177e4
LT
1446 struct sock *sk;
1447 int ret;
a86b1e30 1448 struct net *net = dev_net(skb->dev);
1da177e4
LT
1449
1450 if (skb->pkt_type != PACKET_HOST)
1451 goto discard_it;
1452
1453 /*
1454 * Count it even if it's bad.
1455 */
63231bdd 1456 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1da177e4
LT
1457
1458 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1459 goto discard_it;
1460
aa8223c7 1461 th = tcp_hdr(skb);
1da177e4
LT
1462
1463 if (th->doff < sizeof(struct tcphdr)/4)
1464 goto bad_packet;
1465 if (!pskb_may_pull(skb, th->doff*4))
1466 goto discard_it;
1467
60476372 1468 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
6a5dc9e5 1469 goto csum_error;
1da177e4 1470
aa8223c7 1471 th = tcp_hdr(skb);
e802af9c 1472 hdr = ipv6_hdr(skb);
1da177e4
LT
1473 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1474 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1475 skb->len - th->doff*4);
1476 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1477 TCP_SKB_CB(skb)->when = 0;
b82d1bb4 1478 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
1da177e4
LT
1479 TCP_SKB_CB(skb)->sacked = 0;
1480
9a1f27c4 1481 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1da177e4
LT
1482 if (!sk)
1483 goto no_tcp_socket;
1484
1485process:
1486 if (sk->sk_state == TCP_TIME_WAIT)
1487 goto do_time_wait;
1488
e802af9c
SH
1489 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1490 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1491 goto discard_and_relse;
1492 }
1493
1da177e4
LT
1494 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1495 goto discard_and_relse;
1496
fda9ef5d 1497 if (sk_filter(sk, skb))
1da177e4
LT
1498 goto discard_and_relse;
1499
8b80cda5 1500 sk_mark_napi_id(sk, skb);
1da177e4
LT
1501 skb->dev = NULL;
1502
293b9c42 1503 bh_lock_sock_nested(sk);
1da177e4
LT
1504 ret = 0;
1505 if (!sock_owned_by_user(sk)) {
1a2449a8 1506#ifdef CONFIG_NET_DMA
1ab1457c 1507 struct tcp_sock *tp = tcp_sk(sk);
b4caea8a 1508 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
a2bd1140 1509 tp->ucopy.dma_chan = net_dma_find_channel();
1ab1457c
YH
1510 if (tp->ucopy.dma_chan)
1511 ret = tcp_v6_do_rcv(sk, skb);
1512 else
1a2449a8
CL
1513#endif
1514 {
1515 if (!tcp_prequeue(sk, skb))
1516 ret = tcp_v6_do_rcv(sk, skb);
1517 }
da882c1f
ED
1518 } else if (unlikely(sk_add_backlog(sk, skb,
1519 sk->sk_rcvbuf + sk->sk_sndbuf))) {
6b03a53a 1520 bh_unlock_sock(sk);
6cce09f8 1521 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
6b03a53a
ZY
1522 goto discard_and_relse;
1523 }
1da177e4
LT
1524 bh_unlock_sock(sk);
1525
1526 sock_put(sk);
1527 return ret ? -1 : 0;
1528
1529no_tcp_socket:
1530 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1531 goto discard_it;
1532
1533 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
6a5dc9e5
ED
1534csum_error:
1535 TCP_INC_STATS_BH(net, TCP_MIB_CSUMERRORS);
1da177e4 1536bad_packet:
63231bdd 1537 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1da177e4 1538 } else {
cfb6eeb4 1539 tcp_v6_send_reset(NULL, skb);
1da177e4
LT
1540 }
1541
1542discard_it:
1da177e4
LT
1543 kfree_skb(skb);
1544 return 0;
1545
1546discard_and_relse:
1547 sock_put(sk);
1548 goto discard_it;
1549
1550do_time_wait:
1551 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
9469c7b4 1552 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1553 goto discard_it;
1554 }
1555
6a5dc9e5 1556 if (skb->len < (th->doff<<2)) {
9469c7b4 1557 inet_twsk_put(inet_twsk(sk));
6a5dc9e5
ED
1558 goto bad_packet;
1559 }
1560 if (tcp_checksum_complete(skb)) {
1561 inet_twsk_put(inet_twsk(sk));
1562 goto csum_error;
1da177e4
LT
1563 }
1564
9469c7b4 1565 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1da177e4
LT
1566 case TCP_TW_SYN:
1567 {
1568 struct sock *sk2;
1569
c346dca1 1570 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
5ba24953 1571 &ipv6_hdr(skb)->saddr, th->source,
0660e03f 1572 &ipv6_hdr(skb)->daddr,
505cbfc5 1573 ntohs(th->dest), inet6_iif(skb));
1da177e4 1574 if (sk2 != NULL) {
295ff7ed
ACM
1575 struct inet_timewait_sock *tw = inet_twsk(sk);
1576 inet_twsk_deschedule(tw, &tcp_death_row);
1577 inet_twsk_put(tw);
1da177e4
LT
1578 sk = sk2;
1579 goto process;
1580 }
1581 /* Fall through to ACK */
1582 }
1583 case TCP_TW_ACK:
1584 tcp_v6_timewait_ack(sk, skb);
1585 break;
1586 case TCP_TW_RST:
1587 goto no_tcp_socket;
1588 case TCP_TW_SUCCESS:;
1589 }
1590 goto discard_it;
1591}
1592
c7109986
ED
1593static void tcp_v6_early_demux(struct sk_buff *skb)
1594{
1595 const struct ipv6hdr *hdr;
1596 const struct tcphdr *th;
1597 struct sock *sk;
1598
1599 if (skb->pkt_type != PACKET_HOST)
1600 return;
1601
1602 if (!pskb_may_pull(skb, skb_transport_offset(skb) + sizeof(struct tcphdr)))
1603 return;
1604
1605 hdr = ipv6_hdr(skb);
1606 th = tcp_hdr(skb);
1607
1608 if (th->doff < sizeof(struct tcphdr) / 4)
1609 return;
1610
1611 sk = __inet6_lookup_established(dev_net(skb->dev), &tcp_hashinfo,
1612 &hdr->saddr, th->source,
1613 &hdr->daddr, ntohs(th->dest),
1614 inet6_iif(skb));
1615 if (sk) {
1616 skb->sk = sk;
1617 skb->destructor = sock_edemux;
1618 if (sk->sk_state != TCP_TIME_WAIT) {
1619 struct dst_entry *dst = sk->sk_rx_dst;
f3f12135 1620
c7109986 1621 if (dst)
5d299f3d 1622 dst = dst_check(dst, inet6_sk(sk)->rx_dst_cookie);
c7109986 1623 if (dst &&
f3f12135 1624 inet_sk(sk)->rx_dst_ifindex == skb->skb_iif)
c7109986
ED
1625 skb_dst_set_noref(skb, dst);
1626 }
1627 }
1628}
1629
ccb7c410
DM
1630static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1631 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1632 .twsk_unique = tcp_twsk_unique,
1633 .twsk_destructor= tcp_twsk_destructor,
ccb7c410
DM
1634};
1635
3b401a81 1636static const struct inet_connection_sock_af_ops ipv6_specific = {
543d9cfe
ACM
1637 .queue_xmit = inet6_csk_xmit,
1638 .send_check = tcp_v6_send_check,
1639 .rebuild_header = inet6_sk_rebuild_header,
5d299f3d 1640 .sk_rx_dst_set = inet6_sk_rx_dst_set,
543d9cfe
ACM
1641 .conn_request = tcp_v6_conn_request,
1642 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe 1643 .net_header_len = sizeof(struct ipv6hdr),
67469601 1644 .net_frag_header_len = sizeof(struct frag_hdr),
543d9cfe
ACM
1645 .setsockopt = ipv6_setsockopt,
1646 .getsockopt = ipv6_getsockopt,
1647 .addr2sockaddr = inet6_csk_addr2sockaddr,
1648 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1649 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1650#ifdef CONFIG_COMPAT
543d9cfe
ACM
1651 .compat_setsockopt = compat_ipv6_setsockopt,
1652 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1653#endif
1da177e4
LT
1654};
1655
cfb6eeb4 1656#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1657static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
cfb6eeb4 1658 .md5_lookup = tcp_v6_md5_lookup,
49a72dfb 1659 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 1660 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1661};
a928630a 1662#endif
cfb6eeb4 1663
1da177e4
LT
1664/*
1665 * TCP over IPv4 via INET6 API
1666 */
1667
3b401a81 1668static const struct inet_connection_sock_af_ops ipv6_mapped = {
543d9cfe
ACM
1669 .queue_xmit = ip_queue_xmit,
1670 .send_check = tcp_v4_send_check,
1671 .rebuild_header = inet_sk_rebuild_header,
63d02d15 1672 .sk_rx_dst_set = inet_sk_rx_dst_set,
543d9cfe
ACM
1673 .conn_request = tcp_v6_conn_request,
1674 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe
ACM
1675 .net_header_len = sizeof(struct iphdr),
1676 .setsockopt = ipv6_setsockopt,
1677 .getsockopt = ipv6_getsockopt,
1678 .addr2sockaddr = inet6_csk_addr2sockaddr,
1679 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1680 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1681#ifdef CONFIG_COMPAT
543d9cfe
ACM
1682 .compat_setsockopt = compat_ipv6_setsockopt,
1683 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1684#endif
1da177e4
LT
1685};
1686
cfb6eeb4 1687#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1688static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
cfb6eeb4 1689 .md5_lookup = tcp_v4_md5_lookup,
49a72dfb 1690 .calc_md5_hash = tcp_v4_md5_hash_skb,
cfb6eeb4 1691 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1692};
a928630a 1693#endif
cfb6eeb4 1694
1da177e4
LT
1695/* NOTE: A lot of things set to zero explicitly by call to
1696 * sk_alloc() so need not be done here.
1697 */
1698static int tcp_v6_init_sock(struct sock *sk)
1699{
6687e988 1700 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4 1701
900f65d3 1702 tcp_init_sock(sk);
1da177e4 1703
8292a17a 1704 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 1705
cfb6eeb4 1706#ifdef CONFIG_TCP_MD5SIG
ac807fa8 1707 tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
cfb6eeb4
YH
1708#endif
1709
1da177e4
LT
1710 return 0;
1711}
1712
7d06b2e0 1713static void tcp_v6_destroy_sock(struct sock *sk)
1da177e4 1714{
1da177e4 1715 tcp_v4_destroy_sock(sk);
7d06b2e0 1716 inet6_destroy_sock(sk);
1da177e4
LT
1717}
1718
952a10be 1719#ifdef CONFIG_PROC_FS
1da177e4 1720/* Proc filesystem TCPv6 sock list dumping. */
1ab1457c 1721static void get_openreq6(struct seq_file *seq,
a7cb5a49 1722 const struct sock *sk, struct request_sock *req, int i, kuid_t uid)
1da177e4 1723{
1da177e4 1724 int ttd = req->expires - jiffies;
b71d1d42
ED
1725 const struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1726 const struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1da177e4
LT
1727
1728 if (ttd < 0)
1729 ttd = 0;
1730
1da177e4
LT
1731 seq_printf(seq,
1732 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1733 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1da177e4
LT
1734 i,
1735 src->s6_addr32[0], src->s6_addr32[1],
1736 src->s6_addr32[2], src->s6_addr32[3],
fd507037 1737 ntohs(inet_rsk(req)->loc_port),
1da177e4
LT
1738 dest->s6_addr32[0], dest->s6_addr32[1],
1739 dest->s6_addr32[2], dest->s6_addr32[3],
2e6599cb 1740 ntohs(inet_rsk(req)->rmt_port),
1da177e4
LT
1741 TCP_SYN_RECV,
1742 0,0, /* could print option size, but that is af dependent. */
1ab1457c
YH
1743 1, /* timers active (only the expire timer) */
1744 jiffies_to_clock_t(ttd),
e6c022a4 1745 req->num_timeout,
a7cb5a49 1746 from_kuid_munged(seq_user_ns(seq), uid),
1ab1457c 1747 0, /* non standard timer */
1da177e4
LT
1748 0, /* open_requests have no inode */
1749 0, req);
1750}
1751
1752static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1753{
b71d1d42 1754 const struct in6_addr *dest, *src;
1da177e4
LT
1755 __u16 destp, srcp;
1756 int timer_active;
1757 unsigned long timer_expires;
cf533ea5
ED
1758 const struct inet_sock *inet = inet_sk(sp);
1759 const struct tcp_sock *tp = tcp_sk(sp);
463c84b9 1760 const struct inet_connection_sock *icsk = inet_csk(sp);
cf533ea5 1761 const struct ipv6_pinfo *np = inet6_sk(sp);
1da177e4
LT
1762
1763 dest = &np->daddr;
1764 src = &np->rcv_saddr;
c720c7e8
ED
1765 destp = ntohs(inet->inet_dport);
1766 srcp = ntohs(inet->inet_sport);
463c84b9
ACM
1767
1768 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1da177e4 1769 timer_active = 1;
463c84b9
ACM
1770 timer_expires = icsk->icsk_timeout;
1771 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1da177e4 1772 timer_active = 4;
463c84b9 1773 timer_expires = icsk->icsk_timeout;
1da177e4
LT
1774 } else if (timer_pending(&sp->sk_timer)) {
1775 timer_active = 2;
1776 timer_expires = sp->sk_timer.expires;
1777 } else {
1778 timer_active = 0;
1779 timer_expires = jiffies;
1780 }
1781
1782 seq_printf(seq,
1783 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1784 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %pK %lu %lu %u %u %d\n",
1da177e4
LT
1785 i,
1786 src->s6_addr32[0], src->s6_addr32[1],
1787 src->s6_addr32[2], src->s6_addr32[3], srcp,
1788 dest->s6_addr32[0], dest->s6_addr32[1],
1789 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1ab1457c 1790 sp->sk_state,
47da8ee6
SS
1791 tp->write_seq-tp->snd_una,
1792 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1da177e4 1793 timer_active,
a399a805 1794 jiffies_delta_to_clock_t(timer_expires - jiffies),
463c84b9 1795 icsk->icsk_retransmits,
a7cb5a49 1796 from_kuid_munged(seq_user_ns(seq), sock_i_uid(sp)),
6687e988 1797 icsk->icsk_probes_out,
1da177e4
LT
1798 sock_i_ino(sp),
1799 atomic_read(&sp->sk_refcnt), sp,
7be87351
SH
1800 jiffies_to_clock_t(icsk->icsk_rto),
1801 jiffies_to_clock_t(icsk->icsk_ack.ato),
463c84b9 1802 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
0b6a05c1
IJ
1803 tp->snd_cwnd,
1804 tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
1da177e4
LT
1805 );
1806}
1807
1ab1457c 1808static void get_timewait6_sock(struct seq_file *seq,
8feaf0c0 1809 struct inet_timewait_sock *tw, int i)
1da177e4 1810{
b71d1d42 1811 const struct in6_addr *dest, *src;
1da177e4 1812 __u16 destp, srcp;
cf533ea5 1813 const struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
a399a805 1814 long delta = tw->tw_ttd - jiffies;
1da177e4 1815
0fa1a53e
ACM
1816 dest = &tw6->tw_v6_daddr;
1817 src = &tw6->tw_v6_rcv_saddr;
1da177e4
LT
1818 destp = ntohs(tw->tw_dport);
1819 srcp = ntohs(tw->tw_sport);
1820
1821 seq_printf(seq,
1822 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1823 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1da177e4
LT
1824 i,
1825 src->s6_addr32[0], src->s6_addr32[1],
1826 src->s6_addr32[2], src->s6_addr32[3], srcp,
1827 dest->s6_addr32[0], dest->s6_addr32[1],
1828 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1829 tw->tw_substate, 0, 0,
a399a805 1830 3, jiffies_delta_to_clock_t(delta), 0, 0, 0, 0,
1da177e4
LT
1831 atomic_read(&tw->tw_refcnt), tw);
1832}
1833
1da177e4
LT
1834static int tcp6_seq_show(struct seq_file *seq, void *v)
1835{
1836 struct tcp_iter_state *st;
1837
1838 if (v == SEQ_START_TOKEN) {
1839 seq_puts(seq,
1840 " sl "
1841 "local_address "
1842 "remote_address "
1843 "st tx_queue rx_queue tr tm->when retrnsmt"
1844 " uid timeout inode\n");
1845 goto out;
1846 }
1847 st = seq->private;
1848
1849 switch (st->state) {
1850 case TCP_SEQ_STATE_LISTENING:
1851 case TCP_SEQ_STATE_ESTABLISHED:
1852 get_tcp6_sock(seq, v, st->num);
1853 break;
1854 case TCP_SEQ_STATE_OPENREQ:
1855 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1856 break;
1857 case TCP_SEQ_STATE_TIME_WAIT:
1858 get_timewait6_sock(seq, v, st->num);
1859 break;
1860 }
1861out:
1862 return 0;
1863}
1864
73cb88ec
AV
1865static const struct file_operations tcp6_afinfo_seq_fops = {
1866 .owner = THIS_MODULE,
1867 .open = tcp_seq_open,
1868 .read = seq_read,
1869 .llseek = seq_lseek,
1870 .release = seq_release_net
1871};
1872
1da177e4 1873static struct tcp_seq_afinfo tcp6_seq_afinfo = {
1da177e4
LT
1874 .name = "tcp6",
1875 .family = AF_INET6,
73cb88ec 1876 .seq_fops = &tcp6_afinfo_seq_fops,
9427c4b3
DL
1877 .seq_ops = {
1878 .show = tcp6_seq_show,
1879 },
1da177e4
LT
1880};
1881
2c8c1e72 1882int __net_init tcp6_proc_init(struct net *net)
1da177e4 1883{
6f8b13bc 1884 return tcp_proc_register(net, &tcp6_seq_afinfo);
1da177e4
LT
1885}
1886
6f8b13bc 1887void tcp6_proc_exit(struct net *net)
1da177e4 1888{
6f8b13bc 1889 tcp_proc_unregister(net, &tcp6_seq_afinfo);
1da177e4
LT
1890}
1891#endif
1892
f77d6021
ED
1893static void tcp_v6_clear_sk(struct sock *sk, int size)
1894{
1895 struct inet_sock *inet = inet_sk(sk);
1896
1897 /* we do not want to clear pinet6 field, because of RCU lookups */
1898 sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
1899
1900 size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
1901 memset(&inet->pinet6 + 1, 0, size);
1902}
1903
1da177e4
LT
1904struct proto tcpv6_prot = {
1905 .name = "TCPv6",
1906 .owner = THIS_MODULE,
1907 .close = tcp_close,
1908 .connect = tcp_v6_connect,
1909 .disconnect = tcp_disconnect,
463c84b9 1910 .accept = inet_csk_accept,
1da177e4
LT
1911 .ioctl = tcp_ioctl,
1912 .init = tcp_v6_init_sock,
1913 .destroy = tcp_v6_destroy_sock,
1914 .shutdown = tcp_shutdown,
1915 .setsockopt = tcp_setsockopt,
1916 .getsockopt = tcp_getsockopt,
1da177e4 1917 .recvmsg = tcp_recvmsg,
7ba42910
CG
1918 .sendmsg = tcp_sendmsg,
1919 .sendpage = tcp_sendpage,
1da177e4 1920 .backlog_rcv = tcp_v6_do_rcv,
46d3ceab 1921 .release_cb = tcp_release_cb,
563d34d0 1922 .mtu_reduced = tcp_v6_mtu_reduced,
1da177e4 1923 .hash = tcp_v6_hash,
ab1e0a13
ACM
1924 .unhash = inet_unhash,
1925 .get_port = inet_csk_get_port,
1da177e4
LT
1926 .enter_memory_pressure = tcp_enter_memory_pressure,
1927 .sockets_allocated = &tcp_sockets_allocated,
1928 .memory_allocated = &tcp_memory_allocated,
1929 .memory_pressure = &tcp_memory_pressure,
0a5578cf 1930 .orphan_count = &tcp_orphan_count,
1da177e4
LT
1931 .sysctl_wmem = sysctl_tcp_wmem,
1932 .sysctl_rmem = sysctl_tcp_rmem,
1933 .max_header = MAX_TCP_HEADER,
1934 .obj_size = sizeof(struct tcp6_sock),
3ab5aee7 1935 .slab_flags = SLAB_DESTROY_BY_RCU,
6d6ee43e 1936 .twsk_prot = &tcp6_timewait_sock_ops,
60236fdd 1937 .rsk_prot = &tcp6_request_sock_ops,
39d8cda7 1938 .h.hashinfo = &tcp_hashinfo,
7ba42910 1939 .no_autobind = true,
543d9cfe
ACM
1940#ifdef CONFIG_COMPAT
1941 .compat_setsockopt = compat_tcp_setsockopt,
1942 .compat_getsockopt = compat_tcp_getsockopt,
1943#endif
c255a458 1944#ifdef CONFIG_MEMCG_KMEM
d1a4c0b3
GC
1945 .proto_cgroup = tcp_proto_cgroup,
1946#endif
f77d6021 1947 .clear_sk = tcp_v6_clear_sk,
1da177e4
LT
1948};
1949
41135cc8 1950static const struct inet6_protocol tcpv6_protocol = {
c7109986 1951 .early_demux = tcp_v6_early_demux,
1da177e4
LT
1952 .handler = tcp_v6_rcv,
1953 .err_handler = tcp_v6_err,
1954 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1955};
1956
1da177e4
LT
1957static struct inet_protosw tcpv6_protosw = {
1958 .type = SOCK_STREAM,
1959 .protocol = IPPROTO_TCP,
1960 .prot = &tcpv6_prot,
1961 .ops = &inet6_stream_ops,
1da177e4 1962 .no_check = 0,
d83d8461
ACM
1963 .flags = INET_PROTOSW_PERMANENT |
1964 INET_PROTOSW_ICSK,
1da177e4
LT
1965};
1966
2c8c1e72 1967static int __net_init tcpv6_net_init(struct net *net)
93ec926b 1968{
5677242f
DL
1969 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
1970 SOCK_RAW, IPPROTO_TCP, net);
93ec926b
DL
1971}
1972
2c8c1e72 1973static void __net_exit tcpv6_net_exit(struct net *net)
93ec926b 1974{
5677242f 1975 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
b099ce26
EB
1976}
1977
2c8c1e72 1978static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
b099ce26
EB
1979{
1980 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
93ec926b
DL
1981}
1982
1983static struct pernet_operations tcpv6_net_ops = {
b099ce26
EB
1984 .init = tcpv6_net_init,
1985 .exit = tcpv6_net_exit,
1986 .exit_batch = tcpv6_net_exit_batch,
93ec926b
DL
1987};
1988
7f4e4868 1989int __init tcpv6_init(void)
1da177e4 1990{
7f4e4868
DL
1991 int ret;
1992
3336288a
VY
1993 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
1994 if (ret)
c6b641a4 1995 goto out;
3336288a 1996
1da177e4 1997 /* register inet6 protocol */
7f4e4868
DL
1998 ret = inet6_register_protosw(&tcpv6_protosw);
1999 if (ret)
2000 goto out_tcpv6_protocol;
2001
93ec926b 2002 ret = register_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2003 if (ret)
2004 goto out_tcpv6_protosw;
2005out:
2006 return ret;
ae0f7d5f 2007
7f4e4868
DL
2008out_tcpv6_protosw:
2009 inet6_unregister_protosw(&tcpv6_protosw);
3336288a
VY
2010out_tcpv6_protocol:
2011 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
7f4e4868
DL
2012 goto out;
2013}
2014
09f7709f 2015void tcpv6_exit(void)
7f4e4868 2016{
93ec926b 2017 unregister_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2018 inet6_unregister_protosw(&tcpv6_protosw);
2019 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
1da177e4 2020}