net/usb/r8152: enable interrupt transfer
[linux-2.6-block.git] / net / ipv6 / tcp_ipv6.c
CommitLineData
1da177e4
LT
1/*
2 * TCP over IPv6
1ab1457c 3 * Linux INET6 implementation
1da177e4
LT
4 *
5 * Authors:
1ab1457c 6 * Pedro Roque <roque@di.fc.ul.pt>
1da177e4 7 *
1ab1457c 8 * Based on:
1da177e4
LT
9 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
eb4dea58 26#include <linux/bottom_half.h>
1da177e4 27#include <linux/module.h>
1da177e4
LT
28#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
5a0e3ad6 41#include <linux/slab.h>
1da177e4
LT
42
43#include <linux/ipv6.h>
44#include <linux/icmpv6.h>
45#include <linux/random.h>
46
47#include <net/tcp.h>
48#include <net/ndisc.h>
5324a040 49#include <net/inet6_hashtables.h>
8129765a 50#include <net/inet6_connection_sock.h>
1da177e4
LT
51#include <net/ipv6.h>
52#include <net/transp_v6.h>
53#include <net/addrconf.h>
54#include <net/ip6_route.h>
55#include <net/ip6_checksum.h>
56#include <net/inet_ecn.h>
57#include <net/protocol.h>
58#include <net/xfrm.h>
1da177e4
LT
59#include <net/snmp.h>
60#include <net/dsfield.h>
6d6ee43e 61#include <net/timewait_sock.h>
18134bed 62#include <net/netdma.h>
3d58b5fa 63#include <net/inet_common.h>
6e5714ea 64#include <net/secure_seq.h>
d1a4c0b3 65#include <net/tcp_memcontrol.h>
076bb0c8 66#include <net/busy_poll.h>
1da177e4
LT
67
68#include <asm/uaccess.h>
69
70#include <linux/proc_fs.h>
71#include <linux/seq_file.h>
72
cfb6eeb4
YH
73#include <linux/crypto.h>
74#include <linux/scatterlist.h>
75
cfb6eeb4 76static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
6edafaaf
GJ
77static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
78 struct request_sock *req);
1da177e4
LT
79
80static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
1da177e4 81
3b401a81
SH
82static const struct inet_connection_sock_af_ops ipv6_mapped;
83static const struct inet_connection_sock_af_ops ipv6_specific;
a928630a 84#ifdef CONFIG_TCP_MD5SIG
b2e4b3de
SH
85static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
86static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
9501f972
YH
87#else
88static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 89 const struct in6_addr *addr)
9501f972
YH
90{
91 return NULL;
92}
a928630a 93#endif
1da177e4 94
fae6ef87
NC
95static void inet6_sk_rx_dst_set(struct sock *sk, const struct sk_buff *skb)
96{
97 struct dst_entry *dst = skb_dst(skb);
98 const struct rt6_info *rt = (const struct rt6_info *)dst;
99
100 dst_hold(dst);
101 sk->sk_rx_dst = dst;
102 inet_sk(sk)->rx_dst_ifindex = skb->skb_iif;
103 if (rt->rt6i_node)
104 inet6_sk(sk)->rx_dst_cookie = rt->rt6i_node->fn_sernum;
105}
106
1da177e4
LT
107static void tcp_v6_hash(struct sock *sk)
108{
109 if (sk->sk_state != TCP_CLOSE) {
8292a17a 110 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
1da177e4
LT
111 tcp_prot.hash(sk);
112 return;
113 }
114 local_bh_disable();
9327f705 115 __inet6_hash(sk, NULL);
1da177e4
LT
116 local_bh_enable();
117 }
118}
119
cf533ea5 120static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
1da177e4 121{
0660e03f
ACM
122 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
123 ipv6_hdr(skb)->saddr.s6_addr32,
aa8223c7
ACM
124 tcp_hdr(skb)->dest,
125 tcp_hdr(skb)->source);
1da177e4
LT
126}
127
1ab1457c 128static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
1da177e4
LT
129 int addr_len)
130{
131 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
1ab1457c 132 struct inet_sock *inet = inet_sk(sk);
d83d8461 133 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4
LT
134 struct ipv6_pinfo *np = inet6_sk(sk);
135 struct tcp_sock *tp = tcp_sk(sk);
20c59de2 136 struct in6_addr *saddr = NULL, *final_p, final;
493f377d 137 struct rt6_info *rt;
4c9483b2 138 struct flowi6 fl6;
1da177e4
LT
139 struct dst_entry *dst;
140 int addr_type;
141 int err;
142
1ab1457c 143 if (addr_len < SIN6_LEN_RFC2133)
1da177e4
LT
144 return -EINVAL;
145
1ab1457c 146 if (usin->sin6_family != AF_INET6)
a02cec21 147 return -EAFNOSUPPORT;
1da177e4 148
4c9483b2 149 memset(&fl6, 0, sizeof(fl6));
1da177e4
LT
150
151 if (np->sndflow) {
4c9483b2
DM
152 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
153 IP6_ECN_flow_init(fl6.flowlabel);
154 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
1da177e4 155 struct ip6_flowlabel *flowlabel;
4c9483b2 156 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
1da177e4
LT
157 if (flowlabel == NULL)
158 return -EINVAL;
4e3fd7a0 159 usin->sin6_addr = flowlabel->dst;
1da177e4
LT
160 fl6_sock_release(flowlabel);
161 }
162 }
163
164 /*
1ab1457c
YH
165 * connect() to INADDR_ANY means loopback (BSD'ism).
166 */
167
168 if(ipv6_addr_any(&usin->sin6_addr))
169 usin->sin6_addr.s6_addr[15] = 0x1;
1da177e4
LT
170
171 addr_type = ipv6_addr_type(&usin->sin6_addr);
172
173 if(addr_type & IPV6_ADDR_MULTICAST)
174 return -ENETUNREACH;
175
176 if (addr_type&IPV6_ADDR_LINKLOCAL) {
177 if (addr_len >= sizeof(struct sockaddr_in6) &&
178 usin->sin6_scope_id) {
179 /* If interface is set while binding, indices
180 * must coincide.
181 */
182 if (sk->sk_bound_dev_if &&
183 sk->sk_bound_dev_if != usin->sin6_scope_id)
184 return -EINVAL;
185
186 sk->sk_bound_dev_if = usin->sin6_scope_id;
187 }
188
189 /* Connect to link-local address requires an interface */
190 if (!sk->sk_bound_dev_if)
191 return -EINVAL;
192 }
193
194 if (tp->rx_opt.ts_recent_stamp &&
195 !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
196 tp->rx_opt.ts_recent = 0;
197 tp->rx_opt.ts_recent_stamp = 0;
198 tp->write_seq = 0;
199 }
200
4e3fd7a0 201 np->daddr = usin->sin6_addr;
4c9483b2 202 np->flow_label = fl6.flowlabel;
1da177e4
LT
203
204 /*
205 * TCP over IPv4
206 */
207
208 if (addr_type == IPV6_ADDR_MAPPED) {
d83d8461 209 u32 exthdrlen = icsk->icsk_ext_hdr_len;
1da177e4
LT
210 struct sockaddr_in sin;
211
212 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
213
214 if (__ipv6_only_sock(sk))
215 return -ENETUNREACH;
216
217 sin.sin_family = AF_INET;
218 sin.sin_port = usin->sin6_port;
219 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
220
d83d8461 221 icsk->icsk_af_ops = &ipv6_mapped;
1da177e4 222 sk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
223#ifdef CONFIG_TCP_MD5SIG
224 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
225#endif
1da177e4
LT
226
227 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
228
229 if (err) {
d83d8461
ACM
230 icsk->icsk_ext_hdr_len = exthdrlen;
231 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 232 sk->sk_backlog_rcv = tcp_v6_do_rcv;
cfb6eeb4
YH
233#ifdef CONFIG_TCP_MD5SIG
234 tp->af_specific = &tcp_sock_ipv6_specific;
235#endif
1da177e4
LT
236 goto failure;
237 } else {
c720c7e8
ED
238 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
239 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
240 &np->rcv_saddr);
1da177e4
LT
241 }
242
243 return err;
244 }
245
246 if (!ipv6_addr_any(&np->rcv_saddr))
247 saddr = &np->rcv_saddr;
248
4c9483b2 249 fl6.flowi6_proto = IPPROTO_TCP;
4e3fd7a0
AD
250 fl6.daddr = np->daddr;
251 fl6.saddr = saddr ? *saddr : np->saddr;
4c9483b2
DM
252 fl6.flowi6_oif = sk->sk_bound_dev_if;
253 fl6.flowi6_mark = sk->sk_mark;
1958b856
DM
254 fl6.fl6_dport = usin->sin6_port;
255 fl6.fl6_sport = inet->inet_sport;
1da177e4 256
4c9483b2 257 final_p = fl6_update_dst(&fl6, np->opt, &final);
1da177e4 258
4c9483b2 259 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
beb8d13b 260
4c9483b2 261 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, true);
68d0c6d3
DM
262 if (IS_ERR(dst)) {
263 err = PTR_ERR(dst);
1da177e4 264 goto failure;
14e50e57 265 }
1da177e4
LT
266
267 if (saddr == NULL) {
4c9483b2 268 saddr = &fl6.saddr;
4e3fd7a0 269 np->rcv_saddr = *saddr;
1da177e4
LT
270 }
271
272 /* set the source address */
4e3fd7a0 273 np->saddr = *saddr;
c720c7e8 274 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 275
f83ef8c0 276 sk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 277 __ip6_dst_store(sk, dst, NULL, NULL);
1da177e4 278
493f377d
DM
279 rt = (struct rt6_info *) dst;
280 if (tcp_death_row.sysctl_tw_recycle &&
281 !tp->rx_opt.ts_recent_stamp &&
81166dd6
DM
282 ipv6_addr_equal(&rt->rt6i_dst.addr, &np->daddr))
283 tcp_fetch_timewait_stamp(sk, dst);
493f377d 284
d83d8461 285 icsk->icsk_ext_hdr_len = 0;
1da177e4 286 if (np->opt)
d83d8461
ACM
287 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
288 np->opt->opt_nflen);
1da177e4
LT
289
290 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
291
c720c7e8 292 inet->inet_dport = usin->sin6_port;
1da177e4
LT
293
294 tcp_set_state(sk, TCP_SYN_SENT);
d8313f5c 295 err = inet6_hash_connect(&tcp_death_row, sk);
1da177e4
LT
296 if (err)
297 goto late_failure;
298
2b916477 299 if (!tp->write_seq && likely(!tp->repair))
1da177e4
LT
300 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
301 np->daddr.s6_addr32,
c720c7e8
ED
302 inet->inet_sport,
303 inet->inet_dport);
1da177e4
LT
304
305 err = tcp_connect(sk);
306 if (err)
307 goto late_failure;
308
309 return 0;
310
311late_failure:
312 tcp_set_state(sk, TCP_CLOSE);
313 __sk_dst_reset(sk);
314failure:
c720c7e8 315 inet->inet_dport = 0;
1da177e4
LT
316 sk->sk_route_caps = 0;
317 return err;
318}
319
563d34d0
ED
320static void tcp_v6_mtu_reduced(struct sock *sk)
321{
322 struct dst_entry *dst;
323
324 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
325 return;
326
327 dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
328 if (!dst)
329 return;
330
331 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
332 tcp_sync_mss(sk, dst_mtu(dst));
333 tcp_simple_retransmit(sk);
334 }
335}
336
1da177e4 337static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
d5fdd6ba 338 u8 type, u8 code, int offset, __be32 info)
1da177e4 339{
b71d1d42 340 const struct ipv6hdr *hdr = (const struct ipv6hdr*)skb->data;
505cbfc5 341 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
1da177e4
LT
342 struct ipv6_pinfo *np;
343 struct sock *sk;
344 int err;
1ab1457c 345 struct tcp_sock *tp;
1da177e4 346 __u32 seq;
ca12a1a4 347 struct net *net = dev_net(skb->dev);
1da177e4 348
ca12a1a4 349 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
d86e0dac 350 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
1da177e4
LT
351
352 if (sk == NULL) {
e41b5368
DL
353 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
354 ICMP6_MIB_INERRORS);
1da177e4
LT
355 return;
356 }
357
358 if (sk->sk_state == TCP_TIME_WAIT) {
9469c7b4 359 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
360 return;
361 }
362
363 bh_lock_sock(sk);
563d34d0 364 if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
de0744af 365 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
1da177e4
LT
366
367 if (sk->sk_state == TCP_CLOSE)
368 goto out;
369
e802af9c
SH
370 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
371 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
372 goto out;
373 }
374
1da177e4 375 tp = tcp_sk(sk);
1ab1457c 376 seq = ntohl(th->seq);
1da177e4
LT
377 if (sk->sk_state != TCP_LISTEN &&
378 !between(seq, tp->snd_una, tp->snd_nxt)) {
de0744af 379 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
380 goto out;
381 }
382
383 np = inet6_sk(sk);
384
ec18d9a2
DM
385 if (type == NDISC_REDIRECT) {
386 struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
387
1ed5c48f 388 if (dst)
6700c270 389 dst->ops->redirect(dst, sk, skb);
50a75a89 390 goto out;
ec18d9a2
DM
391 }
392
1da177e4 393 if (type == ICMPV6_PKT_TOOBIG) {
0d4f0608
ED
394 /* We are not interested in TCP_LISTEN and open_requests
395 * (SYN-ACKs send out by Linux are always <576bytes so
396 * they should go through unfragmented).
397 */
398 if (sk->sk_state == TCP_LISTEN)
399 goto out;
400
563d34d0
ED
401 tp->mtu_info = ntohl(info);
402 if (!sock_owned_by_user(sk))
403 tcp_v6_mtu_reduced(sk);
d013ef2a
JA
404 else if (!test_and_set_bit(TCP_MTU_REDUCED_DEFERRED,
405 &tp->tsq_flags))
406 sock_hold(sk);
1da177e4
LT
407 goto out;
408 }
409
410 icmpv6_err_convert(type, code, &err);
411
60236fdd 412 /* Might be for an request_sock */
1da177e4 413 switch (sk->sk_state) {
60236fdd 414 struct request_sock *req, **prev;
1da177e4
LT
415 case TCP_LISTEN:
416 if (sock_owned_by_user(sk))
417 goto out;
418
8129765a
ACM
419 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
420 &hdr->saddr, inet6_iif(skb));
1da177e4
LT
421 if (!req)
422 goto out;
423
424 /* ICMPs are not backlogged, hence we cannot get
425 * an established socket here.
426 */
547b792c 427 WARN_ON(req->sk != NULL);
1da177e4 428
2e6599cb 429 if (seq != tcp_rsk(req)->snt_isn) {
de0744af 430 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
431 goto out;
432 }
433
463c84b9 434 inet_csk_reqsk_queue_drop(sk, req, prev);
5f1e942c 435 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
436 goto out;
437
438 case TCP_SYN_SENT:
439 case TCP_SYN_RECV: /* Cannot happen.
1ab1457c 440 It can, it SYNs are crossed. --ANK */
1da177e4 441 if (!sock_owned_by_user(sk)) {
1da177e4
LT
442 sk->sk_err = err;
443 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
444
445 tcp_done(sk);
446 } else
447 sk->sk_err_soft = err;
448 goto out;
449 }
450
451 if (!sock_owned_by_user(sk) && np->recverr) {
452 sk->sk_err = err;
453 sk->sk_error_report(sk);
454 } else
455 sk->sk_err_soft = err;
456
457out:
458 bh_unlock_sock(sk);
459 sock_put(sk);
460}
461
462
9f10d3f6
NC
463static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
464 struct flowi6 *fl6,
3840a06e 465 struct request_sock *req,
fff32699 466 u16 queue_mapping)
1da177e4 467{
ca304b61 468 struct inet6_request_sock *treq = inet6_rsk(req);
1da177e4
LT
469 struct ipv6_pinfo *np = inet6_sk(sk);
470 struct sk_buff * skb;
9494218f 471 int err = -ENOMEM;
1da177e4 472
9f10d3f6
NC
473 /* First, grab a route. */
474 if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
fd80eb94 475 goto done;
9494218f 476
1a2c6181 477 skb = tcp_make_synack(sk, dst, req, NULL);
9494218f 478
1da177e4 479 if (skb) {
8ad50d96 480 __tcp_v6_send_check(skb, &treq->loc_addr, &treq->rmt_addr);
1da177e4 481
9f10d3f6 482 fl6->daddr = treq->rmt_addr;
fff32699 483 skb_set_queue_mapping(skb, queue_mapping);
43264e0b 484 err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
b9df3cb8 485 err = net_xmit_eval(err);
1da177e4
LT
486 }
487
488done:
1da177e4
LT
489 return err;
490}
491
1a2c6181 492static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req)
72659ecc 493{
9f10d3f6 494 struct flowi6 fl6;
e6c022a4 495 int res;
9f10d3f6 496
1a2c6181 497 res = tcp_v6_send_synack(sk, NULL, &fl6, req, 0);
e6c022a4
ED
498 if (!res)
499 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
500 return res;
72659ecc
OP
501}
502
60236fdd 503static void tcp_v6_reqsk_destructor(struct request_sock *req)
1da177e4 504{
800d55f1 505 kfree_skb(inet6_rsk(req)->pktopts);
1da177e4
LT
506}
507
cfb6eeb4
YH
508#ifdef CONFIG_TCP_MD5SIG
509static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 510 const struct in6_addr *addr)
cfb6eeb4 511{
a915da9b 512 return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
cfb6eeb4
YH
513}
514
515static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
516 struct sock *addr_sk)
517{
518 return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
519}
520
521static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
522 struct request_sock *req)
523{
524 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
525}
526
cfb6eeb4
YH
527static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
528 int optlen)
529{
530 struct tcp_md5sig cmd;
531 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
cfb6eeb4
YH
532
533 if (optlen < sizeof(cmd))
534 return -EINVAL;
535
536 if (copy_from_user(&cmd, optval, sizeof(cmd)))
537 return -EFAULT;
538
539 if (sin6->sin6_family != AF_INET6)
540 return -EINVAL;
541
542 if (!cmd.tcpm_keylen) {
e773e4fa 543 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
a915da9b
ED
544 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
545 AF_INET);
546 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
547 AF_INET6);
cfb6eeb4
YH
548 }
549
550 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
551 return -EINVAL;
552
a915da9b
ED
553 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
554 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
555 AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4 556
a915da9b
ED
557 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
558 AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4
YH
559}
560
49a72dfb 561static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
b71d1d42
ED
562 const struct in6_addr *daddr,
563 const struct in6_addr *saddr, int nbytes)
cfb6eeb4 564{
cfb6eeb4 565 struct tcp6_pseudohdr *bp;
49a72dfb 566 struct scatterlist sg;
8d26d76d 567
cfb6eeb4 568 bp = &hp->md5_blk.ip6;
cfb6eeb4 569 /* 1. TCP pseudo-header (RFC2460) */
4e3fd7a0
AD
570 bp->saddr = *saddr;
571 bp->daddr = *daddr;
49a72dfb 572 bp->protocol = cpu_to_be32(IPPROTO_TCP);
00b1304c 573 bp->len = cpu_to_be32(nbytes);
cfb6eeb4 574
49a72dfb
AL
575 sg_init_one(&sg, bp, sizeof(*bp));
576 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
577}
c7da57a1 578
49a72dfb 579static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
b71d1d42 580 const struct in6_addr *daddr, struct in6_addr *saddr,
318cf7aa 581 const struct tcphdr *th)
49a72dfb
AL
582{
583 struct tcp_md5sig_pool *hp;
584 struct hash_desc *desc;
585
586 hp = tcp_get_md5sig_pool();
587 if (!hp)
588 goto clear_hash_noput;
589 desc = &hp->md5_desc;
590
591 if (crypto_hash_init(desc))
592 goto clear_hash;
593 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
594 goto clear_hash;
595 if (tcp_md5_hash_header(hp, th))
596 goto clear_hash;
597 if (tcp_md5_hash_key(hp, key))
598 goto clear_hash;
599 if (crypto_hash_final(desc, md5_hash))
cfb6eeb4 600 goto clear_hash;
cfb6eeb4 601
cfb6eeb4 602 tcp_put_md5sig_pool();
cfb6eeb4 603 return 0;
49a72dfb 604
cfb6eeb4
YH
605clear_hash:
606 tcp_put_md5sig_pool();
607clear_hash_noput:
608 memset(md5_hash, 0, 16);
49a72dfb 609 return 1;
cfb6eeb4
YH
610}
611
49a72dfb 612static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
318cf7aa
ED
613 const struct sock *sk,
614 const struct request_sock *req,
615 const struct sk_buff *skb)
cfb6eeb4 616{
b71d1d42 617 const struct in6_addr *saddr, *daddr;
49a72dfb
AL
618 struct tcp_md5sig_pool *hp;
619 struct hash_desc *desc;
318cf7aa 620 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4
YH
621
622 if (sk) {
623 saddr = &inet6_sk(sk)->saddr;
624 daddr = &inet6_sk(sk)->daddr;
49a72dfb 625 } else if (req) {
cfb6eeb4
YH
626 saddr = &inet6_rsk(req)->loc_addr;
627 daddr = &inet6_rsk(req)->rmt_addr;
49a72dfb 628 } else {
b71d1d42 629 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
49a72dfb
AL
630 saddr = &ip6h->saddr;
631 daddr = &ip6h->daddr;
cfb6eeb4 632 }
49a72dfb
AL
633
634 hp = tcp_get_md5sig_pool();
635 if (!hp)
636 goto clear_hash_noput;
637 desc = &hp->md5_desc;
638
639 if (crypto_hash_init(desc))
640 goto clear_hash;
641
642 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
643 goto clear_hash;
644 if (tcp_md5_hash_header(hp, th))
645 goto clear_hash;
646 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
647 goto clear_hash;
648 if (tcp_md5_hash_key(hp, key))
649 goto clear_hash;
650 if (crypto_hash_final(desc, md5_hash))
651 goto clear_hash;
652
653 tcp_put_md5sig_pool();
654 return 0;
655
656clear_hash:
657 tcp_put_md5sig_pool();
658clear_hash_noput:
659 memset(md5_hash, 0, 16);
660 return 1;
cfb6eeb4
YH
661}
662
318cf7aa 663static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
cfb6eeb4 664{
cf533ea5 665 const __u8 *hash_location = NULL;
cfb6eeb4 666 struct tcp_md5sig_key *hash_expected;
b71d1d42 667 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
318cf7aa 668 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4 669 int genhash;
cfb6eeb4
YH
670 u8 newhash[16];
671
672 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
7d5d5525 673 hash_location = tcp_parse_md5sig_option(th);
cfb6eeb4 674
785957d3
DM
675 /* We've parsed the options - do we have a hash? */
676 if (!hash_expected && !hash_location)
677 return 0;
678
679 if (hash_expected && !hash_location) {
680 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
cfb6eeb4
YH
681 return 1;
682 }
683
785957d3
DM
684 if (!hash_expected && hash_location) {
685 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
cfb6eeb4
YH
686 return 1;
687 }
688
689 /* check the signature */
49a72dfb
AL
690 genhash = tcp_v6_md5_hash_skb(newhash,
691 hash_expected,
692 NULL, NULL, skb);
693
cfb6eeb4 694 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
e87cc472
JP
695 net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
696 genhash ? "failed" : "mismatch",
697 &ip6h->saddr, ntohs(th->source),
698 &ip6h->daddr, ntohs(th->dest));
cfb6eeb4
YH
699 return 1;
700 }
701 return 0;
702}
703#endif
704
c6aefafb 705struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
1da177e4 706 .family = AF_INET6,
2e6599cb 707 .obj_size = sizeof(struct tcp6_request_sock),
72659ecc 708 .rtx_syn_ack = tcp_v6_rtx_synack,
60236fdd
ACM
709 .send_ack = tcp_v6_reqsk_send_ack,
710 .destructor = tcp_v6_reqsk_destructor,
72659ecc
OP
711 .send_reset = tcp_v6_send_reset,
712 .syn_ack_timeout = tcp_syn_ack_timeout,
1da177e4
LT
713};
714
cfb6eeb4 715#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 716static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
cfb6eeb4 717 .md5_lookup = tcp_v6_reqsk_md5_lookup,
e3afe7b7 718 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 719};
b6332e6c 720#endif
cfb6eeb4 721
626e264d 722static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
ee684b6f
AV
723 u32 tsval, u32 tsecr,
724 struct tcp_md5sig_key *key, int rst, u8 tclass)
1da177e4 725{
cf533ea5
ED
726 const struct tcphdr *th = tcp_hdr(skb);
727 struct tcphdr *t1;
1da177e4 728 struct sk_buff *buff;
4c9483b2 729 struct flowi6 fl6;
adf30907 730 struct net *net = dev_net(skb_dst(skb)->dev);
e5047992 731 struct sock *ctl_sk = net->ipv6.tcp_sk;
77c676da 732 unsigned int tot_len = sizeof(struct tcphdr);
adf30907 733 struct dst_entry *dst;
81ada62d 734 __be32 *topt;
1da177e4 735
ee684b6f 736 if (tsecr)
626e264d 737 tot_len += TCPOLEN_TSTAMP_ALIGNED;
cfb6eeb4 738#ifdef CONFIG_TCP_MD5SIG
cfb6eeb4
YH
739 if (key)
740 tot_len += TCPOLEN_MD5SIG_ALIGNED;
741#endif
742
cfb6eeb4 743 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1da177e4 744 GFP_ATOMIC);
1ab1457c
YH
745 if (buff == NULL)
746 return;
1da177e4 747
cfb6eeb4 748 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1da177e4 749
cfb6eeb4 750 t1 = (struct tcphdr *) skb_push(buff, tot_len);
6651ffc8 751 skb_reset_transport_header(buff);
1da177e4
LT
752
753 /* Swap the send and the receive. */
754 memset(t1, 0, sizeof(*t1));
755 t1->dest = th->source;
756 t1->source = th->dest;
cfb6eeb4 757 t1->doff = tot_len / 4;
626e264d
IJ
758 t1->seq = htonl(seq);
759 t1->ack_seq = htonl(ack);
760 t1->ack = !rst || !th->ack;
761 t1->rst = rst;
762 t1->window = htons(win);
1da177e4 763
81ada62d
IJ
764 topt = (__be32 *)(t1 + 1);
765
ee684b6f 766 if (tsecr) {
626e264d
IJ
767 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
768 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
ee684b6f
AV
769 *topt++ = htonl(tsval);
770 *topt++ = htonl(tsecr);
626e264d
IJ
771 }
772
cfb6eeb4
YH
773#ifdef CONFIG_TCP_MD5SIG
774 if (key) {
81ada62d
IJ
775 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
776 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
777 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
78e645cb
IJ
778 &ipv6_hdr(skb)->saddr,
779 &ipv6_hdr(skb)->daddr, t1);
cfb6eeb4
YH
780 }
781#endif
782
4c9483b2 783 memset(&fl6, 0, sizeof(fl6));
4e3fd7a0
AD
784 fl6.daddr = ipv6_hdr(skb)->saddr;
785 fl6.saddr = ipv6_hdr(skb)->daddr;
1da177e4 786
e5700aff
DM
787 buff->ip_summed = CHECKSUM_PARTIAL;
788 buff->csum = 0;
789
4c9483b2 790 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
1da177e4 791
4c9483b2 792 fl6.flowi6_proto = IPPROTO_TCP;
4c675258
AK
793 if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
794 fl6.flowi6_oif = inet6_iif(skb);
1958b856
DM
795 fl6.fl6_dport = t1->dest;
796 fl6.fl6_sport = t1->source;
4c9483b2 797 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
1da177e4 798
c20121ae
DL
799 /* Pass a socket to ip6_dst_lookup either it is for RST
800 * Underlying function will use this to retrieve the network
801 * namespace
802 */
4c9483b2 803 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL, false);
68d0c6d3
DM
804 if (!IS_ERR(dst)) {
805 skb_dst_set(buff, dst);
b903d324 806 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
68d0c6d3
DM
807 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
808 if (rst)
809 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
810 return;
1da177e4
LT
811 }
812
813 kfree_skb(buff);
814}
815
626e264d 816static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
1da177e4 817{
cf533ea5 818 const struct tcphdr *th = tcp_hdr(skb);
626e264d 819 u32 seq = 0, ack_seq = 0;
fa3e5b4e 820 struct tcp_md5sig_key *key = NULL;
658ddaaf
SL
821#ifdef CONFIG_TCP_MD5SIG
822 const __u8 *hash_location = NULL;
823 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
824 unsigned char newhash[16];
825 int genhash;
826 struct sock *sk1 = NULL;
827#endif
1da177e4 828
626e264d 829 if (th->rst)
1da177e4
LT
830 return;
831
626e264d
IJ
832 if (!ipv6_unicast_destination(skb))
833 return;
1da177e4 834
cfb6eeb4 835#ifdef CONFIG_TCP_MD5SIG
658ddaaf
SL
836 hash_location = tcp_parse_md5sig_option(th);
837 if (!sk && hash_location) {
838 /*
839 * active side is lost. Try to find listening socket through
840 * source port, and then find md5 key through listening socket.
841 * we are not loose security here:
842 * Incoming packet is checked with md5 hash with finding key,
843 * no RST generated if md5 hash doesn't match.
844 */
845 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
5ba24953
TH
846 &tcp_hashinfo, &ipv6h->saddr,
847 th->source, &ipv6h->daddr,
658ddaaf
SL
848 ntohs(th->source), inet6_iif(skb));
849 if (!sk1)
850 return;
851
852 rcu_read_lock();
853 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
854 if (!key)
855 goto release_sk1;
856
857 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
858 if (genhash || memcmp(hash_location, newhash, 16) != 0)
859 goto release_sk1;
860 } else {
861 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
862 }
cfb6eeb4
YH
863#endif
864
626e264d
IJ
865 if (th->ack)
866 seq = ntohl(th->ack_seq);
867 else
868 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
869 (th->doff << 2);
1da177e4 870
ee684b6f 871 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, 0, key, 1, 0);
658ddaaf
SL
872
873#ifdef CONFIG_TCP_MD5SIG
874release_sk1:
875 if (sk1) {
876 rcu_read_unlock();
877 sock_put(sk1);
878 }
879#endif
626e264d 880}
1da177e4 881
ee684b6f
AV
882static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack,
883 u32 win, u32 tsval, u32 tsecr,
b903d324 884 struct tcp_md5sig_key *key, u8 tclass)
626e264d 885{
ee684b6f 886 tcp_v6_send_response(skb, seq, ack, win, tsval, tsecr, key, 0, tclass);
1da177e4
LT
887}
888
889static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
890{
8feaf0c0 891 struct inet_timewait_sock *tw = inet_twsk(sk);
cfb6eeb4 892 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1da177e4 893
9501f972 894 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
8feaf0c0 895 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
ee684b6f 896 tcp_time_stamp + tcptw->tw_ts_offset,
b903d324
ED
897 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw),
898 tw->tw_tclass);
1da177e4 899
8feaf0c0 900 inet_twsk_put(tw);
1da177e4
LT
901}
902
6edafaaf
GJ
903static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
904 struct request_sock *req)
1da177e4 905{
ee684b6f
AV
906 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1,
907 req->rcv_wnd, tcp_time_stamp, req->ts_recent,
b903d324 908 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr), 0);
1da177e4
LT
909}
910
911
912static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
913{
60236fdd 914 struct request_sock *req, **prev;
aa8223c7 915 const struct tcphdr *th = tcp_hdr(skb);
1da177e4
LT
916 struct sock *nsk;
917
918 /* Find possible connection requests. */
8129765a 919 req = inet6_csk_search_req(sk, &prev, th->source,
0660e03f
ACM
920 &ipv6_hdr(skb)->saddr,
921 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1da177e4 922 if (req)
8336886f 923 return tcp_check_req(sk, skb, req, prev, false);
1da177e4 924
3b1e0a65 925 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
d86e0dac
PE
926 &ipv6_hdr(skb)->saddr, th->source,
927 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1da177e4
LT
928
929 if (nsk) {
930 if (nsk->sk_state != TCP_TIME_WAIT) {
931 bh_lock_sock(nsk);
932 return nsk;
933 }
9469c7b4 934 inet_twsk_put(inet_twsk(nsk));
1da177e4
LT
935 return NULL;
936 }
937
c6aefafb 938#ifdef CONFIG_SYN_COOKIES
af9b4738 939 if (!th->syn)
c6aefafb 940 sk = cookie_v6_check(sk, skb);
1da177e4
LT
941#endif
942 return sk;
943}
944
1da177e4
LT
945/* FIXME: this is substantially similar to the ipv4 code.
946 * Can some kind of merge be done? -- erics
947 */
948static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
949{
e6b4d113
WAS
950 struct tcp_options_received tmp_opt;
951 struct request_sock *req;
ca304b61 952 struct inet6_request_sock *treq;
1da177e4 953 struct ipv6_pinfo *np = inet6_sk(sk);
1da177e4 954 struct tcp_sock *tp = tcp_sk(sk);
e6b4d113 955 __u32 isn = TCP_SKB_CB(skb)->when;
493f377d 956 struct dst_entry *dst = NULL;
3840a06e 957 struct flowi6 fl6;
a2a385d6 958 bool want_cookie = false;
1da177e4
LT
959
960 if (skb->protocol == htons(ETH_P_IP))
961 return tcp_v4_conn_request(sk, skb);
962
963 if (!ipv6_unicast_destination(skb))
1ab1457c 964 goto drop;
1da177e4 965
5ad37d5d
HFS
966 if ((sysctl_tcp_syncookies == 2 ||
967 inet_csk_reqsk_queue_is_full(sk)) && !isn) {
946cedcc
ED
968 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
969 if (!want_cookie)
970 goto drop;
1da177e4
LT
971 }
972
5f1e942c
VS
973 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1) {
974 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1da177e4 975 goto drop;
5f1e942c 976 }
1da177e4 977
ca304b61 978 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1da177e4
LT
979 if (req == NULL)
980 goto drop;
981
cfb6eeb4
YH
982#ifdef CONFIG_TCP_MD5SIG
983 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
984#endif
985
1da177e4
LT
986 tcp_clear_options(&tmp_opt);
987 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
988 tmp_opt.user_mss = tp->rx_opt.user_mss;
1a2c6181 989 tcp_parse_options(skb, &tmp_opt, 0, NULL);
1da177e4 990
4dfc2817 991 if (want_cookie && !tmp_opt.saw_tstamp)
c6aefafb 992 tcp_clear_options(&tmp_opt);
c6aefafb 993
1da177e4
LT
994 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
995 tcp_openreq_init(req, &tmp_opt, skb);
996
ca304b61 997 treq = inet6_rsk(req);
4e3fd7a0
AD
998 treq->rmt_addr = ipv6_hdr(skb)->saddr;
999 treq->loc_addr = ipv6_hdr(skb)->daddr;
172d69e6 1000 if (!want_cookie || tmp_opt.tstamp_ok)
5d134f1c 1001 TCP_ECN_create_request(req, skb, sock_net(sk));
c6aefafb 1002
4d0fe50c
ED
1003 treq->iif = sk->sk_bound_dev_if;
1004
1005 /* So that link locals have meaning */
1006 if (!sk->sk_bound_dev_if &&
1007 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1008 treq->iif = inet6_iif(skb);
1009
2bbdf389 1010 if (!isn) {
c6aefafb
GG
1011 if (ipv6_opt_accepted(sk, skb) ||
1012 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1013 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1014 atomic_inc(&skb->users);
1015 treq->pktopts = skb;
1016 }
493f377d
DM
1017
1018 if (want_cookie) {
2bbdf389
FW
1019 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1020 req->cookie_ts = tmp_opt.tstamp_ok;
493f377d
DM
1021 goto have_isn;
1022 }
1023
1024 /* VJ's idea. We save last timestamp seen
1025 * from the destination in peer table, when entering
1026 * state TIME-WAIT, and check against it before
1027 * accepting new connection request.
1028 *
1029 * If "isn" is not zero, this request hit alive
1030 * timewait bucket, so that all the necessary checks
1031 * are made in the function processing timewait state.
1032 */
1033 if (tmp_opt.saw_tstamp &&
1034 tcp_death_row.sysctl_tw_recycle &&
81166dd6
DM
1035 (dst = inet6_csk_route_req(sk, &fl6, req)) != NULL) {
1036 if (!tcp_peer_is_proven(req, dst, true)) {
493f377d
DM
1037 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1038 goto drop_and_release;
1039 }
1040 }
1041 /* Kill the following clause, if you dislike this way. */
1042 else if (!sysctl_tcp_syncookies &&
1043 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1044 (sysctl_max_syn_backlog >> 2)) &&
81166dd6 1045 !tcp_peer_is_proven(req, dst, false)) {
493f377d
DM
1046 /* Without syncookies last quarter of
1047 * backlog is filled with destinations,
1048 * proven to be alive.
1049 * It means that we continue to communicate
1050 * to destinations, already remembered
1051 * to the moment of synflood.
1052 */
1053 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
1054 &treq->rmt_addr, ntohs(tcp_hdr(skb)->source));
1055 goto drop_and_release;
2bbdf389 1056 }
493f377d
DM
1057
1058 isn = tcp_v6_init_sequence(skb);
c6aefafb 1059 }
493f377d 1060have_isn:
2e6599cb 1061 tcp_rsk(req)->snt_isn = isn;
1da177e4 1062
437c5b53
NC
1063 if (security_inet_conn_request(sk, skb, req))
1064 goto drop_and_release;
4237c75c 1065
9f10d3f6 1066 if (tcp_v6_send_synack(sk, dst, &fl6, req,
fff32699 1067 skb_get_queue_mapping(skb)) ||
4957faad 1068 want_cookie)
e6b4d113 1069 goto drop_and_free;
1da177e4 1070
016818d0 1071 tcp_rsk(req)->snt_synack = tcp_time_stamp;
8336886f 1072 tcp_rsk(req)->listener = NULL;
e6b4d113
WAS
1073 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1074 return 0;
1da177e4 1075
493f377d
DM
1076drop_and_release:
1077 dst_release(dst);
e6b4d113
WAS
1078drop_and_free:
1079 reqsk_free(req);
1da177e4 1080drop:
5f1e942c 1081 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1082 return 0; /* don't send reset */
1083}
1084
1085static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
60236fdd 1086 struct request_sock *req,
1da177e4
LT
1087 struct dst_entry *dst)
1088{
78d15e82 1089 struct inet6_request_sock *treq;
1da177e4
LT
1090 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1091 struct tcp6_sock *newtcp6sk;
1092 struct inet_sock *newinet;
1093 struct tcp_sock *newtp;
1094 struct sock *newsk;
cfb6eeb4
YH
1095#ifdef CONFIG_TCP_MD5SIG
1096 struct tcp_md5sig_key *key;
1097#endif
3840a06e 1098 struct flowi6 fl6;
1da177e4
LT
1099
1100 if (skb->protocol == htons(ETH_P_IP)) {
1101 /*
1102 * v6 mapped
1103 */
1104
1105 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1106
1ab1457c 1107 if (newsk == NULL)
1da177e4
LT
1108 return NULL;
1109
1110 newtcp6sk = (struct tcp6_sock *)newsk;
1111 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1112
1113 newinet = inet_sk(newsk);
1114 newnp = inet6_sk(newsk);
1115 newtp = tcp_sk(newsk);
1116
1117 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1118
c720c7e8 1119 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newnp->daddr);
1da177e4 1120
c720c7e8 1121 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
1da177e4 1122
4e3fd7a0 1123 newnp->rcv_saddr = newnp->saddr;
1da177e4 1124
8292a17a 1125 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1da177e4 1126 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
1127#ifdef CONFIG_TCP_MD5SIG
1128 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1129#endif
1130
676a1184
YZ
1131 newnp->ipv6_ac_list = NULL;
1132 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1133 newnp->pktoptions = NULL;
1134 newnp->opt = NULL;
505cbfc5 1135 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1136 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
e7219858 1137 newnp->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4 1138
e6848976
ACM
1139 /*
1140 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1141 * here, tcp_create_openreq_child now does this for us, see the comment in
1142 * that function for the gory details. -acme
1da177e4 1143 */
1da177e4
LT
1144
1145 /* It is tricky place. Until this moment IPv4 tcp
8292a17a 1146 worked with IPv6 icsk.icsk_af_ops.
1da177e4
LT
1147 Sync it now.
1148 */
d83d8461 1149 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1da177e4
LT
1150
1151 return newsk;
1152 }
1153
78d15e82 1154 treq = inet6_rsk(req);
1da177e4
LT
1155
1156 if (sk_acceptq_is_full(sk))
1157 goto out_overflow;
1158
493f377d 1159 if (!dst) {
3840a06e 1160 dst = inet6_csk_route_req(sk, &fl6, req);
493f377d 1161 if (!dst)
1da177e4 1162 goto out;
1ab1457c 1163 }
1da177e4
LT
1164
1165 newsk = tcp_create_openreq_child(sk, req, skb);
1166 if (newsk == NULL)
093d2823 1167 goto out_nonewsk;
1da177e4 1168
e6848976
ACM
1169 /*
1170 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1171 * count here, tcp_create_openreq_child now does this for us, see the
1172 * comment in that function for the gory details. -acme
1173 */
1da177e4 1174
59eed279 1175 newsk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 1176 __ip6_dst_store(newsk, dst, NULL, NULL);
fae6ef87 1177 inet6_sk_rx_dst_set(newsk, skb);
1da177e4
LT
1178
1179 newtcp6sk = (struct tcp6_sock *)newsk;
1180 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1181
1182 newtp = tcp_sk(newsk);
1183 newinet = inet_sk(newsk);
1184 newnp = inet6_sk(newsk);
1185
1186 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1187
4e3fd7a0
AD
1188 newnp->daddr = treq->rmt_addr;
1189 newnp->saddr = treq->loc_addr;
1190 newnp->rcv_saddr = treq->loc_addr;
2e6599cb 1191 newsk->sk_bound_dev_if = treq->iif;
1da177e4 1192
1ab1457c 1193 /* Now IPv6 options...
1da177e4
LT
1194
1195 First: no IPv4 options.
1196 */
f6d8bd05 1197 newinet->inet_opt = NULL;
676a1184 1198 newnp->ipv6_ac_list = NULL;
d35690be 1199 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1200
1201 /* Clone RX bits */
1202 newnp->rxopt.all = np->rxopt.all;
1203
1204 /* Clone pktoptions received with SYN */
1205 newnp->pktoptions = NULL;
2e6599cb 1206 if (treq->pktopts != NULL) {
99a1dec7
MG
1207 newnp->pktoptions = skb_clone(treq->pktopts,
1208 sk_gfp_atomic(sk, GFP_ATOMIC));
ab185d7b 1209 consume_skb(treq->pktopts);
2e6599cb 1210 treq->pktopts = NULL;
1da177e4
LT
1211 if (newnp->pktoptions)
1212 skb_set_owner_r(newnp->pktoptions, newsk);
1213 }
1214 newnp->opt = NULL;
505cbfc5 1215 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1216 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
e7219858 1217 newnp->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4
LT
1218
1219 /* Clone native IPv6 options from listening socket (if any)
1220
1221 Yes, keeping reference count would be much more clever,
1222 but we make one more one thing there: reattach optmem
1223 to newsk.
1224 */
43264e0b
RL
1225 if (np->opt)
1226 newnp->opt = ipv6_dup_options(newsk, np->opt);
1da177e4 1227
d83d8461 1228 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1da177e4 1229 if (newnp->opt)
d83d8461
ACM
1230 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1231 newnp->opt->opt_flen);
1da177e4 1232
5d424d5a 1233 tcp_mtup_init(newsk);
1da177e4 1234 tcp_sync_mss(newsk, dst_mtu(dst));
0dbaee3b 1235 newtp->advmss = dst_metric_advmss(dst);
d135c522
NC
1236 if (tcp_sk(sk)->rx_opt.user_mss &&
1237 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1238 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1239
1da177e4
LT
1240 tcp_initialize_rcv_mss(newsk);
1241
c720c7e8
ED
1242 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1243 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 1244
cfb6eeb4
YH
1245#ifdef CONFIG_TCP_MD5SIG
1246 /* Copy over the MD5 key from the original socket */
1247 if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1248 /* We're using one, so create a matching key
1249 * on the newsk structure. If we fail to get
1250 * memory, then we end up not copying the key
1251 * across. Shucks.
1252 */
a915da9b 1253 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newnp->daddr,
99a1dec7
MG
1254 AF_INET6, key->key, key->keylen,
1255 sk_gfp_atomic(sk, GFP_ATOMIC));
cfb6eeb4
YH
1256 }
1257#endif
1258
093d2823 1259 if (__inet_inherit_port(sk, newsk) < 0) {
e337e24d
CP
1260 inet_csk_prepare_forced_close(newsk);
1261 tcp_done(newsk);
093d2823
BS
1262 goto out;
1263 }
9327f705 1264 __inet6_hash(newsk, NULL);
1da177e4
LT
1265
1266 return newsk;
1267
1268out_overflow:
de0744af 1269 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
093d2823 1270out_nonewsk:
1da177e4 1271 dst_release(dst);
093d2823
BS
1272out:
1273 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1274 return NULL;
1275}
1276
b51655b9 1277static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1da177e4 1278{
84fa7933 1279 if (skb->ip_summed == CHECKSUM_COMPLETE) {
684f2176 1280 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
0660e03f 1281 &ipv6_hdr(skb)->daddr, skb->csum)) {
fb286bb2 1282 skb->ip_summed = CHECKSUM_UNNECESSARY;
1da177e4 1283 return 0;
fb286bb2 1284 }
1da177e4 1285 }
fb286bb2 1286
684f2176 1287 skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
0660e03f
ACM
1288 &ipv6_hdr(skb)->saddr,
1289 &ipv6_hdr(skb)->daddr, 0));
fb286bb2 1290
1da177e4 1291 if (skb->len <= 76) {
fb286bb2 1292 return __skb_checksum_complete(skb);
1da177e4
LT
1293 }
1294 return 0;
1295}
1296
1297/* The socket must have it's spinlock held when we get
1298 * here.
1299 *
1300 * We have a potential double-lock case here, so even when
1301 * doing backlog processing we use the BH locking scheme.
1302 * This is because we cannot sleep with the original spinlock
1303 * held.
1304 */
1305static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1306{
1307 struct ipv6_pinfo *np = inet6_sk(sk);
1308 struct tcp_sock *tp;
1309 struct sk_buff *opt_skb = NULL;
1310
1311 /* Imagine: socket is IPv6. IPv4 packet arrives,
1312 goes to IPv4 receive handler and backlogged.
1313 From backlog it always goes here. Kerboom...
1314 Fortunately, tcp_rcv_established and rcv_established
1315 handle them correctly, but it is not case with
1316 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1317 */
1318
1319 if (skb->protocol == htons(ETH_P_IP))
1320 return tcp_v4_do_rcv(sk, skb);
1321
cfb6eeb4
YH
1322#ifdef CONFIG_TCP_MD5SIG
1323 if (tcp_v6_inbound_md5_hash (sk, skb))
1324 goto discard;
1325#endif
1326
fda9ef5d 1327 if (sk_filter(sk, skb))
1da177e4
LT
1328 goto discard;
1329
1330 /*
1331 * socket locking is here for SMP purposes as backlog rcv
1332 * is currently called with bh processing disabled.
1333 */
1334
1335 /* Do Stevens' IPV6_PKTOPTIONS.
1336
1337 Yes, guys, it is the only place in our code, where we
1338 may make it not affecting IPv4.
1339 The rest of code is protocol independent,
1340 and I do not like idea to uglify IPv4.
1341
1342 Actually, all the idea behind IPV6_PKTOPTIONS
1343 looks not very well thought. For now we latch
1344 options, received in the last packet, enqueued
1345 by tcp. Feel free to propose better solution.
1ab1457c 1346 --ANK (980728)
1da177e4
LT
1347 */
1348 if (np->rxopt.all)
99a1dec7 1349 opt_skb = skb_clone(skb, sk_gfp_atomic(sk, GFP_ATOMIC));
1da177e4
LT
1350
1351 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
5d299f3d
ED
1352 struct dst_entry *dst = sk->sk_rx_dst;
1353
bdeab991 1354 sock_rps_save_rxhash(sk, skb);
5d299f3d
ED
1355 if (dst) {
1356 if (inet_sk(sk)->rx_dst_ifindex != skb->skb_iif ||
1357 dst->ops->check(dst, np->rx_dst_cookie) == NULL) {
1358 dst_release(dst);
1359 sk->sk_rx_dst = NULL;
1360 }
1361 }
1362
aa8223c7 1363 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1da177e4 1364 goto reset;
1da177e4
LT
1365 if (opt_skb)
1366 goto ipv6_pktoptions;
1367 return 0;
1368 }
1369
ab6a5bb6 1370 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1da177e4
LT
1371 goto csum_err;
1372
1ab1457c 1373 if (sk->sk_state == TCP_LISTEN) {
1da177e4
LT
1374 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1375 if (!nsk)
1376 goto discard;
1377
1378 /*
1379 * Queue it on the new socket if the new socket is active,
1380 * otherwise we just shortcircuit this and continue with
1381 * the new socket..
1382 */
1ab1457c 1383 if(nsk != sk) {
bdeab991 1384 sock_rps_save_rxhash(nsk, skb);
1da177e4
LT
1385 if (tcp_child_process(sk, nsk, skb))
1386 goto reset;
1387 if (opt_skb)
1388 __kfree_skb(opt_skb);
1389 return 0;
1390 }
47482f13 1391 } else
bdeab991 1392 sock_rps_save_rxhash(sk, skb);
1da177e4 1393
aa8223c7 1394 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1da177e4 1395 goto reset;
1da177e4
LT
1396 if (opt_skb)
1397 goto ipv6_pktoptions;
1398 return 0;
1399
1400reset:
cfb6eeb4 1401 tcp_v6_send_reset(sk, skb);
1da177e4
LT
1402discard:
1403 if (opt_skb)
1404 __kfree_skb(opt_skb);
1405 kfree_skb(skb);
1406 return 0;
1407csum_err:
6a5dc9e5 1408 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_CSUMERRORS);
63231bdd 1409 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1da177e4
LT
1410 goto discard;
1411
1412
1413ipv6_pktoptions:
1414 /* Do you ask, what is it?
1415
1416 1. skb was enqueued by tcp.
1417 2. skb is added to tail of read queue, rather than out of order.
1418 3. socket is not in passive state.
1419 4. Finally, it really contains options, which user wants to receive.
1420 */
1421 tp = tcp_sk(sk);
1422 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1423 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
333fad53 1424 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
505cbfc5 1425 np->mcast_oif = inet6_iif(opt_skb);
333fad53 1426 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
0660e03f 1427 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
4c507d28 1428 if (np->rxopt.bits.rxtclass)
e7219858 1429 np->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4
LT
1430 if (ipv6_opt_accepted(sk, opt_skb)) {
1431 skb_set_owner_r(opt_skb, sk);
1432 opt_skb = xchg(&np->pktoptions, opt_skb);
1433 } else {
1434 __kfree_skb(opt_skb);
1435 opt_skb = xchg(&np->pktoptions, NULL);
1436 }
1437 }
1438
800d55f1 1439 kfree_skb(opt_skb);
1da177e4
LT
1440 return 0;
1441}
1442
e5bbef20 1443static int tcp_v6_rcv(struct sk_buff *skb)
1da177e4 1444{
cf533ea5 1445 const struct tcphdr *th;
b71d1d42 1446 const struct ipv6hdr *hdr;
1da177e4
LT
1447 struct sock *sk;
1448 int ret;
a86b1e30 1449 struct net *net = dev_net(skb->dev);
1da177e4
LT
1450
1451 if (skb->pkt_type != PACKET_HOST)
1452 goto discard_it;
1453
1454 /*
1455 * Count it even if it's bad.
1456 */
63231bdd 1457 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1da177e4
LT
1458
1459 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1460 goto discard_it;
1461
aa8223c7 1462 th = tcp_hdr(skb);
1da177e4
LT
1463
1464 if (th->doff < sizeof(struct tcphdr)/4)
1465 goto bad_packet;
1466 if (!pskb_may_pull(skb, th->doff*4))
1467 goto discard_it;
1468
60476372 1469 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
6a5dc9e5 1470 goto csum_error;
1da177e4 1471
aa8223c7 1472 th = tcp_hdr(skb);
e802af9c 1473 hdr = ipv6_hdr(skb);
1da177e4
LT
1474 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1475 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1476 skb->len - th->doff*4);
1477 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1478 TCP_SKB_CB(skb)->when = 0;
b82d1bb4 1479 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
1da177e4
LT
1480 TCP_SKB_CB(skb)->sacked = 0;
1481
9a1f27c4 1482 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1da177e4
LT
1483 if (!sk)
1484 goto no_tcp_socket;
1485
1486process:
1487 if (sk->sk_state == TCP_TIME_WAIT)
1488 goto do_time_wait;
1489
e802af9c
SH
1490 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1491 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1492 goto discard_and_relse;
1493 }
1494
1da177e4
LT
1495 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1496 goto discard_and_relse;
1497
fda9ef5d 1498 if (sk_filter(sk, skb))
1da177e4
LT
1499 goto discard_and_relse;
1500
8b80cda5 1501 sk_mark_napi_id(sk, skb);
1da177e4
LT
1502 skb->dev = NULL;
1503
293b9c42 1504 bh_lock_sock_nested(sk);
1da177e4
LT
1505 ret = 0;
1506 if (!sock_owned_by_user(sk)) {
1a2449a8 1507#ifdef CONFIG_NET_DMA
1ab1457c 1508 struct tcp_sock *tp = tcp_sk(sk);
b4caea8a 1509 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
a2bd1140 1510 tp->ucopy.dma_chan = net_dma_find_channel();
1ab1457c
YH
1511 if (tp->ucopy.dma_chan)
1512 ret = tcp_v6_do_rcv(sk, skb);
1513 else
1a2449a8
CL
1514#endif
1515 {
1516 if (!tcp_prequeue(sk, skb))
1517 ret = tcp_v6_do_rcv(sk, skb);
1518 }
da882c1f
ED
1519 } else if (unlikely(sk_add_backlog(sk, skb,
1520 sk->sk_rcvbuf + sk->sk_sndbuf))) {
6b03a53a 1521 bh_unlock_sock(sk);
6cce09f8 1522 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
6b03a53a
ZY
1523 goto discard_and_relse;
1524 }
1da177e4
LT
1525 bh_unlock_sock(sk);
1526
1527 sock_put(sk);
1528 return ret ? -1 : 0;
1529
1530no_tcp_socket:
1531 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1532 goto discard_it;
1533
1534 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
6a5dc9e5
ED
1535csum_error:
1536 TCP_INC_STATS_BH(net, TCP_MIB_CSUMERRORS);
1da177e4 1537bad_packet:
63231bdd 1538 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1da177e4 1539 } else {
cfb6eeb4 1540 tcp_v6_send_reset(NULL, skb);
1da177e4
LT
1541 }
1542
1543discard_it:
1da177e4
LT
1544 kfree_skb(skb);
1545 return 0;
1546
1547discard_and_relse:
1548 sock_put(sk);
1549 goto discard_it;
1550
1551do_time_wait:
1552 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
9469c7b4 1553 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1554 goto discard_it;
1555 }
1556
6a5dc9e5 1557 if (skb->len < (th->doff<<2)) {
9469c7b4 1558 inet_twsk_put(inet_twsk(sk));
6a5dc9e5
ED
1559 goto bad_packet;
1560 }
1561 if (tcp_checksum_complete(skb)) {
1562 inet_twsk_put(inet_twsk(sk));
1563 goto csum_error;
1da177e4
LT
1564 }
1565
9469c7b4 1566 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1da177e4
LT
1567 case TCP_TW_SYN:
1568 {
1569 struct sock *sk2;
1570
c346dca1 1571 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
5ba24953 1572 &ipv6_hdr(skb)->saddr, th->source,
0660e03f 1573 &ipv6_hdr(skb)->daddr,
505cbfc5 1574 ntohs(th->dest), inet6_iif(skb));
1da177e4 1575 if (sk2 != NULL) {
295ff7ed
ACM
1576 struct inet_timewait_sock *tw = inet_twsk(sk);
1577 inet_twsk_deschedule(tw, &tcp_death_row);
1578 inet_twsk_put(tw);
1da177e4
LT
1579 sk = sk2;
1580 goto process;
1581 }
1582 /* Fall through to ACK */
1583 }
1584 case TCP_TW_ACK:
1585 tcp_v6_timewait_ack(sk, skb);
1586 break;
1587 case TCP_TW_RST:
1588 goto no_tcp_socket;
1589 case TCP_TW_SUCCESS:;
1590 }
1591 goto discard_it;
1592}
1593
c7109986
ED
1594static void tcp_v6_early_demux(struct sk_buff *skb)
1595{
1596 const struct ipv6hdr *hdr;
1597 const struct tcphdr *th;
1598 struct sock *sk;
1599
1600 if (skb->pkt_type != PACKET_HOST)
1601 return;
1602
1603 if (!pskb_may_pull(skb, skb_transport_offset(skb) + sizeof(struct tcphdr)))
1604 return;
1605
1606 hdr = ipv6_hdr(skb);
1607 th = tcp_hdr(skb);
1608
1609 if (th->doff < sizeof(struct tcphdr) / 4)
1610 return;
1611
1612 sk = __inet6_lookup_established(dev_net(skb->dev), &tcp_hashinfo,
1613 &hdr->saddr, th->source,
1614 &hdr->daddr, ntohs(th->dest),
1615 inet6_iif(skb));
1616 if (sk) {
1617 skb->sk = sk;
1618 skb->destructor = sock_edemux;
1619 if (sk->sk_state != TCP_TIME_WAIT) {
1620 struct dst_entry *dst = sk->sk_rx_dst;
f3f12135 1621
c7109986 1622 if (dst)
5d299f3d 1623 dst = dst_check(dst, inet6_sk(sk)->rx_dst_cookie);
c7109986 1624 if (dst &&
f3f12135 1625 inet_sk(sk)->rx_dst_ifindex == skb->skb_iif)
c7109986
ED
1626 skb_dst_set_noref(skb, dst);
1627 }
1628 }
1629}
1630
ccb7c410
DM
1631static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1632 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1633 .twsk_unique = tcp_twsk_unique,
1634 .twsk_destructor= tcp_twsk_destructor,
ccb7c410
DM
1635};
1636
3b401a81 1637static const struct inet_connection_sock_af_ops ipv6_specific = {
543d9cfe
ACM
1638 .queue_xmit = inet6_csk_xmit,
1639 .send_check = tcp_v6_send_check,
1640 .rebuild_header = inet6_sk_rebuild_header,
5d299f3d 1641 .sk_rx_dst_set = inet6_sk_rx_dst_set,
543d9cfe
ACM
1642 .conn_request = tcp_v6_conn_request,
1643 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe 1644 .net_header_len = sizeof(struct ipv6hdr),
67469601 1645 .net_frag_header_len = sizeof(struct frag_hdr),
543d9cfe
ACM
1646 .setsockopt = ipv6_setsockopt,
1647 .getsockopt = ipv6_getsockopt,
1648 .addr2sockaddr = inet6_csk_addr2sockaddr,
1649 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1650 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1651#ifdef CONFIG_COMPAT
543d9cfe
ACM
1652 .compat_setsockopt = compat_ipv6_setsockopt,
1653 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1654#endif
1da177e4
LT
1655};
1656
cfb6eeb4 1657#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1658static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
cfb6eeb4 1659 .md5_lookup = tcp_v6_md5_lookup,
49a72dfb 1660 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 1661 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1662};
a928630a 1663#endif
cfb6eeb4 1664
1da177e4
LT
1665/*
1666 * TCP over IPv4 via INET6 API
1667 */
1668
3b401a81 1669static const struct inet_connection_sock_af_ops ipv6_mapped = {
543d9cfe
ACM
1670 .queue_xmit = ip_queue_xmit,
1671 .send_check = tcp_v4_send_check,
1672 .rebuild_header = inet_sk_rebuild_header,
63d02d15 1673 .sk_rx_dst_set = inet_sk_rx_dst_set,
543d9cfe
ACM
1674 .conn_request = tcp_v6_conn_request,
1675 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe
ACM
1676 .net_header_len = sizeof(struct iphdr),
1677 .setsockopt = ipv6_setsockopt,
1678 .getsockopt = ipv6_getsockopt,
1679 .addr2sockaddr = inet6_csk_addr2sockaddr,
1680 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1681 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1682#ifdef CONFIG_COMPAT
543d9cfe
ACM
1683 .compat_setsockopt = compat_ipv6_setsockopt,
1684 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1685#endif
1da177e4
LT
1686};
1687
cfb6eeb4 1688#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1689static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
cfb6eeb4 1690 .md5_lookup = tcp_v4_md5_lookup,
49a72dfb 1691 .calc_md5_hash = tcp_v4_md5_hash_skb,
cfb6eeb4 1692 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1693};
a928630a 1694#endif
cfb6eeb4 1695
1da177e4
LT
1696/* NOTE: A lot of things set to zero explicitly by call to
1697 * sk_alloc() so need not be done here.
1698 */
1699static int tcp_v6_init_sock(struct sock *sk)
1700{
6687e988 1701 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4 1702
900f65d3 1703 tcp_init_sock(sk);
1da177e4 1704
8292a17a 1705 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 1706
cfb6eeb4 1707#ifdef CONFIG_TCP_MD5SIG
ac807fa8 1708 tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
cfb6eeb4
YH
1709#endif
1710
1da177e4
LT
1711 return 0;
1712}
1713
7d06b2e0 1714static void tcp_v6_destroy_sock(struct sock *sk)
1da177e4 1715{
1da177e4 1716 tcp_v4_destroy_sock(sk);
7d06b2e0 1717 inet6_destroy_sock(sk);
1da177e4
LT
1718}
1719
952a10be 1720#ifdef CONFIG_PROC_FS
1da177e4 1721/* Proc filesystem TCPv6 sock list dumping. */
1ab1457c 1722static void get_openreq6(struct seq_file *seq,
a7cb5a49 1723 const struct sock *sk, struct request_sock *req, int i, kuid_t uid)
1da177e4 1724{
1da177e4 1725 int ttd = req->expires - jiffies;
b71d1d42
ED
1726 const struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1727 const struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1da177e4
LT
1728
1729 if (ttd < 0)
1730 ttd = 0;
1731
1da177e4
LT
1732 seq_printf(seq,
1733 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1734 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1da177e4
LT
1735 i,
1736 src->s6_addr32[0], src->s6_addr32[1],
1737 src->s6_addr32[2], src->s6_addr32[3],
fd507037 1738 ntohs(inet_rsk(req)->loc_port),
1da177e4
LT
1739 dest->s6_addr32[0], dest->s6_addr32[1],
1740 dest->s6_addr32[2], dest->s6_addr32[3],
2e6599cb 1741 ntohs(inet_rsk(req)->rmt_port),
1da177e4
LT
1742 TCP_SYN_RECV,
1743 0,0, /* could print option size, but that is af dependent. */
1ab1457c
YH
1744 1, /* timers active (only the expire timer) */
1745 jiffies_to_clock_t(ttd),
e6c022a4 1746 req->num_timeout,
a7cb5a49 1747 from_kuid_munged(seq_user_ns(seq), uid),
1ab1457c 1748 0, /* non standard timer */
1da177e4
LT
1749 0, /* open_requests have no inode */
1750 0, req);
1751}
1752
1753static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1754{
b71d1d42 1755 const struct in6_addr *dest, *src;
1da177e4
LT
1756 __u16 destp, srcp;
1757 int timer_active;
1758 unsigned long timer_expires;
cf533ea5
ED
1759 const struct inet_sock *inet = inet_sk(sp);
1760 const struct tcp_sock *tp = tcp_sk(sp);
463c84b9 1761 const struct inet_connection_sock *icsk = inet_csk(sp);
cf533ea5 1762 const struct ipv6_pinfo *np = inet6_sk(sp);
1da177e4
LT
1763
1764 dest = &np->daddr;
1765 src = &np->rcv_saddr;
c720c7e8
ED
1766 destp = ntohs(inet->inet_dport);
1767 srcp = ntohs(inet->inet_sport);
463c84b9
ACM
1768
1769 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1da177e4 1770 timer_active = 1;
463c84b9
ACM
1771 timer_expires = icsk->icsk_timeout;
1772 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1da177e4 1773 timer_active = 4;
463c84b9 1774 timer_expires = icsk->icsk_timeout;
1da177e4
LT
1775 } else if (timer_pending(&sp->sk_timer)) {
1776 timer_active = 2;
1777 timer_expires = sp->sk_timer.expires;
1778 } else {
1779 timer_active = 0;
1780 timer_expires = jiffies;
1781 }
1782
1783 seq_printf(seq,
1784 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1785 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %pK %lu %lu %u %u %d\n",
1da177e4
LT
1786 i,
1787 src->s6_addr32[0], src->s6_addr32[1],
1788 src->s6_addr32[2], src->s6_addr32[3], srcp,
1789 dest->s6_addr32[0], dest->s6_addr32[1],
1790 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1ab1457c 1791 sp->sk_state,
47da8ee6
SS
1792 tp->write_seq-tp->snd_una,
1793 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1da177e4 1794 timer_active,
a399a805 1795 jiffies_delta_to_clock_t(timer_expires - jiffies),
463c84b9 1796 icsk->icsk_retransmits,
a7cb5a49 1797 from_kuid_munged(seq_user_ns(seq), sock_i_uid(sp)),
6687e988 1798 icsk->icsk_probes_out,
1da177e4
LT
1799 sock_i_ino(sp),
1800 atomic_read(&sp->sk_refcnt), sp,
7be87351
SH
1801 jiffies_to_clock_t(icsk->icsk_rto),
1802 jiffies_to_clock_t(icsk->icsk_ack.ato),
463c84b9 1803 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
0b6a05c1
IJ
1804 tp->snd_cwnd,
1805 tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
1da177e4
LT
1806 );
1807}
1808
1ab1457c 1809static void get_timewait6_sock(struct seq_file *seq,
8feaf0c0 1810 struct inet_timewait_sock *tw, int i)
1da177e4 1811{
b71d1d42 1812 const struct in6_addr *dest, *src;
1da177e4 1813 __u16 destp, srcp;
cf533ea5 1814 const struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
a399a805 1815 long delta = tw->tw_ttd - jiffies;
1da177e4 1816
0fa1a53e
ACM
1817 dest = &tw6->tw_v6_daddr;
1818 src = &tw6->tw_v6_rcv_saddr;
1da177e4
LT
1819 destp = ntohs(tw->tw_dport);
1820 srcp = ntohs(tw->tw_sport);
1821
1822 seq_printf(seq,
1823 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1824 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1da177e4
LT
1825 i,
1826 src->s6_addr32[0], src->s6_addr32[1],
1827 src->s6_addr32[2], src->s6_addr32[3], srcp,
1828 dest->s6_addr32[0], dest->s6_addr32[1],
1829 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1830 tw->tw_substate, 0, 0,
a399a805 1831 3, jiffies_delta_to_clock_t(delta), 0, 0, 0, 0,
1da177e4
LT
1832 atomic_read(&tw->tw_refcnt), tw);
1833}
1834
1da177e4
LT
1835static int tcp6_seq_show(struct seq_file *seq, void *v)
1836{
1837 struct tcp_iter_state *st;
1838
1839 if (v == SEQ_START_TOKEN) {
1840 seq_puts(seq,
1841 " sl "
1842 "local_address "
1843 "remote_address "
1844 "st tx_queue rx_queue tr tm->when retrnsmt"
1845 " uid timeout inode\n");
1846 goto out;
1847 }
1848 st = seq->private;
1849
1850 switch (st->state) {
1851 case TCP_SEQ_STATE_LISTENING:
1852 case TCP_SEQ_STATE_ESTABLISHED:
1853 get_tcp6_sock(seq, v, st->num);
1854 break;
1855 case TCP_SEQ_STATE_OPENREQ:
1856 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1857 break;
1858 case TCP_SEQ_STATE_TIME_WAIT:
1859 get_timewait6_sock(seq, v, st->num);
1860 break;
1861 }
1862out:
1863 return 0;
1864}
1865
73cb88ec
AV
1866static const struct file_operations tcp6_afinfo_seq_fops = {
1867 .owner = THIS_MODULE,
1868 .open = tcp_seq_open,
1869 .read = seq_read,
1870 .llseek = seq_lseek,
1871 .release = seq_release_net
1872};
1873
1da177e4 1874static struct tcp_seq_afinfo tcp6_seq_afinfo = {
1da177e4
LT
1875 .name = "tcp6",
1876 .family = AF_INET6,
73cb88ec 1877 .seq_fops = &tcp6_afinfo_seq_fops,
9427c4b3
DL
1878 .seq_ops = {
1879 .show = tcp6_seq_show,
1880 },
1da177e4
LT
1881};
1882
2c8c1e72 1883int __net_init tcp6_proc_init(struct net *net)
1da177e4 1884{
6f8b13bc 1885 return tcp_proc_register(net, &tcp6_seq_afinfo);
1da177e4
LT
1886}
1887
6f8b13bc 1888void tcp6_proc_exit(struct net *net)
1da177e4 1889{
6f8b13bc 1890 tcp_proc_unregister(net, &tcp6_seq_afinfo);
1da177e4
LT
1891}
1892#endif
1893
f77d6021
ED
1894static void tcp_v6_clear_sk(struct sock *sk, int size)
1895{
1896 struct inet_sock *inet = inet_sk(sk);
1897
1898 /* we do not want to clear pinet6 field, because of RCU lookups */
1899 sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
1900
1901 size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
1902 memset(&inet->pinet6 + 1, 0, size);
1903}
1904
1da177e4
LT
1905struct proto tcpv6_prot = {
1906 .name = "TCPv6",
1907 .owner = THIS_MODULE,
1908 .close = tcp_close,
1909 .connect = tcp_v6_connect,
1910 .disconnect = tcp_disconnect,
463c84b9 1911 .accept = inet_csk_accept,
1da177e4
LT
1912 .ioctl = tcp_ioctl,
1913 .init = tcp_v6_init_sock,
1914 .destroy = tcp_v6_destroy_sock,
1915 .shutdown = tcp_shutdown,
1916 .setsockopt = tcp_setsockopt,
1917 .getsockopt = tcp_getsockopt,
1da177e4 1918 .recvmsg = tcp_recvmsg,
7ba42910
CG
1919 .sendmsg = tcp_sendmsg,
1920 .sendpage = tcp_sendpage,
1da177e4 1921 .backlog_rcv = tcp_v6_do_rcv,
46d3ceab 1922 .release_cb = tcp_release_cb,
563d34d0 1923 .mtu_reduced = tcp_v6_mtu_reduced,
1da177e4 1924 .hash = tcp_v6_hash,
ab1e0a13
ACM
1925 .unhash = inet_unhash,
1926 .get_port = inet_csk_get_port,
1da177e4 1927 .enter_memory_pressure = tcp_enter_memory_pressure,
c9bee3b7 1928 .stream_memory_free = tcp_stream_memory_free,
1da177e4
LT
1929 .sockets_allocated = &tcp_sockets_allocated,
1930 .memory_allocated = &tcp_memory_allocated,
1931 .memory_pressure = &tcp_memory_pressure,
0a5578cf 1932 .orphan_count = &tcp_orphan_count,
1da177e4
LT
1933 .sysctl_wmem = sysctl_tcp_wmem,
1934 .sysctl_rmem = sysctl_tcp_rmem,
1935 .max_header = MAX_TCP_HEADER,
1936 .obj_size = sizeof(struct tcp6_sock),
3ab5aee7 1937 .slab_flags = SLAB_DESTROY_BY_RCU,
6d6ee43e 1938 .twsk_prot = &tcp6_timewait_sock_ops,
60236fdd 1939 .rsk_prot = &tcp6_request_sock_ops,
39d8cda7 1940 .h.hashinfo = &tcp_hashinfo,
7ba42910 1941 .no_autobind = true,
543d9cfe
ACM
1942#ifdef CONFIG_COMPAT
1943 .compat_setsockopt = compat_tcp_setsockopt,
1944 .compat_getsockopt = compat_tcp_getsockopt,
1945#endif
c255a458 1946#ifdef CONFIG_MEMCG_KMEM
d1a4c0b3
GC
1947 .proto_cgroup = tcp_proto_cgroup,
1948#endif
f77d6021 1949 .clear_sk = tcp_v6_clear_sk,
1da177e4
LT
1950};
1951
41135cc8 1952static const struct inet6_protocol tcpv6_protocol = {
c7109986 1953 .early_demux = tcp_v6_early_demux,
1da177e4
LT
1954 .handler = tcp_v6_rcv,
1955 .err_handler = tcp_v6_err,
1956 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1957};
1958
1da177e4
LT
1959static struct inet_protosw tcpv6_protosw = {
1960 .type = SOCK_STREAM,
1961 .protocol = IPPROTO_TCP,
1962 .prot = &tcpv6_prot,
1963 .ops = &inet6_stream_ops,
1da177e4 1964 .no_check = 0,
d83d8461
ACM
1965 .flags = INET_PROTOSW_PERMANENT |
1966 INET_PROTOSW_ICSK,
1da177e4
LT
1967};
1968
2c8c1e72 1969static int __net_init tcpv6_net_init(struct net *net)
93ec926b 1970{
5677242f
DL
1971 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
1972 SOCK_RAW, IPPROTO_TCP, net);
93ec926b
DL
1973}
1974
2c8c1e72 1975static void __net_exit tcpv6_net_exit(struct net *net)
93ec926b 1976{
5677242f 1977 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
b099ce26
EB
1978}
1979
2c8c1e72 1980static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
b099ce26
EB
1981{
1982 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
93ec926b
DL
1983}
1984
1985static struct pernet_operations tcpv6_net_ops = {
b099ce26
EB
1986 .init = tcpv6_net_init,
1987 .exit = tcpv6_net_exit,
1988 .exit_batch = tcpv6_net_exit_batch,
93ec926b
DL
1989};
1990
7f4e4868 1991int __init tcpv6_init(void)
1da177e4 1992{
7f4e4868
DL
1993 int ret;
1994
3336288a
VY
1995 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
1996 if (ret)
c6b641a4 1997 goto out;
3336288a 1998
1da177e4 1999 /* register inet6 protocol */
7f4e4868
DL
2000 ret = inet6_register_protosw(&tcpv6_protosw);
2001 if (ret)
2002 goto out_tcpv6_protocol;
2003
93ec926b 2004 ret = register_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2005 if (ret)
2006 goto out_tcpv6_protosw;
2007out:
2008 return ret;
ae0f7d5f 2009
7f4e4868
DL
2010out_tcpv6_protosw:
2011 inet6_unregister_protosw(&tcpv6_protosw);
3336288a
VY
2012out_tcpv6_protocol:
2013 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
7f4e4868
DL
2014 goto out;
2015}
2016
09f7709f 2017void tcpv6_exit(void)
7f4e4868 2018{
93ec926b 2019 unregister_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2020 inet6_unregister_protosw(&tcpv6_protosw);
2021 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
1da177e4 2022}