net: gro: allow to build full sized skb
[linux-2.6-block.git] / net / ipv6 / tcp_ipv6.c
CommitLineData
1da177e4
LT
1/*
2 * TCP over IPv6
1ab1457c 3 * Linux INET6 implementation
1da177e4
LT
4 *
5 * Authors:
1ab1457c 6 * Pedro Roque <roque@di.fc.ul.pt>
1da177e4 7 *
1ab1457c 8 * Based on:
1da177e4
LT
9 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
eb4dea58 26#include <linux/bottom_half.h>
1da177e4 27#include <linux/module.h>
1da177e4
LT
28#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
5a0e3ad6 41#include <linux/slab.h>
1da177e4
LT
42
43#include <linux/ipv6.h>
44#include <linux/icmpv6.h>
45#include <linux/random.h>
46
47#include <net/tcp.h>
48#include <net/ndisc.h>
5324a040 49#include <net/inet6_hashtables.h>
8129765a 50#include <net/inet6_connection_sock.h>
1da177e4
LT
51#include <net/ipv6.h>
52#include <net/transp_v6.h>
53#include <net/addrconf.h>
54#include <net/ip6_route.h>
55#include <net/ip6_checksum.h>
56#include <net/inet_ecn.h>
57#include <net/protocol.h>
58#include <net/xfrm.h>
1da177e4
LT
59#include <net/snmp.h>
60#include <net/dsfield.h>
6d6ee43e 61#include <net/timewait_sock.h>
18134bed 62#include <net/netdma.h>
3d58b5fa 63#include <net/inet_common.h>
6e5714ea 64#include <net/secure_seq.h>
d1a4c0b3 65#include <net/tcp_memcontrol.h>
076bb0c8 66#include <net/busy_poll.h>
1da177e4
LT
67
68#include <asm/uaccess.h>
69
70#include <linux/proc_fs.h>
71#include <linux/seq_file.h>
72
cfb6eeb4
YH
73#include <linux/crypto.h>
74#include <linux/scatterlist.h>
75
cfb6eeb4 76static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
6edafaaf
GJ
77static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
78 struct request_sock *req);
1da177e4
LT
79
80static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
1da177e4 81
3b401a81
SH
82static const struct inet_connection_sock_af_ops ipv6_mapped;
83static const struct inet_connection_sock_af_ops ipv6_specific;
a928630a 84#ifdef CONFIG_TCP_MD5SIG
b2e4b3de
SH
85static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
86static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
9501f972
YH
87#else
88static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 89 const struct in6_addr *addr)
9501f972
YH
90{
91 return NULL;
92}
a928630a 93#endif
1da177e4 94
fae6ef87
NC
95static void inet6_sk_rx_dst_set(struct sock *sk, const struct sk_buff *skb)
96{
97 struct dst_entry *dst = skb_dst(skb);
98 const struct rt6_info *rt = (const struct rt6_info *)dst;
99
100 dst_hold(dst);
101 sk->sk_rx_dst = dst;
102 inet_sk(sk)->rx_dst_ifindex = skb->skb_iif;
103 if (rt->rt6i_node)
104 inet6_sk(sk)->rx_dst_cookie = rt->rt6i_node->fn_sernum;
105}
106
1da177e4
LT
107static void tcp_v6_hash(struct sock *sk)
108{
109 if (sk->sk_state != TCP_CLOSE) {
8292a17a 110 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
1da177e4
LT
111 tcp_prot.hash(sk);
112 return;
113 }
114 local_bh_disable();
9327f705 115 __inet6_hash(sk, NULL);
1da177e4
LT
116 local_bh_enable();
117 }
118}
119
cf533ea5 120static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
1da177e4 121{
0660e03f
ACM
122 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
123 ipv6_hdr(skb)->saddr.s6_addr32,
aa8223c7
ACM
124 tcp_hdr(skb)->dest,
125 tcp_hdr(skb)->source);
1da177e4
LT
126}
127
1ab1457c 128static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
1da177e4
LT
129 int addr_len)
130{
131 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
1ab1457c 132 struct inet_sock *inet = inet_sk(sk);
d83d8461 133 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4
LT
134 struct ipv6_pinfo *np = inet6_sk(sk);
135 struct tcp_sock *tp = tcp_sk(sk);
20c59de2 136 struct in6_addr *saddr = NULL, *final_p, final;
493f377d 137 struct rt6_info *rt;
4c9483b2 138 struct flowi6 fl6;
1da177e4
LT
139 struct dst_entry *dst;
140 int addr_type;
141 int err;
142
1ab1457c 143 if (addr_len < SIN6_LEN_RFC2133)
1da177e4
LT
144 return -EINVAL;
145
1ab1457c 146 if (usin->sin6_family != AF_INET6)
a02cec21 147 return -EAFNOSUPPORT;
1da177e4 148
4c9483b2 149 memset(&fl6, 0, sizeof(fl6));
1da177e4
LT
150
151 if (np->sndflow) {
4c9483b2
DM
152 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
153 IP6_ECN_flow_init(fl6.flowlabel);
154 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
1da177e4 155 struct ip6_flowlabel *flowlabel;
4c9483b2 156 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
1da177e4
LT
157 if (flowlabel == NULL)
158 return -EINVAL;
4e3fd7a0 159 usin->sin6_addr = flowlabel->dst;
1da177e4
LT
160 fl6_sock_release(flowlabel);
161 }
162 }
163
164 /*
1ab1457c
YH
165 * connect() to INADDR_ANY means loopback (BSD'ism).
166 */
167
168 if(ipv6_addr_any(&usin->sin6_addr))
169 usin->sin6_addr.s6_addr[15] = 0x1;
1da177e4
LT
170
171 addr_type = ipv6_addr_type(&usin->sin6_addr);
172
173 if(addr_type & IPV6_ADDR_MULTICAST)
174 return -ENETUNREACH;
175
176 if (addr_type&IPV6_ADDR_LINKLOCAL) {
177 if (addr_len >= sizeof(struct sockaddr_in6) &&
178 usin->sin6_scope_id) {
179 /* If interface is set while binding, indices
180 * must coincide.
181 */
182 if (sk->sk_bound_dev_if &&
183 sk->sk_bound_dev_if != usin->sin6_scope_id)
184 return -EINVAL;
185
186 sk->sk_bound_dev_if = usin->sin6_scope_id;
187 }
188
189 /* Connect to link-local address requires an interface */
190 if (!sk->sk_bound_dev_if)
191 return -EINVAL;
192 }
193
194 if (tp->rx_opt.ts_recent_stamp &&
efe4208f 195 !ipv6_addr_equal(&sk->sk_v6_daddr, &usin->sin6_addr)) {
1da177e4
LT
196 tp->rx_opt.ts_recent = 0;
197 tp->rx_opt.ts_recent_stamp = 0;
198 tp->write_seq = 0;
199 }
200
efe4208f 201 sk->sk_v6_daddr = usin->sin6_addr;
4c9483b2 202 np->flow_label = fl6.flowlabel;
1da177e4
LT
203
204 /*
205 * TCP over IPv4
206 */
207
208 if (addr_type == IPV6_ADDR_MAPPED) {
d83d8461 209 u32 exthdrlen = icsk->icsk_ext_hdr_len;
1da177e4
LT
210 struct sockaddr_in sin;
211
212 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
213
214 if (__ipv6_only_sock(sk))
215 return -ENETUNREACH;
216
217 sin.sin_family = AF_INET;
218 sin.sin_port = usin->sin6_port;
219 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
220
d83d8461 221 icsk->icsk_af_ops = &ipv6_mapped;
1da177e4 222 sk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
223#ifdef CONFIG_TCP_MD5SIG
224 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
225#endif
1da177e4
LT
226
227 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
228
229 if (err) {
d83d8461
ACM
230 icsk->icsk_ext_hdr_len = exthdrlen;
231 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 232 sk->sk_backlog_rcv = tcp_v6_do_rcv;
cfb6eeb4
YH
233#ifdef CONFIG_TCP_MD5SIG
234 tp->af_specific = &tcp_sock_ipv6_specific;
235#endif
1da177e4
LT
236 goto failure;
237 } else {
c720c7e8
ED
238 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
239 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
efe4208f 240 &sk->sk_v6_rcv_saddr);
1da177e4
LT
241 }
242
243 return err;
244 }
245
efe4208f
ED
246 if (!ipv6_addr_any(&sk->sk_v6_rcv_saddr))
247 saddr = &sk->sk_v6_rcv_saddr;
1da177e4 248
4c9483b2 249 fl6.flowi6_proto = IPPROTO_TCP;
efe4208f 250 fl6.daddr = sk->sk_v6_daddr;
4e3fd7a0 251 fl6.saddr = saddr ? *saddr : np->saddr;
4c9483b2
DM
252 fl6.flowi6_oif = sk->sk_bound_dev_if;
253 fl6.flowi6_mark = sk->sk_mark;
1958b856
DM
254 fl6.fl6_dport = usin->sin6_port;
255 fl6.fl6_sport = inet->inet_sport;
1da177e4 256
4c9483b2 257 final_p = fl6_update_dst(&fl6, np->opt, &final);
1da177e4 258
4c9483b2 259 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
beb8d13b 260
4c9483b2 261 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, true);
68d0c6d3
DM
262 if (IS_ERR(dst)) {
263 err = PTR_ERR(dst);
1da177e4 264 goto failure;
14e50e57 265 }
1da177e4
LT
266
267 if (saddr == NULL) {
4c9483b2 268 saddr = &fl6.saddr;
efe4208f 269 sk->sk_v6_rcv_saddr = *saddr;
1da177e4
LT
270 }
271
272 /* set the source address */
4e3fd7a0 273 np->saddr = *saddr;
c720c7e8 274 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 275
f83ef8c0 276 sk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 277 __ip6_dst_store(sk, dst, NULL, NULL);
1da177e4 278
493f377d
DM
279 rt = (struct rt6_info *) dst;
280 if (tcp_death_row.sysctl_tw_recycle &&
281 !tp->rx_opt.ts_recent_stamp &&
efe4208f 282 ipv6_addr_equal(&rt->rt6i_dst.addr, &sk->sk_v6_daddr))
81166dd6 283 tcp_fetch_timewait_stamp(sk, dst);
493f377d 284
d83d8461 285 icsk->icsk_ext_hdr_len = 0;
1da177e4 286 if (np->opt)
d83d8461
ACM
287 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
288 np->opt->opt_nflen);
1da177e4
LT
289
290 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
291
c720c7e8 292 inet->inet_dport = usin->sin6_port;
1da177e4
LT
293
294 tcp_set_state(sk, TCP_SYN_SENT);
d8313f5c 295 err = inet6_hash_connect(&tcp_death_row, sk);
1da177e4
LT
296 if (err)
297 goto late_failure;
298
2b916477 299 if (!tp->write_seq && likely(!tp->repair))
1da177e4 300 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
efe4208f 301 sk->sk_v6_daddr.s6_addr32,
c720c7e8
ED
302 inet->inet_sport,
303 inet->inet_dport);
1da177e4
LT
304
305 err = tcp_connect(sk);
306 if (err)
307 goto late_failure;
308
309 return 0;
310
311late_failure:
312 tcp_set_state(sk, TCP_CLOSE);
313 __sk_dst_reset(sk);
314failure:
c720c7e8 315 inet->inet_dport = 0;
1da177e4
LT
316 sk->sk_route_caps = 0;
317 return err;
318}
319
563d34d0
ED
320static void tcp_v6_mtu_reduced(struct sock *sk)
321{
322 struct dst_entry *dst;
323
324 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
325 return;
326
327 dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
328 if (!dst)
329 return;
330
331 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
332 tcp_sync_mss(sk, dst_mtu(dst));
333 tcp_simple_retransmit(sk);
334 }
335}
336
1da177e4 337static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
d5fdd6ba 338 u8 type, u8 code, int offset, __be32 info)
1da177e4 339{
b71d1d42 340 const struct ipv6hdr *hdr = (const struct ipv6hdr*)skb->data;
505cbfc5 341 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
1da177e4
LT
342 struct ipv6_pinfo *np;
343 struct sock *sk;
344 int err;
1ab1457c 345 struct tcp_sock *tp;
1da177e4 346 __u32 seq;
ca12a1a4 347 struct net *net = dev_net(skb->dev);
1da177e4 348
ca12a1a4 349 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
d86e0dac 350 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
1da177e4
LT
351
352 if (sk == NULL) {
e41b5368
DL
353 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
354 ICMP6_MIB_INERRORS);
1da177e4
LT
355 return;
356 }
357
358 if (sk->sk_state == TCP_TIME_WAIT) {
9469c7b4 359 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
360 return;
361 }
362
363 bh_lock_sock(sk);
563d34d0 364 if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
de0744af 365 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
1da177e4
LT
366
367 if (sk->sk_state == TCP_CLOSE)
368 goto out;
369
e802af9c
SH
370 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
371 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
372 goto out;
373 }
374
1da177e4 375 tp = tcp_sk(sk);
1ab1457c 376 seq = ntohl(th->seq);
1da177e4
LT
377 if (sk->sk_state != TCP_LISTEN &&
378 !between(seq, tp->snd_una, tp->snd_nxt)) {
de0744af 379 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
380 goto out;
381 }
382
383 np = inet6_sk(sk);
384
ec18d9a2
DM
385 if (type == NDISC_REDIRECT) {
386 struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
387
1ed5c48f 388 if (dst)
6700c270 389 dst->ops->redirect(dst, sk, skb);
50a75a89 390 goto out;
ec18d9a2
DM
391 }
392
1da177e4 393 if (type == ICMPV6_PKT_TOOBIG) {
0d4f0608
ED
394 /* We are not interested in TCP_LISTEN and open_requests
395 * (SYN-ACKs send out by Linux are always <576bytes so
396 * they should go through unfragmented).
397 */
398 if (sk->sk_state == TCP_LISTEN)
399 goto out;
400
563d34d0
ED
401 tp->mtu_info = ntohl(info);
402 if (!sock_owned_by_user(sk))
403 tcp_v6_mtu_reduced(sk);
d013ef2a
JA
404 else if (!test_and_set_bit(TCP_MTU_REDUCED_DEFERRED,
405 &tp->tsq_flags))
406 sock_hold(sk);
1da177e4
LT
407 goto out;
408 }
409
410 icmpv6_err_convert(type, code, &err);
411
60236fdd 412 /* Might be for an request_sock */
1da177e4 413 switch (sk->sk_state) {
60236fdd 414 struct request_sock *req, **prev;
1da177e4
LT
415 case TCP_LISTEN:
416 if (sock_owned_by_user(sk))
417 goto out;
418
8129765a
ACM
419 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
420 &hdr->saddr, inet6_iif(skb));
1da177e4
LT
421 if (!req)
422 goto out;
423
424 /* ICMPs are not backlogged, hence we cannot get
425 * an established socket here.
426 */
547b792c 427 WARN_ON(req->sk != NULL);
1da177e4 428
2e6599cb 429 if (seq != tcp_rsk(req)->snt_isn) {
de0744af 430 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
431 goto out;
432 }
433
463c84b9 434 inet_csk_reqsk_queue_drop(sk, req, prev);
5f1e942c 435 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
436 goto out;
437
438 case TCP_SYN_SENT:
439 case TCP_SYN_RECV: /* Cannot happen.
1ab1457c 440 It can, it SYNs are crossed. --ANK */
1da177e4 441 if (!sock_owned_by_user(sk)) {
1da177e4
LT
442 sk->sk_err = err;
443 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
444
445 tcp_done(sk);
446 } else
447 sk->sk_err_soft = err;
448 goto out;
449 }
450
451 if (!sock_owned_by_user(sk) && np->recverr) {
452 sk->sk_err = err;
453 sk->sk_error_report(sk);
454 } else
455 sk->sk_err_soft = err;
456
457out:
458 bh_unlock_sock(sk);
459 sock_put(sk);
460}
461
462
9f10d3f6
NC
463static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
464 struct flowi6 *fl6,
3840a06e 465 struct request_sock *req,
fff32699 466 u16 queue_mapping)
1da177e4 467{
ca304b61 468 struct inet6_request_sock *treq = inet6_rsk(req);
1da177e4
LT
469 struct ipv6_pinfo *np = inet6_sk(sk);
470 struct sk_buff * skb;
9494218f 471 int err = -ENOMEM;
1da177e4 472
9f10d3f6
NC
473 /* First, grab a route. */
474 if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
fd80eb94 475 goto done;
9494218f 476
1a2c6181 477 skb = tcp_make_synack(sk, dst, req, NULL);
9494218f 478
1da177e4 479 if (skb) {
8ad50d96 480 __tcp_v6_send_check(skb, &treq->loc_addr, &treq->rmt_addr);
1da177e4 481
9f10d3f6 482 fl6->daddr = treq->rmt_addr;
fff32699 483 skb_set_queue_mapping(skb, queue_mapping);
43264e0b 484 err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
b9df3cb8 485 err = net_xmit_eval(err);
1da177e4
LT
486 }
487
488done:
1da177e4
LT
489 return err;
490}
491
1a2c6181 492static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req)
72659ecc 493{
9f10d3f6 494 struct flowi6 fl6;
e6c022a4 495 int res;
9f10d3f6 496
1a2c6181 497 res = tcp_v6_send_synack(sk, NULL, &fl6, req, 0);
e6c022a4
ED
498 if (!res)
499 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
500 return res;
72659ecc
OP
501}
502
60236fdd 503static void tcp_v6_reqsk_destructor(struct request_sock *req)
1da177e4 504{
800d55f1 505 kfree_skb(inet6_rsk(req)->pktopts);
1da177e4
LT
506}
507
cfb6eeb4
YH
508#ifdef CONFIG_TCP_MD5SIG
509static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 510 const struct in6_addr *addr)
cfb6eeb4 511{
a915da9b 512 return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
cfb6eeb4
YH
513}
514
515static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
516 struct sock *addr_sk)
517{
efe4208f 518 return tcp_v6_md5_do_lookup(sk, &addr_sk->sk_v6_daddr);
cfb6eeb4
YH
519}
520
521static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
522 struct request_sock *req)
523{
524 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
525}
526
cfb6eeb4
YH
527static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
528 int optlen)
529{
530 struct tcp_md5sig cmd;
531 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
cfb6eeb4
YH
532
533 if (optlen < sizeof(cmd))
534 return -EINVAL;
535
536 if (copy_from_user(&cmd, optval, sizeof(cmd)))
537 return -EFAULT;
538
539 if (sin6->sin6_family != AF_INET6)
540 return -EINVAL;
541
542 if (!cmd.tcpm_keylen) {
e773e4fa 543 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
a915da9b
ED
544 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
545 AF_INET);
546 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
547 AF_INET6);
cfb6eeb4
YH
548 }
549
550 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
551 return -EINVAL;
552
a915da9b
ED
553 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
554 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
555 AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4 556
a915da9b
ED
557 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
558 AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4
YH
559}
560
49a72dfb 561static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
b71d1d42
ED
562 const struct in6_addr *daddr,
563 const struct in6_addr *saddr, int nbytes)
cfb6eeb4 564{
cfb6eeb4 565 struct tcp6_pseudohdr *bp;
49a72dfb 566 struct scatterlist sg;
8d26d76d 567
cfb6eeb4 568 bp = &hp->md5_blk.ip6;
cfb6eeb4 569 /* 1. TCP pseudo-header (RFC2460) */
4e3fd7a0
AD
570 bp->saddr = *saddr;
571 bp->daddr = *daddr;
49a72dfb 572 bp->protocol = cpu_to_be32(IPPROTO_TCP);
00b1304c 573 bp->len = cpu_to_be32(nbytes);
cfb6eeb4 574
49a72dfb
AL
575 sg_init_one(&sg, bp, sizeof(*bp));
576 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
577}
c7da57a1 578
49a72dfb 579static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
b71d1d42 580 const struct in6_addr *daddr, struct in6_addr *saddr,
318cf7aa 581 const struct tcphdr *th)
49a72dfb
AL
582{
583 struct tcp_md5sig_pool *hp;
584 struct hash_desc *desc;
585
586 hp = tcp_get_md5sig_pool();
587 if (!hp)
588 goto clear_hash_noput;
589 desc = &hp->md5_desc;
590
591 if (crypto_hash_init(desc))
592 goto clear_hash;
593 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
594 goto clear_hash;
595 if (tcp_md5_hash_header(hp, th))
596 goto clear_hash;
597 if (tcp_md5_hash_key(hp, key))
598 goto clear_hash;
599 if (crypto_hash_final(desc, md5_hash))
cfb6eeb4 600 goto clear_hash;
cfb6eeb4 601
cfb6eeb4 602 tcp_put_md5sig_pool();
cfb6eeb4 603 return 0;
49a72dfb 604
cfb6eeb4
YH
605clear_hash:
606 tcp_put_md5sig_pool();
607clear_hash_noput:
608 memset(md5_hash, 0, 16);
49a72dfb 609 return 1;
cfb6eeb4
YH
610}
611
49a72dfb 612static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
318cf7aa
ED
613 const struct sock *sk,
614 const struct request_sock *req,
615 const struct sk_buff *skb)
cfb6eeb4 616{
b71d1d42 617 const struct in6_addr *saddr, *daddr;
49a72dfb
AL
618 struct tcp_md5sig_pool *hp;
619 struct hash_desc *desc;
318cf7aa 620 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4
YH
621
622 if (sk) {
623 saddr = &inet6_sk(sk)->saddr;
efe4208f 624 daddr = &sk->sk_v6_daddr;
49a72dfb 625 } else if (req) {
cfb6eeb4
YH
626 saddr = &inet6_rsk(req)->loc_addr;
627 daddr = &inet6_rsk(req)->rmt_addr;
49a72dfb 628 } else {
b71d1d42 629 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
49a72dfb
AL
630 saddr = &ip6h->saddr;
631 daddr = &ip6h->daddr;
cfb6eeb4 632 }
49a72dfb
AL
633
634 hp = tcp_get_md5sig_pool();
635 if (!hp)
636 goto clear_hash_noput;
637 desc = &hp->md5_desc;
638
639 if (crypto_hash_init(desc))
640 goto clear_hash;
641
642 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
643 goto clear_hash;
644 if (tcp_md5_hash_header(hp, th))
645 goto clear_hash;
646 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
647 goto clear_hash;
648 if (tcp_md5_hash_key(hp, key))
649 goto clear_hash;
650 if (crypto_hash_final(desc, md5_hash))
651 goto clear_hash;
652
653 tcp_put_md5sig_pool();
654 return 0;
655
656clear_hash:
657 tcp_put_md5sig_pool();
658clear_hash_noput:
659 memset(md5_hash, 0, 16);
660 return 1;
cfb6eeb4
YH
661}
662
318cf7aa 663static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
cfb6eeb4 664{
cf533ea5 665 const __u8 *hash_location = NULL;
cfb6eeb4 666 struct tcp_md5sig_key *hash_expected;
b71d1d42 667 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
318cf7aa 668 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4 669 int genhash;
cfb6eeb4
YH
670 u8 newhash[16];
671
672 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
7d5d5525 673 hash_location = tcp_parse_md5sig_option(th);
cfb6eeb4 674
785957d3
DM
675 /* We've parsed the options - do we have a hash? */
676 if (!hash_expected && !hash_location)
677 return 0;
678
679 if (hash_expected && !hash_location) {
680 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
cfb6eeb4
YH
681 return 1;
682 }
683
785957d3
DM
684 if (!hash_expected && hash_location) {
685 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
cfb6eeb4
YH
686 return 1;
687 }
688
689 /* check the signature */
49a72dfb
AL
690 genhash = tcp_v6_md5_hash_skb(newhash,
691 hash_expected,
692 NULL, NULL, skb);
693
cfb6eeb4 694 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
e87cc472
JP
695 net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
696 genhash ? "failed" : "mismatch",
697 &ip6h->saddr, ntohs(th->source),
698 &ip6h->daddr, ntohs(th->dest));
cfb6eeb4
YH
699 return 1;
700 }
701 return 0;
702}
703#endif
704
c6aefafb 705struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
1da177e4 706 .family = AF_INET6,
2e6599cb 707 .obj_size = sizeof(struct tcp6_request_sock),
72659ecc 708 .rtx_syn_ack = tcp_v6_rtx_synack,
60236fdd
ACM
709 .send_ack = tcp_v6_reqsk_send_ack,
710 .destructor = tcp_v6_reqsk_destructor,
72659ecc
OP
711 .send_reset = tcp_v6_send_reset,
712 .syn_ack_timeout = tcp_syn_ack_timeout,
1da177e4
LT
713};
714
cfb6eeb4 715#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 716static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
cfb6eeb4 717 .md5_lookup = tcp_v6_reqsk_md5_lookup,
e3afe7b7 718 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 719};
b6332e6c 720#endif
cfb6eeb4 721
626e264d 722static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
ee684b6f
AV
723 u32 tsval, u32 tsecr,
724 struct tcp_md5sig_key *key, int rst, u8 tclass)
1da177e4 725{
cf533ea5
ED
726 const struct tcphdr *th = tcp_hdr(skb);
727 struct tcphdr *t1;
1da177e4 728 struct sk_buff *buff;
4c9483b2 729 struct flowi6 fl6;
adf30907 730 struct net *net = dev_net(skb_dst(skb)->dev);
e5047992 731 struct sock *ctl_sk = net->ipv6.tcp_sk;
77c676da 732 unsigned int tot_len = sizeof(struct tcphdr);
adf30907 733 struct dst_entry *dst;
81ada62d 734 __be32 *topt;
1da177e4 735
ee684b6f 736 if (tsecr)
626e264d 737 tot_len += TCPOLEN_TSTAMP_ALIGNED;
cfb6eeb4 738#ifdef CONFIG_TCP_MD5SIG
cfb6eeb4
YH
739 if (key)
740 tot_len += TCPOLEN_MD5SIG_ALIGNED;
741#endif
742
cfb6eeb4 743 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1da177e4 744 GFP_ATOMIC);
1ab1457c
YH
745 if (buff == NULL)
746 return;
1da177e4 747
cfb6eeb4 748 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1da177e4 749
cfb6eeb4 750 t1 = (struct tcphdr *) skb_push(buff, tot_len);
6651ffc8 751 skb_reset_transport_header(buff);
1da177e4
LT
752
753 /* Swap the send and the receive. */
754 memset(t1, 0, sizeof(*t1));
755 t1->dest = th->source;
756 t1->source = th->dest;
cfb6eeb4 757 t1->doff = tot_len / 4;
626e264d
IJ
758 t1->seq = htonl(seq);
759 t1->ack_seq = htonl(ack);
760 t1->ack = !rst || !th->ack;
761 t1->rst = rst;
762 t1->window = htons(win);
1da177e4 763
81ada62d
IJ
764 topt = (__be32 *)(t1 + 1);
765
ee684b6f 766 if (tsecr) {
626e264d
IJ
767 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
768 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
ee684b6f
AV
769 *topt++ = htonl(tsval);
770 *topt++ = htonl(tsecr);
626e264d
IJ
771 }
772
cfb6eeb4
YH
773#ifdef CONFIG_TCP_MD5SIG
774 if (key) {
81ada62d
IJ
775 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
776 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
777 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
78e645cb
IJ
778 &ipv6_hdr(skb)->saddr,
779 &ipv6_hdr(skb)->daddr, t1);
cfb6eeb4
YH
780 }
781#endif
782
4c9483b2 783 memset(&fl6, 0, sizeof(fl6));
4e3fd7a0
AD
784 fl6.daddr = ipv6_hdr(skb)->saddr;
785 fl6.saddr = ipv6_hdr(skb)->daddr;
1da177e4 786
e5700aff
DM
787 buff->ip_summed = CHECKSUM_PARTIAL;
788 buff->csum = 0;
789
4c9483b2 790 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
1da177e4 791
4c9483b2 792 fl6.flowi6_proto = IPPROTO_TCP;
4c675258
AK
793 if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
794 fl6.flowi6_oif = inet6_iif(skb);
1958b856
DM
795 fl6.fl6_dport = t1->dest;
796 fl6.fl6_sport = t1->source;
4c9483b2 797 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
1da177e4 798
c20121ae
DL
799 /* Pass a socket to ip6_dst_lookup either it is for RST
800 * Underlying function will use this to retrieve the network
801 * namespace
802 */
4c9483b2 803 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL, false);
68d0c6d3
DM
804 if (!IS_ERR(dst)) {
805 skb_dst_set(buff, dst);
b903d324 806 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
68d0c6d3
DM
807 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
808 if (rst)
809 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
810 return;
1da177e4
LT
811 }
812
813 kfree_skb(buff);
814}
815
626e264d 816static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
1da177e4 817{
cf533ea5 818 const struct tcphdr *th = tcp_hdr(skb);
626e264d 819 u32 seq = 0, ack_seq = 0;
fa3e5b4e 820 struct tcp_md5sig_key *key = NULL;
658ddaaf
SL
821#ifdef CONFIG_TCP_MD5SIG
822 const __u8 *hash_location = NULL;
823 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
824 unsigned char newhash[16];
825 int genhash;
826 struct sock *sk1 = NULL;
827#endif
1da177e4 828
626e264d 829 if (th->rst)
1da177e4
LT
830 return;
831
626e264d
IJ
832 if (!ipv6_unicast_destination(skb))
833 return;
1da177e4 834
cfb6eeb4 835#ifdef CONFIG_TCP_MD5SIG
658ddaaf
SL
836 hash_location = tcp_parse_md5sig_option(th);
837 if (!sk && hash_location) {
838 /*
839 * active side is lost. Try to find listening socket through
840 * source port, and then find md5 key through listening socket.
841 * we are not loose security here:
842 * Incoming packet is checked with md5 hash with finding key,
843 * no RST generated if md5 hash doesn't match.
844 */
845 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
5ba24953
TH
846 &tcp_hashinfo, &ipv6h->saddr,
847 th->source, &ipv6h->daddr,
658ddaaf
SL
848 ntohs(th->source), inet6_iif(skb));
849 if (!sk1)
850 return;
851
852 rcu_read_lock();
853 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
854 if (!key)
855 goto release_sk1;
856
857 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
858 if (genhash || memcmp(hash_location, newhash, 16) != 0)
859 goto release_sk1;
860 } else {
861 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
862 }
cfb6eeb4
YH
863#endif
864
626e264d
IJ
865 if (th->ack)
866 seq = ntohl(th->ack_seq);
867 else
868 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
869 (th->doff << 2);
1da177e4 870
ee684b6f 871 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, 0, key, 1, 0);
658ddaaf
SL
872
873#ifdef CONFIG_TCP_MD5SIG
874release_sk1:
875 if (sk1) {
876 rcu_read_unlock();
877 sock_put(sk1);
878 }
879#endif
626e264d 880}
1da177e4 881
ee684b6f
AV
882static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack,
883 u32 win, u32 tsval, u32 tsecr,
b903d324 884 struct tcp_md5sig_key *key, u8 tclass)
626e264d 885{
ee684b6f 886 tcp_v6_send_response(skb, seq, ack, win, tsval, tsecr, key, 0, tclass);
1da177e4
LT
887}
888
889static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
890{
8feaf0c0 891 struct inet_timewait_sock *tw = inet_twsk(sk);
cfb6eeb4 892 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1da177e4 893
9501f972 894 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
8feaf0c0 895 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
ee684b6f 896 tcp_time_stamp + tcptw->tw_ts_offset,
b903d324
ED
897 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw),
898 tw->tw_tclass);
1da177e4 899
8feaf0c0 900 inet_twsk_put(tw);
1da177e4
LT
901}
902
6edafaaf
GJ
903static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
904 struct request_sock *req)
1da177e4 905{
ee684b6f
AV
906 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1,
907 req->rcv_wnd, tcp_time_stamp, req->ts_recent,
b903d324 908 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr), 0);
1da177e4
LT
909}
910
911
912static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
913{
60236fdd 914 struct request_sock *req, **prev;
aa8223c7 915 const struct tcphdr *th = tcp_hdr(skb);
1da177e4
LT
916 struct sock *nsk;
917
918 /* Find possible connection requests. */
8129765a 919 req = inet6_csk_search_req(sk, &prev, th->source,
0660e03f
ACM
920 &ipv6_hdr(skb)->saddr,
921 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1da177e4 922 if (req)
8336886f 923 return tcp_check_req(sk, skb, req, prev, false);
1da177e4 924
3b1e0a65 925 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
d86e0dac
PE
926 &ipv6_hdr(skb)->saddr, th->source,
927 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1da177e4
LT
928
929 if (nsk) {
930 if (nsk->sk_state != TCP_TIME_WAIT) {
931 bh_lock_sock(nsk);
932 return nsk;
933 }
9469c7b4 934 inet_twsk_put(inet_twsk(nsk));
1da177e4
LT
935 return NULL;
936 }
937
c6aefafb 938#ifdef CONFIG_SYN_COOKIES
af9b4738 939 if (!th->syn)
c6aefafb 940 sk = cookie_v6_check(sk, skb);
1da177e4
LT
941#endif
942 return sk;
943}
944
1da177e4
LT
945/* FIXME: this is substantially similar to the ipv4 code.
946 * Can some kind of merge be done? -- erics
947 */
948static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
949{
e6b4d113
WAS
950 struct tcp_options_received tmp_opt;
951 struct request_sock *req;
ca304b61 952 struct inet6_request_sock *treq;
1da177e4 953 struct ipv6_pinfo *np = inet6_sk(sk);
1da177e4 954 struct tcp_sock *tp = tcp_sk(sk);
e6b4d113 955 __u32 isn = TCP_SKB_CB(skb)->when;
493f377d 956 struct dst_entry *dst = NULL;
3840a06e 957 struct flowi6 fl6;
a2a385d6 958 bool want_cookie = false;
1da177e4
LT
959
960 if (skb->protocol == htons(ETH_P_IP))
961 return tcp_v4_conn_request(sk, skb);
962
963 if (!ipv6_unicast_destination(skb))
1ab1457c 964 goto drop;
1da177e4 965
5ad37d5d
HFS
966 if ((sysctl_tcp_syncookies == 2 ||
967 inet_csk_reqsk_queue_is_full(sk)) && !isn) {
946cedcc
ED
968 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
969 if (!want_cookie)
970 goto drop;
1da177e4
LT
971 }
972
5f1e942c
VS
973 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1) {
974 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1da177e4 975 goto drop;
5f1e942c 976 }
1da177e4 977
ca304b61 978 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1da177e4
LT
979 if (req == NULL)
980 goto drop;
981
cfb6eeb4
YH
982#ifdef CONFIG_TCP_MD5SIG
983 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
984#endif
985
1da177e4
LT
986 tcp_clear_options(&tmp_opt);
987 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
988 tmp_opt.user_mss = tp->rx_opt.user_mss;
1a2c6181 989 tcp_parse_options(skb, &tmp_opt, 0, NULL);
1da177e4 990
4dfc2817 991 if (want_cookie && !tmp_opt.saw_tstamp)
c6aefafb 992 tcp_clear_options(&tmp_opt);
c6aefafb 993
1da177e4
LT
994 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
995 tcp_openreq_init(req, &tmp_opt, skb);
996
ca304b61 997 treq = inet6_rsk(req);
4e3fd7a0
AD
998 treq->rmt_addr = ipv6_hdr(skb)->saddr;
999 treq->loc_addr = ipv6_hdr(skb)->daddr;
172d69e6 1000 if (!want_cookie || tmp_opt.tstamp_ok)
5d134f1c 1001 TCP_ECN_create_request(req, skb, sock_net(sk));
c6aefafb 1002
4d0fe50c
ED
1003 treq->iif = sk->sk_bound_dev_if;
1004
1005 /* So that link locals have meaning */
1006 if (!sk->sk_bound_dev_if &&
1007 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1008 treq->iif = inet6_iif(skb);
1009
2bbdf389 1010 if (!isn) {
c6aefafb
GG
1011 if (ipv6_opt_accepted(sk, skb) ||
1012 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1013 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1014 atomic_inc(&skb->users);
1015 treq->pktopts = skb;
1016 }
493f377d
DM
1017
1018 if (want_cookie) {
2bbdf389
FW
1019 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1020 req->cookie_ts = tmp_opt.tstamp_ok;
493f377d
DM
1021 goto have_isn;
1022 }
1023
1024 /* VJ's idea. We save last timestamp seen
1025 * from the destination in peer table, when entering
1026 * state TIME-WAIT, and check against it before
1027 * accepting new connection request.
1028 *
1029 * If "isn" is not zero, this request hit alive
1030 * timewait bucket, so that all the necessary checks
1031 * are made in the function processing timewait state.
1032 */
1033 if (tmp_opt.saw_tstamp &&
1034 tcp_death_row.sysctl_tw_recycle &&
81166dd6
DM
1035 (dst = inet6_csk_route_req(sk, &fl6, req)) != NULL) {
1036 if (!tcp_peer_is_proven(req, dst, true)) {
493f377d
DM
1037 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1038 goto drop_and_release;
1039 }
1040 }
1041 /* Kill the following clause, if you dislike this way. */
1042 else if (!sysctl_tcp_syncookies &&
1043 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1044 (sysctl_max_syn_backlog >> 2)) &&
81166dd6 1045 !tcp_peer_is_proven(req, dst, false)) {
493f377d
DM
1046 /* Without syncookies last quarter of
1047 * backlog is filled with destinations,
1048 * proven to be alive.
1049 * It means that we continue to communicate
1050 * to destinations, already remembered
1051 * to the moment of synflood.
1052 */
1053 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
1054 &treq->rmt_addr, ntohs(tcp_hdr(skb)->source));
1055 goto drop_and_release;
2bbdf389 1056 }
493f377d
DM
1057
1058 isn = tcp_v6_init_sequence(skb);
c6aefafb 1059 }
493f377d 1060have_isn:
2e6599cb 1061 tcp_rsk(req)->snt_isn = isn;
1da177e4 1062
437c5b53
NC
1063 if (security_inet_conn_request(sk, skb, req))
1064 goto drop_and_release;
4237c75c 1065
9f10d3f6 1066 if (tcp_v6_send_synack(sk, dst, &fl6, req,
fff32699 1067 skb_get_queue_mapping(skb)) ||
4957faad 1068 want_cookie)
e6b4d113 1069 goto drop_and_free;
1da177e4 1070
016818d0 1071 tcp_rsk(req)->snt_synack = tcp_time_stamp;
8336886f 1072 tcp_rsk(req)->listener = NULL;
e6b4d113
WAS
1073 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1074 return 0;
1da177e4 1075
493f377d
DM
1076drop_and_release:
1077 dst_release(dst);
e6b4d113
WAS
1078drop_and_free:
1079 reqsk_free(req);
1da177e4 1080drop:
5f1e942c 1081 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1082 return 0; /* don't send reset */
1083}
1084
1085static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
60236fdd 1086 struct request_sock *req,
1da177e4
LT
1087 struct dst_entry *dst)
1088{
78d15e82 1089 struct inet6_request_sock *treq;
1da177e4
LT
1090 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1091 struct tcp6_sock *newtcp6sk;
1092 struct inet_sock *newinet;
1093 struct tcp_sock *newtp;
1094 struct sock *newsk;
cfb6eeb4
YH
1095#ifdef CONFIG_TCP_MD5SIG
1096 struct tcp_md5sig_key *key;
1097#endif
3840a06e 1098 struct flowi6 fl6;
1da177e4
LT
1099
1100 if (skb->protocol == htons(ETH_P_IP)) {
1101 /*
1102 * v6 mapped
1103 */
1104
1105 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1106
1ab1457c 1107 if (newsk == NULL)
1da177e4
LT
1108 return NULL;
1109
1110 newtcp6sk = (struct tcp6_sock *)newsk;
1111 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1112
1113 newinet = inet_sk(newsk);
1114 newnp = inet6_sk(newsk);
1115 newtp = tcp_sk(newsk);
1116
1117 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1118
efe4208f 1119 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newsk->sk_v6_daddr);
1da177e4 1120
c720c7e8 1121 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
1da177e4 1122
efe4208f 1123 newsk->sk_v6_rcv_saddr = newnp->saddr;
1da177e4 1124
8292a17a 1125 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1da177e4 1126 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
1127#ifdef CONFIG_TCP_MD5SIG
1128 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1129#endif
1130
676a1184
YZ
1131 newnp->ipv6_ac_list = NULL;
1132 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1133 newnp->pktoptions = NULL;
1134 newnp->opt = NULL;
505cbfc5 1135 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1136 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
e7219858 1137 newnp->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4 1138
e6848976
ACM
1139 /*
1140 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1141 * here, tcp_create_openreq_child now does this for us, see the comment in
1142 * that function for the gory details. -acme
1da177e4 1143 */
1da177e4
LT
1144
1145 /* It is tricky place. Until this moment IPv4 tcp
8292a17a 1146 worked with IPv6 icsk.icsk_af_ops.
1da177e4
LT
1147 Sync it now.
1148 */
d83d8461 1149 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1da177e4
LT
1150
1151 return newsk;
1152 }
1153
78d15e82 1154 treq = inet6_rsk(req);
1da177e4
LT
1155
1156 if (sk_acceptq_is_full(sk))
1157 goto out_overflow;
1158
493f377d 1159 if (!dst) {
3840a06e 1160 dst = inet6_csk_route_req(sk, &fl6, req);
493f377d 1161 if (!dst)
1da177e4 1162 goto out;
1ab1457c 1163 }
1da177e4
LT
1164
1165 newsk = tcp_create_openreq_child(sk, req, skb);
1166 if (newsk == NULL)
093d2823 1167 goto out_nonewsk;
1da177e4 1168
e6848976
ACM
1169 /*
1170 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1171 * count here, tcp_create_openreq_child now does this for us, see the
1172 * comment in that function for the gory details. -acme
1173 */
1da177e4 1174
59eed279 1175 newsk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 1176 __ip6_dst_store(newsk, dst, NULL, NULL);
fae6ef87 1177 inet6_sk_rx_dst_set(newsk, skb);
1da177e4
LT
1178
1179 newtcp6sk = (struct tcp6_sock *)newsk;
1180 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1181
1182 newtp = tcp_sk(newsk);
1183 newinet = inet_sk(newsk);
1184 newnp = inet6_sk(newsk);
1185
1186 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1187
efe4208f 1188 newsk->sk_v6_daddr = treq->rmt_addr;
4e3fd7a0 1189 newnp->saddr = treq->loc_addr;
efe4208f 1190 newsk->sk_v6_rcv_saddr = treq->loc_addr;
2e6599cb 1191 newsk->sk_bound_dev_if = treq->iif;
1da177e4 1192
1ab1457c 1193 /* Now IPv6 options...
1da177e4
LT
1194
1195 First: no IPv4 options.
1196 */
f6d8bd05 1197 newinet->inet_opt = NULL;
676a1184 1198 newnp->ipv6_ac_list = NULL;
d35690be 1199 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1200
1201 /* Clone RX bits */
1202 newnp->rxopt.all = np->rxopt.all;
1203
1204 /* Clone pktoptions received with SYN */
1205 newnp->pktoptions = NULL;
2e6599cb 1206 if (treq->pktopts != NULL) {
99a1dec7
MG
1207 newnp->pktoptions = skb_clone(treq->pktopts,
1208 sk_gfp_atomic(sk, GFP_ATOMIC));
ab185d7b 1209 consume_skb(treq->pktopts);
2e6599cb 1210 treq->pktopts = NULL;
1da177e4
LT
1211 if (newnp->pktoptions)
1212 skb_set_owner_r(newnp->pktoptions, newsk);
1213 }
1214 newnp->opt = NULL;
505cbfc5 1215 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1216 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
e7219858 1217 newnp->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4
LT
1218
1219 /* Clone native IPv6 options from listening socket (if any)
1220
1221 Yes, keeping reference count would be much more clever,
1222 but we make one more one thing there: reattach optmem
1223 to newsk.
1224 */
43264e0b
RL
1225 if (np->opt)
1226 newnp->opt = ipv6_dup_options(newsk, np->opt);
1da177e4 1227
d83d8461 1228 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1da177e4 1229 if (newnp->opt)
d83d8461
ACM
1230 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1231 newnp->opt->opt_flen);
1da177e4 1232
5d424d5a 1233 tcp_mtup_init(newsk);
1da177e4 1234 tcp_sync_mss(newsk, dst_mtu(dst));
0dbaee3b 1235 newtp->advmss = dst_metric_advmss(dst);
d135c522
NC
1236 if (tcp_sk(sk)->rx_opt.user_mss &&
1237 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1238 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1239
1da177e4
LT
1240 tcp_initialize_rcv_mss(newsk);
1241
c720c7e8
ED
1242 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1243 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 1244
cfb6eeb4
YH
1245#ifdef CONFIG_TCP_MD5SIG
1246 /* Copy over the MD5 key from the original socket */
efe4208f 1247 if ((key = tcp_v6_md5_do_lookup(sk, &newsk->sk_v6_daddr)) != NULL) {
cfb6eeb4
YH
1248 /* We're using one, so create a matching key
1249 * on the newsk structure. If we fail to get
1250 * memory, then we end up not copying the key
1251 * across. Shucks.
1252 */
efe4208f 1253 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newsk->sk_v6_daddr,
99a1dec7
MG
1254 AF_INET6, key->key, key->keylen,
1255 sk_gfp_atomic(sk, GFP_ATOMIC));
cfb6eeb4
YH
1256 }
1257#endif
1258
093d2823 1259 if (__inet_inherit_port(sk, newsk) < 0) {
e337e24d
CP
1260 inet_csk_prepare_forced_close(newsk);
1261 tcp_done(newsk);
093d2823
BS
1262 goto out;
1263 }
9327f705 1264 __inet6_hash(newsk, NULL);
1da177e4
LT
1265
1266 return newsk;
1267
1268out_overflow:
de0744af 1269 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
093d2823 1270out_nonewsk:
1da177e4 1271 dst_release(dst);
093d2823
BS
1272out:
1273 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1274 return NULL;
1275}
1276
b51655b9 1277static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1da177e4 1278{
84fa7933 1279 if (skb->ip_summed == CHECKSUM_COMPLETE) {
684f2176 1280 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
0660e03f 1281 &ipv6_hdr(skb)->daddr, skb->csum)) {
fb286bb2 1282 skb->ip_summed = CHECKSUM_UNNECESSARY;
1da177e4 1283 return 0;
fb286bb2 1284 }
1da177e4 1285 }
fb286bb2 1286
684f2176 1287 skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
0660e03f
ACM
1288 &ipv6_hdr(skb)->saddr,
1289 &ipv6_hdr(skb)->daddr, 0));
fb286bb2 1290
1da177e4 1291 if (skb->len <= 76) {
fb286bb2 1292 return __skb_checksum_complete(skb);
1da177e4
LT
1293 }
1294 return 0;
1295}
1296
1297/* The socket must have it's spinlock held when we get
1298 * here.
1299 *
1300 * We have a potential double-lock case here, so even when
1301 * doing backlog processing we use the BH locking scheme.
1302 * This is because we cannot sleep with the original spinlock
1303 * held.
1304 */
1305static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1306{
1307 struct ipv6_pinfo *np = inet6_sk(sk);
1308 struct tcp_sock *tp;
1309 struct sk_buff *opt_skb = NULL;
1310
1311 /* Imagine: socket is IPv6. IPv4 packet arrives,
1312 goes to IPv4 receive handler and backlogged.
1313 From backlog it always goes here. Kerboom...
1314 Fortunately, tcp_rcv_established and rcv_established
1315 handle them correctly, but it is not case with
1316 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1317 */
1318
1319 if (skb->protocol == htons(ETH_P_IP))
1320 return tcp_v4_do_rcv(sk, skb);
1321
cfb6eeb4
YH
1322#ifdef CONFIG_TCP_MD5SIG
1323 if (tcp_v6_inbound_md5_hash (sk, skb))
1324 goto discard;
1325#endif
1326
fda9ef5d 1327 if (sk_filter(sk, skb))
1da177e4
LT
1328 goto discard;
1329
1330 /*
1331 * socket locking is here for SMP purposes as backlog rcv
1332 * is currently called with bh processing disabled.
1333 */
1334
1335 /* Do Stevens' IPV6_PKTOPTIONS.
1336
1337 Yes, guys, it is the only place in our code, where we
1338 may make it not affecting IPv4.
1339 The rest of code is protocol independent,
1340 and I do not like idea to uglify IPv4.
1341
1342 Actually, all the idea behind IPV6_PKTOPTIONS
1343 looks not very well thought. For now we latch
1344 options, received in the last packet, enqueued
1345 by tcp. Feel free to propose better solution.
1ab1457c 1346 --ANK (980728)
1da177e4
LT
1347 */
1348 if (np->rxopt.all)
99a1dec7 1349 opt_skb = skb_clone(skb, sk_gfp_atomic(sk, GFP_ATOMIC));
1da177e4
LT
1350
1351 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
5d299f3d
ED
1352 struct dst_entry *dst = sk->sk_rx_dst;
1353
bdeab991 1354 sock_rps_save_rxhash(sk, skb);
5d299f3d
ED
1355 if (dst) {
1356 if (inet_sk(sk)->rx_dst_ifindex != skb->skb_iif ||
1357 dst->ops->check(dst, np->rx_dst_cookie) == NULL) {
1358 dst_release(dst);
1359 sk->sk_rx_dst = NULL;
1360 }
1361 }
1362
c995ae22 1363 tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len);
1da177e4
LT
1364 if (opt_skb)
1365 goto ipv6_pktoptions;
1366 return 0;
1367 }
1368
ab6a5bb6 1369 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1da177e4
LT
1370 goto csum_err;
1371
1ab1457c 1372 if (sk->sk_state == TCP_LISTEN) {
1da177e4
LT
1373 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1374 if (!nsk)
1375 goto discard;
1376
1377 /*
1378 * Queue it on the new socket if the new socket is active,
1379 * otherwise we just shortcircuit this and continue with
1380 * the new socket..
1381 */
1ab1457c 1382 if(nsk != sk) {
bdeab991 1383 sock_rps_save_rxhash(nsk, skb);
1da177e4
LT
1384 if (tcp_child_process(sk, nsk, skb))
1385 goto reset;
1386 if (opt_skb)
1387 __kfree_skb(opt_skb);
1388 return 0;
1389 }
47482f13 1390 } else
bdeab991 1391 sock_rps_save_rxhash(sk, skb);
1da177e4 1392
aa8223c7 1393 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1da177e4 1394 goto reset;
1da177e4
LT
1395 if (opt_skb)
1396 goto ipv6_pktoptions;
1397 return 0;
1398
1399reset:
cfb6eeb4 1400 tcp_v6_send_reset(sk, skb);
1da177e4
LT
1401discard:
1402 if (opt_skb)
1403 __kfree_skb(opt_skb);
1404 kfree_skb(skb);
1405 return 0;
1406csum_err:
6a5dc9e5 1407 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_CSUMERRORS);
63231bdd 1408 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1da177e4
LT
1409 goto discard;
1410
1411
1412ipv6_pktoptions:
1413 /* Do you ask, what is it?
1414
1415 1. skb was enqueued by tcp.
1416 2. skb is added to tail of read queue, rather than out of order.
1417 3. socket is not in passive state.
1418 4. Finally, it really contains options, which user wants to receive.
1419 */
1420 tp = tcp_sk(sk);
1421 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1422 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
333fad53 1423 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
505cbfc5 1424 np->mcast_oif = inet6_iif(opt_skb);
333fad53 1425 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
0660e03f 1426 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
4c507d28 1427 if (np->rxopt.bits.rxtclass)
3a1c7565 1428 np->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(opt_skb));
1da177e4
LT
1429 if (ipv6_opt_accepted(sk, opt_skb)) {
1430 skb_set_owner_r(opt_skb, sk);
1431 opt_skb = xchg(&np->pktoptions, opt_skb);
1432 } else {
1433 __kfree_skb(opt_skb);
1434 opt_skb = xchg(&np->pktoptions, NULL);
1435 }
1436 }
1437
800d55f1 1438 kfree_skb(opt_skb);
1da177e4
LT
1439 return 0;
1440}
1441
e5bbef20 1442static int tcp_v6_rcv(struct sk_buff *skb)
1da177e4 1443{
cf533ea5 1444 const struct tcphdr *th;
b71d1d42 1445 const struct ipv6hdr *hdr;
1da177e4
LT
1446 struct sock *sk;
1447 int ret;
a86b1e30 1448 struct net *net = dev_net(skb->dev);
1da177e4
LT
1449
1450 if (skb->pkt_type != PACKET_HOST)
1451 goto discard_it;
1452
1453 /*
1454 * Count it even if it's bad.
1455 */
63231bdd 1456 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1da177e4
LT
1457
1458 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1459 goto discard_it;
1460
aa8223c7 1461 th = tcp_hdr(skb);
1da177e4
LT
1462
1463 if (th->doff < sizeof(struct tcphdr)/4)
1464 goto bad_packet;
1465 if (!pskb_may_pull(skb, th->doff*4))
1466 goto discard_it;
1467
60476372 1468 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
6a5dc9e5 1469 goto csum_error;
1da177e4 1470
aa8223c7 1471 th = tcp_hdr(skb);
e802af9c 1472 hdr = ipv6_hdr(skb);
1da177e4
LT
1473 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1474 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1475 skb->len - th->doff*4);
1476 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1477 TCP_SKB_CB(skb)->when = 0;
b82d1bb4 1478 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
1da177e4
LT
1479 TCP_SKB_CB(skb)->sacked = 0;
1480
9a1f27c4 1481 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1da177e4
LT
1482 if (!sk)
1483 goto no_tcp_socket;
1484
1485process:
1486 if (sk->sk_state == TCP_TIME_WAIT)
1487 goto do_time_wait;
1488
e802af9c
SH
1489 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1490 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1491 goto discard_and_relse;
1492 }
1493
1da177e4
LT
1494 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1495 goto discard_and_relse;
1496
fda9ef5d 1497 if (sk_filter(sk, skb))
1da177e4
LT
1498 goto discard_and_relse;
1499
8b80cda5 1500 sk_mark_napi_id(sk, skb);
1da177e4
LT
1501 skb->dev = NULL;
1502
293b9c42 1503 bh_lock_sock_nested(sk);
1da177e4
LT
1504 ret = 0;
1505 if (!sock_owned_by_user(sk)) {
1a2449a8 1506#ifdef CONFIG_NET_DMA
1ab1457c 1507 struct tcp_sock *tp = tcp_sk(sk);
b4caea8a 1508 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
a2bd1140 1509 tp->ucopy.dma_chan = net_dma_find_channel();
1ab1457c
YH
1510 if (tp->ucopy.dma_chan)
1511 ret = tcp_v6_do_rcv(sk, skb);
1512 else
1a2449a8
CL
1513#endif
1514 {
1515 if (!tcp_prequeue(sk, skb))
1516 ret = tcp_v6_do_rcv(sk, skb);
1517 }
da882c1f
ED
1518 } else if (unlikely(sk_add_backlog(sk, skb,
1519 sk->sk_rcvbuf + sk->sk_sndbuf))) {
6b03a53a 1520 bh_unlock_sock(sk);
6cce09f8 1521 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
6b03a53a
ZY
1522 goto discard_and_relse;
1523 }
1da177e4
LT
1524 bh_unlock_sock(sk);
1525
1526 sock_put(sk);
1527 return ret ? -1 : 0;
1528
1529no_tcp_socket:
1530 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1531 goto discard_it;
1532
1533 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
6a5dc9e5
ED
1534csum_error:
1535 TCP_INC_STATS_BH(net, TCP_MIB_CSUMERRORS);
1da177e4 1536bad_packet:
63231bdd 1537 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1da177e4 1538 } else {
cfb6eeb4 1539 tcp_v6_send_reset(NULL, skb);
1da177e4
LT
1540 }
1541
1542discard_it:
1da177e4
LT
1543 kfree_skb(skb);
1544 return 0;
1545
1546discard_and_relse:
1547 sock_put(sk);
1548 goto discard_it;
1549
1550do_time_wait:
1551 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
9469c7b4 1552 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1553 goto discard_it;
1554 }
1555
6a5dc9e5 1556 if (skb->len < (th->doff<<2)) {
9469c7b4 1557 inet_twsk_put(inet_twsk(sk));
6a5dc9e5
ED
1558 goto bad_packet;
1559 }
1560 if (tcp_checksum_complete(skb)) {
1561 inet_twsk_put(inet_twsk(sk));
1562 goto csum_error;
1da177e4
LT
1563 }
1564
9469c7b4 1565 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1da177e4
LT
1566 case TCP_TW_SYN:
1567 {
1568 struct sock *sk2;
1569
c346dca1 1570 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
5ba24953 1571 &ipv6_hdr(skb)->saddr, th->source,
0660e03f 1572 &ipv6_hdr(skb)->daddr,
505cbfc5 1573 ntohs(th->dest), inet6_iif(skb));
1da177e4 1574 if (sk2 != NULL) {
295ff7ed
ACM
1575 struct inet_timewait_sock *tw = inet_twsk(sk);
1576 inet_twsk_deschedule(tw, &tcp_death_row);
1577 inet_twsk_put(tw);
1da177e4
LT
1578 sk = sk2;
1579 goto process;
1580 }
1581 /* Fall through to ACK */
1582 }
1583 case TCP_TW_ACK:
1584 tcp_v6_timewait_ack(sk, skb);
1585 break;
1586 case TCP_TW_RST:
1587 goto no_tcp_socket;
1588 case TCP_TW_SUCCESS:;
1589 }
1590 goto discard_it;
1591}
1592
c7109986
ED
1593static void tcp_v6_early_demux(struct sk_buff *skb)
1594{
1595 const struct ipv6hdr *hdr;
1596 const struct tcphdr *th;
1597 struct sock *sk;
1598
1599 if (skb->pkt_type != PACKET_HOST)
1600 return;
1601
1602 if (!pskb_may_pull(skb, skb_transport_offset(skb) + sizeof(struct tcphdr)))
1603 return;
1604
1605 hdr = ipv6_hdr(skb);
1606 th = tcp_hdr(skb);
1607
1608 if (th->doff < sizeof(struct tcphdr) / 4)
1609 return;
1610
1611 sk = __inet6_lookup_established(dev_net(skb->dev), &tcp_hashinfo,
1612 &hdr->saddr, th->source,
1613 &hdr->daddr, ntohs(th->dest),
1614 inet6_iif(skb));
1615 if (sk) {
1616 skb->sk = sk;
1617 skb->destructor = sock_edemux;
1618 if (sk->sk_state != TCP_TIME_WAIT) {
1619 struct dst_entry *dst = sk->sk_rx_dst;
f3f12135 1620
c7109986 1621 if (dst)
5d299f3d 1622 dst = dst_check(dst, inet6_sk(sk)->rx_dst_cookie);
c7109986 1623 if (dst &&
f3f12135 1624 inet_sk(sk)->rx_dst_ifindex == skb->skb_iif)
c7109986
ED
1625 skb_dst_set_noref(skb, dst);
1626 }
1627 }
1628}
1629
ccb7c410
DM
1630static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1631 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1632 .twsk_unique = tcp_twsk_unique,
1633 .twsk_destructor= tcp_twsk_destructor,
ccb7c410
DM
1634};
1635
3b401a81 1636static const struct inet_connection_sock_af_ops ipv6_specific = {
543d9cfe
ACM
1637 .queue_xmit = inet6_csk_xmit,
1638 .send_check = tcp_v6_send_check,
1639 .rebuild_header = inet6_sk_rebuild_header,
5d299f3d 1640 .sk_rx_dst_set = inet6_sk_rx_dst_set,
543d9cfe
ACM
1641 .conn_request = tcp_v6_conn_request,
1642 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe 1643 .net_header_len = sizeof(struct ipv6hdr),
67469601 1644 .net_frag_header_len = sizeof(struct frag_hdr),
543d9cfe
ACM
1645 .setsockopt = ipv6_setsockopt,
1646 .getsockopt = ipv6_getsockopt,
1647 .addr2sockaddr = inet6_csk_addr2sockaddr,
1648 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1649 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1650#ifdef CONFIG_COMPAT
543d9cfe
ACM
1651 .compat_setsockopt = compat_ipv6_setsockopt,
1652 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1653#endif
1da177e4
LT
1654};
1655
cfb6eeb4 1656#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1657static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
cfb6eeb4 1658 .md5_lookup = tcp_v6_md5_lookup,
49a72dfb 1659 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 1660 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1661};
a928630a 1662#endif
cfb6eeb4 1663
1da177e4
LT
1664/*
1665 * TCP over IPv4 via INET6 API
1666 */
1667
3b401a81 1668static const struct inet_connection_sock_af_ops ipv6_mapped = {
543d9cfe
ACM
1669 .queue_xmit = ip_queue_xmit,
1670 .send_check = tcp_v4_send_check,
1671 .rebuild_header = inet_sk_rebuild_header,
63d02d15 1672 .sk_rx_dst_set = inet_sk_rx_dst_set,
543d9cfe
ACM
1673 .conn_request = tcp_v6_conn_request,
1674 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe
ACM
1675 .net_header_len = sizeof(struct iphdr),
1676 .setsockopt = ipv6_setsockopt,
1677 .getsockopt = ipv6_getsockopt,
1678 .addr2sockaddr = inet6_csk_addr2sockaddr,
1679 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1680 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1681#ifdef CONFIG_COMPAT
543d9cfe
ACM
1682 .compat_setsockopt = compat_ipv6_setsockopt,
1683 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1684#endif
1da177e4
LT
1685};
1686
cfb6eeb4 1687#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1688static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
cfb6eeb4 1689 .md5_lookup = tcp_v4_md5_lookup,
49a72dfb 1690 .calc_md5_hash = tcp_v4_md5_hash_skb,
cfb6eeb4 1691 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1692};
a928630a 1693#endif
cfb6eeb4 1694
1da177e4
LT
1695/* NOTE: A lot of things set to zero explicitly by call to
1696 * sk_alloc() so need not be done here.
1697 */
1698static int tcp_v6_init_sock(struct sock *sk)
1699{
6687e988 1700 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4 1701
900f65d3 1702 tcp_init_sock(sk);
1da177e4 1703
8292a17a 1704 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 1705
cfb6eeb4 1706#ifdef CONFIG_TCP_MD5SIG
ac807fa8 1707 tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
cfb6eeb4
YH
1708#endif
1709
1da177e4
LT
1710 return 0;
1711}
1712
7d06b2e0 1713static void tcp_v6_destroy_sock(struct sock *sk)
1da177e4 1714{
1da177e4 1715 tcp_v4_destroy_sock(sk);
7d06b2e0 1716 inet6_destroy_sock(sk);
1da177e4
LT
1717}
1718
952a10be 1719#ifdef CONFIG_PROC_FS
1da177e4 1720/* Proc filesystem TCPv6 sock list dumping. */
1ab1457c 1721static void get_openreq6(struct seq_file *seq,
a7cb5a49 1722 const struct sock *sk, struct request_sock *req, int i, kuid_t uid)
1da177e4 1723{
1da177e4 1724 int ttd = req->expires - jiffies;
b71d1d42
ED
1725 const struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1726 const struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1da177e4
LT
1727
1728 if (ttd < 0)
1729 ttd = 0;
1730
1da177e4
LT
1731 seq_printf(seq,
1732 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
d14c5ab6 1733 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %d %d %pK\n",
1da177e4
LT
1734 i,
1735 src->s6_addr32[0], src->s6_addr32[1],
1736 src->s6_addr32[2], src->s6_addr32[3],
fd507037 1737 ntohs(inet_rsk(req)->loc_port),
1da177e4
LT
1738 dest->s6_addr32[0], dest->s6_addr32[1],
1739 dest->s6_addr32[2], dest->s6_addr32[3],
2e6599cb 1740 ntohs(inet_rsk(req)->rmt_port),
1da177e4
LT
1741 TCP_SYN_RECV,
1742 0,0, /* could print option size, but that is af dependent. */
1ab1457c
YH
1743 1, /* timers active (only the expire timer) */
1744 jiffies_to_clock_t(ttd),
e6c022a4 1745 req->num_timeout,
a7cb5a49 1746 from_kuid_munged(seq_user_ns(seq), uid),
1ab1457c 1747 0, /* non standard timer */
1da177e4
LT
1748 0, /* open_requests have no inode */
1749 0, req);
1750}
1751
1752static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1753{
b71d1d42 1754 const struct in6_addr *dest, *src;
1da177e4
LT
1755 __u16 destp, srcp;
1756 int timer_active;
1757 unsigned long timer_expires;
cf533ea5
ED
1758 const struct inet_sock *inet = inet_sk(sp);
1759 const struct tcp_sock *tp = tcp_sk(sp);
463c84b9 1760 const struct inet_connection_sock *icsk = inet_csk(sp);
1da177e4 1761
efe4208f
ED
1762 dest = &sp->sk_v6_daddr;
1763 src = &sp->sk_v6_rcv_saddr;
c720c7e8
ED
1764 destp = ntohs(inet->inet_dport);
1765 srcp = ntohs(inet->inet_sport);
463c84b9
ACM
1766
1767 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1da177e4 1768 timer_active = 1;
463c84b9
ACM
1769 timer_expires = icsk->icsk_timeout;
1770 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1da177e4 1771 timer_active = 4;
463c84b9 1772 timer_expires = icsk->icsk_timeout;
1da177e4
LT
1773 } else if (timer_pending(&sp->sk_timer)) {
1774 timer_active = 2;
1775 timer_expires = sp->sk_timer.expires;
1776 } else {
1777 timer_active = 0;
1778 timer_expires = jiffies;
1779 }
1780
1781 seq_printf(seq,
1782 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
d14c5ab6 1783 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %lu %d %pK %lu %lu %u %u %d\n",
1da177e4
LT
1784 i,
1785 src->s6_addr32[0], src->s6_addr32[1],
1786 src->s6_addr32[2], src->s6_addr32[3], srcp,
1787 dest->s6_addr32[0], dest->s6_addr32[1],
1788 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1ab1457c 1789 sp->sk_state,
47da8ee6
SS
1790 tp->write_seq-tp->snd_una,
1791 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1da177e4 1792 timer_active,
a399a805 1793 jiffies_delta_to_clock_t(timer_expires - jiffies),
463c84b9 1794 icsk->icsk_retransmits,
a7cb5a49 1795 from_kuid_munged(seq_user_ns(seq), sock_i_uid(sp)),
6687e988 1796 icsk->icsk_probes_out,
1da177e4
LT
1797 sock_i_ino(sp),
1798 atomic_read(&sp->sk_refcnt), sp,
7be87351
SH
1799 jiffies_to_clock_t(icsk->icsk_rto),
1800 jiffies_to_clock_t(icsk->icsk_ack.ato),
463c84b9 1801 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
0b6a05c1
IJ
1802 tp->snd_cwnd,
1803 tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
1da177e4
LT
1804 );
1805}
1806
1ab1457c 1807static void get_timewait6_sock(struct seq_file *seq,
8feaf0c0 1808 struct inet_timewait_sock *tw, int i)
1da177e4 1809{
b71d1d42 1810 const struct in6_addr *dest, *src;
1da177e4 1811 __u16 destp, srcp;
96f817fe 1812 s32 delta = tw->tw_ttd - inet_tw_time_stamp();
1da177e4 1813
efe4208f
ED
1814 dest = &tw->tw_v6_daddr;
1815 src = &tw->tw_v6_rcv_saddr;
1da177e4
LT
1816 destp = ntohs(tw->tw_dport);
1817 srcp = ntohs(tw->tw_sport);
1818
1819 seq_printf(seq,
1820 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1821 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1da177e4
LT
1822 i,
1823 src->s6_addr32[0], src->s6_addr32[1],
1824 src->s6_addr32[2], src->s6_addr32[3], srcp,
1825 dest->s6_addr32[0], dest->s6_addr32[1],
1826 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1827 tw->tw_substate, 0, 0,
a399a805 1828 3, jiffies_delta_to_clock_t(delta), 0, 0, 0, 0,
1da177e4
LT
1829 atomic_read(&tw->tw_refcnt), tw);
1830}
1831
1da177e4
LT
1832static int tcp6_seq_show(struct seq_file *seq, void *v)
1833{
1834 struct tcp_iter_state *st;
05dbc7b5 1835 struct sock *sk = v;
1da177e4
LT
1836
1837 if (v == SEQ_START_TOKEN) {
1838 seq_puts(seq,
1839 " sl "
1840 "local_address "
1841 "remote_address "
1842 "st tx_queue rx_queue tr tm->when retrnsmt"
1843 " uid timeout inode\n");
1844 goto out;
1845 }
1846 st = seq->private;
1847
1848 switch (st->state) {
1849 case TCP_SEQ_STATE_LISTENING:
1850 case TCP_SEQ_STATE_ESTABLISHED:
05dbc7b5
ED
1851 if (sk->sk_state == TCP_TIME_WAIT)
1852 get_timewait6_sock(seq, v, st->num);
1853 else
1854 get_tcp6_sock(seq, v, st->num);
1da177e4
LT
1855 break;
1856 case TCP_SEQ_STATE_OPENREQ:
1857 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1858 break;
1da177e4
LT
1859 }
1860out:
1861 return 0;
1862}
1863
73cb88ec
AV
1864static const struct file_operations tcp6_afinfo_seq_fops = {
1865 .owner = THIS_MODULE,
1866 .open = tcp_seq_open,
1867 .read = seq_read,
1868 .llseek = seq_lseek,
1869 .release = seq_release_net
1870};
1871
1da177e4 1872static struct tcp_seq_afinfo tcp6_seq_afinfo = {
1da177e4
LT
1873 .name = "tcp6",
1874 .family = AF_INET6,
73cb88ec 1875 .seq_fops = &tcp6_afinfo_seq_fops,
9427c4b3
DL
1876 .seq_ops = {
1877 .show = tcp6_seq_show,
1878 },
1da177e4
LT
1879};
1880
2c8c1e72 1881int __net_init tcp6_proc_init(struct net *net)
1da177e4 1882{
6f8b13bc 1883 return tcp_proc_register(net, &tcp6_seq_afinfo);
1da177e4
LT
1884}
1885
6f8b13bc 1886void tcp6_proc_exit(struct net *net)
1da177e4 1887{
6f8b13bc 1888 tcp_proc_unregister(net, &tcp6_seq_afinfo);
1da177e4
LT
1889}
1890#endif
1891
f77d6021
ED
1892static void tcp_v6_clear_sk(struct sock *sk, int size)
1893{
1894 struct inet_sock *inet = inet_sk(sk);
1895
1896 /* we do not want to clear pinet6 field, because of RCU lookups */
1897 sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
1898
1899 size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
1900 memset(&inet->pinet6 + 1, 0, size);
1901}
1902
1da177e4
LT
1903struct proto tcpv6_prot = {
1904 .name = "TCPv6",
1905 .owner = THIS_MODULE,
1906 .close = tcp_close,
1907 .connect = tcp_v6_connect,
1908 .disconnect = tcp_disconnect,
463c84b9 1909 .accept = inet_csk_accept,
1da177e4
LT
1910 .ioctl = tcp_ioctl,
1911 .init = tcp_v6_init_sock,
1912 .destroy = tcp_v6_destroy_sock,
1913 .shutdown = tcp_shutdown,
1914 .setsockopt = tcp_setsockopt,
1915 .getsockopt = tcp_getsockopt,
1da177e4 1916 .recvmsg = tcp_recvmsg,
7ba42910
CG
1917 .sendmsg = tcp_sendmsg,
1918 .sendpage = tcp_sendpage,
1da177e4 1919 .backlog_rcv = tcp_v6_do_rcv,
46d3ceab 1920 .release_cb = tcp_release_cb,
563d34d0 1921 .mtu_reduced = tcp_v6_mtu_reduced,
1da177e4 1922 .hash = tcp_v6_hash,
ab1e0a13
ACM
1923 .unhash = inet_unhash,
1924 .get_port = inet_csk_get_port,
1da177e4 1925 .enter_memory_pressure = tcp_enter_memory_pressure,
c9bee3b7 1926 .stream_memory_free = tcp_stream_memory_free,
1da177e4
LT
1927 .sockets_allocated = &tcp_sockets_allocated,
1928 .memory_allocated = &tcp_memory_allocated,
1929 .memory_pressure = &tcp_memory_pressure,
0a5578cf 1930 .orphan_count = &tcp_orphan_count,
1da177e4
LT
1931 .sysctl_wmem = sysctl_tcp_wmem,
1932 .sysctl_rmem = sysctl_tcp_rmem,
1933 .max_header = MAX_TCP_HEADER,
1934 .obj_size = sizeof(struct tcp6_sock),
3ab5aee7 1935 .slab_flags = SLAB_DESTROY_BY_RCU,
6d6ee43e 1936 .twsk_prot = &tcp6_timewait_sock_ops,
60236fdd 1937 .rsk_prot = &tcp6_request_sock_ops,
39d8cda7 1938 .h.hashinfo = &tcp_hashinfo,
7ba42910 1939 .no_autobind = true,
543d9cfe
ACM
1940#ifdef CONFIG_COMPAT
1941 .compat_setsockopt = compat_tcp_setsockopt,
1942 .compat_getsockopt = compat_tcp_getsockopt,
1943#endif
c255a458 1944#ifdef CONFIG_MEMCG_KMEM
d1a4c0b3
GC
1945 .proto_cgroup = tcp_proto_cgroup,
1946#endif
f77d6021 1947 .clear_sk = tcp_v6_clear_sk,
1da177e4
LT
1948};
1949
41135cc8 1950static const struct inet6_protocol tcpv6_protocol = {
c7109986 1951 .early_demux = tcp_v6_early_demux,
1da177e4
LT
1952 .handler = tcp_v6_rcv,
1953 .err_handler = tcp_v6_err,
1954 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1955};
1956
1da177e4
LT
1957static struct inet_protosw tcpv6_protosw = {
1958 .type = SOCK_STREAM,
1959 .protocol = IPPROTO_TCP,
1960 .prot = &tcpv6_prot,
1961 .ops = &inet6_stream_ops,
1da177e4 1962 .no_check = 0,
d83d8461
ACM
1963 .flags = INET_PROTOSW_PERMANENT |
1964 INET_PROTOSW_ICSK,
1da177e4
LT
1965};
1966
2c8c1e72 1967static int __net_init tcpv6_net_init(struct net *net)
93ec926b 1968{
5677242f
DL
1969 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
1970 SOCK_RAW, IPPROTO_TCP, net);
93ec926b
DL
1971}
1972
2c8c1e72 1973static void __net_exit tcpv6_net_exit(struct net *net)
93ec926b 1974{
5677242f 1975 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
b099ce26
EB
1976}
1977
2c8c1e72 1978static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
b099ce26
EB
1979{
1980 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
93ec926b
DL
1981}
1982
1983static struct pernet_operations tcpv6_net_ops = {
b099ce26
EB
1984 .init = tcpv6_net_init,
1985 .exit = tcpv6_net_exit,
1986 .exit_batch = tcpv6_net_exit_batch,
93ec926b
DL
1987};
1988
7f4e4868 1989int __init tcpv6_init(void)
1da177e4 1990{
7f4e4868
DL
1991 int ret;
1992
3336288a
VY
1993 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
1994 if (ret)
c6b641a4 1995 goto out;
3336288a 1996
1da177e4 1997 /* register inet6 protocol */
7f4e4868
DL
1998 ret = inet6_register_protosw(&tcpv6_protosw);
1999 if (ret)
2000 goto out_tcpv6_protocol;
2001
93ec926b 2002 ret = register_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2003 if (ret)
2004 goto out_tcpv6_protosw;
2005out:
2006 return ret;
ae0f7d5f 2007
7f4e4868
DL
2008out_tcpv6_protosw:
2009 inet6_unregister_protosw(&tcpv6_protosw);
3336288a
VY
2010out_tcpv6_protocol:
2011 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
7f4e4868
DL
2012 goto out;
2013}
2014
09f7709f 2015void tcpv6_exit(void)
7f4e4868 2016{
93ec926b 2017 unregister_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2018 inet6_unregister_protosw(&tcpv6_protosw);
2019 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
1da177e4 2020}