tcp: dont drop MTU reduction indications
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / net / ipv6 / tcp_ipv6.c
CommitLineData
1da177e4
LT
1/*
2 * TCP over IPv6
1ab1457c 3 * Linux INET6 implementation
1da177e4
LT
4 *
5 * Authors:
1ab1457c 6 * Pedro Roque <roque@di.fc.ul.pt>
1da177e4 7 *
1ab1457c 8 * Based on:
1da177e4
LT
9 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
eb4dea58 26#include <linux/bottom_half.h>
1da177e4 27#include <linux/module.h>
1da177e4
LT
28#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
5a0e3ad6 41#include <linux/slab.h>
1da177e4
LT
42
43#include <linux/ipv6.h>
44#include <linux/icmpv6.h>
45#include <linux/random.h>
46
47#include <net/tcp.h>
48#include <net/ndisc.h>
5324a040 49#include <net/inet6_hashtables.h>
8129765a 50#include <net/inet6_connection_sock.h>
1da177e4
LT
51#include <net/ipv6.h>
52#include <net/transp_v6.h>
53#include <net/addrconf.h>
54#include <net/ip6_route.h>
55#include <net/ip6_checksum.h>
56#include <net/inet_ecn.h>
57#include <net/protocol.h>
58#include <net/xfrm.h>
1da177e4
LT
59#include <net/snmp.h>
60#include <net/dsfield.h>
6d6ee43e 61#include <net/timewait_sock.h>
18134bed 62#include <net/netdma.h>
3d58b5fa 63#include <net/inet_common.h>
6e5714ea 64#include <net/secure_seq.h>
d1a4c0b3 65#include <net/tcp_memcontrol.h>
1da177e4
LT
66
67#include <asm/uaccess.h>
68
69#include <linux/proc_fs.h>
70#include <linux/seq_file.h>
71
cfb6eeb4
YH
72#include <linux/crypto.h>
73#include <linux/scatterlist.h>
74
cfb6eeb4 75static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
6edafaaf
GJ
76static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
77 struct request_sock *req);
1da177e4
LT
78
79static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
8ad50d96 80static void __tcp_v6_send_check(struct sk_buff *skb,
b71d1d42
ED
81 const struct in6_addr *saddr,
82 const struct in6_addr *daddr);
1da177e4 83
3b401a81
SH
84static const struct inet_connection_sock_af_ops ipv6_mapped;
85static const struct inet_connection_sock_af_ops ipv6_specific;
a928630a 86#ifdef CONFIG_TCP_MD5SIG
b2e4b3de
SH
87static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
88static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
9501f972
YH
89#else
90static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 91 const struct in6_addr *addr)
9501f972
YH
92{
93 return NULL;
94}
a928630a 95#endif
1da177e4 96
1da177e4
LT
97static void tcp_v6_hash(struct sock *sk)
98{
99 if (sk->sk_state != TCP_CLOSE) {
8292a17a 100 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
1da177e4
LT
101 tcp_prot.hash(sk);
102 return;
103 }
104 local_bh_disable();
9327f705 105 __inet6_hash(sk, NULL);
1da177e4
LT
106 local_bh_enable();
107 }
108}
109
684f2176 110static __inline__ __sum16 tcp_v6_check(int len,
b71d1d42
ED
111 const struct in6_addr *saddr,
112 const struct in6_addr *daddr,
868c86bc 113 __wsum base)
1da177e4
LT
114{
115 return csum_ipv6_magic(saddr, daddr, len, IPPROTO_TCP, base);
116}
117
cf533ea5 118static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
1da177e4 119{
0660e03f
ACM
120 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
121 ipv6_hdr(skb)->saddr.s6_addr32,
aa8223c7
ACM
122 tcp_hdr(skb)->dest,
123 tcp_hdr(skb)->source);
1da177e4
LT
124}
125
1ab1457c 126static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
1da177e4
LT
127 int addr_len)
128{
129 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
1ab1457c 130 struct inet_sock *inet = inet_sk(sk);
d83d8461 131 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4
LT
132 struct ipv6_pinfo *np = inet6_sk(sk);
133 struct tcp_sock *tp = tcp_sk(sk);
20c59de2 134 struct in6_addr *saddr = NULL, *final_p, final;
493f377d 135 struct rt6_info *rt;
4c9483b2 136 struct flowi6 fl6;
1da177e4
LT
137 struct dst_entry *dst;
138 int addr_type;
139 int err;
140
1ab1457c 141 if (addr_len < SIN6_LEN_RFC2133)
1da177e4
LT
142 return -EINVAL;
143
1ab1457c 144 if (usin->sin6_family != AF_INET6)
a02cec21 145 return -EAFNOSUPPORT;
1da177e4 146
4c9483b2 147 memset(&fl6, 0, sizeof(fl6));
1da177e4
LT
148
149 if (np->sndflow) {
4c9483b2
DM
150 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
151 IP6_ECN_flow_init(fl6.flowlabel);
152 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
1da177e4 153 struct ip6_flowlabel *flowlabel;
4c9483b2 154 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
1da177e4
LT
155 if (flowlabel == NULL)
156 return -EINVAL;
4e3fd7a0 157 usin->sin6_addr = flowlabel->dst;
1da177e4
LT
158 fl6_sock_release(flowlabel);
159 }
160 }
161
162 /*
1ab1457c
YH
163 * connect() to INADDR_ANY means loopback (BSD'ism).
164 */
165
166 if(ipv6_addr_any(&usin->sin6_addr))
167 usin->sin6_addr.s6_addr[15] = 0x1;
1da177e4
LT
168
169 addr_type = ipv6_addr_type(&usin->sin6_addr);
170
171 if(addr_type & IPV6_ADDR_MULTICAST)
172 return -ENETUNREACH;
173
174 if (addr_type&IPV6_ADDR_LINKLOCAL) {
175 if (addr_len >= sizeof(struct sockaddr_in6) &&
176 usin->sin6_scope_id) {
177 /* If interface is set while binding, indices
178 * must coincide.
179 */
180 if (sk->sk_bound_dev_if &&
181 sk->sk_bound_dev_if != usin->sin6_scope_id)
182 return -EINVAL;
183
184 sk->sk_bound_dev_if = usin->sin6_scope_id;
185 }
186
187 /* Connect to link-local address requires an interface */
188 if (!sk->sk_bound_dev_if)
189 return -EINVAL;
190 }
191
192 if (tp->rx_opt.ts_recent_stamp &&
193 !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
194 tp->rx_opt.ts_recent = 0;
195 tp->rx_opt.ts_recent_stamp = 0;
196 tp->write_seq = 0;
197 }
198
4e3fd7a0 199 np->daddr = usin->sin6_addr;
4c9483b2 200 np->flow_label = fl6.flowlabel;
1da177e4
LT
201
202 /*
203 * TCP over IPv4
204 */
205
206 if (addr_type == IPV6_ADDR_MAPPED) {
d83d8461 207 u32 exthdrlen = icsk->icsk_ext_hdr_len;
1da177e4
LT
208 struct sockaddr_in sin;
209
210 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
211
212 if (__ipv6_only_sock(sk))
213 return -ENETUNREACH;
214
215 sin.sin_family = AF_INET;
216 sin.sin_port = usin->sin6_port;
217 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
218
d83d8461 219 icsk->icsk_af_ops = &ipv6_mapped;
1da177e4 220 sk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
221#ifdef CONFIG_TCP_MD5SIG
222 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
223#endif
1da177e4
LT
224
225 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
226
227 if (err) {
d83d8461
ACM
228 icsk->icsk_ext_hdr_len = exthdrlen;
229 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 230 sk->sk_backlog_rcv = tcp_v6_do_rcv;
cfb6eeb4
YH
231#ifdef CONFIG_TCP_MD5SIG
232 tp->af_specific = &tcp_sock_ipv6_specific;
233#endif
1da177e4
LT
234 goto failure;
235 } else {
c720c7e8
ED
236 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
237 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
238 &np->rcv_saddr);
1da177e4
LT
239 }
240
241 return err;
242 }
243
244 if (!ipv6_addr_any(&np->rcv_saddr))
245 saddr = &np->rcv_saddr;
246
4c9483b2 247 fl6.flowi6_proto = IPPROTO_TCP;
4e3fd7a0
AD
248 fl6.daddr = np->daddr;
249 fl6.saddr = saddr ? *saddr : np->saddr;
4c9483b2
DM
250 fl6.flowi6_oif = sk->sk_bound_dev_if;
251 fl6.flowi6_mark = sk->sk_mark;
1958b856
DM
252 fl6.fl6_dport = usin->sin6_port;
253 fl6.fl6_sport = inet->inet_sport;
1da177e4 254
4c9483b2 255 final_p = fl6_update_dst(&fl6, np->opt, &final);
1da177e4 256
4c9483b2 257 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
beb8d13b 258
4c9483b2 259 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, true);
68d0c6d3
DM
260 if (IS_ERR(dst)) {
261 err = PTR_ERR(dst);
1da177e4 262 goto failure;
14e50e57 263 }
1da177e4
LT
264
265 if (saddr == NULL) {
4c9483b2 266 saddr = &fl6.saddr;
4e3fd7a0 267 np->rcv_saddr = *saddr;
1da177e4
LT
268 }
269
270 /* set the source address */
4e3fd7a0 271 np->saddr = *saddr;
c720c7e8 272 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 273
f83ef8c0 274 sk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 275 __ip6_dst_store(sk, dst, NULL, NULL);
1da177e4 276
493f377d
DM
277 rt = (struct rt6_info *) dst;
278 if (tcp_death_row.sysctl_tw_recycle &&
279 !tp->rx_opt.ts_recent_stamp &&
81166dd6
DM
280 ipv6_addr_equal(&rt->rt6i_dst.addr, &np->daddr))
281 tcp_fetch_timewait_stamp(sk, dst);
493f377d 282
d83d8461 283 icsk->icsk_ext_hdr_len = 0;
1da177e4 284 if (np->opt)
d83d8461
ACM
285 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
286 np->opt->opt_nflen);
1da177e4
LT
287
288 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
289
c720c7e8 290 inet->inet_dport = usin->sin6_port;
1da177e4
LT
291
292 tcp_set_state(sk, TCP_SYN_SENT);
d8313f5c 293 err = inet6_hash_connect(&tcp_death_row, sk);
1da177e4
LT
294 if (err)
295 goto late_failure;
296
297 if (!tp->write_seq)
298 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
299 np->daddr.s6_addr32,
c720c7e8
ED
300 inet->inet_sport,
301 inet->inet_dport);
1da177e4
LT
302
303 err = tcp_connect(sk);
304 if (err)
305 goto late_failure;
306
307 return 0;
308
309late_failure:
310 tcp_set_state(sk, TCP_CLOSE);
311 __sk_dst_reset(sk);
312failure:
c720c7e8 313 inet->inet_dport = 0;
1da177e4
LT
314 sk->sk_route_caps = 0;
315 return err;
316}
317
563d34d0
ED
318static void tcp_v6_mtu_reduced(struct sock *sk)
319{
320 struct dst_entry *dst;
321
322 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
323 return;
324
325 dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
326 if (!dst)
327 return;
328
329 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
330 tcp_sync_mss(sk, dst_mtu(dst));
331 tcp_simple_retransmit(sk);
332 }
333}
334
1da177e4 335static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
d5fdd6ba 336 u8 type, u8 code, int offset, __be32 info)
1da177e4 337{
b71d1d42 338 const struct ipv6hdr *hdr = (const struct ipv6hdr*)skb->data;
505cbfc5 339 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
1da177e4
LT
340 struct ipv6_pinfo *np;
341 struct sock *sk;
342 int err;
1ab1457c 343 struct tcp_sock *tp;
1da177e4 344 __u32 seq;
ca12a1a4 345 struct net *net = dev_net(skb->dev);
1da177e4 346
ca12a1a4 347 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
d86e0dac 348 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
1da177e4
LT
349
350 if (sk == NULL) {
e41b5368
DL
351 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
352 ICMP6_MIB_INERRORS);
1da177e4
LT
353 return;
354 }
355
356 if (sk->sk_state == TCP_TIME_WAIT) {
9469c7b4 357 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
358 return;
359 }
360
361 bh_lock_sock(sk);
563d34d0 362 if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
de0744af 363 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
1da177e4
LT
364
365 if (sk->sk_state == TCP_CLOSE)
366 goto out;
367
e802af9c
SH
368 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
369 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
370 goto out;
371 }
372
1da177e4 373 tp = tcp_sk(sk);
1ab1457c 374 seq = ntohl(th->seq);
1da177e4
LT
375 if (sk->sk_state != TCP_LISTEN &&
376 !between(seq, tp->snd_una, tp->snd_nxt)) {
de0744af 377 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
378 goto out;
379 }
380
381 np = inet6_sk(sk);
382
ec18d9a2
DM
383 if (type == NDISC_REDIRECT) {
384 struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
385
1ed5c48f 386 if (dst)
6700c270 387 dst->ops->redirect(dst, sk, skb);
ec18d9a2
DM
388 }
389
1da177e4 390 if (type == ICMPV6_PKT_TOOBIG) {
563d34d0
ED
391 tp->mtu_info = ntohl(info);
392 if (!sock_owned_by_user(sk))
393 tcp_v6_mtu_reduced(sk);
394 else
395 set_bit(TCP_MTU_REDUCED_DEFERRED, &tp->tsq_flags);
1da177e4
LT
396 goto out;
397 }
398
399 icmpv6_err_convert(type, code, &err);
400
60236fdd 401 /* Might be for an request_sock */
1da177e4 402 switch (sk->sk_state) {
60236fdd 403 struct request_sock *req, **prev;
1da177e4
LT
404 case TCP_LISTEN:
405 if (sock_owned_by_user(sk))
406 goto out;
407
8129765a
ACM
408 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
409 &hdr->saddr, inet6_iif(skb));
1da177e4
LT
410 if (!req)
411 goto out;
412
413 /* ICMPs are not backlogged, hence we cannot get
414 * an established socket here.
415 */
547b792c 416 WARN_ON(req->sk != NULL);
1da177e4 417
2e6599cb 418 if (seq != tcp_rsk(req)->snt_isn) {
de0744af 419 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
420 goto out;
421 }
422
463c84b9 423 inet_csk_reqsk_queue_drop(sk, req, prev);
1da177e4
LT
424 goto out;
425
426 case TCP_SYN_SENT:
427 case TCP_SYN_RECV: /* Cannot happen.
1ab1457c 428 It can, it SYNs are crossed. --ANK */
1da177e4 429 if (!sock_owned_by_user(sk)) {
1da177e4
LT
430 sk->sk_err = err;
431 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
432
433 tcp_done(sk);
434 } else
435 sk->sk_err_soft = err;
436 goto out;
437 }
438
439 if (!sock_owned_by_user(sk) && np->recverr) {
440 sk->sk_err = err;
441 sk->sk_error_report(sk);
442 } else
443 sk->sk_err_soft = err;
444
445out:
446 bh_unlock_sock(sk);
447 sock_put(sk);
448}
449
450
9f10d3f6
NC
451static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
452 struct flowi6 *fl6,
3840a06e 453 struct request_sock *req,
fff32699
ED
454 struct request_values *rvp,
455 u16 queue_mapping)
1da177e4 456{
ca304b61 457 struct inet6_request_sock *treq = inet6_rsk(req);
1da177e4
LT
458 struct ipv6_pinfo *np = inet6_sk(sk);
459 struct sk_buff * skb;
9494218f 460 int err = -ENOMEM;
1da177e4 461
9f10d3f6
NC
462 /* First, grab a route. */
463 if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
fd80eb94 464 goto done;
9494218f 465
e6b4d113 466 skb = tcp_make_synack(sk, dst, req, rvp);
9494218f 467
1da177e4 468 if (skb) {
8ad50d96 469 __tcp_v6_send_check(skb, &treq->loc_addr, &treq->rmt_addr);
1da177e4 470
9f10d3f6 471 fl6->daddr = treq->rmt_addr;
fff32699 472 skb_set_queue_mapping(skb, queue_mapping);
43264e0b 473 err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
b9df3cb8 474 err = net_xmit_eval(err);
1da177e4
LT
475 }
476
477done:
1da177e4
LT
478 return err;
479}
480
72659ecc
OP
481static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req,
482 struct request_values *rvp)
483{
9f10d3f6
NC
484 struct flowi6 fl6;
485
72659ecc 486 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
9f10d3f6 487 return tcp_v6_send_synack(sk, NULL, &fl6, req, rvp, 0);
72659ecc
OP
488}
489
60236fdd 490static void tcp_v6_reqsk_destructor(struct request_sock *req)
1da177e4 491{
800d55f1 492 kfree_skb(inet6_rsk(req)->pktopts);
1da177e4
LT
493}
494
cfb6eeb4
YH
495#ifdef CONFIG_TCP_MD5SIG
496static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 497 const struct in6_addr *addr)
cfb6eeb4 498{
a915da9b 499 return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
cfb6eeb4
YH
500}
501
502static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
503 struct sock *addr_sk)
504{
505 return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
506}
507
508static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
509 struct request_sock *req)
510{
511 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
512}
513
cfb6eeb4
YH
514static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
515 int optlen)
516{
517 struct tcp_md5sig cmd;
518 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
cfb6eeb4
YH
519
520 if (optlen < sizeof(cmd))
521 return -EINVAL;
522
523 if (copy_from_user(&cmd, optval, sizeof(cmd)))
524 return -EFAULT;
525
526 if (sin6->sin6_family != AF_INET6)
527 return -EINVAL;
528
529 if (!cmd.tcpm_keylen) {
e773e4fa 530 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
a915da9b
ED
531 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
532 AF_INET);
533 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
534 AF_INET6);
cfb6eeb4
YH
535 }
536
537 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
538 return -EINVAL;
539
a915da9b
ED
540 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
541 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
542 AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4 543
a915da9b
ED
544 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
545 AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4
YH
546}
547
49a72dfb 548static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
b71d1d42
ED
549 const struct in6_addr *daddr,
550 const struct in6_addr *saddr, int nbytes)
cfb6eeb4 551{
cfb6eeb4 552 struct tcp6_pseudohdr *bp;
49a72dfb 553 struct scatterlist sg;
8d26d76d 554
cfb6eeb4 555 bp = &hp->md5_blk.ip6;
cfb6eeb4 556 /* 1. TCP pseudo-header (RFC2460) */
4e3fd7a0
AD
557 bp->saddr = *saddr;
558 bp->daddr = *daddr;
49a72dfb 559 bp->protocol = cpu_to_be32(IPPROTO_TCP);
00b1304c 560 bp->len = cpu_to_be32(nbytes);
cfb6eeb4 561
49a72dfb
AL
562 sg_init_one(&sg, bp, sizeof(*bp));
563 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
564}
c7da57a1 565
49a72dfb 566static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
b71d1d42 567 const struct in6_addr *daddr, struct in6_addr *saddr,
318cf7aa 568 const struct tcphdr *th)
49a72dfb
AL
569{
570 struct tcp_md5sig_pool *hp;
571 struct hash_desc *desc;
572
573 hp = tcp_get_md5sig_pool();
574 if (!hp)
575 goto clear_hash_noput;
576 desc = &hp->md5_desc;
577
578 if (crypto_hash_init(desc))
579 goto clear_hash;
580 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
581 goto clear_hash;
582 if (tcp_md5_hash_header(hp, th))
583 goto clear_hash;
584 if (tcp_md5_hash_key(hp, key))
585 goto clear_hash;
586 if (crypto_hash_final(desc, md5_hash))
cfb6eeb4 587 goto clear_hash;
cfb6eeb4 588
cfb6eeb4 589 tcp_put_md5sig_pool();
cfb6eeb4 590 return 0;
49a72dfb 591
cfb6eeb4
YH
592clear_hash:
593 tcp_put_md5sig_pool();
594clear_hash_noput:
595 memset(md5_hash, 0, 16);
49a72dfb 596 return 1;
cfb6eeb4
YH
597}
598
49a72dfb 599static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
318cf7aa
ED
600 const struct sock *sk,
601 const struct request_sock *req,
602 const struct sk_buff *skb)
cfb6eeb4 603{
b71d1d42 604 const struct in6_addr *saddr, *daddr;
49a72dfb
AL
605 struct tcp_md5sig_pool *hp;
606 struct hash_desc *desc;
318cf7aa 607 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4
YH
608
609 if (sk) {
610 saddr = &inet6_sk(sk)->saddr;
611 daddr = &inet6_sk(sk)->daddr;
49a72dfb 612 } else if (req) {
cfb6eeb4
YH
613 saddr = &inet6_rsk(req)->loc_addr;
614 daddr = &inet6_rsk(req)->rmt_addr;
49a72dfb 615 } else {
b71d1d42 616 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
49a72dfb
AL
617 saddr = &ip6h->saddr;
618 daddr = &ip6h->daddr;
cfb6eeb4 619 }
49a72dfb
AL
620
621 hp = tcp_get_md5sig_pool();
622 if (!hp)
623 goto clear_hash_noput;
624 desc = &hp->md5_desc;
625
626 if (crypto_hash_init(desc))
627 goto clear_hash;
628
629 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
630 goto clear_hash;
631 if (tcp_md5_hash_header(hp, th))
632 goto clear_hash;
633 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
634 goto clear_hash;
635 if (tcp_md5_hash_key(hp, key))
636 goto clear_hash;
637 if (crypto_hash_final(desc, md5_hash))
638 goto clear_hash;
639
640 tcp_put_md5sig_pool();
641 return 0;
642
643clear_hash:
644 tcp_put_md5sig_pool();
645clear_hash_noput:
646 memset(md5_hash, 0, 16);
647 return 1;
cfb6eeb4
YH
648}
649
318cf7aa 650static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
cfb6eeb4 651{
cf533ea5 652 const __u8 *hash_location = NULL;
cfb6eeb4 653 struct tcp_md5sig_key *hash_expected;
b71d1d42 654 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
318cf7aa 655 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4 656 int genhash;
cfb6eeb4
YH
657 u8 newhash[16];
658
659 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
7d5d5525 660 hash_location = tcp_parse_md5sig_option(th);
cfb6eeb4 661
785957d3
DM
662 /* We've parsed the options - do we have a hash? */
663 if (!hash_expected && !hash_location)
664 return 0;
665
666 if (hash_expected && !hash_location) {
667 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
cfb6eeb4
YH
668 return 1;
669 }
670
785957d3
DM
671 if (!hash_expected && hash_location) {
672 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
cfb6eeb4
YH
673 return 1;
674 }
675
676 /* check the signature */
49a72dfb
AL
677 genhash = tcp_v6_md5_hash_skb(newhash,
678 hash_expected,
679 NULL, NULL, skb);
680
cfb6eeb4 681 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
e87cc472
JP
682 net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
683 genhash ? "failed" : "mismatch",
684 &ip6h->saddr, ntohs(th->source),
685 &ip6h->daddr, ntohs(th->dest));
cfb6eeb4
YH
686 return 1;
687 }
688 return 0;
689}
690#endif
691
c6aefafb 692struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
1da177e4 693 .family = AF_INET6,
2e6599cb 694 .obj_size = sizeof(struct tcp6_request_sock),
72659ecc 695 .rtx_syn_ack = tcp_v6_rtx_synack,
60236fdd
ACM
696 .send_ack = tcp_v6_reqsk_send_ack,
697 .destructor = tcp_v6_reqsk_destructor,
72659ecc
OP
698 .send_reset = tcp_v6_send_reset,
699 .syn_ack_timeout = tcp_syn_ack_timeout,
1da177e4
LT
700};
701
cfb6eeb4 702#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 703static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
cfb6eeb4 704 .md5_lookup = tcp_v6_reqsk_md5_lookup,
e3afe7b7 705 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 706};
b6332e6c 707#endif
cfb6eeb4 708
8ad50d96 709static void __tcp_v6_send_check(struct sk_buff *skb,
b71d1d42 710 const struct in6_addr *saddr, const struct in6_addr *daddr)
1da177e4 711{
aa8223c7 712 struct tcphdr *th = tcp_hdr(skb);
1da177e4 713
84fa7933 714 if (skb->ip_summed == CHECKSUM_PARTIAL) {
8ad50d96 715 th->check = ~tcp_v6_check(skb->len, saddr, daddr, 0);
663ead3b 716 skb->csum_start = skb_transport_header(skb) - skb->head;
ff1dcadb 717 skb->csum_offset = offsetof(struct tcphdr, check);
1da177e4 718 } else {
8ad50d96
HX
719 th->check = tcp_v6_check(skb->len, saddr, daddr,
720 csum_partial(th, th->doff << 2,
721 skb->csum));
1da177e4
LT
722 }
723}
724
bb296246 725static void tcp_v6_send_check(struct sock *sk, struct sk_buff *skb)
8ad50d96
HX
726{
727 struct ipv6_pinfo *np = inet6_sk(sk);
728
729 __tcp_v6_send_check(skb, &np->saddr, &np->daddr);
730}
731
a430a43d
HX
732static int tcp_v6_gso_send_check(struct sk_buff *skb)
733{
b71d1d42 734 const struct ipv6hdr *ipv6h;
a430a43d
HX
735 struct tcphdr *th;
736
737 if (!pskb_may_pull(skb, sizeof(*th)))
738 return -EINVAL;
739
0660e03f 740 ipv6h = ipv6_hdr(skb);
aa8223c7 741 th = tcp_hdr(skb);
a430a43d
HX
742
743 th->check = 0;
84fa7933 744 skb->ip_summed = CHECKSUM_PARTIAL;
8ad50d96 745 __tcp_v6_send_check(skb, &ipv6h->saddr, &ipv6h->daddr);
a430a43d
HX
746 return 0;
747}
1da177e4 748
36990673
HX
749static struct sk_buff **tcp6_gro_receive(struct sk_buff **head,
750 struct sk_buff *skb)
684f2176 751{
b71d1d42 752 const struct ipv6hdr *iph = skb_gro_network_header(skb);
684f2176
HX
753
754 switch (skb->ip_summed) {
755 case CHECKSUM_COMPLETE:
86911732 756 if (!tcp_v6_check(skb_gro_len(skb), &iph->saddr, &iph->daddr,
684f2176
HX
757 skb->csum)) {
758 skb->ip_summed = CHECKSUM_UNNECESSARY;
759 break;
760 }
761
762 /* fall through */
763 case CHECKSUM_NONE:
764 NAPI_GRO_CB(skb)->flush = 1;
765 return NULL;
766 }
767
768 return tcp_gro_receive(head, skb);
769}
684f2176 770
36990673 771static int tcp6_gro_complete(struct sk_buff *skb)
684f2176 772{
b71d1d42 773 const struct ipv6hdr *iph = ipv6_hdr(skb);
684f2176
HX
774 struct tcphdr *th = tcp_hdr(skb);
775
776 th->check = ~tcp_v6_check(skb->len - skb_transport_offset(skb),
777 &iph->saddr, &iph->daddr, 0);
778 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
779
780 return tcp_gro_complete(skb);
781}
684f2176 782
626e264d 783static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
b903d324 784 u32 ts, struct tcp_md5sig_key *key, int rst, u8 tclass)
1da177e4 785{
cf533ea5
ED
786 const struct tcphdr *th = tcp_hdr(skb);
787 struct tcphdr *t1;
1da177e4 788 struct sk_buff *buff;
4c9483b2 789 struct flowi6 fl6;
adf30907 790 struct net *net = dev_net(skb_dst(skb)->dev);
e5047992 791 struct sock *ctl_sk = net->ipv6.tcp_sk;
77c676da 792 unsigned int tot_len = sizeof(struct tcphdr);
adf30907 793 struct dst_entry *dst;
81ada62d 794 __be32 *topt;
1da177e4 795
626e264d
IJ
796 if (ts)
797 tot_len += TCPOLEN_TSTAMP_ALIGNED;
cfb6eeb4 798#ifdef CONFIG_TCP_MD5SIG
cfb6eeb4
YH
799 if (key)
800 tot_len += TCPOLEN_MD5SIG_ALIGNED;
801#endif
802
cfb6eeb4 803 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1da177e4 804 GFP_ATOMIC);
1ab1457c
YH
805 if (buff == NULL)
806 return;
1da177e4 807
cfb6eeb4 808 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1da177e4 809
cfb6eeb4 810 t1 = (struct tcphdr *) skb_push(buff, tot_len);
6651ffc8 811 skb_reset_transport_header(buff);
1da177e4
LT
812
813 /* Swap the send and the receive. */
814 memset(t1, 0, sizeof(*t1));
815 t1->dest = th->source;
816 t1->source = th->dest;
cfb6eeb4 817 t1->doff = tot_len / 4;
626e264d
IJ
818 t1->seq = htonl(seq);
819 t1->ack_seq = htonl(ack);
820 t1->ack = !rst || !th->ack;
821 t1->rst = rst;
822 t1->window = htons(win);
1da177e4 823
81ada62d
IJ
824 topt = (__be32 *)(t1 + 1);
825
626e264d
IJ
826 if (ts) {
827 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
828 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
829 *topt++ = htonl(tcp_time_stamp);
830 *topt++ = htonl(ts);
831 }
832
cfb6eeb4
YH
833#ifdef CONFIG_TCP_MD5SIG
834 if (key) {
81ada62d
IJ
835 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
836 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
837 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
78e645cb
IJ
838 &ipv6_hdr(skb)->saddr,
839 &ipv6_hdr(skb)->daddr, t1);
cfb6eeb4
YH
840 }
841#endif
842
4c9483b2 843 memset(&fl6, 0, sizeof(fl6));
4e3fd7a0
AD
844 fl6.daddr = ipv6_hdr(skb)->saddr;
845 fl6.saddr = ipv6_hdr(skb)->daddr;
1da177e4 846
e5700aff
DM
847 buff->ip_summed = CHECKSUM_PARTIAL;
848 buff->csum = 0;
849
4c9483b2 850 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
1da177e4 851
4c9483b2
DM
852 fl6.flowi6_proto = IPPROTO_TCP;
853 fl6.flowi6_oif = inet6_iif(skb);
1958b856
DM
854 fl6.fl6_dport = t1->dest;
855 fl6.fl6_sport = t1->source;
4c9483b2 856 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
1da177e4 857
c20121ae
DL
858 /* Pass a socket to ip6_dst_lookup either it is for RST
859 * Underlying function will use this to retrieve the network
860 * namespace
861 */
4c9483b2 862 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL, false);
68d0c6d3
DM
863 if (!IS_ERR(dst)) {
864 skb_dst_set(buff, dst);
b903d324 865 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
68d0c6d3
DM
866 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
867 if (rst)
868 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
869 return;
1da177e4
LT
870 }
871
872 kfree_skb(buff);
873}
874
626e264d 875static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
1da177e4 876{
cf533ea5 877 const struct tcphdr *th = tcp_hdr(skb);
626e264d 878 u32 seq = 0, ack_seq = 0;
fa3e5b4e 879 struct tcp_md5sig_key *key = NULL;
658ddaaf
SL
880#ifdef CONFIG_TCP_MD5SIG
881 const __u8 *hash_location = NULL;
882 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
883 unsigned char newhash[16];
884 int genhash;
885 struct sock *sk1 = NULL;
886#endif
1da177e4 887
626e264d 888 if (th->rst)
1da177e4
LT
889 return;
890
626e264d
IJ
891 if (!ipv6_unicast_destination(skb))
892 return;
1da177e4 893
cfb6eeb4 894#ifdef CONFIG_TCP_MD5SIG
658ddaaf
SL
895 hash_location = tcp_parse_md5sig_option(th);
896 if (!sk && hash_location) {
897 /*
898 * active side is lost. Try to find listening socket through
899 * source port, and then find md5 key through listening socket.
900 * we are not loose security here:
901 * Incoming packet is checked with md5 hash with finding key,
902 * no RST generated if md5 hash doesn't match.
903 */
904 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
905 &tcp_hashinfo, &ipv6h->daddr,
906 ntohs(th->source), inet6_iif(skb));
907 if (!sk1)
908 return;
909
910 rcu_read_lock();
911 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
912 if (!key)
913 goto release_sk1;
914
915 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
916 if (genhash || memcmp(hash_location, newhash, 16) != 0)
917 goto release_sk1;
918 } else {
919 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
920 }
cfb6eeb4
YH
921#endif
922
626e264d
IJ
923 if (th->ack)
924 seq = ntohl(th->ack_seq);
925 else
926 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
927 (th->doff << 2);
1da177e4 928
b903d324 929 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, key, 1, 0);
658ddaaf
SL
930
931#ifdef CONFIG_TCP_MD5SIG
932release_sk1:
933 if (sk1) {
934 rcu_read_unlock();
935 sock_put(sk1);
936 }
937#endif
626e264d 938}
1da177e4 939
626e264d 940static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack, u32 win, u32 ts,
b903d324 941 struct tcp_md5sig_key *key, u8 tclass)
626e264d 942{
b903d324 943 tcp_v6_send_response(skb, seq, ack, win, ts, key, 0, tclass);
1da177e4
LT
944}
945
946static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
947{
8feaf0c0 948 struct inet_timewait_sock *tw = inet_twsk(sk);
cfb6eeb4 949 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1da177e4 950
9501f972 951 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
8feaf0c0 952 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
b903d324
ED
953 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw),
954 tw->tw_tclass);
1da177e4 955
8feaf0c0 956 inet_twsk_put(tw);
1da177e4
LT
957}
958
6edafaaf
GJ
959static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
960 struct request_sock *req)
1da177e4 961{
9501f972 962 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1, req->rcv_wnd, req->ts_recent,
b903d324 963 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr), 0);
1da177e4
LT
964}
965
966
967static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
968{
60236fdd 969 struct request_sock *req, **prev;
aa8223c7 970 const struct tcphdr *th = tcp_hdr(skb);
1da177e4
LT
971 struct sock *nsk;
972
973 /* Find possible connection requests. */
8129765a 974 req = inet6_csk_search_req(sk, &prev, th->source,
0660e03f
ACM
975 &ipv6_hdr(skb)->saddr,
976 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1da177e4
LT
977 if (req)
978 return tcp_check_req(sk, skb, req, prev);
979
3b1e0a65 980 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
d86e0dac
PE
981 &ipv6_hdr(skb)->saddr, th->source,
982 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1da177e4
LT
983
984 if (nsk) {
985 if (nsk->sk_state != TCP_TIME_WAIT) {
986 bh_lock_sock(nsk);
987 return nsk;
988 }
9469c7b4 989 inet_twsk_put(inet_twsk(nsk));
1da177e4
LT
990 return NULL;
991 }
992
c6aefafb 993#ifdef CONFIG_SYN_COOKIES
af9b4738 994 if (!th->syn)
c6aefafb 995 sk = cookie_v6_check(sk, skb);
1da177e4
LT
996#endif
997 return sk;
998}
999
1da177e4
LT
1000/* FIXME: this is substantially similar to the ipv4 code.
1001 * Can some kind of merge be done? -- erics
1002 */
1003static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1004{
4957faad 1005 struct tcp_extend_values tmp_ext;
e6b4d113 1006 struct tcp_options_received tmp_opt;
cf533ea5 1007 const u8 *hash_location;
e6b4d113 1008 struct request_sock *req;
ca304b61 1009 struct inet6_request_sock *treq;
1da177e4 1010 struct ipv6_pinfo *np = inet6_sk(sk);
1da177e4 1011 struct tcp_sock *tp = tcp_sk(sk);
e6b4d113 1012 __u32 isn = TCP_SKB_CB(skb)->when;
493f377d 1013 struct dst_entry *dst = NULL;
3840a06e 1014 struct flowi6 fl6;
a2a385d6 1015 bool want_cookie = false;
1da177e4
LT
1016
1017 if (skb->protocol == htons(ETH_P_IP))
1018 return tcp_v4_conn_request(sk, skb);
1019
1020 if (!ipv6_unicast_destination(skb))
1ab1457c 1021 goto drop;
1da177e4 1022
463c84b9 1023 if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
946cedcc
ED
1024 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
1025 if (!want_cookie)
1026 goto drop;
1da177e4
LT
1027 }
1028
463c84b9 1029 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
1da177e4
LT
1030 goto drop;
1031
ca304b61 1032 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1da177e4
LT
1033 if (req == NULL)
1034 goto drop;
1035
cfb6eeb4
YH
1036#ifdef CONFIG_TCP_MD5SIG
1037 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1038#endif
1039
1da177e4
LT
1040 tcp_clear_options(&tmp_opt);
1041 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1042 tmp_opt.user_mss = tp->rx_opt.user_mss;
2100c8d2 1043 tcp_parse_options(skb, &tmp_opt, &hash_location, 0, NULL);
4957faad
WAS
1044
1045 if (tmp_opt.cookie_plus > 0 &&
1046 tmp_opt.saw_tstamp &&
1047 !tp->rx_opt.cookie_out_never &&
1048 (sysctl_tcp_cookie_size > 0 ||
1049 (tp->cookie_values != NULL &&
1050 tp->cookie_values->cookie_desired > 0))) {
1051 u8 *c;
1052 u32 *d;
1053 u32 *mess = &tmp_ext.cookie_bakery[COOKIE_DIGEST_WORDS];
1054 int l = tmp_opt.cookie_plus - TCPOLEN_COOKIE_BASE;
1055
1056 if (tcp_cookie_generator(&tmp_ext.cookie_bakery[0]) != 0)
1057 goto drop_and_free;
1058
1059 /* Secret recipe starts with IP addresses */
0eae88f3 1060 d = (__force u32 *)&ipv6_hdr(skb)->daddr.s6_addr32[0];
4957faad
WAS
1061 *mess++ ^= *d++;
1062 *mess++ ^= *d++;
1063 *mess++ ^= *d++;
1064 *mess++ ^= *d++;
0eae88f3 1065 d = (__force u32 *)&ipv6_hdr(skb)->saddr.s6_addr32[0];
4957faad
WAS
1066 *mess++ ^= *d++;
1067 *mess++ ^= *d++;
1068 *mess++ ^= *d++;
1069 *mess++ ^= *d++;
1070
1071 /* plus variable length Initiator Cookie */
1072 c = (u8 *)mess;
1073 while (l-- > 0)
1074 *c++ ^= *hash_location++;
1da177e4 1075
a2a385d6 1076 want_cookie = false; /* not our kind of cookie */
4957faad
WAS
1077 tmp_ext.cookie_out_never = 0; /* false */
1078 tmp_ext.cookie_plus = tmp_opt.cookie_plus;
1079 } else if (!tp->rx_opt.cookie_in_always) {
1080 /* redundant indications, but ensure initialization. */
1081 tmp_ext.cookie_out_never = 1; /* true */
1082 tmp_ext.cookie_plus = 0;
1083 } else {
1084 goto drop_and_free;
1085 }
1086 tmp_ext.cookie_in_always = tp->rx_opt.cookie_in_always;
1da177e4 1087
4dfc2817 1088 if (want_cookie && !tmp_opt.saw_tstamp)
c6aefafb 1089 tcp_clear_options(&tmp_opt);
c6aefafb 1090
1da177e4
LT
1091 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1092 tcp_openreq_init(req, &tmp_opt, skb);
1093
ca304b61 1094 treq = inet6_rsk(req);
4e3fd7a0
AD
1095 treq->rmt_addr = ipv6_hdr(skb)->saddr;
1096 treq->loc_addr = ipv6_hdr(skb)->daddr;
172d69e6 1097 if (!want_cookie || tmp_opt.tstamp_ok)
bd14b1b2 1098 TCP_ECN_create_request(req, skb);
c6aefafb 1099
4d0fe50c
ED
1100 treq->iif = sk->sk_bound_dev_if;
1101
1102 /* So that link locals have meaning */
1103 if (!sk->sk_bound_dev_if &&
1104 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1105 treq->iif = inet6_iif(skb);
1106
2bbdf389 1107 if (!isn) {
c6aefafb
GG
1108 if (ipv6_opt_accepted(sk, skb) ||
1109 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1110 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1111 atomic_inc(&skb->users);
1112 treq->pktopts = skb;
1113 }
493f377d
DM
1114
1115 if (want_cookie) {
2bbdf389
FW
1116 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1117 req->cookie_ts = tmp_opt.tstamp_ok;
493f377d
DM
1118 goto have_isn;
1119 }
1120
1121 /* VJ's idea. We save last timestamp seen
1122 * from the destination in peer table, when entering
1123 * state TIME-WAIT, and check against it before
1124 * accepting new connection request.
1125 *
1126 * If "isn" is not zero, this request hit alive
1127 * timewait bucket, so that all the necessary checks
1128 * are made in the function processing timewait state.
1129 */
1130 if (tmp_opt.saw_tstamp &&
1131 tcp_death_row.sysctl_tw_recycle &&
81166dd6
DM
1132 (dst = inet6_csk_route_req(sk, &fl6, req)) != NULL) {
1133 if (!tcp_peer_is_proven(req, dst, true)) {
493f377d
DM
1134 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1135 goto drop_and_release;
1136 }
1137 }
1138 /* Kill the following clause, if you dislike this way. */
1139 else if (!sysctl_tcp_syncookies &&
1140 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1141 (sysctl_max_syn_backlog >> 2)) &&
81166dd6 1142 !tcp_peer_is_proven(req, dst, false)) {
493f377d
DM
1143 /* Without syncookies last quarter of
1144 * backlog is filled with destinations,
1145 * proven to be alive.
1146 * It means that we continue to communicate
1147 * to destinations, already remembered
1148 * to the moment of synflood.
1149 */
1150 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
1151 &treq->rmt_addr, ntohs(tcp_hdr(skb)->source));
1152 goto drop_and_release;
2bbdf389 1153 }
493f377d
DM
1154
1155 isn = tcp_v6_init_sequence(skb);
c6aefafb 1156 }
493f377d 1157have_isn:
2e6599cb 1158 tcp_rsk(req)->snt_isn = isn;
9ad7c049 1159 tcp_rsk(req)->snt_synack = tcp_time_stamp;
1da177e4 1160
437c5b53
NC
1161 if (security_inet_conn_request(sk, skb, req))
1162 goto drop_and_release;
4237c75c 1163
9f10d3f6 1164 if (tcp_v6_send_synack(sk, dst, &fl6, req,
fff32699
ED
1165 (struct request_values *)&tmp_ext,
1166 skb_get_queue_mapping(skb)) ||
4957faad 1167 want_cookie)
e6b4d113 1168 goto drop_and_free;
1da177e4 1169
e6b4d113
WAS
1170 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1171 return 0;
1da177e4 1172
493f377d
DM
1173drop_and_release:
1174 dst_release(dst);
e6b4d113
WAS
1175drop_and_free:
1176 reqsk_free(req);
1da177e4 1177drop:
1da177e4
LT
1178 return 0; /* don't send reset */
1179}
1180
1181static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
60236fdd 1182 struct request_sock *req,
1da177e4
LT
1183 struct dst_entry *dst)
1184{
78d15e82 1185 struct inet6_request_sock *treq;
1da177e4
LT
1186 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1187 struct tcp6_sock *newtcp6sk;
1188 struct inet_sock *newinet;
1189 struct tcp_sock *newtp;
1190 struct sock *newsk;
cfb6eeb4
YH
1191#ifdef CONFIG_TCP_MD5SIG
1192 struct tcp_md5sig_key *key;
1193#endif
3840a06e 1194 struct flowi6 fl6;
1da177e4
LT
1195
1196 if (skb->protocol == htons(ETH_P_IP)) {
1197 /*
1198 * v6 mapped
1199 */
1200
1201 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1202
1ab1457c 1203 if (newsk == NULL)
1da177e4
LT
1204 return NULL;
1205
1206 newtcp6sk = (struct tcp6_sock *)newsk;
1207 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1208
1209 newinet = inet_sk(newsk);
1210 newnp = inet6_sk(newsk);
1211 newtp = tcp_sk(newsk);
1212
1213 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1214
c720c7e8 1215 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newnp->daddr);
1da177e4 1216
c720c7e8 1217 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
1da177e4 1218
4e3fd7a0 1219 newnp->rcv_saddr = newnp->saddr;
1da177e4 1220
8292a17a 1221 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1da177e4 1222 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
1223#ifdef CONFIG_TCP_MD5SIG
1224 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1225#endif
1226
676a1184
YZ
1227 newnp->ipv6_ac_list = NULL;
1228 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1229 newnp->pktoptions = NULL;
1230 newnp->opt = NULL;
505cbfc5 1231 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1232 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
4c507d28 1233 newnp->rcv_tclass = ipv6_tclass(ipv6_hdr(skb));
1da177e4 1234
e6848976
ACM
1235 /*
1236 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1237 * here, tcp_create_openreq_child now does this for us, see the comment in
1238 * that function for the gory details. -acme
1da177e4 1239 */
1da177e4
LT
1240
1241 /* It is tricky place. Until this moment IPv4 tcp
8292a17a 1242 worked with IPv6 icsk.icsk_af_ops.
1da177e4
LT
1243 Sync it now.
1244 */
d83d8461 1245 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1da177e4
LT
1246
1247 return newsk;
1248 }
1249
78d15e82 1250 treq = inet6_rsk(req);
1da177e4
LT
1251
1252 if (sk_acceptq_is_full(sk))
1253 goto out_overflow;
1254
493f377d 1255 if (!dst) {
3840a06e 1256 dst = inet6_csk_route_req(sk, &fl6, req);
493f377d 1257 if (!dst)
1da177e4 1258 goto out;
1ab1457c 1259 }
1da177e4
LT
1260
1261 newsk = tcp_create_openreq_child(sk, req, skb);
1262 if (newsk == NULL)
093d2823 1263 goto out_nonewsk;
1da177e4 1264
e6848976
ACM
1265 /*
1266 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1267 * count here, tcp_create_openreq_child now does this for us, see the
1268 * comment in that function for the gory details. -acme
1269 */
1da177e4 1270
59eed279 1271 newsk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 1272 __ip6_dst_store(newsk, dst, NULL, NULL);
1da177e4
LT
1273
1274 newtcp6sk = (struct tcp6_sock *)newsk;
1275 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1276
1277 newtp = tcp_sk(newsk);
1278 newinet = inet_sk(newsk);
1279 newnp = inet6_sk(newsk);
1280
1281 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1282
4e3fd7a0
AD
1283 newnp->daddr = treq->rmt_addr;
1284 newnp->saddr = treq->loc_addr;
1285 newnp->rcv_saddr = treq->loc_addr;
2e6599cb 1286 newsk->sk_bound_dev_if = treq->iif;
1da177e4 1287
1ab1457c 1288 /* Now IPv6 options...
1da177e4
LT
1289
1290 First: no IPv4 options.
1291 */
f6d8bd05 1292 newinet->inet_opt = NULL;
676a1184 1293 newnp->ipv6_ac_list = NULL;
d35690be 1294 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1295
1296 /* Clone RX bits */
1297 newnp->rxopt.all = np->rxopt.all;
1298
1299 /* Clone pktoptions received with SYN */
1300 newnp->pktoptions = NULL;
2e6599cb
ACM
1301 if (treq->pktopts != NULL) {
1302 newnp->pktoptions = skb_clone(treq->pktopts, GFP_ATOMIC);
ab185d7b 1303 consume_skb(treq->pktopts);
2e6599cb 1304 treq->pktopts = NULL;
1da177e4
LT
1305 if (newnp->pktoptions)
1306 skb_set_owner_r(newnp->pktoptions, newsk);
1307 }
1308 newnp->opt = NULL;
505cbfc5 1309 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1310 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
4c507d28 1311 newnp->rcv_tclass = ipv6_tclass(ipv6_hdr(skb));
1da177e4
LT
1312
1313 /* Clone native IPv6 options from listening socket (if any)
1314
1315 Yes, keeping reference count would be much more clever,
1316 but we make one more one thing there: reattach optmem
1317 to newsk.
1318 */
43264e0b
RL
1319 if (np->opt)
1320 newnp->opt = ipv6_dup_options(newsk, np->opt);
1da177e4 1321
d83d8461 1322 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1da177e4 1323 if (newnp->opt)
d83d8461
ACM
1324 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1325 newnp->opt->opt_flen);
1da177e4 1326
5d424d5a 1327 tcp_mtup_init(newsk);
1da177e4 1328 tcp_sync_mss(newsk, dst_mtu(dst));
0dbaee3b 1329 newtp->advmss = dst_metric_advmss(dst);
d135c522
NC
1330 if (tcp_sk(sk)->rx_opt.user_mss &&
1331 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1332 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1333
1da177e4 1334 tcp_initialize_rcv_mss(newsk);
9ad7c049
JC
1335 if (tcp_rsk(req)->snt_synack)
1336 tcp_valid_rtt_meas(newsk,
1337 tcp_time_stamp - tcp_rsk(req)->snt_synack);
1338 newtp->total_retrans = req->retrans;
1da177e4 1339
c720c7e8
ED
1340 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1341 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 1342
cfb6eeb4
YH
1343#ifdef CONFIG_TCP_MD5SIG
1344 /* Copy over the MD5 key from the original socket */
1345 if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1346 /* We're using one, so create a matching key
1347 * on the newsk structure. If we fail to get
1348 * memory, then we end up not copying the key
1349 * across. Shucks.
1350 */
a915da9b
ED
1351 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newnp->daddr,
1352 AF_INET6, key->key, key->keylen, GFP_ATOMIC);
cfb6eeb4
YH
1353 }
1354#endif
1355
093d2823
BS
1356 if (__inet_inherit_port(sk, newsk) < 0) {
1357 sock_put(newsk);
1358 goto out;
1359 }
9327f705 1360 __inet6_hash(newsk, NULL);
1da177e4
LT
1361
1362 return newsk;
1363
1364out_overflow:
de0744af 1365 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
093d2823 1366out_nonewsk:
1da177e4 1367 dst_release(dst);
093d2823
BS
1368out:
1369 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1370 return NULL;
1371}
1372
b51655b9 1373static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1da177e4 1374{
84fa7933 1375 if (skb->ip_summed == CHECKSUM_COMPLETE) {
684f2176 1376 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
0660e03f 1377 &ipv6_hdr(skb)->daddr, skb->csum)) {
fb286bb2 1378 skb->ip_summed = CHECKSUM_UNNECESSARY;
1da177e4 1379 return 0;
fb286bb2 1380 }
1da177e4 1381 }
fb286bb2 1382
684f2176 1383 skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
0660e03f
ACM
1384 &ipv6_hdr(skb)->saddr,
1385 &ipv6_hdr(skb)->daddr, 0));
fb286bb2 1386
1da177e4 1387 if (skb->len <= 76) {
fb286bb2 1388 return __skb_checksum_complete(skb);
1da177e4
LT
1389 }
1390 return 0;
1391}
1392
1393/* The socket must have it's spinlock held when we get
1394 * here.
1395 *
1396 * We have a potential double-lock case here, so even when
1397 * doing backlog processing we use the BH locking scheme.
1398 * This is because we cannot sleep with the original spinlock
1399 * held.
1400 */
1401static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1402{
1403 struct ipv6_pinfo *np = inet6_sk(sk);
1404 struct tcp_sock *tp;
1405 struct sk_buff *opt_skb = NULL;
1406
1407 /* Imagine: socket is IPv6. IPv4 packet arrives,
1408 goes to IPv4 receive handler and backlogged.
1409 From backlog it always goes here. Kerboom...
1410 Fortunately, tcp_rcv_established and rcv_established
1411 handle them correctly, but it is not case with
1412 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1413 */
1414
1415 if (skb->protocol == htons(ETH_P_IP))
1416 return tcp_v4_do_rcv(sk, skb);
1417
cfb6eeb4
YH
1418#ifdef CONFIG_TCP_MD5SIG
1419 if (tcp_v6_inbound_md5_hash (sk, skb))
1420 goto discard;
1421#endif
1422
fda9ef5d 1423 if (sk_filter(sk, skb))
1da177e4
LT
1424 goto discard;
1425
1426 /*
1427 * socket locking is here for SMP purposes as backlog rcv
1428 * is currently called with bh processing disabled.
1429 */
1430
1431 /* Do Stevens' IPV6_PKTOPTIONS.
1432
1433 Yes, guys, it is the only place in our code, where we
1434 may make it not affecting IPv4.
1435 The rest of code is protocol independent,
1436 and I do not like idea to uglify IPv4.
1437
1438 Actually, all the idea behind IPV6_PKTOPTIONS
1439 looks not very well thought. For now we latch
1440 options, received in the last packet, enqueued
1441 by tcp. Feel free to propose better solution.
1ab1457c 1442 --ANK (980728)
1da177e4
LT
1443 */
1444 if (np->rxopt.all)
1445 opt_skb = skb_clone(skb, GFP_ATOMIC);
1446
1447 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
bdeab991 1448 sock_rps_save_rxhash(sk, skb);
aa8223c7 1449 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1da177e4 1450 goto reset;
1da177e4
LT
1451 if (opt_skb)
1452 goto ipv6_pktoptions;
1453 return 0;
1454 }
1455
ab6a5bb6 1456 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1da177e4
LT
1457 goto csum_err;
1458
1ab1457c 1459 if (sk->sk_state == TCP_LISTEN) {
1da177e4
LT
1460 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1461 if (!nsk)
1462 goto discard;
1463
1464 /*
1465 * Queue it on the new socket if the new socket is active,
1466 * otherwise we just shortcircuit this and continue with
1467 * the new socket..
1468 */
1ab1457c 1469 if(nsk != sk) {
bdeab991 1470 sock_rps_save_rxhash(nsk, skb);
1da177e4
LT
1471 if (tcp_child_process(sk, nsk, skb))
1472 goto reset;
1473 if (opt_skb)
1474 __kfree_skb(opt_skb);
1475 return 0;
1476 }
47482f13 1477 } else
bdeab991 1478 sock_rps_save_rxhash(sk, skb);
1da177e4 1479
aa8223c7 1480 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1da177e4 1481 goto reset;
1da177e4
LT
1482 if (opt_skb)
1483 goto ipv6_pktoptions;
1484 return 0;
1485
1486reset:
cfb6eeb4 1487 tcp_v6_send_reset(sk, skb);
1da177e4
LT
1488discard:
1489 if (opt_skb)
1490 __kfree_skb(opt_skb);
1491 kfree_skb(skb);
1492 return 0;
1493csum_err:
63231bdd 1494 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1da177e4
LT
1495 goto discard;
1496
1497
1498ipv6_pktoptions:
1499 /* Do you ask, what is it?
1500
1501 1. skb was enqueued by tcp.
1502 2. skb is added to tail of read queue, rather than out of order.
1503 3. socket is not in passive state.
1504 4. Finally, it really contains options, which user wants to receive.
1505 */
1506 tp = tcp_sk(sk);
1507 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1508 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
333fad53 1509 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
505cbfc5 1510 np->mcast_oif = inet6_iif(opt_skb);
333fad53 1511 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
0660e03f 1512 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
4c507d28
JB
1513 if (np->rxopt.bits.rxtclass)
1514 np->rcv_tclass = ipv6_tclass(ipv6_hdr(skb));
1da177e4
LT
1515 if (ipv6_opt_accepted(sk, opt_skb)) {
1516 skb_set_owner_r(opt_skb, sk);
1517 opt_skb = xchg(&np->pktoptions, opt_skb);
1518 } else {
1519 __kfree_skb(opt_skb);
1520 opt_skb = xchg(&np->pktoptions, NULL);
1521 }
1522 }
1523
800d55f1 1524 kfree_skb(opt_skb);
1da177e4
LT
1525 return 0;
1526}
1527
e5bbef20 1528static int tcp_v6_rcv(struct sk_buff *skb)
1da177e4 1529{
cf533ea5 1530 const struct tcphdr *th;
b71d1d42 1531 const struct ipv6hdr *hdr;
1da177e4
LT
1532 struct sock *sk;
1533 int ret;
a86b1e30 1534 struct net *net = dev_net(skb->dev);
1da177e4
LT
1535
1536 if (skb->pkt_type != PACKET_HOST)
1537 goto discard_it;
1538
1539 /*
1540 * Count it even if it's bad.
1541 */
63231bdd 1542 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1da177e4
LT
1543
1544 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1545 goto discard_it;
1546
aa8223c7 1547 th = tcp_hdr(skb);
1da177e4
LT
1548
1549 if (th->doff < sizeof(struct tcphdr)/4)
1550 goto bad_packet;
1551 if (!pskb_may_pull(skb, th->doff*4))
1552 goto discard_it;
1553
60476372 1554 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1da177e4
LT
1555 goto bad_packet;
1556
aa8223c7 1557 th = tcp_hdr(skb);
e802af9c 1558 hdr = ipv6_hdr(skb);
1da177e4
LT
1559 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1560 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1561 skb->len - th->doff*4);
1562 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1563 TCP_SKB_CB(skb)->when = 0;
b82d1bb4 1564 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
1da177e4
LT
1565 TCP_SKB_CB(skb)->sacked = 0;
1566
9a1f27c4 1567 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1da177e4
LT
1568 if (!sk)
1569 goto no_tcp_socket;
1570
1571process:
1572 if (sk->sk_state == TCP_TIME_WAIT)
1573 goto do_time_wait;
1574
e802af9c
SH
1575 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1576 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1577 goto discard_and_relse;
1578 }
1579
1da177e4
LT
1580 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1581 goto discard_and_relse;
1582
fda9ef5d 1583 if (sk_filter(sk, skb))
1da177e4
LT
1584 goto discard_and_relse;
1585
1586 skb->dev = NULL;
1587
293b9c42 1588 bh_lock_sock_nested(sk);
1da177e4
LT
1589 ret = 0;
1590 if (!sock_owned_by_user(sk)) {
1a2449a8 1591#ifdef CONFIG_NET_DMA
1ab1457c 1592 struct tcp_sock *tp = tcp_sk(sk);
b4caea8a 1593 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
a2bd1140 1594 tp->ucopy.dma_chan = net_dma_find_channel();
1ab1457c
YH
1595 if (tp->ucopy.dma_chan)
1596 ret = tcp_v6_do_rcv(sk, skb);
1597 else
1a2449a8
CL
1598#endif
1599 {
1600 if (!tcp_prequeue(sk, skb))
1601 ret = tcp_v6_do_rcv(sk, skb);
1602 }
da882c1f
ED
1603 } else if (unlikely(sk_add_backlog(sk, skb,
1604 sk->sk_rcvbuf + sk->sk_sndbuf))) {
6b03a53a 1605 bh_unlock_sock(sk);
6cce09f8 1606 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
6b03a53a
ZY
1607 goto discard_and_relse;
1608 }
1da177e4
LT
1609 bh_unlock_sock(sk);
1610
1611 sock_put(sk);
1612 return ret ? -1 : 0;
1613
1614no_tcp_socket:
1615 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1616 goto discard_it;
1617
1618 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1619bad_packet:
63231bdd 1620 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1da177e4 1621 } else {
cfb6eeb4 1622 tcp_v6_send_reset(NULL, skb);
1da177e4
LT
1623 }
1624
1625discard_it:
1626
1627 /*
1628 * Discard frame
1629 */
1630
1631 kfree_skb(skb);
1632 return 0;
1633
1634discard_and_relse:
1635 sock_put(sk);
1636 goto discard_it;
1637
1638do_time_wait:
1639 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
9469c7b4 1640 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1641 goto discard_it;
1642 }
1643
1644 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
63231bdd 1645 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
9469c7b4 1646 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1647 goto discard_it;
1648 }
1649
9469c7b4 1650 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1da177e4
LT
1651 case TCP_TW_SYN:
1652 {
1653 struct sock *sk2;
1654
c346dca1 1655 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
0660e03f 1656 &ipv6_hdr(skb)->daddr,
505cbfc5 1657 ntohs(th->dest), inet6_iif(skb));
1da177e4 1658 if (sk2 != NULL) {
295ff7ed
ACM
1659 struct inet_timewait_sock *tw = inet_twsk(sk);
1660 inet_twsk_deschedule(tw, &tcp_death_row);
1661 inet_twsk_put(tw);
1da177e4
LT
1662 sk = sk2;
1663 goto process;
1664 }
1665 /* Fall through to ACK */
1666 }
1667 case TCP_TW_ACK:
1668 tcp_v6_timewait_ack(sk, skb);
1669 break;
1670 case TCP_TW_RST:
1671 goto no_tcp_socket;
1672 case TCP_TW_SUCCESS:;
1673 }
1674 goto discard_it;
1675}
1676
ccb7c410
DM
1677static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1678 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1679 .twsk_unique = tcp_twsk_unique,
1680 .twsk_destructor= tcp_twsk_destructor,
ccb7c410
DM
1681};
1682
3b401a81 1683static const struct inet_connection_sock_af_ops ipv6_specific = {
543d9cfe
ACM
1684 .queue_xmit = inet6_csk_xmit,
1685 .send_check = tcp_v6_send_check,
1686 .rebuild_header = inet6_sk_rebuild_header,
1687 .conn_request = tcp_v6_conn_request,
1688 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe 1689 .net_header_len = sizeof(struct ipv6hdr),
67469601 1690 .net_frag_header_len = sizeof(struct frag_hdr),
543d9cfe
ACM
1691 .setsockopt = ipv6_setsockopt,
1692 .getsockopt = ipv6_getsockopt,
1693 .addr2sockaddr = inet6_csk_addr2sockaddr,
1694 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1695 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1696#ifdef CONFIG_COMPAT
543d9cfe
ACM
1697 .compat_setsockopt = compat_ipv6_setsockopt,
1698 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1699#endif
1da177e4
LT
1700};
1701
cfb6eeb4 1702#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1703static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
cfb6eeb4 1704 .md5_lookup = tcp_v6_md5_lookup,
49a72dfb 1705 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 1706 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1707};
a928630a 1708#endif
cfb6eeb4 1709
1da177e4
LT
1710/*
1711 * TCP over IPv4 via INET6 API
1712 */
1713
3b401a81 1714static const struct inet_connection_sock_af_ops ipv6_mapped = {
543d9cfe
ACM
1715 .queue_xmit = ip_queue_xmit,
1716 .send_check = tcp_v4_send_check,
1717 .rebuild_header = inet_sk_rebuild_header,
1718 .conn_request = tcp_v6_conn_request,
1719 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe
ACM
1720 .net_header_len = sizeof(struct iphdr),
1721 .setsockopt = ipv6_setsockopt,
1722 .getsockopt = ipv6_getsockopt,
1723 .addr2sockaddr = inet6_csk_addr2sockaddr,
1724 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1725 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1726#ifdef CONFIG_COMPAT
543d9cfe
ACM
1727 .compat_setsockopt = compat_ipv6_setsockopt,
1728 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1729#endif
1da177e4
LT
1730};
1731
cfb6eeb4 1732#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1733static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
cfb6eeb4 1734 .md5_lookup = tcp_v4_md5_lookup,
49a72dfb 1735 .calc_md5_hash = tcp_v4_md5_hash_skb,
cfb6eeb4 1736 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1737};
a928630a 1738#endif
cfb6eeb4 1739
1da177e4
LT
1740/* NOTE: A lot of things set to zero explicitly by call to
1741 * sk_alloc() so need not be done here.
1742 */
1743static int tcp_v6_init_sock(struct sock *sk)
1744{
6687e988 1745 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4 1746
900f65d3 1747 tcp_init_sock(sk);
1da177e4 1748
8292a17a 1749 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 1750
cfb6eeb4 1751#ifdef CONFIG_TCP_MD5SIG
ac807fa8 1752 tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
cfb6eeb4
YH
1753#endif
1754
1da177e4
LT
1755 return 0;
1756}
1757
7d06b2e0 1758static void tcp_v6_destroy_sock(struct sock *sk)
1da177e4 1759{
1da177e4 1760 tcp_v4_destroy_sock(sk);
7d06b2e0 1761 inet6_destroy_sock(sk);
1da177e4
LT
1762}
1763
952a10be 1764#ifdef CONFIG_PROC_FS
1da177e4 1765/* Proc filesystem TCPv6 sock list dumping. */
1ab1457c 1766static void get_openreq6(struct seq_file *seq,
cf533ea5 1767 const struct sock *sk, struct request_sock *req, int i, int uid)
1da177e4 1768{
1da177e4 1769 int ttd = req->expires - jiffies;
b71d1d42
ED
1770 const struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1771 const struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1da177e4
LT
1772
1773 if (ttd < 0)
1774 ttd = 0;
1775
1da177e4
LT
1776 seq_printf(seq,
1777 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1778 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1da177e4
LT
1779 i,
1780 src->s6_addr32[0], src->s6_addr32[1],
1781 src->s6_addr32[2], src->s6_addr32[3],
fd507037 1782 ntohs(inet_rsk(req)->loc_port),
1da177e4
LT
1783 dest->s6_addr32[0], dest->s6_addr32[1],
1784 dest->s6_addr32[2], dest->s6_addr32[3],
2e6599cb 1785 ntohs(inet_rsk(req)->rmt_port),
1da177e4
LT
1786 TCP_SYN_RECV,
1787 0,0, /* could print option size, but that is af dependent. */
1ab1457c
YH
1788 1, /* timers active (only the expire timer) */
1789 jiffies_to_clock_t(ttd),
1da177e4
LT
1790 req->retrans,
1791 uid,
1ab1457c 1792 0, /* non standard timer */
1da177e4
LT
1793 0, /* open_requests have no inode */
1794 0, req);
1795}
1796
1797static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1798{
b71d1d42 1799 const struct in6_addr *dest, *src;
1da177e4
LT
1800 __u16 destp, srcp;
1801 int timer_active;
1802 unsigned long timer_expires;
cf533ea5
ED
1803 const struct inet_sock *inet = inet_sk(sp);
1804 const struct tcp_sock *tp = tcp_sk(sp);
463c84b9 1805 const struct inet_connection_sock *icsk = inet_csk(sp);
cf533ea5 1806 const struct ipv6_pinfo *np = inet6_sk(sp);
1da177e4
LT
1807
1808 dest = &np->daddr;
1809 src = &np->rcv_saddr;
c720c7e8
ED
1810 destp = ntohs(inet->inet_dport);
1811 srcp = ntohs(inet->inet_sport);
463c84b9
ACM
1812
1813 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1da177e4 1814 timer_active = 1;
463c84b9
ACM
1815 timer_expires = icsk->icsk_timeout;
1816 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1da177e4 1817 timer_active = 4;
463c84b9 1818 timer_expires = icsk->icsk_timeout;
1da177e4
LT
1819 } else if (timer_pending(&sp->sk_timer)) {
1820 timer_active = 2;
1821 timer_expires = sp->sk_timer.expires;
1822 } else {
1823 timer_active = 0;
1824 timer_expires = jiffies;
1825 }
1826
1827 seq_printf(seq,
1828 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1829 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %pK %lu %lu %u %u %d\n",
1da177e4
LT
1830 i,
1831 src->s6_addr32[0], src->s6_addr32[1],
1832 src->s6_addr32[2], src->s6_addr32[3], srcp,
1833 dest->s6_addr32[0], dest->s6_addr32[1],
1834 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1ab1457c 1835 sp->sk_state,
47da8ee6
SS
1836 tp->write_seq-tp->snd_una,
1837 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1da177e4
LT
1838 timer_active,
1839 jiffies_to_clock_t(timer_expires - jiffies),
463c84b9 1840 icsk->icsk_retransmits,
1da177e4 1841 sock_i_uid(sp),
6687e988 1842 icsk->icsk_probes_out,
1da177e4
LT
1843 sock_i_ino(sp),
1844 atomic_read(&sp->sk_refcnt), sp,
7be87351
SH
1845 jiffies_to_clock_t(icsk->icsk_rto),
1846 jiffies_to_clock_t(icsk->icsk_ack.ato),
463c84b9 1847 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
0b6a05c1
IJ
1848 tp->snd_cwnd,
1849 tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
1da177e4
LT
1850 );
1851}
1852
1ab1457c 1853static void get_timewait6_sock(struct seq_file *seq,
8feaf0c0 1854 struct inet_timewait_sock *tw, int i)
1da177e4 1855{
b71d1d42 1856 const struct in6_addr *dest, *src;
1da177e4 1857 __u16 destp, srcp;
cf533ea5 1858 const struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
1da177e4
LT
1859 int ttd = tw->tw_ttd - jiffies;
1860
1861 if (ttd < 0)
1862 ttd = 0;
1863
0fa1a53e
ACM
1864 dest = &tw6->tw_v6_daddr;
1865 src = &tw6->tw_v6_rcv_saddr;
1da177e4
LT
1866 destp = ntohs(tw->tw_dport);
1867 srcp = ntohs(tw->tw_sport);
1868
1869 seq_printf(seq,
1870 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1871 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1da177e4
LT
1872 i,
1873 src->s6_addr32[0], src->s6_addr32[1],
1874 src->s6_addr32[2], src->s6_addr32[3], srcp,
1875 dest->s6_addr32[0], dest->s6_addr32[1],
1876 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1877 tw->tw_substate, 0, 0,
1878 3, jiffies_to_clock_t(ttd), 0, 0, 0, 0,
1879 atomic_read(&tw->tw_refcnt), tw);
1880}
1881
1da177e4
LT
1882static int tcp6_seq_show(struct seq_file *seq, void *v)
1883{
1884 struct tcp_iter_state *st;
1885
1886 if (v == SEQ_START_TOKEN) {
1887 seq_puts(seq,
1888 " sl "
1889 "local_address "
1890 "remote_address "
1891 "st tx_queue rx_queue tr tm->when retrnsmt"
1892 " uid timeout inode\n");
1893 goto out;
1894 }
1895 st = seq->private;
1896
1897 switch (st->state) {
1898 case TCP_SEQ_STATE_LISTENING:
1899 case TCP_SEQ_STATE_ESTABLISHED:
1900 get_tcp6_sock(seq, v, st->num);
1901 break;
1902 case TCP_SEQ_STATE_OPENREQ:
1903 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1904 break;
1905 case TCP_SEQ_STATE_TIME_WAIT:
1906 get_timewait6_sock(seq, v, st->num);
1907 break;
1908 }
1909out:
1910 return 0;
1911}
1912
73cb88ec
AV
1913static const struct file_operations tcp6_afinfo_seq_fops = {
1914 .owner = THIS_MODULE,
1915 .open = tcp_seq_open,
1916 .read = seq_read,
1917 .llseek = seq_lseek,
1918 .release = seq_release_net
1919};
1920
1da177e4 1921static struct tcp_seq_afinfo tcp6_seq_afinfo = {
1da177e4
LT
1922 .name = "tcp6",
1923 .family = AF_INET6,
73cb88ec 1924 .seq_fops = &tcp6_afinfo_seq_fops,
9427c4b3
DL
1925 .seq_ops = {
1926 .show = tcp6_seq_show,
1927 },
1da177e4
LT
1928};
1929
2c8c1e72 1930int __net_init tcp6_proc_init(struct net *net)
1da177e4 1931{
6f8b13bc 1932 return tcp_proc_register(net, &tcp6_seq_afinfo);
1da177e4
LT
1933}
1934
6f8b13bc 1935void tcp6_proc_exit(struct net *net)
1da177e4 1936{
6f8b13bc 1937 tcp_proc_unregister(net, &tcp6_seq_afinfo);
1da177e4
LT
1938}
1939#endif
1940
1941struct proto tcpv6_prot = {
1942 .name = "TCPv6",
1943 .owner = THIS_MODULE,
1944 .close = tcp_close,
1945 .connect = tcp_v6_connect,
1946 .disconnect = tcp_disconnect,
463c84b9 1947 .accept = inet_csk_accept,
1da177e4
LT
1948 .ioctl = tcp_ioctl,
1949 .init = tcp_v6_init_sock,
1950 .destroy = tcp_v6_destroy_sock,
1951 .shutdown = tcp_shutdown,
1952 .setsockopt = tcp_setsockopt,
1953 .getsockopt = tcp_getsockopt,
1da177e4 1954 .recvmsg = tcp_recvmsg,
7ba42910
CG
1955 .sendmsg = tcp_sendmsg,
1956 .sendpage = tcp_sendpage,
1da177e4 1957 .backlog_rcv = tcp_v6_do_rcv,
46d3ceab 1958 .release_cb = tcp_release_cb,
563d34d0 1959 .mtu_reduced = tcp_v6_mtu_reduced,
1da177e4 1960 .hash = tcp_v6_hash,
ab1e0a13
ACM
1961 .unhash = inet_unhash,
1962 .get_port = inet_csk_get_port,
1da177e4
LT
1963 .enter_memory_pressure = tcp_enter_memory_pressure,
1964 .sockets_allocated = &tcp_sockets_allocated,
1965 .memory_allocated = &tcp_memory_allocated,
1966 .memory_pressure = &tcp_memory_pressure,
0a5578cf 1967 .orphan_count = &tcp_orphan_count,
1da177e4
LT
1968 .sysctl_wmem = sysctl_tcp_wmem,
1969 .sysctl_rmem = sysctl_tcp_rmem,
1970 .max_header = MAX_TCP_HEADER,
1971 .obj_size = sizeof(struct tcp6_sock),
3ab5aee7 1972 .slab_flags = SLAB_DESTROY_BY_RCU,
6d6ee43e 1973 .twsk_prot = &tcp6_timewait_sock_ops,
60236fdd 1974 .rsk_prot = &tcp6_request_sock_ops,
39d8cda7 1975 .h.hashinfo = &tcp_hashinfo,
7ba42910 1976 .no_autobind = true,
543d9cfe
ACM
1977#ifdef CONFIG_COMPAT
1978 .compat_setsockopt = compat_tcp_setsockopt,
1979 .compat_getsockopt = compat_tcp_getsockopt,
1980#endif
d1a4c0b3
GC
1981#ifdef CONFIG_CGROUP_MEM_RES_CTLR_KMEM
1982 .proto_cgroup = tcp_proto_cgroup,
1983#endif
1da177e4
LT
1984};
1985
41135cc8 1986static const struct inet6_protocol tcpv6_protocol = {
1da177e4
LT
1987 .handler = tcp_v6_rcv,
1988 .err_handler = tcp_v6_err,
a430a43d 1989 .gso_send_check = tcp_v6_gso_send_check,
adcfc7d0 1990 .gso_segment = tcp_tso_segment,
684f2176
HX
1991 .gro_receive = tcp6_gro_receive,
1992 .gro_complete = tcp6_gro_complete,
1da177e4
LT
1993 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1994};
1995
1da177e4
LT
1996static struct inet_protosw tcpv6_protosw = {
1997 .type = SOCK_STREAM,
1998 .protocol = IPPROTO_TCP,
1999 .prot = &tcpv6_prot,
2000 .ops = &inet6_stream_ops,
1da177e4 2001 .no_check = 0,
d83d8461
ACM
2002 .flags = INET_PROTOSW_PERMANENT |
2003 INET_PROTOSW_ICSK,
1da177e4
LT
2004};
2005
2c8c1e72 2006static int __net_init tcpv6_net_init(struct net *net)
93ec926b 2007{
5677242f
DL
2008 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2009 SOCK_RAW, IPPROTO_TCP, net);
93ec926b
DL
2010}
2011
2c8c1e72 2012static void __net_exit tcpv6_net_exit(struct net *net)
93ec926b 2013{
5677242f 2014 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
b099ce26
EB
2015}
2016
2c8c1e72 2017static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
b099ce26
EB
2018{
2019 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
93ec926b
DL
2020}
2021
2022static struct pernet_operations tcpv6_net_ops = {
b099ce26
EB
2023 .init = tcpv6_net_init,
2024 .exit = tcpv6_net_exit,
2025 .exit_batch = tcpv6_net_exit_batch,
93ec926b
DL
2026};
2027
7f4e4868 2028int __init tcpv6_init(void)
1da177e4 2029{
7f4e4868
DL
2030 int ret;
2031
2032 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2033 if (ret)
2034 goto out;
2035
1da177e4 2036 /* register inet6 protocol */
7f4e4868
DL
2037 ret = inet6_register_protosw(&tcpv6_protosw);
2038 if (ret)
2039 goto out_tcpv6_protocol;
2040
93ec926b 2041 ret = register_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2042 if (ret)
2043 goto out_tcpv6_protosw;
2044out:
2045 return ret;
ae0f7d5f 2046
7f4e4868
DL
2047out_tcpv6_protocol:
2048 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2049out_tcpv6_protosw:
2050 inet6_unregister_protosw(&tcpv6_protosw);
2051 goto out;
2052}
2053
09f7709f 2054void tcpv6_exit(void)
7f4e4868 2055{
93ec926b 2056 unregister_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2057 inet6_unregister_protosw(&tcpv6_protosw);
2058 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
1da177e4 2059}