]> git.ipfire.org Git - people/ms/linux.git/blame - net/ipv6/tcp_ipv6.c
bgmac: connect to PHY and make use of PHY device
[people/ms/linux.git] / net / ipv6 / tcp_ipv6.c
CommitLineData
1da177e4
LT
1/*
2 * TCP over IPv6
1ab1457c 3 * Linux INET6 implementation
1da177e4
LT
4 *
5 * Authors:
1ab1457c 6 * Pedro Roque <roque@di.fc.ul.pt>
1da177e4 7 *
1ab1457c 8 * Based on:
1da177e4
LT
9 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
eb4dea58 26#include <linux/bottom_half.h>
1da177e4 27#include <linux/module.h>
1da177e4
LT
28#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
5a0e3ad6 41#include <linux/slab.h>
1da177e4
LT
42
43#include <linux/ipv6.h>
44#include <linux/icmpv6.h>
45#include <linux/random.h>
46
47#include <net/tcp.h>
48#include <net/ndisc.h>
5324a040 49#include <net/inet6_hashtables.h>
8129765a 50#include <net/inet6_connection_sock.h>
1da177e4
LT
51#include <net/ipv6.h>
52#include <net/transp_v6.h>
53#include <net/addrconf.h>
54#include <net/ip6_route.h>
55#include <net/ip6_checksum.h>
56#include <net/inet_ecn.h>
57#include <net/protocol.h>
58#include <net/xfrm.h>
1da177e4
LT
59#include <net/snmp.h>
60#include <net/dsfield.h>
6d6ee43e 61#include <net/timewait_sock.h>
18134bed 62#include <net/netdma.h>
3d58b5fa 63#include <net/inet_common.h>
6e5714ea 64#include <net/secure_seq.h>
d1a4c0b3 65#include <net/tcp_memcontrol.h>
076bb0c8 66#include <net/busy_poll.h>
1da177e4
LT
67
68#include <asm/uaccess.h>
69
70#include <linux/proc_fs.h>
71#include <linux/seq_file.h>
72
cfb6eeb4
YH
73#include <linux/crypto.h>
74#include <linux/scatterlist.h>
75
cfb6eeb4 76static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
6edafaaf
GJ
77static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
78 struct request_sock *req);
1da177e4
LT
79
80static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
1da177e4 81
3b401a81
SH
82static const struct inet_connection_sock_af_ops ipv6_mapped;
83static const struct inet_connection_sock_af_ops ipv6_specific;
a928630a 84#ifdef CONFIG_TCP_MD5SIG
b2e4b3de
SH
85static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
86static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
9501f972
YH
87#else
88static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 89 const struct in6_addr *addr)
9501f972
YH
90{
91 return NULL;
92}
a928630a 93#endif
1da177e4 94
fae6ef87
NC
95static void inet6_sk_rx_dst_set(struct sock *sk, const struct sk_buff *skb)
96{
97 struct dst_entry *dst = skb_dst(skb);
98 const struct rt6_info *rt = (const struct rt6_info *)dst;
99
100 dst_hold(dst);
101 sk->sk_rx_dst = dst;
102 inet_sk(sk)->rx_dst_ifindex = skb->skb_iif;
103 if (rt->rt6i_node)
104 inet6_sk(sk)->rx_dst_cookie = rt->rt6i_node->fn_sernum;
105}
106
1da177e4
LT
107static void tcp_v6_hash(struct sock *sk)
108{
109 if (sk->sk_state != TCP_CLOSE) {
8292a17a 110 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
1da177e4
LT
111 tcp_prot.hash(sk);
112 return;
113 }
114 local_bh_disable();
9327f705 115 __inet6_hash(sk, NULL);
1da177e4
LT
116 local_bh_enable();
117 }
118}
119
cf533ea5 120static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
1da177e4 121{
0660e03f
ACM
122 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
123 ipv6_hdr(skb)->saddr.s6_addr32,
aa8223c7
ACM
124 tcp_hdr(skb)->dest,
125 tcp_hdr(skb)->source);
1da177e4
LT
126}
127
1ab1457c 128static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
1da177e4
LT
129 int addr_len)
130{
131 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
1ab1457c 132 struct inet_sock *inet = inet_sk(sk);
d83d8461 133 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4
LT
134 struct ipv6_pinfo *np = inet6_sk(sk);
135 struct tcp_sock *tp = tcp_sk(sk);
20c59de2 136 struct in6_addr *saddr = NULL, *final_p, final;
493f377d 137 struct rt6_info *rt;
4c9483b2 138 struct flowi6 fl6;
1da177e4
LT
139 struct dst_entry *dst;
140 int addr_type;
141 int err;
142
1ab1457c 143 if (addr_len < SIN6_LEN_RFC2133)
1da177e4
LT
144 return -EINVAL;
145
1ab1457c 146 if (usin->sin6_family != AF_INET6)
a02cec21 147 return -EAFNOSUPPORT;
1da177e4 148
4c9483b2 149 memset(&fl6, 0, sizeof(fl6));
1da177e4
LT
150
151 if (np->sndflow) {
4c9483b2
DM
152 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
153 IP6_ECN_flow_init(fl6.flowlabel);
154 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
1da177e4 155 struct ip6_flowlabel *flowlabel;
4c9483b2 156 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
1da177e4
LT
157 if (flowlabel == NULL)
158 return -EINVAL;
4e3fd7a0 159 usin->sin6_addr = flowlabel->dst;
1da177e4
LT
160 fl6_sock_release(flowlabel);
161 }
162 }
163
164 /*
1ab1457c
YH
165 * connect() to INADDR_ANY means loopback (BSD'ism).
166 */
167
168 if(ipv6_addr_any(&usin->sin6_addr))
169 usin->sin6_addr.s6_addr[15] = 0x1;
1da177e4
LT
170
171 addr_type = ipv6_addr_type(&usin->sin6_addr);
172
173 if(addr_type & IPV6_ADDR_MULTICAST)
174 return -ENETUNREACH;
175
176 if (addr_type&IPV6_ADDR_LINKLOCAL) {
177 if (addr_len >= sizeof(struct sockaddr_in6) &&
178 usin->sin6_scope_id) {
179 /* If interface is set while binding, indices
180 * must coincide.
181 */
182 if (sk->sk_bound_dev_if &&
183 sk->sk_bound_dev_if != usin->sin6_scope_id)
184 return -EINVAL;
185
186 sk->sk_bound_dev_if = usin->sin6_scope_id;
187 }
188
189 /* Connect to link-local address requires an interface */
190 if (!sk->sk_bound_dev_if)
191 return -EINVAL;
192 }
193
194 if (tp->rx_opt.ts_recent_stamp &&
efe4208f 195 !ipv6_addr_equal(&sk->sk_v6_daddr, &usin->sin6_addr)) {
1da177e4
LT
196 tp->rx_opt.ts_recent = 0;
197 tp->rx_opt.ts_recent_stamp = 0;
198 tp->write_seq = 0;
199 }
200
efe4208f 201 sk->sk_v6_daddr = usin->sin6_addr;
4c9483b2 202 np->flow_label = fl6.flowlabel;
1da177e4
LT
203
204 /*
205 * TCP over IPv4
206 */
207
208 if (addr_type == IPV6_ADDR_MAPPED) {
d83d8461 209 u32 exthdrlen = icsk->icsk_ext_hdr_len;
1da177e4
LT
210 struct sockaddr_in sin;
211
212 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
213
214 if (__ipv6_only_sock(sk))
215 return -ENETUNREACH;
216
217 sin.sin_family = AF_INET;
218 sin.sin_port = usin->sin6_port;
219 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
220
d83d8461 221 icsk->icsk_af_ops = &ipv6_mapped;
1da177e4 222 sk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
223#ifdef CONFIG_TCP_MD5SIG
224 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
225#endif
1da177e4
LT
226
227 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
228
229 if (err) {
d83d8461
ACM
230 icsk->icsk_ext_hdr_len = exthdrlen;
231 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 232 sk->sk_backlog_rcv = tcp_v6_do_rcv;
cfb6eeb4
YH
233#ifdef CONFIG_TCP_MD5SIG
234 tp->af_specific = &tcp_sock_ipv6_specific;
235#endif
1da177e4
LT
236 goto failure;
237 } else {
c720c7e8
ED
238 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
239 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
efe4208f 240 &sk->sk_v6_rcv_saddr);
1da177e4
LT
241 }
242
243 return err;
244 }
245
efe4208f
ED
246 if (!ipv6_addr_any(&sk->sk_v6_rcv_saddr))
247 saddr = &sk->sk_v6_rcv_saddr;
1da177e4 248
4c9483b2 249 fl6.flowi6_proto = IPPROTO_TCP;
efe4208f 250 fl6.daddr = sk->sk_v6_daddr;
4e3fd7a0 251 fl6.saddr = saddr ? *saddr : np->saddr;
4c9483b2
DM
252 fl6.flowi6_oif = sk->sk_bound_dev_if;
253 fl6.flowi6_mark = sk->sk_mark;
1958b856
DM
254 fl6.fl6_dport = usin->sin6_port;
255 fl6.fl6_sport = inet->inet_sport;
1da177e4 256
4c9483b2 257 final_p = fl6_update_dst(&fl6, np->opt, &final);
1da177e4 258
4c9483b2 259 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
beb8d13b 260
4c9483b2 261 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, true);
68d0c6d3
DM
262 if (IS_ERR(dst)) {
263 err = PTR_ERR(dst);
1da177e4 264 goto failure;
14e50e57 265 }
1da177e4
LT
266
267 if (saddr == NULL) {
4c9483b2 268 saddr = &fl6.saddr;
efe4208f 269 sk->sk_v6_rcv_saddr = *saddr;
1da177e4
LT
270 }
271
272 /* set the source address */
4e3fd7a0 273 np->saddr = *saddr;
c720c7e8 274 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 275
f83ef8c0 276 sk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 277 __ip6_dst_store(sk, dst, NULL, NULL);
1da177e4 278
493f377d
DM
279 rt = (struct rt6_info *) dst;
280 if (tcp_death_row.sysctl_tw_recycle &&
281 !tp->rx_opt.ts_recent_stamp &&
efe4208f 282 ipv6_addr_equal(&rt->rt6i_dst.addr, &sk->sk_v6_daddr))
81166dd6 283 tcp_fetch_timewait_stamp(sk, dst);
493f377d 284
d83d8461 285 icsk->icsk_ext_hdr_len = 0;
1da177e4 286 if (np->opt)
d83d8461
ACM
287 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
288 np->opt->opt_nflen);
1da177e4
LT
289
290 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
291
c720c7e8 292 inet->inet_dport = usin->sin6_port;
1da177e4
LT
293
294 tcp_set_state(sk, TCP_SYN_SENT);
d8313f5c 295 err = inet6_hash_connect(&tcp_death_row, sk);
1da177e4
LT
296 if (err)
297 goto late_failure;
298
2b916477 299 if (!tp->write_seq && likely(!tp->repair))
1da177e4 300 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
efe4208f 301 sk->sk_v6_daddr.s6_addr32,
c720c7e8
ED
302 inet->inet_sport,
303 inet->inet_dport);
1da177e4
LT
304
305 err = tcp_connect(sk);
306 if (err)
307 goto late_failure;
308
309 return 0;
310
311late_failure:
312 tcp_set_state(sk, TCP_CLOSE);
313 __sk_dst_reset(sk);
314failure:
c720c7e8 315 inet->inet_dport = 0;
1da177e4
LT
316 sk->sk_route_caps = 0;
317 return err;
318}
319
563d34d0
ED
320static void tcp_v6_mtu_reduced(struct sock *sk)
321{
322 struct dst_entry *dst;
323
324 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
325 return;
326
327 dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
328 if (!dst)
329 return;
330
331 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
332 tcp_sync_mss(sk, dst_mtu(dst));
333 tcp_simple_retransmit(sk);
334 }
335}
336
1da177e4 337static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
d5fdd6ba 338 u8 type, u8 code, int offset, __be32 info)
1da177e4 339{
b71d1d42 340 const struct ipv6hdr *hdr = (const struct ipv6hdr*)skb->data;
505cbfc5 341 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
1da177e4
LT
342 struct ipv6_pinfo *np;
343 struct sock *sk;
344 int err;
1ab1457c 345 struct tcp_sock *tp;
1da177e4 346 __u32 seq;
ca12a1a4 347 struct net *net = dev_net(skb->dev);
1da177e4 348
ca12a1a4 349 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
d86e0dac 350 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
1da177e4
LT
351
352 if (sk == NULL) {
e41b5368
DL
353 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
354 ICMP6_MIB_INERRORS);
1da177e4
LT
355 return;
356 }
357
358 if (sk->sk_state == TCP_TIME_WAIT) {
9469c7b4 359 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
360 return;
361 }
362
363 bh_lock_sock(sk);
563d34d0 364 if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
de0744af 365 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
1da177e4
LT
366
367 if (sk->sk_state == TCP_CLOSE)
368 goto out;
369
e802af9c
SH
370 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
371 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
372 goto out;
373 }
374
1da177e4 375 tp = tcp_sk(sk);
1ab1457c 376 seq = ntohl(th->seq);
1da177e4
LT
377 if (sk->sk_state != TCP_LISTEN &&
378 !between(seq, tp->snd_una, tp->snd_nxt)) {
de0744af 379 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
380 goto out;
381 }
382
383 np = inet6_sk(sk);
384
ec18d9a2
DM
385 if (type == NDISC_REDIRECT) {
386 struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
387
1ed5c48f 388 if (dst)
6700c270 389 dst->ops->redirect(dst, sk, skb);
50a75a89 390 goto out;
ec18d9a2
DM
391 }
392
1da177e4 393 if (type == ICMPV6_PKT_TOOBIG) {
0d4f0608
ED
394 /* We are not interested in TCP_LISTEN and open_requests
395 * (SYN-ACKs send out by Linux are always <576bytes so
396 * they should go through unfragmented).
397 */
398 if (sk->sk_state == TCP_LISTEN)
399 goto out;
400
563d34d0
ED
401 tp->mtu_info = ntohl(info);
402 if (!sock_owned_by_user(sk))
403 tcp_v6_mtu_reduced(sk);
d013ef2a
JA
404 else if (!test_and_set_bit(TCP_MTU_REDUCED_DEFERRED,
405 &tp->tsq_flags))
406 sock_hold(sk);
1da177e4
LT
407 goto out;
408 }
409
410 icmpv6_err_convert(type, code, &err);
411
60236fdd 412 /* Might be for an request_sock */
1da177e4 413 switch (sk->sk_state) {
60236fdd 414 struct request_sock *req, **prev;
1da177e4
LT
415 case TCP_LISTEN:
416 if (sock_owned_by_user(sk))
417 goto out;
418
8129765a
ACM
419 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
420 &hdr->saddr, inet6_iif(skb));
1da177e4
LT
421 if (!req)
422 goto out;
423
424 /* ICMPs are not backlogged, hence we cannot get
425 * an established socket here.
426 */
547b792c 427 WARN_ON(req->sk != NULL);
1da177e4 428
2e6599cb 429 if (seq != tcp_rsk(req)->snt_isn) {
de0744af 430 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
1da177e4
LT
431 goto out;
432 }
433
463c84b9 434 inet_csk_reqsk_queue_drop(sk, req, prev);
5f1e942c 435 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
436 goto out;
437
438 case TCP_SYN_SENT:
439 case TCP_SYN_RECV: /* Cannot happen.
1ab1457c 440 It can, it SYNs are crossed. --ANK */
1da177e4 441 if (!sock_owned_by_user(sk)) {
1da177e4
LT
442 sk->sk_err = err;
443 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
444
445 tcp_done(sk);
446 } else
447 sk->sk_err_soft = err;
448 goto out;
449 }
450
451 if (!sock_owned_by_user(sk) && np->recverr) {
452 sk->sk_err = err;
453 sk->sk_error_report(sk);
454 } else
455 sk->sk_err_soft = err;
456
457out:
458 bh_unlock_sock(sk);
459 sock_put(sk);
460}
461
462
9f10d3f6
NC
463static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
464 struct flowi6 *fl6,
3840a06e 465 struct request_sock *req,
fff32699 466 u16 queue_mapping)
1da177e4 467{
634fb979 468 struct inet_request_sock *ireq = inet_rsk(req);
1da177e4
LT
469 struct ipv6_pinfo *np = inet6_sk(sk);
470 struct sk_buff * skb;
9494218f 471 int err = -ENOMEM;
1da177e4 472
9f10d3f6
NC
473 /* First, grab a route. */
474 if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
fd80eb94 475 goto done;
9494218f 476
1a2c6181 477 skb = tcp_make_synack(sk, dst, req, NULL);
9494218f 478
1da177e4 479 if (skb) {
634fb979
ED
480 __tcp_v6_send_check(skb, &ireq->ir_v6_loc_addr,
481 &ireq->ir_v6_rmt_addr);
1da177e4 482
634fb979 483 fl6->daddr = ireq->ir_v6_rmt_addr;
fff32699 484 skb_set_queue_mapping(skb, queue_mapping);
43264e0b 485 err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
b9df3cb8 486 err = net_xmit_eval(err);
1da177e4
LT
487 }
488
489done:
1da177e4
LT
490 return err;
491}
492
1a2c6181 493static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req)
72659ecc 494{
9f10d3f6 495 struct flowi6 fl6;
e6c022a4 496 int res;
9f10d3f6 497
1a2c6181 498 res = tcp_v6_send_synack(sk, NULL, &fl6, req, 0);
e6c022a4
ED
499 if (!res)
500 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
501 return res;
72659ecc
OP
502}
503
60236fdd 504static void tcp_v6_reqsk_destructor(struct request_sock *req)
1da177e4 505{
634fb979 506 kfree_skb(inet_rsk(req)->pktopts);
1da177e4
LT
507}
508
cfb6eeb4
YH
509#ifdef CONFIG_TCP_MD5SIG
510static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
b71d1d42 511 const struct in6_addr *addr)
cfb6eeb4 512{
a915da9b 513 return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
cfb6eeb4
YH
514}
515
516static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
517 struct sock *addr_sk)
518{
efe4208f 519 return tcp_v6_md5_do_lookup(sk, &addr_sk->sk_v6_daddr);
cfb6eeb4
YH
520}
521
522static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
523 struct request_sock *req)
524{
634fb979 525 return tcp_v6_md5_do_lookup(sk, &inet_rsk(req)->ir_v6_rmt_addr);
cfb6eeb4
YH
526}
527
cfb6eeb4
YH
528static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
529 int optlen)
530{
531 struct tcp_md5sig cmd;
532 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
cfb6eeb4
YH
533
534 if (optlen < sizeof(cmd))
535 return -EINVAL;
536
537 if (copy_from_user(&cmd, optval, sizeof(cmd)))
538 return -EFAULT;
539
540 if (sin6->sin6_family != AF_INET6)
541 return -EINVAL;
542
543 if (!cmd.tcpm_keylen) {
e773e4fa 544 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
a915da9b
ED
545 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
546 AF_INET);
547 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
548 AF_INET6);
cfb6eeb4
YH
549 }
550
551 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
552 return -EINVAL;
553
a915da9b
ED
554 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
555 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
556 AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4 557
a915da9b
ED
558 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
559 AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
cfb6eeb4
YH
560}
561
49a72dfb 562static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
b71d1d42
ED
563 const struct in6_addr *daddr,
564 const struct in6_addr *saddr, int nbytes)
cfb6eeb4 565{
cfb6eeb4 566 struct tcp6_pseudohdr *bp;
49a72dfb 567 struct scatterlist sg;
8d26d76d 568
cfb6eeb4 569 bp = &hp->md5_blk.ip6;
cfb6eeb4 570 /* 1. TCP pseudo-header (RFC2460) */
4e3fd7a0
AD
571 bp->saddr = *saddr;
572 bp->daddr = *daddr;
49a72dfb 573 bp->protocol = cpu_to_be32(IPPROTO_TCP);
00b1304c 574 bp->len = cpu_to_be32(nbytes);
cfb6eeb4 575
49a72dfb
AL
576 sg_init_one(&sg, bp, sizeof(*bp));
577 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
578}
c7da57a1 579
49a72dfb 580static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
b71d1d42 581 const struct in6_addr *daddr, struct in6_addr *saddr,
318cf7aa 582 const struct tcphdr *th)
49a72dfb
AL
583{
584 struct tcp_md5sig_pool *hp;
585 struct hash_desc *desc;
586
587 hp = tcp_get_md5sig_pool();
588 if (!hp)
589 goto clear_hash_noput;
590 desc = &hp->md5_desc;
591
592 if (crypto_hash_init(desc))
593 goto clear_hash;
594 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
595 goto clear_hash;
596 if (tcp_md5_hash_header(hp, th))
597 goto clear_hash;
598 if (tcp_md5_hash_key(hp, key))
599 goto clear_hash;
600 if (crypto_hash_final(desc, md5_hash))
cfb6eeb4 601 goto clear_hash;
cfb6eeb4 602
cfb6eeb4 603 tcp_put_md5sig_pool();
cfb6eeb4 604 return 0;
49a72dfb 605
cfb6eeb4
YH
606clear_hash:
607 tcp_put_md5sig_pool();
608clear_hash_noput:
609 memset(md5_hash, 0, 16);
49a72dfb 610 return 1;
cfb6eeb4
YH
611}
612
49a72dfb 613static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
318cf7aa
ED
614 const struct sock *sk,
615 const struct request_sock *req,
616 const struct sk_buff *skb)
cfb6eeb4 617{
b71d1d42 618 const struct in6_addr *saddr, *daddr;
49a72dfb
AL
619 struct tcp_md5sig_pool *hp;
620 struct hash_desc *desc;
318cf7aa 621 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4
YH
622
623 if (sk) {
624 saddr = &inet6_sk(sk)->saddr;
efe4208f 625 daddr = &sk->sk_v6_daddr;
49a72dfb 626 } else if (req) {
634fb979
ED
627 saddr = &inet_rsk(req)->ir_v6_loc_addr;
628 daddr = &inet_rsk(req)->ir_v6_rmt_addr;
49a72dfb 629 } else {
b71d1d42 630 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
49a72dfb
AL
631 saddr = &ip6h->saddr;
632 daddr = &ip6h->daddr;
cfb6eeb4 633 }
49a72dfb
AL
634
635 hp = tcp_get_md5sig_pool();
636 if (!hp)
637 goto clear_hash_noput;
638 desc = &hp->md5_desc;
639
640 if (crypto_hash_init(desc))
641 goto clear_hash;
642
643 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
644 goto clear_hash;
645 if (tcp_md5_hash_header(hp, th))
646 goto clear_hash;
647 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
648 goto clear_hash;
649 if (tcp_md5_hash_key(hp, key))
650 goto clear_hash;
651 if (crypto_hash_final(desc, md5_hash))
652 goto clear_hash;
653
654 tcp_put_md5sig_pool();
655 return 0;
656
657clear_hash:
658 tcp_put_md5sig_pool();
659clear_hash_noput:
660 memset(md5_hash, 0, 16);
661 return 1;
cfb6eeb4
YH
662}
663
318cf7aa 664static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
cfb6eeb4 665{
cf533ea5 666 const __u8 *hash_location = NULL;
cfb6eeb4 667 struct tcp_md5sig_key *hash_expected;
b71d1d42 668 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
318cf7aa 669 const struct tcphdr *th = tcp_hdr(skb);
cfb6eeb4 670 int genhash;
cfb6eeb4
YH
671 u8 newhash[16];
672
673 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
7d5d5525 674 hash_location = tcp_parse_md5sig_option(th);
cfb6eeb4 675
785957d3
DM
676 /* We've parsed the options - do we have a hash? */
677 if (!hash_expected && !hash_location)
678 return 0;
679
680 if (hash_expected && !hash_location) {
681 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
cfb6eeb4
YH
682 return 1;
683 }
684
785957d3
DM
685 if (!hash_expected && hash_location) {
686 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
cfb6eeb4
YH
687 return 1;
688 }
689
690 /* check the signature */
49a72dfb
AL
691 genhash = tcp_v6_md5_hash_skb(newhash,
692 hash_expected,
693 NULL, NULL, skb);
694
cfb6eeb4 695 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
e87cc472
JP
696 net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
697 genhash ? "failed" : "mismatch",
698 &ip6h->saddr, ntohs(th->source),
699 &ip6h->daddr, ntohs(th->dest));
cfb6eeb4
YH
700 return 1;
701 }
702 return 0;
703}
704#endif
705
c6aefafb 706struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
1da177e4 707 .family = AF_INET6,
2e6599cb 708 .obj_size = sizeof(struct tcp6_request_sock),
72659ecc 709 .rtx_syn_ack = tcp_v6_rtx_synack,
60236fdd
ACM
710 .send_ack = tcp_v6_reqsk_send_ack,
711 .destructor = tcp_v6_reqsk_destructor,
72659ecc
OP
712 .send_reset = tcp_v6_send_reset,
713 .syn_ack_timeout = tcp_syn_ack_timeout,
1da177e4
LT
714};
715
cfb6eeb4 716#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 717static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
cfb6eeb4 718 .md5_lookup = tcp_v6_reqsk_md5_lookup,
e3afe7b7 719 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 720};
b6332e6c 721#endif
cfb6eeb4 722
626e264d 723static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
ee684b6f
AV
724 u32 tsval, u32 tsecr,
725 struct tcp_md5sig_key *key, int rst, u8 tclass)
1da177e4 726{
cf533ea5
ED
727 const struct tcphdr *th = tcp_hdr(skb);
728 struct tcphdr *t1;
1da177e4 729 struct sk_buff *buff;
4c9483b2 730 struct flowi6 fl6;
adf30907 731 struct net *net = dev_net(skb_dst(skb)->dev);
e5047992 732 struct sock *ctl_sk = net->ipv6.tcp_sk;
77c676da 733 unsigned int tot_len = sizeof(struct tcphdr);
adf30907 734 struct dst_entry *dst;
81ada62d 735 __be32 *topt;
1da177e4 736
ee684b6f 737 if (tsecr)
626e264d 738 tot_len += TCPOLEN_TSTAMP_ALIGNED;
cfb6eeb4 739#ifdef CONFIG_TCP_MD5SIG
cfb6eeb4
YH
740 if (key)
741 tot_len += TCPOLEN_MD5SIG_ALIGNED;
742#endif
743
cfb6eeb4 744 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1da177e4 745 GFP_ATOMIC);
1ab1457c
YH
746 if (buff == NULL)
747 return;
1da177e4 748
cfb6eeb4 749 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1da177e4 750
cfb6eeb4 751 t1 = (struct tcphdr *) skb_push(buff, tot_len);
6651ffc8 752 skb_reset_transport_header(buff);
1da177e4
LT
753
754 /* Swap the send and the receive. */
755 memset(t1, 0, sizeof(*t1));
756 t1->dest = th->source;
757 t1->source = th->dest;
cfb6eeb4 758 t1->doff = tot_len / 4;
626e264d
IJ
759 t1->seq = htonl(seq);
760 t1->ack_seq = htonl(ack);
761 t1->ack = !rst || !th->ack;
762 t1->rst = rst;
763 t1->window = htons(win);
1da177e4 764
81ada62d
IJ
765 topt = (__be32 *)(t1 + 1);
766
ee684b6f 767 if (tsecr) {
626e264d
IJ
768 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
769 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
ee684b6f
AV
770 *topt++ = htonl(tsval);
771 *topt++ = htonl(tsecr);
626e264d
IJ
772 }
773
cfb6eeb4
YH
774#ifdef CONFIG_TCP_MD5SIG
775 if (key) {
81ada62d
IJ
776 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
777 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
778 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
78e645cb
IJ
779 &ipv6_hdr(skb)->saddr,
780 &ipv6_hdr(skb)->daddr, t1);
cfb6eeb4
YH
781 }
782#endif
783
4c9483b2 784 memset(&fl6, 0, sizeof(fl6));
4e3fd7a0
AD
785 fl6.daddr = ipv6_hdr(skb)->saddr;
786 fl6.saddr = ipv6_hdr(skb)->daddr;
1da177e4 787
e5700aff
DM
788 buff->ip_summed = CHECKSUM_PARTIAL;
789 buff->csum = 0;
790
4c9483b2 791 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
1da177e4 792
4c9483b2 793 fl6.flowi6_proto = IPPROTO_TCP;
4c675258
AK
794 if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
795 fl6.flowi6_oif = inet6_iif(skb);
1958b856
DM
796 fl6.fl6_dport = t1->dest;
797 fl6.fl6_sport = t1->source;
4c9483b2 798 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
1da177e4 799
c20121ae
DL
800 /* Pass a socket to ip6_dst_lookup either it is for RST
801 * Underlying function will use this to retrieve the network
802 * namespace
803 */
4c9483b2 804 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL, false);
68d0c6d3
DM
805 if (!IS_ERR(dst)) {
806 skb_dst_set(buff, dst);
b903d324 807 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
68d0c6d3
DM
808 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
809 if (rst)
810 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
811 return;
1da177e4
LT
812 }
813
814 kfree_skb(buff);
815}
816
626e264d 817static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
1da177e4 818{
cf533ea5 819 const struct tcphdr *th = tcp_hdr(skb);
626e264d 820 u32 seq = 0, ack_seq = 0;
fa3e5b4e 821 struct tcp_md5sig_key *key = NULL;
658ddaaf
SL
822#ifdef CONFIG_TCP_MD5SIG
823 const __u8 *hash_location = NULL;
824 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
825 unsigned char newhash[16];
826 int genhash;
827 struct sock *sk1 = NULL;
828#endif
1da177e4 829
626e264d 830 if (th->rst)
1da177e4
LT
831 return;
832
626e264d
IJ
833 if (!ipv6_unicast_destination(skb))
834 return;
1da177e4 835
cfb6eeb4 836#ifdef CONFIG_TCP_MD5SIG
658ddaaf
SL
837 hash_location = tcp_parse_md5sig_option(th);
838 if (!sk && hash_location) {
839 /*
840 * active side is lost. Try to find listening socket through
841 * source port, and then find md5 key through listening socket.
842 * we are not loose security here:
843 * Incoming packet is checked with md5 hash with finding key,
844 * no RST generated if md5 hash doesn't match.
845 */
846 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
5ba24953
TH
847 &tcp_hashinfo, &ipv6h->saddr,
848 th->source, &ipv6h->daddr,
658ddaaf
SL
849 ntohs(th->source), inet6_iif(skb));
850 if (!sk1)
851 return;
852
853 rcu_read_lock();
854 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
855 if (!key)
856 goto release_sk1;
857
858 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
859 if (genhash || memcmp(hash_location, newhash, 16) != 0)
860 goto release_sk1;
861 } else {
862 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
863 }
cfb6eeb4
YH
864#endif
865
626e264d
IJ
866 if (th->ack)
867 seq = ntohl(th->ack_seq);
868 else
869 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
870 (th->doff << 2);
1da177e4 871
ee684b6f 872 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, 0, key, 1, 0);
658ddaaf
SL
873
874#ifdef CONFIG_TCP_MD5SIG
875release_sk1:
876 if (sk1) {
877 rcu_read_unlock();
878 sock_put(sk1);
879 }
880#endif
626e264d 881}
1da177e4 882
ee684b6f
AV
883static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack,
884 u32 win, u32 tsval, u32 tsecr,
b903d324 885 struct tcp_md5sig_key *key, u8 tclass)
626e264d 886{
ee684b6f 887 tcp_v6_send_response(skb, seq, ack, win, tsval, tsecr, key, 0, tclass);
1da177e4
LT
888}
889
890static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
891{
8feaf0c0 892 struct inet_timewait_sock *tw = inet_twsk(sk);
cfb6eeb4 893 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1da177e4 894
9501f972 895 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
8feaf0c0 896 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
ee684b6f 897 tcp_time_stamp + tcptw->tw_ts_offset,
b903d324
ED
898 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw),
899 tw->tw_tclass);
1da177e4 900
8feaf0c0 901 inet_twsk_put(tw);
1da177e4
LT
902}
903
6edafaaf
GJ
904static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
905 struct request_sock *req)
1da177e4 906{
ee684b6f
AV
907 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1,
908 req->rcv_wnd, tcp_time_stamp, req->ts_recent,
b903d324 909 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr), 0);
1da177e4
LT
910}
911
912
913static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
914{
60236fdd 915 struct request_sock *req, **prev;
aa8223c7 916 const struct tcphdr *th = tcp_hdr(skb);
1da177e4
LT
917 struct sock *nsk;
918
919 /* Find possible connection requests. */
8129765a 920 req = inet6_csk_search_req(sk, &prev, th->source,
0660e03f
ACM
921 &ipv6_hdr(skb)->saddr,
922 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1da177e4 923 if (req)
8336886f 924 return tcp_check_req(sk, skb, req, prev, false);
1da177e4 925
3b1e0a65 926 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
d86e0dac
PE
927 &ipv6_hdr(skb)->saddr, th->source,
928 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1da177e4
LT
929
930 if (nsk) {
931 if (nsk->sk_state != TCP_TIME_WAIT) {
932 bh_lock_sock(nsk);
933 return nsk;
934 }
9469c7b4 935 inet_twsk_put(inet_twsk(nsk));
1da177e4
LT
936 return NULL;
937 }
938
c6aefafb 939#ifdef CONFIG_SYN_COOKIES
af9b4738 940 if (!th->syn)
c6aefafb 941 sk = cookie_v6_check(sk, skb);
1da177e4
LT
942#endif
943 return sk;
944}
945
1da177e4
LT
946/* FIXME: this is substantially similar to the ipv4 code.
947 * Can some kind of merge be done? -- erics
948 */
949static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
950{
e6b4d113
WAS
951 struct tcp_options_received tmp_opt;
952 struct request_sock *req;
634fb979 953 struct inet_request_sock *ireq;
1da177e4 954 struct ipv6_pinfo *np = inet6_sk(sk);
1da177e4 955 struct tcp_sock *tp = tcp_sk(sk);
e6b4d113 956 __u32 isn = TCP_SKB_CB(skb)->when;
493f377d 957 struct dst_entry *dst = NULL;
3840a06e 958 struct flowi6 fl6;
a2a385d6 959 bool want_cookie = false;
1da177e4
LT
960
961 if (skb->protocol == htons(ETH_P_IP))
962 return tcp_v4_conn_request(sk, skb);
963
964 if (!ipv6_unicast_destination(skb))
1ab1457c 965 goto drop;
1da177e4 966
5ad37d5d
HFS
967 if ((sysctl_tcp_syncookies == 2 ||
968 inet_csk_reqsk_queue_is_full(sk)) && !isn) {
946cedcc
ED
969 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
970 if (!want_cookie)
971 goto drop;
1da177e4
LT
972 }
973
5f1e942c
VS
974 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1) {
975 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1da177e4 976 goto drop;
5f1e942c 977 }
1da177e4 978
ca304b61 979 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1da177e4
LT
980 if (req == NULL)
981 goto drop;
982
cfb6eeb4
YH
983#ifdef CONFIG_TCP_MD5SIG
984 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
985#endif
986
1da177e4
LT
987 tcp_clear_options(&tmp_opt);
988 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
989 tmp_opt.user_mss = tp->rx_opt.user_mss;
1a2c6181 990 tcp_parse_options(skb, &tmp_opt, 0, NULL);
1da177e4 991
4dfc2817 992 if (want_cookie && !tmp_opt.saw_tstamp)
c6aefafb 993 tcp_clear_options(&tmp_opt);
c6aefafb 994
1da177e4
LT
995 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
996 tcp_openreq_init(req, &tmp_opt, skb);
997
634fb979
ED
998 ireq = inet_rsk(req);
999 ireq->ir_v6_rmt_addr = ipv6_hdr(skb)->saddr;
1000 ireq->ir_v6_loc_addr = ipv6_hdr(skb)->daddr;
172d69e6 1001 if (!want_cookie || tmp_opt.tstamp_ok)
5d134f1c 1002 TCP_ECN_create_request(req, skb, sock_net(sk));
c6aefafb 1003
634fb979 1004 ireq->ir_iif = sk->sk_bound_dev_if;
4d0fe50c
ED
1005
1006 /* So that link locals have meaning */
1007 if (!sk->sk_bound_dev_if &&
634fb979
ED
1008 ipv6_addr_type(&ireq->ir_v6_rmt_addr) & IPV6_ADDR_LINKLOCAL)
1009 ireq->ir_iif = inet6_iif(skb);
4d0fe50c 1010
2bbdf389 1011 if (!isn) {
c6aefafb
GG
1012 if (ipv6_opt_accepted(sk, skb) ||
1013 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1014 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1015 atomic_inc(&skb->users);
634fb979 1016 ireq->pktopts = skb;
c6aefafb 1017 }
493f377d
DM
1018
1019 if (want_cookie) {
2bbdf389
FW
1020 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1021 req->cookie_ts = tmp_opt.tstamp_ok;
493f377d
DM
1022 goto have_isn;
1023 }
1024
1025 /* VJ's idea. We save last timestamp seen
1026 * from the destination in peer table, when entering
1027 * state TIME-WAIT, and check against it before
1028 * accepting new connection request.
1029 *
1030 * If "isn" is not zero, this request hit alive
1031 * timewait bucket, so that all the necessary checks
1032 * are made in the function processing timewait state.
1033 */
1034 if (tmp_opt.saw_tstamp &&
1035 tcp_death_row.sysctl_tw_recycle &&
81166dd6
DM
1036 (dst = inet6_csk_route_req(sk, &fl6, req)) != NULL) {
1037 if (!tcp_peer_is_proven(req, dst, true)) {
493f377d
DM
1038 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1039 goto drop_and_release;
1040 }
1041 }
1042 /* Kill the following clause, if you dislike this way. */
1043 else if (!sysctl_tcp_syncookies &&
1044 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1045 (sysctl_max_syn_backlog >> 2)) &&
81166dd6 1046 !tcp_peer_is_proven(req, dst, false)) {
493f377d
DM
1047 /* Without syncookies last quarter of
1048 * backlog is filled with destinations,
1049 * proven to be alive.
1050 * It means that we continue to communicate
1051 * to destinations, already remembered
1052 * to the moment of synflood.
1053 */
1054 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
634fb979 1055 &ireq->ir_v6_rmt_addr, ntohs(tcp_hdr(skb)->source));
493f377d 1056 goto drop_and_release;
2bbdf389 1057 }
493f377d
DM
1058
1059 isn = tcp_v6_init_sequence(skb);
c6aefafb 1060 }
493f377d 1061have_isn:
2e6599cb 1062 tcp_rsk(req)->snt_isn = isn;
1da177e4 1063
437c5b53
NC
1064 if (security_inet_conn_request(sk, skb, req))
1065 goto drop_and_release;
4237c75c 1066
9f10d3f6 1067 if (tcp_v6_send_synack(sk, dst, &fl6, req,
fff32699 1068 skb_get_queue_mapping(skb)) ||
4957faad 1069 want_cookie)
e6b4d113 1070 goto drop_and_free;
1da177e4 1071
016818d0 1072 tcp_rsk(req)->snt_synack = tcp_time_stamp;
8336886f 1073 tcp_rsk(req)->listener = NULL;
e6b4d113
WAS
1074 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1075 return 0;
1da177e4 1076
493f377d
DM
1077drop_and_release:
1078 dst_release(dst);
e6b4d113
WAS
1079drop_and_free:
1080 reqsk_free(req);
1da177e4 1081drop:
5f1e942c 1082 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1083 return 0; /* don't send reset */
1084}
1085
1086static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
60236fdd 1087 struct request_sock *req,
1da177e4
LT
1088 struct dst_entry *dst)
1089{
634fb979 1090 struct inet_request_sock *ireq;
1da177e4
LT
1091 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1092 struct tcp6_sock *newtcp6sk;
1093 struct inet_sock *newinet;
1094 struct tcp_sock *newtp;
1095 struct sock *newsk;
cfb6eeb4
YH
1096#ifdef CONFIG_TCP_MD5SIG
1097 struct tcp_md5sig_key *key;
1098#endif
3840a06e 1099 struct flowi6 fl6;
1da177e4
LT
1100
1101 if (skb->protocol == htons(ETH_P_IP)) {
1102 /*
1103 * v6 mapped
1104 */
1105
1106 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1107
1ab1457c 1108 if (newsk == NULL)
1da177e4
LT
1109 return NULL;
1110
1111 newtcp6sk = (struct tcp6_sock *)newsk;
1112 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1113
1114 newinet = inet_sk(newsk);
1115 newnp = inet6_sk(newsk);
1116 newtp = tcp_sk(newsk);
1117
1118 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1119
efe4208f 1120 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newsk->sk_v6_daddr);
1da177e4 1121
c720c7e8 1122 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
1da177e4 1123
efe4208f 1124 newsk->sk_v6_rcv_saddr = newnp->saddr;
1da177e4 1125
8292a17a 1126 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1da177e4 1127 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
cfb6eeb4
YH
1128#ifdef CONFIG_TCP_MD5SIG
1129 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1130#endif
1131
676a1184
YZ
1132 newnp->ipv6_ac_list = NULL;
1133 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1134 newnp->pktoptions = NULL;
1135 newnp->opt = NULL;
505cbfc5 1136 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1137 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
e7219858 1138 newnp->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4 1139
e6848976
ACM
1140 /*
1141 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1142 * here, tcp_create_openreq_child now does this for us, see the comment in
1143 * that function for the gory details. -acme
1da177e4 1144 */
1da177e4
LT
1145
1146 /* It is tricky place. Until this moment IPv4 tcp
8292a17a 1147 worked with IPv6 icsk.icsk_af_ops.
1da177e4
LT
1148 Sync it now.
1149 */
d83d8461 1150 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1da177e4
LT
1151
1152 return newsk;
1153 }
1154
634fb979 1155 ireq = inet_rsk(req);
1da177e4
LT
1156
1157 if (sk_acceptq_is_full(sk))
1158 goto out_overflow;
1159
493f377d 1160 if (!dst) {
3840a06e 1161 dst = inet6_csk_route_req(sk, &fl6, req);
493f377d 1162 if (!dst)
1da177e4 1163 goto out;
1ab1457c 1164 }
1da177e4
LT
1165
1166 newsk = tcp_create_openreq_child(sk, req, skb);
1167 if (newsk == NULL)
093d2823 1168 goto out_nonewsk;
1da177e4 1169
e6848976
ACM
1170 /*
1171 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1172 * count here, tcp_create_openreq_child now does this for us, see the
1173 * comment in that function for the gory details. -acme
1174 */
1da177e4 1175
59eed279 1176 newsk->sk_gso_type = SKB_GSO_TCPV6;
8e1ef0a9 1177 __ip6_dst_store(newsk, dst, NULL, NULL);
fae6ef87 1178 inet6_sk_rx_dst_set(newsk, skb);
1da177e4
LT
1179
1180 newtcp6sk = (struct tcp6_sock *)newsk;
1181 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1182
1183 newtp = tcp_sk(newsk);
1184 newinet = inet_sk(newsk);
1185 newnp = inet6_sk(newsk);
1186
1187 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1188
634fb979
ED
1189 newsk->sk_v6_daddr = ireq->ir_v6_rmt_addr;
1190 newnp->saddr = ireq->ir_v6_loc_addr;
1191 newsk->sk_v6_rcv_saddr = ireq->ir_v6_loc_addr;
1192 newsk->sk_bound_dev_if = ireq->ir_iif;
1da177e4 1193
1ab1457c 1194 /* Now IPv6 options...
1da177e4
LT
1195
1196 First: no IPv4 options.
1197 */
f6d8bd05 1198 newinet->inet_opt = NULL;
676a1184 1199 newnp->ipv6_ac_list = NULL;
d35690be 1200 newnp->ipv6_fl_list = NULL;
1da177e4
LT
1201
1202 /* Clone RX bits */
1203 newnp->rxopt.all = np->rxopt.all;
1204
1205 /* Clone pktoptions received with SYN */
1206 newnp->pktoptions = NULL;
634fb979
ED
1207 if (ireq->pktopts != NULL) {
1208 newnp->pktoptions = skb_clone(ireq->pktopts,
99a1dec7 1209 sk_gfp_atomic(sk, GFP_ATOMIC));
634fb979
ED
1210 consume_skb(ireq->pktopts);
1211 ireq->pktopts = NULL;
1da177e4
LT
1212 if (newnp->pktoptions)
1213 skb_set_owner_r(newnp->pktoptions, newsk);
1214 }
1215 newnp->opt = NULL;
505cbfc5 1216 newnp->mcast_oif = inet6_iif(skb);
0660e03f 1217 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
e7219858 1218 newnp->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1da177e4
LT
1219
1220 /* Clone native IPv6 options from listening socket (if any)
1221
1222 Yes, keeping reference count would be much more clever,
1223 but we make one more one thing there: reattach optmem
1224 to newsk.
1225 */
43264e0b
RL
1226 if (np->opt)
1227 newnp->opt = ipv6_dup_options(newsk, np->opt);
1da177e4 1228
d83d8461 1229 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1da177e4 1230 if (newnp->opt)
d83d8461
ACM
1231 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1232 newnp->opt->opt_flen);
1da177e4 1233
5d424d5a 1234 tcp_mtup_init(newsk);
1da177e4 1235 tcp_sync_mss(newsk, dst_mtu(dst));
0dbaee3b 1236 newtp->advmss = dst_metric_advmss(dst);
d135c522
NC
1237 if (tcp_sk(sk)->rx_opt.user_mss &&
1238 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1239 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1240
1da177e4
LT
1241 tcp_initialize_rcv_mss(newsk);
1242
c720c7e8
ED
1243 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1244 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
1da177e4 1245
cfb6eeb4
YH
1246#ifdef CONFIG_TCP_MD5SIG
1247 /* Copy over the MD5 key from the original socket */
efe4208f 1248 if ((key = tcp_v6_md5_do_lookup(sk, &newsk->sk_v6_daddr)) != NULL) {
cfb6eeb4
YH
1249 /* We're using one, so create a matching key
1250 * on the newsk structure. If we fail to get
1251 * memory, then we end up not copying the key
1252 * across. Shucks.
1253 */
efe4208f 1254 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newsk->sk_v6_daddr,
99a1dec7
MG
1255 AF_INET6, key->key, key->keylen,
1256 sk_gfp_atomic(sk, GFP_ATOMIC));
cfb6eeb4
YH
1257 }
1258#endif
1259
093d2823 1260 if (__inet_inherit_port(sk, newsk) < 0) {
e337e24d
CP
1261 inet_csk_prepare_forced_close(newsk);
1262 tcp_done(newsk);
093d2823
BS
1263 goto out;
1264 }
9327f705 1265 __inet6_hash(newsk, NULL);
1da177e4
LT
1266
1267 return newsk;
1268
1269out_overflow:
de0744af 1270 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
093d2823 1271out_nonewsk:
1da177e4 1272 dst_release(dst);
093d2823
BS
1273out:
1274 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1da177e4
LT
1275 return NULL;
1276}
1277
b51655b9 1278static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1da177e4 1279{
84fa7933 1280 if (skb->ip_summed == CHECKSUM_COMPLETE) {
684f2176 1281 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
0660e03f 1282 &ipv6_hdr(skb)->daddr, skb->csum)) {
fb286bb2 1283 skb->ip_summed = CHECKSUM_UNNECESSARY;
1da177e4 1284 return 0;
fb286bb2 1285 }
1da177e4 1286 }
fb286bb2 1287
684f2176 1288 skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
0660e03f
ACM
1289 &ipv6_hdr(skb)->saddr,
1290 &ipv6_hdr(skb)->daddr, 0));
fb286bb2 1291
1da177e4 1292 if (skb->len <= 76) {
fb286bb2 1293 return __skb_checksum_complete(skb);
1da177e4
LT
1294 }
1295 return 0;
1296}
1297
1298/* The socket must have it's spinlock held when we get
1299 * here.
1300 *
1301 * We have a potential double-lock case here, so even when
1302 * doing backlog processing we use the BH locking scheme.
1303 * This is because we cannot sleep with the original spinlock
1304 * held.
1305 */
1306static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1307{
1308 struct ipv6_pinfo *np = inet6_sk(sk);
1309 struct tcp_sock *tp;
1310 struct sk_buff *opt_skb = NULL;
1311
1312 /* Imagine: socket is IPv6. IPv4 packet arrives,
1313 goes to IPv4 receive handler and backlogged.
1314 From backlog it always goes here. Kerboom...
1315 Fortunately, tcp_rcv_established and rcv_established
1316 handle them correctly, but it is not case with
1317 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1318 */
1319
1320 if (skb->protocol == htons(ETH_P_IP))
1321 return tcp_v4_do_rcv(sk, skb);
1322
cfb6eeb4
YH
1323#ifdef CONFIG_TCP_MD5SIG
1324 if (tcp_v6_inbound_md5_hash (sk, skb))
1325 goto discard;
1326#endif
1327
fda9ef5d 1328 if (sk_filter(sk, skb))
1da177e4
LT
1329 goto discard;
1330
1331 /*
1332 * socket locking is here for SMP purposes as backlog rcv
1333 * is currently called with bh processing disabled.
1334 */
1335
1336 /* Do Stevens' IPV6_PKTOPTIONS.
1337
1338 Yes, guys, it is the only place in our code, where we
1339 may make it not affecting IPv4.
1340 The rest of code is protocol independent,
1341 and I do not like idea to uglify IPv4.
1342
1343 Actually, all the idea behind IPV6_PKTOPTIONS
1344 looks not very well thought. For now we latch
1345 options, received in the last packet, enqueued
1346 by tcp. Feel free to propose better solution.
1ab1457c 1347 --ANK (980728)
1da177e4
LT
1348 */
1349 if (np->rxopt.all)
99a1dec7 1350 opt_skb = skb_clone(skb, sk_gfp_atomic(sk, GFP_ATOMIC));
1da177e4
LT
1351
1352 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
5d299f3d
ED
1353 struct dst_entry *dst = sk->sk_rx_dst;
1354
bdeab991 1355 sock_rps_save_rxhash(sk, skb);
5d299f3d
ED
1356 if (dst) {
1357 if (inet_sk(sk)->rx_dst_ifindex != skb->skb_iif ||
1358 dst->ops->check(dst, np->rx_dst_cookie) == NULL) {
1359 dst_release(dst);
1360 sk->sk_rx_dst = NULL;
1361 }
1362 }
1363
c995ae22 1364 tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len);
1da177e4
LT
1365 if (opt_skb)
1366 goto ipv6_pktoptions;
1367 return 0;
1368 }
1369
ab6a5bb6 1370 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1da177e4
LT
1371 goto csum_err;
1372
1ab1457c 1373 if (sk->sk_state == TCP_LISTEN) {
1da177e4
LT
1374 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1375 if (!nsk)
1376 goto discard;
1377
1378 /*
1379 * Queue it on the new socket if the new socket is active,
1380 * otherwise we just shortcircuit this and continue with
1381 * the new socket..
1382 */
1ab1457c 1383 if(nsk != sk) {
bdeab991 1384 sock_rps_save_rxhash(nsk, skb);
1da177e4
LT
1385 if (tcp_child_process(sk, nsk, skb))
1386 goto reset;
1387 if (opt_skb)
1388 __kfree_skb(opt_skb);
1389 return 0;
1390 }
47482f13 1391 } else
bdeab991 1392 sock_rps_save_rxhash(sk, skb);
1da177e4 1393
aa8223c7 1394 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1da177e4 1395 goto reset;
1da177e4
LT
1396 if (opt_skb)
1397 goto ipv6_pktoptions;
1398 return 0;
1399
1400reset:
cfb6eeb4 1401 tcp_v6_send_reset(sk, skb);
1da177e4
LT
1402discard:
1403 if (opt_skb)
1404 __kfree_skb(opt_skb);
1405 kfree_skb(skb);
1406 return 0;
1407csum_err:
6a5dc9e5 1408 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_CSUMERRORS);
63231bdd 1409 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1da177e4
LT
1410 goto discard;
1411
1412
1413ipv6_pktoptions:
1414 /* Do you ask, what is it?
1415
1416 1. skb was enqueued by tcp.
1417 2. skb is added to tail of read queue, rather than out of order.
1418 3. socket is not in passive state.
1419 4. Finally, it really contains options, which user wants to receive.
1420 */
1421 tp = tcp_sk(sk);
1422 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1423 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
333fad53 1424 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
505cbfc5 1425 np->mcast_oif = inet6_iif(opt_skb);
333fad53 1426 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
0660e03f 1427 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
4c507d28 1428 if (np->rxopt.bits.rxtclass)
3a1c7565 1429 np->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(opt_skb));
1da177e4
LT
1430 if (ipv6_opt_accepted(sk, opt_skb)) {
1431 skb_set_owner_r(opt_skb, sk);
1432 opt_skb = xchg(&np->pktoptions, opt_skb);
1433 } else {
1434 __kfree_skb(opt_skb);
1435 opt_skb = xchg(&np->pktoptions, NULL);
1436 }
1437 }
1438
800d55f1 1439 kfree_skb(opt_skb);
1da177e4
LT
1440 return 0;
1441}
1442
e5bbef20 1443static int tcp_v6_rcv(struct sk_buff *skb)
1da177e4 1444{
cf533ea5 1445 const struct tcphdr *th;
b71d1d42 1446 const struct ipv6hdr *hdr;
1da177e4
LT
1447 struct sock *sk;
1448 int ret;
a86b1e30 1449 struct net *net = dev_net(skb->dev);
1da177e4
LT
1450
1451 if (skb->pkt_type != PACKET_HOST)
1452 goto discard_it;
1453
1454 /*
1455 * Count it even if it's bad.
1456 */
63231bdd 1457 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1da177e4
LT
1458
1459 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1460 goto discard_it;
1461
aa8223c7 1462 th = tcp_hdr(skb);
1da177e4
LT
1463
1464 if (th->doff < sizeof(struct tcphdr)/4)
1465 goto bad_packet;
1466 if (!pskb_may_pull(skb, th->doff*4))
1467 goto discard_it;
1468
60476372 1469 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
6a5dc9e5 1470 goto csum_error;
1da177e4 1471
aa8223c7 1472 th = tcp_hdr(skb);
e802af9c 1473 hdr = ipv6_hdr(skb);
1da177e4
LT
1474 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1475 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1476 skb->len - th->doff*4);
1477 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1478 TCP_SKB_CB(skb)->when = 0;
b82d1bb4 1479 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
1da177e4
LT
1480 TCP_SKB_CB(skb)->sacked = 0;
1481
9a1f27c4 1482 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1da177e4
LT
1483 if (!sk)
1484 goto no_tcp_socket;
1485
1486process:
1487 if (sk->sk_state == TCP_TIME_WAIT)
1488 goto do_time_wait;
1489
e802af9c
SH
1490 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1491 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1492 goto discard_and_relse;
1493 }
1494
1da177e4
LT
1495 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1496 goto discard_and_relse;
1497
fda9ef5d 1498 if (sk_filter(sk, skb))
1da177e4
LT
1499 goto discard_and_relse;
1500
8b80cda5 1501 sk_mark_napi_id(sk, skb);
1da177e4
LT
1502 skb->dev = NULL;
1503
293b9c42 1504 bh_lock_sock_nested(sk);
1da177e4
LT
1505 ret = 0;
1506 if (!sock_owned_by_user(sk)) {
1a2449a8 1507#ifdef CONFIG_NET_DMA
1ab1457c 1508 struct tcp_sock *tp = tcp_sk(sk);
b4caea8a 1509 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
a2bd1140 1510 tp->ucopy.dma_chan = net_dma_find_channel();
1ab1457c
YH
1511 if (tp->ucopy.dma_chan)
1512 ret = tcp_v6_do_rcv(sk, skb);
1513 else
1a2449a8
CL
1514#endif
1515 {
1516 if (!tcp_prequeue(sk, skb))
1517 ret = tcp_v6_do_rcv(sk, skb);
1518 }
da882c1f
ED
1519 } else if (unlikely(sk_add_backlog(sk, skb,
1520 sk->sk_rcvbuf + sk->sk_sndbuf))) {
6b03a53a 1521 bh_unlock_sock(sk);
6cce09f8 1522 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
6b03a53a
ZY
1523 goto discard_and_relse;
1524 }
1da177e4
LT
1525 bh_unlock_sock(sk);
1526
1527 sock_put(sk);
1528 return ret ? -1 : 0;
1529
1530no_tcp_socket:
1531 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1532 goto discard_it;
1533
1534 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
6a5dc9e5
ED
1535csum_error:
1536 TCP_INC_STATS_BH(net, TCP_MIB_CSUMERRORS);
1da177e4 1537bad_packet:
63231bdd 1538 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1da177e4 1539 } else {
cfb6eeb4 1540 tcp_v6_send_reset(NULL, skb);
1da177e4
LT
1541 }
1542
1543discard_it:
1da177e4
LT
1544 kfree_skb(skb);
1545 return 0;
1546
1547discard_and_relse:
1548 sock_put(sk);
1549 goto discard_it;
1550
1551do_time_wait:
1552 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
9469c7b4 1553 inet_twsk_put(inet_twsk(sk));
1da177e4
LT
1554 goto discard_it;
1555 }
1556
6a5dc9e5 1557 if (skb->len < (th->doff<<2)) {
9469c7b4 1558 inet_twsk_put(inet_twsk(sk));
6a5dc9e5
ED
1559 goto bad_packet;
1560 }
1561 if (tcp_checksum_complete(skb)) {
1562 inet_twsk_put(inet_twsk(sk));
1563 goto csum_error;
1da177e4
LT
1564 }
1565
9469c7b4 1566 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1da177e4
LT
1567 case TCP_TW_SYN:
1568 {
1569 struct sock *sk2;
1570
c346dca1 1571 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
5ba24953 1572 &ipv6_hdr(skb)->saddr, th->source,
0660e03f 1573 &ipv6_hdr(skb)->daddr,
505cbfc5 1574 ntohs(th->dest), inet6_iif(skb));
1da177e4 1575 if (sk2 != NULL) {
295ff7ed
ACM
1576 struct inet_timewait_sock *tw = inet_twsk(sk);
1577 inet_twsk_deschedule(tw, &tcp_death_row);
1578 inet_twsk_put(tw);
1da177e4
LT
1579 sk = sk2;
1580 goto process;
1581 }
1582 /* Fall through to ACK */
1583 }
1584 case TCP_TW_ACK:
1585 tcp_v6_timewait_ack(sk, skb);
1586 break;
1587 case TCP_TW_RST:
1588 goto no_tcp_socket;
1589 case TCP_TW_SUCCESS:;
1590 }
1591 goto discard_it;
1592}
1593
c7109986
ED
1594static void tcp_v6_early_demux(struct sk_buff *skb)
1595{
1596 const struct ipv6hdr *hdr;
1597 const struct tcphdr *th;
1598 struct sock *sk;
1599
1600 if (skb->pkt_type != PACKET_HOST)
1601 return;
1602
1603 if (!pskb_may_pull(skb, skb_transport_offset(skb) + sizeof(struct tcphdr)))
1604 return;
1605
1606 hdr = ipv6_hdr(skb);
1607 th = tcp_hdr(skb);
1608
1609 if (th->doff < sizeof(struct tcphdr) / 4)
1610 return;
1611
1612 sk = __inet6_lookup_established(dev_net(skb->dev), &tcp_hashinfo,
1613 &hdr->saddr, th->source,
1614 &hdr->daddr, ntohs(th->dest),
1615 inet6_iif(skb));
1616 if (sk) {
1617 skb->sk = sk;
1618 skb->destructor = sock_edemux;
1619 if (sk->sk_state != TCP_TIME_WAIT) {
1620 struct dst_entry *dst = sk->sk_rx_dst;
f3f12135 1621
c7109986 1622 if (dst)
5d299f3d 1623 dst = dst_check(dst, inet6_sk(sk)->rx_dst_cookie);
c7109986 1624 if (dst &&
f3f12135 1625 inet_sk(sk)->rx_dst_ifindex == skb->skb_iif)
c7109986
ED
1626 skb_dst_set_noref(skb, dst);
1627 }
1628 }
1629}
1630
ccb7c410
DM
1631static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1632 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1633 .twsk_unique = tcp_twsk_unique,
1634 .twsk_destructor= tcp_twsk_destructor,
ccb7c410
DM
1635};
1636
3b401a81 1637static const struct inet_connection_sock_af_ops ipv6_specific = {
543d9cfe
ACM
1638 .queue_xmit = inet6_csk_xmit,
1639 .send_check = tcp_v6_send_check,
1640 .rebuild_header = inet6_sk_rebuild_header,
5d299f3d 1641 .sk_rx_dst_set = inet6_sk_rx_dst_set,
543d9cfe
ACM
1642 .conn_request = tcp_v6_conn_request,
1643 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe 1644 .net_header_len = sizeof(struct ipv6hdr),
67469601 1645 .net_frag_header_len = sizeof(struct frag_hdr),
543d9cfe
ACM
1646 .setsockopt = ipv6_setsockopt,
1647 .getsockopt = ipv6_getsockopt,
1648 .addr2sockaddr = inet6_csk_addr2sockaddr,
1649 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1650 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1651#ifdef CONFIG_COMPAT
543d9cfe
ACM
1652 .compat_setsockopt = compat_ipv6_setsockopt,
1653 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1654#endif
1da177e4
LT
1655};
1656
cfb6eeb4 1657#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1658static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
cfb6eeb4 1659 .md5_lookup = tcp_v6_md5_lookup,
49a72dfb 1660 .calc_md5_hash = tcp_v6_md5_hash_skb,
cfb6eeb4 1661 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1662};
a928630a 1663#endif
cfb6eeb4 1664
1da177e4
LT
1665/*
1666 * TCP over IPv4 via INET6 API
1667 */
1668
3b401a81 1669static const struct inet_connection_sock_af_ops ipv6_mapped = {
543d9cfe
ACM
1670 .queue_xmit = ip_queue_xmit,
1671 .send_check = tcp_v4_send_check,
1672 .rebuild_header = inet_sk_rebuild_header,
63d02d15 1673 .sk_rx_dst_set = inet_sk_rx_dst_set,
543d9cfe
ACM
1674 .conn_request = tcp_v6_conn_request,
1675 .syn_recv_sock = tcp_v6_syn_recv_sock,
543d9cfe
ACM
1676 .net_header_len = sizeof(struct iphdr),
1677 .setsockopt = ipv6_setsockopt,
1678 .getsockopt = ipv6_getsockopt,
1679 .addr2sockaddr = inet6_csk_addr2sockaddr,
1680 .sockaddr_len = sizeof(struct sockaddr_in6),
ab1e0a13 1681 .bind_conflict = inet6_csk_bind_conflict,
3fdadf7d 1682#ifdef CONFIG_COMPAT
543d9cfe
ACM
1683 .compat_setsockopt = compat_ipv6_setsockopt,
1684 .compat_getsockopt = compat_ipv6_getsockopt,
3fdadf7d 1685#endif
1da177e4
LT
1686};
1687
cfb6eeb4 1688#ifdef CONFIG_TCP_MD5SIG
b2e4b3de 1689static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
cfb6eeb4 1690 .md5_lookup = tcp_v4_md5_lookup,
49a72dfb 1691 .calc_md5_hash = tcp_v4_md5_hash_skb,
cfb6eeb4 1692 .md5_parse = tcp_v6_parse_md5_keys,
cfb6eeb4 1693};
a928630a 1694#endif
cfb6eeb4 1695
1da177e4
LT
1696/* NOTE: A lot of things set to zero explicitly by call to
1697 * sk_alloc() so need not be done here.
1698 */
1699static int tcp_v6_init_sock(struct sock *sk)
1700{
6687e988 1701 struct inet_connection_sock *icsk = inet_csk(sk);
1da177e4 1702
900f65d3 1703 tcp_init_sock(sk);
1da177e4 1704
8292a17a 1705 icsk->icsk_af_ops = &ipv6_specific;
1da177e4 1706
cfb6eeb4 1707#ifdef CONFIG_TCP_MD5SIG
ac807fa8 1708 tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
cfb6eeb4
YH
1709#endif
1710
1da177e4
LT
1711 return 0;
1712}
1713
7d06b2e0 1714static void tcp_v6_destroy_sock(struct sock *sk)
1da177e4 1715{
1da177e4 1716 tcp_v4_destroy_sock(sk);
7d06b2e0 1717 inet6_destroy_sock(sk);
1da177e4
LT
1718}
1719
952a10be 1720#ifdef CONFIG_PROC_FS
1da177e4 1721/* Proc filesystem TCPv6 sock list dumping. */
1ab1457c 1722static void get_openreq6(struct seq_file *seq,
a7cb5a49 1723 const struct sock *sk, struct request_sock *req, int i, kuid_t uid)
1da177e4 1724{
1da177e4 1725 int ttd = req->expires - jiffies;
634fb979
ED
1726 const struct in6_addr *src = &inet_rsk(req)->ir_v6_loc_addr;
1727 const struct in6_addr *dest = &inet_rsk(req)->ir_v6_rmt_addr;
1da177e4
LT
1728
1729 if (ttd < 0)
1730 ttd = 0;
1731
1da177e4
LT
1732 seq_printf(seq,
1733 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
d14c5ab6 1734 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %d %d %pK\n",
1da177e4
LT
1735 i,
1736 src->s6_addr32[0], src->s6_addr32[1],
1737 src->s6_addr32[2], src->s6_addr32[3],
b44084c2 1738 inet_rsk(req)->ir_num,
1da177e4
LT
1739 dest->s6_addr32[0], dest->s6_addr32[1],
1740 dest->s6_addr32[2], dest->s6_addr32[3],
634fb979 1741 ntohs(inet_rsk(req)->ir_rmt_port),
1da177e4
LT
1742 TCP_SYN_RECV,
1743 0,0, /* could print option size, but that is af dependent. */
1ab1457c
YH
1744 1, /* timers active (only the expire timer) */
1745 jiffies_to_clock_t(ttd),
e6c022a4 1746 req->num_timeout,
a7cb5a49 1747 from_kuid_munged(seq_user_ns(seq), uid),
1ab1457c 1748 0, /* non standard timer */
1da177e4
LT
1749 0, /* open_requests have no inode */
1750 0, req);
1751}
1752
1753static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1754{
b71d1d42 1755 const struct in6_addr *dest, *src;
1da177e4
LT
1756 __u16 destp, srcp;
1757 int timer_active;
1758 unsigned long timer_expires;
cf533ea5
ED
1759 const struct inet_sock *inet = inet_sk(sp);
1760 const struct tcp_sock *tp = tcp_sk(sp);
463c84b9 1761 const struct inet_connection_sock *icsk = inet_csk(sp);
1da177e4 1762
efe4208f
ED
1763 dest = &sp->sk_v6_daddr;
1764 src = &sp->sk_v6_rcv_saddr;
c720c7e8
ED
1765 destp = ntohs(inet->inet_dport);
1766 srcp = ntohs(inet->inet_sport);
463c84b9
ACM
1767
1768 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1da177e4 1769 timer_active = 1;
463c84b9
ACM
1770 timer_expires = icsk->icsk_timeout;
1771 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1da177e4 1772 timer_active = 4;
463c84b9 1773 timer_expires = icsk->icsk_timeout;
1da177e4
LT
1774 } else if (timer_pending(&sp->sk_timer)) {
1775 timer_active = 2;
1776 timer_expires = sp->sk_timer.expires;
1777 } else {
1778 timer_active = 0;
1779 timer_expires = jiffies;
1780 }
1781
1782 seq_printf(seq,
1783 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
d14c5ab6 1784 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %lu %d %pK %lu %lu %u %u %d\n",
1da177e4
LT
1785 i,
1786 src->s6_addr32[0], src->s6_addr32[1],
1787 src->s6_addr32[2], src->s6_addr32[3], srcp,
1788 dest->s6_addr32[0], dest->s6_addr32[1],
1789 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1ab1457c 1790 sp->sk_state,
47da8ee6
SS
1791 tp->write_seq-tp->snd_una,
1792 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1da177e4 1793 timer_active,
a399a805 1794 jiffies_delta_to_clock_t(timer_expires - jiffies),
463c84b9 1795 icsk->icsk_retransmits,
a7cb5a49 1796 from_kuid_munged(seq_user_ns(seq), sock_i_uid(sp)),
6687e988 1797 icsk->icsk_probes_out,
1da177e4
LT
1798 sock_i_ino(sp),
1799 atomic_read(&sp->sk_refcnt), sp,
7be87351
SH
1800 jiffies_to_clock_t(icsk->icsk_rto),
1801 jiffies_to_clock_t(icsk->icsk_ack.ato),
463c84b9 1802 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
0b6a05c1
IJ
1803 tp->snd_cwnd,
1804 tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
1da177e4
LT
1805 );
1806}
1807
1ab1457c 1808static void get_timewait6_sock(struct seq_file *seq,
8feaf0c0 1809 struct inet_timewait_sock *tw, int i)
1da177e4 1810{
b71d1d42 1811 const struct in6_addr *dest, *src;
1da177e4 1812 __u16 destp, srcp;
96f817fe 1813 s32 delta = tw->tw_ttd - inet_tw_time_stamp();
1da177e4 1814
efe4208f
ED
1815 dest = &tw->tw_v6_daddr;
1816 src = &tw->tw_v6_rcv_saddr;
1da177e4
LT
1817 destp = ntohs(tw->tw_dport);
1818 srcp = ntohs(tw->tw_sport);
1819
1820 seq_printf(seq,
1821 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
71338aa7 1822 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1da177e4
LT
1823 i,
1824 src->s6_addr32[0], src->s6_addr32[1],
1825 src->s6_addr32[2], src->s6_addr32[3], srcp,
1826 dest->s6_addr32[0], dest->s6_addr32[1],
1827 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1828 tw->tw_substate, 0, 0,
a399a805 1829 3, jiffies_delta_to_clock_t(delta), 0, 0, 0, 0,
1da177e4
LT
1830 atomic_read(&tw->tw_refcnt), tw);
1831}
1832
1da177e4
LT
1833static int tcp6_seq_show(struct seq_file *seq, void *v)
1834{
1835 struct tcp_iter_state *st;
05dbc7b5 1836 struct sock *sk = v;
1da177e4
LT
1837
1838 if (v == SEQ_START_TOKEN) {
1839 seq_puts(seq,
1840 " sl "
1841 "local_address "
1842 "remote_address "
1843 "st tx_queue rx_queue tr tm->when retrnsmt"
1844 " uid timeout inode\n");
1845 goto out;
1846 }
1847 st = seq->private;
1848
1849 switch (st->state) {
1850 case TCP_SEQ_STATE_LISTENING:
1851 case TCP_SEQ_STATE_ESTABLISHED:
05dbc7b5
ED
1852 if (sk->sk_state == TCP_TIME_WAIT)
1853 get_timewait6_sock(seq, v, st->num);
1854 else
1855 get_tcp6_sock(seq, v, st->num);
1da177e4
LT
1856 break;
1857 case TCP_SEQ_STATE_OPENREQ:
1858 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1859 break;
1da177e4
LT
1860 }
1861out:
1862 return 0;
1863}
1864
73cb88ec
AV
1865static const struct file_operations tcp6_afinfo_seq_fops = {
1866 .owner = THIS_MODULE,
1867 .open = tcp_seq_open,
1868 .read = seq_read,
1869 .llseek = seq_lseek,
1870 .release = seq_release_net
1871};
1872
1da177e4 1873static struct tcp_seq_afinfo tcp6_seq_afinfo = {
1da177e4
LT
1874 .name = "tcp6",
1875 .family = AF_INET6,
73cb88ec 1876 .seq_fops = &tcp6_afinfo_seq_fops,
9427c4b3
DL
1877 .seq_ops = {
1878 .show = tcp6_seq_show,
1879 },
1da177e4
LT
1880};
1881
2c8c1e72 1882int __net_init tcp6_proc_init(struct net *net)
1da177e4 1883{
6f8b13bc 1884 return tcp_proc_register(net, &tcp6_seq_afinfo);
1da177e4
LT
1885}
1886
6f8b13bc 1887void tcp6_proc_exit(struct net *net)
1da177e4 1888{
6f8b13bc 1889 tcp_proc_unregister(net, &tcp6_seq_afinfo);
1da177e4
LT
1890}
1891#endif
1892
f77d6021
ED
1893static void tcp_v6_clear_sk(struct sock *sk, int size)
1894{
1895 struct inet_sock *inet = inet_sk(sk);
1896
1897 /* we do not want to clear pinet6 field, because of RCU lookups */
1898 sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
1899
1900 size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
1901 memset(&inet->pinet6 + 1, 0, size);
1902}
1903
1da177e4
LT
1904struct proto tcpv6_prot = {
1905 .name = "TCPv6",
1906 .owner = THIS_MODULE,
1907 .close = tcp_close,
1908 .connect = tcp_v6_connect,
1909 .disconnect = tcp_disconnect,
463c84b9 1910 .accept = inet_csk_accept,
1da177e4
LT
1911 .ioctl = tcp_ioctl,
1912 .init = tcp_v6_init_sock,
1913 .destroy = tcp_v6_destroy_sock,
1914 .shutdown = tcp_shutdown,
1915 .setsockopt = tcp_setsockopt,
1916 .getsockopt = tcp_getsockopt,
1da177e4 1917 .recvmsg = tcp_recvmsg,
7ba42910
CG
1918 .sendmsg = tcp_sendmsg,
1919 .sendpage = tcp_sendpage,
1da177e4 1920 .backlog_rcv = tcp_v6_do_rcv,
46d3ceab 1921 .release_cb = tcp_release_cb,
563d34d0 1922 .mtu_reduced = tcp_v6_mtu_reduced,
1da177e4 1923 .hash = tcp_v6_hash,
ab1e0a13
ACM
1924 .unhash = inet_unhash,
1925 .get_port = inet_csk_get_port,
1da177e4 1926 .enter_memory_pressure = tcp_enter_memory_pressure,
c9bee3b7 1927 .stream_memory_free = tcp_stream_memory_free,
1da177e4
LT
1928 .sockets_allocated = &tcp_sockets_allocated,
1929 .memory_allocated = &tcp_memory_allocated,
1930 .memory_pressure = &tcp_memory_pressure,
0a5578cf 1931 .orphan_count = &tcp_orphan_count,
a4fe34bf 1932 .sysctl_mem = sysctl_tcp_mem,
1da177e4
LT
1933 .sysctl_wmem = sysctl_tcp_wmem,
1934 .sysctl_rmem = sysctl_tcp_rmem,
1935 .max_header = MAX_TCP_HEADER,
1936 .obj_size = sizeof(struct tcp6_sock),
3ab5aee7 1937 .slab_flags = SLAB_DESTROY_BY_RCU,
6d6ee43e 1938 .twsk_prot = &tcp6_timewait_sock_ops,
60236fdd 1939 .rsk_prot = &tcp6_request_sock_ops,
39d8cda7 1940 .h.hashinfo = &tcp_hashinfo,
7ba42910 1941 .no_autobind = true,
543d9cfe
ACM
1942#ifdef CONFIG_COMPAT
1943 .compat_setsockopt = compat_tcp_setsockopt,
1944 .compat_getsockopt = compat_tcp_getsockopt,
1945#endif
c255a458 1946#ifdef CONFIG_MEMCG_KMEM
d1a4c0b3
GC
1947 .proto_cgroup = tcp_proto_cgroup,
1948#endif
f77d6021 1949 .clear_sk = tcp_v6_clear_sk,
1da177e4
LT
1950};
1951
41135cc8 1952static const struct inet6_protocol tcpv6_protocol = {
c7109986 1953 .early_demux = tcp_v6_early_demux,
1da177e4
LT
1954 .handler = tcp_v6_rcv,
1955 .err_handler = tcp_v6_err,
1956 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1957};
1958
1da177e4
LT
1959static struct inet_protosw tcpv6_protosw = {
1960 .type = SOCK_STREAM,
1961 .protocol = IPPROTO_TCP,
1962 .prot = &tcpv6_prot,
1963 .ops = &inet6_stream_ops,
1da177e4 1964 .no_check = 0,
d83d8461
ACM
1965 .flags = INET_PROTOSW_PERMANENT |
1966 INET_PROTOSW_ICSK,
1da177e4
LT
1967};
1968
2c8c1e72 1969static int __net_init tcpv6_net_init(struct net *net)
93ec926b 1970{
5677242f
DL
1971 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
1972 SOCK_RAW, IPPROTO_TCP, net);
93ec926b
DL
1973}
1974
2c8c1e72 1975static void __net_exit tcpv6_net_exit(struct net *net)
93ec926b 1976{
5677242f 1977 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
b099ce26
EB
1978}
1979
2c8c1e72 1980static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
b099ce26
EB
1981{
1982 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
93ec926b
DL
1983}
1984
1985static struct pernet_operations tcpv6_net_ops = {
b099ce26
EB
1986 .init = tcpv6_net_init,
1987 .exit = tcpv6_net_exit,
1988 .exit_batch = tcpv6_net_exit_batch,
93ec926b
DL
1989};
1990
7f4e4868 1991int __init tcpv6_init(void)
1da177e4 1992{
7f4e4868
DL
1993 int ret;
1994
3336288a
VY
1995 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
1996 if (ret)
c6b641a4 1997 goto out;
3336288a 1998
1da177e4 1999 /* register inet6 protocol */
7f4e4868
DL
2000 ret = inet6_register_protosw(&tcpv6_protosw);
2001 if (ret)
2002 goto out_tcpv6_protocol;
2003
93ec926b 2004 ret = register_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2005 if (ret)
2006 goto out_tcpv6_protosw;
2007out:
2008 return ret;
ae0f7d5f 2009
7f4e4868
DL
2010out_tcpv6_protosw:
2011 inet6_unregister_protosw(&tcpv6_protosw);
3336288a
VY
2012out_tcpv6_protocol:
2013 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
7f4e4868
DL
2014 goto out;
2015}
2016
09f7709f 2017void tcpv6_exit(void)
7f4e4868 2018{
93ec926b 2019 unregister_pernet_subsys(&tcpv6_net_ops);
7f4e4868
DL
2020 inet6_unregister_protosw(&tcpv6_protosw);
2021 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
1da177e4 2022}