blob: a7a62ce12b3f4fd896a372a459ddc2696d00c5a3 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * TCP over IPv6
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09003 * Linux INET6 implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
5 * Authors:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09006 * Pedro Roque <roque@di.fc.ul.pt>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09008 * Based on:
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
Herbert Xueb4dea52008-12-29 23:04:08 -080026#include <linux/bottom_half.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090041#include <linux/slab.h>
Wang Yufen4aa956d2014-03-29 09:27:29 +080042#include <linux/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#include <linux/ipv6.h>
44#include <linux/icmpv6.h>
45#include <linux/random.h>
46
47#include <net/tcp.h>
48#include <net/ndisc.h>
Arnaldo Carvalho de Melo5324a042005-08-12 09:26:18 -030049#include <net/inet6_hashtables.h>
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -080050#include <net/inet6_connection_sock.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <net/ipv6.h>
52#include <net/transp_v6.h>
53#include <net/addrconf.h>
54#include <net/ip6_route.h>
55#include <net/ip6_checksum.h>
56#include <net/inet_ecn.h>
57#include <net/protocol.h>
58#include <net/xfrm.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070059#include <net/snmp.h>
60#include <net/dsfield.h>
Arnaldo Carvalho de Melo6d6ee432005-12-13 23:25:19 -080061#include <net/timewait_sock.h>
Jeff Garzik18134be2007-10-26 22:53:14 -070062#include <net/netdma.h>
Denis V. Lunev3d58b5f2008-04-03 14:22:32 -070063#include <net/inet_common.h>
David S. Miller6e5714e2011-08-03 20:50:44 -070064#include <net/secure_seq.h>
Glauber Costad1a4c0b2011-12-11 21:47:04 +000065#include <net/tcp_memcontrol.h>
Eliezer Tamir076bb0c2013-07-10 17:13:17 +030066#include <net/busy_poll.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
Linus Torvalds1da177e2005-04-16 15:20:36 -070068#include <linux/proc_fs.h>
69#include <linux/seq_file.h>
70
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -080071#include <linux/crypto.h>
72#include <linux/scatterlist.h>
73
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -080074static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
Gui Jianfeng6edafaa2008-08-06 23:50:04 -070075static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
76 struct request_sock *req);
Linus Torvalds1da177e2005-04-16 15:20:36 -070077
78static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
Stephen Hemminger3b401a82009-09-01 19:25:04 +000080static const struct inet_connection_sock_af_ops ipv6_mapped;
81static const struct inet_connection_sock_af_ops ipv6_specific;
David S. Millera9286302006-11-14 19:53:22 -080082#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3de2009-09-01 19:25:03 +000083static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
84static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +090085#else
86static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
Eric Dumazetb71d1d42011-04-22 04:53:02 +000087 const struct in6_addr *addr)
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +090088{
89 return NULL;
90}
David S. Millera9286302006-11-14 19:53:22 -080091#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070092
Neal Cardwellfae6ef82012-08-19 03:30:38 +000093static void inet6_sk_rx_dst_set(struct sock *sk, const struct sk_buff *skb)
94{
95 struct dst_entry *dst = skb_dst(skb);
96 const struct rt6_info *rt = (const struct rt6_info *)dst;
97
98 dst_hold(dst);
99 sk->sk_rx_dst = dst;
100 inet_sk(sk)->rx_dst_ifindex = skb->skb_iif;
101 if (rt->rt6i_node)
102 inet6_sk(sk)->rx_dst_cookie = rt->rt6i_node->fn_sernum;
103}
104
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105static void tcp_v6_hash(struct sock *sk)
106{
107 if (sk->sk_state != TCP_CLOSE) {
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -0800108 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109 tcp_prot.hash(sk);
110 return;
111 }
112 local_bh_disable();
Eric Dumazet9327f702009-12-04 03:46:54 +0000113 __inet6_hash(sk, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 local_bh_enable();
115 }
116}
117
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400118static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119{
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700120 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
121 ipv6_hdr(skb)->saddr.s6_addr32,
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -0700122 tcp_hdr(skb)->dest,
123 tcp_hdr(skb)->source);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124}
125
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900126static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127 int addr_len)
128{
129 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900130 struct inet_sock *inet = inet_sk(sk);
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800131 struct inet_connection_sock *icsk = inet_csk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700132 struct ipv6_pinfo *np = inet6_sk(sk);
133 struct tcp_sock *tp = tcp_sk(sk);
Arnaud Ebalard20c59de2010-06-01 21:35:01 +0000134 struct in6_addr *saddr = NULL, *final_p, final;
David S. Miller493f3772010-12-02 12:14:29 -0800135 struct rt6_info *rt;
David S. Miller4c9483b2011-03-12 16:22:43 -0500136 struct flowi6 fl6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137 struct dst_entry *dst;
138 int addr_type;
139 int err;
140
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900141 if (addr_len < SIN6_LEN_RFC2133)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142 return -EINVAL;
143
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900144 if (usin->sin6_family != AF_INET6)
Eric Dumazeta02cec22010-09-22 20:43:57 +0000145 return -EAFNOSUPPORT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146
David S. Miller4c9483b2011-03-12 16:22:43 -0500147 memset(&fl6, 0, sizeof(fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148
149 if (np->sndflow) {
David S. Miller4c9483b2011-03-12 16:22:43 -0500150 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
151 IP6_ECN_flow_init(fl6.flowlabel);
152 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 struct ip6_flowlabel *flowlabel;
David S. Miller4c9483b2011-03-12 16:22:43 -0500154 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 if (flowlabel == NULL)
156 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157 fl6_sock_release(flowlabel);
158 }
159 }
160
161 /*
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900162 * connect() to INADDR_ANY means loopback (BSD'ism).
163 */
164
Weilong Chen4c99aa42013-12-19 18:44:34 +0800165 if (ipv6_addr_any(&usin->sin6_addr))
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900166 usin->sin6_addr.s6_addr[15] = 0x1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167
168 addr_type = ipv6_addr_type(&usin->sin6_addr);
169
Weilong Chen4c99aa42013-12-19 18:44:34 +0800170 if (addr_type & IPV6_ADDR_MULTICAST)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171 return -ENETUNREACH;
172
173 if (addr_type&IPV6_ADDR_LINKLOCAL) {
174 if (addr_len >= sizeof(struct sockaddr_in6) &&
175 usin->sin6_scope_id) {
176 /* If interface is set while binding, indices
177 * must coincide.
178 */
179 if (sk->sk_bound_dev_if &&
180 sk->sk_bound_dev_if != usin->sin6_scope_id)
181 return -EINVAL;
182
183 sk->sk_bound_dev_if = usin->sin6_scope_id;
184 }
185
186 /* Connect to link-local address requires an interface */
187 if (!sk->sk_bound_dev_if)
188 return -EINVAL;
189 }
190
191 if (tp->rx_opt.ts_recent_stamp &&
Eric Dumazetefe42082013-10-03 15:42:29 -0700192 !ipv6_addr_equal(&sk->sk_v6_daddr, &usin->sin6_addr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193 tp->rx_opt.ts_recent = 0;
194 tp->rx_opt.ts_recent_stamp = 0;
195 tp->write_seq = 0;
196 }
197
Eric Dumazetefe42082013-10-03 15:42:29 -0700198 sk->sk_v6_daddr = usin->sin6_addr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500199 np->flow_label = fl6.flowlabel;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200
201 /*
202 * TCP over IPv4
203 */
204
205 if (addr_type == IPV6_ADDR_MAPPED) {
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800206 u32 exthdrlen = icsk->icsk_ext_hdr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207 struct sockaddr_in sin;
208
209 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
210
211 if (__ipv6_only_sock(sk))
212 return -ENETUNREACH;
213
214 sin.sin_family = AF_INET;
215 sin.sin_port = usin->sin6_port;
216 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
217
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800218 icsk->icsk_af_ops = &ipv6_mapped;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219 sk->sk_backlog_rcv = tcp_v4_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800220#ifdef CONFIG_TCP_MD5SIG
221 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
222#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223
224 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
225
226 if (err) {
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800227 icsk->icsk_ext_hdr_len = exthdrlen;
228 icsk->icsk_af_ops = &ipv6_specific;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 sk->sk_backlog_rcv = tcp_v6_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800230#ifdef CONFIG_TCP_MD5SIG
231 tp->af_specific = &tcp_sock_ipv6_specific;
232#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233 goto failure;
234 } else {
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000235 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
236 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
Eric Dumazetefe42082013-10-03 15:42:29 -0700237 &sk->sk_v6_rcv_saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238 }
239
240 return err;
241 }
242
Eric Dumazetefe42082013-10-03 15:42:29 -0700243 if (!ipv6_addr_any(&sk->sk_v6_rcv_saddr))
244 saddr = &sk->sk_v6_rcv_saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245
David S. Miller4c9483b2011-03-12 16:22:43 -0500246 fl6.flowi6_proto = IPPROTO_TCP;
Eric Dumazetefe42082013-10-03 15:42:29 -0700247 fl6.daddr = sk->sk_v6_daddr;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000248 fl6.saddr = saddr ? *saddr : np->saddr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500249 fl6.flowi6_oif = sk->sk_bound_dev_if;
250 fl6.flowi6_mark = sk->sk_mark;
David S. Miller1958b852011-03-12 16:36:19 -0500251 fl6.fl6_dport = usin->sin6_port;
252 fl6.fl6_sport = inet->inet_sport;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253
David S. Miller4c9483b2011-03-12 16:22:43 -0500254 final_p = fl6_update_dst(&fl6, np->opt, &final);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255
David S. Miller4c9483b2011-03-12 16:22:43 -0500256 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
Venkat Yekkiralabeb8d132006-08-04 23:12:42 -0700257
Steffen Klassert0e0d44a2013-08-28 08:04:14 +0200258 dst = ip6_dst_lookup_flow(sk, &fl6, final_p);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800259 if (IS_ERR(dst)) {
260 err = PTR_ERR(dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261 goto failure;
David S. Miller14e50e52007-05-24 18:17:54 -0700262 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263
264 if (saddr == NULL) {
David S. Miller4c9483b2011-03-12 16:22:43 -0500265 saddr = &fl6.saddr;
Eric Dumazetefe42082013-10-03 15:42:29 -0700266 sk->sk_v6_rcv_saddr = *saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267 }
268
269 /* set the source address */
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000270 np->saddr = *saddr;
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000271 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272
Herbert Xuf83ef8c2006-06-30 13:37:03 -0700273 sk->sk_gso_type = SKB_GSO_TCPV6;
YOSHIFUJI Hideaki8e1ef0a2006-08-29 17:15:09 -0700274 __ip6_dst_store(sk, dst, NULL, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275
David S. Miller493f3772010-12-02 12:14:29 -0800276 rt = (struct rt6_info *) dst;
277 if (tcp_death_row.sysctl_tw_recycle &&
278 !tp->rx_opt.ts_recent_stamp &&
Eric Dumazetefe42082013-10-03 15:42:29 -0700279 ipv6_addr_equal(&rt->rt6i_dst.addr, &sk->sk_v6_daddr))
David S. Miller81166dd2012-07-10 03:14:24 -0700280 tcp_fetch_timewait_stamp(sk, dst);
David S. Miller493f3772010-12-02 12:14:29 -0800281
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800282 icsk->icsk_ext_hdr_len = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283 if (np->opt)
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800284 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
285 np->opt->opt_nflen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286
287 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
288
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000289 inet->inet_dport = usin->sin6_port;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290
291 tcp_set_state(sk, TCP_SYN_SENT);
Arnaldo Carvalho de Melod8313f52005-12-13 23:25:44 -0800292 err = inet6_hash_connect(&tcp_death_row, sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293 if (err)
294 goto late_failure;
295
Andrey Vagin2b916472012-11-22 01:13:58 +0000296 if (!tp->write_seq && likely(!tp->repair))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
Eric Dumazetefe42082013-10-03 15:42:29 -0700298 sk->sk_v6_daddr.s6_addr32,
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000299 inet->inet_sport,
300 inet->inet_dport);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301
302 err = tcp_connect(sk);
303 if (err)
304 goto late_failure;
305
306 return 0;
307
308late_failure:
309 tcp_set_state(sk, TCP_CLOSE);
310 __sk_dst_reset(sk);
311failure:
Eric Dumazetc720c7e82009-10-15 06:30:45 +0000312 inet->inet_dport = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700313 sk->sk_route_caps = 0;
314 return err;
315}
316
Eric Dumazet563d34d2012-07-23 09:48:52 +0200317static void tcp_v6_mtu_reduced(struct sock *sk)
318{
319 struct dst_entry *dst;
320
321 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
322 return;
323
324 dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
325 if (!dst)
326 return;
327
328 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
329 tcp_sync_mss(sk, dst_mtu(dst));
330 tcp_simple_retransmit(sk);
331 }
332}
333
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
Brian Haleyd5fdd6b2009-06-23 04:31:07 -0700335 u8 type, u8 code, int offset, __be32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336{
Weilong Chen4c99aa42013-12-19 18:44:34 +0800337 const struct ipv6hdr *hdr = (const struct ipv6hdr *)skb->data;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -0300338 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 struct ipv6_pinfo *np;
340 struct sock *sk;
341 int err;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900342 struct tcp_sock *tp;
Yuchung Cheng0a672f742014-05-11 20:22:12 -0700343 struct request_sock *fastopen;
344 __u32 seq, snd_una;
Pavel Emelyanovca12a1a2008-07-16 20:28:42 -0700345 struct net *net = dev_net(skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346
Pavel Emelyanovca12a1a2008-07-16 20:28:42 -0700347 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
Pavel Emelyanovd86e0da2008-01-31 05:07:21 -0800348 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349
350 if (sk == NULL) {
Denis V. Luneve41b5362008-10-08 10:33:26 -0700351 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
352 ICMP6_MIB_INERRORS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353 return;
354 }
355
356 if (sk->sk_state == TCP_TIME_WAIT) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -0700357 inet_twsk_put(inet_twsk(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700358 return;
359 }
360
361 bh_lock_sock(sk);
Eric Dumazet563d34d2012-07-23 09:48:52 +0200362 if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700363 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364
365 if (sk->sk_state == TCP_CLOSE)
366 goto out;
367
Stephen Hemmingere802af92010-04-22 15:24:53 -0700368 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
369 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
370 goto out;
371 }
372
Linus Torvalds1da177e2005-04-16 15:20:36 -0700373 tp = tcp_sk(sk);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900374 seq = ntohl(th->seq);
Yuchung Cheng0a672f742014-05-11 20:22:12 -0700375 /* XXX (TFO) - tp->snd_una should be ISN (tcp_create_openreq_child() */
376 fastopen = tp->fastopen_rsk;
377 snd_una = fastopen ? tcp_rsk(fastopen)->snt_isn : tp->snd_una;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700378 if (sk->sk_state != TCP_LISTEN &&
Yuchung Cheng0a672f742014-05-11 20:22:12 -0700379 !between(seq, snd_una, tp->snd_nxt)) {
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700380 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381 goto out;
382 }
383
384 np = inet6_sk(sk);
385
David S. Millerec18d9a2012-07-12 00:25:15 -0700386 if (type == NDISC_REDIRECT) {
387 struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
388
David S. Miller1ed5c482012-07-12 00:41:25 -0700389 if (dst)
David S. Miller6700c272012-07-17 03:29:28 -0700390 dst->ops->redirect(dst, sk, skb);
Christoph Paasch50a75a82013-04-07 04:53:15 +0000391 goto out;
David S. Millerec18d9a2012-07-12 00:25:15 -0700392 }
393
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394 if (type == ICMPV6_PKT_TOOBIG) {
Eric Dumazet0d4f0602013-03-18 07:01:28 +0000395 /* We are not interested in TCP_LISTEN and open_requests
396 * (SYN-ACKs send out by Linux are always <576bytes so
397 * they should go through unfragmented).
398 */
399 if (sk->sk_state == TCP_LISTEN)
400 goto out;
401
Hannes Frederic Sowa93b36cf2013-12-15 03:41:14 +0100402 if (!ip6_sk_accept_pmtu(sk))
403 goto out;
404
Eric Dumazet563d34d2012-07-23 09:48:52 +0200405 tp->mtu_info = ntohl(info);
406 if (!sock_owned_by_user(sk))
407 tcp_v6_mtu_reduced(sk);
Julian Anastasovd013ef2a2012-09-05 10:53:18 +0000408 else if (!test_and_set_bit(TCP_MTU_REDUCED_DEFERRED,
409 &tp->tsq_flags))
410 sock_hold(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700411 goto out;
412 }
413
414 icmpv6_err_convert(type, code, &err);
415
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700416 /* Might be for an request_sock */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 switch (sk->sk_state) {
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700418 struct request_sock *req, **prev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700419 case TCP_LISTEN:
420 if (sock_owned_by_user(sk))
421 goto out;
422
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -0800423 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
424 &hdr->saddr, inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425 if (!req)
426 goto out;
427
428 /* ICMPs are not backlogged, hence we cannot get
429 * an established socket here.
430 */
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700431 WARN_ON(req->sk != NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -0700433 if (seq != tcp_rsk(req)->snt_isn) {
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700434 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435 goto out;
436 }
437
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -0700438 inet_csk_reqsk_queue_drop(sk, req, prev);
Vijay Subramanian5f1e9422013-01-31 08:24:19 +0000439 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700440 goto out;
441
442 case TCP_SYN_SENT:
Yuchung Cheng0a672f742014-05-11 20:22:12 -0700443 case TCP_SYN_RECV:
444 /* Only in fast or simultaneous open. If a fast open socket is
445 * is already accepted it is treated as a connected one below.
446 */
447 if (fastopen && fastopen->sk == NULL)
448 break;
449
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450 if (!sock_owned_by_user(sk)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700451 sk->sk_err = err;
452 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
453
454 tcp_done(sk);
455 } else
456 sk->sk_err_soft = err;
457 goto out;
458 }
459
460 if (!sock_owned_by_user(sk) && np->recverr) {
461 sk->sk_err = err;
462 sk->sk_error_report(sk);
463 } else
464 sk->sk_err_soft = err;
465
466out:
467 bh_unlock_sock(sk);
468 sock_put(sk);
469}
470
471
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000472static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
473 struct flowi6 *fl6,
Neal Cardwell3840a062012-06-28 12:34:19 +0000474 struct request_sock *req,
Eric Dumazetfff32692012-06-01 01:47:50 +0000475 u16 queue_mapping)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700476{
Eric Dumazet634fb9792013-10-09 15:21:29 -0700477 struct inet_request_sock *ireq = inet_rsk(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478 struct ipv6_pinfo *np = inet6_sk(sk);
Weilong Chen4c99aa42013-12-19 18:44:34 +0800479 struct sk_buff *skb;
Neal Cardwell94942182012-06-28 12:34:20 +0000480 int err = -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000482 /* First, grab a route. */
483 if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
Denis V. Lunevfd80eb92008-02-29 11:43:03 -0800484 goto done;
Neal Cardwell94942182012-06-28 12:34:20 +0000485
Christoph Paasch1a2c6182013-03-17 08:23:34 +0000486 skb = tcp_make_synack(sk, dst, req, NULL);
Neal Cardwell94942182012-06-28 12:34:20 +0000487
Linus Torvalds1da177e2005-04-16 15:20:36 -0700488 if (skb) {
Eric Dumazet634fb9792013-10-09 15:21:29 -0700489 __tcp_v6_send_check(skb, &ireq->ir_v6_loc_addr,
490 &ireq->ir_v6_rmt_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700491
Eric Dumazet634fb9792013-10-09 15:21:29 -0700492 fl6->daddr = ireq->ir_v6_rmt_addr;
Florent Fourcotdf3687f2014-01-17 17:15:03 +0100493 if (np->repflow && (ireq->pktopts != NULL))
494 fl6->flowlabel = ip6_flowlabel(ipv6_hdr(ireq->pktopts));
495
Eric Dumazetfff32692012-06-01 01:47:50 +0000496 skb_set_queue_mapping(skb, queue_mapping);
RongQing.Li43264e02012-07-01 17:18:59 +0000497 err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
Gerrit Renkerb9df3cb2006-11-14 11:21:36 -0200498 err = net_xmit_eval(err);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499 }
500
501done:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700502 return err;
503}
504
Christoph Paasch1a2c6182013-03-17 08:23:34 +0000505static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req)
Octavian Purdila72659ec2010-01-17 19:09:39 -0800506{
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000507 struct flowi6 fl6;
Eric Dumazete6c022a2012-10-27 23:16:46 +0000508 int res;
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000509
Christoph Paasch1a2c6182013-03-17 08:23:34 +0000510 res = tcp_v6_send_synack(sk, NULL, &fl6, req, 0);
Yuchung Chengf19c29e2014-03-03 12:31:36 -0800511 if (!res) {
Eric Dumazete6c022a2012-10-27 23:16:46 +0000512 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
Yuchung Chengf19c29e2014-03-03 12:31:36 -0800513 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPSYNRETRANS);
514 }
Eric Dumazete6c022a2012-10-27 23:16:46 +0000515 return res;
Octavian Purdila72659ec2010-01-17 19:09:39 -0800516}
517
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700518static void tcp_v6_reqsk_destructor(struct request_sock *req)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700519{
Eric Dumazet634fb9792013-10-09 15:21:29 -0700520 kfree_skb(inet_rsk(req)->pktopts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521}
522
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800523#ifdef CONFIG_TCP_MD5SIG
524static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000525 const struct in6_addr *addr)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800526{
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000527 return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800528}
529
530static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
531 struct sock *addr_sk)
532{
Eric Dumazetefe42082013-10-03 15:42:29 -0700533 return tcp_v6_md5_do_lookup(sk, &addr_sk->sk_v6_daddr);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800534}
535
536static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
537 struct request_sock *req)
538{
Eric Dumazet634fb9792013-10-09 15:21:29 -0700539 return tcp_v6_md5_do_lookup(sk, &inet_rsk(req)->ir_v6_rmt_addr);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800540}
541
Wang Yufen4aa956d2014-03-29 09:27:29 +0800542static int tcp_v6_parse_md5_keys(struct sock *sk, char __user *optval,
543 int optlen)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800544{
545 struct tcp_md5sig cmd;
546 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800547
548 if (optlen < sizeof(cmd))
549 return -EINVAL;
550
551 if (copy_from_user(&cmd, optval, sizeof(cmd)))
552 return -EFAULT;
553
554 if (sin6->sin6_family != AF_INET6)
555 return -EINVAL;
556
557 if (!cmd.tcpm_keylen) {
Brian Haleye773e4f2007-08-24 23:16:08 -0700558 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000559 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
560 AF_INET);
561 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
562 AF_INET6);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800563 }
564
565 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
566 return -EINVAL;
567
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000568 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
569 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
570 AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800571
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000572 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
573 AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800574}
575
Adam Langley49a72df2008-07-19 00:01:42 -0700576static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000577 const struct in6_addr *daddr,
578 const struct in6_addr *saddr, int nbytes)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800579{
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800580 struct tcp6_pseudohdr *bp;
Adam Langley49a72df2008-07-19 00:01:42 -0700581 struct scatterlist sg;
YOSHIFUJI Hideaki8d26d762008-04-17 13:19:16 +0900582
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800583 bp = &hp->md5_blk.ip6;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800584 /* 1. TCP pseudo-header (RFC2460) */
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000585 bp->saddr = *saddr;
586 bp->daddr = *daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700587 bp->protocol = cpu_to_be32(IPPROTO_TCP);
Adam Langley00b13042008-07-31 21:36:07 -0700588 bp->len = cpu_to_be32(nbytes);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800589
Adam Langley49a72df2008-07-19 00:01:42 -0700590 sg_init_one(&sg, bp, sizeof(*bp));
591 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
592}
David S. Millerc7da57a2007-10-26 00:41:21 -0700593
Adam Langley49a72df2008-07-19 00:01:42 -0700594static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000595 const struct in6_addr *daddr, struct in6_addr *saddr,
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400596 const struct tcphdr *th)
Adam Langley49a72df2008-07-19 00:01:42 -0700597{
598 struct tcp_md5sig_pool *hp;
599 struct hash_desc *desc;
600
601 hp = tcp_get_md5sig_pool();
602 if (!hp)
603 goto clear_hash_noput;
604 desc = &hp->md5_desc;
605
606 if (crypto_hash_init(desc))
607 goto clear_hash;
608 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
609 goto clear_hash;
610 if (tcp_md5_hash_header(hp, th))
611 goto clear_hash;
612 if (tcp_md5_hash_key(hp, key))
613 goto clear_hash;
614 if (crypto_hash_final(desc, md5_hash))
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800615 goto clear_hash;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800616
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800617 tcp_put_md5sig_pool();
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800618 return 0;
Adam Langley49a72df2008-07-19 00:01:42 -0700619
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800620clear_hash:
621 tcp_put_md5sig_pool();
622clear_hash_noput:
623 memset(md5_hash, 0, 16);
Adam Langley49a72df2008-07-19 00:01:42 -0700624 return 1;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800625}
626
Adam Langley49a72df2008-07-19 00:01:42 -0700627static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400628 const struct sock *sk,
629 const struct request_sock *req,
630 const struct sk_buff *skb)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800631{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000632 const struct in6_addr *saddr, *daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700633 struct tcp_md5sig_pool *hp;
634 struct hash_desc *desc;
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400635 const struct tcphdr *th = tcp_hdr(skb);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800636
637 if (sk) {
638 saddr = &inet6_sk(sk)->saddr;
Eric Dumazetefe42082013-10-03 15:42:29 -0700639 daddr = &sk->sk_v6_daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700640 } else if (req) {
Eric Dumazet634fb9792013-10-09 15:21:29 -0700641 saddr = &inet_rsk(req)->ir_v6_loc_addr;
642 daddr = &inet_rsk(req)->ir_v6_rmt_addr;
Adam Langley49a72df2008-07-19 00:01:42 -0700643 } else {
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000644 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
Adam Langley49a72df2008-07-19 00:01:42 -0700645 saddr = &ip6h->saddr;
646 daddr = &ip6h->daddr;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800647 }
Adam Langley49a72df2008-07-19 00:01:42 -0700648
649 hp = tcp_get_md5sig_pool();
650 if (!hp)
651 goto clear_hash_noput;
652 desc = &hp->md5_desc;
653
654 if (crypto_hash_init(desc))
655 goto clear_hash;
656
657 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
658 goto clear_hash;
659 if (tcp_md5_hash_header(hp, th))
660 goto clear_hash;
661 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
662 goto clear_hash;
663 if (tcp_md5_hash_key(hp, key))
664 goto clear_hash;
665 if (crypto_hash_final(desc, md5_hash))
666 goto clear_hash;
667
668 tcp_put_md5sig_pool();
669 return 0;
670
671clear_hash:
672 tcp_put_md5sig_pool();
673clear_hash_noput:
674 memset(md5_hash, 0, 16);
675 return 1;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800676}
677
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400678static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800679{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400680 const __u8 *hash_location = NULL;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800681 struct tcp_md5sig_key *hash_expected;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000682 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400683 const struct tcphdr *th = tcp_hdr(skb);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800684 int genhash;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800685 u8 newhash[16];
686
687 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
YOSHIFUJI Hideaki7d5d5522008-04-17 12:29:53 +0900688 hash_location = tcp_parse_md5sig_option(th);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800689
David S. Miller785957d2008-07-30 03:03:15 -0700690 /* We've parsed the options - do we have a hash? */
691 if (!hash_expected && !hash_location)
692 return 0;
693
694 if (hash_expected && !hash_location) {
695 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800696 return 1;
697 }
698
David S. Miller785957d2008-07-30 03:03:15 -0700699 if (!hash_expected && hash_location) {
700 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800701 return 1;
702 }
703
704 /* check the signature */
Adam Langley49a72df2008-07-19 00:01:42 -0700705 genhash = tcp_v6_md5_hash_skb(newhash,
706 hash_expected,
707 NULL, NULL, skb);
708
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800709 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
Joe Perchese87cc472012-05-13 21:56:26 +0000710 net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
711 genhash ? "failed" : "mismatch",
712 &ip6h->saddr, ntohs(th->source),
713 &ip6h->daddr, ntohs(th->dest));
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800714 return 1;
715 }
716 return 0;
717}
718#endif
719
Glenn Griffinc6aefaf2008-02-07 21:49:26 -0800720struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700721 .family = AF_INET6,
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -0700722 .obj_size = sizeof(struct tcp6_request_sock),
Octavian Purdila72659ec2010-01-17 19:09:39 -0800723 .rtx_syn_ack = tcp_v6_rtx_synack,
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700724 .send_ack = tcp_v6_reqsk_send_ack,
725 .destructor = tcp_v6_reqsk_destructor,
Octavian Purdila72659ec2010-01-17 19:09:39 -0800726 .send_reset = tcp_v6_send_reset,
Wang Yufen4aa956d2014-03-29 09:27:29 +0800727 .syn_ack_timeout = tcp_syn_ack_timeout,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700728};
729
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800730#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3de2009-09-01 19:25:03 +0000731static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800732 .md5_lookup = tcp_v6_reqsk_md5_lookup,
John Dykstrae3afe7b2009-07-16 05:04:51 +0000733 .calc_md5_hash = tcp_v6_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800734};
Andrew Mortonb6332e62006-11-30 19:16:28 -0800735#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800736
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700737static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
Wang Yufen9c76a112014-03-29 09:27:31 +0800738 u32 tsval, u32 tsecr, int oif,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100739 struct tcp_md5sig_key *key, int rst, u8 tclass,
740 u32 label)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400742 const struct tcphdr *th = tcp_hdr(skb);
743 struct tcphdr *t1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700744 struct sk_buff *buff;
David S. Miller4c9483b2011-03-12 16:22:43 -0500745 struct flowi6 fl6;
Eric Dumazetadf30902009-06-02 05:19:30 +0000746 struct net *net = dev_net(skb_dst(skb)->dev);
Daniel Lezcanoe5047992008-03-07 11:16:26 -0800747 struct sock *ctl_sk = net->ipv6.tcp_sk;
YOSHIFUJI Hideaki9cb5734e2008-01-12 02:16:03 -0800748 unsigned int tot_len = sizeof(struct tcphdr);
Eric Dumazetadf30902009-06-02 05:19:30 +0000749 struct dst_entry *dst;
Al Viroe69a4adc2006-11-14 20:56:00 -0800750 __be32 *topt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751
Andrey Vaginee684b62013-02-11 05:50:19 +0000752 if (tsecr)
YOSHIFUJI Hideaki4244f8a2006-10-10 19:40:50 -0700753 tot_len += TCPOLEN_TSTAMP_ALIGNED;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800754#ifdef CONFIG_TCP_MD5SIG
755 if (key)
756 tot_len += TCPOLEN_MD5SIG_ALIGNED;
757#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758
759 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
760 GFP_ATOMIC);
761 if (buff == NULL)
762 return;
763
764 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
765
Ilpo Järvinen77c676d2008-10-09 14:41:38 -0700766 t1 = (struct tcphdr *) skb_push(buff, tot_len);
Herbert Xu6651ffc2010-04-21 00:47:15 -0700767 skb_reset_transport_header(buff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768
769 /* Swap the send and the receive. */
770 memset(t1, 0, sizeof(*t1));
771 t1->dest = th->source;
772 t1->source = th->dest;
Ilpo Järvinen77c676d2008-10-09 14:41:38 -0700773 t1->doff = tot_len / 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700774 t1->seq = htonl(seq);
775 t1->ack_seq = htonl(ack);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700776 t1->ack = !rst || !th->ack;
777 t1->rst = rst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700778 t1->window = htons(win);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800779
Al Viroe69a4adc2006-11-14 20:56:00 -0800780 topt = (__be32 *)(t1 + 1);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900781
Andrey Vaginee684b62013-02-11 05:50:19 +0000782 if (tsecr) {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800783 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
784 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
Andrey Vaginee684b62013-02-11 05:50:19 +0000785 *topt++ = htonl(tsval);
786 *topt++ = htonl(tsecr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700787 }
788
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800789#ifdef CONFIG_TCP_MD5SIG
790 if (key) {
791 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
792 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
Adam Langley49a72df2008-07-19 00:01:42 -0700793 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
Adam Langley90b7e112008-07-31 20:49:48 -0700794 &ipv6_hdr(skb)->saddr,
795 &ipv6_hdr(skb)->daddr, t1);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800796 }
797#endif
798
David S. Miller4c9483b2011-03-12 16:22:43 -0500799 memset(&fl6, 0, sizeof(fl6));
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000800 fl6.daddr = ipv6_hdr(skb)->saddr;
801 fl6.saddr = ipv6_hdr(skb)->daddr;
Florent Fourcot1d13a962014-01-16 17:21:22 +0100802 fl6.flowlabel = label;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700803
David S. Millere5700af2010-04-21 14:59:20 -0700804 buff->ip_summed = CHECKSUM_PARTIAL;
805 buff->csum = 0;
806
David S. Miller4c9483b2011-03-12 16:22:43 -0500807 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700808
David S. Miller4c9483b2011-03-12 16:22:43 -0500809 fl6.flowi6_proto = IPPROTO_TCP;
Lorenzo Colittia36dbdb2014-04-11 13:19:12 +0900810 if (rt6_need_strict(&fl6.daddr) && !oif)
Alexey Kuznetsov4c675252012-10-12 04:34:17 +0000811 fl6.flowi6_oif = inet6_iif(skb);
Wang Yufen9c76a112014-03-29 09:27:31 +0800812 else
813 fl6.flowi6_oif = oif;
David S. Miller1958b852011-03-12 16:36:19 -0500814 fl6.fl6_dport = t1->dest;
815 fl6.fl6_sport = t1->source;
David S. Miller4c9483b2011-03-12 16:22:43 -0500816 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700818 /* Pass a socket to ip6_dst_lookup either it is for RST
819 * Underlying function will use this to retrieve the network
820 * namespace
821 */
Steffen Klassert0e0d44a2013-08-28 08:04:14 +0200822 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800823 if (!IS_ERR(dst)) {
824 skb_dst_set(buff, dst);
Eric Dumazetb903d322011-10-27 00:44:35 -0400825 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800826 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
827 if (rst)
828 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
829 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700830 }
831
832 kfree_skb(buff);
833}
834
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700835static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
836{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400837 const struct tcphdr *th = tcp_hdr(skb);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700838 u32 seq = 0, ack_seq = 0;
Guo-Fu Tsengfa3e5b42008-10-09 21:11:56 -0700839 struct tcp_md5sig_key *key = NULL;
Shawn Lu658ddaa2012-01-31 22:35:48 +0000840#ifdef CONFIG_TCP_MD5SIG
841 const __u8 *hash_location = NULL;
842 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
843 unsigned char newhash[16];
844 int genhash;
845 struct sock *sk1 = NULL;
846#endif
Wang Yufen9c76a112014-03-29 09:27:31 +0800847 int oif;
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700848
849 if (th->rst)
850 return;
851
852 if (!ipv6_unicast_destination(skb))
853 return;
854
855#ifdef CONFIG_TCP_MD5SIG
Shawn Lu658ddaa2012-01-31 22:35:48 +0000856 hash_location = tcp_parse_md5sig_option(th);
857 if (!sk && hash_location) {
858 /*
859 * active side is lost. Try to find listening socket through
860 * source port, and then find md5 key through listening socket.
861 * we are not loose security here:
862 * Incoming packet is checked with md5 hash with finding key,
863 * no RST generated if md5 hash doesn't match.
864 */
865 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
Tom Herbert5ba24952013-01-22 09:50:39 +0000866 &tcp_hashinfo, &ipv6h->saddr,
867 th->source, &ipv6h->daddr,
Shawn Lu658ddaa2012-01-31 22:35:48 +0000868 ntohs(th->source), inet6_iif(skb));
869 if (!sk1)
870 return;
871
872 rcu_read_lock();
873 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
874 if (!key)
875 goto release_sk1;
876
877 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
878 if (genhash || memcmp(hash_location, newhash, 16) != 0)
879 goto release_sk1;
880 } else {
881 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
882 }
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700883#endif
884
885 if (th->ack)
886 seq = ntohl(th->ack_seq);
887 else
888 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
889 (th->doff << 2);
890
Wang Yufen9c76a112014-03-29 09:27:31 +0800891 oif = sk ? sk->sk_bound_dev_if : 0;
892 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, 0, oif, key, 1, 0, 0);
Shawn Lu658ddaa2012-01-31 22:35:48 +0000893
894#ifdef CONFIG_TCP_MD5SIG
895release_sk1:
896 if (sk1) {
897 rcu_read_unlock();
898 sock_put(sk1);
899 }
900#endif
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700901}
902
Andrey Vaginee684b62013-02-11 05:50:19 +0000903static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack,
Wang Yufen9c76a112014-03-29 09:27:31 +0800904 u32 win, u32 tsval, u32 tsecr, int oif,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100905 struct tcp_md5sig_key *key, u8 tclass,
906 u32 label)
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700907{
Wang Yufen9c76a112014-03-29 09:27:31 +0800908 tcp_v6_send_response(skb, seq, ack, win, tsval, tsecr, oif, key, 0, tclass,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100909 label);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700910}
911
Linus Torvalds1da177e2005-04-16 15:20:36 -0700912static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
913{
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -0700914 struct inet_timewait_sock *tw = inet_twsk(sk);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800915 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700916
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +0900917 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -0700918 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
Andrey Vaginee684b62013-02-11 05:50:19 +0000919 tcp_time_stamp + tcptw->tw_ts_offset,
Wang Yufen9c76a112014-03-29 09:27:31 +0800920 tcptw->tw_ts_recent, tw->tw_bound_dev_if, tcp_twsk_md5_key(tcptw),
Florent Fourcot1d13a962014-01-16 17:21:22 +0100921 tw->tw_tclass, (tw->tw_flowlabel << 12));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700922
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -0700923 inet_twsk_put(tw);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700924}
925
Gui Jianfeng6edafaa2008-08-06 23:50:04 -0700926static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
927 struct request_sock *req)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700928{
Andrey Vaginee684b62013-02-11 05:50:19 +0000929 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1,
Wang Yufen9c76a112014-03-29 09:27:31 +0800930 req->rcv_wnd, tcp_time_stamp, req->ts_recent, sk->sk_bound_dev_if,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100931 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr),
932 0, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700933}
934
935
Weilong Chen4c99aa42013-12-19 18:44:34 +0800936static struct sock *tcp_v6_hnd_req(struct sock *sk, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700937{
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700938 struct request_sock *req, **prev;
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -0700939 const struct tcphdr *th = tcp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700940 struct sock *nsk;
941
942 /* Find possible connection requests. */
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -0800943 req = inet6_csk_search_req(sk, &prev, th->source,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700944 &ipv6_hdr(skb)->saddr,
945 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700946 if (req)
Jerry Chu83368862012-08-31 12:29:12 +0000947 return tcp_check_req(sk, skb, req, prev, false);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700948
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900949 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
Pavel Emelyanovd86e0da2008-01-31 05:07:21 -0800950 &ipv6_hdr(skb)->saddr, th->source,
951 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700952
953 if (nsk) {
954 if (nsk->sk_state != TCP_TIME_WAIT) {
955 bh_lock_sock(nsk);
956 return nsk;
957 }
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -0700958 inet_twsk_put(inet_twsk(nsk));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700959 return NULL;
960 }
961
Glenn Griffinc6aefaf2008-02-07 21:49:26 -0800962#ifdef CONFIG_SYN_COOKIES
Florian Westphalaf9b4732010-06-03 00:43:44 +0000963 if (!th->syn)
Glenn Griffinc6aefaf2008-02-07 21:49:26 -0800964 sk = cookie_v6_check(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700965#endif
966 return sk;
967}
968
Linus Torvalds1da177e2005-04-16 15:20:36 -0700969/* FIXME: this is substantially similar to the ipv4 code.
970 * Can some kind of merge be done? -- erics
971 */
972static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
973{
William Allen Simpsone6b4d112009-12-02 18:07:39 +0000974 struct tcp_options_received tmp_opt;
975 struct request_sock *req;
Eric Dumazet634fb9792013-10-09 15:21:29 -0700976 struct inet_request_sock *ireq;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700977 struct ipv6_pinfo *np = inet6_sk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700978 struct tcp_sock *tp = tcp_sk(sk);
William Allen Simpsone6b4d112009-12-02 18:07:39 +0000979 __u32 isn = TCP_SKB_CB(skb)->when;
David S. Miller493f3772010-12-02 12:14:29 -0800980 struct dst_entry *dst = NULL;
Neal Cardwell3840a062012-06-28 12:34:19 +0000981 struct flowi6 fl6;
Eric Dumazeta2a385d2012-05-16 23:15:34 +0000982 bool want_cookie = false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700983
984 if (skb->protocol == htons(ETH_P_IP))
985 return tcp_v4_conn_request(sk, skb);
986
987 if (!ipv6_unicast_destination(skb))
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900988 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700989
Hannes Frederic Sowa5ad37d52013-07-26 17:43:23 +0200990 if ((sysctl_tcp_syncookies == 2 ||
991 inet_csk_reqsk_queue_is_full(sk)) && !isn) {
Eric Dumazet946cedc2011-08-30 03:21:44 +0000992 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
993 if (!want_cookie)
994 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700995 }
996
Vijay Subramanian5f1e9422013-01-31 08:24:19 +0000997 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1) {
998 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700999 goto drop;
Vijay Subramanian5f1e9422013-01-31 08:24:19 +00001000 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001001
Arnaldo Carvalho de Meloca304b62005-12-13 23:15:40 -08001002 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001003 if (req == NULL)
1004 goto drop;
1005
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001006#ifdef CONFIG_TCP_MD5SIG
1007 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1008#endif
1009
Linus Torvalds1da177e2005-04-16 15:20:36 -07001010 tcp_clear_options(&tmp_opt);
1011 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1012 tmp_opt.user_mss = tp->rx_opt.user_mss;
Christoph Paasch1a2c6182013-03-17 08:23:34 +00001013 tcp_parse_options(skb, &tmp_opt, 0, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001014
Florian Westphal4dfc2812008-04-10 03:12:40 -07001015 if (want_cookie && !tmp_opt.saw_tstamp)
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001016 tcp_clear_options(&tmp_opt);
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001017
Linus Torvalds1da177e2005-04-16 15:20:36 -07001018 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1019 tcp_openreq_init(req, &tmp_opt, skb);
1020
Eric Dumazet634fb9792013-10-09 15:21:29 -07001021 ireq = inet_rsk(req);
1022 ireq->ir_v6_rmt_addr = ipv6_hdr(skb)->saddr;
1023 ireq->ir_v6_loc_addr = ipv6_hdr(skb)->daddr;
Florian Westphal172d69e2010-06-21 11:48:45 +00001024 if (!want_cookie || tmp_opt.tstamp_ok)
Hannes Frederic Sowa5d134f12013-01-05 16:10:48 +00001025 TCP_ECN_create_request(req, skb, sock_net(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001026
Eric Dumazet634fb9792013-10-09 15:21:29 -07001027 ireq->ir_iif = sk->sk_bound_dev_if;
Eric Dumazet4d0fe502011-11-23 17:29:23 -05001028
1029 /* So that link locals have meaning */
1030 if (!sk->sk_bound_dev_if &&
Eric Dumazet634fb9792013-10-09 15:21:29 -07001031 ipv6_addr_type(&ireq->ir_v6_rmt_addr) & IPV6_ADDR_LINKLOCAL)
1032 ireq->ir_iif = inet6_iif(skb);
Eric Dumazet4d0fe502011-11-23 17:29:23 -05001033
Florian Westphal2bbdf382010-06-13 11:29:39 +00001034 if (!isn) {
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001035 if (ipv6_opt_accepted(sk, skb) ||
1036 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001037 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim ||
1038 np->repflow) {
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001039 atomic_inc(&skb->users);
Eric Dumazet634fb9792013-10-09 15:21:29 -07001040 ireq->pktopts = skb;
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001041 }
David S. Miller493f3772010-12-02 12:14:29 -08001042
1043 if (want_cookie) {
Florian Westphal2bbdf382010-06-13 11:29:39 +00001044 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1045 req->cookie_ts = tmp_opt.tstamp_ok;
David S. Miller493f3772010-12-02 12:14:29 -08001046 goto have_isn;
Florian Westphal2bbdf382010-06-13 11:29:39 +00001047 }
David S. Miller493f3772010-12-02 12:14:29 -08001048
1049 /* VJ's idea. We save last timestamp seen
1050 * from the destination in peer table, when entering
1051 * state TIME-WAIT, and check against it before
1052 * accepting new connection request.
1053 *
1054 * If "isn" is not zero, this request hit alive
1055 * timewait bucket, so that all the necessary checks
1056 * are made in the function processing timewait state.
1057 */
1058 if (tmp_opt.saw_tstamp &&
1059 tcp_death_row.sysctl_tw_recycle &&
David S. Miller81166dd2012-07-10 03:14:24 -07001060 (dst = inet6_csk_route_req(sk, &fl6, req)) != NULL) {
1061 if (!tcp_peer_is_proven(req, dst, true)) {
David S. Miller493f3772010-12-02 12:14:29 -08001062 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1063 goto drop_and_release;
1064 }
1065 }
1066 /* Kill the following clause, if you dislike this way. */
1067 else if (!sysctl_tcp_syncookies &&
1068 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1069 (sysctl_max_syn_backlog >> 2)) &&
David S. Miller81166dd2012-07-10 03:14:24 -07001070 !tcp_peer_is_proven(req, dst, false)) {
David S. Miller493f3772010-12-02 12:14:29 -08001071 /* Without syncookies last quarter of
1072 * backlog is filled with destinations,
1073 * proven to be alive.
1074 * It means that we continue to communicate
1075 * to destinations, already remembered
1076 * to the moment of synflood.
1077 */
1078 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
Eric Dumazet634fb9792013-10-09 15:21:29 -07001079 &ireq->ir_v6_rmt_addr, ntohs(tcp_hdr(skb)->source));
David S. Miller493f3772010-12-02 12:14:29 -08001080 goto drop_and_release;
1081 }
1082
1083 isn = tcp_v6_init_sequence(skb);
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001084 }
David S. Miller493f3772010-12-02 12:14:29 -08001085have_isn:
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -07001086 tcp_rsk(req)->snt_isn = isn;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001087
Neal Cardwell437c5b52012-06-23 19:22:00 +00001088 if (security_inet_conn_request(sk, skb, req))
1089 goto drop_and_release;
Venkat Yekkirala4237c752006-07-24 23:32:50 -07001090
Neal Cardwell9f10d3f2012-06-28 12:34:21 +00001091 if (tcp_v6_send_synack(sk, dst, &fl6, req,
Eric Dumazetfff32692012-06-01 01:47:50 +00001092 skb_get_queue_mapping(skb)) ||
William Allen Simpson4957faade2009-12-02 18:25:27 +00001093 want_cookie)
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001094 goto drop_and_free;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001095
Neal Cardwell016818d2012-09-22 04:18:55 +00001096 tcp_rsk(req)->snt_synack = tcp_time_stamp;
Jerry Chu83368862012-08-31 12:29:12 +00001097 tcp_rsk(req)->listener = NULL;
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001098 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1099 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001100
David S. Miller493f3772010-12-02 12:14:29 -08001101drop_and_release:
1102 dst_release(dst);
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001103drop_and_free:
1104 reqsk_free(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001105drop:
Vijay Subramanian5f1e9422013-01-31 08:24:19 +00001106 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001107 return 0; /* don't send reset */
1108}
1109
Weilong Chen4c99aa42013-12-19 18:44:34 +08001110static struct sock *tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1111 struct request_sock *req,
1112 struct dst_entry *dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001113{
Eric Dumazet634fb9792013-10-09 15:21:29 -07001114 struct inet_request_sock *ireq;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001115 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1116 struct tcp6_sock *newtcp6sk;
1117 struct inet_sock *newinet;
1118 struct tcp_sock *newtp;
1119 struct sock *newsk;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001120#ifdef CONFIG_TCP_MD5SIG
1121 struct tcp_md5sig_key *key;
1122#endif
Neal Cardwell3840a062012-06-28 12:34:19 +00001123 struct flowi6 fl6;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001124
1125 if (skb->protocol == htons(ETH_P_IP)) {
1126 /*
1127 * v6 mapped
1128 */
1129
1130 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1131
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001132 if (newsk == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001133 return NULL;
1134
1135 newtcp6sk = (struct tcp6_sock *)newsk;
1136 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1137
1138 newinet = inet_sk(newsk);
1139 newnp = inet6_sk(newsk);
1140 newtp = tcp_sk(newsk);
1141
1142 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1143
Eric Dumazetefe42082013-10-03 15:42:29 -07001144 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newsk->sk_v6_daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001145
Eric Dumazetc720c7e82009-10-15 06:30:45 +00001146 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001147
Eric Dumazetefe42082013-10-03 15:42:29 -07001148 newsk->sk_v6_rcv_saddr = newnp->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001149
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001150 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001151 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001152#ifdef CONFIG_TCP_MD5SIG
1153 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1154#endif
1155
Yan, Zheng676a1182011-09-25 02:21:30 +00001156 newnp->ipv6_ac_list = NULL;
1157 newnp->ipv6_fl_list = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158 newnp->pktoptions = NULL;
1159 newnp->opt = NULL;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001160 newnp->mcast_oif = inet6_iif(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001161 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
Florent Fourcot1397ed32013-12-08 15:46:57 +01001162 newnp->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(skb));
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001163 if (np->repflow)
1164 newnp->flow_label = ip6_flowlabel(ipv6_hdr(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001165
Arnaldo Carvalho de Meloe6848972005-08-09 19:45:38 -07001166 /*
1167 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1168 * here, tcp_create_openreq_child now does this for us, see the comment in
1169 * that function for the gory details. -acme
Linus Torvalds1da177e2005-04-16 15:20:36 -07001170 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001171
1172 /* It is tricky place. Until this moment IPv4 tcp
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001173 worked with IPv6 icsk.icsk_af_ops.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001174 Sync it now.
1175 */
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001176 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001177
1178 return newsk;
1179 }
1180
Eric Dumazet634fb9792013-10-09 15:21:29 -07001181 ireq = inet_rsk(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001182
1183 if (sk_acceptq_is_full(sk))
1184 goto out_overflow;
1185
David S. Miller493f3772010-12-02 12:14:29 -08001186 if (!dst) {
Neal Cardwell3840a062012-06-28 12:34:19 +00001187 dst = inet6_csk_route_req(sk, &fl6, req);
David S. Miller493f3772010-12-02 12:14:29 -08001188 if (!dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001189 goto out;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001190 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001191
1192 newsk = tcp_create_openreq_child(sk, req, skb);
1193 if (newsk == NULL)
Balazs Scheidler093d2822010-10-21 13:06:43 +02001194 goto out_nonewsk;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001195
Arnaldo Carvalho de Meloe6848972005-08-09 19:45:38 -07001196 /*
1197 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1198 * count here, tcp_create_openreq_child now does this for us, see the
1199 * comment in that function for the gory details. -acme
1200 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201
Stephen Hemminger59eed272006-08-25 15:55:43 -07001202 newsk->sk_gso_type = SKB_GSO_TCPV6;
YOSHIFUJI Hideaki8e1ef0a2006-08-29 17:15:09 -07001203 __ip6_dst_store(newsk, dst, NULL, NULL);
Neal Cardwellfae6ef82012-08-19 03:30:38 +00001204 inet6_sk_rx_dst_set(newsk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001205
1206 newtcp6sk = (struct tcp6_sock *)newsk;
1207 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1208
1209 newtp = tcp_sk(newsk);
1210 newinet = inet_sk(newsk);
1211 newnp = inet6_sk(newsk);
1212
1213 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1214
Eric Dumazet634fb9792013-10-09 15:21:29 -07001215 newsk->sk_v6_daddr = ireq->ir_v6_rmt_addr;
1216 newnp->saddr = ireq->ir_v6_loc_addr;
1217 newsk->sk_v6_rcv_saddr = ireq->ir_v6_loc_addr;
1218 newsk->sk_bound_dev_if = ireq->ir_iif;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001219
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001220 /* Now IPv6 options...
Linus Torvalds1da177e2005-04-16 15:20:36 -07001221
1222 First: no IPv4 options.
1223 */
Eric Dumazetf6d8bd02011-04-21 09:45:37 +00001224 newinet->inet_opt = NULL;
Yan, Zheng676a1182011-09-25 02:21:30 +00001225 newnp->ipv6_ac_list = NULL;
Masayuki Nakagawad35690b2007-03-16 16:14:03 -07001226 newnp->ipv6_fl_list = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001227
1228 /* Clone RX bits */
1229 newnp->rxopt.all = np->rxopt.all;
1230
1231 /* Clone pktoptions received with SYN */
1232 newnp->pktoptions = NULL;
Eric Dumazet634fb9792013-10-09 15:21:29 -07001233 if (ireq->pktopts != NULL) {
1234 newnp->pktoptions = skb_clone(ireq->pktopts,
Mel Gorman99a1dec2012-07-31 16:44:14 -07001235 sk_gfp_atomic(sk, GFP_ATOMIC));
Eric Dumazet634fb9792013-10-09 15:21:29 -07001236 consume_skb(ireq->pktopts);
1237 ireq->pktopts = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001238 if (newnp->pktoptions)
1239 skb_set_owner_r(newnp->pktoptions, newsk);
1240 }
1241 newnp->opt = NULL;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001242 newnp->mcast_oif = inet6_iif(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001243 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
Florent Fourcot1397ed32013-12-08 15:46:57 +01001244 newnp->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(skb));
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001245 if (np->repflow)
1246 newnp->flow_label = ip6_flowlabel(ipv6_hdr(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001247
1248 /* Clone native IPv6 options from listening socket (if any)
1249
1250 Yes, keeping reference count would be much more clever,
1251 but we make one more one thing there: reattach optmem
1252 to newsk.
1253 */
RongQing.Li43264e02012-07-01 17:18:59 +00001254 if (np->opt)
1255 newnp->opt = ipv6_dup_options(newsk, np->opt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001256
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001257 inet_csk(newsk)->icsk_ext_hdr_len = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001258 if (newnp->opt)
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001259 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1260 newnp->opt->opt_flen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001261
1262 tcp_sync_mss(newsk, dst_mtu(dst));
David S. Miller0dbaee32010-12-13 12:52:14 -08001263 newtp->advmss = dst_metric_advmss(dst);
Neal Cardwelld135c522012-04-22 09:45:47 +00001264 if (tcp_sk(sk)->rx_opt.user_mss &&
1265 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1266 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1267
Linus Torvalds1da177e2005-04-16 15:20:36 -07001268 tcp_initialize_rcv_mss(newsk);
1269
Eric Dumazetc720c7e82009-10-15 06:30:45 +00001270 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1271 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001272
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001273#ifdef CONFIG_TCP_MD5SIG
1274 /* Copy over the MD5 key from the original socket */
Wang Yufen4aa956d2014-03-29 09:27:29 +08001275 key = tcp_v6_md5_do_lookup(sk, &newsk->sk_v6_daddr);
1276 if (key != NULL) {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001277 /* We're using one, so create a matching key
1278 * on the newsk structure. If we fail to get
1279 * memory, then we end up not copying the key
1280 * across. Shucks.
1281 */
Eric Dumazetefe42082013-10-03 15:42:29 -07001282 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newsk->sk_v6_daddr,
Mel Gorman99a1dec2012-07-31 16:44:14 -07001283 AF_INET6, key->key, key->keylen,
1284 sk_gfp_atomic(sk, GFP_ATOMIC));
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001285 }
1286#endif
1287
Balazs Scheidler093d2822010-10-21 13:06:43 +02001288 if (__inet_inherit_port(sk, newsk) < 0) {
Christoph Paasche337e242012-12-14 04:07:58 +00001289 inet_csk_prepare_forced_close(newsk);
1290 tcp_done(newsk);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001291 goto out;
1292 }
Eric Dumazet9327f702009-12-04 03:46:54 +00001293 __inet6_hash(newsk, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001294
1295 return newsk;
1296
1297out_overflow:
Pavel Emelyanovde0744a2008-07-16 20:31:16 -07001298 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001299out_nonewsk:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001300 dst_release(dst);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001301out:
1302 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001303 return NULL;
1304}
1305
Linus Torvalds1da177e2005-04-16 15:20:36 -07001306/* The socket must have it's spinlock held when we get
1307 * here.
1308 *
1309 * We have a potential double-lock case here, so even when
1310 * doing backlog processing we use the BH locking scheme.
1311 * This is because we cannot sleep with the original spinlock
1312 * held.
1313 */
1314static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1315{
1316 struct ipv6_pinfo *np = inet6_sk(sk);
1317 struct tcp_sock *tp;
1318 struct sk_buff *opt_skb = NULL;
1319
1320 /* Imagine: socket is IPv6. IPv4 packet arrives,
1321 goes to IPv4 receive handler and backlogged.
1322 From backlog it always goes here. Kerboom...
1323 Fortunately, tcp_rcv_established and rcv_established
1324 handle them correctly, but it is not case with
1325 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1326 */
1327
1328 if (skb->protocol == htons(ETH_P_IP))
1329 return tcp_v4_do_rcv(sk, skb);
1330
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001331#ifdef CONFIG_TCP_MD5SIG
Wang Yufen4aa956d2014-03-29 09:27:29 +08001332 if (tcp_v6_inbound_md5_hash(sk, skb))
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001333 goto discard;
1334#endif
1335
Dmitry Mishinfda9ef52006-08-31 15:28:39 -07001336 if (sk_filter(sk, skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001337 goto discard;
1338
1339 /*
1340 * socket locking is here for SMP purposes as backlog rcv
1341 * is currently called with bh processing disabled.
1342 */
1343
1344 /* Do Stevens' IPV6_PKTOPTIONS.
1345
1346 Yes, guys, it is the only place in our code, where we
1347 may make it not affecting IPv4.
1348 The rest of code is protocol independent,
1349 and I do not like idea to uglify IPv4.
1350
1351 Actually, all the idea behind IPV6_PKTOPTIONS
1352 looks not very well thought. For now we latch
1353 options, received in the last packet, enqueued
1354 by tcp. Feel free to propose better solution.
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001355 --ANK (980728)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001356 */
1357 if (np->rxopt.all)
Mel Gorman99a1dec2012-07-31 16:44:14 -07001358 opt_skb = skb_clone(skb, sk_gfp_atomic(sk, GFP_ATOMIC));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001359
1360 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
Eric Dumazet5d299f32012-08-06 05:09:33 +00001361 struct dst_entry *dst = sk->sk_rx_dst;
1362
Tom Herbertbdeab992011-08-14 19:45:55 +00001363 sock_rps_save_rxhash(sk, skb);
Eric Dumazet5d299f32012-08-06 05:09:33 +00001364 if (dst) {
1365 if (inet_sk(sk)->rx_dst_ifindex != skb->skb_iif ||
1366 dst->ops->check(dst, np->rx_dst_cookie) == NULL) {
1367 dst_release(dst);
1368 sk->sk_rx_dst = NULL;
1369 }
1370 }
1371
Vijay Subramanianc995ae22013-09-03 12:23:22 -07001372 tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001373 if (opt_skb)
1374 goto ipv6_pktoptions;
1375 return 0;
1376 }
1377
Arnaldo Carvalho de Meloab6a5bb2007-03-18 17:43:48 -07001378 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001379 goto csum_err;
1380
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001381 if (sk->sk_state == TCP_LISTEN) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001382 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1383 if (!nsk)
1384 goto discard;
1385
1386 /*
1387 * Queue it on the new socket if the new socket is active,
1388 * otherwise we just shortcircuit this and continue with
1389 * the new socket..
1390 */
Weilong Chen4c99aa42013-12-19 18:44:34 +08001391 if (nsk != sk) {
Tom Herbertbdeab992011-08-14 19:45:55 +00001392 sock_rps_save_rxhash(nsk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001393 if (tcp_child_process(sk, nsk, skb))
1394 goto reset;
1395 if (opt_skb)
1396 __kfree_skb(opt_skb);
1397 return 0;
1398 }
Neil Horman47482f132011-04-06 13:07:09 -07001399 } else
Tom Herbertbdeab992011-08-14 19:45:55 +00001400 sock_rps_save_rxhash(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001401
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001402 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001403 goto reset;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001404 if (opt_skb)
1405 goto ipv6_pktoptions;
1406 return 0;
1407
1408reset:
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001409 tcp_v6_send_reset(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001410discard:
1411 if (opt_skb)
1412 __kfree_skb(opt_skb);
1413 kfree_skb(skb);
1414 return 0;
1415csum_err:
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001416 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_CSUMERRORS);
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001417 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001418 goto discard;
1419
1420
1421ipv6_pktoptions:
1422 /* Do you ask, what is it?
1423
1424 1. skb was enqueued by tcp.
1425 2. skb is added to tail of read queue, rather than out of order.
1426 3. socket is not in passive state.
1427 4. Finally, it really contains options, which user wants to receive.
1428 */
1429 tp = tcp_sk(sk);
1430 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1431 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
YOSHIFUJI Hideaki333fad52005-09-08 09:59:17 +09001432 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001433 np->mcast_oif = inet6_iif(opt_skb);
YOSHIFUJI Hideaki333fad52005-09-08 09:59:17 +09001434 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001435 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
Florent Fourcot82e9f102013-12-08 15:46:59 +01001436 if (np->rxopt.bits.rxflow || np->rxopt.bits.rxtclass)
Florent Fourcot1397ed32013-12-08 15:46:57 +01001437 np->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(opt_skb));
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001438 if (np->repflow)
1439 np->flow_label = ip6_flowlabel(ipv6_hdr(opt_skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001440 if (ipv6_opt_accepted(sk, opt_skb)) {
1441 skb_set_owner_r(opt_skb, sk);
1442 opt_skb = xchg(&np->pktoptions, opt_skb);
1443 } else {
1444 __kfree_skb(opt_skb);
1445 opt_skb = xchg(&np->pktoptions, NULL);
1446 }
1447 }
1448
Wei Yongjun800d55f2009-02-23 21:45:33 +00001449 kfree_skb(opt_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001450 return 0;
1451}
1452
Herbert Xue5bbef22007-10-15 12:50:28 -07001453static int tcp_v6_rcv(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001454{
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001455 const struct tcphdr *th;
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001456 const struct ipv6hdr *hdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001457 struct sock *sk;
1458 int ret;
Pavel Emelyanova86b1e32008-07-16 20:20:58 -07001459 struct net *net = dev_net(skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001460
1461 if (skb->pkt_type != PACKET_HOST)
1462 goto discard_it;
1463
1464 /*
1465 * Count it even if it's bad.
1466 */
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001467 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001468
1469 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1470 goto discard_it;
1471
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001472 th = tcp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001473
1474 if (th->doff < sizeof(struct tcphdr)/4)
1475 goto bad_packet;
1476 if (!pskb_may_pull(skb, th->doff*4))
1477 goto discard_it;
1478
Tom Herberte4f45b72014-05-02 16:29:51 -07001479 if (skb_checksum_init(skb, IPPROTO_TCP, ip6_compute_pseudo))
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001480 goto csum_error;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001481
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001482 th = tcp_hdr(skb);
Stephen Hemmingere802af92010-04-22 15:24:53 -07001483 hdr = ipv6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001484 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1485 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1486 skb->len - th->doff*4);
1487 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1488 TCP_SKB_CB(skb)->when = 0;
Eric Dumazetb82d1bb2011-09-27 02:20:08 -04001489 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001490 TCP_SKB_CB(skb)->sacked = 0;
1491
Arnaldo Carvalho de Melo9a1f27c2008-10-07 11:41:57 -07001492 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001493 if (!sk)
1494 goto no_tcp_socket;
1495
1496process:
1497 if (sk->sk_state == TCP_TIME_WAIT)
1498 goto do_time_wait;
1499
Stephen Hemmingere802af92010-04-22 15:24:53 -07001500 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1501 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1502 goto discard_and_relse;
1503 }
1504
Linus Torvalds1da177e2005-04-16 15:20:36 -07001505 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1506 goto discard_and_relse;
1507
Dmitry Mishinfda9ef52006-08-31 15:28:39 -07001508 if (sk_filter(sk, skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001509 goto discard_and_relse;
1510
Eliezer Tamir8b80cda52013-07-10 17:13:26 +03001511 sk_mark_napi_id(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001512 skb->dev = NULL;
1513
Fabio Olive Leite293b9c42006-09-25 22:28:47 -07001514 bh_lock_sock_nested(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001515 ret = 0;
1516 if (!sock_owned_by_user(sk)) {
Chris Leech1a2449a2006-05-23 18:05:53 -07001517#ifdef CONFIG_NET_DMA
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001518 struct tcp_sock *tp = tcp_sk(sk);
David S. Millerb4caea82007-10-26 04:20:13 -07001519 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
Dave Jianga2bd1142012-04-04 16:10:46 -07001520 tp->ucopy.dma_chan = net_dma_find_channel();
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001521 if (tp->ucopy.dma_chan)
1522 ret = tcp_v6_do_rcv(sk, skb);
1523 else
Chris Leech1a2449a2006-05-23 18:05:53 -07001524#endif
1525 {
1526 if (!tcp_prequeue(sk, skb))
1527 ret = tcp_v6_do_rcv(sk, skb);
1528 }
Eric Dumazetda882c12012-04-22 23:38:54 +00001529 } else if (unlikely(sk_add_backlog(sk, skb,
1530 sk->sk_rcvbuf + sk->sk_sndbuf))) {
Zhu Yi6b03a532010-03-04 18:01:41 +00001531 bh_unlock_sock(sk);
Eric Dumazet6cce09f2010-03-07 23:21:57 +00001532 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
Zhu Yi6b03a532010-03-04 18:01:41 +00001533 goto discard_and_relse;
1534 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001535 bh_unlock_sock(sk);
1536
1537 sock_put(sk);
1538 return ret ? -1 : 0;
1539
1540no_tcp_socket:
1541 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1542 goto discard_it;
1543
1544 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001545csum_error:
1546 TCP_INC_STATS_BH(net, TCP_MIB_CSUMERRORS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001547bad_packet:
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001548 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001549 } else {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001550 tcp_v6_send_reset(NULL, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001551 }
1552
1553discard_it:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001554 kfree_skb(skb);
1555 return 0;
1556
1557discard_and_relse:
1558 sock_put(sk);
1559 goto discard_it;
1560
1561do_time_wait:
1562 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001563 inet_twsk_put(inet_twsk(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001564 goto discard_it;
1565 }
1566
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001567 if (skb->len < (th->doff<<2)) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001568 inet_twsk_put(inet_twsk(sk));
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001569 goto bad_packet;
1570 }
1571 if (tcp_checksum_complete(skb)) {
1572 inet_twsk_put(inet_twsk(sk));
1573 goto csum_error;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001574 }
1575
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001576 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001577 case TCP_TW_SYN:
1578 {
1579 struct sock *sk2;
1580
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001581 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
Tom Herbert5ba24952013-01-22 09:50:39 +00001582 &ipv6_hdr(skb)->saddr, th->source,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001583 &ipv6_hdr(skb)->daddr,
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001584 ntohs(th->dest), inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001585 if (sk2 != NULL) {
Arnaldo Carvalho de Melo295ff7e2005-08-09 20:44:40 -07001586 struct inet_timewait_sock *tw = inet_twsk(sk);
1587 inet_twsk_deschedule(tw, &tcp_death_row);
1588 inet_twsk_put(tw);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001589 sk = sk2;
1590 goto process;
1591 }
1592 /* Fall through to ACK */
1593 }
1594 case TCP_TW_ACK:
1595 tcp_v6_timewait_ack(sk, skb);
1596 break;
1597 case TCP_TW_RST:
1598 goto no_tcp_socket;
Wang Yufen4aa956d2014-03-29 09:27:29 +08001599 case TCP_TW_SUCCESS:
1600 ;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001601 }
1602 goto discard_it;
1603}
1604
Eric Dumazetc7109982012-07-26 12:18:11 +00001605static void tcp_v6_early_demux(struct sk_buff *skb)
1606{
1607 const struct ipv6hdr *hdr;
1608 const struct tcphdr *th;
1609 struct sock *sk;
1610
1611 if (skb->pkt_type != PACKET_HOST)
1612 return;
1613
1614 if (!pskb_may_pull(skb, skb_transport_offset(skb) + sizeof(struct tcphdr)))
1615 return;
1616
1617 hdr = ipv6_hdr(skb);
1618 th = tcp_hdr(skb);
1619
1620 if (th->doff < sizeof(struct tcphdr) / 4)
1621 return;
1622
1623 sk = __inet6_lookup_established(dev_net(skb->dev), &tcp_hashinfo,
1624 &hdr->saddr, th->source,
1625 &hdr->daddr, ntohs(th->dest),
1626 inet6_iif(skb));
1627 if (sk) {
1628 skb->sk = sk;
1629 skb->destructor = sock_edemux;
1630 if (sk->sk_state != TCP_TIME_WAIT) {
1631 struct dst_entry *dst = sk->sk_rx_dst;
Neal Cardwellf3f12132012-10-22 21:41:48 +00001632
Eric Dumazetc7109982012-07-26 12:18:11 +00001633 if (dst)
Eric Dumazet5d299f32012-08-06 05:09:33 +00001634 dst = dst_check(dst, inet6_sk(sk)->rx_dst_cookie);
Eric Dumazetc7109982012-07-26 12:18:11 +00001635 if (dst &&
Neal Cardwellf3f12132012-10-22 21:41:48 +00001636 inet_sk(sk)->rx_dst_ifindex == skb->skb_iif)
Eric Dumazetc7109982012-07-26 12:18:11 +00001637 skb_dst_set_noref(skb, dst);
1638 }
1639 }
1640}
1641
David S. Millerccb7c412010-12-01 18:09:13 -08001642static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1643 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1644 .twsk_unique = tcp_twsk_unique,
Wang Yufen4aa956d2014-03-29 09:27:29 +08001645 .twsk_destructor = tcp_twsk_destructor,
David S. Millerccb7c412010-12-01 18:09:13 -08001646};
1647
Stephen Hemminger3b401a82009-09-01 19:25:04 +00001648static const struct inet_connection_sock_af_ops ipv6_specific = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001649 .queue_xmit = inet6_csk_xmit,
1650 .send_check = tcp_v6_send_check,
1651 .rebuild_header = inet6_sk_rebuild_header,
Eric Dumazet5d299f32012-08-06 05:09:33 +00001652 .sk_rx_dst_set = inet6_sk_rx_dst_set,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001653 .conn_request = tcp_v6_conn_request,
1654 .syn_recv_sock = tcp_v6_syn_recv_sock,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001655 .net_header_len = sizeof(struct ipv6hdr),
Eric Dumazet67469602012-04-24 07:37:38 +00001656 .net_frag_header_len = sizeof(struct frag_hdr),
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001657 .setsockopt = ipv6_setsockopt,
1658 .getsockopt = ipv6_getsockopt,
1659 .addr2sockaddr = inet6_csk_addr2sockaddr,
1660 .sockaddr_len = sizeof(struct sockaddr_in6),
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001661 .bind_conflict = inet6_csk_bind_conflict,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001662#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001663 .compat_setsockopt = compat_ipv6_setsockopt,
1664 .compat_getsockopt = compat_ipv6_getsockopt,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001665#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001666};
1667
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001668#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3de2009-09-01 19:25:03 +00001669static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001670 .md5_lookup = tcp_v6_md5_lookup,
Adam Langley49a72df2008-07-19 00:01:42 -07001671 .calc_md5_hash = tcp_v6_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001672 .md5_parse = tcp_v6_parse_md5_keys,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001673};
David S. Millera9286302006-11-14 19:53:22 -08001674#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001675
Linus Torvalds1da177e2005-04-16 15:20:36 -07001676/*
1677 * TCP over IPv4 via INET6 API
1678 */
Stephen Hemminger3b401a82009-09-01 19:25:04 +00001679static const struct inet_connection_sock_af_ops ipv6_mapped = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001680 .queue_xmit = ip_queue_xmit,
1681 .send_check = tcp_v4_send_check,
1682 .rebuild_header = inet_sk_rebuild_header,
Eric Dumazet63d02d12012-08-09 14:11:00 +00001683 .sk_rx_dst_set = inet_sk_rx_dst_set,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001684 .conn_request = tcp_v6_conn_request,
1685 .syn_recv_sock = tcp_v6_syn_recv_sock,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001686 .net_header_len = sizeof(struct iphdr),
1687 .setsockopt = ipv6_setsockopt,
1688 .getsockopt = ipv6_getsockopt,
1689 .addr2sockaddr = inet6_csk_addr2sockaddr,
1690 .sockaddr_len = sizeof(struct sockaddr_in6),
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001691 .bind_conflict = inet6_csk_bind_conflict,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001692#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001693 .compat_setsockopt = compat_ipv6_setsockopt,
1694 .compat_getsockopt = compat_ipv6_getsockopt,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001695#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001696};
1697
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001698#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3de2009-09-01 19:25:03 +00001699static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001700 .md5_lookup = tcp_v4_md5_lookup,
Adam Langley49a72df2008-07-19 00:01:42 -07001701 .calc_md5_hash = tcp_v4_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001702 .md5_parse = tcp_v6_parse_md5_keys,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001703};
David S. Millera9286302006-11-14 19:53:22 -08001704#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001705
Linus Torvalds1da177e2005-04-16 15:20:36 -07001706/* NOTE: A lot of things set to zero explicitly by call to
1707 * sk_alloc() so need not be done here.
1708 */
1709static int tcp_v6_init_sock(struct sock *sk)
1710{
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001711 struct inet_connection_sock *icsk = inet_csk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001712
Neal Cardwell900f65d2012-04-19 09:55:21 +00001713 tcp_init_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001714
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001715 icsk->icsk_af_ops = &ipv6_specific;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001716
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001717#ifdef CONFIG_TCP_MD5SIG
David S. Millerac807fa2012-04-23 03:21:58 -04001718 tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001719#endif
1720
Linus Torvalds1da177e2005-04-16 15:20:36 -07001721 return 0;
1722}
1723
Brian Haley7d06b2e2008-06-14 17:04:49 -07001724static void tcp_v6_destroy_sock(struct sock *sk)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001725{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001726 tcp_v4_destroy_sock(sk);
Brian Haley7d06b2e2008-06-14 17:04:49 -07001727 inet6_destroy_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001728}
1729
YOSHIFUJI Hideaki952a10b2007-04-21 20:13:44 +09001730#ifdef CONFIG_PROC_FS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001731/* Proc filesystem TCPv6 sock list dumping. */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001732static void get_openreq6(struct seq_file *seq,
Eric W. Biedermana7cb5a42012-05-24 01:10:10 -06001733 const struct sock *sk, struct request_sock *req, int i, kuid_t uid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001734{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001735 int ttd = req->expires - jiffies;
Eric Dumazet634fb9792013-10-09 15:21:29 -07001736 const struct in6_addr *src = &inet_rsk(req)->ir_v6_loc_addr;
1737 const struct in6_addr *dest = &inet_rsk(req)->ir_v6_rmt_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001738
1739 if (ttd < 0)
1740 ttd = 0;
1741
Linus Torvalds1da177e2005-04-16 15:20:36 -07001742 seq_printf(seq,
1743 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Francesco Fuscod14c5ab2013-08-15 13:42:14 +02001744 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %d %d %pK\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001745 i,
1746 src->s6_addr32[0], src->s6_addr32[1],
1747 src->s6_addr32[2], src->s6_addr32[3],
Eric Dumazetb44084c2013-10-10 00:04:37 -07001748 inet_rsk(req)->ir_num,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001749 dest->s6_addr32[0], dest->s6_addr32[1],
1750 dest->s6_addr32[2], dest->s6_addr32[3],
Eric Dumazet634fb9792013-10-09 15:21:29 -07001751 ntohs(inet_rsk(req)->ir_rmt_port),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001752 TCP_SYN_RECV,
Weilong Chen4c99aa42013-12-19 18:44:34 +08001753 0, 0, /* could print option size, but that is af dependent. */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001754 1, /* timers active (only the expire timer) */
1755 jiffies_to_clock_t(ttd),
Eric Dumazete6c022a2012-10-27 23:16:46 +00001756 req->num_timeout,
Eric W. Biedermana7cb5a42012-05-24 01:10:10 -06001757 from_kuid_munged(seq_user_ns(seq), uid),
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001758 0, /* non standard timer */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001759 0, /* open_requests have no inode */
1760 0, req);
1761}
1762
1763static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1764{
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001765 const struct in6_addr *dest, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001766 __u16 destp, srcp;
1767 int timer_active;
1768 unsigned long timer_expires;
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001769 const struct inet_sock *inet = inet_sk(sp);
1770 const struct tcp_sock *tp = tcp_sk(sp);
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001771 const struct inet_connection_sock *icsk = inet_csk(sp);
Yuchung Cheng0a672f742014-05-11 20:22:12 -07001772 struct fastopen_queue *fastopenq = icsk->icsk_accept_queue.fastopenq;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001773
Eric Dumazetefe42082013-10-03 15:42:29 -07001774 dest = &sp->sk_v6_daddr;
1775 src = &sp->sk_v6_rcv_saddr;
Eric Dumazetc720c7e82009-10-15 06:30:45 +00001776 destp = ntohs(inet->inet_dport);
1777 srcp = ntohs(inet->inet_sport);
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001778
1779 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001780 timer_active = 1;
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001781 timer_expires = icsk->icsk_timeout;
1782 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001783 timer_active = 4;
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001784 timer_expires = icsk->icsk_timeout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001785 } else if (timer_pending(&sp->sk_timer)) {
1786 timer_active = 2;
1787 timer_expires = sp->sk_timer.expires;
1788 } else {
1789 timer_active = 0;
1790 timer_expires = jiffies;
1791 }
1792
1793 seq_printf(seq,
1794 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Francesco Fuscod14c5ab2013-08-15 13:42:14 +02001795 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %lu %d %pK %lu %lu %u %u %d\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001796 i,
1797 src->s6_addr32[0], src->s6_addr32[1],
1798 src->s6_addr32[2], src->s6_addr32[3], srcp,
1799 dest->s6_addr32[0], dest->s6_addr32[1],
1800 dest->s6_addr32[2], dest->s6_addr32[3], destp,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001801 sp->sk_state,
Sridhar Samudrala47da8ee2006-06-27 13:29:00 -07001802 tp->write_seq-tp->snd_una,
1803 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001804 timer_active,
Eric Dumazeta399a802012-08-08 21:13:53 +00001805 jiffies_delta_to_clock_t(timer_expires - jiffies),
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001806 icsk->icsk_retransmits,
Eric W. Biedermana7cb5a42012-05-24 01:10:10 -06001807 from_kuid_munged(seq_user_ns(seq), sock_i_uid(sp)),
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001808 icsk->icsk_probes_out,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001809 sock_i_ino(sp),
1810 atomic_read(&sp->sk_refcnt), sp,
Stephen Hemminger7be87352008-06-27 20:00:19 -07001811 jiffies_to_clock_t(icsk->icsk_rto),
1812 jiffies_to_clock_t(icsk->icsk_ack.ato),
Weilong Chen4c99aa42013-12-19 18:44:34 +08001813 (icsk->icsk_ack.quick << 1) | icsk->icsk_ack.pingpong,
Ilpo Järvinen0b6a05c2009-09-15 01:30:10 -07001814 tp->snd_cwnd,
Yuchung Cheng0a672f742014-05-11 20:22:12 -07001815 sp->sk_state == TCP_LISTEN ?
1816 (fastopenq ? fastopenq->max_qlen : 0) :
1817 (tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001818 );
1819}
1820
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001821static void get_timewait6_sock(struct seq_file *seq,
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -07001822 struct inet_timewait_sock *tw, int i)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001823{
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001824 const struct in6_addr *dest, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001825 __u16 destp, srcp;
Eric Dumazet96f817f2013-10-03 14:27:25 -07001826 s32 delta = tw->tw_ttd - inet_tw_time_stamp();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001827
Eric Dumazetefe42082013-10-03 15:42:29 -07001828 dest = &tw->tw_v6_daddr;
1829 src = &tw->tw_v6_rcv_saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001830 destp = ntohs(tw->tw_dport);
1831 srcp = ntohs(tw->tw_sport);
1832
1833 seq_printf(seq,
1834 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Dan Rosenberg71338aa2011-05-23 12:17:35 +00001835 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001836 i,
1837 src->s6_addr32[0], src->s6_addr32[1],
1838 src->s6_addr32[2], src->s6_addr32[3], srcp,
1839 dest->s6_addr32[0], dest->s6_addr32[1],
1840 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1841 tw->tw_substate, 0, 0,
Eric Dumazeta399a802012-08-08 21:13:53 +00001842 3, jiffies_delta_to_clock_t(delta), 0, 0, 0, 0,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001843 atomic_read(&tw->tw_refcnt), tw);
1844}
1845
Linus Torvalds1da177e2005-04-16 15:20:36 -07001846static int tcp6_seq_show(struct seq_file *seq, void *v)
1847{
1848 struct tcp_iter_state *st;
Eric Dumazet05dbc7b2013-10-03 00:22:02 -07001849 struct sock *sk = v;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001850
1851 if (v == SEQ_START_TOKEN) {
1852 seq_puts(seq,
1853 " sl "
1854 "local_address "
1855 "remote_address "
1856 "st tx_queue rx_queue tr tm->when retrnsmt"
1857 " uid timeout inode\n");
1858 goto out;
1859 }
1860 st = seq->private;
1861
1862 switch (st->state) {
1863 case TCP_SEQ_STATE_LISTENING:
1864 case TCP_SEQ_STATE_ESTABLISHED:
Eric Dumazet05dbc7b2013-10-03 00:22:02 -07001865 if (sk->sk_state == TCP_TIME_WAIT)
1866 get_timewait6_sock(seq, v, st->num);
1867 else
1868 get_tcp6_sock(seq, v, st->num);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001869 break;
1870 case TCP_SEQ_STATE_OPENREQ:
1871 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1872 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001873 }
1874out:
1875 return 0;
1876}
1877
Arjan van de Ven73cb88e2011-10-30 06:46:30 +00001878static const struct file_operations tcp6_afinfo_seq_fops = {
1879 .owner = THIS_MODULE,
1880 .open = tcp_seq_open,
1881 .read = seq_read,
1882 .llseek = seq_lseek,
1883 .release = seq_release_net
1884};
1885
Linus Torvalds1da177e2005-04-16 15:20:36 -07001886static struct tcp_seq_afinfo tcp6_seq_afinfo = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001887 .name = "tcp6",
1888 .family = AF_INET6,
Arjan van de Ven73cb88e2011-10-30 06:46:30 +00001889 .seq_fops = &tcp6_afinfo_seq_fops,
Denis V. Lunev9427c4b2008-04-13 22:12:13 -07001890 .seq_ops = {
1891 .show = tcp6_seq_show,
1892 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07001893};
1894
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00001895int __net_init tcp6_proc_init(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001896{
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07001897 return tcp_proc_register(net, &tcp6_seq_afinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001898}
1899
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07001900void tcp6_proc_exit(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001901{
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07001902 tcp_proc_unregister(net, &tcp6_seq_afinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001903}
1904#endif
1905
Eric Dumazetf77d6022013-05-09 10:28:16 +00001906static void tcp_v6_clear_sk(struct sock *sk, int size)
1907{
1908 struct inet_sock *inet = inet_sk(sk);
1909
1910 /* we do not want to clear pinet6 field, because of RCU lookups */
1911 sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
1912
1913 size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
1914 memset(&inet->pinet6 + 1, 0, size);
1915}
1916
Linus Torvalds1da177e2005-04-16 15:20:36 -07001917struct proto tcpv6_prot = {
1918 .name = "TCPv6",
1919 .owner = THIS_MODULE,
1920 .close = tcp_close,
1921 .connect = tcp_v6_connect,
1922 .disconnect = tcp_disconnect,
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001923 .accept = inet_csk_accept,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001924 .ioctl = tcp_ioctl,
1925 .init = tcp_v6_init_sock,
1926 .destroy = tcp_v6_destroy_sock,
1927 .shutdown = tcp_shutdown,
1928 .setsockopt = tcp_setsockopt,
1929 .getsockopt = tcp_getsockopt,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001930 .recvmsg = tcp_recvmsg,
Changli Gao7ba42912010-07-10 20:41:55 +00001931 .sendmsg = tcp_sendmsg,
1932 .sendpage = tcp_sendpage,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001933 .backlog_rcv = tcp_v6_do_rcv,
Eric Dumazet46d3cea2012-07-11 05:50:31 +00001934 .release_cb = tcp_release_cb,
Eric Dumazet563d34d2012-07-23 09:48:52 +02001935 .mtu_reduced = tcp_v6_mtu_reduced,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001936 .hash = tcp_v6_hash,
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001937 .unhash = inet_unhash,
1938 .get_port = inet_csk_get_port,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001939 .enter_memory_pressure = tcp_enter_memory_pressure,
Eric Dumazetc9bee3b72013-07-22 20:27:07 -07001940 .stream_memory_free = tcp_stream_memory_free,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001941 .sockets_allocated = &tcp_sockets_allocated,
1942 .memory_allocated = &tcp_memory_allocated,
1943 .memory_pressure = &tcp_memory_pressure,
Arnaldo Carvalho de Melo0a5578c2005-08-09 20:11:41 -07001944 .orphan_count = &tcp_orphan_count,
Eric W. Biedermana4fe34b2013-10-19 16:25:36 -07001945 .sysctl_mem = sysctl_tcp_mem,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001946 .sysctl_wmem = sysctl_tcp_wmem,
1947 .sysctl_rmem = sysctl_tcp_rmem,
1948 .max_header = MAX_TCP_HEADER,
1949 .obj_size = sizeof(struct tcp6_sock),
Eric Dumazet3ab5aee2008-11-16 19:40:17 -08001950 .slab_flags = SLAB_DESTROY_BY_RCU,
Arnaldo Carvalho de Melo6d6ee432005-12-13 23:25:19 -08001951 .twsk_prot = &tcp6_timewait_sock_ops,
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -07001952 .rsk_prot = &tcp6_request_sock_ops,
Pavel Emelyanov39d8cda2008-03-22 16:50:58 -07001953 .h.hashinfo = &tcp_hashinfo,
Changli Gao7ba42912010-07-10 20:41:55 +00001954 .no_autobind = true,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001955#ifdef CONFIG_COMPAT
1956 .compat_setsockopt = compat_tcp_setsockopt,
1957 .compat_getsockopt = compat_tcp_getsockopt,
1958#endif
Andrew Mortonc255a452012-07-31 16:43:02 -07001959#ifdef CONFIG_MEMCG_KMEM
Glauber Costad1a4c0b2011-12-11 21:47:04 +00001960 .proto_cgroup = tcp_proto_cgroup,
1961#endif
Eric Dumazetf77d6022013-05-09 10:28:16 +00001962 .clear_sk = tcp_v6_clear_sk,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001963};
1964
Alexey Dobriyan41135cc2009-09-14 12:22:28 +00001965static const struct inet6_protocol tcpv6_protocol = {
Eric Dumazetc7109982012-07-26 12:18:11 +00001966 .early_demux = tcp_v6_early_demux,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001967 .handler = tcp_v6_rcv,
1968 .err_handler = tcp_v6_err,
1969 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1970};
1971
Linus Torvalds1da177e2005-04-16 15:20:36 -07001972static struct inet_protosw tcpv6_protosw = {
1973 .type = SOCK_STREAM,
1974 .protocol = IPPROTO_TCP,
1975 .prot = &tcpv6_prot,
1976 .ops = &inet6_stream_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001977 .no_check = 0,
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001978 .flags = INET_PROTOSW_PERMANENT |
1979 INET_PROTOSW_ICSK,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001980};
1981
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00001982static int __net_init tcpv6_net_init(struct net *net)
Daniel Lezcano93ec9262008-03-07 11:16:02 -08001983{
Denis V. Lunev56772422008-04-03 14:28:30 -07001984 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
1985 SOCK_RAW, IPPROTO_TCP, net);
Daniel Lezcano93ec9262008-03-07 11:16:02 -08001986}
1987
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00001988static void __net_exit tcpv6_net_exit(struct net *net)
Daniel Lezcano93ec9262008-03-07 11:16:02 -08001989{
Denis V. Lunev56772422008-04-03 14:28:30 -07001990 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00001991}
1992
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00001993static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00001994{
1995 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
Daniel Lezcano93ec9262008-03-07 11:16:02 -08001996}
1997
1998static struct pernet_operations tcpv6_net_ops = {
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00001999 .init = tcpv6_net_init,
2000 .exit = tcpv6_net_exit,
2001 .exit_batch = tcpv6_net_exit_batch,
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002002};
2003
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002004int __init tcpv6_init(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002005{
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002006 int ret;
David Woodhouseae0f7d52006-01-11 15:53:04 -08002007
Vlad Yasevich33362882012-11-15 08:49:15 +00002008 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2009 if (ret)
Vlad Yasevichc6b641a2012-11-15 08:49:22 +00002010 goto out;
Vlad Yasevich33362882012-11-15 08:49:15 +00002011
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002012 /* register inet6 protocol */
2013 ret = inet6_register_protosw(&tcpv6_protosw);
2014 if (ret)
2015 goto out_tcpv6_protocol;
2016
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002017 ret = register_pernet_subsys(&tcpv6_net_ops);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002018 if (ret)
2019 goto out_tcpv6_protosw;
2020out:
2021 return ret;
2022
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002023out_tcpv6_protosw:
2024 inet6_unregister_protosw(&tcpv6_protosw);
Vlad Yasevich33362882012-11-15 08:49:15 +00002025out_tcpv6_protocol:
2026 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002027 goto out;
2028}
2029
Daniel Lezcano09f77092007-12-13 05:34:58 -08002030void tcpv6_exit(void)
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002031{
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002032 unregister_pernet_subsys(&tcpv6_net_ops);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002033 inet6_unregister_protosw(&tcpv6_protosw);
2034 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002035}