blob: cf62541427ac9578f80482d993baca0977471778 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * TCP over IPv6
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09003 * Linux INET6 implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
5 * Authors:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09006 * Pedro Roque <roque@di.fc.ul.pt>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09008 * Based on:
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
Herbert Xueb4dea52008-12-29 23:04:08 -080026#include <linux/bottom_half.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090041#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070042
43#include <linux/ipv6.h>
44#include <linux/icmpv6.h>
45#include <linux/random.h>
46
47#include <net/tcp.h>
48#include <net/ndisc.h>
Arnaldo Carvalho de Melo5324a042005-08-12 09:26:18 -030049#include <net/inet6_hashtables.h>
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -080050#include <net/inet6_connection_sock.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <net/ipv6.h>
52#include <net/transp_v6.h>
53#include <net/addrconf.h>
54#include <net/ip6_route.h>
55#include <net/ip6_checksum.h>
56#include <net/inet_ecn.h>
57#include <net/protocol.h>
58#include <net/xfrm.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070059#include <net/snmp.h>
60#include <net/dsfield.h>
Arnaldo Carvalho de Melo6d6ee432005-12-13 23:25:19 -080061#include <net/timewait_sock.h>
Jeff Garzik18134be2007-10-26 22:53:14 -070062#include <net/netdma.h>
Denis V. Lunev3d58b5f2008-04-03 14:22:32 -070063#include <net/inet_common.h>
David S. Miller6e5714e2011-08-03 20:50:44 -070064#include <net/secure_seq.h>
Glauber Costad1a4c0b2011-12-11 21:47:04 +000065#include <net/tcp_memcontrol.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070066
67#include <asm/uaccess.h>
68
69#include <linux/proc_fs.h>
70#include <linux/seq_file.h>
71
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -080072#include <linux/crypto.h>
73#include <linux/scatterlist.h>
74
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -080075static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
Gui Jianfeng6edafaa2008-08-06 23:50:04 -070076static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
77 struct request_sock *req);
Linus Torvalds1da177e2005-04-16 15:20:36 -070078
79static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
Herbert Xu8ad50d92010-04-11 02:15:54 +000080static void __tcp_v6_send_check(struct sk_buff *skb,
Eric Dumazetb71d1d42011-04-22 04:53:02 +000081 const struct in6_addr *saddr,
82 const struct in6_addr *daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -070083
Stephen Hemminger3b401a82009-09-01 19:25:04 +000084static const struct inet_connection_sock_af_ops ipv6_mapped;
85static const struct inet_connection_sock_af_ops ipv6_specific;
David S. Millera9286302006-11-14 19:53:22 -080086#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3d2009-09-01 19:25:03 +000087static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
88static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +090089#else
90static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
Eric Dumazetb71d1d42011-04-22 04:53:02 +000091 const struct in6_addr *addr)
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +090092{
93 return NULL;
94}
David S. Millera9286302006-11-14 19:53:22 -080095#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070096
Linus Torvalds1da177e2005-04-16 15:20:36 -070097static void tcp_v6_hash(struct sock *sk)
98{
99 if (sk->sk_state != TCP_CLOSE) {
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -0800100 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101 tcp_prot.hash(sk);
102 return;
103 }
104 local_bh_disable();
Eric Dumazet9327f702009-12-04 03:46:54 +0000105 __inet6_hash(sk, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106 local_bh_enable();
107 }
108}
109
Herbert Xu684f2172009-01-08 10:41:23 -0800110static __inline__ __sum16 tcp_v6_check(int len,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000111 const struct in6_addr *saddr,
112 const struct in6_addr *daddr,
Al Viro868c86b2006-11-14 21:35:48 -0800113 __wsum base)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114{
115 return csum_ipv6_magic(saddr, daddr, len, IPPROTO_TCP, base);
116}
117
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400118static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119{
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700120 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
121 ipv6_hdr(skb)->saddr.s6_addr32,
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -0700122 tcp_hdr(skb)->dest,
123 tcp_hdr(skb)->source);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124}
125
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900126static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127 int addr_len)
128{
129 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900130 struct inet_sock *inet = inet_sk(sk);
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800131 struct inet_connection_sock *icsk = inet_csk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700132 struct ipv6_pinfo *np = inet6_sk(sk);
133 struct tcp_sock *tp = tcp_sk(sk);
Arnaud Ebalard20c59de2010-06-01 21:35:01 +0000134 struct in6_addr *saddr = NULL, *final_p, final;
David S. Miller493f3772010-12-02 12:14:29 -0800135 struct rt6_info *rt;
David S. Miller4c9483b2011-03-12 16:22:43 -0500136 struct flowi6 fl6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137 struct dst_entry *dst;
138 int addr_type;
139 int err;
140
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900141 if (addr_len < SIN6_LEN_RFC2133)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142 return -EINVAL;
143
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900144 if (usin->sin6_family != AF_INET6)
Eric Dumazeta02cec22010-09-22 20:43:57 +0000145 return -EAFNOSUPPORT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146
David S. Miller4c9483b2011-03-12 16:22:43 -0500147 memset(&fl6, 0, sizeof(fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148
149 if (np->sndflow) {
David S. Miller4c9483b2011-03-12 16:22:43 -0500150 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
151 IP6_ECN_flow_init(fl6.flowlabel);
152 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 struct ip6_flowlabel *flowlabel;
David S. Miller4c9483b2011-03-12 16:22:43 -0500154 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 if (flowlabel == NULL)
156 return -EINVAL;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000157 usin->sin6_addr = flowlabel->dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158 fl6_sock_release(flowlabel);
159 }
160 }
161
162 /*
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900163 * connect() to INADDR_ANY means loopback (BSD'ism).
164 */
165
166 if(ipv6_addr_any(&usin->sin6_addr))
167 usin->sin6_addr.s6_addr[15] = 0x1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168
169 addr_type = ipv6_addr_type(&usin->sin6_addr);
170
171 if(addr_type & IPV6_ADDR_MULTICAST)
172 return -ENETUNREACH;
173
174 if (addr_type&IPV6_ADDR_LINKLOCAL) {
175 if (addr_len >= sizeof(struct sockaddr_in6) &&
176 usin->sin6_scope_id) {
177 /* If interface is set while binding, indices
178 * must coincide.
179 */
180 if (sk->sk_bound_dev_if &&
181 sk->sk_bound_dev_if != usin->sin6_scope_id)
182 return -EINVAL;
183
184 sk->sk_bound_dev_if = usin->sin6_scope_id;
185 }
186
187 /* Connect to link-local address requires an interface */
188 if (!sk->sk_bound_dev_if)
189 return -EINVAL;
190 }
191
192 if (tp->rx_opt.ts_recent_stamp &&
193 !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
194 tp->rx_opt.ts_recent = 0;
195 tp->rx_opt.ts_recent_stamp = 0;
196 tp->write_seq = 0;
197 }
198
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000199 np->daddr = usin->sin6_addr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500200 np->flow_label = fl6.flowlabel;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700201
202 /*
203 * TCP over IPv4
204 */
205
206 if (addr_type == IPV6_ADDR_MAPPED) {
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800207 u32 exthdrlen = icsk->icsk_ext_hdr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208 struct sockaddr_in sin;
209
210 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
211
212 if (__ipv6_only_sock(sk))
213 return -ENETUNREACH;
214
215 sin.sin_family = AF_INET;
216 sin.sin_port = usin->sin6_port;
217 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
218
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800219 icsk->icsk_af_ops = &ipv6_mapped;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 sk->sk_backlog_rcv = tcp_v4_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800221#ifdef CONFIG_TCP_MD5SIG
222 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
223#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224
225 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
226
227 if (err) {
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800228 icsk->icsk_ext_hdr_len = exthdrlen;
229 icsk->icsk_af_ops = &ipv6_specific;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230 sk->sk_backlog_rcv = tcp_v6_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800231#ifdef CONFIG_TCP_MD5SIG
232 tp->af_specific = &tcp_sock_ipv6_specific;
233#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234 goto failure;
235 } else {
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000236 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
237 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
238 &np->rcv_saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239 }
240
241 return err;
242 }
243
244 if (!ipv6_addr_any(&np->rcv_saddr))
245 saddr = &np->rcv_saddr;
246
David S. Miller4c9483b2011-03-12 16:22:43 -0500247 fl6.flowi6_proto = IPPROTO_TCP;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000248 fl6.daddr = np->daddr;
249 fl6.saddr = saddr ? *saddr : np->saddr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500250 fl6.flowi6_oif = sk->sk_bound_dev_if;
251 fl6.flowi6_mark = sk->sk_mark;
David S. Miller1958b852011-03-12 16:36:19 -0500252 fl6.fl6_dport = usin->sin6_port;
253 fl6.fl6_sport = inet->inet_sport;
Lorenzo Colitti462ce7c2014-03-31 16:23:51 +0900254 fl6.flowi6_uid = sock_i_uid(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255
David S. Miller4c9483b2011-03-12 16:22:43 -0500256 final_p = fl6_update_dst(&fl6, np->opt, &final);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700257
David S. Miller4c9483b2011-03-12 16:22:43 -0500258 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
Venkat Yekkiralabeb8d132006-08-04 23:12:42 -0700259
David S. Miller4c9483b2011-03-12 16:22:43 -0500260 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, true);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800261 if (IS_ERR(dst)) {
262 err = PTR_ERR(dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263 goto failure;
David S. Miller14e50e52007-05-24 18:17:54 -0700264 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265
266 if (saddr == NULL) {
David S. Miller4c9483b2011-03-12 16:22:43 -0500267 saddr = &fl6.saddr;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000268 np->rcv_saddr = *saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269 }
270
271 /* set the source address */
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000272 np->saddr = *saddr;
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000273 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274
Herbert Xuf83ef8c2006-06-30 13:37:03 -0700275 sk->sk_gso_type = SKB_GSO_TCPV6;
YOSHIFUJI Hideaki8e1ef0a2006-08-29 17:15:09 -0700276 __ip6_dst_store(sk, dst, NULL, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277
David S. Miller493f3772010-12-02 12:14:29 -0800278 rt = (struct rt6_info *) dst;
279 if (tcp_death_row.sysctl_tw_recycle &&
280 !tp->rx_opt.ts_recent_stamp &&
281 ipv6_addr_equal(&rt->rt6i_dst.addr, &np->daddr)) {
282 struct inet_peer *peer = rt6_get_peer(rt);
283 /*
284 * VJ's idea. We save last timestamp seen from
285 * the destination in peer table, when entering state
286 * TIME-WAIT * and initialize rx_opt.ts_recent from it,
287 * when trying new connection.
288 */
289 if (peer) {
290 inet_peer_refcheck(peer);
291 if ((u32)get_seconds() - peer->tcp_ts_stamp <= TCP_PAWS_MSL) {
292 tp->rx_opt.ts_recent_stamp = peer->tcp_ts_stamp;
293 tp->rx_opt.ts_recent = peer->tcp_ts;
294 }
295 }
296 }
297
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800298 icsk->icsk_ext_hdr_len = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299 if (np->opt)
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800300 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
301 np->opt->opt_nflen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302
303 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
304
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000305 inet->inet_dport = usin->sin6_port;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306
307 tcp_set_state(sk, TCP_SYN_SENT);
Arnaldo Carvalho de Melod8313f52005-12-13 23:25:44 -0800308 err = inet6_hash_connect(&tcp_death_row, sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700309 if (err)
310 goto late_failure;
311
312 if (!tp->write_seq)
313 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
314 np->daddr.s6_addr32,
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000315 inet->inet_sport,
316 inet->inet_dport);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317
318 err = tcp_connect(sk);
319 if (err)
320 goto late_failure;
321
322 return 0;
323
324late_failure:
325 tcp_set_state(sk, TCP_CLOSE);
326 __sk_dst_reset(sk);
327failure:
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000328 inet->inet_dport = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700329 sk->sk_route_caps = 0;
330 return err;
331}
332
333static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
Brian Haleyd5fdd6b2009-06-23 04:31:07 -0700334 u8 type, u8 code, int offset, __be32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000336 const struct ipv6hdr *hdr = (const struct ipv6hdr*)skb->data;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -0300337 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338 struct ipv6_pinfo *np;
339 struct sock *sk;
340 int err;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900341 struct tcp_sock *tp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 __u32 seq;
Pavel Emelyanovca12a1a2008-07-16 20:28:42 -0700343 struct net *net = dev_net(skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344
Pavel Emelyanovca12a1a2008-07-16 20:28:42 -0700345 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
Pavel Emelyanovd86e0da2008-01-31 05:07:21 -0800346 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347
348 if (sk == NULL) {
Denis V. Luneve41b5362008-10-08 10:33:26 -0700349 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
350 ICMP6_MIB_INERRORS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 return;
352 }
353
354 if (sk->sk_state == TCP_TIME_WAIT) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -0700355 inet_twsk_put(inet_twsk(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356 return;
357 }
358
359 bh_lock_sock(sk);
360 if (sock_owned_by_user(sk))
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700361 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362
363 if (sk->sk_state == TCP_CLOSE)
364 goto out;
365
Stephen Hemmingere802af92010-04-22 15:24:53 -0700366 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
367 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
368 goto out;
369 }
370
Linus Torvalds1da177e2005-04-16 15:20:36 -0700371 tp = tcp_sk(sk);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900372 seq = ntohl(th->seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700373 if (sk->sk_state != TCP_LISTEN &&
374 !between(seq, tp->snd_una, tp->snd_nxt)) {
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700375 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376 goto out;
377 }
378
379 np = inet6_sk(sk);
380
381 if (type == ICMPV6_PKT_TOOBIG) {
David S. Miller68d0c6d2011-03-01 13:19:07 -0800382 struct dst_entry *dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700383
384 if (sock_owned_by_user(sk))
385 goto out;
386 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
387 goto out;
388
389 /* icmp should have updated the destination cache entry */
390 dst = __sk_dst_check(sk, np->dst_cookie);
391
392 if (dst == NULL) {
393 struct inet_sock *inet = inet_sk(sk);
David S. Miller4c9483b2011-03-12 16:22:43 -0500394 struct flowi6 fl6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395
396 /* BUGGG_FUTURE: Again, it is not clear how
397 to handle rthdr case. Ignore this complexity
398 for now.
399 */
David S. Miller4c9483b2011-03-12 16:22:43 -0500400 memset(&fl6, 0, sizeof(fl6));
401 fl6.flowi6_proto = IPPROTO_TCP;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000402 fl6.daddr = np->daddr;
403 fl6.saddr = np->saddr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500404 fl6.flowi6_oif = sk->sk_bound_dev_if;
405 fl6.flowi6_mark = sk->sk_mark;
David S. Miller1958b852011-03-12 16:36:19 -0500406 fl6.fl6_dport = inet->inet_dport;
407 fl6.fl6_sport = inet->inet_sport;
Lorenzo Colitti462ce7c2014-03-31 16:23:51 +0900408 fl6.flowi6_uid = sock_i_uid(sk);
David S. Miller4c9483b2011-03-12 16:22:43 -0500409 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410
David S. Miller4c9483b2011-03-12 16:22:43 -0500411 dst = ip6_dst_lookup_flow(sk, &fl6, NULL, false);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800412 if (IS_ERR(dst)) {
413 sk->sk_err_soft = -PTR_ERR(dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 goto out;
415 }
416
417 } else
418 dst_hold(dst);
419
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800420 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700421 tcp_sync_mss(sk, dst_mtu(dst));
422 tcp_simple_retransmit(sk);
423 } /* else let the usual retransmit timer handle it */
424 dst_release(dst);
425 goto out;
426 }
427
428 icmpv6_err_convert(type, code, &err);
429
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700430 /* Might be for an request_sock */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700431 switch (sk->sk_state) {
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700432 struct request_sock *req, **prev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700433 case TCP_LISTEN:
434 if (sock_owned_by_user(sk))
435 goto out;
436
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -0800437 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
438 &hdr->saddr, inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700439 if (!req)
440 goto out;
441
442 /* ICMPs are not backlogged, hence we cannot get
443 * an established socket here.
444 */
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700445 WARN_ON(req->sk != NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700446
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -0700447 if (seq != tcp_rsk(req)->snt_isn) {
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700448 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700449 goto out;
450 }
451
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -0700452 inet_csk_reqsk_queue_drop(sk, req, prev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700453 goto out;
454
455 case TCP_SYN_SENT:
456 case TCP_SYN_RECV: /* Cannot happen.
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900457 It can, it SYNs are crossed. --ANK */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700458 if (!sock_owned_by_user(sk)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700459 sk->sk_err = err;
460 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
461
462 tcp_done(sk);
463 } else
464 sk->sk_err_soft = err;
465 goto out;
466 }
467
468 if (!sock_owned_by_user(sk) && np->recverr) {
469 sk->sk_err = err;
470 sk->sk_error_report(sk);
471 } else
472 sk->sk_err_soft = err;
473
474out:
475 bh_unlock_sock(sk);
476 sock_put(sk);
477}
478
479
William Allen Simpsone6b4d112009-12-02 18:07:39 +0000480static int tcp_v6_send_synack(struct sock *sk, struct request_sock *req,
481 struct request_values *rvp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700482{
Arnaldo Carvalho de Meloca304b62005-12-13 23:15:40 -0800483 struct inet6_request_sock *treq = inet6_rsk(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700484 struct ipv6_pinfo *np = inet6_sk(sk);
485 struct sk_buff * skb;
486 struct ipv6_txoptions *opt = NULL;
Arnaud Ebalard20c59de2010-06-01 21:35:01 +0000487 struct in6_addr * final_p, final;
David S. Miller4c9483b2011-03-12 16:22:43 -0500488 struct flowi6 fl6;
Denis V. Lunevfd80eb92008-02-29 11:43:03 -0800489 struct dst_entry *dst;
David S. Miller68d0c6d2011-03-01 13:19:07 -0800490 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700491
David S. Miller4c9483b2011-03-12 16:22:43 -0500492 memset(&fl6, 0, sizeof(fl6));
493 fl6.flowi6_proto = IPPROTO_TCP;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000494 fl6.daddr = treq->rmt_addr;
495 fl6.saddr = treq->loc_addr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500496 fl6.flowlabel = 0;
497 fl6.flowi6_oif = treq->iif;
Lorenzo Colitti8cb56e32014-03-26 13:03:12 +0900498 fl6.flowi6_mark = inet_rsk(req)->ir_mark;
David S. Miller1958b852011-03-12 16:36:19 -0500499 fl6.fl6_dport = inet_rsk(req)->rmt_port;
500 fl6.fl6_sport = inet_rsk(req)->loc_port;
Lorenzo Colitti462ce7c2014-03-31 16:23:51 +0900501 fl6.flowi6_uid = sock_i_uid(sk);
David S. Miller4c9483b2011-03-12 16:22:43 -0500502 security_req_classify_flow(req, flowi6_to_flowi(&fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700503
Denis V. Lunevfd80eb92008-02-29 11:43:03 -0800504 opt = np->opt;
David S. Miller4c9483b2011-03-12 16:22:43 -0500505 final_p = fl6_update_dst(&fl6, opt, &final);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700506
David S. Miller4c9483b2011-03-12 16:22:43 -0500507 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, false);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800508 if (IS_ERR(dst)) {
509 err = PTR_ERR(dst);
Boris Ostrovsky738faca2011-04-04 13:07:26 -0700510 dst = NULL;
Denis V. Lunevfd80eb92008-02-29 11:43:03 -0800511 goto done;
David S. Miller68d0c6d2011-03-01 13:19:07 -0800512 }
William Allen Simpsone6b4d112009-12-02 18:07:39 +0000513 skb = tcp_make_synack(sk, dst, req, rvp);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800514 err = -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700515 if (skb) {
Herbert Xu8ad50d92010-04-11 02:15:54 +0000516 __tcp_v6_send_check(skb, &treq->loc_addr, &treq->rmt_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700517
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000518 fl6.daddr = treq->rmt_addr;
Eric Dumazetb903d322011-10-27 00:44:35 -0400519 err = ip6_xmit(sk, skb, &fl6, opt, np->tclass);
Gerrit Renkerb9df3cb2006-11-14 11:21:36 -0200520 err = net_xmit_eval(err);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 }
522
523done:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900524 if (opt && opt != np->opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700525 sock_kfree_s(sk, opt, opt->tot_len);
Eric W. Biederman78b91042006-01-31 17:51:44 -0800526 dst_release(dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700527 return err;
528}
529
Octavian Purdila72659ec2010-01-17 19:09:39 -0800530static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req,
531 struct request_values *rvp)
532{
533 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
534 return tcp_v6_send_synack(sk, req, rvp);
535}
536
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700537static void tcp_v6_reqsk_destructor(struct request_sock *req)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700538{
Wei Yongjun800d55f2009-02-23 21:45:33 +0000539 kfree_skb(inet6_rsk(req)->pktopts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540}
541
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800542#ifdef CONFIG_TCP_MD5SIG
543static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000544 const struct in6_addr *addr)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800545{
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000546 return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800547}
548
549static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
550 struct sock *addr_sk)
551{
552 return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
553}
554
555static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
556 struct request_sock *req)
557{
558 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
559}
560
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800561static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
562 int optlen)
563{
564 struct tcp_md5sig cmd;
565 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800566
567 if (optlen < sizeof(cmd))
568 return -EINVAL;
569
570 if (copy_from_user(&cmd, optval, sizeof(cmd)))
571 return -EFAULT;
572
573 if (sin6->sin6_family != AF_INET6)
574 return -EINVAL;
575
576 if (!cmd.tcpm_keylen) {
Brian Haleye773e4f2007-08-24 23:16:08 -0700577 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000578 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
579 AF_INET);
580 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
581 AF_INET6);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800582 }
583
584 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
585 return -EINVAL;
586
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000587 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
588 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
589 AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800590
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000591 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
592 AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800593}
594
Adam Langley49a72df2008-07-19 00:01:42 -0700595static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000596 const struct in6_addr *daddr,
597 const struct in6_addr *saddr, int nbytes)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800598{
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800599 struct tcp6_pseudohdr *bp;
Adam Langley49a72df2008-07-19 00:01:42 -0700600 struct scatterlist sg;
YOSHIFUJI Hideaki8d26d762008-04-17 13:19:16 +0900601
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800602 bp = &hp->md5_blk.ip6;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800603 /* 1. TCP pseudo-header (RFC2460) */
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000604 bp->saddr = *saddr;
605 bp->daddr = *daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700606 bp->protocol = cpu_to_be32(IPPROTO_TCP);
Adam Langley00b13042008-07-31 21:36:07 -0700607 bp->len = cpu_to_be32(nbytes);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800608
Adam Langley49a72df2008-07-19 00:01:42 -0700609 sg_init_one(&sg, bp, sizeof(*bp));
610 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
611}
David S. Millerc7da57a2007-10-26 00:41:21 -0700612
Adam Langley49a72df2008-07-19 00:01:42 -0700613static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000614 const struct in6_addr *daddr, struct in6_addr *saddr,
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400615 const struct tcphdr *th)
Adam Langley49a72df2008-07-19 00:01:42 -0700616{
617 struct tcp_md5sig_pool *hp;
618 struct hash_desc *desc;
619
620 hp = tcp_get_md5sig_pool();
621 if (!hp)
622 goto clear_hash_noput;
623 desc = &hp->md5_desc;
624
625 if (crypto_hash_init(desc))
626 goto clear_hash;
627 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
628 goto clear_hash;
629 if (tcp_md5_hash_header(hp, th))
630 goto clear_hash;
631 if (tcp_md5_hash_key(hp, key))
632 goto clear_hash;
633 if (crypto_hash_final(desc, md5_hash))
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800634 goto clear_hash;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800635
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800636 tcp_put_md5sig_pool();
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800637 return 0;
Adam Langley49a72df2008-07-19 00:01:42 -0700638
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800639clear_hash:
640 tcp_put_md5sig_pool();
641clear_hash_noput:
642 memset(md5_hash, 0, 16);
Adam Langley49a72df2008-07-19 00:01:42 -0700643 return 1;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800644}
645
Adam Langley49a72df2008-07-19 00:01:42 -0700646static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400647 const struct sock *sk,
648 const struct request_sock *req,
649 const struct sk_buff *skb)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800650{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000651 const struct in6_addr *saddr, *daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700652 struct tcp_md5sig_pool *hp;
653 struct hash_desc *desc;
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400654 const struct tcphdr *th = tcp_hdr(skb);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800655
656 if (sk) {
657 saddr = &inet6_sk(sk)->saddr;
658 daddr = &inet6_sk(sk)->daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700659 } else if (req) {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800660 saddr = &inet6_rsk(req)->loc_addr;
661 daddr = &inet6_rsk(req)->rmt_addr;
Adam Langley49a72df2008-07-19 00:01:42 -0700662 } else {
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000663 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
Adam Langley49a72df2008-07-19 00:01:42 -0700664 saddr = &ip6h->saddr;
665 daddr = &ip6h->daddr;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800666 }
Adam Langley49a72df2008-07-19 00:01:42 -0700667
668 hp = tcp_get_md5sig_pool();
669 if (!hp)
670 goto clear_hash_noput;
671 desc = &hp->md5_desc;
672
673 if (crypto_hash_init(desc))
674 goto clear_hash;
675
676 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
677 goto clear_hash;
678 if (tcp_md5_hash_header(hp, th))
679 goto clear_hash;
680 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
681 goto clear_hash;
682 if (tcp_md5_hash_key(hp, key))
683 goto clear_hash;
684 if (crypto_hash_final(desc, md5_hash))
685 goto clear_hash;
686
687 tcp_put_md5sig_pool();
688 return 0;
689
690clear_hash:
691 tcp_put_md5sig_pool();
692clear_hash_noput:
693 memset(md5_hash, 0, 16);
694 return 1;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800695}
696
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400697static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800698{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400699 const __u8 *hash_location = NULL;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800700 struct tcp_md5sig_key *hash_expected;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000701 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400702 const struct tcphdr *th = tcp_hdr(skb);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800703 int genhash;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800704 u8 newhash[16];
705
706 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
YOSHIFUJI Hideaki7d5d5522008-04-17 12:29:53 +0900707 hash_location = tcp_parse_md5sig_option(th);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800708
David S. Miller785957d2008-07-30 03:03:15 -0700709 /* We've parsed the options - do we have a hash? */
710 if (!hash_expected && !hash_location)
711 return 0;
712
713 if (hash_expected && !hash_location) {
714 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800715 return 1;
716 }
717
David S. Miller785957d2008-07-30 03:03:15 -0700718 if (!hash_expected && hash_location) {
719 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800720 return 1;
721 }
722
723 /* check the signature */
Adam Langley49a72df2008-07-19 00:01:42 -0700724 genhash = tcp_v6_md5_hash_skb(newhash,
725 hash_expected,
726 NULL, NULL, skb);
727
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800728 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
729 if (net_ratelimit()) {
Joe Perches5856b602010-01-08 00:59:52 -0800730 printk(KERN_INFO "MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800731 genhash ? "failed" : "mismatch",
Harvey Harrison0c6ce782008-10-28 16:09:23 -0700732 &ip6h->saddr, ntohs(th->source),
733 &ip6h->daddr, ntohs(th->dest));
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800734 }
735 return 1;
736 }
737 return 0;
738}
739#endif
740
Glenn Griffinc6aefaf2008-02-07 21:49:26 -0800741struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700742 .family = AF_INET6,
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -0700743 .obj_size = sizeof(struct tcp6_request_sock),
Octavian Purdila72659ec2010-01-17 19:09:39 -0800744 .rtx_syn_ack = tcp_v6_rtx_synack,
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700745 .send_ack = tcp_v6_reqsk_send_ack,
746 .destructor = tcp_v6_reqsk_destructor,
Octavian Purdila72659ec2010-01-17 19:09:39 -0800747 .send_reset = tcp_v6_send_reset,
748 .syn_ack_timeout = tcp_syn_ack_timeout,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700749};
750
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800751#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3d2009-09-01 19:25:03 +0000752static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800753 .md5_lookup = tcp_v6_reqsk_md5_lookup,
John Dykstrae3afe7b2009-07-16 05:04:51 +0000754 .calc_md5_hash = tcp_v6_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800755};
Andrew Mortonb6332e62006-11-30 19:16:28 -0800756#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800757
Herbert Xu8ad50d92010-04-11 02:15:54 +0000758static void __tcp_v6_send_check(struct sk_buff *skb,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000759 const struct in6_addr *saddr, const struct in6_addr *daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700760{
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -0700761 struct tcphdr *th = tcp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700762
Patrick McHardy84fa7932006-08-29 16:44:56 -0700763 if (skb->ip_summed == CHECKSUM_PARTIAL) {
Herbert Xu8ad50d92010-04-11 02:15:54 +0000764 th->check = ~tcp_v6_check(skb->len, saddr, daddr, 0);
Herbert Xu663ead32007-04-09 11:59:07 -0700765 skb->csum_start = skb_transport_header(skb) - skb->head;
Al Viroff1dcad2006-11-20 18:07:29 -0800766 skb->csum_offset = offsetof(struct tcphdr, check);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700767 } else {
Herbert Xu8ad50d92010-04-11 02:15:54 +0000768 th->check = tcp_v6_check(skb->len, saddr, daddr,
769 csum_partial(th, th->doff << 2,
770 skb->csum));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700771 }
772}
773
Herbert Xubb296242010-04-11 02:15:55 +0000774static void tcp_v6_send_check(struct sock *sk, struct sk_buff *skb)
Herbert Xu8ad50d92010-04-11 02:15:54 +0000775{
776 struct ipv6_pinfo *np = inet6_sk(sk);
777
778 __tcp_v6_send_check(skb, &np->saddr, &np->daddr);
779}
780
Herbert Xua430a432006-07-08 13:34:56 -0700781static int tcp_v6_gso_send_check(struct sk_buff *skb)
782{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000783 const struct ipv6hdr *ipv6h;
Herbert Xua430a432006-07-08 13:34:56 -0700784 struct tcphdr *th;
785
786 if (!pskb_may_pull(skb, sizeof(*th)))
787 return -EINVAL;
788
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700789 ipv6h = ipv6_hdr(skb);
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -0700790 th = tcp_hdr(skb);
Herbert Xua430a432006-07-08 13:34:56 -0700791
792 th->check = 0;
Patrick McHardy84fa7932006-08-29 16:44:56 -0700793 skb->ip_summed = CHECKSUM_PARTIAL;
Herbert Xu8ad50d92010-04-11 02:15:54 +0000794 __tcp_v6_send_check(skb, &ipv6h->saddr, &ipv6h->daddr);
Herbert Xua430a432006-07-08 13:34:56 -0700795 return 0;
796}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700797
Herbert Xu36990672009-05-22 00:45:28 -0700798static struct sk_buff **tcp6_gro_receive(struct sk_buff **head,
799 struct sk_buff *skb)
Herbert Xu684f2172009-01-08 10:41:23 -0800800{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000801 const struct ipv6hdr *iph = skb_gro_network_header(skb);
Herbert Xu684f2172009-01-08 10:41:23 -0800802
803 switch (skb->ip_summed) {
804 case CHECKSUM_COMPLETE:
Herbert Xu86911732009-01-29 14:19:50 +0000805 if (!tcp_v6_check(skb_gro_len(skb), &iph->saddr, &iph->daddr,
Herbert Xu684f2172009-01-08 10:41:23 -0800806 skb->csum)) {
807 skb->ip_summed = CHECKSUM_UNNECESSARY;
808 break;
809 }
810
811 /* fall through */
812 case CHECKSUM_NONE:
813 NAPI_GRO_CB(skb)->flush = 1;
814 return NULL;
815 }
816
817 return tcp_gro_receive(head, skb);
818}
Herbert Xu684f2172009-01-08 10:41:23 -0800819
Herbert Xu36990672009-05-22 00:45:28 -0700820static int tcp6_gro_complete(struct sk_buff *skb)
Herbert Xu684f2172009-01-08 10:41:23 -0800821{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000822 const struct ipv6hdr *iph = ipv6_hdr(skb);
Herbert Xu684f2172009-01-08 10:41:23 -0800823 struct tcphdr *th = tcp_hdr(skb);
824
825 th->check = ~tcp_v6_check(skb->len - skb_transport_offset(skb),
826 &iph->saddr, &iph->daddr, 0);
827 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
828
829 return tcp_gro_complete(skb);
830}
Herbert Xu684f2172009-01-08 10:41:23 -0800831
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700832static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
Eric Dumazetb903d322011-10-27 00:44:35 -0400833 u32 ts, struct tcp_md5sig_key *key, int rst, u8 tclass)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700834{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400835 const struct tcphdr *th = tcp_hdr(skb);
836 struct tcphdr *t1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700837 struct sk_buff *buff;
David S. Miller4c9483b2011-03-12 16:22:43 -0500838 struct flowi6 fl6;
Eric Dumazetadf30902009-06-02 05:19:30 +0000839 struct net *net = dev_net(skb_dst(skb)->dev);
Daniel Lezcanoe5047992008-03-07 11:16:26 -0800840 struct sock *ctl_sk = net->ipv6.tcp_sk;
YOSHIFUJI Hideaki9cb57342008-01-12 02:16:03 -0800841 unsigned int tot_len = sizeof(struct tcphdr);
Eric Dumazetadf30902009-06-02 05:19:30 +0000842 struct dst_entry *dst;
Al Viroe69a4ad2006-11-14 20:56:00 -0800843 __be32 *topt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700844
845 if (ts)
YOSHIFUJI Hideaki4244f8a2006-10-10 19:40:50 -0700846 tot_len += TCPOLEN_TSTAMP_ALIGNED;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800847#ifdef CONFIG_TCP_MD5SIG
848 if (key)
849 tot_len += TCPOLEN_MD5SIG_ALIGNED;
850#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700851
852 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
853 GFP_ATOMIC);
854 if (buff == NULL)
855 return;
856
857 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
858
Ilpo Järvinen77c676d2008-10-09 14:41:38 -0700859 t1 = (struct tcphdr *) skb_push(buff, tot_len);
Herbert Xu6651ffc2010-04-21 00:47:15 -0700860 skb_reset_transport_header(buff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700861
862 /* Swap the send and the receive. */
863 memset(t1, 0, sizeof(*t1));
864 t1->dest = th->source;
865 t1->source = th->dest;
Ilpo Järvinen77c676d2008-10-09 14:41:38 -0700866 t1->doff = tot_len / 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700867 t1->seq = htonl(seq);
868 t1->ack_seq = htonl(ack);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700869 t1->ack = !rst || !th->ack;
870 t1->rst = rst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700871 t1->window = htons(win);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800872
Al Viroe69a4ad2006-11-14 20:56:00 -0800873 topt = (__be32 *)(t1 + 1);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900874
Linus Torvalds1da177e2005-04-16 15:20:36 -0700875 if (ts) {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800876 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
877 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
878 *topt++ = htonl(tcp_time_stamp);
Ilpo Järvinen53b12572008-10-08 14:36:33 -0700879 *topt++ = htonl(ts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700880 }
881
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800882#ifdef CONFIG_TCP_MD5SIG
883 if (key) {
884 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
885 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
Adam Langley49a72df2008-07-19 00:01:42 -0700886 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
Adam Langley90b7e112008-07-31 20:49:48 -0700887 &ipv6_hdr(skb)->saddr,
888 &ipv6_hdr(skb)->daddr, t1);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800889 }
890#endif
891
David S. Miller4c9483b2011-03-12 16:22:43 -0500892 memset(&fl6, 0, sizeof(fl6));
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000893 fl6.daddr = ipv6_hdr(skb)->saddr;
894 fl6.saddr = ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895
David S. Millere5700af2010-04-21 14:59:20 -0700896 buff->ip_summed = CHECKSUM_PARTIAL;
897 buff->csum = 0;
898
David S. Miller4c9483b2011-03-12 16:22:43 -0500899 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700900
David S. Miller4c9483b2011-03-12 16:22:43 -0500901 fl6.flowi6_proto = IPPROTO_TCP;
Alexey Kuznetsov259c5a72012-10-12 04:34:17 +0000902 if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
903 fl6.flowi6_oif = inet6_iif(skb);
Lorenzo Colitti2887dec2014-03-18 20:52:27 +0900904 fl6.flowi6_mark = IP6_REPLY_MARK(net, skb->mark);
David S. Miller1958b852011-03-12 16:36:19 -0500905 fl6.fl6_dport = t1->dest;
906 fl6.fl6_sport = t1->source;
David S. Miller4c9483b2011-03-12 16:22:43 -0500907 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700908
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700909 /* Pass a socket to ip6_dst_lookup either it is for RST
910 * Underlying function will use this to retrieve the network
911 * namespace
912 */
David S. Miller4c9483b2011-03-12 16:22:43 -0500913 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL, false);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800914 if (!IS_ERR(dst)) {
915 skb_dst_set(buff, dst);
Eric Dumazetb903d322011-10-27 00:44:35 -0400916 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800917 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
918 if (rst)
919 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
920 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700921 }
922
923 kfree_skb(buff);
924}
925
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700926static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
927{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400928 const struct tcphdr *th = tcp_hdr(skb);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700929 u32 seq = 0, ack_seq = 0;
Guo-Fu Tsengfa3e5b42008-10-09 21:11:56 -0700930 struct tcp_md5sig_key *key = NULL;
Shawn Lu658ddaa2012-01-31 22:35:48 +0000931#ifdef CONFIG_TCP_MD5SIG
932 const __u8 *hash_location = NULL;
933 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
934 unsigned char newhash[16];
935 int genhash;
936 struct sock *sk1 = NULL;
937#endif
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700938
939 if (th->rst)
940 return;
941
942 if (!ipv6_unicast_destination(skb))
943 return;
944
945#ifdef CONFIG_TCP_MD5SIG
Shawn Lu658ddaa2012-01-31 22:35:48 +0000946 hash_location = tcp_parse_md5sig_option(th);
947 if (!sk && hash_location) {
948 /*
949 * active side is lost. Try to find listening socket through
950 * source port, and then find md5 key through listening socket.
951 * we are not loose security here:
952 * Incoming packet is checked with md5 hash with finding key,
953 * no RST generated if md5 hash doesn't match.
954 */
955 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
956 &tcp_hashinfo, &ipv6h->daddr,
957 ntohs(th->source), inet6_iif(skb));
958 if (!sk1)
959 return;
960
961 rcu_read_lock();
962 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
963 if (!key)
964 goto release_sk1;
965
966 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
967 if (genhash || memcmp(hash_location, newhash, 16) != 0)
968 goto release_sk1;
969 } else {
970 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
971 }
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700972#endif
973
974 if (th->ack)
975 seq = ntohl(th->ack_seq);
976 else
977 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
978 (th->doff << 2);
979
Eric Dumazetb903d322011-10-27 00:44:35 -0400980 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, key, 1, 0);
Shawn Lu658ddaa2012-01-31 22:35:48 +0000981
982#ifdef CONFIG_TCP_MD5SIG
983release_sk1:
984 if (sk1) {
985 rcu_read_unlock();
986 sock_put(sk1);
987 }
988#endif
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700989}
990
991static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack, u32 win, u32 ts,
Eric Dumazetb903d322011-10-27 00:44:35 -0400992 struct tcp_md5sig_key *key, u8 tclass)
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700993{
Eric Dumazetb903d322011-10-27 00:44:35 -0400994 tcp_v6_send_response(skb, seq, ack, win, ts, key, 0, tclass);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700995}
996
Linus Torvalds1da177e2005-04-16 15:20:36 -0700997static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
998{
Arnaldo Carvalho de Melo8feaf0c2005-08-09 20:09:30 -0700999 struct inet_timewait_sock *tw = inet_twsk(sk);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001000 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001001
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +09001002 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
Arnaldo Carvalho de Melo8feaf0c2005-08-09 20:09:30 -07001003 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
Eric Dumazetb903d322011-10-27 00:44:35 -04001004 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw),
1005 tw->tw_tclass);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001006
Arnaldo Carvalho de Melo8feaf0c2005-08-09 20:09:30 -07001007 inet_twsk_put(tw);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001008}
1009
Gui Jianfeng6edafaa2008-08-06 23:50:04 -07001010static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
1011 struct request_sock *req)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001012{
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +09001013 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1, req->rcv_wnd, req->ts_recent,
Eric Dumazetb903d322011-10-27 00:44:35 -04001014 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr), 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015}
1016
1017
1018static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
1019{
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -07001020 struct request_sock *req, **prev;
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001021 const struct tcphdr *th = tcp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001022 struct sock *nsk;
1023
1024 /* Find possible connection requests. */
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -08001025 req = inet6_csk_search_req(sk, &prev, th->source,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001026 &ipv6_hdr(skb)->saddr,
1027 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001028 if (req)
1029 return tcp_check_req(sk, skb, req, prev);
1030
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001031 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
Pavel Emelyanovd86e0da2008-01-31 05:07:21 -08001032 &ipv6_hdr(skb)->saddr, th->source,
1033 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001034
1035 if (nsk) {
1036 if (nsk->sk_state != TCP_TIME_WAIT) {
1037 bh_lock_sock(nsk);
1038 return nsk;
1039 }
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001040 inet_twsk_put(inet_twsk(nsk));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001041 return NULL;
1042 }
1043
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001044#ifdef CONFIG_SYN_COOKIES
Florian Westphalaf9b4732010-06-03 00:43:44 +00001045 if (!th->syn)
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001046 sk = cookie_v6_check(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001047#endif
1048 return sk;
1049}
1050
Linus Torvalds1da177e2005-04-16 15:20:36 -07001051/* FIXME: this is substantially similar to the ipv4 code.
1052 * Can some kind of merge be done? -- erics
1053 */
1054static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1055{
William Allen Simpson4957faa2009-12-02 18:25:27 +00001056 struct tcp_extend_values tmp_ext;
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001057 struct tcp_options_received tmp_opt;
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001058 const u8 *hash_location;
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001059 struct request_sock *req;
Arnaldo Carvalho de Meloca304b62005-12-13 23:15:40 -08001060 struct inet6_request_sock *treq;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001061 struct ipv6_pinfo *np = inet6_sk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001062 struct tcp_sock *tp = tcp_sk(sk);
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001063 __u32 isn = TCP_SKB_CB(skb)->when;
David S. Miller493f3772010-12-02 12:14:29 -08001064 struct dst_entry *dst = NULL;
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001065 int want_cookie = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001066
1067 if (skb->protocol == htons(ETH_P_IP))
1068 return tcp_v4_conn_request(sk, skb);
1069
1070 if (!ipv6_unicast_destination(skb))
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001071 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001072
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001073 if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
Eric Dumazet946cedc2011-08-30 03:21:44 +00001074 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
1075 if (!want_cookie)
1076 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001077 }
1078
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001079 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001080 goto drop;
1081
Arnaldo Carvalho de Meloca304b62005-12-13 23:15:40 -08001082 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001083 if (req == NULL)
1084 goto drop;
1085
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001086#ifdef CONFIG_TCP_MD5SIG
1087 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1088#endif
1089
Linus Torvalds1da177e2005-04-16 15:20:36 -07001090 tcp_clear_options(&tmp_opt);
1091 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1092 tmp_opt.user_mss = tp->rx_opt.user_mss;
David S. Millerbb5b7c12009-12-15 20:56:42 -08001093 tcp_parse_options(skb, &tmp_opt, &hash_location, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001094
William Allen Simpson4957faa2009-12-02 18:25:27 +00001095 if (tmp_opt.cookie_plus > 0 &&
1096 tmp_opt.saw_tstamp &&
1097 !tp->rx_opt.cookie_out_never &&
1098 (sysctl_tcp_cookie_size > 0 ||
1099 (tp->cookie_values != NULL &&
1100 tp->cookie_values->cookie_desired > 0))) {
1101 u8 *c;
1102 u32 *d;
1103 u32 *mess = &tmp_ext.cookie_bakery[COOKIE_DIGEST_WORDS];
1104 int l = tmp_opt.cookie_plus - TCPOLEN_COOKIE_BASE;
1105
1106 if (tcp_cookie_generator(&tmp_ext.cookie_bakery[0]) != 0)
1107 goto drop_and_free;
1108
1109 /* Secret recipe starts with IP addresses */
Eric Dumazet0eae88f2010-04-20 19:06:52 -07001110 d = (__force u32 *)&ipv6_hdr(skb)->daddr.s6_addr32[0];
William Allen Simpson4957faa2009-12-02 18:25:27 +00001111 *mess++ ^= *d++;
1112 *mess++ ^= *d++;
1113 *mess++ ^= *d++;
1114 *mess++ ^= *d++;
Eric Dumazet0eae88f2010-04-20 19:06:52 -07001115 d = (__force u32 *)&ipv6_hdr(skb)->saddr.s6_addr32[0];
William Allen Simpson4957faa2009-12-02 18:25:27 +00001116 *mess++ ^= *d++;
1117 *mess++ ^= *d++;
1118 *mess++ ^= *d++;
1119 *mess++ ^= *d++;
1120
1121 /* plus variable length Initiator Cookie */
1122 c = (u8 *)mess;
1123 while (l-- > 0)
1124 *c++ ^= *hash_location++;
1125
William Allen Simpson4957faa2009-12-02 18:25:27 +00001126 want_cookie = 0; /* not our kind of cookie */
William Allen Simpson4957faa2009-12-02 18:25:27 +00001127 tmp_ext.cookie_out_never = 0; /* false */
1128 tmp_ext.cookie_plus = tmp_opt.cookie_plus;
1129 } else if (!tp->rx_opt.cookie_in_always) {
1130 /* redundant indications, but ensure initialization. */
1131 tmp_ext.cookie_out_never = 1; /* true */
1132 tmp_ext.cookie_plus = 0;
1133 } else {
1134 goto drop_and_free;
1135 }
1136 tmp_ext.cookie_in_always = tp->rx_opt.cookie_in_always;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001137
Florian Westphal4dfc2812008-04-10 03:12:40 -07001138 if (want_cookie && !tmp_opt.saw_tstamp)
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001139 tcp_clear_options(&tmp_opt);
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001140
Linus Torvalds1da177e2005-04-16 15:20:36 -07001141 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1142 tcp_openreq_init(req, &tmp_opt, skb);
1143
Arnaldo Carvalho de Meloca304b62005-12-13 23:15:40 -08001144 treq = inet6_rsk(req);
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001145 treq->rmt_addr = ipv6_hdr(skb)->saddr;
1146 treq->loc_addr = ipv6_hdr(skb)->daddr;
Florian Westphal172d69e2010-06-21 11:48:45 +00001147 if (!want_cookie || tmp_opt.tstamp_ok)
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001148 TCP_ECN_create_request(req, tcp_hdr(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001149
Eric Dumazet4d0fe502011-11-23 17:29:23 -05001150 treq->iif = sk->sk_bound_dev_if;
Lorenzo Colitti8cb56e32014-03-26 13:03:12 +09001151 inet_rsk(req)->ir_mark = inet_request_mark(sk, skb);
Eric Dumazet4d0fe502011-11-23 17:29:23 -05001152
1153 /* So that link locals have meaning */
1154 if (!sk->sk_bound_dev_if &&
1155 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1156 treq->iif = inet6_iif(skb);
1157
Florian Westphal2bbdf382010-06-13 11:29:39 +00001158 if (!isn) {
David S. Miller493f3772010-12-02 12:14:29 -08001159 struct inet_peer *peer = NULL;
1160
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001161 if (ipv6_opt_accepted(sk, skb) ||
1162 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1163 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1164 atomic_inc(&skb->users);
1165 treq->pktopts = skb;
1166 }
David S. Miller493f3772010-12-02 12:14:29 -08001167
1168 if (want_cookie) {
Florian Westphal2bbdf382010-06-13 11:29:39 +00001169 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1170 req->cookie_ts = tmp_opt.tstamp_ok;
David S. Miller493f3772010-12-02 12:14:29 -08001171 goto have_isn;
Florian Westphal2bbdf382010-06-13 11:29:39 +00001172 }
David S. Miller493f3772010-12-02 12:14:29 -08001173
1174 /* VJ's idea. We save last timestamp seen
1175 * from the destination in peer table, when entering
1176 * state TIME-WAIT, and check against it before
1177 * accepting new connection request.
1178 *
1179 * If "isn" is not zero, this request hit alive
1180 * timewait bucket, so that all the necessary checks
1181 * are made in the function processing timewait state.
1182 */
1183 if (tmp_opt.saw_tstamp &&
1184 tcp_death_row.sysctl_tw_recycle &&
1185 (dst = inet6_csk_route_req(sk, req)) != NULL &&
1186 (peer = rt6_get_peer((struct rt6_info *)dst)) != NULL &&
David S. Miller7a71ed82011-02-09 14:30:26 -08001187 ipv6_addr_equal((struct in6_addr *)peer->daddr.addr.a6,
David S. Miller493f3772010-12-02 12:14:29 -08001188 &treq->rmt_addr)) {
1189 inet_peer_refcheck(peer);
1190 if ((u32)get_seconds() - peer->tcp_ts_stamp < TCP_PAWS_MSL &&
1191 (s32)(peer->tcp_ts - req->ts_recent) >
1192 TCP_PAWS_WINDOW) {
1193 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1194 goto drop_and_release;
1195 }
1196 }
1197 /* Kill the following clause, if you dislike this way. */
1198 else if (!sysctl_tcp_syncookies &&
1199 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1200 (sysctl_max_syn_backlog >> 2)) &&
1201 (!peer || !peer->tcp_ts_stamp) &&
1202 (!dst || !dst_metric(dst, RTAX_RTT))) {
1203 /* Without syncookies last quarter of
1204 * backlog is filled with destinations,
1205 * proven to be alive.
1206 * It means that we continue to communicate
1207 * to destinations, already remembered
1208 * to the moment of synflood.
1209 */
1210 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
1211 &treq->rmt_addr, ntohs(tcp_hdr(skb)->source));
1212 goto drop_and_release;
1213 }
1214
1215 isn = tcp_v6_init_sequence(skb);
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001216 }
David S. Miller493f3772010-12-02 12:14:29 -08001217have_isn:
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -07001218 tcp_rsk(req)->snt_isn = isn;
Jerry Chu9ad7c042011-06-08 11:08:38 +00001219 tcp_rsk(req)->snt_synack = tcp_time_stamp;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001220
Venkat Yekkirala4237c752006-07-24 23:32:50 -07001221 security_inet_conn_request(sk, skb, req);
1222
William Allen Simpson4957faa2009-12-02 18:25:27 +00001223 if (tcp_v6_send_synack(sk, req,
1224 (struct request_values *)&tmp_ext) ||
1225 want_cookie)
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001226 goto drop_and_free;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001227
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001228 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1229 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001230
David S. Miller493f3772010-12-02 12:14:29 -08001231drop_and_release:
1232 dst_release(dst);
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001233drop_and_free:
1234 reqsk_free(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001235drop:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001236 return 0; /* don't send reset */
1237}
1238
1239static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -07001240 struct request_sock *req,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001241 struct dst_entry *dst)
1242{
Vegard Nossum78d15e82008-09-12 16:17:43 -07001243 struct inet6_request_sock *treq;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001244 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1245 struct tcp6_sock *newtcp6sk;
1246 struct inet_sock *newinet;
1247 struct tcp_sock *newtp;
1248 struct sock *newsk;
1249 struct ipv6_txoptions *opt;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001250#ifdef CONFIG_TCP_MD5SIG
1251 struct tcp_md5sig_key *key;
1252#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001253
1254 if (skb->protocol == htons(ETH_P_IP)) {
1255 /*
1256 * v6 mapped
1257 */
1258
1259 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1260
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001261 if (newsk == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001262 return NULL;
1263
1264 newtcp6sk = (struct tcp6_sock *)newsk;
1265 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1266
1267 newinet = inet_sk(newsk);
1268 newnp = inet6_sk(newsk);
1269 newtp = tcp_sk(newsk);
1270
1271 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1272
Eric Dumazetc720c7e2009-10-15 06:30:45 +00001273 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newnp->daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001274
Eric Dumazetc720c7e2009-10-15 06:30:45 +00001275 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001276
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001277 newnp->rcv_saddr = newnp->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001278
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001279 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001280 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001281#ifdef CONFIG_TCP_MD5SIG
1282 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1283#endif
1284
Yan, Zheng676a1182011-09-25 02:21:30 +00001285 newnp->ipv6_ac_list = NULL;
1286 newnp->ipv6_fl_list = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287 newnp->pktoptions = NULL;
1288 newnp->opt = NULL;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001289 newnp->mcast_oif = inet6_iif(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001290 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
Jiri Benc4c507d22012-02-09 09:35:49 +00001291 newnp->rcv_tclass = ipv6_tclass(ipv6_hdr(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001292
Arnaldo Carvalho de Meloe6848972005-08-09 19:45:38 -07001293 /*
1294 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1295 * here, tcp_create_openreq_child now does this for us, see the comment in
1296 * that function for the gory details. -acme
Linus Torvalds1da177e2005-04-16 15:20:36 -07001297 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001298
1299 /* It is tricky place. Until this moment IPv4 tcp
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001300 worked with IPv6 icsk.icsk_af_ops.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001301 Sync it now.
1302 */
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001303 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001304
1305 return newsk;
1306 }
1307
Vegard Nossum78d15e82008-09-12 16:17:43 -07001308 treq = inet6_rsk(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001309 opt = np->opt;
1310
1311 if (sk_acceptq_is_full(sk))
1312 goto out_overflow;
1313
David S. Miller493f3772010-12-02 12:14:29 -08001314 if (!dst) {
1315 dst = inet6_csk_route_req(sk, req);
1316 if (!dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001317 goto out;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001318 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001319
1320 newsk = tcp_create_openreq_child(sk, req, skb);
1321 if (newsk == NULL)
Balazs Scheidler093d2822010-10-21 13:06:43 +02001322 goto out_nonewsk;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001323
Arnaldo Carvalho de Meloe6848972005-08-09 19:45:38 -07001324 /*
1325 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1326 * count here, tcp_create_openreq_child now does this for us, see the
1327 * comment in that function for the gory details. -acme
1328 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001329
Stephen Hemminger59eed272006-08-25 15:55:43 -07001330 newsk->sk_gso_type = SKB_GSO_TCPV6;
YOSHIFUJI Hideaki8e1ef0a2006-08-29 17:15:09 -07001331 __ip6_dst_store(newsk, dst, NULL, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001332
1333 newtcp6sk = (struct tcp6_sock *)newsk;
1334 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1335
1336 newtp = tcp_sk(newsk);
1337 newinet = inet_sk(newsk);
1338 newnp = inet6_sk(newsk);
1339
1340 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1341
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +00001342 newnp->daddr = treq->rmt_addr;
1343 newnp->saddr = treq->loc_addr;
1344 newnp->rcv_saddr = treq->loc_addr;
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -07001345 newsk->sk_bound_dev_if = treq->iif;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001346
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001347 /* Now IPv6 options...
Linus Torvalds1da177e2005-04-16 15:20:36 -07001348
1349 First: no IPv4 options.
1350 */
Eric Dumazetf6d8bd02011-04-21 09:45:37 +00001351 newinet->inet_opt = NULL;
Yan, Zheng676a1182011-09-25 02:21:30 +00001352 newnp->ipv6_ac_list = NULL;
Masayuki Nakagawad35690b2007-03-16 16:14:03 -07001353 newnp->ipv6_fl_list = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001354
1355 /* Clone RX bits */
1356 newnp->rxopt.all = np->rxopt.all;
1357
1358 /* Clone pktoptions received with SYN */
1359 newnp->pktoptions = NULL;
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -07001360 if (treq->pktopts != NULL) {
1361 newnp->pktoptions = skb_clone(treq->pktopts, GFP_ATOMIC);
1362 kfree_skb(treq->pktopts);
1363 treq->pktopts = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001364 if (newnp->pktoptions)
1365 skb_set_owner_r(newnp->pktoptions, newsk);
1366 }
1367 newnp->opt = NULL;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001368 newnp->mcast_oif = inet6_iif(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001369 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
Jiri Benc4c507d22012-02-09 09:35:49 +00001370 newnp->rcv_tclass = ipv6_tclass(ipv6_hdr(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001371
1372 /* Clone native IPv6 options from listening socket (if any)
1373
1374 Yes, keeping reference count would be much more clever,
1375 but we make one more one thing there: reattach optmem
1376 to newsk.
1377 */
1378 if (opt) {
1379 newnp->opt = ipv6_dup_options(newsk, opt);
1380 if (opt != np->opt)
1381 sock_kfree_s(sk, opt, opt->tot_len);
1382 }
1383
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001384 inet_csk(newsk)->icsk_ext_hdr_len = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001385 if (newnp->opt)
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001386 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1387 newnp->opt->opt_flen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001388
John Heffner5d424d52006-03-20 17:53:41 -08001389 tcp_mtup_init(newsk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001390 tcp_sync_mss(newsk, dst_mtu(dst));
David S. Miller0dbaee32010-12-13 12:52:14 -08001391 newtp->advmss = dst_metric_advmss(dst);
Neal Cardwelld135c522012-04-22 09:45:47 +00001392 if (tcp_sk(sk)->rx_opt.user_mss &&
1393 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1394 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1395
Linus Torvalds1da177e2005-04-16 15:20:36 -07001396 tcp_initialize_rcv_mss(newsk);
Jerry Chu9ad7c042011-06-08 11:08:38 +00001397 if (tcp_rsk(req)->snt_synack)
1398 tcp_valid_rtt_meas(newsk,
1399 tcp_time_stamp - tcp_rsk(req)->snt_synack);
1400 newtp->total_retrans = req->retrans;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001401
Eric Dumazetc720c7e2009-10-15 06:30:45 +00001402 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1403 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001404
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001405#ifdef CONFIG_TCP_MD5SIG
1406 /* Copy over the MD5 key from the original socket */
1407 if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1408 /* We're using one, so create a matching key
1409 * on the newsk structure. If we fail to get
1410 * memory, then we end up not copying the key
1411 * across. Shucks.
1412 */
Eric Dumazeta915da9b2012-01-31 05:18:33 +00001413 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newnp->daddr,
1414 AF_INET6, key->key, key->keylen, GFP_ATOMIC);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001415 }
1416#endif
1417
Balazs Scheidler093d2822010-10-21 13:06:43 +02001418 if (__inet_inherit_port(sk, newsk) < 0) {
Christoph Paaschd46699a2012-12-14 04:07:58 +00001419 inet_csk_prepare_forced_close(newsk);
1420 tcp_done(newsk);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001421 goto out;
1422 }
Eric Dumazet9327f702009-12-04 03:46:54 +00001423 __inet6_hash(newsk, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001424
1425 return newsk;
1426
1427out_overflow:
Pavel Emelyanovde0744a2008-07-16 20:31:16 -07001428 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001429out_nonewsk:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001430 if (opt && opt != np->opt)
1431 sock_kfree_s(sk, opt, opt->tot_len);
1432 dst_release(dst);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001433out:
1434 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001435 return NULL;
1436}
1437
Al Virob51655b2006-11-14 21:40:42 -08001438static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001439{
Patrick McHardy84fa7932006-08-29 16:44:56 -07001440 if (skb->ip_summed == CHECKSUM_COMPLETE) {
Herbert Xu684f2172009-01-08 10:41:23 -08001441 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001442 &ipv6_hdr(skb)->daddr, skb->csum)) {
Herbert Xufb286bb2005-11-10 13:01:24 -08001443 skb->ip_summed = CHECKSUM_UNNECESSARY;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001444 return 0;
Herbert Xufb286bb2005-11-10 13:01:24 -08001445 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001446 }
Herbert Xufb286bb2005-11-10 13:01:24 -08001447
Herbert Xu684f2172009-01-08 10:41:23 -08001448 skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001449 &ipv6_hdr(skb)->saddr,
1450 &ipv6_hdr(skb)->daddr, 0));
Herbert Xufb286bb2005-11-10 13:01:24 -08001451
Linus Torvalds1da177e2005-04-16 15:20:36 -07001452 if (skb->len <= 76) {
Herbert Xufb286bb2005-11-10 13:01:24 -08001453 return __skb_checksum_complete(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001454 }
1455 return 0;
1456}
1457
1458/* The socket must have it's spinlock held when we get
1459 * here.
1460 *
1461 * We have a potential double-lock case here, so even when
1462 * doing backlog processing we use the BH locking scheme.
1463 * This is because we cannot sleep with the original spinlock
1464 * held.
1465 */
1466static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1467{
1468 struct ipv6_pinfo *np = inet6_sk(sk);
1469 struct tcp_sock *tp;
1470 struct sk_buff *opt_skb = NULL;
1471
1472 /* Imagine: socket is IPv6. IPv4 packet arrives,
1473 goes to IPv4 receive handler and backlogged.
1474 From backlog it always goes here. Kerboom...
1475 Fortunately, tcp_rcv_established and rcv_established
1476 handle them correctly, but it is not case with
1477 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1478 */
1479
1480 if (skb->protocol == htons(ETH_P_IP))
1481 return tcp_v4_do_rcv(sk, skb);
1482
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001483#ifdef CONFIG_TCP_MD5SIG
1484 if (tcp_v6_inbound_md5_hash (sk, skb))
1485 goto discard;
1486#endif
1487
Dmitry Mishinfda9ef52006-08-31 15:28:39 -07001488 if (sk_filter(sk, skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001489 goto discard;
1490
1491 /*
1492 * socket locking is here for SMP purposes as backlog rcv
1493 * is currently called with bh processing disabled.
1494 */
1495
1496 /* Do Stevens' IPV6_PKTOPTIONS.
1497
1498 Yes, guys, it is the only place in our code, where we
1499 may make it not affecting IPv4.
1500 The rest of code is protocol independent,
1501 and I do not like idea to uglify IPv4.
1502
1503 Actually, all the idea behind IPV6_PKTOPTIONS
1504 looks not very well thought. For now we latch
1505 options, received in the last packet, enqueued
1506 by tcp. Feel free to propose better solution.
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001507 --ANK (980728)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001508 */
1509 if (np->rxopt.all)
1510 opt_skb = skb_clone(skb, GFP_ATOMIC);
1511
1512 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
Tom Herbertbdeab992011-08-14 19:45:55 +00001513 sock_rps_save_rxhash(sk, skb);
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001514 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001515 goto reset;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001516 if (opt_skb)
1517 goto ipv6_pktoptions;
1518 return 0;
1519 }
1520
Arnaldo Carvalho de Meloab6a5bb2007-03-18 17:43:48 -07001521 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001522 goto csum_err;
1523
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001524 if (sk->sk_state == TCP_LISTEN) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001525 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1526 if (!nsk)
1527 goto discard;
1528
1529 /*
1530 * Queue it on the new socket if the new socket is active,
1531 * otherwise we just shortcircuit this and continue with
1532 * the new socket..
1533 */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001534 if(nsk != sk) {
Tom Herbertbdeab992011-08-14 19:45:55 +00001535 sock_rps_save_rxhash(nsk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001536 if (tcp_child_process(sk, nsk, skb))
1537 goto reset;
1538 if (opt_skb)
1539 __kfree_skb(opt_skb);
1540 return 0;
1541 }
Neil Horman47482f12011-04-06 13:07:09 -07001542 } else
Tom Herbertbdeab992011-08-14 19:45:55 +00001543 sock_rps_save_rxhash(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001544
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001545 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001546 goto reset;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001547 if (opt_skb)
1548 goto ipv6_pktoptions;
1549 return 0;
1550
1551reset:
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001552 tcp_v6_send_reset(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001553discard:
1554 if (opt_skb)
1555 __kfree_skb(opt_skb);
1556 kfree_skb(skb);
1557 return 0;
1558csum_err:
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001559 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001560 goto discard;
1561
1562
1563ipv6_pktoptions:
1564 /* Do you ask, what is it?
1565
1566 1. skb was enqueued by tcp.
1567 2. skb is added to tail of read queue, rather than out of order.
1568 3. socket is not in passive state.
1569 4. Finally, it really contains options, which user wants to receive.
1570 */
1571 tp = tcp_sk(sk);
1572 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1573 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
YOSHIFUJI Hideaki333fad52005-09-08 09:59:17 +09001574 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001575 np->mcast_oif = inet6_iif(opt_skb);
YOSHIFUJI Hideaki333fad52005-09-08 09:59:17 +09001576 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001577 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
Jiri Benc4c507d22012-02-09 09:35:49 +00001578 if (np->rxopt.bits.rxtclass)
Daniel Borkmannd22586f2013-09-03 19:29:12 +02001579 np->rcv_tclass = ipv6_tclass(ipv6_hdr(opt_skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001580 if (ipv6_opt_accepted(sk, opt_skb)) {
1581 skb_set_owner_r(opt_skb, sk);
1582 opt_skb = xchg(&np->pktoptions, opt_skb);
1583 } else {
1584 __kfree_skb(opt_skb);
1585 opt_skb = xchg(&np->pktoptions, NULL);
1586 }
1587 }
1588
Wei Yongjun800d55f2009-02-23 21:45:33 +00001589 kfree_skb(opt_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001590 return 0;
1591}
1592
Herbert Xue5bbef22007-10-15 12:50:28 -07001593static int tcp_v6_rcv(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001594{
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001595 const struct tcphdr *th;
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001596 const struct ipv6hdr *hdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001597 struct sock *sk;
1598 int ret;
Pavel Emelyanova86b1e32008-07-16 20:20:58 -07001599 struct net *net = dev_net(skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001600
1601 if (skb->pkt_type != PACKET_HOST)
1602 goto discard_it;
1603
1604 /*
1605 * Count it even if it's bad.
1606 */
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001607 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001608
1609 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1610 goto discard_it;
1611
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001612 th = tcp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001613
1614 if (th->doff < sizeof(struct tcphdr)/4)
1615 goto bad_packet;
1616 if (!pskb_may_pull(skb, th->doff*4))
1617 goto discard_it;
1618
Herbert Xu60476372007-04-09 11:59:39 -07001619 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001620 goto bad_packet;
1621
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001622 th = tcp_hdr(skb);
Stephen Hemmingere802af92010-04-22 15:24:53 -07001623 hdr = ipv6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001624 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1625 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1626 skb->len - th->doff*4);
1627 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1628 TCP_SKB_CB(skb)->when = 0;
Eric Dumazetb82d1bb2011-09-27 02:20:08 -04001629 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001630 TCP_SKB_CB(skb)->sacked = 0;
1631
Arnaldo Carvalho de Melo9a1f27c2008-10-07 11:41:57 -07001632 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001633 if (!sk)
1634 goto no_tcp_socket;
1635
1636process:
1637 if (sk->sk_state == TCP_TIME_WAIT)
1638 goto do_time_wait;
1639
Stephen Hemmingere802af92010-04-22 15:24:53 -07001640 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1641 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1642 goto discard_and_relse;
1643 }
1644
Linus Torvalds1da177e2005-04-16 15:20:36 -07001645 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1646 goto discard_and_relse;
1647
Dmitry Mishinfda9ef52006-08-31 15:28:39 -07001648 if (sk_filter(sk, skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001649 goto discard_and_relse;
1650
1651 skb->dev = NULL;
1652
Fabio Olive Leite293b9c42006-09-25 22:28:47 -07001653 bh_lock_sock_nested(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001654 ret = 0;
1655 if (!sock_owned_by_user(sk)) {
Chris Leech1a2449a2006-05-23 18:05:53 -07001656#ifdef CONFIG_NET_DMA
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001657 struct tcp_sock *tp = tcp_sk(sk);
David S. Millerb4caea82007-10-26 04:20:13 -07001658 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
Dave Jianga2bd1142012-04-04 16:10:46 -07001659 tp->ucopy.dma_chan = net_dma_find_channel();
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001660 if (tp->ucopy.dma_chan)
1661 ret = tcp_v6_do_rcv(sk, skb);
1662 else
Chris Leech1a2449a2006-05-23 18:05:53 -07001663#endif
1664 {
1665 if (!tcp_prequeue(sk, skb))
1666 ret = tcp_v6_do_rcv(sk, skb);
1667 }
Eric Dumazet6cce09f2010-03-07 23:21:57 +00001668 } else if (unlikely(sk_add_backlog(sk, skb))) {
Zhu Yi6b03a532010-03-04 18:01:41 +00001669 bh_unlock_sock(sk);
Eric Dumazet6cce09f2010-03-07 23:21:57 +00001670 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
Zhu Yi6b03a532010-03-04 18:01:41 +00001671 goto discard_and_relse;
1672 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001673 bh_unlock_sock(sk);
1674
1675 sock_put(sk);
1676 return ret ? -1 : 0;
1677
1678no_tcp_socket:
1679 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1680 goto discard_it;
1681
1682 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1683bad_packet:
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001684 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001685 } else {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001686 tcp_v6_send_reset(NULL, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001687 }
1688
1689discard_it:
1690
1691 /*
1692 * Discard frame
1693 */
1694
1695 kfree_skb(skb);
1696 return 0;
1697
1698discard_and_relse:
1699 sock_put(sk);
1700 goto discard_it;
1701
1702do_time_wait:
1703 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001704 inet_twsk_put(inet_twsk(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001705 goto discard_it;
1706 }
1707
1708 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001709 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001710 inet_twsk_put(inet_twsk(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001711 goto discard_it;
1712 }
1713
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001714 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001715 case TCP_TW_SYN:
1716 {
1717 struct sock *sk2;
1718
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001719 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001720 &ipv6_hdr(skb)->daddr,
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001721 ntohs(th->dest), inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001722 if (sk2 != NULL) {
Arnaldo Carvalho de Melo295ff7e2005-08-09 20:44:40 -07001723 struct inet_timewait_sock *tw = inet_twsk(sk);
1724 inet_twsk_deschedule(tw, &tcp_death_row);
1725 inet_twsk_put(tw);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001726 sk = sk2;
1727 goto process;
1728 }
1729 /* Fall through to ACK */
1730 }
1731 case TCP_TW_ACK:
1732 tcp_v6_timewait_ack(sk, skb);
1733 break;
1734 case TCP_TW_RST:
1735 goto no_tcp_socket;
1736 case TCP_TW_SUCCESS:;
1737 }
1738 goto discard_it;
1739}
1740
David S. Millerccb7c412010-12-01 18:09:13 -08001741static struct inet_peer *tcp_v6_get_peer(struct sock *sk, bool *release_it)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001742{
David S. Millerdb3949c2010-12-02 11:52:07 -08001743 struct rt6_info *rt = (struct rt6_info *) __sk_dst_get(sk);
1744 struct ipv6_pinfo *np = inet6_sk(sk);
1745 struct inet_peer *peer;
1746
1747 if (!rt ||
1748 !ipv6_addr_equal(&np->daddr, &rt->rt6i_dst.addr)) {
1749 peer = inet_getpeer_v6(&np->daddr, 1);
1750 *release_it = true;
1751 } else {
1752 if (!rt->rt6i_peer)
1753 rt6_bind_peer(rt, 1);
1754 peer = rt->rt6i_peer;
David S. Miller457de432010-12-10 13:16:09 -08001755 *release_it = false;
David S. Millerdb3949c2010-12-02 11:52:07 -08001756 }
1757
1758 return peer;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001759}
1760
David S. Millerccb7c412010-12-01 18:09:13 -08001761static void *tcp_v6_tw_get_peer(struct sock *sk)
1762{
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001763 const struct inet6_timewait_sock *tw6 = inet6_twsk(sk);
1764 const struct inet_timewait_sock *tw = inet_twsk(sk);
David S. Millerccb7c412010-12-01 18:09:13 -08001765
1766 if (tw->tw_family == AF_INET)
1767 return tcp_v4_tw_get_peer(sk);
1768
David S. Millerdb3949c2010-12-02 11:52:07 -08001769 return inet_getpeer_v6(&tw6->tw_v6_daddr, 1);
David S. Millerccb7c412010-12-01 18:09:13 -08001770}
1771
1772static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1773 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1774 .twsk_unique = tcp_twsk_unique,
1775 .twsk_destructor= tcp_twsk_destructor,
1776 .twsk_getpeer = tcp_v6_tw_get_peer,
1777};
1778
Stephen Hemminger3b401a82009-09-01 19:25:04 +00001779static const struct inet_connection_sock_af_ops ipv6_specific = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001780 .queue_xmit = inet6_csk_xmit,
1781 .send_check = tcp_v6_send_check,
1782 .rebuild_header = inet6_sk_rebuild_header,
1783 .conn_request = tcp_v6_conn_request,
1784 .syn_recv_sock = tcp_v6_syn_recv_sock,
David S. Miller3f419d22010-11-29 13:37:14 -08001785 .get_peer = tcp_v6_get_peer,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001786 .net_header_len = sizeof(struct ipv6hdr),
1787 .setsockopt = ipv6_setsockopt,
1788 .getsockopt = ipv6_getsockopt,
1789 .addr2sockaddr = inet6_csk_addr2sockaddr,
1790 .sockaddr_len = sizeof(struct sockaddr_in6),
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001791 .bind_conflict = inet6_csk_bind_conflict,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001792#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001793 .compat_setsockopt = compat_ipv6_setsockopt,
1794 .compat_getsockopt = compat_ipv6_getsockopt,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001795#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001796};
1797
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001798#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3d2009-09-01 19:25:03 +00001799static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001800 .md5_lookup = tcp_v6_md5_lookup,
Adam Langley49a72df2008-07-19 00:01:42 -07001801 .calc_md5_hash = tcp_v6_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001802 .md5_parse = tcp_v6_parse_md5_keys,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001803};
David S. Millera9286302006-11-14 19:53:22 -08001804#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001805
Linus Torvalds1da177e2005-04-16 15:20:36 -07001806/*
1807 * TCP over IPv4 via INET6 API
1808 */
1809
Stephen Hemminger3b401a82009-09-01 19:25:04 +00001810static const struct inet_connection_sock_af_ops ipv6_mapped = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001811 .queue_xmit = ip_queue_xmit,
1812 .send_check = tcp_v4_send_check,
1813 .rebuild_header = inet_sk_rebuild_header,
1814 .conn_request = tcp_v6_conn_request,
1815 .syn_recv_sock = tcp_v6_syn_recv_sock,
David S. Miller3f419d22010-11-29 13:37:14 -08001816 .get_peer = tcp_v4_get_peer,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001817 .net_header_len = sizeof(struct iphdr),
1818 .setsockopt = ipv6_setsockopt,
1819 .getsockopt = ipv6_getsockopt,
1820 .addr2sockaddr = inet6_csk_addr2sockaddr,
1821 .sockaddr_len = sizeof(struct sockaddr_in6),
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001822 .bind_conflict = inet6_csk_bind_conflict,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001823#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001824 .compat_setsockopt = compat_ipv6_setsockopt,
1825 .compat_getsockopt = compat_ipv6_getsockopt,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001826#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001827};
1828
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001829#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3d2009-09-01 19:25:03 +00001830static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001831 .md5_lookup = tcp_v4_md5_lookup,
Adam Langley49a72df2008-07-19 00:01:42 -07001832 .calc_md5_hash = tcp_v4_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001833 .md5_parse = tcp_v6_parse_md5_keys,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001834};
David S. Millera9286302006-11-14 19:53:22 -08001835#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001836
Linus Torvalds1da177e2005-04-16 15:20:36 -07001837/* NOTE: A lot of things set to zero explicitly by call to
1838 * sk_alloc() so need not be done here.
1839 */
1840static int tcp_v6_init_sock(struct sock *sk)
1841{
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001842 struct inet_connection_sock *icsk = inet_csk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001843 struct tcp_sock *tp = tcp_sk(sk);
1844
1845 skb_queue_head_init(&tp->out_of_order_queue);
1846 tcp_init_xmit_timers(sk);
1847 tcp_prequeue_init(tp);
1848
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001849 icsk->icsk_rto = TCP_TIMEOUT_INIT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001850 tp->mdev = TCP_TIMEOUT_INIT;
1851
1852 /* So many TCP implementations out there (incorrectly) count the
1853 * initial SYN frame in their delayed-ACK and congestion control
1854 * algorithms that we must have the following bandaid to talk
1855 * efficiently to them. -DaveM
1856 */
1857 tp->snd_cwnd = 2;
1858
1859 /* See draft-stevens-tcpca-spec-01 for discussion of the
1860 * initialization of these values.
1861 */
Ilpo Järvinen0b6a05c2009-09-15 01:30:10 -07001862 tp->snd_ssthresh = TCP_INFINITE_SSTHRESH;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001863 tp->snd_cwnd_clamp = ~0;
William Allen Simpsonbee7ca92009-11-10 09:51:18 +00001864 tp->mss_cache = TCP_MSS_DEFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001865
1866 tp->reordering = sysctl_tcp_reordering;
1867
1868 sk->sk_state = TCP_CLOSE;
1869
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001870 icsk->icsk_af_ops = &ipv6_specific;
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001871 icsk->icsk_ca_ops = &tcp_init_congestion_ops;
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001872 icsk->icsk_sync_mss = tcp_sync_mss;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001873 sk->sk_write_space = sk_stream_write_space;
1874 sock_set_flag(sk, SOCK_USE_WRITE_QUEUE);
1875
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001876#ifdef CONFIG_TCP_MD5SIG
1877 tp->af_specific = &tcp_sock_ipv6_specific;
1878#endif
1879
William Allen Simpson435cf552009-12-02 18:17:05 +00001880 /* TCP Cookie Transactions */
1881 if (sysctl_tcp_cookie_size > 0) {
1882 /* Default, cookies without s_data_payload. */
1883 tp->cookie_values =
1884 kzalloc(sizeof(*tp->cookie_values),
1885 sk->sk_allocation);
1886 if (tp->cookie_values != NULL)
1887 kref_init(&tp->cookie_values->kref);
1888 }
1889 /* Presumed zeroed, in order of appearance:
1890 * cookie_in_always, cookie_out_never,
1891 * s_data_constant, s_data_in, s_data_out
1892 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001893 sk->sk_sndbuf = sysctl_tcp_wmem[1];
1894 sk->sk_rcvbuf = sysctl_tcp_rmem[1];
1895
Herbert Xueb4dea52008-12-29 23:04:08 -08001896 local_bh_disable();
Glauber Costad1a4c0b2011-12-11 21:47:04 +00001897 sock_update_memcg(sk);
Glauber Costa180d8cd2011-12-11 21:47:02 +00001898 sk_sockets_allocated_inc(sk);
Herbert Xueb4dea52008-12-29 23:04:08 -08001899 local_bh_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001900
1901 return 0;
1902}
1903
Brian Haley7d06b2e2008-06-14 17:04:49 -07001904static void tcp_v6_destroy_sock(struct sock *sk)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001905{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001906 tcp_v4_destroy_sock(sk);
Brian Haley7d06b2e2008-06-14 17:04:49 -07001907 inet6_destroy_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001908}
1909
YOSHIFUJI Hideaki952a10b2007-04-21 20:13:44 +09001910#ifdef CONFIG_PROC_FS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001911/* Proc filesystem TCPv6 sock list dumping. */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001912static void get_openreq6(struct seq_file *seq,
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001913 const struct sock *sk, struct request_sock *req, int i, int uid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001914{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001915 int ttd = req->expires - jiffies;
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001916 const struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1917 const struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001918
1919 if (ttd < 0)
1920 ttd = 0;
1921
Linus Torvalds1da177e2005-04-16 15:20:36 -07001922 seq_printf(seq,
1923 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Dan Rosenberg71338aa2011-05-23 12:17:35 +00001924 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001925 i,
1926 src->s6_addr32[0], src->s6_addr32[1],
1927 src->s6_addr32[2], src->s6_addr32[3],
KOVACS Krisztianfd507032008-10-19 23:35:58 -07001928 ntohs(inet_rsk(req)->loc_port),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001929 dest->s6_addr32[0], dest->s6_addr32[1],
1930 dest->s6_addr32[2], dest->s6_addr32[3],
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -07001931 ntohs(inet_rsk(req)->rmt_port),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001932 TCP_SYN_RECV,
1933 0,0, /* could print option size, but that is af dependent. */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001934 1, /* timers active (only the expire timer) */
1935 jiffies_to_clock_t(ttd),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001936 req->retrans,
1937 uid,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001938 0, /* non standard timer */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001939 0, /* open_requests have no inode */
1940 0, req);
1941}
1942
1943static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1944{
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001945 const struct in6_addr *dest, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001946 __u16 destp, srcp;
1947 int timer_active;
1948 unsigned long timer_expires;
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001949 const struct inet_sock *inet = inet_sk(sp);
1950 const struct tcp_sock *tp = tcp_sk(sp);
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001951 const struct inet_connection_sock *icsk = inet_csk(sp);
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001952 const struct ipv6_pinfo *np = inet6_sk(sp);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001953
1954 dest = &np->daddr;
1955 src = &np->rcv_saddr;
Eric Dumazetc720c7e2009-10-15 06:30:45 +00001956 destp = ntohs(inet->inet_dport);
1957 srcp = ntohs(inet->inet_sport);
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001958
1959 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001960 timer_active = 1;
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001961 timer_expires = icsk->icsk_timeout;
1962 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001963 timer_active = 4;
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001964 timer_expires = icsk->icsk_timeout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001965 } else if (timer_pending(&sp->sk_timer)) {
1966 timer_active = 2;
1967 timer_expires = sp->sk_timer.expires;
1968 } else {
1969 timer_active = 0;
1970 timer_expires = jiffies;
1971 }
1972
1973 seq_printf(seq,
1974 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Dan Rosenberg71338aa2011-05-23 12:17:35 +00001975 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %pK %lu %lu %u %u %d\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001976 i,
1977 src->s6_addr32[0], src->s6_addr32[1],
1978 src->s6_addr32[2], src->s6_addr32[3], srcp,
1979 dest->s6_addr32[0], dest->s6_addr32[1],
1980 dest->s6_addr32[2], dest->s6_addr32[3], destp,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001981 sp->sk_state,
Sridhar Samudrala47da8ee2006-06-27 13:29:00 -07001982 tp->write_seq-tp->snd_una,
1983 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001984 timer_active,
1985 jiffies_to_clock_t(timer_expires - jiffies),
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001986 icsk->icsk_retransmits,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001987 sock_i_uid(sp),
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001988 icsk->icsk_probes_out,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001989 sock_i_ino(sp),
1990 atomic_read(&sp->sk_refcnt), sp,
Stephen Hemminger7be87352008-06-27 20:00:19 -07001991 jiffies_to_clock_t(icsk->icsk_rto),
1992 jiffies_to_clock_t(icsk->icsk_ack.ato),
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001993 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
Ilpo Järvinen0b6a05c2009-09-15 01:30:10 -07001994 tp->snd_cwnd,
1995 tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
Linus Torvalds1da177e2005-04-16 15:20:36 -07001996 );
1997}
1998
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001999static void get_timewait6_sock(struct seq_file *seq,
Arnaldo Carvalho de Melo8feaf0c2005-08-09 20:09:30 -07002000 struct inet_timewait_sock *tw, int i)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002001{
Eric Dumazetb71d1d42011-04-22 04:53:02 +00002002 const struct in6_addr *dest, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002003 __u16 destp, srcp;
Eric Dumazetcf533ea2011-10-21 05:22:42 -04002004 const struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002005 int ttd = tw->tw_ttd - jiffies;
2006
2007 if (ttd < 0)
2008 ttd = 0;
2009
Arnaldo Carvalho de Melo0fa1a532005-12-13 23:23:09 -08002010 dest = &tw6->tw_v6_daddr;
2011 src = &tw6->tw_v6_rcv_saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002012 destp = ntohs(tw->tw_dport);
2013 srcp = ntohs(tw->tw_sport);
2014
2015 seq_printf(seq,
2016 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Dan Rosenberg71338aa2011-05-23 12:17:35 +00002017 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07002018 i,
2019 src->s6_addr32[0], src->s6_addr32[1],
2020 src->s6_addr32[2], src->s6_addr32[3], srcp,
2021 dest->s6_addr32[0], dest->s6_addr32[1],
2022 dest->s6_addr32[2], dest->s6_addr32[3], destp,
2023 tw->tw_substate, 0, 0,
2024 3, jiffies_to_clock_t(ttd), 0, 0, 0, 0,
2025 atomic_read(&tw->tw_refcnt), tw);
2026}
2027
Linus Torvalds1da177e2005-04-16 15:20:36 -07002028static int tcp6_seq_show(struct seq_file *seq, void *v)
2029{
2030 struct tcp_iter_state *st;
2031
2032 if (v == SEQ_START_TOKEN) {
2033 seq_puts(seq,
2034 " sl "
2035 "local_address "
2036 "remote_address "
2037 "st tx_queue rx_queue tr tm->when retrnsmt"
2038 " uid timeout inode\n");
2039 goto out;
2040 }
2041 st = seq->private;
2042
2043 switch (st->state) {
2044 case TCP_SEQ_STATE_LISTENING:
2045 case TCP_SEQ_STATE_ESTABLISHED:
2046 get_tcp6_sock(seq, v, st->num);
2047 break;
2048 case TCP_SEQ_STATE_OPENREQ:
2049 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
2050 break;
2051 case TCP_SEQ_STATE_TIME_WAIT:
2052 get_timewait6_sock(seq, v, st->num);
2053 break;
2054 }
2055out:
2056 return 0;
2057}
2058
Arjan van de Ven73cb88e2011-10-30 06:46:30 +00002059static const struct file_operations tcp6_afinfo_seq_fops = {
2060 .owner = THIS_MODULE,
2061 .open = tcp_seq_open,
2062 .read = seq_read,
2063 .llseek = seq_lseek,
2064 .release = seq_release_net
2065};
2066
Linus Torvalds1da177e2005-04-16 15:20:36 -07002067static struct tcp_seq_afinfo tcp6_seq_afinfo = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002068 .name = "tcp6",
2069 .family = AF_INET6,
Arjan van de Ven73cb88e2011-10-30 06:46:30 +00002070 .seq_fops = &tcp6_afinfo_seq_fops,
Denis V. Lunev9427c4b2008-04-13 22:12:13 -07002071 .seq_ops = {
2072 .show = tcp6_seq_show,
2073 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07002074};
2075
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002076int __net_init tcp6_proc_init(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002077{
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07002078 return tcp_proc_register(net, &tcp6_seq_afinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002079}
2080
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07002081void tcp6_proc_exit(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002082{
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07002083 tcp_proc_unregister(net, &tcp6_seq_afinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002084}
2085#endif
2086
Eric Dumazet7d9577d2013-05-09 10:28:16 +00002087static void tcp_v6_clear_sk(struct sock *sk, int size)
2088{
2089 struct inet_sock *inet = inet_sk(sk);
2090
2091 /* we do not want to clear pinet6 field, because of RCU lookups */
2092 sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
2093
2094 size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
2095 memset(&inet->pinet6 + 1, 0, size);
2096}
2097
Linus Torvalds1da177e2005-04-16 15:20:36 -07002098struct proto tcpv6_prot = {
2099 .name = "TCPv6",
2100 .owner = THIS_MODULE,
2101 .close = tcp_close,
2102 .connect = tcp_v6_connect,
2103 .disconnect = tcp_disconnect,
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07002104 .accept = inet_csk_accept,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002105 .ioctl = tcp_ioctl,
2106 .init = tcp_v6_init_sock,
2107 .destroy = tcp_v6_destroy_sock,
2108 .shutdown = tcp_shutdown,
2109 .setsockopt = tcp_setsockopt,
2110 .getsockopt = tcp_getsockopt,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002111 .recvmsg = tcp_recvmsg,
Changli Gao7ba42912010-07-10 20:41:55 +00002112 .sendmsg = tcp_sendmsg,
2113 .sendpage = tcp_sendpage,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002114 .backlog_rcv = tcp_v6_do_rcv,
2115 .hash = tcp_v6_hash,
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08002116 .unhash = inet_unhash,
2117 .get_port = inet_csk_get_port,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002118 .enter_memory_pressure = tcp_enter_memory_pressure,
2119 .sockets_allocated = &tcp_sockets_allocated,
2120 .memory_allocated = &tcp_memory_allocated,
2121 .memory_pressure = &tcp_memory_pressure,
Arnaldo Carvalho de Melo0a5578c2005-08-09 20:11:41 -07002122 .orphan_count = &tcp_orphan_count,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002123 .sysctl_wmem = sysctl_tcp_wmem,
2124 .sysctl_rmem = sysctl_tcp_rmem,
2125 .max_header = MAX_TCP_HEADER,
2126 .obj_size = sizeof(struct tcp6_sock),
Eric Dumazet3ab5aee2008-11-16 19:40:17 -08002127 .slab_flags = SLAB_DESTROY_BY_RCU,
Arnaldo Carvalho de Melo6d6ee432005-12-13 23:25:19 -08002128 .twsk_prot = &tcp6_timewait_sock_ops,
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -07002129 .rsk_prot = &tcp6_request_sock_ops,
Pavel Emelyanov39d8cda2008-03-22 16:50:58 -07002130 .h.hashinfo = &tcp_hashinfo,
Changli Gao7ba42912010-07-10 20:41:55 +00002131 .no_autobind = true,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08002132#ifdef CONFIG_COMPAT
2133 .compat_setsockopt = compat_tcp_setsockopt,
2134 .compat_getsockopt = compat_tcp_getsockopt,
2135#endif
Glauber Costad1a4c0b2011-12-11 21:47:04 +00002136#ifdef CONFIG_CGROUP_MEM_RES_CTLR_KMEM
2137 .proto_cgroup = tcp_proto_cgroup,
2138#endif
Eric Dumazet7d9577d2013-05-09 10:28:16 +00002139 .clear_sk = tcp_v6_clear_sk,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002140};
2141
Alexey Dobriyan41135cc2009-09-14 12:22:28 +00002142static const struct inet6_protocol tcpv6_protocol = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002143 .handler = tcp_v6_rcv,
2144 .err_handler = tcp_v6_err,
Herbert Xua430a432006-07-08 13:34:56 -07002145 .gso_send_check = tcp_v6_gso_send_check,
Herbert Xuadcfc7d2006-06-30 13:36:15 -07002146 .gso_segment = tcp_tso_segment,
Herbert Xu684f2172009-01-08 10:41:23 -08002147 .gro_receive = tcp6_gro_receive,
2148 .gro_complete = tcp6_gro_complete,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002149 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
2150};
2151
Linus Torvalds1da177e2005-04-16 15:20:36 -07002152static struct inet_protosw tcpv6_protosw = {
2153 .type = SOCK_STREAM,
2154 .protocol = IPPROTO_TCP,
2155 .prot = &tcpv6_prot,
2156 .ops = &inet6_stream_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002157 .no_check = 0,
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08002158 .flags = INET_PROTOSW_PERMANENT |
2159 INET_PROTOSW_ICSK,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002160};
2161
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002162static int __net_init tcpv6_net_init(struct net *net)
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002163{
Denis V. Lunev56772422008-04-03 14:28:30 -07002164 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2165 SOCK_RAW, IPPROTO_TCP, net);
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002166}
2167
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002168static void __net_exit tcpv6_net_exit(struct net *net)
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002169{
Denis V. Lunev56772422008-04-03 14:28:30 -07002170 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00002171}
2172
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00002173static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00002174{
2175 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002176}
2177
2178static struct pernet_operations tcpv6_net_ops = {
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00002179 .init = tcpv6_net_init,
2180 .exit = tcpv6_net_exit,
2181 .exit_batch = tcpv6_net_exit_batch,
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002182};
2183
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002184int __init tcpv6_init(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002185{
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002186 int ret;
David Woodhouseae0f7d52006-01-11 15:53:04 -08002187
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002188 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2189 if (ret)
2190 goto out;
2191
2192 /* register inet6 protocol */
2193 ret = inet6_register_protosw(&tcpv6_protosw);
2194 if (ret)
2195 goto out_tcpv6_protocol;
2196
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002197 ret = register_pernet_subsys(&tcpv6_net_ops);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002198 if (ret)
2199 goto out_tcpv6_protosw;
2200out:
2201 return ret;
2202
2203out_tcpv6_protocol:
2204 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2205out_tcpv6_protosw:
2206 inet6_unregister_protosw(&tcpv6_protosw);
2207 goto out;
2208}
2209
Daniel Lezcano09f77092007-12-13 05:34:58 -08002210void tcpv6_exit(void)
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002211{
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002212 unregister_pernet_subsys(&tcpv6_net_ops);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002213 inet6_unregister_protosw(&tcpv6_protosw);
2214 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002215}