| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 1 | /* | 
 | 2 |  * INET		An implementation of the TCP/IP protocol suite for the LINUX | 
 | 3 |  *		operating system.  INET is implemented using the BSD Socket | 
 | 4 |  *		interface as the means of communication with the user level. | 
 | 5 |  * | 
 | 6 |  *		Generic INET transport hashtables | 
 | 7 |  * | 
 | 8 |  * Authors:	Lotsa people, from code originally in tcp | 
 | 9 |  * | 
 | 10 |  *	This program is free software; you can redistribute it and/or | 
 | 11 |  *      modify it under the terms of the GNU General Public License | 
 | 12 |  *      as published by the Free Software Foundation; either version | 
 | 13 |  *      2 of the License, or (at your option) any later version. | 
 | 14 |  */ | 
 | 15 |  | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 16 | #include <linux/module.h> | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 17 | #include <linux/random.h> | 
| Arnaldo Carvalho de Melo | f3f05f7 | 2005-08-09 20:08:09 -0700 | [diff] [blame] | 18 | #include <linux/sched.h> | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 19 | #include <linux/slab.h> | 
| Arnaldo Carvalho de Melo | f3f05f7 | 2005-08-09 20:08:09 -0700 | [diff] [blame] | 20 | #include <linux/wait.h> | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 21 |  | 
| Arnaldo Carvalho de Melo | 463c84b | 2005-08-09 20:10:42 -0700 | [diff] [blame] | 22 | #include <net/inet_connection_sock.h> | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 23 | #include <net/inet_hashtables.h> | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 24 | #include <net/ip.h> | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 25 |  | 
 | 26 | /* | 
 | 27 |  * Allocate and initialize a new local port bind bucket. | 
 | 28 |  * The bindhash mutex for snum's hash chain must be held here. | 
 | 29 |  */ | 
| Christoph Lameter | e18b890 | 2006-12-06 20:33:20 -0800 | [diff] [blame] | 30 | struct inet_bind_bucket *inet_bind_bucket_create(struct kmem_cache *cachep, | 
| Pavel Emelyanov | 941b1d2 | 2008-01-31 05:05:50 -0800 | [diff] [blame] | 31 | 						 struct net *net, | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 32 | 						 struct inet_bind_hashbucket *head, | 
 | 33 | 						 const unsigned short snum) | 
 | 34 | { | 
| Christoph Lameter | 54e6ecb | 2006-12-06 20:33:16 -0800 | [diff] [blame] | 35 | 	struct inet_bind_bucket *tb = kmem_cache_alloc(cachep, GFP_ATOMIC); | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 36 |  | 
 | 37 | 	if (tb != NULL) { | 
| Eric Dumazet | 7a9546e | 2008-11-12 00:54:20 -0800 | [diff] [blame] | 38 | 		write_pnet(&tb->ib_net, hold_net(net)); | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 39 | 		tb->port      = snum; | 
 | 40 | 		tb->fastreuse = 0; | 
| Evgeniy Polyakov | a9d8f91 | 2009-01-19 16:46:02 -0800 | [diff] [blame] | 41 | 		tb->num_owners = 0; | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 42 | 		INIT_HLIST_HEAD(&tb->owners); | 
 | 43 | 		hlist_add_head(&tb->node, &head->chain); | 
 | 44 | 	} | 
 | 45 | 	return tb; | 
 | 46 | } | 
 | 47 |  | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 48 | /* | 
 | 49 |  * Caller must hold hashbucket lock for this tb with local BH disabled | 
 | 50 |  */ | 
| Christoph Lameter | e18b890 | 2006-12-06 20:33:20 -0800 | [diff] [blame] | 51 | void inet_bind_bucket_destroy(struct kmem_cache *cachep, struct inet_bind_bucket *tb) | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 52 | { | 
 | 53 | 	if (hlist_empty(&tb->owners)) { | 
 | 54 | 		__hlist_del(&tb->node); | 
| Eric Dumazet | 7a9546e | 2008-11-12 00:54:20 -0800 | [diff] [blame] | 55 | 		release_net(ib_net(tb)); | 
| Arnaldo Carvalho de Melo | 77d8bf9 | 2005-08-09 20:00:51 -0700 | [diff] [blame] | 56 | 		kmem_cache_free(cachep, tb); | 
 | 57 | 	} | 
 | 58 | } | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 59 |  | 
 | 60 | void inet_bind_hash(struct sock *sk, struct inet_bind_bucket *tb, | 
 | 61 | 		    const unsigned short snum) | 
 | 62 | { | 
| Evgeniy Polyakov | a9d8f91 | 2009-01-19 16:46:02 -0800 | [diff] [blame] | 63 | 	struct inet_hashinfo *hashinfo = sk->sk_prot->h.hashinfo; | 
 | 64 |  | 
| Eric Dumazet | 24dd1fa | 2009-02-01 12:31:33 -0800 | [diff] [blame] | 65 | 	atomic_inc(&hashinfo->bsockets); | 
| Evgeniy Polyakov | a9d8f91 | 2009-01-19 16:46:02 -0800 | [diff] [blame] | 66 |  | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 67 | 	inet_sk(sk)->inet_num = snum; | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 68 | 	sk_add_bind_node(sk, &tb->owners); | 
| Evgeniy Polyakov | a9d8f91 | 2009-01-19 16:46:02 -0800 | [diff] [blame] | 69 | 	tb->num_owners++; | 
| Arnaldo Carvalho de Melo | 463c84b | 2005-08-09 20:10:42 -0700 | [diff] [blame] | 70 | 	inet_csk(sk)->icsk_bind_hash = tb; | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 71 | } | 
 | 72 |  | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 73 | /* | 
 | 74 |  * Get rid of any references to a local port held by the given sock. | 
 | 75 |  */ | 
| Arnaldo Carvalho de Melo | ab1e0a1 | 2008-02-03 04:06:04 -0800 | [diff] [blame] | 76 | static void __inet_put_port(struct sock *sk) | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 77 | { | 
| Pavel Emelyanov | 39d8cda | 2008-03-22 16:50:58 -0700 | [diff] [blame] | 78 | 	struct inet_hashinfo *hashinfo = sk->sk_prot->h.hashinfo; | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 79 | 	const int bhash = inet_bhashfn(sock_net(sk), inet_sk(sk)->inet_num, | 
| Pavel Emelyanov | 7f635ab | 2008-06-16 17:12:49 -0700 | [diff] [blame] | 80 | 			hashinfo->bhash_size); | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 81 | 	struct inet_bind_hashbucket *head = &hashinfo->bhash[bhash]; | 
 | 82 | 	struct inet_bind_bucket *tb; | 
 | 83 |  | 
| Eric Dumazet | 24dd1fa | 2009-02-01 12:31:33 -0800 | [diff] [blame] | 84 | 	atomic_dec(&hashinfo->bsockets); | 
| Evgeniy Polyakov | a9d8f91 | 2009-01-19 16:46:02 -0800 | [diff] [blame] | 85 |  | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 86 | 	spin_lock(&head->lock); | 
| Arnaldo Carvalho de Melo | 463c84b | 2005-08-09 20:10:42 -0700 | [diff] [blame] | 87 | 	tb = inet_csk(sk)->icsk_bind_hash; | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 88 | 	__sk_del_bind_node(sk); | 
| Evgeniy Polyakov | a9d8f91 | 2009-01-19 16:46:02 -0800 | [diff] [blame] | 89 | 	tb->num_owners--; | 
| Arnaldo Carvalho de Melo | 463c84b | 2005-08-09 20:10:42 -0700 | [diff] [blame] | 90 | 	inet_csk(sk)->icsk_bind_hash = NULL; | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 91 | 	inet_sk(sk)->inet_num = 0; | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 92 | 	inet_bind_bucket_destroy(hashinfo->bind_bucket_cachep, tb); | 
 | 93 | 	spin_unlock(&head->lock); | 
 | 94 | } | 
 | 95 |  | 
| Arnaldo Carvalho de Melo | ab1e0a1 | 2008-02-03 04:06:04 -0800 | [diff] [blame] | 96 | void inet_put_port(struct sock *sk) | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 97 | { | 
 | 98 | 	local_bh_disable(); | 
| Arnaldo Carvalho de Melo | ab1e0a1 | 2008-02-03 04:06:04 -0800 | [diff] [blame] | 99 | 	__inet_put_port(sk); | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 100 | 	local_bh_enable(); | 
 | 101 | } | 
| Arnaldo Carvalho de Melo | 2d8c4ce | 2005-08-09 20:07:13 -0700 | [diff] [blame] | 102 | EXPORT_SYMBOL(inet_put_port); | 
| Arnaldo Carvalho de Melo | f3f05f7 | 2005-08-09 20:08:09 -0700 | [diff] [blame] | 103 |  | 
| Balazs Scheidler | 093d282 | 2010-10-21 13:06:43 +0200 | [diff] [blame] | 104 | int __inet_inherit_port(struct sock *sk, struct sock *child) | 
| Pavel Emelyanov | 5308377 | 2008-04-17 23:18:15 -0700 | [diff] [blame] | 105 | { | 
 | 106 | 	struct inet_hashinfo *table = sk->sk_prot->h.hashinfo; | 
| Balazs Scheidler | 093d282 | 2010-10-21 13:06:43 +0200 | [diff] [blame] | 107 | 	unsigned short port = inet_sk(child)->inet_num; | 
 | 108 | 	const int bhash = inet_bhashfn(sock_net(sk), port, | 
| Pavel Emelyanov | 7f635ab | 2008-06-16 17:12:49 -0700 | [diff] [blame] | 109 | 			table->bhash_size); | 
| Pavel Emelyanov | 5308377 | 2008-04-17 23:18:15 -0700 | [diff] [blame] | 110 | 	struct inet_bind_hashbucket *head = &table->bhash[bhash]; | 
 | 111 | 	struct inet_bind_bucket *tb; | 
 | 112 |  | 
 | 113 | 	spin_lock(&head->lock); | 
 | 114 | 	tb = inet_csk(sk)->icsk_bind_hash; | 
| Balazs Scheidler | 093d282 | 2010-10-21 13:06:43 +0200 | [diff] [blame] | 115 | 	if (tb->port != port) { | 
 | 116 | 		/* NOTE: using tproxy and redirecting skbs to a proxy | 
 | 117 | 		 * on a different listener port breaks the assumption | 
 | 118 | 		 * that the listener socket's icsk_bind_hash is the same | 
 | 119 | 		 * as that of the child socket. We have to look up or | 
 | 120 | 		 * create a new bind bucket for the child here. */ | 
 | 121 | 		struct hlist_node *node; | 
 | 122 | 		inet_bind_bucket_for_each(tb, node, &head->chain) { | 
 | 123 | 			if (net_eq(ib_net(tb), sock_net(sk)) && | 
 | 124 | 			    tb->port == port) | 
 | 125 | 				break; | 
 | 126 | 		} | 
 | 127 | 		if (!node) { | 
 | 128 | 			tb = inet_bind_bucket_create(table->bind_bucket_cachep, | 
 | 129 | 						     sock_net(sk), head, port); | 
 | 130 | 			if (!tb) { | 
 | 131 | 				spin_unlock(&head->lock); | 
 | 132 | 				return -ENOMEM; | 
 | 133 | 			} | 
 | 134 | 		} | 
 | 135 | 	} | 
| Nagendra Tomar | b4ff3c9 | 2010-11-26 14:26:27 +0000 | [diff] [blame] | 136 | 	inet_bind_hash(child, tb, port); | 
| Pavel Emelyanov | 5308377 | 2008-04-17 23:18:15 -0700 | [diff] [blame] | 137 | 	spin_unlock(&head->lock); | 
| Balazs Scheidler | 093d282 | 2010-10-21 13:06:43 +0200 | [diff] [blame] | 138 |  | 
 | 139 | 	return 0; | 
| Pavel Emelyanov | 5308377 | 2008-04-17 23:18:15 -0700 | [diff] [blame] | 140 | } | 
| Pavel Emelyanov | 5308377 | 2008-04-17 23:18:15 -0700 | [diff] [blame] | 141 | EXPORT_SYMBOL_GPL(__inet_inherit_port); | 
 | 142 |  | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 143 | static inline int compute_score(struct sock *sk, struct net *net, | 
 | 144 | 				const unsigned short hnum, const __be32 daddr, | 
 | 145 | 				const int dif) | 
 | 146 | { | 
 | 147 | 	int score = -1; | 
 | 148 | 	struct inet_sock *inet = inet_sk(sk); | 
 | 149 |  | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 150 | 	if (net_eq(sock_net(sk), net) && inet->inet_num == hnum && | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 151 | 			!ipv6_only_sock(sk)) { | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 152 | 		__be32 rcv_saddr = inet->inet_rcv_saddr; | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 153 | 		score = sk->sk_family == PF_INET ? 1 : 0; | 
 | 154 | 		if (rcv_saddr) { | 
 | 155 | 			if (rcv_saddr != daddr) | 
 | 156 | 				return -1; | 
 | 157 | 			score += 2; | 
 | 158 | 		} | 
 | 159 | 		if (sk->sk_bound_dev_if) { | 
 | 160 | 			if (sk->sk_bound_dev_if != dif) | 
 | 161 | 				return -1; | 
 | 162 | 			score += 2; | 
 | 163 | 		} | 
 | 164 | 	} | 
 | 165 | 	return score; | 
 | 166 | } | 
 | 167 |  | 
| Arnaldo Carvalho de Melo | f3f05f7 | 2005-08-09 20:08:09 -0700 | [diff] [blame] | 168 | /* | 
| Arnaldo Carvalho de Melo | 33b6223 | 2005-08-09 20:09:06 -0700 | [diff] [blame] | 169 |  * Don't inline this cruft. Here are some nice properties to exploit here. The | 
 | 170 |  * BSD API does not allow a listening sock to specify the remote port nor the | 
 | 171 |  * remote address for the connection. So always assume those are both | 
 | 172 |  * wildcarded during the search since they can never be otherwise. | 
 | 173 |  */ | 
| Arnaldo Carvalho de Melo | 33b6223 | 2005-08-09 20:09:06 -0700 | [diff] [blame] | 174 |  | 
| Arnaldo Carvalho de Melo | 33b6223 | 2005-08-09 20:09:06 -0700 | [diff] [blame] | 175 |  | 
| Pavel Emelyanov | c67499c | 2008-01-31 05:06:40 -0800 | [diff] [blame] | 176 | struct sock *__inet_lookup_listener(struct net *net, | 
 | 177 | 				    struct inet_hashinfo *hashinfo, | 
| Al Viro | fb99c84 | 2006-09-27 18:43:33 -0700 | [diff] [blame] | 178 | 				    const __be32 daddr, const unsigned short hnum, | 
| Herbert Xu | 8f491069 | 2006-08-09 15:47:12 -0700 | [diff] [blame] | 179 | 				    const int dif) | 
| Herbert Xu | 99a92ff | 2006-08-08 02:18:10 -0700 | [diff] [blame] | 180 | { | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 181 | 	struct sock *sk, *result; | 
 | 182 | 	struct hlist_nulls_node *node; | 
 | 183 | 	unsigned int hash = inet_lhashfn(net, hnum); | 
 | 184 | 	struct inet_listen_hashbucket *ilb = &hashinfo->listening_hash[hash]; | 
 | 185 | 	int score, hiscore; | 
| Herbert Xu | 99a92ff | 2006-08-08 02:18:10 -0700 | [diff] [blame] | 186 |  | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 187 | 	rcu_read_lock(); | 
 | 188 | begin: | 
 | 189 | 	result = NULL; | 
 | 190 | 	hiscore = -1; | 
 | 191 | 	sk_nulls_for_each_rcu(sk, node, &ilb->head) { | 
 | 192 | 		score = compute_score(sk, net, hnum, daddr, dif); | 
 | 193 | 		if (score > hiscore) { | 
 | 194 | 			result = sk; | 
 | 195 | 			hiscore = score; | 
 | 196 | 		} | 
| Herbert Xu | 99a92ff | 2006-08-08 02:18:10 -0700 | [diff] [blame] | 197 | 	} | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 198 | 	/* | 
 | 199 | 	 * if the nulls value we got at the end of this lookup is | 
 | 200 | 	 * not the expected one, we must restart lookup. | 
 | 201 | 	 * We probably met an item that was moved to another chain. | 
 | 202 | 	 */ | 
 | 203 | 	if (get_nulls_value(node) != hash + LISTENING_NULLS_BASE) | 
 | 204 | 		goto begin; | 
 | 205 | 	if (result) { | 
 | 206 | 		if (unlikely(!atomic_inc_not_zero(&result->sk_refcnt))) | 
 | 207 | 			result = NULL; | 
 | 208 | 		else if (unlikely(compute_score(result, net, hnum, daddr, | 
 | 209 | 				  dif) < hiscore)) { | 
 | 210 | 			sock_put(result); | 
 | 211 | 			goto begin; | 
 | 212 | 		} | 
| Herbert Xu | 99a92ff | 2006-08-08 02:18:10 -0700 | [diff] [blame] | 213 | 	} | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 214 | 	rcu_read_unlock(); | 
 | 215 | 	return result; | 
| Herbert Xu | 99a92ff | 2006-08-08 02:18:10 -0700 | [diff] [blame] | 216 | } | 
| Herbert Xu | 8f491069 | 2006-08-09 15:47:12 -0700 | [diff] [blame] | 217 | EXPORT_SYMBOL_GPL(__inet_lookup_listener); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 218 |  | 
| Pavel Emelyanov | c67499c | 2008-01-31 05:06:40 -0800 | [diff] [blame] | 219 | struct sock * __inet_lookup_established(struct net *net, | 
 | 220 | 				  struct inet_hashinfo *hashinfo, | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 221 | 				  const __be32 saddr, const __be16 sport, | 
 | 222 | 				  const __be32 daddr, const u16 hnum, | 
 | 223 | 				  const int dif) | 
 | 224 | { | 
 | 225 | 	INET_ADDR_COOKIE(acookie, saddr, daddr) | 
 | 226 | 	const __portpair ports = INET_COMBINED_PORTS(sport, hnum); | 
 | 227 | 	struct sock *sk; | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 228 | 	const struct hlist_nulls_node *node; | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 229 | 	/* Optimize here for direct hit, only listening connections can | 
 | 230 | 	 * have wildcards anyways. | 
 | 231 | 	 */ | 
| Pavel Emelyanov | 9f26b3a | 2008-06-16 17:13:27 -0700 | [diff] [blame] | 232 | 	unsigned int hash = inet_ehashfn(net, daddr, hnum, saddr, sport); | 
| Eric Dumazet | f373b53 | 2009-10-09 00:16:19 +0000 | [diff] [blame] | 233 | 	unsigned int slot = hash & hashinfo->ehash_mask; | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 234 | 	struct inet_ehash_bucket *head = &hashinfo->ehash[slot]; | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 235 |  | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 236 | 	rcu_read_lock(); | 
 | 237 | begin: | 
 | 238 | 	sk_nulls_for_each_rcu(sk, node, &head->chain) { | 
| Pavel Emelyanov | c67499c | 2008-01-31 05:06:40 -0800 | [diff] [blame] | 239 | 		if (INET_MATCH(sk, net, hash, acookie, | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 240 | 					saddr, daddr, ports, dif)) { | 
 | 241 | 			if (unlikely(!atomic_inc_not_zero(&sk->sk_refcnt))) | 
 | 242 | 				goto begintw; | 
 | 243 | 			if (unlikely(!INET_MATCH(sk, net, hash, acookie, | 
 | 244 | 				saddr, daddr, ports, dif))) { | 
 | 245 | 				sock_put(sk); | 
 | 246 | 				goto begin; | 
 | 247 | 			} | 
 | 248 | 			goto out; | 
 | 249 | 		} | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 250 | 	} | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 251 | 	/* | 
 | 252 | 	 * if the nulls value we got at the end of this lookup is | 
 | 253 | 	 * not the expected one, we must restart lookup. | 
 | 254 | 	 * We probably met an item that was moved to another chain. | 
 | 255 | 	 */ | 
 | 256 | 	if (get_nulls_value(node) != slot) | 
 | 257 | 		goto begin; | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 258 |  | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 259 | begintw: | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 260 | 	/* Must check for a TIME_WAIT'er before going to listener hash. */ | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 261 | 	sk_nulls_for_each_rcu(sk, node, &head->twchain) { | 
| Pavel Emelyanov | c67499c | 2008-01-31 05:06:40 -0800 | [diff] [blame] | 262 | 		if (INET_TW_MATCH(sk, net, hash, acookie, | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 263 | 					saddr, daddr, ports, dif)) { | 
 | 264 | 			if (unlikely(!atomic_inc_not_zero(&sk->sk_refcnt))) { | 
 | 265 | 				sk = NULL; | 
 | 266 | 				goto out; | 
 | 267 | 			} | 
 | 268 | 			if (unlikely(!INET_TW_MATCH(sk, net, hash, acookie, | 
 | 269 | 				 saddr, daddr, ports, dif))) { | 
 | 270 | 				sock_put(sk); | 
 | 271 | 				goto begintw; | 
 | 272 | 			} | 
 | 273 | 			goto out; | 
 | 274 | 		} | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 275 | 	} | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 276 | 	/* | 
 | 277 | 	 * if the nulls value we got at the end of this lookup is | 
 | 278 | 	 * not the expected one, we must restart lookup. | 
 | 279 | 	 * We probably met an item that was moved to another chain. | 
 | 280 | 	 */ | 
 | 281 | 	if (get_nulls_value(node) != slot) | 
 | 282 | 		goto begintw; | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 283 | 	sk = NULL; | 
 | 284 | out: | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 285 | 	rcu_read_unlock(); | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 286 | 	return sk; | 
| Pavel Emelyanov | 77a5ba5 | 2007-12-20 15:32:17 -0800 | [diff] [blame] | 287 | } | 
 | 288 | EXPORT_SYMBOL_GPL(__inet_lookup_established); | 
 | 289 |  | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 290 | /* called with local bh disabled */ | 
 | 291 | static int __inet_check_established(struct inet_timewait_death_row *death_row, | 
 | 292 | 				    struct sock *sk, __u16 lport, | 
 | 293 | 				    struct inet_timewait_sock **twp) | 
 | 294 | { | 
 | 295 | 	struct inet_hashinfo *hinfo = death_row->hashinfo; | 
 | 296 | 	struct inet_sock *inet = inet_sk(sk); | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 297 | 	__be32 daddr = inet->inet_rcv_saddr; | 
 | 298 | 	__be32 saddr = inet->inet_daddr; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 299 | 	int dif = sk->sk_bound_dev_if; | 
 | 300 | 	INET_ADDR_COOKIE(acookie, saddr, daddr) | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 301 | 	const __portpair ports = INET_COMBINED_PORTS(inet->inet_dport, lport); | 
| Pavel Emelyanov | 9f26b3a | 2008-06-16 17:13:27 -0700 | [diff] [blame] | 302 | 	struct net *net = sock_net(sk); | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 303 | 	unsigned int hash = inet_ehashfn(net, daddr, lport, | 
 | 304 | 					 saddr, inet->inet_dport); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 305 | 	struct inet_ehash_bucket *head = inet_ehash_bucket(hinfo, hash); | 
| Eric Dumazet | 9db66bd | 2008-11-20 20:39:09 -0800 | [diff] [blame] | 306 | 	spinlock_t *lock = inet_ehash_lockp(hinfo, hash); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 307 | 	struct sock *sk2; | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 308 | 	const struct hlist_nulls_node *node; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 309 | 	struct inet_timewait_sock *tw; | 
| Eric Dumazet | 13475a3 | 2009-12-02 22:31:19 +0000 | [diff] [blame] | 310 | 	int twrefcnt = 0; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 311 |  | 
| Eric Dumazet | 9db66bd | 2008-11-20 20:39:09 -0800 | [diff] [blame] | 312 | 	spin_lock(lock); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 313 |  | 
 | 314 | 	/* Check TIME-WAIT sockets first. */ | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 315 | 	sk_nulls_for_each(sk2, node, &head->twchain) { | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 316 | 		tw = inet_twsk(sk2); | 
 | 317 |  | 
| Pavel Emelyanov | c67499c | 2008-01-31 05:06:40 -0800 | [diff] [blame] | 318 | 		if (INET_TW_MATCH(sk2, net, hash, acookie, | 
 | 319 | 					saddr, daddr, ports, dif)) { | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 320 | 			if (twsk_unique(sk, sk2, twp)) | 
 | 321 | 				goto unique; | 
 | 322 | 			else | 
 | 323 | 				goto not_unique; | 
 | 324 | 		} | 
 | 325 | 	} | 
 | 326 | 	tw = NULL; | 
 | 327 |  | 
 | 328 | 	/* And established part... */ | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 329 | 	sk_nulls_for_each(sk2, node, &head->chain) { | 
| Pavel Emelyanov | c67499c | 2008-01-31 05:06:40 -0800 | [diff] [blame] | 330 | 		if (INET_MATCH(sk2, net, hash, acookie, | 
 | 331 | 					saddr, daddr, ports, dif)) | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 332 | 			goto not_unique; | 
 | 333 | 	} | 
 | 334 |  | 
 | 335 | unique: | 
 | 336 | 	/* Must record num and sport now. Otherwise we will see | 
 | 337 | 	 * in hash table socket with a funny identity. */ | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 338 | 	inet->inet_num = lport; | 
 | 339 | 	inet->inet_sport = htons(lport); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 340 | 	sk->sk_hash = hash; | 
| Ilpo Järvinen | 547b792 | 2008-07-25 21:43:18 -0700 | [diff] [blame] | 341 | 	WARN_ON(!sk_unhashed(sk)); | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 342 | 	__sk_nulls_add_node_rcu(sk, &head->chain); | 
| Eric Dumazet | 13475a3 | 2009-12-02 22:31:19 +0000 | [diff] [blame] | 343 | 	if (tw) { | 
 | 344 | 		twrefcnt = inet_twsk_unhash(tw); | 
 | 345 | 		NET_INC_STATS_BH(net, LINUX_MIB_TIMEWAITRECYCLED); | 
 | 346 | 	} | 
| Eric Dumazet | 9db66bd | 2008-11-20 20:39:09 -0800 | [diff] [blame] | 347 | 	spin_unlock(lock); | 
| Eric Dumazet | 13475a3 | 2009-12-02 22:31:19 +0000 | [diff] [blame] | 348 | 	if (twrefcnt) | 
 | 349 | 		inet_twsk_put(tw); | 
| Pavel Emelyanov | c29a0bc | 2008-03-31 19:41:46 -0700 | [diff] [blame] | 350 | 	sock_prot_inuse_add(sock_net(sk), sk->sk_prot, 1); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 351 |  | 
 | 352 | 	if (twp) { | 
 | 353 | 		*twp = tw; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 354 | 	} else if (tw) { | 
 | 355 | 		/* Silly. Should hash-dance instead... */ | 
 | 356 | 		inet_twsk_deschedule(tw, death_row); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 357 |  | 
 | 358 | 		inet_twsk_put(tw); | 
 | 359 | 	} | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 360 | 	return 0; | 
 | 361 |  | 
 | 362 | not_unique: | 
| Eric Dumazet | 9db66bd | 2008-11-20 20:39:09 -0800 | [diff] [blame] | 363 | 	spin_unlock(lock); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 364 | 	return -EADDRNOTAVAIL; | 
 | 365 | } | 
 | 366 |  | 
 | 367 | static inline u32 inet_sk_port_offset(const struct sock *sk) | 
 | 368 | { | 
 | 369 | 	const struct inet_sock *inet = inet_sk(sk); | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 370 | 	return secure_ipv4_port_ephemeral(inet->inet_rcv_saddr, | 
 | 371 | 					  inet->inet_daddr, | 
 | 372 | 					  inet->inet_dport); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 373 | } | 
 | 374 |  | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 375 | int __inet_hash_nolisten(struct sock *sk, struct inet_timewait_sock *tw) | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 376 | { | 
| Pavel Emelyanov | 39d8cda | 2008-03-22 16:50:58 -0700 | [diff] [blame] | 377 | 	struct inet_hashinfo *hashinfo = sk->sk_prot->h.hashinfo; | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 378 | 	struct hlist_nulls_head *list; | 
| Eric Dumazet | 9db66bd | 2008-11-20 20:39:09 -0800 | [diff] [blame] | 379 | 	spinlock_t *lock; | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 380 | 	struct inet_ehash_bucket *head; | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 381 | 	int twrefcnt = 0; | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 382 |  | 
| Ilpo Järvinen | 547b792 | 2008-07-25 21:43:18 -0700 | [diff] [blame] | 383 | 	WARN_ON(!sk_unhashed(sk)); | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 384 |  | 
 | 385 | 	sk->sk_hash = inet_sk_ehashfn(sk); | 
 | 386 | 	head = inet_ehash_bucket(hashinfo, sk->sk_hash); | 
 | 387 | 	list = &head->chain; | 
 | 388 | 	lock = inet_ehash_lockp(hashinfo, sk->sk_hash); | 
 | 389 |  | 
| Eric Dumazet | 9db66bd | 2008-11-20 20:39:09 -0800 | [diff] [blame] | 390 | 	spin_lock(lock); | 
| Eric Dumazet | 3ab5aee | 2008-11-16 19:40:17 -0800 | [diff] [blame] | 391 | 	__sk_nulls_add_node_rcu(sk, list); | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 392 | 	if (tw) { | 
 | 393 | 		WARN_ON(sk->sk_hash != tw->tw_hash); | 
 | 394 | 		twrefcnt = inet_twsk_unhash(tw); | 
 | 395 | 	} | 
| Eric Dumazet | 9db66bd | 2008-11-20 20:39:09 -0800 | [diff] [blame] | 396 | 	spin_unlock(lock); | 
| Pavel Emelyanov | c29a0bc | 2008-03-31 19:41:46 -0700 | [diff] [blame] | 397 | 	sock_prot_inuse_add(sock_net(sk), sk->sk_prot, 1); | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 398 | 	return twrefcnt; | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 399 | } | 
 | 400 | EXPORT_SYMBOL_GPL(__inet_hash_nolisten); | 
 | 401 |  | 
| Arnaldo Carvalho de Melo | ab1e0a1 | 2008-02-03 04:06:04 -0800 | [diff] [blame] | 402 | static void __inet_hash(struct sock *sk) | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 403 | { | 
| Pavel Emelyanov | 39d8cda | 2008-03-22 16:50:58 -0700 | [diff] [blame] | 404 | 	struct inet_hashinfo *hashinfo = sk->sk_prot->h.hashinfo; | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 405 | 	struct inet_listen_hashbucket *ilb; | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 406 |  | 
 | 407 | 	if (sk->sk_state != TCP_LISTEN) { | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 408 | 		__inet_hash_nolisten(sk, NULL); | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 409 | 		return; | 
 | 410 | 	} | 
 | 411 |  | 
| Ilpo Järvinen | 547b792 | 2008-07-25 21:43:18 -0700 | [diff] [blame] | 412 | 	WARN_ON(!sk_unhashed(sk)); | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 413 | 	ilb = &hashinfo->listening_hash[inet_sk_listen_hashfn(sk)]; | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 414 |  | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 415 | 	spin_lock(&ilb->lock); | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 416 | 	__sk_nulls_add_node_rcu(sk, &ilb->head); | 
| Pavel Emelyanov | c29a0bc | 2008-03-31 19:41:46 -0700 | [diff] [blame] | 417 | 	sock_prot_inuse_add(sock_net(sk), sk->sk_prot, 1); | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 418 | 	spin_unlock(&ilb->lock); | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 419 | } | 
| Arnaldo Carvalho de Melo | ab1e0a1 | 2008-02-03 04:06:04 -0800 | [diff] [blame] | 420 |  | 
 | 421 | void inet_hash(struct sock *sk) | 
 | 422 | { | 
 | 423 | 	if (sk->sk_state != TCP_CLOSE) { | 
 | 424 | 		local_bh_disable(); | 
 | 425 | 		__inet_hash(sk); | 
 | 426 | 		local_bh_enable(); | 
 | 427 | 	} | 
 | 428 | } | 
 | 429 | EXPORT_SYMBOL_GPL(inet_hash); | 
 | 430 |  | 
 | 431 | void inet_unhash(struct sock *sk) | 
 | 432 | { | 
| Pavel Emelyanov | 39d8cda | 2008-03-22 16:50:58 -0700 | [diff] [blame] | 433 | 	struct inet_hashinfo *hashinfo = sk->sk_prot->h.hashinfo; | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 434 | 	spinlock_t *lock; | 
 | 435 | 	int done; | 
| Arnaldo Carvalho de Melo | ab1e0a1 | 2008-02-03 04:06:04 -0800 | [diff] [blame] | 436 |  | 
 | 437 | 	if (sk_unhashed(sk)) | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 438 | 		return; | 
| Arnaldo Carvalho de Melo | ab1e0a1 | 2008-02-03 04:06:04 -0800 | [diff] [blame] | 439 |  | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 440 | 	if (sk->sk_state == TCP_LISTEN) | 
 | 441 | 		lock = &hashinfo->listening_hash[inet_sk_listen_hashfn(sk)].lock; | 
 | 442 | 	else | 
 | 443 | 		lock = inet_ehash_lockp(hashinfo, sk->sk_hash); | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 444 |  | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 445 | 	spin_lock_bh(lock); | 
 | 446 | 	done =__sk_nulls_del_node_init_rcu(sk); | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 447 | 	if (done) | 
 | 448 | 		sock_prot_inuse_add(sock_net(sk), sk->sk_prot, -1); | 
| Eric Dumazet | 920de80 | 2008-11-24 00:09:29 -0800 | [diff] [blame] | 449 | 	spin_unlock_bh(lock); | 
| Arnaldo Carvalho de Melo | ab1e0a1 | 2008-02-03 04:06:04 -0800 | [diff] [blame] | 450 | } | 
 | 451 | EXPORT_SYMBOL_GPL(inet_unhash); | 
| Pavel Emelyanov | 152da81 | 2007-12-20 15:31:33 -0800 | [diff] [blame] | 452 |  | 
| Pavel Emelyanov | 5ee31fc | 2008-01-31 05:04:45 -0800 | [diff] [blame] | 453 | int __inet_hash_connect(struct inet_timewait_death_row *death_row, | 
| Pavel Emelyanov | 5d8c0aa | 2008-02-05 03:14:44 -0800 | [diff] [blame] | 454 | 		struct sock *sk, u32 port_offset, | 
| Pavel Emelyanov | 5ee31fc | 2008-01-31 05:04:45 -0800 | [diff] [blame] | 455 | 		int (*check_established)(struct inet_timewait_death_row *, | 
 | 456 | 			struct sock *, __u16, struct inet_timewait_sock **), | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 457 | 		int (*hash)(struct sock *sk, struct inet_timewait_sock *twp)) | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 458 | { | 
 | 459 | 	struct inet_hashinfo *hinfo = death_row->hashinfo; | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 460 | 	const unsigned short snum = inet_sk(sk)->inet_num; | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 461 | 	struct inet_bind_hashbucket *head; | 
 | 462 | 	struct inet_bind_bucket *tb; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 463 | 	int ret; | 
| YOSHIFUJI Hideaki | 3b1e0a6 | 2008-03-26 02:26:21 +0900 | [diff] [blame] | 464 | 	struct net *net = sock_net(sk); | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 465 | 	int twrefcnt = 1; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 466 |  | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 467 | 	if (!snum) { | 
| Stephen Hemminger | 227b60f | 2007-10-10 17:30:46 -0700 | [diff] [blame] | 468 | 		int i, remaining, low, high, port; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 469 | 		static u32 hint; | 
| Pavel Emelyanov | 5d8c0aa | 2008-02-05 03:14:44 -0800 | [diff] [blame] | 470 | 		u32 offset = hint + port_offset; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 471 | 		struct hlist_node *node; | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 472 | 		struct inet_timewait_sock *tw = NULL; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 473 |  | 
| Stephen Hemminger | 227b60f | 2007-10-10 17:30:46 -0700 | [diff] [blame] | 474 | 		inet_get_local_port_range(&low, &high); | 
| Anton Arapov | a25de53 | 2007-10-18 22:00:17 -0700 | [diff] [blame] | 475 | 		remaining = (high - low) + 1; | 
| Stephen Hemminger | 227b60f | 2007-10-10 17:30:46 -0700 | [diff] [blame] | 476 |  | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 477 | 		local_bh_disable(); | 
| Stephen Hemminger | 227b60f | 2007-10-10 17:30:46 -0700 | [diff] [blame] | 478 | 		for (i = 1; i <= remaining; i++) { | 
 | 479 | 			port = low + (i + offset) % remaining; | 
| Amerigo Wang | e3826f1 | 2010-05-05 00:27:06 +0000 | [diff] [blame] | 480 | 			if (inet_is_reserved_local_port(port)) | 
 | 481 | 				continue; | 
| Pavel Emelyanov | 7f635ab | 2008-06-16 17:12:49 -0700 | [diff] [blame] | 482 | 			head = &hinfo->bhash[inet_bhashfn(net, port, | 
 | 483 | 					hinfo->bhash_size)]; | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 484 | 			spin_lock(&head->lock); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 485 |  | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 486 | 			/* Does not bother with rcv_saddr checks, | 
 | 487 | 			 * because the established check is already | 
 | 488 | 			 * unique enough. | 
 | 489 | 			 */ | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 490 | 			inet_bind_bucket_for_each(tb, node, &head->chain) { | 
| Octavian Purdila | 09ad9bc | 2009-11-25 15:14:13 -0800 | [diff] [blame] | 491 | 				if (net_eq(ib_net(tb), net) && | 
 | 492 | 				    tb->port == port) { | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 493 | 					if (tb->fastreuse >= 0) | 
 | 494 | 						goto next_port; | 
| Evgeniy Polyakov | a9d8f91 | 2009-01-19 16:46:02 -0800 | [diff] [blame] | 495 | 					WARN_ON(hlist_empty(&tb->owners)); | 
| Pavel Emelyanov | 5ee31fc | 2008-01-31 05:04:45 -0800 | [diff] [blame] | 496 | 					if (!check_established(death_row, sk, | 
 | 497 | 								port, &tw)) | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 498 | 						goto ok; | 
 | 499 | 					goto next_port; | 
 | 500 | 				} | 
 | 501 | 			} | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 502 |  | 
| Pavel Emelyanov | 941b1d2 | 2008-01-31 05:05:50 -0800 | [diff] [blame] | 503 | 			tb = inet_bind_bucket_create(hinfo->bind_bucket_cachep, | 
 | 504 | 					net, head, port); | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 505 | 			if (!tb) { | 
 | 506 | 				spin_unlock(&head->lock); | 
 | 507 | 				break; | 
 | 508 | 			} | 
 | 509 | 			tb->fastreuse = -1; | 
 | 510 | 			goto ok; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 511 |  | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 512 | 		next_port: | 
 | 513 | 			spin_unlock(&head->lock); | 
 | 514 | 		} | 
 | 515 | 		local_bh_enable(); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 516 |  | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 517 | 		return -EADDRNOTAVAIL; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 518 |  | 
 | 519 | ok: | 
 | 520 | 		hint += i; | 
 | 521 |  | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 522 | 		/* Head lock still held and bh's disabled */ | 
 | 523 | 		inet_bind_hash(sk, tb, port); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 524 | 		if (sk_unhashed(sk)) { | 
| Eric Dumazet | c720c7e | 2009-10-15 06:30:45 +0000 | [diff] [blame] | 525 | 			inet_sk(sk)->inet_sport = htons(port); | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 526 | 			twrefcnt += hash(sk, tw); | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 527 | 		} | 
| Eric Dumazet | 3cdaeda | 2009-12-04 03:47:42 +0000 | [diff] [blame] | 528 | 		if (tw) | 
 | 529 | 			twrefcnt += inet_twsk_bind_unhash(tw, hinfo); | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 530 | 		spin_unlock(&head->lock); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 531 |  | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 532 | 		if (tw) { | 
 | 533 | 			inet_twsk_deschedule(tw, death_row); | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 534 | 			while (twrefcnt) { | 
 | 535 | 				twrefcnt--; | 
 | 536 | 				inet_twsk_put(tw); | 
 | 537 | 			} | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 538 | 		} | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 539 |  | 
 | 540 | 		ret = 0; | 
 | 541 | 		goto out; | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 542 | 	} | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 543 |  | 
| Pavel Emelyanov | 7f635ab | 2008-06-16 17:12:49 -0700 | [diff] [blame] | 544 | 	head = &hinfo->bhash[inet_bhashfn(net, snum, hinfo->bhash_size)]; | 
| YOSHIFUJI Hideaki | e905a9e | 2007-02-09 23:24:47 +0900 | [diff] [blame] | 545 | 	tb  = inet_csk(sk)->icsk_bind_hash; | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 546 | 	spin_lock_bh(&head->lock); | 
 | 547 | 	if (sk_head(&tb->owners) == sk && !sk->sk_bind_node.next) { | 
| Eric Dumazet | 9327f70 | 2009-12-04 03:46:54 +0000 | [diff] [blame] | 548 | 		hash(sk, NULL); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 549 | 		spin_unlock_bh(&head->lock); | 
 | 550 | 		return 0; | 
 | 551 | 	} else { | 
 | 552 | 		spin_unlock(&head->lock); | 
 | 553 | 		/* No definite answer... Walk to established hash table */ | 
| Pavel Emelyanov | 5ee31fc | 2008-01-31 05:04:45 -0800 | [diff] [blame] | 554 | 		ret = check_established(death_row, sk, snum, NULL); | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 555 | out: | 
 | 556 | 		local_bh_enable(); | 
 | 557 | 		return ret; | 
 | 558 | 	} | 
 | 559 | } | 
| Pavel Emelyanov | 5ee31fc | 2008-01-31 05:04:45 -0800 | [diff] [blame] | 560 |  | 
 | 561 | /* | 
 | 562 |  * Bind a port for a connect operation and hash it. | 
 | 563 |  */ | 
 | 564 | int inet_hash_connect(struct inet_timewait_death_row *death_row, | 
 | 565 | 		      struct sock *sk) | 
 | 566 | { | 
| Pavel Emelyanov | 5d8c0aa | 2008-02-05 03:14:44 -0800 | [diff] [blame] | 567 | 	return __inet_hash_connect(death_row, sk, inet_sk_port_offset(sk), | 
| Pavel Emelyanov | 5ee31fc | 2008-01-31 05:04:45 -0800 | [diff] [blame] | 568 | 			__inet_check_established, __inet_hash_nolisten); | 
 | 569 | } | 
| Arnaldo Carvalho de Melo | a7f5e7f | 2005-12-13 23:25:31 -0800 | [diff] [blame] | 570 | EXPORT_SYMBOL_GPL(inet_hash_connect); | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 571 |  | 
 | 572 | void inet_hashinfo_init(struct inet_hashinfo *h) | 
 | 573 | { | 
 | 574 | 	int i; | 
 | 575 |  | 
| Eric Dumazet | 24dd1fa | 2009-02-01 12:31:33 -0800 | [diff] [blame] | 576 | 	atomic_set(&h->bsockets, 0); | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 577 | 	for (i = 0; i < INET_LHTABLE_SIZE; i++) { | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 578 | 		spin_lock_init(&h->listening_hash[i].lock); | 
| Eric Dumazet | c25eb3b | 2008-11-23 17:22:55 -0800 | [diff] [blame] | 579 | 		INIT_HLIST_NULLS_HEAD(&h->listening_hash[i].head, | 
 | 580 | 				      i + LISTENING_NULLS_BASE); | 
 | 581 | 		} | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 582 | } | 
| Eric Dumazet | 5caea4e | 2008-11-20 00:40:07 -0800 | [diff] [blame] | 583 | EXPORT_SYMBOL_GPL(inet_hashinfo_init); |