Commit 7ae7730f authored by Patrick McHardy's avatar Patrick McHardy Committed by David S. Miller

[NETFILTER]: nf_conntrack: early_drop improvement

When the maximum number of conntrack entries is reached and a new
one needs to be allocated, conntrack tries to drop an unassured
connection from the same hash bucket the new conntrack would hash
to. Since with a properly sized hash the average number of entries
per bucket is 1, the chances of actually finding one are not very
good. This patch makes it walk the hash until a minimum number of
8 entries are checked.

Based on patch by Vasily Averin <vvs@sw.ru>.
Signed-off-by: default avatarPatrick McHardy <kaber@trash.net>
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parent ec59a111
...@@ -377,21 +377,30 @@ nf_conntrack_tuple_taken(const struct nf_conntrack_tuple *tuple, ...@@ -377,21 +377,30 @@ nf_conntrack_tuple_taken(const struct nf_conntrack_tuple *tuple,
} }
EXPORT_SYMBOL_GPL(nf_conntrack_tuple_taken); EXPORT_SYMBOL_GPL(nf_conntrack_tuple_taken);
#define NF_CT_EVICTION_RANGE 8
/* There's a small race here where we may free a just-assured /* There's a small race here where we may free a just-assured
connection. Too bad: we're in trouble anyway. */ connection. Too bad: we're in trouble anyway. */
static int early_drop(struct hlist_head *chain) static int early_drop(unsigned int hash)
{ {
/* Use oldest entry, which is roughly LRU */ /* Use oldest entry, which is roughly LRU */
struct nf_conntrack_tuple_hash *h; struct nf_conntrack_tuple_hash *h;
struct nf_conn *ct = NULL, *tmp; struct nf_conn *ct = NULL, *tmp;
struct hlist_node *n; struct hlist_node *n;
unsigned int i, cnt = 0;
int dropped = 0; int dropped = 0;
read_lock_bh(&nf_conntrack_lock); read_lock_bh(&nf_conntrack_lock);
hlist_for_each_entry(h, n, chain, hnode) { for (i = 0; i < nf_conntrack_htable_size; i++) {
tmp = nf_ct_tuplehash_to_ctrack(h); hlist_for_each_entry(h, n, &nf_conntrack_hash[hash], hnode) {
if (!test_bit(IPS_ASSURED_BIT, &tmp->status)) tmp = nf_ct_tuplehash_to_ctrack(h);
ct = tmp; if (!test_bit(IPS_ASSURED_BIT, &tmp->status))
ct = tmp;
cnt++;
}
if (ct || cnt >= NF_CT_EVICTION_RANGE)
break;
hash = (hash + 1) % nf_conntrack_htable_size;
} }
if (ct) if (ct)
atomic_inc(&ct->ct_general.use); atomic_inc(&ct->ct_general.use);
...@@ -425,8 +434,7 @@ struct nf_conn *nf_conntrack_alloc(const struct nf_conntrack_tuple *orig, ...@@ -425,8 +434,7 @@ struct nf_conn *nf_conntrack_alloc(const struct nf_conntrack_tuple *orig,
if (nf_conntrack_max if (nf_conntrack_max
&& atomic_read(&nf_conntrack_count) > nf_conntrack_max) { && atomic_read(&nf_conntrack_count) > nf_conntrack_max) {
unsigned int hash = hash_conntrack(orig); unsigned int hash = hash_conntrack(orig);
/* Try dropping from this hash chain. */ if (!early_drop(hash)) {
if (!early_drop(&nf_conntrack_hash[hash])) {
atomic_dec(&nf_conntrack_count); atomic_dec(&nf_conntrack_count);
if (net_ratelimit()) if (net_ratelimit())
printk(KERN_WARNING printk(KERN_WARNING
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment