net: Use a percpu_counter for sockets_allocated
Instead of using one atomic_t per protocol, use a percpu_counter
for "sockets_allocated", to reduce cache line contention on
heavy duty network servers.
Note : We revert commit (248969ae31
net: af_unix can make unix_nr_socks visbile in /proc),
since it is not anymore used after sock_prot_inuse_add() addition
Signed-off-by: Eric Dumazet <dada1@cosmosbay.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
This commit is contained in:
parent
c1b56878fb
commit
1748376b66
11 changed files with 29 additions and 16 deletions
|
@ -138,6 +138,7 @@ void sctp_write_space(struct sock *sk);
|
||||||
unsigned int sctp_poll(struct file *file, struct socket *sock,
|
unsigned int sctp_poll(struct file *file, struct socket *sock,
|
||||||
poll_table *wait);
|
poll_table *wait);
|
||||||
void sctp_sock_rfree(struct sk_buff *skb);
|
void sctp_sock_rfree(struct sk_buff *skb);
|
||||||
|
extern struct percpu_counter sctp_sockets_allocated;
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* sctp/primitive.c
|
* sctp/primitive.c
|
||||||
|
|
|
@ -649,7 +649,7 @@ struct proto {
|
||||||
/* Memory pressure */
|
/* Memory pressure */
|
||||||
void (*enter_memory_pressure)(struct sock *sk);
|
void (*enter_memory_pressure)(struct sock *sk);
|
||||||
atomic_t *memory_allocated; /* Current allocated memory. */
|
atomic_t *memory_allocated; /* Current allocated memory. */
|
||||||
atomic_t *sockets_allocated; /* Current number of sockets. */
|
struct percpu_counter *sockets_allocated; /* Current number of sockets. */
|
||||||
/*
|
/*
|
||||||
* Pressure flag: try to collapse.
|
* Pressure flag: try to collapse.
|
||||||
* Technical note: it is used by multiple contexts non atomically.
|
* Technical note: it is used by multiple contexts non atomically.
|
||||||
|
|
|
@ -238,7 +238,7 @@ extern int sysctl_tcp_slow_start_after_idle;
|
||||||
extern int sysctl_tcp_max_ssthresh;
|
extern int sysctl_tcp_max_ssthresh;
|
||||||
|
|
||||||
extern atomic_t tcp_memory_allocated;
|
extern atomic_t tcp_memory_allocated;
|
||||||
extern atomic_t tcp_sockets_allocated;
|
extern struct percpu_counter tcp_sockets_allocated;
|
||||||
extern int tcp_memory_pressure;
|
extern int tcp_memory_pressure;
|
||||||
|
|
||||||
/*
|
/*
|
||||||
|
|
|
@ -1071,7 +1071,7 @@ struct sock *sk_clone(const struct sock *sk, const gfp_t priority)
|
||||||
newsk->sk_sleep = NULL;
|
newsk->sk_sleep = NULL;
|
||||||
|
|
||||||
if (newsk->sk_prot->sockets_allocated)
|
if (newsk->sk_prot->sockets_allocated)
|
||||||
atomic_inc(newsk->sk_prot->sockets_allocated);
|
percpu_counter_inc(newsk->sk_prot->sockets_allocated);
|
||||||
}
|
}
|
||||||
out:
|
out:
|
||||||
return newsk;
|
return newsk;
|
||||||
|
@ -1463,8 +1463,12 @@ int __sk_mem_schedule(struct sock *sk, int size, int kind)
|
||||||
}
|
}
|
||||||
|
|
||||||
if (prot->memory_pressure) {
|
if (prot->memory_pressure) {
|
||||||
if (!*prot->memory_pressure ||
|
int alloc;
|
||||||
prot->sysctl_mem[2] > atomic_read(prot->sockets_allocated) *
|
|
||||||
|
if (!*prot->memory_pressure)
|
||||||
|
return 1;
|
||||||
|
alloc = percpu_counter_read_positive(prot->sockets_allocated);
|
||||||
|
if (prot->sysctl_mem[2] > alloc *
|
||||||
sk_mem_pages(sk->sk_wmem_queued +
|
sk_mem_pages(sk->sk_wmem_queued +
|
||||||
atomic_read(&sk->sk_rmem_alloc) +
|
atomic_read(&sk->sk_rmem_alloc) +
|
||||||
sk->sk_forward_alloc))
|
sk->sk_forward_alloc))
|
||||||
|
|
|
@ -55,7 +55,8 @@ static int sockstat_seq_show(struct seq_file *seq, void *v)
|
||||||
seq_printf(seq, "TCP: inuse %d orphan %d tw %d alloc %d mem %d\n",
|
seq_printf(seq, "TCP: inuse %d orphan %d tw %d alloc %d mem %d\n",
|
||||||
sock_prot_inuse_get(net, &tcp_prot),
|
sock_prot_inuse_get(net, &tcp_prot),
|
||||||
atomic_read(&tcp_orphan_count),
|
atomic_read(&tcp_orphan_count),
|
||||||
tcp_death_row.tw_count, atomic_read(&tcp_sockets_allocated),
|
tcp_death_row.tw_count,
|
||||||
|
(int)percpu_counter_sum_positive(&tcp_sockets_allocated),
|
||||||
atomic_read(&tcp_memory_allocated));
|
atomic_read(&tcp_memory_allocated));
|
||||||
seq_printf(seq, "UDP: inuse %d mem %d\n",
|
seq_printf(seq, "UDP: inuse %d mem %d\n",
|
||||||
sock_prot_inuse_get(net, &udp_prot),
|
sock_prot_inuse_get(net, &udp_prot),
|
||||||
|
|
|
@ -290,9 +290,12 @@ EXPORT_SYMBOL(sysctl_tcp_rmem);
|
||||||
EXPORT_SYMBOL(sysctl_tcp_wmem);
|
EXPORT_SYMBOL(sysctl_tcp_wmem);
|
||||||
|
|
||||||
atomic_t tcp_memory_allocated; /* Current allocated memory. */
|
atomic_t tcp_memory_allocated; /* Current allocated memory. */
|
||||||
atomic_t tcp_sockets_allocated; /* Current number of TCP sockets. */
|
|
||||||
|
|
||||||
EXPORT_SYMBOL(tcp_memory_allocated);
|
EXPORT_SYMBOL(tcp_memory_allocated);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Current number of TCP sockets.
|
||||||
|
*/
|
||||||
|
struct percpu_counter tcp_sockets_allocated;
|
||||||
EXPORT_SYMBOL(tcp_sockets_allocated);
|
EXPORT_SYMBOL(tcp_sockets_allocated);
|
||||||
|
|
||||||
/*
|
/*
|
||||||
|
@ -2685,6 +2688,7 @@ void __init tcp_init(void)
|
||||||
|
|
||||||
BUILD_BUG_ON(sizeof(struct tcp_skb_cb) > sizeof(skb->cb));
|
BUILD_BUG_ON(sizeof(struct tcp_skb_cb) > sizeof(skb->cb));
|
||||||
|
|
||||||
|
percpu_counter_init(&tcp_sockets_allocated, 0);
|
||||||
tcp_hashinfo.bind_bucket_cachep =
|
tcp_hashinfo.bind_bucket_cachep =
|
||||||
kmem_cache_create("tcp_bind_bucket",
|
kmem_cache_create("tcp_bind_bucket",
|
||||||
sizeof(struct inet_bind_bucket), 0,
|
sizeof(struct inet_bind_bucket), 0,
|
||||||
|
|
|
@ -1797,7 +1797,7 @@ static int tcp_v4_init_sock(struct sock *sk)
|
||||||
sk->sk_sndbuf = sysctl_tcp_wmem[1];
|
sk->sk_sndbuf = sysctl_tcp_wmem[1];
|
||||||
sk->sk_rcvbuf = sysctl_tcp_rmem[1];
|
sk->sk_rcvbuf = sysctl_tcp_rmem[1];
|
||||||
|
|
||||||
atomic_inc(&tcp_sockets_allocated);
|
percpu_counter_inc(&tcp_sockets_allocated);
|
||||||
|
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
@ -1845,7 +1845,7 @@ void tcp_v4_destroy_sock(struct sock *sk)
|
||||||
sk->sk_sndmsg_page = NULL;
|
sk->sk_sndmsg_page = NULL;
|
||||||
}
|
}
|
||||||
|
|
||||||
atomic_dec(&tcp_sockets_allocated);
|
percpu_counter_dec(&tcp_sockets_allocated);
|
||||||
}
|
}
|
||||||
|
|
||||||
EXPORT_SYMBOL(tcp_v4_destroy_sock);
|
EXPORT_SYMBOL(tcp_v4_destroy_sock);
|
||||||
|
|
|
@ -1830,7 +1830,7 @@ static int tcp_v6_init_sock(struct sock *sk)
|
||||||
sk->sk_sndbuf = sysctl_tcp_wmem[1];
|
sk->sk_sndbuf = sysctl_tcp_wmem[1];
|
||||||
sk->sk_rcvbuf = sysctl_tcp_rmem[1];
|
sk->sk_rcvbuf = sysctl_tcp_rmem[1];
|
||||||
|
|
||||||
atomic_inc(&tcp_sockets_allocated);
|
percpu_counter_inc(&tcp_sockets_allocated);
|
||||||
|
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
|
|
@ -102,6 +102,8 @@ struct sock *sctp_get_ctl_sock(void)
|
||||||
/* Set up the proc fs entry for the SCTP protocol. */
|
/* Set up the proc fs entry for the SCTP protocol. */
|
||||||
static __init int sctp_proc_init(void)
|
static __init int sctp_proc_init(void)
|
||||||
{
|
{
|
||||||
|
if (percpu_counter_init(&sctp_sockets_allocated, 0))
|
||||||
|
goto out_nomem;
|
||||||
#ifdef CONFIG_PROC_FS
|
#ifdef CONFIG_PROC_FS
|
||||||
if (!proc_net_sctp) {
|
if (!proc_net_sctp) {
|
||||||
struct proc_dir_entry *ent;
|
struct proc_dir_entry *ent;
|
||||||
|
@ -110,7 +112,7 @@ static __init int sctp_proc_init(void)
|
||||||
ent->owner = THIS_MODULE;
|
ent->owner = THIS_MODULE;
|
||||||
proc_net_sctp = ent;
|
proc_net_sctp = ent;
|
||||||
} else
|
} else
|
||||||
goto out_nomem;
|
goto out_free_percpu;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (sctp_snmp_proc_init())
|
if (sctp_snmp_proc_init())
|
||||||
|
@ -135,6 +137,8 @@ static __init int sctp_proc_init(void)
|
||||||
proc_net_sctp = NULL;
|
proc_net_sctp = NULL;
|
||||||
remove_proc_entry("sctp", init_net.proc_net);
|
remove_proc_entry("sctp", init_net.proc_net);
|
||||||
}
|
}
|
||||||
|
out_free_percpu:
|
||||||
|
percpu_counter_destroy(&sctp_sockets_allocated);
|
||||||
out_nomem:
|
out_nomem:
|
||||||
return -ENOMEM;
|
return -ENOMEM;
|
||||||
#else
|
#else
|
||||||
|
|
|
@ -114,7 +114,7 @@ extern int sysctl_sctp_wmem[3];
|
||||||
|
|
||||||
static int sctp_memory_pressure;
|
static int sctp_memory_pressure;
|
||||||
static atomic_t sctp_memory_allocated;
|
static atomic_t sctp_memory_allocated;
|
||||||
static atomic_t sctp_sockets_allocated;
|
struct percpu_counter sctp_sockets_allocated;
|
||||||
|
|
||||||
static void sctp_enter_memory_pressure(struct sock *sk)
|
static void sctp_enter_memory_pressure(struct sock *sk)
|
||||||
{
|
{
|
||||||
|
@ -3613,7 +3613,7 @@ SCTP_STATIC int sctp_init_sock(struct sock *sk)
|
||||||
sp->hmac = NULL;
|
sp->hmac = NULL;
|
||||||
|
|
||||||
SCTP_DBG_OBJCNT_INC(sock);
|
SCTP_DBG_OBJCNT_INC(sock);
|
||||||
atomic_inc(&sctp_sockets_allocated);
|
percpu_counter_inc(&sctp_sockets_allocated);
|
||||||
|
|
||||||
local_bh_disable();
|
local_bh_disable();
|
||||||
sock_prot_inuse_add(sock_net(sk), sk->sk_prot, 1);
|
sock_prot_inuse_add(sock_net(sk), sk->sk_prot, 1);
|
||||||
|
@ -3632,7 +3632,7 @@ SCTP_STATIC void sctp_destroy_sock(struct sock *sk)
|
||||||
/* Release our hold on the endpoint. */
|
/* Release our hold on the endpoint. */
|
||||||
ep = sctp_sk(sk)->ep;
|
ep = sctp_sk(sk)->ep;
|
||||||
sctp_endpoint_free(ep);
|
sctp_endpoint_free(ep);
|
||||||
atomic_dec(&sctp_sockets_allocated);
|
percpu_counter_dec(&sctp_sockets_allocated);
|
||||||
local_bh_disable();
|
local_bh_disable();
|
||||||
sock_prot_inuse_add(sock_net(sk), sk->sk_prot, -1);
|
sock_prot_inuse_add(sock_net(sk), sk->sk_prot, -1);
|
||||||
local_bh_enable();
|
local_bh_enable();
|
||||||
|
|
|
@ -571,7 +571,6 @@ static const struct proto_ops unix_seqpacket_ops = {
|
||||||
static struct proto unix_proto = {
|
static struct proto unix_proto = {
|
||||||
.name = "UNIX",
|
.name = "UNIX",
|
||||||
.owner = THIS_MODULE,
|
.owner = THIS_MODULE,
|
||||||
.sockets_allocated = &unix_nr_socks,
|
|
||||||
.obj_size = sizeof(struct unix_sock),
|
.obj_size = sizeof(struct unix_sock),
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue