nfsd: dynamically allocate DRC entries

The existing code keeps a fixed-size cache of 1024 entries. This is much
too small for a busy server, and wastes memory on an idle one.  This
patch changes the code to dynamically allocate and free these cache
entries.

A cap on the number of entries is retained, but it's much larger than
the existing value and now scales with the amount of low memory in the
machine.

Signed-off-by: Jeff Layton <jlayton@redhat.com>
Signed-off-by: J. Bruce Fields <bfields@redhat.com>
This commit is contained in:
Jeff Layton 2013-02-04 08:18:02 -05:00 committed by J. Bruce Fields
parent 0ee0bf7ee5
commit 0338dd1572

View file

@ -10,17 +10,13 @@
#include <linux/slab.h> #include <linux/slab.h>
#include <linux/sunrpc/clnt.h> #include <linux/sunrpc/clnt.h>
#include <linux/highmem.h>
#include "nfsd.h" #include "nfsd.h"
#include "cache.h" #include "cache.h"
/* Size of reply cache. Common values are: #define NFSDDBG_FACILITY NFSDDBG_REPCACHE
* 4.3BSD: 128
* 4.4BSD: 256
* Solaris2: 1024
* DEC Unix: 512-4096
*/
#define CACHESIZE 1024
#define HASHSIZE 64 #define HASHSIZE 64
static struct hlist_head * cache_hash; static struct hlist_head * cache_hash;
@ -28,6 +24,7 @@ static struct list_head lru_head;
static int cache_disabled = 1; static int cache_disabled = 1;
static struct kmem_cache *drc_slab; static struct kmem_cache *drc_slab;
static unsigned int num_drc_entries; static unsigned int num_drc_entries;
static unsigned int max_drc_entries;
/* /*
* Calculate the hash index from an XID. * Calculate the hash index from an XID.
@ -48,6 +45,34 @@ static int nfsd_cache_append(struct svc_rqst *rqstp, struct kvec *vec);
*/ */
static DEFINE_SPINLOCK(cache_lock); static DEFINE_SPINLOCK(cache_lock);
/*
* Put a cap on the size of the DRC based on the amount of available
* low memory in the machine.
*
* 64MB: 8192
* 128MB: 11585
* 256MB: 16384
* 512MB: 23170
* 1GB: 32768
* 2GB: 46340
* 4GB: 65536
* 8GB: 92681
* 16GB: 131072
*
* ...with a hard cap of 256k entries. In the worst case, each entry will be
* ~1k, so the above numbers should give a rough max of the amount of memory
* used in k.
*/
static unsigned int
nfsd_cache_size_limit(void)
{
unsigned int limit;
unsigned long low_pages = totalram_pages - totalhigh_pages;
limit = (16 * int_sqrt(low_pages)) << (PAGE_SHIFT-10);
return min_t(unsigned int, limit, 256*1024);
}
static struct svc_cacherep * static struct svc_cacherep *
nfsd_reply_cache_alloc(void) nfsd_reply_cache_alloc(void)
{ {
@ -68,6 +93,7 @@ nfsd_reply_cache_free_locked(struct svc_cacherep *rp)
{ {
if (rp->c_type == RC_REPLBUFF) if (rp->c_type == RC_REPLBUFF)
kfree(rp->c_replvec.iov_base); kfree(rp->c_replvec.iov_base);
hlist_del(&rp->c_hash);
list_del(&rp->c_lru); list_del(&rp->c_lru);
--num_drc_entries; --num_drc_entries;
kmem_cache_free(drc_slab, rp); kmem_cache_free(drc_slab, rp);
@ -75,30 +101,18 @@ nfsd_reply_cache_free_locked(struct svc_cacherep *rp)
int nfsd_reply_cache_init(void) int nfsd_reply_cache_init(void)
{ {
int i;
struct svc_cacherep *rp;
drc_slab = kmem_cache_create("nfsd_drc", sizeof(struct svc_cacherep), drc_slab = kmem_cache_create("nfsd_drc", sizeof(struct svc_cacherep),
0, 0, NULL); 0, 0, NULL);
if (!drc_slab) if (!drc_slab)
goto out_nomem; goto out_nomem;
INIT_LIST_HEAD(&lru_head); cache_hash = kcalloc(HASHSIZE, sizeof(struct hlist_head), GFP_KERNEL);
i = CACHESIZE;
num_drc_entries = 0;
while (i) {
rp = nfsd_reply_cache_alloc();
if (!rp)
goto out_nomem;
++num_drc_entries;
list_add(&rp->c_lru, &lru_head);
i--;
}
cache_hash = kcalloc (HASHSIZE, sizeof(struct hlist_head), GFP_KERNEL);
if (!cache_hash) if (!cache_hash)
goto out_nomem; goto out_nomem;
INIT_LIST_HEAD(&lru_head);
max_drc_entries = nfsd_cache_size_limit();
num_drc_entries = 0;
cache_disabled = 0; cache_disabled = 0;
return 0; return 0;
out_nomem: out_nomem:
@ -191,7 +205,7 @@ nfsd_cache_search(struct svc_rqst *rqstp)
int int
nfsd_cache_lookup(struct svc_rqst *rqstp) nfsd_cache_lookup(struct svc_rqst *rqstp)
{ {
struct svc_cacherep *rp; struct svc_cacherep *rp, *found;
__be32 xid = rqstp->rq_xid; __be32 xid = rqstp->rq_xid;
u32 proto = rqstp->rq_prot, u32 proto = rqstp->rq_prot,
vers = rqstp->rq_vers, vers = rqstp->rq_vers,
@ -210,38 +224,48 @@ nfsd_cache_lookup(struct svc_rqst *rqstp)
rtn = RC_DOIT; rtn = RC_DOIT;
rp = nfsd_cache_search(rqstp); rp = nfsd_cache_search(rqstp);
if (rp) { if (rp)
nfsdstats.rchits++; goto found_entry;
/* Try to use the first entry on the LRU */
if (!list_empty(&lru_head)) {
rp = list_first_entry(&lru_head, struct svc_cacherep, c_lru);
if (nfsd_cache_entry_expired(rp) ||
num_drc_entries >= max_drc_entries)
goto setup_entry;
}
spin_unlock(&cache_lock);
rp = nfsd_reply_cache_alloc();
if (!rp) {
dprintk("nfsd: unable to allocate DRC entry!\n");
return RC_DOIT;
}
spin_lock(&cache_lock);
++num_drc_entries;
/*
* Must search again just in case someone inserted one
* after we dropped the lock above.
*/
found = nfsd_cache_search(rqstp);
if (found) {
nfsd_reply_cache_free_locked(rp);
rp = found;
goto found_entry; goto found_entry;
} }
/*
* We're keeping the one we just allocated. Are we now over the
* limit? Prune one off the tip of the LRU in trade for the one we
* just allocated if so.
*/
if (num_drc_entries >= max_drc_entries)
nfsd_reply_cache_free_locked(list_first_entry(&lru_head,
struct svc_cacherep, c_lru));
setup_entry:
nfsdstats.rcmisses++; nfsdstats.rcmisses++;
/* This loop shouldn't take more than a few iterations normally */
{
int safe = 0;
list_for_each_entry(rp, &lru_head, c_lru) {
if (rp->c_state != RC_INPROG)
break;
if (safe++ > CACHESIZE) {
printk("nfsd: loop in repcache LRU list\n");
cache_disabled = 1;
goto out;
}
}
}
/* All entries on the LRU are in-progress. This should not happen */
if (&rp->c_lru == &lru_head) {
static int complaints;
printk(KERN_WARNING "nfsd: all repcache entries locked!\n");
if (++complaints > 5) {
printk(KERN_WARNING "nfsd: disabling repcache.\n");
cache_disabled = 1;
}
goto out;
}
rqstp->rq_cacherep = rp; rqstp->rq_cacherep = rp;
rp->c_state = RC_INPROG; rp->c_state = RC_INPROG;
rp->c_xid = xid; rp->c_xid = xid;
@ -265,6 +289,7 @@ nfsd_cache_lookup(struct svc_rqst *rqstp)
return rtn; return rtn;
found_entry: found_entry:
nfsdstats.rchits++;
/* We found a matching entry which is either in progress or done. */ /* We found a matching entry which is either in progress or done. */
age = jiffies - rp->c_timestamp; age = jiffies - rp->c_timestamp;
lru_put_end(rp); lru_put_end(rp);
@ -295,7 +320,7 @@ nfsd_cache_lookup(struct svc_rqst *rqstp)
break; break;
default: default:
printk(KERN_WARNING "nfsd: bad repcache type %d\n", rp->c_type); printk(KERN_WARNING "nfsd: bad repcache type %d\n", rp->c_type);
rp->c_state = RC_UNUSED; nfsd_reply_cache_free_locked(rp);
} }
goto out; goto out;