Memory controller: cgroups setup
Setup the memory cgroup and add basic hooks and controls to integrate and work with the cgroup. Signed-off-by: Balbir Singh <balbir@linux.vnet.ibm.com> Cc: Pavel Emelianov <xemul@openvz.org> Cc: Paul Menage <menage@google.com> Cc: Peter Zijlstra <a.p.zijlstra@chello.nl> Cc: "Eric W. Biederman" <ebiederm@xmission.com> Cc: Nick Piggin <nickpiggin@yahoo.com.au> Cc: Kirill Korotaev <dev@sw.ru> Cc: Herbert Poetzl <herbert@13thfloor.at> Cc: David Rientjes <rientjes@google.com> Cc: Vaidyanathan Srinivasan <svaidy@linux.vnet.ibm.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
This commit is contained in:
parent
e552b66170
commit
8cdea7c054
5 changed files with 161 additions and 0 deletions
|
@ -37,3 +37,8 @@ SUBSYS(cpuacct)
|
||||||
|
|
||||||
/* */
|
/* */
|
||||||
|
|
||||||
|
#ifdef CONFIG_CGROUP_MEM_CONT
|
||||||
|
SUBSYS(mem_cgroup)
|
||||||
|
#endif
|
||||||
|
|
||||||
|
/* */
|
||||||
|
|
21
include/linux/memcontrol.h
Normal file
21
include/linux/memcontrol.h
Normal file
|
@ -0,0 +1,21 @@
|
||||||
|
/* memcontrol.h - Memory Controller
|
||||||
|
*
|
||||||
|
* Copyright IBM Corporation, 2007
|
||||||
|
* Author Balbir Singh <balbir@linux.vnet.ibm.com>
|
||||||
|
*
|
||||||
|
* This program is free software; you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation; either version 2 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#ifndef _LINUX_MEMCONTROL_H
|
||||||
|
#define _LINUX_MEMCONTROL_H
|
||||||
|
|
||||||
|
#endif /* _LINUX_MEMCONTROL_H */
|
||||||
|
|
|
@ -397,6 +397,13 @@ config SYSFS_DEPRECATED
|
||||||
If you are using a distro that was released in 2006 or later,
|
If you are using a distro that was released in 2006 or later,
|
||||||
it should be safe to say N here.
|
it should be safe to say N here.
|
||||||
|
|
||||||
|
config CGROUP_MEM_CONT
|
||||||
|
bool "Memory controller for cgroups"
|
||||||
|
depends on CGROUPS && RESOURCE_COUNTERS
|
||||||
|
help
|
||||||
|
Provides a memory controller that manages both page cache and
|
||||||
|
RSS memory.
|
||||||
|
|
||||||
config PROC_PID_CPUSET
|
config PROC_PID_CPUSET
|
||||||
bool "Include legacy /proc/<pid>/cpuset file"
|
bool "Include legacy /proc/<pid>/cpuset file"
|
||||||
depends on CPUSETS
|
depends on CPUSETS
|
||||||
|
|
|
@ -32,4 +32,5 @@ obj-$(CONFIG_FS_XIP) += filemap_xip.o
|
||||||
obj-$(CONFIG_MIGRATION) += migrate.o
|
obj-$(CONFIG_MIGRATION) += migrate.o
|
||||||
obj-$(CONFIG_SMP) += allocpercpu.o
|
obj-$(CONFIG_SMP) += allocpercpu.o
|
||||||
obj-$(CONFIG_QUICKLIST) += quicklist.o
|
obj-$(CONFIG_QUICKLIST) += quicklist.o
|
||||||
|
obj-$(CONFIG_CGROUP_MEM_CONT) += memcontrol.o
|
||||||
|
|
||||||
|
|
127
mm/memcontrol.c
Normal file
127
mm/memcontrol.c
Normal file
|
@ -0,0 +1,127 @@
|
||||||
|
/* memcontrol.c - Memory Controller
|
||||||
|
*
|
||||||
|
* Copyright IBM Corporation, 2007
|
||||||
|
* Author Balbir Singh <balbir@linux.vnet.ibm.com>
|
||||||
|
*
|
||||||
|
* This program is free software; you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation; either version 2 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#include <linux/res_counter.h>
|
||||||
|
#include <linux/memcontrol.h>
|
||||||
|
#include <linux/cgroup.h>
|
||||||
|
|
||||||
|
struct cgroup_subsys mem_cgroup_subsys;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* The memory controller data structure. The memory controller controls both
|
||||||
|
* page cache and RSS per cgroup. We would eventually like to provide
|
||||||
|
* statistics based on the statistics developed by Rik Van Riel for clock-pro,
|
||||||
|
* to help the administrator determine what knobs to tune.
|
||||||
|
*
|
||||||
|
* TODO: Add a water mark for the memory controller. Reclaim will begin when
|
||||||
|
* we hit the water mark.
|
||||||
|
*/
|
||||||
|
struct mem_cgroup {
|
||||||
|
struct cgroup_subsys_state css;
|
||||||
|
/*
|
||||||
|
* the counter to account for memory usage
|
||||||
|
*/
|
||||||
|
struct res_counter res;
|
||||||
|
};
|
||||||
|
|
||||||
|
/*
|
||||||
|
* A page_cgroup page is associated with every page descriptor. The
|
||||||
|
* page_cgroup helps us identify information about the cgroup
|
||||||
|
*/
|
||||||
|
struct page_cgroup {
|
||||||
|
struct list_head lru; /* per cgroup LRU list */
|
||||||
|
struct page *page;
|
||||||
|
struct mem_cgroup *mem_cgroup;
|
||||||
|
};
|
||||||
|
|
||||||
|
|
||||||
|
static inline
|
||||||
|
struct mem_cgroup *mem_cgroup_from_cont(struct cgroup *cont)
|
||||||
|
{
|
||||||
|
return container_of(cgroup_subsys_state(cont,
|
||||||
|
mem_cgroup_subsys_id), struct mem_cgroup,
|
||||||
|
css);
|
||||||
|
}
|
||||||
|
|
||||||
|
static ssize_t mem_cgroup_read(struct cgroup *cont, struct cftype *cft,
|
||||||
|
struct file *file, char __user *userbuf, size_t nbytes,
|
||||||
|
loff_t *ppos)
|
||||||
|
{
|
||||||
|
return res_counter_read(&mem_cgroup_from_cont(cont)->res,
|
||||||
|
cft->private, userbuf, nbytes, ppos);
|
||||||
|
}
|
||||||
|
|
||||||
|
static ssize_t mem_cgroup_write(struct cgroup *cont, struct cftype *cft,
|
||||||
|
struct file *file, const char __user *userbuf,
|
||||||
|
size_t nbytes, loff_t *ppos)
|
||||||
|
{
|
||||||
|
return res_counter_write(&mem_cgroup_from_cont(cont)->res,
|
||||||
|
cft->private, userbuf, nbytes, ppos);
|
||||||
|
}
|
||||||
|
|
||||||
|
static struct cftype mem_cgroup_files[] = {
|
||||||
|
{
|
||||||
|
.name = "usage",
|
||||||
|
.private = RES_USAGE,
|
||||||
|
.read = mem_cgroup_read,
|
||||||
|
},
|
||||||
|
{
|
||||||
|
.name = "limit",
|
||||||
|
.private = RES_LIMIT,
|
||||||
|
.write = mem_cgroup_write,
|
||||||
|
.read = mem_cgroup_read,
|
||||||
|
},
|
||||||
|
{
|
||||||
|
.name = "failcnt",
|
||||||
|
.private = RES_FAILCNT,
|
||||||
|
.read = mem_cgroup_read,
|
||||||
|
},
|
||||||
|
};
|
||||||
|
|
||||||
|
static struct cgroup_subsys_state *
|
||||||
|
mem_cgroup_create(struct cgroup_subsys *ss, struct cgroup *cont)
|
||||||
|
{
|
||||||
|
struct mem_cgroup *mem;
|
||||||
|
|
||||||
|
mem = kzalloc(sizeof(struct mem_cgroup), GFP_KERNEL);
|
||||||
|
if (!mem)
|
||||||
|
return -ENOMEM;
|
||||||
|
|
||||||
|
res_counter_init(&mem->res);
|
||||||
|
return &mem->css;
|
||||||
|
}
|
||||||
|
|
||||||
|
static void mem_cgroup_destroy(struct cgroup_subsys *ss,
|
||||||
|
struct cgroup *cont)
|
||||||
|
{
|
||||||
|
kfree(mem_cgroup_from_cont(cont));
|
||||||
|
}
|
||||||
|
|
||||||
|
static int mem_cgroup_populate(struct cgroup_subsys *ss,
|
||||||
|
struct cgroup *cont)
|
||||||
|
{
|
||||||
|
return cgroup_add_files(cont, ss, mem_cgroup_files,
|
||||||
|
ARRAY_SIZE(mem_cgroup_files));
|
||||||
|
}
|
||||||
|
|
||||||
|
struct cgroup_subsys mem_cgroup_subsys = {
|
||||||
|
.name = "memory",
|
||||||
|
.subsys_id = mem_cgroup_subsys_id,
|
||||||
|
.create = mem_cgroup_create,
|
||||||
|
.destroy = mem_cgroup_destroy,
|
||||||
|
.populate = mem_cgroup_populate,
|
||||||
|
.early_init = 0,
|
||||||
|
};
|
Loading…
Reference in a new issue