From: Andrea Righi <arighi@develer.com>
To: Vivek Goyal <vgoyal@redhat.com>
Cc: Balbir Singh <balbir@linux.vnet.ibm.com>,
KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com>,
Suleiman Souhlal <suleiman@google.com>,
Andrew Morton <akpm@linux-foundation.org>,
containers@lists.linux-foundation.org,
linux-kernel@vger.kernel.org
Subject: Re: [PATCH 1/2] memcg: dirty pages accounting and limiting infrastructure
Date: Tue, 23 Feb 2010 10:26:58 +0100 [thread overview]
Message-ID: <20100223092658.GA1882@linux> (raw)
In-Reply-To: <20100222155840.GC13823@redhat.com>
On Mon, Feb 22, 2010 at 10:58:40AM -0500, Vivek Goyal wrote:
> On Sun, Feb 21, 2010 at 04:18:44PM +0100, Andrea Righi wrote:
> > Infrastructure to account dirty pages per cgroup + add memory.dirty_bytes limit
> > in cgroupfs.
> >
> > Signed-off-by: Andrea Righi <arighi@develer.com>
> > ---
> > include/linux/memcontrol.h | 31 ++++++
> > mm/memcontrol.c | 218 +++++++++++++++++++++++++++++++++++++++++++-
> > 2 files changed, 248 insertions(+), 1 deletions(-)
> >
> > diff --git a/include/linux/memcontrol.h b/include/linux/memcontrol.h
> > index 1f9b119..ba3fe0d 100644
> > --- a/include/linux/memcontrol.h
> > +++ b/include/linux/memcontrol.h
> > @@ -25,6 +25,16 @@ struct page_cgroup;
> > struct page;
> > struct mm_struct;
> >
> > +/* Cgroup memory statistics items exported to the kernel */
> > +enum memcg_page_stat_item {
> > + MEMCG_NR_FREE_PAGES,
> > + MEMCG_NR_RECLAIMABLE_PAGES,
> > + MEMCG_NR_FILE_DIRTY,
> > + MEMCG_NR_WRITEBACK,
> > + MEMCG_NR_WRITEBACK_TEMP,
> > + MEMCG_NR_UNSTABLE_NFS,
> > +};
> > +
> > #ifdef CONFIG_CGROUP_MEM_RES_CTLR
> > /*
> > * All "charge" functions with gfp_mask should use GFP_KERNEL or
> > @@ -48,6 +58,8 @@ extern void mem_cgroup_cancel_charge_swapin(struct mem_cgroup *ptr);
> >
> > extern int mem_cgroup_cache_charge(struct page *page, struct mm_struct *mm,
> > gfp_t gfp_mask);
> > +extern void mem_cgroup_charge_dirty(struct page *page,
> > + enum zone_stat_item idx, int charge);
> > extern void mem_cgroup_add_lru_list(struct page *page, enum lru_list lru);
> > extern void mem_cgroup_del_lru_list(struct page *page, enum lru_list lru);
> > extern void mem_cgroup_rotate_lru_list(struct page *page, enum lru_list lru);
> > @@ -117,6 +129,10 @@ extern void mem_cgroup_print_oom_info(struct mem_cgroup *memcg,
> > extern int do_swap_account;
> > #endif
> >
> > +extern unsigned long mem_cgroup_dirty_bytes(void);
> > +
> > +extern u64 mem_cgroup_page_state(enum memcg_page_stat_item item);
> > +
> > static inline bool mem_cgroup_disabled(void)
> > {
> > if (mem_cgroup_subsys.disabled)
> > @@ -144,6 +160,11 @@ static inline int mem_cgroup_cache_charge(struct page *page,
> > return 0;
> > }
> >
> > +static inline void mem_cgroup_charge_dirty(struct page *page,
> > + enum zone_stat_item idx, int charge)
> > +{
> > +}
> > +
> > static inline int mem_cgroup_try_charge_swapin(struct mm_struct *mm,
> > struct page *page, gfp_t gfp_mask, struct mem_cgroup **ptr)
> > {
> > @@ -312,6 +333,16 @@ unsigned long mem_cgroup_soft_limit_reclaim(struct zone *zone, int order,
> > return 0;
> > }
> >
> > +static inline unsigned long mem_cgroup_dirty_bytes(void)
> > +{
> > + return vm_dirty_bytes;
> > +}
> > +
> > +static inline u64 mem_cgroup_page_state(enum memcg_page_stat_item item)
> > +{
> > + return 0;
> > +}
> > +
> > #endif /* CONFIG_CGROUP_MEM_CONT */
> >
> > #endif /* _LINUX_MEMCONTROL_H */
> > diff --git a/mm/memcontrol.c b/mm/memcontrol.c
> > index 954032b..288b9a4 100644
> > --- a/mm/memcontrol.c
> > +++ b/mm/memcontrol.c
> > @@ -64,13 +64,18 @@ enum mem_cgroup_stat_index {
> > /*
> > * For MEM_CONTAINER_TYPE_ALL, usage = pagecache + rss.
> > */
> > - MEM_CGROUP_STAT_CACHE, /* # of pages charged as cache */
> > + MEM_CGROUP_STAT_CACHE, /* # of pages charged as cache */
> > MEM_CGROUP_STAT_RSS, /* # of pages charged as anon rss */
> > MEM_CGROUP_STAT_FILE_MAPPED, /* # of pages charged as file rss */
> > MEM_CGROUP_STAT_PGPGIN_COUNT, /* # of pages paged in */
> > MEM_CGROUP_STAT_PGPGOUT_COUNT, /* # of pages paged out */
> > MEM_CGROUP_STAT_EVENTS, /* sum of pagein + pageout for internal use */
> > MEM_CGROUP_STAT_SWAPOUT, /* # of pages, swapped out */
> > + MEM_CGROUP_STAT_FILE_DIRTY, /* # of dirty pages in page cache */
> > + MEM_CGROUP_STAT_WRITEBACK, /* # of pages under writeback */
> > + MEM_CGROUP_STAT_WRITEBACK_TEMP, /* # of pages under writeback using
> > + temporary buffers */
> > + MEM_CGROUP_STAT_UNSTABLE_NFS, /* # of NFS unstable pages */
> >
> > MEM_CGROUP_STAT_NSTATS,
> > };
> > @@ -225,6 +230,9 @@ struct mem_cgroup {
> > /* set when res.limit == memsw.limit */
> > bool memsw_is_minimum;
> >
> > + /* control memory cgroup dirty pages */
> > + unsigned long dirty_bytes;
> > +
> > /*
> > * statistics. This must be placed at the end of memcg.
> > */
> > @@ -519,6 +527,67 @@ static void mem_cgroup_charge_statistics(struct mem_cgroup *mem,
> > put_cpu();
> > }
> >
> > +static struct mem_cgroup *get_mem_cgroup_from_page(struct page *page)
> > +{
> > + struct page_cgroup *pc;
> > + struct mem_cgroup *mem = NULL;
> > +
> > + pc = lookup_page_cgroup(page);
> > + if (unlikely(!pc))
> > + return NULL;
> > + lock_page_cgroup(pc);
> > + if (PageCgroupUsed(pc)) {
> > + mem = pc->mem_cgroup;
> > + if (mem)
> > + css_get(&mem->css);
> > + }
> > + unlock_page_cgroup(pc);
> > + return mem;
> > +}
> > +
> > +void mem_cgroup_charge_dirty(struct page *page,
> > + enum zone_stat_item idx, int charge)
> > +{
> > + struct mem_cgroup *mem;
> > + struct mem_cgroup_stat_cpu *cpustat;
> > + unsigned long flags;
> > + int cpu;
> > +
> > + if (mem_cgroup_disabled())
> > + return;
> > + /* Translate the zone_stat_item into a mem_cgroup_stat_index */
> > + switch (idx) {
> > + case NR_FILE_DIRTY:
> > + idx = MEM_CGROUP_STAT_FILE_DIRTY;
> > + break;
> > + case NR_WRITEBACK:
> > + idx = MEM_CGROUP_STAT_WRITEBACK;
> > + break;
> > + case NR_WRITEBACK_TEMP:
> > + idx = MEM_CGROUP_STAT_WRITEBACK_TEMP;
> > + break;
> > + case NR_UNSTABLE_NFS:
> > + idx = MEM_CGROUP_STAT_UNSTABLE_NFS;
> > + break;
> > + default:
> > + return;
> > + }
> > + /* Charge the memory cgroup statistics */
> > + mem = get_mem_cgroup_from_page(page);
> > + if (!mem) {
> > + mem = root_mem_cgroup;
> > + css_get(&mem->css);
> > + }
> > +
> > + local_irq_save(flags);
> > + cpu = get_cpu();
> > + cpustat = &mem->stat.cpustat[cpu];
> > + __mem_cgroup_stat_add_safe(cpustat, idx, charge);
> > + put_cpu();
> > + local_irq_restore(flags);
> > + css_put(&mem->css);
> > +}
> > +
>
> We seem to be doing same operation as existing "mem_cgroup_update_file_mapped"
> function is doing to udpate some stats. Can we just reuse that? We
> probably can create one core function which take index of stat to update
> and update_file_mapped and other variants for memcg dirty ratio can make
> use of it.
>
> In fact instead of single function charge_dirty() accounting for
> WRITEBACK, we well as other states like UNSTABLE_NFS is not very intutive.
> May be we can have indivdual functions.
>
> mem_cgroup_update_dirty()
> mem_cgroup_update_writeback()
> mem_cgroup_update_unstable_nfs() etc.
Right. I like it. We can extend this function or provide separate
functions to account each stat.
Thanks!
-Andrea
next prev parent reply other threads:[~2010-02-23 9:27 UTC|newest]
Thread overview: 104+ messages / expand[flat|nested] mbox.gz Atom feed top
2010-02-21 15:18 [RFC] [PATCH 0/2] memcg: per cgroup dirty limit Andrea Righi
2010-02-21 15:18 ` [PATCH 1/2] memcg: dirty pages accounting and limiting infrastructure Andrea Righi
2010-02-21 21:28 ` David Rientjes
2010-02-21 22:17 ` Andrea Righi
2010-02-22 18:07 ` Vivek Goyal
2010-02-22 18:07 ` Vivek Goyal
[not found] ` <20100222180732.GC3096-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-23 11:58 ` Andrea Righi
2010-02-23 11:58 ` Andrea Righi
2010-02-25 15:36 ` Minchan Kim
2010-02-26 0:23 ` KAMEZAWA Hiroyuki
[not found] ` <20100226092339.1f639cbf.kamezawa.hiroyu-+CUm20s59erQFUHtdCDX3A@public.gmane.org>
2010-02-26 4:50 ` Minchan Kim
2010-02-26 4:50 ` Minchan Kim
2010-02-26 5:01 ` KAMEZAWA Hiroyuki
[not found] ` <20100226140135.23c32a8d.kamezawa.hiroyu-+CUm20s59erQFUHtdCDX3A@public.gmane.org>
2010-02-26 5:53 ` Minchan Kim
2010-02-26 5:53 ` Minchan Kim
[not found] ` <28c262361002252153s587b70ecxf89eda9a642e527c-JsoAwUIsXosN+BqQ9rBEUg@public.gmane.org>
2010-02-26 6:15 ` KAMEZAWA Hiroyuki
2010-02-26 6:15 ` KAMEZAWA Hiroyuki
[not found] ` <20100226151506.c78b4312.kamezawa.hiroyu-+CUm20s59erQFUHtdCDX3A@public.gmane.org>
2010-02-26 6:35 ` Minchan Kim
2010-02-26 6:35 ` Minchan Kim
[not found] ` <28c262361002252050r29f54ea2u6c6e87f1f702d195-JsoAwUIsXosN+BqQ9rBEUg@public.gmane.org>
2010-02-26 5:01 ` KAMEZAWA Hiroyuki
[not found] ` <28c262361002250736k57543379j8291e0dfb8df194e-JsoAwUIsXosN+BqQ9rBEUg@public.gmane.org>
2010-02-26 0:23 ` KAMEZAWA Hiroyuki
2010-02-25 15:36 ` Minchan Kim
[not found] ` <1266765525-30890-2-git-send-email-arighi-vWjgImWzx8FBDgjK7y7TUQ@public.gmane.org>
2010-02-22 0:22 ` KAMEZAWA Hiroyuki
2010-02-22 15:58 ` Vivek Goyal
2010-02-22 16:14 ` Balbir Singh
2010-02-22 0:22 ` KAMEZAWA Hiroyuki
2010-02-22 18:00 ` Andrea Righi
2010-02-22 21:21 ` David Rientjes
2010-02-22 21:21 ` David Rientjes
[not found] ` <20100222092242.98df82e4.kamezawa.hiroyu-+CUm20s59erQFUHtdCDX3A@public.gmane.org>
2010-02-22 18:00 ` Andrea Righi
2010-02-22 19:31 ` Vivek Goyal
[not found] ` <20100222193113.GE3096-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-23 9:58 ` Andrea Righi
2010-02-23 9:58 ` Andrea Righi
2010-02-22 15:58 ` Vivek Goyal
2010-02-22 17:29 ` Balbir Singh
[not found] ` <20100222155840.GC13823-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-22 17:29 ` Balbir Singh
2010-02-23 9:26 ` Andrea Righi
2010-02-23 9:26 ` Andrea Righi [this message]
2010-02-22 16:14 ` Balbir Singh
[not found] ` <20100222161442.GE3063-SINUvgVNF2CyUtPGxGje5AC/G2K4zDHf@public.gmane.org>
2010-02-23 9:28 ` Andrea Righi
2010-02-23 9:28 ` Andrea Righi
2010-02-24 0:09 ` KAMEZAWA Hiroyuki
2010-02-24 0:09 ` KAMEZAWA Hiroyuki
2010-02-21 15:18 ` [PATCH 2/2] memcg: dirty pages instrumentation Andrea Righi
2010-02-21 21:38 ` David Rientjes
2010-02-21 22:33 ` Andrea Righi
[not found] ` <1266765525-30890-3-git-send-email-arighi-vWjgImWzx8FBDgjK7y7TUQ@public.gmane.org>
2010-02-22 0:32 ` KAMEZAWA Hiroyuki
2010-02-22 16:52 ` Vivek Goyal
2010-02-22 18:20 ` Peter Zijlstra
2010-02-23 21:29 ` Vivek Goyal
2010-02-22 0:32 ` KAMEZAWA Hiroyuki
2010-02-22 17:57 ` Andrea Righi
[not found] ` <20100222093221.eaaff1b4.kamezawa.hiroyu-+CUm20s59erQFUHtdCDX3A@public.gmane.org>
2010-02-22 17:57 ` Andrea Righi
2010-02-22 16:52 ` Vivek Goyal
2010-02-23 9:40 ` Andrea Righi
2010-02-23 9:45 ` Andrea Righi
2010-02-23 9:45 ` Andrea Righi
2010-02-23 19:56 ` Vivek Goyal
[not found] ` <20100223195606.GD11930-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-23 22:22 ` David Rientjes
2010-02-23 22:22 ` David Rientjes
2010-02-25 14:34 ` Andrea Righi
2010-02-26 0:14 ` KAMEZAWA Hiroyuki
2010-02-26 0:14 ` KAMEZAWA Hiroyuki
[not found] ` <alpine.DEB.2.00.1002231419450.8693-X6Q0R45D7oAcqpCFd4KODRPsWskHk0ljAL8bYrjMMd8@public.gmane.org>
2010-02-25 14:34 ` Andrea Righi
2010-02-23 19:56 ` Vivek Goyal
[not found] ` <20100222165215.GA3096-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-23 9:40 ` Andrea Righi
2010-02-22 18:20 ` Peter Zijlstra
2010-02-23 9:46 ` Andrea Righi
2010-02-23 9:46 ` Andrea Righi
2010-02-23 21:29 ` Vivek Goyal
2010-02-25 15:12 ` Andrea Righi
2010-02-26 21:48 ` Vivek Goyal
2010-02-26 22:21 ` Andrea Righi
2010-02-26 22:28 ` Vivek Goyal
2010-02-26 22:28 ` Vivek Goyal
[not found] ` <20100226214811.GB7498-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-26 22:21 ` Andrea Righi
2010-03-01 0:47 ` KAMEZAWA Hiroyuki
2010-03-01 0:47 ` KAMEZAWA Hiroyuki
2010-02-26 21:48 ` Vivek Goyal
[not found] ` <20100223212943.GF11930-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-25 15:12 ` Andrea Righi
[not found] ` <1266765525-30890-1-git-send-email-arighi-vWjgImWzx8FBDgjK7y7TUQ@public.gmane.org>
2010-02-21 23:48 ` [RFC] [PATCH 0/2] memcg: per cgroup dirty limit KAMEZAWA Hiroyuki
2010-02-21 23:48 ` KAMEZAWA Hiroyuki
2010-02-22 14:27 ` Vivek Goyal
2010-02-22 14:27 ` Vivek Goyal
2010-02-22 17:36 ` Balbir Singh
[not found] ` <20100222173640.GG3063-SINUvgVNF2CyUtPGxGje5AC/G2K4zDHf@public.gmane.org>
2010-02-22 17:58 ` Vivek Goyal
2010-02-22 17:58 ` Vivek Goyal
2010-02-23 0:07 ` KAMEZAWA Hiroyuki
2010-02-23 15:12 ` Vivek Goyal
2010-02-24 0:19 ` KAMEZAWA Hiroyuki
[not found] ` <20100223151201.GB11930-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-24 0:19 ` KAMEZAWA Hiroyuki
[not found] ` <20100223090704.839d8bef.kamezawa.hiroyu-+CUm20s59erQFUHtdCDX3A@public.gmane.org>
2010-02-23 15:12 ` Vivek Goyal
[not found] ` <20100222175833.GB3096-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-23 0:07 ` KAMEZAWA Hiroyuki
2010-02-22 18:12 ` Andrea Righi
2010-02-22 18:29 ` Vivek Goyal
2010-02-22 18:29 ` Vivek Goyal
2010-02-22 21:15 ` David Rientjes
[not found] ` <20100222182934.GD3096-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-22 21:15 ` David Rientjes
2010-02-23 9:55 ` Andrea Righi
2010-02-23 9:55 ` Andrea Righi
2010-02-23 20:01 ` Vivek Goyal
2010-02-23 20:01 ` Vivek Goyal
[not found] ` <20100222142744.GB13823-H+wXaHxf7aLQT0dZR+AlfA@public.gmane.org>
2010-02-22 17:36 ` Balbir Singh
2010-02-22 18:12 ` Andrea Righi
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20100223092658.GA1882@linux \
--to=arighi@develer.com \
--cc=akpm@linux-foundation.org \
--cc=balbir@linux.vnet.ibm.com \
--cc=containers@lists.linux-foundation.org \
--cc=kamezawa.hiroyu@jp.fujitsu.com \
--cc=linux-kernel@vger.kernel.org \
--cc=suleiman@google.com \
--cc=vgoyal@redhat.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.