From: Li Zhong <lizhongfs@gmail.com>
To: Glauber Costa <glommer@openvz.org>
Cc: akpm@linux-foundation.org, linux-fsdevel@vger.kernel.org,
mgorman@suse.de, david@fromorbit.com, linux-mm@kvack.org,
cgroups@vger.kernel.org, kamezawa.hiroyu@jp.fujitsu.com,
mhocko@suze.cz, hannes@cmpxchg.org, hughd@google.com,
gthelen@google.com, Dave Chinner <dchinner@redhat.com>
Subject: Re: [PATCH v11 25/25] list_lru: dynamically adjust node arrays
Date: Tue, 18 Jun 2013 17:42:01 +0800 [thread overview]
Message-ID: <1371548521.2984.6.camel@ThinkPad-T5421> (raw)
In-Reply-To: <1370550898-26711-26-git-send-email-glommer@openvz.org>
On Fri, 2013-06-07 at 00:34 +0400, Glauber Costa wrote:
> We currently use a compile-time constant to size the node array for the
> list_lru structure. Due to this, we don't need to allocate any memory at
> initialization time. But as a consequence, the structures that contain
> embedded list_lru lists can become way too big (the superblock for
> instance contains two of them).
>
> This patch aims at ameliorating this situation by dynamically allocating
> the node arrays with the firmware provided nr_node_ids.
>
> Signed-off-by: Glauber Costa <glommer@openvz.org>
> Cc: Dave Chinner <dchinner@redhat.com>
> Cc: Mel Gorman <mgorman@suse.de>
> ---
> fs/super.c | 11 +++++++++--
> fs/xfs/xfs_buf.c | 6 +++++-
> fs/xfs/xfs_qm.c | 10 ++++++++--
> include/linux/list_lru.h | 13 ++-----------
> mm/list_lru.c | 14 +++++++++++++-
> 5 files changed, 37 insertions(+), 17 deletions(-)
>
> diff --git a/fs/super.c b/fs/super.c
> index 85a6104..1b6ef7b 100644
> --- a/fs/super.c
> +++ b/fs/super.c
> @@ -199,8 +199,12 @@ static struct super_block *alloc_super(struct file_system_type *type, int flags)
> INIT_HLIST_NODE(&s->s_instances);
> INIT_HLIST_BL_HEAD(&s->s_anon);
> INIT_LIST_HEAD(&s->s_inodes);
> - list_lru_init(&s->s_dentry_lru);
> - list_lru_init(&s->s_inode_lru);
> +
> + if (list_lru_init(&s->s_dentry_lru))
> + goto err_out;
> + if (list_lru_init(&s->s_inode_lru))
> + goto err_out_dentry_lru;
> +
> INIT_LIST_HEAD(&s->s_mounts);
> init_rwsem(&s->s_umount);
> lockdep_set_class(&s->s_umount, &type->s_umount_key);
> @@ -240,6 +244,9 @@ static struct super_block *alloc_super(struct file_system_type *type, int flags)
> }
> out:
> return s;
> +
> +err_out_dentry_lru:
> + list_lru_destroy(&s->s_dentry_lru);
> err_out:
> security_sb_free(s);
> #ifdef CONFIG_SMP
It seems we also need to call list_lru_destroy() in destroy_super()?
like below:
-----------
diff --git a/fs/super.c b/fs/super.c
index b79e732..06ee3af 100644
--- a/fs/super.c
+++ b/fs/super.c
@@ -269,6 +269,8 @@ err_out:
*/
static inline void destroy_super(struct super_block *s)
{
+ list_lru_destroy(&s->s_inode_lru);
+ list_lru_destroy(&s->s_dentry_lru);
#ifdef CONFIG_SMP
free_percpu(s->s_files);
#endif
-----------
Thanks, Zhong
> diff --git a/fs/xfs/xfs_buf.c b/fs/xfs/xfs_buf.c
> index c3f8ea9..9c2b656 100644
> --- a/fs/xfs/xfs_buf.c
> +++ b/fs/xfs/xfs_buf.c
> @@ -1591,6 +1591,7 @@ xfs_free_buftarg(
> struct xfs_mount *mp,
> struct xfs_buftarg *btp)
> {
> + list_lru_destroy(&btp->bt_lru);
> unregister_shrinker(&btp->bt_shrinker);
>
> if (mp->m_flags & XFS_MOUNT_BARRIER)
> @@ -1665,9 +1666,12 @@ xfs_alloc_buftarg(
> if (!btp->bt_bdi)
> goto error;
>
> - list_lru_init(&btp->bt_lru);
> if (xfs_setsize_buftarg_early(btp, bdev))
> goto error;
> +
> + if (list_lru_init(&btp->bt_lru))
> + goto error;
> +
> btp->bt_shrinker.count_objects = xfs_buftarg_shrink_count;
> btp->bt_shrinker.scan_objects = xfs_buftarg_shrink_scan;
> btp->bt_shrinker.seeks = DEFAULT_SEEKS;
> diff --git a/fs/xfs/xfs_qm.c b/fs/xfs/xfs_qm.c
> index bd6c12a..b840000 100644
> --- a/fs/xfs/xfs_qm.c
> +++ b/fs/xfs/xfs_qm.c
> @@ -781,11 +781,18 @@ xfs_qm_init_quotainfo(
>
> qinf = mp->m_quotainfo = kmem_zalloc(sizeof(xfs_quotainfo_t), KM_SLEEP);
>
> + if ((error = list_lru_init(&qinf->qi_lru))) {
> + kmem_free(qinf);
> + mp->m_quotainfo = NULL;
> + return error;
> + }
> +
> /*
> * See if quotainodes are setup, and if not, allocate them,
> * and change the superblock accordingly.
> */
> if ((error = xfs_qm_init_quotainos(mp))) {
> + list_lru_destroy(&qinf->qi_lru);
> kmem_free(qinf);
> mp->m_quotainfo = NULL;
> return error;
> @@ -795,8 +802,6 @@ xfs_qm_init_quotainfo(
> INIT_RADIX_TREE(&qinf->qi_gquota_tree, GFP_NOFS);
> mutex_init(&qinf->qi_tree_lock);
>
> - list_lru_init(&qinf->qi_lru);
> -
> /* mutex used to serialize quotaoffs */
> mutex_init(&qinf->qi_quotaofflock);
>
> @@ -884,6 +889,7 @@ xfs_qm_destroy_quotainfo(
> qi = mp->m_quotainfo;
> ASSERT(qi != NULL);
>
> + list_lru_destroy(&qi->qi_lru);
> unregister_shrinker(&qi->qi_shrinker);
>
> if (qi->qi_uquotaip) {
> diff --git a/include/linux/list_lru.h b/include/linux/list_lru.h
> index 2fe13e1..ff57503 100644
> --- a/include/linux/list_lru.h
> +++ b/include/linux/list_lru.h
> @@ -27,20 +27,11 @@ struct list_lru_node {
> } ____cacheline_aligned_in_smp;
>
> struct list_lru {
> - /*
> - * Because we use a fixed-size array, this struct can be very big if
> - * MAX_NUMNODES is big. If this becomes a problem this is fixable by
> - * turning this into a pointer and dynamically allocating this to
> - * nr_node_ids. This quantity is firwmare-provided, and still would
> - * provide room for all nodes at the cost of a pointer lookup and an
> - * extra allocation. Because that allocation will most likely come from
> - * a different slab cache than the main structure holding this
> - * structure, we may very well fail.
> - */
> - struct list_lru_node node[MAX_NUMNODES];
> + struct list_lru_node *node;
> nodemask_t active_nodes;
> };
>
> +void list_lru_destroy(struct list_lru *lru);
> int list_lru_init(struct list_lru *lru);
>
> /**
> diff --git a/mm/list_lru.c b/mm/list_lru.c
> index 2822817..700d322 100644
> --- a/mm/list_lru.c
> +++ b/mm/list_lru.c
> @@ -8,6 +8,7 @@
> #include <linux/module.h>
> #include <linux/mm.h>
> #include <linux/list_lru.h>
> +#include <linux/slab.h>
>
> bool list_lru_add(struct list_lru *lru, struct list_head *item)
> {
> @@ -162,9 +163,14 @@ unsigned long list_lru_dispose_all(struct list_lru *lru,
> int list_lru_init(struct list_lru *lru)
> {
> int i;
> + size_t size = sizeof(*lru->node) * nr_node_ids;
> +
> + lru->node = kzalloc(size, GFP_KERNEL);
> + if (!lru->node)
> + return -ENOMEM;
>
> nodes_clear(lru->active_nodes);
> - for (i = 0; i < MAX_NUMNODES; i++) {
> + for (i = 0; i < nr_node_ids; i++) {
> spin_lock_init(&lru->node[i].lock);
> INIT_LIST_HEAD(&lru->node[i].list);
> lru->node[i].nr_items = 0;
> @@ -172,3 +178,9 @@ int list_lru_init(struct list_lru *lru)
> return 0;
> }
> EXPORT_SYMBOL_GPL(list_lru_init);
> +
> +void list_lru_destroy(struct list_lru *lru)
> +{
> + kfree(lru->node);
> +}
> +EXPORT_SYMBOL_GPL(list_lru_destroy);
--
To unsubscribe, send a message with 'unsubscribe linux-mm' in
the body to majordomo@kvack.org. For more info on Linux MM,
see: http://www.linux-mm.org/ .
Don't email: <a href=mailto:"dont@kvack.org"> email@kvack.org </a>
next prev parent reply other threads:[~2013-06-18 9:42 UTC|newest]
Thread overview: 41+ messages / expand[flat|nested] mbox.gz Atom feed top
2013-06-06 20:34 [PATCH v11 00/25] shrinkers rework: per-numa, generic lists, etc Glauber Costa
2013-06-06 20:34 ` [PATCH v11 02/25] super: fix calculation of shrinkable objects for small numbers Glauber Costa
[not found] ` <1370550898-26711-1-git-send-email-glommer-GEFAQzZX7r8dnm+yROfE0A@public.gmane.org>
2013-06-06 20:34 ` [PATCH v11 01/25] fs: bump inode and dentry counters to long Glauber Costa
2013-06-06 20:34 ` [PATCH v11 03/25] dcache: convert dentry_stat.nr_unused to per-cpu counters Glauber Costa
2013-06-06 20:34 ` [PATCH v11 04/25] dentry: move to per-sb LRU locks Glauber Costa
2013-06-06 20:34 ` [PATCH v11 05/25] dcache: remove dentries from LRU before putting on dispose list Glauber Costa
2013-06-06 20:34 ` [PATCH v11 06/25] mm: new shrinker API Glauber Costa
2013-06-06 20:34 ` [PATCH v11 07/25] shrinker: convert superblock shrinkers to new API Glauber Costa
2013-06-06 20:34 ` [PATCH v11 08/25] list: add a new LRU list type Glauber Costa
2013-06-06 20:34 ` [PATCH v11 09/25] inode: convert inode lru list to generic lru list code Glauber Costa
2013-06-06 20:34 ` [PATCH v11 10/25] dcache: convert to use new lru list infrastructure Glauber Costa
2013-06-06 20:34 ` [PATCH v11 11/25] list_lru: per-node " Glauber Costa
2013-06-06 20:34 ` [PATCH v11 12/25] list_lru: per-node API Glauber Costa
2013-06-06 20:34 ` [PATCH v11 13/25] shrinker: add node awareness Glauber Costa
2013-06-06 20:34 ` [PATCH v11 14/25] vmscan: per-node deferred work Glauber Costa
2013-06-06 20:34 ` [PATCH v11 15/25] fs: convert inode and dentry shrinking to be node aware Glauber Costa
2013-06-06 20:34 ` [PATCH v11 16/25] xfs: convert buftarg LRU to generic code Glauber Costa
2013-06-06 20:34 ` [PATCH v11 17/25] xfs: rework buffer dispose list tracking Glauber Costa
2013-06-06 20:34 ` [PATCH v11 18/25] xfs: convert dquot cache lru to list_lru Glauber Costa
2013-06-06 20:34 ` [PATCH v11 21/25] i915: bail out earlier when shrinker cannot acquire mutex Glauber Costa
2013-06-06 20:34 ` [PATCH v11 23/25] hugepage: convert huge zero page shrinker to new shrinker API Glauber Costa
2013-06-06 20:34 ` [PATCH v11 24/25] shrinker: Kill old ->shrink API Glauber Costa
2013-06-06 20:34 ` [PATCH v11 25/25] list_lru: dynamically adjust node arrays Glauber Costa
2013-06-18 9:42 ` Li Zhong [this message]
2013-06-19 7:31 ` Glauber Costa
2013-06-19 9:12 ` Li Zhong
2013-06-19 13:29 ` Glauber Costa
2013-06-19 17:14 ` Andrew Morton
2013-06-20 0:50 ` Li Zhong
2013-06-20 1:35 ` Li Zhong
2013-06-20 2:37 ` Dave Chinner
2013-06-06 21:15 ` [PATCH v11 00/25] shrinkers rework: per-numa, generic lists, etc Andrew Morton
2013-06-07 6:11 ` Glauber Costa
[not found] ` <51B1797D.3010209-bzQdu9zFT3WakBO8gow8eQ@public.gmane.org>
2013-06-07 7:08 ` Glauber Costa
2013-06-07 8:04 ` Glauber Costa
2013-06-06 20:34 ` [PATCH v11 19/25] fs: convert fs shrinkers to new scan/count API Glauber Costa
2013-06-06 20:34 ` [PATCH v11 20/25] drivers: convert shrinkers to new count/scan API Glauber Costa
2013-06-07 14:10 ` Konrad Rzeszutek Wilk
2013-06-09 12:02 ` Glauber Costa
2013-06-06 20:34 ` [PATCH v11 22/25] shrinker: convert remaining shrinkers to " Glauber Costa
2013-06-06 22:31 ` Andrew Morton
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=1371548521.2984.6.camel@ThinkPad-T5421 \
--to=lizhongfs@gmail.com \
--cc=akpm@linux-foundation.org \
--cc=cgroups@vger.kernel.org \
--cc=david@fromorbit.com \
--cc=dchinner@redhat.com \
--cc=glommer@openvz.org \
--cc=gthelen@google.com \
--cc=hannes@cmpxchg.org \
--cc=hughd@google.com \
--cc=kamezawa.hiroyu@jp.fujitsu.com \
--cc=linux-fsdevel@vger.kernel.org \
--cc=linux-mm@kvack.org \
--cc=mgorman@suse.de \
--cc=mhocko@suze.cz \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).