Re: [patch 3/3] mm: vmscan: clean up struct scan_control

linux-mm.kvack.org archive mirror
 help / color / mirror / Atom feed

From: Hugh Dickins <hughd@google.com>
To: Johannes Weiner <hannes@cmpxchg.org>
Cc: Andrew Morton <akpm@linux-foundation.org>,
	Mel Gorman <mgorman@suse.de>, Michal Hocko <mhocko@suse.cz>,
	Minchan Kim <minchan.kim@gmail.com>,
	Rik van Riel <riel@redhat.com>,
	linux-mm@kvack.org, linux-kernel@vger.kernel.org
Subject: Re: [patch 3/3] mm: vmscan: clean up struct scan_control
Date: Mon, 14 Jul 2014 12:46:21 -0700 (PDT)	[thread overview]
Message-ID: <alpine.LSU.2.11.1407141240200.17669@eggly.anvils> (raw)
In-Reply-To: <1405344049-19868-4-git-send-email-hannes@cmpxchg.org>

On Mon, 14 Jul 2014, Johannes Weiner wrote:

> Reorder the members by input and output, then turn the individual
> integers for may_writepage, may_unmap, may_swap, compaction_ready,
> hibernation_mode into flags that fit into a single integer.
> 
> Stack delta: +72/-296 -224                   old     new   delta
> kswapd                                       104     176     +72
> try_to_free_pages                             80      56     -24
> try_to_free_mem_cgroup_pages                  80      56     -24
> shrink_all_memory                             88      64     -24
> reclaim_clean_pages_from_list                168     144     -24
> mem_cgroup_shrink_node_zone                  104      80     -24
> __zone_reclaim                               176     152     -24
> balance_pgdat                                152       -    -152
> 
>    text    data     bss     dec     hex filename
>   38151    5641      16   43808    ab20 mm/vmscan.o.old
>   38047    5641      16   43704    aab8 mm/vmscan.o
> 
> Suggested-by: Mel Gorman <mgorman@suse.de>
> Signed-off-by: Johannes Weiner <hannes@cmpxchg.org>
> ---
>  mm/vmscan.c | 158 ++++++++++++++++++++++++++++++------------------------------
>  1 file changed, 78 insertions(+), 80 deletions(-)
> 
> diff --git a/mm/vmscan.c b/mm/vmscan.c
> index c28b8981e56a..73d8e69ff3eb 100644
> --- a/mm/vmscan.c
> +++ b/mm/vmscan.c
> @@ -58,36 +58,28 @@
>  #define CREATE_TRACE_POINTS
>  #include <trace/events/vmscan.h>
>  
> -struct scan_control {
> -	/* Incremented by the number of inactive pages that were scanned */
> -	unsigned long nr_scanned;
> -
> -	/* Number of pages freed so far during a call to shrink_zones() */
> -	unsigned long nr_reclaimed;
> -
> -	/* One of the zones is ready for compaction */
> -	int compaction_ready;
> +/* Scan control flags */
> +#define MAY_WRITEPAGE		0x1
> +#define MAY_UNMAP		0x2
> +#define MAY_SWAP		0x4
> +#define MAY_SKIP_CONGESTION	0x8
> +#define COMPACTION_READY	0x10
>  
> +struct scan_control {
>  	/* How many pages shrink_list() should reclaim */
>  	unsigned long nr_to_reclaim;
>  
> -	unsigned long hibernation_mode;
> -
>  	/* This context's GFP mask */
>  	gfp_t gfp_mask;
>  
> -	int may_writepage;
> -
> -	/* Can mapped pages be reclaimed? */
> -	int may_unmap;
> -
> -	/* Can pages be swapped as part of reclaim? */
> -	int may_swap;
> -
> +	/* Allocation order */
>  	int order;
>  
> -	/* Scan (total_size >> priority) pages at once */
> -	int priority;
> +	/*
> +	 * Nodemask of nodes allowed by the caller. If NULL, all nodes
> +	 * are scanned.
> +	 */
> +	nodemask_t	*nodemask;
>  
>  	/*
>  	 * The memory cgroup that hit its limit and as a result is the
> @@ -95,11 +87,17 @@ struct scan_control {
>  	 */
>  	struct mem_cgroup *target_mem_cgroup;
>  
> -	/*
> -	 * Nodemask of nodes allowed by the caller. If NULL, all nodes
> -	 * are scanned.
> -	 */
> -	nodemask_t	*nodemask;
> +	/* Scan (total_size >> priority) pages at once */
> +	int priority;
> +
> +	/* Scan control flags; see above */
> +	unsigned int flags;

This seems to result in a fair amount of unnecessary churn:
why not just put may_writepage etc into an unsigned int bitfield,
then you get the saving without changing all the rest of the code.

Hugh

> +
> +	/* Incremented by the number of inactive pages that were scanned */
> +	unsigned long nr_scanned;
> +
> +	/* Number of pages freed so far during a call to shrink_zones() */
> +	unsigned long nr_reclaimed;
>  };
>  
>  #define lru_to_page(_head) (list_entry((_head)->prev, struct page, lru))
> @@ -840,7 +838,7 @@ static unsigned long shrink_page_list(struct list_head *page_list,
>  		if (unlikely(!page_evictable(page)))
>  			goto cull_mlocked;
>  
> -		if (!sc->may_unmap && page_mapped(page))
> +		if (!(sc->flags & MAY_UNMAP) && page_mapped(page))
>  			goto keep_locked;
>  
>  		/* Double the slab pressure for mapped and swapcache pages */
> @@ -1014,7 +1012,7 @@ static unsigned long shrink_page_list(struct list_head *page_list,
>  				goto keep_locked;
>  			if (!may_enter_fs)
>  				goto keep_locked;
> -			if (!sc->may_writepage)
> +			if (!(sc->flags & MAY_WRITEPAGE))
>  				goto keep_locked;
>  
>  			/* Page is dirty, try to write it out here */
> @@ -1146,7 +1144,7 @@ unsigned long reclaim_clean_pages_from_list(struct zone *zone,
>  	struct scan_control sc = {
>  		.gfp_mask = GFP_KERNEL,
>  		.priority = DEF_PRIORITY,
> -		.may_unmap = 1,
> +		.flags = MAY_UNMAP,
>  	};
>  	unsigned long ret, dummy1, dummy2, dummy3, dummy4, dummy5;
>  	struct page *page, *next;
> @@ -1489,9 +1487,9 @@ shrink_inactive_list(unsigned long nr_to_scan, struct lruvec *lruvec,
>  
>  	lru_add_drain();
>  
> -	if (!sc->may_unmap)
> +	if (!(sc->flags & MAY_UNMAP))
>  		isolate_mode |= ISOLATE_UNMAPPED;
> -	if (!sc->may_writepage)
> +	if (!(sc->flags & MAY_WRITEPAGE))
>  		isolate_mode |= ISOLATE_CLEAN;
>  
>  	spin_lock_irq(&zone->lru_lock);
> @@ -1593,7 +1591,7 @@ shrink_inactive_list(unsigned long nr_to_scan, struct lruvec *lruvec,
>  	 * is congested. Allow kswapd to continue until it starts encountering
>  	 * unqueued dirty pages or cycling through the LRU too quickly.
>  	 */
> -	if (!sc->hibernation_mode && !current_is_kswapd() &&
> +	if (!(sc->flags & MAY_SKIP_CONGESTION) && !current_is_kswapd() &&
>  	    current_may_throttle())
>  		wait_iff_congested(zone, BLK_RW_ASYNC, HZ/10);
>  
> @@ -1683,9 +1681,9 @@ static void shrink_active_list(unsigned long nr_to_scan,
>  
>  	lru_add_drain();
>  
> -	if (!sc->may_unmap)
> +	if (!(sc->flags & MAY_UNMAP))
>  		isolate_mode |= ISOLATE_UNMAPPED;
> -	if (!sc->may_writepage)
> +	if (!(sc->flags & MAY_WRITEPAGE))
>  		isolate_mode |= ISOLATE_CLEAN;
>  
>  	spin_lock_irq(&zone->lru_lock);
> @@ -1897,7 +1895,7 @@ static void get_scan_count(struct lruvec *lruvec, int swappiness,
>  		force_scan = true;
>  
>  	/* If we have no swap space, do not bother scanning anon pages. */
> -	if (!sc->may_swap || (get_nr_swap_pages() <= 0)) {
> +	if (!(sc->flags & MAY_SWAP) || (get_nr_swap_pages() <= 0)) {
>  		scan_balance = SCAN_FILE;
>  		goto out;
>  	}
> @@ -2406,7 +2404,7 @@ static bool shrink_zones(struct zonelist *zonelist, struct scan_control *sc)
>  			    sc->order > PAGE_ALLOC_COSTLY_ORDER &&
>  			    zonelist_zone_idx(z) <= requested_highidx &&
>  			    compaction_ready(zone, sc->order)) {
> -				sc->compaction_ready = true;
> +				sc->flags |= COMPACTION_READY;
>  				continue;
>  			}
>  
> @@ -2496,7 +2494,7 @@ static unsigned long do_try_to_free_pages(struct zonelist *zonelist,
>  		if (sc->nr_reclaimed >= sc->nr_to_reclaim)
>  			break;
>  
> -		if (sc->compaction_ready)
> +		if (sc->flags & COMPACTION_READY)
>  			break;
>  
>  		/*
> @@ -2504,7 +2502,7 @@ static unsigned long do_try_to_free_pages(struct zonelist *zonelist,
>  		 * writepage even in laptop mode.
>  		 */
>  		if (sc->priority < DEF_PRIORITY - 2)
> -			sc->may_writepage = 1;
> +			sc->flags |= MAY_WRITEPAGE;
>  
>  		/*
>  		 * Try to write back as many pages as we just scanned.  This
> @@ -2517,7 +2515,7 @@ static unsigned long do_try_to_free_pages(struct zonelist *zonelist,
>  		if (total_scanned > writeback_threshold) {
>  			wakeup_flusher_threads(laptop_mode ? 0 : total_scanned,
>  						WB_REASON_TRY_TO_FREE_PAGES);
> -			sc->may_writepage = 1;
> +			sc->flags |= MAY_WRITEPAGE;
>  		}
>  	} while (--sc->priority >= 0);
>  
> @@ -2527,7 +2525,7 @@ static unsigned long do_try_to_free_pages(struct zonelist *zonelist,
>  		return sc->nr_reclaimed;
>  
>  	/* Aborted reclaim to try compaction? don't OOM, then */
> -	if (sc->compaction_ready)
> +	if (sc->flags & COMPACTION_READY)
>  		return 1;
>  
>  	/* Any of the zones still reclaimable?  Don't OOM. */
> @@ -2668,17 +2666,17 @@ unsigned long try_to_free_pages(struct zonelist *zonelist, int order,
>  {
>  	unsigned long nr_reclaimed;
>  	struct scan_control sc = {
> -		.gfp_mask = (gfp_mask = memalloc_noio_flags(gfp_mask)),
> -		.may_writepage = !laptop_mode,
>  		.nr_to_reclaim = SWAP_CLUSTER_MAX,
> -		.may_unmap = 1,
> -		.may_swap = 1,
> +		.gfp_mask = (gfp_mask = memalloc_noio_flags(gfp_mask)),
>  		.order = order,
> -		.priority = DEF_PRIORITY,
> -		.target_mem_cgroup = NULL,
>  		.nodemask = nodemask,
> +		.priority = DEF_PRIORITY,
> +		.flags = MAY_UNMAP | MAY_SWAP,
>  	};
>  
> +	if (!laptop_mode)
> +		sc.flags |= MAY_WRITEPAGE;
> +
>  	/*
>  	 * Do not enter reclaim if fatal signal was delivered while throttled.
>  	 * 1 is returned so that the page allocator does not OOM kill at this
> @@ -2688,7 +2686,7 @@ unsigned long try_to_free_pages(struct zonelist *zonelist, int order,
>  		return 1;
>  
>  	trace_mm_vmscan_direct_reclaim_begin(order,
> -				sc.may_writepage,
> +				sc.flags & MAY_WRITEPAGE,
>  				gfp_mask);
>  
>  	nr_reclaimed = do_try_to_free_pages(zonelist, &sc);
> @@ -2706,23 +2704,22 @@ unsigned long mem_cgroup_shrink_node_zone(struct mem_cgroup *memcg,
>  						unsigned long *nr_scanned)
>  {
>  	struct scan_control sc = {
> -		.nr_scanned = 0,
>  		.nr_to_reclaim = SWAP_CLUSTER_MAX,
> -		.may_writepage = !laptop_mode,
> -		.may_unmap = 1,
> -		.may_swap = !noswap,
> -		.order = 0,
> -		.priority = 0,
> +		.gfp_mask = (gfp_mask & GFP_RECLAIM_MASK) |
> +		            (GFP_HIGHUSER_MOVABLE & ~GFP_RECLAIM_MASK),
>  		.target_mem_cgroup = memcg,
> +		.flags = MAY_UNMAP,
>  	};
>  	struct lruvec *lruvec = mem_cgroup_zone_lruvec(zone, memcg);
>  	int swappiness = mem_cgroup_swappiness(memcg);
>  
> -	sc.gfp_mask = (gfp_mask & GFP_RECLAIM_MASK) |
> -			(GFP_HIGHUSER_MOVABLE & ~GFP_RECLAIM_MASK);
> +	if (!laptop_mode)
> +		sc.flags |= MAY_WRITEPAGE;
> +	if (!noswap)
> +		sc.flags |= MAY_SWAP;
>  
>  	trace_mm_vmscan_memcg_softlimit_reclaim_begin(sc.order,
> -						      sc.may_writepage,
> +						      sc.flags & MAY_WRITEPAGE,
>  						      sc.gfp_mask);
>  
>  	/*
> @@ -2748,18 +2745,19 @@ unsigned long try_to_free_mem_cgroup_pages(struct mem_cgroup *memcg,
>  	unsigned long nr_reclaimed;
>  	int nid;
>  	struct scan_control sc = {
> -		.may_writepage = !laptop_mode,
> -		.may_unmap = 1,
> -		.may_swap = !noswap,
>  		.nr_to_reclaim = SWAP_CLUSTER_MAX,
> -		.order = 0,
> -		.priority = DEF_PRIORITY,
> -		.target_mem_cgroup = memcg,
> -		.nodemask = NULL, /* we don't care the placement */
>  		.gfp_mask = (gfp_mask & GFP_RECLAIM_MASK) |
> -				(GFP_HIGHUSER_MOVABLE & ~GFP_RECLAIM_MASK),
> +		            (GFP_HIGHUSER_MOVABLE & ~GFP_RECLAIM_MASK),
> +		.target_mem_cgroup = memcg,
> +		.priority = DEF_PRIORITY,
> +		.flags = MAY_UNMAP,
>  	};
>  
> +	if (!laptop_mode)
> +		sc.flags |= MAY_WRITEPAGE;
> +	if (!noswap)
> +		sc.flags |= MAY_SWAP;
> +
>  	/*
>  	 * Unlike direct reclaim via alloc_pages(), memcg's reclaim doesn't
>  	 * take care of from where we get pages. So the node where we start the
> @@ -2770,7 +2768,7 @@ unsigned long try_to_free_mem_cgroup_pages(struct mem_cgroup *memcg,
>  	zonelist = NODE_DATA(nid)->node_zonelists;
>  
>  	trace_mm_vmscan_memcg_reclaim_begin(0,
> -					    sc.may_writepage,
> +					    sc.flags & MAY_WRITEPAGE,
>  					    sc.gfp_mask);
>  
>  	nr_reclaimed = do_try_to_free_pages(zonelist, &sc);
> @@ -3015,15 +3013,15 @@ static unsigned long balance_pgdat(pg_data_t *pgdat, int order,
>  	unsigned long nr_soft_scanned;
>  	struct scan_control sc = {
>  		.gfp_mask = GFP_KERNEL,
> -		.priority = DEF_PRIORITY,
> -		.may_unmap = 1,
> -		.may_swap = 1,
> -		.may_writepage = !laptop_mode,
>  		.order = order,
> -		.target_mem_cgroup = NULL,
> +		.priority = DEF_PRIORITY,
> +		.flags = MAY_UNMAP | MAY_SWAP,
>  	};
>  	count_vm_event(PAGEOUTRUN);
>  
> +	if (!laptop_mode)
> +		sc.flags |= MAY_WRITEPAGE;
> +
>  	do {
>  		unsigned long lru_pages = 0;
>  		unsigned long nr_attempted = 0;
> @@ -3104,7 +3102,7 @@ static unsigned long balance_pgdat(pg_data_t *pgdat, int order,
>  		 * even in laptop mode.
>  		 */
>  		if (sc.priority < DEF_PRIORITY - 2)
> -			sc.may_writepage = 1;
> +			sc.flags |= MAY_WRITEPAGE;
>  
>  		/*
>  		 * Now scan the zone in the dma->highmem direction, stopping
> @@ -3401,14 +3399,11 @@ unsigned long shrink_all_memory(unsigned long nr_to_reclaim)
>  {
>  	struct reclaim_state reclaim_state;
>  	struct scan_control sc = {
> -		.gfp_mask = GFP_HIGHUSER_MOVABLE,
> -		.may_swap = 1,
> -		.may_unmap = 1,
> -		.may_writepage = 1,
>  		.nr_to_reclaim = nr_to_reclaim,
> -		.hibernation_mode = 1,
> -		.order = 0,
> +		.gfp_mask = GFP_HIGHUSER_MOVABLE,
>  		.priority = DEF_PRIORITY,
> +		.flags = MAY_WRITEPAGE | MAY_UNMAP | MAY_SWAP |
> +		         MAY_SKIP_CONGESTION,
>  	};
>  	struct zonelist *zonelist = node_zonelist(numa_node_id(), sc.gfp_mask);
>  	struct task_struct *p = current;
> @@ -3588,19 +3583,22 @@ static int __zone_reclaim(struct zone *zone, gfp_t gfp_mask, unsigned int order)
>  	struct task_struct *p = current;
>  	struct reclaim_state reclaim_state;
>  	struct scan_control sc = {
> -		.may_writepage = !!(zone_reclaim_mode & RECLAIM_WRITE),
> -		.may_unmap = !!(zone_reclaim_mode & RECLAIM_SWAP),
> -		.may_swap = 1,
>  		.nr_to_reclaim = max(nr_pages, SWAP_CLUSTER_MAX),
>  		.gfp_mask = (gfp_mask = memalloc_noio_flags(gfp_mask)),
>  		.order = order,
>  		.priority = ZONE_RECLAIM_PRIORITY,
> +		.flags = MAY_SWAP,
>  	};
>  	struct shrink_control shrink = {
>  		.gfp_mask = sc.gfp_mask,
>  	};
>  	unsigned long nr_slab_pages0, nr_slab_pages1;
>  
> +	if (zone_reclaim_mode & RECLAIM_WRITE)
> +		sc.flags |= MAY_WRITEPAGE;
> +	if (zone_reclaim_mode & RECLAIM_SWAP)
> +		sc.flags |= MAY_UNMAP;
> +
>  	cond_resched();
>  	/*
>  	 * We need to be able to allocate from the reserves for RECLAIM_SWAP
> -- 
> 2.0.0

--
To unsubscribe, send a message with 'unsubscribe linux-mm' in
the body to majordomo@kvack.org.  For more info on Linux MM,
see: http://www.linux-mm.org/ .
Don't email: <a href=mailto:"dont@kvack.org"> email@kvack.org </a>

next prev parent reply	other threads:[~2014-07-14 19:48 UTC|newest]

Thread overview: 15+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2014-07-14 13:20 [patch 0/3] mm: vmscan: followup fixes to cleanups in -mm Johannes Weiner
2014-07-14 13:20 ` [patch 1/3] mm: vmscan: rework compaction-ready signaling in direct reclaim fix Johannes Weiner
2014-07-14 14:09   ` Rik van Riel
2014-07-18 12:50   ` Mel Gorman
2014-07-14 13:20 ` [patch 2/3] mm: vmscan: remove all_unreclaimable() fix Johannes Weiner
2014-07-14 14:10   ` Rik van Riel
2014-07-16  9:40   ` Michal Hocko
2014-07-18 12:51   ` Mel Gorman
2014-07-14 13:20 ` [patch 3/3] mm: vmscan: clean up struct scan_control Johannes Weiner
2014-07-14 19:46   ` Hugh Dickins [this message]
2014-07-17 13:26     ` Johannes Weiner
2014-07-17 13:57       ` Michal Hocko
2014-07-17 23:00         ` Hugh Dickins
2014-07-18 12:53       ` Mel Gorman
2014-07-14 19:56   ` Andrew Morton

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=alpine.LSU.2.11.1407141240200.17669@eggly.anvils \
    --to=hughd@google.com \
    --cc=akpm@linux-foundation.org \
    --cc=hannes@cmpxchg.org \
    --cc=linux-kernel@vger.kernel.org \
    --cc=linux-mm@kvack.org \
    --cc=mgorman@suse.de \
    --cc=mhocko@suse.cz \
    --cc=minchan.kim@gmail.com \
    --cc=riel@redhat.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link

Be sure your reply has a Subject: header at the top and a blank line before the message body.

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).