linux-mm.kvack.org archive mirror
 help / color / mirror / Atom feed
From: Michal Hocko <mhocko@suse.cz>
To: Mel Gorman <mgorman@suse.de>
Cc: Andrew Morton <akpm@linux-foundation.org>,
	Jiri Slaby <jslaby@suse.cz>,
	Valdis Kletnieks <Valdis.Kletnieks@vt.edu>,
	Rik van Riel <riel@redhat.com>,
	Zlatko Calusic <zcalusic@bitsync.net>,
	Johannes Weiner <hannes@cmpxchg.org>,
	dormando <dormando@rydia.net>,
	Kamezawa Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com>,
	Linux-MM <linux-mm@kvack.org>,
	LKML <linux-kernel@vger.kernel.org>
Subject: Re: [PATCH 9/9] mm: vmscan: Move logic from balance_pgdat() to kswapd_shrink_zone()
Date: Tue, 14 May 2013 14:23:25 +0200	[thread overview]
Message-ID: <20130514122325.GP5198@dhcp22.suse.cz> (raw)
In-Reply-To: <1368432760-21573-10-git-send-email-mgorman@suse.de>

On Mon 13-05-13 09:12:40, Mel Gorman wrote:
> balance_pgdat() is very long and some of the logic can and should
> be internal to kswapd_shrink_zone(). Move it so the flow of
> balance_pgdat() is marginally easier to follow.
> 
> Signed-off-by: Mel Gorman <mgorman@suse.de>
> Acked-by: Johannes Weiner <hannes@cmpxchg.org>

Looks good
Reviewed-by: Michal Hocko <mhocko@suse.cz>

> ---
>  mm/vmscan.c | 110 +++++++++++++++++++++++++++++-------------------------------
>  1 file changed, 54 insertions(+), 56 deletions(-)
> 
> diff --git a/mm/vmscan.c b/mm/vmscan.c
> index e65fe46..0ba9d3a 100644
> --- a/mm/vmscan.c
> +++ b/mm/vmscan.c
> @@ -2705,18 +2705,53 @@ static bool prepare_kswapd_sleep(pg_data_t *pgdat, int order, long remaining,
>   * This is used to determine if the scanning priority needs to be raised.
>   */
>  static bool kswapd_shrink_zone(struct zone *zone,
> +			       int classzone_idx,
>  			       struct scan_control *sc,
>  			       unsigned long lru_pages,
>  			       unsigned long *nr_attempted)
>  {
>  	unsigned long nr_slab;
> +	int testorder = sc->order;
> +	unsigned long balance_gap;
>  	struct reclaim_state *reclaim_state = current->reclaim_state;
>  	struct shrink_control shrink = {
>  		.gfp_mask = sc->gfp_mask,
>  	};
> +	bool lowmem_pressure;
>  
>  	/* Reclaim above the high watermark. */
>  	sc->nr_to_reclaim = max(SWAP_CLUSTER_MAX, high_wmark_pages(zone));
> +
> +	/*
> +	 * Kswapd reclaims only single pages with compaction enabled. Trying
> +	 * too hard to reclaim until contiguous free pages have become
> +	 * available can hurt performance by evicting too much useful data
> +	 * from memory. Do not reclaim more than needed for compaction.
> +	 */
> +	if (IS_ENABLED(CONFIG_COMPACTION) && sc->order &&
> +			compaction_suitable(zone, sc->order) !=
> +				COMPACT_SKIPPED)
> +		testorder = 0;
> +
> +	/*
> +	 * We put equal pressure on every zone, unless one zone has way too
> +	 * many pages free already. The "too many pages" is defined as the
> +	 * high wmark plus a "gap" where the gap is either the low
> +	 * watermark or 1% of the zone, whichever is smaller.
> +	 */
> +	balance_gap = min(low_wmark_pages(zone),
> +		(zone->managed_pages + KSWAPD_ZONE_BALANCE_GAP_RATIO-1) /
> +		KSWAPD_ZONE_BALANCE_GAP_RATIO);
> +
> +	/*
> +	 * If there is no low memory pressure or the zone is balanced then no
> +	 * reclaim is necessary
> +	 */
> +	lowmem_pressure = (buffer_heads_over_limit && is_highmem(zone));
> +	if (!lowmem_pressure && zone_balanced(zone, testorder,
> +						balance_gap, classzone_idx))
> +		return true;
> +
>  	shrink_zone(zone, sc);
>  
>  	reclaim_state->reclaimed_slab = 0;
> @@ -2731,6 +2766,18 @@ static bool kswapd_shrink_zone(struct zone *zone,
>  
>  	zone_clear_flag(zone, ZONE_WRITEBACK);
>  
> +	/*
> +	 * If a zone reaches its high watermark, consider it to be no longer
> +	 * congested. It's possible there are dirty pages backed by congested
> +	 * BDIs but as pressure is relieved, speculatively avoid congestion
> +	 * waits.
> +	 */
> +	if (!zone->all_unreclaimable &&
> +	    zone_balanced(zone, testorder, 0, classzone_idx)) {
> +		zone_clear_flag(zone, ZONE_CONGESTED);
> +		zone_clear_flag(zone, ZONE_TAIL_LRU_DIRTY);
> +	}
> +
>  	return sc->nr_scanned >= sc->nr_to_reclaim;
>  }
>  
> @@ -2866,8 +2913,6 @@ static unsigned long balance_pgdat(pg_data_t *pgdat, int order,
>  		 */
>  		for (i = 0; i <= end_zone; i++) {
>  			struct zone *zone = pgdat->node_zones + i;
> -			int testorder;
> -			unsigned long balance_gap;
>  
>  			if (!populated_zone(zone))
>  				continue;
> @@ -2888,61 +2933,14 @@ static unsigned long balance_pgdat(pg_data_t *pgdat, int order,
>  			sc.nr_reclaimed += nr_soft_reclaimed;
>  
>  			/*
> -			 * We put equal pressure on every zone, unless
> -			 * one zone has way too many pages free
> -			 * already. The "too many pages" is defined
> -			 * as the high wmark plus a "gap" where the
> -			 * gap is either the low watermark or 1%
> -			 * of the zone, whichever is smaller.
> -			 */
> -			balance_gap = min(low_wmark_pages(zone),
> -				(zone->managed_pages +
> -					KSWAPD_ZONE_BALANCE_GAP_RATIO-1) /
> -				KSWAPD_ZONE_BALANCE_GAP_RATIO);
> -			/*
> -			 * Kswapd reclaims only single pages with compaction
> -			 * enabled. Trying too hard to reclaim until contiguous
> -			 * free pages have become available can hurt performance
> -			 * by evicting too much useful data from memory.
> -			 * Do not reclaim more than needed for compaction.
> +			 * There should be no need to raise the scanning
> +			 * priority if enough pages are already being scanned
> +			 * that that high watermark would be met at 100%
> +			 * efficiency.
>  			 */
> -			testorder = order;
> -			if (IS_ENABLED(CONFIG_COMPACTION) && order &&
> -					compaction_suitable(zone, order) !=
> -						COMPACT_SKIPPED)
> -				testorder = 0;
> -
> -			if ((buffer_heads_over_limit && is_highmem_idx(i)) ||
> -			    !zone_balanced(zone, testorder,
> -					   balance_gap, end_zone)) {
> -				/*
> -				 * There should be no need to raise the
> -				 * scanning priority if enough pages are
> -				 * already being scanned that high
> -				 * watermark would be met at 100% efficiency.
> -				 */
> -				if (kswapd_shrink_zone(zone, &sc, lru_pages,
> -						       &nr_attempted))
> -					raise_priority = false;
> -			}
> -
> -			if (zone->all_unreclaimable) {
> -				if (end_zone && end_zone == i)
> -					end_zone--;
> -				continue;
> -			}
> -
> -			if (zone_balanced(zone, testorder, 0, end_zone))
> -				/*
> -				 * If a zone reaches its high watermark,
> -				 * consider it to be no longer congested. It's
> -				 * possible there are dirty pages backed by
> -				 * congested BDIs but as pressure is relieved,
> -				 * speculatively avoid congestion waits
> -				 * or writing pages from kswapd context.
> -				 */
> -				zone_clear_flag(zone, ZONE_CONGESTED);
> -				zone_clear_flag(zone, ZONE_TAIL_LRU_DIRTY);
> +			if (kswapd_shrink_zone(zone, end_zone, &sc,
> +					lru_pages, &nr_attempted))
> +				raise_priority = false;
>  		}
>  
>  		/*
> -- 
> 1.8.1.4
> 

-- 
Michal Hocko
SUSE Labs

--
To unsubscribe, send a message with 'unsubscribe linux-mm' in
the body to majordomo@kvack.org.  For more info on Linux MM,
see: http://www.linux-mm.org/ .
Don't email: <a href=mailto:"dont@kvack.org"> email@kvack.org </a>

  reply	other threads:[~2013-05-14 12:23 UTC|newest]

Thread overview: 27+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2013-05-13  8:12 [PATCH 0/9] Reduce system disruption due to kswapd V4 Mel Gorman
2013-05-13  8:12 ` [PATCH 1/9] mm: vmscan: Limit the number of pages kswapd reclaims at each priority Mel Gorman
2013-05-13  8:12 ` [PATCH 2/9] mm: vmscan: Obey proportional scanning requirements for kswapd Mel Gorman
2013-05-14 10:21   ` Michal Hocko
2013-05-17  3:41   ` Kamezawa Hiroyuki
2013-05-13  8:12 ` [PATCH 3/9] mm: vmscan: Flatten kswapd priority loop Mel Gorman
2013-05-14 10:38   ` Michal Hocko
2013-05-13  8:12 ` [PATCH 4/9] mm: vmscan: Decide whether to compact the pgdat based on reclaim progress Mel Gorman
2013-05-14 10:51   ` Michal Hocko
2013-05-13  8:12 ` [PATCH 5/9] mm: vmscan: Do not allow kswapd to scan at maximum priority Mel Gorman
2013-05-13  8:12 ` [PATCH 6/9] mm: vmscan: Have kswapd writeback pages based on dirty pages encountered, not priority Mel Gorman
2013-05-14 11:25   ` Michal Hocko
2013-05-13  8:12 ` [PATCH 7/9] mm: vmscan: Block kswapd if it is encountering pages under writeback Mel Gorman
2013-05-14 21:06   ` Rik van Riel
2013-05-15 21:39   ` Andrew Morton
2013-05-16 13:07     ` Mel Gorman
2013-05-13  8:12 ` [PATCH 8/9] mm: vmscan: Check if kswapd should writepage once per pgdat scan Mel Gorman
2013-05-13  8:12 ` [PATCH 9/9] mm: vmscan: Move logic from balance_pgdat() to kswapd_shrink_zone() Mel Gorman
2013-05-14 12:23   ` Michal Hocko [this message]
2013-05-14 21:06   ` Rik van Riel
2013-05-15 20:37 ` [PATCH 0/9] Reduce system disruption due to kswapd V4 Andrew Morton
2013-05-16 10:33   ` Mel Gorman
2013-05-16 13:54     ` Michal Hocko
2013-05-16 14:11       ` Mel Gorman
2013-05-18 21:15   ` Zlatko Calusic
2013-05-21 23:13 ` Dave Chinner
2013-05-22  8:48   ` Mel Gorman

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=20130514122325.GP5198@dhcp22.suse.cz \
    --to=mhocko@suse.cz \
    --cc=Valdis.Kletnieks@vt.edu \
    --cc=akpm@linux-foundation.org \
    --cc=dormando@rydia.net \
    --cc=hannes@cmpxchg.org \
    --cc=jslaby@suse.cz \
    --cc=kamezawa.hiroyu@jp.fujitsu.com \
    --cc=linux-kernel@vger.kernel.org \
    --cc=linux-mm@kvack.org \
    --cc=mgorman@suse.de \
    --cc=riel@redhat.com \
    --cc=zcalusic@bitsync.net \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox