public inbox for linux-kernel@vger.kernel.org
 help / color / mirror / Atom feed
From: "Justin P. Mattock" <justinmattock@gmail.com>
To: Yinghai Lu <yinghai@kernel.org>
Cc: Ingo Molnar <mingo@elte.hu>, Thomas Gleixner <tglx@linutronix.de>,
	"H. Peter Anvin" <hpa@zytor.com>,
	Andrew Morton <akpm@linux-foundation.org>,
	Suresh Siddha <suresh.b.siddha@intel.com>,
	Christoph Lameter <cl@linux-foundation.org>,
	"linux-kernel@vger.kernel.org" <linux-kernel@vger.kernel.org>,
	Al Viro <viro@zeniv.linux.org.uk>,
	Rusty Russell <rusty@rustcorp.com.au>,
	Pekka Enberg <penberg@cs.helsinki.fi>
Subject: Re: [PATCH 2/3] x86: add numa_move_cpus_to_node
Date: Sat, 09 May 2009 00:05:24 -0700	[thread overview]
Message-ID: <1241852724.1876.5.camel@unix> (raw)
In-Reply-To: <4A052721.4010201@kernel.org>

On Fri, 2009-05-08 at 23:48 -0700, Yinghai Lu wrote:

> 
> when node only have hot add range and don't have other static range.

when the node only has "hot add range", then don't have other "static
ranges".

> that node will not be onlined, and cpus on that will be linked to nearby
> node with memory.
> then when that host add range is added later, we need to linked those cpus
Then
> back.
> 
> Signed-off-by: Yinghai Lu <yinghai@kernel.org>
> 
> ---
>  arch/x86/include/asm/numa_64.h |   10 ++++---
>  arch/x86/mm/init_64.c          |    3 ++
>  arch/x86/mm/numa_64.c          |   52 +++++++++++++++++++++++++++++++++++------
>  3 files changed, 54 insertions(+), 11 deletions(-)
> 
> Index: linux-2.6/arch/x86/include/asm/numa_64.h
> ===================================================================
> --- linux-2.6.orig/arch/x86/include/asm/numa_64.h
> +++ linux-2.6/arch/x86/include/asm/numa_64.h
> @@ -25,16 +25,18 @@ extern void setup_node_bootmem(int nodei
>  
>  #ifdef CONFIG_NUMA
>  extern void __init init_cpu_to_node(void);
> -extern void __cpuinit numa_set_node(int cpu, int node);
> -extern void __cpuinit numa_clear_node(int cpu);
> -extern void __cpuinit numa_add_cpu(int cpu);
> -extern void __cpuinit numa_remove_cpu(int cpu);
> +extern void numa_set_node(int cpu, int node);
> +extern void numa_clear_node(int cpu);
> +extern void numa_add_cpu(int cpu);
> +extern void numa_remove_cpu(int cpu);
> +extern void numa_move_cpus_to_node(int nid);
>  #else
>  static inline void init_cpu_to_node(void)		{ }
>  static inline void numa_set_node(int cpu, int node)	{ }
>  static inline void numa_clear_node(int cpu)		{ }
>  static inline void numa_add_cpu(int cpu, int node)	{ }
>  static inline void numa_remove_cpu(int cpu)		{ }
> +static inline void numa_move_cpus_to_node(int nid)	{ }
>  #endif
>  
>  #endif /* _ASM_X86_NUMA_64_H */
> Index: linux-2.6/arch/x86/mm/numa_64.c
> ===================================================================
> --- linux-2.6.orig/arch/x86/mm/numa_64.c
> +++ linux-2.6/arch/x86/mm/numa_64.c
> @@ -12,6 +12,7 @@
>  #include <linux/module.h>
>  #include <linux/nodemask.h>
>  #include <linux/sched.h>
> +#include <linux/node.h>
>  
>  #include <asm/e820.h>
>  #include <asm/proto.h>
> @@ -660,7 +661,7 @@ void __init init_cpu_to_node(void)
>  #endif
>  
> 
> -void __cpuinit numa_set_node(int cpu, int node)
> +void numa_set_node(int cpu, int node)
>  {
>  	int *cpu_to_node_map = early_per_cpu_ptr(x86_cpu_to_node_map);
>  
> @@ -683,19 +684,56 @@ void __cpuinit numa_set_node(int cpu, in
>  		per_cpu(node_number, cpu) = node;
>  }
>  
> -void __cpuinit numa_clear_node(int cpu)
> +void numa_clear_node(int cpu)
>  {
>  	numa_set_node(cpu, NUMA_NO_NODE);
>  }
>  
> +static int real_cpu_to_node(int cpu)
> +{
> +	int apicid, nodeid = -1;
> +
> +	/*
> +	 * when the node doesn't have memory before, cpu_to_node(cpu) is
> +	 * point to other node, but apicid_to_node still hold the real nodeid
> +	 */
> +	apicid = per_cpu(x86_cpu_to_apicid, cpu);
> +	if (apicid == BAD_APICID)
> +		return nodeid;
> +
> +	nodeid = apicid_to_node[apicid];
> +	return nodeid;
> +}
> +
> +void numa_move_cpus_to_node(int nid)
> +{
> +	int cpu;
> +
> +	for_each_present_cpu(cpu) {
> +		int nodeid;
> +
> +		nodeid = real_cpu_to_node(cpu);
> +		if (nodeid != nid)
> +			continue;
> +
> +		nodeid = cpu_to_node(cpu);
> +		if (nodeid != nid) {
> +			unregister_cpu_under_node(cpu, nodeid);
> +			numa_remove_cpu(cpu);
> +			numa_set_node(cpu, nid);
> +			numa_add_cpu(cpu);
> +		}
> +	}
> +}
> +
>  #ifndef CONFIG_DEBUG_PER_CPU_MAPS
>  
> -void __cpuinit numa_add_cpu(int cpu)
> +void numa_add_cpu(int cpu)
>  {
>  	cpumask_set_cpu(cpu, node_to_cpumask_map[early_cpu_to_node(cpu)]);
>  }
>  
> -void __cpuinit numa_remove_cpu(int cpu)
> +void numa_remove_cpu(int cpu)
>  {
>  	cpumask_clear_cpu(cpu, node_to_cpumask_map[early_cpu_to_node(cpu)]);
>  }
> @@ -705,7 +743,7 @@ void __cpuinit numa_remove_cpu(int cpu)
>  /*
>   * --------- debug versions of the numa functions ---------
>   */
> -static void __cpuinit numa_set_cpumask(int cpu, int enable)
> +static void numa_set_cpumask(int cpu, int enable)
>  {
>  	int node = early_cpu_to_node(cpu);
>  	struct cpumask *mask;
> @@ -728,12 +766,12 @@ static void __cpuinit numa_set_cpumask(i
>  		enable ? "numa_add_cpu" : "numa_remove_cpu", cpu, node, buf);
>  }
>  
> -void __cpuinit numa_add_cpu(int cpu)
> +void numa_add_cpu(int cpu)
>  {
>  	numa_set_cpumask(cpu, 1);
>  }
>  
> -void __cpuinit numa_remove_cpu(int cpu)
> +void numa_remove_cpu(int cpu)
>  {
>  	numa_set_cpumask(cpu, 0);
>  }
> Index: linux-2.6/arch/x86/mm/init_64.c
> ===================================================================
> --- linux-2.6.orig/arch/x86/mm/init_64.c
> +++ linux-2.6/arch/x86/mm/init_64.c
> @@ -631,6 +631,9 @@ int arch_add_memory(int nid, u64 start,
>  	ret = __add_pages(nid, zone, start_pfn, nr_pages);
>  	WARN_ON_ONCE(ret);
>  
> +	if (!ret)
> +		numa_move_cpus_to_node(nid);
> +
>  	return ret;
>  }
>  EXPORT_SYMBOL_GPL(arch_add_memory);
> --
> To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
> the body of a message to majordomo@vger.kernel.org
> More majordomo info at  http://vger.kernel.org/majordomo-info.html
> Please read the FAQ at  http://www.tux.org/lkml/

This way it sounds better(correct me if I'm wrong).

regards,

Justin P. Mattock


  reply	other threads:[~2009-05-09  7:05 UTC|newest]

Thread overview: 90+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2009-05-09  6:45 [PATCH 1/3] x86: remove MEMORY_HOTPLUG_RESERVE related code Yinghai Lu
2009-05-09  6:48 ` [PATCH 2/3] x86: add numa_move_cpus_to_node Yinghai Lu
2009-05-09  7:05   ` Justin P. Mattock [this message]
2009-05-12  1:27   ` Christoph Lameter
2009-05-11 21:53     ` Yinghai Lu
2009-05-12 20:59       ` Christoph Lameter
2009-05-12 17:16         ` Yinghai Lu
2009-05-12 21:21           ` Christoph Lameter
2009-05-13  5:39             ` Yinghai Lu
2009-05-14 19:34               ` Christoph Lameter
2009-05-14 20:58                 ` Yinghai Lu
2009-05-09  6:50 ` [PATCH 3/3] x86: fix node_possible_map logic -v2 Yinghai Lu
2009-05-11 17:53   ` Jack Steiner
2009-05-11 19:15     ` Yinghai Lu
2009-05-11 19:36       ` Yinghai Lu
2009-05-11 19:27     ` David Rientjes
2009-05-11 21:12       ` H. Peter Anvin
2009-05-11 21:26         ` Alan Cox
2009-05-11 22:25         ` David Rientjes
2009-05-12 15:06           ` Jack Steiner
2009-05-12 15:10             ` Yinghai Lu
2009-05-12 16:16               ` Jack Steiner
2009-05-12 16:40                 ` Yinghai Lu
2009-05-12 18:03                   ` Jack Steiner
2009-05-12 21:31                     ` Yinghai Lu
2009-05-12 21:58                       ` Jack Steiner
2009-05-12 23:13                         ` Yinghai Lu
2009-05-12 23:26                           ` Yinghai Lu
2009-05-12 15:43             ` Andi Kleen
2009-05-13  1:34             ` [PATCH] x86: fix system without memory on node0 Yinghai Lu
2009-05-13  8:00               ` Andi Kleen
2009-05-13 15:58                 ` Yinghai Lu
2009-05-13 13:35               ` Ingo Molnar
2009-05-13 16:52               ` Jack Steiner
2009-05-13 17:43                 ` Yinghai Lu
2009-05-13 18:08                 ` Yinghai Lu
2009-05-12  7:15         ` [PATCH 3/3] x86: fix node_possible_map logic -v2 Andi Kleen
2009-05-11 21:33       ` Jack Steiner
2009-05-11 22:56         ` David Rientjes
2009-05-11 23:00           ` Yinghai Lu
2009-05-12  7:09       ` Andi Kleen
2009-05-12  1:02 ` [PATCH 1/3] x86: remove MEMORY_HOTPLUG_RESERVE related code Christoph Lameter
2009-05-12 11:16 ` Mel Gorman
2009-05-13  5:29   ` Yinghai Lu
2009-05-13  9:55     ` Mel Gorman
2009-05-13  6:13   ` [PATCH] x86: remove MEMORY_HOTPLUG_RESERVE related code -v2 Yinghai Lu
2009-05-13 14:59     ` Mel Gorman
2009-05-14 16:38       ` [PATCH 1/5] " Yinghai Lu
2009-05-14 16:40         ` [PATCH 2/5] x86: add numa_move_cpus_to_node Yinghai Lu
2009-05-14 16:41         ` [PATCH 3/5] x86: fix node_possible_map logic -v2 Yinghai Lu
2009-05-18  7:40           ` [tip:x86/mm] x86, mm: Fix node_possible_map logic tip-bot for Yinghai Lu
2009-05-14 16:42         ` [PATCH 4/5] x86: fix system without memory on node0 -v2 Yinghai Lu
2009-05-18  7:40           ` [tip:x86/mm] x86: fix system without memory on node0 tip-bot for Yinghai Lu
2009-05-14 16:43         ` [PATCH 5/5] mm: clear N_HIGH_MEMORY map before se set it again -v2 Yinghai Lu
2009-05-14 16:54           ` Andrew Morton
2009-05-14 17:05             ` Yinghai Lu
2009-05-14 17:25               ` Andrew Morton
2009-05-14 17:34                 ` Yinghai Lu
2009-05-14 19:44                   ` Christoph Lameter
2009-06-04  5:16                   ` [RESEND PATCH] " Yinghai Lu
2009-06-04 16:38                     ` Christoph Lameter
2009-06-04 16:48                       ` Yinghai Lu
2009-06-04 17:11                         ` Christoph Lameter
2009-06-04 17:26                           ` [PATCH] mm: clear N_HIGH_MEMORY map before se set it again -v4 Yinghai Lu
2009-06-19  6:42                             ` Nathan Lynch
2009-06-19  8:18                               ` Yinghai Lu
2009-06-19  8:43                                 ` Nathan Lynch
2009-06-19 16:16                                   ` Yinghai Lu
2009-06-20 23:43                                   ` Yinghai Lu
2009-06-22  4:39                                     ` Nathan Lynch
2009-06-22 15:38                                       ` [PATCH] x86: only clear node_states for 64bit Yinghai Lu
2009-06-26 20:54                                         ` Andrew Morton
2009-06-26 21:09                                           ` Yinghai Lu
2009-06-27 17:17                                             ` Ingo Molnar
2009-06-27 20:40                                               ` Yinghai Lu
2009-06-29  7:39                                                 ` Yinghai Lu
2009-05-18  7:39         ` [tip:x86/mm] mm, x86: remove MEMORY_HOTPLUG_RESERVE related code tip-bot for Yinghai Lu
     [not found] ` <20090511095022.GA23121@elte.hu>
     [not found]   ` <20090511163158.c4e4d334.akpm@linux-foundation.org>
     [not found]     ` <20090512090704.GC18004@elte.hu>
     [not found]       ` <4A0A6700.3070100@kernel.org>
     [not found]         ` <20090513133635.GB7384@elte.hu>
     [not found]           ` <4A0AFA6E.5050200@kernel.org>
     [not found]             ` <20090515173521.GA29647@elte.hu>
2009-05-15 21:38               ` tip: patches in git for irq and numa Yinghai Lu
2009-05-18  7:29                 ` Ingo Molnar
2009-05-18 13:50                   ` Peter Zijlstra
2009-05-18 13:56                     ` Ingo Molnar
2009-05-18 15:03                     ` Yinghai Lu
2009-05-18 15:09                       ` Ingo Molnar
2009-05-18 15:11                       ` Peter Zijlstra
2009-05-18 17:23                         ` Yinghai Lu
2009-05-19  9:37                           ` Ingo Molnar
2009-05-19 10:31                             ` Peter Zijlstra
2009-05-19 12:26                               ` Ingo Molnar
2009-05-19  9:39                           ` [tip:irq/numa] x86, io-apic: Don't mark pin_programmed early tip-bot for Yinghai Lu
2009-05-19 12:30                           ` tip-bot for Yinghai Lu

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=1241852724.1876.5.camel@unix \
    --to=justinmattock@gmail.com \
    --cc=akpm@linux-foundation.org \
    --cc=cl@linux-foundation.org \
    --cc=hpa@zytor.com \
    --cc=linux-kernel@vger.kernel.org \
    --cc=mingo@elte.hu \
    --cc=penberg@cs.helsinki.fi \
    --cc=rusty@rustcorp.com.au \
    --cc=suresh.b.siddha@intel.com \
    --cc=tglx@linutronix.de \
    --cc=viro@zeniv.linux.org.uk \
    --cc=yinghai@kernel.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox