From: Oscar Salvador <osalvador@techadventures.net>
To: Pavel Tatashin <pasha.tatashin@oracle.com>
Cc: steven.sistare@oracle.com, daniel.m.jordan@oracle.com,
linux-kernel@vger.kernel.org, akpm@linux-foundation.org,
kirill.shutemov@linux.intel.com, mhocko@suse.com,
linux-mm@kvack.org, dan.j.williams@intel.com, jack@suse.cz,
jglisse@redhat.com, jrdr.linux@gmail.com, bhe@redhat.com,
gregkh@linuxfoundation.org, vbabka@suse.cz,
richard.weiyang@gmail.com, dave.hansen@intel.com,
rientjes@google.com, mingo@kernel.org
Subject: Re: [PATCH v1 2/2] mm/sparse: start using sparse_init_nid(), and remove old code
Date: Fri, 29 Jun 2018 16:40:59 +0200 [thread overview]
Message-ID: <20180629144059.GB23545@techadventures.net> (raw)
In-Reply-To: <20180628173010.23849-3-pasha.tatashin@oracle.com>
On Thu, Jun 28, 2018 at 01:30:10PM -0400, Pavel Tatashin wrote:
> Change sprase_init() to only find the pnum ranges that belong to a specific
> node and call sprase_init_nid() for that range from sparse_init().
>
> Delete all the code that became obsolete with this change.
>
> Signed-off-by: Pavel Tatashin <pasha.tatashin@oracle.com>
> ---
> include/linux/mm.h | 5 -
> mm/sparse-vmemmap.c | 39 --------
> mm/sparse.c | 223 ++++----------------------------------------
> 3 files changed, 16 insertions(+), 251 deletions(-)
>
> diff --git a/include/linux/mm.h b/include/linux/mm.h
> index ba200808dd5f..a25395071a13 100644
> --- a/include/linux/mm.h
> +++ b/include/linux/mm.h
> @@ -2646,11 +2646,6 @@ extern int randomize_va_space;
> const char * arch_vma_name(struct vm_area_struct *vma);
> void print_vma_addr(char *prefix, unsigned long rip);
>
> -void sparse_mem_maps_populate_node(struct page **map_map,
> - unsigned long pnum_begin,
> - unsigned long pnum_end,
> - unsigned long map_count,
> - int nodeid);
> struct page * sparse_populate_node(unsigned long pnum_begin,
> unsigned long pnum_end,
> unsigned long map_count,
> diff --git a/mm/sparse-vmemmap.c b/mm/sparse-vmemmap.c
> index 4655503bdc66..0adda7c32feb 100644
> --- a/mm/sparse-vmemmap.c
> +++ b/mm/sparse-vmemmap.c
> @@ -273,45 +273,6 @@ struct page * __meminit sparse_mem_map_populate(unsigned long pnum, int nid,
> return map;
> }
>
> -void __init sparse_mem_maps_populate_node(struct page **map_map,
> - unsigned long pnum_begin,
> - unsigned long pnum_end,
> - unsigned long map_count, int nodeid)
> -{
> - unsigned long pnum;
> - unsigned long size = sizeof(struct page) * PAGES_PER_SECTION;
> - void *vmemmap_buf_start;
> - int nr_consumed_maps = 0;
> -
> - size = ALIGN(size, PMD_SIZE);
> - vmemmap_buf_start = __earlyonly_bootmem_alloc(nodeid, size * map_count,
> - PMD_SIZE, __pa(MAX_DMA_ADDRESS));
> -
> - if (vmemmap_buf_start) {
> - vmemmap_buf = vmemmap_buf_start;
> - vmemmap_buf_end = vmemmap_buf_start + size * map_count;
> - }
> -
> - for (pnum = pnum_begin; pnum < pnum_end; pnum++) {
> - if (!present_section_nr(pnum))
> - continue;
> -
> - map_map[nr_consumed_maps] = sparse_mem_map_populate(pnum, nodeid, NULL);
> - if (map_map[nr_consumed_maps++])
> - continue;
> - pr_err("%s: sparsemem memory map backing failed some memory will not be available\n",
> - __func__);
> - }
> -
> - if (vmemmap_buf_start) {
> - /* need to free left buf */
> - memblock_free_early(__pa(vmemmap_buf),
> - vmemmap_buf_end - vmemmap_buf);
> - vmemmap_buf = NULL;
> - vmemmap_buf_end = NULL;
> - }
> -}
> -
> struct page * __init sparse_populate_node(unsigned long pnum_begin,
> unsigned long pnum_end,
> unsigned long map_count,
> diff --git a/mm/sparse.c b/mm/sparse.c
> index 60eaa2a4842a..ad2522e733bb 100644
> --- a/mm/sparse.c
> +++ b/mm/sparse.c
> @@ -200,12 +200,6 @@ static inline int next_present_section_nr(int section_nr)
> (section_nr <= __highest_present_section_nr)); \
> section_nr = next_present_section_nr(section_nr))
>
> -/*
> - * Record how many memory sections are marked as present
> - * during system bootup.
> - */
> -static int __initdata nr_present_sections;
> -
> /* Record a memory area against a node. */
> void __init memory_present(int nid, unsigned long start, unsigned long end)
> {
> @@ -235,7 +229,6 @@ void __init memory_present(int nid, unsigned long start, unsigned long end)
> ms->section_mem_map = sparse_encode_early_nid(nid) |
> SECTION_IS_ONLINE;
> section_mark_present(ms);
> - nr_present_sections++;
> }
> }
> }
> @@ -377,34 +370,6 @@ static void __init check_usemap_section_nr(int nid, unsigned long *usemap)
> }
> #endif /* CONFIG_MEMORY_HOTREMOVE */
>
> -static void __init sparse_early_usemaps_alloc_node(void *data,
> - unsigned long pnum_begin,
> - unsigned long pnum_end,
> - unsigned long usemap_count, int nodeid)
> -{
> - void *usemap;
> - unsigned long pnum;
> - unsigned long **usemap_map = (unsigned long **)data;
> - int size = usemap_size();
> - int nr_consumed_maps = 0;
> -
> - usemap = sparse_early_usemaps_alloc_pgdat_section(NODE_DATA(nodeid),
> - size * usemap_count);
> - if (!usemap) {
> - pr_warn("%s: allocation failed\n", __func__);
> - return;
> - }
> -
> - for (pnum = pnum_begin; pnum < pnum_end; pnum++) {
> - if (!present_section_nr(pnum))
> - continue;
> - usemap_map[nr_consumed_maps] = usemap;
> - usemap += size;
> - check_usemap_section_nr(nodeid, usemap_map[nr_consumed_maps]);
> - nr_consumed_maps++;
> - }
> -}
> -
> #ifndef CONFIG_SPARSEMEM_VMEMMAP
> struct page __init *sparse_mem_map_populate(unsigned long pnum, int nid,
> struct vmem_altmap *altmap)
> @@ -418,44 +383,6 @@ struct page __init *sparse_mem_map_populate(unsigned long pnum, int nid,
> BOOTMEM_ALLOC_ACCESSIBLE, nid);
> return map;
> }
> -void __init sparse_mem_maps_populate_node(struct page **map_map,
> - unsigned long pnum_begin,
> - unsigned long pnum_end,
> - unsigned long map_count, int nodeid)
> -{
> - void *map;
> - unsigned long pnum;
> - unsigned long size = sizeof(struct page) * PAGES_PER_SECTION;
> - int nr_consumed_maps;
> -
> - size = PAGE_ALIGN(size);
> - map = memblock_virt_alloc_try_nid_raw(size * map_count,
> - PAGE_SIZE, __pa(MAX_DMA_ADDRESS),
> - BOOTMEM_ALLOC_ACCESSIBLE, nodeid);
> - if (map) {
> - nr_consumed_maps = 0;
> - for (pnum = pnum_begin; pnum < pnum_end; pnum++) {
> - if (!present_section_nr(pnum))
> - continue;
> - map_map[nr_consumed_maps] = map;
> - map += size;
> - nr_consumed_maps++;
> - }
> - return;
> - }
> -
> - /* fallback */
> - nr_consumed_maps = 0;
> - for (pnum = pnum_begin; pnum < pnum_end; pnum++) {
> - if (!present_section_nr(pnum))
> - continue;
> - map_map[nr_consumed_maps] = sparse_mem_map_populate(pnum, nodeid, NULL);
> - if (map_map[nr_consumed_maps++])
> - continue;
> - pr_err("%s: sparsemem memory map backing failed some memory will not be available\n",
> - __func__);
> - }
> -}
>
> static unsigned long section_map_size(void)
> {
> @@ -495,73 +422,15 @@ struct page * __init sprase_populate_node_section(struct page *map_base,
> }
> #endif /* !CONFIG_SPARSEMEM_VMEMMAP */
>
> -static void __init sparse_early_mem_maps_alloc_node(void *data,
> - unsigned long pnum_begin,
> - unsigned long pnum_end,
> - unsigned long map_count, int nodeid)
> -{
> - struct page **map_map = (struct page **)data;
> - sparse_mem_maps_populate_node(map_map, pnum_begin, pnum_end,
> - map_count, nodeid);
> -}
> -
> void __weak __meminit vmemmap_populate_print_last(void)
> {
> }
>
> -/**
> - * alloc_usemap_and_memmap - memory alloction for pageblock flags and vmemmap
> - * @map: usemap_map for pageblock flags or mmap_map for vmemmap
> - * @unit_size: size of map unit
> - */
> -static void __init alloc_usemap_and_memmap(void (*alloc_func)
> - (void *, unsigned long, unsigned long,
> - unsigned long, int), void *data,
> - int data_unit_size)
> -{
> - unsigned long pnum;
> - unsigned long map_count;
> - int nodeid_begin = 0;
> - unsigned long pnum_begin = 0;
> -
> - for_each_present_section_nr(0, pnum) {
> - struct mem_section *ms;
> -
> - ms = __nr_to_section(pnum);
> - nodeid_begin = sparse_early_nid(ms);
> - pnum_begin = pnum;
> - break;
> - }
> - map_count = 1;
> - for_each_present_section_nr(pnum_begin + 1, pnum) {
> - struct mem_section *ms;
> - int nodeid;
> -
> - ms = __nr_to_section(pnum);
> - nodeid = sparse_early_nid(ms);
> - if (nodeid == nodeid_begin) {
> - map_count++;
> - continue;
> - }
> - /* ok, we need to take cake of from pnum_begin to pnum - 1*/
> - alloc_func(data, pnum_begin, pnum,
> - map_count, nodeid_begin);
> - /* new start, update count etc*/
> - nodeid_begin = nodeid;
> - pnum_begin = pnum;
> - data += map_count * data_unit_size;
> - map_count = 1;
> - }
> - /* ok, last chunk */
> - alloc_func(data, pnum_begin, __highest_present_section_nr+1,
> - map_count, nodeid_begin);
> -}
> -
> /*
> * Initialize sparse on a specific node. The node spans [pnum_begin, pnum_end)
> * And number of present sections in this node is map_count.
> */
> -void __init sparse_init_nid(int nid, unsigned long pnum_begin,
> +static void __init sparse_init_nid(int nid, unsigned long pnum_begin,
> unsigned long pnum_end,
> unsigned long map_count)
> {
> @@ -616,87 +485,27 @@ void __init sparse_init_nid(int nid, unsigned long pnum_begin,
> */
> void __init sparse_init(void)
> {
> - unsigned long pnum;
> - struct page *map;
> - struct page **map_map;
> - unsigned long *usemap;
> - unsigned long **usemap_map;
> - int size, size2;
> - int nr_consumed_maps = 0;
> + unsigned long pnum_begin, pnum_end, map_count;
> + int nid, nid_begin;
>
> - /* see include/linux/mmzone.h 'struct mem_section' definition */
> - BUILD_BUG_ON(!is_power_of_2(sizeof(struct mem_section)));
> -
> - /* Setup pageblock_order for HUGETLB_PAGE_SIZE_VARIABLE */
> - set_pageblock_order();
> -
> - /*
> - * map is using big page (aka 2M in x86 64 bit)
> - * usemap is less one page (aka 24 bytes)
> - * so alloc 2M (with 2M align) and 24 bytes in turn will
> - * make next 2M slip to one more 2M later.
> - * then in big system, the memory will have a lot of holes...
> - * here try to allocate 2M pages continuously.
> - *
> - * powerpc need to call sparse_init_one_section right after each
> - * sparse_early_mem_map_alloc, so allocate usemap_map at first.
> - */
> - size = sizeof(unsigned long *) * nr_present_sections;
> - usemap_map = memblock_virt_alloc(size, 0);
> - if (!usemap_map)
> - panic("can not allocate usemap_map\n");
> - alloc_usemap_and_memmap(sparse_early_usemaps_alloc_node,
> - (void *)usemap_map,
> - sizeof(usemap_map[0]));
> -
> - size2 = sizeof(struct page *) * nr_present_sections;
> - map_map = memblock_virt_alloc(size2, 0);
> - if (!map_map)
> - panic("can not allocate map_map\n");
> - alloc_usemap_and_memmap(sparse_early_mem_maps_alloc_node,
> - (void *)map_map,
> - sizeof(map_map[0]));
> -
> - /* The numner of present sections stored in nr_present_sections
> - * are kept the same since mem sections are marked as present in
> - * memory_present(). In this for loop, we need check which sections
> - * failed to allocate memmap or usemap, then clear its
> - * ->section_mem_map accordingly. During this process, we need
> - * increase 'nr_consumed_maps' whether its allocation of memmap
> - * or usemap failed or not, so that after we handle the i-th
> - * memory section, can get memmap and usemap of (i+1)-th section
> - * correctly. */
> - for_each_present_section_nr(0, pnum) {
> - struct mem_section *ms;
> -
> - if (nr_consumed_maps >= nr_present_sections) {
> - pr_err("nr_consumed_maps goes beyond nr_present_sections\n");
> - break;
> - }
> - ms = __nr_to_section(pnum);
> - usemap = usemap_map[nr_consumed_maps];
> - if (!usemap) {
> - ms->section_mem_map = 0;
> - nr_consumed_maps++;
> - continue;
> - }
> + for_each_present_section_nr(0, pnum_begin)
> + break;
Hi Pavel,
besides this first for_each_present_section_nr(), what about writing a static inline
function that returns next_present_section_nr(-1) ?
Something like:
static inline int first_present_section_nr(void)
{
return next_present_section_nr(-1);
}
pnum_begin = first_present_section_nr();
I think it will generate the same code, but maybe it is more readable?
>
> - map = map_map[nr_consumed_maps];
> - if (!map) {
> - ms->section_mem_map = 0;
> - nr_consumed_maps++;
> + nid_begin = sparse_early_nid(__nr_to_section(pnum_begin));
> + map_count = 1;
> + for_each_present_section_nr(pnum_begin + 1, pnum_end) {
> + nid = sparse_early_nid(__nr_to_section(pnum_end));
> + if (nid == nid_begin) {
> + map_count++;
> continue;
> }
> -
> - sparse_init_one_section(__nr_to_section(pnum), pnum, map,
> - usemap);
> - nr_consumed_maps++;
> + sparse_init_nid(nid, pnum_begin, pnum_end, map_count);
> + nid_begin = nid;
> + pnum_begin = pnum_end;
> + map_count = 1;
> }
> -
> + sparse_init_nid(nid_begin, pnum_begin, pnum_end, map_count);
> vmemmap_populate_print_last();
> -
> - memblock_free_early(__pa(map_map), size2);
> - memblock_free_early(__pa(usemap_map), size);
> }
>
> #ifdef CONFIG_MEMORY_HOTPLUG
> --
> 2.18.0
>
--
Oscar Salvador
SUSE L3
next prev parent reply other threads:[~2018-06-29 14:41 UTC|newest]
Thread overview: 10+ messages / expand[flat|nested] mbox.gz Atom feed top
2018-06-28 17:30 [PATCH v1 0/2] sparse_init rewrite Pavel Tatashin
2018-06-28 17:30 ` [PATCH v1 1/2] mm/sparse: add sparse_init_nid() Pavel Tatashin
2018-06-29 10:04 ` Oscar Salvador
2018-06-29 10:44 ` Oscar Salvador
2018-06-29 11:56 ` Pavel Tatashin
2018-06-29 14:35 ` Oscar Salvador
2018-06-29 15:54 ` Pavel Tatashin
2018-06-28 17:30 ` [PATCH v1 2/2] mm/sparse: start using sparse_init_nid(), and remove old code Pavel Tatashin
2018-06-29 14:40 ` Oscar Salvador [this message]
2018-06-29 15:55 ` Pavel Tatashin
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20180629144059.GB23545@techadventures.net \
--to=osalvador@techadventures.net \
--cc=akpm@linux-foundation.org \
--cc=bhe@redhat.com \
--cc=dan.j.williams@intel.com \
--cc=daniel.m.jordan@oracle.com \
--cc=dave.hansen@intel.com \
--cc=gregkh@linuxfoundation.org \
--cc=jack@suse.cz \
--cc=jglisse@redhat.com \
--cc=jrdr.linux@gmail.com \
--cc=kirill.shutemov@linux.intel.com \
--cc=linux-kernel@vger.kernel.org \
--cc=linux-mm@kvack.org \
--cc=mhocko@suse.com \
--cc=mingo@kernel.org \
--cc=pasha.tatashin@oracle.com \
--cc=richard.weiyang@gmail.com \
--cc=rientjes@google.com \
--cc=steven.sistare@oracle.com \
--cc=vbabka@suse.cz \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.