Commit 4eb0716e authored by Alexandre Ghiti's avatar Alexandre Ghiti Committed by Linus Torvalds

hugetlb: allow to free gigantic pages regardless of the configuration

On systems without CONTIG_ALLOC activated but that support gigantic pages,
boottime reserved gigantic pages can not be freed at all.  This patch
simply enables the possibility to hand back those pages to memory
allocator.

Link: http://lkml.kernel.org/r/20190327063626.18421-5-alex@ghiti.frSigned-off-by: default avatarAlexandre Ghiti <alex@ghiti.fr>
Acked-by: David S. Miller <davem@davemloft.net> [sparc]
Reviewed-by: default avatarMike Kravetz <mike.kravetz@oracle.com>
Cc: Andy Lutomirsky <luto@kernel.org>
Cc: Aneesh Kumar K.V <aneesh.kumar@linux.ibm.com>
Cc: Benjamin Herrenschmidt <benh@kernel.crashing.org>
Cc: Borislav Petkov <bp@alien8.de>
Cc: Catalin Marinas <catalin.marinas@arm.com>
Cc: Dave Hansen <dave.hansen@linux.intel.com>
Cc: Heiko Carstens <heiko.carstens@de.ibm.com>
Cc: "H . Peter Anvin" <hpa@zytor.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Martin Schwidefsky <schwidefsky@de.ibm.com>
Cc: Michael Ellerman <mpe@ellerman.id.au>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Rich Felker <dalias@libc.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Vlastimil Babka <vbabka@suse.cz>
Cc: Will Deacon <will.deacon@arm.com>
Cc: Yoshinori Sato <ysato@users.sourceforge.jp>
Signed-off-by: default avatarAndrew Morton <akpm@linux-foundation.org>
Signed-off-by: default avatarLinus Torvalds <torvalds@linux-foundation.org>
parent 8df995f6
...@@ -19,7 +19,7 @@ config ARM64 ...@@ -19,7 +19,7 @@ config ARM64
select ARCH_HAS_FAST_MULTIPLIER select ARCH_HAS_FAST_MULTIPLIER
select ARCH_HAS_FORTIFY_SOURCE select ARCH_HAS_FORTIFY_SOURCE
select ARCH_HAS_GCOV_PROFILE_ALL select ARCH_HAS_GCOV_PROFILE_ALL
select ARCH_HAS_GIGANTIC_PAGE if CONTIG_ALLOC select ARCH_HAS_GIGANTIC_PAGE
select ARCH_HAS_KCOV select ARCH_HAS_KCOV
select ARCH_HAS_KEEPINITRD select ARCH_HAS_KEEPINITRD
select ARCH_HAS_MEMBARRIER_SYNC_CORE select ARCH_HAS_MEMBARRIER_SYNC_CORE
......
...@@ -70,8 +70,4 @@ extern void set_huge_swap_pte_at(struct mm_struct *mm, unsigned long addr, ...@@ -70,8 +70,4 @@ extern void set_huge_swap_pte_at(struct mm_struct *mm, unsigned long addr,
#include <asm-generic/hugetlb.h> #include <asm-generic/hugetlb.h>
#ifdef CONFIG_ARCH_HAS_GIGANTIC_PAGE
static inline bool gigantic_page_supported(void) { return true; }
#endif
#endif /* __ASM_HUGETLB_H */ #endif /* __ASM_HUGETLB_H */
...@@ -36,8 +36,8 @@ static inline int hstate_get_psize(struct hstate *hstate) ...@@ -36,8 +36,8 @@ static inline int hstate_get_psize(struct hstate *hstate)
} }
} }
#ifdef CONFIG_ARCH_HAS_GIGANTIC_PAGE #define __HAVE_ARCH_GIGANTIC_PAGE_RUNTIME_SUPPORTED
static inline bool gigantic_page_supported(void) static inline bool gigantic_page_runtime_supported(void)
{ {
/* /*
* We used gigantic page reservation with hypervisor assist in some case. * We used gigantic page reservation with hypervisor assist in some case.
...@@ -49,7 +49,6 @@ static inline bool gigantic_page_supported(void) ...@@ -49,7 +49,6 @@ static inline bool gigantic_page_supported(void)
return true; return true;
} }
#endif
/* hugepd entry valid bit */ /* hugepd entry valid bit */
#define HUGEPD_VAL_BITS (0x8000000000000000UL) #define HUGEPD_VAL_BITS (0x8000000000000000UL)
......
...@@ -331,7 +331,7 @@ config ARCH_ENABLE_SPLIT_PMD_PTLOCK ...@@ -331,7 +331,7 @@ config ARCH_ENABLE_SPLIT_PMD_PTLOCK
config PPC_RADIX_MMU config PPC_RADIX_MMU
bool "Radix MMU Support" bool "Radix MMU Support"
depends on PPC_BOOK3S_64 && HUGETLB_PAGE depends on PPC_BOOK3S_64 && HUGETLB_PAGE
select ARCH_HAS_GIGANTIC_PAGE if CONTIG_ALLOC select ARCH_HAS_GIGANTIC_PAGE
select PPC_HAVE_KUEP select PPC_HAVE_KUEP
select PPC_HAVE_KUAP select PPC_HAVE_KUAP
default y default y
......
...@@ -63,7 +63,7 @@ config S390 ...@@ -63,7 +63,7 @@ config S390
select ARCH_HAS_ELF_RANDOMIZE select ARCH_HAS_ELF_RANDOMIZE
select ARCH_HAS_FORTIFY_SOURCE select ARCH_HAS_FORTIFY_SOURCE
select ARCH_HAS_GCOV_PROFILE_ALL select ARCH_HAS_GCOV_PROFILE_ALL
select ARCH_HAS_GIGANTIC_PAGE if CONTIG_ALLOC select ARCH_HAS_GIGANTIC_PAGE
select ARCH_HAS_KCOV select ARCH_HAS_KCOV
select ARCH_HAS_PTE_SPECIAL select ARCH_HAS_PTE_SPECIAL
select ARCH_HAS_SET_MEMORY select ARCH_HAS_SET_MEMORY
......
...@@ -116,7 +116,9 @@ static inline pte_t huge_pte_modify(pte_t pte, pgprot_t newprot) ...@@ -116,7 +116,9 @@ static inline pte_t huge_pte_modify(pte_t pte, pgprot_t newprot)
return pte_modify(pte, newprot); return pte_modify(pte, newprot);
} }
#ifdef CONFIG_ARCH_HAS_GIGANTIC_PAGE static inline bool gigantic_page_runtime_supported(void)
static inline bool gigantic_page_supported(void) { return true; } {
#endif return true;
}
#endif /* _ASM_S390_HUGETLB_H */ #endif /* _ASM_S390_HUGETLB_H */
...@@ -53,7 +53,7 @@ config SUPERH ...@@ -53,7 +53,7 @@ config SUPERH
select HAVE_FUTEX_CMPXCHG if FUTEX select HAVE_FUTEX_CMPXCHG if FUTEX
select HAVE_NMI select HAVE_NMI
select NEED_SG_DMA_LENGTH select NEED_SG_DMA_LENGTH
select ARCH_HAS_GIGANTIC_PAGE if CONTIG_ALLOC select ARCH_HAS_GIGANTIC_PAGE
help help
The SuperH is a RISC processor targeted for use in embedded systems The SuperH is a RISC processor targeted for use in embedded systems
......
...@@ -92,7 +92,7 @@ config SPARC64 ...@@ -92,7 +92,7 @@ config SPARC64
select ARCH_CLOCKSOURCE_DATA select ARCH_CLOCKSOURCE_DATA
select ARCH_HAS_PTE_SPECIAL select ARCH_HAS_PTE_SPECIAL
select PCI_DOMAINS if PCI select PCI_DOMAINS if PCI
select ARCH_HAS_GIGANTIC_PAGE if CONTIG_ALLOC select ARCH_HAS_GIGANTIC_PAGE
config ARCH_DEFCONFIG config ARCH_DEFCONFIG
string string
......
...@@ -22,7 +22,7 @@ config X86_64 ...@@ -22,7 +22,7 @@ config X86_64
def_bool y def_bool y
depends on 64BIT depends on 64BIT
# Options that are inherently 64-bit kernel only: # Options that are inherently 64-bit kernel only:
select ARCH_HAS_GIGANTIC_PAGE if CONTIG_ALLOC select ARCH_HAS_GIGANTIC_PAGE
select ARCH_SUPPORTS_INT128 select ARCH_SUPPORTS_INT128
select ARCH_USE_CMPXCHG_LOCKREF select ARCH_USE_CMPXCHG_LOCKREF
select HAVE_ARCH_SOFT_DIRTY select HAVE_ARCH_SOFT_DIRTY
......
...@@ -17,8 +17,4 @@ static inline void arch_clear_hugepage_flags(struct page *page) ...@@ -17,8 +17,4 @@ static inline void arch_clear_hugepage_flags(struct page *page)
{ {
} }
#ifdef CONFIG_ARCH_HAS_GIGANTIC_PAGE
static inline bool gigantic_page_supported(void) { return true; }
#endif
#endif /* _ASM_X86_HUGETLB_H */ #endif /* _ASM_X86_HUGETLB_H */
...@@ -126,4 +126,11 @@ static inline pte_t huge_ptep_get(pte_t *ptep) ...@@ -126,4 +126,11 @@ static inline pte_t huge_ptep_get(pte_t *ptep)
} }
#endif #endif
#ifndef __HAVE_ARCH_GIGANTIC_PAGE_RUNTIME_SUPPORTED
static inline bool gigantic_page_runtime_supported(void)
{
return IS_ENABLED(CONFIG_ARCH_HAS_GIGANTIC_PAGE);
}
#endif /* __HAVE_ARCH_GIGANTIC_PAGE_RUNTIME_SUPPORTED */
#endif /* _ASM_GENERIC_HUGETLB_H */ #endif /* _ASM_GENERIC_HUGETLB_H */
...@@ -589,8 +589,8 @@ static inline bool pm_suspended_storage(void) ...@@ -589,8 +589,8 @@ static inline bool pm_suspended_storage(void)
/* The below functions must be run on a range from a single zone. */ /* The below functions must be run on a range from a single zone. */
extern int alloc_contig_range(unsigned long start, unsigned long end, extern int alloc_contig_range(unsigned long start, unsigned long end,
unsigned migratetype, gfp_t gfp_mask); unsigned migratetype, gfp_t gfp_mask);
extern void free_contig_range(unsigned long pfn, unsigned nr_pages);
#endif #endif
void free_contig_range(unsigned long pfn, unsigned int nr_pages);
#ifdef CONFIG_CMA #ifdef CONFIG_CMA
/* CMA stuff */ /* CMA stuff */
......
...@@ -1059,6 +1059,7 @@ static void free_gigantic_page(struct page *page, unsigned int order) ...@@ -1059,6 +1059,7 @@ static void free_gigantic_page(struct page *page, unsigned int order)
free_contig_range(page_to_pfn(page), 1 << order); free_contig_range(page_to_pfn(page), 1 << order);
} }
#ifdef CONFIG_CONTIG_ALLOC
static int __alloc_gigantic_page(unsigned long start_pfn, static int __alloc_gigantic_page(unsigned long start_pfn,
unsigned long nr_pages, gfp_t gfp_mask) unsigned long nr_pages, gfp_t gfp_mask)
{ {
...@@ -1143,11 +1144,20 @@ static struct page *alloc_gigantic_page(struct hstate *h, gfp_t gfp_mask, ...@@ -1143,11 +1144,20 @@ static struct page *alloc_gigantic_page(struct hstate *h, gfp_t gfp_mask,
static void prep_new_huge_page(struct hstate *h, struct page *page, int nid); static void prep_new_huge_page(struct hstate *h, struct page *page, int nid);
static void prep_compound_gigantic_page(struct page *page, unsigned int order); static void prep_compound_gigantic_page(struct page *page, unsigned int order);
#else /* !CONFIG_CONTIG_ALLOC */
static struct page *alloc_gigantic_page(struct hstate *h, gfp_t gfp_mask,
int nid, nodemask_t *nodemask)
{
return NULL;
}
#endif /* CONFIG_CONTIG_ALLOC */
#else /* !CONFIG_ARCH_HAS_GIGANTIC_PAGE */ #else /* !CONFIG_ARCH_HAS_GIGANTIC_PAGE */
static inline bool gigantic_page_supported(void) { return false; }
static struct page *alloc_gigantic_page(struct hstate *h, gfp_t gfp_mask, static struct page *alloc_gigantic_page(struct hstate *h, gfp_t gfp_mask,
int nid, nodemask_t *nodemask) { return NULL; } int nid, nodemask_t *nodemask)
{
return NULL;
}
static inline void free_gigantic_page(struct page *page, unsigned int order) { } static inline void free_gigantic_page(struct page *page, unsigned int order) { }
static inline void destroy_compound_gigantic_page(struct page *page, static inline void destroy_compound_gigantic_page(struct page *page,
unsigned int order) { } unsigned int order) { }
...@@ -1157,7 +1167,7 @@ static void update_and_free_page(struct hstate *h, struct page *page) ...@@ -1157,7 +1167,7 @@ static void update_and_free_page(struct hstate *h, struct page *page)
{ {
int i; int i;
if (hstate_is_gigantic(h) && !gigantic_page_supported()) if (hstate_is_gigantic(h) && !gigantic_page_runtime_supported())
return; return;
h->nr_huge_pages--; h->nr_huge_pages--;
...@@ -2278,13 +2288,27 @@ static int adjust_pool_surplus(struct hstate *h, nodemask_t *nodes_allowed, ...@@ -2278,13 +2288,27 @@ static int adjust_pool_surplus(struct hstate *h, nodemask_t *nodes_allowed,
} }
#define persistent_huge_pages(h) (h->nr_huge_pages - h->surplus_huge_pages) #define persistent_huge_pages(h) (h->nr_huge_pages - h->surplus_huge_pages)
static unsigned long set_max_huge_pages(struct hstate *h, unsigned long count, static int set_max_huge_pages(struct hstate *h, unsigned long count,
nodemask_t *nodes_allowed) nodemask_t *nodes_allowed)
{ {
unsigned long min_count, ret; unsigned long min_count, ret;
if (hstate_is_gigantic(h) && !gigantic_page_supported()) spin_lock(&hugetlb_lock);
return h->max_huge_pages;
/*
* Gigantic pages runtime allocation depend on the capability for large
* page range allocation.
* If the system does not provide this feature, return an error when
* the user tries to allocate gigantic pages but let the user free the
* boottime allocated gigantic pages.
*/
if (hstate_is_gigantic(h) && !IS_ENABLED(CONFIG_CONTIG_ALLOC)) {
if (count > persistent_huge_pages(h)) {
spin_unlock(&hugetlb_lock);
return -EINVAL;
}
/* Fall through to decrease pool */
}
/* /*
* Increase the pool size * Increase the pool size
...@@ -2297,7 +2321,6 @@ static unsigned long set_max_huge_pages(struct hstate *h, unsigned long count, ...@@ -2297,7 +2321,6 @@ static unsigned long set_max_huge_pages(struct hstate *h, unsigned long count,
* pool might be one hugepage larger than it needs to be, but * pool might be one hugepage larger than it needs to be, but
* within all the constraints specified by the sysctls. * within all the constraints specified by the sysctls.
*/ */
spin_lock(&hugetlb_lock);
while (h->surplus_huge_pages && count > persistent_huge_pages(h)) { while (h->surplus_huge_pages && count > persistent_huge_pages(h)) {
if (!adjust_pool_surplus(h, nodes_allowed, -1)) if (!adjust_pool_surplus(h, nodes_allowed, -1))
break; break;
...@@ -2352,9 +2375,10 @@ static unsigned long set_max_huge_pages(struct hstate *h, unsigned long count, ...@@ -2352,9 +2375,10 @@ static unsigned long set_max_huge_pages(struct hstate *h, unsigned long count,
break; break;
} }
out: out:
ret = persistent_huge_pages(h); h->max_huge_pages = persistent_huge_pages(h);
spin_unlock(&hugetlb_lock); spin_unlock(&hugetlb_lock);
return ret;
return 0;
} }
#define HSTATE_ATTR_RO(_name) \ #define HSTATE_ATTR_RO(_name) \
...@@ -2406,7 +2430,7 @@ static ssize_t __nr_hugepages_store_common(bool obey_mempolicy, ...@@ -2406,7 +2430,7 @@ static ssize_t __nr_hugepages_store_common(bool obey_mempolicy,
int err; int err;
NODEMASK_ALLOC(nodemask_t, nodes_allowed, GFP_KERNEL | __GFP_NORETRY); NODEMASK_ALLOC(nodemask_t, nodes_allowed, GFP_KERNEL | __GFP_NORETRY);
if (hstate_is_gigantic(h) && !gigantic_page_supported()) { if (hstate_is_gigantic(h) && !gigantic_page_runtime_supported()) {
err = -EINVAL; err = -EINVAL;
goto out; goto out;
} }
...@@ -2430,15 +2454,13 @@ static ssize_t __nr_hugepages_store_common(bool obey_mempolicy, ...@@ -2430,15 +2454,13 @@ static ssize_t __nr_hugepages_store_common(bool obey_mempolicy,
} else } else
nodes_allowed = &node_states[N_MEMORY]; nodes_allowed = &node_states[N_MEMORY];
h->max_huge_pages = set_max_huge_pages(h, count, nodes_allowed); err = set_max_huge_pages(h, count, nodes_allowed);
out:
if (nodes_allowed != &node_states[N_MEMORY]) if (nodes_allowed != &node_states[N_MEMORY])
NODEMASK_FREE(nodes_allowed); NODEMASK_FREE(nodes_allowed);
return len; return err ? err : len;
out:
NODEMASK_FREE(nodes_allowed);
return err;
} }
static ssize_t nr_hugepages_store_common(bool obey_mempolicy, static ssize_t nr_hugepages_store_common(bool obey_mempolicy,
......
...@@ -8346,8 +8346,9 @@ int alloc_contig_range(unsigned long start, unsigned long end, ...@@ -8346,8 +8346,9 @@ int alloc_contig_range(unsigned long start, unsigned long end,
pfn_max_align_up(end), migratetype); pfn_max_align_up(end), migratetype);
return ret; return ret;
} }
#endif /* CONFIG_CONTIG_ALLOC */
void free_contig_range(unsigned long pfn, unsigned nr_pages) void free_contig_range(unsigned long pfn, unsigned int nr_pages)
{ {
unsigned int count = 0; unsigned int count = 0;
...@@ -8359,7 +8360,6 @@ void free_contig_range(unsigned long pfn, unsigned nr_pages) ...@@ -8359,7 +8360,6 @@ void free_contig_range(unsigned long pfn, unsigned nr_pages)
} }
WARN(count != 0, "%d pages are still in use!\n", count); WARN(count != 0, "%d pages are still in use!\n", count);
} }
#endif
#ifdef CONFIG_MEMORY_HOTPLUG #ifdef CONFIG_MEMORY_HOTPLUG
/* /*
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment