Message ID | 524163CF.3010303@cn.fujitsu.com (mailing list archive) |
---|---|
State | Superseded, archived |
Headers | show |
On Tue, Sep 24, 2013 at 06:05:03PM +0800, Zhang Yanfei wrote: > +/* Allocation direction */ > +enum { > + MEMBLOCK_DIRECTION_TOP_DOWN, > + MEMBLOCK_DIRECTION_BOTTOM_UP, > + NR_MEMLBOCK_DIRECTIONS > +}; > + > struct memblock_region { > phys_addr_t base; > phys_addr_t size; > @@ -35,6 +42,7 @@ struct memblock_type { > }; > > struct memblock { > + int current_direction; /* current allocation direction */ Just use boolean bottom_up here too? No need for the constants. > @@ -20,6 +20,8 @@ > #include <linux/seq_file.h> > #include <linux/memblock.h> > > +#include <asm-generic/sections.h> > + Why is the above added by this patch? > /** > + * __memblock_find_range - find free area utility > + * @start: start of candidate range > + * @end: end of candidate range, can be %MEMBLOCK_ALLOC_{ANYWHERE|ACCESSIBLE} > + * @size: size of free area to find > + * @align: alignment of free area to find > + * @nid: nid of the free area to find, %MAX_NUMNODES for any node > + * > + * Utility called from memblock_find_in_range_node(), find free area bottom-up. > + * > + * RETURNS: > + * Found address on success, %0 on failure. I don't think we prefix numeric literals with %. ... > @@ -127,6 +162,10 @@ __memblock_find_range_rev(phys_addr_t start, phys_addr_t end, > * > * Find @size free area aligned to @align in the specified range and node. > * > + * When allocation direction is bottom-up, the @start should be greater > + * than the end of the kernel image. Otherwise, it will be trimmed. And also, > + * if bottom-up allocation failed, will try to allocate memory top-down. It'd be nice to explain that bottom-up allocation is limited to above kernel image and what it's used for here. > + * > * RETURNS: > * Found address on success, %0 on failure. > */ > @@ -134,6 +173,8 @@ phys_addr_t __init_memblock memblock_find_in_range_node(phys_addr_t start, > phys_addr_t end, phys_addr_t size, > phys_addr_t align, int nid) > { > + int ret; > + > /* pump up @end */ > if (end == MEMBLOCK_ALLOC_ACCESSIBLE) > end = memblock.current_limit; > @@ -142,6 +183,28 @@ phys_addr_t __init_memblock memblock_find_in_range_node(phys_addr_t start, > start = max_t(phys_addr_t, start, PAGE_SIZE); > end = max(start, end); > > + if (memblock_bottom_up()) { > + phys_addr_t bottom_up_start; > + > + /* make sure we will allocate above the kernel */ > + bottom_up_start = max_t(phys_addr_t, start, __pa_symbol(_end)); > + > + /* ok, try bottom-up allocation first */ > + ret = __memblock_find_range(bottom_up_start, end, > + size, align, nid); > + if (ret) > + return ret; > + > + /* > + * we always limit bottom-up allocation above the kernel, > + * but top-down allocation doesn't have the limit, so > + * retrying top-down allocation may succeed when bottom-up > + * allocation failed. > + */ > + pr_warn("memblock: Failed to allocate memory in bottom up " > + "direction. Now try top down direction.\n"); Maybe just print warning only on the first failure? Otherwise, looks good to me. Thanks.
Hello tejun, On 09/24/2013 08:17 PM, Tejun Heo wrote: > On Tue, Sep 24, 2013 at 06:05:03PM +0800, Zhang Yanfei wrote: >> +/* Allocation direction */ >> +enum { >> + MEMBLOCK_DIRECTION_TOP_DOWN, >> + MEMBLOCK_DIRECTION_BOTTOM_UP, >> + NR_MEMLBOCK_DIRECTIONS >> +}; >> + >> struct memblock_region { >> phys_addr_t base; >> phys_addr_t size; >> @@ -35,6 +42,7 @@ struct memblock_type { >> }; >> >> struct memblock { >> + int current_direction; /* current allocation direction */ > > Just use boolean bottom_up here too? No need for the constants. OKay. Will try this way. > >> @@ -20,6 +20,8 @@ >> #include <linux/seq_file.h> >> #include <linux/memblock.h> >> >> +#include <asm-generic/sections.h> >> + > > Why is the above added by this patch? Oh, we use _end in this file which is defined in that header file. > >> /** >> + * __memblock_find_range - find free area utility >> + * @start: start of candidate range >> + * @end: end of candidate range, can be %MEMBLOCK_ALLOC_{ANYWHERE|ACCESSIBLE} >> + * @size: size of free area to find >> + * @align: alignment of free area to find >> + * @nid: nid of the free area to find, %MAX_NUMNODES for any node >> + * >> + * Utility called from memblock_find_in_range_node(), find free area bottom-up. >> + * >> + * RETURNS: >> + * Found address on success, %0 on failure. > > I don't think we prefix numeric literals with %. OKay. Will remove % > > ... >> @@ -127,6 +162,10 @@ __memblock_find_range_rev(phys_addr_t start, phys_addr_t end, >> * >> * Find @size free area aligned to @align in the specified range and node. >> * >> + * When allocation direction is bottom-up, the @start should be greater >> + * than the end of the kernel image. Otherwise, it will be trimmed. And also, >> + * if bottom-up allocation failed, will try to allocate memory top-down. > > It'd be nice to explain that bottom-up allocation is limited to above > kernel image and what it's used for here. OK. Will add the comment. > >> + * >> * RETURNS: >> * Found address on success, %0 on failure. >> */ >> @@ -134,6 +173,8 @@ phys_addr_t __init_memblock memblock_find_in_range_node(phys_addr_t start, >> phys_addr_t end, phys_addr_t size, >> phys_addr_t align, int nid) >> { >> + int ret; >> + >> /* pump up @end */ >> if (end == MEMBLOCK_ALLOC_ACCESSIBLE) >> end = memblock.current_limit; >> @@ -142,6 +183,28 @@ phys_addr_t __init_memblock memblock_find_in_range_node(phys_addr_t start, >> start = max_t(phys_addr_t, start, PAGE_SIZE); >> end = max(start, end); >> >> + if (memblock_bottom_up()) { >> + phys_addr_t bottom_up_start; >> + >> + /* make sure we will allocate above the kernel */ >> + bottom_up_start = max_t(phys_addr_t, start, __pa_symbol(_end)); >> + >> + /* ok, try bottom-up allocation first */ >> + ret = __memblock_find_range(bottom_up_start, end, >> + size, align, nid); >> + if (ret) >> + return ret; >> + >> + /* >> + * we always limit bottom-up allocation above the kernel, >> + * but top-down allocation doesn't have the limit, so >> + * retrying top-down allocation may succeed when bottom-up >> + * allocation failed. >> + */ >> + pr_warn("memblock: Failed to allocate memory in bottom up " >> + "direction. Now try top down direction.\n"); > > Maybe just print warning only on the first failure? Hmmm... This message is for each memblock allocation, that said, if the allocation this time fails, it prints the message and we use so called top-down. But next time, we still use bottom up first again. Did you mean if we fail on one bottom-up allocation, then we never try bottom-up again and will always use top-down? Thanks. > > Otherwise, looks good to me. > > Thanks. >
On Tue, Sep 24, 2013 at 09:17:16PM +0800, Zhang Yanfei wrote: > > Maybe just print warning only on the first failure? > > Hmmm... This message is for each memblock allocation, that said, if the > allocation this time fails, it prints the message and we use so called top-down. > But next time, we still use bottom up first again. > > Did you mean if we fail on one bottom-up allocation, then we never try > bottom-up again and will always use top-down? Nope, it's just that it might end up printing something for each alloc which can end up flooding console / log. The first failure is the most interesting and pretty much defeats the purpose of the whole thing after all. If it's expected to fail very rarely, I'd just stick in WARN_ONCE() there as the stack trace would be interesting too. Thanks.
On 09/24/2013 09:23 PM, Tejun Heo wrote: > On Tue, Sep 24, 2013 at 09:17:16PM +0800, Zhang Yanfei wrote: >>> Maybe just print warning only on the first failure? >> >> Hmmm... This message is for each memblock allocation, that said, if the >> allocation this time fails, it prints the message and we use so called top-down. >> But next time, we still use bottom up first again. >> >> Did you mean if we fail on one bottom-up allocation, then we never try >> bottom-up again and will always use top-down? > > Nope, it's just that it might end up printing something for each alloc > which can end up flooding console / log. The first failure is the > most interesting and pretty much defeats the purpose of the whole > thing after all. If it's expected to fail very rarely, I'd just stick > in WARN_ONCE() there as the stack trace would be interesting too. > I see. I think it is rarely to fail. But here is case that it must fail in the current bottom-up implementation. For example, we allocate memory in reserve_real_mode() by calling this: memblock_find_in_range(0, 1<<20, size, PAGE_SIZE); Both the start and end is below the kernel, so trying bottom-up for this must fail. So I am now thinking that if we should take this as the special case for bottom-up. That said, if we limit start and end both below the kernel, we should allocate memory below the kernel instead of make it fail. The cases are also rare, in early boot time, only these two: |->early_reserve_e820_mpc_new() /* allocate memory under 1MB */ |->reserve_real_mode() /* allocate memory under 1MB */ How do you think?
Hello, On Tue, Sep 24, 2013 at 10:12:22PM +0800, Zhang Yanfei wrote: > I see. I think it is rarely to fail. But here is case that it must > fail in the current bottom-up implementation. For example, we allocate > memory in reserve_real_mode() by calling this: > memblock_find_in_range(0, 1<<20, size, PAGE_SIZE); > > Both the start and end is below the kernel, so trying bottom-up for > this must fail. So I am now thinking that if we should take this as > the special case for bottom-up. That said, if we limit start and end > both below the kernel, we should allocate memory below the kernel instead > of make it fail. The cases are also rare, in early boot time, only > these two: > > |->early_reserve_e820_mpc_new() /* allocate memory under 1MB */ > |->reserve_real_mode() /* allocate memory under 1MB */ > > How do you think? They need to be special cased regardless, right? It's wrong to print out warning messages for things which are expected to behave that way. Just skip bottom-up allocs if @end is under kernel image? Thanks.
On 09/24/2013 10:16 PM, Tejun Heo wrote: > Hello, > > On Tue, Sep 24, 2013 at 10:12:22PM +0800, Zhang Yanfei wrote: >> I see. I think it is rarely to fail. But here is case that it must >> fail in the current bottom-up implementation. For example, we allocate >> memory in reserve_real_mode() by calling this: >> memblock_find_in_range(0, 1<<20, size, PAGE_SIZE); >> >> Both the start and end is below the kernel, so trying bottom-up for >> this must fail. So I am now thinking that if we should take this as >> the special case for bottom-up. That said, if we limit start and end >> both below the kernel, we should allocate memory below the kernel instead >> of make it fail. The cases are also rare, in early boot time, only >> these two: >> >> |->early_reserve_e820_mpc_new() /* allocate memory under 1MB */ >> |->reserve_real_mode() /* allocate memory under 1MB */ >> >> How do you think? > > They need to be special cased regardless, right? It's wrong to print > out warning messages for things which are expected to behave that way. > Just skip bottom-up allocs if @end is under kernel image? > Good idea. Will do this way.
diff --git a/include/linux/memblock.h b/include/linux/memblock.h index 31e95ac..c14bca5 100644 --- a/include/linux/memblock.h +++ b/include/linux/memblock.h @@ -19,6 +19,13 @@ #define INIT_MEMBLOCK_REGIONS 128 +/* Allocation direction */ +enum { + MEMBLOCK_DIRECTION_TOP_DOWN, + MEMBLOCK_DIRECTION_BOTTOM_UP, + NR_MEMLBOCK_DIRECTIONS +}; + struct memblock_region { phys_addr_t base; phys_addr_t size; @@ -35,6 +42,7 @@ struct memblock_type { }; struct memblock { + int current_direction; /* current allocation direction */ phys_addr_t current_limit; struct memblock_type memory; struct memblock_type reserved; @@ -148,6 +156,24 @@ phys_addr_t memblock_alloc_try_nid(phys_addr_t size, phys_addr_t align, int nid) phys_addr_t memblock_alloc(phys_addr_t size, phys_addr_t align); +#ifdef CONFIG_MOVABLE_NODE +static inline void memblock_set_bottom_up(bool enable) +{ + if (enable) + memblock.current_direction = MEMBLOCK_DIRECTION_BOTTOM_UP; + else + memblock.current_direction = MEMBLOCK_DIRECTION_TOP_DOWN; +} + +static inline bool memblock_bottom_up(void) +{ + return memblock.current_direction == MEMBLOCK_DIRECTION_BOTTOM_UP; +} +#else +static inline void memblock_set_bottom_up(bool enable) {} +static inline bool memblock_bottom_up(void) { return false; } +#endif + /* Flags for memblock_alloc_base() amd __memblock_alloc_base() */ #define MEMBLOCK_ALLOC_ANYWHERE (~(phys_addr_t)0) #define MEMBLOCK_ALLOC_ACCESSIBLE 0 diff --git a/mm/memblock.c b/mm/memblock.c index 3d80c74..5859b8e 100644 --- a/mm/memblock.c +++ b/mm/memblock.c @@ -20,6 +20,8 @@ #include <linux/seq_file.h> #include <linux/memblock.h> +#include <asm-generic/sections.h> + static struct memblock_region memblock_memory_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock; static struct memblock_region memblock_reserved_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock; @@ -32,6 +34,7 @@ struct memblock memblock __initdata_memblock = { .reserved.cnt = 1, /* empty dummy entry */ .reserved.max = INIT_MEMBLOCK_REGIONS, + .current_direction = MEMBLOCK_DIRECTION_TOP_DOWN, .current_limit = MEMBLOCK_ALLOC_ANYWHERE, }; @@ -83,6 +86,38 @@ static long __init_memblock memblock_overlaps_region(struct memblock_type *type, } /** + * __memblock_find_range - find free area utility + * @start: start of candidate range + * @end: end of candidate range, can be %MEMBLOCK_ALLOC_{ANYWHERE|ACCESSIBLE} + * @size: size of free area to find + * @align: alignment of free area to find + * @nid: nid of the free area to find, %MAX_NUMNODES for any node + * + * Utility called from memblock_find_in_range_node(), find free area bottom-up. + * + * RETURNS: + * Found address on success, %0 on failure. + */ +static phys_addr_t __init_memblock +__memblock_find_range(phys_addr_t start, phys_addr_t end, phys_addr_t size, + phys_addr_t align, int nid) +{ + phys_addr_t this_start, this_end, cand; + u64 i; + + for_each_free_mem_range(i, nid, &this_start, &this_end, NULL) { + this_start = clamp(this_start, start, end); + this_end = clamp(this_end, start, end); + + cand = round_up(this_start, align); + if (cand < this_end && this_end - cand >= size) + return cand; + } + + return 0; +} + +/** * __memblock_find_range_rev - find free area utility, in reverse order * @start: start of candidate range * @end: end of candidate range, can be %MEMBLOCK_ALLOC_{ANYWHERE|ACCESSIBLE} @@ -127,6 +162,10 @@ __memblock_find_range_rev(phys_addr_t start, phys_addr_t end, * * Find @size free area aligned to @align in the specified range and node. * + * When allocation direction is bottom-up, the @start should be greater + * than the end of the kernel image. Otherwise, it will be trimmed. And also, + * if bottom-up allocation failed, will try to allocate memory top-down. + * * RETURNS: * Found address on success, %0 on failure. */ @@ -134,6 +173,8 @@ phys_addr_t __init_memblock memblock_find_in_range_node(phys_addr_t start, phys_addr_t end, phys_addr_t size, phys_addr_t align, int nid) { + int ret; + /* pump up @end */ if (end == MEMBLOCK_ALLOC_ACCESSIBLE) end = memblock.current_limit; @@ -142,6 +183,28 @@ phys_addr_t __init_memblock memblock_find_in_range_node(phys_addr_t start, start = max_t(phys_addr_t, start, PAGE_SIZE); end = max(start, end); + if (memblock_bottom_up()) { + phys_addr_t bottom_up_start; + + /* make sure we will allocate above the kernel */ + bottom_up_start = max_t(phys_addr_t, start, __pa_symbol(_end)); + + /* ok, try bottom-up allocation first */ + ret = __memblock_find_range(bottom_up_start, end, + size, align, nid); + if (ret) + return ret; + + /* + * we always limit bottom-up allocation above the kernel, + * but top-down allocation doesn't have the limit, so + * retrying top-down allocation may succeed when bottom-up + * allocation failed. + */ + pr_warn("memblock: Failed to allocate memory in bottom up " + "direction. Now try top down direction.\n"); + } + return __memblock_find_range_rev(start, end, size, align, nid); }