xref: /linux/mm/memblock.c (revision 7fb0bc3f06fdc3a35e41bcea7a15e53d2515362f)
195f72d1eSYinghai Lu /*
295f72d1eSYinghai Lu  * Procedures for maintaining information about logical memory blocks.
395f72d1eSYinghai Lu  *
495f72d1eSYinghai Lu  * Peter Bergner, IBM Corp.	June 2001.
595f72d1eSYinghai Lu  * Copyright (C) 2001 Peter Bergner.
695f72d1eSYinghai Lu  *
795f72d1eSYinghai Lu  *      This program is free software; you can redistribute it and/or
895f72d1eSYinghai Lu  *      modify it under the terms of the GNU General Public License
995f72d1eSYinghai Lu  *      as published by the Free Software Foundation; either version
1095f72d1eSYinghai Lu  *      2 of the License, or (at your option) any later version.
1195f72d1eSYinghai Lu  */
1295f72d1eSYinghai Lu 
1395f72d1eSYinghai Lu #include <linux/kernel.h>
14142b45a7SBenjamin Herrenschmidt #include <linux/slab.h>
1595f72d1eSYinghai Lu #include <linux/init.h>
1695f72d1eSYinghai Lu #include <linux/bitops.h>
17449e8df3SBenjamin Herrenschmidt #include <linux/poison.h>
18c196f76fSBenjamin Herrenschmidt #include <linux/pfn.h>
196d03b885SBenjamin Herrenschmidt #include <linux/debugfs.h>
206d03b885SBenjamin Herrenschmidt #include <linux/seq_file.h>
2195f72d1eSYinghai Lu #include <linux/memblock.h>
2295f72d1eSYinghai Lu 
23fe091c20STejun Heo static struct memblock_region memblock_memory_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock;
24fe091c20STejun Heo static struct memblock_region memblock_reserved_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock;
25fe091c20STejun Heo 
26fe091c20STejun Heo struct memblock memblock __initdata_memblock = {
27fe091c20STejun Heo 	.memory.regions		= memblock_memory_init_regions,
28fe091c20STejun Heo 	.memory.cnt		= 1,	/* empty dummy entry */
29fe091c20STejun Heo 	.memory.max		= INIT_MEMBLOCK_REGIONS,
30fe091c20STejun Heo 
31fe091c20STejun Heo 	.reserved.regions	= memblock_reserved_init_regions,
32fe091c20STejun Heo 	.reserved.cnt		= 1,	/* empty dummy entry */
33fe091c20STejun Heo 	.reserved.max		= INIT_MEMBLOCK_REGIONS,
34fe091c20STejun Heo 
35fe091c20STejun Heo 	.current_limit		= MEMBLOCK_ALLOC_ANYWHERE,
36fe091c20STejun Heo };
3795f72d1eSYinghai Lu 
3810d06439SYinghai Lu int memblock_debug __initdata_memblock;
391aadc056STejun Heo static int memblock_can_resize __initdata_memblock;
4095f72d1eSYinghai Lu 
41142b45a7SBenjamin Herrenschmidt /* inline so we don't get a warning when pr_debug is compiled out */
42142b45a7SBenjamin Herrenschmidt static inline const char *memblock_type_name(struct memblock_type *type)
43142b45a7SBenjamin Herrenschmidt {
44142b45a7SBenjamin Herrenschmidt 	if (type == &memblock.memory)
45142b45a7SBenjamin Herrenschmidt 		return "memory";
46142b45a7SBenjamin Herrenschmidt 	else if (type == &memblock.reserved)
47142b45a7SBenjamin Herrenschmidt 		return "reserved";
48142b45a7SBenjamin Herrenschmidt 	else
49142b45a7SBenjamin Herrenschmidt 		return "unknown";
50142b45a7SBenjamin Herrenschmidt }
51142b45a7SBenjamin Herrenschmidt 
52eb18f1b5STejun Heo /* adjust *@size so that (@base + *@size) doesn't overflow, return new size */
53eb18f1b5STejun Heo static inline phys_addr_t memblock_cap_size(phys_addr_t base, phys_addr_t *size)
54eb18f1b5STejun Heo {
55eb18f1b5STejun Heo 	return *size = min(*size, (phys_addr_t)ULLONG_MAX - base);
56eb18f1b5STejun Heo }
57eb18f1b5STejun Heo 
586ed311b2SBenjamin Herrenschmidt /*
596ed311b2SBenjamin Herrenschmidt  * Address comparison utilities
606ed311b2SBenjamin Herrenschmidt  */
6110d06439SYinghai Lu static unsigned long __init_memblock memblock_addrs_overlap(phys_addr_t base1, phys_addr_t size1,
622898cc4cSBenjamin Herrenschmidt 				       phys_addr_t base2, phys_addr_t size2)
6395f72d1eSYinghai Lu {
6495f72d1eSYinghai Lu 	return ((base1 < (base2 + size2)) && (base2 < (base1 + size1)));
6595f72d1eSYinghai Lu }
6695f72d1eSYinghai Lu 
672d7d3eb2SH Hartley Sweeten static long __init_memblock memblock_overlaps_region(struct memblock_type *type,
682d7d3eb2SH Hartley Sweeten 					phys_addr_t base, phys_addr_t size)
696ed311b2SBenjamin Herrenschmidt {
706ed311b2SBenjamin Herrenschmidt 	unsigned long i;
716ed311b2SBenjamin Herrenschmidt 
726ed311b2SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
736ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnbase = type->regions[i].base;
746ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnsize = type->regions[i].size;
756ed311b2SBenjamin Herrenschmidt 		if (memblock_addrs_overlap(base, size, rgnbase, rgnsize))
766ed311b2SBenjamin Herrenschmidt 			break;
776ed311b2SBenjamin Herrenschmidt 	}
786ed311b2SBenjamin Herrenschmidt 
796ed311b2SBenjamin Herrenschmidt 	return (i < type->cnt) ? i : -1;
806ed311b2SBenjamin Herrenschmidt }
816ed311b2SBenjamin Herrenschmidt 
826ed311b2SBenjamin Herrenschmidt /*
836ed311b2SBenjamin Herrenschmidt  * Find, allocate, deallocate or reserve unreserved regions. All allocations
846ed311b2SBenjamin Herrenschmidt  * are top-down.
856ed311b2SBenjamin Herrenschmidt  */
866ed311b2SBenjamin Herrenschmidt 
87cd79481dSYinghai Lu static phys_addr_t __init_memblock memblock_find_region(phys_addr_t start, phys_addr_t end,
886ed311b2SBenjamin Herrenschmidt 					  phys_addr_t size, phys_addr_t align)
896ed311b2SBenjamin Herrenschmidt {
906ed311b2SBenjamin Herrenschmidt 	phys_addr_t base, res_base;
916ed311b2SBenjamin Herrenschmidt 	long j;
926ed311b2SBenjamin Herrenschmidt 
93f1af98c7SYinghai Lu 	/* In case, huge size is requested */
94f1af98c7SYinghai Lu 	if (end < size)
951f5026a7STejun Heo 		return 0;
96f1af98c7SYinghai Lu 
97348968ebSTejun Heo 	base = round_down(end - size, align);
98f1af98c7SYinghai Lu 
9925818f0fSBenjamin Herrenschmidt 	/* Prevent allocations returning 0 as it's also used to
10025818f0fSBenjamin Herrenschmidt 	 * indicate an allocation failure
10125818f0fSBenjamin Herrenschmidt 	 */
10225818f0fSBenjamin Herrenschmidt 	if (start == 0)
10325818f0fSBenjamin Herrenschmidt 		start = PAGE_SIZE;
10425818f0fSBenjamin Herrenschmidt 
1056ed311b2SBenjamin Herrenschmidt 	while (start <= base) {
1066ed311b2SBenjamin Herrenschmidt 		j = memblock_overlaps_region(&memblock.reserved, base, size);
1076ed311b2SBenjamin Herrenschmidt 		if (j < 0)
1086ed311b2SBenjamin Herrenschmidt 			return base;
1096ed311b2SBenjamin Herrenschmidt 		res_base = memblock.reserved.regions[j].base;
1106ed311b2SBenjamin Herrenschmidt 		if (res_base < size)
1116ed311b2SBenjamin Herrenschmidt 			break;
112348968ebSTejun Heo 		base = round_down(res_base - size, align);
1136ed311b2SBenjamin Herrenschmidt 	}
1146ed311b2SBenjamin Herrenschmidt 
1151f5026a7STejun Heo 	return 0;
1166ed311b2SBenjamin Herrenschmidt }
1176ed311b2SBenjamin Herrenschmidt 
118fc769a8eSTejun Heo /*
119fc769a8eSTejun Heo  * Find a free area with specified alignment in a specific range.
120fc769a8eSTejun Heo  */
121fc769a8eSTejun Heo phys_addr_t __init_memblock memblock_find_in_range(phys_addr_t start, phys_addr_t end,
122fc769a8eSTejun Heo 					phys_addr_t size, phys_addr_t align)
1236ed311b2SBenjamin Herrenschmidt {
1246ed311b2SBenjamin Herrenschmidt 	long i;
1256ed311b2SBenjamin Herrenschmidt 
1266ed311b2SBenjamin Herrenschmidt 	BUG_ON(0 == size);
1276ed311b2SBenjamin Herrenschmidt 
1286ed311b2SBenjamin Herrenschmidt 	/* Pump up max_addr */
129fef501d4SBenjamin Herrenschmidt 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
130fef501d4SBenjamin Herrenschmidt 		end = memblock.current_limit;
1316ed311b2SBenjamin Herrenschmidt 
1326ed311b2SBenjamin Herrenschmidt 	/* We do a top-down search, this tends to limit memory
1336ed311b2SBenjamin Herrenschmidt 	 * fragmentation by keeping early boot allocs near the
1346ed311b2SBenjamin Herrenschmidt 	 * top of memory
1356ed311b2SBenjamin Herrenschmidt 	 */
1366ed311b2SBenjamin Herrenschmidt 	for (i = memblock.memory.cnt - 1; i >= 0; i--) {
1376ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblockbase = memblock.memory.regions[i].base;
1386ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblocksize = memblock.memory.regions[i].size;
139fef501d4SBenjamin Herrenschmidt 		phys_addr_t bottom, top, found;
1406ed311b2SBenjamin Herrenschmidt 
1416ed311b2SBenjamin Herrenschmidt 		if (memblocksize < size)
1426ed311b2SBenjamin Herrenschmidt 			continue;
143fef501d4SBenjamin Herrenschmidt 		if ((memblockbase + memblocksize) <= start)
144fef501d4SBenjamin Herrenschmidt 			break;
145fef501d4SBenjamin Herrenschmidt 		bottom = max(memblockbase, start);
146fef501d4SBenjamin Herrenschmidt 		top = min(memblockbase + memblocksize, end);
147fef501d4SBenjamin Herrenschmidt 		if (bottom >= top)
148fef501d4SBenjamin Herrenschmidt 			continue;
149fef501d4SBenjamin Herrenschmidt 		found = memblock_find_region(bottom, top, size, align);
1501f5026a7STejun Heo 		if (found)
151fef501d4SBenjamin Herrenschmidt 			return found;
1526ed311b2SBenjamin Herrenschmidt 	}
1531f5026a7STejun Heo 	return 0;
1546ed311b2SBenjamin Herrenschmidt }
1556ed311b2SBenjamin Herrenschmidt 
1565303b68fSYinghai Lu /*
1577950c407SYinghai Lu  * Free memblock.reserved.regions
1587950c407SYinghai Lu  */
1597950c407SYinghai Lu int __init_memblock memblock_free_reserved_regions(void)
1607950c407SYinghai Lu {
1617950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1627950c407SYinghai Lu 		return 0;
1637950c407SYinghai Lu 
1647950c407SYinghai Lu 	return memblock_free(__pa(memblock.reserved.regions),
1657950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1667950c407SYinghai Lu }
1677950c407SYinghai Lu 
1687950c407SYinghai Lu /*
1697950c407SYinghai Lu  * Reserve memblock.reserved.regions
1707950c407SYinghai Lu  */
1717950c407SYinghai Lu int __init_memblock memblock_reserve_reserved_regions(void)
1727950c407SYinghai Lu {
1737950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1747950c407SYinghai Lu 		return 0;
1757950c407SYinghai Lu 
1767950c407SYinghai Lu 	return memblock_reserve(__pa(memblock.reserved.regions),
1777950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1787950c407SYinghai Lu }
1797950c407SYinghai Lu 
18010d06439SYinghai Lu static void __init_memblock memblock_remove_region(struct memblock_type *type, unsigned long r)
18195f72d1eSYinghai Lu {
1821440c4e2STejun Heo 	type->total_size -= type->regions[r].size;
1837c0caeb8STejun Heo 	memmove(&type->regions[r], &type->regions[r + 1],
1847c0caeb8STejun Heo 		(type->cnt - (r + 1)) * sizeof(type->regions[r]));
185e3239ff9SBenjamin Herrenschmidt 	type->cnt--;
18695f72d1eSYinghai Lu 
1878f7a6605SBenjamin Herrenschmidt 	/* Special case for empty arrays */
1888f7a6605SBenjamin Herrenschmidt 	if (type->cnt == 0) {
1891440c4e2STejun Heo 		WARN_ON(type->total_size != 0);
1908f7a6605SBenjamin Herrenschmidt 		type->cnt = 1;
1918f7a6605SBenjamin Herrenschmidt 		type->regions[0].base = 0;
1928f7a6605SBenjamin Herrenschmidt 		type->regions[0].size = 0;
1937c0caeb8STejun Heo 		memblock_set_region_node(&type->regions[0], MAX_NUMNODES);
1948f7a6605SBenjamin Herrenschmidt 	}
19595f72d1eSYinghai Lu }
19695f72d1eSYinghai Lu 
19710d06439SYinghai Lu static int __init_memblock memblock_double_array(struct memblock_type *type)
198142b45a7SBenjamin Herrenschmidt {
199142b45a7SBenjamin Herrenschmidt 	struct memblock_region *new_array, *old_array;
200142b45a7SBenjamin Herrenschmidt 	phys_addr_t old_size, new_size, addr;
201142b45a7SBenjamin Herrenschmidt 	int use_slab = slab_is_available();
202142b45a7SBenjamin Herrenschmidt 
203142b45a7SBenjamin Herrenschmidt 	/* We don't allow resizing until we know about the reserved regions
204142b45a7SBenjamin Herrenschmidt 	 * of memory that aren't suitable for allocation
205142b45a7SBenjamin Herrenschmidt 	 */
206142b45a7SBenjamin Herrenschmidt 	if (!memblock_can_resize)
207142b45a7SBenjamin Herrenschmidt 		return -1;
208142b45a7SBenjamin Herrenschmidt 
209142b45a7SBenjamin Herrenschmidt 	/* Calculate new doubled size */
210142b45a7SBenjamin Herrenschmidt 	old_size = type->max * sizeof(struct memblock_region);
211142b45a7SBenjamin Herrenschmidt 	new_size = old_size << 1;
212142b45a7SBenjamin Herrenschmidt 
213142b45a7SBenjamin Herrenschmidt 	/* Try to find some space for it.
214142b45a7SBenjamin Herrenschmidt 	 *
215142b45a7SBenjamin Herrenschmidt 	 * WARNING: We assume that either slab_is_available() and we use it or
216142b45a7SBenjamin Herrenschmidt 	 * we use MEMBLOCK for allocations. That means that this is unsafe to use
217142b45a7SBenjamin Herrenschmidt 	 * when bootmem is currently active (unless bootmem itself is implemented
218142b45a7SBenjamin Herrenschmidt 	 * on top of MEMBLOCK which isn't the case yet)
219142b45a7SBenjamin Herrenschmidt 	 *
220142b45a7SBenjamin Herrenschmidt 	 * This should however not be an issue for now, as we currently only
221142b45a7SBenjamin Herrenschmidt 	 * call into MEMBLOCK while it's still active, or much later when slab is
222142b45a7SBenjamin Herrenschmidt 	 * active for memory hotplug operations
223142b45a7SBenjamin Herrenschmidt 	 */
224142b45a7SBenjamin Herrenschmidt 	if (use_slab) {
225142b45a7SBenjamin Herrenschmidt 		new_array = kmalloc(new_size, GFP_KERNEL);
2261f5026a7STejun Heo 		addr = new_array ? __pa(new_array) : 0;
227142b45a7SBenjamin Herrenschmidt 	} else
228fc769a8eSTejun Heo 		addr = memblock_find_in_range(0, MEMBLOCK_ALLOC_ACCESSIBLE, new_size, sizeof(phys_addr_t));
2291f5026a7STejun Heo 	if (!addr) {
230142b45a7SBenjamin Herrenschmidt 		pr_err("memblock: Failed to double %s array from %ld to %ld entries !\n",
231142b45a7SBenjamin Herrenschmidt 		       memblock_type_name(type), type->max, type->max * 2);
232142b45a7SBenjamin Herrenschmidt 		return -1;
233142b45a7SBenjamin Herrenschmidt 	}
234142b45a7SBenjamin Herrenschmidt 	new_array = __va(addr);
235142b45a7SBenjamin Herrenschmidt 
236ea9e4376SYinghai Lu 	memblock_dbg("memblock: %s array is doubled to %ld at [%#010llx-%#010llx]",
237ea9e4376SYinghai Lu 		 memblock_type_name(type), type->max * 2, (u64)addr, (u64)addr + new_size - 1);
238ea9e4376SYinghai Lu 
239142b45a7SBenjamin Herrenschmidt 	/* Found space, we now need to move the array over before
240142b45a7SBenjamin Herrenschmidt 	 * we add the reserved region since it may be our reserved
241142b45a7SBenjamin Herrenschmidt 	 * array itself that is full.
242142b45a7SBenjamin Herrenschmidt 	 */
243142b45a7SBenjamin Herrenschmidt 	memcpy(new_array, type->regions, old_size);
244142b45a7SBenjamin Herrenschmidt 	memset(new_array + type->max, 0, old_size);
245142b45a7SBenjamin Herrenschmidt 	old_array = type->regions;
246142b45a7SBenjamin Herrenschmidt 	type->regions = new_array;
247142b45a7SBenjamin Herrenschmidt 	type->max <<= 1;
248142b45a7SBenjamin Herrenschmidt 
249142b45a7SBenjamin Herrenschmidt 	/* If we use SLAB that's it, we are done */
250142b45a7SBenjamin Herrenschmidt 	if (use_slab)
251142b45a7SBenjamin Herrenschmidt 		return 0;
252142b45a7SBenjamin Herrenschmidt 
253142b45a7SBenjamin Herrenschmidt 	/* Add the new reserved region now. Should not fail ! */
2549c8c27e2STejun Heo 	BUG_ON(memblock_reserve(addr, new_size));
255142b45a7SBenjamin Herrenschmidt 
256142b45a7SBenjamin Herrenschmidt 	/* If the array wasn't our static init one, then free it. We only do
257142b45a7SBenjamin Herrenschmidt 	 * that before SLAB is available as later on, we don't know whether
258142b45a7SBenjamin Herrenschmidt 	 * to use kfree or free_bootmem_pages(). Shouldn't be a big deal
259142b45a7SBenjamin Herrenschmidt 	 * anyways
260142b45a7SBenjamin Herrenschmidt 	 */
261142b45a7SBenjamin Herrenschmidt 	if (old_array != memblock_memory_init_regions &&
262142b45a7SBenjamin Herrenschmidt 	    old_array != memblock_reserved_init_regions)
263142b45a7SBenjamin Herrenschmidt 		memblock_free(__pa(old_array), old_size);
264142b45a7SBenjamin Herrenschmidt 
265142b45a7SBenjamin Herrenschmidt 	return 0;
266142b45a7SBenjamin Herrenschmidt }
267142b45a7SBenjamin Herrenschmidt 
268784656f9STejun Heo /**
269784656f9STejun Heo  * memblock_merge_regions - merge neighboring compatible regions
270784656f9STejun Heo  * @type: memblock type to scan
271784656f9STejun Heo  *
272784656f9STejun Heo  * Scan @type and merge neighboring compatible regions.
273784656f9STejun Heo  */
274784656f9STejun Heo static void __init_memblock memblock_merge_regions(struct memblock_type *type)
275784656f9STejun Heo {
276784656f9STejun Heo 	int i = 0;
277784656f9STejun Heo 
278784656f9STejun Heo 	/* cnt never goes below 1 */
279784656f9STejun Heo 	while (i < type->cnt - 1) {
280784656f9STejun Heo 		struct memblock_region *this = &type->regions[i];
281784656f9STejun Heo 		struct memblock_region *next = &type->regions[i + 1];
282784656f9STejun Heo 
2837c0caeb8STejun Heo 		if (this->base + this->size != next->base ||
2847c0caeb8STejun Heo 		    memblock_get_region_node(this) !=
2857c0caeb8STejun Heo 		    memblock_get_region_node(next)) {
286784656f9STejun Heo 			BUG_ON(this->base + this->size > next->base);
287784656f9STejun Heo 			i++;
288784656f9STejun Heo 			continue;
289784656f9STejun Heo 		}
290784656f9STejun Heo 
291784656f9STejun Heo 		this->size += next->size;
292784656f9STejun Heo 		memmove(next, next + 1, (type->cnt - (i + 1)) * sizeof(*next));
293784656f9STejun Heo 		type->cnt--;
294784656f9STejun Heo 	}
295784656f9STejun Heo }
296784656f9STejun Heo 
297784656f9STejun Heo /**
298784656f9STejun Heo  * memblock_insert_region - insert new memblock region
299784656f9STejun Heo  * @type: memblock type to insert into
300784656f9STejun Heo  * @idx: index for the insertion point
301784656f9STejun Heo  * @base: base address of the new region
302784656f9STejun Heo  * @size: size of the new region
303784656f9STejun Heo  *
304784656f9STejun Heo  * Insert new memblock region [@base,@base+@size) into @type at @idx.
305784656f9STejun Heo  * @type must already have extra room to accomodate the new region.
306784656f9STejun Heo  */
307784656f9STejun Heo static void __init_memblock memblock_insert_region(struct memblock_type *type,
308784656f9STejun Heo 						   int idx, phys_addr_t base,
3097c0caeb8STejun Heo 						   phys_addr_t size, int nid)
310784656f9STejun Heo {
311784656f9STejun Heo 	struct memblock_region *rgn = &type->regions[idx];
312784656f9STejun Heo 
313784656f9STejun Heo 	BUG_ON(type->cnt >= type->max);
314784656f9STejun Heo 	memmove(rgn + 1, rgn, (type->cnt - idx) * sizeof(*rgn));
315784656f9STejun Heo 	rgn->base = base;
316784656f9STejun Heo 	rgn->size = size;
3177c0caeb8STejun Heo 	memblock_set_region_node(rgn, nid);
318784656f9STejun Heo 	type->cnt++;
3191440c4e2STejun Heo 	type->total_size += size;
320784656f9STejun Heo }
321784656f9STejun Heo 
322784656f9STejun Heo /**
323784656f9STejun Heo  * memblock_add_region - add new memblock region
324784656f9STejun Heo  * @type: memblock type to add new region into
325784656f9STejun Heo  * @base: base address of the new region
326784656f9STejun Heo  * @size: size of the new region
327*7fb0bc3fSTejun Heo  * @nid: nid of the new region
328784656f9STejun Heo  *
329784656f9STejun Heo  * Add new memblock region [@base,@base+@size) into @type.  The new region
330784656f9STejun Heo  * is allowed to overlap with existing ones - overlaps don't affect already
331784656f9STejun Heo  * existing regions.  @type is guaranteed to be minimal (all neighbouring
332784656f9STejun Heo  * compatible regions are merged) after the addition.
333784656f9STejun Heo  *
334784656f9STejun Heo  * RETURNS:
335784656f9STejun Heo  * 0 on success, -errno on failure.
336784656f9STejun Heo  */
337581adcbeSTejun Heo static int __init_memblock memblock_add_region(struct memblock_type *type,
338*7fb0bc3fSTejun Heo 				phys_addr_t base, phys_addr_t size, int nid)
33995f72d1eSYinghai Lu {
340784656f9STejun Heo 	bool insert = false;
341eb18f1b5STejun Heo 	phys_addr_t obase = base;
342eb18f1b5STejun Heo 	phys_addr_t end = base + memblock_cap_size(base, &size);
343784656f9STejun Heo 	int i, nr_new;
34495f72d1eSYinghai Lu 
345784656f9STejun Heo 	/* special case for empty array */
346784656f9STejun Heo 	if (type->regions[0].size == 0) {
3471440c4e2STejun Heo 		WARN_ON(type->cnt != 1 || type->total_size);
348784656f9STejun Heo 		type->regions[0].base = base;
349784656f9STejun Heo 		type->regions[0].size = size;
350*7fb0bc3fSTejun Heo 		memblock_set_region_node(&type->regions[0], nid);
3511440c4e2STejun Heo 		type->total_size = size;
352784656f9STejun Heo 		return 0;
353784656f9STejun Heo 	}
354784656f9STejun Heo repeat:
355784656f9STejun Heo 	/*
356784656f9STejun Heo 	 * The following is executed twice.  Once with %false @insert and
357784656f9STejun Heo 	 * then with %true.  The first counts the number of regions needed
358784656f9STejun Heo 	 * to accomodate the new area.  The second actually inserts them.
359784656f9STejun Heo 	 */
360784656f9STejun Heo 	base = obase;
361784656f9STejun Heo 	nr_new = 0;
362784656f9STejun Heo 
3638f7a6605SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
3648f7a6605SBenjamin Herrenschmidt 		struct memblock_region *rgn = &type->regions[i];
365784656f9STejun Heo 		phys_addr_t rbase = rgn->base;
366784656f9STejun Heo 		phys_addr_t rend = rbase + rgn->size;
3678f7a6605SBenjamin Herrenschmidt 
368784656f9STejun Heo 		if (rbase >= end)
3698f7a6605SBenjamin Herrenschmidt 			break;
370784656f9STejun Heo 		if (rend <= base)
371784656f9STejun Heo 			continue;
372784656f9STejun Heo 		/*
373784656f9STejun Heo 		 * @rgn overlaps.  If it separates the lower part of new
374784656f9STejun Heo 		 * area, insert that portion.
3758f7a6605SBenjamin Herrenschmidt 		 */
376784656f9STejun Heo 		if (rbase > base) {
377784656f9STejun Heo 			nr_new++;
378784656f9STejun Heo 			if (insert)
379784656f9STejun Heo 				memblock_insert_region(type, i++, base,
380*7fb0bc3fSTejun Heo 						       rbase - base, nid);
381784656f9STejun Heo 		}
382784656f9STejun Heo 		/* area below @rend is dealt with, forget about it */
383784656f9STejun Heo 		base = min(rend, end);
3848f7a6605SBenjamin Herrenschmidt 	}
3858f7a6605SBenjamin Herrenschmidt 
386784656f9STejun Heo 	/* insert the remaining portion */
387784656f9STejun Heo 	if (base < end) {
388784656f9STejun Heo 		nr_new++;
389784656f9STejun Heo 		if (insert)
390*7fb0bc3fSTejun Heo 			memblock_insert_region(type, i, base, end - base, nid);
3918f7a6605SBenjamin Herrenschmidt 	}
3928f7a6605SBenjamin Herrenschmidt 
393784656f9STejun Heo 	/*
394784656f9STejun Heo 	 * If this was the first round, resize array and repeat for actual
395784656f9STejun Heo 	 * insertions; otherwise, merge and return.
3968f7a6605SBenjamin Herrenschmidt 	 */
397784656f9STejun Heo 	if (!insert) {
398784656f9STejun Heo 		while (type->cnt + nr_new > type->max)
399784656f9STejun Heo 			if (memblock_double_array(type) < 0)
400784656f9STejun Heo 				return -ENOMEM;
401784656f9STejun Heo 		insert = true;
402784656f9STejun Heo 		goto repeat;
40395f72d1eSYinghai Lu 	} else {
404784656f9STejun Heo 		memblock_merge_regions(type);
40595f72d1eSYinghai Lu 		return 0;
40695f72d1eSYinghai Lu 	}
407784656f9STejun Heo }
40895f72d1eSYinghai Lu 
409*7fb0bc3fSTejun Heo int __init_memblock memblock_add_node(phys_addr_t base, phys_addr_t size,
410*7fb0bc3fSTejun Heo 				       int nid)
411*7fb0bc3fSTejun Heo {
412*7fb0bc3fSTejun Heo 	return memblock_add_region(&memblock.memory, base, size, nid);
413*7fb0bc3fSTejun Heo }
414*7fb0bc3fSTejun Heo 
415581adcbeSTejun Heo int __init_memblock memblock_add(phys_addr_t base, phys_addr_t size)
41695f72d1eSYinghai Lu {
417*7fb0bc3fSTejun Heo 	return memblock_add_region(&memblock.memory, base, size, MAX_NUMNODES);
41895f72d1eSYinghai Lu }
41995f72d1eSYinghai Lu 
4206a9ceb31STejun Heo /**
4216a9ceb31STejun Heo  * memblock_isolate_range - isolate given range into disjoint memblocks
4226a9ceb31STejun Heo  * @type: memblock type to isolate range for
4236a9ceb31STejun Heo  * @base: base of range to isolate
4246a9ceb31STejun Heo  * @size: size of range to isolate
4256a9ceb31STejun Heo  * @start_rgn: out parameter for the start of isolated region
4266a9ceb31STejun Heo  * @end_rgn: out parameter for the end of isolated region
4276a9ceb31STejun Heo  *
4286a9ceb31STejun Heo  * Walk @type and ensure that regions don't cross the boundaries defined by
4296a9ceb31STejun Heo  * [@base,@base+@size).  Crossing regions are split at the boundaries,
4306a9ceb31STejun Heo  * which may create at most two more regions.  The index of the first
4316a9ceb31STejun Heo  * region inside the range is returned in *@start_rgn and end in *@end_rgn.
4326a9ceb31STejun Heo  *
4336a9ceb31STejun Heo  * RETURNS:
4346a9ceb31STejun Heo  * 0 on success, -errno on failure.
4356a9ceb31STejun Heo  */
4366a9ceb31STejun Heo static int __init_memblock memblock_isolate_range(struct memblock_type *type,
4376a9ceb31STejun Heo 					phys_addr_t base, phys_addr_t size,
4386a9ceb31STejun Heo 					int *start_rgn, int *end_rgn)
4396a9ceb31STejun Heo {
440eb18f1b5STejun Heo 	phys_addr_t end = base + memblock_cap_size(base, &size);
4416a9ceb31STejun Heo 	int i;
4426a9ceb31STejun Heo 
4436a9ceb31STejun Heo 	*start_rgn = *end_rgn = 0;
4446a9ceb31STejun Heo 
4456a9ceb31STejun Heo 	/* we'll create at most two more regions */
4466a9ceb31STejun Heo 	while (type->cnt + 2 > type->max)
4476a9ceb31STejun Heo 		if (memblock_double_array(type) < 0)
4486a9ceb31STejun Heo 			return -ENOMEM;
4496a9ceb31STejun Heo 
4506a9ceb31STejun Heo 	for (i = 0; i < type->cnt; i++) {
4516a9ceb31STejun Heo 		struct memblock_region *rgn = &type->regions[i];
4526a9ceb31STejun Heo 		phys_addr_t rbase = rgn->base;
4536a9ceb31STejun Heo 		phys_addr_t rend = rbase + rgn->size;
4546a9ceb31STejun Heo 
4556a9ceb31STejun Heo 		if (rbase >= end)
4566a9ceb31STejun Heo 			break;
4576a9ceb31STejun Heo 		if (rend <= base)
4586a9ceb31STejun Heo 			continue;
4596a9ceb31STejun Heo 
4606a9ceb31STejun Heo 		if (rbase < base) {
4616a9ceb31STejun Heo 			/*
4626a9ceb31STejun Heo 			 * @rgn intersects from below.  Split and continue
4636a9ceb31STejun Heo 			 * to process the next region - the new top half.
4646a9ceb31STejun Heo 			 */
4656a9ceb31STejun Heo 			rgn->base = base;
4661440c4e2STejun Heo 			rgn->size -= base - rbase;
4671440c4e2STejun Heo 			type->total_size -= base - rbase;
4686a9ceb31STejun Heo 			memblock_insert_region(type, i, rbase, base - rbase,
46971936180STejun Heo 					       memblock_get_region_node(rgn));
4706a9ceb31STejun Heo 		} else if (rend > end) {
4716a9ceb31STejun Heo 			/*
4726a9ceb31STejun Heo 			 * @rgn intersects from above.  Split and redo the
4736a9ceb31STejun Heo 			 * current region - the new bottom half.
4746a9ceb31STejun Heo 			 */
4756a9ceb31STejun Heo 			rgn->base = end;
4761440c4e2STejun Heo 			rgn->size -= end - rbase;
4771440c4e2STejun Heo 			type->total_size -= end - rbase;
4786a9ceb31STejun Heo 			memblock_insert_region(type, i--, rbase, end - rbase,
47971936180STejun Heo 					       memblock_get_region_node(rgn));
4806a9ceb31STejun Heo 		} else {
4816a9ceb31STejun Heo 			/* @rgn is fully contained, record it */
4826a9ceb31STejun Heo 			if (!*end_rgn)
4836a9ceb31STejun Heo 				*start_rgn = i;
4846a9ceb31STejun Heo 			*end_rgn = i + 1;
4856a9ceb31STejun Heo 		}
4866a9ceb31STejun Heo 	}
4876a9ceb31STejun Heo 
4886a9ceb31STejun Heo 	return 0;
4896a9ceb31STejun Heo }
4906a9ceb31STejun Heo 
491581adcbeSTejun Heo static int __init_memblock __memblock_remove(struct memblock_type *type,
4928f7a6605SBenjamin Herrenschmidt 					     phys_addr_t base, phys_addr_t size)
49395f72d1eSYinghai Lu {
49471936180STejun Heo 	int start_rgn, end_rgn;
49571936180STejun Heo 	int i, ret;
49695f72d1eSYinghai Lu 
49771936180STejun Heo 	ret = memblock_isolate_range(type, base, size, &start_rgn, &end_rgn);
49871936180STejun Heo 	if (ret)
49971936180STejun Heo 		return ret;
50095f72d1eSYinghai Lu 
50171936180STejun Heo 	for (i = end_rgn - 1; i >= start_rgn; i--)
50271936180STejun Heo 		memblock_remove_region(type, i);
50395f72d1eSYinghai Lu 	return 0;
50495f72d1eSYinghai Lu }
50595f72d1eSYinghai Lu 
506581adcbeSTejun Heo int __init_memblock memblock_remove(phys_addr_t base, phys_addr_t size)
50795f72d1eSYinghai Lu {
50895f72d1eSYinghai Lu 	return __memblock_remove(&memblock.memory, base, size);
50995f72d1eSYinghai Lu }
51095f72d1eSYinghai Lu 
511581adcbeSTejun Heo int __init_memblock memblock_free(phys_addr_t base, phys_addr_t size)
51295f72d1eSYinghai Lu {
51324aa0788STejun Heo 	memblock_dbg("   memblock_free: [%#016llx-%#016llx] %pF\n",
514a150439cSH. Peter Anvin 		     (unsigned long long)base,
515a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
516a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
51724aa0788STejun Heo 
51895f72d1eSYinghai Lu 	return __memblock_remove(&memblock.reserved, base, size);
51995f72d1eSYinghai Lu }
52095f72d1eSYinghai Lu 
521581adcbeSTejun Heo int __init_memblock memblock_reserve(phys_addr_t base, phys_addr_t size)
52295f72d1eSYinghai Lu {
523e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *_rgn = &memblock.reserved;
52495f72d1eSYinghai Lu 
52524aa0788STejun Heo 	memblock_dbg("memblock_reserve: [%#016llx-%#016llx] %pF\n",
526a150439cSH. Peter Anvin 		     (unsigned long long)base,
527a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
528a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
52995f72d1eSYinghai Lu 	BUG_ON(0 == size);
53095f72d1eSYinghai Lu 
531*7fb0bc3fSTejun Heo 	return memblock_add_region(_rgn, base, size, MAX_NUMNODES);
53295f72d1eSYinghai Lu }
53395f72d1eSYinghai Lu 
53435fd0808STejun Heo /**
53535fd0808STejun Heo  * __next_free_mem_range - next function for for_each_free_mem_range()
53635fd0808STejun Heo  * @idx: pointer to u64 loop variable
53735fd0808STejun Heo  * @nid: nid: node selector, %MAX_NUMNODES for all nodes
53835fd0808STejun Heo  * @p_start: ptr to phys_addr_t for start address of the range, can be %NULL
53935fd0808STejun Heo  * @p_end: ptr to phys_addr_t for end address of the range, can be %NULL
54035fd0808STejun Heo  * @p_nid: ptr to int for nid of the range, can be %NULL
54135fd0808STejun Heo  *
54235fd0808STejun Heo  * Find the first free area from *@idx which matches @nid, fill the out
54335fd0808STejun Heo  * parameters, and update *@idx for the next iteration.  The lower 32bit of
54435fd0808STejun Heo  * *@idx contains index into memory region and the upper 32bit indexes the
54535fd0808STejun Heo  * areas before each reserved region.  For example, if reserved regions
54635fd0808STejun Heo  * look like the following,
54735fd0808STejun Heo  *
54835fd0808STejun Heo  *	0:[0-16), 1:[32-48), 2:[128-130)
54935fd0808STejun Heo  *
55035fd0808STejun Heo  * The upper 32bit indexes the following regions.
55135fd0808STejun Heo  *
55235fd0808STejun Heo  *	0:[0-0), 1:[16-32), 2:[48-128), 3:[130-MAX)
55335fd0808STejun Heo  *
55435fd0808STejun Heo  * As both region arrays are sorted, the function advances the two indices
55535fd0808STejun Heo  * in lockstep and returns each intersection.
55635fd0808STejun Heo  */
55735fd0808STejun Heo void __init_memblock __next_free_mem_range(u64 *idx, int nid,
55835fd0808STejun Heo 					   phys_addr_t *out_start,
55935fd0808STejun Heo 					   phys_addr_t *out_end, int *out_nid)
56035fd0808STejun Heo {
56135fd0808STejun Heo 	struct memblock_type *mem = &memblock.memory;
56235fd0808STejun Heo 	struct memblock_type *rsv = &memblock.reserved;
56335fd0808STejun Heo 	int mi = *idx & 0xffffffff;
56435fd0808STejun Heo 	int ri = *idx >> 32;
56535fd0808STejun Heo 
56635fd0808STejun Heo 	for ( ; mi < mem->cnt; mi++) {
56735fd0808STejun Heo 		struct memblock_region *m = &mem->regions[mi];
56835fd0808STejun Heo 		phys_addr_t m_start = m->base;
56935fd0808STejun Heo 		phys_addr_t m_end = m->base + m->size;
57035fd0808STejun Heo 
57135fd0808STejun Heo 		/* only memory regions are associated with nodes, check it */
57235fd0808STejun Heo 		if (nid != MAX_NUMNODES && nid != memblock_get_region_node(m))
57335fd0808STejun Heo 			continue;
57435fd0808STejun Heo 
57535fd0808STejun Heo 		/* scan areas before each reservation for intersection */
57635fd0808STejun Heo 		for ( ; ri < rsv->cnt + 1; ri++) {
57735fd0808STejun Heo 			struct memblock_region *r = &rsv->regions[ri];
57835fd0808STejun Heo 			phys_addr_t r_start = ri ? r[-1].base + r[-1].size : 0;
57935fd0808STejun Heo 			phys_addr_t r_end = ri < rsv->cnt ? r->base : ULLONG_MAX;
58035fd0808STejun Heo 
58135fd0808STejun Heo 			/* if ri advanced past mi, break out to advance mi */
58235fd0808STejun Heo 			if (r_start >= m_end)
58335fd0808STejun Heo 				break;
58435fd0808STejun Heo 			/* if the two regions intersect, we're done */
58535fd0808STejun Heo 			if (m_start < r_end) {
58635fd0808STejun Heo 				if (out_start)
58735fd0808STejun Heo 					*out_start = max(m_start, r_start);
58835fd0808STejun Heo 				if (out_end)
58935fd0808STejun Heo 					*out_end = min(m_end, r_end);
59035fd0808STejun Heo 				if (out_nid)
59135fd0808STejun Heo 					*out_nid = memblock_get_region_node(m);
59235fd0808STejun Heo 				/*
59335fd0808STejun Heo 				 * The region which ends first is advanced
59435fd0808STejun Heo 				 * for the next iteration.
59535fd0808STejun Heo 				 */
59635fd0808STejun Heo 				if (m_end <= r_end)
59735fd0808STejun Heo 					mi++;
59835fd0808STejun Heo 				else
59935fd0808STejun Heo 					ri++;
60035fd0808STejun Heo 				*idx = (u32)mi | (u64)ri << 32;
60135fd0808STejun Heo 				return;
60235fd0808STejun Heo 			}
60335fd0808STejun Heo 		}
60435fd0808STejun Heo 	}
60535fd0808STejun Heo 
60635fd0808STejun Heo 	/* signal end of iteration */
60735fd0808STejun Heo 	*idx = ULLONG_MAX;
60835fd0808STejun Heo }
60935fd0808STejun Heo 
6107c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
6117c0caeb8STejun Heo /*
6127c0caeb8STejun Heo  * Common iterator interface used to define for_each_mem_range().
6137c0caeb8STejun Heo  */
6147c0caeb8STejun Heo void __init_memblock __next_mem_pfn_range(int *idx, int nid,
6157c0caeb8STejun Heo 				unsigned long *out_start_pfn,
6167c0caeb8STejun Heo 				unsigned long *out_end_pfn, int *out_nid)
6177c0caeb8STejun Heo {
6187c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
6197c0caeb8STejun Heo 	struct memblock_region *r;
6207c0caeb8STejun Heo 
6217c0caeb8STejun Heo 	while (++*idx < type->cnt) {
6227c0caeb8STejun Heo 		r = &type->regions[*idx];
6237c0caeb8STejun Heo 
6247c0caeb8STejun Heo 		if (PFN_UP(r->base) >= PFN_DOWN(r->base + r->size))
6257c0caeb8STejun Heo 			continue;
6267c0caeb8STejun Heo 		if (nid == MAX_NUMNODES || nid == r->nid)
6277c0caeb8STejun Heo 			break;
6287c0caeb8STejun Heo 	}
6297c0caeb8STejun Heo 	if (*idx >= type->cnt) {
6307c0caeb8STejun Heo 		*idx = -1;
6317c0caeb8STejun Heo 		return;
6327c0caeb8STejun Heo 	}
6337c0caeb8STejun Heo 
6347c0caeb8STejun Heo 	if (out_start_pfn)
6357c0caeb8STejun Heo 		*out_start_pfn = PFN_UP(r->base);
6367c0caeb8STejun Heo 	if (out_end_pfn)
6377c0caeb8STejun Heo 		*out_end_pfn = PFN_DOWN(r->base + r->size);
6387c0caeb8STejun Heo 	if (out_nid)
6397c0caeb8STejun Heo 		*out_nid = r->nid;
6407c0caeb8STejun Heo }
6417c0caeb8STejun Heo 
6427c0caeb8STejun Heo /**
6437c0caeb8STejun Heo  * memblock_set_node - set node ID on memblock regions
6447c0caeb8STejun Heo  * @base: base of area to set node ID for
6457c0caeb8STejun Heo  * @size: size of area to set node ID for
6467c0caeb8STejun Heo  * @nid: node ID to set
6477c0caeb8STejun Heo  *
6487c0caeb8STejun Heo  * Set the nid of memblock memory regions in [@base,@base+@size) to @nid.
6497c0caeb8STejun Heo  * Regions which cross the area boundaries are split as necessary.
6507c0caeb8STejun Heo  *
6517c0caeb8STejun Heo  * RETURNS:
6527c0caeb8STejun Heo  * 0 on success, -errno on failure.
6537c0caeb8STejun Heo  */
6547c0caeb8STejun Heo int __init_memblock memblock_set_node(phys_addr_t base, phys_addr_t size,
6557c0caeb8STejun Heo 				      int nid)
6567c0caeb8STejun Heo {
6577c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
6586a9ceb31STejun Heo 	int start_rgn, end_rgn;
6596a9ceb31STejun Heo 	int i, ret;
6607c0caeb8STejun Heo 
6616a9ceb31STejun Heo 	ret = memblock_isolate_range(type, base, size, &start_rgn, &end_rgn);
6626a9ceb31STejun Heo 	if (ret)
6636a9ceb31STejun Heo 		return ret;
6647c0caeb8STejun Heo 
6656a9ceb31STejun Heo 	for (i = start_rgn; i < end_rgn; i++)
6666a9ceb31STejun Heo 		type->regions[i].nid = nid;
6677c0caeb8STejun Heo 
6687c0caeb8STejun Heo 	memblock_merge_regions(type);
6697c0caeb8STejun Heo 	return 0;
6707c0caeb8STejun Heo }
6717c0caeb8STejun Heo #endif /* CONFIG_HAVE_MEMBLOCK_NODE_MAP */
6727c0caeb8STejun Heo 
6736ed311b2SBenjamin Herrenschmidt phys_addr_t __init __memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
67495f72d1eSYinghai Lu {
6756ed311b2SBenjamin Herrenschmidt 	phys_addr_t found;
67695f72d1eSYinghai Lu 
6776ed311b2SBenjamin Herrenschmidt 	/* We align the size to limit fragmentation. Without this, a lot of
6786ed311b2SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
6796ed311b2SBenjamin Herrenschmidt 	 */
680348968ebSTejun Heo 	size = round_up(size, align);
6816ed311b2SBenjamin Herrenschmidt 
682fc769a8eSTejun Heo 	found = memblock_find_in_range(0, max_addr, size, align);
6839c8c27e2STejun Heo 	if (found && !memblock_reserve(found, size))
6846ed311b2SBenjamin Herrenschmidt 		return found;
6856ed311b2SBenjamin Herrenschmidt 
6866ed311b2SBenjamin Herrenschmidt 	return 0;
68795f72d1eSYinghai Lu }
68895f72d1eSYinghai Lu 
6896ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
69095f72d1eSYinghai Lu {
6916ed311b2SBenjamin Herrenschmidt 	phys_addr_t alloc;
6926ed311b2SBenjamin Herrenschmidt 
6936ed311b2SBenjamin Herrenschmidt 	alloc = __memblock_alloc_base(size, align, max_addr);
6946ed311b2SBenjamin Herrenschmidt 
6956ed311b2SBenjamin Herrenschmidt 	if (alloc == 0)
6966ed311b2SBenjamin Herrenschmidt 		panic("ERROR: Failed to allocate 0x%llx bytes below 0x%llx.\n",
6976ed311b2SBenjamin Herrenschmidt 		      (unsigned long long) size, (unsigned long long) max_addr);
6986ed311b2SBenjamin Herrenschmidt 
6996ed311b2SBenjamin Herrenschmidt 	return alloc;
70095f72d1eSYinghai Lu }
70195f72d1eSYinghai Lu 
7026ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc(phys_addr_t size, phys_addr_t align)
70395f72d1eSYinghai Lu {
7046ed311b2SBenjamin Herrenschmidt 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
70595f72d1eSYinghai Lu }
70695f72d1eSYinghai Lu 
70795f72d1eSYinghai Lu 
7086ed311b2SBenjamin Herrenschmidt /*
70934e18455STejun Heo  * Additional node-local top-down allocators.
710c196f76fSBenjamin Herrenschmidt  *
711c196f76fSBenjamin Herrenschmidt  * WARNING: Only available after early_node_map[] has been populated,
712c196f76fSBenjamin Herrenschmidt  * on some architectures, that is after all the calls to add_active_range()
713c196f76fSBenjamin Herrenschmidt  * have been done to populate it.
7146ed311b2SBenjamin Herrenschmidt  */
71595f72d1eSYinghai Lu 
71634e18455STejun Heo static phys_addr_t __init memblock_nid_range_rev(phys_addr_t start,
71734e18455STejun Heo 						 phys_addr_t end, int *nid)
718c3f72b57SBenjamin Herrenschmidt {
719c196f76fSBenjamin Herrenschmidt #ifdef CONFIG_ARCH_POPULATES_NODE_MAP
720c196f76fSBenjamin Herrenschmidt 	unsigned long start_pfn, end_pfn;
721c196f76fSBenjamin Herrenschmidt 	int i;
722c196f76fSBenjamin Herrenschmidt 
723b2fea988STejun Heo 	for_each_mem_pfn_range(i, MAX_NUMNODES, &start_pfn, &end_pfn, nid)
72434e18455STejun Heo 		if (end > PFN_PHYS(start_pfn) && end <= PFN_PHYS(end_pfn))
72534e18455STejun Heo 			return max(start, PFN_PHYS(start_pfn));
726c196f76fSBenjamin Herrenschmidt #endif
727c3f72b57SBenjamin Herrenschmidt 	*nid = 0;
72834e18455STejun Heo 	return start;
729c3f72b57SBenjamin Herrenschmidt }
730c3f72b57SBenjamin Herrenschmidt 
731e6498040STejun Heo phys_addr_t __init memblock_find_in_range_node(phys_addr_t start,
732e6498040STejun Heo 					       phys_addr_t end,
7332898cc4cSBenjamin Herrenschmidt 					       phys_addr_t size,
7342898cc4cSBenjamin Herrenschmidt 					       phys_addr_t align, int nid)
73595f72d1eSYinghai Lu {
736e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *mem = &memblock.memory;
73795f72d1eSYinghai Lu 	int i;
73895f72d1eSYinghai Lu 
73995f72d1eSYinghai Lu 	BUG_ON(0 == size);
74095f72d1eSYinghai Lu 
741e6498040STejun Heo 	/* Pump up max_addr */
742e6498040STejun Heo 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
743e6498040STejun Heo 		end = memblock.current_limit;
744e6498040STejun Heo 
745e6498040STejun Heo 	for (i = mem->cnt - 1; i >= 0; i--) {
746e6498040STejun Heo 		struct memblock_region *r = &mem->regions[i];
747e6498040STejun Heo 		phys_addr_t base = max(start, r->base);
748e6498040STejun Heo 		phys_addr_t top = min(end, r->base + r->size);
749e6498040STejun Heo 
750e6498040STejun Heo 		while (base < top) {
751e6498040STejun Heo 			phys_addr_t tbase, ret;
752e6498040STejun Heo 			int tnid;
753e6498040STejun Heo 
754e6498040STejun Heo 			tbase = memblock_nid_range_rev(base, top, &tnid);
755e6498040STejun Heo 			if (nid == MAX_NUMNODES || tnid == nid) {
756e6498040STejun Heo 				ret = memblock_find_region(tbase, top, size, align);
757e6498040STejun Heo 				if (ret)
758e6498040STejun Heo 					return ret;
759e6498040STejun Heo 			}
760e6498040STejun Heo 			top = tbase;
761e6498040STejun Heo 		}
762e6498040STejun Heo 	}
763e6498040STejun Heo 
764e6498040STejun Heo 	return 0;
765e6498040STejun Heo }
766e6498040STejun Heo 
767e6498040STejun Heo phys_addr_t __init memblock_alloc_nid(phys_addr_t size, phys_addr_t align, int nid)
768e6498040STejun Heo {
769e6498040STejun Heo 	phys_addr_t found;
770e6498040STejun Heo 
771e6498040STejun Heo 	/*
772e6498040STejun Heo 	 * We align the size to limit fragmentation. Without this, a lot of
7737f219c73SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
7747f219c73SBenjamin Herrenschmidt 	 */
775348968ebSTejun Heo 	size = round_up(size, align);
7767f219c73SBenjamin Herrenschmidt 
777e6498040STejun Heo 	found = memblock_find_in_range_node(0, MEMBLOCK_ALLOC_ACCESSIBLE,
77895f72d1eSYinghai Lu 					    size, align, nid);
7799c8c27e2STejun Heo 	if (found && !memblock_reserve(found, size))
780e6498040STejun Heo 		return found;
78195f72d1eSYinghai Lu 
7829d1e2492SBenjamin Herrenschmidt 	return 0;
7839d1e2492SBenjamin Herrenschmidt }
7849d1e2492SBenjamin Herrenschmidt 
7859d1e2492SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_try_nid(phys_addr_t size, phys_addr_t align, int nid)
7869d1e2492SBenjamin Herrenschmidt {
7879d1e2492SBenjamin Herrenschmidt 	phys_addr_t res = memblock_alloc_nid(size, align, nid);
7889d1e2492SBenjamin Herrenschmidt 
7899d1e2492SBenjamin Herrenschmidt 	if (res)
7909d1e2492SBenjamin Herrenschmidt 		return res;
79115fb0972STejun Heo 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
79295f72d1eSYinghai Lu }
79395f72d1eSYinghai Lu 
7949d1e2492SBenjamin Herrenschmidt 
7959d1e2492SBenjamin Herrenschmidt /*
7969d1e2492SBenjamin Herrenschmidt  * Remaining API functions
7979d1e2492SBenjamin Herrenschmidt  */
7989d1e2492SBenjamin Herrenschmidt 
7992898cc4cSBenjamin Herrenschmidt phys_addr_t __init memblock_phys_mem_size(void)
80095f72d1eSYinghai Lu {
8011440c4e2STejun Heo 	return memblock.memory.total_size;
80295f72d1eSYinghai Lu }
80395f72d1eSYinghai Lu 
8040a93ebefSSam Ravnborg /* lowest address */
8050a93ebefSSam Ravnborg phys_addr_t __init_memblock memblock_start_of_DRAM(void)
8060a93ebefSSam Ravnborg {
8070a93ebefSSam Ravnborg 	return memblock.memory.regions[0].base;
8080a93ebefSSam Ravnborg }
8090a93ebefSSam Ravnborg 
81010d06439SYinghai Lu phys_addr_t __init_memblock memblock_end_of_DRAM(void)
81195f72d1eSYinghai Lu {
81295f72d1eSYinghai Lu 	int idx = memblock.memory.cnt - 1;
81395f72d1eSYinghai Lu 
814e3239ff9SBenjamin Herrenschmidt 	return (memblock.memory.regions[idx].base + memblock.memory.regions[idx].size);
81595f72d1eSYinghai Lu }
81695f72d1eSYinghai Lu 
817c0ce8fefSTejun Heo void __init memblock_enforce_memory_limit(phys_addr_t limit)
81895f72d1eSYinghai Lu {
81995f72d1eSYinghai Lu 	unsigned long i;
820c0ce8fefSTejun Heo 	phys_addr_t max_addr = (phys_addr_t)ULLONG_MAX;
82195f72d1eSYinghai Lu 
822c0ce8fefSTejun Heo 	if (!limit)
82395f72d1eSYinghai Lu 		return;
82495f72d1eSYinghai Lu 
825c0ce8fefSTejun Heo 	/* find out max address */
82695f72d1eSYinghai Lu 	for (i = 0; i < memblock.memory.cnt; i++) {
827c0ce8fefSTejun Heo 		struct memblock_region *r = &memblock.memory.regions[i];
82895f72d1eSYinghai Lu 
829c0ce8fefSTejun Heo 		if (limit <= r->size) {
830c0ce8fefSTejun Heo 			max_addr = r->base + limit;
83195f72d1eSYinghai Lu 			break;
83295f72d1eSYinghai Lu 		}
833c0ce8fefSTejun Heo 		limit -= r->size;
83495f72d1eSYinghai Lu 	}
835c0ce8fefSTejun Heo 
836c0ce8fefSTejun Heo 	/* truncate both memory and reserved regions */
837c0ce8fefSTejun Heo 	__memblock_remove(&memblock.memory, max_addr, (phys_addr_t)ULLONG_MAX);
838c0ce8fefSTejun Heo 	__memblock_remove(&memblock.reserved, max_addr, (phys_addr_t)ULLONG_MAX);
83995f72d1eSYinghai Lu }
84095f72d1eSYinghai Lu 
841cd79481dSYinghai Lu static int __init_memblock memblock_search(struct memblock_type *type, phys_addr_t addr)
84272d4b0b4SBenjamin Herrenschmidt {
84372d4b0b4SBenjamin Herrenschmidt 	unsigned int left = 0, right = type->cnt;
84472d4b0b4SBenjamin Herrenschmidt 
84572d4b0b4SBenjamin Herrenschmidt 	do {
84672d4b0b4SBenjamin Herrenschmidt 		unsigned int mid = (right + left) / 2;
84772d4b0b4SBenjamin Herrenschmidt 
84872d4b0b4SBenjamin Herrenschmidt 		if (addr < type->regions[mid].base)
84972d4b0b4SBenjamin Herrenschmidt 			right = mid;
85072d4b0b4SBenjamin Herrenschmidt 		else if (addr >= (type->regions[mid].base +
85172d4b0b4SBenjamin Herrenschmidt 				  type->regions[mid].size))
85272d4b0b4SBenjamin Herrenschmidt 			left = mid + 1;
85372d4b0b4SBenjamin Herrenschmidt 		else
85472d4b0b4SBenjamin Herrenschmidt 			return mid;
85572d4b0b4SBenjamin Herrenschmidt 	} while (left < right);
85672d4b0b4SBenjamin Herrenschmidt 	return -1;
85772d4b0b4SBenjamin Herrenschmidt }
85872d4b0b4SBenjamin Herrenschmidt 
8592898cc4cSBenjamin Herrenschmidt int __init memblock_is_reserved(phys_addr_t addr)
86095f72d1eSYinghai Lu {
86172d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.reserved, addr) != -1;
86295f72d1eSYinghai Lu }
86372d4b0b4SBenjamin Herrenschmidt 
8643661ca66SYinghai Lu int __init_memblock memblock_is_memory(phys_addr_t addr)
86572d4b0b4SBenjamin Herrenschmidt {
86672d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.memory, addr) != -1;
86772d4b0b4SBenjamin Herrenschmidt }
86872d4b0b4SBenjamin Herrenschmidt 
8693661ca66SYinghai Lu int __init_memblock memblock_is_region_memory(phys_addr_t base, phys_addr_t size)
87072d4b0b4SBenjamin Herrenschmidt {
871abb65272STomi Valkeinen 	int idx = memblock_search(&memblock.memory, base);
872eb18f1b5STejun Heo 	phys_addr_t end = base + memblock_cap_size(base, &size);
87372d4b0b4SBenjamin Herrenschmidt 
87472d4b0b4SBenjamin Herrenschmidt 	if (idx == -1)
87595f72d1eSYinghai Lu 		return 0;
876abb65272STomi Valkeinen 	return memblock.memory.regions[idx].base <= base &&
877abb65272STomi Valkeinen 		(memblock.memory.regions[idx].base +
878eb18f1b5STejun Heo 		 memblock.memory.regions[idx].size) >= end;
87995f72d1eSYinghai Lu }
88095f72d1eSYinghai Lu 
88110d06439SYinghai Lu int __init_memblock memblock_is_region_reserved(phys_addr_t base, phys_addr_t size)
88295f72d1eSYinghai Lu {
883eb18f1b5STejun Heo 	memblock_cap_size(base, &size);
884f1c2c19cSBenjamin Herrenschmidt 	return memblock_overlaps_region(&memblock.reserved, base, size) >= 0;
88595f72d1eSYinghai Lu }
88695f72d1eSYinghai Lu 
887e63075a3SBenjamin Herrenschmidt 
8883661ca66SYinghai Lu void __init_memblock memblock_set_current_limit(phys_addr_t limit)
889e63075a3SBenjamin Herrenschmidt {
890e63075a3SBenjamin Herrenschmidt 	memblock.current_limit = limit;
891e63075a3SBenjamin Herrenschmidt }
892e63075a3SBenjamin Herrenschmidt 
8937c0caeb8STejun Heo static void __init_memblock memblock_dump(struct memblock_type *type, char *name)
8946ed311b2SBenjamin Herrenschmidt {
8956ed311b2SBenjamin Herrenschmidt 	unsigned long long base, size;
8966ed311b2SBenjamin Herrenschmidt 	int i;
8976ed311b2SBenjamin Herrenschmidt 
8987c0caeb8STejun Heo 	pr_info(" %s.cnt  = 0x%lx\n", name, type->cnt);
8996ed311b2SBenjamin Herrenschmidt 
9007c0caeb8STejun Heo 	for (i = 0; i < type->cnt; i++) {
9017c0caeb8STejun Heo 		struct memblock_region *rgn = &type->regions[i];
9027c0caeb8STejun Heo 		char nid_buf[32] = "";
9036ed311b2SBenjamin Herrenschmidt 
9047c0caeb8STejun Heo 		base = rgn->base;
9057c0caeb8STejun Heo 		size = rgn->size;
9067c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
9077c0caeb8STejun Heo 		if (memblock_get_region_node(rgn) != MAX_NUMNODES)
9087c0caeb8STejun Heo 			snprintf(nid_buf, sizeof(nid_buf), " on node %d",
9097c0caeb8STejun Heo 				 memblock_get_region_node(rgn));
9107c0caeb8STejun Heo #endif
9117c0caeb8STejun Heo 		pr_info(" %s[%#x]\t[%#016llx-%#016llx], %#llx bytes%s\n",
9127c0caeb8STejun Heo 			name, i, base, base + size - 1, size, nid_buf);
9136ed311b2SBenjamin Herrenschmidt 	}
9146ed311b2SBenjamin Herrenschmidt }
9156ed311b2SBenjamin Herrenschmidt 
9164ff7b82fSTejun Heo void __init_memblock __memblock_dump_all(void)
9176ed311b2SBenjamin Herrenschmidt {
9186ed311b2SBenjamin Herrenschmidt 	pr_info("MEMBLOCK configuration:\n");
9191440c4e2STejun Heo 	pr_info(" memory size = %#llx reserved size = %#llx\n",
9201440c4e2STejun Heo 		(unsigned long long)memblock.memory.total_size,
9211440c4e2STejun Heo 		(unsigned long long)memblock.reserved.total_size);
9226ed311b2SBenjamin Herrenschmidt 
9236ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.memory, "memory");
9246ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.reserved, "reserved");
9256ed311b2SBenjamin Herrenschmidt }
9266ed311b2SBenjamin Herrenschmidt 
9271aadc056STejun Heo void __init memblock_allow_resize(void)
9286ed311b2SBenjamin Herrenschmidt {
929142b45a7SBenjamin Herrenschmidt 	memblock_can_resize = 1;
9306ed311b2SBenjamin Herrenschmidt }
9316ed311b2SBenjamin Herrenschmidt 
9326ed311b2SBenjamin Herrenschmidt static int __init early_memblock(char *p)
9336ed311b2SBenjamin Herrenschmidt {
9346ed311b2SBenjamin Herrenschmidt 	if (p && strstr(p, "debug"))
9356ed311b2SBenjamin Herrenschmidt 		memblock_debug = 1;
9366ed311b2SBenjamin Herrenschmidt 	return 0;
9376ed311b2SBenjamin Herrenschmidt }
9386ed311b2SBenjamin Herrenschmidt early_param("memblock", early_memblock);
9396ed311b2SBenjamin Herrenschmidt 
940c378ddd5STejun Heo #if defined(CONFIG_DEBUG_FS) && !defined(CONFIG_ARCH_DISCARD_MEMBLOCK)
9416d03b885SBenjamin Herrenschmidt 
9426d03b885SBenjamin Herrenschmidt static int memblock_debug_show(struct seq_file *m, void *private)
9436d03b885SBenjamin Herrenschmidt {
9446d03b885SBenjamin Herrenschmidt 	struct memblock_type *type = m->private;
9456d03b885SBenjamin Herrenschmidt 	struct memblock_region *reg;
9466d03b885SBenjamin Herrenschmidt 	int i;
9476d03b885SBenjamin Herrenschmidt 
9486d03b885SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
9496d03b885SBenjamin Herrenschmidt 		reg = &type->regions[i];
9506d03b885SBenjamin Herrenschmidt 		seq_printf(m, "%4d: ", i);
9516d03b885SBenjamin Herrenschmidt 		if (sizeof(phys_addr_t) == 4)
9526d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%08lx..0x%08lx\n",
9536d03b885SBenjamin Herrenschmidt 				   (unsigned long)reg->base,
9546d03b885SBenjamin Herrenschmidt 				   (unsigned long)(reg->base + reg->size - 1));
9556d03b885SBenjamin Herrenschmidt 		else
9566d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%016llx..0x%016llx\n",
9576d03b885SBenjamin Herrenschmidt 				   (unsigned long long)reg->base,
9586d03b885SBenjamin Herrenschmidt 				   (unsigned long long)(reg->base + reg->size - 1));
9596d03b885SBenjamin Herrenschmidt 
9606d03b885SBenjamin Herrenschmidt 	}
9616d03b885SBenjamin Herrenschmidt 	return 0;
9626d03b885SBenjamin Herrenschmidt }
9636d03b885SBenjamin Herrenschmidt 
9646d03b885SBenjamin Herrenschmidt static int memblock_debug_open(struct inode *inode, struct file *file)
9656d03b885SBenjamin Herrenschmidt {
9666d03b885SBenjamin Herrenschmidt 	return single_open(file, memblock_debug_show, inode->i_private);
9676d03b885SBenjamin Herrenschmidt }
9686d03b885SBenjamin Herrenschmidt 
9696d03b885SBenjamin Herrenschmidt static const struct file_operations memblock_debug_fops = {
9706d03b885SBenjamin Herrenschmidt 	.open = memblock_debug_open,
9716d03b885SBenjamin Herrenschmidt 	.read = seq_read,
9726d03b885SBenjamin Herrenschmidt 	.llseek = seq_lseek,
9736d03b885SBenjamin Herrenschmidt 	.release = single_release,
9746d03b885SBenjamin Herrenschmidt };
9756d03b885SBenjamin Herrenschmidt 
9766d03b885SBenjamin Herrenschmidt static int __init memblock_init_debugfs(void)
9776d03b885SBenjamin Herrenschmidt {
9786d03b885SBenjamin Herrenschmidt 	struct dentry *root = debugfs_create_dir("memblock", NULL);
9796d03b885SBenjamin Herrenschmidt 	if (!root)
9806d03b885SBenjamin Herrenschmidt 		return -ENXIO;
9816d03b885SBenjamin Herrenschmidt 	debugfs_create_file("memory", S_IRUGO, root, &memblock.memory, &memblock_debug_fops);
9826d03b885SBenjamin Herrenschmidt 	debugfs_create_file("reserved", S_IRUGO, root, &memblock.reserved, &memblock_debug_fops);
9836d03b885SBenjamin Herrenschmidt 
9846d03b885SBenjamin Herrenschmidt 	return 0;
9856d03b885SBenjamin Herrenschmidt }
9866d03b885SBenjamin Herrenschmidt __initcall(memblock_init_debugfs);
9876d03b885SBenjamin Herrenschmidt 
9886d03b885SBenjamin Herrenschmidt #endif /* CONFIG_DEBUG_FS */
989