xref: /linux/mm/memblock.c (revision c0ce8fef55896a2813a3d94e1b2d0e6d7fab6228)
195f72d1eSYinghai Lu /*
295f72d1eSYinghai Lu  * Procedures for maintaining information about logical memory blocks.
395f72d1eSYinghai Lu  *
495f72d1eSYinghai Lu  * Peter Bergner, IBM Corp.	June 2001.
595f72d1eSYinghai Lu  * Copyright (C) 2001 Peter Bergner.
695f72d1eSYinghai Lu  *
795f72d1eSYinghai Lu  *      This program is free software; you can redistribute it and/or
895f72d1eSYinghai Lu  *      modify it under the terms of the GNU General Public License
995f72d1eSYinghai Lu  *      as published by the Free Software Foundation; either version
1095f72d1eSYinghai Lu  *      2 of the License, or (at your option) any later version.
1195f72d1eSYinghai Lu  */
1295f72d1eSYinghai Lu 
1395f72d1eSYinghai Lu #include <linux/kernel.h>
14142b45a7SBenjamin Herrenschmidt #include <linux/slab.h>
1595f72d1eSYinghai Lu #include <linux/init.h>
1695f72d1eSYinghai Lu #include <linux/bitops.h>
17449e8df3SBenjamin Herrenschmidt #include <linux/poison.h>
18c196f76fSBenjamin Herrenschmidt #include <linux/pfn.h>
196d03b885SBenjamin Herrenschmidt #include <linux/debugfs.h>
206d03b885SBenjamin Herrenschmidt #include <linux/seq_file.h>
2195f72d1eSYinghai Lu #include <linux/memblock.h>
2295f72d1eSYinghai Lu 
23fe091c20STejun Heo static struct memblock_region memblock_memory_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock;
24fe091c20STejun Heo static struct memblock_region memblock_reserved_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock;
25fe091c20STejun Heo 
26fe091c20STejun Heo struct memblock memblock __initdata_memblock = {
27fe091c20STejun Heo 	.memory.regions		= memblock_memory_init_regions,
28fe091c20STejun Heo 	.memory.cnt		= 1,	/* empty dummy entry */
29fe091c20STejun Heo 	.memory.max		= INIT_MEMBLOCK_REGIONS,
30fe091c20STejun Heo 
31fe091c20STejun Heo 	.reserved.regions	= memblock_reserved_init_regions,
32fe091c20STejun Heo 	.reserved.cnt		= 1,	/* empty dummy entry */
33fe091c20STejun Heo 	.reserved.max		= INIT_MEMBLOCK_REGIONS,
34fe091c20STejun Heo 
35fe091c20STejun Heo 	.current_limit		= MEMBLOCK_ALLOC_ANYWHERE,
36fe091c20STejun Heo };
3795f72d1eSYinghai Lu 
3810d06439SYinghai Lu int memblock_debug __initdata_memblock;
3910d06439SYinghai Lu int memblock_can_resize __initdata_memblock;
4095f72d1eSYinghai Lu 
41142b45a7SBenjamin Herrenschmidt /* inline so we don't get a warning when pr_debug is compiled out */
42142b45a7SBenjamin Herrenschmidt static inline const char *memblock_type_name(struct memblock_type *type)
43142b45a7SBenjamin Herrenschmidt {
44142b45a7SBenjamin Herrenschmidt 	if (type == &memblock.memory)
45142b45a7SBenjamin Herrenschmidt 		return "memory";
46142b45a7SBenjamin Herrenschmidt 	else if (type == &memblock.reserved)
47142b45a7SBenjamin Herrenschmidt 		return "reserved";
48142b45a7SBenjamin Herrenschmidt 	else
49142b45a7SBenjamin Herrenschmidt 		return "unknown";
50142b45a7SBenjamin Herrenschmidt }
51142b45a7SBenjamin Herrenschmidt 
52eb18f1b5STejun Heo /* adjust *@size so that (@base + *@size) doesn't overflow, return new size */
53eb18f1b5STejun Heo static inline phys_addr_t memblock_cap_size(phys_addr_t base, phys_addr_t *size)
54eb18f1b5STejun Heo {
55eb18f1b5STejun Heo 	return *size = min(*size, (phys_addr_t)ULLONG_MAX - base);
56eb18f1b5STejun Heo }
57eb18f1b5STejun Heo 
586ed311b2SBenjamin Herrenschmidt /*
596ed311b2SBenjamin Herrenschmidt  * Address comparison utilities
606ed311b2SBenjamin Herrenschmidt  */
6110d06439SYinghai Lu static unsigned long __init_memblock memblock_addrs_overlap(phys_addr_t base1, phys_addr_t size1,
622898cc4cSBenjamin Herrenschmidt 				       phys_addr_t base2, phys_addr_t size2)
6395f72d1eSYinghai Lu {
6495f72d1eSYinghai Lu 	return ((base1 < (base2 + size2)) && (base2 < (base1 + size1)));
6595f72d1eSYinghai Lu }
6695f72d1eSYinghai Lu 
672d7d3eb2SH Hartley Sweeten static long __init_memblock memblock_overlaps_region(struct memblock_type *type,
682d7d3eb2SH Hartley Sweeten 					phys_addr_t base, phys_addr_t size)
696ed311b2SBenjamin Herrenschmidt {
706ed311b2SBenjamin Herrenschmidt 	unsigned long i;
716ed311b2SBenjamin Herrenschmidt 
726ed311b2SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
736ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnbase = type->regions[i].base;
746ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnsize = type->regions[i].size;
756ed311b2SBenjamin Herrenschmidt 		if (memblock_addrs_overlap(base, size, rgnbase, rgnsize))
766ed311b2SBenjamin Herrenschmidt 			break;
776ed311b2SBenjamin Herrenschmidt 	}
786ed311b2SBenjamin Herrenschmidt 
796ed311b2SBenjamin Herrenschmidt 	return (i < type->cnt) ? i : -1;
806ed311b2SBenjamin Herrenschmidt }
816ed311b2SBenjamin Herrenschmidt 
826ed311b2SBenjamin Herrenschmidt /*
836ed311b2SBenjamin Herrenschmidt  * Find, allocate, deallocate or reserve unreserved regions. All allocations
846ed311b2SBenjamin Herrenschmidt  * are top-down.
856ed311b2SBenjamin Herrenschmidt  */
866ed311b2SBenjamin Herrenschmidt 
87cd79481dSYinghai Lu static phys_addr_t __init_memblock memblock_find_region(phys_addr_t start, phys_addr_t end,
886ed311b2SBenjamin Herrenschmidt 					  phys_addr_t size, phys_addr_t align)
896ed311b2SBenjamin Herrenschmidt {
906ed311b2SBenjamin Herrenschmidt 	phys_addr_t base, res_base;
916ed311b2SBenjamin Herrenschmidt 	long j;
926ed311b2SBenjamin Herrenschmidt 
93f1af98c7SYinghai Lu 	/* In case, huge size is requested */
94f1af98c7SYinghai Lu 	if (end < size)
951f5026a7STejun Heo 		return 0;
96f1af98c7SYinghai Lu 
97348968ebSTejun Heo 	base = round_down(end - size, align);
98f1af98c7SYinghai Lu 
9925818f0fSBenjamin Herrenschmidt 	/* Prevent allocations returning 0 as it's also used to
10025818f0fSBenjamin Herrenschmidt 	 * indicate an allocation failure
10125818f0fSBenjamin Herrenschmidt 	 */
10225818f0fSBenjamin Herrenschmidt 	if (start == 0)
10325818f0fSBenjamin Herrenschmidt 		start = PAGE_SIZE;
10425818f0fSBenjamin Herrenschmidt 
1056ed311b2SBenjamin Herrenschmidt 	while (start <= base) {
1066ed311b2SBenjamin Herrenschmidt 		j = memblock_overlaps_region(&memblock.reserved, base, size);
1076ed311b2SBenjamin Herrenschmidt 		if (j < 0)
1086ed311b2SBenjamin Herrenschmidt 			return base;
1096ed311b2SBenjamin Herrenschmidt 		res_base = memblock.reserved.regions[j].base;
1106ed311b2SBenjamin Herrenschmidt 		if (res_base < size)
1116ed311b2SBenjamin Herrenschmidt 			break;
112348968ebSTejun Heo 		base = round_down(res_base - size, align);
1136ed311b2SBenjamin Herrenschmidt 	}
1146ed311b2SBenjamin Herrenschmidt 
1151f5026a7STejun Heo 	return 0;
1166ed311b2SBenjamin Herrenschmidt }
1176ed311b2SBenjamin Herrenschmidt 
118fc769a8eSTejun Heo /*
119fc769a8eSTejun Heo  * Find a free area with specified alignment in a specific range.
120fc769a8eSTejun Heo  */
121fc769a8eSTejun Heo phys_addr_t __init_memblock memblock_find_in_range(phys_addr_t start, phys_addr_t end,
122fc769a8eSTejun Heo 					phys_addr_t size, phys_addr_t align)
1236ed311b2SBenjamin Herrenschmidt {
1246ed311b2SBenjamin Herrenschmidt 	long i;
1256ed311b2SBenjamin Herrenschmidt 
1266ed311b2SBenjamin Herrenschmidt 	BUG_ON(0 == size);
1276ed311b2SBenjamin Herrenschmidt 
1286ed311b2SBenjamin Herrenschmidt 	/* Pump up max_addr */
129fef501d4SBenjamin Herrenschmidt 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
130fef501d4SBenjamin Herrenschmidt 		end = memblock.current_limit;
1316ed311b2SBenjamin Herrenschmidt 
1326ed311b2SBenjamin Herrenschmidt 	/* We do a top-down search, this tends to limit memory
1336ed311b2SBenjamin Herrenschmidt 	 * fragmentation by keeping early boot allocs near the
1346ed311b2SBenjamin Herrenschmidt 	 * top of memory
1356ed311b2SBenjamin Herrenschmidt 	 */
1366ed311b2SBenjamin Herrenschmidt 	for (i = memblock.memory.cnt - 1; i >= 0; i--) {
1376ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblockbase = memblock.memory.regions[i].base;
1386ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblocksize = memblock.memory.regions[i].size;
139fef501d4SBenjamin Herrenschmidt 		phys_addr_t bottom, top, found;
1406ed311b2SBenjamin Herrenschmidt 
1416ed311b2SBenjamin Herrenschmidt 		if (memblocksize < size)
1426ed311b2SBenjamin Herrenschmidt 			continue;
143fef501d4SBenjamin Herrenschmidt 		if ((memblockbase + memblocksize) <= start)
144fef501d4SBenjamin Herrenschmidt 			break;
145fef501d4SBenjamin Herrenschmidt 		bottom = max(memblockbase, start);
146fef501d4SBenjamin Herrenschmidt 		top = min(memblockbase + memblocksize, end);
147fef501d4SBenjamin Herrenschmidt 		if (bottom >= top)
148fef501d4SBenjamin Herrenschmidt 			continue;
149fef501d4SBenjamin Herrenschmidt 		found = memblock_find_region(bottom, top, size, align);
1501f5026a7STejun Heo 		if (found)
151fef501d4SBenjamin Herrenschmidt 			return found;
1526ed311b2SBenjamin Herrenschmidt 	}
1531f5026a7STejun Heo 	return 0;
1546ed311b2SBenjamin Herrenschmidt }
1556ed311b2SBenjamin Herrenschmidt 
1565303b68fSYinghai Lu /*
1577950c407SYinghai Lu  * Free memblock.reserved.regions
1587950c407SYinghai Lu  */
1597950c407SYinghai Lu int __init_memblock memblock_free_reserved_regions(void)
1607950c407SYinghai Lu {
1617950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1627950c407SYinghai Lu 		return 0;
1637950c407SYinghai Lu 
1647950c407SYinghai Lu 	return memblock_free(__pa(memblock.reserved.regions),
1657950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1667950c407SYinghai Lu }
1677950c407SYinghai Lu 
1687950c407SYinghai Lu /*
1697950c407SYinghai Lu  * Reserve memblock.reserved.regions
1707950c407SYinghai Lu  */
1717950c407SYinghai Lu int __init_memblock memblock_reserve_reserved_regions(void)
1727950c407SYinghai Lu {
1737950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1747950c407SYinghai Lu 		return 0;
1757950c407SYinghai Lu 
1767950c407SYinghai Lu 	return memblock_reserve(__pa(memblock.reserved.regions),
1777950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1787950c407SYinghai Lu }
1797950c407SYinghai Lu 
18010d06439SYinghai Lu static void __init_memblock memblock_remove_region(struct memblock_type *type, unsigned long r)
18195f72d1eSYinghai Lu {
1827c0caeb8STejun Heo 	memmove(&type->regions[r], &type->regions[r + 1],
1837c0caeb8STejun Heo 		(type->cnt - (r + 1)) * sizeof(type->regions[r]));
184e3239ff9SBenjamin Herrenschmidt 	type->cnt--;
18595f72d1eSYinghai Lu 
1868f7a6605SBenjamin Herrenschmidt 	/* Special case for empty arrays */
1878f7a6605SBenjamin Herrenschmidt 	if (type->cnt == 0) {
1888f7a6605SBenjamin Herrenschmidt 		type->cnt = 1;
1898f7a6605SBenjamin Herrenschmidt 		type->regions[0].base = 0;
1908f7a6605SBenjamin Herrenschmidt 		type->regions[0].size = 0;
1917c0caeb8STejun Heo 		memblock_set_region_node(&type->regions[0], MAX_NUMNODES);
1928f7a6605SBenjamin Herrenschmidt 	}
19395f72d1eSYinghai Lu }
19495f72d1eSYinghai Lu 
19510d06439SYinghai Lu static int __init_memblock memblock_double_array(struct memblock_type *type)
196142b45a7SBenjamin Herrenschmidt {
197142b45a7SBenjamin Herrenschmidt 	struct memblock_region *new_array, *old_array;
198142b45a7SBenjamin Herrenschmidt 	phys_addr_t old_size, new_size, addr;
199142b45a7SBenjamin Herrenschmidt 	int use_slab = slab_is_available();
200142b45a7SBenjamin Herrenschmidt 
201142b45a7SBenjamin Herrenschmidt 	/* We don't allow resizing until we know about the reserved regions
202142b45a7SBenjamin Herrenschmidt 	 * of memory that aren't suitable for allocation
203142b45a7SBenjamin Herrenschmidt 	 */
204142b45a7SBenjamin Herrenschmidt 	if (!memblock_can_resize)
205142b45a7SBenjamin Herrenschmidt 		return -1;
206142b45a7SBenjamin Herrenschmidt 
207142b45a7SBenjamin Herrenschmidt 	/* Calculate new doubled size */
208142b45a7SBenjamin Herrenschmidt 	old_size = type->max * sizeof(struct memblock_region);
209142b45a7SBenjamin Herrenschmidt 	new_size = old_size << 1;
210142b45a7SBenjamin Herrenschmidt 
211142b45a7SBenjamin Herrenschmidt 	/* Try to find some space for it.
212142b45a7SBenjamin Herrenschmidt 	 *
213142b45a7SBenjamin Herrenschmidt 	 * WARNING: We assume that either slab_is_available() and we use it or
214142b45a7SBenjamin Herrenschmidt 	 * we use MEMBLOCK for allocations. That means that this is unsafe to use
215142b45a7SBenjamin Herrenschmidt 	 * when bootmem is currently active (unless bootmem itself is implemented
216142b45a7SBenjamin Herrenschmidt 	 * on top of MEMBLOCK which isn't the case yet)
217142b45a7SBenjamin Herrenschmidt 	 *
218142b45a7SBenjamin Herrenschmidt 	 * This should however not be an issue for now, as we currently only
219142b45a7SBenjamin Herrenschmidt 	 * call into MEMBLOCK while it's still active, or much later when slab is
220142b45a7SBenjamin Herrenschmidt 	 * active for memory hotplug operations
221142b45a7SBenjamin Herrenschmidt 	 */
222142b45a7SBenjamin Herrenschmidt 	if (use_slab) {
223142b45a7SBenjamin Herrenschmidt 		new_array = kmalloc(new_size, GFP_KERNEL);
2241f5026a7STejun Heo 		addr = new_array ? __pa(new_array) : 0;
225142b45a7SBenjamin Herrenschmidt 	} else
226fc769a8eSTejun Heo 		addr = memblock_find_in_range(0, MEMBLOCK_ALLOC_ACCESSIBLE, new_size, sizeof(phys_addr_t));
2271f5026a7STejun Heo 	if (!addr) {
228142b45a7SBenjamin Herrenschmidt 		pr_err("memblock: Failed to double %s array from %ld to %ld entries !\n",
229142b45a7SBenjamin Herrenschmidt 		       memblock_type_name(type), type->max, type->max * 2);
230142b45a7SBenjamin Herrenschmidt 		return -1;
231142b45a7SBenjamin Herrenschmidt 	}
232142b45a7SBenjamin Herrenschmidt 	new_array = __va(addr);
233142b45a7SBenjamin Herrenschmidt 
234ea9e4376SYinghai Lu 	memblock_dbg("memblock: %s array is doubled to %ld at [%#010llx-%#010llx]",
235ea9e4376SYinghai Lu 		 memblock_type_name(type), type->max * 2, (u64)addr, (u64)addr + new_size - 1);
236ea9e4376SYinghai Lu 
237142b45a7SBenjamin Herrenschmidt 	/* Found space, we now need to move the array over before
238142b45a7SBenjamin Herrenschmidt 	 * we add the reserved region since it may be our reserved
239142b45a7SBenjamin Herrenschmidt 	 * array itself that is full.
240142b45a7SBenjamin Herrenschmidt 	 */
241142b45a7SBenjamin Herrenschmidt 	memcpy(new_array, type->regions, old_size);
242142b45a7SBenjamin Herrenschmidt 	memset(new_array + type->max, 0, old_size);
243142b45a7SBenjamin Herrenschmidt 	old_array = type->regions;
244142b45a7SBenjamin Herrenschmidt 	type->regions = new_array;
245142b45a7SBenjamin Herrenschmidt 	type->max <<= 1;
246142b45a7SBenjamin Herrenschmidt 
247142b45a7SBenjamin Herrenschmidt 	/* If we use SLAB that's it, we are done */
248142b45a7SBenjamin Herrenschmidt 	if (use_slab)
249142b45a7SBenjamin Herrenschmidt 		return 0;
250142b45a7SBenjamin Herrenschmidt 
251142b45a7SBenjamin Herrenschmidt 	/* Add the new reserved region now. Should not fail ! */
2529c8c27e2STejun Heo 	BUG_ON(memblock_reserve(addr, new_size));
253142b45a7SBenjamin Herrenschmidt 
254142b45a7SBenjamin Herrenschmidt 	/* If the array wasn't our static init one, then free it. We only do
255142b45a7SBenjamin Herrenschmidt 	 * that before SLAB is available as later on, we don't know whether
256142b45a7SBenjamin Herrenschmidt 	 * to use kfree or free_bootmem_pages(). Shouldn't be a big deal
257142b45a7SBenjamin Herrenschmidt 	 * anyways
258142b45a7SBenjamin Herrenschmidt 	 */
259142b45a7SBenjamin Herrenschmidt 	if (old_array != memblock_memory_init_regions &&
260142b45a7SBenjamin Herrenschmidt 	    old_array != memblock_reserved_init_regions)
261142b45a7SBenjamin Herrenschmidt 		memblock_free(__pa(old_array), old_size);
262142b45a7SBenjamin Herrenschmidt 
263142b45a7SBenjamin Herrenschmidt 	return 0;
264142b45a7SBenjamin Herrenschmidt }
265142b45a7SBenjamin Herrenschmidt 
266784656f9STejun Heo /**
267784656f9STejun Heo  * memblock_merge_regions - merge neighboring compatible regions
268784656f9STejun Heo  * @type: memblock type to scan
269784656f9STejun Heo  *
270784656f9STejun Heo  * Scan @type and merge neighboring compatible regions.
271784656f9STejun Heo  */
272784656f9STejun Heo static void __init_memblock memblock_merge_regions(struct memblock_type *type)
273784656f9STejun Heo {
274784656f9STejun Heo 	int i = 0;
275784656f9STejun Heo 
276784656f9STejun Heo 	/* cnt never goes below 1 */
277784656f9STejun Heo 	while (i < type->cnt - 1) {
278784656f9STejun Heo 		struct memblock_region *this = &type->regions[i];
279784656f9STejun Heo 		struct memblock_region *next = &type->regions[i + 1];
280784656f9STejun Heo 
2817c0caeb8STejun Heo 		if (this->base + this->size != next->base ||
2827c0caeb8STejun Heo 		    memblock_get_region_node(this) !=
2837c0caeb8STejun Heo 		    memblock_get_region_node(next)) {
284784656f9STejun Heo 			BUG_ON(this->base + this->size > next->base);
285784656f9STejun Heo 			i++;
286784656f9STejun Heo 			continue;
287784656f9STejun Heo 		}
288784656f9STejun Heo 
289784656f9STejun Heo 		this->size += next->size;
290784656f9STejun Heo 		memmove(next, next + 1, (type->cnt - (i + 1)) * sizeof(*next));
291784656f9STejun Heo 		type->cnt--;
292784656f9STejun Heo 	}
293784656f9STejun Heo }
294784656f9STejun Heo 
295784656f9STejun Heo /**
296784656f9STejun Heo  * memblock_insert_region - insert new memblock region
297784656f9STejun Heo  * @type: memblock type to insert into
298784656f9STejun Heo  * @idx: index for the insertion point
299784656f9STejun Heo  * @base: base address of the new region
300784656f9STejun Heo  * @size: size of the new region
301784656f9STejun Heo  *
302784656f9STejun Heo  * Insert new memblock region [@base,@base+@size) into @type at @idx.
303784656f9STejun Heo  * @type must already have extra room to accomodate the new region.
304784656f9STejun Heo  */
305784656f9STejun Heo static void __init_memblock memblock_insert_region(struct memblock_type *type,
306784656f9STejun Heo 						   int idx, phys_addr_t base,
3077c0caeb8STejun Heo 						   phys_addr_t size, int nid)
308784656f9STejun Heo {
309784656f9STejun Heo 	struct memblock_region *rgn = &type->regions[idx];
310784656f9STejun Heo 
311784656f9STejun Heo 	BUG_ON(type->cnt >= type->max);
312784656f9STejun Heo 	memmove(rgn + 1, rgn, (type->cnt - idx) * sizeof(*rgn));
313784656f9STejun Heo 	rgn->base = base;
314784656f9STejun Heo 	rgn->size = size;
3157c0caeb8STejun Heo 	memblock_set_region_node(rgn, nid);
316784656f9STejun Heo 	type->cnt++;
317784656f9STejun Heo }
318784656f9STejun Heo 
319784656f9STejun Heo /**
320784656f9STejun Heo  * memblock_add_region - add new memblock region
321784656f9STejun Heo  * @type: memblock type to add new region into
322784656f9STejun Heo  * @base: base address of the new region
323784656f9STejun Heo  * @size: size of the new region
324784656f9STejun Heo  *
325784656f9STejun Heo  * Add new memblock region [@base,@base+@size) into @type.  The new region
326784656f9STejun Heo  * is allowed to overlap with existing ones - overlaps don't affect already
327784656f9STejun Heo  * existing regions.  @type is guaranteed to be minimal (all neighbouring
328784656f9STejun Heo  * compatible regions are merged) after the addition.
329784656f9STejun Heo  *
330784656f9STejun Heo  * RETURNS:
331784656f9STejun Heo  * 0 on success, -errno on failure.
332784656f9STejun Heo  */
333581adcbeSTejun Heo static int __init_memblock memblock_add_region(struct memblock_type *type,
3348f7a6605SBenjamin Herrenschmidt 					       phys_addr_t base, phys_addr_t size)
33595f72d1eSYinghai Lu {
336784656f9STejun Heo 	bool insert = false;
337eb18f1b5STejun Heo 	phys_addr_t obase = base;
338eb18f1b5STejun Heo 	phys_addr_t end = base + memblock_cap_size(base, &size);
339784656f9STejun Heo 	int i, nr_new;
34095f72d1eSYinghai Lu 
341784656f9STejun Heo 	/* special case for empty array */
342784656f9STejun Heo 	if (type->regions[0].size == 0) {
343784656f9STejun Heo 		WARN_ON(type->cnt != 1);
344784656f9STejun Heo 		type->regions[0].base = base;
345784656f9STejun Heo 		type->regions[0].size = size;
3467c0caeb8STejun Heo 		memblock_set_region_node(&type->regions[0], MAX_NUMNODES);
347784656f9STejun Heo 		return 0;
348784656f9STejun Heo 	}
349784656f9STejun Heo repeat:
350784656f9STejun Heo 	/*
351784656f9STejun Heo 	 * The following is executed twice.  Once with %false @insert and
352784656f9STejun Heo 	 * then with %true.  The first counts the number of regions needed
353784656f9STejun Heo 	 * to accomodate the new area.  The second actually inserts them.
354784656f9STejun Heo 	 */
355784656f9STejun Heo 	base = obase;
356784656f9STejun Heo 	nr_new = 0;
357784656f9STejun Heo 
3588f7a6605SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
3598f7a6605SBenjamin Herrenschmidt 		struct memblock_region *rgn = &type->regions[i];
360784656f9STejun Heo 		phys_addr_t rbase = rgn->base;
361784656f9STejun Heo 		phys_addr_t rend = rbase + rgn->size;
3628f7a6605SBenjamin Herrenschmidt 
363784656f9STejun Heo 		if (rbase >= end)
3648f7a6605SBenjamin Herrenschmidt 			break;
365784656f9STejun Heo 		if (rend <= base)
366784656f9STejun Heo 			continue;
367784656f9STejun Heo 		/*
368784656f9STejun Heo 		 * @rgn overlaps.  If it separates the lower part of new
369784656f9STejun Heo 		 * area, insert that portion.
3708f7a6605SBenjamin Herrenschmidt 		 */
371784656f9STejun Heo 		if (rbase > base) {
372784656f9STejun Heo 			nr_new++;
373784656f9STejun Heo 			if (insert)
374784656f9STejun Heo 				memblock_insert_region(type, i++, base,
3757c0caeb8STejun Heo 						rbase - base, MAX_NUMNODES);
376784656f9STejun Heo 		}
377784656f9STejun Heo 		/* area below @rend is dealt with, forget about it */
378784656f9STejun Heo 		base = min(rend, end);
3798f7a6605SBenjamin Herrenschmidt 	}
3808f7a6605SBenjamin Herrenschmidt 
381784656f9STejun Heo 	/* insert the remaining portion */
382784656f9STejun Heo 	if (base < end) {
383784656f9STejun Heo 		nr_new++;
384784656f9STejun Heo 		if (insert)
3857c0caeb8STejun Heo 			memblock_insert_region(type, i, base, end - base,
3867c0caeb8STejun Heo 					       MAX_NUMNODES);
3878f7a6605SBenjamin Herrenschmidt 	}
3888f7a6605SBenjamin Herrenschmidt 
389784656f9STejun Heo 	/*
390784656f9STejun Heo 	 * If this was the first round, resize array and repeat for actual
391784656f9STejun Heo 	 * insertions; otherwise, merge and return.
3928f7a6605SBenjamin Herrenschmidt 	 */
393784656f9STejun Heo 	if (!insert) {
394784656f9STejun Heo 		while (type->cnt + nr_new > type->max)
395784656f9STejun Heo 			if (memblock_double_array(type) < 0)
396784656f9STejun Heo 				return -ENOMEM;
397784656f9STejun Heo 		insert = true;
398784656f9STejun Heo 		goto repeat;
39995f72d1eSYinghai Lu 	} else {
400784656f9STejun Heo 		memblock_merge_regions(type);
40195f72d1eSYinghai Lu 		return 0;
40295f72d1eSYinghai Lu 	}
403784656f9STejun Heo }
40495f72d1eSYinghai Lu 
405581adcbeSTejun Heo int __init_memblock memblock_add(phys_addr_t base, phys_addr_t size)
40695f72d1eSYinghai Lu {
407e3239ff9SBenjamin Herrenschmidt 	return memblock_add_region(&memblock.memory, base, size);
40895f72d1eSYinghai Lu }
40995f72d1eSYinghai Lu 
4106a9ceb31STejun Heo /**
4116a9ceb31STejun Heo  * memblock_isolate_range - isolate given range into disjoint memblocks
4126a9ceb31STejun Heo  * @type: memblock type to isolate range for
4136a9ceb31STejun Heo  * @base: base of range to isolate
4146a9ceb31STejun Heo  * @size: size of range to isolate
4156a9ceb31STejun Heo  * @start_rgn: out parameter for the start of isolated region
4166a9ceb31STejun Heo  * @end_rgn: out parameter for the end of isolated region
4176a9ceb31STejun Heo  *
4186a9ceb31STejun Heo  * Walk @type and ensure that regions don't cross the boundaries defined by
4196a9ceb31STejun Heo  * [@base,@base+@size).  Crossing regions are split at the boundaries,
4206a9ceb31STejun Heo  * which may create at most two more regions.  The index of the first
4216a9ceb31STejun Heo  * region inside the range is returned in *@start_rgn and end in *@end_rgn.
4226a9ceb31STejun Heo  *
4236a9ceb31STejun Heo  * RETURNS:
4246a9ceb31STejun Heo  * 0 on success, -errno on failure.
4256a9ceb31STejun Heo  */
4266a9ceb31STejun Heo static int __init_memblock memblock_isolate_range(struct memblock_type *type,
4276a9ceb31STejun Heo 					phys_addr_t base, phys_addr_t size,
4286a9ceb31STejun Heo 					int *start_rgn, int *end_rgn)
4296a9ceb31STejun Heo {
430eb18f1b5STejun Heo 	phys_addr_t end = base + memblock_cap_size(base, &size);
4316a9ceb31STejun Heo 	int i;
4326a9ceb31STejun Heo 
4336a9ceb31STejun Heo 	*start_rgn = *end_rgn = 0;
4346a9ceb31STejun Heo 
4356a9ceb31STejun Heo 	/* we'll create at most two more regions */
4366a9ceb31STejun Heo 	while (type->cnt + 2 > type->max)
4376a9ceb31STejun Heo 		if (memblock_double_array(type) < 0)
4386a9ceb31STejun Heo 			return -ENOMEM;
4396a9ceb31STejun Heo 
4406a9ceb31STejun Heo 	for (i = 0; i < type->cnt; i++) {
4416a9ceb31STejun Heo 		struct memblock_region *rgn = &type->regions[i];
4426a9ceb31STejun Heo 		phys_addr_t rbase = rgn->base;
4436a9ceb31STejun Heo 		phys_addr_t rend = rbase + rgn->size;
4446a9ceb31STejun Heo 
4456a9ceb31STejun Heo 		if (rbase >= end)
4466a9ceb31STejun Heo 			break;
4476a9ceb31STejun Heo 		if (rend <= base)
4486a9ceb31STejun Heo 			continue;
4496a9ceb31STejun Heo 
4506a9ceb31STejun Heo 		if (rbase < base) {
4516a9ceb31STejun Heo 			/*
4526a9ceb31STejun Heo 			 * @rgn intersects from below.  Split and continue
4536a9ceb31STejun Heo 			 * to process the next region - the new top half.
4546a9ceb31STejun Heo 			 */
4556a9ceb31STejun Heo 			rgn->base = base;
4566a9ceb31STejun Heo 			rgn->size = rend - rgn->base;
4576a9ceb31STejun Heo 			memblock_insert_region(type, i, rbase, base - rbase,
45871936180STejun Heo 					       memblock_get_region_node(rgn));
4596a9ceb31STejun Heo 		} else if (rend > end) {
4606a9ceb31STejun Heo 			/*
4616a9ceb31STejun Heo 			 * @rgn intersects from above.  Split and redo the
4626a9ceb31STejun Heo 			 * current region - the new bottom half.
4636a9ceb31STejun Heo 			 */
4646a9ceb31STejun Heo 			rgn->base = end;
4656a9ceb31STejun Heo 			rgn->size = rend - rgn->base;
4666a9ceb31STejun Heo 			memblock_insert_region(type, i--, rbase, end - rbase,
46771936180STejun Heo 					       memblock_get_region_node(rgn));
4686a9ceb31STejun Heo 		} else {
4696a9ceb31STejun Heo 			/* @rgn is fully contained, record it */
4706a9ceb31STejun Heo 			if (!*end_rgn)
4716a9ceb31STejun Heo 				*start_rgn = i;
4726a9ceb31STejun Heo 			*end_rgn = i + 1;
4736a9ceb31STejun Heo 		}
4746a9ceb31STejun Heo 	}
4756a9ceb31STejun Heo 
4766a9ceb31STejun Heo 	return 0;
4776a9ceb31STejun Heo }
4786a9ceb31STejun Heo 
479581adcbeSTejun Heo static int __init_memblock __memblock_remove(struct memblock_type *type,
4808f7a6605SBenjamin Herrenschmidt 					     phys_addr_t base, phys_addr_t size)
48195f72d1eSYinghai Lu {
48271936180STejun Heo 	int start_rgn, end_rgn;
48371936180STejun Heo 	int i, ret;
48495f72d1eSYinghai Lu 
48571936180STejun Heo 	ret = memblock_isolate_range(type, base, size, &start_rgn, &end_rgn);
48671936180STejun Heo 	if (ret)
48771936180STejun Heo 		return ret;
48895f72d1eSYinghai Lu 
48971936180STejun Heo 	for (i = end_rgn - 1; i >= start_rgn; i--)
49071936180STejun Heo 		memblock_remove_region(type, i);
49195f72d1eSYinghai Lu 	return 0;
49295f72d1eSYinghai Lu }
49395f72d1eSYinghai Lu 
494581adcbeSTejun Heo int __init_memblock memblock_remove(phys_addr_t base, phys_addr_t size)
49595f72d1eSYinghai Lu {
49695f72d1eSYinghai Lu 	return __memblock_remove(&memblock.memory, base, size);
49795f72d1eSYinghai Lu }
49895f72d1eSYinghai Lu 
499581adcbeSTejun Heo int __init_memblock memblock_free(phys_addr_t base, phys_addr_t size)
50095f72d1eSYinghai Lu {
50124aa0788STejun Heo 	memblock_dbg("   memblock_free: [%#016llx-%#016llx] %pF\n",
502a150439cSH. Peter Anvin 		     (unsigned long long)base,
503a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
504a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
50524aa0788STejun Heo 
50695f72d1eSYinghai Lu 	return __memblock_remove(&memblock.reserved, base, size);
50795f72d1eSYinghai Lu }
50895f72d1eSYinghai Lu 
509581adcbeSTejun Heo int __init_memblock memblock_reserve(phys_addr_t base, phys_addr_t size)
51095f72d1eSYinghai Lu {
511e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *_rgn = &memblock.reserved;
51295f72d1eSYinghai Lu 
51324aa0788STejun Heo 	memblock_dbg("memblock_reserve: [%#016llx-%#016llx] %pF\n",
514a150439cSH. Peter Anvin 		     (unsigned long long)base,
515a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
516a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
51795f72d1eSYinghai Lu 	BUG_ON(0 == size);
51895f72d1eSYinghai Lu 
51995f72d1eSYinghai Lu 	return memblock_add_region(_rgn, base, size);
52095f72d1eSYinghai Lu }
52195f72d1eSYinghai Lu 
52235fd0808STejun Heo /**
52335fd0808STejun Heo  * __next_free_mem_range - next function for for_each_free_mem_range()
52435fd0808STejun Heo  * @idx: pointer to u64 loop variable
52535fd0808STejun Heo  * @nid: nid: node selector, %MAX_NUMNODES for all nodes
52635fd0808STejun Heo  * @p_start: ptr to phys_addr_t for start address of the range, can be %NULL
52735fd0808STejun Heo  * @p_end: ptr to phys_addr_t for end address of the range, can be %NULL
52835fd0808STejun Heo  * @p_nid: ptr to int for nid of the range, can be %NULL
52935fd0808STejun Heo  *
53035fd0808STejun Heo  * Find the first free area from *@idx which matches @nid, fill the out
53135fd0808STejun Heo  * parameters, and update *@idx for the next iteration.  The lower 32bit of
53235fd0808STejun Heo  * *@idx contains index into memory region and the upper 32bit indexes the
53335fd0808STejun Heo  * areas before each reserved region.  For example, if reserved regions
53435fd0808STejun Heo  * look like the following,
53535fd0808STejun Heo  *
53635fd0808STejun Heo  *	0:[0-16), 1:[32-48), 2:[128-130)
53735fd0808STejun Heo  *
53835fd0808STejun Heo  * The upper 32bit indexes the following regions.
53935fd0808STejun Heo  *
54035fd0808STejun Heo  *	0:[0-0), 1:[16-32), 2:[48-128), 3:[130-MAX)
54135fd0808STejun Heo  *
54235fd0808STejun Heo  * As both region arrays are sorted, the function advances the two indices
54335fd0808STejun Heo  * in lockstep and returns each intersection.
54435fd0808STejun Heo  */
54535fd0808STejun Heo void __init_memblock __next_free_mem_range(u64 *idx, int nid,
54635fd0808STejun Heo 					   phys_addr_t *out_start,
54735fd0808STejun Heo 					   phys_addr_t *out_end, int *out_nid)
54835fd0808STejun Heo {
54935fd0808STejun Heo 	struct memblock_type *mem = &memblock.memory;
55035fd0808STejun Heo 	struct memblock_type *rsv = &memblock.reserved;
55135fd0808STejun Heo 	int mi = *idx & 0xffffffff;
55235fd0808STejun Heo 	int ri = *idx >> 32;
55335fd0808STejun Heo 
55435fd0808STejun Heo 	for ( ; mi < mem->cnt; mi++) {
55535fd0808STejun Heo 		struct memblock_region *m = &mem->regions[mi];
55635fd0808STejun Heo 		phys_addr_t m_start = m->base;
55735fd0808STejun Heo 		phys_addr_t m_end = m->base + m->size;
55835fd0808STejun Heo 
55935fd0808STejun Heo 		/* only memory regions are associated with nodes, check it */
56035fd0808STejun Heo 		if (nid != MAX_NUMNODES && nid != memblock_get_region_node(m))
56135fd0808STejun Heo 			continue;
56235fd0808STejun Heo 
56335fd0808STejun Heo 		/* scan areas before each reservation for intersection */
56435fd0808STejun Heo 		for ( ; ri < rsv->cnt + 1; ri++) {
56535fd0808STejun Heo 			struct memblock_region *r = &rsv->regions[ri];
56635fd0808STejun Heo 			phys_addr_t r_start = ri ? r[-1].base + r[-1].size : 0;
56735fd0808STejun Heo 			phys_addr_t r_end = ri < rsv->cnt ? r->base : ULLONG_MAX;
56835fd0808STejun Heo 
56935fd0808STejun Heo 			/* if ri advanced past mi, break out to advance mi */
57035fd0808STejun Heo 			if (r_start >= m_end)
57135fd0808STejun Heo 				break;
57235fd0808STejun Heo 			/* if the two regions intersect, we're done */
57335fd0808STejun Heo 			if (m_start < r_end) {
57435fd0808STejun Heo 				if (out_start)
57535fd0808STejun Heo 					*out_start = max(m_start, r_start);
57635fd0808STejun Heo 				if (out_end)
57735fd0808STejun Heo 					*out_end = min(m_end, r_end);
57835fd0808STejun Heo 				if (out_nid)
57935fd0808STejun Heo 					*out_nid = memblock_get_region_node(m);
58035fd0808STejun Heo 				/*
58135fd0808STejun Heo 				 * The region which ends first is advanced
58235fd0808STejun Heo 				 * for the next iteration.
58335fd0808STejun Heo 				 */
58435fd0808STejun Heo 				if (m_end <= r_end)
58535fd0808STejun Heo 					mi++;
58635fd0808STejun Heo 				else
58735fd0808STejun Heo 					ri++;
58835fd0808STejun Heo 				*idx = (u32)mi | (u64)ri << 32;
58935fd0808STejun Heo 				return;
59035fd0808STejun Heo 			}
59135fd0808STejun Heo 		}
59235fd0808STejun Heo 	}
59335fd0808STejun Heo 
59435fd0808STejun Heo 	/* signal end of iteration */
59535fd0808STejun Heo 	*idx = ULLONG_MAX;
59635fd0808STejun Heo }
59735fd0808STejun Heo 
5987c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
5997c0caeb8STejun Heo /*
6007c0caeb8STejun Heo  * Common iterator interface used to define for_each_mem_range().
6017c0caeb8STejun Heo  */
6027c0caeb8STejun Heo void __init_memblock __next_mem_pfn_range(int *idx, int nid,
6037c0caeb8STejun Heo 				unsigned long *out_start_pfn,
6047c0caeb8STejun Heo 				unsigned long *out_end_pfn, int *out_nid)
6057c0caeb8STejun Heo {
6067c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
6077c0caeb8STejun Heo 	struct memblock_region *r;
6087c0caeb8STejun Heo 
6097c0caeb8STejun Heo 	while (++*idx < type->cnt) {
6107c0caeb8STejun Heo 		r = &type->regions[*idx];
6117c0caeb8STejun Heo 
6127c0caeb8STejun Heo 		if (PFN_UP(r->base) >= PFN_DOWN(r->base + r->size))
6137c0caeb8STejun Heo 			continue;
6147c0caeb8STejun Heo 		if (nid == MAX_NUMNODES || nid == r->nid)
6157c0caeb8STejun Heo 			break;
6167c0caeb8STejun Heo 	}
6177c0caeb8STejun Heo 	if (*idx >= type->cnt) {
6187c0caeb8STejun Heo 		*idx = -1;
6197c0caeb8STejun Heo 		return;
6207c0caeb8STejun Heo 	}
6217c0caeb8STejun Heo 
6227c0caeb8STejun Heo 	if (out_start_pfn)
6237c0caeb8STejun Heo 		*out_start_pfn = PFN_UP(r->base);
6247c0caeb8STejun Heo 	if (out_end_pfn)
6257c0caeb8STejun Heo 		*out_end_pfn = PFN_DOWN(r->base + r->size);
6267c0caeb8STejun Heo 	if (out_nid)
6277c0caeb8STejun Heo 		*out_nid = r->nid;
6287c0caeb8STejun Heo }
6297c0caeb8STejun Heo 
6307c0caeb8STejun Heo /**
6317c0caeb8STejun Heo  * memblock_set_node - set node ID on memblock regions
6327c0caeb8STejun Heo  * @base: base of area to set node ID for
6337c0caeb8STejun Heo  * @size: size of area to set node ID for
6347c0caeb8STejun Heo  * @nid: node ID to set
6357c0caeb8STejun Heo  *
6367c0caeb8STejun Heo  * Set the nid of memblock memory regions in [@base,@base+@size) to @nid.
6377c0caeb8STejun Heo  * Regions which cross the area boundaries are split as necessary.
6387c0caeb8STejun Heo  *
6397c0caeb8STejun Heo  * RETURNS:
6407c0caeb8STejun Heo  * 0 on success, -errno on failure.
6417c0caeb8STejun Heo  */
6427c0caeb8STejun Heo int __init_memblock memblock_set_node(phys_addr_t base, phys_addr_t size,
6437c0caeb8STejun Heo 				      int nid)
6447c0caeb8STejun Heo {
6457c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
6466a9ceb31STejun Heo 	int start_rgn, end_rgn;
6476a9ceb31STejun Heo 	int i, ret;
6487c0caeb8STejun Heo 
6496a9ceb31STejun Heo 	ret = memblock_isolate_range(type, base, size, &start_rgn, &end_rgn);
6506a9ceb31STejun Heo 	if (ret)
6516a9ceb31STejun Heo 		return ret;
6527c0caeb8STejun Heo 
6536a9ceb31STejun Heo 	for (i = start_rgn; i < end_rgn; i++)
6546a9ceb31STejun Heo 		type->regions[i].nid = nid;
6557c0caeb8STejun Heo 
6567c0caeb8STejun Heo 	memblock_merge_regions(type);
6577c0caeb8STejun Heo 	return 0;
6587c0caeb8STejun Heo }
6597c0caeb8STejun Heo #endif /* CONFIG_HAVE_MEMBLOCK_NODE_MAP */
6607c0caeb8STejun Heo 
6616ed311b2SBenjamin Herrenschmidt phys_addr_t __init __memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
66295f72d1eSYinghai Lu {
6636ed311b2SBenjamin Herrenschmidt 	phys_addr_t found;
66495f72d1eSYinghai Lu 
6656ed311b2SBenjamin Herrenschmidt 	/* We align the size to limit fragmentation. Without this, a lot of
6666ed311b2SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
6676ed311b2SBenjamin Herrenschmidt 	 */
668348968ebSTejun Heo 	size = round_up(size, align);
6696ed311b2SBenjamin Herrenschmidt 
670fc769a8eSTejun Heo 	found = memblock_find_in_range(0, max_addr, size, align);
6719c8c27e2STejun Heo 	if (found && !memblock_reserve(found, size))
6726ed311b2SBenjamin Herrenschmidt 		return found;
6736ed311b2SBenjamin Herrenschmidt 
6746ed311b2SBenjamin Herrenschmidt 	return 0;
67595f72d1eSYinghai Lu }
67695f72d1eSYinghai Lu 
6776ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
67895f72d1eSYinghai Lu {
6796ed311b2SBenjamin Herrenschmidt 	phys_addr_t alloc;
6806ed311b2SBenjamin Herrenschmidt 
6816ed311b2SBenjamin Herrenschmidt 	alloc = __memblock_alloc_base(size, align, max_addr);
6826ed311b2SBenjamin Herrenschmidt 
6836ed311b2SBenjamin Herrenschmidt 	if (alloc == 0)
6846ed311b2SBenjamin Herrenschmidt 		panic("ERROR: Failed to allocate 0x%llx bytes below 0x%llx.\n",
6856ed311b2SBenjamin Herrenschmidt 		      (unsigned long long) size, (unsigned long long) max_addr);
6866ed311b2SBenjamin Herrenschmidt 
6876ed311b2SBenjamin Herrenschmidt 	return alloc;
68895f72d1eSYinghai Lu }
68995f72d1eSYinghai Lu 
6906ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc(phys_addr_t size, phys_addr_t align)
69195f72d1eSYinghai Lu {
6926ed311b2SBenjamin Herrenschmidt 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
69395f72d1eSYinghai Lu }
69495f72d1eSYinghai Lu 
69595f72d1eSYinghai Lu 
6966ed311b2SBenjamin Herrenschmidt /*
69734e18455STejun Heo  * Additional node-local top-down allocators.
698c196f76fSBenjamin Herrenschmidt  *
699c196f76fSBenjamin Herrenschmidt  * WARNING: Only available after early_node_map[] has been populated,
700c196f76fSBenjamin Herrenschmidt  * on some architectures, that is after all the calls to add_active_range()
701c196f76fSBenjamin Herrenschmidt  * have been done to populate it.
7026ed311b2SBenjamin Herrenschmidt  */
70395f72d1eSYinghai Lu 
70434e18455STejun Heo static phys_addr_t __init memblock_nid_range_rev(phys_addr_t start,
70534e18455STejun Heo 						 phys_addr_t end, int *nid)
706c3f72b57SBenjamin Herrenschmidt {
707c196f76fSBenjamin Herrenschmidt #ifdef CONFIG_ARCH_POPULATES_NODE_MAP
708c196f76fSBenjamin Herrenschmidt 	unsigned long start_pfn, end_pfn;
709c196f76fSBenjamin Herrenschmidt 	int i;
710c196f76fSBenjamin Herrenschmidt 
711b2fea988STejun Heo 	for_each_mem_pfn_range(i, MAX_NUMNODES, &start_pfn, &end_pfn, nid)
71234e18455STejun Heo 		if (end > PFN_PHYS(start_pfn) && end <= PFN_PHYS(end_pfn))
71334e18455STejun Heo 			return max(start, PFN_PHYS(start_pfn));
714c196f76fSBenjamin Herrenschmidt #endif
715c3f72b57SBenjamin Herrenschmidt 	*nid = 0;
71634e18455STejun Heo 	return start;
717c3f72b57SBenjamin Herrenschmidt }
718c3f72b57SBenjamin Herrenschmidt 
719e6498040STejun Heo phys_addr_t __init memblock_find_in_range_node(phys_addr_t start,
720e6498040STejun Heo 					       phys_addr_t end,
7212898cc4cSBenjamin Herrenschmidt 					       phys_addr_t size,
7222898cc4cSBenjamin Herrenschmidt 					       phys_addr_t align, int nid)
72395f72d1eSYinghai Lu {
724e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *mem = &memblock.memory;
72595f72d1eSYinghai Lu 	int i;
72695f72d1eSYinghai Lu 
72795f72d1eSYinghai Lu 	BUG_ON(0 == size);
72895f72d1eSYinghai Lu 
729e6498040STejun Heo 	/* Pump up max_addr */
730e6498040STejun Heo 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
731e6498040STejun Heo 		end = memblock.current_limit;
732e6498040STejun Heo 
733e6498040STejun Heo 	for (i = mem->cnt - 1; i >= 0; i--) {
734e6498040STejun Heo 		struct memblock_region *r = &mem->regions[i];
735e6498040STejun Heo 		phys_addr_t base = max(start, r->base);
736e6498040STejun Heo 		phys_addr_t top = min(end, r->base + r->size);
737e6498040STejun Heo 
738e6498040STejun Heo 		while (base < top) {
739e6498040STejun Heo 			phys_addr_t tbase, ret;
740e6498040STejun Heo 			int tnid;
741e6498040STejun Heo 
742e6498040STejun Heo 			tbase = memblock_nid_range_rev(base, top, &tnid);
743e6498040STejun Heo 			if (nid == MAX_NUMNODES || tnid == nid) {
744e6498040STejun Heo 				ret = memblock_find_region(tbase, top, size, align);
745e6498040STejun Heo 				if (ret)
746e6498040STejun Heo 					return ret;
747e6498040STejun Heo 			}
748e6498040STejun Heo 			top = tbase;
749e6498040STejun Heo 		}
750e6498040STejun Heo 	}
751e6498040STejun Heo 
752e6498040STejun Heo 	return 0;
753e6498040STejun Heo }
754e6498040STejun Heo 
755e6498040STejun Heo phys_addr_t __init memblock_alloc_nid(phys_addr_t size, phys_addr_t align, int nid)
756e6498040STejun Heo {
757e6498040STejun Heo 	phys_addr_t found;
758e6498040STejun Heo 
759e6498040STejun Heo 	/*
760e6498040STejun Heo 	 * We align the size to limit fragmentation. Without this, a lot of
7617f219c73SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
7627f219c73SBenjamin Herrenschmidt 	 */
763348968ebSTejun Heo 	size = round_up(size, align);
7647f219c73SBenjamin Herrenschmidt 
765e6498040STejun Heo 	found = memblock_find_in_range_node(0, MEMBLOCK_ALLOC_ACCESSIBLE,
76695f72d1eSYinghai Lu 					    size, align, nid);
7679c8c27e2STejun Heo 	if (found && !memblock_reserve(found, size))
768e6498040STejun Heo 		return found;
76995f72d1eSYinghai Lu 
7709d1e2492SBenjamin Herrenschmidt 	return 0;
7719d1e2492SBenjamin Herrenschmidt }
7729d1e2492SBenjamin Herrenschmidt 
7739d1e2492SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_try_nid(phys_addr_t size, phys_addr_t align, int nid)
7749d1e2492SBenjamin Herrenschmidt {
7759d1e2492SBenjamin Herrenschmidt 	phys_addr_t res = memblock_alloc_nid(size, align, nid);
7769d1e2492SBenjamin Herrenschmidt 
7779d1e2492SBenjamin Herrenschmidt 	if (res)
7789d1e2492SBenjamin Herrenschmidt 		return res;
77915fb0972STejun Heo 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
78095f72d1eSYinghai Lu }
78195f72d1eSYinghai Lu 
7829d1e2492SBenjamin Herrenschmidt 
7839d1e2492SBenjamin Herrenschmidt /*
7849d1e2492SBenjamin Herrenschmidt  * Remaining API functions
7859d1e2492SBenjamin Herrenschmidt  */
7869d1e2492SBenjamin Herrenschmidt 
78795f72d1eSYinghai Lu /* You must call memblock_analyze() before this. */
7882898cc4cSBenjamin Herrenschmidt phys_addr_t __init memblock_phys_mem_size(void)
78995f72d1eSYinghai Lu {
7904734b594SBenjamin Herrenschmidt 	return memblock.memory_size;
79195f72d1eSYinghai Lu }
79295f72d1eSYinghai Lu 
7930a93ebefSSam Ravnborg /* lowest address */
7940a93ebefSSam Ravnborg phys_addr_t __init_memblock memblock_start_of_DRAM(void)
7950a93ebefSSam Ravnborg {
7960a93ebefSSam Ravnborg 	return memblock.memory.regions[0].base;
7970a93ebefSSam Ravnborg }
7980a93ebefSSam Ravnborg 
79910d06439SYinghai Lu phys_addr_t __init_memblock memblock_end_of_DRAM(void)
80095f72d1eSYinghai Lu {
80195f72d1eSYinghai Lu 	int idx = memblock.memory.cnt - 1;
80295f72d1eSYinghai Lu 
803e3239ff9SBenjamin Herrenschmidt 	return (memblock.memory.regions[idx].base + memblock.memory.regions[idx].size);
80495f72d1eSYinghai Lu }
80595f72d1eSYinghai Lu 
80695f72d1eSYinghai Lu /* You must call memblock_analyze() after this. */
807*c0ce8fefSTejun Heo void __init memblock_enforce_memory_limit(phys_addr_t limit)
80895f72d1eSYinghai Lu {
80995f72d1eSYinghai Lu 	unsigned long i;
810*c0ce8fefSTejun Heo 	phys_addr_t max_addr = (phys_addr_t)ULLONG_MAX;
81195f72d1eSYinghai Lu 
812*c0ce8fefSTejun Heo 	if (!limit)
81395f72d1eSYinghai Lu 		return;
81495f72d1eSYinghai Lu 
815*c0ce8fefSTejun Heo 	/* find out max address */
81695f72d1eSYinghai Lu 	for (i = 0; i < memblock.memory.cnt; i++) {
817*c0ce8fefSTejun Heo 		struct memblock_region *r = &memblock.memory.regions[i];
81895f72d1eSYinghai Lu 
819*c0ce8fefSTejun Heo 		if (limit <= r->size) {
820*c0ce8fefSTejun Heo 			max_addr = r->base + limit;
82195f72d1eSYinghai Lu 			break;
82295f72d1eSYinghai Lu 		}
823*c0ce8fefSTejun Heo 		limit -= r->size;
82495f72d1eSYinghai Lu 	}
825*c0ce8fefSTejun Heo 
826*c0ce8fefSTejun Heo 	/* truncate both memory and reserved regions */
827*c0ce8fefSTejun Heo 	__memblock_remove(&memblock.memory, max_addr, (phys_addr_t)ULLONG_MAX);
828*c0ce8fefSTejun Heo 	__memblock_remove(&memblock.reserved, max_addr, (phys_addr_t)ULLONG_MAX);
82995f72d1eSYinghai Lu }
83095f72d1eSYinghai Lu 
831cd79481dSYinghai Lu static int __init_memblock memblock_search(struct memblock_type *type, phys_addr_t addr)
83272d4b0b4SBenjamin Herrenschmidt {
83372d4b0b4SBenjamin Herrenschmidt 	unsigned int left = 0, right = type->cnt;
83472d4b0b4SBenjamin Herrenschmidt 
83572d4b0b4SBenjamin Herrenschmidt 	do {
83672d4b0b4SBenjamin Herrenschmidt 		unsigned int mid = (right + left) / 2;
83772d4b0b4SBenjamin Herrenschmidt 
83872d4b0b4SBenjamin Herrenschmidt 		if (addr < type->regions[mid].base)
83972d4b0b4SBenjamin Herrenschmidt 			right = mid;
84072d4b0b4SBenjamin Herrenschmidt 		else if (addr >= (type->regions[mid].base +
84172d4b0b4SBenjamin Herrenschmidt 				  type->regions[mid].size))
84272d4b0b4SBenjamin Herrenschmidt 			left = mid + 1;
84372d4b0b4SBenjamin Herrenschmidt 		else
84472d4b0b4SBenjamin Herrenschmidt 			return mid;
84572d4b0b4SBenjamin Herrenschmidt 	} while (left < right);
84672d4b0b4SBenjamin Herrenschmidt 	return -1;
84772d4b0b4SBenjamin Herrenschmidt }
84872d4b0b4SBenjamin Herrenschmidt 
8492898cc4cSBenjamin Herrenschmidt int __init memblock_is_reserved(phys_addr_t addr)
85095f72d1eSYinghai Lu {
85172d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.reserved, addr) != -1;
85295f72d1eSYinghai Lu }
85372d4b0b4SBenjamin Herrenschmidt 
8543661ca66SYinghai Lu int __init_memblock memblock_is_memory(phys_addr_t addr)
85572d4b0b4SBenjamin Herrenschmidt {
85672d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.memory, addr) != -1;
85772d4b0b4SBenjamin Herrenschmidt }
85872d4b0b4SBenjamin Herrenschmidt 
8593661ca66SYinghai Lu int __init_memblock memblock_is_region_memory(phys_addr_t base, phys_addr_t size)
86072d4b0b4SBenjamin Herrenschmidt {
861abb65272STomi Valkeinen 	int idx = memblock_search(&memblock.memory, base);
862eb18f1b5STejun Heo 	phys_addr_t end = base + memblock_cap_size(base, &size);
86372d4b0b4SBenjamin Herrenschmidt 
86472d4b0b4SBenjamin Herrenschmidt 	if (idx == -1)
86595f72d1eSYinghai Lu 		return 0;
866abb65272STomi Valkeinen 	return memblock.memory.regions[idx].base <= base &&
867abb65272STomi Valkeinen 		(memblock.memory.regions[idx].base +
868eb18f1b5STejun Heo 		 memblock.memory.regions[idx].size) >= end;
86995f72d1eSYinghai Lu }
87095f72d1eSYinghai Lu 
87110d06439SYinghai Lu int __init_memblock memblock_is_region_reserved(phys_addr_t base, phys_addr_t size)
87295f72d1eSYinghai Lu {
873eb18f1b5STejun Heo 	memblock_cap_size(base, &size);
874f1c2c19cSBenjamin Herrenschmidt 	return memblock_overlaps_region(&memblock.reserved, base, size) >= 0;
87595f72d1eSYinghai Lu }
87695f72d1eSYinghai Lu 
877e63075a3SBenjamin Herrenschmidt 
8783661ca66SYinghai Lu void __init_memblock memblock_set_current_limit(phys_addr_t limit)
879e63075a3SBenjamin Herrenschmidt {
880e63075a3SBenjamin Herrenschmidt 	memblock.current_limit = limit;
881e63075a3SBenjamin Herrenschmidt }
882e63075a3SBenjamin Herrenschmidt 
8837c0caeb8STejun Heo static void __init_memblock memblock_dump(struct memblock_type *type, char *name)
8846ed311b2SBenjamin Herrenschmidt {
8856ed311b2SBenjamin Herrenschmidt 	unsigned long long base, size;
8866ed311b2SBenjamin Herrenschmidt 	int i;
8876ed311b2SBenjamin Herrenschmidt 
8887c0caeb8STejun Heo 	pr_info(" %s.cnt  = 0x%lx\n", name, type->cnt);
8896ed311b2SBenjamin Herrenschmidt 
8907c0caeb8STejun Heo 	for (i = 0; i < type->cnt; i++) {
8917c0caeb8STejun Heo 		struct memblock_region *rgn = &type->regions[i];
8927c0caeb8STejun Heo 		char nid_buf[32] = "";
8936ed311b2SBenjamin Herrenschmidt 
8947c0caeb8STejun Heo 		base = rgn->base;
8957c0caeb8STejun Heo 		size = rgn->size;
8967c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
8977c0caeb8STejun Heo 		if (memblock_get_region_node(rgn) != MAX_NUMNODES)
8987c0caeb8STejun Heo 			snprintf(nid_buf, sizeof(nid_buf), " on node %d",
8997c0caeb8STejun Heo 				 memblock_get_region_node(rgn));
9007c0caeb8STejun Heo #endif
9017c0caeb8STejun Heo 		pr_info(" %s[%#x]\t[%#016llx-%#016llx], %#llx bytes%s\n",
9027c0caeb8STejun Heo 			name, i, base, base + size - 1, size, nid_buf);
9036ed311b2SBenjamin Herrenschmidt 	}
9046ed311b2SBenjamin Herrenschmidt }
9056ed311b2SBenjamin Herrenschmidt 
9064ff7b82fSTejun Heo void __init_memblock __memblock_dump_all(void)
9076ed311b2SBenjamin Herrenschmidt {
9086ed311b2SBenjamin Herrenschmidt 	pr_info("MEMBLOCK configuration:\n");
9096ed311b2SBenjamin Herrenschmidt 	pr_info(" memory size = 0x%llx\n", (unsigned long long)memblock.memory_size);
9106ed311b2SBenjamin Herrenschmidt 
9116ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.memory, "memory");
9126ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.reserved, "reserved");
9136ed311b2SBenjamin Herrenschmidt }
9146ed311b2SBenjamin Herrenschmidt 
9156ed311b2SBenjamin Herrenschmidt void __init memblock_analyze(void)
9166ed311b2SBenjamin Herrenschmidt {
9176ed311b2SBenjamin Herrenschmidt 	int i;
9186ed311b2SBenjamin Herrenschmidt 
9196ed311b2SBenjamin Herrenschmidt 	memblock.memory_size = 0;
9206ed311b2SBenjamin Herrenschmidt 
9216ed311b2SBenjamin Herrenschmidt 	for (i = 0; i < memblock.memory.cnt; i++)
9226ed311b2SBenjamin Herrenschmidt 		memblock.memory_size += memblock.memory.regions[i].size;
923142b45a7SBenjamin Herrenschmidt 
924142b45a7SBenjamin Herrenschmidt 	/* We allow resizing from there */
925142b45a7SBenjamin Herrenschmidt 	memblock_can_resize = 1;
9266ed311b2SBenjamin Herrenschmidt }
9276ed311b2SBenjamin Herrenschmidt 
9286ed311b2SBenjamin Herrenschmidt static int __init early_memblock(char *p)
9296ed311b2SBenjamin Herrenschmidt {
9306ed311b2SBenjamin Herrenschmidt 	if (p && strstr(p, "debug"))
9316ed311b2SBenjamin Herrenschmidt 		memblock_debug = 1;
9326ed311b2SBenjamin Herrenschmidt 	return 0;
9336ed311b2SBenjamin Herrenschmidt }
9346ed311b2SBenjamin Herrenschmidt early_param("memblock", early_memblock);
9356ed311b2SBenjamin Herrenschmidt 
936c378ddd5STejun Heo #if defined(CONFIG_DEBUG_FS) && !defined(CONFIG_ARCH_DISCARD_MEMBLOCK)
9376d03b885SBenjamin Herrenschmidt 
9386d03b885SBenjamin Herrenschmidt static int memblock_debug_show(struct seq_file *m, void *private)
9396d03b885SBenjamin Herrenschmidt {
9406d03b885SBenjamin Herrenschmidt 	struct memblock_type *type = m->private;
9416d03b885SBenjamin Herrenschmidt 	struct memblock_region *reg;
9426d03b885SBenjamin Herrenschmidt 	int i;
9436d03b885SBenjamin Herrenschmidt 
9446d03b885SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
9456d03b885SBenjamin Herrenschmidt 		reg = &type->regions[i];
9466d03b885SBenjamin Herrenschmidt 		seq_printf(m, "%4d: ", i);
9476d03b885SBenjamin Herrenschmidt 		if (sizeof(phys_addr_t) == 4)
9486d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%08lx..0x%08lx\n",
9496d03b885SBenjamin Herrenschmidt 				   (unsigned long)reg->base,
9506d03b885SBenjamin Herrenschmidt 				   (unsigned long)(reg->base + reg->size - 1));
9516d03b885SBenjamin Herrenschmidt 		else
9526d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%016llx..0x%016llx\n",
9536d03b885SBenjamin Herrenschmidt 				   (unsigned long long)reg->base,
9546d03b885SBenjamin Herrenschmidt 				   (unsigned long long)(reg->base + reg->size - 1));
9556d03b885SBenjamin Herrenschmidt 
9566d03b885SBenjamin Herrenschmidt 	}
9576d03b885SBenjamin Herrenschmidt 	return 0;
9586d03b885SBenjamin Herrenschmidt }
9596d03b885SBenjamin Herrenschmidt 
9606d03b885SBenjamin Herrenschmidt static int memblock_debug_open(struct inode *inode, struct file *file)
9616d03b885SBenjamin Herrenschmidt {
9626d03b885SBenjamin Herrenschmidt 	return single_open(file, memblock_debug_show, inode->i_private);
9636d03b885SBenjamin Herrenschmidt }
9646d03b885SBenjamin Herrenschmidt 
9656d03b885SBenjamin Herrenschmidt static const struct file_operations memblock_debug_fops = {
9666d03b885SBenjamin Herrenschmidt 	.open = memblock_debug_open,
9676d03b885SBenjamin Herrenschmidt 	.read = seq_read,
9686d03b885SBenjamin Herrenschmidt 	.llseek = seq_lseek,
9696d03b885SBenjamin Herrenschmidt 	.release = single_release,
9706d03b885SBenjamin Herrenschmidt };
9716d03b885SBenjamin Herrenschmidt 
9726d03b885SBenjamin Herrenschmidt static int __init memblock_init_debugfs(void)
9736d03b885SBenjamin Herrenschmidt {
9746d03b885SBenjamin Herrenschmidt 	struct dentry *root = debugfs_create_dir("memblock", NULL);
9756d03b885SBenjamin Herrenschmidt 	if (!root)
9766d03b885SBenjamin Herrenschmidt 		return -ENXIO;
9776d03b885SBenjamin Herrenschmidt 	debugfs_create_file("memory", S_IRUGO, root, &memblock.memory, &memblock_debug_fops);
9786d03b885SBenjamin Herrenschmidt 	debugfs_create_file("reserved", S_IRUGO, root, &memblock.reserved, &memblock_debug_fops);
9796d03b885SBenjamin Herrenschmidt 
9806d03b885SBenjamin Herrenschmidt 	return 0;
9816d03b885SBenjamin Herrenschmidt }
9826d03b885SBenjamin Herrenschmidt __initcall(memblock_init_debugfs);
9836d03b885SBenjamin Herrenschmidt 
9846d03b885SBenjamin Herrenschmidt #endif /* CONFIG_DEBUG_FS */
985