xref: /linux/mm/memblock.c (revision 6a9ceb31c06f1e8d50be79259756fda73234868d)
195f72d1eSYinghai Lu /*
295f72d1eSYinghai Lu  * Procedures for maintaining information about logical memory blocks.
395f72d1eSYinghai Lu  *
495f72d1eSYinghai Lu  * Peter Bergner, IBM Corp.	June 2001.
595f72d1eSYinghai Lu  * Copyright (C) 2001 Peter Bergner.
695f72d1eSYinghai Lu  *
795f72d1eSYinghai Lu  *      This program is free software; you can redistribute it and/or
895f72d1eSYinghai Lu  *      modify it under the terms of the GNU General Public License
995f72d1eSYinghai Lu  *      as published by the Free Software Foundation; either version
1095f72d1eSYinghai Lu  *      2 of the License, or (at your option) any later version.
1195f72d1eSYinghai Lu  */
1295f72d1eSYinghai Lu 
1395f72d1eSYinghai Lu #include <linux/kernel.h>
14142b45a7SBenjamin Herrenschmidt #include <linux/slab.h>
1595f72d1eSYinghai Lu #include <linux/init.h>
1695f72d1eSYinghai Lu #include <linux/bitops.h>
17449e8df3SBenjamin Herrenschmidt #include <linux/poison.h>
18c196f76fSBenjamin Herrenschmidt #include <linux/pfn.h>
196d03b885SBenjamin Herrenschmidt #include <linux/debugfs.h>
206d03b885SBenjamin Herrenschmidt #include <linux/seq_file.h>
2195f72d1eSYinghai Lu #include <linux/memblock.h>
2295f72d1eSYinghai Lu 
23fe091c20STejun Heo static struct memblock_region memblock_memory_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock;
24fe091c20STejun Heo static struct memblock_region memblock_reserved_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock;
25fe091c20STejun Heo 
26fe091c20STejun Heo struct memblock memblock __initdata_memblock = {
27fe091c20STejun Heo 	.memory.regions		= memblock_memory_init_regions,
28fe091c20STejun Heo 	.memory.cnt		= 1,	/* empty dummy entry */
29fe091c20STejun Heo 	.memory.max		= INIT_MEMBLOCK_REGIONS,
30fe091c20STejun Heo 
31fe091c20STejun Heo 	.reserved.regions	= memblock_reserved_init_regions,
32fe091c20STejun Heo 	.reserved.cnt		= 1,	/* empty dummy entry */
33fe091c20STejun Heo 	.reserved.max		= INIT_MEMBLOCK_REGIONS,
34fe091c20STejun Heo 
35fe091c20STejun Heo 	.current_limit		= MEMBLOCK_ALLOC_ANYWHERE,
36fe091c20STejun Heo };
3795f72d1eSYinghai Lu 
3810d06439SYinghai Lu int memblock_debug __initdata_memblock;
3910d06439SYinghai Lu int memblock_can_resize __initdata_memblock;
4095f72d1eSYinghai Lu 
41142b45a7SBenjamin Herrenschmidt /* inline so we don't get a warning when pr_debug is compiled out */
42142b45a7SBenjamin Herrenschmidt static inline const char *memblock_type_name(struct memblock_type *type)
43142b45a7SBenjamin Herrenschmidt {
44142b45a7SBenjamin Herrenschmidt 	if (type == &memblock.memory)
45142b45a7SBenjamin Herrenschmidt 		return "memory";
46142b45a7SBenjamin Herrenschmidt 	else if (type == &memblock.reserved)
47142b45a7SBenjamin Herrenschmidt 		return "reserved";
48142b45a7SBenjamin Herrenschmidt 	else
49142b45a7SBenjamin Herrenschmidt 		return "unknown";
50142b45a7SBenjamin Herrenschmidt }
51142b45a7SBenjamin Herrenschmidt 
526ed311b2SBenjamin Herrenschmidt /*
536ed311b2SBenjamin Herrenschmidt  * Address comparison utilities
546ed311b2SBenjamin Herrenschmidt  */
5510d06439SYinghai Lu static unsigned long __init_memblock memblock_addrs_overlap(phys_addr_t base1, phys_addr_t size1,
562898cc4cSBenjamin Herrenschmidt 				       phys_addr_t base2, phys_addr_t size2)
5795f72d1eSYinghai Lu {
5895f72d1eSYinghai Lu 	return ((base1 < (base2 + size2)) && (base2 < (base1 + size1)));
5995f72d1eSYinghai Lu }
6095f72d1eSYinghai Lu 
612d7d3eb2SH Hartley Sweeten static long __init_memblock memblock_overlaps_region(struct memblock_type *type,
622d7d3eb2SH Hartley Sweeten 					phys_addr_t base, phys_addr_t size)
636ed311b2SBenjamin Herrenschmidt {
646ed311b2SBenjamin Herrenschmidt 	unsigned long i;
656ed311b2SBenjamin Herrenschmidt 
666ed311b2SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
676ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnbase = type->regions[i].base;
686ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnsize = type->regions[i].size;
696ed311b2SBenjamin Herrenschmidt 		if (memblock_addrs_overlap(base, size, rgnbase, rgnsize))
706ed311b2SBenjamin Herrenschmidt 			break;
716ed311b2SBenjamin Herrenschmidt 	}
726ed311b2SBenjamin Herrenschmidt 
736ed311b2SBenjamin Herrenschmidt 	return (i < type->cnt) ? i : -1;
746ed311b2SBenjamin Herrenschmidt }
756ed311b2SBenjamin Herrenschmidt 
766ed311b2SBenjamin Herrenschmidt /*
776ed311b2SBenjamin Herrenschmidt  * Find, allocate, deallocate or reserve unreserved regions. All allocations
786ed311b2SBenjamin Herrenschmidt  * are top-down.
796ed311b2SBenjamin Herrenschmidt  */
806ed311b2SBenjamin Herrenschmidt 
81cd79481dSYinghai Lu static phys_addr_t __init_memblock memblock_find_region(phys_addr_t start, phys_addr_t end,
826ed311b2SBenjamin Herrenschmidt 					  phys_addr_t size, phys_addr_t align)
836ed311b2SBenjamin Herrenschmidt {
846ed311b2SBenjamin Herrenschmidt 	phys_addr_t base, res_base;
856ed311b2SBenjamin Herrenschmidt 	long j;
866ed311b2SBenjamin Herrenschmidt 
87f1af98c7SYinghai Lu 	/* In case, huge size is requested */
88f1af98c7SYinghai Lu 	if (end < size)
891f5026a7STejun Heo 		return 0;
90f1af98c7SYinghai Lu 
91348968ebSTejun Heo 	base = round_down(end - size, align);
92f1af98c7SYinghai Lu 
9325818f0fSBenjamin Herrenschmidt 	/* Prevent allocations returning 0 as it's also used to
9425818f0fSBenjamin Herrenschmidt 	 * indicate an allocation failure
9525818f0fSBenjamin Herrenschmidt 	 */
9625818f0fSBenjamin Herrenschmidt 	if (start == 0)
9725818f0fSBenjamin Herrenschmidt 		start = PAGE_SIZE;
9825818f0fSBenjamin Herrenschmidt 
996ed311b2SBenjamin Herrenschmidt 	while (start <= base) {
1006ed311b2SBenjamin Herrenschmidt 		j = memblock_overlaps_region(&memblock.reserved, base, size);
1016ed311b2SBenjamin Herrenschmidt 		if (j < 0)
1026ed311b2SBenjamin Herrenschmidt 			return base;
1036ed311b2SBenjamin Herrenschmidt 		res_base = memblock.reserved.regions[j].base;
1046ed311b2SBenjamin Herrenschmidt 		if (res_base < size)
1056ed311b2SBenjamin Herrenschmidt 			break;
106348968ebSTejun Heo 		base = round_down(res_base - size, align);
1076ed311b2SBenjamin Herrenschmidt 	}
1086ed311b2SBenjamin Herrenschmidt 
1091f5026a7STejun Heo 	return 0;
1106ed311b2SBenjamin Herrenschmidt }
1116ed311b2SBenjamin Herrenschmidt 
112fc769a8eSTejun Heo /*
113fc769a8eSTejun Heo  * Find a free area with specified alignment in a specific range.
114fc769a8eSTejun Heo  */
115fc769a8eSTejun Heo phys_addr_t __init_memblock memblock_find_in_range(phys_addr_t start, phys_addr_t end,
116fc769a8eSTejun Heo 					phys_addr_t size, phys_addr_t align)
1176ed311b2SBenjamin Herrenschmidt {
1186ed311b2SBenjamin Herrenschmidt 	long i;
1196ed311b2SBenjamin Herrenschmidt 
1206ed311b2SBenjamin Herrenschmidt 	BUG_ON(0 == size);
1216ed311b2SBenjamin Herrenschmidt 
1226ed311b2SBenjamin Herrenschmidt 	/* Pump up max_addr */
123fef501d4SBenjamin Herrenschmidt 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
124fef501d4SBenjamin Herrenschmidt 		end = memblock.current_limit;
1256ed311b2SBenjamin Herrenschmidt 
1266ed311b2SBenjamin Herrenschmidt 	/* We do a top-down search, this tends to limit memory
1276ed311b2SBenjamin Herrenschmidt 	 * fragmentation by keeping early boot allocs near the
1286ed311b2SBenjamin Herrenschmidt 	 * top of memory
1296ed311b2SBenjamin Herrenschmidt 	 */
1306ed311b2SBenjamin Herrenschmidt 	for (i = memblock.memory.cnt - 1; i >= 0; i--) {
1316ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblockbase = memblock.memory.regions[i].base;
1326ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblocksize = memblock.memory.regions[i].size;
133fef501d4SBenjamin Herrenschmidt 		phys_addr_t bottom, top, found;
1346ed311b2SBenjamin Herrenschmidt 
1356ed311b2SBenjamin Herrenschmidt 		if (memblocksize < size)
1366ed311b2SBenjamin Herrenschmidt 			continue;
137fef501d4SBenjamin Herrenschmidt 		if ((memblockbase + memblocksize) <= start)
138fef501d4SBenjamin Herrenschmidt 			break;
139fef501d4SBenjamin Herrenschmidt 		bottom = max(memblockbase, start);
140fef501d4SBenjamin Herrenschmidt 		top = min(memblockbase + memblocksize, end);
141fef501d4SBenjamin Herrenschmidt 		if (bottom >= top)
142fef501d4SBenjamin Herrenschmidt 			continue;
143fef501d4SBenjamin Herrenschmidt 		found = memblock_find_region(bottom, top, size, align);
1441f5026a7STejun Heo 		if (found)
145fef501d4SBenjamin Herrenschmidt 			return found;
1466ed311b2SBenjamin Herrenschmidt 	}
1471f5026a7STejun Heo 	return 0;
1486ed311b2SBenjamin Herrenschmidt }
1496ed311b2SBenjamin Herrenschmidt 
1505303b68fSYinghai Lu /*
1517950c407SYinghai Lu  * Free memblock.reserved.regions
1527950c407SYinghai Lu  */
1537950c407SYinghai Lu int __init_memblock memblock_free_reserved_regions(void)
1547950c407SYinghai Lu {
1557950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1567950c407SYinghai Lu 		return 0;
1577950c407SYinghai Lu 
1587950c407SYinghai Lu 	return memblock_free(__pa(memblock.reserved.regions),
1597950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1607950c407SYinghai Lu }
1617950c407SYinghai Lu 
1627950c407SYinghai Lu /*
1637950c407SYinghai Lu  * Reserve memblock.reserved.regions
1647950c407SYinghai Lu  */
1657950c407SYinghai Lu int __init_memblock memblock_reserve_reserved_regions(void)
1667950c407SYinghai Lu {
1677950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1687950c407SYinghai Lu 		return 0;
1697950c407SYinghai Lu 
1707950c407SYinghai Lu 	return memblock_reserve(__pa(memblock.reserved.regions),
1717950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1727950c407SYinghai Lu }
1737950c407SYinghai Lu 
17410d06439SYinghai Lu static void __init_memblock memblock_remove_region(struct memblock_type *type, unsigned long r)
17595f72d1eSYinghai Lu {
1767c0caeb8STejun Heo 	memmove(&type->regions[r], &type->regions[r + 1],
1777c0caeb8STejun Heo 		(type->cnt - (r + 1)) * sizeof(type->regions[r]));
178e3239ff9SBenjamin Herrenschmidt 	type->cnt--;
17995f72d1eSYinghai Lu 
1808f7a6605SBenjamin Herrenschmidt 	/* Special case for empty arrays */
1818f7a6605SBenjamin Herrenschmidt 	if (type->cnt == 0) {
1828f7a6605SBenjamin Herrenschmidt 		type->cnt = 1;
1838f7a6605SBenjamin Herrenschmidt 		type->regions[0].base = 0;
1848f7a6605SBenjamin Herrenschmidt 		type->regions[0].size = 0;
1857c0caeb8STejun Heo 		memblock_set_region_node(&type->regions[0], MAX_NUMNODES);
1868f7a6605SBenjamin Herrenschmidt 	}
18795f72d1eSYinghai Lu }
18895f72d1eSYinghai Lu 
18910d06439SYinghai Lu static int __init_memblock memblock_double_array(struct memblock_type *type)
190142b45a7SBenjamin Herrenschmidt {
191142b45a7SBenjamin Herrenschmidt 	struct memblock_region *new_array, *old_array;
192142b45a7SBenjamin Herrenschmidt 	phys_addr_t old_size, new_size, addr;
193142b45a7SBenjamin Herrenschmidt 	int use_slab = slab_is_available();
194142b45a7SBenjamin Herrenschmidt 
195142b45a7SBenjamin Herrenschmidt 	/* We don't allow resizing until we know about the reserved regions
196142b45a7SBenjamin Herrenschmidt 	 * of memory that aren't suitable for allocation
197142b45a7SBenjamin Herrenschmidt 	 */
198142b45a7SBenjamin Herrenschmidt 	if (!memblock_can_resize)
199142b45a7SBenjamin Herrenschmidt 		return -1;
200142b45a7SBenjamin Herrenschmidt 
201142b45a7SBenjamin Herrenschmidt 	/* Calculate new doubled size */
202142b45a7SBenjamin Herrenschmidt 	old_size = type->max * sizeof(struct memblock_region);
203142b45a7SBenjamin Herrenschmidt 	new_size = old_size << 1;
204142b45a7SBenjamin Herrenschmidt 
205142b45a7SBenjamin Herrenschmidt 	/* Try to find some space for it.
206142b45a7SBenjamin Herrenschmidt 	 *
207142b45a7SBenjamin Herrenschmidt 	 * WARNING: We assume that either slab_is_available() and we use it or
208142b45a7SBenjamin Herrenschmidt 	 * we use MEMBLOCK for allocations. That means that this is unsafe to use
209142b45a7SBenjamin Herrenschmidt 	 * when bootmem is currently active (unless bootmem itself is implemented
210142b45a7SBenjamin Herrenschmidt 	 * on top of MEMBLOCK which isn't the case yet)
211142b45a7SBenjamin Herrenschmidt 	 *
212142b45a7SBenjamin Herrenschmidt 	 * This should however not be an issue for now, as we currently only
213142b45a7SBenjamin Herrenschmidt 	 * call into MEMBLOCK while it's still active, or much later when slab is
214142b45a7SBenjamin Herrenschmidt 	 * active for memory hotplug operations
215142b45a7SBenjamin Herrenschmidt 	 */
216142b45a7SBenjamin Herrenschmidt 	if (use_slab) {
217142b45a7SBenjamin Herrenschmidt 		new_array = kmalloc(new_size, GFP_KERNEL);
2181f5026a7STejun Heo 		addr = new_array ? __pa(new_array) : 0;
219142b45a7SBenjamin Herrenschmidt 	} else
220fc769a8eSTejun Heo 		addr = memblock_find_in_range(0, MEMBLOCK_ALLOC_ACCESSIBLE, new_size, sizeof(phys_addr_t));
2211f5026a7STejun Heo 	if (!addr) {
222142b45a7SBenjamin Herrenschmidt 		pr_err("memblock: Failed to double %s array from %ld to %ld entries !\n",
223142b45a7SBenjamin Herrenschmidt 		       memblock_type_name(type), type->max, type->max * 2);
224142b45a7SBenjamin Herrenschmidt 		return -1;
225142b45a7SBenjamin Herrenschmidt 	}
226142b45a7SBenjamin Herrenschmidt 	new_array = __va(addr);
227142b45a7SBenjamin Herrenschmidt 
228ea9e4376SYinghai Lu 	memblock_dbg("memblock: %s array is doubled to %ld at [%#010llx-%#010llx]",
229ea9e4376SYinghai Lu 		 memblock_type_name(type), type->max * 2, (u64)addr, (u64)addr + new_size - 1);
230ea9e4376SYinghai Lu 
231142b45a7SBenjamin Herrenschmidt 	/* Found space, we now need to move the array over before
232142b45a7SBenjamin Herrenschmidt 	 * we add the reserved region since it may be our reserved
233142b45a7SBenjamin Herrenschmidt 	 * array itself that is full.
234142b45a7SBenjamin Herrenschmidt 	 */
235142b45a7SBenjamin Herrenschmidt 	memcpy(new_array, type->regions, old_size);
236142b45a7SBenjamin Herrenschmidt 	memset(new_array + type->max, 0, old_size);
237142b45a7SBenjamin Herrenschmidt 	old_array = type->regions;
238142b45a7SBenjamin Herrenschmidt 	type->regions = new_array;
239142b45a7SBenjamin Herrenschmidt 	type->max <<= 1;
240142b45a7SBenjamin Herrenschmidt 
241142b45a7SBenjamin Herrenschmidt 	/* If we use SLAB that's it, we are done */
242142b45a7SBenjamin Herrenschmidt 	if (use_slab)
243142b45a7SBenjamin Herrenschmidt 		return 0;
244142b45a7SBenjamin Herrenschmidt 
245142b45a7SBenjamin Herrenschmidt 	/* Add the new reserved region now. Should not fail ! */
2469c8c27e2STejun Heo 	BUG_ON(memblock_reserve(addr, new_size));
247142b45a7SBenjamin Herrenschmidt 
248142b45a7SBenjamin Herrenschmidt 	/* If the array wasn't our static init one, then free it. We only do
249142b45a7SBenjamin Herrenschmidt 	 * that before SLAB is available as later on, we don't know whether
250142b45a7SBenjamin Herrenschmidt 	 * to use kfree or free_bootmem_pages(). Shouldn't be a big deal
251142b45a7SBenjamin Herrenschmidt 	 * anyways
252142b45a7SBenjamin Herrenschmidt 	 */
253142b45a7SBenjamin Herrenschmidt 	if (old_array != memblock_memory_init_regions &&
254142b45a7SBenjamin Herrenschmidt 	    old_array != memblock_reserved_init_regions)
255142b45a7SBenjamin Herrenschmidt 		memblock_free(__pa(old_array), old_size);
256142b45a7SBenjamin Herrenschmidt 
257142b45a7SBenjamin Herrenschmidt 	return 0;
258142b45a7SBenjamin Herrenschmidt }
259142b45a7SBenjamin Herrenschmidt 
260784656f9STejun Heo /**
261784656f9STejun Heo  * memblock_merge_regions - merge neighboring compatible regions
262784656f9STejun Heo  * @type: memblock type to scan
263784656f9STejun Heo  *
264784656f9STejun Heo  * Scan @type and merge neighboring compatible regions.
265784656f9STejun Heo  */
266784656f9STejun Heo static void __init_memblock memblock_merge_regions(struct memblock_type *type)
267784656f9STejun Heo {
268784656f9STejun Heo 	int i = 0;
269784656f9STejun Heo 
270784656f9STejun Heo 	/* cnt never goes below 1 */
271784656f9STejun Heo 	while (i < type->cnt - 1) {
272784656f9STejun Heo 		struct memblock_region *this = &type->regions[i];
273784656f9STejun Heo 		struct memblock_region *next = &type->regions[i + 1];
274784656f9STejun Heo 
2757c0caeb8STejun Heo 		if (this->base + this->size != next->base ||
2767c0caeb8STejun Heo 		    memblock_get_region_node(this) !=
2777c0caeb8STejun Heo 		    memblock_get_region_node(next)) {
278784656f9STejun Heo 			BUG_ON(this->base + this->size > next->base);
279784656f9STejun Heo 			i++;
280784656f9STejun Heo 			continue;
281784656f9STejun Heo 		}
282784656f9STejun Heo 
283784656f9STejun Heo 		this->size += next->size;
284784656f9STejun Heo 		memmove(next, next + 1, (type->cnt - (i + 1)) * sizeof(*next));
285784656f9STejun Heo 		type->cnt--;
286784656f9STejun Heo 	}
287784656f9STejun Heo }
288784656f9STejun Heo 
289784656f9STejun Heo /**
290784656f9STejun Heo  * memblock_insert_region - insert new memblock region
291784656f9STejun Heo  * @type: memblock type to insert into
292784656f9STejun Heo  * @idx: index for the insertion point
293784656f9STejun Heo  * @base: base address of the new region
294784656f9STejun Heo  * @size: size of the new region
295784656f9STejun Heo  *
296784656f9STejun Heo  * Insert new memblock region [@base,@base+@size) into @type at @idx.
297784656f9STejun Heo  * @type must already have extra room to accomodate the new region.
298784656f9STejun Heo  */
299784656f9STejun Heo static void __init_memblock memblock_insert_region(struct memblock_type *type,
300784656f9STejun Heo 						   int idx, phys_addr_t base,
3017c0caeb8STejun Heo 						   phys_addr_t size, int nid)
302784656f9STejun Heo {
303784656f9STejun Heo 	struct memblock_region *rgn = &type->regions[idx];
304784656f9STejun Heo 
305784656f9STejun Heo 	BUG_ON(type->cnt >= type->max);
306784656f9STejun Heo 	memmove(rgn + 1, rgn, (type->cnt - idx) * sizeof(*rgn));
307784656f9STejun Heo 	rgn->base = base;
308784656f9STejun Heo 	rgn->size = size;
3097c0caeb8STejun Heo 	memblock_set_region_node(rgn, nid);
310784656f9STejun Heo 	type->cnt++;
311784656f9STejun Heo }
312784656f9STejun Heo 
313784656f9STejun Heo /**
314784656f9STejun Heo  * memblock_add_region - add new memblock region
315784656f9STejun Heo  * @type: memblock type to add new region into
316784656f9STejun Heo  * @base: base address of the new region
317784656f9STejun Heo  * @size: size of the new region
318784656f9STejun Heo  *
319784656f9STejun Heo  * Add new memblock region [@base,@base+@size) into @type.  The new region
320784656f9STejun Heo  * is allowed to overlap with existing ones - overlaps don't affect already
321784656f9STejun Heo  * existing regions.  @type is guaranteed to be minimal (all neighbouring
322784656f9STejun Heo  * compatible regions are merged) after the addition.
323784656f9STejun Heo  *
324784656f9STejun Heo  * RETURNS:
325784656f9STejun Heo  * 0 on success, -errno on failure.
326784656f9STejun Heo  */
327581adcbeSTejun Heo static int __init_memblock memblock_add_region(struct memblock_type *type,
3288f7a6605SBenjamin Herrenschmidt 					       phys_addr_t base, phys_addr_t size)
32995f72d1eSYinghai Lu {
330784656f9STejun Heo 	bool insert = false;
331784656f9STejun Heo 	phys_addr_t obase = base, end = base + size;
332784656f9STejun Heo 	int i, nr_new;
33395f72d1eSYinghai Lu 
334784656f9STejun Heo 	/* special case for empty array */
335784656f9STejun Heo 	if (type->regions[0].size == 0) {
336784656f9STejun Heo 		WARN_ON(type->cnt != 1);
337784656f9STejun Heo 		type->regions[0].base = base;
338784656f9STejun Heo 		type->regions[0].size = size;
3397c0caeb8STejun Heo 		memblock_set_region_node(&type->regions[0], MAX_NUMNODES);
340784656f9STejun Heo 		return 0;
341784656f9STejun Heo 	}
342784656f9STejun Heo repeat:
343784656f9STejun Heo 	/*
344784656f9STejun Heo 	 * The following is executed twice.  Once with %false @insert and
345784656f9STejun Heo 	 * then with %true.  The first counts the number of regions needed
346784656f9STejun Heo 	 * to accomodate the new area.  The second actually inserts them.
347784656f9STejun Heo 	 */
348784656f9STejun Heo 	base = obase;
349784656f9STejun Heo 	nr_new = 0;
350784656f9STejun Heo 
3518f7a6605SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
3528f7a6605SBenjamin Herrenschmidt 		struct memblock_region *rgn = &type->regions[i];
353784656f9STejun Heo 		phys_addr_t rbase = rgn->base;
354784656f9STejun Heo 		phys_addr_t rend = rbase + rgn->size;
3558f7a6605SBenjamin Herrenschmidt 
356784656f9STejun Heo 		if (rbase >= end)
3578f7a6605SBenjamin Herrenschmidt 			break;
358784656f9STejun Heo 		if (rend <= base)
359784656f9STejun Heo 			continue;
360784656f9STejun Heo 		/*
361784656f9STejun Heo 		 * @rgn overlaps.  If it separates the lower part of new
362784656f9STejun Heo 		 * area, insert that portion.
3638f7a6605SBenjamin Herrenschmidt 		 */
364784656f9STejun Heo 		if (rbase > base) {
365784656f9STejun Heo 			nr_new++;
366784656f9STejun Heo 			if (insert)
367784656f9STejun Heo 				memblock_insert_region(type, i++, base,
3687c0caeb8STejun Heo 						rbase - base, MAX_NUMNODES);
369784656f9STejun Heo 		}
370784656f9STejun Heo 		/* area below @rend is dealt with, forget about it */
371784656f9STejun Heo 		base = min(rend, end);
3728f7a6605SBenjamin Herrenschmidt 	}
3738f7a6605SBenjamin Herrenschmidt 
374784656f9STejun Heo 	/* insert the remaining portion */
375784656f9STejun Heo 	if (base < end) {
376784656f9STejun Heo 		nr_new++;
377784656f9STejun Heo 		if (insert)
3787c0caeb8STejun Heo 			memblock_insert_region(type, i, base, end - base,
3797c0caeb8STejun Heo 					       MAX_NUMNODES);
3808f7a6605SBenjamin Herrenschmidt 	}
3818f7a6605SBenjamin Herrenschmidt 
382784656f9STejun Heo 	/*
383784656f9STejun Heo 	 * If this was the first round, resize array and repeat for actual
384784656f9STejun Heo 	 * insertions; otherwise, merge and return.
3858f7a6605SBenjamin Herrenschmidt 	 */
386784656f9STejun Heo 	if (!insert) {
387784656f9STejun Heo 		while (type->cnt + nr_new > type->max)
388784656f9STejun Heo 			if (memblock_double_array(type) < 0)
389784656f9STejun Heo 				return -ENOMEM;
390784656f9STejun Heo 		insert = true;
391784656f9STejun Heo 		goto repeat;
39295f72d1eSYinghai Lu 	} else {
393784656f9STejun Heo 		memblock_merge_regions(type);
39495f72d1eSYinghai Lu 		return 0;
39595f72d1eSYinghai Lu 	}
396784656f9STejun Heo }
39795f72d1eSYinghai Lu 
398581adcbeSTejun Heo int __init_memblock memblock_add(phys_addr_t base, phys_addr_t size)
39995f72d1eSYinghai Lu {
400e3239ff9SBenjamin Herrenschmidt 	return memblock_add_region(&memblock.memory, base, size);
40195f72d1eSYinghai Lu }
40295f72d1eSYinghai Lu 
403*6a9ceb31STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
404*6a9ceb31STejun Heo /**
405*6a9ceb31STejun Heo  * memblock_isolate_range - isolate given range into disjoint memblocks
406*6a9ceb31STejun Heo  * @type: memblock type to isolate range for
407*6a9ceb31STejun Heo  * @base: base of range to isolate
408*6a9ceb31STejun Heo  * @size: size of range to isolate
409*6a9ceb31STejun Heo  * @start_rgn: out parameter for the start of isolated region
410*6a9ceb31STejun Heo  * @end_rgn: out parameter for the end of isolated region
411*6a9ceb31STejun Heo  *
412*6a9ceb31STejun Heo  * Walk @type and ensure that regions don't cross the boundaries defined by
413*6a9ceb31STejun Heo  * [@base,@base+@size).  Crossing regions are split at the boundaries,
414*6a9ceb31STejun Heo  * which may create at most two more regions.  The index of the first
415*6a9ceb31STejun Heo  * region inside the range is returned in *@start_rgn and end in *@end_rgn.
416*6a9ceb31STejun Heo  *
417*6a9ceb31STejun Heo  * RETURNS:
418*6a9ceb31STejun Heo  * 0 on success, -errno on failure.
419*6a9ceb31STejun Heo  */
420*6a9ceb31STejun Heo static int __init_memblock memblock_isolate_range(struct memblock_type *type,
421*6a9ceb31STejun Heo 					phys_addr_t base, phys_addr_t size,
422*6a9ceb31STejun Heo 					int *start_rgn, int *end_rgn)
423*6a9ceb31STejun Heo {
424*6a9ceb31STejun Heo 	phys_addr_t end = base + size;
425*6a9ceb31STejun Heo 	int i;
426*6a9ceb31STejun Heo 
427*6a9ceb31STejun Heo 	*start_rgn = *end_rgn = 0;
428*6a9ceb31STejun Heo 
429*6a9ceb31STejun Heo 	/* we'll create at most two more regions */
430*6a9ceb31STejun Heo 	while (type->cnt + 2 > type->max)
431*6a9ceb31STejun Heo 		if (memblock_double_array(type) < 0)
432*6a9ceb31STejun Heo 			return -ENOMEM;
433*6a9ceb31STejun Heo 
434*6a9ceb31STejun Heo 	for (i = 0; i < type->cnt; i++) {
435*6a9ceb31STejun Heo 		struct memblock_region *rgn = &type->regions[i];
436*6a9ceb31STejun Heo 		phys_addr_t rbase = rgn->base;
437*6a9ceb31STejun Heo 		phys_addr_t rend = rbase + rgn->size;
438*6a9ceb31STejun Heo 
439*6a9ceb31STejun Heo 		if (rbase >= end)
440*6a9ceb31STejun Heo 			break;
441*6a9ceb31STejun Heo 		if (rend <= base)
442*6a9ceb31STejun Heo 			continue;
443*6a9ceb31STejun Heo 
444*6a9ceb31STejun Heo 		if (rbase < base) {
445*6a9ceb31STejun Heo 			/*
446*6a9ceb31STejun Heo 			 * @rgn intersects from below.  Split and continue
447*6a9ceb31STejun Heo 			 * to process the next region - the new top half.
448*6a9ceb31STejun Heo 			 */
449*6a9ceb31STejun Heo 			rgn->base = base;
450*6a9ceb31STejun Heo 			rgn->size = rend - rgn->base;
451*6a9ceb31STejun Heo 			memblock_insert_region(type, i, rbase, base - rbase,
452*6a9ceb31STejun Heo 					       rgn->nid);
453*6a9ceb31STejun Heo 		} else if (rend > end) {
454*6a9ceb31STejun Heo 			/*
455*6a9ceb31STejun Heo 			 * @rgn intersects from above.  Split and redo the
456*6a9ceb31STejun Heo 			 * current region - the new bottom half.
457*6a9ceb31STejun Heo 			 */
458*6a9ceb31STejun Heo 			rgn->base = end;
459*6a9ceb31STejun Heo 			rgn->size = rend - rgn->base;
460*6a9ceb31STejun Heo 			memblock_insert_region(type, i--, rbase, end - rbase,
461*6a9ceb31STejun Heo 					       rgn->nid);
462*6a9ceb31STejun Heo 		} else {
463*6a9ceb31STejun Heo 			/* @rgn is fully contained, record it */
464*6a9ceb31STejun Heo 			if (!*end_rgn)
465*6a9ceb31STejun Heo 				*start_rgn = i;
466*6a9ceb31STejun Heo 			*end_rgn = i + 1;
467*6a9ceb31STejun Heo 		}
468*6a9ceb31STejun Heo 	}
469*6a9ceb31STejun Heo 
470*6a9ceb31STejun Heo 	return 0;
471*6a9ceb31STejun Heo }
472*6a9ceb31STejun Heo #endif
473*6a9ceb31STejun Heo 
474581adcbeSTejun Heo static int __init_memblock __memblock_remove(struct memblock_type *type,
4758f7a6605SBenjamin Herrenschmidt 					     phys_addr_t base, phys_addr_t size)
47695f72d1eSYinghai Lu {
4772898cc4cSBenjamin Herrenschmidt 	phys_addr_t end = base + size;
47895f72d1eSYinghai Lu 	int i;
47995f72d1eSYinghai Lu 
4808f7a6605SBenjamin Herrenschmidt 	/* Walk through the array for collisions */
481e3239ff9SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
4828f7a6605SBenjamin Herrenschmidt 		struct memblock_region *rgn = &type->regions[i];
4838f7a6605SBenjamin Herrenschmidt 		phys_addr_t rend = rgn->base + rgn->size;
48495f72d1eSYinghai Lu 
4858f7a6605SBenjamin Herrenschmidt 		/* Nothing more to do, exit */
4868f7a6605SBenjamin Herrenschmidt 		if (rgn->base > end || rgn->size == 0)
4878f7a6605SBenjamin Herrenschmidt 			break;
4888f7a6605SBenjamin Herrenschmidt 
4898f7a6605SBenjamin Herrenschmidt 		/* If we fully enclose the block, drop it */
4908f7a6605SBenjamin Herrenschmidt 		if (base <= rgn->base && end >= rend) {
4918f7a6605SBenjamin Herrenschmidt 			memblock_remove_region(type, i--);
4928f7a6605SBenjamin Herrenschmidt 			continue;
4938f7a6605SBenjamin Herrenschmidt 		}
4948f7a6605SBenjamin Herrenschmidt 
4958f7a6605SBenjamin Herrenschmidt 		/* If we are fully enclosed within a block
4968f7a6605SBenjamin Herrenschmidt 		 * then we need to split it and we are done
4978f7a6605SBenjamin Herrenschmidt 		 */
4988f7a6605SBenjamin Herrenschmidt 		if (base > rgn->base && end < rend) {
4998f7a6605SBenjamin Herrenschmidt 			rgn->size = base - rgn->base;
5008f7a6605SBenjamin Herrenschmidt 			if (!memblock_add_region(type, end, rend - end))
5018f7a6605SBenjamin Herrenschmidt 				return 0;
5028f7a6605SBenjamin Herrenschmidt 			/* Failure to split is bad, we at least
5038f7a6605SBenjamin Herrenschmidt 			 * restore the block before erroring
5048f7a6605SBenjamin Herrenschmidt 			 */
5058f7a6605SBenjamin Herrenschmidt 			rgn->size = rend - rgn->base;
5068f7a6605SBenjamin Herrenschmidt 			WARN_ON(1);
5078f7a6605SBenjamin Herrenschmidt 			return -1;
5088f7a6605SBenjamin Herrenschmidt 		}
5098f7a6605SBenjamin Herrenschmidt 
5108f7a6605SBenjamin Herrenschmidt 		/* Check if we need to trim the bottom of a block */
5118f7a6605SBenjamin Herrenschmidt 		if (rgn->base < end && rend > end) {
5128f7a6605SBenjamin Herrenschmidt 			rgn->size -= end - rgn->base;
5138f7a6605SBenjamin Herrenschmidt 			rgn->base = end;
51495f72d1eSYinghai Lu 			break;
51595f72d1eSYinghai Lu 		}
51695f72d1eSYinghai Lu 
5178f7a6605SBenjamin Herrenschmidt 		/* And check if we need to trim the top of a block */
5188f7a6605SBenjamin Herrenschmidt 		if (base < rend)
5198f7a6605SBenjamin Herrenschmidt 			rgn->size -= rend - base;
52095f72d1eSYinghai Lu 
52195f72d1eSYinghai Lu 	}
52295f72d1eSYinghai Lu 	return 0;
52395f72d1eSYinghai Lu }
52495f72d1eSYinghai Lu 
525581adcbeSTejun Heo int __init_memblock memblock_remove(phys_addr_t base, phys_addr_t size)
52695f72d1eSYinghai Lu {
52795f72d1eSYinghai Lu 	return __memblock_remove(&memblock.memory, base, size);
52895f72d1eSYinghai Lu }
52995f72d1eSYinghai Lu 
530581adcbeSTejun Heo int __init_memblock memblock_free(phys_addr_t base, phys_addr_t size)
53195f72d1eSYinghai Lu {
53224aa0788STejun Heo 	memblock_dbg("   memblock_free: [%#016llx-%#016llx] %pF\n",
533a150439cSH. Peter Anvin 		     (unsigned long long)base,
534a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
535a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
53624aa0788STejun Heo 
53795f72d1eSYinghai Lu 	return __memblock_remove(&memblock.reserved, base, size);
53895f72d1eSYinghai Lu }
53995f72d1eSYinghai Lu 
540581adcbeSTejun Heo int __init_memblock memblock_reserve(phys_addr_t base, phys_addr_t size)
54195f72d1eSYinghai Lu {
542e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *_rgn = &memblock.reserved;
54395f72d1eSYinghai Lu 
54424aa0788STejun Heo 	memblock_dbg("memblock_reserve: [%#016llx-%#016llx] %pF\n",
545a150439cSH. Peter Anvin 		     (unsigned long long)base,
546a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
547a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
54895f72d1eSYinghai Lu 	BUG_ON(0 == size);
54995f72d1eSYinghai Lu 
55095f72d1eSYinghai Lu 	return memblock_add_region(_rgn, base, size);
55195f72d1eSYinghai Lu }
55295f72d1eSYinghai Lu 
55335fd0808STejun Heo /**
55435fd0808STejun Heo  * __next_free_mem_range - next function for for_each_free_mem_range()
55535fd0808STejun Heo  * @idx: pointer to u64 loop variable
55635fd0808STejun Heo  * @nid: nid: node selector, %MAX_NUMNODES for all nodes
55735fd0808STejun Heo  * @p_start: ptr to phys_addr_t for start address of the range, can be %NULL
55835fd0808STejun Heo  * @p_end: ptr to phys_addr_t for end address of the range, can be %NULL
55935fd0808STejun Heo  * @p_nid: ptr to int for nid of the range, can be %NULL
56035fd0808STejun Heo  *
56135fd0808STejun Heo  * Find the first free area from *@idx which matches @nid, fill the out
56235fd0808STejun Heo  * parameters, and update *@idx for the next iteration.  The lower 32bit of
56335fd0808STejun Heo  * *@idx contains index into memory region and the upper 32bit indexes the
56435fd0808STejun Heo  * areas before each reserved region.  For example, if reserved regions
56535fd0808STejun Heo  * look like the following,
56635fd0808STejun Heo  *
56735fd0808STejun Heo  *	0:[0-16), 1:[32-48), 2:[128-130)
56835fd0808STejun Heo  *
56935fd0808STejun Heo  * The upper 32bit indexes the following regions.
57035fd0808STejun Heo  *
57135fd0808STejun Heo  *	0:[0-0), 1:[16-32), 2:[48-128), 3:[130-MAX)
57235fd0808STejun Heo  *
57335fd0808STejun Heo  * As both region arrays are sorted, the function advances the two indices
57435fd0808STejun Heo  * in lockstep and returns each intersection.
57535fd0808STejun Heo  */
57635fd0808STejun Heo void __init_memblock __next_free_mem_range(u64 *idx, int nid,
57735fd0808STejun Heo 					   phys_addr_t *out_start,
57835fd0808STejun Heo 					   phys_addr_t *out_end, int *out_nid)
57935fd0808STejun Heo {
58035fd0808STejun Heo 	struct memblock_type *mem = &memblock.memory;
58135fd0808STejun Heo 	struct memblock_type *rsv = &memblock.reserved;
58235fd0808STejun Heo 	int mi = *idx & 0xffffffff;
58335fd0808STejun Heo 	int ri = *idx >> 32;
58435fd0808STejun Heo 
58535fd0808STejun Heo 	for ( ; mi < mem->cnt; mi++) {
58635fd0808STejun Heo 		struct memblock_region *m = &mem->regions[mi];
58735fd0808STejun Heo 		phys_addr_t m_start = m->base;
58835fd0808STejun Heo 		phys_addr_t m_end = m->base + m->size;
58935fd0808STejun Heo 
59035fd0808STejun Heo 		/* only memory regions are associated with nodes, check it */
59135fd0808STejun Heo 		if (nid != MAX_NUMNODES && nid != memblock_get_region_node(m))
59235fd0808STejun Heo 			continue;
59335fd0808STejun Heo 
59435fd0808STejun Heo 		/* scan areas before each reservation for intersection */
59535fd0808STejun Heo 		for ( ; ri < rsv->cnt + 1; ri++) {
59635fd0808STejun Heo 			struct memblock_region *r = &rsv->regions[ri];
59735fd0808STejun Heo 			phys_addr_t r_start = ri ? r[-1].base + r[-1].size : 0;
59835fd0808STejun Heo 			phys_addr_t r_end = ri < rsv->cnt ? r->base : ULLONG_MAX;
59935fd0808STejun Heo 
60035fd0808STejun Heo 			/* if ri advanced past mi, break out to advance mi */
60135fd0808STejun Heo 			if (r_start >= m_end)
60235fd0808STejun Heo 				break;
60335fd0808STejun Heo 			/* if the two regions intersect, we're done */
60435fd0808STejun Heo 			if (m_start < r_end) {
60535fd0808STejun Heo 				if (out_start)
60635fd0808STejun Heo 					*out_start = max(m_start, r_start);
60735fd0808STejun Heo 				if (out_end)
60835fd0808STejun Heo 					*out_end = min(m_end, r_end);
60935fd0808STejun Heo 				if (out_nid)
61035fd0808STejun Heo 					*out_nid = memblock_get_region_node(m);
61135fd0808STejun Heo 				/*
61235fd0808STejun Heo 				 * The region which ends first is advanced
61335fd0808STejun Heo 				 * for the next iteration.
61435fd0808STejun Heo 				 */
61535fd0808STejun Heo 				if (m_end <= r_end)
61635fd0808STejun Heo 					mi++;
61735fd0808STejun Heo 				else
61835fd0808STejun Heo 					ri++;
61935fd0808STejun Heo 				*idx = (u32)mi | (u64)ri << 32;
62035fd0808STejun Heo 				return;
62135fd0808STejun Heo 			}
62235fd0808STejun Heo 		}
62335fd0808STejun Heo 	}
62435fd0808STejun Heo 
62535fd0808STejun Heo 	/* signal end of iteration */
62635fd0808STejun Heo 	*idx = ULLONG_MAX;
62735fd0808STejun Heo }
62835fd0808STejun Heo 
6297c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
6307c0caeb8STejun Heo /*
6317c0caeb8STejun Heo  * Common iterator interface used to define for_each_mem_range().
6327c0caeb8STejun Heo  */
6337c0caeb8STejun Heo void __init_memblock __next_mem_pfn_range(int *idx, int nid,
6347c0caeb8STejun Heo 				unsigned long *out_start_pfn,
6357c0caeb8STejun Heo 				unsigned long *out_end_pfn, int *out_nid)
6367c0caeb8STejun Heo {
6377c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
6387c0caeb8STejun Heo 	struct memblock_region *r;
6397c0caeb8STejun Heo 
6407c0caeb8STejun Heo 	while (++*idx < type->cnt) {
6417c0caeb8STejun Heo 		r = &type->regions[*idx];
6427c0caeb8STejun Heo 
6437c0caeb8STejun Heo 		if (PFN_UP(r->base) >= PFN_DOWN(r->base + r->size))
6447c0caeb8STejun Heo 			continue;
6457c0caeb8STejun Heo 		if (nid == MAX_NUMNODES || nid == r->nid)
6467c0caeb8STejun Heo 			break;
6477c0caeb8STejun Heo 	}
6487c0caeb8STejun Heo 	if (*idx >= type->cnt) {
6497c0caeb8STejun Heo 		*idx = -1;
6507c0caeb8STejun Heo 		return;
6517c0caeb8STejun Heo 	}
6527c0caeb8STejun Heo 
6537c0caeb8STejun Heo 	if (out_start_pfn)
6547c0caeb8STejun Heo 		*out_start_pfn = PFN_UP(r->base);
6557c0caeb8STejun Heo 	if (out_end_pfn)
6567c0caeb8STejun Heo 		*out_end_pfn = PFN_DOWN(r->base + r->size);
6577c0caeb8STejun Heo 	if (out_nid)
6587c0caeb8STejun Heo 		*out_nid = r->nid;
6597c0caeb8STejun Heo }
6607c0caeb8STejun Heo 
6617c0caeb8STejun Heo /**
6627c0caeb8STejun Heo  * memblock_set_node - set node ID on memblock regions
6637c0caeb8STejun Heo  * @base: base of area to set node ID for
6647c0caeb8STejun Heo  * @size: size of area to set node ID for
6657c0caeb8STejun Heo  * @nid: node ID to set
6667c0caeb8STejun Heo  *
6677c0caeb8STejun Heo  * Set the nid of memblock memory regions in [@base,@base+@size) to @nid.
6687c0caeb8STejun Heo  * Regions which cross the area boundaries are split as necessary.
6697c0caeb8STejun Heo  *
6707c0caeb8STejun Heo  * RETURNS:
6717c0caeb8STejun Heo  * 0 on success, -errno on failure.
6727c0caeb8STejun Heo  */
6737c0caeb8STejun Heo int __init_memblock memblock_set_node(phys_addr_t base, phys_addr_t size,
6747c0caeb8STejun Heo 				      int nid)
6757c0caeb8STejun Heo {
6767c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
677*6a9ceb31STejun Heo 	int start_rgn, end_rgn;
678*6a9ceb31STejun Heo 	int i, ret;
6797c0caeb8STejun Heo 
680*6a9ceb31STejun Heo 	ret = memblock_isolate_range(type, base, size, &start_rgn, &end_rgn);
681*6a9ceb31STejun Heo 	if (ret)
682*6a9ceb31STejun Heo 		return ret;
6837c0caeb8STejun Heo 
684*6a9ceb31STejun Heo 	for (i = start_rgn; i < end_rgn; i++)
685*6a9ceb31STejun Heo 		type->regions[i].nid = nid;
6867c0caeb8STejun Heo 
6877c0caeb8STejun Heo 	memblock_merge_regions(type);
6887c0caeb8STejun Heo 	return 0;
6897c0caeb8STejun Heo }
6907c0caeb8STejun Heo #endif /* CONFIG_HAVE_MEMBLOCK_NODE_MAP */
6917c0caeb8STejun Heo 
6926ed311b2SBenjamin Herrenschmidt phys_addr_t __init __memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
69395f72d1eSYinghai Lu {
6946ed311b2SBenjamin Herrenschmidt 	phys_addr_t found;
69595f72d1eSYinghai Lu 
6966ed311b2SBenjamin Herrenschmidt 	/* We align the size to limit fragmentation. Without this, a lot of
6976ed311b2SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
6986ed311b2SBenjamin Herrenschmidt 	 */
699348968ebSTejun Heo 	size = round_up(size, align);
7006ed311b2SBenjamin Herrenschmidt 
701fc769a8eSTejun Heo 	found = memblock_find_in_range(0, max_addr, size, align);
7029c8c27e2STejun Heo 	if (found && !memblock_reserve(found, size))
7036ed311b2SBenjamin Herrenschmidt 		return found;
7046ed311b2SBenjamin Herrenschmidt 
7056ed311b2SBenjamin Herrenschmidt 	return 0;
70695f72d1eSYinghai Lu }
70795f72d1eSYinghai Lu 
7086ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
70995f72d1eSYinghai Lu {
7106ed311b2SBenjamin Herrenschmidt 	phys_addr_t alloc;
7116ed311b2SBenjamin Herrenschmidt 
7126ed311b2SBenjamin Herrenschmidt 	alloc = __memblock_alloc_base(size, align, max_addr);
7136ed311b2SBenjamin Herrenschmidt 
7146ed311b2SBenjamin Herrenschmidt 	if (alloc == 0)
7156ed311b2SBenjamin Herrenschmidt 		panic("ERROR: Failed to allocate 0x%llx bytes below 0x%llx.\n",
7166ed311b2SBenjamin Herrenschmidt 		      (unsigned long long) size, (unsigned long long) max_addr);
7176ed311b2SBenjamin Herrenschmidt 
7186ed311b2SBenjamin Herrenschmidt 	return alloc;
71995f72d1eSYinghai Lu }
72095f72d1eSYinghai Lu 
7216ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc(phys_addr_t size, phys_addr_t align)
72295f72d1eSYinghai Lu {
7236ed311b2SBenjamin Herrenschmidt 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
72495f72d1eSYinghai Lu }
72595f72d1eSYinghai Lu 
72695f72d1eSYinghai Lu 
7276ed311b2SBenjamin Herrenschmidt /*
72834e18455STejun Heo  * Additional node-local top-down allocators.
729c196f76fSBenjamin Herrenschmidt  *
730c196f76fSBenjamin Herrenschmidt  * WARNING: Only available after early_node_map[] has been populated,
731c196f76fSBenjamin Herrenschmidt  * on some architectures, that is after all the calls to add_active_range()
732c196f76fSBenjamin Herrenschmidt  * have been done to populate it.
7336ed311b2SBenjamin Herrenschmidt  */
73495f72d1eSYinghai Lu 
73534e18455STejun Heo static phys_addr_t __init memblock_nid_range_rev(phys_addr_t start,
73634e18455STejun Heo 						 phys_addr_t end, int *nid)
737c3f72b57SBenjamin Herrenschmidt {
738c196f76fSBenjamin Herrenschmidt #ifdef CONFIG_ARCH_POPULATES_NODE_MAP
739c196f76fSBenjamin Herrenschmidt 	unsigned long start_pfn, end_pfn;
740c196f76fSBenjamin Herrenschmidt 	int i;
741c196f76fSBenjamin Herrenschmidt 
742b2fea988STejun Heo 	for_each_mem_pfn_range(i, MAX_NUMNODES, &start_pfn, &end_pfn, nid)
74334e18455STejun Heo 		if (end > PFN_PHYS(start_pfn) && end <= PFN_PHYS(end_pfn))
74434e18455STejun Heo 			return max(start, PFN_PHYS(start_pfn));
745c196f76fSBenjamin Herrenschmidt #endif
746c3f72b57SBenjamin Herrenschmidt 	*nid = 0;
74734e18455STejun Heo 	return start;
748c3f72b57SBenjamin Herrenschmidt }
749c3f72b57SBenjamin Herrenschmidt 
750e6498040STejun Heo phys_addr_t __init memblock_find_in_range_node(phys_addr_t start,
751e6498040STejun Heo 					       phys_addr_t end,
7522898cc4cSBenjamin Herrenschmidt 					       phys_addr_t size,
7532898cc4cSBenjamin Herrenschmidt 					       phys_addr_t align, int nid)
75495f72d1eSYinghai Lu {
755e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *mem = &memblock.memory;
75695f72d1eSYinghai Lu 	int i;
75795f72d1eSYinghai Lu 
75895f72d1eSYinghai Lu 	BUG_ON(0 == size);
75995f72d1eSYinghai Lu 
760e6498040STejun Heo 	/* Pump up max_addr */
761e6498040STejun Heo 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
762e6498040STejun Heo 		end = memblock.current_limit;
763e6498040STejun Heo 
764e6498040STejun Heo 	for (i = mem->cnt - 1; i >= 0; i--) {
765e6498040STejun Heo 		struct memblock_region *r = &mem->regions[i];
766e6498040STejun Heo 		phys_addr_t base = max(start, r->base);
767e6498040STejun Heo 		phys_addr_t top = min(end, r->base + r->size);
768e6498040STejun Heo 
769e6498040STejun Heo 		while (base < top) {
770e6498040STejun Heo 			phys_addr_t tbase, ret;
771e6498040STejun Heo 			int tnid;
772e6498040STejun Heo 
773e6498040STejun Heo 			tbase = memblock_nid_range_rev(base, top, &tnid);
774e6498040STejun Heo 			if (nid == MAX_NUMNODES || tnid == nid) {
775e6498040STejun Heo 				ret = memblock_find_region(tbase, top, size, align);
776e6498040STejun Heo 				if (ret)
777e6498040STejun Heo 					return ret;
778e6498040STejun Heo 			}
779e6498040STejun Heo 			top = tbase;
780e6498040STejun Heo 		}
781e6498040STejun Heo 	}
782e6498040STejun Heo 
783e6498040STejun Heo 	return 0;
784e6498040STejun Heo }
785e6498040STejun Heo 
786e6498040STejun Heo phys_addr_t __init memblock_alloc_nid(phys_addr_t size, phys_addr_t align, int nid)
787e6498040STejun Heo {
788e6498040STejun Heo 	phys_addr_t found;
789e6498040STejun Heo 
790e6498040STejun Heo 	/*
791e6498040STejun Heo 	 * We align the size to limit fragmentation. Without this, a lot of
7927f219c73SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
7937f219c73SBenjamin Herrenschmidt 	 */
794348968ebSTejun Heo 	size = round_up(size, align);
7957f219c73SBenjamin Herrenschmidt 
796e6498040STejun Heo 	found = memblock_find_in_range_node(0, MEMBLOCK_ALLOC_ACCESSIBLE,
79795f72d1eSYinghai Lu 					    size, align, nid);
7989c8c27e2STejun Heo 	if (found && !memblock_reserve(found, size))
799e6498040STejun Heo 		return found;
80095f72d1eSYinghai Lu 
8019d1e2492SBenjamin Herrenschmidt 	return 0;
8029d1e2492SBenjamin Herrenschmidt }
8039d1e2492SBenjamin Herrenschmidt 
8049d1e2492SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_try_nid(phys_addr_t size, phys_addr_t align, int nid)
8059d1e2492SBenjamin Herrenschmidt {
8069d1e2492SBenjamin Herrenschmidt 	phys_addr_t res = memblock_alloc_nid(size, align, nid);
8079d1e2492SBenjamin Herrenschmidt 
8089d1e2492SBenjamin Herrenschmidt 	if (res)
8099d1e2492SBenjamin Herrenschmidt 		return res;
81015fb0972STejun Heo 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
81195f72d1eSYinghai Lu }
81295f72d1eSYinghai Lu 
8139d1e2492SBenjamin Herrenschmidt 
8149d1e2492SBenjamin Herrenschmidt /*
8159d1e2492SBenjamin Herrenschmidt  * Remaining API functions
8169d1e2492SBenjamin Herrenschmidt  */
8179d1e2492SBenjamin Herrenschmidt 
81895f72d1eSYinghai Lu /* You must call memblock_analyze() before this. */
8192898cc4cSBenjamin Herrenschmidt phys_addr_t __init memblock_phys_mem_size(void)
82095f72d1eSYinghai Lu {
8214734b594SBenjamin Herrenschmidt 	return memblock.memory_size;
82295f72d1eSYinghai Lu }
82395f72d1eSYinghai Lu 
8240a93ebefSSam Ravnborg /* lowest address */
8250a93ebefSSam Ravnborg phys_addr_t __init_memblock memblock_start_of_DRAM(void)
8260a93ebefSSam Ravnborg {
8270a93ebefSSam Ravnborg 	return memblock.memory.regions[0].base;
8280a93ebefSSam Ravnborg }
8290a93ebefSSam Ravnborg 
83010d06439SYinghai Lu phys_addr_t __init_memblock memblock_end_of_DRAM(void)
83195f72d1eSYinghai Lu {
83295f72d1eSYinghai Lu 	int idx = memblock.memory.cnt - 1;
83395f72d1eSYinghai Lu 
834e3239ff9SBenjamin Herrenschmidt 	return (memblock.memory.regions[idx].base + memblock.memory.regions[idx].size);
83595f72d1eSYinghai Lu }
83695f72d1eSYinghai Lu 
83795f72d1eSYinghai Lu /* You must call memblock_analyze() after this. */
8382898cc4cSBenjamin Herrenschmidt void __init memblock_enforce_memory_limit(phys_addr_t memory_limit)
83995f72d1eSYinghai Lu {
84095f72d1eSYinghai Lu 	unsigned long i;
8412898cc4cSBenjamin Herrenschmidt 	phys_addr_t limit;
842e3239ff9SBenjamin Herrenschmidt 	struct memblock_region *p;
84395f72d1eSYinghai Lu 
84495f72d1eSYinghai Lu 	if (!memory_limit)
84595f72d1eSYinghai Lu 		return;
84695f72d1eSYinghai Lu 
84795f72d1eSYinghai Lu 	/* Truncate the memblock regions to satisfy the memory limit. */
84895f72d1eSYinghai Lu 	limit = memory_limit;
84995f72d1eSYinghai Lu 	for (i = 0; i < memblock.memory.cnt; i++) {
850e3239ff9SBenjamin Herrenschmidt 		if (limit > memblock.memory.regions[i].size) {
851e3239ff9SBenjamin Herrenschmidt 			limit -= memblock.memory.regions[i].size;
85295f72d1eSYinghai Lu 			continue;
85395f72d1eSYinghai Lu 		}
85495f72d1eSYinghai Lu 
855e3239ff9SBenjamin Herrenschmidt 		memblock.memory.regions[i].size = limit;
85695f72d1eSYinghai Lu 		memblock.memory.cnt = i + 1;
85795f72d1eSYinghai Lu 		break;
85895f72d1eSYinghai Lu 	}
85995f72d1eSYinghai Lu 
86095f72d1eSYinghai Lu 	memory_limit = memblock_end_of_DRAM();
86195f72d1eSYinghai Lu 
86295f72d1eSYinghai Lu 	/* And truncate any reserves above the limit also. */
86395f72d1eSYinghai Lu 	for (i = 0; i < memblock.reserved.cnt; i++) {
864e3239ff9SBenjamin Herrenschmidt 		p = &memblock.reserved.regions[i];
86595f72d1eSYinghai Lu 
86695f72d1eSYinghai Lu 		if (p->base > memory_limit)
86795f72d1eSYinghai Lu 			p->size = 0;
86895f72d1eSYinghai Lu 		else if ((p->base + p->size) > memory_limit)
86995f72d1eSYinghai Lu 			p->size = memory_limit - p->base;
87095f72d1eSYinghai Lu 
87195f72d1eSYinghai Lu 		if (p->size == 0) {
87295f72d1eSYinghai Lu 			memblock_remove_region(&memblock.reserved, i);
87395f72d1eSYinghai Lu 			i--;
87495f72d1eSYinghai Lu 		}
87595f72d1eSYinghai Lu 	}
87695f72d1eSYinghai Lu }
87795f72d1eSYinghai Lu 
878cd79481dSYinghai Lu static int __init_memblock memblock_search(struct memblock_type *type, phys_addr_t addr)
87972d4b0b4SBenjamin Herrenschmidt {
88072d4b0b4SBenjamin Herrenschmidt 	unsigned int left = 0, right = type->cnt;
88172d4b0b4SBenjamin Herrenschmidt 
88272d4b0b4SBenjamin Herrenschmidt 	do {
88372d4b0b4SBenjamin Herrenschmidt 		unsigned int mid = (right + left) / 2;
88472d4b0b4SBenjamin Herrenschmidt 
88572d4b0b4SBenjamin Herrenschmidt 		if (addr < type->regions[mid].base)
88672d4b0b4SBenjamin Herrenschmidt 			right = mid;
88772d4b0b4SBenjamin Herrenschmidt 		else if (addr >= (type->regions[mid].base +
88872d4b0b4SBenjamin Herrenschmidt 				  type->regions[mid].size))
88972d4b0b4SBenjamin Herrenschmidt 			left = mid + 1;
89072d4b0b4SBenjamin Herrenschmidt 		else
89172d4b0b4SBenjamin Herrenschmidt 			return mid;
89272d4b0b4SBenjamin Herrenschmidt 	} while (left < right);
89372d4b0b4SBenjamin Herrenschmidt 	return -1;
89472d4b0b4SBenjamin Herrenschmidt }
89572d4b0b4SBenjamin Herrenschmidt 
8962898cc4cSBenjamin Herrenschmidt int __init memblock_is_reserved(phys_addr_t addr)
89795f72d1eSYinghai Lu {
89872d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.reserved, addr) != -1;
89995f72d1eSYinghai Lu }
90072d4b0b4SBenjamin Herrenschmidt 
9013661ca66SYinghai Lu int __init_memblock memblock_is_memory(phys_addr_t addr)
90272d4b0b4SBenjamin Herrenschmidt {
90372d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.memory, addr) != -1;
90472d4b0b4SBenjamin Herrenschmidt }
90572d4b0b4SBenjamin Herrenschmidt 
9063661ca66SYinghai Lu int __init_memblock memblock_is_region_memory(phys_addr_t base, phys_addr_t size)
90772d4b0b4SBenjamin Herrenschmidt {
908abb65272STomi Valkeinen 	int idx = memblock_search(&memblock.memory, base);
90972d4b0b4SBenjamin Herrenschmidt 
91072d4b0b4SBenjamin Herrenschmidt 	if (idx == -1)
91195f72d1eSYinghai Lu 		return 0;
912abb65272STomi Valkeinen 	return memblock.memory.regions[idx].base <= base &&
913abb65272STomi Valkeinen 		(memblock.memory.regions[idx].base +
914abb65272STomi Valkeinen 		 memblock.memory.regions[idx].size) >= (base + size);
91595f72d1eSYinghai Lu }
91695f72d1eSYinghai Lu 
91710d06439SYinghai Lu int __init_memblock memblock_is_region_reserved(phys_addr_t base, phys_addr_t size)
91895f72d1eSYinghai Lu {
919f1c2c19cSBenjamin Herrenschmidt 	return memblock_overlaps_region(&memblock.reserved, base, size) >= 0;
92095f72d1eSYinghai Lu }
92195f72d1eSYinghai Lu 
922e63075a3SBenjamin Herrenschmidt 
9233661ca66SYinghai Lu void __init_memblock memblock_set_current_limit(phys_addr_t limit)
924e63075a3SBenjamin Herrenschmidt {
925e63075a3SBenjamin Herrenschmidt 	memblock.current_limit = limit;
926e63075a3SBenjamin Herrenschmidt }
927e63075a3SBenjamin Herrenschmidt 
9287c0caeb8STejun Heo static void __init_memblock memblock_dump(struct memblock_type *type, char *name)
9296ed311b2SBenjamin Herrenschmidt {
9306ed311b2SBenjamin Herrenschmidt 	unsigned long long base, size;
9316ed311b2SBenjamin Herrenschmidt 	int i;
9326ed311b2SBenjamin Herrenschmidt 
9337c0caeb8STejun Heo 	pr_info(" %s.cnt  = 0x%lx\n", name, type->cnt);
9346ed311b2SBenjamin Herrenschmidt 
9357c0caeb8STejun Heo 	for (i = 0; i < type->cnt; i++) {
9367c0caeb8STejun Heo 		struct memblock_region *rgn = &type->regions[i];
9377c0caeb8STejun Heo 		char nid_buf[32] = "";
9386ed311b2SBenjamin Herrenschmidt 
9397c0caeb8STejun Heo 		base = rgn->base;
9407c0caeb8STejun Heo 		size = rgn->size;
9417c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
9427c0caeb8STejun Heo 		if (memblock_get_region_node(rgn) != MAX_NUMNODES)
9437c0caeb8STejun Heo 			snprintf(nid_buf, sizeof(nid_buf), " on node %d",
9447c0caeb8STejun Heo 				 memblock_get_region_node(rgn));
9457c0caeb8STejun Heo #endif
9467c0caeb8STejun Heo 		pr_info(" %s[%#x]\t[%#016llx-%#016llx], %#llx bytes%s\n",
9477c0caeb8STejun Heo 			name, i, base, base + size - 1, size, nid_buf);
9486ed311b2SBenjamin Herrenschmidt 	}
9496ed311b2SBenjamin Herrenschmidt }
9506ed311b2SBenjamin Herrenschmidt 
9514ff7b82fSTejun Heo void __init_memblock __memblock_dump_all(void)
9526ed311b2SBenjamin Herrenschmidt {
9536ed311b2SBenjamin Herrenschmidt 	pr_info("MEMBLOCK configuration:\n");
9546ed311b2SBenjamin Herrenschmidt 	pr_info(" memory size = 0x%llx\n", (unsigned long long)memblock.memory_size);
9556ed311b2SBenjamin Herrenschmidt 
9566ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.memory, "memory");
9576ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.reserved, "reserved");
9586ed311b2SBenjamin Herrenschmidt }
9596ed311b2SBenjamin Herrenschmidt 
9606ed311b2SBenjamin Herrenschmidt void __init memblock_analyze(void)
9616ed311b2SBenjamin Herrenschmidt {
9626ed311b2SBenjamin Herrenschmidt 	int i;
9636ed311b2SBenjamin Herrenschmidt 
9646ed311b2SBenjamin Herrenschmidt 	memblock.memory_size = 0;
9656ed311b2SBenjamin Herrenschmidt 
9666ed311b2SBenjamin Herrenschmidt 	for (i = 0; i < memblock.memory.cnt; i++)
9676ed311b2SBenjamin Herrenschmidt 		memblock.memory_size += memblock.memory.regions[i].size;
968142b45a7SBenjamin Herrenschmidt 
969142b45a7SBenjamin Herrenschmidt 	/* We allow resizing from there */
970142b45a7SBenjamin Herrenschmidt 	memblock_can_resize = 1;
9716ed311b2SBenjamin Herrenschmidt }
9726ed311b2SBenjamin Herrenschmidt 
9736ed311b2SBenjamin Herrenschmidt static int __init early_memblock(char *p)
9746ed311b2SBenjamin Herrenschmidt {
9756ed311b2SBenjamin Herrenschmidt 	if (p && strstr(p, "debug"))
9766ed311b2SBenjamin Herrenschmidt 		memblock_debug = 1;
9776ed311b2SBenjamin Herrenschmidt 	return 0;
9786ed311b2SBenjamin Herrenschmidt }
9796ed311b2SBenjamin Herrenschmidt early_param("memblock", early_memblock);
9806ed311b2SBenjamin Herrenschmidt 
981c378ddd5STejun Heo #if defined(CONFIG_DEBUG_FS) && !defined(CONFIG_ARCH_DISCARD_MEMBLOCK)
9826d03b885SBenjamin Herrenschmidt 
9836d03b885SBenjamin Herrenschmidt static int memblock_debug_show(struct seq_file *m, void *private)
9846d03b885SBenjamin Herrenschmidt {
9856d03b885SBenjamin Herrenschmidt 	struct memblock_type *type = m->private;
9866d03b885SBenjamin Herrenschmidt 	struct memblock_region *reg;
9876d03b885SBenjamin Herrenschmidt 	int i;
9886d03b885SBenjamin Herrenschmidt 
9896d03b885SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
9906d03b885SBenjamin Herrenschmidt 		reg = &type->regions[i];
9916d03b885SBenjamin Herrenschmidt 		seq_printf(m, "%4d: ", i);
9926d03b885SBenjamin Herrenschmidt 		if (sizeof(phys_addr_t) == 4)
9936d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%08lx..0x%08lx\n",
9946d03b885SBenjamin Herrenschmidt 				   (unsigned long)reg->base,
9956d03b885SBenjamin Herrenschmidt 				   (unsigned long)(reg->base + reg->size - 1));
9966d03b885SBenjamin Herrenschmidt 		else
9976d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%016llx..0x%016llx\n",
9986d03b885SBenjamin Herrenschmidt 				   (unsigned long long)reg->base,
9996d03b885SBenjamin Herrenschmidt 				   (unsigned long long)(reg->base + reg->size - 1));
10006d03b885SBenjamin Herrenschmidt 
10016d03b885SBenjamin Herrenschmidt 	}
10026d03b885SBenjamin Herrenschmidt 	return 0;
10036d03b885SBenjamin Herrenschmidt }
10046d03b885SBenjamin Herrenschmidt 
10056d03b885SBenjamin Herrenschmidt static int memblock_debug_open(struct inode *inode, struct file *file)
10066d03b885SBenjamin Herrenschmidt {
10076d03b885SBenjamin Herrenschmidt 	return single_open(file, memblock_debug_show, inode->i_private);
10086d03b885SBenjamin Herrenschmidt }
10096d03b885SBenjamin Herrenschmidt 
10106d03b885SBenjamin Herrenschmidt static const struct file_operations memblock_debug_fops = {
10116d03b885SBenjamin Herrenschmidt 	.open = memblock_debug_open,
10126d03b885SBenjamin Herrenschmidt 	.read = seq_read,
10136d03b885SBenjamin Herrenschmidt 	.llseek = seq_lseek,
10146d03b885SBenjamin Herrenschmidt 	.release = single_release,
10156d03b885SBenjamin Herrenschmidt };
10166d03b885SBenjamin Herrenschmidt 
10176d03b885SBenjamin Herrenschmidt static int __init memblock_init_debugfs(void)
10186d03b885SBenjamin Herrenschmidt {
10196d03b885SBenjamin Herrenschmidt 	struct dentry *root = debugfs_create_dir("memblock", NULL);
10206d03b885SBenjamin Herrenschmidt 	if (!root)
10216d03b885SBenjamin Herrenschmidt 		return -ENXIO;
10226d03b885SBenjamin Herrenschmidt 	debugfs_create_file("memory", S_IRUGO, root, &memblock.memory, &memblock_debug_fops);
10236d03b885SBenjamin Herrenschmidt 	debugfs_create_file("reserved", S_IRUGO, root, &memblock.reserved, &memblock_debug_fops);
10246d03b885SBenjamin Herrenschmidt 
10256d03b885SBenjamin Herrenschmidt 	return 0;
10266d03b885SBenjamin Herrenschmidt }
10276d03b885SBenjamin Herrenschmidt __initcall(memblock_init_debugfs);
10286d03b885SBenjamin Herrenschmidt 
10296d03b885SBenjamin Herrenschmidt #endif /* CONFIG_DEBUG_FS */
1030