xref: /linux/mm/memblock.c (revision fe091c208a40299fba40e62292a610fb91e44b4e)
195f72d1eSYinghai Lu /*
295f72d1eSYinghai Lu  * Procedures for maintaining information about logical memory blocks.
395f72d1eSYinghai Lu  *
495f72d1eSYinghai Lu  * Peter Bergner, IBM Corp.	June 2001.
595f72d1eSYinghai Lu  * Copyright (C) 2001 Peter Bergner.
695f72d1eSYinghai Lu  *
795f72d1eSYinghai Lu  *      This program is free software; you can redistribute it and/or
895f72d1eSYinghai Lu  *      modify it under the terms of the GNU General Public License
995f72d1eSYinghai Lu  *      as published by the Free Software Foundation; either version
1095f72d1eSYinghai Lu  *      2 of the License, or (at your option) any later version.
1195f72d1eSYinghai Lu  */
1295f72d1eSYinghai Lu 
1395f72d1eSYinghai Lu #include <linux/kernel.h>
14142b45a7SBenjamin Herrenschmidt #include <linux/slab.h>
1595f72d1eSYinghai Lu #include <linux/init.h>
1695f72d1eSYinghai Lu #include <linux/bitops.h>
17449e8df3SBenjamin Herrenschmidt #include <linux/poison.h>
18c196f76fSBenjamin Herrenschmidt #include <linux/pfn.h>
196d03b885SBenjamin Herrenschmidt #include <linux/debugfs.h>
206d03b885SBenjamin Herrenschmidt #include <linux/seq_file.h>
2195f72d1eSYinghai Lu #include <linux/memblock.h>
2295f72d1eSYinghai Lu 
23*fe091c20STejun Heo static struct memblock_region memblock_memory_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock;
24*fe091c20STejun Heo static struct memblock_region memblock_reserved_init_regions[INIT_MEMBLOCK_REGIONS] __initdata_memblock;
25*fe091c20STejun Heo 
26*fe091c20STejun Heo struct memblock memblock __initdata_memblock = {
27*fe091c20STejun Heo 	.memory.regions		= memblock_memory_init_regions,
28*fe091c20STejun Heo 	.memory.cnt		= 1,	/* empty dummy entry */
29*fe091c20STejun Heo 	.memory.max		= INIT_MEMBLOCK_REGIONS,
30*fe091c20STejun Heo 
31*fe091c20STejun Heo 	.reserved.regions	= memblock_reserved_init_regions,
32*fe091c20STejun Heo 	.reserved.cnt		= 1,	/* empty dummy entry */
33*fe091c20STejun Heo 	.reserved.max		= INIT_MEMBLOCK_REGIONS,
34*fe091c20STejun Heo 
35*fe091c20STejun Heo 	.current_limit		= MEMBLOCK_ALLOC_ANYWHERE,
36*fe091c20STejun Heo };
3795f72d1eSYinghai Lu 
3810d06439SYinghai Lu int memblock_debug __initdata_memblock;
3910d06439SYinghai Lu int memblock_can_resize __initdata_memblock;
4095f72d1eSYinghai Lu 
41142b45a7SBenjamin Herrenschmidt /* inline so we don't get a warning when pr_debug is compiled out */
42142b45a7SBenjamin Herrenschmidt static inline const char *memblock_type_name(struct memblock_type *type)
43142b45a7SBenjamin Herrenschmidt {
44142b45a7SBenjamin Herrenschmidt 	if (type == &memblock.memory)
45142b45a7SBenjamin Herrenschmidt 		return "memory";
46142b45a7SBenjamin Herrenschmidt 	else if (type == &memblock.reserved)
47142b45a7SBenjamin Herrenschmidt 		return "reserved";
48142b45a7SBenjamin Herrenschmidt 	else
49142b45a7SBenjamin Herrenschmidt 		return "unknown";
50142b45a7SBenjamin Herrenschmidt }
51142b45a7SBenjamin Herrenschmidt 
526ed311b2SBenjamin Herrenschmidt /*
536ed311b2SBenjamin Herrenschmidt  * Address comparison utilities
546ed311b2SBenjamin Herrenschmidt  */
5510d06439SYinghai Lu static unsigned long __init_memblock memblock_addrs_overlap(phys_addr_t base1, phys_addr_t size1,
562898cc4cSBenjamin Herrenschmidt 				       phys_addr_t base2, phys_addr_t size2)
5795f72d1eSYinghai Lu {
5895f72d1eSYinghai Lu 	return ((base1 < (base2 + size2)) && (base2 < (base1 + size1)));
5995f72d1eSYinghai Lu }
6095f72d1eSYinghai Lu 
612d7d3eb2SH Hartley Sweeten static long __init_memblock memblock_overlaps_region(struct memblock_type *type,
622d7d3eb2SH Hartley Sweeten 					phys_addr_t base, phys_addr_t size)
636ed311b2SBenjamin Herrenschmidt {
646ed311b2SBenjamin Herrenschmidt 	unsigned long i;
656ed311b2SBenjamin Herrenschmidt 
666ed311b2SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
676ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnbase = type->regions[i].base;
686ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnsize = type->regions[i].size;
696ed311b2SBenjamin Herrenschmidt 		if (memblock_addrs_overlap(base, size, rgnbase, rgnsize))
706ed311b2SBenjamin Herrenschmidt 			break;
716ed311b2SBenjamin Herrenschmidt 	}
726ed311b2SBenjamin Herrenschmidt 
736ed311b2SBenjamin Herrenschmidt 	return (i < type->cnt) ? i : -1;
746ed311b2SBenjamin Herrenschmidt }
756ed311b2SBenjamin Herrenschmidt 
766ed311b2SBenjamin Herrenschmidt /*
776ed311b2SBenjamin Herrenschmidt  * Find, allocate, deallocate or reserve unreserved regions. All allocations
786ed311b2SBenjamin Herrenschmidt  * are top-down.
796ed311b2SBenjamin Herrenschmidt  */
806ed311b2SBenjamin Herrenschmidt 
81cd79481dSYinghai Lu static phys_addr_t __init_memblock memblock_find_region(phys_addr_t start, phys_addr_t end,
826ed311b2SBenjamin Herrenschmidt 					  phys_addr_t size, phys_addr_t align)
836ed311b2SBenjamin Herrenschmidt {
846ed311b2SBenjamin Herrenschmidt 	phys_addr_t base, res_base;
856ed311b2SBenjamin Herrenschmidt 	long j;
866ed311b2SBenjamin Herrenschmidt 
87f1af98c7SYinghai Lu 	/* In case, huge size is requested */
88f1af98c7SYinghai Lu 	if (end < size)
891f5026a7STejun Heo 		return 0;
90f1af98c7SYinghai Lu 
91348968ebSTejun Heo 	base = round_down(end - size, align);
92f1af98c7SYinghai Lu 
9325818f0fSBenjamin Herrenschmidt 	/* Prevent allocations returning 0 as it's also used to
9425818f0fSBenjamin Herrenschmidt 	 * indicate an allocation failure
9525818f0fSBenjamin Herrenschmidt 	 */
9625818f0fSBenjamin Herrenschmidt 	if (start == 0)
9725818f0fSBenjamin Herrenschmidt 		start = PAGE_SIZE;
9825818f0fSBenjamin Herrenschmidt 
996ed311b2SBenjamin Herrenschmidt 	while (start <= base) {
1006ed311b2SBenjamin Herrenschmidt 		j = memblock_overlaps_region(&memblock.reserved, base, size);
1016ed311b2SBenjamin Herrenschmidt 		if (j < 0)
1026ed311b2SBenjamin Herrenschmidt 			return base;
1036ed311b2SBenjamin Herrenschmidt 		res_base = memblock.reserved.regions[j].base;
1046ed311b2SBenjamin Herrenschmidt 		if (res_base < size)
1056ed311b2SBenjamin Herrenschmidt 			break;
106348968ebSTejun Heo 		base = round_down(res_base - size, align);
1076ed311b2SBenjamin Herrenschmidt 	}
1086ed311b2SBenjamin Herrenschmidt 
1091f5026a7STejun Heo 	return 0;
1106ed311b2SBenjamin Herrenschmidt }
1116ed311b2SBenjamin Herrenschmidt 
112fc769a8eSTejun Heo /*
113fc769a8eSTejun Heo  * Find a free area with specified alignment in a specific range.
114fc769a8eSTejun Heo  */
115fc769a8eSTejun Heo phys_addr_t __init_memblock memblock_find_in_range(phys_addr_t start, phys_addr_t end,
116fc769a8eSTejun Heo 					phys_addr_t size, phys_addr_t align)
1176ed311b2SBenjamin Herrenschmidt {
1186ed311b2SBenjamin Herrenschmidt 	long i;
1196ed311b2SBenjamin Herrenschmidt 
1206ed311b2SBenjamin Herrenschmidt 	BUG_ON(0 == size);
1216ed311b2SBenjamin Herrenschmidt 
1226ed311b2SBenjamin Herrenschmidt 	/* Pump up max_addr */
123fef501d4SBenjamin Herrenschmidt 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
124fef501d4SBenjamin Herrenschmidt 		end = memblock.current_limit;
1256ed311b2SBenjamin Herrenschmidt 
1266ed311b2SBenjamin Herrenschmidt 	/* We do a top-down search, this tends to limit memory
1276ed311b2SBenjamin Herrenschmidt 	 * fragmentation by keeping early boot allocs near the
1286ed311b2SBenjamin Herrenschmidt 	 * top of memory
1296ed311b2SBenjamin Herrenschmidt 	 */
1306ed311b2SBenjamin Herrenschmidt 	for (i = memblock.memory.cnt - 1; i >= 0; i--) {
1316ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblockbase = memblock.memory.regions[i].base;
1326ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblocksize = memblock.memory.regions[i].size;
133fef501d4SBenjamin Herrenschmidt 		phys_addr_t bottom, top, found;
1346ed311b2SBenjamin Herrenschmidt 
1356ed311b2SBenjamin Herrenschmidt 		if (memblocksize < size)
1366ed311b2SBenjamin Herrenschmidt 			continue;
137fef501d4SBenjamin Herrenschmidt 		if ((memblockbase + memblocksize) <= start)
138fef501d4SBenjamin Herrenschmidt 			break;
139fef501d4SBenjamin Herrenschmidt 		bottom = max(memblockbase, start);
140fef501d4SBenjamin Herrenschmidt 		top = min(memblockbase + memblocksize, end);
141fef501d4SBenjamin Herrenschmidt 		if (bottom >= top)
142fef501d4SBenjamin Herrenschmidt 			continue;
143fef501d4SBenjamin Herrenschmidt 		found = memblock_find_region(bottom, top, size, align);
1441f5026a7STejun Heo 		if (found)
145fef501d4SBenjamin Herrenschmidt 			return found;
1466ed311b2SBenjamin Herrenschmidt 	}
1471f5026a7STejun Heo 	return 0;
1486ed311b2SBenjamin Herrenschmidt }
1496ed311b2SBenjamin Herrenschmidt 
1505303b68fSYinghai Lu /*
1517950c407SYinghai Lu  * Free memblock.reserved.regions
1527950c407SYinghai Lu  */
1537950c407SYinghai Lu int __init_memblock memblock_free_reserved_regions(void)
1547950c407SYinghai Lu {
1557950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1567950c407SYinghai Lu 		return 0;
1577950c407SYinghai Lu 
1587950c407SYinghai Lu 	return memblock_free(__pa(memblock.reserved.regions),
1597950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1607950c407SYinghai Lu }
1617950c407SYinghai Lu 
1627950c407SYinghai Lu /*
1637950c407SYinghai Lu  * Reserve memblock.reserved.regions
1647950c407SYinghai Lu  */
1657950c407SYinghai Lu int __init_memblock memblock_reserve_reserved_regions(void)
1667950c407SYinghai Lu {
1677950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1687950c407SYinghai Lu 		return 0;
1697950c407SYinghai Lu 
1707950c407SYinghai Lu 	return memblock_reserve(__pa(memblock.reserved.regions),
1717950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1727950c407SYinghai Lu }
1737950c407SYinghai Lu 
17410d06439SYinghai Lu static void __init_memblock memblock_remove_region(struct memblock_type *type, unsigned long r)
17595f72d1eSYinghai Lu {
1767c0caeb8STejun Heo 	memmove(&type->regions[r], &type->regions[r + 1],
1777c0caeb8STejun Heo 		(type->cnt - (r + 1)) * sizeof(type->regions[r]));
178e3239ff9SBenjamin Herrenschmidt 	type->cnt--;
17995f72d1eSYinghai Lu 
1808f7a6605SBenjamin Herrenschmidt 	/* Special case for empty arrays */
1818f7a6605SBenjamin Herrenschmidt 	if (type->cnt == 0) {
1828f7a6605SBenjamin Herrenschmidt 		type->cnt = 1;
1838f7a6605SBenjamin Herrenschmidt 		type->regions[0].base = 0;
1848f7a6605SBenjamin Herrenschmidt 		type->regions[0].size = 0;
1857c0caeb8STejun Heo 		memblock_set_region_node(&type->regions[0], MAX_NUMNODES);
1868f7a6605SBenjamin Herrenschmidt 	}
18795f72d1eSYinghai Lu }
18895f72d1eSYinghai Lu 
18910d06439SYinghai Lu static int __init_memblock memblock_double_array(struct memblock_type *type)
190142b45a7SBenjamin Herrenschmidt {
191142b45a7SBenjamin Herrenschmidt 	struct memblock_region *new_array, *old_array;
192142b45a7SBenjamin Herrenschmidt 	phys_addr_t old_size, new_size, addr;
193142b45a7SBenjamin Herrenschmidt 	int use_slab = slab_is_available();
194142b45a7SBenjamin Herrenschmidt 
195142b45a7SBenjamin Herrenschmidt 	/* We don't allow resizing until we know about the reserved regions
196142b45a7SBenjamin Herrenschmidt 	 * of memory that aren't suitable for allocation
197142b45a7SBenjamin Herrenschmidt 	 */
198142b45a7SBenjamin Herrenschmidt 	if (!memblock_can_resize)
199142b45a7SBenjamin Herrenschmidt 		return -1;
200142b45a7SBenjamin Herrenschmidt 
201142b45a7SBenjamin Herrenschmidt 	/* Calculate new doubled size */
202142b45a7SBenjamin Herrenschmidt 	old_size = type->max * sizeof(struct memblock_region);
203142b45a7SBenjamin Herrenschmidt 	new_size = old_size << 1;
204142b45a7SBenjamin Herrenschmidt 
205142b45a7SBenjamin Herrenschmidt 	/* Try to find some space for it.
206142b45a7SBenjamin Herrenschmidt 	 *
207142b45a7SBenjamin Herrenschmidt 	 * WARNING: We assume that either slab_is_available() and we use it or
208142b45a7SBenjamin Herrenschmidt 	 * we use MEMBLOCK for allocations. That means that this is unsafe to use
209142b45a7SBenjamin Herrenschmidt 	 * when bootmem is currently active (unless bootmem itself is implemented
210142b45a7SBenjamin Herrenschmidt 	 * on top of MEMBLOCK which isn't the case yet)
211142b45a7SBenjamin Herrenschmidt 	 *
212142b45a7SBenjamin Herrenschmidt 	 * This should however not be an issue for now, as we currently only
213142b45a7SBenjamin Herrenschmidt 	 * call into MEMBLOCK while it's still active, or much later when slab is
214142b45a7SBenjamin Herrenschmidt 	 * active for memory hotplug operations
215142b45a7SBenjamin Herrenschmidt 	 */
216142b45a7SBenjamin Herrenschmidt 	if (use_slab) {
217142b45a7SBenjamin Herrenschmidt 		new_array = kmalloc(new_size, GFP_KERNEL);
2181f5026a7STejun Heo 		addr = new_array ? __pa(new_array) : 0;
219142b45a7SBenjamin Herrenschmidt 	} else
220fc769a8eSTejun Heo 		addr = memblock_find_in_range(0, MEMBLOCK_ALLOC_ACCESSIBLE, new_size, sizeof(phys_addr_t));
2211f5026a7STejun Heo 	if (!addr) {
222142b45a7SBenjamin Herrenschmidt 		pr_err("memblock: Failed to double %s array from %ld to %ld entries !\n",
223142b45a7SBenjamin Herrenschmidt 		       memblock_type_name(type), type->max, type->max * 2);
224142b45a7SBenjamin Herrenschmidt 		return -1;
225142b45a7SBenjamin Herrenschmidt 	}
226142b45a7SBenjamin Herrenschmidt 	new_array = __va(addr);
227142b45a7SBenjamin Herrenschmidt 
228ea9e4376SYinghai Lu 	memblock_dbg("memblock: %s array is doubled to %ld at [%#010llx-%#010llx]",
229ea9e4376SYinghai Lu 		 memblock_type_name(type), type->max * 2, (u64)addr, (u64)addr + new_size - 1);
230ea9e4376SYinghai Lu 
231142b45a7SBenjamin Herrenschmidt 	/* Found space, we now need to move the array over before
232142b45a7SBenjamin Herrenschmidt 	 * we add the reserved region since it may be our reserved
233142b45a7SBenjamin Herrenschmidt 	 * array itself that is full.
234142b45a7SBenjamin Herrenschmidt 	 */
235142b45a7SBenjamin Herrenschmidt 	memcpy(new_array, type->regions, old_size);
236142b45a7SBenjamin Herrenschmidt 	memset(new_array + type->max, 0, old_size);
237142b45a7SBenjamin Herrenschmidt 	old_array = type->regions;
238142b45a7SBenjamin Herrenschmidt 	type->regions = new_array;
239142b45a7SBenjamin Herrenschmidt 	type->max <<= 1;
240142b45a7SBenjamin Herrenschmidt 
241142b45a7SBenjamin Herrenschmidt 	/* If we use SLAB that's it, we are done */
242142b45a7SBenjamin Herrenschmidt 	if (use_slab)
243142b45a7SBenjamin Herrenschmidt 		return 0;
244142b45a7SBenjamin Herrenschmidt 
245142b45a7SBenjamin Herrenschmidt 	/* Add the new reserved region now. Should not fail ! */
2469c8c27e2STejun Heo 	BUG_ON(memblock_reserve(addr, new_size));
247142b45a7SBenjamin Herrenschmidt 
248142b45a7SBenjamin Herrenschmidt 	/* If the array wasn't our static init one, then free it. We only do
249142b45a7SBenjamin Herrenschmidt 	 * that before SLAB is available as later on, we don't know whether
250142b45a7SBenjamin Herrenschmidt 	 * to use kfree or free_bootmem_pages(). Shouldn't be a big deal
251142b45a7SBenjamin Herrenschmidt 	 * anyways
252142b45a7SBenjamin Herrenschmidt 	 */
253142b45a7SBenjamin Herrenschmidt 	if (old_array != memblock_memory_init_regions &&
254142b45a7SBenjamin Herrenschmidt 	    old_array != memblock_reserved_init_regions)
255142b45a7SBenjamin Herrenschmidt 		memblock_free(__pa(old_array), old_size);
256142b45a7SBenjamin Herrenschmidt 
257142b45a7SBenjamin Herrenschmidt 	return 0;
258142b45a7SBenjamin Herrenschmidt }
259142b45a7SBenjamin Herrenschmidt 
260784656f9STejun Heo /**
261784656f9STejun Heo  * memblock_merge_regions - merge neighboring compatible regions
262784656f9STejun Heo  * @type: memblock type to scan
263784656f9STejun Heo  *
264784656f9STejun Heo  * Scan @type and merge neighboring compatible regions.
265784656f9STejun Heo  */
266784656f9STejun Heo static void __init_memblock memblock_merge_regions(struct memblock_type *type)
267784656f9STejun Heo {
268784656f9STejun Heo 	int i = 0;
269784656f9STejun Heo 
270784656f9STejun Heo 	/* cnt never goes below 1 */
271784656f9STejun Heo 	while (i < type->cnt - 1) {
272784656f9STejun Heo 		struct memblock_region *this = &type->regions[i];
273784656f9STejun Heo 		struct memblock_region *next = &type->regions[i + 1];
274784656f9STejun Heo 
2757c0caeb8STejun Heo 		if (this->base + this->size != next->base ||
2767c0caeb8STejun Heo 		    memblock_get_region_node(this) !=
2777c0caeb8STejun Heo 		    memblock_get_region_node(next)) {
278784656f9STejun Heo 			BUG_ON(this->base + this->size > next->base);
279784656f9STejun Heo 			i++;
280784656f9STejun Heo 			continue;
281784656f9STejun Heo 		}
282784656f9STejun Heo 
283784656f9STejun Heo 		this->size += next->size;
284784656f9STejun Heo 		memmove(next, next + 1, (type->cnt - (i + 1)) * sizeof(*next));
285784656f9STejun Heo 		type->cnt--;
286784656f9STejun Heo 	}
287784656f9STejun Heo }
288784656f9STejun Heo 
289784656f9STejun Heo /**
290784656f9STejun Heo  * memblock_insert_region - insert new memblock region
291784656f9STejun Heo  * @type: memblock type to insert into
292784656f9STejun Heo  * @idx: index for the insertion point
293784656f9STejun Heo  * @base: base address of the new region
294784656f9STejun Heo  * @size: size of the new region
295784656f9STejun Heo  *
296784656f9STejun Heo  * Insert new memblock region [@base,@base+@size) into @type at @idx.
297784656f9STejun Heo  * @type must already have extra room to accomodate the new region.
298784656f9STejun Heo  */
299784656f9STejun Heo static void __init_memblock memblock_insert_region(struct memblock_type *type,
300784656f9STejun Heo 						   int idx, phys_addr_t base,
3017c0caeb8STejun Heo 						   phys_addr_t size, int nid)
302784656f9STejun Heo {
303784656f9STejun Heo 	struct memblock_region *rgn = &type->regions[idx];
304784656f9STejun Heo 
305784656f9STejun Heo 	BUG_ON(type->cnt >= type->max);
306784656f9STejun Heo 	memmove(rgn + 1, rgn, (type->cnt - idx) * sizeof(*rgn));
307784656f9STejun Heo 	rgn->base = base;
308784656f9STejun Heo 	rgn->size = size;
3097c0caeb8STejun Heo 	memblock_set_region_node(rgn, nid);
310784656f9STejun Heo 	type->cnt++;
311784656f9STejun Heo }
312784656f9STejun Heo 
313784656f9STejun Heo /**
314784656f9STejun Heo  * memblock_add_region - add new memblock region
315784656f9STejun Heo  * @type: memblock type to add new region into
316784656f9STejun Heo  * @base: base address of the new region
317784656f9STejun Heo  * @size: size of the new region
318784656f9STejun Heo  *
319784656f9STejun Heo  * Add new memblock region [@base,@base+@size) into @type.  The new region
320784656f9STejun Heo  * is allowed to overlap with existing ones - overlaps don't affect already
321784656f9STejun Heo  * existing regions.  @type is guaranteed to be minimal (all neighbouring
322784656f9STejun Heo  * compatible regions are merged) after the addition.
323784656f9STejun Heo  *
324784656f9STejun Heo  * RETURNS:
325784656f9STejun Heo  * 0 on success, -errno on failure.
326784656f9STejun Heo  */
327581adcbeSTejun Heo static int __init_memblock memblock_add_region(struct memblock_type *type,
3288f7a6605SBenjamin Herrenschmidt 					       phys_addr_t base, phys_addr_t size)
32995f72d1eSYinghai Lu {
330784656f9STejun Heo 	bool insert = false;
331784656f9STejun Heo 	phys_addr_t obase = base, end = base + size;
332784656f9STejun Heo 	int i, nr_new;
33395f72d1eSYinghai Lu 
334784656f9STejun Heo 	/* special case for empty array */
335784656f9STejun Heo 	if (type->regions[0].size == 0) {
336784656f9STejun Heo 		WARN_ON(type->cnt != 1);
337784656f9STejun Heo 		type->regions[0].base = base;
338784656f9STejun Heo 		type->regions[0].size = size;
3397c0caeb8STejun Heo 		memblock_set_region_node(&type->regions[0], MAX_NUMNODES);
340784656f9STejun Heo 		return 0;
341784656f9STejun Heo 	}
342784656f9STejun Heo repeat:
343784656f9STejun Heo 	/*
344784656f9STejun Heo 	 * The following is executed twice.  Once with %false @insert and
345784656f9STejun Heo 	 * then with %true.  The first counts the number of regions needed
346784656f9STejun Heo 	 * to accomodate the new area.  The second actually inserts them.
347784656f9STejun Heo 	 */
348784656f9STejun Heo 	base = obase;
349784656f9STejun Heo 	nr_new = 0;
350784656f9STejun Heo 
3518f7a6605SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
3528f7a6605SBenjamin Herrenschmidt 		struct memblock_region *rgn = &type->regions[i];
353784656f9STejun Heo 		phys_addr_t rbase = rgn->base;
354784656f9STejun Heo 		phys_addr_t rend = rbase + rgn->size;
3558f7a6605SBenjamin Herrenschmidt 
356784656f9STejun Heo 		if (rbase >= end)
3578f7a6605SBenjamin Herrenschmidt 			break;
358784656f9STejun Heo 		if (rend <= base)
359784656f9STejun Heo 			continue;
360784656f9STejun Heo 		/*
361784656f9STejun Heo 		 * @rgn overlaps.  If it separates the lower part of new
362784656f9STejun Heo 		 * area, insert that portion.
3638f7a6605SBenjamin Herrenschmidt 		 */
364784656f9STejun Heo 		if (rbase > base) {
365784656f9STejun Heo 			nr_new++;
366784656f9STejun Heo 			if (insert)
367784656f9STejun Heo 				memblock_insert_region(type, i++, base,
3687c0caeb8STejun Heo 						rbase - base, MAX_NUMNODES);
369784656f9STejun Heo 		}
370784656f9STejun Heo 		/* area below @rend is dealt with, forget about it */
371784656f9STejun Heo 		base = min(rend, end);
3728f7a6605SBenjamin Herrenschmidt 	}
3738f7a6605SBenjamin Herrenschmidt 
374784656f9STejun Heo 	/* insert the remaining portion */
375784656f9STejun Heo 	if (base < end) {
376784656f9STejun Heo 		nr_new++;
377784656f9STejun Heo 		if (insert)
3787c0caeb8STejun Heo 			memblock_insert_region(type, i, base, end - base,
3797c0caeb8STejun Heo 					       MAX_NUMNODES);
3808f7a6605SBenjamin Herrenschmidt 	}
3818f7a6605SBenjamin Herrenschmidt 
382784656f9STejun Heo 	/*
383784656f9STejun Heo 	 * If this was the first round, resize array and repeat for actual
384784656f9STejun Heo 	 * insertions; otherwise, merge and return.
3858f7a6605SBenjamin Herrenschmidt 	 */
386784656f9STejun Heo 	if (!insert) {
387784656f9STejun Heo 		while (type->cnt + nr_new > type->max)
388784656f9STejun Heo 			if (memblock_double_array(type) < 0)
389784656f9STejun Heo 				return -ENOMEM;
390784656f9STejun Heo 		insert = true;
391784656f9STejun Heo 		goto repeat;
39295f72d1eSYinghai Lu 	} else {
393784656f9STejun Heo 		memblock_merge_regions(type);
39495f72d1eSYinghai Lu 		return 0;
39595f72d1eSYinghai Lu 	}
396784656f9STejun Heo }
39795f72d1eSYinghai Lu 
398581adcbeSTejun Heo int __init_memblock memblock_add(phys_addr_t base, phys_addr_t size)
39995f72d1eSYinghai Lu {
400e3239ff9SBenjamin Herrenschmidt 	return memblock_add_region(&memblock.memory, base, size);
40195f72d1eSYinghai Lu }
40295f72d1eSYinghai Lu 
403581adcbeSTejun Heo static int __init_memblock __memblock_remove(struct memblock_type *type,
4048f7a6605SBenjamin Herrenschmidt 					     phys_addr_t base, phys_addr_t size)
40595f72d1eSYinghai Lu {
4062898cc4cSBenjamin Herrenschmidt 	phys_addr_t end = base + size;
40795f72d1eSYinghai Lu 	int i;
40895f72d1eSYinghai Lu 
4098f7a6605SBenjamin Herrenschmidt 	/* Walk through the array for collisions */
410e3239ff9SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
4118f7a6605SBenjamin Herrenschmidt 		struct memblock_region *rgn = &type->regions[i];
4128f7a6605SBenjamin Herrenschmidt 		phys_addr_t rend = rgn->base + rgn->size;
41395f72d1eSYinghai Lu 
4148f7a6605SBenjamin Herrenschmidt 		/* Nothing more to do, exit */
4158f7a6605SBenjamin Herrenschmidt 		if (rgn->base > end || rgn->size == 0)
4168f7a6605SBenjamin Herrenschmidt 			break;
4178f7a6605SBenjamin Herrenschmidt 
4188f7a6605SBenjamin Herrenschmidt 		/* If we fully enclose the block, drop it */
4198f7a6605SBenjamin Herrenschmidt 		if (base <= rgn->base && end >= rend) {
4208f7a6605SBenjamin Herrenschmidt 			memblock_remove_region(type, i--);
4218f7a6605SBenjamin Herrenschmidt 			continue;
4228f7a6605SBenjamin Herrenschmidt 		}
4238f7a6605SBenjamin Herrenschmidt 
4248f7a6605SBenjamin Herrenschmidt 		/* If we are fully enclosed within a block
4258f7a6605SBenjamin Herrenschmidt 		 * then we need to split it and we are done
4268f7a6605SBenjamin Herrenschmidt 		 */
4278f7a6605SBenjamin Herrenschmidt 		if (base > rgn->base && end < rend) {
4288f7a6605SBenjamin Herrenschmidt 			rgn->size = base - rgn->base;
4298f7a6605SBenjamin Herrenschmidt 			if (!memblock_add_region(type, end, rend - end))
4308f7a6605SBenjamin Herrenschmidt 				return 0;
4318f7a6605SBenjamin Herrenschmidt 			/* Failure to split is bad, we at least
4328f7a6605SBenjamin Herrenschmidt 			 * restore the block before erroring
4338f7a6605SBenjamin Herrenschmidt 			 */
4348f7a6605SBenjamin Herrenschmidt 			rgn->size = rend - rgn->base;
4358f7a6605SBenjamin Herrenschmidt 			WARN_ON(1);
4368f7a6605SBenjamin Herrenschmidt 			return -1;
4378f7a6605SBenjamin Herrenschmidt 		}
4388f7a6605SBenjamin Herrenschmidt 
4398f7a6605SBenjamin Herrenschmidt 		/* Check if we need to trim the bottom of a block */
4408f7a6605SBenjamin Herrenschmidt 		if (rgn->base < end && rend > end) {
4418f7a6605SBenjamin Herrenschmidt 			rgn->size -= end - rgn->base;
4428f7a6605SBenjamin Herrenschmidt 			rgn->base = end;
44395f72d1eSYinghai Lu 			break;
44495f72d1eSYinghai Lu 		}
44595f72d1eSYinghai Lu 
4468f7a6605SBenjamin Herrenschmidt 		/* And check if we need to trim the top of a block */
4478f7a6605SBenjamin Herrenschmidt 		if (base < rend)
4488f7a6605SBenjamin Herrenschmidt 			rgn->size -= rend - base;
44995f72d1eSYinghai Lu 
45095f72d1eSYinghai Lu 	}
45195f72d1eSYinghai Lu 	return 0;
45295f72d1eSYinghai Lu }
45395f72d1eSYinghai Lu 
454581adcbeSTejun Heo int __init_memblock memblock_remove(phys_addr_t base, phys_addr_t size)
45595f72d1eSYinghai Lu {
45695f72d1eSYinghai Lu 	return __memblock_remove(&memblock.memory, base, size);
45795f72d1eSYinghai Lu }
45895f72d1eSYinghai Lu 
459581adcbeSTejun Heo int __init_memblock memblock_free(phys_addr_t base, phys_addr_t size)
46095f72d1eSYinghai Lu {
46124aa0788STejun Heo 	memblock_dbg("   memblock_free: [%#016llx-%#016llx] %pF\n",
462a150439cSH. Peter Anvin 		     (unsigned long long)base,
463a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
464a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
46524aa0788STejun Heo 
46695f72d1eSYinghai Lu 	return __memblock_remove(&memblock.reserved, base, size);
46795f72d1eSYinghai Lu }
46895f72d1eSYinghai Lu 
469581adcbeSTejun Heo int __init_memblock memblock_reserve(phys_addr_t base, phys_addr_t size)
47095f72d1eSYinghai Lu {
471e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *_rgn = &memblock.reserved;
47295f72d1eSYinghai Lu 
47324aa0788STejun Heo 	memblock_dbg("memblock_reserve: [%#016llx-%#016llx] %pF\n",
474a150439cSH. Peter Anvin 		     (unsigned long long)base,
475a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
476a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
47795f72d1eSYinghai Lu 	BUG_ON(0 == size);
47895f72d1eSYinghai Lu 
47995f72d1eSYinghai Lu 	return memblock_add_region(_rgn, base, size);
48095f72d1eSYinghai Lu }
48195f72d1eSYinghai Lu 
48235fd0808STejun Heo /**
48335fd0808STejun Heo  * __next_free_mem_range - next function for for_each_free_mem_range()
48435fd0808STejun Heo  * @idx: pointer to u64 loop variable
48535fd0808STejun Heo  * @nid: nid: node selector, %MAX_NUMNODES for all nodes
48635fd0808STejun Heo  * @p_start: ptr to phys_addr_t for start address of the range, can be %NULL
48735fd0808STejun Heo  * @p_end: ptr to phys_addr_t for end address of the range, can be %NULL
48835fd0808STejun Heo  * @p_nid: ptr to int for nid of the range, can be %NULL
48935fd0808STejun Heo  *
49035fd0808STejun Heo  * Find the first free area from *@idx which matches @nid, fill the out
49135fd0808STejun Heo  * parameters, and update *@idx for the next iteration.  The lower 32bit of
49235fd0808STejun Heo  * *@idx contains index into memory region and the upper 32bit indexes the
49335fd0808STejun Heo  * areas before each reserved region.  For example, if reserved regions
49435fd0808STejun Heo  * look like the following,
49535fd0808STejun Heo  *
49635fd0808STejun Heo  *	0:[0-16), 1:[32-48), 2:[128-130)
49735fd0808STejun Heo  *
49835fd0808STejun Heo  * The upper 32bit indexes the following regions.
49935fd0808STejun Heo  *
50035fd0808STejun Heo  *	0:[0-0), 1:[16-32), 2:[48-128), 3:[130-MAX)
50135fd0808STejun Heo  *
50235fd0808STejun Heo  * As both region arrays are sorted, the function advances the two indices
50335fd0808STejun Heo  * in lockstep and returns each intersection.
50435fd0808STejun Heo  */
50535fd0808STejun Heo void __init_memblock __next_free_mem_range(u64 *idx, int nid,
50635fd0808STejun Heo 					   phys_addr_t *out_start,
50735fd0808STejun Heo 					   phys_addr_t *out_end, int *out_nid)
50835fd0808STejun Heo {
50935fd0808STejun Heo 	struct memblock_type *mem = &memblock.memory;
51035fd0808STejun Heo 	struct memblock_type *rsv = &memblock.reserved;
51135fd0808STejun Heo 	int mi = *idx & 0xffffffff;
51235fd0808STejun Heo 	int ri = *idx >> 32;
51335fd0808STejun Heo 
51435fd0808STejun Heo 	for ( ; mi < mem->cnt; mi++) {
51535fd0808STejun Heo 		struct memblock_region *m = &mem->regions[mi];
51635fd0808STejun Heo 		phys_addr_t m_start = m->base;
51735fd0808STejun Heo 		phys_addr_t m_end = m->base + m->size;
51835fd0808STejun Heo 
51935fd0808STejun Heo 		/* only memory regions are associated with nodes, check it */
52035fd0808STejun Heo 		if (nid != MAX_NUMNODES && nid != memblock_get_region_node(m))
52135fd0808STejun Heo 			continue;
52235fd0808STejun Heo 
52335fd0808STejun Heo 		/* scan areas before each reservation for intersection */
52435fd0808STejun Heo 		for ( ; ri < rsv->cnt + 1; ri++) {
52535fd0808STejun Heo 			struct memblock_region *r = &rsv->regions[ri];
52635fd0808STejun Heo 			phys_addr_t r_start = ri ? r[-1].base + r[-1].size : 0;
52735fd0808STejun Heo 			phys_addr_t r_end = ri < rsv->cnt ? r->base : ULLONG_MAX;
52835fd0808STejun Heo 
52935fd0808STejun Heo 			/* if ri advanced past mi, break out to advance mi */
53035fd0808STejun Heo 			if (r_start >= m_end)
53135fd0808STejun Heo 				break;
53235fd0808STejun Heo 			/* if the two regions intersect, we're done */
53335fd0808STejun Heo 			if (m_start < r_end) {
53435fd0808STejun Heo 				if (out_start)
53535fd0808STejun Heo 					*out_start = max(m_start, r_start);
53635fd0808STejun Heo 				if (out_end)
53735fd0808STejun Heo 					*out_end = min(m_end, r_end);
53835fd0808STejun Heo 				if (out_nid)
53935fd0808STejun Heo 					*out_nid = memblock_get_region_node(m);
54035fd0808STejun Heo 				/*
54135fd0808STejun Heo 				 * The region which ends first is advanced
54235fd0808STejun Heo 				 * for the next iteration.
54335fd0808STejun Heo 				 */
54435fd0808STejun Heo 				if (m_end <= r_end)
54535fd0808STejun Heo 					mi++;
54635fd0808STejun Heo 				else
54735fd0808STejun Heo 					ri++;
54835fd0808STejun Heo 				*idx = (u32)mi | (u64)ri << 32;
54935fd0808STejun Heo 				return;
55035fd0808STejun Heo 			}
55135fd0808STejun Heo 		}
55235fd0808STejun Heo 	}
55335fd0808STejun Heo 
55435fd0808STejun Heo 	/* signal end of iteration */
55535fd0808STejun Heo 	*idx = ULLONG_MAX;
55635fd0808STejun Heo }
55735fd0808STejun Heo 
5587c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
5597c0caeb8STejun Heo /*
5607c0caeb8STejun Heo  * Common iterator interface used to define for_each_mem_range().
5617c0caeb8STejun Heo  */
5627c0caeb8STejun Heo void __init_memblock __next_mem_pfn_range(int *idx, int nid,
5637c0caeb8STejun Heo 				unsigned long *out_start_pfn,
5647c0caeb8STejun Heo 				unsigned long *out_end_pfn, int *out_nid)
5657c0caeb8STejun Heo {
5667c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
5677c0caeb8STejun Heo 	struct memblock_region *r;
5687c0caeb8STejun Heo 
5697c0caeb8STejun Heo 	while (++*idx < type->cnt) {
5707c0caeb8STejun Heo 		r = &type->regions[*idx];
5717c0caeb8STejun Heo 
5727c0caeb8STejun Heo 		if (PFN_UP(r->base) >= PFN_DOWN(r->base + r->size))
5737c0caeb8STejun Heo 			continue;
5747c0caeb8STejun Heo 		if (nid == MAX_NUMNODES || nid == r->nid)
5757c0caeb8STejun Heo 			break;
5767c0caeb8STejun Heo 	}
5777c0caeb8STejun Heo 	if (*idx >= type->cnt) {
5787c0caeb8STejun Heo 		*idx = -1;
5797c0caeb8STejun Heo 		return;
5807c0caeb8STejun Heo 	}
5817c0caeb8STejun Heo 
5827c0caeb8STejun Heo 	if (out_start_pfn)
5837c0caeb8STejun Heo 		*out_start_pfn = PFN_UP(r->base);
5847c0caeb8STejun Heo 	if (out_end_pfn)
5857c0caeb8STejun Heo 		*out_end_pfn = PFN_DOWN(r->base + r->size);
5867c0caeb8STejun Heo 	if (out_nid)
5877c0caeb8STejun Heo 		*out_nid = r->nid;
5887c0caeb8STejun Heo }
5897c0caeb8STejun Heo 
5907c0caeb8STejun Heo /**
5917c0caeb8STejun Heo  * memblock_set_node - set node ID on memblock regions
5927c0caeb8STejun Heo  * @base: base of area to set node ID for
5937c0caeb8STejun Heo  * @size: size of area to set node ID for
5947c0caeb8STejun Heo  * @nid: node ID to set
5957c0caeb8STejun Heo  *
5967c0caeb8STejun Heo  * Set the nid of memblock memory regions in [@base,@base+@size) to @nid.
5977c0caeb8STejun Heo  * Regions which cross the area boundaries are split as necessary.
5987c0caeb8STejun Heo  *
5997c0caeb8STejun Heo  * RETURNS:
6007c0caeb8STejun Heo  * 0 on success, -errno on failure.
6017c0caeb8STejun Heo  */
6027c0caeb8STejun Heo int __init_memblock memblock_set_node(phys_addr_t base, phys_addr_t size,
6037c0caeb8STejun Heo 				      int nid)
6047c0caeb8STejun Heo {
6057c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
6067c0caeb8STejun Heo 	phys_addr_t end = base + size;
6077c0caeb8STejun Heo 	int i;
6087c0caeb8STejun Heo 
6097c0caeb8STejun Heo 	/* we'll create at most two more regions */
6107c0caeb8STejun Heo 	while (type->cnt + 2 > type->max)
6117c0caeb8STejun Heo 		if (memblock_double_array(type) < 0)
6127c0caeb8STejun Heo 			return -ENOMEM;
6137c0caeb8STejun Heo 
6147c0caeb8STejun Heo 	for (i = 0; i < type->cnt; i++) {
6157c0caeb8STejun Heo 		struct memblock_region *rgn = &type->regions[i];
6167c0caeb8STejun Heo 		phys_addr_t rbase = rgn->base;
6177c0caeb8STejun Heo 		phys_addr_t rend = rbase + rgn->size;
6187c0caeb8STejun Heo 
6197c0caeb8STejun Heo 		if (rbase >= end)
6207c0caeb8STejun Heo 			break;
6217c0caeb8STejun Heo 		if (rend <= base)
6227c0caeb8STejun Heo 			continue;
6237c0caeb8STejun Heo 
6247c0caeb8STejun Heo 		if (rbase < base) {
6257c0caeb8STejun Heo 			/*
6267c0caeb8STejun Heo 			 * @rgn intersects from below.  Split and continue
6277c0caeb8STejun Heo 			 * to process the next region - the new top half.
6287c0caeb8STejun Heo 			 */
6297c0caeb8STejun Heo 			rgn->base = base;
6307c0caeb8STejun Heo 			rgn->size = rend - rgn->base;
6317c0caeb8STejun Heo 			memblock_insert_region(type, i, rbase, base - rbase,
6327c0caeb8STejun Heo 					       rgn->nid);
6337c0caeb8STejun Heo 		} else if (rend > end) {
6347c0caeb8STejun Heo 			/*
6357c0caeb8STejun Heo 			 * @rgn intersects from above.  Split and redo the
6367c0caeb8STejun Heo 			 * current region - the new bottom half.
6377c0caeb8STejun Heo 			 */
6387c0caeb8STejun Heo 			rgn->base = end;
6397c0caeb8STejun Heo 			rgn->size = rend - rgn->base;
6407c0caeb8STejun Heo 			memblock_insert_region(type, i--, rbase, end - rbase,
6417c0caeb8STejun Heo 					       rgn->nid);
6427c0caeb8STejun Heo 		} else {
6437c0caeb8STejun Heo 			/* @rgn is fully contained, set ->nid */
6447c0caeb8STejun Heo 			rgn->nid = nid;
6457c0caeb8STejun Heo 		}
6467c0caeb8STejun Heo 	}
6477c0caeb8STejun Heo 
6487c0caeb8STejun Heo 	memblock_merge_regions(type);
6497c0caeb8STejun Heo 	return 0;
6507c0caeb8STejun Heo }
6517c0caeb8STejun Heo #endif /* CONFIG_HAVE_MEMBLOCK_NODE_MAP */
6527c0caeb8STejun Heo 
6536ed311b2SBenjamin Herrenschmidt phys_addr_t __init __memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
65495f72d1eSYinghai Lu {
6556ed311b2SBenjamin Herrenschmidt 	phys_addr_t found;
65695f72d1eSYinghai Lu 
6576ed311b2SBenjamin Herrenschmidt 	/* We align the size to limit fragmentation. Without this, a lot of
6586ed311b2SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
6596ed311b2SBenjamin Herrenschmidt 	 */
660348968ebSTejun Heo 	size = round_up(size, align);
6616ed311b2SBenjamin Herrenschmidt 
662fc769a8eSTejun Heo 	found = memblock_find_in_range(0, max_addr, size, align);
6639c8c27e2STejun Heo 	if (found && !memblock_reserve(found, size))
6646ed311b2SBenjamin Herrenschmidt 		return found;
6656ed311b2SBenjamin Herrenschmidt 
6666ed311b2SBenjamin Herrenschmidt 	return 0;
66795f72d1eSYinghai Lu }
66895f72d1eSYinghai Lu 
6696ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
67095f72d1eSYinghai Lu {
6716ed311b2SBenjamin Herrenschmidt 	phys_addr_t alloc;
6726ed311b2SBenjamin Herrenschmidt 
6736ed311b2SBenjamin Herrenschmidt 	alloc = __memblock_alloc_base(size, align, max_addr);
6746ed311b2SBenjamin Herrenschmidt 
6756ed311b2SBenjamin Herrenschmidt 	if (alloc == 0)
6766ed311b2SBenjamin Herrenschmidt 		panic("ERROR: Failed to allocate 0x%llx bytes below 0x%llx.\n",
6776ed311b2SBenjamin Herrenschmidt 		      (unsigned long long) size, (unsigned long long) max_addr);
6786ed311b2SBenjamin Herrenschmidt 
6796ed311b2SBenjamin Herrenschmidt 	return alloc;
68095f72d1eSYinghai Lu }
68195f72d1eSYinghai Lu 
6826ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc(phys_addr_t size, phys_addr_t align)
68395f72d1eSYinghai Lu {
6846ed311b2SBenjamin Herrenschmidt 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
68595f72d1eSYinghai Lu }
68695f72d1eSYinghai Lu 
68795f72d1eSYinghai Lu 
6886ed311b2SBenjamin Herrenschmidt /*
68934e18455STejun Heo  * Additional node-local top-down allocators.
690c196f76fSBenjamin Herrenschmidt  *
691c196f76fSBenjamin Herrenschmidt  * WARNING: Only available after early_node_map[] has been populated,
692c196f76fSBenjamin Herrenschmidt  * on some architectures, that is after all the calls to add_active_range()
693c196f76fSBenjamin Herrenschmidt  * have been done to populate it.
6946ed311b2SBenjamin Herrenschmidt  */
69595f72d1eSYinghai Lu 
69634e18455STejun Heo static phys_addr_t __init memblock_nid_range_rev(phys_addr_t start,
69734e18455STejun Heo 						 phys_addr_t end, int *nid)
698c3f72b57SBenjamin Herrenschmidt {
699c196f76fSBenjamin Herrenschmidt #ifdef CONFIG_ARCH_POPULATES_NODE_MAP
700c196f76fSBenjamin Herrenschmidt 	unsigned long start_pfn, end_pfn;
701c196f76fSBenjamin Herrenschmidt 	int i;
702c196f76fSBenjamin Herrenschmidt 
703b2fea988STejun Heo 	for_each_mem_pfn_range(i, MAX_NUMNODES, &start_pfn, &end_pfn, nid)
70434e18455STejun Heo 		if (end > PFN_PHYS(start_pfn) && end <= PFN_PHYS(end_pfn))
70534e18455STejun Heo 			return max(start, PFN_PHYS(start_pfn));
706c196f76fSBenjamin Herrenschmidt #endif
707c3f72b57SBenjamin Herrenschmidt 	*nid = 0;
70834e18455STejun Heo 	return start;
709c3f72b57SBenjamin Herrenschmidt }
710c3f72b57SBenjamin Herrenschmidt 
711e6498040STejun Heo phys_addr_t __init memblock_find_in_range_node(phys_addr_t start,
712e6498040STejun Heo 					       phys_addr_t end,
7132898cc4cSBenjamin Herrenschmidt 					       phys_addr_t size,
7142898cc4cSBenjamin Herrenschmidt 					       phys_addr_t align, int nid)
71595f72d1eSYinghai Lu {
716e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *mem = &memblock.memory;
71795f72d1eSYinghai Lu 	int i;
71895f72d1eSYinghai Lu 
71995f72d1eSYinghai Lu 	BUG_ON(0 == size);
72095f72d1eSYinghai Lu 
721e6498040STejun Heo 	/* Pump up max_addr */
722e6498040STejun Heo 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
723e6498040STejun Heo 		end = memblock.current_limit;
724e6498040STejun Heo 
725e6498040STejun Heo 	for (i = mem->cnt - 1; i >= 0; i--) {
726e6498040STejun Heo 		struct memblock_region *r = &mem->regions[i];
727e6498040STejun Heo 		phys_addr_t base = max(start, r->base);
728e6498040STejun Heo 		phys_addr_t top = min(end, r->base + r->size);
729e6498040STejun Heo 
730e6498040STejun Heo 		while (base < top) {
731e6498040STejun Heo 			phys_addr_t tbase, ret;
732e6498040STejun Heo 			int tnid;
733e6498040STejun Heo 
734e6498040STejun Heo 			tbase = memblock_nid_range_rev(base, top, &tnid);
735e6498040STejun Heo 			if (nid == MAX_NUMNODES || tnid == nid) {
736e6498040STejun Heo 				ret = memblock_find_region(tbase, top, size, align);
737e6498040STejun Heo 				if (ret)
738e6498040STejun Heo 					return ret;
739e6498040STejun Heo 			}
740e6498040STejun Heo 			top = tbase;
741e6498040STejun Heo 		}
742e6498040STejun Heo 	}
743e6498040STejun Heo 
744e6498040STejun Heo 	return 0;
745e6498040STejun Heo }
746e6498040STejun Heo 
747e6498040STejun Heo phys_addr_t __init memblock_alloc_nid(phys_addr_t size, phys_addr_t align, int nid)
748e6498040STejun Heo {
749e6498040STejun Heo 	phys_addr_t found;
750e6498040STejun Heo 
751e6498040STejun Heo 	/*
752e6498040STejun Heo 	 * We align the size to limit fragmentation. Without this, a lot of
7537f219c73SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
7547f219c73SBenjamin Herrenschmidt 	 */
755348968ebSTejun Heo 	size = round_up(size, align);
7567f219c73SBenjamin Herrenschmidt 
757e6498040STejun Heo 	found = memblock_find_in_range_node(0, MEMBLOCK_ALLOC_ACCESSIBLE,
75895f72d1eSYinghai Lu 					    size, align, nid);
7599c8c27e2STejun Heo 	if (found && !memblock_reserve(found, size))
760e6498040STejun Heo 		return found;
76195f72d1eSYinghai Lu 
7629d1e2492SBenjamin Herrenschmidt 	return 0;
7639d1e2492SBenjamin Herrenschmidt }
7649d1e2492SBenjamin Herrenschmidt 
7659d1e2492SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_try_nid(phys_addr_t size, phys_addr_t align, int nid)
7669d1e2492SBenjamin Herrenschmidt {
7679d1e2492SBenjamin Herrenschmidt 	phys_addr_t res = memblock_alloc_nid(size, align, nid);
7689d1e2492SBenjamin Herrenschmidt 
7699d1e2492SBenjamin Herrenschmidt 	if (res)
7709d1e2492SBenjamin Herrenschmidt 		return res;
77115fb0972STejun Heo 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
77295f72d1eSYinghai Lu }
77395f72d1eSYinghai Lu 
7749d1e2492SBenjamin Herrenschmidt 
7759d1e2492SBenjamin Herrenschmidt /*
7769d1e2492SBenjamin Herrenschmidt  * Remaining API functions
7779d1e2492SBenjamin Herrenschmidt  */
7789d1e2492SBenjamin Herrenschmidt 
77995f72d1eSYinghai Lu /* You must call memblock_analyze() before this. */
7802898cc4cSBenjamin Herrenschmidt phys_addr_t __init memblock_phys_mem_size(void)
78195f72d1eSYinghai Lu {
7824734b594SBenjamin Herrenschmidt 	return memblock.memory_size;
78395f72d1eSYinghai Lu }
78495f72d1eSYinghai Lu 
7850a93ebefSSam Ravnborg /* lowest address */
7860a93ebefSSam Ravnborg phys_addr_t __init_memblock memblock_start_of_DRAM(void)
7870a93ebefSSam Ravnborg {
7880a93ebefSSam Ravnborg 	return memblock.memory.regions[0].base;
7890a93ebefSSam Ravnborg }
7900a93ebefSSam Ravnborg 
79110d06439SYinghai Lu phys_addr_t __init_memblock memblock_end_of_DRAM(void)
79295f72d1eSYinghai Lu {
79395f72d1eSYinghai Lu 	int idx = memblock.memory.cnt - 1;
79495f72d1eSYinghai Lu 
795e3239ff9SBenjamin Herrenschmidt 	return (memblock.memory.regions[idx].base + memblock.memory.regions[idx].size);
79695f72d1eSYinghai Lu }
79795f72d1eSYinghai Lu 
79895f72d1eSYinghai Lu /* You must call memblock_analyze() after this. */
7992898cc4cSBenjamin Herrenschmidt void __init memblock_enforce_memory_limit(phys_addr_t memory_limit)
80095f72d1eSYinghai Lu {
80195f72d1eSYinghai Lu 	unsigned long i;
8022898cc4cSBenjamin Herrenschmidt 	phys_addr_t limit;
803e3239ff9SBenjamin Herrenschmidt 	struct memblock_region *p;
80495f72d1eSYinghai Lu 
80595f72d1eSYinghai Lu 	if (!memory_limit)
80695f72d1eSYinghai Lu 		return;
80795f72d1eSYinghai Lu 
80895f72d1eSYinghai Lu 	/* Truncate the memblock regions to satisfy the memory limit. */
80995f72d1eSYinghai Lu 	limit = memory_limit;
81095f72d1eSYinghai Lu 	for (i = 0; i < memblock.memory.cnt; i++) {
811e3239ff9SBenjamin Herrenschmidt 		if (limit > memblock.memory.regions[i].size) {
812e3239ff9SBenjamin Herrenschmidt 			limit -= memblock.memory.regions[i].size;
81395f72d1eSYinghai Lu 			continue;
81495f72d1eSYinghai Lu 		}
81595f72d1eSYinghai Lu 
816e3239ff9SBenjamin Herrenschmidt 		memblock.memory.regions[i].size = limit;
81795f72d1eSYinghai Lu 		memblock.memory.cnt = i + 1;
81895f72d1eSYinghai Lu 		break;
81995f72d1eSYinghai Lu 	}
82095f72d1eSYinghai Lu 
82195f72d1eSYinghai Lu 	memory_limit = memblock_end_of_DRAM();
82295f72d1eSYinghai Lu 
82395f72d1eSYinghai Lu 	/* And truncate any reserves above the limit also. */
82495f72d1eSYinghai Lu 	for (i = 0; i < memblock.reserved.cnt; i++) {
825e3239ff9SBenjamin Herrenschmidt 		p = &memblock.reserved.regions[i];
82695f72d1eSYinghai Lu 
82795f72d1eSYinghai Lu 		if (p->base > memory_limit)
82895f72d1eSYinghai Lu 			p->size = 0;
82995f72d1eSYinghai Lu 		else if ((p->base + p->size) > memory_limit)
83095f72d1eSYinghai Lu 			p->size = memory_limit - p->base;
83195f72d1eSYinghai Lu 
83295f72d1eSYinghai Lu 		if (p->size == 0) {
83395f72d1eSYinghai Lu 			memblock_remove_region(&memblock.reserved, i);
83495f72d1eSYinghai Lu 			i--;
83595f72d1eSYinghai Lu 		}
83695f72d1eSYinghai Lu 	}
83795f72d1eSYinghai Lu }
83895f72d1eSYinghai Lu 
839cd79481dSYinghai Lu static int __init_memblock memblock_search(struct memblock_type *type, phys_addr_t addr)
84072d4b0b4SBenjamin Herrenschmidt {
84172d4b0b4SBenjamin Herrenschmidt 	unsigned int left = 0, right = type->cnt;
84272d4b0b4SBenjamin Herrenschmidt 
84372d4b0b4SBenjamin Herrenschmidt 	do {
84472d4b0b4SBenjamin Herrenschmidt 		unsigned int mid = (right + left) / 2;
84572d4b0b4SBenjamin Herrenschmidt 
84672d4b0b4SBenjamin Herrenschmidt 		if (addr < type->regions[mid].base)
84772d4b0b4SBenjamin Herrenschmidt 			right = mid;
84872d4b0b4SBenjamin Herrenschmidt 		else if (addr >= (type->regions[mid].base +
84972d4b0b4SBenjamin Herrenschmidt 				  type->regions[mid].size))
85072d4b0b4SBenjamin Herrenschmidt 			left = mid + 1;
85172d4b0b4SBenjamin Herrenschmidt 		else
85272d4b0b4SBenjamin Herrenschmidt 			return mid;
85372d4b0b4SBenjamin Herrenschmidt 	} while (left < right);
85472d4b0b4SBenjamin Herrenschmidt 	return -1;
85572d4b0b4SBenjamin Herrenschmidt }
85672d4b0b4SBenjamin Herrenschmidt 
8572898cc4cSBenjamin Herrenschmidt int __init memblock_is_reserved(phys_addr_t addr)
85895f72d1eSYinghai Lu {
85972d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.reserved, addr) != -1;
86095f72d1eSYinghai Lu }
86172d4b0b4SBenjamin Herrenschmidt 
8623661ca66SYinghai Lu int __init_memblock memblock_is_memory(phys_addr_t addr)
86372d4b0b4SBenjamin Herrenschmidt {
86472d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.memory, addr) != -1;
86572d4b0b4SBenjamin Herrenschmidt }
86672d4b0b4SBenjamin Herrenschmidt 
8673661ca66SYinghai Lu int __init_memblock memblock_is_region_memory(phys_addr_t base, phys_addr_t size)
86872d4b0b4SBenjamin Herrenschmidt {
869abb65272STomi Valkeinen 	int idx = memblock_search(&memblock.memory, base);
87072d4b0b4SBenjamin Herrenschmidt 
87172d4b0b4SBenjamin Herrenschmidt 	if (idx == -1)
87295f72d1eSYinghai Lu 		return 0;
873abb65272STomi Valkeinen 	return memblock.memory.regions[idx].base <= base &&
874abb65272STomi Valkeinen 		(memblock.memory.regions[idx].base +
875abb65272STomi Valkeinen 		 memblock.memory.regions[idx].size) >= (base + size);
87695f72d1eSYinghai Lu }
87795f72d1eSYinghai Lu 
87810d06439SYinghai Lu int __init_memblock memblock_is_region_reserved(phys_addr_t base, phys_addr_t size)
87995f72d1eSYinghai Lu {
880f1c2c19cSBenjamin Herrenschmidt 	return memblock_overlaps_region(&memblock.reserved, base, size) >= 0;
88195f72d1eSYinghai Lu }
88295f72d1eSYinghai Lu 
883e63075a3SBenjamin Herrenschmidt 
8843661ca66SYinghai Lu void __init_memblock memblock_set_current_limit(phys_addr_t limit)
885e63075a3SBenjamin Herrenschmidt {
886e63075a3SBenjamin Herrenschmidt 	memblock.current_limit = limit;
887e63075a3SBenjamin Herrenschmidt }
888e63075a3SBenjamin Herrenschmidt 
8897c0caeb8STejun Heo static void __init_memblock memblock_dump(struct memblock_type *type, char *name)
8906ed311b2SBenjamin Herrenschmidt {
8916ed311b2SBenjamin Herrenschmidt 	unsigned long long base, size;
8926ed311b2SBenjamin Herrenschmidt 	int i;
8936ed311b2SBenjamin Herrenschmidt 
8947c0caeb8STejun Heo 	pr_info(" %s.cnt  = 0x%lx\n", name, type->cnt);
8956ed311b2SBenjamin Herrenschmidt 
8967c0caeb8STejun Heo 	for (i = 0; i < type->cnt; i++) {
8977c0caeb8STejun Heo 		struct memblock_region *rgn = &type->regions[i];
8987c0caeb8STejun Heo 		char nid_buf[32] = "";
8996ed311b2SBenjamin Herrenschmidt 
9007c0caeb8STejun Heo 		base = rgn->base;
9017c0caeb8STejun Heo 		size = rgn->size;
9027c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
9037c0caeb8STejun Heo 		if (memblock_get_region_node(rgn) != MAX_NUMNODES)
9047c0caeb8STejun Heo 			snprintf(nid_buf, sizeof(nid_buf), " on node %d",
9057c0caeb8STejun Heo 				 memblock_get_region_node(rgn));
9067c0caeb8STejun Heo #endif
9077c0caeb8STejun Heo 		pr_info(" %s[%#x]\t[%#016llx-%#016llx], %#llx bytes%s\n",
9087c0caeb8STejun Heo 			name, i, base, base + size - 1, size, nid_buf);
9096ed311b2SBenjamin Herrenschmidt 	}
9106ed311b2SBenjamin Herrenschmidt }
9116ed311b2SBenjamin Herrenschmidt 
9124ff7b82fSTejun Heo void __init_memblock __memblock_dump_all(void)
9136ed311b2SBenjamin Herrenschmidt {
9146ed311b2SBenjamin Herrenschmidt 	pr_info("MEMBLOCK configuration:\n");
9156ed311b2SBenjamin Herrenschmidt 	pr_info(" memory size = 0x%llx\n", (unsigned long long)memblock.memory_size);
9166ed311b2SBenjamin Herrenschmidt 
9176ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.memory, "memory");
9186ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.reserved, "reserved");
9196ed311b2SBenjamin Herrenschmidt }
9206ed311b2SBenjamin Herrenschmidt 
9216ed311b2SBenjamin Herrenschmidt void __init memblock_analyze(void)
9226ed311b2SBenjamin Herrenschmidt {
9236ed311b2SBenjamin Herrenschmidt 	int i;
9246ed311b2SBenjamin Herrenschmidt 
9256ed311b2SBenjamin Herrenschmidt 	memblock.memory_size = 0;
9266ed311b2SBenjamin Herrenschmidt 
9276ed311b2SBenjamin Herrenschmidt 	for (i = 0; i < memblock.memory.cnt; i++)
9286ed311b2SBenjamin Herrenschmidt 		memblock.memory_size += memblock.memory.regions[i].size;
929142b45a7SBenjamin Herrenschmidt 
930142b45a7SBenjamin Herrenschmidt 	/* We allow resizing from there */
931142b45a7SBenjamin Herrenschmidt 	memblock_can_resize = 1;
9326ed311b2SBenjamin Herrenschmidt }
9336ed311b2SBenjamin Herrenschmidt 
9346ed311b2SBenjamin Herrenschmidt static int __init early_memblock(char *p)
9356ed311b2SBenjamin Herrenschmidt {
9366ed311b2SBenjamin Herrenschmidt 	if (p && strstr(p, "debug"))
9376ed311b2SBenjamin Herrenschmidt 		memblock_debug = 1;
9386ed311b2SBenjamin Herrenschmidt 	return 0;
9396ed311b2SBenjamin Herrenschmidt }
9406ed311b2SBenjamin Herrenschmidt early_param("memblock", early_memblock);
9416ed311b2SBenjamin Herrenschmidt 
942c378ddd5STejun Heo #if defined(CONFIG_DEBUG_FS) && !defined(CONFIG_ARCH_DISCARD_MEMBLOCK)
9436d03b885SBenjamin Herrenschmidt 
9446d03b885SBenjamin Herrenschmidt static int memblock_debug_show(struct seq_file *m, void *private)
9456d03b885SBenjamin Herrenschmidt {
9466d03b885SBenjamin Herrenschmidt 	struct memblock_type *type = m->private;
9476d03b885SBenjamin Herrenschmidt 	struct memblock_region *reg;
9486d03b885SBenjamin Herrenschmidt 	int i;
9496d03b885SBenjamin Herrenschmidt 
9506d03b885SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
9516d03b885SBenjamin Herrenschmidt 		reg = &type->regions[i];
9526d03b885SBenjamin Herrenschmidt 		seq_printf(m, "%4d: ", i);
9536d03b885SBenjamin Herrenschmidt 		if (sizeof(phys_addr_t) == 4)
9546d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%08lx..0x%08lx\n",
9556d03b885SBenjamin Herrenschmidt 				   (unsigned long)reg->base,
9566d03b885SBenjamin Herrenschmidt 				   (unsigned long)(reg->base + reg->size - 1));
9576d03b885SBenjamin Herrenschmidt 		else
9586d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%016llx..0x%016llx\n",
9596d03b885SBenjamin Herrenschmidt 				   (unsigned long long)reg->base,
9606d03b885SBenjamin Herrenschmidt 				   (unsigned long long)(reg->base + reg->size - 1));
9616d03b885SBenjamin Herrenschmidt 
9626d03b885SBenjamin Herrenschmidt 	}
9636d03b885SBenjamin Herrenschmidt 	return 0;
9646d03b885SBenjamin Herrenschmidt }
9656d03b885SBenjamin Herrenschmidt 
9666d03b885SBenjamin Herrenschmidt static int memblock_debug_open(struct inode *inode, struct file *file)
9676d03b885SBenjamin Herrenschmidt {
9686d03b885SBenjamin Herrenschmidt 	return single_open(file, memblock_debug_show, inode->i_private);
9696d03b885SBenjamin Herrenschmidt }
9706d03b885SBenjamin Herrenschmidt 
9716d03b885SBenjamin Herrenschmidt static const struct file_operations memblock_debug_fops = {
9726d03b885SBenjamin Herrenschmidt 	.open = memblock_debug_open,
9736d03b885SBenjamin Herrenschmidt 	.read = seq_read,
9746d03b885SBenjamin Herrenschmidt 	.llseek = seq_lseek,
9756d03b885SBenjamin Herrenschmidt 	.release = single_release,
9766d03b885SBenjamin Herrenschmidt };
9776d03b885SBenjamin Herrenschmidt 
9786d03b885SBenjamin Herrenschmidt static int __init memblock_init_debugfs(void)
9796d03b885SBenjamin Herrenschmidt {
9806d03b885SBenjamin Herrenschmidt 	struct dentry *root = debugfs_create_dir("memblock", NULL);
9816d03b885SBenjamin Herrenschmidt 	if (!root)
9826d03b885SBenjamin Herrenschmidt 		return -ENXIO;
9836d03b885SBenjamin Herrenschmidt 	debugfs_create_file("memory", S_IRUGO, root, &memblock.memory, &memblock_debug_fops);
9846d03b885SBenjamin Herrenschmidt 	debugfs_create_file("reserved", S_IRUGO, root, &memblock.reserved, &memblock_debug_fops);
9856d03b885SBenjamin Herrenschmidt 
9866d03b885SBenjamin Herrenschmidt 	return 0;
9876d03b885SBenjamin Herrenschmidt }
9886d03b885SBenjamin Herrenschmidt __initcall(memblock_init_debugfs);
9896d03b885SBenjamin Herrenschmidt 
9906d03b885SBenjamin Herrenschmidt #endif /* CONFIG_DEBUG_FS */
991