xref: /linux/mm/memblock.c (revision 581adcbe121872429de76ff9884762de71a76200)
195f72d1eSYinghai Lu /*
295f72d1eSYinghai Lu  * Procedures for maintaining information about logical memory blocks.
395f72d1eSYinghai Lu  *
495f72d1eSYinghai Lu  * Peter Bergner, IBM Corp.	June 2001.
595f72d1eSYinghai Lu  * Copyright (C) 2001 Peter Bergner.
695f72d1eSYinghai Lu  *
795f72d1eSYinghai Lu  *      This program is free software; you can redistribute it and/or
895f72d1eSYinghai Lu  *      modify it under the terms of the GNU General Public License
995f72d1eSYinghai Lu  *      as published by the Free Software Foundation; either version
1095f72d1eSYinghai Lu  *      2 of the License, or (at your option) any later version.
1195f72d1eSYinghai Lu  */
1295f72d1eSYinghai Lu 
1395f72d1eSYinghai Lu #include <linux/kernel.h>
14142b45a7SBenjamin Herrenschmidt #include <linux/slab.h>
1595f72d1eSYinghai Lu #include <linux/init.h>
1695f72d1eSYinghai Lu #include <linux/bitops.h>
17449e8df3SBenjamin Herrenschmidt #include <linux/poison.h>
18c196f76fSBenjamin Herrenschmidt #include <linux/pfn.h>
196d03b885SBenjamin Herrenschmidt #include <linux/debugfs.h>
206d03b885SBenjamin Herrenschmidt #include <linux/seq_file.h>
2195f72d1eSYinghai Lu #include <linux/memblock.h>
2295f72d1eSYinghai Lu 
2310d06439SYinghai Lu struct memblock memblock __initdata_memblock;
2495f72d1eSYinghai Lu 
2510d06439SYinghai Lu int memblock_debug __initdata_memblock;
2610d06439SYinghai Lu int memblock_can_resize __initdata_memblock;
2710d06439SYinghai Lu static struct memblock_region memblock_memory_init_regions[INIT_MEMBLOCK_REGIONS + 1] __initdata_memblock;
2810d06439SYinghai Lu static struct memblock_region memblock_reserved_init_regions[INIT_MEMBLOCK_REGIONS + 1] __initdata_memblock;
2995f72d1eSYinghai Lu 
30142b45a7SBenjamin Herrenschmidt /* inline so we don't get a warning when pr_debug is compiled out */
31142b45a7SBenjamin Herrenschmidt static inline const char *memblock_type_name(struct memblock_type *type)
32142b45a7SBenjamin Herrenschmidt {
33142b45a7SBenjamin Herrenschmidt 	if (type == &memblock.memory)
34142b45a7SBenjamin Herrenschmidt 		return "memory";
35142b45a7SBenjamin Herrenschmidt 	else if (type == &memblock.reserved)
36142b45a7SBenjamin Herrenschmidt 		return "reserved";
37142b45a7SBenjamin Herrenschmidt 	else
38142b45a7SBenjamin Herrenschmidt 		return "unknown";
39142b45a7SBenjamin Herrenschmidt }
40142b45a7SBenjamin Herrenschmidt 
416ed311b2SBenjamin Herrenschmidt /*
426ed311b2SBenjamin Herrenschmidt  * Address comparison utilities
436ed311b2SBenjamin Herrenschmidt  */
4410d06439SYinghai Lu static unsigned long __init_memblock memblock_addrs_overlap(phys_addr_t base1, phys_addr_t size1,
452898cc4cSBenjamin Herrenschmidt 				       phys_addr_t base2, phys_addr_t size2)
4695f72d1eSYinghai Lu {
4795f72d1eSYinghai Lu 	return ((base1 < (base2 + size2)) && (base2 < (base1 + size1)));
4895f72d1eSYinghai Lu }
4995f72d1eSYinghai Lu 
502d7d3eb2SH Hartley Sweeten static long __init_memblock memblock_overlaps_region(struct memblock_type *type,
512d7d3eb2SH Hartley Sweeten 					phys_addr_t base, phys_addr_t size)
526ed311b2SBenjamin Herrenschmidt {
536ed311b2SBenjamin Herrenschmidt 	unsigned long i;
546ed311b2SBenjamin Herrenschmidt 
556ed311b2SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
566ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnbase = type->regions[i].base;
576ed311b2SBenjamin Herrenschmidt 		phys_addr_t rgnsize = type->regions[i].size;
586ed311b2SBenjamin Herrenschmidt 		if (memblock_addrs_overlap(base, size, rgnbase, rgnsize))
596ed311b2SBenjamin Herrenschmidt 			break;
606ed311b2SBenjamin Herrenschmidt 	}
616ed311b2SBenjamin Herrenschmidt 
626ed311b2SBenjamin Herrenschmidt 	return (i < type->cnt) ? i : -1;
636ed311b2SBenjamin Herrenschmidt }
646ed311b2SBenjamin Herrenschmidt 
656ed311b2SBenjamin Herrenschmidt /*
666ed311b2SBenjamin Herrenschmidt  * Find, allocate, deallocate or reserve unreserved regions. All allocations
676ed311b2SBenjamin Herrenschmidt  * are top-down.
686ed311b2SBenjamin Herrenschmidt  */
696ed311b2SBenjamin Herrenschmidt 
70cd79481dSYinghai Lu static phys_addr_t __init_memblock memblock_find_region(phys_addr_t start, phys_addr_t end,
716ed311b2SBenjamin Herrenschmidt 					  phys_addr_t size, phys_addr_t align)
726ed311b2SBenjamin Herrenschmidt {
736ed311b2SBenjamin Herrenschmidt 	phys_addr_t base, res_base;
746ed311b2SBenjamin Herrenschmidt 	long j;
756ed311b2SBenjamin Herrenschmidt 
76f1af98c7SYinghai Lu 	/* In case, huge size is requested */
77f1af98c7SYinghai Lu 	if (end < size)
781f5026a7STejun Heo 		return 0;
79f1af98c7SYinghai Lu 
80348968ebSTejun Heo 	base = round_down(end - size, align);
81f1af98c7SYinghai Lu 
8225818f0fSBenjamin Herrenschmidt 	/* Prevent allocations returning 0 as it's also used to
8325818f0fSBenjamin Herrenschmidt 	 * indicate an allocation failure
8425818f0fSBenjamin Herrenschmidt 	 */
8525818f0fSBenjamin Herrenschmidt 	if (start == 0)
8625818f0fSBenjamin Herrenschmidt 		start = PAGE_SIZE;
8725818f0fSBenjamin Herrenschmidt 
886ed311b2SBenjamin Herrenschmidt 	while (start <= base) {
896ed311b2SBenjamin Herrenschmidt 		j = memblock_overlaps_region(&memblock.reserved, base, size);
906ed311b2SBenjamin Herrenschmidt 		if (j < 0)
916ed311b2SBenjamin Herrenschmidt 			return base;
926ed311b2SBenjamin Herrenschmidt 		res_base = memblock.reserved.regions[j].base;
936ed311b2SBenjamin Herrenschmidt 		if (res_base < size)
946ed311b2SBenjamin Herrenschmidt 			break;
95348968ebSTejun Heo 		base = round_down(res_base - size, align);
966ed311b2SBenjamin Herrenschmidt 	}
976ed311b2SBenjamin Herrenschmidt 
981f5026a7STejun Heo 	return 0;
996ed311b2SBenjamin Herrenschmidt }
1006ed311b2SBenjamin Herrenschmidt 
101fc769a8eSTejun Heo /*
102fc769a8eSTejun Heo  * Find a free area with specified alignment in a specific range.
103fc769a8eSTejun Heo  */
104fc769a8eSTejun Heo phys_addr_t __init_memblock memblock_find_in_range(phys_addr_t start, phys_addr_t end,
105fc769a8eSTejun Heo 					phys_addr_t size, phys_addr_t align)
1066ed311b2SBenjamin Herrenschmidt {
1076ed311b2SBenjamin Herrenschmidt 	long i;
1086ed311b2SBenjamin Herrenschmidt 
1096ed311b2SBenjamin Herrenschmidt 	BUG_ON(0 == size);
1106ed311b2SBenjamin Herrenschmidt 
1116ed311b2SBenjamin Herrenschmidt 	/* Pump up max_addr */
112fef501d4SBenjamin Herrenschmidt 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
113fef501d4SBenjamin Herrenschmidt 		end = memblock.current_limit;
1146ed311b2SBenjamin Herrenschmidt 
1156ed311b2SBenjamin Herrenschmidt 	/* We do a top-down search, this tends to limit memory
1166ed311b2SBenjamin Herrenschmidt 	 * fragmentation by keeping early boot allocs near the
1176ed311b2SBenjamin Herrenschmidt 	 * top of memory
1186ed311b2SBenjamin Herrenschmidt 	 */
1196ed311b2SBenjamin Herrenschmidt 	for (i = memblock.memory.cnt - 1; i >= 0; i--) {
1206ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblockbase = memblock.memory.regions[i].base;
1216ed311b2SBenjamin Herrenschmidt 		phys_addr_t memblocksize = memblock.memory.regions[i].size;
122fef501d4SBenjamin Herrenschmidt 		phys_addr_t bottom, top, found;
1236ed311b2SBenjamin Herrenschmidt 
1246ed311b2SBenjamin Herrenschmidt 		if (memblocksize < size)
1256ed311b2SBenjamin Herrenschmidt 			continue;
126fef501d4SBenjamin Herrenschmidt 		if ((memblockbase + memblocksize) <= start)
127fef501d4SBenjamin Herrenschmidt 			break;
128fef501d4SBenjamin Herrenschmidt 		bottom = max(memblockbase, start);
129fef501d4SBenjamin Herrenschmidt 		top = min(memblockbase + memblocksize, end);
130fef501d4SBenjamin Herrenschmidt 		if (bottom >= top)
131fef501d4SBenjamin Herrenschmidt 			continue;
132fef501d4SBenjamin Herrenschmidt 		found = memblock_find_region(bottom, top, size, align);
1331f5026a7STejun Heo 		if (found)
134fef501d4SBenjamin Herrenschmidt 			return found;
1356ed311b2SBenjamin Herrenschmidt 	}
1361f5026a7STejun Heo 	return 0;
1376ed311b2SBenjamin Herrenschmidt }
1386ed311b2SBenjamin Herrenschmidt 
1395303b68fSYinghai Lu /*
1407950c407SYinghai Lu  * Free memblock.reserved.regions
1417950c407SYinghai Lu  */
1427950c407SYinghai Lu int __init_memblock memblock_free_reserved_regions(void)
1437950c407SYinghai Lu {
1447950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1457950c407SYinghai Lu 		return 0;
1467950c407SYinghai Lu 
1477950c407SYinghai Lu 	return memblock_free(__pa(memblock.reserved.regions),
1487950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1497950c407SYinghai Lu }
1507950c407SYinghai Lu 
1517950c407SYinghai Lu /*
1527950c407SYinghai Lu  * Reserve memblock.reserved.regions
1537950c407SYinghai Lu  */
1547950c407SYinghai Lu int __init_memblock memblock_reserve_reserved_regions(void)
1557950c407SYinghai Lu {
1567950c407SYinghai Lu 	if (memblock.reserved.regions == memblock_reserved_init_regions)
1577950c407SYinghai Lu 		return 0;
1587950c407SYinghai Lu 
1597950c407SYinghai Lu 	return memblock_reserve(__pa(memblock.reserved.regions),
1607950c407SYinghai Lu 		 sizeof(struct memblock_region) * memblock.reserved.max);
1617950c407SYinghai Lu }
1627950c407SYinghai Lu 
16310d06439SYinghai Lu static void __init_memblock memblock_remove_region(struct memblock_type *type, unsigned long r)
16495f72d1eSYinghai Lu {
1657c0caeb8STejun Heo 	memmove(&type->regions[r], &type->regions[r + 1],
1667c0caeb8STejun Heo 		(type->cnt - (r + 1)) * sizeof(type->regions[r]));
167e3239ff9SBenjamin Herrenschmidt 	type->cnt--;
16895f72d1eSYinghai Lu 
1698f7a6605SBenjamin Herrenschmidt 	/* Special case for empty arrays */
1708f7a6605SBenjamin Herrenschmidt 	if (type->cnt == 0) {
1718f7a6605SBenjamin Herrenschmidt 		type->cnt = 1;
1728f7a6605SBenjamin Herrenschmidt 		type->regions[0].base = 0;
1738f7a6605SBenjamin Herrenschmidt 		type->regions[0].size = 0;
1747c0caeb8STejun Heo 		memblock_set_region_node(&type->regions[0], MAX_NUMNODES);
1758f7a6605SBenjamin Herrenschmidt 	}
17695f72d1eSYinghai Lu }
17795f72d1eSYinghai Lu 
178142b45a7SBenjamin Herrenschmidt /* Defined below but needed now */
179*581adcbeSTejun Heo static int memblock_add_region(struct memblock_type *type, phys_addr_t base, phys_addr_t size);
180142b45a7SBenjamin Herrenschmidt 
18110d06439SYinghai Lu static int __init_memblock memblock_double_array(struct memblock_type *type)
182142b45a7SBenjamin Herrenschmidt {
183142b45a7SBenjamin Herrenschmidt 	struct memblock_region *new_array, *old_array;
184142b45a7SBenjamin Herrenschmidt 	phys_addr_t old_size, new_size, addr;
185142b45a7SBenjamin Herrenschmidt 	int use_slab = slab_is_available();
186142b45a7SBenjamin Herrenschmidt 
187142b45a7SBenjamin Herrenschmidt 	/* We don't allow resizing until we know about the reserved regions
188142b45a7SBenjamin Herrenschmidt 	 * of memory that aren't suitable for allocation
189142b45a7SBenjamin Herrenschmidt 	 */
190142b45a7SBenjamin Herrenschmidt 	if (!memblock_can_resize)
191142b45a7SBenjamin Herrenschmidt 		return -1;
192142b45a7SBenjamin Herrenschmidt 
193142b45a7SBenjamin Herrenschmidt 	/* Calculate new doubled size */
194142b45a7SBenjamin Herrenschmidt 	old_size = type->max * sizeof(struct memblock_region);
195142b45a7SBenjamin Herrenschmidt 	new_size = old_size << 1;
196142b45a7SBenjamin Herrenschmidt 
197142b45a7SBenjamin Herrenschmidt 	/* Try to find some space for it.
198142b45a7SBenjamin Herrenschmidt 	 *
199142b45a7SBenjamin Herrenschmidt 	 * WARNING: We assume that either slab_is_available() and we use it or
200142b45a7SBenjamin Herrenschmidt 	 * we use MEMBLOCK for allocations. That means that this is unsafe to use
201142b45a7SBenjamin Herrenschmidt 	 * when bootmem is currently active (unless bootmem itself is implemented
202142b45a7SBenjamin Herrenschmidt 	 * on top of MEMBLOCK which isn't the case yet)
203142b45a7SBenjamin Herrenschmidt 	 *
204142b45a7SBenjamin Herrenschmidt 	 * This should however not be an issue for now, as we currently only
205142b45a7SBenjamin Herrenschmidt 	 * call into MEMBLOCK while it's still active, or much later when slab is
206142b45a7SBenjamin Herrenschmidt 	 * active for memory hotplug operations
207142b45a7SBenjamin Herrenschmidt 	 */
208142b45a7SBenjamin Herrenschmidt 	if (use_slab) {
209142b45a7SBenjamin Herrenschmidt 		new_array = kmalloc(new_size, GFP_KERNEL);
2101f5026a7STejun Heo 		addr = new_array ? __pa(new_array) : 0;
211142b45a7SBenjamin Herrenschmidt 	} else
212fc769a8eSTejun Heo 		addr = memblock_find_in_range(0, MEMBLOCK_ALLOC_ACCESSIBLE, new_size, sizeof(phys_addr_t));
2131f5026a7STejun Heo 	if (!addr) {
214142b45a7SBenjamin Herrenschmidt 		pr_err("memblock: Failed to double %s array from %ld to %ld entries !\n",
215142b45a7SBenjamin Herrenschmidt 		       memblock_type_name(type), type->max, type->max * 2);
216142b45a7SBenjamin Herrenschmidt 		return -1;
217142b45a7SBenjamin Herrenschmidt 	}
218142b45a7SBenjamin Herrenschmidt 	new_array = __va(addr);
219142b45a7SBenjamin Herrenschmidt 
220ea9e4376SYinghai Lu 	memblock_dbg("memblock: %s array is doubled to %ld at [%#010llx-%#010llx]",
221ea9e4376SYinghai Lu 		 memblock_type_name(type), type->max * 2, (u64)addr, (u64)addr + new_size - 1);
222ea9e4376SYinghai Lu 
223142b45a7SBenjamin Herrenschmidt 	/* Found space, we now need to move the array over before
224142b45a7SBenjamin Herrenschmidt 	 * we add the reserved region since it may be our reserved
225142b45a7SBenjamin Herrenschmidt 	 * array itself that is full.
226142b45a7SBenjamin Herrenschmidt 	 */
227142b45a7SBenjamin Herrenschmidt 	memcpy(new_array, type->regions, old_size);
228142b45a7SBenjamin Herrenschmidt 	memset(new_array + type->max, 0, old_size);
229142b45a7SBenjamin Herrenschmidt 	old_array = type->regions;
230142b45a7SBenjamin Herrenschmidt 	type->regions = new_array;
231142b45a7SBenjamin Herrenschmidt 	type->max <<= 1;
232142b45a7SBenjamin Herrenschmidt 
233142b45a7SBenjamin Herrenschmidt 	/* If we use SLAB that's it, we are done */
234142b45a7SBenjamin Herrenschmidt 	if (use_slab)
235142b45a7SBenjamin Herrenschmidt 		return 0;
236142b45a7SBenjamin Herrenschmidt 
237142b45a7SBenjamin Herrenschmidt 	/* Add the new reserved region now. Should not fail ! */
2388f7a6605SBenjamin Herrenschmidt 	BUG_ON(memblock_add_region(&memblock.reserved, addr, new_size));
239142b45a7SBenjamin Herrenschmidt 
240142b45a7SBenjamin Herrenschmidt 	/* If the array wasn't our static init one, then free it. We only do
241142b45a7SBenjamin Herrenschmidt 	 * that before SLAB is available as later on, we don't know whether
242142b45a7SBenjamin Herrenschmidt 	 * to use kfree or free_bootmem_pages(). Shouldn't be a big deal
243142b45a7SBenjamin Herrenschmidt 	 * anyways
244142b45a7SBenjamin Herrenschmidt 	 */
245142b45a7SBenjamin Herrenschmidt 	if (old_array != memblock_memory_init_regions &&
246142b45a7SBenjamin Herrenschmidt 	    old_array != memblock_reserved_init_regions)
247142b45a7SBenjamin Herrenschmidt 		memblock_free(__pa(old_array), old_size);
248142b45a7SBenjamin Herrenschmidt 
249142b45a7SBenjamin Herrenschmidt 	return 0;
250142b45a7SBenjamin Herrenschmidt }
251142b45a7SBenjamin Herrenschmidt 
252784656f9STejun Heo /**
253784656f9STejun Heo  * memblock_merge_regions - merge neighboring compatible regions
254784656f9STejun Heo  * @type: memblock type to scan
255784656f9STejun Heo  *
256784656f9STejun Heo  * Scan @type and merge neighboring compatible regions.
257784656f9STejun Heo  */
258784656f9STejun Heo static void __init_memblock memblock_merge_regions(struct memblock_type *type)
259784656f9STejun Heo {
260784656f9STejun Heo 	int i = 0;
261784656f9STejun Heo 
262784656f9STejun Heo 	/* cnt never goes below 1 */
263784656f9STejun Heo 	while (i < type->cnt - 1) {
264784656f9STejun Heo 		struct memblock_region *this = &type->regions[i];
265784656f9STejun Heo 		struct memblock_region *next = &type->regions[i + 1];
266784656f9STejun Heo 
2677c0caeb8STejun Heo 		if (this->base + this->size != next->base ||
2687c0caeb8STejun Heo 		    memblock_get_region_node(this) !=
2697c0caeb8STejun Heo 		    memblock_get_region_node(next)) {
270784656f9STejun Heo 			BUG_ON(this->base + this->size > next->base);
271784656f9STejun Heo 			i++;
272784656f9STejun Heo 			continue;
273784656f9STejun Heo 		}
274784656f9STejun Heo 
275784656f9STejun Heo 		this->size += next->size;
276784656f9STejun Heo 		memmove(next, next + 1, (type->cnt - (i + 1)) * sizeof(*next));
277784656f9STejun Heo 		type->cnt--;
278784656f9STejun Heo 	}
279784656f9STejun Heo }
280784656f9STejun Heo 
281784656f9STejun Heo /**
282784656f9STejun Heo  * memblock_insert_region - insert new memblock region
283784656f9STejun Heo  * @type: memblock type to insert into
284784656f9STejun Heo  * @idx: index for the insertion point
285784656f9STejun Heo  * @base: base address of the new region
286784656f9STejun Heo  * @size: size of the new region
287784656f9STejun Heo  *
288784656f9STejun Heo  * Insert new memblock region [@base,@base+@size) into @type at @idx.
289784656f9STejun Heo  * @type must already have extra room to accomodate the new region.
290784656f9STejun Heo  */
291784656f9STejun Heo static void __init_memblock memblock_insert_region(struct memblock_type *type,
292784656f9STejun Heo 						   int idx, phys_addr_t base,
2937c0caeb8STejun Heo 						   phys_addr_t size, int nid)
294784656f9STejun Heo {
295784656f9STejun Heo 	struct memblock_region *rgn = &type->regions[idx];
296784656f9STejun Heo 
297784656f9STejun Heo 	BUG_ON(type->cnt >= type->max);
298784656f9STejun Heo 	memmove(rgn + 1, rgn, (type->cnt - idx) * sizeof(*rgn));
299784656f9STejun Heo 	rgn->base = base;
300784656f9STejun Heo 	rgn->size = size;
3017c0caeb8STejun Heo 	memblock_set_region_node(rgn, nid);
302784656f9STejun Heo 	type->cnt++;
303784656f9STejun Heo }
304784656f9STejun Heo 
305784656f9STejun Heo /**
306784656f9STejun Heo  * memblock_add_region - add new memblock region
307784656f9STejun Heo  * @type: memblock type to add new region into
308784656f9STejun Heo  * @base: base address of the new region
309784656f9STejun Heo  * @size: size of the new region
310784656f9STejun Heo  *
311784656f9STejun Heo  * Add new memblock region [@base,@base+@size) into @type.  The new region
312784656f9STejun Heo  * is allowed to overlap with existing ones - overlaps don't affect already
313784656f9STejun Heo  * existing regions.  @type is guaranteed to be minimal (all neighbouring
314784656f9STejun Heo  * compatible regions are merged) after the addition.
315784656f9STejun Heo  *
316784656f9STejun Heo  * RETURNS:
317784656f9STejun Heo  * 0 on success, -errno on failure.
318784656f9STejun Heo  */
319*581adcbeSTejun Heo static int __init_memblock memblock_add_region(struct memblock_type *type,
3208f7a6605SBenjamin Herrenschmidt 					       phys_addr_t base, phys_addr_t size)
32195f72d1eSYinghai Lu {
322784656f9STejun Heo 	bool insert = false;
323784656f9STejun Heo 	phys_addr_t obase = base, end = base + size;
324784656f9STejun Heo 	int i, nr_new;
32595f72d1eSYinghai Lu 
326784656f9STejun Heo 	/* special case for empty array */
327784656f9STejun Heo 	if (type->regions[0].size == 0) {
328784656f9STejun Heo 		WARN_ON(type->cnt != 1);
329784656f9STejun Heo 		type->regions[0].base = base;
330784656f9STejun Heo 		type->regions[0].size = size;
3317c0caeb8STejun Heo 		memblock_set_region_node(&type->regions[0], MAX_NUMNODES);
332784656f9STejun Heo 		return 0;
333784656f9STejun Heo 	}
334784656f9STejun Heo repeat:
335784656f9STejun Heo 	/*
336784656f9STejun Heo 	 * The following is executed twice.  Once with %false @insert and
337784656f9STejun Heo 	 * then with %true.  The first counts the number of regions needed
338784656f9STejun Heo 	 * to accomodate the new area.  The second actually inserts them.
339784656f9STejun Heo 	 */
340784656f9STejun Heo 	base = obase;
341784656f9STejun Heo 	nr_new = 0;
342784656f9STejun Heo 
3438f7a6605SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
3448f7a6605SBenjamin Herrenschmidt 		struct memblock_region *rgn = &type->regions[i];
345784656f9STejun Heo 		phys_addr_t rbase = rgn->base;
346784656f9STejun Heo 		phys_addr_t rend = rbase + rgn->size;
3478f7a6605SBenjamin Herrenschmidt 
348784656f9STejun Heo 		if (rbase >= end)
3498f7a6605SBenjamin Herrenschmidt 			break;
350784656f9STejun Heo 		if (rend <= base)
351784656f9STejun Heo 			continue;
352784656f9STejun Heo 		/*
353784656f9STejun Heo 		 * @rgn overlaps.  If it separates the lower part of new
354784656f9STejun Heo 		 * area, insert that portion.
3558f7a6605SBenjamin Herrenschmidt 		 */
356784656f9STejun Heo 		if (rbase > base) {
357784656f9STejun Heo 			nr_new++;
358784656f9STejun Heo 			if (insert)
359784656f9STejun Heo 				memblock_insert_region(type, i++, base,
3607c0caeb8STejun Heo 						rbase - base, MAX_NUMNODES);
361784656f9STejun Heo 		}
362784656f9STejun Heo 		/* area below @rend is dealt with, forget about it */
363784656f9STejun Heo 		base = min(rend, end);
3648f7a6605SBenjamin Herrenschmidt 	}
3658f7a6605SBenjamin Herrenschmidt 
366784656f9STejun Heo 	/* insert the remaining portion */
367784656f9STejun Heo 	if (base < end) {
368784656f9STejun Heo 		nr_new++;
369784656f9STejun Heo 		if (insert)
3707c0caeb8STejun Heo 			memblock_insert_region(type, i, base, end - base,
3717c0caeb8STejun Heo 					       MAX_NUMNODES);
3728f7a6605SBenjamin Herrenschmidt 	}
3738f7a6605SBenjamin Herrenschmidt 
374784656f9STejun Heo 	/*
375784656f9STejun Heo 	 * If this was the first round, resize array and repeat for actual
376784656f9STejun Heo 	 * insertions; otherwise, merge and return.
3778f7a6605SBenjamin Herrenschmidt 	 */
378784656f9STejun Heo 	if (!insert) {
379784656f9STejun Heo 		while (type->cnt + nr_new > type->max)
380784656f9STejun Heo 			if (memblock_double_array(type) < 0)
381784656f9STejun Heo 				return -ENOMEM;
382784656f9STejun Heo 		insert = true;
383784656f9STejun Heo 		goto repeat;
38495f72d1eSYinghai Lu 	} else {
385784656f9STejun Heo 		memblock_merge_regions(type);
38695f72d1eSYinghai Lu 		return 0;
38795f72d1eSYinghai Lu 	}
388784656f9STejun Heo }
38995f72d1eSYinghai Lu 
390*581adcbeSTejun Heo int __init_memblock memblock_add(phys_addr_t base, phys_addr_t size)
39195f72d1eSYinghai Lu {
392e3239ff9SBenjamin Herrenschmidt 	return memblock_add_region(&memblock.memory, base, size);
39395f72d1eSYinghai Lu }
39495f72d1eSYinghai Lu 
395*581adcbeSTejun Heo static int __init_memblock __memblock_remove(struct memblock_type *type,
3968f7a6605SBenjamin Herrenschmidt 					     phys_addr_t base, phys_addr_t size)
39795f72d1eSYinghai Lu {
3982898cc4cSBenjamin Herrenschmidt 	phys_addr_t end = base + size;
39995f72d1eSYinghai Lu 	int i;
40095f72d1eSYinghai Lu 
4018f7a6605SBenjamin Herrenschmidt 	/* Walk through the array for collisions */
402e3239ff9SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
4038f7a6605SBenjamin Herrenschmidt 		struct memblock_region *rgn = &type->regions[i];
4048f7a6605SBenjamin Herrenschmidt 		phys_addr_t rend = rgn->base + rgn->size;
40595f72d1eSYinghai Lu 
4068f7a6605SBenjamin Herrenschmidt 		/* Nothing more to do, exit */
4078f7a6605SBenjamin Herrenschmidt 		if (rgn->base > end || rgn->size == 0)
4088f7a6605SBenjamin Herrenschmidt 			break;
4098f7a6605SBenjamin Herrenschmidt 
4108f7a6605SBenjamin Herrenschmidt 		/* If we fully enclose the block, drop it */
4118f7a6605SBenjamin Herrenschmidt 		if (base <= rgn->base && end >= rend) {
4128f7a6605SBenjamin Herrenschmidt 			memblock_remove_region(type, i--);
4138f7a6605SBenjamin Herrenschmidt 			continue;
4148f7a6605SBenjamin Herrenschmidt 		}
4158f7a6605SBenjamin Herrenschmidt 
4168f7a6605SBenjamin Herrenschmidt 		/* If we are fully enclosed within a block
4178f7a6605SBenjamin Herrenschmidt 		 * then we need to split it and we are done
4188f7a6605SBenjamin Herrenschmidt 		 */
4198f7a6605SBenjamin Herrenschmidt 		if (base > rgn->base && end < rend) {
4208f7a6605SBenjamin Herrenschmidt 			rgn->size = base - rgn->base;
4218f7a6605SBenjamin Herrenschmidt 			if (!memblock_add_region(type, end, rend - end))
4228f7a6605SBenjamin Herrenschmidt 				return 0;
4238f7a6605SBenjamin Herrenschmidt 			/* Failure to split is bad, we at least
4248f7a6605SBenjamin Herrenschmidt 			 * restore the block before erroring
4258f7a6605SBenjamin Herrenschmidt 			 */
4268f7a6605SBenjamin Herrenschmidt 			rgn->size = rend - rgn->base;
4278f7a6605SBenjamin Herrenschmidt 			WARN_ON(1);
4288f7a6605SBenjamin Herrenschmidt 			return -1;
4298f7a6605SBenjamin Herrenschmidt 		}
4308f7a6605SBenjamin Herrenschmidt 
4318f7a6605SBenjamin Herrenschmidt 		/* Check if we need to trim the bottom of a block */
4328f7a6605SBenjamin Herrenschmidt 		if (rgn->base < end && rend > end) {
4338f7a6605SBenjamin Herrenschmidt 			rgn->size -= end - rgn->base;
4348f7a6605SBenjamin Herrenschmidt 			rgn->base = end;
43595f72d1eSYinghai Lu 			break;
43695f72d1eSYinghai Lu 		}
43795f72d1eSYinghai Lu 
4388f7a6605SBenjamin Herrenschmidt 		/* And check if we need to trim the top of a block */
4398f7a6605SBenjamin Herrenschmidt 		if (base < rend)
4408f7a6605SBenjamin Herrenschmidt 			rgn->size -= rend - base;
44195f72d1eSYinghai Lu 
44295f72d1eSYinghai Lu 	}
44395f72d1eSYinghai Lu 	return 0;
44495f72d1eSYinghai Lu }
44595f72d1eSYinghai Lu 
446*581adcbeSTejun Heo int __init_memblock memblock_remove(phys_addr_t base, phys_addr_t size)
44795f72d1eSYinghai Lu {
44895f72d1eSYinghai Lu 	return __memblock_remove(&memblock.memory, base, size);
44995f72d1eSYinghai Lu }
45095f72d1eSYinghai Lu 
451*581adcbeSTejun Heo int __init_memblock memblock_free(phys_addr_t base, phys_addr_t size)
45295f72d1eSYinghai Lu {
45324aa0788STejun Heo 	memblock_dbg("   memblock_free: [%#016llx-%#016llx] %pF\n",
454a150439cSH. Peter Anvin 		     (unsigned long long)base,
455a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
456a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
45724aa0788STejun Heo 
45895f72d1eSYinghai Lu 	return __memblock_remove(&memblock.reserved, base, size);
45995f72d1eSYinghai Lu }
46095f72d1eSYinghai Lu 
461*581adcbeSTejun Heo int __init_memblock memblock_reserve(phys_addr_t base, phys_addr_t size)
46295f72d1eSYinghai Lu {
463e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *_rgn = &memblock.reserved;
46495f72d1eSYinghai Lu 
46524aa0788STejun Heo 	memblock_dbg("memblock_reserve: [%#016llx-%#016llx] %pF\n",
466a150439cSH. Peter Anvin 		     (unsigned long long)base,
467a150439cSH. Peter Anvin 		     (unsigned long long)base + size,
468a150439cSH. Peter Anvin 		     (void *)_RET_IP_);
46995f72d1eSYinghai Lu 	BUG_ON(0 == size);
47095f72d1eSYinghai Lu 
47195f72d1eSYinghai Lu 	return memblock_add_region(_rgn, base, size);
47295f72d1eSYinghai Lu }
47395f72d1eSYinghai Lu 
47435fd0808STejun Heo /**
47535fd0808STejun Heo  * __next_free_mem_range - next function for for_each_free_mem_range()
47635fd0808STejun Heo  * @idx: pointer to u64 loop variable
47735fd0808STejun Heo  * @nid: nid: node selector, %MAX_NUMNODES for all nodes
47835fd0808STejun Heo  * @p_start: ptr to phys_addr_t for start address of the range, can be %NULL
47935fd0808STejun Heo  * @p_end: ptr to phys_addr_t for end address of the range, can be %NULL
48035fd0808STejun Heo  * @p_nid: ptr to int for nid of the range, can be %NULL
48135fd0808STejun Heo  *
48235fd0808STejun Heo  * Find the first free area from *@idx which matches @nid, fill the out
48335fd0808STejun Heo  * parameters, and update *@idx for the next iteration.  The lower 32bit of
48435fd0808STejun Heo  * *@idx contains index into memory region and the upper 32bit indexes the
48535fd0808STejun Heo  * areas before each reserved region.  For example, if reserved regions
48635fd0808STejun Heo  * look like the following,
48735fd0808STejun Heo  *
48835fd0808STejun Heo  *	0:[0-16), 1:[32-48), 2:[128-130)
48935fd0808STejun Heo  *
49035fd0808STejun Heo  * The upper 32bit indexes the following regions.
49135fd0808STejun Heo  *
49235fd0808STejun Heo  *	0:[0-0), 1:[16-32), 2:[48-128), 3:[130-MAX)
49335fd0808STejun Heo  *
49435fd0808STejun Heo  * As both region arrays are sorted, the function advances the two indices
49535fd0808STejun Heo  * in lockstep and returns each intersection.
49635fd0808STejun Heo  */
49735fd0808STejun Heo void __init_memblock __next_free_mem_range(u64 *idx, int nid,
49835fd0808STejun Heo 					   phys_addr_t *out_start,
49935fd0808STejun Heo 					   phys_addr_t *out_end, int *out_nid)
50035fd0808STejun Heo {
50135fd0808STejun Heo 	struct memblock_type *mem = &memblock.memory;
50235fd0808STejun Heo 	struct memblock_type *rsv = &memblock.reserved;
50335fd0808STejun Heo 	int mi = *idx & 0xffffffff;
50435fd0808STejun Heo 	int ri = *idx >> 32;
50535fd0808STejun Heo 
50635fd0808STejun Heo 	for ( ; mi < mem->cnt; mi++) {
50735fd0808STejun Heo 		struct memblock_region *m = &mem->regions[mi];
50835fd0808STejun Heo 		phys_addr_t m_start = m->base;
50935fd0808STejun Heo 		phys_addr_t m_end = m->base + m->size;
51035fd0808STejun Heo 
51135fd0808STejun Heo 		/* only memory regions are associated with nodes, check it */
51235fd0808STejun Heo 		if (nid != MAX_NUMNODES && nid != memblock_get_region_node(m))
51335fd0808STejun Heo 			continue;
51435fd0808STejun Heo 
51535fd0808STejun Heo 		/* scan areas before each reservation for intersection */
51635fd0808STejun Heo 		for ( ; ri < rsv->cnt + 1; ri++) {
51735fd0808STejun Heo 			struct memblock_region *r = &rsv->regions[ri];
51835fd0808STejun Heo 			phys_addr_t r_start = ri ? r[-1].base + r[-1].size : 0;
51935fd0808STejun Heo 			phys_addr_t r_end = ri < rsv->cnt ? r->base : ULLONG_MAX;
52035fd0808STejun Heo 
52135fd0808STejun Heo 			/* if ri advanced past mi, break out to advance mi */
52235fd0808STejun Heo 			if (r_start >= m_end)
52335fd0808STejun Heo 				break;
52435fd0808STejun Heo 			/* if the two regions intersect, we're done */
52535fd0808STejun Heo 			if (m_start < r_end) {
52635fd0808STejun Heo 				if (out_start)
52735fd0808STejun Heo 					*out_start = max(m_start, r_start);
52835fd0808STejun Heo 				if (out_end)
52935fd0808STejun Heo 					*out_end = min(m_end, r_end);
53035fd0808STejun Heo 				if (out_nid)
53135fd0808STejun Heo 					*out_nid = memblock_get_region_node(m);
53235fd0808STejun Heo 				/*
53335fd0808STejun Heo 				 * The region which ends first is advanced
53435fd0808STejun Heo 				 * for the next iteration.
53535fd0808STejun Heo 				 */
53635fd0808STejun Heo 				if (m_end <= r_end)
53735fd0808STejun Heo 					mi++;
53835fd0808STejun Heo 				else
53935fd0808STejun Heo 					ri++;
54035fd0808STejun Heo 				*idx = (u32)mi | (u64)ri << 32;
54135fd0808STejun Heo 				return;
54235fd0808STejun Heo 			}
54335fd0808STejun Heo 		}
54435fd0808STejun Heo 	}
54535fd0808STejun Heo 
54635fd0808STejun Heo 	/* signal end of iteration */
54735fd0808STejun Heo 	*idx = ULLONG_MAX;
54835fd0808STejun Heo }
54935fd0808STejun Heo 
5507c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
5517c0caeb8STejun Heo /*
5527c0caeb8STejun Heo  * Common iterator interface used to define for_each_mem_range().
5537c0caeb8STejun Heo  */
5547c0caeb8STejun Heo void __init_memblock __next_mem_pfn_range(int *idx, int nid,
5557c0caeb8STejun Heo 				unsigned long *out_start_pfn,
5567c0caeb8STejun Heo 				unsigned long *out_end_pfn, int *out_nid)
5577c0caeb8STejun Heo {
5587c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
5597c0caeb8STejun Heo 	struct memblock_region *r;
5607c0caeb8STejun Heo 
5617c0caeb8STejun Heo 	while (++*idx < type->cnt) {
5627c0caeb8STejun Heo 		r = &type->regions[*idx];
5637c0caeb8STejun Heo 
5647c0caeb8STejun Heo 		if (PFN_UP(r->base) >= PFN_DOWN(r->base + r->size))
5657c0caeb8STejun Heo 			continue;
5667c0caeb8STejun Heo 		if (nid == MAX_NUMNODES || nid == r->nid)
5677c0caeb8STejun Heo 			break;
5687c0caeb8STejun Heo 	}
5697c0caeb8STejun Heo 	if (*idx >= type->cnt) {
5707c0caeb8STejun Heo 		*idx = -1;
5717c0caeb8STejun Heo 		return;
5727c0caeb8STejun Heo 	}
5737c0caeb8STejun Heo 
5747c0caeb8STejun Heo 	if (out_start_pfn)
5757c0caeb8STejun Heo 		*out_start_pfn = PFN_UP(r->base);
5767c0caeb8STejun Heo 	if (out_end_pfn)
5777c0caeb8STejun Heo 		*out_end_pfn = PFN_DOWN(r->base + r->size);
5787c0caeb8STejun Heo 	if (out_nid)
5797c0caeb8STejun Heo 		*out_nid = r->nid;
5807c0caeb8STejun Heo }
5817c0caeb8STejun Heo 
5827c0caeb8STejun Heo /**
5837c0caeb8STejun Heo  * memblock_set_node - set node ID on memblock regions
5847c0caeb8STejun Heo  * @base: base of area to set node ID for
5857c0caeb8STejun Heo  * @size: size of area to set node ID for
5867c0caeb8STejun Heo  * @nid: node ID to set
5877c0caeb8STejun Heo  *
5887c0caeb8STejun Heo  * Set the nid of memblock memory regions in [@base,@base+@size) to @nid.
5897c0caeb8STejun Heo  * Regions which cross the area boundaries are split as necessary.
5907c0caeb8STejun Heo  *
5917c0caeb8STejun Heo  * RETURNS:
5927c0caeb8STejun Heo  * 0 on success, -errno on failure.
5937c0caeb8STejun Heo  */
5947c0caeb8STejun Heo int __init_memblock memblock_set_node(phys_addr_t base, phys_addr_t size,
5957c0caeb8STejun Heo 				      int nid)
5967c0caeb8STejun Heo {
5977c0caeb8STejun Heo 	struct memblock_type *type = &memblock.memory;
5987c0caeb8STejun Heo 	phys_addr_t end = base + size;
5997c0caeb8STejun Heo 	int i;
6007c0caeb8STejun Heo 
6017c0caeb8STejun Heo 	/* we'll create at most two more regions */
6027c0caeb8STejun Heo 	while (type->cnt + 2 > type->max)
6037c0caeb8STejun Heo 		if (memblock_double_array(type) < 0)
6047c0caeb8STejun Heo 			return -ENOMEM;
6057c0caeb8STejun Heo 
6067c0caeb8STejun Heo 	for (i = 0; i < type->cnt; i++) {
6077c0caeb8STejun Heo 		struct memblock_region *rgn = &type->regions[i];
6087c0caeb8STejun Heo 		phys_addr_t rbase = rgn->base;
6097c0caeb8STejun Heo 		phys_addr_t rend = rbase + rgn->size;
6107c0caeb8STejun Heo 
6117c0caeb8STejun Heo 		if (rbase >= end)
6127c0caeb8STejun Heo 			break;
6137c0caeb8STejun Heo 		if (rend <= base)
6147c0caeb8STejun Heo 			continue;
6157c0caeb8STejun Heo 
6167c0caeb8STejun Heo 		if (rbase < base) {
6177c0caeb8STejun Heo 			/*
6187c0caeb8STejun Heo 			 * @rgn intersects from below.  Split and continue
6197c0caeb8STejun Heo 			 * to process the next region - the new top half.
6207c0caeb8STejun Heo 			 */
6217c0caeb8STejun Heo 			rgn->base = base;
6227c0caeb8STejun Heo 			rgn->size = rend - rgn->base;
6237c0caeb8STejun Heo 			memblock_insert_region(type, i, rbase, base - rbase,
6247c0caeb8STejun Heo 					       rgn->nid);
6257c0caeb8STejun Heo 		} else if (rend > end) {
6267c0caeb8STejun Heo 			/*
6277c0caeb8STejun Heo 			 * @rgn intersects from above.  Split and redo the
6287c0caeb8STejun Heo 			 * current region - the new bottom half.
6297c0caeb8STejun Heo 			 */
6307c0caeb8STejun Heo 			rgn->base = end;
6317c0caeb8STejun Heo 			rgn->size = rend - rgn->base;
6327c0caeb8STejun Heo 			memblock_insert_region(type, i--, rbase, end - rbase,
6337c0caeb8STejun Heo 					       rgn->nid);
6347c0caeb8STejun Heo 		} else {
6357c0caeb8STejun Heo 			/* @rgn is fully contained, set ->nid */
6367c0caeb8STejun Heo 			rgn->nid = nid;
6377c0caeb8STejun Heo 		}
6387c0caeb8STejun Heo 	}
6397c0caeb8STejun Heo 
6407c0caeb8STejun Heo 	memblock_merge_regions(type);
6417c0caeb8STejun Heo 	return 0;
6427c0caeb8STejun Heo }
6437c0caeb8STejun Heo #endif /* CONFIG_HAVE_MEMBLOCK_NODE_MAP */
6447c0caeb8STejun Heo 
6456ed311b2SBenjamin Herrenschmidt phys_addr_t __init __memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
64695f72d1eSYinghai Lu {
6476ed311b2SBenjamin Herrenschmidt 	phys_addr_t found;
64895f72d1eSYinghai Lu 
6496ed311b2SBenjamin Herrenschmidt 	/* We align the size to limit fragmentation. Without this, a lot of
6506ed311b2SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
6516ed311b2SBenjamin Herrenschmidt 	 */
652348968ebSTejun Heo 	size = round_up(size, align);
6536ed311b2SBenjamin Herrenschmidt 
654fc769a8eSTejun Heo 	found = memblock_find_in_range(0, max_addr, size, align);
6551f5026a7STejun Heo 	if (found && !memblock_add_region(&memblock.reserved, found, size))
6566ed311b2SBenjamin Herrenschmidt 		return found;
6576ed311b2SBenjamin Herrenschmidt 
6586ed311b2SBenjamin Herrenschmidt 	return 0;
65995f72d1eSYinghai Lu }
66095f72d1eSYinghai Lu 
6616ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_base(phys_addr_t size, phys_addr_t align, phys_addr_t max_addr)
66295f72d1eSYinghai Lu {
6636ed311b2SBenjamin Herrenschmidt 	phys_addr_t alloc;
6646ed311b2SBenjamin Herrenschmidt 
6656ed311b2SBenjamin Herrenschmidt 	alloc = __memblock_alloc_base(size, align, max_addr);
6666ed311b2SBenjamin Herrenschmidt 
6676ed311b2SBenjamin Herrenschmidt 	if (alloc == 0)
6686ed311b2SBenjamin Herrenschmidt 		panic("ERROR: Failed to allocate 0x%llx bytes below 0x%llx.\n",
6696ed311b2SBenjamin Herrenschmidt 		      (unsigned long long) size, (unsigned long long) max_addr);
6706ed311b2SBenjamin Herrenschmidt 
6716ed311b2SBenjamin Herrenschmidt 	return alloc;
67295f72d1eSYinghai Lu }
67395f72d1eSYinghai Lu 
6746ed311b2SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc(phys_addr_t size, phys_addr_t align)
67595f72d1eSYinghai Lu {
6766ed311b2SBenjamin Herrenschmidt 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
67795f72d1eSYinghai Lu }
67895f72d1eSYinghai Lu 
67995f72d1eSYinghai Lu 
6806ed311b2SBenjamin Herrenschmidt /*
68134e18455STejun Heo  * Additional node-local top-down allocators.
682c196f76fSBenjamin Herrenschmidt  *
683c196f76fSBenjamin Herrenschmidt  * WARNING: Only available after early_node_map[] has been populated,
684c196f76fSBenjamin Herrenschmidt  * on some architectures, that is after all the calls to add_active_range()
685c196f76fSBenjamin Herrenschmidt  * have been done to populate it.
6866ed311b2SBenjamin Herrenschmidt  */
68795f72d1eSYinghai Lu 
68834e18455STejun Heo static phys_addr_t __init memblock_nid_range_rev(phys_addr_t start,
68934e18455STejun Heo 						 phys_addr_t end, int *nid)
690c3f72b57SBenjamin Herrenschmidt {
691c196f76fSBenjamin Herrenschmidt #ifdef CONFIG_ARCH_POPULATES_NODE_MAP
692c196f76fSBenjamin Herrenschmidt 	unsigned long start_pfn, end_pfn;
693c196f76fSBenjamin Herrenschmidt 	int i;
694c196f76fSBenjamin Herrenschmidt 
695b2fea988STejun Heo 	for_each_mem_pfn_range(i, MAX_NUMNODES, &start_pfn, &end_pfn, nid)
69634e18455STejun Heo 		if (end > PFN_PHYS(start_pfn) && end <= PFN_PHYS(end_pfn))
69734e18455STejun Heo 			return max(start, PFN_PHYS(start_pfn));
698c196f76fSBenjamin Herrenschmidt #endif
699c3f72b57SBenjamin Herrenschmidt 	*nid = 0;
70034e18455STejun Heo 	return start;
701c3f72b57SBenjamin Herrenschmidt }
702c3f72b57SBenjamin Herrenschmidt 
703e6498040STejun Heo phys_addr_t __init memblock_find_in_range_node(phys_addr_t start,
704e6498040STejun Heo 					       phys_addr_t end,
7052898cc4cSBenjamin Herrenschmidt 					       phys_addr_t size,
7062898cc4cSBenjamin Herrenschmidt 					       phys_addr_t align, int nid)
70795f72d1eSYinghai Lu {
708e3239ff9SBenjamin Herrenschmidt 	struct memblock_type *mem = &memblock.memory;
70995f72d1eSYinghai Lu 	int i;
71095f72d1eSYinghai Lu 
71195f72d1eSYinghai Lu 	BUG_ON(0 == size);
71295f72d1eSYinghai Lu 
713e6498040STejun Heo 	/* Pump up max_addr */
714e6498040STejun Heo 	if (end == MEMBLOCK_ALLOC_ACCESSIBLE)
715e6498040STejun Heo 		end = memblock.current_limit;
716e6498040STejun Heo 
717e6498040STejun Heo 	for (i = mem->cnt - 1; i >= 0; i--) {
718e6498040STejun Heo 		struct memblock_region *r = &mem->regions[i];
719e6498040STejun Heo 		phys_addr_t base = max(start, r->base);
720e6498040STejun Heo 		phys_addr_t top = min(end, r->base + r->size);
721e6498040STejun Heo 
722e6498040STejun Heo 		while (base < top) {
723e6498040STejun Heo 			phys_addr_t tbase, ret;
724e6498040STejun Heo 			int tnid;
725e6498040STejun Heo 
726e6498040STejun Heo 			tbase = memblock_nid_range_rev(base, top, &tnid);
727e6498040STejun Heo 			if (nid == MAX_NUMNODES || tnid == nid) {
728e6498040STejun Heo 				ret = memblock_find_region(tbase, top, size, align);
729e6498040STejun Heo 				if (ret)
730e6498040STejun Heo 					return ret;
731e6498040STejun Heo 			}
732e6498040STejun Heo 			top = tbase;
733e6498040STejun Heo 		}
734e6498040STejun Heo 	}
735e6498040STejun Heo 
736e6498040STejun Heo 	return 0;
737e6498040STejun Heo }
738e6498040STejun Heo 
739e6498040STejun Heo phys_addr_t __init memblock_alloc_nid(phys_addr_t size, phys_addr_t align, int nid)
740e6498040STejun Heo {
741e6498040STejun Heo 	phys_addr_t found;
742e6498040STejun Heo 
743e6498040STejun Heo 	/*
744e6498040STejun Heo 	 * We align the size to limit fragmentation. Without this, a lot of
7457f219c73SBenjamin Herrenschmidt 	 * small allocs quickly eat up the whole reserve array on sparc
7467f219c73SBenjamin Herrenschmidt 	 */
747348968ebSTejun Heo 	size = round_up(size, align);
7487f219c73SBenjamin Herrenschmidt 
749e6498040STejun Heo 	found = memblock_find_in_range_node(0, MEMBLOCK_ALLOC_ACCESSIBLE,
75095f72d1eSYinghai Lu 					    size, align, nid);
751e6498040STejun Heo 	if (found && !memblock_add_region(&memblock.reserved, found, size))
752e6498040STejun Heo 		return found;
75395f72d1eSYinghai Lu 
7549d1e2492SBenjamin Herrenschmidt 	return 0;
7559d1e2492SBenjamin Herrenschmidt }
7569d1e2492SBenjamin Herrenschmidt 
7579d1e2492SBenjamin Herrenschmidt phys_addr_t __init memblock_alloc_try_nid(phys_addr_t size, phys_addr_t align, int nid)
7589d1e2492SBenjamin Herrenschmidt {
7599d1e2492SBenjamin Herrenschmidt 	phys_addr_t res = memblock_alloc_nid(size, align, nid);
7609d1e2492SBenjamin Herrenschmidt 
7619d1e2492SBenjamin Herrenschmidt 	if (res)
7629d1e2492SBenjamin Herrenschmidt 		return res;
76315fb0972STejun Heo 	return memblock_alloc_base(size, align, MEMBLOCK_ALLOC_ACCESSIBLE);
76495f72d1eSYinghai Lu }
76595f72d1eSYinghai Lu 
7669d1e2492SBenjamin Herrenschmidt 
7679d1e2492SBenjamin Herrenschmidt /*
7689d1e2492SBenjamin Herrenschmidt  * Remaining API functions
7699d1e2492SBenjamin Herrenschmidt  */
7709d1e2492SBenjamin Herrenschmidt 
77195f72d1eSYinghai Lu /* You must call memblock_analyze() before this. */
7722898cc4cSBenjamin Herrenschmidt phys_addr_t __init memblock_phys_mem_size(void)
77395f72d1eSYinghai Lu {
7744734b594SBenjamin Herrenschmidt 	return memblock.memory_size;
77595f72d1eSYinghai Lu }
77695f72d1eSYinghai Lu 
7770a93ebefSSam Ravnborg /* lowest address */
7780a93ebefSSam Ravnborg phys_addr_t __init_memblock memblock_start_of_DRAM(void)
7790a93ebefSSam Ravnborg {
7800a93ebefSSam Ravnborg 	return memblock.memory.regions[0].base;
7810a93ebefSSam Ravnborg }
7820a93ebefSSam Ravnborg 
78310d06439SYinghai Lu phys_addr_t __init_memblock memblock_end_of_DRAM(void)
78495f72d1eSYinghai Lu {
78595f72d1eSYinghai Lu 	int idx = memblock.memory.cnt - 1;
78695f72d1eSYinghai Lu 
787e3239ff9SBenjamin Herrenschmidt 	return (memblock.memory.regions[idx].base + memblock.memory.regions[idx].size);
78895f72d1eSYinghai Lu }
78995f72d1eSYinghai Lu 
79095f72d1eSYinghai Lu /* You must call memblock_analyze() after this. */
7912898cc4cSBenjamin Herrenschmidt void __init memblock_enforce_memory_limit(phys_addr_t memory_limit)
79295f72d1eSYinghai Lu {
79395f72d1eSYinghai Lu 	unsigned long i;
7942898cc4cSBenjamin Herrenschmidt 	phys_addr_t limit;
795e3239ff9SBenjamin Herrenschmidt 	struct memblock_region *p;
79695f72d1eSYinghai Lu 
79795f72d1eSYinghai Lu 	if (!memory_limit)
79895f72d1eSYinghai Lu 		return;
79995f72d1eSYinghai Lu 
80095f72d1eSYinghai Lu 	/* Truncate the memblock regions to satisfy the memory limit. */
80195f72d1eSYinghai Lu 	limit = memory_limit;
80295f72d1eSYinghai Lu 	for (i = 0; i < memblock.memory.cnt; i++) {
803e3239ff9SBenjamin Herrenschmidt 		if (limit > memblock.memory.regions[i].size) {
804e3239ff9SBenjamin Herrenschmidt 			limit -= memblock.memory.regions[i].size;
80595f72d1eSYinghai Lu 			continue;
80695f72d1eSYinghai Lu 		}
80795f72d1eSYinghai Lu 
808e3239ff9SBenjamin Herrenschmidt 		memblock.memory.regions[i].size = limit;
80995f72d1eSYinghai Lu 		memblock.memory.cnt = i + 1;
81095f72d1eSYinghai Lu 		break;
81195f72d1eSYinghai Lu 	}
81295f72d1eSYinghai Lu 
81395f72d1eSYinghai Lu 	memory_limit = memblock_end_of_DRAM();
81495f72d1eSYinghai Lu 
81595f72d1eSYinghai Lu 	/* And truncate any reserves above the limit also. */
81695f72d1eSYinghai Lu 	for (i = 0; i < memblock.reserved.cnt; i++) {
817e3239ff9SBenjamin Herrenschmidt 		p = &memblock.reserved.regions[i];
81895f72d1eSYinghai Lu 
81995f72d1eSYinghai Lu 		if (p->base > memory_limit)
82095f72d1eSYinghai Lu 			p->size = 0;
82195f72d1eSYinghai Lu 		else if ((p->base + p->size) > memory_limit)
82295f72d1eSYinghai Lu 			p->size = memory_limit - p->base;
82395f72d1eSYinghai Lu 
82495f72d1eSYinghai Lu 		if (p->size == 0) {
82595f72d1eSYinghai Lu 			memblock_remove_region(&memblock.reserved, i);
82695f72d1eSYinghai Lu 			i--;
82795f72d1eSYinghai Lu 		}
82895f72d1eSYinghai Lu 	}
82995f72d1eSYinghai Lu }
83095f72d1eSYinghai Lu 
831cd79481dSYinghai Lu static int __init_memblock memblock_search(struct memblock_type *type, phys_addr_t addr)
83272d4b0b4SBenjamin Herrenschmidt {
83372d4b0b4SBenjamin Herrenschmidt 	unsigned int left = 0, right = type->cnt;
83472d4b0b4SBenjamin Herrenschmidt 
83572d4b0b4SBenjamin Herrenschmidt 	do {
83672d4b0b4SBenjamin Herrenschmidt 		unsigned int mid = (right + left) / 2;
83772d4b0b4SBenjamin Herrenschmidt 
83872d4b0b4SBenjamin Herrenschmidt 		if (addr < type->regions[mid].base)
83972d4b0b4SBenjamin Herrenschmidt 			right = mid;
84072d4b0b4SBenjamin Herrenschmidt 		else if (addr >= (type->regions[mid].base +
84172d4b0b4SBenjamin Herrenschmidt 				  type->regions[mid].size))
84272d4b0b4SBenjamin Herrenschmidt 			left = mid + 1;
84372d4b0b4SBenjamin Herrenschmidt 		else
84472d4b0b4SBenjamin Herrenschmidt 			return mid;
84572d4b0b4SBenjamin Herrenschmidt 	} while (left < right);
84672d4b0b4SBenjamin Herrenschmidt 	return -1;
84772d4b0b4SBenjamin Herrenschmidt }
84872d4b0b4SBenjamin Herrenschmidt 
8492898cc4cSBenjamin Herrenschmidt int __init memblock_is_reserved(phys_addr_t addr)
85095f72d1eSYinghai Lu {
85172d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.reserved, addr) != -1;
85295f72d1eSYinghai Lu }
85372d4b0b4SBenjamin Herrenschmidt 
8543661ca66SYinghai Lu int __init_memblock memblock_is_memory(phys_addr_t addr)
85572d4b0b4SBenjamin Herrenschmidt {
85672d4b0b4SBenjamin Herrenschmidt 	return memblock_search(&memblock.memory, addr) != -1;
85772d4b0b4SBenjamin Herrenschmidt }
85872d4b0b4SBenjamin Herrenschmidt 
8593661ca66SYinghai Lu int __init_memblock memblock_is_region_memory(phys_addr_t base, phys_addr_t size)
86072d4b0b4SBenjamin Herrenschmidt {
861abb65272STomi Valkeinen 	int idx = memblock_search(&memblock.memory, base);
86272d4b0b4SBenjamin Herrenschmidt 
86372d4b0b4SBenjamin Herrenschmidt 	if (idx == -1)
86495f72d1eSYinghai Lu 		return 0;
865abb65272STomi Valkeinen 	return memblock.memory.regions[idx].base <= base &&
866abb65272STomi Valkeinen 		(memblock.memory.regions[idx].base +
867abb65272STomi Valkeinen 		 memblock.memory.regions[idx].size) >= (base + size);
86895f72d1eSYinghai Lu }
86995f72d1eSYinghai Lu 
87010d06439SYinghai Lu int __init_memblock memblock_is_region_reserved(phys_addr_t base, phys_addr_t size)
87195f72d1eSYinghai Lu {
872f1c2c19cSBenjamin Herrenschmidt 	return memblock_overlaps_region(&memblock.reserved, base, size) >= 0;
87395f72d1eSYinghai Lu }
87495f72d1eSYinghai Lu 
875e63075a3SBenjamin Herrenschmidt 
8763661ca66SYinghai Lu void __init_memblock memblock_set_current_limit(phys_addr_t limit)
877e63075a3SBenjamin Herrenschmidt {
878e63075a3SBenjamin Herrenschmidt 	memblock.current_limit = limit;
879e63075a3SBenjamin Herrenschmidt }
880e63075a3SBenjamin Herrenschmidt 
8817c0caeb8STejun Heo static void __init_memblock memblock_dump(struct memblock_type *type, char *name)
8826ed311b2SBenjamin Herrenschmidt {
8836ed311b2SBenjamin Herrenschmidt 	unsigned long long base, size;
8846ed311b2SBenjamin Herrenschmidt 	int i;
8856ed311b2SBenjamin Herrenschmidt 
8867c0caeb8STejun Heo 	pr_info(" %s.cnt  = 0x%lx\n", name, type->cnt);
8876ed311b2SBenjamin Herrenschmidt 
8887c0caeb8STejun Heo 	for (i = 0; i < type->cnt; i++) {
8897c0caeb8STejun Heo 		struct memblock_region *rgn = &type->regions[i];
8907c0caeb8STejun Heo 		char nid_buf[32] = "";
8916ed311b2SBenjamin Herrenschmidt 
8927c0caeb8STejun Heo 		base = rgn->base;
8937c0caeb8STejun Heo 		size = rgn->size;
8947c0caeb8STejun Heo #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP
8957c0caeb8STejun Heo 		if (memblock_get_region_node(rgn) != MAX_NUMNODES)
8967c0caeb8STejun Heo 			snprintf(nid_buf, sizeof(nid_buf), " on node %d",
8977c0caeb8STejun Heo 				 memblock_get_region_node(rgn));
8987c0caeb8STejun Heo #endif
8997c0caeb8STejun Heo 		pr_info(" %s[%#x]\t[%#016llx-%#016llx], %#llx bytes%s\n",
9007c0caeb8STejun Heo 			name, i, base, base + size - 1, size, nid_buf);
9016ed311b2SBenjamin Herrenschmidt 	}
9026ed311b2SBenjamin Herrenschmidt }
9036ed311b2SBenjamin Herrenschmidt 
90410d06439SYinghai Lu void __init_memblock memblock_dump_all(void)
9056ed311b2SBenjamin Herrenschmidt {
9066ed311b2SBenjamin Herrenschmidt 	if (!memblock_debug)
9076ed311b2SBenjamin Herrenschmidt 		return;
9086ed311b2SBenjamin Herrenschmidt 
9096ed311b2SBenjamin Herrenschmidt 	pr_info("MEMBLOCK configuration:\n");
9106ed311b2SBenjamin Herrenschmidt 	pr_info(" memory size = 0x%llx\n", (unsigned long long)memblock.memory_size);
9116ed311b2SBenjamin Herrenschmidt 
9126ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.memory, "memory");
9136ed311b2SBenjamin Herrenschmidt 	memblock_dump(&memblock.reserved, "reserved");
9146ed311b2SBenjamin Herrenschmidt }
9156ed311b2SBenjamin Herrenschmidt 
9166ed311b2SBenjamin Herrenschmidt void __init memblock_analyze(void)
9176ed311b2SBenjamin Herrenschmidt {
9186ed311b2SBenjamin Herrenschmidt 	int i;
9196ed311b2SBenjamin Herrenschmidt 
9206ed311b2SBenjamin Herrenschmidt 	/* Check marker in the unused last array entry */
9216ed311b2SBenjamin Herrenschmidt 	WARN_ON(memblock_memory_init_regions[INIT_MEMBLOCK_REGIONS].base
922c9d8c3d0SAndrew Morton 		!= MEMBLOCK_INACTIVE);
9236ed311b2SBenjamin Herrenschmidt 	WARN_ON(memblock_reserved_init_regions[INIT_MEMBLOCK_REGIONS].base
924c9d8c3d0SAndrew Morton 		!= MEMBLOCK_INACTIVE);
9256ed311b2SBenjamin Herrenschmidt 
9266ed311b2SBenjamin Herrenschmidt 	memblock.memory_size = 0;
9276ed311b2SBenjamin Herrenschmidt 
9286ed311b2SBenjamin Herrenschmidt 	for (i = 0; i < memblock.memory.cnt; i++)
9296ed311b2SBenjamin Herrenschmidt 		memblock.memory_size += memblock.memory.regions[i].size;
930142b45a7SBenjamin Herrenschmidt 
931142b45a7SBenjamin Herrenschmidt 	/* We allow resizing from there */
932142b45a7SBenjamin Herrenschmidt 	memblock_can_resize = 1;
9336ed311b2SBenjamin Herrenschmidt }
9346ed311b2SBenjamin Herrenschmidt 
9357590abe8SBenjamin Herrenschmidt void __init memblock_init(void)
9367590abe8SBenjamin Herrenschmidt {
937236260b9SJeremy Fitzhardinge 	static int init_done __initdata = 0;
938236260b9SJeremy Fitzhardinge 
939236260b9SJeremy Fitzhardinge 	if (init_done)
940236260b9SJeremy Fitzhardinge 		return;
941236260b9SJeremy Fitzhardinge 	init_done = 1;
942236260b9SJeremy Fitzhardinge 
9437590abe8SBenjamin Herrenschmidt 	/* Hookup the initial arrays */
9447590abe8SBenjamin Herrenschmidt 	memblock.memory.regions	= memblock_memory_init_regions;
9457590abe8SBenjamin Herrenschmidt 	memblock.memory.max		= INIT_MEMBLOCK_REGIONS;
9467590abe8SBenjamin Herrenschmidt 	memblock.reserved.regions	= memblock_reserved_init_regions;
9477590abe8SBenjamin Herrenschmidt 	memblock.reserved.max	= INIT_MEMBLOCK_REGIONS;
9487590abe8SBenjamin Herrenschmidt 
9497590abe8SBenjamin Herrenschmidt 	/* Write a marker in the unused last array entry */
950c9d8c3d0SAndrew Morton 	memblock.memory.regions[INIT_MEMBLOCK_REGIONS].base = MEMBLOCK_INACTIVE;
951c9d8c3d0SAndrew Morton 	memblock.reserved.regions[INIT_MEMBLOCK_REGIONS].base = MEMBLOCK_INACTIVE;
9527590abe8SBenjamin Herrenschmidt 
9537590abe8SBenjamin Herrenschmidt 	/* Create a dummy zero size MEMBLOCK which will get coalesced away later.
9547590abe8SBenjamin Herrenschmidt 	 * This simplifies the memblock_add() code below...
9557590abe8SBenjamin Herrenschmidt 	 */
9567590abe8SBenjamin Herrenschmidt 	memblock.memory.regions[0].base = 0;
9577590abe8SBenjamin Herrenschmidt 	memblock.memory.regions[0].size = 0;
9587c0caeb8STejun Heo 	memblock_set_region_node(&memblock.memory.regions[0], MAX_NUMNODES);
9597590abe8SBenjamin Herrenschmidt 	memblock.memory.cnt = 1;
9607590abe8SBenjamin Herrenschmidt 
9617590abe8SBenjamin Herrenschmidt 	/* Ditto. */
9627590abe8SBenjamin Herrenschmidt 	memblock.reserved.regions[0].base = 0;
9637590abe8SBenjamin Herrenschmidt 	memblock.reserved.regions[0].size = 0;
9647c0caeb8STejun Heo 	memblock_set_region_node(&memblock.reserved.regions[0], MAX_NUMNODES);
9657590abe8SBenjamin Herrenschmidt 	memblock.reserved.cnt = 1;
9667590abe8SBenjamin Herrenschmidt 
9677590abe8SBenjamin Herrenschmidt 	memblock.current_limit = MEMBLOCK_ALLOC_ANYWHERE;
9687590abe8SBenjamin Herrenschmidt }
9697590abe8SBenjamin Herrenschmidt 
9706ed311b2SBenjamin Herrenschmidt static int __init early_memblock(char *p)
9716ed311b2SBenjamin Herrenschmidt {
9726ed311b2SBenjamin Herrenschmidt 	if (p && strstr(p, "debug"))
9736ed311b2SBenjamin Herrenschmidt 		memblock_debug = 1;
9746ed311b2SBenjamin Herrenschmidt 	return 0;
9756ed311b2SBenjamin Herrenschmidt }
9766ed311b2SBenjamin Herrenschmidt early_param("memblock", early_memblock);
9776ed311b2SBenjamin Herrenschmidt 
978c378ddd5STejun Heo #if defined(CONFIG_DEBUG_FS) && !defined(CONFIG_ARCH_DISCARD_MEMBLOCK)
9796d03b885SBenjamin Herrenschmidt 
9806d03b885SBenjamin Herrenschmidt static int memblock_debug_show(struct seq_file *m, void *private)
9816d03b885SBenjamin Herrenschmidt {
9826d03b885SBenjamin Herrenschmidt 	struct memblock_type *type = m->private;
9836d03b885SBenjamin Herrenschmidt 	struct memblock_region *reg;
9846d03b885SBenjamin Herrenschmidt 	int i;
9856d03b885SBenjamin Herrenschmidt 
9866d03b885SBenjamin Herrenschmidt 	for (i = 0; i < type->cnt; i++) {
9876d03b885SBenjamin Herrenschmidt 		reg = &type->regions[i];
9886d03b885SBenjamin Herrenschmidt 		seq_printf(m, "%4d: ", i);
9896d03b885SBenjamin Herrenschmidt 		if (sizeof(phys_addr_t) == 4)
9906d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%08lx..0x%08lx\n",
9916d03b885SBenjamin Herrenschmidt 				   (unsigned long)reg->base,
9926d03b885SBenjamin Herrenschmidt 				   (unsigned long)(reg->base + reg->size - 1));
9936d03b885SBenjamin Herrenschmidt 		else
9946d03b885SBenjamin Herrenschmidt 			seq_printf(m, "0x%016llx..0x%016llx\n",
9956d03b885SBenjamin Herrenschmidt 				   (unsigned long long)reg->base,
9966d03b885SBenjamin Herrenschmidt 				   (unsigned long long)(reg->base + reg->size - 1));
9976d03b885SBenjamin Herrenschmidt 
9986d03b885SBenjamin Herrenschmidt 	}
9996d03b885SBenjamin Herrenschmidt 	return 0;
10006d03b885SBenjamin Herrenschmidt }
10016d03b885SBenjamin Herrenschmidt 
10026d03b885SBenjamin Herrenschmidt static int memblock_debug_open(struct inode *inode, struct file *file)
10036d03b885SBenjamin Herrenschmidt {
10046d03b885SBenjamin Herrenschmidt 	return single_open(file, memblock_debug_show, inode->i_private);
10056d03b885SBenjamin Herrenschmidt }
10066d03b885SBenjamin Herrenschmidt 
10076d03b885SBenjamin Herrenschmidt static const struct file_operations memblock_debug_fops = {
10086d03b885SBenjamin Herrenschmidt 	.open = memblock_debug_open,
10096d03b885SBenjamin Herrenschmidt 	.read = seq_read,
10106d03b885SBenjamin Herrenschmidt 	.llseek = seq_lseek,
10116d03b885SBenjamin Herrenschmidt 	.release = single_release,
10126d03b885SBenjamin Herrenschmidt };
10136d03b885SBenjamin Herrenschmidt 
10146d03b885SBenjamin Herrenschmidt static int __init memblock_init_debugfs(void)
10156d03b885SBenjamin Herrenschmidt {
10166d03b885SBenjamin Herrenschmidt 	struct dentry *root = debugfs_create_dir("memblock", NULL);
10176d03b885SBenjamin Herrenschmidt 	if (!root)
10186d03b885SBenjamin Herrenschmidt 		return -ENXIO;
10196d03b885SBenjamin Herrenschmidt 	debugfs_create_file("memory", S_IRUGO, root, &memblock.memory, &memblock_debug_fops);
10206d03b885SBenjamin Herrenschmidt 	debugfs_create_file("reserved", S_IRUGO, root, &memblock.reserved, &memblock_debug_fops);
10216d03b885SBenjamin Herrenschmidt 
10226d03b885SBenjamin Herrenschmidt 	return 0;
10236d03b885SBenjamin Herrenschmidt }
10246d03b885SBenjamin Herrenschmidt __initcall(memblock_init_debugfs);
10256d03b885SBenjamin Herrenschmidt 
10266d03b885SBenjamin Herrenschmidt #endif /* CONFIG_DEBUG_FS */
1027