xref: /linux/arch/x86/kernel/aperture_64.c (revision 24d9b70b8c679264756a6980e668b96b3f964826)
1250c2277SThomas Gleixner /*
2250c2277SThomas Gleixner  * Firmware replacement code.
3250c2277SThomas Gleixner  *
48caac563SPavel Machek  * Work around broken BIOSes that don't set an aperture, only set the
58caac563SPavel Machek  * aperture in the AGP bridge, or set too small aperture.
68caac563SPavel Machek  *
7250c2277SThomas Gleixner  * If all fails map the aperture over some low memory.  This is cheaper than
8250c2277SThomas Gleixner  * doing bounce buffering. The memory is lost. This is done at early boot
9250c2277SThomas Gleixner  * because only the bootmem allocator can allocate 32+MB.
10250c2277SThomas Gleixner  *
11250c2277SThomas Gleixner  * Copyright 2002 Andi Kleen, SuSE Labs.
12250c2277SThomas Gleixner  */
13250c2277SThomas Gleixner #include <linux/kernel.h>
14250c2277SThomas Gleixner #include <linux/types.h>
15250c2277SThomas Gleixner #include <linux/init.h>
16250c2277SThomas Gleixner #include <linux/bootmem.h>
17250c2277SThomas Gleixner #include <linux/mmzone.h>
18250c2277SThomas Gleixner #include <linux/pci_ids.h>
19250c2277SThomas Gleixner #include <linux/pci.h>
20250c2277SThomas Gleixner #include <linux/bitops.h>
21250c2277SThomas Gleixner #include <linux/ioport.h>
222050d45dSPavel Machek #include <linux/suspend.h>
23acde31dcSCatalin Marinas #include <linux/kmemleak.h>
24250c2277SThomas Gleixner #include <asm/e820.h>
25250c2277SThomas Gleixner #include <asm/io.h>
2646a7fa27SFUJITA Tomonori #include <asm/iommu.h>
27395624fcSJoerg Roedel #include <asm/gart.h>
28250c2277SThomas Gleixner #include <asm/pci-direct.h>
29250c2277SThomas Gleixner #include <asm/dma.h>
3023ac4ae8SAndreas Herrmann #include <asm/amd_nb.h>
31de957628SFUJITA Tomonori #include <asm/x86_init.h>
32250c2277SThomas Gleixner 
330440d4c0SJoerg Roedel int gart_iommu_aperture;
347de6a4cdSPavel Machek int gart_iommu_aperture_disabled __initdata;
357de6a4cdSPavel Machek int gart_iommu_aperture_allowed __initdata;
36250c2277SThomas Gleixner 
37250c2277SThomas Gleixner int fallback_aper_order __initdata = 1; /* 64MB */
387de6a4cdSPavel Machek int fallback_aper_force __initdata;
39250c2277SThomas Gleixner 
40250c2277SThomas Gleixner int fix_aperture __initdata = 1;
41250c2277SThomas Gleixner 
42250c2277SThomas Gleixner static struct resource gart_resource = {
43250c2277SThomas Gleixner 	.name	= "GART",
44250c2277SThomas Gleixner 	.flags	= IORESOURCE_MEM,
45250c2277SThomas Gleixner };
46250c2277SThomas Gleixner 
47250c2277SThomas Gleixner static void __init insert_aperture_resource(u32 aper_base, u32 aper_size)
48250c2277SThomas Gleixner {
49250c2277SThomas Gleixner 	gart_resource.start = aper_base;
50250c2277SThomas Gleixner 	gart_resource.end = aper_base + aper_size - 1;
51250c2277SThomas Gleixner 	insert_resource(&iomem_resource, &gart_resource);
52250c2277SThomas Gleixner }
53250c2277SThomas Gleixner 
54250c2277SThomas Gleixner /* This code runs before the PCI subsystem is initialized, so just
55250c2277SThomas Gleixner    access the northbridge directly. */
56250c2277SThomas Gleixner 
57250c2277SThomas Gleixner static u32 __init allocate_aperture(void)
58250c2277SThomas Gleixner {
59250c2277SThomas Gleixner 	u32 aper_size;
60250c2277SThomas Gleixner 	void *p;
61250c2277SThomas Gleixner 
627677b2efSYinghai Lu 	/* aper_size should <= 1G */
637677b2efSYinghai Lu 	if (fallback_aper_order > 5)
647677b2efSYinghai Lu 		fallback_aper_order = 5;
65250c2277SThomas Gleixner 	aper_size = (32 * 1024 * 1024) << fallback_aper_order;
66250c2277SThomas Gleixner 
67250c2277SThomas Gleixner 	/*
68c140df97SIngo Molnar 	 * Aperture has to be naturally aligned. This means a 2GB aperture
69c140df97SIngo Molnar 	 * won't have much chance of finding a place in the lower 4GB of
70c140df97SIngo Molnar 	 * memory. Unfortunately we cannot move it up because that would
71c140df97SIngo Molnar 	 * make the IOMMU useless.
72250c2277SThomas Gleixner 	 */
737677b2efSYinghai Lu 	/*
747677b2efSYinghai Lu 	 * using 512M as goal, in case kexec will load kernel_big
757677b2efSYinghai Lu 	 * that will do the on position decompress, and  could overlap with
767677b2efSYinghai Lu 	 * that positon with gart that is used.
777677b2efSYinghai Lu 	 * sequende:
787677b2efSYinghai Lu 	 * kernel_small
797677b2efSYinghai Lu 	 * ==> kexec (with kdump trigger path or previous doesn't shutdown gart)
807677b2efSYinghai Lu 	 * ==> kernel_small(gart area become e820_reserved)
817677b2efSYinghai Lu 	 * ==> kexec (with kdump trigger path or previous doesn't shutdown gart)
827677b2efSYinghai Lu 	 * ==> kerne_big (uncompressed size will be big than 64M or 128M)
837677b2efSYinghai Lu 	 * so don't use 512M below as gart iommu, leave the space for kernel
847677b2efSYinghai Lu 	 * code for safe
857677b2efSYinghai Lu 	 */
867677b2efSYinghai Lu 	p = __alloc_bootmem_nopanic(aper_size, aper_size, 512ULL<<20);
87acde31dcSCatalin Marinas 	/*
88acde31dcSCatalin Marinas 	 * Kmemleak should not scan this block as it may not be mapped via the
89acde31dcSCatalin Marinas 	 * kernel direct mapping.
90acde31dcSCatalin Marinas 	 */
91acde31dcSCatalin Marinas 	kmemleak_ignore(p);
92250c2277SThomas Gleixner 	if (!p || __pa(p)+aper_size > 0xffffffff) {
9331183ba8SIngo Molnar 		printk(KERN_ERR
9431183ba8SIngo Molnar 			"Cannot allocate aperture memory hole (%p,%uK)\n",
95250c2277SThomas Gleixner 				p, aper_size>>10);
96250c2277SThomas Gleixner 		if (p)
97250c2277SThomas Gleixner 			free_bootmem(__pa(p), aper_size);
98250c2277SThomas Gleixner 		return 0;
99250c2277SThomas Gleixner 	}
10031183ba8SIngo Molnar 	printk(KERN_INFO "Mapping aperture over %d KB of RAM @ %lx\n",
101250c2277SThomas Gleixner 			aper_size >> 10, __pa(p));
102250c2277SThomas Gleixner 	insert_aperture_resource((u32)__pa(p), aper_size);
1032050d45dSPavel Machek 	register_nosave_region((u32)__pa(p) >> PAGE_SHIFT,
1042050d45dSPavel Machek 				(u32)__pa(p+aper_size) >> PAGE_SHIFT);
105c140df97SIngo Molnar 
106250c2277SThomas Gleixner 	return (u32)__pa(p);
107250c2277SThomas Gleixner }
108250c2277SThomas Gleixner 
109250c2277SThomas Gleixner 
110250c2277SThomas Gleixner /* Find a PCI capability */
111dd564d0cSPavel Machek static u32 __init find_cap(int bus, int slot, int func, int cap)
112250c2277SThomas Gleixner {
113250c2277SThomas Gleixner 	int bytes;
114c140df97SIngo Molnar 	u8 pos;
115c140df97SIngo Molnar 
11655c0d721SYinghai Lu 	if (!(read_pci_config_16(bus, slot, func, PCI_STATUS) &
117c140df97SIngo Molnar 						PCI_STATUS_CAP_LIST))
118250c2277SThomas Gleixner 		return 0;
119c140df97SIngo Molnar 
12055c0d721SYinghai Lu 	pos = read_pci_config_byte(bus, slot, func, PCI_CAPABILITY_LIST);
121250c2277SThomas Gleixner 	for (bytes = 0; bytes < 48 && pos >= 0x40; bytes++) {
122250c2277SThomas Gleixner 		u8 id;
123c140df97SIngo Molnar 
124250c2277SThomas Gleixner 		pos &= ~3;
12555c0d721SYinghai Lu 		id = read_pci_config_byte(bus, slot, func, pos+PCI_CAP_LIST_ID);
126250c2277SThomas Gleixner 		if (id == 0xff)
127250c2277SThomas Gleixner 			break;
128250c2277SThomas Gleixner 		if (id == cap)
129250c2277SThomas Gleixner 			return pos;
13055c0d721SYinghai Lu 		pos = read_pci_config_byte(bus, slot, func,
131c140df97SIngo Molnar 						pos+PCI_CAP_LIST_NEXT);
132250c2277SThomas Gleixner 	}
133250c2277SThomas Gleixner 	return 0;
134250c2277SThomas Gleixner }
135250c2277SThomas Gleixner 
136250c2277SThomas Gleixner /* Read a standard AGPv3 bridge header */
137dd564d0cSPavel Machek static u32 __init read_agp(int bus, int slot, int func, int cap, u32 *order)
138250c2277SThomas Gleixner {
139250c2277SThomas Gleixner 	u32 apsize;
140250c2277SThomas Gleixner 	u32 apsizereg;
141250c2277SThomas Gleixner 	int nbits;
142250c2277SThomas Gleixner 	u32 aper_low, aper_hi;
143250c2277SThomas Gleixner 	u64 aper;
1441edc1ab3SYinghai Lu 	u32 old_order;
145250c2277SThomas Gleixner 
14655c0d721SYinghai Lu 	printk(KERN_INFO "AGP bridge at %02x:%02x:%02x\n", bus, slot, func);
14755c0d721SYinghai Lu 	apsizereg = read_pci_config_16(bus, slot, func, cap + 0x14);
148250c2277SThomas Gleixner 	if (apsizereg == 0xffffffff) {
14931183ba8SIngo Molnar 		printk(KERN_ERR "APSIZE in AGP bridge unreadable\n");
150250c2277SThomas Gleixner 		return 0;
151250c2277SThomas Gleixner 	}
152250c2277SThomas Gleixner 
1531edc1ab3SYinghai Lu 	/* old_order could be the value from NB gart setting */
1541edc1ab3SYinghai Lu 	old_order = *order;
1551edc1ab3SYinghai Lu 
156250c2277SThomas Gleixner 	apsize = apsizereg & 0xfff;
157250c2277SThomas Gleixner 	/* Some BIOS use weird encodings not in the AGPv3 table. */
158250c2277SThomas Gleixner 	if (apsize & 0xff)
159250c2277SThomas Gleixner 		apsize |= 0xf00;
160250c2277SThomas Gleixner 	nbits = hweight16(apsize);
161250c2277SThomas Gleixner 	*order = 7 - nbits;
162250c2277SThomas Gleixner 	if ((int)*order < 0) /* < 32MB */
163250c2277SThomas Gleixner 		*order = 0;
164250c2277SThomas Gleixner 
16555c0d721SYinghai Lu 	aper_low = read_pci_config(bus, slot, func, 0x10);
16655c0d721SYinghai Lu 	aper_hi = read_pci_config(bus, slot, func, 0x14);
167250c2277SThomas Gleixner 	aper = (aper_low & ~((1<<22)-1)) | ((u64)aper_hi << 32);
168250c2277SThomas Gleixner 
1691edc1ab3SYinghai Lu 	/*
1701edc1ab3SYinghai Lu 	 * On some sick chips, APSIZE is 0. It means it wants 4G
1711edc1ab3SYinghai Lu 	 * so let double check that order, and lets trust AMD NB settings:
1721edc1ab3SYinghai Lu 	 */
1738c9fd91aSYinghai Lu 	printk(KERN_INFO "Aperture from AGP @ %Lx old size %u MB\n",
1748c9fd91aSYinghai Lu 			aper, 32 << old_order);
1758c9fd91aSYinghai Lu 	if (aper + (32ULL<<(20 + *order)) > 0x100000000ULL) {
1761edc1ab3SYinghai Lu 		printk(KERN_INFO "Aperture size %u MB (APSIZE %x) is not right, using settings from NB\n",
1771edc1ab3SYinghai Lu 				32 << *order, apsizereg);
1781edc1ab3SYinghai Lu 		*order = old_order;
1791edc1ab3SYinghai Lu 	}
1801edc1ab3SYinghai Lu 
18131183ba8SIngo Molnar 	printk(KERN_INFO "Aperture from AGP @ %Lx size %u MB (APSIZE %x)\n",
182250c2277SThomas Gleixner 			aper, 32 << *order, apsizereg);
183250c2277SThomas Gleixner 
1848c9fd91aSYinghai Lu 	if (!aperture_valid(aper, (32*1024*1024) << *order, 32<<20))
185250c2277SThomas Gleixner 		return 0;
186250c2277SThomas Gleixner 	return (u32)aper;
187250c2277SThomas Gleixner }
188250c2277SThomas Gleixner 
189c140df97SIngo Molnar /*
190c140df97SIngo Molnar  * Look for an AGP bridge. Windows only expects the aperture in the
191c140df97SIngo Molnar  * AGP bridge and some BIOS forget to initialize the Northbridge too.
192c140df97SIngo Molnar  * Work around this here.
193c140df97SIngo Molnar  *
194c140df97SIngo Molnar  * Do an PCI bus scan by hand because we're running before the PCI
195c140df97SIngo Molnar  * subsystem.
196c140df97SIngo Molnar  *
197eec1d4faSHans Rosenfeld  * All AMD AGP bridges are AGPv3 compliant, so we can do this scan
198c140df97SIngo Molnar  * generically. It's probably overkill to always scan all slots because
199c140df97SIngo Molnar  * the AGP bridges should be always an own bus on the HT hierarchy,
200c140df97SIngo Molnar  * but do it here for future safety.
201c140df97SIngo Molnar  */
202dd564d0cSPavel Machek static u32 __init search_agp_bridge(u32 *order, int *valid_agp)
203250c2277SThomas Gleixner {
20455c0d721SYinghai Lu 	int bus, slot, func;
205250c2277SThomas Gleixner 
206250c2277SThomas Gleixner 	/* Poor man's PCI discovery */
20755c0d721SYinghai Lu 	for (bus = 0; bus < 256; bus++) {
208250c2277SThomas Gleixner 		for (slot = 0; slot < 32; slot++) {
209250c2277SThomas Gleixner 			for (func = 0; func < 8; func++) {
210250c2277SThomas Gleixner 				u32 class, cap;
211250c2277SThomas Gleixner 				u8 type;
21255c0d721SYinghai Lu 				class = read_pci_config(bus, slot, func,
213250c2277SThomas Gleixner 							PCI_CLASS_REVISION);
214250c2277SThomas Gleixner 				if (class == 0xffffffff)
215250c2277SThomas Gleixner 					break;
216250c2277SThomas Gleixner 
217250c2277SThomas Gleixner 				switch (class >> 16) {
218250c2277SThomas Gleixner 				case PCI_CLASS_BRIDGE_HOST:
219250c2277SThomas Gleixner 				case PCI_CLASS_BRIDGE_OTHER: /* needed? */
220250c2277SThomas Gleixner 					/* AGP bridge? */
22155c0d721SYinghai Lu 					cap = find_cap(bus, slot, func,
222c140df97SIngo Molnar 							PCI_CAP_ID_AGP);
223250c2277SThomas Gleixner 					if (!cap)
224250c2277SThomas Gleixner 						break;
225250c2277SThomas Gleixner 					*valid_agp = 1;
22655c0d721SYinghai Lu 					return read_agp(bus, slot, func, cap,
227c140df97SIngo Molnar 							order);
228250c2277SThomas Gleixner 				}
229250c2277SThomas Gleixner 
230250c2277SThomas Gleixner 				/* No multi-function device? */
23155c0d721SYinghai Lu 				type = read_pci_config_byte(bus, slot, func,
232250c2277SThomas Gleixner 							       PCI_HEADER_TYPE);
233250c2277SThomas Gleixner 				if (!(type & 0x80))
234250c2277SThomas Gleixner 					break;
235250c2277SThomas Gleixner 			}
236250c2277SThomas Gleixner 		}
237250c2277SThomas Gleixner 	}
23831183ba8SIngo Molnar 	printk(KERN_INFO "No AGP bridge found\n");
239c140df97SIngo Molnar 
240250c2277SThomas Gleixner 	return 0;
241250c2277SThomas Gleixner }
242250c2277SThomas Gleixner 
243aaf23042SYinghai Lu static int gart_fix_e820 __initdata = 1;
244aaf23042SYinghai Lu 
245aaf23042SYinghai Lu static int __init parse_gart_mem(char *p)
246aaf23042SYinghai Lu {
247aaf23042SYinghai Lu 	if (!p)
248aaf23042SYinghai Lu 		return -EINVAL;
249aaf23042SYinghai Lu 
250aaf23042SYinghai Lu 	if (!strncmp(p, "off", 3))
251aaf23042SYinghai Lu 		gart_fix_e820 = 0;
252aaf23042SYinghai Lu 	else if (!strncmp(p, "on", 2))
253aaf23042SYinghai Lu 		gart_fix_e820 = 1;
254aaf23042SYinghai Lu 
255aaf23042SYinghai Lu 	return 0;
256aaf23042SYinghai Lu }
257aaf23042SYinghai Lu early_param("gart_fix_e820", parse_gart_mem);
258aaf23042SYinghai Lu 
259aaf23042SYinghai Lu void __init early_gart_iommu_check(void)
260aaf23042SYinghai Lu {
261aaf23042SYinghai Lu 	/*
262aaf23042SYinghai Lu 	 * in case it is enabled before, esp for kexec/kdump,
263aaf23042SYinghai Lu 	 * previous kernel already enable that. memset called
264aaf23042SYinghai Lu 	 * by allocate_aperture/__alloc_bootmem_nopanic cause restart.
265aaf23042SYinghai Lu 	 * or second kernel have different position for GART hole. and new
266aaf23042SYinghai Lu 	 * kernel could use hole as RAM that is still used by GART set by
267aaf23042SYinghai Lu 	 * first kernel
268aaf23042SYinghai Lu 	 * or BIOS forget to put that in reserved.
269aaf23042SYinghai Lu 	 * try to update e820 to make that region as reserved.
270aaf23042SYinghai Lu 	 */
271fa10ba64SAndi Kleen 	u32 agp_aper_order = 0;
272f3eee542SYinghai Lu 	int i, fix, slot, valid_agp = 0;
273aaf23042SYinghai Lu 	u32 ctl;
274aaf23042SYinghai Lu 	u32 aper_size = 0, aper_order = 0, last_aper_order = 0;
275aaf23042SYinghai Lu 	u64 aper_base = 0, last_aper_base = 0;
276fa5b8a30SPavel Machek 	int aper_enabled = 0, last_aper_enabled = 0, last_valid = 0;
277aaf23042SYinghai Lu 
278aaf23042SYinghai Lu 	if (!early_pci_allowed())
279aaf23042SYinghai Lu 		return;
280aaf23042SYinghai Lu 
281fa5b8a30SPavel Machek 	/* This is mostly duplicate of iommu_hole_init */
282fa10ba64SAndi Kleen 	search_agp_bridge(&agp_aper_order, &valid_agp);
283f3eee542SYinghai Lu 
284aaf23042SYinghai Lu 	fix = 0;
285*24d9b70bSJan Beulich 	for (i = 0; amd_nb_bus_dev_ranges[i].dev_limit; i++) {
28655c0d721SYinghai Lu 		int bus;
28755c0d721SYinghai Lu 		int dev_base, dev_limit;
28855c0d721SYinghai Lu 
289*24d9b70bSJan Beulich 		bus = amd_nb_bus_dev_ranges[i].bus;
290*24d9b70bSJan Beulich 		dev_base = amd_nb_bus_dev_ranges[i].dev_base;
291*24d9b70bSJan Beulich 		dev_limit = amd_nb_bus_dev_ranges[i].dev_limit;
29255c0d721SYinghai Lu 
29355c0d721SYinghai Lu 		for (slot = dev_base; slot < dev_limit; slot++) {
294eec1d4faSHans Rosenfeld 			if (!early_is_amd_nb(read_pci_config(bus, slot, 3, 0x00)))
295aaf23042SYinghai Lu 				continue;
296aaf23042SYinghai Lu 
29755c0d721SYinghai Lu 			ctl = read_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL);
29857ab43e3SBorislav Petkov 			aper_enabled = ctl & GARTEN;
299aaf23042SYinghai Lu 			aper_order = (ctl >> 1) & 7;
300aaf23042SYinghai Lu 			aper_size = (32 * 1024 * 1024) << aper_order;
30155c0d721SYinghai Lu 			aper_base = read_pci_config(bus, slot, 3, AMD64_GARTAPERTUREBASE) & 0x7fff;
302aaf23042SYinghai Lu 			aper_base <<= 25;
303aaf23042SYinghai Lu 
304fa5b8a30SPavel Machek 			if (last_valid) {
305fa5b8a30SPavel Machek 				if ((aper_order != last_aper_order) ||
306fa5b8a30SPavel Machek 				    (aper_base != last_aper_base) ||
307fa5b8a30SPavel Machek 				    (aper_enabled != last_aper_enabled)) {
308aaf23042SYinghai Lu 					fix = 1;
309fa5b8a30SPavel Machek 					break;
310aaf23042SYinghai Lu 				}
31155c0d721SYinghai Lu 			}
312aaf23042SYinghai Lu 
313fa5b8a30SPavel Machek 			last_aper_order = aper_order;
314fa5b8a30SPavel Machek 			last_aper_base = aper_base;
315fa5b8a30SPavel Machek 			last_aper_enabled = aper_enabled;
316fa5b8a30SPavel Machek 			last_valid = 1;
317fa5b8a30SPavel Machek 		}
318fa5b8a30SPavel Machek 	}
319fa5b8a30SPavel Machek 
320aaf23042SYinghai Lu 	if (!fix && !aper_enabled)
321aaf23042SYinghai Lu 		return;
322aaf23042SYinghai Lu 
323aaf23042SYinghai Lu 	if (!aper_base || !aper_size || aper_base + aper_size > 0x100000000UL)
324aaf23042SYinghai Lu 		fix = 1;
325aaf23042SYinghai Lu 
326aaf23042SYinghai Lu 	if (gart_fix_e820 && !fix && aper_enabled) {
3270754557dSYinghai Lu 		if (e820_any_mapped(aper_base, aper_base + aper_size,
3280754557dSYinghai Lu 				    E820_RAM)) {
3290abbc78aSPavel Machek 			/* reserve it, so we can reuse it in second kernel */
330aaf23042SYinghai Lu 			printk(KERN_INFO "update e820 for GART\n");
331d0be6bdeSYinghai Lu 			e820_add_region(aper_base, aper_size, E820_RESERVED);
332aaf23042SYinghai Lu 			update_e820();
333aaf23042SYinghai Lu 		}
334aaf23042SYinghai Lu 	}
335aaf23042SYinghai Lu 
336f3eee542SYinghai Lu 	if (valid_agp)
3374f384f8bSPavel Machek 		return;
3384f384f8bSPavel Machek 
339f3eee542SYinghai Lu 	/* disable them all at first */
340*24d9b70bSJan Beulich 	for (i = 0; i < amd_nb_bus_dev_ranges[i].dev_limit; i++) {
34155c0d721SYinghai Lu 		int bus;
34255c0d721SYinghai Lu 		int dev_base, dev_limit;
34355c0d721SYinghai Lu 
344*24d9b70bSJan Beulich 		bus = amd_nb_bus_dev_ranges[i].bus;
345*24d9b70bSJan Beulich 		dev_base = amd_nb_bus_dev_ranges[i].dev_base;
346*24d9b70bSJan Beulich 		dev_limit = amd_nb_bus_dev_ranges[i].dev_limit;
34755c0d721SYinghai Lu 
34855c0d721SYinghai Lu 		for (slot = dev_base; slot < dev_limit; slot++) {
349eec1d4faSHans Rosenfeld 			if (!early_is_amd_nb(read_pci_config(bus, slot, 3, 0x00)))
350aaf23042SYinghai Lu 				continue;
351aaf23042SYinghai Lu 
35255c0d721SYinghai Lu 			ctl = read_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL);
35357ab43e3SBorislav Petkov 			ctl &= ~GARTEN;
35455c0d721SYinghai Lu 			write_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL, ctl);
35555c0d721SYinghai Lu 		}
356aaf23042SYinghai Lu 	}
357aaf23042SYinghai Lu 
358aaf23042SYinghai Lu }
359aaf23042SYinghai Lu 
3608c9fd91aSYinghai Lu static int __initdata printed_gart_size_msg;
3618c9fd91aSYinghai Lu 
362480125baSKonrad Rzeszutek Wilk int __init gart_iommu_hole_init(void)
363250c2277SThomas Gleixner {
3648c9fd91aSYinghai Lu 	u32 agp_aper_base = 0, agp_aper_order = 0;
365250c2277SThomas Gleixner 	u32 aper_size, aper_alloc = 0, aper_order = 0, last_aper_order = 0;
366250c2277SThomas Gleixner 	u64 aper_base, last_aper_base = 0;
36755c0d721SYinghai Lu 	int fix, slot, valid_agp = 0;
36855c0d721SYinghai Lu 	int i, node;
369250c2277SThomas Gleixner 
3700440d4c0SJoerg Roedel 	if (gart_iommu_aperture_disabled || !fix_aperture ||
3710440d4c0SJoerg Roedel 	    !early_pci_allowed())
372480125baSKonrad Rzeszutek Wilk 		return -ENODEV;
373250c2277SThomas Gleixner 
374250c2277SThomas Gleixner 	printk(KERN_INFO  "Checking aperture...\n");
375250c2277SThomas Gleixner 
3768c9fd91aSYinghai Lu 	if (!fallback_aper_force)
3778c9fd91aSYinghai Lu 		agp_aper_base = search_agp_bridge(&agp_aper_order, &valid_agp);
3788c9fd91aSYinghai Lu 
379250c2277SThomas Gleixner 	fix = 0;
38047db4c3eSYinghai Lu 	node = 0;
381*24d9b70bSJan Beulich 	for (i = 0; i < amd_nb_bus_dev_ranges[i].dev_limit; i++) {
38255c0d721SYinghai Lu 		int bus;
38355c0d721SYinghai Lu 		int dev_base, dev_limit;
3844b83873dSJoerg Roedel 		u32 ctl;
38555c0d721SYinghai Lu 
386*24d9b70bSJan Beulich 		bus = amd_nb_bus_dev_ranges[i].bus;
387*24d9b70bSJan Beulich 		dev_base = amd_nb_bus_dev_ranges[i].dev_base;
388*24d9b70bSJan Beulich 		dev_limit = amd_nb_bus_dev_ranges[i].dev_limit;
38955c0d721SYinghai Lu 
39055c0d721SYinghai Lu 		for (slot = dev_base; slot < dev_limit; slot++) {
391eec1d4faSHans Rosenfeld 			if (!early_is_amd_nb(read_pci_config(bus, slot, 3, 0x00)))
392250c2277SThomas Gleixner 				continue;
393250c2277SThomas Gleixner 
394250c2277SThomas Gleixner 			iommu_detected = 1;
3950440d4c0SJoerg Roedel 			gart_iommu_aperture = 1;
396de957628SFUJITA Tomonori 			x86_init.iommu.iommu_init = gart_iommu_init;
397250c2277SThomas Gleixner 
3984b83873dSJoerg Roedel 			ctl = read_pci_config(bus, slot, 3,
3994b83873dSJoerg Roedel 					      AMD64_GARTAPERTURECTL);
4004b83873dSJoerg Roedel 
4014b83873dSJoerg Roedel 			/*
4024b83873dSJoerg Roedel 			 * Before we do anything else disable the GART. It may
4034b83873dSJoerg Roedel 			 * still be enabled if we boot into a crash-kernel here.
4044b83873dSJoerg Roedel 			 * Reconfiguring the GART while it is enabled could have
4054b83873dSJoerg Roedel 			 * unknown side-effects.
4064b83873dSJoerg Roedel 			 */
4074b83873dSJoerg Roedel 			ctl &= ~GARTEN;
4084b83873dSJoerg Roedel 			write_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL, ctl);
4094b83873dSJoerg Roedel 
4104b83873dSJoerg Roedel 			aper_order = (ctl >> 1) & 7;
411250c2277SThomas Gleixner 			aper_size = (32 * 1024 * 1024) << aper_order;
41255c0d721SYinghai Lu 			aper_base = read_pci_config(bus, slot, 3, AMD64_GARTAPERTUREBASE) & 0x7fff;
413250c2277SThomas Gleixner 			aper_base <<= 25;
414250c2277SThomas Gleixner 
41547db4c3eSYinghai Lu 			printk(KERN_INFO "Node %d: aperture @ %Lx size %u MB\n",
41647db4c3eSYinghai Lu 					node, aper_base, aper_size >> 20);
41747db4c3eSYinghai Lu 			node++;
418250c2277SThomas Gleixner 
4198c9fd91aSYinghai Lu 			if (!aperture_valid(aper_base, aper_size, 64<<20)) {
4208c9fd91aSYinghai Lu 				if (valid_agp && agp_aper_base &&
4218c9fd91aSYinghai Lu 				    agp_aper_base == aper_base &&
4228c9fd91aSYinghai Lu 				    agp_aper_order == aper_order) {
4238c9fd91aSYinghai Lu 					/* the same between two setting from NB and agp */
424c987d12fSYinghai Lu 					if (!no_iommu &&
425c987d12fSYinghai Lu 					    max_pfn > MAX_DMA32_PFN &&
426c987d12fSYinghai Lu 					    !printed_gart_size_msg) {
4278c9fd91aSYinghai Lu 						printk(KERN_ERR "you are using iommu with agp, but GART size is less than 64M\n");
4288c9fd91aSYinghai Lu 						printk(KERN_ERR "please increase GART size in your BIOS setup\n");
4298c9fd91aSYinghai Lu 						printk(KERN_ERR "if BIOS doesn't have that option, contact your HW vendor!\n");
4308c9fd91aSYinghai Lu 						printed_gart_size_msg = 1;
4318c9fd91aSYinghai Lu 					}
4328c9fd91aSYinghai Lu 				} else {
433250c2277SThomas Gleixner 					fix = 1;
43455c0d721SYinghai Lu 					goto out;
435250c2277SThomas Gleixner 				}
4368c9fd91aSYinghai Lu 			}
437250c2277SThomas Gleixner 
438250c2277SThomas Gleixner 			if ((last_aper_order && aper_order != last_aper_order) ||
439250c2277SThomas Gleixner 			    (last_aper_base && aper_base != last_aper_base)) {
440250c2277SThomas Gleixner 				fix = 1;
44155c0d721SYinghai Lu 				goto out;
442250c2277SThomas Gleixner 			}
443250c2277SThomas Gleixner 			last_aper_order = aper_order;
444250c2277SThomas Gleixner 			last_aper_base = aper_base;
445250c2277SThomas Gleixner 		}
44655c0d721SYinghai Lu 	}
447250c2277SThomas Gleixner 
44855c0d721SYinghai Lu out:
449250c2277SThomas Gleixner 	if (!fix && !fallback_aper_force) {
450250c2277SThomas Gleixner 		if (last_aper_base) {
451250c2277SThomas Gleixner 			unsigned long n = (32 * 1024 * 1024) << last_aper_order;
452c140df97SIngo Molnar 
453250c2277SThomas Gleixner 			insert_aperture_resource((u32)last_aper_base, n);
454480125baSKonrad Rzeszutek Wilk 			return 1;
455250c2277SThomas Gleixner 		}
456480125baSKonrad Rzeszutek Wilk 		return 0;
457250c2277SThomas Gleixner 	}
458250c2277SThomas Gleixner 
4598c9fd91aSYinghai Lu 	if (!fallback_aper_force) {
4608c9fd91aSYinghai Lu 		aper_alloc = agp_aper_base;
4618c9fd91aSYinghai Lu 		aper_order = agp_aper_order;
4628c9fd91aSYinghai Lu 	}
463250c2277SThomas Gleixner 
464250c2277SThomas Gleixner 	if (aper_alloc) {
465250c2277SThomas Gleixner 		/* Got the aperture from the AGP bridge */
466c987d12fSYinghai Lu 	} else if ((!no_iommu && max_pfn > MAX_DMA32_PFN) ||
467250c2277SThomas Gleixner 		   force_iommu ||
468250c2277SThomas Gleixner 		   valid_agp ||
469250c2277SThomas Gleixner 		   fallback_aper_force) {
4709b156845SAdam Jackson 		printk(KERN_INFO
47131183ba8SIngo Molnar 			"Your BIOS doesn't leave a aperture memory hole\n");
4729b156845SAdam Jackson 		printk(KERN_INFO
47331183ba8SIngo Molnar 			"Please enable the IOMMU option in the BIOS setup\n");
4749b156845SAdam Jackson 		printk(KERN_INFO
47531183ba8SIngo Molnar 			"This costs you %d MB of RAM\n",
476250c2277SThomas Gleixner 				32 << fallback_aper_order);
477250c2277SThomas Gleixner 
478250c2277SThomas Gleixner 		aper_order = fallback_aper_order;
479250c2277SThomas Gleixner 		aper_alloc = allocate_aperture();
480250c2277SThomas Gleixner 		if (!aper_alloc) {
481c140df97SIngo Molnar 			/*
482c140df97SIngo Molnar 			 * Could disable AGP and IOMMU here, but it's
483c140df97SIngo Molnar 			 * probably not worth it. But the later users
484c140df97SIngo Molnar 			 * cannot deal with bad apertures and turning
485c140df97SIngo Molnar 			 * on the aperture over memory causes very
486c140df97SIngo Molnar 			 * strange problems, so it's better to panic
487c140df97SIngo Molnar 			 * early.
488c140df97SIngo Molnar 			 */
489250c2277SThomas Gleixner 			panic("Not enough memory for aperture");
490250c2277SThomas Gleixner 		}
491250c2277SThomas Gleixner 	} else {
492480125baSKonrad Rzeszutek Wilk 		return 0;
493250c2277SThomas Gleixner 	}
494250c2277SThomas Gleixner 
495250c2277SThomas Gleixner 	/* Fix up the north bridges */
496*24d9b70bSJan Beulich 	for (i = 0; i < amd_nb_bus_dev_ranges[i].dev_limit; i++) {
497260133abSBorislav Petkov 		int bus, dev_base, dev_limit;
498260133abSBorislav Petkov 
499260133abSBorislav Petkov 		/*
500260133abSBorislav Petkov 		 * Don't enable translation yet but enable GART IO and CPU
501260133abSBorislav Petkov 		 * accesses and set DISTLBWALKPRB since GART table memory is UC.
502260133abSBorislav Petkov 		 */
503260133abSBorislav Petkov 		u32 ctl = DISTLBWALKPRB | aper_order << 1;
50455c0d721SYinghai Lu 
505*24d9b70bSJan Beulich 		bus = amd_nb_bus_dev_ranges[i].bus;
506*24d9b70bSJan Beulich 		dev_base = amd_nb_bus_dev_ranges[i].dev_base;
507*24d9b70bSJan Beulich 		dev_limit = amd_nb_bus_dev_ranges[i].dev_limit;
50855c0d721SYinghai Lu 		for (slot = dev_base; slot < dev_limit; slot++) {
509eec1d4faSHans Rosenfeld 			if (!early_is_amd_nb(read_pci_config(bus, slot, 3, 0x00)))
510250c2277SThomas Gleixner 				continue;
511250c2277SThomas Gleixner 
512260133abSBorislav Petkov 			write_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL, ctl);
51355c0d721SYinghai Lu 			write_pci_config(bus, slot, 3, AMD64_GARTAPERTUREBASE, aper_alloc >> 25);
51455c0d721SYinghai Lu 		}
515250c2277SThomas Gleixner 	}
5166703f6d1SRafael J. Wysocki 
5176703f6d1SRafael J. Wysocki 	set_up_gart_resume(aper_order, aper_alloc);
518480125baSKonrad Rzeszutek Wilk 
519480125baSKonrad Rzeszutek Wilk 	return 1;
520250c2277SThomas Gleixner }
521