xref: /linux/arch/x86/kernel/aperture_64.c (revision c387aa3a1a910ce00b86f3a85082d24f144db256)
1250c2277SThomas Gleixner /*
2250c2277SThomas Gleixner  * Firmware replacement code.
3250c2277SThomas Gleixner  *
48caac563SPavel Machek  * Work around broken BIOSes that don't set an aperture, only set the
58caac563SPavel Machek  * aperture in the AGP bridge, or set too small aperture.
68caac563SPavel Machek  *
7250c2277SThomas Gleixner  * If all fails map the aperture over some low memory.  This is cheaper than
8250c2277SThomas Gleixner  * doing bounce buffering. The memory is lost. This is done at early boot
9250c2277SThomas Gleixner  * because only the bootmem allocator can allocate 32+MB.
10250c2277SThomas Gleixner  *
11250c2277SThomas Gleixner  * Copyright 2002 Andi Kleen, SuSE Labs.
12250c2277SThomas Gleixner  */
13250c2277SThomas Gleixner #include <linux/kernel.h>
14250c2277SThomas Gleixner #include <linux/types.h>
15250c2277SThomas Gleixner #include <linux/init.h>
1632e3f2b0SYinghai Lu #include <linux/memblock.h>
17250c2277SThomas Gleixner #include <linux/mmzone.h>
18250c2277SThomas Gleixner #include <linux/pci_ids.h>
19250c2277SThomas Gleixner #include <linux/pci.h>
20250c2277SThomas Gleixner #include <linux/bitops.h>
21250c2277SThomas Gleixner #include <linux/ioport.h>
222050d45dSPavel Machek #include <linux/suspend.h>
23acde31dcSCatalin Marinas #include <linux/kmemleak.h>
24250c2277SThomas Gleixner #include <asm/e820.h>
25250c2277SThomas Gleixner #include <asm/io.h>
2646a7fa27SFUJITA Tomonori #include <asm/iommu.h>
27395624fcSJoerg Roedel #include <asm/gart.h>
28250c2277SThomas Gleixner #include <asm/pci-direct.h>
29250c2277SThomas Gleixner #include <asm/dma.h>
3023ac4ae8SAndreas Herrmann #include <asm/amd_nb.h>
31de957628SFUJITA Tomonori #include <asm/x86_init.h>
32250c2277SThomas Gleixner 
33*c387aa3aSJoerg Roedel /*
34*c387aa3aSJoerg Roedel  * Using 512M as goal, in case kexec will load kernel_big
35*c387aa3aSJoerg Roedel  * that will do the on-position decompress, and could overlap with
36*c387aa3aSJoerg Roedel  * with the gart aperture that is used.
37*c387aa3aSJoerg Roedel  * Sequence:
38*c387aa3aSJoerg Roedel  * kernel_small
39*c387aa3aSJoerg Roedel  * ==> kexec (with kdump trigger path or gart still enabled)
40*c387aa3aSJoerg Roedel  * ==> kernel_small (gart area become e820_reserved)
41*c387aa3aSJoerg Roedel  * ==> kexec (with kdump trigger path or gart still enabled)
42*c387aa3aSJoerg Roedel  * ==> kerne_big (uncompressed size will be big than 64M or 128M)
43*c387aa3aSJoerg Roedel  * So don't use 512M below as gart iommu, leave the space for kernel
44*c387aa3aSJoerg Roedel  * code for safe.
45*c387aa3aSJoerg Roedel  */
46*c387aa3aSJoerg Roedel #define GART_MIN_ADDR	(512ULL << 20)
47*c387aa3aSJoerg Roedel #define GART_MAX_ADDR	(1ULL   << 32)
48*c387aa3aSJoerg Roedel 
490440d4c0SJoerg Roedel int gart_iommu_aperture;
507de6a4cdSPavel Machek int gart_iommu_aperture_disabled __initdata;
517de6a4cdSPavel Machek int gart_iommu_aperture_allowed __initdata;
52250c2277SThomas Gleixner 
53250c2277SThomas Gleixner int fallback_aper_order __initdata = 1; /* 64MB */
547de6a4cdSPavel Machek int fallback_aper_force __initdata;
55250c2277SThomas Gleixner 
56250c2277SThomas Gleixner int fix_aperture __initdata = 1;
57250c2277SThomas Gleixner 
58250c2277SThomas Gleixner static struct resource gart_resource = {
59250c2277SThomas Gleixner 	.name	= "GART",
60250c2277SThomas Gleixner 	.flags	= IORESOURCE_MEM,
61250c2277SThomas Gleixner };
62250c2277SThomas Gleixner 
63250c2277SThomas Gleixner static void __init insert_aperture_resource(u32 aper_base, u32 aper_size)
64250c2277SThomas Gleixner {
65250c2277SThomas Gleixner 	gart_resource.start = aper_base;
66250c2277SThomas Gleixner 	gart_resource.end = aper_base + aper_size - 1;
67250c2277SThomas Gleixner 	insert_resource(&iomem_resource, &gart_resource);
68250c2277SThomas Gleixner }
69250c2277SThomas Gleixner 
70250c2277SThomas Gleixner /* This code runs before the PCI subsystem is initialized, so just
71250c2277SThomas Gleixner    access the northbridge directly. */
72250c2277SThomas Gleixner 
73250c2277SThomas Gleixner static u32 __init allocate_aperture(void)
74250c2277SThomas Gleixner {
75250c2277SThomas Gleixner 	u32 aper_size;
7632e3f2b0SYinghai Lu 	unsigned long addr;
77250c2277SThomas Gleixner 
787677b2efSYinghai Lu 	/* aper_size should <= 1G */
797677b2efSYinghai Lu 	if (fallback_aper_order > 5)
807677b2efSYinghai Lu 		fallback_aper_order = 5;
81250c2277SThomas Gleixner 	aper_size = (32 * 1024 * 1024) << fallback_aper_order;
82250c2277SThomas Gleixner 
83250c2277SThomas Gleixner 	/*
84c140df97SIngo Molnar 	 * Aperture has to be naturally aligned. This means a 2GB aperture
85c140df97SIngo Molnar 	 * won't have much chance of finding a place in the lower 4GB of
86c140df97SIngo Molnar 	 * memory. Unfortunately we cannot move it up because that would
87c140df97SIngo Molnar 	 * make the IOMMU useless.
88250c2277SThomas Gleixner 	 */
89*c387aa3aSJoerg Roedel 	addr = memblock_find_in_range(GART_MIN_ADDR, GART_MAX_ADDR,
90*c387aa3aSJoerg Roedel 				      aper_size, aper_size);
91*c387aa3aSJoerg Roedel 	if (addr == MEMBLOCK_ERROR || addr + aper_size > GART_MAX_ADDR) {
9232e3f2b0SYinghai Lu 		printk(KERN_ERR
9332e3f2b0SYinghai Lu 			"Cannot allocate aperture memory hole (%lx,%uK)\n",
9432e3f2b0SYinghai Lu 				addr, aper_size>>10);
9532e3f2b0SYinghai Lu 		return 0;
9632e3f2b0SYinghai Lu 	}
9732e3f2b0SYinghai Lu 	memblock_x86_reserve_range(addr, addr + aper_size, "aperture64");
98acde31dcSCatalin Marinas 	/*
99acde31dcSCatalin Marinas 	 * Kmemleak should not scan this block as it may not be mapped via the
100acde31dcSCatalin Marinas 	 * kernel direct mapping.
101acde31dcSCatalin Marinas 	 */
10232e3f2b0SYinghai Lu 	kmemleak_ignore(phys_to_virt(addr));
10331183ba8SIngo Molnar 	printk(KERN_INFO "Mapping aperture over %d KB of RAM @ %lx\n",
10432e3f2b0SYinghai Lu 			aper_size >> 10, addr);
10532e3f2b0SYinghai Lu 	insert_aperture_resource((u32)addr, aper_size);
10632e3f2b0SYinghai Lu 	register_nosave_region(addr >> PAGE_SHIFT,
10732e3f2b0SYinghai Lu 			       (addr+aper_size) >> PAGE_SHIFT);
108c140df97SIngo Molnar 
10932e3f2b0SYinghai Lu 	return (u32)addr;
110250c2277SThomas Gleixner }
111250c2277SThomas Gleixner 
112250c2277SThomas Gleixner 
113250c2277SThomas Gleixner /* Find a PCI capability */
114dd564d0cSPavel Machek static u32 __init find_cap(int bus, int slot, int func, int cap)
115250c2277SThomas Gleixner {
116250c2277SThomas Gleixner 	int bytes;
117c140df97SIngo Molnar 	u8 pos;
118c140df97SIngo Molnar 
11955c0d721SYinghai Lu 	if (!(read_pci_config_16(bus, slot, func, PCI_STATUS) &
120c140df97SIngo Molnar 						PCI_STATUS_CAP_LIST))
121250c2277SThomas Gleixner 		return 0;
122c140df97SIngo Molnar 
12355c0d721SYinghai Lu 	pos = read_pci_config_byte(bus, slot, func, PCI_CAPABILITY_LIST);
124250c2277SThomas Gleixner 	for (bytes = 0; bytes < 48 && pos >= 0x40; bytes++) {
125250c2277SThomas Gleixner 		u8 id;
126c140df97SIngo Molnar 
127250c2277SThomas Gleixner 		pos &= ~3;
12855c0d721SYinghai Lu 		id = read_pci_config_byte(bus, slot, func, pos+PCI_CAP_LIST_ID);
129250c2277SThomas Gleixner 		if (id == 0xff)
130250c2277SThomas Gleixner 			break;
131250c2277SThomas Gleixner 		if (id == cap)
132250c2277SThomas Gleixner 			return pos;
13355c0d721SYinghai Lu 		pos = read_pci_config_byte(bus, slot, func,
134c140df97SIngo Molnar 						pos+PCI_CAP_LIST_NEXT);
135250c2277SThomas Gleixner 	}
136250c2277SThomas Gleixner 	return 0;
137250c2277SThomas Gleixner }
138250c2277SThomas Gleixner 
139250c2277SThomas Gleixner /* Read a standard AGPv3 bridge header */
140dd564d0cSPavel Machek static u32 __init read_agp(int bus, int slot, int func, int cap, u32 *order)
141250c2277SThomas Gleixner {
142250c2277SThomas Gleixner 	u32 apsize;
143250c2277SThomas Gleixner 	u32 apsizereg;
144250c2277SThomas Gleixner 	int nbits;
145250c2277SThomas Gleixner 	u32 aper_low, aper_hi;
146250c2277SThomas Gleixner 	u64 aper;
1471edc1ab3SYinghai Lu 	u32 old_order;
148250c2277SThomas Gleixner 
14955c0d721SYinghai Lu 	printk(KERN_INFO "AGP bridge at %02x:%02x:%02x\n", bus, slot, func);
15055c0d721SYinghai Lu 	apsizereg = read_pci_config_16(bus, slot, func, cap + 0x14);
151250c2277SThomas Gleixner 	if (apsizereg == 0xffffffff) {
15231183ba8SIngo Molnar 		printk(KERN_ERR "APSIZE in AGP bridge unreadable\n");
153250c2277SThomas Gleixner 		return 0;
154250c2277SThomas Gleixner 	}
155250c2277SThomas Gleixner 
1561edc1ab3SYinghai Lu 	/* old_order could be the value from NB gart setting */
1571edc1ab3SYinghai Lu 	old_order = *order;
1581edc1ab3SYinghai Lu 
159250c2277SThomas Gleixner 	apsize = apsizereg & 0xfff;
160250c2277SThomas Gleixner 	/* Some BIOS use weird encodings not in the AGPv3 table. */
161250c2277SThomas Gleixner 	if (apsize & 0xff)
162250c2277SThomas Gleixner 		apsize |= 0xf00;
163250c2277SThomas Gleixner 	nbits = hweight16(apsize);
164250c2277SThomas Gleixner 	*order = 7 - nbits;
165250c2277SThomas Gleixner 	if ((int)*order < 0) /* < 32MB */
166250c2277SThomas Gleixner 		*order = 0;
167250c2277SThomas Gleixner 
16855c0d721SYinghai Lu 	aper_low = read_pci_config(bus, slot, func, 0x10);
16955c0d721SYinghai Lu 	aper_hi = read_pci_config(bus, slot, func, 0x14);
170250c2277SThomas Gleixner 	aper = (aper_low & ~((1<<22)-1)) | ((u64)aper_hi << 32);
171250c2277SThomas Gleixner 
1721edc1ab3SYinghai Lu 	/*
1731edc1ab3SYinghai Lu 	 * On some sick chips, APSIZE is 0. It means it wants 4G
1741edc1ab3SYinghai Lu 	 * so let double check that order, and lets trust AMD NB settings:
1751edc1ab3SYinghai Lu 	 */
1768c9fd91aSYinghai Lu 	printk(KERN_INFO "Aperture from AGP @ %Lx old size %u MB\n",
1778c9fd91aSYinghai Lu 			aper, 32 << old_order);
1788c9fd91aSYinghai Lu 	if (aper + (32ULL<<(20 + *order)) > 0x100000000ULL) {
1791edc1ab3SYinghai Lu 		printk(KERN_INFO "Aperture size %u MB (APSIZE %x) is not right, using settings from NB\n",
1801edc1ab3SYinghai Lu 				32 << *order, apsizereg);
1811edc1ab3SYinghai Lu 		*order = old_order;
1821edc1ab3SYinghai Lu 	}
1831edc1ab3SYinghai Lu 
18431183ba8SIngo Molnar 	printk(KERN_INFO "Aperture from AGP @ %Lx size %u MB (APSIZE %x)\n",
185250c2277SThomas Gleixner 			aper, 32 << *order, apsizereg);
186250c2277SThomas Gleixner 
1878c9fd91aSYinghai Lu 	if (!aperture_valid(aper, (32*1024*1024) << *order, 32<<20))
188250c2277SThomas Gleixner 		return 0;
189250c2277SThomas Gleixner 	return (u32)aper;
190250c2277SThomas Gleixner }
191250c2277SThomas Gleixner 
192c140df97SIngo Molnar /*
193c140df97SIngo Molnar  * Look for an AGP bridge. Windows only expects the aperture in the
194c140df97SIngo Molnar  * AGP bridge and some BIOS forget to initialize the Northbridge too.
195c140df97SIngo Molnar  * Work around this here.
196c140df97SIngo Molnar  *
197c140df97SIngo Molnar  * Do an PCI bus scan by hand because we're running before the PCI
198c140df97SIngo Molnar  * subsystem.
199c140df97SIngo Molnar  *
200eec1d4faSHans Rosenfeld  * All AMD AGP bridges are AGPv3 compliant, so we can do this scan
201c140df97SIngo Molnar  * generically. It's probably overkill to always scan all slots because
202c140df97SIngo Molnar  * the AGP bridges should be always an own bus on the HT hierarchy,
203c140df97SIngo Molnar  * but do it here for future safety.
204c140df97SIngo Molnar  */
205dd564d0cSPavel Machek static u32 __init search_agp_bridge(u32 *order, int *valid_agp)
206250c2277SThomas Gleixner {
20755c0d721SYinghai Lu 	int bus, slot, func;
208250c2277SThomas Gleixner 
209250c2277SThomas Gleixner 	/* Poor man's PCI discovery */
21055c0d721SYinghai Lu 	for (bus = 0; bus < 256; bus++) {
211250c2277SThomas Gleixner 		for (slot = 0; slot < 32; slot++) {
212250c2277SThomas Gleixner 			for (func = 0; func < 8; func++) {
213250c2277SThomas Gleixner 				u32 class, cap;
214250c2277SThomas Gleixner 				u8 type;
21555c0d721SYinghai Lu 				class = read_pci_config(bus, slot, func,
216250c2277SThomas Gleixner 							PCI_CLASS_REVISION);
217250c2277SThomas Gleixner 				if (class == 0xffffffff)
218250c2277SThomas Gleixner 					break;
219250c2277SThomas Gleixner 
220250c2277SThomas Gleixner 				switch (class >> 16) {
221250c2277SThomas Gleixner 				case PCI_CLASS_BRIDGE_HOST:
222250c2277SThomas Gleixner 				case PCI_CLASS_BRIDGE_OTHER: /* needed? */
223250c2277SThomas Gleixner 					/* AGP bridge? */
22455c0d721SYinghai Lu 					cap = find_cap(bus, slot, func,
225c140df97SIngo Molnar 							PCI_CAP_ID_AGP);
226250c2277SThomas Gleixner 					if (!cap)
227250c2277SThomas Gleixner 						break;
228250c2277SThomas Gleixner 					*valid_agp = 1;
22955c0d721SYinghai Lu 					return read_agp(bus, slot, func, cap,
230c140df97SIngo Molnar 							order);
231250c2277SThomas Gleixner 				}
232250c2277SThomas Gleixner 
233250c2277SThomas Gleixner 				/* No multi-function device? */
23455c0d721SYinghai Lu 				type = read_pci_config_byte(bus, slot, func,
235250c2277SThomas Gleixner 							       PCI_HEADER_TYPE);
236250c2277SThomas Gleixner 				if (!(type & 0x80))
237250c2277SThomas Gleixner 					break;
238250c2277SThomas Gleixner 			}
239250c2277SThomas Gleixner 		}
240250c2277SThomas Gleixner 	}
24131183ba8SIngo Molnar 	printk(KERN_INFO "No AGP bridge found\n");
242c140df97SIngo Molnar 
243250c2277SThomas Gleixner 	return 0;
244250c2277SThomas Gleixner }
245250c2277SThomas Gleixner 
246aaf23042SYinghai Lu static int gart_fix_e820 __initdata = 1;
247aaf23042SYinghai Lu 
248aaf23042SYinghai Lu static int __init parse_gart_mem(char *p)
249aaf23042SYinghai Lu {
250aaf23042SYinghai Lu 	if (!p)
251aaf23042SYinghai Lu 		return -EINVAL;
252aaf23042SYinghai Lu 
253aaf23042SYinghai Lu 	if (!strncmp(p, "off", 3))
254aaf23042SYinghai Lu 		gart_fix_e820 = 0;
255aaf23042SYinghai Lu 	else if (!strncmp(p, "on", 2))
256aaf23042SYinghai Lu 		gart_fix_e820 = 1;
257aaf23042SYinghai Lu 
258aaf23042SYinghai Lu 	return 0;
259aaf23042SYinghai Lu }
260aaf23042SYinghai Lu early_param("gart_fix_e820", parse_gart_mem);
261aaf23042SYinghai Lu 
262aaf23042SYinghai Lu void __init early_gart_iommu_check(void)
263aaf23042SYinghai Lu {
264aaf23042SYinghai Lu 	/*
265aaf23042SYinghai Lu 	 * in case it is enabled before, esp for kexec/kdump,
266aaf23042SYinghai Lu 	 * previous kernel already enable that. memset called
267aaf23042SYinghai Lu 	 * by allocate_aperture/__alloc_bootmem_nopanic cause restart.
268aaf23042SYinghai Lu 	 * or second kernel have different position for GART hole. and new
269aaf23042SYinghai Lu 	 * kernel could use hole as RAM that is still used by GART set by
270aaf23042SYinghai Lu 	 * first kernel
271aaf23042SYinghai Lu 	 * or BIOS forget to put that in reserved.
272aaf23042SYinghai Lu 	 * try to update e820 to make that region as reserved.
273aaf23042SYinghai Lu 	 */
274fa10ba64SAndi Kleen 	u32 agp_aper_order = 0;
275f3eee542SYinghai Lu 	int i, fix, slot, valid_agp = 0;
276aaf23042SYinghai Lu 	u32 ctl;
277aaf23042SYinghai Lu 	u32 aper_size = 0, aper_order = 0, last_aper_order = 0;
278aaf23042SYinghai Lu 	u64 aper_base = 0, last_aper_base = 0;
279fa5b8a30SPavel Machek 	int aper_enabled = 0, last_aper_enabled = 0, last_valid = 0;
280aaf23042SYinghai Lu 
281aaf23042SYinghai Lu 	if (!early_pci_allowed())
282aaf23042SYinghai Lu 		return;
283aaf23042SYinghai Lu 
284fa5b8a30SPavel Machek 	/* This is mostly duplicate of iommu_hole_init */
285fa10ba64SAndi Kleen 	search_agp_bridge(&agp_aper_order, &valid_agp);
286f3eee542SYinghai Lu 
287aaf23042SYinghai Lu 	fix = 0;
28824d9b70bSJan Beulich 	for (i = 0; amd_nb_bus_dev_ranges[i].dev_limit; i++) {
28955c0d721SYinghai Lu 		int bus;
29055c0d721SYinghai Lu 		int dev_base, dev_limit;
29155c0d721SYinghai Lu 
29224d9b70bSJan Beulich 		bus = amd_nb_bus_dev_ranges[i].bus;
29324d9b70bSJan Beulich 		dev_base = amd_nb_bus_dev_ranges[i].dev_base;
29424d9b70bSJan Beulich 		dev_limit = amd_nb_bus_dev_ranges[i].dev_limit;
29555c0d721SYinghai Lu 
29655c0d721SYinghai Lu 		for (slot = dev_base; slot < dev_limit; slot++) {
297eec1d4faSHans Rosenfeld 			if (!early_is_amd_nb(read_pci_config(bus, slot, 3, 0x00)))
298aaf23042SYinghai Lu 				continue;
299aaf23042SYinghai Lu 
30055c0d721SYinghai Lu 			ctl = read_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL);
30157ab43e3SBorislav Petkov 			aper_enabled = ctl & GARTEN;
302aaf23042SYinghai Lu 			aper_order = (ctl >> 1) & 7;
303aaf23042SYinghai Lu 			aper_size = (32 * 1024 * 1024) << aper_order;
30455c0d721SYinghai Lu 			aper_base = read_pci_config(bus, slot, 3, AMD64_GARTAPERTUREBASE) & 0x7fff;
305aaf23042SYinghai Lu 			aper_base <<= 25;
306aaf23042SYinghai Lu 
307fa5b8a30SPavel Machek 			if (last_valid) {
308fa5b8a30SPavel Machek 				if ((aper_order != last_aper_order) ||
309fa5b8a30SPavel Machek 				    (aper_base != last_aper_base) ||
310fa5b8a30SPavel Machek 				    (aper_enabled != last_aper_enabled)) {
311aaf23042SYinghai Lu 					fix = 1;
312fa5b8a30SPavel Machek 					break;
313aaf23042SYinghai Lu 				}
31455c0d721SYinghai Lu 			}
315aaf23042SYinghai Lu 
316fa5b8a30SPavel Machek 			last_aper_order = aper_order;
317fa5b8a30SPavel Machek 			last_aper_base = aper_base;
318fa5b8a30SPavel Machek 			last_aper_enabled = aper_enabled;
319fa5b8a30SPavel Machek 			last_valid = 1;
320fa5b8a30SPavel Machek 		}
321fa5b8a30SPavel Machek 	}
322fa5b8a30SPavel Machek 
323aaf23042SYinghai Lu 	if (!fix && !aper_enabled)
324aaf23042SYinghai Lu 		return;
325aaf23042SYinghai Lu 
326aaf23042SYinghai Lu 	if (!aper_base || !aper_size || aper_base + aper_size > 0x100000000UL)
327aaf23042SYinghai Lu 		fix = 1;
328aaf23042SYinghai Lu 
329aaf23042SYinghai Lu 	if (gart_fix_e820 && !fix && aper_enabled) {
3300754557dSYinghai Lu 		if (e820_any_mapped(aper_base, aper_base + aper_size,
3310754557dSYinghai Lu 				    E820_RAM)) {
3320abbc78aSPavel Machek 			/* reserve it, so we can reuse it in second kernel */
333aaf23042SYinghai Lu 			printk(KERN_INFO "update e820 for GART\n");
334d0be6bdeSYinghai Lu 			e820_add_region(aper_base, aper_size, E820_RESERVED);
335aaf23042SYinghai Lu 			update_e820();
336aaf23042SYinghai Lu 		}
337aaf23042SYinghai Lu 	}
338aaf23042SYinghai Lu 
339f3eee542SYinghai Lu 	if (valid_agp)
3404f384f8bSPavel Machek 		return;
3414f384f8bSPavel Machek 
342f3eee542SYinghai Lu 	/* disable them all at first */
34324d9b70bSJan Beulich 	for (i = 0; i < amd_nb_bus_dev_ranges[i].dev_limit; i++) {
34455c0d721SYinghai Lu 		int bus;
34555c0d721SYinghai Lu 		int dev_base, dev_limit;
34655c0d721SYinghai Lu 
34724d9b70bSJan Beulich 		bus = amd_nb_bus_dev_ranges[i].bus;
34824d9b70bSJan Beulich 		dev_base = amd_nb_bus_dev_ranges[i].dev_base;
34924d9b70bSJan Beulich 		dev_limit = amd_nb_bus_dev_ranges[i].dev_limit;
35055c0d721SYinghai Lu 
35155c0d721SYinghai Lu 		for (slot = dev_base; slot < dev_limit; slot++) {
352eec1d4faSHans Rosenfeld 			if (!early_is_amd_nb(read_pci_config(bus, slot, 3, 0x00)))
353aaf23042SYinghai Lu 				continue;
354aaf23042SYinghai Lu 
35555c0d721SYinghai Lu 			ctl = read_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL);
35657ab43e3SBorislav Petkov 			ctl &= ~GARTEN;
35755c0d721SYinghai Lu 			write_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL, ctl);
35855c0d721SYinghai Lu 		}
359aaf23042SYinghai Lu 	}
360aaf23042SYinghai Lu 
361aaf23042SYinghai Lu }
362aaf23042SYinghai Lu 
3638c9fd91aSYinghai Lu static int __initdata printed_gart_size_msg;
3648c9fd91aSYinghai Lu 
365480125baSKonrad Rzeszutek Wilk int __init gart_iommu_hole_init(void)
366250c2277SThomas Gleixner {
3678c9fd91aSYinghai Lu 	u32 agp_aper_base = 0, agp_aper_order = 0;
368250c2277SThomas Gleixner 	u32 aper_size, aper_alloc = 0, aper_order = 0, last_aper_order = 0;
369250c2277SThomas Gleixner 	u64 aper_base, last_aper_base = 0;
37055c0d721SYinghai Lu 	int fix, slot, valid_agp = 0;
37155c0d721SYinghai Lu 	int i, node;
372250c2277SThomas Gleixner 
3730440d4c0SJoerg Roedel 	if (gart_iommu_aperture_disabled || !fix_aperture ||
3740440d4c0SJoerg Roedel 	    !early_pci_allowed())
375480125baSKonrad Rzeszutek Wilk 		return -ENODEV;
376250c2277SThomas Gleixner 
377250c2277SThomas Gleixner 	printk(KERN_INFO  "Checking aperture...\n");
378250c2277SThomas Gleixner 
3798c9fd91aSYinghai Lu 	if (!fallback_aper_force)
3808c9fd91aSYinghai Lu 		agp_aper_base = search_agp_bridge(&agp_aper_order, &valid_agp);
3818c9fd91aSYinghai Lu 
382250c2277SThomas Gleixner 	fix = 0;
38347db4c3eSYinghai Lu 	node = 0;
38424d9b70bSJan Beulich 	for (i = 0; i < amd_nb_bus_dev_ranges[i].dev_limit; i++) {
38555c0d721SYinghai Lu 		int bus;
38655c0d721SYinghai Lu 		int dev_base, dev_limit;
3874b83873dSJoerg Roedel 		u32 ctl;
38855c0d721SYinghai Lu 
38924d9b70bSJan Beulich 		bus = amd_nb_bus_dev_ranges[i].bus;
39024d9b70bSJan Beulich 		dev_base = amd_nb_bus_dev_ranges[i].dev_base;
39124d9b70bSJan Beulich 		dev_limit = amd_nb_bus_dev_ranges[i].dev_limit;
39255c0d721SYinghai Lu 
39355c0d721SYinghai Lu 		for (slot = dev_base; slot < dev_limit; slot++) {
394eec1d4faSHans Rosenfeld 			if (!early_is_amd_nb(read_pci_config(bus, slot, 3, 0x00)))
395250c2277SThomas Gleixner 				continue;
396250c2277SThomas Gleixner 
397250c2277SThomas Gleixner 			iommu_detected = 1;
3980440d4c0SJoerg Roedel 			gart_iommu_aperture = 1;
399de957628SFUJITA Tomonori 			x86_init.iommu.iommu_init = gart_iommu_init;
400250c2277SThomas Gleixner 
4014b83873dSJoerg Roedel 			ctl = read_pci_config(bus, slot, 3,
4024b83873dSJoerg Roedel 					      AMD64_GARTAPERTURECTL);
4034b83873dSJoerg Roedel 
4044b83873dSJoerg Roedel 			/*
4054b83873dSJoerg Roedel 			 * Before we do anything else disable the GART. It may
4064b83873dSJoerg Roedel 			 * still be enabled if we boot into a crash-kernel here.
4074b83873dSJoerg Roedel 			 * Reconfiguring the GART while it is enabled could have
4084b83873dSJoerg Roedel 			 * unknown side-effects.
4094b83873dSJoerg Roedel 			 */
4104b83873dSJoerg Roedel 			ctl &= ~GARTEN;
4114b83873dSJoerg Roedel 			write_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL, ctl);
4124b83873dSJoerg Roedel 
4134b83873dSJoerg Roedel 			aper_order = (ctl >> 1) & 7;
414250c2277SThomas Gleixner 			aper_size = (32 * 1024 * 1024) << aper_order;
41555c0d721SYinghai Lu 			aper_base = read_pci_config(bus, slot, 3, AMD64_GARTAPERTUREBASE) & 0x7fff;
416250c2277SThomas Gleixner 			aper_base <<= 25;
417250c2277SThomas Gleixner 
41847db4c3eSYinghai Lu 			printk(KERN_INFO "Node %d: aperture @ %Lx size %u MB\n",
41947db4c3eSYinghai Lu 					node, aper_base, aper_size >> 20);
42047db4c3eSYinghai Lu 			node++;
421250c2277SThomas Gleixner 
4228c9fd91aSYinghai Lu 			if (!aperture_valid(aper_base, aper_size, 64<<20)) {
4238c9fd91aSYinghai Lu 				if (valid_agp && agp_aper_base &&
4248c9fd91aSYinghai Lu 				    agp_aper_base == aper_base &&
4258c9fd91aSYinghai Lu 				    agp_aper_order == aper_order) {
4268c9fd91aSYinghai Lu 					/* the same between two setting from NB and agp */
427c987d12fSYinghai Lu 					if (!no_iommu &&
428c987d12fSYinghai Lu 					    max_pfn > MAX_DMA32_PFN &&
429c987d12fSYinghai Lu 					    !printed_gart_size_msg) {
4308c9fd91aSYinghai Lu 						printk(KERN_ERR "you are using iommu with agp, but GART size is less than 64M\n");
4318c9fd91aSYinghai Lu 						printk(KERN_ERR "please increase GART size in your BIOS setup\n");
4328c9fd91aSYinghai Lu 						printk(KERN_ERR "if BIOS doesn't have that option, contact your HW vendor!\n");
4338c9fd91aSYinghai Lu 						printed_gart_size_msg = 1;
4348c9fd91aSYinghai Lu 					}
4358c9fd91aSYinghai Lu 				} else {
436250c2277SThomas Gleixner 					fix = 1;
43755c0d721SYinghai Lu 					goto out;
438250c2277SThomas Gleixner 				}
4398c9fd91aSYinghai Lu 			}
440250c2277SThomas Gleixner 
441250c2277SThomas Gleixner 			if ((last_aper_order && aper_order != last_aper_order) ||
442250c2277SThomas Gleixner 			    (last_aper_base && aper_base != last_aper_base)) {
443250c2277SThomas Gleixner 				fix = 1;
44455c0d721SYinghai Lu 				goto out;
445250c2277SThomas Gleixner 			}
446250c2277SThomas Gleixner 			last_aper_order = aper_order;
447250c2277SThomas Gleixner 			last_aper_base = aper_base;
448250c2277SThomas Gleixner 		}
44955c0d721SYinghai Lu 	}
450250c2277SThomas Gleixner 
45155c0d721SYinghai Lu out:
452250c2277SThomas Gleixner 	if (!fix && !fallback_aper_force) {
453250c2277SThomas Gleixner 		if (last_aper_base) {
454250c2277SThomas Gleixner 			unsigned long n = (32 * 1024 * 1024) << last_aper_order;
455c140df97SIngo Molnar 
456250c2277SThomas Gleixner 			insert_aperture_resource((u32)last_aper_base, n);
457480125baSKonrad Rzeszutek Wilk 			return 1;
458250c2277SThomas Gleixner 		}
459480125baSKonrad Rzeszutek Wilk 		return 0;
460250c2277SThomas Gleixner 	}
461250c2277SThomas Gleixner 
4628c9fd91aSYinghai Lu 	if (!fallback_aper_force) {
4638c9fd91aSYinghai Lu 		aper_alloc = agp_aper_base;
4648c9fd91aSYinghai Lu 		aper_order = agp_aper_order;
4658c9fd91aSYinghai Lu 	}
466250c2277SThomas Gleixner 
467250c2277SThomas Gleixner 	if (aper_alloc) {
468250c2277SThomas Gleixner 		/* Got the aperture from the AGP bridge */
469c987d12fSYinghai Lu 	} else if ((!no_iommu && max_pfn > MAX_DMA32_PFN) ||
470250c2277SThomas Gleixner 		   force_iommu ||
471250c2277SThomas Gleixner 		   valid_agp ||
472250c2277SThomas Gleixner 		   fallback_aper_force) {
4739b156845SAdam Jackson 		printk(KERN_INFO
47431183ba8SIngo Molnar 			"Your BIOS doesn't leave a aperture memory hole\n");
4759b156845SAdam Jackson 		printk(KERN_INFO
47631183ba8SIngo Molnar 			"Please enable the IOMMU option in the BIOS setup\n");
4779b156845SAdam Jackson 		printk(KERN_INFO
47831183ba8SIngo Molnar 			"This costs you %d MB of RAM\n",
479250c2277SThomas Gleixner 				32 << fallback_aper_order);
480250c2277SThomas Gleixner 
481250c2277SThomas Gleixner 		aper_order = fallback_aper_order;
482250c2277SThomas Gleixner 		aper_alloc = allocate_aperture();
483250c2277SThomas Gleixner 		if (!aper_alloc) {
484c140df97SIngo Molnar 			/*
485c140df97SIngo Molnar 			 * Could disable AGP and IOMMU here, but it's
486c140df97SIngo Molnar 			 * probably not worth it. But the later users
487c140df97SIngo Molnar 			 * cannot deal with bad apertures and turning
488c140df97SIngo Molnar 			 * on the aperture over memory causes very
489c140df97SIngo Molnar 			 * strange problems, so it's better to panic
490c140df97SIngo Molnar 			 * early.
491c140df97SIngo Molnar 			 */
492250c2277SThomas Gleixner 			panic("Not enough memory for aperture");
493250c2277SThomas Gleixner 		}
494250c2277SThomas Gleixner 	} else {
495480125baSKonrad Rzeszutek Wilk 		return 0;
496250c2277SThomas Gleixner 	}
497250c2277SThomas Gleixner 
498250c2277SThomas Gleixner 	/* Fix up the north bridges */
49924d9b70bSJan Beulich 	for (i = 0; i < amd_nb_bus_dev_ranges[i].dev_limit; i++) {
500260133abSBorislav Petkov 		int bus, dev_base, dev_limit;
501260133abSBorislav Petkov 
502260133abSBorislav Petkov 		/*
503260133abSBorislav Petkov 		 * Don't enable translation yet but enable GART IO and CPU
504260133abSBorislav Petkov 		 * accesses and set DISTLBWALKPRB since GART table memory is UC.
505260133abSBorislav Petkov 		 */
506c34151a7SJoerg Roedel 		u32 ctl = aper_order << 1;
50755c0d721SYinghai Lu 
50824d9b70bSJan Beulich 		bus = amd_nb_bus_dev_ranges[i].bus;
50924d9b70bSJan Beulich 		dev_base = amd_nb_bus_dev_ranges[i].dev_base;
51024d9b70bSJan Beulich 		dev_limit = amd_nb_bus_dev_ranges[i].dev_limit;
51155c0d721SYinghai Lu 		for (slot = dev_base; slot < dev_limit; slot++) {
512eec1d4faSHans Rosenfeld 			if (!early_is_amd_nb(read_pci_config(bus, slot, 3, 0x00)))
513250c2277SThomas Gleixner 				continue;
514250c2277SThomas Gleixner 
515260133abSBorislav Petkov 			write_pci_config(bus, slot, 3, AMD64_GARTAPERTURECTL, ctl);
51655c0d721SYinghai Lu 			write_pci_config(bus, slot, 3, AMD64_GARTAPERTUREBASE, aper_alloc >> 25);
51755c0d721SYinghai Lu 		}
518250c2277SThomas Gleixner 	}
5196703f6d1SRafael J. Wysocki 
5206703f6d1SRafael J. Wysocki 	set_up_gart_resume(aper_order, aper_alloc);
521480125baSKonrad Rzeszutek Wilk 
522480125baSKonrad Rzeszutek Wilk 	return 1;
523250c2277SThomas Gleixner }
524