xref: /linux/arch/powerpc/platforms/pseries/lpar.c (revision 9ce7677cfd7cd871adb457c80bea3b581b839641)
1 /*
2  * pSeries_lpar.c
3  * Copyright (C) 2001 Todd Inglett, IBM Corporation
4  *
5  * pSeries LPAR support.
6  *
7  * This program is free software; you can redistribute it and/or modify
8  * it under the terms of the GNU General Public License as published by
9  * the Free Software Foundation; either version 2 of the License, or
10  * (at your option) any later version.
11  *
12  * This program is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15  * GNU General Public License for more details.
16  *
17  * You should have received a copy of the GNU General Public License
18  * along with this program; if not, write to the Free Software
19  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
20  */
21 
22 #undef DEBUG_LOW
23 
24 #include <linux/config.h>
25 #include <linux/kernel.h>
26 #include <linux/dma-mapping.h>
27 #include <asm/processor.h>
28 #include <asm/mmu.h>
29 #include <asm/page.h>
30 #include <asm/pgtable.h>
31 #include <asm/machdep.h>
32 #include <asm/abs_addr.h>
33 #include <asm/mmu_context.h>
34 #include <asm/iommu.h>
35 #include <asm/tlbflush.h>
36 #include <asm/tlb.h>
37 #include <asm/prom.h>
38 #include <asm/abs_addr.h>
39 #include <asm/cputable.h>
40 #include <asm/udbg.h>
41 #include <asm/smp.h>
42 
43 #include "plpar_wrappers.h"
44 
45 #ifdef DEBUG_LOW
46 #define DBG_LOW(fmt...) do { udbg_printf(fmt); } while(0)
47 #else
48 #define DBG_LOW(fmt...) do { } while(0)
49 #endif
50 
51 /* in pSeries_hvCall.S */
52 EXPORT_SYMBOL(plpar_hcall);
53 EXPORT_SYMBOL(plpar_hcall_4out);
54 EXPORT_SYMBOL(plpar_hcall_norets);
55 EXPORT_SYMBOL(plpar_hcall_8arg_2ret);
56 
57 extern void pSeries_find_serial_port(void);
58 
59 
60 int vtermno;	/* virtual terminal# for udbg  */
61 
62 #define __ALIGNED__ __attribute__((__aligned__(sizeof(long))))
63 static void udbg_hvsi_putc(unsigned char c)
64 {
65 	/* packet's seqno isn't used anyways */
66 	uint8_t packet[] __ALIGNED__ = { 0xff, 5, 0, 0, c };
67 	int rc;
68 
69 	if (c == '\n')
70 		udbg_hvsi_putc('\r');
71 
72 	do {
73 		rc = plpar_put_term_char(vtermno, sizeof(packet), packet);
74 	} while (rc == H_Busy);
75 }
76 
77 static long hvsi_udbg_buf_len;
78 static uint8_t hvsi_udbg_buf[256];
79 
80 static int udbg_hvsi_getc_poll(void)
81 {
82 	unsigned char ch;
83 	int rc, i;
84 
85 	if (hvsi_udbg_buf_len == 0) {
86 		rc = plpar_get_term_char(vtermno, &hvsi_udbg_buf_len, hvsi_udbg_buf);
87 		if (rc != H_Success || hvsi_udbg_buf[0] != 0xff) {
88 			/* bad read or non-data packet */
89 			hvsi_udbg_buf_len = 0;
90 		} else {
91 			/* remove the packet header */
92 			for (i = 4; i < hvsi_udbg_buf_len; i++)
93 				hvsi_udbg_buf[i-4] = hvsi_udbg_buf[i];
94 			hvsi_udbg_buf_len -= 4;
95 		}
96 	}
97 
98 	if (hvsi_udbg_buf_len <= 0 || hvsi_udbg_buf_len > 256) {
99 		/* no data ready */
100 		hvsi_udbg_buf_len = 0;
101 		return -1;
102 	}
103 
104 	ch = hvsi_udbg_buf[0];
105 	/* shift remaining data down */
106 	for (i = 1; i < hvsi_udbg_buf_len; i++) {
107 		hvsi_udbg_buf[i-1] = hvsi_udbg_buf[i];
108 	}
109 	hvsi_udbg_buf_len--;
110 
111 	return ch;
112 }
113 
114 static unsigned char udbg_hvsi_getc(void)
115 {
116 	int ch;
117 	for (;;) {
118 		ch = udbg_hvsi_getc_poll();
119 		if (ch == -1) {
120 			/* This shouldn't be needed...but... */
121 			volatile unsigned long delay;
122 			for (delay=0; delay < 2000000; delay++)
123 				;
124 		} else {
125 			return ch;
126 		}
127 	}
128 }
129 
130 static void udbg_putcLP(unsigned char c)
131 {
132 	char buf[16];
133 	unsigned long rc;
134 
135 	if (c == '\n')
136 		udbg_putcLP('\r');
137 
138 	buf[0] = c;
139 	do {
140 		rc = plpar_put_term_char(vtermno, 1, buf);
141 	} while(rc == H_Busy);
142 }
143 
144 /* Buffered chars getc */
145 static long inbuflen;
146 static long inbuf[2];	/* must be 2 longs */
147 
148 static int udbg_getc_pollLP(void)
149 {
150 	/* The interface is tricky because it may return up to 16 chars.
151 	 * We save them statically for future calls to udbg_getc().
152 	 */
153 	char ch, *buf = (char *)inbuf;
154 	int i;
155 	long rc;
156 	if (inbuflen == 0) {
157 		/* get some more chars. */
158 		inbuflen = 0;
159 		rc = plpar_get_term_char(vtermno, &inbuflen, buf);
160 		if (rc != H_Success)
161 			inbuflen = 0;	/* otherwise inbuflen is garbage */
162 	}
163 	if (inbuflen <= 0 || inbuflen > 16) {
164 		/* Catch error case as well as other oddities (corruption) */
165 		inbuflen = 0;
166 		return -1;
167 	}
168 	ch = buf[0];
169 	for (i = 1; i < inbuflen; i++)	/* shuffle them down. */
170 		buf[i-1] = buf[i];
171 	inbuflen--;
172 	return ch;
173 }
174 
175 static unsigned char udbg_getcLP(void)
176 {
177 	int ch;
178 	for (;;) {
179 		ch = udbg_getc_pollLP();
180 		if (ch == -1) {
181 			/* This shouldn't be needed...but... */
182 			volatile unsigned long delay;
183 			for (delay=0; delay < 2000000; delay++)
184 				;
185 		} else {
186 			return ch;
187 		}
188 	}
189 }
190 
191 /* call this from early_init() for a working debug console on
192  * vterm capable LPAR machines
193  */
194 void udbg_init_debug_lpar(void)
195 {
196 	vtermno = 0;
197 	udbg_putc = udbg_putcLP;
198 	udbg_getc = udbg_getcLP;
199 	udbg_getc_poll = udbg_getc_pollLP;
200 }
201 
202 /* returns 0 if couldn't find or use /chosen/stdout as console */
203 int find_udbg_vterm(void)
204 {
205 	struct device_node *stdout_node;
206 	u32 *termno;
207 	char *name;
208 	int found = 0;
209 
210 	/* find the boot console from /chosen/stdout */
211 	if (!of_chosen)
212 		return 0;
213 	name = (char *)get_property(of_chosen, "linux,stdout-path", NULL);
214 	if (name == NULL)
215 		return 0;
216 	stdout_node = of_find_node_by_path(name);
217 	if (!stdout_node)
218 		return 0;
219 
220 	/* now we have the stdout node; figure out what type of device it is. */
221 	name = (char *)get_property(stdout_node, "name", NULL);
222 	if (!name) {
223 		printk(KERN_WARNING "stdout node missing 'name' property!\n");
224 		goto out;
225 	}
226 
227 	if (strncmp(name, "vty", 3) == 0) {
228 		if (device_is_compatible(stdout_node, "hvterm1")) {
229 			termno = (u32 *)get_property(stdout_node, "reg", NULL);
230 			if (termno) {
231 				vtermno = termno[0];
232 				udbg_putc = udbg_putcLP;
233 				udbg_getc = udbg_getcLP;
234 				udbg_getc_poll = udbg_getc_pollLP;
235 				found = 1;
236 			}
237 		} else if (device_is_compatible(stdout_node, "hvterm-protocol")) {
238 			termno = (u32 *)get_property(stdout_node, "reg", NULL);
239 			if (termno) {
240 				vtermno = termno[0];
241 				udbg_putc = udbg_hvsi_putc;
242 				udbg_getc = udbg_hvsi_getc;
243 				udbg_getc_poll = udbg_hvsi_getc_poll;
244 				found = 1;
245 			}
246 		}
247 	} else if (strncmp(name, "serial", 6)) {
248 		/* XXX fix ISA serial console */
249 		printk(KERN_WARNING "serial stdout on LPAR ('%s')! "
250 				"can't print udbg messages\n",
251 		       stdout_node->full_name);
252 	} else {
253 		printk(KERN_WARNING "don't know how to print to stdout '%s'\n",
254 		       stdout_node->full_name);
255 	}
256 
257 out:
258 	of_node_put(stdout_node);
259 	return found;
260 }
261 
262 void vpa_init(int cpu)
263 {
264 	int hwcpu = get_hard_smp_processor_id(cpu);
265 	unsigned long vpa = __pa(&paca[cpu].lppaca);
266 	long ret;
267 
268 	if (cpu_has_feature(CPU_FTR_ALTIVEC))
269 		paca[cpu].lppaca.vmxregs_in_use = 1;
270 
271 	ret = register_vpa(hwcpu, vpa);
272 
273 	if (ret)
274 		printk(KERN_ERR "WARNING: vpa_init: VPA registration for "
275 				"cpu %d (hw %d) of area %lx returns %ld\n",
276 				cpu, hwcpu, vpa, ret);
277 }
278 
279 long pSeries_lpar_hpte_insert(unsigned long hpte_group,
280  			      unsigned long va, unsigned long pa,
281  			      unsigned long rflags, unsigned long vflags,
282  			      int psize)
283 {
284 	unsigned long lpar_rc;
285 	unsigned long flags;
286 	unsigned long slot;
287 	unsigned long hpte_v, hpte_r;
288 	unsigned long dummy0, dummy1;
289 
290 	if (!(vflags & HPTE_V_BOLTED))
291 		DBG_LOW("hpte_insert(group=%lx, va=%016lx, pa=%016lx, "
292 			"rflags=%lx, vflags=%lx, psize=%d)\n",
293 		hpte_group, va, pa, rflags, vflags, psize);
294 
295  	hpte_v = hpte_encode_v(va, psize) | vflags | HPTE_V_VALID;
296 	hpte_r = hpte_encode_r(pa, psize) | rflags;
297 
298 	if (!(vflags & HPTE_V_BOLTED))
299 		DBG_LOW(" hpte_v=%016lx, hpte_r=%016lx\n", hpte_v, hpte_r);
300 
301 	/* Now fill in the actual HPTE */
302 	/* Set CEC cookie to 0         */
303 	/* Zero page = 0               */
304 	/* I-cache Invalidate = 0      */
305 	/* I-cache synchronize = 0     */
306 	/* Exact = 0                   */
307 	flags = 0;
308 
309 	/* Make pHyp happy */
310 	if (rflags & (_PAGE_GUARDED|_PAGE_NO_CACHE))
311 		hpte_r &= ~_PAGE_COHERENT;
312 
313 	lpar_rc = plpar_hcall(H_ENTER, flags, hpte_group, hpte_v,
314 			      hpte_r, &slot, &dummy0, &dummy1);
315 	if (unlikely(lpar_rc == H_PTEG_Full)) {
316 		if (!(vflags & HPTE_V_BOLTED))
317 			DBG_LOW(" full\n");
318 		return -1;
319 	}
320 
321 	/*
322 	 * Since we try and ioremap PHBs we don't own, the pte insert
323 	 * will fail. However we must catch the failure in hash_page
324 	 * or we will loop forever, so return -2 in this case.
325 	 */
326 	if (unlikely(lpar_rc != H_Success)) {
327 		if (!(vflags & HPTE_V_BOLTED))
328 			DBG_LOW(" lpar err %d\n", lpar_rc);
329 		return -2;
330 	}
331 	if (!(vflags & HPTE_V_BOLTED))
332 		DBG_LOW(" -> slot: %d\n", slot & 7);
333 
334 	/* Because of iSeries, we have to pass down the secondary
335 	 * bucket bit here as well
336 	 */
337 	return (slot & 7) | (!!(vflags & HPTE_V_SECONDARY) << 3);
338 }
339 
340 static DEFINE_SPINLOCK(pSeries_lpar_tlbie_lock);
341 
342 static long pSeries_lpar_hpte_remove(unsigned long hpte_group)
343 {
344 	unsigned long slot_offset;
345 	unsigned long lpar_rc;
346 	int i;
347 	unsigned long dummy1, dummy2;
348 
349 	/* pick a random slot to start at */
350 	slot_offset = mftb() & 0x7;
351 
352 	for (i = 0; i < HPTES_PER_GROUP; i++) {
353 
354 		/* don't remove a bolted entry */
355 		lpar_rc = plpar_pte_remove(H_ANDCOND, hpte_group + slot_offset,
356 					   (0x1UL << 4), &dummy1, &dummy2);
357 		if (lpar_rc == H_Success)
358 			return i;
359 		BUG_ON(lpar_rc != H_Not_Found);
360 
361 		slot_offset++;
362 		slot_offset &= 0x7;
363 	}
364 
365 	return -1;
366 }
367 
368 static void pSeries_lpar_hptab_clear(void)
369 {
370 	unsigned long size_bytes = 1UL << ppc64_pft_size;
371 	unsigned long hpte_count = size_bytes >> 4;
372 	unsigned long dummy1, dummy2;
373 	int i;
374 
375 	/* TODO: Use bulk call */
376 	for (i = 0; i < hpte_count; i++)
377 		plpar_pte_remove(0, i, 0, &dummy1, &dummy2);
378 }
379 
380 /*
381  * NOTE: for updatepp ops we are fortunate that the linux "newpp" bits and
382  * the low 3 bits of flags happen to line up.  So no transform is needed.
383  * We can probably optimize here and assume the high bits of newpp are
384  * already zero.  For now I am paranoid.
385  */
386 static long pSeries_lpar_hpte_updatepp(unsigned long slot,
387 				       unsigned long newpp,
388 				       unsigned long va,
389 				       int psize, int local)
390 {
391 	unsigned long lpar_rc;
392 	unsigned long flags = (newpp & 7) | H_AVPN;
393 	unsigned long want_v;
394 
395 	want_v = hpte_encode_v(va, psize);
396 
397 	DBG_LOW("    update: avpnv=%016lx, hash=%016lx, f=%x, psize: %d ... ",
398 		want_v & HPTE_V_AVPN, slot, flags, psize);
399 
400 	lpar_rc = plpar_pte_protect(flags, slot, want_v & HPTE_V_AVPN);
401 
402 	if (lpar_rc == H_Not_Found) {
403 		DBG_LOW("not found !\n");
404 		return -1;
405 	}
406 
407 	DBG_LOW("ok\n");
408 
409 	BUG_ON(lpar_rc != H_Success);
410 
411 	return 0;
412 }
413 
414 static unsigned long pSeries_lpar_hpte_getword0(unsigned long slot)
415 {
416 	unsigned long dword0;
417 	unsigned long lpar_rc;
418 	unsigned long dummy_word1;
419 	unsigned long flags;
420 
421 	/* Read 1 pte at a time                        */
422 	/* Do not need RPN to logical page translation */
423 	/* No cross CEC PFT access                     */
424 	flags = 0;
425 
426 	lpar_rc = plpar_pte_read(flags, slot, &dword0, &dummy_word1);
427 
428 	BUG_ON(lpar_rc != H_Success);
429 
430 	return dword0;
431 }
432 
433 static long pSeries_lpar_hpte_find(unsigned long va, int psize)
434 {
435 	unsigned long hash;
436 	unsigned long i, j;
437 	long slot;
438 	unsigned long want_v, hpte_v;
439 
440 	hash = hpt_hash(va, mmu_psize_defs[psize].shift);
441 	want_v = hpte_encode_v(va, psize);
442 
443 	for (j = 0; j < 2; j++) {
444 		slot = (hash & htab_hash_mask) * HPTES_PER_GROUP;
445 		for (i = 0; i < HPTES_PER_GROUP; i++) {
446 			hpte_v = pSeries_lpar_hpte_getword0(slot);
447 
448 			if (HPTE_V_COMPARE(hpte_v, want_v)
449 			    && (hpte_v & HPTE_V_VALID)
450 			    && (!!(hpte_v & HPTE_V_SECONDARY) == j)) {
451 				/* HPTE matches */
452 				if (j)
453 					slot = -slot;
454 				return slot;
455 			}
456 			++slot;
457 		}
458 		hash = ~hash;
459 	}
460 
461 	return -1;
462 }
463 
464 static void pSeries_lpar_hpte_updateboltedpp(unsigned long newpp,
465 					     unsigned long ea,
466 					     int psize)
467 {
468 	unsigned long lpar_rc, slot, vsid, va, flags;
469 
470 	vsid = get_kernel_vsid(ea);
471 	va = (vsid << 28) | (ea & 0x0fffffff);
472 
473 	slot = pSeries_lpar_hpte_find(va, psize);
474 	BUG_ON(slot == -1);
475 
476 	flags = newpp & 7;
477 	lpar_rc = plpar_pte_protect(flags, slot, 0);
478 
479 	BUG_ON(lpar_rc != H_Success);
480 }
481 
482 static void pSeries_lpar_hpte_invalidate(unsigned long slot, unsigned long va,
483 					 int psize, int local)
484 {
485 	unsigned long want_v;
486 	unsigned long lpar_rc;
487 	unsigned long dummy1, dummy2;
488 
489 	DBG_LOW("    inval : slot=%lx, va=%016lx, psize: %d, local: %d",
490 		slot, va, psize, local);
491 
492 	want_v = hpte_encode_v(va, psize);
493 	lpar_rc = plpar_pte_remove(H_AVPN, slot, want_v & HPTE_V_AVPN,
494 				   &dummy1, &dummy2);
495 	if (lpar_rc == H_Not_Found)
496 		return;
497 
498 	BUG_ON(lpar_rc != H_Success);
499 }
500 
501 /*
502  * Take a spinlock around flushes to avoid bouncing the hypervisor tlbie
503  * lock.
504  */
505 void pSeries_lpar_flush_hash_range(unsigned long number, int local)
506 {
507 	int i;
508 	unsigned long flags = 0;
509 	struct ppc64_tlb_batch *batch = &__get_cpu_var(ppc64_tlb_batch);
510 	int lock_tlbie = !cpu_has_feature(CPU_FTR_LOCKLESS_TLBIE);
511 
512 	if (lock_tlbie)
513 		spin_lock_irqsave(&pSeries_lpar_tlbie_lock, flags);
514 
515 	for (i = 0; i < number; i++)
516 		flush_hash_page(batch->vaddr[i], batch->pte[i],
517 				batch->psize, local);
518 
519 	if (lock_tlbie)
520 		spin_unlock_irqrestore(&pSeries_lpar_tlbie_lock, flags);
521 }
522 
523 void hpte_init_lpar(void)
524 {
525 	ppc_md.hpte_invalidate	= pSeries_lpar_hpte_invalidate;
526 	ppc_md.hpte_updatepp	= pSeries_lpar_hpte_updatepp;
527 	ppc_md.hpte_updateboltedpp = pSeries_lpar_hpte_updateboltedpp;
528 	ppc_md.hpte_insert	= pSeries_lpar_hpte_insert;
529 	ppc_md.hpte_remove	= pSeries_lpar_hpte_remove;
530 	ppc_md.flush_hash_range	= pSeries_lpar_flush_hash_range;
531 	ppc_md.hpte_clear_all   = pSeries_lpar_hptab_clear;
532 
533 	htab_finish_init();
534 }
535