xref: /linux/drivers/misc/cxl/guest.c (revision 0883c2c06fb5bcf5b9e008270827e63c09a88c1e)
1 /*
2  * Copyright 2015 IBM Corp.
3  *
4  * This program is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU General Public License
6  * as published by the Free Software Foundation; either version
7  * 2 of the License, or (at your option) any later version.
8  */
9 
10 #include <linux/spinlock.h>
11 #include <linux/uaccess.h>
12 #include <linux/delay.h>
13 
14 #include "cxl.h"
15 #include "hcalls.h"
16 #include "trace.h"
17 
18 #define CXL_ERROR_DETECTED_EVENT	1
19 #define CXL_SLOT_RESET_EVENT		2
20 #define CXL_RESUME_EVENT		3
21 
22 static void pci_error_handlers(struct cxl_afu *afu,
23 				int bus_error_event,
24 				pci_channel_state_t state)
25 {
26 	struct pci_dev *afu_dev;
27 
28 	if (afu->phb == NULL)
29 		return;
30 
31 	list_for_each_entry(afu_dev, &afu->phb->bus->devices, bus_list) {
32 		if (!afu_dev->driver)
33 			continue;
34 
35 		switch (bus_error_event) {
36 		case CXL_ERROR_DETECTED_EVENT:
37 			afu_dev->error_state = state;
38 
39 			if (afu_dev->driver->err_handler &&
40 			    afu_dev->driver->err_handler->error_detected)
41 				afu_dev->driver->err_handler->error_detected(afu_dev, state);
42 		break;
43 		case CXL_SLOT_RESET_EVENT:
44 			afu_dev->error_state = state;
45 
46 			if (afu_dev->driver->err_handler &&
47 			    afu_dev->driver->err_handler->slot_reset)
48 				afu_dev->driver->err_handler->slot_reset(afu_dev);
49 		break;
50 		case CXL_RESUME_EVENT:
51 			if (afu_dev->driver->err_handler &&
52 			    afu_dev->driver->err_handler->resume)
53 				afu_dev->driver->err_handler->resume(afu_dev);
54 		break;
55 		}
56 	}
57 }
58 
59 static irqreturn_t guest_handle_psl_slice_error(struct cxl_context *ctx, u64 dsisr,
60 					u64 errstat)
61 {
62 	pr_devel("in %s\n", __func__);
63 	dev_crit(&ctx->afu->dev, "PSL ERROR STATUS: 0x%.16llx\n", errstat);
64 
65 	return cxl_ops->ack_irq(ctx, 0, errstat);
66 }
67 
68 static ssize_t guest_collect_vpd(struct cxl *adapter, struct cxl_afu *afu,
69 			void *buf, size_t len)
70 {
71 	unsigned int entries, mod;
72 	unsigned long **vpd_buf = NULL;
73 	struct sg_list *le;
74 	int rc = 0, i, tocopy;
75 	u64 out = 0;
76 
77 	if (buf == NULL)
78 		return -EINVAL;
79 
80 	/* number of entries in the list */
81 	entries = len / SG_BUFFER_SIZE;
82 	mod = len % SG_BUFFER_SIZE;
83 	if (mod)
84 		entries++;
85 
86 	if (entries > SG_MAX_ENTRIES) {
87 		entries = SG_MAX_ENTRIES;
88 		len = SG_MAX_ENTRIES * SG_BUFFER_SIZE;
89 		mod = 0;
90 	}
91 
92 	vpd_buf = kzalloc(entries * sizeof(unsigned long *), GFP_KERNEL);
93 	if (!vpd_buf)
94 		return -ENOMEM;
95 
96 	le = (struct sg_list *)get_zeroed_page(GFP_KERNEL);
97 	if (!le) {
98 		rc = -ENOMEM;
99 		goto err1;
100 	}
101 
102 	for (i = 0; i < entries; i++) {
103 		vpd_buf[i] = (unsigned long *)get_zeroed_page(GFP_KERNEL);
104 		if (!vpd_buf[i]) {
105 			rc = -ENOMEM;
106 			goto err2;
107 		}
108 		le[i].phys_addr = cpu_to_be64(virt_to_phys(vpd_buf[i]));
109 		le[i].len = cpu_to_be64(SG_BUFFER_SIZE);
110 		if ((i == (entries - 1)) && mod)
111 			le[i].len = cpu_to_be64(mod);
112 	}
113 
114 	if (adapter)
115 		rc = cxl_h_collect_vpd_adapter(adapter->guest->handle,
116 					virt_to_phys(le), entries, &out);
117 	else
118 		rc = cxl_h_collect_vpd(afu->guest->handle, 0,
119 				virt_to_phys(le), entries, &out);
120 	pr_devel("length of available (entries: %i), vpd: %#llx\n",
121 		entries, out);
122 
123 	if (!rc) {
124 		/*
125 		 * hcall returns in 'out' the size of available VPDs.
126 		 * It fills the buffer with as much data as possible.
127 		 */
128 		if (out < len)
129 			len = out;
130 		rc = len;
131 		if (out) {
132 			for (i = 0; i < entries; i++) {
133 				if (len < SG_BUFFER_SIZE)
134 					tocopy = len;
135 				else
136 					tocopy = SG_BUFFER_SIZE;
137 				memcpy(buf, vpd_buf[i], tocopy);
138 				buf += tocopy;
139 				len -= tocopy;
140 			}
141 		}
142 	}
143 err2:
144 	for (i = 0; i < entries; i++) {
145 		if (vpd_buf[i])
146 			free_page((unsigned long) vpd_buf[i]);
147 	}
148 	free_page((unsigned long) le);
149 err1:
150 	kfree(vpd_buf);
151 	return rc;
152 }
153 
154 static int guest_get_irq_info(struct cxl_context *ctx, struct cxl_irq_info *info)
155 {
156 	return cxl_h_collect_int_info(ctx->afu->guest->handle, ctx->process_token, info);
157 }
158 
159 static irqreturn_t guest_psl_irq(int irq, void *data)
160 {
161 	struct cxl_context *ctx = data;
162 	struct cxl_irq_info irq_info;
163 	int rc;
164 
165 	pr_devel("%d: received PSL interrupt %i\n", ctx->pe, irq);
166 	rc = guest_get_irq_info(ctx, &irq_info);
167 	if (rc) {
168 		WARN(1, "Unable to get IRQ info: %i\n", rc);
169 		return IRQ_HANDLED;
170 	}
171 
172 	rc = cxl_irq(irq, ctx, &irq_info);
173 	return rc;
174 }
175 
176 static int afu_read_error_state(struct cxl_afu *afu, int *state_out)
177 {
178 	u64 state;
179 	int rc = 0;
180 
181 	if (!afu)
182 		return -EIO;
183 
184 	rc = cxl_h_read_error_state(afu->guest->handle, &state);
185 	if (!rc) {
186 		WARN_ON(state != H_STATE_NORMAL &&
187 			state != H_STATE_DISABLE &&
188 			state != H_STATE_TEMP_UNAVAILABLE &&
189 			state != H_STATE_PERM_UNAVAILABLE);
190 		*state_out = state & 0xffffffff;
191 	}
192 	return rc;
193 }
194 
195 static irqreturn_t guest_slice_irq_err(int irq, void *data)
196 {
197 	struct cxl_afu *afu = data;
198 	int rc;
199 	u64 serr;
200 
201 	WARN(irq, "CXL SLICE ERROR interrupt %i\n", irq);
202 	rc = cxl_h_get_fn_error_interrupt(afu->guest->handle, &serr);
203 	if (rc) {
204 		dev_crit(&afu->dev, "Couldn't read PSL_SERR_An: %d\n", rc);
205 		return IRQ_HANDLED;
206 	}
207 	dev_crit(&afu->dev, "PSL_SERR_An: 0x%.16llx\n", serr);
208 
209 	rc = cxl_h_ack_fn_error_interrupt(afu->guest->handle, serr);
210 	if (rc)
211 		dev_crit(&afu->dev, "Couldn't ack slice error interrupt: %d\n",
212 			rc);
213 
214 	return IRQ_HANDLED;
215 }
216 
217 
218 static int irq_alloc_range(struct cxl *adapter, int len, int *irq)
219 {
220 	int i, n;
221 	struct irq_avail *cur;
222 
223 	for (i = 0; i < adapter->guest->irq_nranges; i++) {
224 		cur = &adapter->guest->irq_avail[i];
225 		n = bitmap_find_next_zero_area(cur->bitmap, cur->range,
226 					0, len, 0);
227 		if (n < cur->range) {
228 			bitmap_set(cur->bitmap, n, len);
229 			*irq = cur->offset + n;
230 			pr_devel("guest: allocate IRQs %#x->%#x\n",
231 				*irq, *irq + len - 1);
232 
233 			return 0;
234 		}
235 	}
236 	return -ENOSPC;
237 }
238 
239 static int irq_free_range(struct cxl *adapter, int irq, int len)
240 {
241 	int i, n;
242 	struct irq_avail *cur;
243 
244 	if (len == 0)
245 		return -ENOENT;
246 
247 	for (i = 0; i < adapter->guest->irq_nranges; i++) {
248 		cur = &adapter->guest->irq_avail[i];
249 		if (irq >= cur->offset &&
250 			(irq + len) <= (cur->offset + cur->range)) {
251 			n = irq - cur->offset;
252 			bitmap_clear(cur->bitmap, n, len);
253 			pr_devel("guest: release IRQs %#x->%#x\n",
254 				irq, irq + len - 1);
255 			return 0;
256 		}
257 	}
258 	return -ENOENT;
259 }
260 
261 static int guest_reset(struct cxl *adapter)
262 {
263 	struct cxl_afu *afu = NULL;
264 	int i, rc;
265 
266 	pr_devel("Adapter reset request\n");
267 	for (i = 0; i < adapter->slices; i++) {
268 		if ((afu = adapter->afu[i])) {
269 			pci_error_handlers(afu, CXL_ERROR_DETECTED_EVENT,
270 					pci_channel_io_frozen);
271 			cxl_context_detach_all(afu);
272 		}
273 	}
274 
275 	rc = cxl_h_reset_adapter(adapter->guest->handle);
276 	for (i = 0; i < adapter->slices; i++) {
277 		if (!rc && (afu = adapter->afu[i])) {
278 			pci_error_handlers(afu, CXL_SLOT_RESET_EVENT,
279 					pci_channel_io_normal);
280 			pci_error_handlers(afu, CXL_RESUME_EVENT, 0);
281 		}
282 	}
283 	return rc;
284 }
285 
286 static int guest_alloc_one_irq(struct cxl *adapter)
287 {
288 	int irq;
289 
290 	spin_lock(&adapter->guest->irq_alloc_lock);
291 	if (irq_alloc_range(adapter, 1, &irq))
292 		irq = -ENOSPC;
293 	spin_unlock(&adapter->guest->irq_alloc_lock);
294 	return irq;
295 }
296 
297 static void guest_release_one_irq(struct cxl *adapter, int irq)
298 {
299 	spin_lock(&adapter->guest->irq_alloc_lock);
300 	irq_free_range(adapter, irq, 1);
301 	spin_unlock(&adapter->guest->irq_alloc_lock);
302 }
303 
304 static int guest_alloc_irq_ranges(struct cxl_irq_ranges *irqs,
305 				struct cxl *adapter, unsigned int num)
306 {
307 	int i, try, irq;
308 
309 	memset(irqs, 0, sizeof(struct cxl_irq_ranges));
310 
311 	spin_lock(&adapter->guest->irq_alloc_lock);
312 	for (i = 0; i < CXL_IRQ_RANGES && num; i++) {
313 		try = num;
314 		while (try) {
315 			if (irq_alloc_range(adapter, try, &irq) == 0)
316 				break;
317 			try /= 2;
318 		}
319 		if (!try)
320 			goto error;
321 		irqs->offset[i] = irq;
322 		irqs->range[i] = try;
323 		num -= try;
324 	}
325 	if (num)
326 		goto error;
327 	spin_unlock(&adapter->guest->irq_alloc_lock);
328 	return 0;
329 
330 error:
331 	for (i = 0; i < CXL_IRQ_RANGES; i++)
332 		irq_free_range(adapter, irqs->offset[i], irqs->range[i]);
333 	spin_unlock(&adapter->guest->irq_alloc_lock);
334 	return -ENOSPC;
335 }
336 
337 static void guest_release_irq_ranges(struct cxl_irq_ranges *irqs,
338 				struct cxl *adapter)
339 {
340 	int i;
341 
342 	spin_lock(&adapter->guest->irq_alloc_lock);
343 	for (i = 0; i < CXL_IRQ_RANGES; i++)
344 		irq_free_range(adapter, irqs->offset[i], irqs->range[i]);
345 	spin_unlock(&adapter->guest->irq_alloc_lock);
346 }
347 
348 static int guest_register_serr_irq(struct cxl_afu *afu)
349 {
350 	afu->err_irq_name = kasprintf(GFP_KERNEL, "cxl-%s-err",
351 				      dev_name(&afu->dev));
352 	if (!afu->err_irq_name)
353 		return -ENOMEM;
354 
355 	if (!(afu->serr_virq = cxl_map_irq(afu->adapter, afu->serr_hwirq,
356 				 guest_slice_irq_err, afu, afu->err_irq_name))) {
357 		kfree(afu->err_irq_name);
358 		afu->err_irq_name = NULL;
359 		return -ENOMEM;
360 	}
361 
362 	return 0;
363 }
364 
365 static void guest_release_serr_irq(struct cxl_afu *afu)
366 {
367 	cxl_unmap_irq(afu->serr_virq, afu);
368 	cxl_ops->release_one_irq(afu->adapter, afu->serr_hwirq);
369 	kfree(afu->err_irq_name);
370 }
371 
372 static int guest_ack_irq(struct cxl_context *ctx, u64 tfc, u64 psl_reset_mask)
373 {
374 	return cxl_h_control_faults(ctx->afu->guest->handle, ctx->process_token,
375 				tfc >> 32, (psl_reset_mask != 0));
376 }
377 
378 static void disable_afu_irqs(struct cxl_context *ctx)
379 {
380 	irq_hw_number_t hwirq;
381 	unsigned int virq;
382 	int r, i;
383 
384 	pr_devel("Disabling AFU(%d) interrupts\n", ctx->afu->slice);
385 	for (r = 0; r < CXL_IRQ_RANGES; r++) {
386 		hwirq = ctx->irqs.offset[r];
387 		for (i = 0; i < ctx->irqs.range[r]; hwirq++, i++) {
388 			virq = irq_find_mapping(NULL, hwirq);
389 			disable_irq(virq);
390 		}
391 	}
392 }
393 
394 static void enable_afu_irqs(struct cxl_context *ctx)
395 {
396 	irq_hw_number_t hwirq;
397 	unsigned int virq;
398 	int r, i;
399 
400 	pr_devel("Enabling AFU(%d) interrupts\n", ctx->afu->slice);
401 	for (r = 0; r < CXL_IRQ_RANGES; r++) {
402 		hwirq = ctx->irqs.offset[r];
403 		for (i = 0; i < ctx->irqs.range[r]; hwirq++, i++) {
404 			virq = irq_find_mapping(NULL, hwirq);
405 			enable_irq(virq);
406 		}
407 	}
408 }
409 
410 static int _guest_afu_cr_readXX(int sz, struct cxl_afu *afu, int cr_idx,
411 			u64 offset, u64 *val)
412 {
413 	unsigned long cr;
414 	char c;
415 	int rc = 0;
416 
417 	if (afu->crs_len < sz)
418 		return -ENOENT;
419 
420 	if (unlikely(offset >= afu->crs_len))
421 		return -ERANGE;
422 
423 	cr = get_zeroed_page(GFP_KERNEL);
424 	if (!cr)
425 		return -ENOMEM;
426 
427 	rc = cxl_h_get_config(afu->guest->handle, cr_idx, offset,
428 			virt_to_phys((void *)cr), sz);
429 	if (rc)
430 		goto err;
431 
432 	switch (sz) {
433 	case 1:
434 		c = *((char *) cr);
435 		*val = c;
436 		break;
437 	case 2:
438 		*val = in_le16((u16 *)cr);
439 		break;
440 	case 4:
441 		*val = in_le32((unsigned *)cr);
442 		break;
443 	case 8:
444 		*val = in_le64((u64 *)cr);
445 		break;
446 	default:
447 		WARN_ON(1);
448 	}
449 err:
450 	free_page(cr);
451 	return rc;
452 }
453 
454 static int guest_afu_cr_read32(struct cxl_afu *afu, int cr_idx, u64 offset,
455 			u32 *out)
456 {
457 	int rc;
458 	u64 val;
459 
460 	rc = _guest_afu_cr_readXX(4, afu, cr_idx, offset, &val);
461 	if (!rc)
462 		*out = (u32) val;
463 	return rc;
464 }
465 
466 static int guest_afu_cr_read16(struct cxl_afu *afu, int cr_idx, u64 offset,
467 			u16 *out)
468 {
469 	int rc;
470 	u64 val;
471 
472 	rc = _guest_afu_cr_readXX(2, afu, cr_idx, offset, &val);
473 	if (!rc)
474 		*out = (u16) val;
475 	return rc;
476 }
477 
478 static int guest_afu_cr_read8(struct cxl_afu *afu, int cr_idx, u64 offset,
479 			u8 *out)
480 {
481 	int rc;
482 	u64 val;
483 
484 	rc = _guest_afu_cr_readXX(1, afu, cr_idx, offset, &val);
485 	if (!rc)
486 		*out = (u8) val;
487 	return rc;
488 }
489 
490 static int guest_afu_cr_read64(struct cxl_afu *afu, int cr_idx, u64 offset,
491 			u64 *out)
492 {
493 	return _guest_afu_cr_readXX(8, afu, cr_idx, offset, out);
494 }
495 
496 static int guest_afu_cr_write32(struct cxl_afu *afu, int cr, u64 off, u32 in)
497 {
498 	/* config record is not writable from guest */
499 	return -EPERM;
500 }
501 
502 static int guest_afu_cr_write16(struct cxl_afu *afu, int cr, u64 off, u16 in)
503 {
504 	/* config record is not writable from guest */
505 	return -EPERM;
506 }
507 
508 static int guest_afu_cr_write8(struct cxl_afu *afu, int cr, u64 off, u8 in)
509 {
510 	/* config record is not writable from guest */
511 	return -EPERM;
512 }
513 
514 static int attach_afu_directed(struct cxl_context *ctx, u64 wed, u64 amr)
515 {
516 	struct cxl_process_element_hcall *elem;
517 	struct cxl *adapter = ctx->afu->adapter;
518 	const struct cred *cred;
519 	u32 pid, idx;
520 	int rc, r, i;
521 	u64 mmio_addr, mmio_size;
522 	__be64 flags = 0;
523 
524 	/* Must be 8 byte aligned and cannot cross a 4096 byte boundary */
525 	if (!(elem = (struct cxl_process_element_hcall *)
526 			get_zeroed_page(GFP_KERNEL)))
527 		return -ENOMEM;
528 
529 	elem->version = cpu_to_be64(CXL_PROCESS_ELEMENT_VERSION);
530 	if (ctx->kernel) {
531 		pid = 0;
532 		flags |= CXL_PE_TRANSLATION_ENABLED;
533 		flags |= CXL_PE_PRIVILEGED_PROCESS;
534 		if (mfmsr() & MSR_SF)
535 			flags |= CXL_PE_64_BIT;
536 	} else {
537 		pid = current->pid;
538 		flags |= CXL_PE_PROBLEM_STATE;
539 		flags |= CXL_PE_TRANSLATION_ENABLED;
540 		if (!test_tsk_thread_flag(current, TIF_32BIT))
541 			flags |= CXL_PE_64_BIT;
542 		cred = get_current_cred();
543 		if (uid_eq(cred->euid, GLOBAL_ROOT_UID))
544 			flags |= CXL_PE_PRIVILEGED_PROCESS;
545 		put_cred(cred);
546 	}
547 	elem->flags         = cpu_to_be64(flags);
548 	elem->common.tid    = cpu_to_be32(0); /* Unused */
549 	elem->common.pid    = cpu_to_be32(pid);
550 	elem->common.csrp   = cpu_to_be64(0); /* disable */
551 	elem->common.aurp0  = cpu_to_be64(0); /* disable */
552 	elem->common.aurp1  = cpu_to_be64(0); /* disable */
553 
554 	cxl_prefault(ctx, wed);
555 
556 	elem->common.sstp0  = cpu_to_be64(ctx->sstp0);
557 	elem->common.sstp1  = cpu_to_be64(ctx->sstp1);
558 
559 	/*
560 	 * Ensure we have at least one interrupt allocated to take faults for
561 	 * kernel contexts that may not have allocated any AFU IRQs at all:
562 	 */
563 	if (ctx->irqs.range[0] == 0) {
564 		rc = afu_register_irqs(ctx, 0);
565 		if (rc)
566 			goto out_free;
567 	}
568 
569 	for (r = 0; r < CXL_IRQ_RANGES; r++) {
570 		for (i = 0; i < ctx->irqs.range[r]; i++) {
571 			if (r == 0 && i == 0) {
572 				elem->pslVirtualIsn = cpu_to_be32(ctx->irqs.offset[0]);
573 			} else {
574 				idx = ctx->irqs.offset[r] + i - adapter->guest->irq_base_offset;
575 				elem->applicationVirtualIsnBitmap[idx / 8] |= 0x80 >> (idx % 8);
576 			}
577 		}
578 	}
579 	elem->common.amr = cpu_to_be64(amr);
580 	elem->common.wed = cpu_to_be64(wed);
581 
582 	disable_afu_irqs(ctx);
583 
584 	rc = cxl_h_attach_process(ctx->afu->guest->handle, elem,
585 				&ctx->process_token, &mmio_addr, &mmio_size);
586 	if (rc == H_SUCCESS) {
587 		if (ctx->master || !ctx->afu->pp_psa) {
588 			ctx->psn_phys = ctx->afu->psn_phys;
589 			ctx->psn_size = ctx->afu->adapter->ps_size;
590 		} else {
591 			ctx->psn_phys = mmio_addr;
592 			ctx->psn_size = mmio_size;
593 		}
594 		if (ctx->afu->pp_psa && mmio_size &&
595 			ctx->afu->pp_size == 0) {
596 			/*
597 			 * There's no property in the device tree to read the
598 			 * pp_size. We only find out at the 1st attach.
599 			 * Compared to bare-metal, it is too late and we
600 			 * should really lock here. However, on powerVM,
601 			 * pp_size is really only used to display in /sys.
602 			 * Being discussed with pHyp for their next release.
603 			 */
604 			ctx->afu->pp_size = mmio_size;
605 		}
606 		/* from PAPR: process element is bytes 4-7 of process token */
607 		ctx->external_pe = ctx->process_token & 0xFFFFFFFF;
608 		pr_devel("CXL pe=%i is known as %i for pHyp, mmio_size=%#llx",
609 			ctx->pe, ctx->external_pe, ctx->psn_size);
610 		ctx->pe_inserted = true;
611 		enable_afu_irqs(ctx);
612 	}
613 
614 out_free:
615 	free_page((u64)elem);
616 	return rc;
617 }
618 
619 static int guest_attach_process(struct cxl_context *ctx, bool kernel, u64 wed, u64 amr)
620 {
621 	pr_devel("in %s\n", __func__);
622 
623 	if (ctx->real_mode)
624 		return -EPERM;
625 
626 	ctx->kernel = kernel;
627 	if (ctx->afu->current_mode == CXL_MODE_DIRECTED)
628 		return attach_afu_directed(ctx, wed, amr);
629 
630 	/* dedicated mode not supported on FW840 */
631 
632 	return -EINVAL;
633 }
634 
635 static int detach_afu_directed(struct cxl_context *ctx)
636 {
637 	if (!ctx->pe_inserted)
638 		return 0;
639 	if (cxl_h_detach_process(ctx->afu->guest->handle, ctx->process_token))
640 		return -1;
641 	return 0;
642 }
643 
644 static int guest_detach_process(struct cxl_context *ctx)
645 {
646 	pr_devel("in %s\n", __func__);
647 	trace_cxl_detach(ctx);
648 
649 	if (!cxl_ops->link_ok(ctx->afu->adapter, ctx->afu))
650 		return -EIO;
651 
652 	if (ctx->afu->current_mode == CXL_MODE_DIRECTED)
653 		return detach_afu_directed(ctx);
654 
655 	return -EINVAL;
656 }
657 
658 static void guest_release_afu(struct device *dev)
659 {
660 	struct cxl_afu *afu = to_cxl_afu(dev);
661 
662 	pr_devel("%s\n", __func__);
663 
664 	idr_destroy(&afu->contexts_idr);
665 
666 	kfree(afu->guest);
667 	kfree(afu);
668 }
669 
670 ssize_t cxl_guest_read_afu_vpd(struct cxl_afu *afu, void *buf, size_t len)
671 {
672 	return guest_collect_vpd(NULL, afu, buf, len);
673 }
674 
675 #define ERR_BUFF_MAX_COPY_SIZE PAGE_SIZE
676 static ssize_t guest_afu_read_err_buffer(struct cxl_afu *afu, char *buf,
677 					loff_t off, size_t count)
678 {
679 	void *tbuf = NULL;
680 	int rc = 0;
681 
682 	tbuf = (void *) get_zeroed_page(GFP_KERNEL);
683 	if (!tbuf)
684 		return -ENOMEM;
685 
686 	rc = cxl_h_get_afu_err(afu->guest->handle,
687 			       off & 0x7,
688 			       virt_to_phys(tbuf),
689 			       count);
690 	if (rc)
691 		goto err;
692 
693 	if (count > ERR_BUFF_MAX_COPY_SIZE)
694 		count = ERR_BUFF_MAX_COPY_SIZE - (off & 0x7);
695 	memcpy(buf, tbuf, count);
696 err:
697 	free_page((u64)tbuf);
698 
699 	return rc;
700 }
701 
702 static int guest_afu_check_and_enable(struct cxl_afu *afu)
703 {
704 	return 0;
705 }
706 
707 static bool guest_support_attributes(const char *attr_name,
708 				     enum cxl_attrs type)
709 {
710 	switch (type) {
711 	case CXL_ADAPTER_ATTRS:
712 		if ((strcmp(attr_name, "base_image") == 0) ||
713 			(strcmp(attr_name, "load_image_on_perst") == 0) ||
714 			(strcmp(attr_name, "perst_reloads_same_image") == 0) ||
715 			(strcmp(attr_name, "image_loaded") == 0))
716 			return false;
717 		break;
718 	case CXL_AFU_MASTER_ATTRS:
719 		if ((strcmp(attr_name, "pp_mmio_off") == 0))
720 			return false;
721 		break;
722 	case CXL_AFU_ATTRS:
723 		break;
724 	default:
725 		break;
726 	}
727 
728 	return true;
729 }
730 
731 static int activate_afu_directed(struct cxl_afu *afu)
732 {
733 	int rc;
734 
735 	dev_info(&afu->dev, "Activating AFU(%d) directed mode\n", afu->slice);
736 
737 	afu->current_mode = CXL_MODE_DIRECTED;
738 
739 	afu->num_procs = afu->max_procs_virtualised;
740 
741 	if ((rc = cxl_chardev_m_afu_add(afu)))
742 		return rc;
743 
744 	if ((rc = cxl_sysfs_afu_m_add(afu)))
745 		goto err;
746 
747 	if ((rc = cxl_chardev_s_afu_add(afu)))
748 		goto err1;
749 
750 	return 0;
751 err1:
752 	cxl_sysfs_afu_m_remove(afu);
753 err:
754 	cxl_chardev_afu_remove(afu);
755 	return rc;
756 }
757 
758 static int guest_afu_activate_mode(struct cxl_afu *afu, int mode)
759 {
760 	if (!mode)
761 		return 0;
762 	if (!(mode & afu->modes_supported))
763 		return -EINVAL;
764 
765 	if (mode == CXL_MODE_DIRECTED)
766 		return activate_afu_directed(afu);
767 
768 	if (mode == CXL_MODE_DEDICATED)
769 		dev_err(&afu->dev, "Dedicated mode not supported\n");
770 
771 	return -EINVAL;
772 }
773 
774 static int deactivate_afu_directed(struct cxl_afu *afu)
775 {
776 	dev_info(&afu->dev, "Deactivating AFU(%d) directed mode\n", afu->slice);
777 
778 	afu->current_mode = 0;
779 	afu->num_procs = 0;
780 
781 	cxl_sysfs_afu_m_remove(afu);
782 	cxl_chardev_afu_remove(afu);
783 
784 	cxl_ops->afu_reset(afu);
785 
786 	return 0;
787 }
788 
789 static int guest_afu_deactivate_mode(struct cxl_afu *afu, int mode)
790 {
791 	if (!mode)
792 		return 0;
793 	if (!(mode & afu->modes_supported))
794 		return -EINVAL;
795 
796 	if (mode == CXL_MODE_DIRECTED)
797 		return deactivate_afu_directed(afu);
798 	return 0;
799 }
800 
801 static int guest_afu_reset(struct cxl_afu *afu)
802 {
803 	pr_devel("AFU(%d) reset request\n", afu->slice);
804 	return cxl_h_reset_afu(afu->guest->handle);
805 }
806 
807 static int guest_map_slice_regs(struct cxl_afu *afu)
808 {
809 	if (!(afu->p2n_mmio = ioremap(afu->guest->p2n_phys, afu->guest->p2n_size))) {
810 		dev_err(&afu->dev, "Error mapping AFU(%d) MMIO regions\n",
811 			afu->slice);
812 		return -ENOMEM;
813 	}
814 	return 0;
815 }
816 
817 static void guest_unmap_slice_regs(struct cxl_afu *afu)
818 {
819 	if (afu->p2n_mmio)
820 		iounmap(afu->p2n_mmio);
821 }
822 
823 static int afu_update_state(struct cxl_afu *afu)
824 {
825 	int rc, cur_state;
826 
827 	rc = afu_read_error_state(afu, &cur_state);
828 	if (rc)
829 		return rc;
830 
831 	if (afu->guest->previous_state == cur_state)
832 		return 0;
833 
834 	pr_devel("AFU(%d) update state to %#x\n", afu->slice, cur_state);
835 
836 	switch (cur_state) {
837 	case H_STATE_NORMAL:
838 		afu->guest->previous_state = cur_state;
839 		break;
840 
841 	case H_STATE_DISABLE:
842 		pci_error_handlers(afu, CXL_ERROR_DETECTED_EVENT,
843 				pci_channel_io_frozen);
844 
845 		cxl_context_detach_all(afu);
846 		if ((rc = cxl_ops->afu_reset(afu)))
847 			pr_devel("reset hcall failed %d\n", rc);
848 
849 		rc = afu_read_error_state(afu, &cur_state);
850 		if (!rc && cur_state == H_STATE_NORMAL) {
851 			pci_error_handlers(afu, CXL_SLOT_RESET_EVENT,
852 					pci_channel_io_normal);
853 			pci_error_handlers(afu, CXL_RESUME_EVENT, 0);
854 		}
855 		afu->guest->previous_state = 0;
856 		break;
857 
858 	case H_STATE_TEMP_UNAVAILABLE:
859 		afu->guest->previous_state = cur_state;
860 		break;
861 
862 	case H_STATE_PERM_UNAVAILABLE:
863 		dev_err(&afu->dev, "AFU is in permanent error state\n");
864 		pci_error_handlers(afu, CXL_ERROR_DETECTED_EVENT,
865 				pci_channel_io_perm_failure);
866 		afu->guest->previous_state = cur_state;
867 		break;
868 
869 	default:
870 		pr_err("Unexpected AFU(%d) error state: %#x\n",
871 		       afu->slice, cur_state);
872 		return -EINVAL;
873 	}
874 
875 	return rc;
876 }
877 
878 static void afu_handle_errstate(struct work_struct *work)
879 {
880 	struct cxl_afu_guest *afu_guest =
881 		container_of(to_delayed_work(work), struct cxl_afu_guest, work_err);
882 
883 	if (!afu_update_state(afu_guest->parent) &&
884 	    afu_guest->previous_state == H_STATE_PERM_UNAVAILABLE)
885 		return;
886 
887 	if (afu_guest->handle_err == true)
888 		schedule_delayed_work(&afu_guest->work_err,
889 				      msecs_to_jiffies(3000));
890 }
891 
892 static bool guest_link_ok(struct cxl *cxl, struct cxl_afu *afu)
893 {
894 	int state;
895 
896 	if (afu && (!afu_read_error_state(afu, &state))) {
897 		if (state == H_STATE_NORMAL)
898 			return true;
899 	}
900 
901 	return false;
902 }
903 
904 static int afu_properties_look_ok(struct cxl_afu *afu)
905 {
906 	if (afu->pp_irqs < 0) {
907 		dev_err(&afu->dev, "Unexpected per-process minimum interrupt value\n");
908 		return -EINVAL;
909 	}
910 
911 	if (afu->max_procs_virtualised < 1) {
912 		dev_err(&afu->dev, "Unexpected max number of processes virtualised value\n");
913 		return -EINVAL;
914 	}
915 
916 	if (afu->crs_len < 0) {
917 		dev_err(&afu->dev, "Unexpected configuration record size value\n");
918 		return -EINVAL;
919 	}
920 
921 	return 0;
922 }
923 
924 int cxl_guest_init_afu(struct cxl *adapter, int slice, struct device_node *afu_np)
925 {
926 	struct cxl_afu *afu;
927 	bool free = true;
928 	int rc;
929 
930 	pr_devel("in %s - AFU(%d)\n", __func__, slice);
931 	if (!(afu = cxl_alloc_afu(adapter, slice)))
932 		return -ENOMEM;
933 
934 	if (!(afu->guest = kzalloc(sizeof(struct cxl_afu_guest), GFP_KERNEL))) {
935 		kfree(afu);
936 		return -ENOMEM;
937 	}
938 
939 	if ((rc = dev_set_name(&afu->dev, "afu%i.%i",
940 					  adapter->adapter_num,
941 					  slice)))
942 		goto err1;
943 
944 	adapter->slices++;
945 
946 	if ((rc = cxl_of_read_afu_handle(afu, afu_np)))
947 		goto err1;
948 
949 	if ((rc = cxl_ops->afu_reset(afu)))
950 		goto err1;
951 
952 	if ((rc = cxl_of_read_afu_properties(afu, afu_np)))
953 		goto err1;
954 
955 	if ((rc = afu_properties_look_ok(afu)))
956 		goto err1;
957 
958 	if ((rc = guest_map_slice_regs(afu)))
959 		goto err1;
960 
961 	if ((rc = guest_register_serr_irq(afu)))
962 		goto err2;
963 
964 	/*
965 	 * After we call this function we must not free the afu directly, even
966 	 * if it returns an error!
967 	 */
968 	if ((rc = cxl_register_afu(afu)))
969 		goto err_put1;
970 
971 	if ((rc = cxl_sysfs_afu_add(afu)))
972 		goto err_put1;
973 
974 	/*
975 	 * pHyp doesn't expose the programming models supported by the
976 	 * AFU. pHyp currently only supports directed mode. If it adds
977 	 * dedicated mode later, this version of cxl has no way to
978 	 * detect it. So we'll initialize the driver, but the first
979 	 * attach will fail.
980 	 * Being discussed with pHyp to do better (likely new property)
981 	 */
982 	if (afu->max_procs_virtualised == 1)
983 		afu->modes_supported = CXL_MODE_DEDICATED;
984 	else
985 		afu->modes_supported = CXL_MODE_DIRECTED;
986 
987 	if ((rc = cxl_afu_select_best_mode(afu)))
988 		goto err_put2;
989 
990 	adapter->afu[afu->slice] = afu;
991 
992 	afu->enabled = true;
993 
994 	/*
995 	 * wake up the cpu periodically to check the state
996 	 * of the AFU using "afu" stored in the guest structure.
997 	 */
998 	afu->guest->parent = afu;
999 	afu->guest->handle_err = true;
1000 	INIT_DELAYED_WORK(&afu->guest->work_err, afu_handle_errstate);
1001 	schedule_delayed_work(&afu->guest->work_err, msecs_to_jiffies(1000));
1002 
1003 	if ((rc = cxl_pci_vphb_add(afu)))
1004 		dev_info(&afu->dev, "Can't register vPHB\n");
1005 
1006 	return 0;
1007 
1008 err_put2:
1009 	cxl_sysfs_afu_remove(afu);
1010 err_put1:
1011 	device_unregister(&afu->dev);
1012 	free = false;
1013 	guest_release_serr_irq(afu);
1014 err2:
1015 	guest_unmap_slice_regs(afu);
1016 err1:
1017 	if (free) {
1018 		kfree(afu->guest);
1019 		kfree(afu);
1020 	}
1021 	return rc;
1022 }
1023 
1024 void cxl_guest_remove_afu(struct cxl_afu *afu)
1025 {
1026 	pr_devel("in %s - AFU(%d)\n", __func__, afu->slice);
1027 
1028 	if (!afu)
1029 		return;
1030 
1031 	/* flush and stop pending job */
1032 	afu->guest->handle_err = false;
1033 	flush_delayed_work(&afu->guest->work_err);
1034 
1035 	cxl_pci_vphb_remove(afu);
1036 	cxl_sysfs_afu_remove(afu);
1037 
1038 	spin_lock(&afu->adapter->afu_list_lock);
1039 	afu->adapter->afu[afu->slice] = NULL;
1040 	spin_unlock(&afu->adapter->afu_list_lock);
1041 
1042 	cxl_context_detach_all(afu);
1043 	cxl_ops->afu_deactivate_mode(afu, afu->current_mode);
1044 	guest_release_serr_irq(afu);
1045 	guest_unmap_slice_regs(afu);
1046 
1047 	device_unregister(&afu->dev);
1048 }
1049 
1050 static void free_adapter(struct cxl *adapter)
1051 {
1052 	struct irq_avail *cur;
1053 	int i;
1054 
1055 	if (adapter->guest->irq_avail) {
1056 		for (i = 0; i < adapter->guest->irq_nranges; i++) {
1057 			cur = &adapter->guest->irq_avail[i];
1058 			kfree(cur->bitmap);
1059 		}
1060 		kfree(adapter->guest->irq_avail);
1061 	}
1062 	kfree(adapter->guest->status);
1063 	cxl_remove_adapter_nr(adapter);
1064 	kfree(adapter->guest);
1065 	kfree(adapter);
1066 }
1067 
1068 static int properties_look_ok(struct cxl *adapter)
1069 {
1070 	/* The absence of this property means that the operational
1071 	 * status is unknown or okay
1072 	 */
1073 	if (strlen(adapter->guest->status) &&
1074 	    strcmp(adapter->guest->status, "okay")) {
1075 		pr_err("ABORTING:Bad operational status of the device\n");
1076 		return -EINVAL;
1077 	}
1078 
1079 	return 0;
1080 }
1081 
1082 ssize_t cxl_guest_read_adapter_vpd(struct cxl *adapter, void *buf, size_t len)
1083 {
1084 	return guest_collect_vpd(adapter, NULL, buf, len);
1085 }
1086 
1087 void cxl_guest_remove_adapter(struct cxl *adapter)
1088 {
1089 	pr_devel("in %s\n", __func__);
1090 
1091 	cxl_sysfs_adapter_remove(adapter);
1092 
1093 	cxl_guest_remove_chardev(adapter);
1094 	device_unregister(&adapter->dev);
1095 }
1096 
1097 static void release_adapter(struct device *dev)
1098 {
1099 	free_adapter(to_cxl_adapter(dev));
1100 }
1101 
1102 struct cxl *cxl_guest_init_adapter(struct device_node *np, struct platform_device *pdev)
1103 {
1104 	struct cxl *adapter;
1105 	bool free = true;
1106 	int rc;
1107 
1108 	if (!(adapter = cxl_alloc_adapter()))
1109 		return ERR_PTR(-ENOMEM);
1110 
1111 	if (!(adapter->guest = kzalloc(sizeof(struct cxl_guest), GFP_KERNEL))) {
1112 		free_adapter(adapter);
1113 		return ERR_PTR(-ENOMEM);
1114 	}
1115 
1116 	adapter->slices = 0;
1117 	adapter->guest->pdev = pdev;
1118 	adapter->dev.parent = &pdev->dev;
1119 	adapter->dev.release = release_adapter;
1120 	dev_set_drvdata(&pdev->dev, adapter);
1121 
1122 	/*
1123 	 * Hypervisor controls PSL timebase initialization (p1 register).
1124 	 * On FW840, PSL is initialized.
1125 	 */
1126 	adapter->psl_timebase_synced = true;
1127 
1128 	if ((rc = cxl_of_read_adapter_handle(adapter, np)))
1129 		goto err1;
1130 
1131 	if ((rc = cxl_of_read_adapter_properties(adapter, np)))
1132 		goto err1;
1133 
1134 	if ((rc = properties_look_ok(adapter)))
1135 		goto err1;
1136 
1137 	if ((rc = cxl_guest_add_chardev(adapter)))
1138 		goto err1;
1139 
1140 	/*
1141 	 * After we call this function we must not free the adapter directly,
1142 	 * even if it returns an error!
1143 	 */
1144 	if ((rc = cxl_register_adapter(adapter)))
1145 		goto err_put1;
1146 
1147 	if ((rc = cxl_sysfs_adapter_add(adapter)))
1148 		goto err_put1;
1149 
1150 	return adapter;
1151 
1152 err_put1:
1153 	device_unregister(&adapter->dev);
1154 	free = false;
1155 	cxl_guest_remove_chardev(adapter);
1156 err1:
1157 	if (free)
1158 		free_adapter(adapter);
1159 	return ERR_PTR(rc);
1160 }
1161 
1162 void cxl_guest_reload_module(struct cxl *adapter)
1163 {
1164 	struct platform_device *pdev;
1165 
1166 	pdev = adapter->guest->pdev;
1167 	cxl_guest_remove_adapter(adapter);
1168 
1169 	cxl_of_probe(pdev);
1170 }
1171 
1172 const struct cxl_backend_ops cxl_guest_ops = {
1173 	.module = THIS_MODULE,
1174 	.adapter_reset = guest_reset,
1175 	.alloc_one_irq = guest_alloc_one_irq,
1176 	.release_one_irq = guest_release_one_irq,
1177 	.alloc_irq_ranges = guest_alloc_irq_ranges,
1178 	.release_irq_ranges = guest_release_irq_ranges,
1179 	.setup_irq = NULL,
1180 	.handle_psl_slice_error = guest_handle_psl_slice_error,
1181 	.psl_interrupt = guest_psl_irq,
1182 	.ack_irq = guest_ack_irq,
1183 	.attach_process = guest_attach_process,
1184 	.detach_process = guest_detach_process,
1185 	.update_ivtes = NULL,
1186 	.support_attributes = guest_support_attributes,
1187 	.link_ok = guest_link_ok,
1188 	.release_afu = guest_release_afu,
1189 	.afu_read_err_buffer = guest_afu_read_err_buffer,
1190 	.afu_check_and_enable = guest_afu_check_and_enable,
1191 	.afu_activate_mode = guest_afu_activate_mode,
1192 	.afu_deactivate_mode = guest_afu_deactivate_mode,
1193 	.afu_reset = guest_afu_reset,
1194 	.afu_cr_read8 = guest_afu_cr_read8,
1195 	.afu_cr_read16 = guest_afu_cr_read16,
1196 	.afu_cr_read32 = guest_afu_cr_read32,
1197 	.afu_cr_read64 = guest_afu_cr_read64,
1198 	.afu_cr_write8 = guest_afu_cr_write8,
1199 	.afu_cr_write16 = guest_afu_cr_write16,
1200 	.afu_cr_write32 = guest_afu_cr_write32,
1201 	.read_adapter_vpd = cxl_guest_read_adapter_vpd,
1202 };
1203