xref: /linux/drivers/gpu/drm/panfrost/panfrost_mmu.c (revision eb01fe7abbe2d0b38824d2a93fdb4cc3eaf2ccc1)
1 // SPDX-License-Identifier: GPL-2.0
2 /* Copyright 2019 Linaro, Ltd, Rob Herring <robh@kernel.org> */
3 
4 #include <drm/panfrost_drm.h>
5 
6 #include <linux/atomic.h>
7 #include <linux/bitfield.h>
8 #include <linux/delay.h>
9 #include <linux/dma-mapping.h>
10 #include <linux/interrupt.h>
11 #include <linux/io.h>
12 #include <linux/iopoll.h>
13 #include <linux/io-pgtable.h>
14 #include <linux/iommu.h>
15 #include <linux/platform_device.h>
16 #include <linux/pm_runtime.h>
17 #include <linux/shmem_fs.h>
18 #include <linux/sizes.h>
19 
20 #include "panfrost_device.h"
21 #include "panfrost_mmu.h"
22 #include "panfrost_gem.h"
23 #include "panfrost_features.h"
24 #include "panfrost_regs.h"
25 
26 #define mmu_write(dev, reg, data) writel(data, dev->iomem + reg)
27 #define mmu_read(dev, reg) readl(dev->iomem + reg)
28 
29 static int wait_ready(struct panfrost_device *pfdev, u32 as_nr)
30 {
31 	int ret;
32 	u32 val;
33 
34 	/* Wait for the MMU status to indicate there is no active command, in
35 	 * case one is pending. */
36 	ret = readl_relaxed_poll_timeout_atomic(pfdev->iomem + AS_STATUS(as_nr),
37 		val, !(val & AS_STATUS_AS_ACTIVE), 10, 100000);
38 
39 	if (ret) {
40 		/* The GPU hung, let's trigger a reset */
41 		panfrost_device_schedule_reset(pfdev);
42 		dev_err(pfdev->dev, "AS_ACTIVE bit stuck\n");
43 	}
44 
45 	return ret;
46 }
47 
48 static int write_cmd(struct panfrost_device *pfdev, u32 as_nr, u32 cmd)
49 {
50 	int status;
51 
52 	/* write AS_COMMAND when MMU is ready to accept another command */
53 	status = wait_ready(pfdev, as_nr);
54 	if (!status)
55 		mmu_write(pfdev, AS_COMMAND(as_nr), cmd);
56 
57 	return status;
58 }
59 
60 static void lock_region(struct panfrost_device *pfdev, u32 as_nr,
61 			u64 region_start, u64 size)
62 {
63 	u8 region_width;
64 	u64 region;
65 	u64 region_end = region_start + size;
66 
67 	if (!size)
68 		return;
69 
70 	/*
71 	 * The locked region is a naturally aligned power of 2 block encoded as
72 	 * log2 minus(1).
73 	 * Calculate the desired start/end and look for the highest bit which
74 	 * differs. The smallest naturally aligned block must include this bit
75 	 * change, the desired region starts with this bit (and subsequent bits)
76 	 * zeroed and ends with the bit (and subsequent bits) set to one.
77 	 */
78 	region_width = max(fls64(region_start ^ (region_end - 1)),
79 			   const_ilog2(AS_LOCK_REGION_MIN_SIZE)) - 1;
80 
81 	/*
82 	 * Mask off the low bits of region_start (which would be ignored by
83 	 * the hardware anyway)
84 	 */
85 	region_start &= GENMASK_ULL(63, region_width);
86 
87 	region = region_width | region_start;
88 
89 	/* Lock the region that needs to be updated */
90 	mmu_write(pfdev, AS_LOCKADDR_LO(as_nr), lower_32_bits(region));
91 	mmu_write(pfdev, AS_LOCKADDR_HI(as_nr), upper_32_bits(region));
92 	write_cmd(pfdev, as_nr, AS_COMMAND_LOCK);
93 }
94 
95 
96 static int mmu_hw_do_operation_locked(struct panfrost_device *pfdev, int as_nr,
97 				      u64 iova, u64 size, u32 op)
98 {
99 	if (as_nr < 0)
100 		return 0;
101 
102 	if (op != AS_COMMAND_UNLOCK)
103 		lock_region(pfdev, as_nr, iova, size);
104 
105 	/* Run the MMU operation */
106 	write_cmd(pfdev, as_nr, op);
107 
108 	/* Wait for the flush to complete */
109 	return wait_ready(pfdev, as_nr);
110 }
111 
112 static int mmu_hw_do_operation(struct panfrost_device *pfdev,
113 			       struct panfrost_mmu *mmu,
114 			       u64 iova, u64 size, u32 op)
115 {
116 	int ret;
117 
118 	spin_lock(&pfdev->as_lock);
119 	ret = mmu_hw_do_operation_locked(pfdev, mmu->as, iova, size, op);
120 	spin_unlock(&pfdev->as_lock);
121 	return ret;
122 }
123 
124 static void panfrost_mmu_enable(struct panfrost_device *pfdev, struct panfrost_mmu *mmu)
125 {
126 	int as_nr = mmu->as;
127 	struct io_pgtable_cfg *cfg = &mmu->pgtbl_cfg;
128 	u64 transtab = cfg->arm_mali_lpae_cfg.transtab;
129 	u64 memattr = cfg->arm_mali_lpae_cfg.memattr;
130 
131 	mmu_hw_do_operation_locked(pfdev, as_nr, 0, ~0ULL, AS_COMMAND_FLUSH_MEM);
132 
133 	mmu_write(pfdev, AS_TRANSTAB_LO(as_nr), lower_32_bits(transtab));
134 	mmu_write(pfdev, AS_TRANSTAB_HI(as_nr), upper_32_bits(transtab));
135 
136 	/* Need to revisit mem attrs.
137 	 * NC is the default, Mali driver is inner WT.
138 	 */
139 	mmu_write(pfdev, AS_MEMATTR_LO(as_nr), lower_32_bits(memattr));
140 	mmu_write(pfdev, AS_MEMATTR_HI(as_nr), upper_32_bits(memattr));
141 
142 	write_cmd(pfdev, as_nr, AS_COMMAND_UPDATE);
143 }
144 
145 static void panfrost_mmu_disable(struct panfrost_device *pfdev, u32 as_nr)
146 {
147 	mmu_hw_do_operation_locked(pfdev, as_nr, 0, ~0ULL, AS_COMMAND_FLUSH_MEM);
148 
149 	mmu_write(pfdev, AS_TRANSTAB_LO(as_nr), 0);
150 	mmu_write(pfdev, AS_TRANSTAB_HI(as_nr), 0);
151 
152 	mmu_write(pfdev, AS_MEMATTR_LO(as_nr), 0);
153 	mmu_write(pfdev, AS_MEMATTR_HI(as_nr), 0);
154 
155 	write_cmd(pfdev, as_nr, AS_COMMAND_UPDATE);
156 }
157 
158 u32 panfrost_mmu_as_get(struct panfrost_device *pfdev, struct panfrost_mmu *mmu)
159 {
160 	int as;
161 
162 	spin_lock(&pfdev->as_lock);
163 
164 	as = mmu->as;
165 	if (as >= 0) {
166 		int en = atomic_inc_return(&mmu->as_count);
167 		u32 mask = BIT(as) | BIT(16 + as);
168 
169 		/*
170 		 * AS can be retained by active jobs or a perfcnt context,
171 		 * hence the '+ 1' here.
172 		 */
173 		WARN_ON(en >= (NUM_JOB_SLOTS + 1));
174 
175 		list_move(&mmu->list, &pfdev->as_lru_list);
176 
177 		if (pfdev->as_faulty_mask & mask) {
178 			/* Unhandled pagefault on this AS, the MMU was
179 			 * disabled. We need to re-enable the MMU after
180 			 * clearing+unmasking the AS interrupts.
181 			 */
182 			mmu_write(pfdev, MMU_INT_CLEAR, mask);
183 			mmu_write(pfdev, MMU_INT_MASK, ~pfdev->as_faulty_mask);
184 			pfdev->as_faulty_mask &= ~mask;
185 			panfrost_mmu_enable(pfdev, mmu);
186 		}
187 
188 		goto out;
189 	}
190 
191 	/* Check for a free AS */
192 	as = ffz(pfdev->as_alloc_mask);
193 	if (!(BIT(as) & pfdev->features.as_present)) {
194 		struct panfrost_mmu *lru_mmu;
195 
196 		list_for_each_entry_reverse(lru_mmu, &pfdev->as_lru_list, list) {
197 			if (!atomic_read(&lru_mmu->as_count))
198 				break;
199 		}
200 		WARN_ON(&lru_mmu->list == &pfdev->as_lru_list);
201 
202 		list_del_init(&lru_mmu->list);
203 		as = lru_mmu->as;
204 
205 		WARN_ON(as < 0);
206 		lru_mmu->as = -1;
207 	}
208 
209 	/* Assign the free or reclaimed AS to the FD */
210 	mmu->as = as;
211 	set_bit(as, &pfdev->as_alloc_mask);
212 	atomic_set(&mmu->as_count, 1);
213 	list_add(&mmu->list, &pfdev->as_lru_list);
214 
215 	dev_dbg(pfdev->dev, "Assigned AS%d to mmu %p, alloc_mask=%lx", as, mmu, pfdev->as_alloc_mask);
216 
217 	panfrost_mmu_enable(pfdev, mmu);
218 
219 out:
220 	spin_unlock(&pfdev->as_lock);
221 	return as;
222 }
223 
224 void panfrost_mmu_as_put(struct panfrost_device *pfdev, struct panfrost_mmu *mmu)
225 {
226 	atomic_dec(&mmu->as_count);
227 	WARN_ON(atomic_read(&mmu->as_count) < 0);
228 }
229 
230 void panfrost_mmu_reset(struct panfrost_device *pfdev)
231 {
232 	struct panfrost_mmu *mmu, *mmu_tmp;
233 
234 	clear_bit(PANFROST_COMP_BIT_MMU, pfdev->is_suspended);
235 
236 	spin_lock(&pfdev->as_lock);
237 
238 	pfdev->as_alloc_mask = 0;
239 	pfdev->as_faulty_mask = 0;
240 
241 	list_for_each_entry_safe(mmu, mmu_tmp, &pfdev->as_lru_list, list) {
242 		mmu->as = -1;
243 		atomic_set(&mmu->as_count, 0);
244 		list_del_init(&mmu->list);
245 	}
246 
247 	spin_unlock(&pfdev->as_lock);
248 
249 	mmu_write(pfdev, MMU_INT_CLEAR, ~0);
250 	mmu_write(pfdev, MMU_INT_MASK, ~0);
251 }
252 
253 static size_t get_pgsize(u64 addr, size_t size, size_t *count)
254 {
255 	/*
256 	 * io-pgtable only operates on multiple pages within a single table
257 	 * entry, so we need to split at boundaries of the table size, i.e.
258 	 * the next block size up. The distance from address A to the next
259 	 * boundary of block size B is logically B - A % B, but in unsigned
260 	 * two's complement where B is a power of two we get the equivalence
261 	 * B - A % B == (B - A) % B == (n * B - A) % B, and choose n = 0 :)
262 	 */
263 	size_t blk_offset = -addr % SZ_2M;
264 
265 	if (blk_offset || size < SZ_2M) {
266 		*count = min_not_zero(blk_offset, size) / SZ_4K;
267 		return SZ_4K;
268 	}
269 	blk_offset = -addr % SZ_1G ?: SZ_1G;
270 	*count = min(blk_offset, size) / SZ_2M;
271 	return SZ_2M;
272 }
273 
274 static void panfrost_mmu_flush_range(struct panfrost_device *pfdev,
275 				     struct panfrost_mmu *mmu,
276 				     u64 iova, u64 size)
277 {
278 	if (mmu->as < 0)
279 		return;
280 
281 	pm_runtime_get_noresume(pfdev->dev);
282 
283 	/* Flush the PTs only if we're already awake */
284 	if (pm_runtime_active(pfdev->dev))
285 		mmu_hw_do_operation(pfdev, mmu, iova, size, AS_COMMAND_FLUSH_PT);
286 
287 	pm_runtime_put_autosuspend(pfdev->dev);
288 }
289 
290 static int mmu_map_sg(struct panfrost_device *pfdev, struct panfrost_mmu *mmu,
291 		      u64 iova, int prot, struct sg_table *sgt)
292 {
293 	unsigned int count;
294 	struct scatterlist *sgl;
295 	struct io_pgtable_ops *ops = mmu->pgtbl_ops;
296 	u64 start_iova = iova;
297 
298 	for_each_sgtable_dma_sg(sgt, sgl, count) {
299 		unsigned long paddr = sg_dma_address(sgl);
300 		size_t len = sg_dma_len(sgl);
301 
302 		dev_dbg(pfdev->dev, "map: as=%d, iova=%llx, paddr=%lx, len=%zx", mmu->as, iova, paddr, len);
303 
304 		while (len) {
305 			size_t pgcount, mapped = 0;
306 			size_t pgsize = get_pgsize(iova | paddr, len, &pgcount);
307 
308 			ops->map_pages(ops, iova, paddr, pgsize, pgcount, prot,
309 				       GFP_KERNEL, &mapped);
310 			/* Don't get stuck if things have gone wrong */
311 			mapped = max(mapped, pgsize);
312 			iova += mapped;
313 			paddr += mapped;
314 			len -= mapped;
315 		}
316 	}
317 
318 	panfrost_mmu_flush_range(pfdev, mmu, start_iova, iova - start_iova);
319 
320 	return 0;
321 }
322 
323 int panfrost_mmu_map(struct panfrost_gem_mapping *mapping)
324 {
325 	struct panfrost_gem_object *bo = mapping->obj;
326 	struct drm_gem_shmem_object *shmem = &bo->base;
327 	struct drm_gem_object *obj = &shmem->base;
328 	struct panfrost_device *pfdev = to_panfrost_device(obj->dev);
329 	struct sg_table *sgt;
330 	int prot = IOMMU_READ | IOMMU_WRITE;
331 
332 	if (WARN_ON(mapping->active))
333 		return 0;
334 
335 	if (bo->noexec)
336 		prot |= IOMMU_NOEXEC;
337 
338 	sgt = drm_gem_shmem_get_pages_sgt(shmem);
339 	if (WARN_ON(IS_ERR(sgt)))
340 		return PTR_ERR(sgt);
341 
342 	mmu_map_sg(pfdev, mapping->mmu, mapping->mmnode.start << PAGE_SHIFT,
343 		   prot, sgt);
344 	mapping->active = true;
345 
346 	return 0;
347 }
348 
349 void panfrost_mmu_unmap(struct panfrost_gem_mapping *mapping)
350 {
351 	struct panfrost_gem_object *bo = mapping->obj;
352 	struct drm_gem_object *obj = &bo->base.base;
353 	struct panfrost_device *pfdev = to_panfrost_device(obj->dev);
354 	struct io_pgtable_ops *ops = mapping->mmu->pgtbl_ops;
355 	u64 iova = mapping->mmnode.start << PAGE_SHIFT;
356 	size_t len = mapping->mmnode.size << PAGE_SHIFT;
357 	size_t unmapped_len = 0;
358 
359 	if (WARN_ON(!mapping->active))
360 		return;
361 
362 	dev_dbg(pfdev->dev, "unmap: as=%d, iova=%llx, len=%zx",
363 		mapping->mmu->as, iova, len);
364 
365 	while (unmapped_len < len) {
366 		size_t unmapped_page, pgcount;
367 		size_t pgsize = get_pgsize(iova, len - unmapped_len, &pgcount);
368 
369 		if (bo->is_heap)
370 			pgcount = 1;
371 		if (!bo->is_heap || ops->iova_to_phys(ops, iova)) {
372 			unmapped_page = ops->unmap_pages(ops, iova, pgsize, pgcount, NULL);
373 			WARN_ON(unmapped_page != pgsize * pgcount);
374 		}
375 		iova += pgsize * pgcount;
376 		unmapped_len += pgsize * pgcount;
377 	}
378 
379 	panfrost_mmu_flush_range(pfdev, mapping->mmu,
380 				 mapping->mmnode.start << PAGE_SHIFT, len);
381 	mapping->active = false;
382 }
383 
384 static void mmu_tlb_inv_context_s1(void *cookie)
385 {}
386 
387 static void mmu_tlb_sync_context(void *cookie)
388 {
389 	//struct panfrost_mmu *mmu = cookie;
390 	// TODO: Wait 1000 GPU cycles for HW_ISSUE_6367/T60X
391 }
392 
393 static void mmu_tlb_flush_walk(unsigned long iova, size_t size, size_t granule,
394 			       void *cookie)
395 {
396 	mmu_tlb_sync_context(cookie);
397 }
398 
399 static const struct iommu_flush_ops mmu_tlb_ops = {
400 	.tlb_flush_all	= mmu_tlb_inv_context_s1,
401 	.tlb_flush_walk = mmu_tlb_flush_walk,
402 };
403 
404 static struct panfrost_gem_mapping *
405 addr_to_mapping(struct panfrost_device *pfdev, int as, u64 addr)
406 {
407 	struct panfrost_gem_mapping *mapping = NULL;
408 	struct drm_mm_node *node;
409 	u64 offset = addr >> PAGE_SHIFT;
410 	struct panfrost_mmu *mmu;
411 
412 	spin_lock(&pfdev->as_lock);
413 	list_for_each_entry(mmu, &pfdev->as_lru_list, list) {
414 		if (as == mmu->as)
415 			goto found_mmu;
416 	}
417 	goto out;
418 
419 found_mmu:
420 
421 	spin_lock(&mmu->mm_lock);
422 
423 	drm_mm_for_each_node(node, &mmu->mm) {
424 		if (offset >= node->start &&
425 		    offset < (node->start + node->size)) {
426 			mapping = drm_mm_node_to_panfrost_mapping(node);
427 
428 			kref_get(&mapping->refcount);
429 			break;
430 		}
431 	}
432 
433 	spin_unlock(&mmu->mm_lock);
434 out:
435 	spin_unlock(&pfdev->as_lock);
436 	return mapping;
437 }
438 
439 #define NUM_FAULT_PAGES (SZ_2M / PAGE_SIZE)
440 
441 static int panfrost_mmu_map_fault_addr(struct panfrost_device *pfdev, int as,
442 				       u64 addr)
443 {
444 	int ret, i;
445 	struct panfrost_gem_mapping *bomapping;
446 	struct panfrost_gem_object *bo;
447 	struct address_space *mapping;
448 	struct drm_gem_object *obj;
449 	pgoff_t page_offset;
450 	struct sg_table *sgt;
451 	struct page **pages;
452 
453 	bomapping = addr_to_mapping(pfdev, as, addr);
454 	if (!bomapping)
455 		return -ENOENT;
456 
457 	bo = bomapping->obj;
458 	if (!bo->is_heap) {
459 		dev_WARN(pfdev->dev, "matching BO is not heap type (GPU VA = %llx)",
460 			 bomapping->mmnode.start << PAGE_SHIFT);
461 		ret = -EINVAL;
462 		goto err_bo;
463 	}
464 	WARN_ON(bomapping->mmu->as != as);
465 
466 	/* Assume 2MB alignment and size multiple */
467 	addr &= ~((u64)SZ_2M - 1);
468 	page_offset = addr >> PAGE_SHIFT;
469 	page_offset -= bomapping->mmnode.start;
470 
471 	obj = &bo->base.base;
472 
473 	dma_resv_lock(obj->resv, NULL);
474 
475 	if (!bo->base.pages) {
476 		bo->sgts = kvmalloc_array(bo->base.base.size / SZ_2M,
477 				     sizeof(struct sg_table), GFP_KERNEL | __GFP_ZERO);
478 		if (!bo->sgts) {
479 			ret = -ENOMEM;
480 			goto err_unlock;
481 		}
482 
483 		pages = kvmalloc_array(bo->base.base.size >> PAGE_SHIFT,
484 				       sizeof(struct page *), GFP_KERNEL | __GFP_ZERO);
485 		if (!pages) {
486 			kvfree(bo->sgts);
487 			bo->sgts = NULL;
488 			ret = -ENOMEM;
489 			goto err_unlock;
490 		}
491 		bo->base.pages = pages;
492 		bo->base.pages_use_count = 1;
493 	} else {
494 		pages = bo->base.pages;
495 		if (pages[page_offset]) {
496 			/* Pages are already mapped, bail out. */
497 			goto out;
498 		}
499 	}
500 
501 	mapping = bo->base.base.filp->f_mapping;
502 	mapping_set_unevictable(mapping);
503 
504 	for (i = page_offset; i < page_offset + NUM_FAULT_PAGES; i++) {
505 		pages[i] = shmem_read_mapping_page(mapping, i);
506 		if (IS_ERR(pages[i])) {
507 			ret = PTR_ERR(pages[i]);
508 			pages[i] = NULL;
509 			goto err_pages;
510 		}
511 	}
512 
513 	sgt = &bo->sgts[page_offset / (SZ_2M / PAGE_SIZE)];
514 	ret = sg_alloc_table_from_pages(sgt, pages + page_offset,
515 					NUM_FAULT_PAGES, 0, SZ_2M, GFP_KERNEL);
516 	if (ret)
517 		goto err_pages;
518 
519 	ret = dma_map_sgtable(pfdev->dev, sgt, DMA_BIDIRECTIONAL, 0);
520 	if (ret)
521 		goto err_map;
522 
523 	mmu_map_sg(pfdev, bomapping->mmu, addr,
524 		   IOMMU_WRITE | IOMMU_READ | IOMMU_NOEXEC, sgt);
525 
526 	bomapping->active = true;
527 	bo->heap_rss_size += SZ_2M;
528 
529 	dev_dbg(pfdev->dev, "mapped page fault @ AS%d %llx", as, addr);
530 
531 out:
532 	dma_resv_unlock(obj->resv);
533 
534 	panfrost_gem_mapping_put(bomapping);
535 
536 	return 0;
537 
538 err_map:
539 	sg_free_table(sgt);
540 err_pages:
541 	drm_gem_shmem_put_pages(&bo->base);
542 err_unlock:
543 	dma_resv_unlock(obj->resv);
544 err_bo:
545 	panfrost_gem_mapping_put(bomapping);
546 	return ret;
547 }
548 
549 static void panfrost_mmu_release_ctx(struct kref *kref)
550 {
551 	struct panfrost_mmu *mmu = container_of(kref, struct panfrost_mmu,
552 						refcount);
553 	struct panfrost_device *pfdev = mmu->pfdev;
554 
555 	spin_lock(&pfdev->as_lock);
556 	if (mmu->as >= 0) {
557 		pm_runtime_get_noresume(pfdev->dev);
558 		if (pm_runtime_active(pfdev->dev))
559 			panfrost_mmu_disable(pfdev, mmu->as);
560 		pm_runtime_put_autosuspend(pfdev->dev);
561 
562 		clear_bit(mmu->as, &pfdev->as_alloc_mask);
563 		clear_bit(mmu->as, &pfdev->as_in_use_mask);
564 		list_del(&mmu->list);
565 	}
566 	spin_unlock(&pfdev->as_lock);
567 
568 	free_io_pgtable_ops(mmu->pgtbl_ops);
569 	drm_mm_takedown(&mmu->mm);
570 	kfree(mmu);
571 }
572 
573 void panfrost_mmu_ctx_put(struct panfrost_mmu *mmu)
574 {
575 	kref_put(&mmu->refcount, panfrost_mmu_release_ctx);
576 }
577 
578 struct panfrost_mmu *panfrost_mmu_ctx_get(struct panfrost_mmu *mmu)
579 {
580 	kref_get(&mmu->refcount);
581 
582 	return mmu;
583 }
584 
585 #define PFN_4G		(SZ_4G >> PAGE_SHIFT)
586 #define PFN_4G_MASK	(PFN_4G - 1)
587 #define PFN_16M		(SZ_16M >> PAGE_SHIFT)
588 
589 static void panfrost_drm_mm_color_adjust(const struct drm_mm_node *node,
590 					 unsigned long color,
591 					 u64 *start, u64 *end)
592 {
593 	/* Executable buffers can't start or end on a 4GB boundary */
594 	if (!(color & PANFROST_BO_NOEXEC)) {
595 		u64 next_seg;
596 
597 		if ((*start & PFN_4G_MASK) == 0)
598 			(*start)++;
599 
600 		if ((*end & PFN_4G_MASK) == 0)
601 			(*end)--;
602 
603 		next_seg = ALIGN(*start, PFN_4G);
604 		if (next_seg - *start <= PFN_16M)
605 			*start = next_seg + 1;
606 
607 		*end = min(*end, ALIGN(*start, PFN_4G) - 1);
608 	}
609 }
610 
611 struct panfrost_mmu *panfrost_mmu_ctx_create(struct panfrost_device *pfdev)
612 {
613 	struct panfrost_mmu *mmu;
614 
615 	mmu = kzalloc(sizeof(*mmu), GFP_KERNEL);
616 	if (!mmu)
617 		return ERR_PTR(-ENOMEM);
618 
619 	mmu->pfdev = pfdev;
620 	spin_lock_init(&mmu->mm_lock);
621 
622 	/* 4G enough for now. can be 48-bit */
623 	drm_mm_init(&mmu->mm, SZ_32M >> PAGE_SHIFT, (SZ_4G - SZ_32M) >> PAGE_SHIFT);
624 	mmu->mm.color_adjust = panfrost_drm_mm_color_adjust;
625 
626 	INIT_LIST_HEAD(&mmu->list);
627 	mmu->as = -1;
628 
629 	mmu->pgtbl_cfg = (struct io_pgtable_cfg) {
630 		.pgsize_bitmap	= SZ_4K | SZ_2M,
631 		.ias		= FIELD_GET(0xff, pfdev->features.mmu_features),
632 		.oas		= FIELD_GET(0xff00, pfdev->features.mmu_features),
633 		.coherent_walk	= pfdev->coherent,
634 		.tlb		= &mmu_tlb_ops,
635 		.iommu_dev	= pfdev->dev,
636 	};
637 
638 	mmu->pgtbl_ops = alloc_io_pgtable_ops(ARM_MALI_LPAE, &mmu->pgtbl_cfg,
639 					      mmu);
640 	if (!mmu->pgtbl_ops) {
641 		kfree(mmu);
642 		return ERR_PTR(-EINVAL);
643 	}
644 
645 	kref_init(&mmu->refcount);
646 
647 	return mmu;
648 }
649 
650 static const char *access_type_name(struct panfrost_device *pfdev,
651 		u32 fault_status)
652 {
653 	switch (fault_status & AS_FAULTSTATUS_ACCESS_TYPE_MASK) {
654 	case AS_FAULTSTATUS_ACCESS_TYPE_ATOMIC:
655 		if (panfrost_has_hw_feature(pfdev, HW_FEATURE_AARCH64_MMU))
656 			return "ATOMIC";
657 		else
658 			return "UNKNOWN";
659 	case AS_FAULTSTATUS_ACCESS_TYPE_READ:
660 		return "READ";
661 	case AS_FAULTSTATUS_ACCESS_TYPE_WRITE:
662 		return "WRITE";
663 	case AS_FAULTSTATUS_ACCESS_TYPE_EX:
664 		return "EXECUTE";
665 	default:
666 		WARN_ON(1);
667 		return NULL;
668 	}
669 }
670 
671 static irqreturn_t panfrost_mmu_irq_handler(int irq, void *data)
672 {
673 	struct panfrost_device *pfdev = data;
674 
675 	if (test_bit(PANFROST_COMP_BIT_MMU, pfdev->is_suspended))
676 		return IRQ_NONE;
677 
678 	if (!mmu_read(pfdev, MMU_INT_STAT))
679 		return IRQ_NONE;
680 
681 	mmu_write(pfdev, MMU_INT_MASK, 0);
682 	return IRQ_WAKE_THREAD;
683 }
684 
685 static irqreturn_t panfrost_mmu_irq_handler_thread(int irq, void *data)
686 {
687 	struct panfrost_device *pfdev = data;
688 	u32 status = mmu_read(pfdev, MMU_INT_RAWSTAT);
689 	int ret;
690 
691 	while (status) {
692 		u32 as = ffs(status | (status >> 16)) - 1;
693 		u32 mask = BIT(as) | BIT(as + 16);
694 		u64 addr;
695 		u32 fault_status;
696 		u32 exception_type;
697 		u32 access_type;
698 		u32 source_id;
699 
700 		fault_status = mmu_read(pfdev, AS_FAULTSTATUS(as));
701 		addr = mmu_read(pfdev, AS_FAULTADDRESS_LO(as));
702 		addr |= (u64)mmu_read(pfdev, AS_FAULTADDRESS_HI(as)) << 32;
703 
704 		/* decode the fault status */
705 		exception_type = fault_status & 0xFF;
706 		access_type = (fault_status >> 8) & 0x3;
707 		source_id = (fault_status >> 16);
708 
709 		mmu_write(pfdev, MMU_INT_CLEAR, mask);
710 
711 		/* Page fault only */
712 		ret = -1;
713 		if ((status & mask) == BIT(as) && (exception_type & 0xF8) == 0xC0)
714 			ret = panfrost_mmu_map_fault_addr(pfdev, as, addr);
715 
716 		if (ret) {
717 			/* terminal fault, print info about the fault */
718 			dev_err(pfdev->dev,
719 				"Unhandled Page fault in AS%d at VA 0x%016llX\n"
720 				"Reason: %s\n"
721 				"raw fault status: 0x%X\n"
722 				"decoded fault status: %s\n"
723 				"exception type 0x%X: %s\n"
724 				"access type 0x%X: %s\n"
725 				"source id 0x%X\n",
726 				as, addr,
727 				"TODO",
728 				fault_status,
729 				(fault_status & (1 << 10) ? "DECODER FAULT" : "SLAVE FAULT"),
730 				exception_type, panfrost_exception_name(exception_type),
731 				access_type, access_type_name(pfdev, fault_status),
732 				source_id);
733 
734 			spin_lock(&pfdev->as_lock);
735 			/* Ignore MMU interrupts on this AS until it's been
736 			 * re-enabled.
737 			 */
738 			pfdev->as_faulty_mask |= mask;
739 
740 			/* Disable the MMU to kill jobs on this AS. */
741 			panfrost_mmu_disable(pfdev, as);
742 			spin_unlock(&pfdev->as_lock);
743 		}
744 
745 		status &= ~mask;
746 
747 		/* If we received new MMU interrupts, process them before returning. */
748 		if (!status)
749 			status = mmu_read(pfdev, MMU_INT_RAWSTAT) & ~pfdev->as_faulty_mask;
750 	}
751 
752 	/* Enable interrupts only if we're not about to get suspended */
753 	if (!test_bit(PANFROST_COMP_BIT_MMU, pfdev->is_suspended)) {
754 		spin_lock(&pfdev->as_lock);
755 		mmu_write(pfdev, MMU_INT_MASK, ~pfdev->as_faulty_mask);
756 		spin_unlock(&pfdev->as_lock);
757 	}
758 
759 	return IRQ_HANDLED;
760 };
761 
762 int panfrost_mmu_init(struct panfrost_device *pfdev)
763 {
764 	int err;
765 
766 	pfdev->mmu_irq = platform_get_irq_byname(to_platform_device(pfdev->dev), "mmu");
767 	if (pfdev->mmu_irq < 0)
768 		return pfdev->mmu_irq;
769 
770 	err = devm_request_threaded_irq(pfdev->dev, pfdev->mmu_irq,
771 					panfrost_mmu_irq_handler,
772 					panfrost_mmu_irq_handler_thread,
773 					IRQF_SHARED, KBUILD_MODNAME "-mmu",
774 					pfdev);
775 
776 	if (err) {
777 		dev_err(pfdev->dev, "failed to request mmu irq");
778 		return err;
779 	}
780 
781 	return 0;
782 }
783 
784 void panfrost_mmu_fini(struct panfrost_device *pfdev)
785 {
786 	mmu_write(pfdev, MMU_INT_MASK, 0);
787 }
788 
789 void panfrost_mmu_suspend_irq(struct panfrost_device *pfdev)
790 {
791 	set_bit(PANFROST_COMP_BIT_MMU, pfdev->is_suspended);
792 
793 	mmu_write(pfdev, MMU_INT_MASK, 0);
794 	synchronize_irq(pfdev->mmu_irq);
795 }
796