1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3 * Copyright (C) 2011-2014 NVIDIA CORPORATION. All rights reserved.
4 */
5
6 #include <linux/bitops.h>
7 #include <linux/debugfs.h>
8 #include <linux/err.h>
9 #include <linux/iommu.h>
10 #include <linux/kernel.h>
11 #include <linux/of.h>
12 #include <linux/of_platform.h>
13 #include <linux/pci.h>
14 #include <linux/platform_device.h>
15 #include <linux/slab.h>
16 #include <linux/spinlock.h>
17 #include <linux/dma-mapping.h>
18
19 #include <soc/tegra/ahb.h>
20 #include <soc/tegra/mc.h>
21
22 #include "iommu-pages.h"
23
24 struct tegra_smmu_group {
25 struct list_head list;
26 struct tegra_smmu *smmu;
27 const struct tegra_smmu_group_soc *soc;
28 struct iommu_group *group;
29 unsigned int swgroup;
30 };
31
32 struct tegra_smmu {
33 void __iomem *regs;
34 struct device *dev;
35
36 struct tegra_mc *mc;
37 const struct tegra_smmu_soc *soc;
38
39 struct list_head groups;
40
41 unsigned long pfn_mask;
42 unsigned long tlb_mask;
43
44 unsigned long *asids;
45 struct mutex lock;
46
47 struct list_head list;
48
49 struct dentry *debugfs;
50
51 struct iommu_device iommu; /* IOMMU Core code handle */
52 };
53
54 struct tegra_smmu_as {
55 struct iommu_domain domain;
56 struct tegra_smmu *smmu;
57 unsigned int use_count;
58 spinlock_t lock;
59 u32 *count;
60 struct page **pts;
61 struct page *pd;
62 dma_addr_t pd_dma;
63 unsigned id;
64 u32 attr;
65 };
66
to_smmu_as(struct iommu_domain * dom)67 static struct tegra_smmu_as *to_smmu_as(struct iommu_domain *dom)
68 {
69 return container_of(dom, struct tegra_smmu_as, domain);
70 }
71
smmu_writel(struct tegra_smmu * smmu,u32 value,unsigned long offset)72 static inline void smmu_writel(struct tegra_smmu *smmu, u32 value,
73 unsigned long offset)
74 {
75 writel(value, smmu->regs + offset);
76 }
77
smmu_readl(struct tegra_smmu * smmu,unsigned long offset)78 static inline u32 smmu_readl(struct tegra_smmu *smmu, unsigned long offset)
79 {
80 return readl(smmu->regs + offset);
81 }
82
83 #define SMMU_CONFIG 0x010
84 #define SMMU_CONFIG_ENABLE (1 << 0)
85
86 #define SMMU_TLB_CONFIG 0x14
87 #define SMMU_TLB_CONFIG_HIT_UNDER_MISS (1 << 29)
88 #define SMMU_TLB_CONFIG_ROUND_ROBIN_ARBITRATION (1 << 28)
89 #define SMMU_TLB_CONFIG_ACTIVE_LINES(smmu) \
90 ((smmu)->soc->num_tlb_lines & (smmu)->tlb_mask)
91
92 #define SMMU_PTC_CONFIG 0x18
93 #define SMMU_PTC_CONFIG_ENABLE (1 << 29)
94 #define SMMU_PTC_CONFIG_REQ_LIMIT(x) (((x) & 0x0f) << 24)
95 #define SMMU_PTC_CONFIG_INDEX_MAP(x) ((x) & 0x3f)
96
97 #define SMMU_PTB_ASID 0x01c
98 #define SMMU_PTB_ASID_VALUE(x) ((x) & 0x7f)
99
100 #define SMMU_PTB_DATA 0x020
101 #define SMMU_PTB_DATA_VALUE(dma, attr) ((dma) >> 12 | (attr))
102
103 #define SMMU_MK_PDE(dma, attr) ((dma) >> SMMU_PTE_SHIFT | (attr))
104
105 #define SMMU_TLB_FLUSH 0x030
106 #define SMMU_TLB_FLUSH_VA_MATCH_ALL (0 << 0)
107 #define SMMU_TLB_FLUSH_VA_MATCH_SECTION (2 << 0)
108 #define SMMU_TLB_FLUSH_VA_MATCH_GROUP (3 << 0)
109 #define SMMU_TLB_FLUSH_VA_SECTION(addr) ((((addr) & 0xffc00000) >> 12) | \
110 SMMU_TLB_FLUSH_VA_MATCH_SECTION)
111 #define SMMU_TLB_FLUSH_VA_GROUP(addr) ((((addr) & 0xffffc000) >> 12) | \
112 SMMU_TLB_FLUSH_VA_MATCH_GROUP)
113 #define SMMU_TLB_FLUSH_ASID_MATCH (1 << 31)
114
115 #define SMMU_PTC_FLUSH 0x034
116 #define SMMU_PTC_FLUSH_TYPE_ALL (0 << 0)
117 #define SMMU_PTC_FLUSH_TYPE_ADR (1 << 0)
118
119 #define SMMU_PTC_FLUSH_HI 0x9b8
120 #define SMMU_PTC_FLUSH_HI_MASK 0x3
121
122 /* per-SWGROUP SMMU_*_ASID register */
123 #define SMMU_ASID_ENABLE (1 << 31)
124 #define SMMU_ASID_MASK 0x7f
125 #define SMMU_ASID_VALUE(x) ((x) & SMMU_ASID_MASK)
126
127 /* page table definitions */
128 #define SMMU_NUM_PDE 1024
129 #define SMMU_NUM_PTE 1024
130
131 #define SMMU_SIZE_PD (SMMU_NUM_PDE * 4)
132 #define SMMU_SIZE_PT (SMMU_NUM_PTE * 4)
133
134 #define SMMU_PDE_SHIFT 22
135 #define SMMU_PTE_SHIFT 12
136
137 #define SMMU_PAGE_MASK (~(SMMU_SIZE_PT-1))
138 #define SMMU_OFFSET_IN_PAGE(x) ((unsigned long)(x) & ~SMMU_PAGE_MASK)
139 #define SMMU_PFN_PHYS(x) ((phys_addr_t)(x) << SMMU_PTE_SHIFT)
140 #define SMMU_PHYS_PFN(x) ((unsigned long)((x) >> SMMU_PTE_SHIFT))
141
142 #define SMMU_PD_READABLE (1 << 31)
143 #define SMMU_PD_WRITABLE (1 << 30)
144 #define SMMU_PD_NONSECURE (1 << 29)
145
146 #define SMMU_PDE_READABLE (1 << 31)
147 #define SMMU_PDE_WRITABLE (1 << 30)
148 #define SMMU_PDE_NONSECURE (1 << 29)
149 #define SMMU_PDE_NEXT (1 << 28)
150
151 #define SMMU_PTE_READABLE (1 << 31)
152 #define SMMU_PTE_WRITABLE (1 << 30)
153 #define SMMU_PTE_NONSECURE (1 << 29)
154
155 #define SMMU_PDE_ATTR (SMMU_PDE_READABLE | SMMU_PDE_WRITABLE | \
156 SMMU_PDE_NONSECURE)
157
iova_pd_index(unsigned long iova)158 static unsigned int iova_pd_index(unsigned long iova)
159 {
160 return (iova >> SMMU_PDE_SHIFT) & (SMMU_NUM_PDE - 1);
161 }
162
iova_pt_index(unsigned long iova)163 static unsigned int iova_pt_index(unsigned long iova)
164 {
165 return (iova >> SMMU_PTE_SHIFT) & (SMMU_NUM_PTE - 1);
166 }
167
smmu_dma_addr_valid(struct tegra_smmu * smmu,dma_addr_t addr)168 static bool smmu_dma_addr_valid(struct tegra_smmu *smmu, dma_addr_t addr)
169 {
170 addr >>= 12;
171 return (addr & smmu->pfn_mask) == addr;
172 }
173
smmu_pde_to_dma(struct tegra_smmu * smmu,u32 pde)174 static dma_addr_t smmu_pde_to_dma(struct tegra_smmu *smmu, u32 pde)
175 {
176 return (dma_addr_t)(pde & smmu->pfn_mask) << 12;
177 }
178
smmu_flush_ptc_all(struct tegra_smmu * smmu)179 static void smmu_flush_ptc_all(struct tegra_smmu *smmu)
180 {
181 smmu_writel(smmu, SMMU_PTC_FLUSH_TYPE_ALL, SMMU_PTC_FLUSH);
182 }
183
smmu_flush_ptc(struct tegra_smmu * smmu,dma_addr_t dma,unsigned long offset)184 static inline void smmu_flush_ptc(struct tegra_smmu *smmu, dma_addr_t dma,
185 unsigned long offset)
186 {
187 u32 value;
188
189 offset &= ~(smmu->mc->soc->atom_size - 1);
190
191 if (smmu->mc->soc->num_address_bits > 32) {
192 #ifdef CONFIG_ARCH_DMA_ADDR_T_64BIT
193 value = (dma >> 32) & SMMU_PTC_FLUSH_HI_MASK;
194 #else
195 value = 0;
196 #endif
197 smmu_writel(smmu, value, SMMU_PTC_FLUSH_HI);
198 }
199
200 value = (dma + offset) | SMMU_PTC_FLUSH_TYPE_ADR;
201 smmu_writel(smmu, value, SMMU_PTC_FLUSH);
202 }
203
smmu_flush_tlb(struct tegra_smmu * smmu)204 static inline void smmu_flush_tlb(struct tegra_smmu *smmu)
205 {
206 smmu_writel(smmu, SMMU_TLB_FLUSH_VA_MATCH_ALL, SMMU_TLB_FLUSH);
207 }
208
smmu_flush_tlb_asid(struct tegra_smmu * smmu,unsigned long asid)209 static inline void smmu_flush_tlb_asid(struct tegra_smmu *smmu,
210 unsigned long asid)
211 {
212 u32 value;
213
214 if (smmu->soc->num_asids == 4)
215 value = (asid & 0x3) << 29;
216 else
217 value = (asid & 0x7f) << 24;
218
219 value |= SMMU_TLB_FLUSH_ASID_MATCH | SMMU_TLB_FLUSH_VA_MATCH_ALL;
220 smmu_writel(smmu, value, SMMU_TLB_FLUSH);
221 }
222
smmu_flush_tlb_section(struct tegra_smmu * smmu,unsigned long asid,unsigned long iova)223 static inline void smmu_flush_tlb_section(struct tegra_smmu *smmu,
224 unsigned long asid,
225 unsigned long iova)
226 {
227 u32 value;
228
229 if (smmu->soc->num_asids == 4)
230 value = (asid & 0x3) << 29;
231 else
232 value = (asid & 0x7f) << 24;
233
234 value |= SMMU_TLB_FLUSH_ASID_MATCH | SMMU_TLB_FLUSH_VA_SECTION(iova);
235 smmu_writel(smmu, value, SMMU_TLB_FLUSH);
236 }
237
smmu_flush_tlb_group(struct tegra_smmu * smmu,unsigned long asid,unsigned long iova)238 static inline void smmu_flush_tlb_group(struct tegra_smmu *smmu,
239 unsigned long asid,
240 unsigned long iova)
241 {
242 u32 value;
243
244 if (smmu->soc->num_asids == 4)
245 value = (asid & 0x3) << 29;
246 else
247 value = (asid & 0x7f) << 24;
248
249 value |= SMMU_TLB_FLUSH_ASID_MATCH | SMMU_TLB_FLUSH_VA_GROUP(iova);
250 smmu_writel(smmu, value, SMMU_TLB_FLUSH);
251 }
252
smmu_flush(struct tegra_smmu * smmu)253 static inline void smmu_flush(struct tegra_smmu *smmu)
254 {
255 smmu_readl(smmu, SMMU_PTB_ASID);
256 }
257
tegra_smmu_alloc_asid(struct tegra_smmu * smmu,unsigned int * idp)258 static int tegra_smmu_alloc_asid(struct tegra_smmu *smmu, unsigned int *idp)
259 {
260 unsigned long id;
261
262 id = find_first_zero_bit(smmu->asids, smmu->soc->num_asids);
263 if (id >= smmu->soc->num_asids)
264 return -ENOSPC;
265
266 set_bit(id, smmu->asids);
267 *idp = id;
268
269 return 0;
270 }
271
tegra_smmu_free_asid(struct tegra_smmu * smmu,unsigned int id)272 static void tegra_smmu_free_asid(struct tegra_smmu *smmu, unsigned int id)
273 {
274 clear_bit(id, smmu->asids);
275 }
276
tegra_smmu_domain_alloc_paging(struct device * dev)277 static struct iommu_domain *tegra_smmu_domain_alloc_paging(struct device *dev)
278 {
279 struct tegra_smmu_as *as;
280
281 as = kzalloc(sizeof(*as), GFP_KERNEL);
282 if (!as)
283 return NULL;
284
285 as->attr = SMMU_PD_READABLE | SMMU_PD_WRITABLE | SMMU_PD_NONSECURE;
286
287 as->pd = __iommu_alloc_pages(GFP_KERNEL | __GFP_DMA, 0);
288 if (!as->pd) {
289 kfree(as);
290 return NULL;
291 }
292
293 as->count = kcalloc(SMMU_NUM_PDE, sizeof(u32), GFP_KERNEL);
294 if (!as->count) {
295 __iommu_free_pages(as->pd, 0);
296 kfree(as);
297 return NULL;
298 }
299
300 as->pts = kcalloc(SMMU_NUM_PDE, sizeof(*as->pts), GFP_KERNEL);
301 if (!as->pts) {
302 kfree(as->count);
303 __iommu_free_pages(as->pd, 0);
304 kfree(as);
305 return NULL;
306 }
307
308 spin_lock_init(&as->lock);
309
310 /* setup aperture */
311 as->domain.geometry.aperture_start = 0;
312 as->domain.geometry.aperture_end = 0xffffffff;
313 as->domain.geometry.force_aperture = true;
314
315 return &as->domain;
316 }
317
tegra_smmu_domain_free(struct iommu_domain * domain)318 static void tegra_smmu_domain_free(struct iommu_domain *domain)
319 {
320 struct tegra_smmu_as *as = to_smmu_as(domain);
321
322 /* TODO: free page directory and page tables */
323
324 WARN_ON_ONCE(as->use_count);
325 kfree(as->count);
326 kfree(as->pts);
327 kfree(as);
328 }
329
330 static const struct tegra_smmu_swgroup *
tegra_smmu_find_swgroup(struct tegra_smmu * smmu,unsigned int swgroup)331 tegra_smmu_find_swgroup(struct tegra_smmu *smmu, unsigned int swgroup)
332 {
333 const struct tegra_smmu_swgroup *group = NULL;
334 unsigned int i;
335
336 for (i = 0; i < smmu->soc->num_swgroups; i++) {
337 if (smmu->soc->swgroups[i].swgroup == swgroup) {
338 group = &smmu->soc->swgroups[i];
339 break;
340 }
341 }
342
343 return group;
344 }
345
tegra_smmu_enable(struct tegra_smmu * smmu,unsigned int swgroup,unsigned int asid)346 static void tegra_smmu_enable(struct tegra_smmu *smmu, unsigned int swgroup,
347 unsigned int asid)
348 {
349 const struct tegra_smmu_swgroup *group;
350 unsigned int i;
351 u32 value;
352
353 group = tegra_smmu_find_swgroup(smmu, swgroup);
354 if (group) {
355 value = smmu_readl(smmu, group->reg);
356 value &= ~SMMU_ASID_MASK;
357 value |= SMMU_ASID_VALUE(asid);
358 value |= SMMU_ASID_ENABLE;
359 smmu_writel(smmu, value, group->reg);
360 } else {
361 pr_warn("%s group from swgroup %u not found\n", __func__,
362 swgroup);
363 /* No point moving ahead if group was not found */
364 return;
365 }
366
367 for (i = 0; i < smmu->soc->num_clients; i++) {
368 const struct tegra_mc_client *client = &smmu->soc->clients[i];
369
370 if (client->swgroup != swgroup)
371 continue;
372
373 value = smmu_readl(smmu, client->regs.smmu.reg);
374 value |= BIT(client->regs.smmu.bit);
375 smmu_writel(smmu, value, client->regs.smmu.reg);
376 }
377 }
378
tegra_smmu_disable(struct tegra_smmu * smmu,unsigned int swgroup,unsigned int asid)379 static void tegra_smmu_disable(struct tegra_smmu *smmu, unsigned int swgroup,
380 unsigned int asid)
381 {
382 const struct tegra_smmu_swgroup *group;
383 unsigned int i;
384 u32 value;
385
386 group = tegra_smmu_find_swgroup(smmu, swgroup);
387 if (group) {
388 value = smmu_readl(smmu, group->reg);
389 value &= ~SMMU_ASID_MASK;
390 value |= SMMU_ASID_VALUE(asid);
391 value &= ~SMMU_ASID_ENABLE;
392 smmu_writel(smmu, value, group->reg);
393 }
394
395 for (i = 0; i < smmu->soc->num_clients; i++) {
396 const struct tegra_mc_client *client = &smmu->soc->clients[i];
397
398 if (client->swgroup != swgroup)
399 continue;
400
401 value = smmu_readl(smmu, client->regs.smmu.reg);
402 value &= ~BIT(client->regs.smmu.bit);
403 smmu_writel(smmu, value, client->regs.smmu.reg);
404 }
405 }
406
tegra_smmu_as_prepare(struct tegra_smmu * smmu,struct tegra_smmu_as * as)407 static int tegra_smmu_as_prepare(struct tegra_smmu *smmu,
408 struct tegra_smmu_as *as)
409 {
410 u32 value;
411 int err = 0;
412
413 mutex_lock(&smmu->lock);
414
415 if (as->use_count > 0) {
416 as->use_count++;
417 goto unlock;
418 }
419
420 as->pd_dma = dma_map_page(smmu->dev, as->pd, 0, SMMU_SIZE_PD,
421 DMA_TO_DEVICE);
422 if (dma_mapping_error(smmu->dev, as->pd_dma)) {
423 err = -ENOMEM;
424 goto unlock;
425 }
426
427 /* We can't handle 64-bit DMA addresses */
428 if (!smmu_dma_addr_valid(smmu, as->pd_dma)) {
429 err = -ENOMEM;
430 goto err_unmap;
431 }
432
433 err = tegra_smmu_alloc_asid(smmu, &as->id);
434 if (err < 0)
435 goto err_unmap;
436
437 smmu_flush_ptc(smmu, as->pd_dma, 0);
438 smmu_flush_tlb_asid(smmu, as->id);
439
440 smmu_writel(smmu, as->id & 0x7f, SMMU_PTB_ASID);
441 value = SMMU_PTB_DATA_VALUE(as->pd_dma, as->attr);
442 smmu_writel(smmu, value, SMMU_PTB_DATA);
443 smmu_flush(smmu);
444
445 as->smmu = smmu;
446 as->use_count++;
447
448 mutex_unlock(&smmu->lock);
449
450 return 0;
451
452 err_unmap:
453 dma_unmap_page(smmu->dev, as->pd_dma, SMMU_SIZE_PD, DMA_TO_DEVICE);
454 unlock:
455 mutex_unlock(&smmu->lock);
456
457 return err;
458 }
459
tegra_smmu_as_unprepare(struct tegra_smmu * smmu,struct tegra_smmu_as * as)460 static void tegra_smmu_as_unprepare(struct tegra_smmu *smmu,
461 struct tegra_smmu_as *as)
462 {
463 mutex_lock(&smmu->lock);
464
465 if (--as->use_count > 0) {
466 mutex_unlock(&smmu->lock);
467 return;
468 }
469
470 tegra_smmu_free_asid(smmu, as->id);
471
472 dma_unmap_page(smmu->dev, as->pd_dma, SMMU_SIZE_PD, DMA_TO_DEVICE);
473
474 as->smmu = NULL;
475
476 mutex_unlock(&smmu->lock);
477 }
478
tegra_smmu_attach_dev(struct iommu_domain * domain,struct device * dev)479 static int tegra_smmu_attach_dev(struct iommu_domain *domain,
480 struct device *dev)
481 {
482 struct iommu_fwspec *fwspec = dev_iommu_fwspec_get(dev);
483 struct tegra_smmu *smmu = dev_iommu_priv_get(dev);
484 struct tegra_smmu_as *as = to_smmu_as(domain);
485 unsigned int index;
486 int err;
487
488 if (!fwspec)
489 return -ENOENT;
490
491 for (index = 0; index < fwspec->num_ids; index++) {
492 err = tegra_smmu_as_prepare(smmu, as);
493 if (err)
494 goto disable;
495
496 tegra_smmu_enable(smmu, fwspec->ids[index], as->id);
497 }
498
499 if (index == 0)
500 return -ENODEV;
501
502 return 0;
503
504 disable:
505 while (index--) {
506 tegra_smmu_disable(smmu, fwspec->ids[index], as->id);
507 tegra_smmu_as_unprepare(smmu, as);
508 }
509
510 return err;
511 }
512
tegra_smmu_identity_attach(struct iommu_domain * identity_domain,struct device * dev)513 static int tegra_smmu_identity_attach(struct iommu_domain *identity_domain,
514 struct device *dev)
515 {
516 struct iommu_domain *domain = iommu_get_domain_for_dev(dev);
517 struct iommu_fwspec *fwspec = dev_iommu_fwspec_get(dev);
518 struct tegra_smmu_as *as;
519 struct tegra_smmu *smmu;
520 unsigned int index;
521
522 if (!fwspec)
523 return -ENODEV;
524
525 if (domain == identity_domain || !domain)
526 return 0;
527
528 as = to_smmu_as(domain);
529 smmu = as->smmu;
530 for (index = 0; index < fwspec->num_ids; index++) {
531 tegra_smmu_disable(smmu, fwspec->ids[index], as->id);
532 tegra_smmu_as_unprepare(smmu, as);
533 }
534 return 0;
535 }
536
537 static struct iommu_domain_ops tegra_smmu_identity_ops = {
538 .attach_dev = tegra_smmu_identity_attach,
539 };
540
541 static struct iommu_domain tegra_smmu_identity_domain = {
542 .type = IOMMU_DOMAIN_IDENTITY,
543 .ops = &tegra_smmu_identity_ops,
544 };
545
tegra_smmu_set_pde(struct tegra_smmu_as * as,unsigned long iova,u32 value)546 static void tegra_smmu_set_pde(struct tegra_smmu_as *as, unsigned long iova,
547 u32 value)
548 {
549 unsigned int pd_index = iova_pd_index(iova);
550 struct tegra_smmu *smmu = as->smmu;
551 u32 *pd = page_address(as->pd);
552 unsigned long offset = pd_index * sizeof(*pd);
553
554 /* Set the page directory entry first */
555 pd[pd_index] = value;
556
557 /* The flush the page directory entry from caches */
558 dma_sync_single_range_for_device(smmu->dev, as->pd_dma, offset,
559 sizeof(*pd), DMA_TO_DEVICE);
560
561 /* And flush the iommu */
562 smmu_flush_ptc(smmu, as->pd_dma, offset);
563 smmu_flush_tlb_section(smmu, as->id, iova);
564 smmu_flush(smmu);
565 }
566
tegra_smmu_pte_offset(struct page * pt_page,unsigned long iova)567 static u32 *tegra_smmu_pte_offset(struct page *pt_page, unsigned long iova)
568 {
569 u32 *pt = page_address(pt_page);
570
571 return pt + iova_pt_index(iova);
572 }
573
tegra_smmu_pte_lookup(struct tegra_smmu_as * as,unsigned long iova,dma_addr_t * dmap)574 static u32 *tegra_smmu_pte_lookup(struct tegra_smmu_as *as, unsigned long iova,
575 dma_addr_t *dmap)
576 {
577 unsigned int pd_index = iova_pd_index(iova);
578 struct tegra_smmu *smmu = as->smmu;
579 struct page *pt_page;
580 u32 *pd;
581
582 pt_page = as->pts[pd_index];
583 if (!pt_page)
584 return NULL;
585
586 pd = page_address(as->pd);
587 *dmap = smmu_pde_to_dma(smmu, pd[pd_index]);
588
589 return tegra_smmu_pte_offset(pt_page, iova);
590 }
591
as_get_pte(struct tegra_smmu_as * as,dma_addr_t iova,dma_addr_t * dmap,struct page * page)592 static u32 *as_get_pte(struct tegra_smmu_as *as, dma_addr_t iova,
593 dma_addr_t *dmap, struct page *page)
594 {
595 unsigned int pde = iova_pd_index(iova);
596 struct tegra_smmu *smmu = as->smmu;
597
598 if (!as->pts[pde]) {
599 dma_addr_t dma;
600
601 dma = dma_map_page(smmu->dev, page, 0, SMMU_SIZE_PT,
602 DMA_TO_DEVICE);
603 if (dma_mapping_error(smmu->dev, dma)) {
604 __iommu_free_pages(page, 0);
605 return NULL;
606 }
607
608 if (!smmu_dma_addr_valid(smmu, dma)) {
609 dma_unmap_page(smmu->dev, dma, SMMU_SIZE_PT,
610 DMA_TO_DEVICE);
611 __iommu_free_pages(page, 0);
612 return NULL;
613 }
614
615 as->pts[pde] = page;
616
617 tegra_smmu_set_pde(as, iova, SMMU_MK_PDE(dma, SMMU_PDE_ATTR |
618 SMMU_PDE_NEXT));
619
620 *dmap = dma;
621 } else {
622 u32 *pd = page_address(as->pd);
623
624 *dmap = smmu_pde_to_dma(smmu, pd[pde]);
625 }
626
627 return tegra_smmu_pte_offset(as->pts[pde], iova);
628 }
629
tegra_smmu_pte_get_use(struct tegra_smmu_as * as,unsigned long iova)630 static void tegra_smmu_pte_get_use(struct tegra_smmu_as *as, unsigned long iova)
631 {
632 unsigned int pd_index = iova_pd_index(iova);
633
634 as->count[pd_index]++;
635 }
636
tegra_smmu_pte_put_use(struct tegra_smmu_as * as,unsigned long iova)637 static void tegra_smmu_pte_put_use(struct tegra_smmu_as *as, unsigned long iova)
638 {
639 unsigned int pde = iova_pd_index(iova);
640 struct page *page = as->pts[pde];
641
642 /*
643 * When no entries in this page table are used anymore, return the
644 * memory page to the system.
645 */
646 if (--as->count[pde] == 0) {
647 struct tegra_smmu *smmu = as->smmu;
648 u32 *pd = page_address(as->pd);
649 dma_addr_t pte_dma = smmu_pde_to_dma(smmu, pd[pde]);
650
651 tegra_smmu_set_pde(as, iova, 0);
652
653 dma_unmap_page(smmu->dev, pte_dma, SMMU_SIZE_PT, DMA_TO_DEVICE);
654 __iommu_free_pages(page, 0);
655 as->pts[pde] = NULL;
656 }
657 }
658
tegra_smmu_set_pte(struct tegra_smmu_as * as,unsigned long iova,u32 * pte,dma_addr_t pte_dma,u32 val)659 static void tegra_smmu_set_pte(struct tegra_smmu_as *as, unsigned long iova,
660 u32 *pte, dma_addr_t pte_dma, u32 val)
661 {
662 struct tegra_smmu *smmu = as->smmu;
663 unsigned long offset = SMMU_OFFSET_IN_PAGE(pte);
664
665 *pte = val;
666
667 dma_sync_single_range_for_device(smmu->dev, pte_dma, offset,
668 4, DMA_TO_DEVICE);
669 smmu_flush_ptc(smmu, pte_dma, offset);
670 smmu_flush_tlb_group(smmu, as->id, iova);
671 smmu_flush(smmu);
672 }
673
as_get_pde_page(struct tegra_smmu_as * as,unsigned long iova,gfp_t gfp,unsigned long * flags)674 static struct page *as_get_pde_page(struct tegra_smmu_as *as,
675 unsigned long iova, gfp_t gfp,
676 unsigned long *flags)
677 {
678 unsigned int pde = iova_pd_index(iova);
679 struct page *page = as->pts[pde];
680
681 /* at first check whether allocation needs to be done at all */
682 if (page)
683 return page;
684
685 /*
686 * In order to prevent exhaustion of the atomic memory pool, we
687 * allocate page in a sleeping context if GFP flags permit. Hence
688 * spinlock needs to be unlocked and re-locked after allocation.
689 */
690 if (gfpflags_allow_blocking(gfp))
691 spin_unlock_irqrestore(&as->lock, *flags);
692
693 page = __iommu_alloc_pages(gfp | __GFP_DMA, 0);
694
695 if (gfpflags_allow_blocking(gfp))
696 spin_lock_irqsave(&as->lock, *flags);
697
698 /*
699 * In a case of blocking allocation, a concurrent mapping may win
700 * the PDE allocation. In this case the allocated page isn't needed
701 * if allocation succeeded and the allocation failure isn't fatal.
702 */
703 if (as->pts[pde]) {
704 if (page)
705 __iommu_free_pages(page, 0);
706
707 page = as->pts[pde];
708 }
709
710 return page;
711 }
712
713 static int
__tegra_smmu_map(struct iommu_domain * domain,unsigned long iova,phys_addr_t paddr,size_t size,int prot,gfp_t gfp,unsigned long * flags)714 __tegra_smmu_map(struct iommu_domain *domain, unsigned long iova,
715 phys_addr_t paddr, size_t size, int prot, gfp_t gfp,
716 unsigned long *flags)
717 {
718 struct tegra_smmu_as *as = to_smmu_as(domain);
719 dma_addr_t pte_dma;
720 struct page *page;
721 u32 pte_attrs;
722 u32 *pte;
723
724 page = as_get_pde_page(as, iova, gfp, flags);
725 if (!page)
726 return -ENOMEM;
727
728 pte = as_get_pte(as, iova, &pte_dma, page);
729 if (!pte)
730 return -ENOMEM;
731
732 /* If we aren't overwriting a pre-existing entry, increment use */
733 if (*pte == 0)
734 tegra_smmu_pte_get_use(as, iova);
735
736 pte_attrs = SMMU_PTE_NONSECURE;
737
738 if (prot & IOMMU_READ)
739 pte_attrs |= SMMU_PTE_READABLE;
740
741 if (prot & IOMMU_WRITE)
742 pte_attrs |= SMMU_PTE_WRITABLE;
743
744 tegra_smmu_set_pte(as, iova, pte, pte_dma,
745 SMMU_PHYS_PFN(paddr) | pte_attrs);
746
747 return 0;
748 }
749
750 static size_t
__tegra_smmu_unmap(struct iommu_domain * domain,unsigned long iova,size_t size,struct iommu_iotlb_gather * gather)751 __tegra_smmu_unmap(struct iommu_domain *domain, unsigned long iova,
752 size_t size, struct iommu_iotlb_gather *gather)
753 {
754 struct tegra_smmu_as *as = to_smmu_as(domain);
755 dma_addr_t pte_dma;
756 u32 *pte;
757
758 pte = tegra_smmu_pte_lookup(as, iova, &pte_dma);
759 if (!pte || !*pte)
760 return 0;
761
762 tegra_smmu_set_pte(as, iova, pte, pte_dma, 0);
763 tegra_smmu_pte_put_use(as, iova);
764
765 return size;
766 }
767
tegra_smmu_map(struct iommu_domain * domain,unsigned long iova,phys_addr_t paddr,size_t size,size_t count,int prot,gfp_t gfp,size_t * mapped)768 static int tegra_smmu_map(struct iommu_domain *domain, unsigned long iova,
769 phys_addr_t paddr, size_t size, size_t count,
770 int prot, gfp_t gfp, size_t *mapped)
771 {
772 struct tegra_smmu_as *as = to_smmu_as(domain);
773 unsigned long flags;
774 int ret;
775
776 spin_lock_irqsave(&as->lock, flags);
777 ret = __tegra_smmu_map(domain, iova, paddr, size, prot, gfp, &flags);
778 spin_unlock_irqrestore(&as->lock, flags);
779
780 if (!ret)
781 *mapped = size;
782
783 return ret;
784 }
785
tegra_smmu_unmap(struct iommu_domain * domain,unsigned long iova,size_t size,size_t count,struct iommu_iotlb_gather * gather)786 static size_t tegra_smmu_unmap(struct iommu_domain *domain, unsigned long iova,
787 size_t size, size_t count, struct iommu_iotlb_gather *gather)
788 {
789 struct tegra_smmu_as *as = to_smmu_as(domain);
790 unsigned long flags;
791
792 spin_lock_irqsave(&as->lock, flags);
793 size = __tegra_smmu_unmap(domain, iova, size, gather);
794 spin_unlock_irqrestore(&as->lock, flags);
795
796 return size;
797 }
798
tegra_smmu_iova_to_phys(struct iommu_domain * domain,dma_addr_t iova)799 static phys_addr_t tegra_smmu_iova_to_phys(struct iommu_domain *domain,
800 dma_addr_t iova)
801 {
802 struct tegra_smmu_as *as = to_smmu_as(domain);
803 unsigned long pfn;
804 dma_addr_t pte_dma;
805 u32 *pte;
806
807 pte = tegra_smmu_pte_lookup(as, iova, &pte_dma);
808 if (!pte || !*pte)
809 return 0;
810
811 pfn = *pte & as->smmu->pfn_mask;
812
813 return SMMU_PFN_PHYS(pfn) + SMMU_OFFSET_IN_PAGE(iova);
814 }
815
tegra_smmu_find(struct device_node * np)816 static struct tegra_smmu *tegra_smmu_find(struct device_node *np)
817 {
818 struct platform_device *pdev;
819 struct tegra_mc *mc;
820
821 pdev = of_find_device_by_node(np);
822 if (!pdev)
823 return NULL;
824
825 mc = platform_get_drvdata(pdev);
826 if (!mc) {
827 put_device(&pdev->dev);
828 return NULL;
829 }
830
831 return mc->smmu;
832 }
833
tegra_smmu_configure(struct tegra_smmu * smmu,struct device * dev,const struct of_phandle_args * args)834 static int tegra_smmu_configure(struct tegra_smmu *smmu, struct device *dev,
835 const struct of_phandle_args *args)
836 {
837 const struct iommu_ops *ops = smmu->iommu.ops;
838 int err;
839
840 err = iommu_fwspec_init(dev, dev_fwnode(smmu->dev));
841 if (err < 0) {
842 dev_err(dev, "failed to initialize fwspec: %d\n", err);
843 return err;
844 }
845
846 err = ops->of_xlate(dev, args);
847 if (err < 0) {
848 dev_err(dev, "failed to parse SW group ID: %d\n", err);
849 iommu_fwspec_free(dev);
850 return err;
851 }
852
853 return 0;
854 }
855
tegra_smmu_probe_device(struct device * dev)856 static struct iommu_device *tegra_smmu_probe_device(struct device *dev)
857 {
858 struct device_node *np = dev->of_node;
859 struct tegra_smmu *smmu = NULL;
860 struct of_phandle_args args;
861 unsigned int index = 0;
862 int err;
863
864 while (of_parse_phandle_with_args(np, "iommus", "#iommu-cells", index,
865 &args) == 0) {
866 smmu = tegra_smmu_find(args.np);
867 if (smmu) {
868 err = tegra_smmu_configure(smmu, dev, &args);
869
870 if (err < 0) {
871 of_node_put(args.np);
872 return ERR_PTR(err);
873 }
874 }
875
876 of_node_put(args.np);
877 index++;
878 }
879
880 smmu = dev_iommu_priv_get(dev);
881 if (!smmu)
882 return ERR_PTR(-ENODEV);
883
884 return &smmu->iommu;
885 }
886
887 static const struct tegra_smmu_group_soc *
tegra_smmu_find_group(struct tegra_smmu * smmu,unsigned int swgroup)888 tegra_smmu_find_group(struct tegra_smmu *smmu, unsigned int swgroup)
889 {
890 unsigned int i, j;
891
892 for (i = 0; i < smmu->soc->num_groups; i++)
893 for (j = 0; j < smmu->soc->groups[i].num_swgroups; j++)
894 if (smmu->soc->groups[i].swgroups[j] == swgroup)
895 return &smmu->soc->groups[i];
896
897 return NULL;
898 }
899
tegra_smmu_group_release(void * iommu_data)900 static void tegra_smmu_group_release(void *iommu_data)
901 {
902 struct tegra_smmu_group *group = iommu_data;
903 struct tegra_smmu *smmu = group->smmu;
904
905 mutex_lock(&smmu->lock);
906 list_del(&group->list);
907 mutex_unlock(&smmu->lock);
908 }
909
tegra_smmu_device_group(struct device * dev)910 static struct iommu_group *tegra_smmu_device_group(struct device *dev)
911 {
912 struct iommu_fwspec *fwspec = dev_iommu_fwspec_get(dev);
913 struct tegra_smmu *smmu = dev_iommu_priv_get(dev);
914 const struct tegra_smmu_group_soc *soc;
915 unsigned int swgroup = fwspec->ids[0];
916 struct tegra_smmu_group *group;
917 struct iommu_group *grp;
918
919 /* Find group_soc associating with swgroup */
920 soc = tegra_smmu_find_group(smmu, swgroup);
921
922 mutex_lock(&smmu->lock);
923
924 /* Find existing iommu_group associating with swgroup or group_soc */
925 list_for_each_entry(group, &smmu->groups, list)
926 if ((group->swgroup == swgroup) || (soc && group->soc == soc)) {
927 grp = iommu_group_ref_get(group->group);
928 mutex_unlock(&smmu->lock);
929 return grp;
930 }
931
932 group = devm_kzalloc(smmu->dev, sizeof(*group), GFP_KERNEL);
933 if (!group) {
934 mutex_unlock(&smmu->lock);
935 return NULL;
936 }
937
938 INIT_LIST_HEAD(&group->list);
939 group->swgroup = swgroup;
940 group->smmu = smmu;
941 group->soc = soc;
942
943 if (dev_is_pci(dev))
944 group->group = pci_device_group(dev);
945 else
946 group->group = generic_device_group(dev);
947
948 if (IS_ERR(group->group)) {
949 devm_kfree(smmu->dev, group);
950 mutex_unlock(&smmu->lock);
951 return NULL;
952 }
953
954 iommu_group_set_iommudata(group->group, group, tegra_smmu_group_release);
955 if (soc)
956 iommu_group_set_name(group->group, soc->name);
957 list_add_tail(&group->list, &smmu->groups);
958 mutex_unlock(&smmu->lock);
959
960 return group->group;
961 }
962
tegra_smmu_of_xlate(struct device * dev,const struct of_phandle_args * args)963 static int tegra_smmu_of_xlate(struct device *dev,
964 const struct of_phandle_args *args)
965 {
966 struct platform_device *iommu_pdev = of_find_device_by_node(args->np);
967 struct tegra_mc *mc = platform_get_drvdata(iommu_pdev);
968 u32 id = args->args[0];
969
970 /*
971 * Note: we are here releasing the reference of &iommu_pdev->dev, which
972 * is mc->dev. Although some functions in tegra_smmu_ops may keep using
973 * its private data beyond this point, it's still safe to do so because
974 * the SMMU parent device is the same as the MC, so the reference count
975 * isn't strictly necessary.
976 */
977 put_device(&iommu_pdev->dev);
978
979 dev_iommu_priv_set(dev, mc->smmu);
980
981 return iommu_fwspec_add_ids(dev, &id, 1);
982 }
983
tegra_smmu_def_domain_type(struct device * dev)984 static int tegra_smmu_def_domain_type(struct device *dev)
985 {
986 /*
987 * FIXME: For now we want to run all translation in IDENTITY mode, due
988 * to some device quirks. Better would be to just quirk the troubled
989 * devices.
990 */
991 return IOMMU_DOMAIN_IDENTITY;
992 }
993
994 static const struct iommu_ops tegra_smmu_ops = {
995 .identity_domain = &tegra_smmu_identity_domain,
996 .def_domain_type = &tegra_smmu_def_domain_type,
997 .domain_alloc_paging = tegra_smmu_domain_alloc_paging,
998 .probe_device = tegra_smmu_probe_device,
999 .device_group = tegra_smmu_device_group,
1000 .of_xlate = tegra_smmu_of_xlate,
1001 .pgsize_bitmap = SZ_4K,
1002 .default_domain_ops = &(const struct iommu_domain_ops) {
1003 .attach_dev = tegra_smmu_attach_dev,
1004 .map_pages = tegra_smmu_map,
1005 .unmap_pages = tegra_smmu_unmap,
1006 .iova_to_phys = tegra_smmu_iova_to_phys,
1007 .free = tegra_smmu_domain_free,
1008 }
1009 };
1010
tegra_smmu_ahb_enable(void)1011 static void tegra_smmu_ahb_enable(void)
1012 {
1013 static const struct of_device_id ahb_match[] = {
1014 { .compatible = "nvidia,tegra30-ahb", },
1015 { }
1016 };
1017 struct device_node *ahb;
1018
1019 ahb = of_find_matching_node(NULL, ahb_match);
1020 if (ahb) {
1021 tegra_ahb_enable_smmu(ahb);
1022 of_node_put(ahb);
1023 }
1024 }
1025
tegra_smmu_swgroups_show(struct seq_file * s,void * data)1026 static int tegra_smmu_swgroups_show(struct seq_file *s, void *data)
1027 {
1028 struct tegra_smmu *smmu = s->private;
1029 unsigned int i;
1030 u32 value;
1031
1032 seq_printf(s, "swgroup enabled ASID\n");
1033 seq_printf(s, "------------------------\n");
1034
1035 for (i = 0; i < smmu->soc->num_swgroups; i++) {
1036 const struct tegra_smmu_swgroup *group = &smmu->soc->swgroups[i];
1037 const char *status;
1038 unsigned int asid;
1039
1040 value = smmu_readl(smmu, group->reg);
1041
1042 if (value & SMMU_ASID_ENABLE)
1043 status = "yes";
1044 else
1045 status = "no";
1046
1047 asid = value & SMMU_ASID_MASK;
1048
1049 seq_printf(s, "%-9s %-7s %#04x\n", group->name, status,
1050 asid);
1051 }
1052
1053 return 0;
1054 }
1055
1056 DEFINE_SHOW_ATTRIBUTE(tegra_smmu_swgroups);
1057
tegra_smmu_clients_show(struct seq_file * s,void * data)1058 static int tegra_smmu_clients_show(struct seq_file *s, void *data)
1059 {
1060 struct tegra_smmu *smmu = s->private;
1061 unsigned int i;
1062 u32 value;
1063
1064 seq_printf(s, "client enabled\n");
1065 seq_printf(s, "--------------------\n");
1066
1067 for (i = 0; i < smmu->soc->num_clients; i++) {
1068 const struct tegra_mc_client *client = &smmu->soc->clients[i];
1069 const char *status;
1070
1071 value = smmu_readl(smmu, client->regs.smmu.reg);
1072
1073 if (value & BIT(client->regs.smmu.bit))
1074 status = "yes";
1075 else
1076 status = "no";
1077
1078 seq_printf(s, "%-12s %s\n", client->name, status);
1079 }
1080
1081 return 0;
1082 }
1083
1084 DEFINE_SHOW_ATTRIBUTE(tegra_smmu_clients);
1085
tegra_smmu_debugfs_init(struct tegra_smmu * smmu)1086 static void tegra_smmu_debugfs_init(struct tegra_smmu *smmu)
1087 {
1088 smmu->debugfs = debugfs_create_dir("smmu", NULL);
1089
1090 debugfs_create_file("swgroups", S_IRUGO, smmu->debugfs, smmu,
1091 &tegra_smmu_swgroups_fops);
1092 debugfs_create_file("clients", S_IRUGO, smmu->debugfs, smmu,
1093 &tegra_smmu_clients_fops);
1094 }
1095
tegra_smmu_debugfs_exit(struct tegra_smmu * smmu)1096 static void tegra_smmu_debugfs_exit(struct tegra_smmu *smmu)
1097 {
1098 debugfs_remove_recursive(smmu->debugfs);
1099 }
1100
tegra_smmu_probe(struct device * dev,const struct tegra_smmu_soc * soc,struct tegra_mc * mc)1101 struct tegra_smmu *tegra_smmu_probe(struct device *dev,
1102 const struct tegra_smmu_soc *soc,
1103 struct tegra_mc *mc)
1104 {
1105 struct tegra_smmu *smmu;
1106 u32 value;
1107 int err;
1108
1109 smmu = devm_kzalloc(dev, sizeof(*smmu), GFP_KERNEL);
1110 if (!smmu)
1111 return ERR_PTR(-ENOMEM);
1112
1113 /*
1114 * This is a bit of a hack. Ideally we'd want to simply return this
1115 * value. However iommu_device_register() will attempt to add
1116 * all devices to the IOMMU before we get that far. In order
1117 * not to rely on global variables to track the IOMMU instance, we
1118 * set it here so that it can be looked up from the .probe_device()
1119 * callback via the IOMMU device's .drvdata field.
1120 */
1121 mc->smmu = smmu;
1122
1123 smmu->asids = devm_bitmap_zalloc(dev, soc->num_asids, GFP_KERNEL);
1124 if (!smmu->asids)
1125 return ERR_PTR(-ENOMEM);
1126
1127 INIT_LIST_HEAD(&smmu->groups);
1128 mutex_init(&smmu->lock);
1129
1130 smmu->regs = mc->regs;
1131 smmu->soc = soc;
1132 smmu->dev = dev;
1133 smmu->mc = mc;
1134
1135 smmu->pfn_mask =
1136 BIT_MASK(mc->soc->num_address_bits - SMMU_PTE_SHIFT) - 1;
1137 dev_dbg(dev, "address bits: %u, PFN mask: %#lx\n",
1138 mc->soc->num_address_bits, smmu->pfn_mask);
1139 smmu->tlb_mask = (1 << fls(smmu->soc->num_tlb_lines)) - 1;
1140 dev_dbg(dev, "TLB lines: %u, mask: %#lx\n", smmu->soc->num_tlb_lines,
1141 smmu->tlb_mask);
1142
1143 value = SMMU_PTC_CONFIG_ENABLE | SMMU_PTC_CONFIG_INDEX_MAP(0x3f);
1144
1145 if (soc->supports_request_limit)
1146 value |= SMMU_PTC_CONFIG_REQ_LIMIT(8);
1147
1148 smmu_writel(smmu, value, SMMU_PTC_CONFIG);
1149
1150 value = SMMU_TLB_CONFIG_HIT_UNDER_MISS |
1151 SMMU_TLB_CONFIG_ACTIVE_LINES(smmu);
1152
1153 if (soc->supports_round_robin_arbitration)
1154 value |= SMMU_TLB_CONFIG_ROUND_ROBIN_ARBITRATION;
1155
1156 smmu_writel(smmu, value, SMMU_TLB_CONFIG);
1157
1158 smmu_flush_ptc_all(smmu);
1159 smmu_flush_tlb(smmu);
1160 smmu_writel(smmu, SMMU_CONFIG_ENABLE, SMMU_CONFIG);
1161 smmu_flush(smmu);
1162
1163 tegra_smmu_ahb_enable();
1164
1165 err = iommu_device_sysfs_add(&smmu->iommu, dev, NULL, dev_name(dev));
1166 if (err)
1167 return ERR_PTR(err);
1168
1169 err = iommu_device_register(&smmu->iommu, &tegra_smmu_ops, dev);
1170 if (err) {
1171 iommu_device_sysfs_remove(&smmu->iommu);
1172 return ERR_PTR(err);
1173 }
1174
1175 if (IS_ENABLED(CONFIG_DEBUG_FS))
1176 tegra_smmu_debugfs_init(smmu);
1177
1178 return smmu;
1179 }
1180
tegra_smmu_remove(struct tegra_smmu * smmu)1181 void tegra_smmu_remove(struct tegra_smmu *smmu)
1182 {
1183 iommu_device_unregister(&smmu->iommu);
1184 iommu_device_sysfs_remove(&smmu->iommu);
1185
1186 if (IS_ENABLED(CONFIG_DEBUG_FS))
1187 tegra_smmu_debugfs_exit(smmu);
1188 }
1189