2 * IOMMU API for SMMU in Tegra30
4 * Copyright (c) 2011-2013, NVIDIA CORPORATION. All rights reserved.
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms and conditions of the GNU General Public License,
8 * version 2, as published by the Free Software Foundation.
10 * This program is distributed in the hope it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
15 * You should have received a copy of the GNU General Public License along with
16 * this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
20 #define pr_fmt(fmt) "%s(): " fmt, __func__
22 #include <linux/module.h>
23 #include <linux/platform_device.h>
24 #include <linux/spinlock.h>
25 #include <linux/slab.h>
26 #include <linux/vmalloc.h>
28 #include <linux/pagemap.h>
29 #include <linux/device.h>
30 #include <linux/sched.h>
31 #include <linux/iommu.h>
34 #include <linux/of_iommu.h>
35 #include <linux/debugfs.h>
36 #include <linux/seq_file.h>
37 #include <linux/tegra-ahb.h>
40 #include <asm/cacheflush.h>
65 #define HWG_AFI (1 << HWGRP_AFI)
66 #define HWG_AVPC (1 << HWGRP_AVPC)
67 #define HWG_DC (1 << HWGRP_DC)
68 #define HWG_DCB (1 << HWGRP_DCB)
69 #define HWG_EPP (1 << HWGRP_EPP)
70 #define HWG_G2 (1 << HWGRP_G2)
71 #define HWG_HC (1 << HWGRP_HC)
72 #define HWG_HDA (1 << HWGRP_HDA)
73 #define HWG_ISP (1 << HWGRP_ISP)
74 #define HWG_MPE (1 << HWGRP_MPE)
75 #define HWG_NV (1 << HWGRP_NV)
76 #define HWG_NV2 (1 << HWGRP_NV2)
77 #define HWG_PPCS (1 << HWGRP_PPCS)
78 #define HWG_SATA (1 << HWGRP_SATA)
79 #define HWG_VDE (1 << HWGRP_VDE)
80 #define HWG_VI (1 << HWGRP_VI)
82 /* bitmap of the page sizes currently supported */
83 #define SMMU_IOMMU_PGSIZES (SZ_4K)
85 #define SMMU_CONFIG 0x10
86 #define SMMU_CONFIG_DISABLE 0
87 #define SMMU_CONFIG_ENABLE 1
89 /* REVISIT: To support multiple MCs */
99 #define SMMU_CACHE_CONFIG_BASE 0x14
100 #define __SMMU_CACHE_CONFIG(mc, cache) (SMMU_CACHE_CONFIG_BASE + 4 * cache)
101 #define SMMU_CACHE_CONFIG(cache) __SMMU_CACHE_CONFIG(_MC, cache)
103 #define SMMU_CACHE_CONFIG_STATS_SHIFT 31
104 #define SMMU_CACHE_CONFIG_STATS_ENABLE (1 << SMMU_CACHE_CONFIG_STATS_SHIFT)
105 #define SMMU_CACHE_CONFIG_STATS_TEST_SHIFT 30
106 #define SMMU_CACHE_CONFIG_STATS_TEST (1 << SMMU_CACHE_CONFIG_STATS_TEST_SHIFT)
108 #define SMMU_TLB_CONFIG_HIT_UNDER_MISS__ENABLE (1 << 29)
109 #define SMMU_TLB_CONFIG_ACTIVE_LINES__VALUE 0x10
110 #define SMMU_TLB_CONFIG_RESET_VAL 0x20000010
112 #define SMMU_PTC_CONFIG_CACHE__ENABLE (1 << 29)
113 #define SMMU_PTC_CONFIG_INDEX_MAP__PATTERN 0x3f
114 #define SMMU_PTC_CONFIG_RESET_VAL 0x2000003f
116 #define SMMU_PTB_ASID 0x1c
117 #define SMMU_PTB_ASID_CURRENT_SHIFT 0
119 #define SMMU_PTB_DATA 0x20
120 #define SMMU_PTB_DATA_RESET_VAL 0
121 #define SMMU_PTB_DATA_ASID_NONSECURE_SHIFT 29
122 #define SMMU_PTB_DATA_ASID_WRITABLE_SHIFT 30
123 #define SMMU_PTB_DATA_ASID_READABLE_SHIFT 31
125 #define SMMU_TLB_FLUSH 0x30
126 #define SMMU_TLB_FLUSH_VA_MATCH_ALL 0
127 #define SMMU_TLB_FLUSH_VA_MATCH_SECTION 2
128 #define SMMU_TLB_FLUSH_VA_MATCH_GROUP 3
129 #define SMMU_TLB_FLUSH_ASID_SHIFT 29
130 #define SMMU_TLB_FLUSH_ASID_MATCH_DISABLE 0
131 #define SMMU_TLB_FLUSH_ASID_MATCH_ENABLE 1
132 #define SMMU_TLB_FLUSH_ASID_MATCH_SHIFT 31
134 #define SMMU_PTC_FLUSH 0x34
135 #define SMMU_PTC_FLUSH_TYPE_ALL 0
136 #define SMMU_PTC_FLUSH_TYPE_ADR 1
137 #define SMMU_PTC_FLUSH_ADR_SHIFT 4
139 #define SMMU_ASID_SECURITY 0x38
141 #define SMMU_STATS_CACHE_COUNT_BASE 0x1f0
143 #define SMMU_STATS_CACHE_COUNT(mc, cache, hitmiss) \
144 (SMMU_STATS_CACHE_COUNT_BASE + 8 * cache + 4 * hitmiss)
146 #define SMMU_TRANSLATION_ENABLE_0 0x228
147 #define SMMU_TRANSLATION_ENABLE_1 0x22c
148 #define SMMU_TRANSLATION_ENABLE_2 0x230
150 #define SMMU_AFI_ASID 0x238 /* PCIE */
151 #define SMMU_AVPC_ASID 0x23c /* AVP */
152 #define SMMU_DC_ASID 0x240 /* Display controller */
153 #define SMMU_DCB_ASID 0x244 /* Display controller B */
154 #define SMMU_EPP_ASID 0x248 /* Encoder pre-processor */
155 #define SMMU_G2_ASID 0x24c /* 2D engine */
156 #define SMMU_HC_ASID 0x250 /* Host1x */
157 #define SMMU_HDA_ASID 0x254 /* High-def audio */
158 #define SMMU_ISP_ASID 0x258 /* Image signal processor */
159 #define SMMU_MPE_ASID 0x264 /* MPEG encoder */
160 #define SMMU_NV_ASID 0x268 /* (3D) */
161 #define SMMU_NV2_ASID 0x26c /* (3D) */
162 #define SMMU_PPCS_ASID 0x270 /* AHB */
163 #define SMMU_SATA_ASID 0x278 /* SATA */
164 #define SMMU_VDE_ASID 0x27c /* Video decoder */
165 #define SMMU_VI_ASID 0x280 /* Video input */
167 #define SMMU_PDE_NEXT_SHIFT 28
169 #define SMMU_TLB_FLUSH_VA_SECTION__MASK 0xffc00000
170 #define SMMU_TLB_FLUSH_VA_SECTION__SHIFT 12 /* right shift */
171 #define SMMU_TLB_FLUSH_VA_GROUP__MASK 0xffffc000
172 #define SMMU_TLB_FLUSH_VA_GROUP__SHIFT 12 /* right shift */
173 #define SMMU_TLB_FLUSH_VA(iova, which) \
174 ((((iova) & SMMU_TLB_FLUSH_VA_##which##__MASK) >> \
175 SMMU_TLB_FLUSH_VA_##which##__SHIFT) | \
176 SMMU_TLB_FLUSH_VA_MATCH_##which)
177 #define SMMU_PTB_ASID_CUR(n) \
178 ((n) << SMMU_PTB_ASID_CURRENT_SHIFT)
179 #define SMMU_TLB_FLUSH_ASID_MATCH_disable \
180 (SMMU_TLB_FLUSH_ASID_MATCH_DISABLE << \
181 SMMU_TLB_FLUSH_ASID_MATCH_SHIFT)
182 #define SMMU_TLB_FLUSH_ASID_MATCH__ENABLE \
183 (SMMU_TLB_FLUSH_ASID_MATCH_ENABLE << \
184 SMMU_TLB_FLUSH_ASID_MATCH_SHIFT)
186 #define SMMU_PAGE_SHIFT 12
187 #define SMMU_PAGE_SIZE (1 << SMMU_PAGE_SHIFT)
188 #define SMMU_PAGE_MASK ((1 << SMMU_PAGE_SHIFT) - 1)
190 #define SMMU_PDIR_COUNT 1024
191 #define SMMU_PDIR_SIZE (sizeof(unsigned long) * SMMU_PDIR_COUNT)
192 #define SMMU_PTBL_COUNT 1024
193 #define SMMU_PTBL_SIZE (sizeof(unsigned long) * SMMU_PTBL_COUNT)
194 #define SMMU_PDIR_SHIFT 12
195 #define SMMU_PDE_SHIFT 12
196 #define SMMU_PTE_SHIFT 12
197 #define SMMU_PFN_MASK 0x000fffff
199 #define SMMU_ADDR_TO_PFN(addr) ((addr) >> 12)
200 #define SMMU_ADDR_TO_PDN(addr) ((addr) >> 22)
201 #define SMMU_PDN_TO_ADDR(pdn) ((pdn) << 22)
203 #define _READABLE (1 << SMMU_PTB_DATA_ASID_READABLE_SHIFT)
204 #define _WRITABLE (1 << SMMU_PTB_DATA_ASID_WRITABLE_SHIFT)
205 #define _NONSECURE (1 << SMMU_PTB_DATA_ASID_NONSECURE_SHIFT)
206 #define _PDE_NEXT (1 << SMMU_PDE_NEXT_SHIFT)
207 #define _MASK_ATTR (_READABLE | _WRITABLE | _NONSECURE)
209 #define _PDIR_ATTR (_READABLE | _WRITABLE | _NONSECURE)
211 #define _PDE_ATTR (_READABLE | _WRITABLE | _NONSECURE)
212 #define _PDE_ATTR_N (_PDE_ATTR | _PDE_NEXT)
213 #define _PDE_VACANT(pdn) (((pdn) << 10) | _PDE_ATTR)
215 #define _PTE_ATTR (_READABLE | _WRITABLE | _NONSECURE)
216 #define _PTE_VACANT(addr) (((addr) >> SMMU_PAGE_SHIFT) | _PTE_ATTR)
218 #define SMMU_MK_PDIR(page, attr) \
219 ((page_to_phys(page) >> SMMU_PDIR_SHIFT) | (attr))
220 #define SMMU_MK_PDE(page, attr) \
221 (unsigned long)((page_to_phys(page) >> SMMU_PDE_SHIFT) | (attr))
222 #define SMMU_EX_PTBL_PAGE(pde) \
223 pfn_to_page((unsigned long)(pde) & SMMU_PFN_MASK)
224 #define SMMU_PFN_TO_PTE(pfn, attr) (unsigned long)((pfn) | (attr))
226 #define SMMU_ASID_ENABLE(asid) ((asid) | (1 << 31))
227 #define SMMU_ASID_DISABLE 0
228 #define SMMU_ASID_ASID(n) ((n) & ~SMMU_ASID_ENABLE(0))
230 #define NUM_SMMU_REG_BANKS 3
232 #define smmu_client_enable_hwgrp(c, m) smmu_client_set_hwgrp(c, m, 1)
233 #define smmu_client_disable_hwgrp(c) smmu_client_set_hwgrp(c, 0, 0)
234 #define __smmu_client_enable_hwgrp(c, m) __smmu_client_set_hwgrp(c, m, 1)
235 #define __smmu_client_disable_hwgrp(c) __smmu_client_set_hwgrp(c, 0, 0)
237 #define HWGRP_INIT(client) [HWGRP_##client] = SMMU_##client##_ASID
239 static const u32 smmu_hwgrp_asid_reg[] = {
257 #define HWGRP_ASID_REG(x) (smmu_hwgrp_asid_reg[x])
260 * Per client for address space
264 struct list_head list;
273 struct smmu_device *smmu; /* back pointer to container */
275 spinlock_t lock; /* for pagetable */
276 struct page *pdir_page;
277 unsigned long pdir_attr;
278 unsigned long pde_attr;
279 unsigned long pte_attr;
280 unsigned int *pte_count;
282 struct list_head client;
283 spinlock_t client_lock; /* for client list */
286 struct smmu_debugfs_info {
287 struct smmu_device *smmu;
293 * Per SMMU device - IOMMU device
296 void __iomem *regbase; /* register offset base */
297 void __iomem **regs; /* register block start address array */
298 void __iomem **rege; /* register block end address array */
299 int nregs; /* number of register blocks */
301 unsigned long iovmm_base; /* remappable base address */
302 unsigned long page_count; /* total remappable size */
306 struct page *avp_vector_page; /* dummy page shared by all AS's */
309 * Register image savers for suspend/resume
311 unsigned long translation_enable_0;
312 unsigned long translation_enable_1;
313 unsigned long translation_enable_2;
314 unsigned long asid_security;
316 struct dentry *debugfs_root;
317 struct smmu_debugfs_info *debugfs_info;
319 struct device_node *ahb;
322 struct smmu_as as[0]; /* Run-time allocated array */
325 static struct smmu_device *smmu_handle; /* unique for a system */
328 * SMMU register accessors
330 static bool inline smmu_valid_reg(struct smmu_device *smmu,
335 for (i = 0; i < smmu->nregs; i++) {
336 if (addr < smmu->regs[i])
338 if (addr <= smmu->rege[i])
345 static inline u32 smmu_read(struct smmu_device *smmu, size_t offs)
347 void __iomem *addr = smmu->regbase + offs;
349 BUG_ON(!smmu_valid_reg(smmu, addr));
354 static inline void smmu_write(struct smmu_device *smmu, u32 val, size_t offs)
356 void __iomem *addr = smmu->regbase + offs;
358 BUG_ON(!smmu_valid_reg(smmu, addr));
363 #define VA_PAGE_TO_PA(va, page) \
364 (page_to_phys(page) + ((unsigned long)(va) & ~PAGE_MASK))
366 #define FLUSH_CPU_DCACHE(va, page, size) \
368 unsigned long _pa_ = VA_PAGE_TO_PA(va, page); \
369 __cpuc_flush_dcache_area((void *)(va), (size_t)(size)); \
370 outer_flush_range(_pa_, _pa_+(size_t)(size)); \
374 * Any interaction between any block on PPSB and a block on APB or AHB
375 * must have these read-back barriers to ensure the APB/AHB bus
376 * transaction is complete before initiating activity on the PPSB
379 #define FLUSH_SMMU_REGS(smmu) smmu_read(smmu, SMMU_CONFIG)
381 #define smmu_client_hwgrp(c) (u32)((c)->dev->platform_data)
383 static int __smmu_client_set_hwgrp(struct smmu_client *c,
384 unsigned long map, int on)
387 struct smmu_as *as = c->as;
388 u32 val, offs, mask = SMMU_ASID_ENABLE(as->asid);
389 struct smmu_device *smmu = as->smmu;
395 map = smmu_client_hwgrp(c);
397 for_each_set_bit(i, &map, HWGRP_COUNT) {
398 offs = HWGRP_ASID_REG(i);
399 val = smmu_read(smmu, offs);
401 if (WARN_ON(val & mask))
405 WARN_ON((val & mask) == mask);
408 smmu_write(smmu, val, offs);
410 FLUSH_SMMU_REGS(smmu);
415 for_each_set_bit(i, &map, HWGRP_COUNT) {
416 offs = HWGRP_ASID_REG(i);
417 val = smmu_read(smmu, offs);
419 smmu_write(smmu, val, offs);
424 static int smmu_client_set_hwgrp(struct smmu_client *c, u32 map, int on)
428 struct smmu_as *as = c->as;
429 struct smmu_device *smmu = as->smmu;
431 spin_lock_irqsave(&smmu->lock, flags);
432 val = __smmu_client_set_hwgrp(c, map, on);
433 spin_unlock_irqrestore(&smmu->lock, flags);
438 * Flush all TLB entries and all PTC entries
439 * Caller must lock smmu
441 static void smmu_flush_regs(struct smmu_device *smmu, int enable)
445 smmu_write(smmu, SMMU_PTC_FLUSH_TYPE_ALL, SMMU_PTC_FLUSH);
446 FLUSH_SMMU_REGS(smmu);
447 val = SMMU_TLB_FLUSH_VA_MATCH_ALL |
448 SMMU_TLB_FLUSH_ASID_MATCH_disable;
449 smmu_write(smmu, val, SMMU_TLB_FLUSH);
452 smmu_write(smmu, SMMU_CONFIG_ENABLE, SMMU_CONFIG);
453 FLUSH_SMMU_REGS(smmu);
456 static int smmu_setup_regs(struct smmu_device *smmu)
461 for (i = 0; i < smmu->num_as; i++) {
462 struct smmu_as *as = &smmu->as[i];
463 struct smmu_client *c;
465 smmu_write(smmu, SMMU_PTB_ASID_CUR(as->asid), SMMU_PTB_ASID);
466 val = as->pdir_page ?
467 SMMU_MK_PDIR(as->pdir_page, as->pdir_attr) :
468 SMMU_PTB_DATA_RESET_VAL;
469 smmu_write(smmu, val, SMMU_PTB_DATA);
471 list_for_each_entry(c, &as->client, list)
472 __smmu_client_set_hwgrp(c, c->hwgrp, 1);
475 smmu_write(smmu, smmu->translation_enable_0, SMMU_TRANSLATION_ENABLE_0);
476 smmu_write(smmu, smmu->translation_enable_1, SMMU_TRANSLATION_ENABLE_1);
477 smmu_write(smmu, smmu->translation_enable_2, SMMU_TRANSLATION_ENABLE_2);
478 smmu_write(smmu, smmu->asid_security, SMMU_ASID_SECURITY);
479 smmu_write(smmu, SMMU_TLB_CONFIG_RESET_VAL, SMMU_CACHE_CONFIG(_TLB));
480 smmu_write(smmu, SMMU_PTC_CONFIG_RESET_VAL, SMMU_CACHE_CONFIG(_PTC));
482 smmu_flush_regs(smmu, 1);
484 return tegra_ahb_enable_smmu(smmu->ahb);
487 static void flush_ptc_and_tlb(struct smmu_device *smmu,
488 struct smmu_as *as, dma_addr_t iova,
489 unsigned long *pte, struct page *page, int is_pde)
492 unsigned long tlb_flush_va = is_pde
493 ? SMMU_TLB_FLUSH_VA(iova, SECTION)
494 : SMMU_TLB_FLUSH_VA(iova, GROUP);
496 val = SMMU_PTC_FLUSH_TYPE_ADR | VA_PAGE_TO_PA(pte, page);
497 smmu_write(smmu, val, SMMU_PTC_FLUSH);
498 FLUSH_SMMU_REGS(smmu);
500 SMMU_TLB_FLUSH_ASID_MATCH__ENABLE |
501 (as->asid << SMMU_TLB_FLUSH_ASID_SHIFT);
502 smmu_write(smmu, val, SMMU_TLB_FLUSH);
503 FLUSH_SMMU_REGS(smmu);
506 static void free_ptbl(struct smmu_as *as, dma_addr_t iova)
508 unsigned long pdn = SMMU_ADDR_TO_PDN(iova);
509 unsigned long *pdir = (unsigned long *)page_address(as->pdir_page);
511 if (pdir[pdn] != _PDE_VACANT(pdn)) {
512 dev_dbg(as->smmu->dev, "pdn: %lx\n", pdn);
514 ClearPageReserved(SMMU_EX_PTBL_PAGE(pdir[pdn]));
515 __free_page(SMMU_EX_PTBL_PAGE(pdir[pdn]));
516 pdir[pdn] = _PDE_VACANT(pdn);
517 FLUSH_CPU_DCACHE(&pdir[pdn], as->pdir_page, sizeof pdir[pdn]);
518 flush_ptc_and_tlb(as->smmu, as, iova, &pdir[pdn],
523 static void free_pdir(struct smmu_as *as)
527 struct device *dev = as->smmu->dev;
532 addr = as->smmu->iovmm_base;
533 count = as->smmu->page_count;
534 while (count-- > 0) {
536 addr += SMMU_PAGE_SIZE * SMMU_PTBL_COUNT;
538 ClearPageReserved(as->pdir_page);
539 __free_page(as->pdir_page);
540 as->pdir_page = NULL;
541 devm_kfree(dev, as->pte_count);
542 as->pte_count = NULL;
546 * Maps PTBL for given iova and returns the PTE address
547 * Caller must unmap the mapped PTBL returned in *ptbl_page_p
549 static unsigned long *locate_pte(struct smmu_as *as,
550 dma_addr_t iova, bool allocate,
551 struct page **ptbl_page_p,
552 unsigned int **count)
554 unsigned long ptn = SMMU_ADDR_TO_PFN(iova);
555 unsigned long pdn = SMMU_ADDR_TO_PDN(iova);
556 unsigned long *pdir = page_address(as->pdir_page);
559 if (pdir[pdn] != _PDE_VACANT(pdn)) {
560 /* Mapped entry table already exists */
561 *ptbl_page_p = SMMU_EX_PTBL_PAGE(pdir[pdn]);
562 ptbl = page_address(*ptbl_page_p);
563 } else if (!allocate) {
567 unsigned long addr = SMMU_PDN_TO_ADDR(pdn);
569 /* Vacant - allocate a new page table */
570 dev_dbg(as->smmu->dev, "New PTBL pdn: %lx\n", pdn);
572 *ptbl_page_p = alloc_page(GFP_ATOMIC);
574 dev_err(as->smmu->dev,
575 "failed to allocate smmu_device page table\n");
578 SetPageReserved(*ptbl_page_p);
579 ptbl = (unsigned long *)page_address(*ptbl_page_p);
580 for (pn = 0; pn < SMMU_PTBL_COUNT;
581 pn++, addr += SMMU_PAGE_SIZE) {
582 ptbl[pn] = _PTE_VACANT(addr);
584 FLUSH_CPU_DCACHE(ptbl, *ptbl_page_p, SMMU_PTBL_SIZE);
585 pdir[pdn] = SMMU_MK_PDE(*ptbl_page_p,
586 as->pde_attr | _PDE_NEXT);
587 FLUSH_CPU_DCACHE(&pdir[pdn], as->pdir_page, sizeof pdir[pdn]);
588 flush_ptc_and_tlb(as->smmu, as, iova, &pdir[pdn],
591 *count = &as->pte_count[pdn];
593 return &ptbl[ptn % SMMU_PTBL_COUNT];
596 #ifdef CONFIG_SMMU_SIG_DEBUG
597 static void put_signature(struct smmu_as *as,
598 dma_addr_t iova, unsigned long pfn)
601 unsigned long *vaddr;
603 page = pfn_to_page(pfn);
604 vaddr = page_address(page);
609 vaddr[1] = pfn << PAGE_SHIFT;
610 FLUSH_CPU_DCACHE(vaddr, page, sizeof(vaddr[0]) * 2);
613 static inline void put_signature(struct smmu_as *as,
614 unsigned long addr, unsigned long pfn)
620 * Caller must not hold as->lock
622 static int alloc_pdir(struct smmu_as *as)
624 unsigned long *pdir, flags;
627 struct smmu_device *smmu = as->smmu;
632 * do the allocation, then grab as->lock
634 cnt = devm_kzalloc(smmu->dev,
635 sizeof(cnt[0]) * SMMU_PDIR_COUNT,
637 page = alloc_page(GFP_KERNEL | __GFP_DMA);
639 spin_lock_irqsave(&as->lock, flags);
642 /* We raced, free the redundant */
648 dev_err(smmu->dev, "failed to allocate at %s\n", __func__);
653 as->pdir_page = page;
656 SetPageReserved(as->pdir_page);
657 pdir = page_address(as->pdir_page);
659 for (pdn = 0; pdn < SMMU_PDIR_COUNT; pdn++)
660 pdir[pdn] = _PDE_VACANT(pdn);
661 FLUSH_CPU_DCACHE(pdir, as->pdir_page, SMMU_PDIR_SIZE);
662 val = SMMU_PTC_FLUSH_TYPE_ADR | VA_PAGE_TO_PA(pdir, as->pdir_page);
663 smmu_write(smmu, val, SMMU_PTC_FLUSH);
664 FLUSH_SMMU_REGS(as->smmu);
665 val = SMMU_TLB_FLUSH_VA_MATCH_ALL |
666 SMMU_TLB_FLUSH_ASID_MATCH__ENABLE |
667 (as->asid << SMMU_TLB_FLUSH_ASID_SHIFT);
668 smmu_write(smmu, val, SMMU_TLB_FLUSH);
669 FLUSH_SMMU_REGS(as->smmu);
671 spin_unlock_irqrestore(&as->lock, flags);
676 spin_unlock_irqrestore(&as->lock, flags);
678 devm_kfree(smmu->dev, cnt);
684 static void __smmu_iommu_unmap(struct smmu_as *as, dma_addr_t iova)
690 pte = locate_pte(as, iova, false, &page, &count);
694 if (WARN_ON(*pte == _PTE_VACANT(iova)))
697 *pte = _PTE_VACANT(iova);
698 FLUSH_CPU_DCACHE(pte, page, sizeof(*pte));
699 flush_ptc_and_tlb(as->smmu, as, iova, pte, page, 0);
704 static void __smmu_iommu_map_pfn(struct smmu_as *as, dma_addr_t iova,
707 struct smmu_device *smmu = as->smmu;
712 pte = locate_pte(as, iova, true, &page, &count);
716 if (*pte == _PTE_VACANT(iova))
718 *pte = SMMU_PFN_TO_PTE(pfn, as->pte_attr);
719 if (unlikely((*pte == _PTE_VACANT(iova))))
721 FLUSH_CPU_DCACHE(pte, page, sizeof(*pte));
722 flush_ptc_and_tlb(smmu, as, iova, pte, page, 0);
723 put_signature(as, iova, pfn);
726 static int smmu_iommu_map(struct iommu_domain *domain, unsigned long iova,
727 phys_addr_t pa, size_t bytes, int prot)
729 struct smmu_as *as = domain->priv;
730 unsigned long pfn = __phys_to_pfn(pa);
733 dev_dbg(as->smmu->dev, "[%d] %08lx:%08x\n", as->asid, iova, pa);
738 spin_lock_irqsave(&as->lock, flags);
739 __smmu_iommu_map_pfn(as, iova, pfn);
740 spin_unlock_irqrestore(&as->lock, flags);
744 static size_t smmu_iommu_unmap(struct iommu_domain *domain, unsigned long iova,
747 struct smmu_as *as = domain->priv;
750 dev_dbg(as->smmu->dev, "[%d] %08lx\n", as->asid, iova);
752 spin_lock_irqsave(&as->lock, flags);
753 __smmu_iommu_unmap(as, iova);
754 spin_unlock_irqrestore(&as->lock, flags);
755 return SMMU_PAGE_SIZE;
758 static phys_addr_t smmu_iommu_iova_to_phys(struct iommu_domain *domain,
761 struct smmu_as *as = domain->priv;
768 spin_lock_irqsave(&as->lock, flags);
770 pte = locate_pte(as, iova, true, &page, &count);
771 pfn = *pte & SMMU_PFN_MASK;
772 WARN_ON(!pfn_valid(pfn));
773 dev_dbg(as->smmu->dev,
774 "iova:%08lx pfn:%08lx asid:%d\n", iova, pfn, as->asid);
776 spin_unlock_irqrestore(&as->lock, flags);
777 return PFN_PHYS(pfn);
780 static int smmu_iommu_domain_has_cap(struct iommu_domain *domain,
786 static int smmu_iommu_attach_dev(struct iommu_domain *domain,
789 struct smmu_as *as = domain->priv;
790 struct smmu_device *smmu = as->smmu;
791 struct smmu_client *client, *c;
795 client = devm_kzalloc(smmu->dev, sizeof(*c), GFP_KERNEL);
800 map = (unsigned long)dev->platform_data;
804 err = smmu_client_enable_hwgrp(client, map);
808 spin_lock(&as->client_lock);
809 list_for_each_entry(c, &as->client, list) {
812 "%s is already attached\n", dev_name(c->dev));
817 list_add(&client->list, &as->client);
818 spin_unlock(&as->client_lock);
821 * Reserve "page zero" for AVP vectors using a common dummy
824 if (map & HWG_AVPC) {
827 page = as->smmu->avp_vector_page;
828 __smmu_iommu_map_pfn(as, 0, page_to_pfn(page));
830 pr_info("Reserve \"page zero\" for AVP vectors using a common dummy\n");
833 dev_dbg(smmu->dev, "%s is attached\n", dev_name(dev));
837 smmu_client_disable_hwgrp(client);
838 spin_unlock(&as->client_lock);
840 devm_kfree(smmu->dev, client);
844 static void smmu_iommu_detach_dev(struct iommu_domain *domain,
847 struct smmu_as *as = domain->priv;
848 struct smmu_device *smmu = as->smmu;
849 struct smmu_client *c;
851 spin_lock(&as->client_lock);
853 list_for_each_entry(c, &as->client, list) {
855 smmu_client_disable_hwgrp(c);
857 devm_kfree(smmu->dev, c);
860 "%s is detached\n", dev_name(c->dev));
864 dev_err(smmu->dev, "Couldn't find %s\n", dev_name(dev));
866 spin_unlock(&as->client_lock);
869 static int smmu_iommu_domain_init(struct iommu_domain *domain)
871 int i, err = -EAGAIN;
874 struct smmu_device *smmu = smmu_handle;
876 /* Look for a free AS with lock held */
877 for (i = 0; i < smmu->num_as; i++) {
883 err = alloc_pdir(as);
890 if (i == smmu->num_as)
891 dev_err(smmu->dev, "no free AS\n");
895 spin_lock_irqsave(&smmu->lock, flags);
897 /* Update PDIR register */
898 smmu_write(smmu, SMMU_PTB_ASID_CUR(as->asid), SMMU_PTB_ASID);
900 SMMU_MK_PDIR(as->pdir_page, as->pdir_attr), SMMU_PTB_DATA);
901 FLUSH_SMMU_REGS(smmu);
903 spin_unlock_irqrestore(&smmu->lock, flags);
907 domain->geometry.aperture_start = smmu->iovmm_base;
908 domain->geometry.aperture_end = smmu->iovmm_base +
909 smmu->page_count * SMMU_PAGE_SIZE - 1;
910 domain->geometry.force_aperture = true;
912 dev_dbg(smmu->dev, "smmu_as@%p\n", as);
917 static void smmu_iommu_domain_destroy(struct iommu_domain *domain)
919 struct smmu_as *as = domain->priv;
920 struct smmu_device *smmu = as->smmu;
923 spin_lock_irqsave(&as->lock, flags);
926 spin_lock(&smmu->lock);
927 smmu_write(smmu, SMMU_PTB_ASID_CUR(as->asid), SMMU_PTB_ASID);
928 smmu_write(smmu, SMMU_PTB_DATA_RESET_VAL, SMMU_PTB_DATA);
929 FLUSH_SMMU_REGS(smmu);
930 spin_unlock(&smmu->lock);
935 if (!list_empty(&as->client)) {
936 struct smmu_client *c;
938 list_for_each_entry(c, &as->client, list)
939 smmu_iommu_detach_dev(domain, c->dev);
942 spin_unlock_irqrestore(&as->lock, flags);
945 dev_dbg(smmu->dev, "smmu_as@%p\n", as);
948 static struct iommu_ops smmu_iommu_ops = {
949 .domain_init = smmu_iommu_domain_init,
950 .domain_destroy = smmu_iommu_domain_destroy,
951 .attach_dev = smmu_iommu_attach_dev,
952 .detach_dev = smmu_iommu_detach_dev,
953 .map = smmu_iommu_map,
954 .unmap = smmu_iommu_unmap,
955 .iova_to_phys = smmu_iommu_iova_to_phys,
956 .domain_has_cap = smmu_iommu_domain_has_cap,
957 .pgsize_bitmap = SMMU_IOMMU_PGSIZES,
960 /* Should be in the order of enum */
961 static const char * const smmu_debugfs_mc[] = { "mc", };
962 static const char * const smmu_debugfs_cache[] = { "tlb", "ptc", };
964 static ssize_t smmu_debugfs_stats_write(struct file *file,
965 const char __user *buffer,
966 size_t count, loff_t *pos)
968 struct smmu_debugfs_info *info;
969 struct smmu_device *smmu;
977 const char * const command[] = {
982 char str[] = "reset";
986 count = min_t(size_t, count, sizeof(str));
987 if (copy_from_user(str, buffer, count))
990 for (i = 0; i < ARRAY_SIZE(command); i++)
991 if (strncmp(str, command[i],
992 strlen(command[i])) == 0)
995 if (i == ARRAY_SIZE(command))
998 dent = file->f_dentry;
999 info = dent->d_inode->i_private;
1002 offs = SMMU_CACHE_CONFIG(info->cache);
1003 val = smmu_read(smmu, offs);
1006 val &= ~SMMU_CACHE_CONFIG_STATS_ENABLE;
1007 val &= ~SMMU_CACHE_CONFIG_STATS_TEST;
1008 smmu_write(smmu, val, offs);
1011 val |= SMMU_CACHE_CONFIG_STATS_ENABLE;
1012 val &= ~SMMU_CACHE_CONFIG_STATS_TEST;
1013 smmu_write(smmu, val, offs);
1016 val |= SMMU_CACHE_CONFIG_STATS_TEST;
1017 smmu_write(smmu, val, offs);
1018 val &= ~SMMU_CACHE_CONFIG_STATS_TEST;
1019 smmu_write(smmu, val, offs);
1026 dev_dbg(smmu->dev, "%s() %08x, %08x @%08x\n", __func__,
1027 val, smmu_read(smmu, offs), offs);
1032 static int smmu_debugfs_stats_show(struct seq_file *s, void *v)
1034 struct smmu_debugfs_info *info;
1035 struct smmu_device *smmu;
1036 struct dentry *dent;
1038 const char * const stats[] = { "hit", "miss", };
1040 dent = d_find_alias(s->private);
1041 info = dent->d_inode->i_private;
1044 for (i = 0; i < ARRAY_SIZE(stats); i++) {
1048 offs = SMMU_STATS_CACHE_COUNT(info->mc, info->cache, i);
1049 val = smmu_read(smmu, offs);
1050 seq_printf(s, "%s:%08x ", stats[i], val);
1052 dev_dbg(smmu->dev, "%s() %s %08x @%08x\n", __func__,
1053 stats[i], val, offs);
1055 seq_printf(s, "\n");
1061 static int smmu_debugfs_stats_open(struct inode *inode, struct file *file)
1063 return single_open(file, smmu_debugfs_stats_show, inode);
1066 static const struct file_operations smmu_debugfs_stats_fops = {
1067 .open = smmu_debugfs_stats_open,
1069 .llseek = seq_lseek,
1070 .release = single_release,
1071 .write = smmu_debugfs_stats_write,
1074 static void smmu_debugfs_delete(struct smmu_device *smmu)
1076 debugfs_remove_recursive(smmu->debugfs_root);
1077 kfree(smmu->debugfs_info);
1080 static void smmu_debugfs_create(struct smmu_device *smmu)
1084 struct dentry *root;
1086 bytes = ARRAY_SIZE(smmu_debugfs_mc) * ARRAY_SIZE(smmu_debugfs_cache) *
1087 sizeof(*smmu->debugfs_info);
1088 smmu->debugfs_info = kmalloc(bytes, GFP_KERNEL);
1089 if (!smmu->debugfs_info)
1092 root = debugfs_create_dir(dev_name(smmu->dev), NULL);
1095 smmu->debugfs_root = root;
1097 for (i = 0; i < ARRAY_SIZE(smmu_debugfs_mc); i++) {
1101 mc = debugfs_create_dir(smmu_debugfs_mc[i], root);
1105 for (j = 0; j < ARRAY_SIZE(smmu_debugfs_cache); j++) {
1106 struct dentry *cache;
1107 struct smmu_debugfs_info *info;
1109 info = smmu->debugfs_info;
1110 info += i * ARRAY_SIZE(smmu_debugfs_mc) + j;
1115 cache = debugfs_create_file(smmu_debugfs_cache[j],
1116 S_IWUGO | S_IRUGO, mc,
1118 &smmu_debugfs_stats_fops);
1127 smmu_debugfs_delete(smmu);
1130 static int tegra_smmu_suspend(struct device *dev)
1132 struct smmu_device *smmu = dev_get_drvdata(dev);
1134 smmu->translation_enable_0 = smmu_read(smmu, SMMU_TRANSLATION_ENABLE_0);
1135 smmu->translation_enable_1 = smmu_read(smmu, SMMU_TRANSLATION_ENABLE_1);
1136 smmu->translation_enable_2 = smmu_read(smmu, SMMU_TRANSLATION_ENABLE_2);
1137 smmu->asid_security = smmu_read(smmu, SMMU_ASID_SECURITY);
1141 static int tegra_smmu_resume(struct device *dev)
1143 struct smmu_device *smmu = dev_get_drvdata(dev);
1144 unsigned long flags;
1147 spin_lock_irqsave(&smmu->lock, flags);
1148 err = smmu_setup_regs(smmu);
1149 spin_unlock_irqrestore(&smmu->lock, flags);
1153 static int tegra_smmu_probe(struct platform_device *pdev)
1155 struct smmu_device *smmu;
1156 struct device *dev = &pdev->dev;
1157 int i, asids, err = 0;
1158 dma_addr_t uninitialized_var(base);
1159 size_t bytes, uninitialized_var(size);
1164 BUILD_BUG_ON(PAGE_SHIFT != SMMU_PAGE_SHIFT);
1166 if (of_property_read_u32(dev->of_node, "nvidia,#asids", &asids))
1169 bytes = sizeof(*smmu) + asids * sizeof(*smmu->as);
1170 smmu = devm_kzalloc(dev, bytes, GFP_KERNEL);
1172 dev_err(dev, "failed to allocate smmu_device\n");
1176 smmu->nregs = pdev->num_resources;
1177 smmu->regs = devm_kzalloc(dev, 2 * smmu->nregs * sizeof(*smmu->regs),
1179 smmu->rege = smmu->regs + smmu->nregs;
1182 for (i = 0; i < smmu->nregs; i++) {
1183 struct resource *res;
1185 res = platform_get_resource(pdev, IORESOURCE_MEM, i);
1188 smmu->regs[i] = devm_request_and_ioremap(&pdev->dev, res);
1191 smmu->rege[i] = smmu->regs[i] + resource_size(res) - 1;
1193 /* Same as "mc" 1st regiter block start address */
1194 smmu->regbase = (void __iomem *)((u32)smmu->regs[0] & PAGE_MASK);
1196 err = of_get_dma_window(dev->of_node, NULL, 0, NULL, &base, &size);
1200 if (size & SMMU_PAGE_MASK)
1203 size >>= SMMU_PAGE_SHIFT;
1207 smmu->ahb = of_parse_phandle(dev->of_node, "nvidia,ahb", 0);
1212 smmu->num_as = asids;
1213 smmu->iovmm_base = base;
1214 smmu->page_count = size;
1216 smmu->translation_enable_0 = ~0;
1217 smmu->translation_enable_1 = ~0;
1218 smmu->translation_enable_2 = ~0;
1219 smmu->asid_security = 0;
1221 for (i = 0; i < smmu->num_as; i++) {
1222 struct smmu_as *as = &smmu->as[i];
1226 as->pdir_attr = _PDIR_ATTR;
1227 as->pde_attr = _PDE_ATTR;
1228 as->pte_attr = _PTE_ATTR;
1230 spin_lock_init(&as->lock);
1231 spin_lock_init(&as->client_lock);
1232 INIT_LIST_HEAD(&as->client);
1234 spin_lock_init(&smmu->lock);
1235 err = smmu_setup_regs(smmu);
1238 platform_set_drvdata(pdev, smmu);
1240 smmu->avp_vector_page = alloc_page(GFP_KERNEL);
1241 if (!smmu->avp_vector_page)
1244 smmu_debugfs_create(smmu);
1246 bus_set_iommu(&platform_bus_type, &smmu_iommu_ops);
1250 static int tegra_smmu_remove(struct platform_device *pdev)
1252 struct smmu_device *smmu = platform_get_drvdata(pdev);
1255 smmu_debugfs_delete(smmu);
1257 smmu_write(smmu, SMMU_CONFIG_DISABLE, SMMU_CONFIG);
1258 for (i = 0; i < smmu->num_as; i++)
1259 free_pdir(&smmu->as[i]);
1260 __free_page(smmu->avp_vector_page);
1265 const struct dev_pm_ops tegra_smmu_pm_ops = {
1266 .suspend = tegra_smmu_suspend,
1267 .resume = tegra_smmu_resume,
1271 static struct of_device_id tegra_smmu_of_match[] = {
1272 { .compatible = "nvidia,tegra30-smmu", },
1275 MODULE_DEVICE_TABLE(of, tegra_smmu_of_match);
1278 static struct platform_driver tegra_smmu_driver = {
1279 .probe = tegra_smmu_probe,
1280 .remove = tegra_smmu_remove,
1282 .owner = THIS_MODULE,
1283 .name = "tegra-smmu",
1284 .pm = &tegra_smmu_pm_ops,
1285 .of_match_table = of_match_ptr(tegra_smmu_of_match),
1289 static int tegra_smmu_init(void)
1291 return platform_driver_register(&tegra_smmu_driver);
1294 static void __exit tegra_smmu_exit(void)
1296 platform_driver_unregister(&tegra_smmu_driver);
1299 subsys_initcall(tegra_smmu_init);
1300 module_exit(tegra_smmu_exit);
1302 MODULE_DESCRIPTION("IOMMU API for SMMU in Tegra30");
1303 MODULE_AUTHOR("Hiroshi DOYU <hdoyu@nvidia.com>");
1304 MODULE_ALIAS("platform:tegra-smmu");
1305 MODULE_LICENSE("GPL v2");