1 /* Copyright (c) 2010-2011, Code Aurora Forum. All rights reserved.
3 * This program is free software; you can redistribute it and/or modify
4 * it under the terms of the GNU General Public License version 2 and
5 * only version 2 as published by the Free Software Foundation.
7 * This program is distributed in the hope that it will be useful,
8 * but WITHOUT ANY WARRANTY; without even the implied warranty of
9 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
10 * GNU General Public License for more details.
12 * You should have received a copy of the GNU General Public License
13 * along with this program; if not, write to the Free Software
14 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
18 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19 #include <linux/kernel.h>
20 #include <linux/module.h>
21 #include <linux/platform_device.h>
22 #include <linux/errno.h>
24 #include <linux/interrupt.h>
25 #include <linux/list.h>
26 #include <linux/spinlock.h>
27 #include <linux/slab.h>
28 #include <linux/iommu.h>
29 #include <linux/clk.h>
31 #include <asm/cacheflush.h>
32 #include <asm/sizes.h>
34 #include "msm_iommu_hw-8xxx.h"
35 #include "msm_iommu.h"
37 #define MRC(reg, processor, op1, crn, crm, op2) \
38 __asm__ __volatile__ ( \
39 " mrc " #processor "," #op1 ", %0," #crn "," #crm "," #op2 "\n" \
42 #define RCP15_PRRR(reg) MRC(reg, p15, 0, c10, c2, 0)
43 #define RCP15_NMRR(reg) MRC(reg, p15, 0, c10, c2, 1)
45 /* bitmap of the page sizes currently supported */
46 #define MSM_IOMMU_PGSIZES (SZ_4K | SZ_64K | SZ_1M | SZ_16M)
48 static int msm_iommu_tex_class[4];
50 DEFINE_SPINLOCK(msm_iommu_lock);
53 unsigned long *pgtable;
54 struct list_head list_attached;
55 struct iommu_domain domain;
58 static struct msm_priv *to_msm_priv(struct iommu_domain *dom)
60 return container_of(dom, struct msm_priv, domain);
63 static int __enable_clocks(struct msm_iommu_drvdata *drvdata)
67 ret = clk_enable(drvdata->pclk);
72 ret = clk_enable(drvdata->clk);
74 clk_disable(drvdata->pclk);
80 static void __disable_clocks(struct msm_iommu_drvdata *drvdata)
82 clk_disable(drvdata->clk);
83 clk_disable(drvdata->pclk);
86 static int __flush_iotlb(struct iommu_domain *domain)
88 struct msm_priv *priv = to_msm_priv(domain);
89 struct msm_iommu_drvdata *iommu_drvdata;
90 struct msm_iommu_ctx_drvdata *ctx_drvdata;
92 #ifndef CONFIG_IOMMU_PGTABLES_L2
93 unsigned long *fl_table = priv->pgtable;
96 if (!list_empty(&priv->list_attached)) {
97 dmac_flush_range(fl_table, fl_table + SZ_16K);
99 for (i = 0; i < NUM_FL_PTE; i++)
100 if ((fl_table[i] & 0x03) == FL_TYPE_TABLE) {
101 void *sl_table = __va(fl_table[i] &
103 dmac_flush_range(sl_table, sl_table + SZ_4K);
108 list_for_each_entry(ctx_drvdata, &priv->list_attached, attached_elm) {
110 BUG_ON(!ctx_drvdata->pdev || !ctx_drvdata->pdev->dev.parent);
112 iommu_drvdata = dev_get_drvdata(ctx_drvdata->pdev->dev.parent);
113 BUG_ON(!iommu_drvdata);
115 ret = __enable_clocks(iommu_drvdata);
119 SET_CTX_TLBIALL(iommu_drvdata->base, ctx_drvdata->num, 0);
120 __disable_clocks(iommu_drvdata);
126 static void __reset_context(void __iomem *base, int ctx)
128 SET_BPRCOSH(base, ctx, 0);
129 SET_BPRCISH(base, ctx, 0);
130 SET_BPRCNSH(base, ctx, 0);
131 SET_BPSHCFG(base, ctx, 0);
132 SET_BPMTCFG(base, ctx, 0);
133 SET_ACTLR(base, ctx, 0);
134 SET_SCTLR(base, ctx, 0);
135 SET_FSRRESTORE(base, ctx, 0);
136 SET_TTBR0(base, ctx, 0);
137 SET_TTBR1(base, ctx, 0);
138 SET_TTBCR(base, ctx, 0);
139 SET_BFBCR(base, ctx, 0);
140 SET_PAR(base, ctx, 0);
141 SET_FAR(base, ctx, 0);
142 SET_CTX_TLBIALL(base, ctx, 0);
143 SET_TLBFLPTER(base, ctx, 0);
144 SET_TLBSLPTER(base, ctx, 0);
145 SET_TLBLKCR(base, ctx, 0);
146 SET_PRRR(base, ctx, 0);
147 SET_NMRR(base, ctx, 0);
150 static void __program_context(void __iomem *base, int ctx, phys_addr_t pgtable)
152 unsigned int prrr, nmrr;
153 __reset_context(base, ctx);
155 /* Set up HTW mode */
156 /* TLB miss configuration: perform HTW on miss */
157 SET_TLBMCFG(base, ctx, 0x3);
159 /* V2P configuration: HTW for access */
160 SET_V2PCFG(base, ctx, 0x3);
162 SET_TTBCR(base, ctx, 0);
163 SET_TTBR0_PA(base, ctx, (pgtable >> 14));
165 /* Invalidate the TLB for this context */
166 SET_CTX_TLBIALL(base, ctx, 0);
168 /* Set interrupt number to "secure" interrupt */
169 SET_IRPTNDX(base, ctx, 0);
171 /* Enable context fault interrupt */
172 SET_CFEIE(base, ctx, 1);
174 /* Stall access on a context fault and let the handler deal with it */
175 SET_CFCFG(base, ctx, 1);
177 /* Redirect all cacheable requests to L2 slave port. */
178 SET_RCISH(base, ctx, 1);
179 SET_RCOSH(base, ctx, 1);
180 SET_RCNSH(base, ctx, 1);
182 /* Turn on TEX Remap */
183 SET_TRE(base, ctx, 1);
185 /* Set TEX remap attributes */
188 SET_PRRR(base, ctx, prrr);
189 SET_NMRR(base, ctx, nmrr);
191 /* Turn on BFB prefetch */
192 SET_BFBDFE(base, ctx, 1);
194 #ifdef CONFIG_IOMMU_PGTABLES_L2
195 /* Configure page tables as inner-cacheable and shareable to reduce
196 * the TLB miss penalty.
198 SET_TTBR0_SH(base, ctx, 1);
199 SET_TTBR1_SH(base, ctx, 1);
201 SET_TTBR0_NOS(base, ctx, 1);
202 SET_TTBR1_NOS(base, ctx, 1);
204 SET_TTBR0_IRGNH(base, ctx, 0); /* WB, WA */
205 SET_TTBR0_IRGNL(base, ctx, 1);
207 SET_TTBR1_IRGNH(base, ctx, 0); /* WB, WA */
208 SET_TTBR1_IRGNL(base, ctx, 1);
210 SET_TTBR0_ORGN(base, ctx, 1); /* WB, WA */
211 SET_TTBR1_ORGN(base, ctx, 1); /* WB, WA */
218 static struct iommu_domain *msm_iommu_domain_alloc(unsigned type)
220 struct msm_priv *priv;
222 if (type != IOMMU_DOMAIN_UNMANAGED)
225 priv = kzalloc(sizeof(*priv), GFP_KERNEL);
229 INIT_LIST_HEAD(&priv->list_attached);
230 priv->pgtable = (unsigned long *)__get_free_pages(GFP_KERNEL,
236 memset(priv->pgtable, 0, SZ_16K);
238 priv->domain.geometry.aperture_start = 0;
239 priv->domain.geometry.aperture_end = (1ULL << 32) - 1;
240 priv->domain.geometry.force_aperture = true;
242 return &priv->domain;
249 static void msm_iommu_domain_free(struct iommu_domain *domain)
251 struct msm_priv *priv;
253 unsigned long *fl_table;
256 spin_lock_irqsave(&msm_iommu_lock, flags);
257 priv = to_msm_priv(domain);
259 fl_table = priv->pgtable;
261 for (i = 0; i < NUM_FL_PTE; i++)
262 if ((fl_table[i] & 0x03) == FL_TYPE_TABLE)
263 free_page((unsigned long) __va(((fl_table[i]) &
266 free_pages((unsigned long)priv->pgtable, get_order(SZ_16K));
267 priv->pgtable = NULL;
270 spin_unlock_irqrestore(&msm_iommu_lock, flags);
273 static int msm_iommu_attach_dev(struct iommu_domain *domain, struct device *dev)
275 struct msm_priv *priv;
276 struct msm_iommu_ctx_dev *ctx_dev;
277 struct msm_iommu_drvdata *iommu_drvdata;
278 struct msm_iommu_ctx_drvdata *ctx_drvdata;
279 struct msm_iommu_ctx_drvdata *tmp_drvdata;
283 spin_lock_irqsave(&msm_iommu_lock, flags);
285 priv = to_msm_priv(domain);
292 iommu_drvdata = dev_get_drvdata(dev->parent);
293 ctx_drvdata = dev_get_drvdata(dev);
294 ctx_dev = dev->platform_data;
296 if (!iommu_drvdata || !ctx_drvdata || !ctx_dev) {
301 if (!list_empty(&ctx_drvdata->attached_elm)) {
306 list_for_each_entry(tmp_drvdata, &priv->list_attached, attached_elm)
307 if (tmp_drvdata == ctx_drvdata) {
312 ret = __enable_clocks(iommu_drvdata);
316 __program_context(iommu_drvdata->base, ctx_dev->num,
317 __pa(priv->pgtable));
319 __disable_clocks(iommu_drvdata);
320 list_add(&(ctx_drvdata->attached_elm), &priv->list_attached);
321 ret = __flush_iotlb(domain);
324 spin_unlock_irqrestore(&msm_iommu_lock, flags);
328 static void msm_iommu_detach_dev(struct iommu_domain *domain,
331 struct msm_priv *priv;
332 struct msm_iommu_ctx_dev *ctx_dev;
333 struct msm_iommu_drvdata *iommu_drvdata;
334 struct msm_iommu_ctx_drvdata *ctx_drvdata;
338 spin_lock_irqsave(&msm_iommu_lock, flags);
339 priv = to_msm_priv(domain);
344 iommu_drvdata = dev_get_drvdata(dev->parent);
345 ctx_drvdata = dev_get_drvdata(dev);
346 ctx_dev = dev->platform_data;
348 if (!iommu_drvdata || !ctx_drvdata || !ctx_dev)
351 ret = __flush_iotlb(domain);
355 ret = __enable_clocks(iommu_drvdata);
359 __reset_context(iommu_drvdata->base, ctx_dev->num);
360 __disable_clocks(iommu_drvdata);
361 list_del_init(&ctx_drvdata->attached_elm);
364 spin_unlock_irqrestore(&msm_iommu_lock, flags);
367 static int msm_iommu_map(struct iommu_domain *domain, unsigned long va,
368 phys_addr_t pa, size_t len, int prot)
370 struct msm_priv *priv;
372 unsigned long *fl_table;
373 unsigned long *fl_pte;
374 unsigned long fl_offset;
375 unsigned long *sl_table;
376 unsigned long *sl_pte;
377 unsigned long sl_offset;
379 int ret = 0, tex, sh;
381 spin_lock_irqsave(&msm_iommu_lock, flags);
383 sh = (prot & MSM_IOMMU_ATTR_SH) ? 1 : 0;
384 tex = msm_iommu_tex_class[prot & MSM_IOMMU_CP_MASK];
386 if (tex < 0 || tex > NUM_TEX_CLASS - 1) {
391 priv = to_msm_priv(domain);
393 fl_table = priv->pgtable;
395 if (len != SZ_16M && len != SZ_1M &&
396 len != SZ_64K && len != SZ_4K) {
397 pr_debug("Bad size: %d\n", len);
403 pr_debug("Null page table\n");
408 if (len == SZ_16M || len == SZ_1M) {
409 pgprot = sh ? FL_SHARED : 0;
410 pgprot |= tex & 0x01 ? FL_BUFFERABLE : 0;
411 pgprot |= tex & 0x02 ? FL_CACHEABLE : 0;
412 pgprot |= tex & 0x04 ? FL_TEX0 : 0;
414 pgprot = sh ? SL_SHARED : 0;
415 pgprot |= tex & 0x01 ? SL_BUFFERABLE : 0;
416 pgprot |= tex & 0x02 ? SL_CACHEABLE : 0;
417 pgprot |= tex & 0x04 ? SL_TEX0 : 0;
420 fl_offset = FL_OFFSET(va); /* Upper 12 bits */
421 fl_pte = fl_table + fl_offset; /* int pointers, 4 bytes */
425 for (i = 0; i < 16; i++)
426 *(fl_pte+i) = (pa & 0xFF000000) | FL_SUPERSECTION |
427 FL_AP_READ | FL_AP_WRITE | FL_TYPE_SECT |
428 FL_SHARED | FL_NG | pgprot;
432 *fl_pte = (pa & 0xFFF00000) | FL_AP_READ | FL_AP_WRITE | FL_NG |
433 FL_TYPE_SECT | FL_SHARED | pgprot;
435 /* Need a 2nd level table */
436 if ((len == SZ_4K || len == SZ_64K) && (*fl_pte) == 0) {
438 sl = (unsigned long *) __get_free_pages(GFP_ATOMIC,
442 pr_debug("Could not allocate second level table\n");
447 memset(sl, 0, SZ_4K);
448 *fl_pte = ((((int)__pa(sl)) & FL_BASE_MASK) | FL_TYPE_TABLE);
451 sl_table = (unsigned long *) __va(((*fl_pte) & FL_BASE_MASK));
452 sl_offset = SL_OFFSET(va);
453 sl_pte = sl_table + sl_offset;
457 *sl_pte = (pa & SL_BASE_MASK_SMALL) | SL_AP0 | SL_AP1 | SL_NG |
458 SL_SHARED | SL_TYPE_SMALL | pgprot;
463 for (i = 0; i < 16; i++)
464 *(sl_pte+i) = (pa & SL_BASE_MASK_LARGE) | SL_AP0 |
465 SL_NG | SL_AP1 | SL_SHARED | SL_TYPE_LARGE | pgprot;
468 ret = __flush_iotlb(domain);
470 spin_unlock_irqrestore(&msm_iommu_lock, flags);
474 static size_t msm_iommu_unmap(struct iommu_domain *domain, unsigned long va,
477 struct msm_priv *priv;
479 unsigned long *fl_table;
480 unsigned long *fl_pte;
481 unsigned long fl_offset;
482 unsigned long *sl_table;
483 unsigned long *sl_pte;
484 unsigned long sl_offset;
487 spin_lock_irqsave(&msm_iommu_lock, flags);
489 priv = to_msm_priv(domain);
491 fl_table = priv->pgtable;
493 if (len != SZ_16M && len != SZ_1M &&
494 len != SZ_64K && len != SZ_4K) {
495 pr_debug("Bad length: %d\n", len);
500 pr_debug("Null page table\n");
504 fl_offset = FL_OFFSET(va); /* Upper 12 bits */
505 fl_pte = fl_table + fl_offset; /* int pointers, 4 bytes */
508 pr_debug("First level PTE is 0\n");
512 /* Unmap supersection */
514 for (i = 0; i < 16; i++)
520 sl_table = (unsigned long *) __va(((*fl_pte) & FL_BASE_MASK));
521 sl_offset = SL_OFFSET(va);
522 sl_pte = sl_table + sl_offset;
525 for (i = 0; i < 16; i++)
532 if (len == SZ_4K || len == SZ_64K) {
535 for (i = 0; i < NUM_SL_PTE; i++)
539 free_page((unsigned long)sl_table);
544 ret = __flush_iotlb(domain);
547 spin_unlock_irqrestore(&msm_iommu_lock, flags);
549 /* the IOMMU API requires us to return how many bytes were unmapped */
554 static phys_addr_t msm_iommu_iova_to_phys(struct iommu_domain *domain,
557 struct msm_priv *priv;
558 struct msm_iommu_drvdata *iommu_drvdata;
559 struct msm_iommu_ctx_drvdata *ctx_drvdata;
566 spin_lock_irqsave(&msm_iommu_lock, flags);
568 priv = to_msm_priv(domain);
569 if (list_empty(&priv->list_attached))
572 ctx_drvdata = list_entry(priv->list_attached.next,
573 struct msm_iommu_ctx_drvdata, attached_elm);
574 iommu_drvdata = dev_get_drvdata(ctx_drvdata->pdev->dev.parent);
576 base = iommu_drvdata->base;
577 ctx = ctx_drvdata->num;
579 ret = __enable_clocks(iommu_drvdata);
583 /* Invalidate context TLB */
584 SET_CTX_TLBIALL(base, ctx, 0);
585 SET_V2PPR(base, ctx, va & V2Pxx_VA);
587 par = GET_PAR(base, ctx);
589 /* We are dealing with a supersection */
590 if (GET_NOFAULT_SS(base, ctx))
591 ret = (par & 0xFF000000) | (va & 0x00FFFFFF);
592 else /* Upper 20 bits from PAR, lower 12 from VA */
593 ret = (par & 0xFFFFF000) | (va & 0x00000FFF);
595 if (GET_FAULT(base, ctx))
598 __disable_clocks(iommu_drvdata);
600 spin_unlock_irqrestore(&msm_iommu_lock, flags);
604 static bool msm_iommu_capable(enum iommu_cap cap)
609 static void print_ctx_regs(void __iomem *base, int ctx)
611 unsigned int fsr = GET_FSR(base, ctx);
612 pr_err("FAR = %08x PAR = %08x\n",
613 GET_FAR(base, ctx), GET_PAR(base, ctx));
614 pr_err("FSR = %08x [%s%s%s%s%s%s%s%s%s%s]\n", fsr,
615 (fsr & 0x02) ? "TF " : "",
616 (fsr & 0x04) ? "AFF " : "",
617 (fsr & 0x08) ? "APF " : "",
618 (fsr & 0x10) ? "TLBMF " : "",
619 (fsr & 0x20) ? "HTWDEEF " : "",
620 (fsr & 0x40) ? "HTWSEEF " : "",
621 (fsr & 0x80) ? "MHF " : "",
622 (fsr & 0x10000) ? "SL " : "",
623 (fsr & 0x40000000) ? "SS " : "",
624 (fsr & 0x80000000) ? "MULTI " : "");
626 pr_err("FSYNR0 = %08x FSYNR1 = %08x\n",
627 GET_FSYNR0(base, ctx), GET_FSYNR1(base, ctx));
628 pr_err("TTBR0 = %08x TTBR1 = %08x\n",
629 GET_TTBR0(base, ctx), GET_TTBR1(base, ctx));
630 pr_err("SCTLR = %08x ACTLR = %08x\n",
631 GET_SCTLR(base, ctx), GET_ACTLR(base, ctx));
632 pr_err("PRRR = %08x NMRR = %08x\n",
633 GET_PRRR(base, ctx), GET_NMRR(base, ctx));
636 irqreturn_t msm_iommu_fault_handler(int irq, void *dev_id)
638 struct msm_iommu_drvdata *drvdata = dev_id;
643 spin_lock(&msm_iommu_lock);
646 pr_err("Invalid device ID in context interrupt handler\n");
650 base = drvdata->base;
652 pr_err("Unexpected IOMMU page fault!\n");
653 pr_err("base = %08x\n", (unsigned int) base);
655 ret = __enable_clocks(drvdata);
659 for (i = 0; i < drvdata->ncb; i++) {
660 fsr = GET_FSR(base, i);
662 pr_err("Fault occurred in context %d.\n", i);
663 pr_err("Interesting registers:\n");
664 print_ctx_regs(base, i);
665 SET_FSR(base, i, 0x4000000F);
668 __disable_clocks(drvdata);
670 spin_unlock(&msm_iommu_lock);
674 static const struct iommu_ops msm_iommu_ops = {
675 .capable = msm_iommu_capable,
676 .domain_alloc = msm_iommu_domain_alloc,
677 .domain_free = msm_iommu_domain_free,
678 .attach_dev = msm_iommu_attach_dev,
679 .detach_dev = msm_iommu_detach_dev,
680 .map = msm_iommu_map,
681 .unmap = msm_iommu_unmap,
682 .map_sg = default_iommu_map_sg,
683 .iova_to_phys = msm_iommu_iova_to_phys,
684 .pgsize_bitmap = MSM_IOMMU_PGSIZES,
687 static int __init get_tex_class(int icp, int ocp, int mt, int nos)
690 unsigned int prrr = 0;
691 unsigned int nmrr = 0;
692 int c_icp, c_ocp, c_mt, c_nos;
697 for (i = 0; i < NUM_TEX_CLASS; i++) {
698 c_nos = PRRR_NOS(prrr, i);
699 c_mt = PRRR_MT(prrr, i);
700 c_icp = NMRR_ICP(nmrr, i);
701 c_ocp = NMRR_OCP(nmrr, i);
703 if (icp == c_icp && ocp == c_ocp && c_mt == mt && c_nos == nos)
710 static void __init setup_iommu_tex_classes(void)
712 msm_iommu_tex_class[MSM_IOMMU_ATTR_NONCACHED] =
713 get_tex_class(CP_NONCACHED, CP_NONCACHED, MT_NORMAL, 1);
715 msm_iommu_tex_class[MSM_IOMMU_ATTR_CACHED_WB_WA] =
716 get_tex_class(CP_WB_WA, CP_WB_WA, MT_NORMAL, 1);
718 msm_iommu_tex_class[MSM_IOMMU_ATTR_CACHED_WB_NWA] =
719 get_tex_class(CP_WB_NWA, CP_WB_NWA, MT_NORMAL, 1);
721 msm_iommu_tex_class[MSM_IOMMU_ATTR_CACHED_WT] =
722 get_tex_class(CP_WT, CP_WT, MT_NORMAL, 1);
725 static int __init msm_iommu_init(void)
727 setup_iommu_tex_classes();
728 bus_set_iommu(&platform_bus_type, &msm_iommu_ops);
732 subsys_initcall(msm_iommu_init);
734 MODULE_LICENSE("GPL v2");
735 MODULE_AUTHOR("Stepan Moskovchenko <stepanm@codeaurora.org>");