xref: /OK3568_Linux_fs/kernel/drivers/video/rockchip/mpp/mpp_iommu_av1d.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Compatible with the IOMMU of av1 decode
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Module Authors:	Yandong Lin <yandong.lin@rock-chips.com>
6*4882a593Smuzhiyun  *			Simon Xue <xxm@rock-chips.com>
7*4882a593Smuzhiyun  */
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun #include <linux/clk.h>
10*4882a593Smuzhiyun #include <linux/compiler.h>
11*4882a593Smuzhiyun #include <linux/delay.h>
12*4882a593Smuzhiyun #include <linux/device.h>
13*4882a593Smuzhiyun #include <linux/dma-iommu.h>
14*4882a593Smuzhiyun #include <linux/dma-mapping.h>
15*4882a593Smuzhiyun #include <linux/dma-map-ops.h>
16*4882a593Smuzhiyun #include <linux/errno.h>
17*4882a593Smuzhiyun #include <linux/interrupt.h>
18*4882a593Smuzhiyun #include <linux/io.h>
19*4882a593Smuzhiyun #include <linux/iommu.h>
20*4882a593Smuzhiyun #include <linux/iopoll.h>
21*4882a593Smuzhiyun #include <linux/list.h>
22*4882a593Smuzhiyun #include <linux/mm.h>
23*4882a593Smuzhiyun #include <linux/module.h>
24*4882a593Smuzhiyun #include <linux/init.h>
25*4882a593Smuzhiyun #include <linux/of.h>
26*4882a593Smuzhiyun #include <linux/of_iommu.h>
27*4882a593Smuzhiyun #include <linux/of_platform.h>
28*4882a593Smuzhiyun #include <linux/platform_device.h>
29*4882a593Smuzhiyun #include <linux/pm_runtime.h>
30*4882a593Smuzhiyun #include <linux/slab.h>
31*4882a593Smuzhiyun #include <linux/spinlock.h>
32*4882a593Smuzhiyun #include "mpp_debug.h"
33*4882a593Smuzhiyun #include "mpp_common.h"
34*4882a593Smuzhiyun #include "mpp_iommu.h"
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun struct av1_iommu_domain {
37*4882a593Smuzhiyun 	struct list_head iommus;
38*4882a593Smuzhiyun 	u32 *dt; /* page directory table */
39*4882a593Smuzhiyun 	dma_addr_t dt_dma;
40*4882a593Smuzhiyun 	spinlock_t iommus_lock; /* lock for iommus list */
41*4882a593Smuzhiyun 	spinlock_t dt_lock; /* lock for modifying page directory table */
42*4882a593Smuzhiyun 	struct iommu_domain domain;
43*4882a593Smuzhiyun 	/* for av1 iommu */
44*4882a593Smuzhiyun 	u64 *pta; /* page directory table */
45*4882a593Smuzhiyun 	dma_addr_t pta_dma;
46*4882a593Smuzhiyun };
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun struct av1_iommu {
49*4882a593Smuzhiyun 	struct device *dev;
50*4882a593Smuzhiyun 	void __iomem **bases;
51*4882a593Smuzhiyun 	int num_mmu;
52*4882a593Smuzhiyun 	int num_irq;
53*4882a593Smuzhiyun 	struct clk_bulk_data *clocks;
54*4882a593Smuzhiyun 	int num_clocks;
55*4882a593Smuzhiyun 	struct iommu_device iommu;
56*4882a593Smuzhiyun 	struct list_head node; /* entry in rk_iommu_domain.iommus */
57*4882a593Smuzhiyun 	struct iommu_domain *domain; /* domain to which iommu is attached */
58*4882a593Smuzhiyun 	struct iommu_group *group;
59*4882a593Smuzhiyun };
60*4882a593Smuzhiyun 
61*4882a593Smuzhiyun struct av1_iommudata {
62*4882a593Smuzhiyun 	struct device_link *link; /* runtime PM link from IOMMU to master */
63*4882a593Smuzhiyun 	struct av1_iommu *iommu;
64*4882a593Smuzhiyun 	bool defer_attach;
65*4882a593Smuzhiyun };
66*4882a593Smuzhiyun 
67*4882a593Smuzhiyun #define RK_IOMMU_AV1	0xa
68*4882a593Smuzhiyun #define NUM_DT_ENTRIES	1024
69*4882a593Smuzhiyun #define NUM_PT_ENTRIES	1024
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun #define SPAGE_ORDER	12
72*4882a593Smuzhiyun #define SPAGE_SIZE	(1 << SPAGE_ORDER)
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun /* av1 iommu regs address */
75*4882a593Smuzhiyun #define AV1_CLOCK_CTRL_BASE			0x0
76*4882a593Smuzhiyun #define AV1_IDLE_ST_BASE			0x4
77*4882a593Smuzhiyun #define AV1_MMU_CONFIG0_BASE			0x184
78*4882a593Smuzhiyun #define AV1_MMU_CONFIG1_BASE			0x1ac
79*4882a593Smuzhiyun #define AV1_MMU_AHB_EXCEPTION_BASE		0x380
80*4882a593Smuzhiyun #define AV1_MMU_AHB_STATUS_BASE			0x384
81*4882a593Smuzhiyun #define AV1_MMU_AHB_CONTROL_BASE		0x388
82*4882a593Smuzhiyun #define AV1_MMU_AHB_TBL_ARRAY_BASE_L_BASE	0x38C
83*4882a593Smuzhiyun #define AV1_MMU_AHB_TBL_ARRAY_BASE_H_BASE	0x390
84*4882a593Smuzhiyun #define AV1_MMU_AHB_CTX_PD_BASE			0x3b4
85*4882a593Smuzhiyun #define AV1_MMU_BUTT_BASE			0xffff
86*4882a593Smuzhiyun 
87*4882a593Smuzhiyun /* MMU register offsets */
88*4882a593Smuzhiyun #define AV1_MMU_FLUSH_BASE		0x184
89*4882a593Smuzhiyun #define AV1_MMU_BIT_FLUSH		BIT(4)
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun #define AV1_MMU_PAGE_FAULT_ADDR		0x380
92*4882a593Smuzhiyun #define AV1_MMU_STATUS_BASE		0x384	/* IRQ status */
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun #define AV1_MMU_EN_BASE			0x388
95*4882a593Smuzhiyun #define AV1_MMU_BIT_ENABLE		BIT(0)
96*4882a593Smuzhiyun 
97*4882a593Smuzhiyun #define AV1_MMU_OUT_OF_BOUND		BIT(28)
98*4882a593Smuzhiyun /* Irq mask */
99*4882a593Smuzhiyun #define AV1_MMU_IRQ_MASK		0x7
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun #define AV1_DTE_PT_ADDRESS_MASK		0xffffffc0
102*4882a593Smuzhiyun #define AV1_DTE_PT_VALID		BIT(0)
103*4882a593Smuzhiyun 
104*4882a593Smuzhiyun #define AV1_PAGE_DESC_LO_MASK		0xfffff000
105*4882a593Smuzhiyun #define AV1_PAGE_DESC_HI_MASK		GENMASK_ULL(39, 32)
106*4882a593Smuzhiyun #define AV1_PAGE_DESC_HI_SHIFT		(32-4)
107*4882a593Smuzhiyun 
108*4882a593Smuzhiyun #define AV1_IOMMU_PGSIZE_BITMAP 0x007ff000
109*4882a593Smuzhiyun 
av1_dte_pt_address(u32 dte)110*4882a593Smuzhiyun static inline phys_addr_t av1_dte_pt_address(u32 dte)
111*4882a593Smuzhiyun {
112*4882a593Smuzhiyun 	return (phys_addr_t)dte & AV1_DTE_PT_ADDRESS_MASK;
113*4882a593Smuzhiyun }
114*4882a593Smuzhiyun 
av1_mk_dte(dma_addr_t pt_dma)115*4882a593Smuzhiyun static inline u32 av1_mk_dte(dma_addr_t pt_dma)
116*4882a593Smuzhiyun {
117*4882a593Smuzhiyun 	return (pt_dma) | AV1_DTE_PT_VALID;
118*4882a593Smuzhiyun }
119*4882a593Smuzhiyun 
120*4882a593Smuzhiyun #define AV1_PTE_PAGE_ADDRESS_MASK	0xfffffff0
121*4882a593Smuzhiyun #define AV1_PTE_PAGE_WRITABLE		BIT(2)
122*4882a593Smuzhiyun #define AV1_PTE_PAGE_VALID		BIT(0)
123*4882a593Smuzhiyun 
124*4882a593Smuzhiyun static struct device *dma_dev;
125*4882a593Smuzhiyun 
av1_pte_page_address(u32 pte)126*4882a593Smuzhiyun static inline phys_addr_t av1_pte_page_address(u32 pte)
127*4882a593Smuzhiyun {
128*4882a593Smuzhiyun 	u64 pte_av1 = pte;
129*4882a593Smuzhiyun 
130*4882a593Smuzhiyun 	pte_av1 = ((pte_av1 & AV1_PAGE_DESC_HI_MASK) << AV1_PAGE_DESC_HI_SHIFT) |
131*4882a593Smuzhiyun 		  (pte_av1 & AV1_PAGE_DESC_LO_MASK);
132*4882a593Smuzhiyun 
133*4882a593Smuzhiyun 	return (phys_addr_t)pte_av1;
134*4882a593Smuzhiyun }
135*4882a593Smuzhiyun 
av1_mk_pte(phys_addr_t page,int prot)136*4882a593Smuzhiyun static u32 av1_mk_pte(phys_addr_t page, int prot)
137*4882a593Smuzhiyun {
138*4882a593Smuzhiyun 	u32 flags = 0;
139*4882a593Smuzhiyun 
140*4882a593Smuzhiyun 	flags |= (prot & IOMMU_WRITE) ? AV1_PTE_PAGE_WRITABLE : 0;
141*4882a593Smuzhiyun 	page = (page & AV1_PAGE_DESC_LO_MASK) |
142*4882a593Smuzhiyun 	       ((page & AV1_PAGE_DESC_HI_MASK) >> AV1_PAGE_DESC_HI_SHIFT);
143*4882a593Smuzhiyun 	page &= AV1_PTE_PAGE_ADDRESS_MASK;
144*4882a593Smuzhiyun 
145*4882a593Smuzhiyun 	return page | flags | AV1_PTE_PAGE_VALID;
146*4882a593Smuzhiyun }
147*4882a593Smuzhiyun 
148*4882a593Smuzhiyun #define AV1_DTE_PT_VALID	BIT(0)
149*4882a593Smuzhiyun 
av1_dte_is_pt_valid(u32 dte)150*4882a593Smuzhiyun static inline bool av1_dte_is_pt_valid(u32 dte)
151*4882a593Smuzhiyun {
152*4882a593Smuzhiyun 	return dte & AV1_DTE_PT_VALID;
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun 
av1_pte_is_page_valid(u32 pte)155*4882a593Smuzhiyun static inline bool av1_pte_is_page_valid(u32 pte)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun 	return pte & AV1_PTE_PAGE_VALID;
158*4882a593Smuzhiyun }
159*4882a593Smuzhiyun 
av1_mk_pte_invalid(u32 pte)160*4882a593Smuzhiyun static u32 av1_mk_pte_invalid(u32 pte)
161*4882a593Smuzhiyun {
162*4882a593Smuzhiyun 	return pte & ~AV1_PTE_PAGE_VALID;
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun #define AV1_MASTER_TLB_MASK	GENMASK_ULL(31, 10)
166*4882a593Smuzhiyun /* mode 0 : 4k */
167*4882a593Smuzhiyun #define AV1_PTA_4K_MODE	0
168*4882a593Smuzhiyun 
av1_iommu_from_dev(struct device * dev)169*4882a593Smuzhiyun static struct av1_iommu *av1_iommu_from_dev(struct device *dev)
170*4882a593Smuzhiyun {
171*4882a593Smuzhiyun 	struct av1_iommudata *data = dev_iommu_priv_get(dev);
172*4882a593Smuzhiyun 
173*4882a593Smuzhiyun 	return data ? data->iommu : NULL;
174*4882a593Smuzhiyun }
175*4882a593Smuzhiyun 
av1_mk_pta(dma_addr_t dt_dma)176*4882a593Smuzhiyun static u64 av1_mk_pta(dma_addr_t dt_dma)
177*4882a593Smuzhiyun {
178*4882a593Smuzhiyun 	u64 val = (dt_dma & AV1_MASTER_TLB_MASK) | AV1_PTA_4K_MODE;
179*4882a593Smuzhiyun 
180*4882a593Smuzhiyun 	return val;
181*4882a593Smuzhiyun }
182*4882a593Smuzhiyun 
to_av1_domain(struct iommu_domain * dom)183*4882a593Smuzhiyun static struct av1_iommu_domain *to_av1_domain(struct iommu_domain *dom)
184*4882a593Smuzhiyun {
185*4882a593Smuzhiyun 	return container_of(dom, struct av1_iommu_domain, domain);
186*4882a593Smuzhiyun }
187*4882a593Smuzhiyun 
av1_iommu_disable(struct av1_iommu * iommu)188*4882a593Smuzhiyun static void av1_iommu_disable(struct av1_iommu *iommu)
189*4882a593Smuzhiyun {
190*4882a593Smuzhiyun 	int i;
191*4882a593Smuzhiyun 
192*4882a593Smuzhiyun 	/* Ignore error while disabling, just keep going */
193*4882a593Smuzhiyun 	WARN_ON(clk_bulk_enable(iommu->num_clocks, iommu->clocks));
194*4882a593Smuzhiyun 	for (i = 0; i < iommu->num_mmu; i++)
195*4882a593Smuzhiyun 		writel(0, iommu->bases[i] + AV1_MMU_AHB_CONTROL_BASE);
196*4882a593Smuzhiyun 
197*4882a593Smuzhiyun 	clk_bulk_disable(iommu->num_clocks, iommu->clocks);
198*4882a593Smuzhiyun }
199*4882a593Smuzhiyun 
mpp_av1_iommu_disable(struct device * dev)200*4882a593Smuzhiyun int mpp_av1_iommu_disable(struct device *dev)
201*4882a593Smuzhiyun {
202*4882a593Smuzhiyun 	struct av1_iommu *iommu = av1_iommu_from_dev(dev);
203*4882a593Smuzhiyun 
204*4882a593Smuzhiyun 	if (!iommu->domain)
205*4882a593Smuzhiyun 		return 0;
206*4882a593Smuzhiyun 
207*4882a593Smuzhiyun 	av1_iommu_disable(iommu);
208*4882a593Smuzhiyun 
209*4882a593Smuzhiyun 	return 0;
210*4882a593Smuzhiyun }
211*4882a593Smuzhiyun 
av1_iommu_enable(struct av1_iommu * iommu)212*4882a593Smuzhiyun static int av1_iommu_enable(struct av1_iommu *iommu)
213*4882a593Smuzhiyun {
214*4882a593Smuzhiyun 	struct iommu_domain *domain = iommu->domain;
215*4882a593Smuzhiyun 	struct av1_iommu_domain *av1_domain = to_av1_domain(domain);
216*4882a593Smuzhiyun 	int ret, i;
217*4882a593Smuzhiyun 
218*4882a593Smuzhiyun 	ret = clk_bulk_enable(iommu->num_clocks, iommu->clocks);
219*4882a593Smuzhiyun 	if (ret)
220*4882a593Smuzhiyun 		return ret;
221*4882a593Smuzhiyun 
222*4882a593Smuzhiyun 	for (i = 0; i < iommu->num_mmu; i++) {
223*4882a593Smuzhiyun 		u32 val = readl(iommu->bases[i] + AV1_MMU_AHB_CONTROL_BASE);
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun 		if (!(val & AV1_MMU_BIT_ENABLE)) {
226*4882a593Smuzhiyun 			writel(av1_domain->pta_dma,
227*4882a593Smuzhiyun 			       iommu->bases[i] + AV1_MMU_AHB_TBL_ARRAY_BASE_L_BASE);
228*4882a593Smuzhiyun 			writel(AV1_MMU_OUT_OF_BOUND, iommu->bases[i] + AV1_MMU_CONFIG1_BASE);
229*4882a593Smuzhiyun 			writel(AV1_MMU_BIT_ENABLE, iommu->bases[i] + AV1_MMU_AHB_EXCEPTION_BASE);
230*4882a593Smuzhiyun 			writel(AV1_MMU_BIT_ENABLE, iommu->bases[i] + AV1_MMU_AHB_CONTROL_BASE);
231*4882a593Smuzhiyun 		}
232*4882a593Smuzhiyun 	}
233*4882a593Smuzhiyun 	clk_bulk_disable(iommu->num_clocks, iommu->clocks);
234*4882a593Smuzhiyun 	return ret;
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun 
mpp_av1_iommu_enable(struct device * dev)237*4882a593Smuzhiyun int mpp_av1_iommu_enable(struct device *dev)
238*4882a593Smuzhiyun {
239*4882a593Smuzhiyun 	struct av1_iommu *iommu = av1_iommu_from_dev(dev);
240*4882a593Smuzhiyun 
241*4882a593Smuzhiyun 	if (!iommu->domain)
242*4882a593Smuzhiyun 		return 0;
243*4882a593Smuzhiyun 
244*4882a593Smuzhiyun 	return av1_iommu_enable(iommu);
245*4882a593Smuzhiyun }
246*4882a593Smuzhiyun 
av1_table_flush(struct av1_iommu_domain * dom,dma_addr_t dma,unsigned int count)247*4882a593Smuzhiyun static inline void av1_table_flush(struct av1_iommu_domain *dom, dma_addr_t dma,
248*4882a593Smuzhiyun 				  unsigned int count)
249*4882a593Smuzhiyun {
250*4882a593Smuzhiyun 	size_t size = count * sizeof(u32); /* count of u32 entry */
251*4882a593Smuzhiyun 
252*4882a593Smuzhiyun 	dma_sync_single_for_device(dma_dev, dma, size, DMA_TO_DEVICE);
253*4882a593Smuzhiyun }
254*4882a593Smuzhiyun 
255*4882a593Smuzhiyun #define AV1_IOVA_DTE_MASK	0xffc00000
256*4882a593Smuzhiyun #define AV1_IOVA_DTE_SHIFT	22
257*4882a593Smuzhiyun #define AV1_IOVA_PTE_MASK	0x003ff000
258*4882a593Smuzhiyun #define AV1_IOVA_PTE_SHIFT	12
259*4882a593Smuzhiyun #define AV1_IOVA_PAGE_MASK	0x00000fff
260*4882a593Smuzhiyun #define AV1_IOVA_PAGE_SHIFT	0
261*4882a593Smuzhiyun 
av1_iova_dte_index(dma_addr_t iova)262*4882a593Smuzhiyun static u32 av1_iova_dte_index(dma_addr_t iova)
263*4882a593Smuzhiyun {
264*4882a593Smuzhiyun 	return (u32)(iova & AV1_IOVA_DTE_MASK) >> AV1_IOVA_DTE_SHIFT;
265*4882a593Smuzhiyun }
266*4882a593Smuzhiyun 
av1_iova_pte_index(dma_addr_t iova)267*4882a593Smuzhiyun static u32 av1_iova_pte_index(dma_addr_t iova)
268*4882a593Smuzhiyun {
269*4882a593Smuzhiyun 	return (u32)(iova & AV1_IOVA_PTE_MASK) >> AV1_IOVA_PTE_SHIFT;
270*4882a593Smuzhiyun }
271*4882a593Smuzhiyun 
av1_iova_page_offset(dma_addr_t iova)272*4882a593Smuzhiyun static u32 av1_iova_page_offset(dma_addr_t iova)
273*4882a593Smuzhiyun {
274*4882a593Smuzhiyun 	return (u32)(iova & AV1_IOVA_PAGE_MASK) >> AV1_IOVA_PAGE_SHIFT;
275*4882a593Smuzhiyun }
276*4882a593Smuzhiyun 
av1_iommu_read(void __iomem * base,u32 offset)277*4882a593Smuzhiyun static u32 av1_iommu_read(void __iomem *base, u32 offset)
278*4882a593Smuzhiyun {
279*4882a593Smuzhiyun 	return readl(base + offset);
280*4882a593Smuzhiyun }
281*4882a593Smuzhiyun 
av1_iommu_write(void __iomem * base,u32 offset,u32 value)282*4882a593Smuzhiyun static void av1_iommu_write(void __iomem *base, u32 offset, u32 value)
283*4882a593Smuzhiyun {
284*4882a593Smuzhiyun 	writel(value, base + offset);
285*4882a593Smuzhiyun }
286*4882a593Smuzhiyun 
287*4882a593Smuzhiyun 
av1_iommu_flush_tlb_all(struct iommu_domain * domain)288*4882a593Smuzhiyun static void av1_iommu_flush_tlb_all(struct iommu_domain *domain)
289*4882a593Smuzhiyun {
290*4882a593Smuzhiyun 	struct av1_iommu_domain *av1_domain = to_av1_domain(domain);
291*4882a593Smuzhiyun 	struct list_head *pos;
292*4882a593Smuzhiyun 	unsigned long flags;
293*4882a593Smuzhiyun 	int i;
294*4882a593Smuzhiyun 
295*4882a593Smuzhiyun 	spin_lock_irqsave(&av1_domain->iommus_lock, flags);
296*4882a593Smuzhiyun 	list_for_each(pos, &av1_domain->iommus) {
297*4882a593Smuzhiyun 		struct av1_iommu *iommu;
298*4882a593Smuzhiyun 		int ret;
299*4882a593Smuzhiyun 
300*4882a593Smuzhiyun 		iommu = list_entry(pos, struct av1_iommu, node);
301*4882a593Smuzhiyun 		ret = pm_runtime_get_if_in_use(iommu->dev);
302*4882a593Smuzhiyun 		if (WARN_ON_ONCE(ret < 0))
303*4882a593Smuzhiyun 			continue;
304*4882a593Smuzhiyun 		if (ret) {
305*4882a593Smuzhiyun 			WARN_ON(clk_bulk_enable(iommu->num_clocks, iommu->clocks));
306*4882a593Smuzhiyun 			for (i = 0; i < iommu->num_mmu; i++) {
307*4882a593Smuzhiyun 				writel(AV1_MMU_BIT_FLUSH,
308*4882a593Smuzhiyun 				       iommu->bases[i] + AV1_MMU_FLUSH_BASE);
309*4882a593Smuzhiyun 				writel(0, iommu->bases[i] + AV1_MMU_FLUSH_BASE);
310*4882a593Smuzhiyun 			}
311*4882a593Smuzhiyun 			clk_bulk_disable(iommu->num_clocks, iommu->clocks);
312*4882a593Smuzhiyun 			pm_runtime_put(iommu->dev);
313*4882a593Smuzhiyun 		}
314*4882a593Smuzhiyun 	}
315*4882a593Smuzhiyun 	spin_unlock_irqrestore(&av1_domain->iommus_lock, flags);
316*4882a593Smuzhiyun }
317*4882a593Smuzhiyun 
av1_iommu_irq(int irq,void * dev_id)318*4882a593Smuzhiyun static irqreturn_t av1_iommu_irq(int irq, void *dev_id)
319*4882a593Smuzhiyun {
320*4882a593Smuzhiyun 	struct av1_iommu *iommu = dev_id;
321*4882a593Smuzhiyun 	u32 int_status;
322*4882a593Smuzhiyun 	dma_addr_t iova;
323*4882a593Smuzhiyun 	irqreturn_t ret = IRQ_NONE;
324*4882a593Smuzhiyun 	int i, err;
325*4882a593Smuzhiyun 
326*4882a593Smuzhiyun 	err = pm_runtime_get_if_in_use(iommu->dev);
327*4882a593Smuzhiyun 	if (!err || WARN_ON_ONCE(err < 0))
328*4882a593Smuzhiyun 		return ret;
329*4882a593Smuzhiyun 
330*4882a593Smuzhiyun 	if (WARN_ON(clk_bulk_enable(iommu->num_clocks, iommu->clocks)))
331*4882a593Smuzhiyun 		goto out;
332*4882a593Smuzhiyun 
333*4882a593Smuzhiyun 	for (i = 0; i < iommu->num_mmu; i++) {
334*4882a593Smuzhiyun 		int_status = av1_iommu_read(iommu->bases[i], AV1_MMU_STATUS_BASE);
335*4882a593Smuzhiyun 		if (int_status & AV1_MMU_IRQ_MASK) {
336*4882a593Smuzhiyun 			dev_err(iommu->dev, "unexpected int_status=%08x\n", int_status);
337*4882a593Smuzhiyun 			iova = av1_iommu_read(iommu->bases[i], AV1_MMU_PAGE_FAULT_ADDR);
338*4882a593Smuzhiyun 
339*4882a593Smuzhiyun 			if (iommu->domain)
340*4882a593Smuzhiyun 				report_iommu_fault(iommu->domain, iommu->dev, iova, int_status);
341*4882a593Smuzhiyun 			else
342*4882a593Smuzhiyun 				dev_err(iommu->dev,
343*4882a593Smuzhiyun 					"Page fault while iommu not attached to domain?\n");
344*4882a593Smuzhiyun 		}
345*4882a593Smuzhiyun 		av1_iommu_write(iommu->bases[i], AV1_MMU_STATUS_BASE, 0);
346*4882a593Smuzhiyun 		ret = IRQ_HANDLED;
347*4882a593Smuzhiyun 	}
348*4882a593Smuzhiyun 
349*4882a593Smuzhiyun 	clk_bulk_disable(iommu->num_clocks, iommu->clocks);
350*4882a593Smuzhiyun 
351*4882a593Smuzhiyun out:
352*4882a593Smuzhiyun 	pm_runtime_put(iommu->dev);
353*4882a593Smuzhiyun 	return ret;
354*4882a593Smuzhiyun }
355*4882a593Smuzhiyun 
av1_iommu_is_attach_deferred(struct iommu_domain * domain,struct device * dev)356*4882a593Smuzhiyun static bool av1_iommu_is_attach_deferred(struct iommu_domain *domain,
357*4882a593Smuzhiyun 					struct device *dev)
358*4882a593Smuzhiyun {
359*4882a593Smuzhiyun 	struct av1_iommudata *data = dev_iommu_priv_get(dev);
360*4882a593Smuzhiyun 
361*4882a593Smuzhiyun 	return data->defer_attach;
362*4882a593Smuzhiyun }
363*4882a593Smuzhiyun 
av1_iommu_domain_alloc(unsigned type)364*4882a593Smuzhiyun static struct iommu_domain *av1_iommu_domain_alloc(unsigned type)
365*4882a593Smuzhiyun {
366*4882a593Smuzhiyun 	struct av1_iommu_domain *av1_domain;
367*4882a593Smuzhiyun 
368*4882a593Smuzhiyun 	if (type != IOMMU_DOMAIN_UNMANAGED && type != IOMMU_DOMAIN_DMA)
369*4882a593Smuzhiyun 		return NULL;
370*4882a593Smuzhiyun 
371*4882a593Smuzhiyun 	if (!dma_dev)
372*4882a593Smuzhiyun 		return NULL;
373*4882a593Smuzhiyun 
374*4882a593Smuzhiyun 	av1_domain = kzalloc(sizeof(*av1_domain), GFP_KERNEL);
375*4882a593Smuzhiyun 	if (!av1_domain)
376*4882a593Smuzhiyun 		return NULL;
377*4882a593Smuzhiyun 
378*4882a593Smuzhiyun 	if (type == IOMMU_DOMAIN_DMA &&
379*4882a593Smuzhiyun 	    iommu_get_dma_cookie(&av1_domain->domain))
380*4882a593Smuzhiyun 		goto err_free_domain;
381*4882a593Smuzhiyun 
382*4882a593Smuzhiyun 	/*
383*4882a593Smuzhiyun 	 * av132xx iommus use a 2 level pagetable.
384*4882a593Smuzhiyun 	 * Each level1 (dt) and level2 (pt) table has 1024 4-byte entries.
385*4882a593Smuzhiyun 	 * Allocate one 4 KiB page for each table.
386*4882a593Smuzhiyun 	 */
387*4882a593Smuzhiyun 	av1_domain->dt = (u32 *)get_zeroed_page(GFP_KERNEL | GFP_DMA32);
388*4882a593Smuzhiyun 	if (!av1_domain->dt)
389*4882a593Smuzhiyun 		goto err_put_cookie;
390*4882a593Smuzhiyun 
391*4882a593Smuzhiyun 	av1_domain->dt_dma = dma_map_single(dma_dev, av1_domain->dt,
392*4882a593Smuzhiyun 					   SPAGE_SIZE, DMA_TO_DEVICE);
393*4882a593Smuzhiyun 	if (dma_mapping_error(dma_dev, av1_domain->dt_dma)) {
394*4882a593Smuzhiyun 		dev_err(dma_dev, "DMA map error for DT\n");
395*4882a593Smuzhiyun 		goto err_free_dt;
396*4882a593Smuzhiyun 	}
397*4882a593Smuzhiyun 
398*4882a593Smuzhiyun 	av1_domain->pta = (u64 *)get_zeroed_page(GFP_KERNEL | GFP_DMA32);
399*4882a593Smuzhiyun 	if (!av1_domain->pta)
400*4882a593Smuzhiyun 		goto err_unmap_dt;
401*4882a593Smuzhiyun 
402*4882a593Smuzhiyun 	av1_domain->pta_dma = dma_map_single(dma_dev, av1_domain->pta,
403*4882a593Smuzhiyun 					SPAGE_SIZE, DMA_TO_DEVICE);
404*4882a593Smuzhiyun 	if (dma_mapping_error(dma_dev, av1_domain->pta_dma)) {
405*4882a593Smuzhiyun 		dev_err(dma_dev, "DMA map error for PTA\n");
406*4882a593Smuzhiyun 		goto err_free_pta;
407*4882a593Smuzhiyun 	}
408*4882a593Smuzhiyun 	av1_domain->pta[0] = av1_mk_pta(av1_domain->dt_dma);
409*4882a593Smuzhiyun 
410*4882a593Smuzhiyun 	av1_table_flush(av1_domain, av1_domain->pta_dma, 1024);
411*4882a593Smuzhiyun 	av1_table_flush(av1_domain, av1_domain->dt_dma, NUM_DT_ENTRIES);
412*4882a593Smuzhiyun 
413*4882a593Smuzhiyun 	spin_lock_init(&av1_domain->iommus_lock);
414*4882a593Smuzhiyun 	spin_lock_init(&av1_domain->dt_lock);
415*4882a593Smuzhiyun 	INIT_LIST_HEAD(&av1_domain->iommus);
416*4882a593Smuzhiyun 
417*4882a593Smuzhiyun 	av1_domain->domain.geometry.aperture_start = 0;
418*4882a593Smuzhiyun 	av1_domain->domain.geometry.aperture_end   = DMA_BIT_MASK(32);
419*4882a593Smuzhiyun 	av1_domain->domain.geometry.force_aperture = true;
420*4882a593Smuzhiyun 
421*4882a593Smuzhiyun 	return &av1_domain->domain;
422*4882a593Smuzhiyun err_free_pta:
423*4882a593Smuzhiyun 	free_page((unsigned long)av1_domain->pta);
424*4882a593Smuzhiyun err_unmap_dt:
425*4882a593Smuzhiyun 	dma_unmap_single(dma_dev, av1_domain->dt_dma,
426*4882a593Smuzhiyun 			 SPAGE_SIZE, DMA_TO_DEVICE);
427*4882a593Smuzhiyun err_free_dt:
428*4882a593Smuzhiyun 	free_page((unsigned long)av1_domain->dt);
429*4882a593Smuzhiyun err_put_cookie:
430*4882a593Smuzhiyun 	if (type == IOMMU_DOMAIN_DMA)
431*4882a593Smuzhiyun 		iommu_put_dma_cookie(&av1_domain->domain);
432*4882a593Smuzhiyun err_free_domain:
433*4882a593Smuzhiyun 	kfree(av1_domain);
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun 	return NULL;
436*4882a593Smuzhiyun }
437*4882a593Smuzhiyun 
av1_iommu_iova_to_phys(struct iommu_domain * domain,dma_addr_t iova)438*4882a593Smuzhiyun static phys_addr_t av1_iommu_iova_to_phys(struct iommu_domain *domain,
439*4882a593Smuzhiyun 						   dma_addr_t iova)
440*4882a593Smuzhiyun {
441*4882a593Smuzhiyun 	struct av1_iommu_domain *av1_domain = to_av1_domain(domain);
442*4882a593Smuzhiyun 	unsigned long flags;
443*4882a593Smuzhiyun 	phys_addr_t pt_phys, phys = 0;
444*4882a593Smuzhiyun 	u32 dte, pte;
445*4882a593Smuzhiyun 	u32 *page_table;
446*4882a593Smuzhiyun 
447*4882a593Smuzhiyun 	spin_lock_irqsave(&av1_domain->dt_lock, flags);
448*4882a593Smuzhiyun 
449*4882a593Smuzhiyun 	dte = av1_domain->dt[av1_iova_dte_index(iova)];
450*4882a593Smuzhiyun 	if (!av1_dte_is_pt_valid(dte))
451*4882a593Smuzhiyun 		goto out;
452*4882a593Smuzhiyun 
453*4882a593Smuzhiyun 	pt_phys = av1_dte_pt_address(dte);
454*4882a593Smuzhiyun 	page_table = (u32 *)phys_to_virt(pt_phys);
455*4882a593Smuzhiyun 	pte = page_table[av1_iova_pte_index(iova)];
456*4882a593Smuzhiyun 	if (!av1_pte_is_page_valid(pte))
457*4882a593Smuzhiyun 		goto out;
458*4882a593Smuzhiyun 
459*4882a593Smuzhiyun 	phys = av1_pte_page_address(pte) + av1_iova_page_offset(iova);
460*4882a593Smuzhiyun out:
461*4882a593Smuzhiyun 	spin_unlock_irqrestore(&av1_domain->dt_lock, flags);
462*4882a593Smuzhiyun 
463*4882a593Smuzhiyun 	return phys;
464*4882a593Smuzhiyun }
465*4882a593Smuzhiyun 
av1_dte_get_page_table(struct av1_iommu_domain * av1_domain,dma_addr_t iova)466*4882a593Smuzhiyun static u32 *av1_dte_get_page_table(struct av1_iommu_domain *av1_domain, dma_addr_t iova)
467*4882a593Smuzhiyun {
468*4882a593Smuzhiyun 	u32 *page_table, *dte_addr;
469*4882a593Smuzhiyun 	u32 dte_index, dte;
470*4882a593Smuzhiyun 	phys_addr_t pt_phys;
471*4882a593Smuzhiyun 	dma_addr_t pt_dma;
472*4882a593Smuzhiyun 
473*4882a593Smuzhiyun 	assert_spin_locked(&av1_domain->dt_lock);
474*4882a593Smuzhiyun 
475*4882a593Smuzhiyun 	dte_index = av1_iova_dte_index(iova);
476*4882a593Smuzhiyun 	dte_addr = &av1_domain->dt[dte_index];
477*4882a593Smuzhiyun 	dte = *dte_addr;
478*4882a593Smuzhiyun 	if (av1_dte_is_pt_valid(dte))
479*4882a593Smuzhiyun 		goto done;
480*4882a593Smuzhiyun 
481*4882a593Smuzhiyun 	page_table = (u32 *)get_zeroed_page(GFP_ATOMIC | GFP_DMA32);
482*4882a593Smuzhiyun 	if (!page_table)
483*4882a593Smuzhiyun 		return ERR_PTR(-ENOMEM);
484*4882a593Smuzhiyun 
485*4882a593Smuzhiyun 	pt_dma = dma_map_single(dma_dev, page_table, SPAGE_SIZE, DMA_TO_DEVICE);
486*4882a593Smuzhiyun 	if (dma_mapping_error(dma_dev, pt_dma)) {
487*4882a593Smuzhiyun 		dev_err(dma_dev, "DMA mapping error while allocating page table\n");
488*4882a593Smuzhiyun 		free_page((unsigned long)page_table);
489*4882a593Smuzhiyun 		return ERR_PTR(-ENOMEM);
490*4882a593Smuzhiyun 	}
491*4882a593Smuzhiyun 
492*4882a593Smuzhiyun 	dte = av1_mk_dte(pt_dma);
493*4882a593Smuzhiyun 	*dte_addr = dte;
494*4882a593Smuzhiyun 
495*4882a593Smuzhiyun 	av1_table_flush(av1_domain, pt_dma, NUM_PT_ENTRIES);
496*4882a593Smuzhiyun 	av1_table_flush(av1_domain,
497*4882a593Smuzhiyun 		       av1_domain->dt_dma + dte_index * sizeof(u32), 1);
498*4882a593Smuzhiyun done:
499*4882a593Smuzhiyun 	pt_phys = av1_dte_pt_address(dte);
500*4882a593Smuzhiyun 	return (u32 *)phys_to_virt(pt_phys);
501*4882a593Smuzhiyun }
502*4882a593Smuzhiyun 
av1_iommu_unmap_iova(struct av1_iommu_domain * av1_domain,u32 * pte_addr,dma_addr_t pte_dma,size_t size)503*4882a593Smuzhiyun static size_t av1_iommu_unmap_iova(struct av1_iommu_domain *av1_domain,
504*4882a593Smuzhiyun 				   u32 *pte_addr, dma_addr_t pte_dma,
505*4882a593Smuzhiyun 				   size_t size)
506*4882a593Smuzhiyun {
507*4882a593Smuzhiyun 	unsigned int pte_count;
508*4882a593Smuzhiyun 	unsigned int pte_total = size / SPAGE_SIZE;
509*4882a593Smuzhiyun 
510*4882a593Smuzhiyun 	assert_spin_locked(&av1_domain->dt_lock);
511*4882a593Smuzhiyun 
512*4882a593Smuzhiyun 	for (pte_count = 0; pte_count < pte_total; pte_count++) {
513*4882a593Smuzhiyun 		u32 pte = pte_addr[pte_count];
514*4882a593Smuzhiyun 
515*4882a593Smuzhiyun 		if (!av1_pte_is_page_valid(pte))
516*4882a593Smuzhiyun 			break;
517*4882a593Smuzhiyun 
518*4882a593Smuzhiyun 		pte_addr[pte_count] = av1_mk_pte_invalid(pte);
519*4882a593Smuzhiyun 	}
520*4882a593Smuzhiyun 
521*4882a593Smuzhiyun 	av1_table_flush(av1_domain, pte_dma, pte_count);
522*4882a593Smuzhiyun 
523*4882a593Smuzhiyun 	return pte_count * SPAGE_SIZE;
524*4882a593Smuzhiyun }
525*4882a593Smuzhiyun 
av1_iommu_map_iova(struct av1_iommu_domain * av1_domain,u32 * pte_addr,dma_addr_t pte_dma,dma_addr_t iova,phys_addr_t paddr,size_t size,int prot)526*4882a593Smuzhiyun static int av1_iommu_map_iova(struct av1_iommu_domain *av1_domain, u32 *pte_addr,
527*4882a593Smuzhiyun 			      dma_addr_t pte_dma, dma_addr_t iova,
528*4882a593Smuzhiyun 			      phys_addr_t paddr, size_t size, int prot)
529*4882a593Smuzhiyun {
530*4882a593Smuzhiyun 	unsigned int pte_count;
531*4882a593Smuzhiyun 	unsigned int pte_total = size / SPAGE_SIZE;
532*4882a593Smuzhiyun 	phys_addr_t page_phys;
533*4882a593Smuzhiyun 
534*4882a593Smuzhiyun 	assert_spin_locked(&av1_domain->dt_lock);
535*4882a593Smuzhiyun 
536*4882a593Smuzhiyun 	for (pte_count = 0; pte_count < pte_total; pte_count++) {
537*4882a593Smuzhiyun 		u32 pte = pte_addr[pte_count];
538*4882a593Smuzhiyun 
539*4882a593Smuzhiyun 		if (av1_pte_is_page_valid(pte))
540*4882a593Smuzhiyun 			goto unwind;
541*4882a593Smuzhiyun 
542*4882a593Smuzhiyun 		pte_addr[pte_count] = av1_mk_pte(paddr, prot);
543*4882a593Smuzhiyun 
544*4882a593Smuzhiyun 		paddr += SPAGE_SIZE;
545*4882a593Smuzhiyun 	}
546*4882a593Smuzhiyun 
547*4882a593Smuzhiyun 	av1_table_flush(av1_domain, pte_dma, pte_total);
548*4882a593Smuzhiyun 
549*4882a593Smuzhiyun 	return 0;
550*4882a593Smuzhiyun unwind:
551*4882a593Smuzhiyun 	/* Unmap the range of iovas that we just mapped */
552*4882a593Smuzhiyun 	av1_iommu_unmap_iova(av1_domain, pte_addr, pte_dma,
553*4882a593Smuzhiyun 			    pte_count * SPAGE_SIZE);
554*4882a593Smuzhiyun 
555*4882a593Smuzhiyun 	iova += pte_count * SPAGE_SIZE;
556*4882a593Smuzhiyun 	page_phys = av1_pte_page_address(pte_addr[pte_count]);
557*4882a593Smuzhiyun 	pr_err("iova: %pad already mapped to %pa cannot remap to phys: %pa prot: %#x\n",
558*4882a593Smuzhiyun 	       &iova, &page_phys, &paddr, prot);
559*4882a593Smuzhiyun 
560*4882a593Smuzhiyun 	return -EADDRINUSE;
561*4882a593Smuzhiyun }
562*4882a593Smuzhiyun 
av1_iommu_unmap(struct iommu_domain * domain,unsigned long _iova,size_t size,struct iommu_iotlb_gather * gather)563*4882a593Smuzhiyun static size_t av1_iommu_unmap(struct iommu_domain *domain, unsigned long _iova,
564*4882a593Smuzhiyun 			      size_t size, struct iommu_iotlb_gather *gather)
565*4882a593Smuzhiyun {
566*4882a593Smuzhiyun 	struct av1_iommu_domain *av1_domain = to_av1_domain(domain);
567*4882a593Smuzhiyun 	unsigned long flags;
568*4882a593Smuzhiyun 	dma_addr_t pte_dma, iova = (dma_addr_t)_iova;
569*4882a593Smuzhiyun 	phys_addr_t pt_phys;
570*4882a593Smuzhiyun 	u32 dte;
571*4882a593Smuzhiyun 	u32 *pte_addr;
572*4882a593Smuzhiyun 	size_t unmap_size;
573*4882a593Smuzhiyun 
574*4882a593Smuzhiyun 	spin_lock_irqsave(&av1_domain->dt_lock, flags);
575*4882a593Smuzhiyun 
576*4882a593Smuzhiyun 	dte = av1_domain->dt[av1_iova_dte_index(iova)];
577*4882a593Smuzhiyun 	/* Just return 0 if iova is unmapped */
578*4882a593Smuzhiyun 	if (!av1_dte_is_pt_valid(dte)) {
579*4882a593Smuzhiyun 		spin_unlock_irqrestore(&av1_domain->dt_lock, flags);
580*4882a593Smuzhiyun 		return 0;
581*4882a593Smuzhiyun 	}
582*4882a593Smuzhiyun 
583*4882a593Smuzhiyun 	pt_phys = av1_dte_pt_address(dte);
584*4882a593Smuzhiyun 	pte_addr = (u32 *)phys_to_virt(pt_phys) + av1_iova_pte_index(iova);
585*4882a593Smuzhiyun 	pte_dma = pt_phys + av1_iova_pte_index(iova) * sizeof(u32);
586*4882a593Smuzhiyun 	unmap_size = av1_iommu_unmap_iova(av1_domain, pte_addr, pte_dma, size);
587*4882a593Smuzhiyun 
588*4882a593Smuzhiyun 	spin_unlock_irqrestore(&av1_domain->dt_lock, flags);
589*4882a593Smuzhiyun 
590*4882a593Smuzhiyun 	return unmap_size;
591*4882a593Smuzhiyun }
592*4882a593Smuzhiyun 
av1_iommu_map(struct iommu_domain * domain,unsigned long _iova,phys_addr_t paddr,size_t size,int prot,gfp_t gfp)593*4882a593Smuzhiyun static int av1_iommu_map(struct iommu_domain *domain, unsigned long _iova,
594*4882a593Smuzhiyun 			    phys_addr_t paddr, size_t size, int prot, gfp_t gfp)
595*4882a593Smuzhiyun {
596*4882a593Smuzhiyun 	struct av1_iommu_domain *av1_domain = to_av1_domain(domain);
597*4882a593Smuzhiyun 	unsigned long flags;
598*4882a593Smuzhiyun 	dma_addr_t pte_dma, iova = (dma_addr_t)_iova;
599*4882a593Smuzhiyun 	u32 *page_table, *pte_addr;
600*4882a593Smuzhiyun 	u32 dte, pte_index;
601*4882a593Smuzhiyun 	int ret;
602*4882a593Smuzhiyun 
603*4882a593Smuzhiyun 	spin_lock_irqsave(&av1_domain->dt_lock, flags);
604*4882a593Smuzhiyun 
605*4882a593Smuzhiyun 	page_table = av1_dte_get_page_table(av1_domain, iova);
606*4882a593Smuzhiyun 	if (IS_ERR(page_table)) {
607*4882a593Smuzhiyun 		spin_unlock_irqrestore(&av1_domain->dt_lock, flags);
608*4882a593Smuzhiyun 		return PTR_ERR(page_table);
609*4882a593Smuzhiyun 	}
610*4882a593Smuzhiyun 
611*4882a593Smuzhiyun 	dte = av1_domain->dt[av1_iova_dte_index(iova)];
612*4882a593Smuzhiyun 	pte_index = av1_iova_pte_index(iova);
613*4882a593Smuzhiyun 	pte_addr = &page_table[pte_index];
614*4882a593Smuzhiyun 	pte_dma = av1_dte_pt_address(dte) + pte_index * sizeof(u32);
615*4882a593Smuzhiyun 	ret = av1_iommu_map_iova(av1_domain, pte_addr, pte_dma, iova,
616*4882a593Smuzhiyun 				   paddr, size, prot);
617*4882a593Smuzhiyun 
618*4882a593Smuzhiyun 	spin_unlock_irqrestore(&av1_domain->dt_lock, flags);
619*4882a593Smuzhiyun 
620*4882a593Smuzhiyun 	return ret;
621*4882a593Smuzhiyun }
622*4882a593Smuzhiyun 
av1_iommu_detach_device(struct iommu_domain * domain,struct device * dev)623*4882a593Smuzhiyun static void av1_iommu_detach_device(struct iommu_domain *domain,
624*4882a593Smuzhiyun 						  struct device *dev)
625*4882a593Smuzhiyun {
626*4882a593Smuzhiyun 	struct av1_iommu *iommu;
627*4882a593Smuzhiyun 	struct av1_iommu_domain *av1_domain = to_av1_domain(domain);
628*4882a593Smuzhiyun 	unsigned long flags;
629*4882a593Smuzhiyun 	int ret;
630*4882a593Smuzhiyun 
631*4882a593Smuzhiyun 	/* Allow 'virtual devices' (eg drm) to detach from domain */
632*4882a593Smuzhiyun 	iommu = av1_iommu_from_dev(dev);
633*4882a593Smuzhiyun 	if (WARN_ON(!iommu))
634*4882a593Smuzhiyun 		return;
635*4882a593Smuzhiyun 
636*4882a593Smuzhiyun 	dev_dbg(dev, "Detaching from iommu domain\n");
637*4882a593Smuzhiyun 
638*4882a593Smuzhiyun 	if (!iommu->domain)
639*4882a593Smuzhiyun 		return;
640*4882a593Smuzhiyun 
641*4882a593Smuzhiyun 	spin_lock_irqsave(&av1_domain->iommus_lock, flags);
642*4882a593Smuzhiyun 	list_del_init(&iommu->node);
643*4882a593Smuzhiyun 	spin_unlock_irqrestore(&av1_domain->iommus_lock, flags);
644*4882a593Smuzhiyun 
645*4882a593Smuzhiyun 	ret = pm_runtime_get_if_in_use(iommu->dev);
646*4882a593Smuzhiyun 	WARN_ON_ONCE(ret < 0);
647*4882a593Smuzhiyun 	if (ret > 0) {
648*4882a593Smuzhiyun 		av1_iommu_disable(iommu);
649*4882a593Smuzhiyun 		pm_runtime_put(iommu->dev);
650*4882a593Smuzhiyun 	}
651*4882a593Smuzhiyun 	iommu->domain = NULL;
652*4882a593Smuzhiyun }
653*4882a593Smuzhiyun 
av1_iommu_attach_device(struct iommu_domain * domain,struct device * dev)654*4882a593Smuzhiyun static int av1_iommu_attach_device(struct iommu_domain *domain,
655*4882a593Smuzhiyun 						  struct device *dev)
656*4882a593Smuzhiyun {
657*4882a593Smuzhiyun 	struct av1_iommu *iommu;
658*4882a593Smuzhiyun 	struct av1_iommu_domain *av1_domain = to_av1_domain(domain);
659*4882a593Smuzhiyun 	unsigned long flags;
660*4882a593Smuzhiyun 	int ret;
661*4882a593Smuzhiyun 
662*4882a593Smuzhiyun 	iommu = av1_iommu_from_dev(dev);
663*4882a593Smuzhiyun 	if (WARN_ON(!iommu))
664*4882a593Smuzhiyun 		return -ENODEV;
665*4882a593Smuzhiyun 
666*4882a593Smuzhiyun 	if (iommu->domain)
667*4882a593Smuzhiyun 		av1_iommu_detach_device(iommu->domain, dev);
668*4882a593Smuzhiyun 
669*4882a593Smuzhiyun 	iommu->domain = domain;
670*4882a593Smuzhiyun 
671*4882a593Smuzhiyun 	/* Attach NULL for disable iommu */
672*4882a593Smuzhiyun 	if (!domain)
673*4882a593Smuzhiyun 		return 0;
674*4882a593Smuzhiyun 
675*4882a593Smuzhiyun 	spin_lock_irqsave(&av1_domain->iommus_lock, flags);
676*4882a593Smuzhiyun 	list_add_tail(&iommu->node, &av1_domain->iommus);
677*4882a593Smuzhiyun 	spin_unlock_irqrestore(&av1_domain->iommus_lock, flags);
678*4882a593Smuzhiyun 
679*4882a593Smuzhiyun 	ret = pm_runtime_get_if_in_use(iommu->dev);
680*4882a593Smuzhiyun 	if (!ret || WARN_ON_ONCE(ret < 0))
681*4882a593Smuzhiyun 		return 0;
682*4882a593Smuzhiyun 
683*4882a593Smuzhiyun 	ret = av1_iommu_enable(iommu);
684*4882a593Smuzhiyun 	if (ret)
685*4882a593Smuzhiyun 		av1_iommu_detach_device(iommu->domain, dev);
686*4882a593Smuzhiyun 
687*4882a593Smuzhiyun 	pm_runtime_put(iommu->dev);
688*4882a593Smuzhiyun 
689*4882a593Smuzhiyun 	return ret;
690*4882a593Smuzhiyun }
691*4882a593Smuzhiyun 
av1_iommu_domain_free(struct iommu_domain * domain)692*4882a593Smuzhiyun static void av1_iommu_domain_free(struct iommu_domain *domain)
693*4882a593Smuzhiyun {
694*4882a593Smuzhiyun 	struct av1_iommu_domain *av1_domain = to_av1_domain(domain);
695*4882a593Smuzhiyun 	int i;
696*4882a593Smuzhiyun 
697*4882a593Smuzhiyun 	WARN_ON(!list_empty(&av1_domain->iommus));
698*4882a593Smuzhiyun 
699*4882a593Smuzhiyun 	for (i = 0; i < NUM_DT_ENTRIES; i++) {
700*4882a593Smuzhiyun 		u32 dte = av1_domain->dt[i];
701*4882a593Smuzhiyun 
702*4882a593Smuzhiyun 		if (av1_dte_is_pt_valid(dte)) {
703*4882a593Smuzhiyun 			phys_addr_t pt_phys = av1_dte_pt_address(dte);
704*4882a593Smuzhiyun 			u32 *page_table = phys_to_virt(pt_phys);
705*4882a593Smuzhiyun 
706*4882a593Smuzhiyun 			dma_unmap_single(dma_dev, pt_phys,
707*4882a593Smuzhiyun 					 SPAGE_SIZE, DMA_TO_DEVICE);
708*4882a593Smuzhiyun 			free_page((unsigned long)page_table);
709*4882a593Smuzhiyun 		}
710*4882a593Smuzhiyun 	}
711*4882a593Smuzhiyun 
712*4882a593Smuzhiyun 	dma_unmap_single(dma_dev, av1_domain->dt_dma,
713*4882a593Smuzhiyun 			 SPAGE_SIZE, DMA_TO_DEVICE);
714*4882a593Smuzhiyun 	free_page((unsigned long)av1_domain->dt);
715*4882a593Smuzhiyun 
716*4882a593Smuzhiyun 	dma_unmap_single(dma_dev, av1_domain->pta_dma,
717*4882a593Smuzhiyun 			 SPAGE_SIZE, DMA_TO_DEVICE);
718*4882a593Smuzhiyun 	free_page((unsigned long)av1_domain->pta);
719*4882a593Smuzhiyun 
720*4882a593Smuzhiyun 	if (domain->type == IOMMU_DOMAIN_DMA)
721*4882a593Smuzhiyun 		iommu_put_dma_cookie(&av1_domain->domain);
722*4882a593Smuzhiyun 	kfree(av1_domain);
723*4882a593Smuzhiyun }
724*4882a593Smuzhiyun 
av1_iommu_probe_device(struct device * dev)725*4882a593Smuzhiyun static struct iommu_device *av1_iommu_probe_device(struct device *dev)
726*4882a593Smuzhiyun {
727*4882a593Smuzhiyun 	struct av1_iommudata *data;
728*4882a593Smuzhiyun 	struct av1_iommu *iommu;
729*4882a593Smuzhiyun 
730*4882a593Smuzhiyun 	data = dev_iommu_priv_get(dev);
731*4882a593Smuzhiyun 	if (!data)
732*4882a593Smuzhiyun 		return ERR_PTR(-ENODEV);
733*4882a593Smuzhiyun 
734*4882a593Smuzhiyun 	iommu = av1_iommu_from_dev(dev);
735*4882a593Smuzhiyun 
736*4882a593Smuzhiyun 	pr_info("%s,%d, consumer : %s, supplier : %s\n",
737*4882a593Smuzhiyun 		__func__, __LINE__, dev_name(dev), dev_name(iommu->dev));
738*4882a593Smuzhiyun 
739*4882a593Smuzhiyun 	/*
740*4882a593Smuzhiyun 	 * link will free by platform_device_del(master) via
741*4882a593Smuzhiyun 	 * BUS_NOTIFY_REMOVED_DEVICE
742*4882a593Smuzhiyun 	 */
743*4882a593Smuzhiyun 	data->link = device_link_add(dev, iommu->dev,
744*4882a593Smuzhiyun 				     DL_FLAG_STATELESS | DL_FLAG_PM_RUNTIME);
745*4882a593Smuzhiyun 
746*4882a593Smuzhiyun 	/* set max segment size for dev, needed for single chunk map */
747*4882a593Smuzhiyun 	if (!dev->dma_parms)
748*4882a593Smuzhiyun 		dev->dma_parms = kzalloc(sizeof(*dev->dma_parms), GFP_KERNEL);
749*4882a593Smuzhiyun 	if (!dev->dma_parms)
750*4882a593Smuzhiyun 		return ERR_PTR(-ENOMEM);
751*4882a593Smuzhiyun 
752*4882a593Smuzhiyun 	dma_set_max_seg_size(dev, DMA_BIT_MASK(32));
753*4882a593Smuzhiyun 
754*4882a593Smuzhiyun 	return &iommu->iommu;
755*4882a593Smuzhiyun }
756*4882a593Smuzhiyun 
av1_iommu_release_device(struct device * dev)757*4882a593Smuzhiyun static void av1_iommu_release_device(struct device *dev)
758*4882a593Smuzhiyun {
759*4882a593Smuzhiyun 	const struct iommu_ops *ops = dev->bus->iommu_ops;
760*4882a593Smuzhiyun 
761*4882a593Smuzhiyun 	/* hack for rmmod */
762*4882a593Smuzhiyun 	__module_get(ops->owner);
763*4882a593Smuzhiyun }
764*4882a593Smuzhiyun 
av1_iommu_device_group(struct device * dev)765*4882a593Smuzhiyun static struct iommu_group *av1_iommu_device_group(struct device *dev)
766*4882a593Smuzhiyun {
767*4882a593Smuzhiyun 	struct av1_iommu *iommu;
768*4882a593Smuzhiyun 
769*4882a593Smuzhiyun 	iommu = av1_iommu_from_dev(dev);
770*4882a593Smuzhiyun 
771*4882a593Smuzhiyun 	return iommu_group_ref_get(iommu->group);
772*4882a593Smuzhiyun }
773*4882a593Smuzhiyun 
av1_iommu_of_xlate(struct device * dev,struct of_phandle_args * args)774*4882a593Smuzhiyun static int av1_iommu_of_xlate(struct device *dev,
775*4882a593Smuzhiyun 			     struct of_phandle_args *args)
776*4882a593Smuzhiyun {
777*4882a593Smuzhiyun 	struct platform_device *iommu_dev;
778*4882a593Smuzhiyun 	struct av1_iommudata *data;
779*4882a593Smuzhiyun 
780*4882a593Smuzhiyun 	data = devm_kzalloc(dma_dev, sizeof(*data), GFP_KERNEL);
781*4882a593Smuzhiyun 	if (!data)
782*4882a593Smuzhiyun 		return -ENOMEM;
783*4882a593Smuzhiyun 
784*4882a593Smuzhiyun 	dev_info(dev, "%s,%d\n", __func__, __LINE__);
785*4882a593Smuzhiyun 	iommu_dev = of_find_device_by_node(args->np);
786*4882a593Smuzhiyun 
787*4882a593Smuzhiyun 	data->iommu = platform_get_drvdata(iommu_dev);
788*4882a593Smuzhiyun 
789*4882a593Smuzhiyun 	dev_iommu_priv_set(dev, data);
790*4882a593Smuzhiyun 
791*4882a593Smuzhiyun 	platform_device_put(iommu_dev);
792*4882a593Smuzhiyun 
793*4882a593Smuzhiyun 	return 0;
794*4882a593Smuzhiyun }
795*4882a593Smuzhiyun 
av1_iommu_probe_finalize(struct device * dev)796*4882a593Smuzhiyun static void av1_iommu_probe_finalize(struct device *dev)
797*4882a593Smuzhiyun {
798*4882a593Smuzhiyun 	const struct iommu_ops *ops = dev->bus->iommu_ops;
799*4882a593Smuzhiyun 
800*4882a593Smuzhiyun 	/* hack for rmmod */
801*4882a593Smuzhiyun 	module_put(ops->owner);
802*4882a593Smuzhiyun }
803*4882a593Smuzhiyun 
804*4882a593Smuzhiyun static struct iommu_ops av1_iommu_ops = {
805*4882a593Smuzhiyun 	.domain_alloc = av1_iommu_domain_alloc,
806*4882a593Smuzhiyun 	.domain_free = av1_iommu_domain_free,
807*4882a593Smuzhiyun 	.attach_dev = av1_iommu_attach_device,
808*4882a593Smuzhiyun 	.detach_dev = av1_iommu_detach_device,
809*4882a593Smuzhiyun 	.map = av1_iommu_map,
810*4882a593Smuzhiyun 	.unmap = av1_iommu_unmap,
811*4882a593Smuzhiyun 	.flush_iotlb_all = av1_iommu_flush_tlb_all,
812*4882a593Smuzhiyun 	.probe_device = av1_iommu_probe_device,
813*4882a593Smuzhiyun 	.release_device = av1_iommu_release_device,
814*4882a593Smuzhiyun 	.iova_to_phys = av1_iommu_iova_to_phys,
815*4882a593Smuzhiyun 	.is_attach_deferred = av1_iommu_is_attach_deferred,
816*4882a593Smuzhiyun 	.device_group = av1_iommu_device_group,
817*4882a593Smuzhiyun 	.pgsize_bitmap = AV1_IOMMU_PGSIZE_BITMAP,
818*4882a593Smuzhiyun 	.of_xlate = av1_iommu_of_xlate,
819*4882a593Smuzhiyun 	.probe_finalize = av1_iommu_probe_finalize,
820*4882a593Smuzhiyun };
821*4882a593Smuzhiyun 
822*4882a593Smuzhiyun static const struct of_device_id av1_iommu_dt_ids[] = {
823*4882a593Smuzhiyun 	{
824*4882a593Smuzhiyun 		.compatible = "rockchip,iommu-av1",
825*4882a593Smuzhiyun 	},
826*4882a593Smuzhiyun 	{ /* sentinel */ }
827*4882a593Smuzhiyun };
828*4882a593Smuzhiyun 
av1_iommu_probe(struct platform_device * pdev)829*4882a593Smuzhiyun static int av1_iommu_probe(struct platform_device *pdev)
830*4882a593Smuzhiyun {
831*4882a593Smuzhiyun 	struct device *dev = &pdev->dev;
832*4882a593Smuzhiyun 	struct av1_iommu *iommu;
833*4882a593Smuzhiyun 	struct resource *res;
834*4882a593Smuzhiyun 	int num_res = pdev->num_resources;
835*4882a593Smuzhiyun 	int err, i;
836*4882a593Smuzhiyun 	const struct of_device_id *match;
837*4882a593Smuzhiyun 
838*4882a593Smuzhiyun 	iommu = devm_kzalloc(dev, sizeof(*iommu), GFP_KERNEL);
839*4882a593Smuzhiyun 	if (!iommu)
840*4882a593Smuzhiyun 		return -ENOMEM;
841*4882a593Smuzhiyun 
842*4882a593Smuzhiyun 	match = of_match_device(av1_iommu_dt_ids, dev);
843*4882a593Smuzhiyun 	if (!match)
844*4882a593Smuzhiyun 		return -EINVAL;
845*4882a593Smuzhiyun 
846*4882a593Smuzhiyun 	platform_set_drvdata(pdev, iommu);
847*4882a593Smuzhiyun 	iommu->dev = dev;
848*4882a593Smuzhiyun 	iommu->num_mmu = 0;
849*4882a593Smuzhiyun 
850*4882a593Smuzhiyun 	iommu->bases = devm_kcalloc(dev, num_res, sizeof(*iommu->bases),
851*4882a593Smuzhiyun 				    GFP_KERNEL);
852*4882a593Smuzhiyun 	if (!iommu->bases)
853*4882a593Smuzhiyun 		return -ENOMEM;
854*4882a593Smuzhiyun 
855*4882a593Smuzhiyun 	for (i = 0; i < num_res; i++) {
856*4882a593Smuzhiyun 		res = platform_get_resource(pdev, IORESOURCE_MEM, i);
857*4882a593Smuzhiyun 		if (!res)
858*4882a593Smuzhiyun 			continue;
859*4882a593Smuzhiyun 		iommu->bases[i] = devm_ioremap_resource(&pdev->dev, res);
860*4882a593Smuzhiyun 		if (IS_ERR(iommu->bases[i]))
861*4882a593Smuzhiyun 			continue;
862*4882a593Smuzhiyun 		iommu->num_mmu++;
863*4882a593Smuzhiyun 	}
864*4882a593Smuzhiyun 	if (iommu->num_mmu == 0)
865*4882a593Smuzhiyun 		return PTR_ERR(iommu->bases[0]);
866*4882a593Smuzhiyun 
867*4882a593Smuzhiyun 	iommu->num_irq = platform_irq_count(pdev);
868*4882a593Smuzhiyun 	if (iommu->num_irq < 0)
869*4882a593Smuzhiyun 		return iommu->num_irq;
870*4882a593Smuzhiyun 
871*4882a593Smuzhiyun 	err = devm_clk_bulk_get_all(dev, &iommu->clocks);
872*4882a593Smuzhiyun 	if (err >= 0)
873*4882a593Smuzhiyun 		iommu->num_clocks = err;
874*4882a593Smuzhiyun 	else if (err == -ENOENT)
875*4882a593Smuzhiyun 		iommu->num_clocks = 0;
876*4882a593Smuzhiyun 	else
877*4882a593Smuzhiyun 		return err;
878*4882a593Smuzhiyun 
879*4882a593Smuzhiyun 	err = clk_bulk_prepare(iommu->num_clocks, iommu->clocks);
880*4882a593Smuzhiyun 	if (err)
881*4882a593Smuzhiyun 		return err;
882*4882a593Smuzhiyun 
883*4882a593Smuzhiyun 	iommu->group = iommu_group_alloc();
884*4882a593Smuzhiyun 	if (IS_ERR(iommu->group)) {
885*4882a593Smuzhiyun 		err = PTR_ERR(iommu->group);
886*4882a593Smuzhiyun 		goto err_unprepare_clocks;
887*4882a593Smuzhiyun 	}
888*4882a593Smuzhiyun 
889*4882a593Smuzhiyun 	err = iommu_device_sysfs_add(&iommu->iommu, dev, NULL, dev_name(dev));
890*4882a593Smuzhiyun 	if (err)
891*4882a593Smuzhiyun 		goto err_put_group;
892*4882a593Smuzhiyun 
893*4882a593Smuzhiyun 	iommu_device_set_ops(&iommu->iommu, &av1_iommu_ops);
894*4882a593Smuzhiyun 	iommu_device_set_fwnode(&iommu->iommu, &dev->of_node->fwnode);
895*4882a593Smuzhiyun 
896*4882a593Smuzhiyun 	err = iommu_device_register(&iommu->iommu);
897*4882a593Smuzhiyun 	if (err)
898*4882a593Smuzhiyun 		goto err_remove_sysfs;
899*4882a593Smuzhiyun 
900*4882a593Smuzhiyun 	if (!dma_dev)
901*4882a593Smuzhiyun 		dma_dev = &pdev->dev;
902*4882a593Smuzhiyun 
903*4882a593Smuzhiyun 	bus_set_iommu(&av1dec_bus, &av1_iommu_ops);
904*4882a593Smuzhiyun 
905*4882a593Smuzhiyun 	pm_runtime_enable(dev);
906*4882a593Smuzhiyun 
907*4882a593Smuzhiyun 	for (i = 0; i < iommu->num_irq; i++) {
908*4882a593Smuzhiyun 		int irq = platform_get_irq(pdev, i);
909*4882a593Smuzhiyun 
910*4882a593Smuzhiyun 		if (irq < 0) {
911*4882a593Smuzhiyun 			err = -ENODEV;
912*4882a593Smuzhiyun 			goto err_diable_runtime;
913*4882a593Smuzhiyun 		}
914*4882a593Smuzhiyun 
915*4882a593Smuzhiyun 		err = devm_request_irq(iommu->dev, irq, av1_iommu_irq,
916*4882a593Smuzhiyun 				       IRQF_SHARED, dev_name(dev), iommu);
917*4882a593Smuzhiyun 		if (err)
918*4882a593Smuzhiyun 			goto err_diable_runtime;
919*4882a593Smuzhiyun 
920*4882a593Smuzhiyun 	}
921*4882a593Smuzhiyun 
922*4882a593Smuzhiyun 	return 0;
923*4882a593Smuzhiyun err_diable_runtime:
924*4882a593Smuzhiyun 	pm_runtime_disable(dev);
925*4882a593Smuzhiyun 	iommu_device_unregister(&iommu->iommu);
926*4882a593Smuzhiyun err_remove_sysfs:
927*4882a593Smuzhiyun 	iommu_device_sysfs_remove(&iommu->iommu);
928*4882a593Smuzhiyun err_put_group:
929*4882a593Smuzhiyun 	iommu_group_put(iommu->group);
930*4882a593Smuzhiyun err_unprepare_clocks:
931*4882a593Smuzhiyun 	clk_bulk_unprepare(iommu->num_clocks, iommu->clocks);
932*4882a593Smuzhiyun 	return err;
933*4882a593Smuzhiyun }
934*4882a593Smuzhiyun 
av1_iommu_remove(struct platform_device * pdev)935*4882a593Smuzhiyun static int av1_iommu_remove(struct platform_device *pdev)
936*4882a593Smuzhiyun {
937*4882a593Smuzhiyun 	struct device *dev = &pdev->dev;
938*4882a593Smuzhiyun 	struct av1_iommu *iommu = platform_get_drvdata(pdev);
939*4882a593Smuzhiyun 
940*4882a593Smuzhiyun 	iommu_device_unregister(&iommu->iommu);
941*4882a593Smuzhiyun 	iommu_device_sysfs_remove(&iommu->iommu);
942*4882a593Smuzhiyun 	pm_runtime_disable(dev);
943*4882a593Smuzhiyun 	return 0;
944*4882a593Smuzhiyun }
945*4882a593Smuzhiyun 
av1_iommu_shutdown(struct platform_device * pdev)946*4882a593Smuzhiyun static void av1_iommu_shutdown(struct platform_device *pdev)
947*4882a593Smuzhiyun {
948*4882a593Smuzhiyun 	struct av1_iommu *iommu = platform_get_drvdata(pdev);
949*4882a593Smuzhiyun 	int i;
950*4882a593Smuzhiyun 
951*4882a593Smuzhiyun 	for (i = 0; i < iommu->num_irq; i++) {
952*4882a593Smuzhiyun 		int irq = platform_get_irq(pdev, i);
953*4882a593Smuzhiyun 
954*4882a593Smuzhiyun 		devm_free_irq(iommu->dev, irq, iommu);
955*4882a593Smuzhiyun 	}
956*4882a593Smuzhiyun 
957*4882a593Smuzhiyun 	pm_runtime_force_suspend(&pdev->dev);
958*4882a593Smuzhiyun }
959*4882a593Smuzhiyun 
av1_iommu_suspend(struct device * dev)960*4882a593Smuzhiyun static int __maybe_unused av1_iommu_suspend(struct device *dev)
961*4882a593Smuzhiyun {
962*4882a593Smuzhiyun 	struct av1_iommu *iommu = dev_get_drvdata(dev);
963*4882a593Smuzhiyun 
964*4882a593Smuzhiyun 	if (!iommu->domain)
965*4882a593Smuzhiyun 		return 0;
966*4882a593Smuzhiyun 
967*4882a593Smuzhiyun 	av1_iommu_disable(iommu);
968*4882a593Smuzhiyun 	return 0;
969*4882a593Smuzhiyun }
970*4882a593Smuzhiyun 
av1_iommu_resume(struct device * dev)971*4882a593Smuzhiyun static int __maybe_unused av1_iommu_resume(struct device *dev)
972*4882a593Smuzhiyun {
973*4882a593Smuzhiyun 	struct av1_iommu *iommu = dev_get_drvdata(dev);
974*4882a593Smuzhiyun 
975*4882a593Smuzhiyun 	if (!iommu->domain)
976*4882a593Smuzhiyun 		return 0;
977*4882a593Smuzhiyun 
978*4882a593Smuzhiyun 	return av1_iommu_enable(iommu);
979*4882a593Smuzhiyun }
980*4882a593Smuzhiyun 
981*4882a593Smuzhiyun static const struct dev_pm_ops av1_iommu_pm_ops = {
982*4882a593Smuzhiyun 	SET_RUNTIME_PM_OPS(av1_iommu_suspend, av1_iommu_resume, NULL)
983*4882a593Smuzhiyun 	SET_SYSTEM_SLEEP_PM_OPS(pm_runtime_force_suspend,
984*4882a593Smuzhiyun 				pm_runtime_force_resume)
985*4882a593Smuzhiyun };
986*4882a593Smuzhiyun 
987*4882a593Smuzhiyun struct platform_driver rockchip_av1_iommu_driver = {
988*4882a593Smuzhiyun 	.probe = av1_iommu_probe,
989*4882a593Smuzhiyun 	.remove = av1_iommu_remove,
990*4882a593Smuzhiyun 	.shutdown = av1_iommu_shutdown,
991*4882a593Smuzhiyun 	.driver = {
992*4882a593Smuzhiyun 		   .name = "av1_iommu",
993*4882a593Smuzhiyun 		   .of_match_table = av1_iommu_dt_ids,
994*4882a593Smuzhiyun 		   .pm = &av1_iommu_pm_ops,
995*4882a593Smuzhiyun 		   .suppress_bind_attrs = true,
996*4882a593Smuzhiyun 	},
997*4882a593Smuzhiyun };
998