xref: /OK3568_Linux_fs/kernel/drivers/dma/mv_xor_v2.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Copyright (C) 2015-2016 Marvell International Ltd.
4*4882a593Smuzhiyun 
5*4882a593Smuzhiyun  */
6*4882a593Smuzhiyun 
7*4882a593Smuzhiyun #include <linux/clk.h>
8*4882a593Smuzhiyun #include <linux/dma-mapping.h>
9*4882a593Smuzhiyun #include <linux/interrupt.h>
10*4882a593Smuzhiyun #include <linux/io.h>
11*4882a593Smuzhiyun #include <linux/module.h>
12*4882a593Smuzhiyun #include <linux/msi.h>
13*4882a593Smuzhiyun #include <linux/of.h>
14*4882a593Smuzhiyun #include <linux/of_irq.h>
15*4882a593Smuzhiyun #include <linux/platform_device.h>
16*4882a593Smuzhiyun #include <linux/spinlock.h>
17*4882a593Smuzhiyun 
18*4882a593Smuzhiyun #include "dmaengine.h"
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun /* DMA Engine Registers */
21*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_BALR_OFF			0x000
22*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_BAHR_OFF			0x004
23*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_SIZE_OFF			0x008
24*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_DONE_OFF			0x00C
25*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_DONE_PENDING_MASK		0x7FFF
26*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_DONE_PENDING_SHIFT		0
27*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_DONE_READ_PTR_MASK		0x1FFF
28*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_DONE_READ_PTR_SHIFT	16
29*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_ARATTR_OFF			0x010
30*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_ATTR_CACHE_MASK		0x3F3F
31*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_ATTR_OUTER_SHAREABLE	0x202
32*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_ATTR_CACHEABLE		0x3C3C
33*4882a593Smuzhiyun #define MV_XOR_V2_DMA_IMSG_CDAT_OFF			0x014
34*4882a593Smuzhiyun #define MV_XOR_V2_DMA_IMSG_THRD_OFF			0x018
35*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_IMSG_THRD_MASK			0x7FFF
36*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_IMSG_TIMER_EN			BIT(18)
37*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_AWATTR_OFF			0x01C
38*4882a593Smuzhiyun   /* Same flags as MV_XOR_V2_DMA_DESQ_ARATTR_OFF */
39*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_ALLOC_OFF			0x04C
40*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_ALLOC_WRPTR_MASK		0xFFFF
41*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_ALLOC_WRPTR_SHIFT		16
42*4882a593Smuzhiyun #define MV_XOR_V2_DMA_IMSG_BALR_OFF			0x050
43*4882a593Smuzhiyun #define MV_XOR_V2_DMA_IMSG_BAHR_OFF			0x054
44*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_CTRL_OFF			0x100
45*4882a593Smuzhiyun #define	  MV_XOR_V2_DMA_DESQ_CTRL_32B			1
46*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_DESQ_CTRL_128B			7
47*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_STOP_OFF			0x800
48*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_DEALLOC_OFF			0x804
49*4882a593Smuzhiyun #define MV_XOR_V2_DMA_DESQ_ADD_OFF			0x808
50*4882a593Smuzhiyun #define MV_XOR_V2_DMA_IMSG_TMOT				0x810
51*4882a593Smuzhiyun #define   MV_XOR_V2_DMA_IMSG_TIMER_THRD_MASK		0x1FFF
52*4882a593Smuzhiyun 
53*4882a593Smuzhiyun /* XOR Global registers */
54*4882a593Smuzhiyun #define MV_XOR_V2_GLOB_BW_CTRL				0x4
55*4882a593Smuzhiyun #define   MV_XOR_V2_GLOB_BW_CTRL_NUM_OSTD_RD_SHIFT	0
56*4882a593Smuzhiyun #define   MV_XOR_V2_GLOB_BW_CTRL_NUM_OSTD_RD_VAL	64
57*4882a593Smuzhiyun #define   MV_XOR_V2_GLOB_BW_CTRL_NUM_OSTD_WR_SHIFT	8
58*4882a593Smuzhiyun #define   MV_XOR_V2_GLOB_BW_CTRL_NUM_OSTD_WR_VAL	8
59*4882a593Smuzhiyun #define   MV_XOR_V2_GLOB_BW_CTRL_RD_BURST_LEN_SHIFT	12
60*4882a593Smuzhiyun #define   MV_XOR_V2_GLOB_BW_CTRL_RD_BURST_LEN_VAL	4
61*4882a593Smuzhiyun #define   MV_XOR_V2_GLOB_BW_CTRL_WR_BURST_LEN_SHIFT	16
62*4882a593Smuzhiyun #define	  MV_XOR_V2_GLOB_BW_CTRL_WR_BURST_LEN_VAL	4
63*4882a593Smuzhiyun #define MV_XOR_V2_GLOB_PAUSE				0x014
64*4882a593Smuzhiyun #define   MV_XOR_V2_GLOB_PAUSE_AXI_TIME_DIS_VAL		0x8
65*4882a593Smuzhiyun #define MV_XOR_V2_GLOB_SYS_INT_CAUSE			0x200
66*4882a593Smuzhiyun #define MV_XOR_V2_GLOB_SYS_INT_MASK			0x204
67*4882a593Smuzhiyun #define MV_XOR_V2_GLOB_MEM_INT_CAUSE			0x220
68*4882a593Smuzhiyun #define MV_XOR_V2_GLOB_MEM_INT_MASK			0x224
69*4882a593Smuzhiyun 
70*4882a593Smuzhiyun #define MV_XOR_V2_MIN_DESC_SIZE				32
71*4882a593Smuzhiyun #define MV_XOR_V2_EXT_DESC_SIZE				128
72*4882a593Smuzhiyun 
73*4882a593Smuzhiyun #define MV_XOR_V2_DESC_RESERVED_SIZE			12
74*4882a593Smuzhiyun #define MV_XOR_V2_DESC_BUFF_D_ADDR_SIZE			12
75*4882a593Smuzhiyun 
76*4882a593Smuzhiyun #define MV_XOR_V2_CMD_LINE_NUM_MAX_D_BUF		8
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun /*
79*4882a593Smuzhiyun  * Descriptors queue size. With 32 bytes descriptors, up to 2^14
80*4882a593Smuzhiyun  * descriptors are allowed, with 128 bytes descriptors, up to 2^12
81*4882a593Smuzhiyun  * descriptors are allowed. This driver uses 128 bytes descriptors,
82*4882a593Smuzhiyun  * but experimentation has shown that a set of 1024 descriptors is
83*4882a593Smuzhiyun  * sufficient to reach a good level of performance.
84*4882a593Smuzhiyun  */
85*4882a593Smuzhiyun #define MV_XOR_V2_DESC_NUM				1024
86*4882a593Smuzhiyun 
87*4882a593Smuzhiyun /*
88*4882a593Smuzhiyun  * Threshold values for descriptors and timeout, determined by
89*4882a593Smuzhiyun  * experimentation as giving a good level of performance.
90*4882a593Smuzhiyun  */
91*4882a593Smuzhiyun #define MV_XOR_V2_DONE_IMSG_THRD  0x14
92*4882a593Smuzhiyun #define MV_XOR_V2_TIMER_THRD      0xB0
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun /**
95*4882a593Smuzhiyun  * struct mv_xor_v2_descriptor - DMA HW descriptor
96*4882a593Smuzhiyun  * @desc_id: used by S/W and is not affected by H/W.
97*4882a593Smuzhiyun  * @flags: error and status flags
98*4882a593Smuzhiyun  * @crc32_result: CRC32 calculation result
99*4882a593Smuzhiyun  * @desc_ctrl: operation mode and control flags
100*4882a593Smuzhiyun  * @buff_size: amount of bytes to be processed
101*4882a593Smuzhiyun  * @fill_pattern_src_addr: Fill-Pattern or Source-Address and
102*4882a593Smuzhiyun  * AW-Attributes
103*4882a593Smuzhiyun  * @data_buff_addr: Source (and might be RAID6 destination)
104*4882a593Smuzhiyun  * addresses of data buffers in RAID5 and RAID6
105*4882a593Smuzhiyun  * @reserved: reserved
106*4882a593Smuzhiyun  */
107*4882a593Smuzhiyun struct mv_xor_v2_descriptor {
108*4882a593Smuzhiyun 	u16 desc_id;
109*4882a593Smuzhiyun 	u16 flags;
110*4882a593Smuzhiyun 	u32 crc32_result;
111*4882a593Smuzhiyun 	u32 desc_ctrl;
112*4882a593Smuzhiyun 
113*4882a593Smuzhiyun 	/* Definitions for desc_ctrl */
114*4882a593Smuzhiyun #define DESC_NUM_ACTIVE_D_BUF_SHIFT	22
115*4882a593Smuzhiyun #define DESC_OP_MODE_SHIFT		28
116*4882a593Smuzhiyun #define DESC_OP_MODE_NOP		0	/* Idle operation */
117*4882a593Smuzhiyun #define DESC_OP_MODE_MEMCPY		1	/* Pure-DMA operation */
118*4882a593Smuzhiyun #define DESC_OP_MODE_MEMSET		2	/* Mem-Fill operation */
119*4882a593Smuzhiyun #define DESC_OP_MODE_MEMINIT		3	/* Mem-Init operation */
120*4882a593Smuzhiyun #define DESC_OP_MODE_MEM_COMPARE	4	/* Mem-Compare operation */
121*4882a593Smuzhiyun #define DESC_OP_MODE_CRC32		5	/* CRC32 calculation */
122*4882a593Smuzhiyun #define DESC_OP_MODE_XOR		6	/* RAID5 (XOR) operation */
123*4882a593Smuzhiyun #define DESC_OP_MODE_RAID6		7	/* RAID6 P&Q-generation */
124*4882a593Smuzhiyun #define DESC_OP_MODE_RAID6_REC		8	/* RAID6 Recovery */
125*4882a593Smuzhiyun #define DESC_Q_BUFFER_ENABLE		BIT(16)
126*4882a593Smuzhiyun #define DESC_P_BUFFER_ENABLE		BIT(17)
127*4882a593Smuzhiyun #define DESC_IOD			BIT(27)
128*4882a593Smuzhiyun 
129*4882a593Smuzhiyun 	u32 buff_size;
130*4882a593Smuzhiyun 	u32 fill_pattern_src_addr[4];
131*4882a593Smuzhiyun 	u32 data_buff_addr[MV_XOR_V2_DESC_BUFF_D_ADDR_SIZE];
132*4882a593Smuzhiyun 	u32 reserved[MV_XOR_V2_DESC_RESERVED_SIZE];
133*4882a593Smuzhiyun };
134*4882a593Smuzhiyun 
135*4882a593Smuzhiyun /**
136*4882a593Smuzhiyun  * struct mv_xor_v2_device - implements a xor device
137*4882a593Smuzhiyun  * @lock: lock for the engine
138*4882a593Smuzhiyun  * @clk: reference to the 'core' clock
139*4882a593Smuzhiyun  * @reg_clk: reference to the 'reg' clock
140*4882a593Smuzhiyun  * @dma_base: memory mapped DMA register base
141*4882a593Smuzhiyun  * @glob_base: memory mapped global register base
142*4882a593Smuzhiyun  * @irq_tasklet: tasklet used for IRQ handling call-backs
143*4882a593Smuzhiyun  * @free_sw_desc: linked list of free SW descriptors
144*4882a593Smuzhiyun  * @dmadev: dma device
145*4882a593Smuzhiyun  * @dmachan: dma channel
146*4882a593Smuzhiyun  * @hw_desq: HW descriptors queue
147*4882a593Smuzhiyun  * @hw_desq_virt: virtual address of DESCQ
148*4882a593Smuzhiyun  * @sw_desq: SW descriptors queue
149*4882a593Smuzhiyun  * @desc_size: HW descriptor size
150*4882a593Smuzhiyun  * @npendings: number of pending descriptors (for which tx_submit has
151*4882a593Smuzhiyun  * @hw_queue_idx: HW queue index
152*4882a593Smuzhiyun  * @msi_desc: local interrupt descriptor information
153*4882a593Smuzhiyun  * been called, but not yet issue_pending)
154*4882a593Smuzhiyun  */
155*4882a593Smuzhiyun struct mv_xor_v2_device {
156*4882a593Smuzhiyun 	spinlock_t lock;
157*4882a593Smuzhiyun 	void __iomem *dma_base;
158*4882a593Smuzhiyun 	void __iomem *glob_base;
159*4882a593Smuzhiyun 	struct clk *clk;
160*4882a593Smuzhiyun 	struct clk *reg_clk;
161*4882a593Smuzhiyun 	struct tasklet_struct irq_tasklet;
162*4882a593Smuzhiyun 	struct list_head free_sw_desc;
163*4882a593Smuzhiyun 	struct dma_device dmadev;
164*4882a593Smuzhiyun 	struct dma_chan	dmachan;
165*4882a593Smuzhiyun 	dma_addr_t hw_desq;
166*4882a593Smuzhiyun 	struct mv_xor_v2_descriptor *hw_desq_virt;
167*4882a593Smuzhiyun 	struct mv_xor_v2_sw_desc *sw_desq;
168*4882a593Smuzhiyun 	int desc_size;
169*4882a593Smuzhiyun 	unsigned int npendings;
170*4882a593Smuzhiyun 	unsigned int hw_queue_idx;
171*4882a593Smuzhiyun 	struct msi_desc *msi_desc;
172*4882a593Smuzhiyun };
173*4882a593Smuzhiyun 
174*4882a593Smuzhiyun /**
175*4882a593Smuzhiyun  * struct mv_xor_v2_sw_desc - implements a xor SW descriptor
176*4882a593Smuzhiyun  * @idx: descriptor index
177*4882a593Smuzhiyun  * @async_tx: support for the async_tx api
178*4882a593Smuzhiyun  * @hw_desc: assosiated HW descriptor
179*4882a593Smuzhiyun  * @free_list: node of the free SW descriprots list
180*4882a593Smuzhiyun */
181*4882a593Smuzhiyun struct mv_xor_v2_sw_desc {
182*4882a593Smuzhiyun 	int idx;
183*4882a593Smuzhiyun 	struct dma_async_tx_descriptor async_tx;
184*4882a593Smuzhiyun 	struct mv_xor_v2_descriptor hw_desc;
185*4882a593Smuzhiyun 	struct list_head free_list;
186*4882a593Smuzhiyun };
187*4882a593Smuzhiyun 
188*4882a593Smuzhiyun /*
189*4882a593Smuzhiyun  * Fill the data buffers to a HW descriptor
190*4882a593Smuzhiyun  */
mv_xor_v2_set_data_buffers(struct mv_xor_v2_device * xor_dev,struct mv_xor_v2_descriptor * desc,dma_addr_t src,int index)191*4882a593Smuzhiyun static void mv_xor_v2_set_data_buffers(struct mv_xor_v2_device *xor_dev,
192*4882a593Smuzhiyun 					struct mv_xor_v2_descriptor *desc,
193*4882a593Smuzhiyun 					dma_addr_t src, int index)
194*4882a593Smuzhiyun {
195*4882a593Smuzhiyun 	int arr_index = ((index >> 1) * 3);
196*4882a593Smuzhiyun 
197*4882a593Smuzhiyun 	/*
198*4882a593Smuzhiyun 	 * Fill the buffer's addresses to the descriptor.
199*4882a593Smuzhiyun 	 *
200*4882a593Smuzhiyun 	 * The format of the buffers address for 2 sequential buffers
201*4882a593Smuzhiyun 	 * X and X + 1:
202*4882a593Smuzhiyun 	 *
203*4882a593Smuzhiyun 	 *  First word:  Buffer-DX-Address-Low[31:0]
204*4882a593Smuzhiyun 	 *  Second word: Buffer-DX+1-Address-Low[31:0]
205*4882a593Smuzhiyun 	 *  Third word:  DX+1-Buffer-Address-High[47:32] [31:16]
206*4882a593Smuzhiyun 	 *		 DX-Buffer-Address-High[47:32] [15:0]
207*4882a593Smuzhiyun 	 */
208*4882a593Smuzhiyun 	if ((index & 0x1) == 0) {
209*4882a593Smuzhiyun 		desc->data_buff_addr[arr_index] = lower_32_bits(src);
210*4882a593Smuzhiyun 
211*4882a593Smuzhiyun 		desc->data_buff_addr[arr_index + 2] &= ~0xFFFF;
212*4882a593Smuzhiyun 		desc->data_buff_addr[arr_index + 2] |=
213*4882a593Smuzhiyun 			upper_32_bits(src) & 0xFFFF;
214*4882a593Smuzhiyun 	} else {
215*4882a593Smuzhiyun 		desc->data_buff_addr[arr_index + 1] =
216*4882a593Smuzhiyun 			lower_32_bits(src);
217*4882a593Smuzhiyun 
218*4882a593Smuzhiyun 		desc->data_buff_addr[arr_index + 2] &= ~0xFFFF0000;
219*4882a593Smuzhiyun 		desc->data_buff_addr[arr_index + 2] |=
220*4882a593Smuzhiyun 			(upper_32_bits(src) & 0xFFFF) << 16;
221*4882a593Smuzhiyun 	}
222*4882a593Smuzhiyun }
223*4882a593Smuzhiyun 
224*4882a593Smuzhiyun /*
225*4882a593Smuzhiyun  * notify the engine of new descriptors, and update the available index.
226*4882a593Smuzhiyun  */
mv_xor_v2_add_desc_to_desq(struct mv_xor_v2_device * xor_dev,int num_of_desc)227*4882a593Smuzhiyun static void mv_xor_v2_add_desc_to_desq(struct mv_xor_v2_device *xor_dev,
228*4882a593Smuzhiyun 				       int num_of_desc)
229*4882a593Smuzhiyun {
230*4882a593Smuzhiyun 	/* write the number of new descriptors in the DESQ. */
231*4882a593Smuzhiyun 	writel(num_of_desc, xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_ADD_OFF);
232*4882a593Smuzhiyun }
233*4882a593Smuzhiyun 
234*4882a593Smuzhiyun /*
235*4882a593Smuzhiyun  * free HW descriptors
236*4882a593Smuzhiyun  */
mv_xor_v2_free_desc_from_desq(struct mv_xor_v2_device * xor_dev,int num_of_desc)237*4882a593Smuzhiyun static void mv_xor_v2_free_desc_from_desq(struct mv_xor_v2_device *xor_dev,
238*4882a593Smuzhiyun 					  int num_of_desc)
239*4882a593Smuzhiyun {
240*4882a593Smuzhiyun 	/* write the number of new descriptors in the DESQ. */
241*4882a593Smuzhiyun 	writel(num_of_desc, xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_DEALLOC_OFF);
242*4882a593Smuzhiyun }
243*4882a593Smuzhiyun 
244*4882a593Smuzhiyun /*
245*4882a593Smuzhiyun  * Set descriptor size
246*4882a593Smuzhiyun  * Return the HW descriptor size in bytes
247*4882a593Smuzhiyun  */
mv_xor_v2_set_desc_size(struct mv_xor_v2_device * xor_dev)248*4882a593Smuzhiyun static int mv_xor_v2_set_desc_size(struct mv_xor_v2_device *xor_dev)
249*4882a593Smuzhiyun {
250*4882a593Smuzhiyun 	writel(MV_XOR_V2_DMA_DESQ_CTRL_128B,
251*4882a593Smuzhiyun 	       xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_CTRL_OFF);
252*4882a593Smuzhiyun 
253*4882a593Smuzhiyun 	return MV_XOR_V2_EXT_DESC_SIZE;
254*4882a593Smuzhiyun }
255*4882a593Smuzhiyun 
256*4882a593Smuzhiyun /*
257*4882a593Smuzhiyun  * Set the IMSG threshold
258*4882a593Smuzhiyun  */
259*4882a593Smuzhiyun static inline
mv_xor_v2_enable_imsg_thrd(struct mv_xor_v2_device * xor_dev)260*4882a593Smuzhiyun void mv_xor_v2_enable_imsg_thrd(struct mv_xor_v2_device *xor_dev)
261*4882a593Smuzhiyun {
262*4882a593Smuzhiyun 	u32 reg;
263*4882a593Smuzhiyun 
264*4882a593Smuzhiyun 	/* Configure threshold of number of descriptors, and enable timer */
265*4882a593Smuzhiyun 	reg = readl(xor_dev->dma_base + MV_XOR_V2_DMA_IMSG_THRD_OFF);
266*4882a593Smuzhiyun 	reg &= ~MV_XOR_V2_DMA_IMSG_THRD_MASK;
267*4882a593Smuzhiyun 	reg |= MV_XOR_V2_DONE_IMSG_THRD;
268*4882a593Smuzhiyun 	reg |= MV_XOR_V2_DMA_IMSG_TIMER_EN;
269*4882a593Smuzhiyun 	writel(reg, xor_dev->dma_base + MV_XOR_V2_DMA_IMSG_THRD_OFF);
270*4882a593Smuzhiyun 
271*4882a593Smuzhiyun 	/* Configure Timer Threshold */
272*4882a593Smuzhiyun 	reg = readl(xor_dev->dma_base + MV_XOR_V2_DMA_IMSG_TMOT);
273*4882a593Smuzhiyun 	reg &= ~MV_XOR_V2_DMA_IMSG_TIMER_THRD_MASK;
274*4882a593Smuzhiyun 	reg |= MV_XOR_V2_TIMER_THRD;
275*4882a593Smuzhiyun 	writel(reg, xor_dev->dma_base + MV_XOR_V2_DMA_IMSG_TMOT);
276*4882a593Smuzhiyun }
277*4882a593Smuzhiyun 
mv_xor_v2_interrupt_handler(int irq,void * data)278*4882a593Smuzhiyun static irqreturn_t mv_xor_v2_interrupt_handler(int irq, void *data)
279*4882a593Smuzhiyun {
280*4882a593Smuzhiyun 	struct mv_xor_v2_device *xor_dev = data;
281*4882a593Smuzhiyun 	unsigned int ndescs;
282*4882a593Smuzhiyun 	u32 reg;
283*4882a593Smuzhiyun 
284*4882a593Smuzhiyun 	reg = readl(xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_DONE_OFF);
285*4882a593Smuzhiyun 
286*4882a593Smuzhiyun 	ndescs = ((reg >> MV_XOR_V2_DMA_DESQ_DONE_PENDING_SHIFT) &
287*4882a593Smuzhiyun 		  MV_XOR_V2_DMA_DESQ_DONE_PENDING_MASK);
288*4882a593Smuzhiyun 
289*4882a593Smuzhiyun 	/* No descriptors to process */
290*4882a593Smuzhiyun 	if (!ndescs)
291*4882a593Smuzhiyun 		return IRQ_NONE;
292*4882a593Smuzhiyun 
293*4882a593Smuzhiyun 	/* schedule a tasklet to handle descriptors callbacks */
294*4882a593Smuzhiyun 	tasklet_schedule(&xor_dev->irq_tasklet);
295*4882a593Smuzhiyun 
296*4882a593Smuzhiyun 	return IRQ_HANDLED;
297*4882a593Smuzhiyun }
298*4882a593Smuzhiyun 
299*4882a593Smuzhiyun /*
300*4882a593Smuzhiyun  * submit a descriptor to the DMA engine
301*4882a593Smuzhiyun  */
302*4882a593Smuzhiyun static dma_cookie_t
mv_xor_v2_tx_submit(struct dma_async_tx_descriptor * tx)303*4882a593Smuzhiyun mv_xor_v2_tx_submit(struct dma_async_tx_descriptor *tx)
304*4882a593Smuzhiyun {
305*4882a593Smuzhiyun 	void *dest_hw_desc;
306*4882a593Smuzhiyun 	dma_cookie_t cookie;
307*4882a593Smuzhiyun 	struct mv_xor_v2_sw_desc *sw_desc =
308*4882a593Smuzhiyun 		container_of(tx, struct mv_xor_v2_sw_desc, async_tx);
309*4882a593Smuzhiyun 	struct mv_xor_v2_device *xor_dev =
310*4882a593Smuzhiyun 		container_of(tx->chan, struct mv_xor_v2_device, dmachan);
311*4882a593Smuzhiyun 
312*4882a593Smuzhiyun 	dev_dbg(xor_dev->dmadev.dev,
313*4882a593Smuzhiyun 		"%s sw_desc %p: async_tx %p\n",
314*4882a593Smuzhiyun 		__func__, sw_desc, &sw_desc->async_tx);
315*4882a593Smuzhiyun 
316*4882a593Smuzhiyun 	/* assign coookie */
317*4882a593Smuzhiyun 	spin_lock_bh(&xor_dev->lock);
318*4882a593Smuzhiyun 	cookie = dma_cookie_assign(tx);
319*4882a593Smuzhiyun 
320*4882a593Smuzhiyun 	/* copy the HW descriptor from the SW descriptor to the DESQ */
321*4882a593Smuzhiyun 	dest_hw_desc = xor_dev->hw_desq_virt + xor_dev->hw_queue_idx;
322*4882a593Smuzhiyun 
323*4882a593Smuzhiyun 	memcpy(dest_hw_desc, &sw_desc->hw_desc, xor_dev->desc_size);
324*4882a593Smuzhiyun 
325*4882a593Smuzhiyun 	xor_dev->npendings++;
326*4882a593Smuzhiyun 	xor_dev->hw_queue_idx++;
327*4882a593Smuzhiyun 	if (xor_dev->hw_queue_idx >= MV_XOR_V2_DESC_NUM)
328*4882a593Smuzhiyun 		xor_dev->hw_queue_idx = 0;
329*4882a593Smuzhiyun 
330*4882a593Smuzhiyun 	spin_unlock_bh(&xor_dev->lock);
331*4882a593Smuzhiyun 
332*4882a593Smuzhiyun 	return cookie;
333*4882a593Smuzhiyun }
334*4882a593Smuzhiyun 
335*4882a593Smuzhiyun /*
336*4882a593Smuzhiyun  * Prepare a SW descriptor
337*4882a593Smuzhiyun  */
338*4882a593Smuzhiyun static struct mv_xor_v2_sw_desc	*
mv_xor_v2_prep_sw_desc(struct mv_xor_v2_device * xor_dev)339*4882a593Smuzhiyun mv_xor_v2_prep_sw_desc(struct mv_xor_v2_device *xor_dev)
340*4882a593Smuzhiyun {
341*4882a593Smuzhiyun 	struct mv_xor_v2_sw_desc *sw_desc;
342*4882a593Smuzhiyun 	bool found = false;
343*4882a593Smuzhiyun 
344*4882a593Smuzhiyun 	/* Lock the channel */
345*4882a593Smuzhiyun 	spin_lock_bh(&xor_dev->lock);
346*4882a593Smuzhiyun 
347*4882a593Smuzhiyun 	if (list_empty(&xor_dev->free_sw_desc)) {
348*4882a593Smuzhiyun 		spin_unlock_bh(&xor_dev->lock);
349*4882a593Smuzhiyun 		/* schedule tasklet to free some descriptors */
350*4882a593Smuzhiyun 		tasklet_schedule(&xor_dev->irq_tasklet);
351*4882a593Smuzhiyun 		return NULL;
352*4882a593Smuzhiyun 	}
353*4882a593Smuzhiyun 
354*4882a593Smuzhiyun 	list_for_each_entry(sw_desc, &xor_dev->free_sw_desc, free_list) {
355*4882a593Smuzhiyun 		if (async_tx_test_ack(&sw_desc->async_tx)) {
356*4882a593Smuzhiyun 			found = true;
357*4882a593Smuzhiyun 			break;
358*4882a593Smuzhiyun 		}
359*4882a593Smuzhiyun 	}
360*4882a593Smuzhiyun 
361*4882a593Smuzhiyun 	if (!found) {
362*4882a593Smuzhiyun 		spin_unlock_bh(&xor_dev->lock);
363*4882a593Smuzhiyun 		return NULL;
364*4882a593Smuzhiyun 	}
365*4882a593Smuzhiyun 
366*4882a593Smuzhiyun 	list_del(&sw_desc->free_list);
367*4882a593Smuzhiyun 
368*4882a593Smuzhiyun 	/* Release the channel */
369*4882a593Smuzhiyun 	spin_unlock_bh(&xor_dev->lock);
370*4882a593Smuzhiyun 
371*4882a593Smuzhiyun 	return sw_desc;
372*4882a593Smuzhiyun }
373*4882a593Smuzhiyun 
374*4882a593Smuzhiyun /*
375*4882a593Smuzhiyun  * Prepare a HW descriptor for a memcpy operation
376*4882a593Smuzhiyun  */
377*4882a593Smuzhiyun static struct dma_async_tx_descriptor *
mv_xor_v2_prep_dma_memcpy(struct dma_chan * chan,dma_addr_t dest,dma_addr_t src,size_t len,unsigned long flags)378*4882a593Smuzhiyun mv_xor_v2_prep_dma_memcpy(struct dma_chan *chan, dma_addr_t dest,
379*4882a593Smuzhiyun 			  dma_addr_t src, size_t len, unsigned long flags)
380*4882a593Smuzhiyun {
381*4882a593Smuzhiyun 	struct mv_xor_v2_sw_desc *sw_desc;
382*4882a593Smuzhiyun 	struct mv_xor_v2_descriptor *hw_descriptor;
383*4882a593Smuzhiyun 	struct mv_xor_v2_device	*xor_dev;
384*4882a593Smuzhiyun 
385*4882a593Smuzhiyun 	xor_dev = container_of(chan, struct mv_xor_v2_device, dmachan);
386*4882a593Smuzhiyun 
387*4882a593Smuzhiyun 	dev_dbg(xor_dev->dmadev.dev,
388*4882a593Smuzhiyun 		"%s len: %zu src %pad dest %pad flags: %ld\n",
389*4882a593Smuzhiyun 		__func__, len, &src, &dest, flags);
390*4882a593Smuzhiyun 
391*4882a593Smuzhiyun 	sw_desc = mv_xor_v2_prep_sw_desc(xor_dev);
392*4882a593Smuzhiyun 	if (!sw_desc)
393*4882a593Smuzhiyun 		return NULL;
394*4882a593Smuzhiyun 
395*4882a593Smuzhiyun 	sw_desc->async_tx.flags = flags;
396*4882a593Smuzhiyun 
397*4882a593Smuzhiyun 	/* set the HW descriptor */
398*4882a593Smuzhiyun 	hw_descriptor = &sw_desc->hw_desc;
399*4882a593Smuzhiyun 
400*4882a593Smuzhiyun 	/* save the SW descriptor ID to restore when operation is done */
401*4882a593Smuzhiyun 	hw_descriptor->desc_id = sw_desc->idx;
402*4882a593Smuzhiyun 
403*4882a593Smuzhiyun 	/* Set the MEMCPY control word */
404*4882a593Smuzhiyun 	hw_descriptor->desc_ctrl =
405*4882a593Smuzhiyun 		DESC_OP_MODE_MEMCPY << DESC_OP_MODE_SHIFT;
406*4882a593Smuzhiyun 
407*4882a593Smuzhiyun 	if (flags & DMA_PREP_INTERRUPT)
408*4882a593Smuzhiyun 		hw_descriptor->desc_ctrl |= DESC_IOD;
409*4882a593Smuzhiyun 
410*4882a593Smuzhiyun 	/* Set source address */
411*4882a593Smuzhiyun 	hw_descriptor->fill_pattern_src_addr[0] = lower_32_bits(src);
412*4882a593Smuzhiyun 	hw_descriptor->fill_pattern_src_addr[1] =
413*4882a593Smuzhiyun 		upper_32_bits(src) & 0xFFFF;
414*4882a593Smuzhiyun 
415*4882a593Smuzhiyun 	/* Set Destination address */
416*4882a593Smuzhiyun 	hw_descriptor->fill_pattern_src_addr[2] = lower_32_bits(dest);
417*4882a593Smuzhiyun 	hw_descriptor->fill_pattern_src_addr[3] =
418*4882a593Smuzhiyun 		upper_32_bits(dest) & 0xFFFF;
419*4882a593Smuzhiyun 
420*4882a593Smuzhiyun 	/* Set buffers size */
421*4882a593Smuzhiyun 	hw_descriptor->buff_size = len;
422*4882a593Smuzhiyun 
423*4882a593Smuzhiyun 	/* return the async tx descriptor */
424*4882a593Smuzhiyun 	return &sw_desc->async_tx;
425*4882a593Smuzhiyun }
426*4882a593Smuzhiyun 
427*4882a593Smuzhiyun /*
428*4882a593Smuzhiyun  * Prepare a HW descriptor for a XOR operation
429*4882a593Smuzhiyun  */
430*4882a593Smuzhiyun static struct dma_async_tx_descriptor *
mv_xor_v2_prep_dma_xor(struct dma_chan * chan,dma_addr_t dest,dma_addr_t * src,unsigned int src_cnt,size_t len,unsigned long flags)431*4882a593Smuzhiyun mv_xor_v2_prep_dma_xor(struct dma_chan *chan, dma_addr_t dest, dma_addr_t *src,
432*4882a593Smuzhiyun 		       unsigned int src_cnt, size_t len, unsigned long flags)
433*4882a593Smuzhiyun {
434*4882a593Smuzhiyun 	struct mv_xor_v2_sw_desc *sw_desc;
435*4882a593Smuzhiyun 	struct mv_xor_v2_descriptor *hw_descriptor;
436*4882a593Smuzhiyun 	struct mv_xor_v2_device	*xor_dev =
437*4882a593Smuzhiyun 		container_of(chan, struct mv_xor_v2_device, dmachan);
438*4882a593Smuzhiyun 	int i;
439*4882a593Smuzhiyun 
440*4882a593Smuzhiyun 	if (src_cnt > MV_XOR_V2_CMD_LINE_NUM_MAX_D_BUF || src_cnt < 1)
441*4882a593Smuzhiyun 		return NULL;
442*4882a593Smuzhiyun 
443*4882a593Smuzhiyun 	dev_dbg(xor_dev->dmadev.dev,
444*4882a593Smuzhiyun 		"%s src_cnt: %d len: %zu dest %pad flags: %ld\n",
445*4882a593Smuzhiyun 		__func__, src_cnt, len, &dest, flags);
446*4882a593Smuzhiyun 
447*4882a593Smuzhiyun 	sw_desc = mv_xor_v2_prep_sw_desc(xor_dev);
448*4882a593Smuzhiyun 	if (!sw_desc)
449*4882a593Smuzhiyun 		return NULL;
450*4882a593Smuzhiyun 
451*4882a593Smuzhiyun 	sw_desc->async_tx.flags = flags;
452*4882a593Smuzhiyun 
453*4882a593Smuzhiyun 	/* set the HW descriptor */
454*4882a593Smuzhiyun 	hw_descriptor = &sw_desc->hw_desc;
455*4882a593Smuzhiyun 
456*4882a593Smuzhiyun 	/* save the SW descriptor ID to restore when operation is done */
457*4882a593Smuzhiyun 	hw_descriptor->desc_id = sw_desc->idx;
458*4882a593Smuzhiyun 
459*4882a593Smuzhiyun 	/* Set the XOR control word */
460*4882a593Smuzhiyun 	hw_descriptor->desc_ctrl =
461*4882a593Smuzhiyun 		DESC_OP_MODE_XOR << DESC_OP_MODE_SHIFT;
462*4882a593Smuzhiyun 	hw_descriptor->desc_ctrl |= DESC_P_BUFFER_ENABLE;
463*4882a593Smuzhiyun 
464*4882a593Smuzhiyun 	if (flags & DMA_PREP_INTERRUPT)
465*4882a593Smuzhiyun 		hw_descriptor->desc_ctrl |= DESC_IOD;
466*4882a593Smuzhiyun 
467*4882a593Smuzhiyun 	/* Set the data buffers */
468*4882a593Smuzhiyun 	for (i = 0; i < src_cnt; i++)
469*4882a593Smuzhiyun 		mv_xor_v2_set_data_buffers(xor_dev, hw_descriptor, src[i], i);
470*4882a593Smuzhiyun 
471*4882a593Smuzhiyun 	hw_descriptor->desc_ctrl |=
472*4882a593Smuzhiyun 		src_cnt << DESC_NUM_ACTIVE_D_BUF_SHIFT;
473*4882a593Smuzhiyun 
474*4882a593Smuzhiyun 	/* Set Destination address */
475*4882a593Smuzhiyun 	hw_descriptor->fill_pattern_src_addr[2] = lower_32_bits(dest);
476*4882a593Smuzhiyun 	hw_descriptor->fill_pattern_src_addr[3] =
477*4882a593Smuzhiyun 		upper_32_bits(dest) & 0xFFFF;
478*4882a593Smuzhiyun 
479*4882a593Smuzhiyun 	/* Set buffers size */
480*4882a593Smuzhiyun 	hw_descriptor->buff_size = len;
481*4882a593Smuzhiyun 
482*4882a593Smuzhiyun 	/* return the async tx descriptor */
483*4882a593Smuzhiyun 	return &sw_desc->async_tx;
484*4882a593Smuzhiyun }
485*4882a593Smuzhiyun 
486*4882a593Smuzhiyun /*
487*4882a593Smuzhiyun  * Prepare a HW descriptor for interrupt operation.
488*4882a593Smuzhiyun  */
489*4882a593Smuzhiyun static struct dma_async_tx_descriptor *
mv_xor_v2_prep_dma_interrupt(struct dma_chan * chan,unsigned long flags)490*4882a593Smuzhiyun mv_xor_v2_prep_dma_interrupt(struct dma_chan *chan, unsigned long flags)
491*4882a593Smuzhiyun {
492*4882a593Smuzhiyun 	struct mv_xor_v2_sw_desc *sw_desc;
493*4882a593Smuzhiyun 	struct mv_xor_v2_descriptor *hw_descriptor;
494*4882a593Smuzhiyun 	struct mv_xor_v2_device	*xor_dev =
495*4882a593Smuzhiyun 		container_of(chan, struct mv_xor_v2_device, dmachan);
496*4882a593Smuzhiyun 
497*4882a593Smuzhiyun 	sw_desc = mv_xor_v2_prep_sw_desc(xor_dev);
498*4882a593Smuzhiyun 	if (!sw_desc)
499*4882a593Smuzhiyun 		return NULL;
500*4882a593Smuzhiyun 
501*4882a593Smuzhiyun 	/* set the HW descriptor */
502*4882a593Smuzhiyun 	hw_descriptor = &sw_desc->hw_desc;
503*4882a593Smuzhiyun 
504*4882a593Smuzhiyun 	/* save the SW descriptor ID to restore when operation is done */
505*4882a593Smuzhiyun 	hw_descriptor->desc_id = sw_desc->idx;
506*4882a593Smuzhiyun 
507*4882a593Smuzhiyun 	/* Set the INTERRUPT control word */
508*4882a593Smuzhiyun 	hw_descriptor->desc_ctrl =
509*4882a593Smuzhiyun 		DESC_OP_MODE_NOP << DESC_OP_MODE_SHIFT;
510*4882a593Smuzhiyun 	hw_descriptor->desc_ctrl |= DESC_IOD;
511*4882a593Smuzhiyun 
512*4882a593Smuzhiyun 	/* return the async tx descriptor */
513*4882a593Smuzhiyun 	return &sw_desc->async_tx;
514*4882a593Smuzhiyun }
515*4882a593Smuzhiyun 
516*4882a593Smuzhiyun /*
517*4882a593Smuzhiyun  * push pending transactions to hardware
518*4882a593Smuzhiyun  */
mv_xor_v2_issue_pending(struct dma_chan * chan)519*4882a593Smuzhiyun static void mv_xor_v2_issue_pending(struct dma_chan *chan)
520*4882a593Smuzhiyun {
521*4882a593Smuzhiyun 	struct mv_xor_v2_device *xor_dev =
522*4882a593Smuzhiyun 		container_of(chan, struct mv_xor_v2_device, dmachan);
523*4882a593Smuzhiyun 
524*4882a593Smuzhiyun 	spin_lock_bh(&xor_dev->lock);
525*4882a593Smuzhiyun 
526*4882a593Smuzhiyun 	/*
527*4882a593Smuzhiyun 	 * update the engine with the number of descriptors to
528*4882a593Smuzhiyun 	 * process
529*4882a593Smuzhiyun 	 */
530*4882a593Smuzhiyun 	mv_xor_v2_add_desc_to_desq(xor_dev, xor_dev->npendings);
531*4882a593Smuzhiyun 	xor_dev->npendings = 0;
532*4882a593Smuzhiyun 
533*4882a593Smuzhiyun 	spin_unlock_bh(&xor_dev->lock);
534*4882a593Smuzhiyun }
535*4882a593Smuzhiyun 
536*4882a593Smuzhiyun static inline
mv_xor_v2_get_pending_params(struct mv_xor_v2_device * xor_dev,int * pending_ptr)537*4882a593Smuzhiyun int mv_xor_v2_get_pending_params(struct mv_xor_v2_device *xor_dev,
538*4882a593Smuzhiyun 				 int *pending_ptr)
539*4882a593Smuzhiyun {
540*4882a593Smuzhiyun 	u32 reg;
541*4882a593Smuzhiyun 
542*4882a593Smuzhiyun 	reg = readl(xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_DONE_OFF);
543*4882a593Smuzhiyun 
544*4882a593Smuzhiyun 	/* get the next pending descriptor index */
545*4882a593Smuzhiyun 	*pending_ptr = ((reg >> MV_XOR_V2_DMA_DESQ_DONE_READ_PTR_SHIFT) &
546*4882a593Smuzhiyun 			MV_XOR_V2_DMA_DESQ_DONE_READ_PTR_MASK);
547*4882a593Smuzhiyun 
548*4882a593Smuzhiyun 	/* get the number of descriptors pending handle */
549*4882a593Smuzhiyun 	return ((reg >> MV_XOR_V2_DMA_DESQ_DONE_PENDING_SHIFT) &
550*4882a593Smuzhiyun 		MV_XOR_V2_DMA_DESQ_DONE_PENDING_MASK);
551*4882a593Smuzhiyun }
552*4882a593Smuzhiyun 
553*4882a593Smuzhiyun /*
554*4882a593Smuzhiyun  * handle the descriptors after HW process
555*4882a593Smuzhiyun  */
mv_xor_v2_tasklet(struct tasklet_struct * t)556*4882a593Smuzhiyun static void mv_xor_v2_tasklet(struct tasklet_struct *t)
557*4882a593Smuzhiyun {
558*4882a593Smuzhiyun 	struct mv_xor_v2_device *xor_dev = from_tasklet(xor_dev, t,
559*4882a593Smuzhiyun 							irq_tasklet);
560*4882a593Smuzhiyun 	int pending_ptr, num_of_pending, i;
561*4882a593Smuzhiyun 	struct mv_xor_v2_sw_desc *next_pending_sw_desc = NULL;
562*4882a593Smuzhiyun 
563*4882a593Smuzhiyun 	dev_dbg(xor_dev->dmadev.dev, "%s %d\n", __func__, __LINE__);
564*4882a593Smuzhiyun 
565*4882a593Smuzhiyun 	/* get the pending descriptors parameters */
566*4882a593Smuzhiyun 	num_of_pending = mv_xor_v2_get_pending_params(xor_dev, &pending_ptr);
567*4882a593Smuzhiyun 
568*4882a593Smuzhiyun 	/* loop over free descriptors */
569*4882a593Smuzhiyun 	for (i = 0; i < num_of_pending; i++) {
570*4882a593Smuzhiyun 		struct mv_xor_v2_descriptor *next_pending_hw_desc =
571*4882a593Smuzhiyun 			xor_dev->hw_desq_virt + pending_ptr;
572*4882a593Smuzhiyun 
573*4882a593Smuzhiyun 		/* get the SW descriptor related to the HW descriptor */
574*4882a593Smuzhiyun 		next_pending_sw_desc =
575*4882a593Smuzhiyun 			&xor_dev->sw_desq[next_pending_hw_desc->desc_id];
576*4882a593Smuzhiyun 
577*4882a593Smuzhiyun 		/* call the callback */
578*4882a593Smuzhiyun 		if (next_pending_sw_desc->async_tx.cookie > 0) {
579*4882a593Smuzhiyun 			/*
580*4882a593Smuzhiyun 			 * update the channel's completed cookie - no
581*4882a593Smuzhiyun 			 * lock is required the IMSG threshold provide
582*4882a593Smuzhiyun 			 * the locking
583*4882a593Smuzhiyun 			 */
584*4882a593Smuzhiyun 			dma_cookie_complete(&next_pending_sw_desc->async_tx);
585*4882a593Smuzhiyun 
586*4882a593Smuzhiyun 			dma_descriptor_unmap(&next_pending_sw_desc->async_tx);
587*4882a593Smuzhiyun 			dmaengine_desc_get_callback_invoke(
588*4882a593Smuzhiyun 					&next_pending_sw_desc->async_tx, NULL);
589*4882a593Smuzhiyun 		}
590*4882a593Smuzhiyun 
591*4882a593Smuzhiyun 		dma_run_dependencies(&next_pending_sw_desc->async_tx);
592*4882a593Smuzhiyun 
593*4882a593Smuzhiyun 		/* Lock the channel */
594*4882a593Smuzhiyun 		spin_lock_bh(&xor_dev->lock);
595*4882a593Smuzhiyun 
596*4882a593Smuzhiyun 		/* add the SW descriptor to the free descriptors list */
597*4882a593Smuzhiyun 		list_add(&next_pending_sw_desc->free_list,
598*4882a593Smuzhiyun 			 &xor_dev->free_sw_desc);
599*4882a593Smuzhiyun 
600*4882a593Smuzhiyun 		/* Release the channel */
601*4882a593Smuzhiyun 		spin_unlock_bh(&xor_dev->lock);
602*4882a593Smuzhiyun 
603*4882a593Smuzhiyun 		/* increment the next descriptor */
604*4882a593Smuzhiyun 		pending_ptr++;
605*4882a593Smuzhiyun 		if (pending_ptr >= MV_XOR_V2_DESC_NUM)
606*4882a593Smuzhiyun 			pending_ptr = 0;
607*4882a593Smuzhiyun 	}
608*4882a593Smuzhiyun 
609*4882a593Smuzhiyun 	if (num_of_pending != 0) {
610*4882a593Smuzhiyun 		/* free the descriptores */
611*4882a593Smuzhiyun 		mv_xor_v2_free_desc_from_desq(xor_dev, num_of_pending);
612*4882a593Smuzhiyun 	}
613*4882a593Smuzhiyun }
614*4882a593Smuzhiyun 
615*4882a593Smuzhiyun /*
616*4882a593Smuzhiyun  *	Set DMA Interrupt-message (IMSG) parameters
617*4882a593Smuzhiyun  */
mv_xor_v2_set_msi_msg(struct msi_desc * desc,struct msi_msg * msg)618*4882a593Smuzhiyun static void mv_xor_v2_set_msi_msg(struct msi_desc *desc, struct msi_msg *msg)
619*4882a593Smuzhiyun {
620*4882a593Smuzhiyun 	struct mv_xor_v2_device *xor_dev = dev_get_drvdata(desc->dev);
621*4882a593Smuzhiyun 
622*4882a593Smuzhiyun 	writel(msg->address_lo,
623*4882a593Smuzhiyun 	       xor_dev->dma_base + MV_XOR_V2_DMA_IMSG_BALR_OFF);
624*4882a593Smuzhiyun 	writel(msg->address_hi & 0xFFFF,
625*4882a593Smuzhiyun 	       xor_dev->dma_base + MV_XOR_V2_DMA_IMSG_BAHR_OFF);
626*4882a593Smuzhiyun 	writel(msg->data,
627*4882a593Smuzhiyun 	       xor_dev->dma_base + MV_XOR_V2_DMA_IMSG_CDAT_OFF);
628*4882a593Smuzhiyun }
629*4882a593Smuzhiyun 
mv_xor_v2_descq_init(struct mv_xor_v2_device * xor_dev)630*4882a593Smuzhiyun static int mv_xor_v2_descq_init(struct mv_xor_v2_device *xor_dev)
631*4882a593Smuzhiyun {
632*4882a593Smuzhiyun 	u32 reg;
633*4882a593Smuzhiyun 
634*4882a593Smuzhiyun 	/* write the DESQ size to the DMA engine */
635*4882a593Smuzhiyun 	writel(MV_XOR_V2_DESC_NUM,
636*4882a593Smuzhiyun 	       xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_SIZE_OFF);
637*4882a593Smuzhiyun 
638*4882a593Smuzhiyun 	/* write the DESQ address to the DMA enngine*/
639*4882a593Smuzhiyun 	writel(lower_32_bits(xor_dev->hw_desq),
640*4882a593Smuzhiyun 	       xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_BALR_OFF);
641*4882a593Smuzhiyun 	writel(upper_32_bits(xor_dev->hw_desq),
642*4882a593Smuzhiyun 	       xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_BAHR_OFF);
643*4882a593Smuzhiyun 
644*4882a593Smuzhiyun 	/*
645*4882a593Smuzhiyun 	 * This is a temporary solution, until we activate the
646*4882a593Smuzhiyun 	 * SMMU. Set the attributes for reading & writing data buffers
647*4882a593Smuzhiyun 	 * & descriptors to:
648*4882a593Smuzhiyun 	 *
649*4882a593Smuzhiyun 	 *  - OuterShareable - Snoops will be performed on CPU caches
650*4882a593Smuzhiyun 	 *  - Enable cacheable - Bufferable, Modifiable, Other Allocate
651*4882a593Smuzhiyun 	 *    and Allocate
652*4882a593Smuzhiyun 	 */
653*4882a593Smuzhiyun 	reg = readl(xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_ARATTR_OFF);
654*4882a593Smuzhiyun 	reg &= ~MV_XOR_V2_DMA_DESQ_ATTR_CACHE_MASK;
655*4882a593Smuzhiyun 	reg |= MV_XOR_V2_DMA_DESQ_ATTR_OUTER_SHAREABLE |
656*4882a593Smuzhiyun 		MV_XOR_V2_DMA_DESQ_ATTR_CACHEABLE;
657*4882a593Smuzhiyun 	writel(reg, xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_ARATTR_OFF);
658*4882a593Smuzhiyun 
659*4882a593Smuzhiyun 	reg = readl(xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_AWATTR_OFF);
660*4882a593Smuzhiyun 	reg &= ~MV_XOR_V2_DMA_DESQ_ATTR_CACHE_MASK;
661*4882a593Smuzhiyun 	reg |= MV_XOR_V2_DMA_DESQ_ATTR_OUTER_SHAREABLE |
662*4882a593Smuzhiyun 		MV_XOR_V2_DMA_DESQ_ATTR_CACHEABLE;
663*4882a593Smuzhiyun 	writel(reg, xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_AWATTR_OFF);
664*4882a593Smuzhiyun 
665*4882a593Smuzhiyun 	/* BW CTRL - set values to optimize the XOR performance:
666*4882a593Smuzhiyun 	 *
667*4882a593Smuzhiyun 	 *  - Set WrBurstLen & RdBurstLen - the unit will issue
668*4882a593Smuzhiyun 	 *    maximum of 256B write/read transactions.
669*4882a593Smuzhiyun 	 * -  Limit the number of outstanding write & read data
670*4882a593Smuzhiyun 	 *    (OBB/IBB) requests to the maximal value.
671*4882a593Smuzhiyun 	*/
672*4882a593Smuzhiyun 	reg = ((MV_XOR_V2_GLOB_BW_CTRL_NUM_OSTD_RD_VAL <<
673*4882a593Smuzhiyun 		MV_XOR_V2_GLOB_BW_CTRL_NUM_OSTD_RD_SHIFT) |
674*4882a593Smuzhiyun 	       (MV_XOR_V2_GLOB_BW_CTRL_NUM_OSTD_WR_VAL  <<
675*4882a593Smuzhiyun 		MV_XOR_V2_GLOB_BW_CTRL_NUM_OSTD_WR_SHIFT) |
676*4882a593Smuzhiyun 	       (MV_XOR_V2_GLOB_BW_CTRL_RD_BURST_LEN_VAL <<
677*4882a593Smuzhiyun 		MV_XOR_V2_GLOB_BW_CTRL_RD_BURST_LEN_SHIFT) |
678*4882a593Smuzhiyun 	       (MV_XOR_V2_GLOB_BW_CTRL_WR_BURST_LEN_VAL <<
679*4882a593Smuzhiyun 		MV_XOR_V2_GLOB_BW_CTRL_WR_BURST_LEN_SHIFT));
680*4882a593Smuzhiyun 	writel(reg, xor_dev->glob_base + MV_XOR_V2_GLOB_BW_CTRL);
681*4882a593Smuzhiyun 
682*4882a593Smuzhiyun 	/* Disable the AXI timer feature */
683*4882a593Smuzhiyun 	reg = readl(xor_dev->glob_base + MV_XOR_V2_GLOB_PAUSE);
684*4882a593Smuzhiyun 	reg |= MV_XOR_V2_GLOB_PAUSE_AXI_TIME_DIS_VAL;
685*4882a593Smuzhiyun 	writel(reg, xor_dev->glob_base + MV_XOR_V2_GLOB_PAUSE);
686*4882a593Smuzhiyun 
687*4882a593Smuzhiyun 	/* enable the DMA engine */
688*4882a593Smuzhiyun 	writel(0, xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_STOP_OFF);
689*4882a593Smuzhiyun 
690*4882a593Smuzhiyun 	return 0;
691*4882a593Smuzhiyun }
692*4882a593Smuzhiyun 
mv_xor_v2_suspend(struct platform_device * dev,pm_message_t state)693*4882a593Smuzhiyun static int mv_xor_v2_suspend(struct platform_device *dev, pm_message_t state)
694*4882a593Smuzhiyun {
695*4882a593Smuzhiyun 	struct mv_xor_v2_device *xor_dev = platform_get_drvdata(dev);
696*4882a593Smuzhiyun 
697*4882a593Smuzhiyun 	/* Set this bit to disable to stop the XOR unit. */
698*4882a593Smuzhiyun 	writel(0x1, xor_dev->dma_base + MV_XOR_V2_DMA_DESQ_STOP_OFF);
699*4882a593Smuzhiyun 
700*4882a593Smuzhiyun 	return 0;
701*4882a593Smuzhiyun }
702*4882a593Smuzhiyun 
mv_xor_v2_resume(struct platform_device * dev)703*4882a593Smuzhiyun static int mv_xor_v2_resume(struct platform_device *dev)
704*4882a593Smuzhiyun {
705*4882a593Smuzhiyun 	struct mv_xor_v2_device *xor_dev = platform_get_drvdata(dev);
706*4882a593Smuzhiyun 
707*4882a593Smuzhiyun 	mv_xor_v2_set_desc_size(xor_dev);
708*4882a593Smuzhiyun 	mv_xor_v2_enable_imsg_thrd(xor_dev);
709*4882a593Smuzhiyun 	mv_xor_v2_descq_init(xor_dev);
710*4882a593Smuzhiyun 
711*4882a593Smuzhiyun 	return 0;
712*4882a593Smuzhiyun }
713*4882a593Smuzhiyun 
mv_xor_v2_probe(struct platform_device * pdev)714*4882a593Smuzhiyun static int mv_xor_v2_probe(struct platform_device *pdev)
715*4882a593Smuzhiyun {
716*4882a593Smuzhiyun 	struct mv_xor_v2_device *xor_dev;
717*4882a593Smuzhiyun 	struct resource *res;
718*4882a593Smuzhiyun 	int i, ret = 0;
719*4882a593Smuzhiyun 	struct dma_device *dma_dev;
720*4882a593Smuzhiyun 	struct mv_xor_v2_sw_desc *sw_desc;
721*4882a593Smuzhiyun 	struct msi_desc *msi_desc;
722*4882a593Smuzhiyun 
723*4882a593Smuzhiyun 	BUILD_BUG_ON(sizeof(struct mv_xor_v2_descriptor) !=
724*4882a593Smuzhiyun 		     MV_XOR_V2_EXT_DESC_SIZE);
725*4882a593Smuzhiyun 
726*4882a593Smuzhiyun 	xor_dev = devm_kzalloc(&pdev->dev, sizeof(*xor_dev), GFP_KERNEL);
727*4882a593Smuzhiyun 	if (!xor_dev)
728*4882a593Smuzhiyun 		return -ENOMEM;
729*4882a593Smuzhiyun 
730*4882a593Smuzhiyun 	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
731*4882a593Smuzhiyun 	xor_dev->dma_base = devm_ioremap_resource(&pdev->dev, res);
732*4882a593Smuzhiyun 	if (IS_ERR(xor_dev->dma_base))
733*4882a593Smuzhiyun 		return PTR_ERR(xor_dev->dma_base);
734*4882a593Smuzhiyun 
735*4882a593Smuzhiyun 	res = platform_get_resource(pdev, IORESOURCE_MEM, 1);
736*4882a593Smuzhiyun 	xor_dev->glob_base = devm_ioremap_resource(&pdev->dev, res);
737*4882a593Smuzhiyun 	if (IS_ERR(xor_dev->glob_base))
738*4882a593Smuzhiyun 		return PTR_ERR(xor_dev->glob_base);
739*4882a593Smuzhiyun 
740*4882a593Smuzhiyun 	platform_set_drvdata(pdev, xor_dev);
741*4882a593Smuzhiyun 
742*4882a593Smuzhiyun 	ret = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(40));
743*4882a593Smuzhiyun 	if (ret)
744*4882a593Smuzhiyun 		return ret;
745*4882a593Smuzhiyun 
746*4882a593Smuzhiyun 	xor_dev->reg_clk = devm_clk_get(&pdev->dev, "reg");
747*4882a593Smuzhiyun 	if (PTR_ERR(xor_dev->reg_clk) != -ENOENT) {
748*4882a593Smuzhiyun 		if (!IS_ERR(xor_dev->reg_clk)) {
749*4882a593Smuzhiyun 			ret = clk_prepare_enable(xor_dev->reg_clk);
750*4882a593Smuzhiyun 			if (ret)
751*4882a593Smuzhiyun 				return ret;
752*4882a593Smuzhiyun 		} else {
753*4882a593Smuzhiyun 			return PTR_ERR(xor_dev->reg_clk);
754*4882a593Smuzhiyun 		}
755*4882a593Smuzhiyun 	}
756*4882a593Smuzhiyun 
757*4882a593Smuzhiyun 	xor_dev->clk = devm_clk_get(&pdev->dev, NULL);
758*4882a593Smuzhiyun 	if (PTR_ERR(xor_dev->clk) == -EPROBE_DEFER) {
759*4882a593Smuzhiyun 		ret = EPROBE_DEFER;
760*4882a593Smuzhiyun 		goto disable_reg_clk;
761*4882a593Smuzhiyun 	}
762*4882a593Smuzhiyun 	if (!IS_ERR(xor_dev->clk)) {
763*4882a593Smuzhiyun 		ret = clk_prepare_enable(xor_dev->clk);
764*4882a593Smuzhiyun 		if (ret)
765*4882a593Smuzhiyun 			goto disable_reg_clk;
766*4882a593Smuzhiyun 	}
767*4882a593Smuzhiyun 
768*4882a593Smuzhiyun 	ret = platform_msi_domain_alloc_irqs(&pdev->dev, 1,
769*4882a593Smuzhiyun 					     mv_xor_v2_set_msi_msg);
770*4882a593Smuzhiyun 	if (ret)
771*4882a593Smuzhiyun 		goto disable_clk;
772*4882a593Smuzhiyun 
773*4882a593Smuzhiyun 	msi_desc = first_msi_entry(&pdev->dev);
774*4882a593Smuzhiyun 	if (!msi_desc) {
775*4882a593Smuzhiyun 		ret = -ENODEV;
776*4882a593Smuzhiyun 		goto free_msi_irqs;
777*4882a593Smuzhiyun 	}
778*4882a593Smuzhiyun 	xor_dev->msi_desc = msi_desc;
779*4882a593Smuzhiyun 
780*4882a593Smuzhiyun 	ret = devm_request_irq(&pdev->dev, msi_desc->irq,
781*4882a593Smuzhiyun 			       mv_xor_v2_interrupt_handler, 0,
782*4882a593Smuzhiyun 			       dev_name(&pdev->dev), xor_dev);
783*4882a593Smuzhiyun 	if (ret)
784*4882a593Smuzhiyun 		goto free_msi_irqs;
785*4882a593Smuzhiyun 
786*4882a593Smuzhiyun 	tasklet_setup(&xor_dev->irq_tasklet, mv_xor_v2_tasklet);
787*4882a593Smuzhiyun 
788*4882a593Smuzhiyun 	xor_dev->desc_size = mv_xor_v2_set_desc_size(xor_dev);
789*4882a593Smuzhiyun 
790*4882a593Smuzhiyun 	dma_cookie_init(&xor_dev->dmachan);
791*4882a593Smuzhiyun 
792*4882a593Smuzhiyun 	/*
793*4882a593Smuzhiyun 	 * allocate coherent memory for hardware descriptors
794*4882a593Smuzhiyun 	 * note: writecombine gives slightly better performance, but
795*4882a593Smuzhiyun 	 * requires that we explicitly flush the writes
796*4882a593Smuzhiyun 	 */
797*4882a593Smuzhiyun 	xor_dev->hw_desq_virt =
798*4882a593Smuzhiyun 		dma_alloc_coherent(&pdev->dev,
799*4882a593Smuzhiyun 				   xor_dev->desc_size * MV_XOR_V2_DESC_NUM,
800*4882a593Smuzhiyun 				   &xor_dev->hw_desq, GFP_KERNEL);
801*4882a593Smuzhiyun 	if (!xor_dev->hw_desq_virt) {
802*4882a593Smuzhiyun 		ret = -ENOMEM;
803*4882a593Smuzhiyun 		goto free_msi_irqs;
804*4882a593Smuzhiyun 	}
805*4882a593Smuzhiyun 
806*4882a593Smuzhiyun 	/* alloc memory for the SW descriptors */
807*4882a593Smuzhiyun 	xor_dev->sw_desq = devm_kcalloc(&pdev->dev,
808*4882a593Smuzhiyun 					MV_XOR_V2_DESC_NUM, sizeof(*sw_desc),
809*4882a593Smuzhiyun 					GFP_KERNEL);
810*4882a593Smuzhiyun 	if (!xor_dev->sw_desq) {
811*4882a593Smuzhiyun 		ret = -ENOMEM;
812*4882a593Smuzhiyun 		goto free_hw_desq;
813*4882a593Smuzhiyun 	}
814*4882a593Smuzhiyun 
815*4882a593Smuzhiyun 	spin_lock_init(&xor_dev->lock);
816*4882a593Smuzhiyun 
817*4882a593Smuzhiyun 	/* init the free SW descriptors list */
818*4882a593Smuzhiyun 	INIT_LIST_HEAD(&xor_dev->free_sw_desc);
819*4882a593Smuzhiyun 
820*4882a593Smuzhiyun 	/* add all SW descriptors to the free list */
821*4882a593Smuzhiyun 	for (i = 0; i < MV_XOR_V2_DESC_NUM; i++) {
822*4882a593Smuzhiyun 		struct mv_xor_v2_sw_desc *sw_desc =
823*4882a593Smuzhiyun 			xor_dev->sw_desq + i;
824*4882a593Smuzhiyun 		sw_desc->idx = i;
825*4882a593Smuzhiyun 		dma_async_tx_descriptor_init(&sw_desc->async_tx,
826*4882a593Smuzhiyun 					     &xor_dev->dmachan);
827*4882a593Smuzhiyun 		sw_desc->async_tx.tx_submit = mv_xor_v2_tx_submit;
828*4882a593Smuzhiyun 		async_tx_ack(&sw_desc->async_tx);
829*4882a593Smuzhiyun 
830*4882a593Smuzhiyun 		list_add(&sw_desc->free_list,
831*4882a593Smuzhiyun 			 &xor_dev->free_sw_desc);
832*4882a593Smuzhiyun 	}
833*4882a593Smuzhiyun 
834*4882a593Smuzhiyun 	dma_dev = &xor_dev->dmadev;
835*4882a593Smuzhiyun 
836*4882a593Smuzhiyun 	/* set DMA capabilities */
837*4882a593Smuzhiyun 	dma_cap_zero(dma_dev->cap_mask);
838*4882a593Smuzhiyun 	dma_cap_set(DMA_MEMCPY, dma_dev->cap_mask);
839*4882a593Smuzhiyun 	dma_cap_set(DMA_XOR, dma_dev->cap_mask);
840*4882a593Smuzhiyun 	dma_cap_set(DMA_INTERRUPT, dma_dev->cap_mask);
841*4882a593Smuzhiyun 
842*4882a593Smuzhiyun 	/* init dma link list */
843*4882a593Smuzhiyun 	INIT_LIST_HEAD(&dma_dev->channels);
844*4882a593Smuzhiyun 
845*4882a593Smuzhiyun 	/* set base routines */
846*4882a593Smuzhiyun 	dma_dev->device_tx_status = dma_cookie_status;
847*4882a593Smuzhiyun 	dma_dev->device_issue_pending = mv_xor_v2_issue_pending;
848*4882a593Smuzhiyun 	dma_dev->dev = &pdev->dev;
849*4882a593Smuzhiyun 
850*4882a593Smuzhiyun 	dma_dev->device_prep_dma_memcpy = mv_xor_v2_prep_dma_memcpy;
851*4882a593Smuzhiyun 	dma_dev->device_prep_dma_interrupt = mv_xor_v2_prep_dma_interrupt;
852*4882a593Smuzhiyun 	dma_dev->max_xor = 8;
853*4882a593Smuzhiyun 	dma_dev->device_prep_dma_xor = mv_xor_v2_prep_dma_xor;
854*4882a593Smuzhiyun 
855*4882a593Smuzhiyun 	xor_dev->dmachan.device = dma_dev;
856*4882a593Smuzhiyun 
857*4882a593Smuzhiyun 	list_add_tail(&xor_dev->dmachan.device_node,
858*4882a593Smuzhiyun 		      &dma_dev->channels);
859*4882a593Smuzhiyun 
860*4882a593Smuzhiyun 	mv_xor_v2_enable_imsg_thrd(xor_dev);
861*4882a593Smuzhiyun 
862*4882a593Smuzhiyun 	mv_xor_v2_descq_init(xor_dev);
863*4882a593Smuzhiyun 
864*4882a593Smuzhiyun 	ret = dma_async_device_register(dma_dev);
865*4882a593Smuzhiyun 	if (ret)
866*4882a593Smuzhiyun 		goto free_hw_desq;
867*4882a593Smuzhiyun 
868*4882a593Smuzhiyun 	dev_notice(&pdev->dev, "Marvell Version 2 XOR driver\n");
869*4882a593Smuzhiyun 
870*4882a593Smuzhiyun 	return 0;
871*4882a593Smuzhiyun 
872*4882a593Smuzhiyun free_hw_desq:
873*4882a593Smuzhiyun 	dma_free_coherent(&pdev->dev,
874*4882a593Smuzhiyun 			  xor_dev->desc_size * MV_XOR_V2_DESC_NUM,
875*4882a593Smuzhiyun 			  xor_dev->hw_desq_virt, xor_dev->hw_desq);
876*4882a593Smuzhiyun free_msi_irqs:
877*4882a593Smuzhiyun 	platform_msi_domain_free_irqs(&pdev->dev);
878*4882a593Smuzhiyun disable_clk:
879*4882a593Smuzhiyun 	clk_disable_unprepare(xor_dev->clk);
880*4882a593Smuzhiyun disable_reg_clk:
881*4882a593Smuzhiyun 	clk_disable_unprepare(xor_dev->reg_clk);
882*4882a593Smuzhiyun 	return ret;
883*4882a593Smuzhiyun }
884*4882a593Smuzhiyun 
mv_xor_v2_remove(struct platform_device * pdev)885*4882a593Smuzhiyun static int mv_xor_v2_remove(struct platform_device *pdev)
886*4882a593Smuzhiyun {
887*4882a593Smuzhiyun 	struct mv_xor_v2_device *xor_dev = platform_get_drvdata(pdev);
888*4882a593Smuzhiyun 
889*4882a593Smuzhiyun 	dma_async_device_unregister(&xor_dev->dmadev);
890*4882a593Smuzhiyun 
891*4882a593Smuzhiyun 	dma_free_coherent(&pdev->dev,
892*4882a593Smuzhiyun 			  xor_dev->desc_size * MV_XOR_V2_DESC_NUM,
893*4882a593Smuzhiyun 			  xor_dev->hw_desq_virt, xor_dev->hw_desq);
894*4882a593Smuzhiyun 
895*4882a593Smuzhiyun 	devm_free_irq(&pdev->dev, xor_dev->msi_desc->irq, xor_dev);
896*4882a593Smuzhiyun 
897*4882a593Smuzhiyun 	platform_msi_domain_free_irqs(&pdev->dev);
898*4882a593Smuzhiyun 
899*4882a593Smuzhiyun 	tasklet_kill(&xor_dev->irq_tasklet);
900*4882a593Smuzhiyun 
901*4882a593Smuzhiyun 	clk_disable_unprepare(xor_dev->clk);
902*4882a593Smuzhiyun 	clk_disable_unprepare(xor_dev->reg_clk);
903*4882a593Smuzhiyun 
904*4882a593Smuzhiyun 	return 0;
905*4882a593Smuzhiyun }
906*4882a593Smuzhiyun 
907*4882a593Smuzhiyun #ifdef CONFIG_OF
908*4882a593Smuzhiyun static const struct of_device_id mv_xor_v2_dt_ids[] = {
909*4882a593Smuzhiyun 	{ .compatible = "marvell,xor-v2", },
910*4882a593Smuzhiyun 	{},
911*4882a593Smuzhiyun };
912*4882a593Smuzhiyun MODULE_DEVICE_TABLE(of, mv_xor_v2_dt_ids);
913*4882a593Smuzhiyun #endif
914*4882a593Smuzhiyun 
915*4882a593Smuzhiyun static struct platform_driver mv_xor_v2_driver = {
916*4882a593Smuzhiyun 	.probe		= mv_xor_v2_probe,
917*4882a593Smuzhiyun 	.suspend	= mv_xor_v2_suspend,
918*4882a593Smuzhiyun 	.resume		= mv_xor_v2_resume,
919*4882a593Smuzhiyun 	.remove		= mv_xor_v2_remove,
920*4882a593Smuzhiyun 	.driver		= {
921*4882a593Smuzhiyun 		.name	= "mv_xor_v2",
922*4882a593Smuzhiyun 		.of_match_table = of_match_ptr(mv_xor_v2_dt_ids),
923*4882a593Smuzhiyun 	},
924*4882a593Smuzhiyun };
925*4882a593Smuzhiyun 
926*4882a593Smuzhiyun module_platform_driver(mv_xor_v2_driver);
927*4882a593Smuzhiyun 
928*4882a593Smuzhiyun MODULE_DESCRIPTION("DMA engine driver for Marvell's Version 2 of XOR engine");
929*4882a593Smuzhiyun MODULE_LICENSE("GPL");
930