1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * mtu3_qmu.c - Queue Management Unit driver for device controller
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2016 MediaTek Inc.
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * Author: Chunfeng Yun <chunfeng.yun@mediatek.com>
8*4882a593Smuzhiyun */
9*4882a593Smuzhiyun
10*4882a593Smuzhiyun /*
11*4882a593Smuzhiyun * Queue Management Unit (QMU) is designed to unload SW effort
12*4882a593Smuzhiyun * to serve DMA interrupts.
13*4882a593Smuzhiyun * By preparing General Purpose Descriptor (GPD) and Buffer Descriptor (BD),
14*4882a593Smuzhiyun * SW links data buffers and triggers QMU to send / receive data to
15*4882a593Smuzhiyun * host / from device at a time.
16*4882a593Smuzhiyun * And now only GPD is supported.
17*4882a593Smuzhiyun *
18*4882a593Smuzhiyun * For more detailed information, please refer to QMU Programming Guide
19*4882a593Smuzhiyun */
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun #include <linux/dmapool.h>
22*4882a593Smuzhiyun #include <linux/iopoll.h>
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun #include "mtu3.h"
25*4882a593Smuzhiyun #include "mtu3_trace.h"
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun #define QMU_CHECKSUM_LEN 16
28*4882a593Smuzhiyun
29*4882a593Smuzhiyun #define GPD_FLAGS_HWO BIT(0)
30*4882a593Smuzhiyun #define GPD_FLAGS_BDP BIT(1)
31*4882a593Smuzhiyun #define GPD_FLAGS_BPS BIT(2)
32*4882a593Smuzhiyun #define GPD_FLAGS_ZLP BIT(6)
33*4882a593Smuzhiyun #define GPD_FLAGS_IOC BIT(7)
34*4882a593Smuzhiyun #define GET_GPD_HWO(gpd) (le32_to_cpu((gpd)->dw0_info) & GPD_FLAGS_HWO)
35*4882a593Smuzhiyun
36*4882a593Smuzhiyun #define GPD_RX_BUF_LEN_OG(x) (((x) & 0xffff) << 16)
37*4882a593Smuzhiyun #define GPD_RX_BUF_LEN_EL(x) (((x) & 0xfffff) << 12)
38*4882a593Smuzhiyun #define GPD_RX_BUF_LEN(mtu, x) \
39*4882a593Smuzhiyun ({ \
40*4882a593Smuzhiyun typeof(x) x_ = (x); \
41*4882a593Smuzhiyun ((mtu)->gen2cp) ? GPD_RX_BUF_LEN_EL(x_) : GPD_RX_BUF_LEN_OG(x_); \
42*4882a593Smuzhiyun })
43*4882a593Smuzhiyun
44*4882a593Smuzhiyun #define GPD_DATA_LEN_OG(x) ((x) & 0xffff)
45*4882a593Smuzhiyun #define GPD_DATA_LEN_EL(x) ((x) & 0xfffff)
46*4882a593Smuzhiyun #define GPD_DATA_LEN(mtu, x) \
47*4882a593Smuzhiyun ({ \
48*4882a593Smuzhiyun typeof(x) x_ = (x); \
49*4882a593Smuzhiyun ((mtu)->gen2cp) ? GPD_DATA_LEN_EL(x_) : GPD_DATA_LEN_OG(x_); \
50*4882a593Smuzhiyun })
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun #define GPD_EXT_FLAG_ZLP BIT(29)
53*4882a593Smuzhiyun #define GPD_EXT_NGP_OG(x) (((x) & 0xf) << 20)
54*4882a593Smuzhiyun #define GPD_EXT_BUF_OG(x) (((x) & 0xf) << 16)
55*4882a593Smuzhiyun #define GPD_EXT_NGP_EL(x) (((x) & 0xf) << 28)
56*4882a593Smuzhiyun #define GPD_EXT_BUF_EL(x) (((x) & 0xf) << 24)
57*4882a593Smuzhiyun #define GPD_EXT_NGP(mtu, x) \
58*4882a593Smuzhiyun ({ \
59*4882a593Smuzhiyun typeof(x) x_ = (x); \
60*4882a593Smuzhiyun ((mtu)->gen2cp) ? GPD_EXT_NGP_EL(x_) : GPD_EXT_NGP_OG(x_); \
61*4882a593Smuzhiyun })
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun #define GPD_EXT_BUF(mtu, x) \
64*4882a593Smuzhiyun ({ \
65*4882a593Smuzhiyun typeof(x) x_ = (x); \
66*4882a593Smuzhiyun ((mtu)->gen2cp) ? GPD_EXT_BUF_EL(x_) : GPD_EXT_BUF_OG(x_); \
67*4882a593Smuzhiyun })
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun #define HILO_GEN64(hi, lo) (((u64)(hi) << 32) + (lo))
70*4882a593Smuzhiyun #define HILO_DMA(hi, lo) \
71*4882a593Smuzhiyun ((dma_addr_t)HILO_GEN64((le32_to_cpu(hi)), (le32_to_cpu(lo))))
72*4882a593Smuzhiyun
read_txq_cur_addr(void __iomem * mbase,u8 epnum)73*4882a593Smuzhiyun static dma_addr_t read_txq_cur_addr(void __iomem *mbase, u8 epnum)
74*4882a593Smuzhiyun {
75*4882a593Smuzhiyun u32 txcpr;
76*4882a593Smuzhiyun u32 txhiar;
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun txcpr = mtu3_readl(mbase, USB_QMU_TQCPR(epnum));
79*4882a593Smuzhiyun txhiar = mtu3_readl(mbase, USB_QMU_TQHIAR(epnum));
80*4882a593Smuzhiyun
81*4882a593Smuzhiyun return HILO_DMA(QMU_CUR_GPD_ADDR_HI(txhiar), txcpr);
82*4882a593Smuzhiyun }
83*4882a593Smuzhiyun
read_rxq_cur_addr(void __iomem * mbase,u8 epnum)84*4882a593Smuzhiyun static dma_addr_t read_rxq_cur_addr(void __iomem *mbase, u8 epnum)
85*4882a593Smuzhiyun {
86*4882a593Smuzhiyun u32 rxcpr;
87*4882a593Smuzhiyun u32 rxhiar;
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun rxcpr = mtu3_readl(mbase, USB_QMU_RQCPR(epnum));
90*4882a593Smuzhiyun rxhiar = mtu3_readl(mbase, USB_QMU_RQHIAR(epnum));
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun return HILO_DMA(QMU_CUR_GPD_ADDR_HI(rxhiar), rxcpr);
93*4882a593Smuzhiyun }
94*4882a593Smuzhiyun
write_txq_start_addr(void __iomem * mbase,u8 epnum,dma_addr_t dma)95*4882a593Smuzhiyun static void write_txq_start_addr(void __iomem *mbase, u8 epnum, dma_addr_t dma)
96*4882a593Smuzhiyun {
97*4882a593Smuzhiyun u32 tqhiar;
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun mtu3_writel(mbase, USB_QMU_TQSAR(epnum),
100*4882a593Smuzhiyun cpu_to_le32(lower_32_bits(dma)));
101*4882a593Smuzhiyun tqhiar = mtu3_readl(mbase, USB_QMU_TQHIAR(epnum));
102*4882a593Smuzhiyun tqhiar &= ~QMU_START_ADDR_HI_MSK;
103*4882a593Smuzhiyun tqhiar |= QMU_START_ADDR_HI(upper_32_bits(dma));
104*4882a593Smuzhiyun mtu3_writel(mbase, USB_QMU_TQHIAR(epnum), tqhiar);
105*4882a593Smuzhiyun }
106*4882a593Smuzhiyun
write_rxq_start_addr(void __iomem * mbase,u8 epnum,dma_addr_t dma)107*4882a593Smuzhiyun static void write_rxq_start_addr(void __iomem *mbase, u8 epnum, dma_addr_t dma)
108*4882a593Smuzhiyun {
109*4882a593Smuzhiyun u32 rqhiar;
110*4882a593Smuzhiyun
111*4882a593Smuzhiyun mtu3_writel(mbase, USB_QMU_RQSAR(epnum),
112*4882a593Smuzhiyun cpu_to_le32(lower_32_bits(dma)));
113*4882a593Smuzhiyun rqhiar = mtu3_readl(mbase, USB_QMU_RQHIAR(epnum));
114*4882a593Smuzhiyun rqhiar &= ~QMU_START_ADDR_HI_MSK;
115*4882a593Smuzhiyun rqhiar |= QMU_START_ADDR_HI(upper_32_bits(dma));
116*4882a593Smuzhiyun mtu3_writel(mbase, USB_QMU_RQHIAR(epnum), rqhiar);
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun
gpd_dma_to_virt(struct mtu3_gpd_ring * ring,dma_addr_t dma_addr)119*4882a593Smuzhiyun static struct qmu_gpd *gpd_dma_to_virt(struct mtu3_gpd_ring *ring,
120*4882a593Smuzhiyun dma_addr_t dma_addr)
121*4882a593Smuzhiyun {
122*4882a593Smuzhiyun dma_addr_t dma_base = ring->dma;
123*4882a593Smuzhiyun struct qmu_gpd *gpd_head = ring->start;
124*4882a593Smuzhiyun u32 offset = (dma_addr - dma_base) / sizeof(*gpd_head);
125*4882a593Smuzhiyun
126*4882a593Smuzhiyun if (offset >= MAX_GPD_NUM)
127*4882a593Smuzhiyun return NULL;
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun return gpd_head + offset;
130*4882a593Smuzhiyun }
131*4882a593Smuzhiyun
gpd_virt_to_dma(struct mtu3_gpd_ring * ring,struct qmu_gpd * gpd)132*4882a593Smuzhiyun static dma_addr_t gpd_virt_to_dma(struct mtu3_gpd_ring *ring,
133*4882a593Smuzhiyun struct qmu_gpd *gpd)
134*4882a593Smuzhiyun {
135*4882a593Smuzhiyun dma_addr_t dma_base = ring->dma;
136*4882a593Smuzhiyun struct qmu_gpd *gpd_head = ring->start;
137*4882a593Smuzhiyun u32 offset;
138*4882a593Smuzhiyun
139*4882a593Smuzhiyun offset = gpd - gpd_head;
140*4882a593Smuzhiyun if (offset >= MAX_GPD_NUM)
141*4882a593Smuzhiyun return 0;
142*4882a593Smuzhiyun
143*4882a593Smuzhiyun return dma_base + (offset * sizeof(*gpd));
144*4882a593Smuzhiyun }
145*4882a593Smuzhiyun
gpd_ring_init(struct mtu3_gpd_ring * ring,struct qmu_gpd * gpd)146*4882a593Smuzhiyun static void gpd_ring_init(struct mtu3_gpd_ring *ring, struct qmu_gpd *gpd)
147*4882a593Smuzhiyun {
148*4882a593Smuzhiyun ring->start = gpd;
149*4882a593Smuzhiyun ring->enqueue = gpd;
150*4882a593Smuzhiyun ring->dequeue = gpd;
151*4882a593Smuzhiyun ring->end = gpd + MAX_GPD_NUM - 1;
152*4882a593Smuzhiyun }
153*4882a593Smuzhiyun
reset_gpd_list(struct mtu3_ep * mep)154*4882a593Smuzhiyun static void reset_gpd_list(struct mtu3_ep *mep)
155*4882a593Smuzhiyun {
156*4882a593Smuzhiyun struct mtu3_gpd_ring *ring = &mep->gpd_ring;
157*4882a593Smuzhiyun struct qmu_gpd *gpd = ring->start;
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun if (gpd) {
160*4882a593Smuzhiyun gpd->dw0_info &= cpu_to_le32(~GPD_FLAGS_HWO);
161*4882a593Smuzhiyun gpd_ring_init(ring, gpd);
162*4882a593Smuzhiyun }
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun
mtu3_gpd_ring_alloc(struct mtu3_ep * mep)165*4882a593Smuzhiyun int mtu3_gpd_ring_alloc(struct mtu3_ep *mep)
166*4882a593Smuzhiyun {
167*4882a593Smuzhiyun struct qmu_gpd *gpd;
168*4882a593Smuzhiyun struct mtu3_gpd_ring *ring = &mep->gpd_ring;
169*4882a593Smuzhiyun
170*4882a593Smuzhiyun /* software own all gpds as default */
171*4882a593Smuzhiyun gpd = dma_pool_zalloc(mep->mtu->qmu_gpd_pool, GFP_ATOMIC, &ring->dma);
172*4882a593Smuzhiyun if (gpd == NULL)
173*4882a593Smuzhiyun return -ENOMEM;
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun gpd_ring_init(ring, gpd);
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun return 0;
178*4882a593Smuzhiyun }
179*4882a593Smuzhiyun
mtu3_gpd_ring_free(struct mtu3_ep * mep)180*4882a593Smuzhiyun void mtu3_gpd_ring_free(struct mtu3_ep *mep)
181*4882a593Smuzhiyun {
182*4882a593Smuzhiyun struct mtu3_gpd_ring *ring = &mep->gpd_ring;
183*4882a593Smuzhiyun
184*4882a593Smuzhiyun dma_pool_free(mep->mtu->qmu_gpd_pool,
185*4882a593Smuzhiyun ring->start, ring->dma);
186*4882a593Smuzhiyun memset(ring, 0, sizeof(*ring));
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun
mtu3_qmu_resume(struct mtu3_ep * mep)189*4882a593Smuzhiyun void mtu3_qmu_resume(struct mtu3_ep *mep)
190*4882a593Smuzhiyun {
191*4882a593Smuzhiyun struct mtu3 *mtu = mep->mtu;
192*4882a593Smuzhiyun void __iomem *mbase = mtu->mac_base;
193*4882a593Smuzhiyun int epnum = mep->epnum;
194*4882a593Smuzhiyun u32 offset;
195*4882a593Smuzhiyun
196*4882a593Smuzhiyun offset = mep->is_in ? USB_QMU_TQCSR(epnum) : USB_QMU_RQCSR(epnum);
197*4882a593Smuzhiyun
198*4882a593Smuzhiyun mtu3_writel(mbase, offset, QMU_Q_RESUME);
199*4882a593Smuzhiyun if (!(mtu3_readl(mbase, offset) & QMU_Q_ACTIVE))
200*4882a593Smuzhiyun mtu3_writel(mbase, offset, QMU_Q_RESUME);
201*4882a593Smuzhiyun }
202*4882a593Smuzhiyun
advance_enq_gpd(struct mtu3_gpd_ring * ring)203*4882a593Smuzhiyun static struct qmu_gpd *advance_enq_gpd(struct mtu3_gpd_ring *ring)
204*4882a593Smuzhiyun {
205*4882a593Smuzhiyun if (ring->enqueue < ring->end)
206*4882a593Smuzhiyun ring->enqueue++;
207*4882a593Smuzhiyun else
208*4882a593Smuzhiyun ring->enqueue = ring->start;
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun return ring->enqueue;
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun
advance_deq_gpd(struct mtu3_gpd_ring * ring)213*4882a593Smuzhiyun static struct qmu_gpd *advance_deq_gpd(struct mtu3_gpd_ring *ring)
214*4882a593Smuzhiyun {
215*4882a593Smuzhiyun if (ring->dequeue < ring->end)
216*4882a593Smuzhiyun ring->dequeue++;
217*4882a593Smuzhiyun else
218*4882a593Smuzhiyun ring->dequeue = ring->start;
219*4882a593Smuzhiyun
220*4882a593Smuzhiyun return ring->dequeue;
221*4882a593Smuzhiyun }
222*4882a593Smuzhiyun
223*4882a593Smuzhiyun /* check if a ring is emtpy */
gpd_ring_empty(struct mtu3_gpd_ring * ring)224*4882a593Smuzhiyun static int gpd_ring_empty(struct mtu3_gpd_ring *ring)
225*4882a593Smuzhiyun {
226*4882a593Smuzhiyun struct qmu_gpd *enq = ring->enqueue;
227*4882a593Smuzhiyun struct qmu_gpd *next;
228*4882a593Smuzhiyun
229*4882a593Smuzhiyun if (ring->enqueue < ring->end)
230*4882a593Smuzhiyun next = enq + 1;
231*4882a593Smuzhiyun else
232*4882a593Smuzhiyun next = ring->start;
233*4882a593Smuzhiyun
234*4882a593Smuzhiyun /* one gpd is reserved to simplify gpd preparation */
235*4882a593Smuzhiyun return next == ring->dequeue;
236*4882a593Smuzhiyun }
237*4882a593Smuzhiyun
mtu3_prepare_transfer(struct mtu3_ep * mep)238*4882a593Smuzhiyun int mtu3_prepare_transfer(struct mtu3_ep *mep)
239*4882a593Smuzhiyun {
240*4882a593Smuzhiyun return gpd_ring_empty(&mep->gpd_ring);
241*4882a593Smuzhiyun }
242*4882a593Smuzhiyun
mtu3_prepare_tx_gpd(struct mtu3_ep * mep,struct mtu3_request * mreq)243*4882a593Smuzhiyun static int mtu3_prepare_tx_gpd(struct mtu3_ep *mep, struct mtu3_request *mreq)
244*4882a593Smuzhiyun {
245*4882a593Smuzhiyun struct qmu_gpd *enq;
246*4882a593Smuzhiyun struct mtu3_gpd_ring *ring = &mep->gpd_ring;
247*4882a593Smuzhiyun struct qmu_gpd *gpd = ring->enqueue;
248*4882a593Smuzhiyun struct usb_request *req = &mreq->request;
249*4882a593Smuzhiyun struct mtu3 *mtu = mep->mtu;
250*4882a593Smuzhiyun dma_addr_t enq_dma;
251*4882a593Smuzhiyun u32 ext_addr;
252*4882a593Smuzhiyun
253*4882a593Smuzhiyun gpd->dw0_info = 0; /* SW own it */
254*4882a593Smuzhiyun gpd->buffer = cpu_to_le32(lower_32_bits(req->dma));
255*4882a593Smuzhiyun ext_addr = GPD_EXT_BUF(mtu, upper_32_bits(req->dma));
256*4882a593Smuzhiyun gpd->dw3_info = cpu_to_le32(GPD_DATA_LEN(mtu, req->length));
257*4882a593Smuzhiyun
258*4882a593Smuzhiyun /* get the next GPD */
259*4882a593Smuzhiyun enq = advance_enq_gpd(ring);
260*4882a593Smuzhiyun enq_dma = gpd_virt_to_dma(ring, enq);
261*4882a593Smuzhiyun dev_dbg(mep->mtu->dev, "TX-EP%d queue gpd=%p, enq=%p, qdma=%pad\n",
262*4882a593Smuzhiyun mep->epnum, gpd, enq, &enq_dma);
263*4882a593Smuzhiyun
264*4882a593Smuzhiyun enq->dw0_info &= cpu_to_le32(~GPD_FLAGS_HWO);
265*4882a593Smuzhiyun gpd->next_gpd = cpu_to_le32(lower_32_bits(enq_dma));
266*4882a593Smuzhiyun ext_addr |= GPD_EXT_NGP(mtu, upper_32_bits(enq_dma));
267*4882a593Smuzhiyun gpd->dw0_info = cpu_to_le32(ext_addr);
268*4882a593Smuzhiyun
269*4882a593Smuzhiyun if (req->zero) {
270*4882a593Smuzhiyun if (mtu->gen2cp)
271*4882a593Smuzhiyun gpd->dw0_info |= cpu_to_le32(GPD_FLAGS_ZLP);
272*4882a593Smuzhiyun else
273*4882a593Smuzhiyun gpd->dw3_info |= cpu_to_le32(GPD_EXT_FLAG_ZLP);
274*4882a593Smuzhiyun }
275*4882a593Smuzhiyun
276*4882a593Smuzhiyun /* prevent reorder, make sure GPD's HWO is set last */
277*4882a593Smuzhiyun mb();
278*4882a593Smuzhiyun gpd->dw0_info |= cpu_to_le32(GPD_FLAGS_IOC | GPD_FLAGS_HWO);
279*4882a593Smuzhiyun
280*4882a593Smuzhiyun mreq->gpd = gpd;
281*4882a593Smuzhiyun trace_mtu3_prepare_gpd(mep, gpd);
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun return 0;
284*4882a593Smuzhiyun }
285*4882a593Smuzhiyun
mtu3_prepare_rx_gpd(struct mtu3_ep * mep,struct mtu3_request * mreq)286*4882a593Smuzhiyun static int mtu3_prepare_rx_gpd(struct mtu3_ep *mep, struct mtu3_request *mreq)
287*4882a593Smuzhiyun {
288*4882a593Smuzhiyun struct qmu_gpd *enq;
289*4882a593Smuzhiyun struct mtu3_gpd_ring *ring = &mep->gpd_ring;
290*4882a593Smuzhiyun struct qmu_gpd *gpd = ring->enqueue;
291*4882a593Smuzhiyun struct usb_request *req = &mreq->request;
292*4882a593Smuzhiyun struct mtu3 *mtu = mep->mtu;
293*4882a593Smuzhiyun dma_addr_t enq_dma;
294*4882a593Smuzhiyun u32 ext_addr;
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun gpd->dw0_info = 0; /* SW own it */
297*4882a593Smuzhiyun gpd->buffer = cpu_to_le32(lower_32_bits(req->dma));
298*4882a593Smuzhiyun ext_addr = GPD_EXT_BUF(mtu, upper_32_bits(req->dma));
299*4882a593Smuzhiyun gpd->dw0_info = cpu_to_le32(GPD_RX_BUF_LEN(mtu, req->length));
300*4882a593Smuzhiyun
301*4882a593Smuzhiyun /* get the next GPD */
302*4882a593Smuzhiyun enq = advance_enq_gpd(ring);
303*4882a593Smuzhiyun enq_dma = gpd_virt_to_dma(ring, enq);
304*4882a593Smuzhiyun dev_dbg(mep->mtu->dev, "RX-EP%d queue gpd=%p, enq=%p, qdma=%pad\n",
305*4882a593Smuzhiyun mep->epnum, gpd, enq, &enq_dma);
306*4882a593Smuzhiyun
307*4882a593Smuzhiyun enq->dw0_info &= cpu_to_le32(~GPD_FLAGS_HWO);
308*4882a593Smuzhiyun gpd->next_gpd = cpu_to_le32(lower_32_bits(enq_dma));
309*4882a593Smuzhiyun ext_addr |= GPD_EXT_NGP(mtu, upper_32_bits(enq_dma));
310*4882a593Smuzhiyun gpd->dw3_info = cpu_to_le32(ext_addr);
311*4882a593Smuzhiyun /* prevent reorder, make sure GPD's HWO is set last */
312*4882a593Smuzhiyun mb();
313*4882a593Smuzhiyun gpd->dw0_info |= cpu_to_le32(GPD_FLAGS_IOC | GPD_FLAGS_HWO);
314*4882a593Smuzhiyun
315*4882a593Smuzhiyun mreq->gpd = gpd;
316*4882a593Smuzhiyun trace_mtu3_prepare_gpd(mep, gpd);
317*4882a593Smuzhiyun
318*4882a593Smuzhiyun return 0;
319*4882a593Smuzhiyun }
320*4882a593Smuzhiyun
mtu3_insert_gpd(struct mtu3_ep * mep,struct mtu3_request * mreq)321*4882a593Smuzhiyun void mtu3_insert_gpd(struct mtu3_ep *mep, struct mtu3_request *mreq)
322*4882a593Smuzhiyun {
323*4882a593Smuzhiyun
324*4882a593Smuzhiyun if (mep->is_in)
325*4882a593Smuzhiyun mtu3_prepare_tx_gpd(mep, mreq);
326*4882a593Smuzhiyun else
327*4882a593Smuzhiyun mtu3_prepare_rx_gpd(mep, mreq);
328*4882a593Smuzhiyun }
329*4882a593Smuzhiyun
mtu3_qmu_start(struct mtu3_ep * mep)330*4882a593Smuzhiyun int mtu3_qmu_start(struct mtu3_ep *mep)
331*4882a593Smuzhiyun {
332*4882a593Smuzhiyun struct mtu3 *mtu = mep->mtu;
333*4882a593Smuzhiyun void __iomem *mbase = mtu->mac_base;
334*4882a593Smuzhiyun struct mtu3_gpd_ring *ring = &mep->gpd_ring;
335*4882a593Smuzhiyun u8 epnum = mep->epnum;
336*4882a593Smuzhiyun
337*4882a593Smuzhiyun if (mep->is_in) {
338*4882a593Smuzhiyun /* set QMU start address */
339*4882a593Smuzhiyun write_txq_start_addr(mbase, epnum, ring->dma);
340*4882a593Smuzhiyun mtu3_setbits(mbase, MU3D_EP_TXCR0(epnum), TX_DMAREQEN);
341*4882a593Smuzhiyun /* send zero length packet according to ZLP flag in GPD */
342*4882a593Smuzhiyun mtu3_setbits(mbase, U3D_QCR1, QMU_TX_ZLP(epnum));
343*4882a593Smuzhiyun mtu3_writel(mbase, U3D_TQERRIESR0,
344*4882a593Smuzhiyun QMU_TX_LEN_ERR(epnum) | QMU_TX_CS_ERR(epnum));
345*4882a593Smuzhiyun
346*4882a593Smuzhiyun if (mtu3_readl(mbase, USB_QMU_TQCSR(epnum)) & QMU_Q_ACTIVE) {
347*4882a593Smuzhiyun dev_warn(mtu->dev, "Tx %d Active Now!\n", epnum);
348*4882a593Smuzhiyun return 0;
349*4882a593Smuzhiyun }
350*4882a593Smuzhiyun mtu3_writel(mbase, USB_QMU_TQCSR(epnum), QMU_Q_START);
351*4882a593Smuzhiyun
352*4882a593Smuzhiyun } else {
353*4882a593Smuzhiyun write_rxq_start_addr(mbase, epnum, ring->dma);
354*4882a593Smuzhiyun mtu3_setbits(mbase, MU3D_EP_RXCR0(epnum), RX_DMAREQEN);
355*4882a593Smuzhiyun /* don't expect ZLP */
356*4882a593Smuzhiyun mtu3_clrbits(mbase, U3D_QCR3, QMU_RX_ZLP(epnum));
357*4882a593Smuzhiyun /* move to next GPD when receive ZLP */
358*4882a593Smuzhiyun mtu3_setbits(mbase, U3D_QCR3, QMU_RX_COZ(epnum));
359*4882a593Smuzhiyun mtu3_writel(mbase, U3D_RQERRIESR0,
360*4882a593Smuzhiyun QMU_RX_LEN_ERR(epnum) | QMU_RX_CS_ERR(epnum));
361*4882a593Smuzhiyun mtu3_writel(mbase, U3D_RQERRIESR1, QMU_RX_ZLP_ERR(epnum));
362*4882a593Smuzhiyun
363*4882a593Smuzhiyun if (mtu3_readl(mbase, USB_QMU_RQCSR(epnum)) & QMU_Q_ACTIVE) {
364*4882a593Smuzhiyun dev_warn(mtu->dev, "Rx %d Active Now!\n", epnum);
365*4882a593Smuzhiyun return 0;
366*4882a593Smuzhiyun }
367*4882a593Smuzhiyun mtu3_writel(mbase, USB_QMU_RQCSR(epnum), QMU_Q_START);
368*4882a593Smuzhiyun }
369*4882a593Smuzhiyun
370*4882a593Smuzhiyun return 0;
371*4882a593Smuzhiyun }
372*4882a593Smuzhiyun
373*4882a593Smuzhiyun /* may called in atomic context */
mtu3_qmu_stop(struct mtu3_ep * mep)374*4882a593Smuzhiyun void mtu3_qmu_stop(struct mtu3_ep *mep)
375*4882a593Smuzhiyun {
376*4882a593Smuzhiyun struct mtu3 *mtu = mep->mtu;
377*4882a593Smuzhiyun void __iomem *mbase = mtu->mac_base;
378*4882a593Smuzhiyun int epnum = mep->epnum;
379*4882a593Smuzhiyun u32 value = 0;
380*4882a593Smuzhiyun u32 qcsr;
381*4882a593Smuzhiyun int ret;
382*4882a593Smuzhiyun
383*4882a593Smuzhiyun qcsr = mep->is_in ? USB_QMU_TQCSR(epnum) : USB_QMU_RQCSR(epnum);
384*4882a593Smuzhiyun
385*4882a593Smuzhiyun if (!(mtu3_readl(mbase, qcsr) & QMU_Q_ACTIVE)) {
386*4882a593Smuzhiyun dev_dbg(mtu->dev, "%s's qmu is inactive now!\n", mep->name);
387*4882a593Smuzhiyun return;
388*4882a593Smuzhiyun }
389*4882a593Smuzhiyun mtu3_writel(mbase, qcsr, QMU_Q_STOP);
390*4882a593Smuzhiyun
391*4882a593Smuzhiyun ret = readl_poll_timeout_atomic(mbase + qcsr, value,
392*4882a593Smuzhiyun !(value & QMU_Q_ACTIVE), 1, 1000);
393*4882a593Smuzhiyun if (ret) {
394*4882a593Smuzhiyun dev_err(mtu->dev, "stop %s's qmu failed\n", mep->name);
395*4882a593Smuzhiyun return;
396*4882a593Smuzhiyun }
397*4882a593Smuzhiyun
398*4882a593Smuzhiyun dev_dbg(mtu->dev, "%s's qmu stop now!\n", mep->name);
399*4882a593Smuzhiyun }
400*4882a593Smuzhiyun
mtu3_qmu_flush(struct mtu3_ep * mep)401*4882a593Smuzhiyun void mtu3_qmu_flush(struct mtu3_ep *mep)
402*4882a593Smuzhiyun {
403*4882a593Smuzhiyun
404*4882a593Smuzhiyun dev_dbg(mep->mtu->dev, "%s flush QMU %s\n", __func__,
405*4882a593Smuzhiyun ((mep->is_in) ? "TX" : "RX"));
406*4882a593Smuzhiyun
407*4882a593Smuzhiyun /*Stop QMU */
408*4882a593Smuzhiyun mtu3_qmu_stop(mep);
409*4882a593Smuzhiyun reset_gpd_list(mep);
410*4882a593Smuzhiyun }
411*4882a593Smuzhiyun
412*4882a593Smuzhiyun /*
413*4882a593Smuzhiyun * QMU can't transfer zero length packet directly (a hardware limit
414*4882a593Smuzhiyun * on old SoCs), so when needs to send ZLP, we intentionally trigger
415*4882a593Smuzhiyun * a length error interrupt, and in the ISR sends a ZLP by BMU.
416*4882a593Smuzhiyun */
qmu_tx_zlp_error_handler(struct mtu3 * mtu,u8 epnum)417*4882a593Smuzhiyun static void qmu_tx_zlp_error_handler(struct mtu3 *mtu, u8 epnum)
418*4882a593Smuzhiyun {
419*4882a593Smuzhiyun struct mtu3_ep *mep = mtu->in_eps + epnum;
420*4882a593Smuzhiyun struct mtu3_gpd_ring *ring = &mep->gpd_ring;
421*4882a593Smuzhiyun void __iomem *mbase = mtu->mac_base;
422*4882a593Smuzhiyun struct qmu_gpd *gpd_current = NULL;
423*4882a593Smuzhiyun struct mtu3_request *mreq;
424*4882a593Smuzhiyun dma_addr_t cur_gpd_dma;
425*4882a593Smuzhiyun u32 txcsr = 0;
426*4882a593Smuzhiyun int ret;
427*4882a593Smuzhiyun
428*4882a593Smuzhiyun mreq = next_request(mep);
429*4882a593Smuzhiyun if (mreq && mreq->request.length != 0)
430*4882a593Smuzhiyun return;
431*4882a593Smuzhiyun
432*4882a593Smuzhiyun cur_gpd_dma = read_txq_cur_addr(mbase, epnum);
433*4882a593Smuzhiyun gpd_current = gpd_dma_to_virt(ring, cur_gpd_dma);
434*4882a593Smuzhiyun
435*4882a593Smuzhiyun if (GPD_DATA_LEN(mtu, le32_to_cpu(gpd_current->dw3_info)) != 0) {
436*4882a593Smuzhiyun dev_err(mtu->dev, "TX EP%d buffer length error(!=0)\n", epnum);
437*4882a593Smuzhiyun return;
438*4882a593Smuzhiyun }
439*4882a593Smuzhiyun
440*4882a593Smuzhiyun dev_dbg(mtu->dev, "%s send ZLP for req=%p\n", __func__, mreq);
441*4882a593Smuzhiyun trace_mtu3_zlp_exp_gpd(mep, gpd_current);
442*4882a593Smuzhiyun
443*4882a593Smuzhiyun mtu3_clrbits(mbase, MU3D_EP_TXCR0(mep->epnum), TX_DMAREQEN);
444*4882a593Smuzhiyun
445*4882a593Smuzhiyun ret = readl_poll_timeout_atomic(mbase + MU3D_EP_TXCR0(mep->epnum),
446*4882a593Smuzhiyun txcsr, !(txcsr & TX_FIFOFULL), 1, 1000);
447*4882a593Smuzhiyun if (ret) {
448*4882a593Smuzhiyun dev_err(mtu->dev, "%s wait for fifo empty fail\n", __func__);
449*4882a593Smuzhiyun return;
450*4882a593Smuzhiyun }
451*4882a593Smuzhiyun mtu3_setbits(mbase, MU3D_EP_TXCR0(mep->epnum), TX_TXPKTRDY);
452*4882a593Smuzhiyun /* prevent reorder, make sure GPD's HWO is set last */
453*4882a593Smuzhiyun mb();
454*4882a593Smuzhiyun /* by pass the current GDP */
455*4882a593Smuzhiyun gpd_current->dw0_info |= cpu_to_le32(GPD_FLAGS_BPS | GPD_FLAGS_HWO);
456*4882a593Smuzhiyun
457*4882a593Smuzhiyun /*enable DMAREQEN, switch back to QMU mode */
458*4882a593Smuzhiyun mtu3_setbits(mbase, MU3D_EP_TXCR0(mep->epnum), TX_DMAREQEN);
459*4882a593Smuzhiyun mtu3_qmu_resume(mep);
460*4882a593Smuzhiyun }
461*4882a593Smuzhiyun
462*4882a593Smuzhiyun /*
463*4882a593Smuzhiyun * NOTE: request list maybe is already empty as following case:
464*4882a593Smuzhiyun * queue_tx --> qmu_interrupt(clear interrupt pending, schedule tasklet)-->
465*4882a593Smuzhiyun * queue_tx --> process_tasklet(meanwhile, the second one is transferred,
466*4882a593Smuzhiyun * tasklet process both of them)-->qmu_interrupt for second one.
467*4882a593Smuzhiyun * To avoid upper case, put qmu_done_tx in ISR directly to process it.
468*4882a593Smuzhiyun */
qmu_done_tx(struct mtu3 * mtu,u8 epnum)469*4882a593Smuzhiyun static void qmu_done_tx(struct mtu3 *mtu, u8 epnum)
470*4882a593Smuzhiyun {
471*4882a593Smuzhiyun struct mtu3_ep *mep = mtu->in_eps + epnum;
472*4882a593Smuzhiyun struct mtu3_gpd_ring *ring = &mep->gpd_ring;
473*4882a593Smuzhiyun void __iomem *mbase = mtu->mac_base;
474*4882a593Smuzhiyun struct qmu_gpd *gpd = ring->dequeue;
475*4882a593Smuzhiyun struct qmu_gpd *gpd_current = NULL;
476*4882a593Smuzhiyun struct usb_request *request = NULL;
477*4882a593Smuzhiyun struct mtu3_request *mreq;
478*4882a593Smuzhiyun dma_addr_t cur_gpd_dma;
479*4882a593Smuzhiyun
480*4882a593Smuzhiyun /*transfer phy address got from QMU register to virtual address */
481*4882a593Smuzhiyun cur_gpd_dma = read_txq_cur_addr(mbase, epnum);
482*4882a593Smuzhiyun gpd_current = gpd_dma_to_virt(ring, cur_gpd_dma);
483*4882a593Smuzhiyun
484*4882a593Smuzhiyun dev_dbg(mtu->dev, "%s EP%d, last=%p, current=%p, enq=%p\n",
485*4882a593Smuzhiyun __func__, epnum, gpd, gpd_current, ring->enqueue);
486*4882a593Smuzhiyun
487*4882a593Smuzhiyun while (gpd != gpd_current && !GET_GPD_HWO(gpd)) {
488*4882a593Smuzhiyun
489*4882a593Smuzhiyun mreq = next_request(mep);
490*4882a593Smuzhiyun
491*4882a593Smuzhiyun if (mreq == NULL || mreq->gpd != gpd) {
492*4882a593Smuzhiyun dev_err(mtu->dev, "no correct TX req is found\n");
493*4882a593Smuzhiyun break;
494*4882a593Smuzhiyun }
495*4882a593Smuzhiyun
496*4882a593Smuzhiyun request = &mreq->request;
497*4882a593Smuzhiyun request->actual = GPD_DATA_LEN(mtu, le32_to_cpu(gpd->dw3_info));
498*4882a593Smuzhiyun trace_mtu3_complete_gpd(mep, gpd);
499*4882a593Smuzhiyun mtu3_req_complete(mep, request, 0);
500*4882a593Smuzhiyun
501*4882a593Smuzhiyun gpd = advance_deq_gpd(ring);
502*4882a593Smuzhiyun }
503*4882a593Smuzhiyun
504*4882a593Smuzhiyun dev_dbg(mtu->dev, "%s EP%d, deq=%p, enq=%p, complete\n",
505*4882a593Smuzhiyun __func__, epnum, ring->dequeue, ring->enqueue);
506*4882a593Smuzhiyun
507*4882a593Smuzhiyun }
508*4882a593Smuzhiyun
qmu_done_rx(struct mtu3 * mtu,u8 epnum)509*4882a593Smuzhiyun static void qmu_done_rx(struct mtu3 *mtu, u8 epnum)
510*4882a593Smuzhiyun {
511*4882a593Smuzhiyun struct mtu3_ep *mep = mtu->out_eps + epnum;
512*4882a593Smuzhiyun struct mtu3_gpd_ring *ring = &mep->gpd_ring;
513*4882a593Smuzhiyun void __iomem *mbase = mtu->mac_base;
514*4882a593Smuzhiyun struct qmu_gpd *gpd = ring->dequeue;
515*4882a593Smuzhiyun struct qmu_gpd *gpd_current = NULL;
516*4882a593Smuzhiyun struct usb_request *req = NULL;
517*4882a593Smuzhiyun struct mtu3_request *mreq;
518*4882a593Smuzhiyun dma_addr_t cur_gpd_dma;
519*4882a593Smuzhiyun
520*4882a593Smuzhiyun cur_gpd_dma = read_rxq_cur_addr(mbase, epnum);
521*4882a593Smuzhiyun gpd_current = gpd_dma_to_virt(ring, cur_gpd_dma);
522*4882a593Smuzhiyun
523*4882a593Smuzhiyun dev_dbg(mtu->dev, "%s EP%d, last=%p, current=%p, enq=%p\n",
524*4882a593Smuzhiyun __func__, epnum, gpd, gpd_current, ring->enqueue);
525*4882a593Smuzhiyun
526*4882a593Smuzhiyun while (gpd != gpd_current && !GET_GPD_HWO(gpd)) {
527*4882a593Smuzhiyun
528*4882a593Smuzhiyun mreq = next_request(mep);
529*4882a593Smuzhiyun
530*4882a593Smuzhiyun if (mreq == NULL || mreq->gpd != gpd) {
531*4882a593Smuzhiyun dev_err(mtu->dev, "no correct RX req is found\n");
532*4882a593Smuzhiyun break;
533*4882a593Smuzhiyun }
534*4882a593Smuzhiyun req = &mreq->request;
535*4882a593Smuzhiyun
536*4882a593Smuzhiyun req->actual = GPD_DATA_LEN(mtu, le32_to_cpu(gpd->dw3_info));
537*4882a593Smuzhiyun trace_mtu3_complete_gpd(mep, gpd);
538*4882a593Smuzhiyun mtu3_req_complete(mep, req, 0);
539*4882a593Smuzhiyun
540*4882a593Smuzhiyun gpd = advance_deq_gpd(ring);
541*4882a593Smuzhiyun }
542*4882a593Smuzhiyun
543*4882a593Smuzhiyun dev_dbg(mtu->dev, "%s EP%d, deq=%p, enq=%p, complete\n",
544*4882a593Smuzhiyun __func__, epnum, ring->dequeue, ring->enqueue);
545*4882a593Smuzhiyun }
546*4882a593Smuzhiyun
qmu_done_isr(struct mtu3 * mtu,u32 done_status)547*4882a593Smuzhiyun static void qmu_done_isr(struct mtu3 *mtu, u32 done_status)
548*4882a593Smuzhiyun {
549*4882a593Smuzhiyun int i;
550*4882a593Smuzhiyun
551*4882a593Smuzhiyun for (i = 1; i < mtu->num_eps; i++) {
552*4882a593Smuzhiyun if (done_status & QMU_RX_DONE_INT(i))
553*4882a593Smuzhiyun qmu_done_rx(mtu, i);
554*4882a593Smuzhiyun if (done_status & QMU_TX_DONE_INT(i))
555*4882a593Smuzhiyun qmu_done_tx(mtu, i);
556*4882a593Smuzhiyun }
557*4882a593Smuzhiyun }
558*4882a593Smuzhiyun
qmu_exception_isr(struct mtu3 * mtu,u32 qmu_status)559*4882a593Smuzhiyun static void qmu_exception_isr(struct mtu3 *mtu, u32 qmu_status)
560*4882a593Smuzhiyun {
561*4882a593Smuzhiyun void __iomem *mbase = mtu->mac_base;
562*4882a593Smuzhiyun u32 errval;
563*4882a593Smuzhiyun int i;
564*4882a593Smuzhiyun
565*4882a593Smuzhiyun if ((qmu_status & RXQ_CSERR_INT) || (qmu_status & RXQ_LENERR_INT)) {
566*4882a593Smuzhiyun errval = mtu3_readl(mbase, U3D_RQERRIR0);
567*4882a593Smuzhiyun for (i = 1; i < mtu->num_eps; i++) {
568*4882a593Smuzhiyun if (errval & QMU_RX_CS_ERR(i))
569*4882a593Smuzhiyun dev_err(mtu->dev, "Rx %d CS error!\n", i);
570*4882a593Smuzhiyun
571*4882a593Smuzhiyun if (errval & QMU_RX_LEN_ERR(i))
572*4882a593Smuzhiyun dev_err(mtu->dev, "RX %d Length error\n", i);
573*4882a593Smuzhiyun }
574*4882a593Smuzhiyun mtu3_writel(mbase, U3D_RQERRIR0, errval);
575*4882a593Smuzhiyun }
576*4882a593Smuzhiyun
577*4882a593Smuzhiyun if (qmu_status & RXQ_ZLPERR_INT) {
578*4882a593Smuzhiyun errval = mtu3_readl(mbase, U3D_RQERRIR1);
579*4882a593Smuzhiyun for (i = 1; i < mtu->num_eps; i++) {
580*4882a593Smuzhiyun if (errval & QMU_RX_ZLP_ERR(i))
581*4882a593Smuzhiyun dev_dbg(mtu->dev, "RX EP%d Recv ZLP\n", i);
582*4882a593Smuzhiyun }
583*4882a593Smuzhiyun mtu3_writel(mbase, U3D_RQERRIR1, errval);
584*4882a593Smuzhiyun }
585*4882a593Smuzhiyun
586*4882a593Smuzhiyun if ((qmu_status & TXQ_CSERR_INT) || (qmu_status & TXQ_LENERR_INT)) {
587*4882a593Smuzhiyun errval = mtu3_readl(mbase, U3D_TQERRIR0);
588*4882a593Smuzhiyun for (i = 1; i < mtu->num_eps; i++) {
589*4882a593Smuzhiyun if (errval & QMU_TX_CS_ERR(i))
590*4882a593Smuzhiyun dev_err(mtu->dev, "Tx %d checksum error!\n", i);
591*4882a593Smuzhiyun
592*4882a593Smuzhiyun if (errval & QMU_TX_LEN_ERR(i))
593*4882a593Smuzhiyun qmu_tx_zlp_error_handler(mtu, i);
594*4882a593Smuzhiyun }
595*4882a593Smuzhiyun mtu3_writel(mbase, U3D_TQERRIR0, errval);
596*4882a593Smuzhiyun }
597*4882a593Smuzhiyun }
598*4882a593Smuzhiyun
mtu3_qmu_isr(struct mtu3 * mtu)599*4882a593Smuzhiyun irqreturn_t mtu3_qmu_isr(struct mtu3 *mtu)
600*4882a593Smuzhiyun {
601*4882a593Smuzhiyun void __iomem *mbase = mtu->mac_base;
602*4882a593Smuzhiyun u32 qmu_status;
603*4882a593Smuzhiyun u32 qmu_done_status;
604*4882a593Smuzhiyun
605*4882a593Smuzhiyun /* U3D_QISAR1 is read update */
606*4882a593Smuzhiyun qmu_status = mtu3_readl(mbase, U3D_QISAR1);
607*4882a593Smuzhiyun qmu_status &= mtu3_readl(mbase, U3D_QIER1);
608*4882a593Smuzhiyun
609*4882a593Smuzhiyun qmu_done_status = mtu3_readl(mbase, U3D_QISAR0);
610*4882a593Smuzhiyun qmu_done_status &= mtu3_readl(mbase, U3D_QIER0);
611*4882a593Smuzhiyun mtu3_writel(mbase, U3D_QISAR0, qmu_done_status); /* W1C */
612*4882a593Smuzhiyun dev_dbg(mtu->dev, "=== QMUdone[tx=%x, rx=%x] QMUexp[%x] ===\n",
613*4882a593Smuzhiyun (qmu_done_status & 0xFFFF), qmu_done_status >> 16,
614*4882a593Smuzhiyun qmu_status);
615*4882a593Smuzhiyun trace_mtu3_qmu_isr(qmu_done_status, qmu_status);
616*4882a593Smuzhiyun
617*4882a593Smuzhiyun if (qmu_done_status)
618*4882a593Smuzhiyun qmu_done_isr(mtu, qmu_done_status);
619*4882a593Smuzhiyun
620*4882a593Smuzhiyun if (qmu_status)
621*4882a593Smuzhiyun qmu_exception_isr(mtu, qmu_status);
622*4882a593Smuzhiyun
623*4882a593Smuzhiyun return IRQ_HANDLED;
624*4882a593Smuzhiyun }
625*4882a593Smuzhiyun
mtu3_qmu_init(struct mtu3 * mtu)626*4882a593Smuzhiyun int mtu3_qmu_init(struct mtu3 *mtu)
627*4882a593Smuzhiyun {
628*4882a593Smuzhiyun
629*4882a593Smuzhiyun compiletime_assert(QMU_GPD_SIZE == 16, "QMU_GPD size SHOULD be 16B");
630*4882a593Smuzhiyun
631*4882a593Smuzhiyun mtu->qmu_gpd_pool = dma_pool_create("QMU_GPD", mtu->dev,
632*4882a593Smuzhiyun QMU_GPD_RING_SIZE, QMU_GPD_SIZE, 0);
633*4882a593Smuzhiyun
634*4882a593Smuzhiyun if (!mtu->qmu_gpd_pool)
635*4882a593Smuzhiyun return -ENOMEM;
636*4882a593Smuzhiyun
637*4882a593Smuzhiyun return 0;
638*4882a593Smuzhiyun }
639*4882a593Smuzhiyun
mtu3_qmu_exit(struct mtu3 * mtu)640*4882a593Smuzhiyun void mtu3_qmu_exit(struct mtu3 *mtu)
641*4882a593Smuzhiyun {
642*4882a593Smuzhiyun dma_pool_destroy(mtu->qmu_gpd_pool);
643*4882a593Smuzhiyun }
644