1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) 2015 Cavium, Inc.
4*4882a593Smuzhiyun */
5*4882a593Smuzhiyun
6*4882a593Smuzhiyun #include <linux/pci.h>
7*4882a593Smuzhiyun #include <linux/netdevice.h>
8*4882a593Smuzhiyun #include <linux/ip.h>
9*4882a593Smuzhiyun #include <linux/etherdevice.h>
10*4882a593Smuzhiyun #include <linux/iommu.h>
11*4882a593Smuzhiyun #include <net/ip.h>
12*4882a593Smuzhiyun #include <net/tso.h>
13*4882a593Smuzhiyun
14*4882a593Smuzhiyun #include "nic_reg.h"
15*4882a593Smuzhiyun #include "nic.h"
16*4882a593Smuzhiyun #include "q_struct.h"
17*4882a593Smuzhiyun #include "nicvf_queues.h"
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun static inline void nicvf_sq_add_gather_subdesc(struct snd_queue *sq, int qentry,
20*4882a593Smuzhiyun int size, u64 data);
nicvf_get_page(struct nicvf * nic)21*4882a593Smuzhiyun static void nicvf_get_page(struct nicvf *nic)
22*4882a593Smuzhiyun {
23*4882a593Smuzhiyun if (!nic->rb_pageref || !nic->rb_page)
24*4882a593Smuzhiyun return;
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun page_ref_add(nic->rb_page, nic->rb_pageref);
27*4882a593Smuzhiyun nic->rb_pageref = 0;
28*4882a593Smuzhiyun }
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun /* Poll a register for a specific value */
nicvf_poll_reg(struct nicvf * nic,int qidx,u64 reg,int bit_pos,int bits,int val)31*4882a593Smuzhiyun static int nicvf_poll_reg(struct nicvf *nic, int qidx,
32*4882a593Smuzhiyun u64 reg, int bit_pos, int bits, int val)
33*4882a593Smuzhiyun {
34*4882a593Smuzhiyun u64 bit_mask;
35*4882a593Smuzhiyun u64 reg_val;
36*4882a593Smuzhiyun int timeout = 10;
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun bit_mask = (1ULL << bits) - 1;
39*4882a593Smuzhiyun bit_mask = (bit_mask << bit_pos);
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun while (timeout) {
42*4882a593Smuzhiyun reg_val = nicvf_queue_reg_read(nic, reg, qidx);
43*4882a593Smuzhiyun if (((reg_val & bit_mask) >> bit_pos) == val)
44*4882a593Smuzhiyun return 0;
45*4882a593Smuzhiyun usleep_range(1000, 2000);
46*4882a593Smuzhiyun timeout--;
47*4882a593Smuzhiyun }
48*4882a593Smuzhiyun netdev_err(nic->netdev, "Poll on reg 0x%llx failed\n", reg);
49*4882a593Smuzhiyun return 1;
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun /* Allocate memory for a queue's descriptors */
nicvf_alloc_q_desc_mem(struct nicvf * nic,struct q_desc_mem * dmem,int q_len,int desc_size,int align_bytes)53*4882a593Smuzhiyun static int nicvf_alloc_q_desc_mem(struct nicvf *nic, struct q_desc_mem *dmem,
54*4882a593Smuzhiyun int q_len, int desc_size, int align_bytes)
55*4882a593Smuzhiyun {
56*4882a593Smuzhiyun dmem->q_len = q_len;
57*4882a593Smuzhiyun dmem->size = (desc_size * q_len) + align_bytes;
58*4882a593Smuzhiyun /* Save address, need it while freeing */
59*4882a593Smuzhiyun dmem->unalign_base = dma_alloc_coherent(&nic->pdev->dev, dmem->size,
60*4882a593Smuzhiyun &dmem->dma, GFP_KERNEL);
61*4882a593Smuzhiyun if (!dmem->unalign_base)
62*4882a593Smuzhiyun return -ENOMEM;
63*4882a593Smuzhiyun
64*4882a593Smuzhiyun /* Align memory address for 'align_bytes' */
65*4882a593Smuzhiyun dmem->phys_base = NICVF_ALIGNED_ADDR((u64)dmem->dma, align_bytes);
66*4882a593Smuzhiyun dmem->base = dmem->unalign_base + (dmem->phys_base - dmem->dma);
67*4882a593Smuzhiyun return 0;
68*4882a593Smuzhiyun }
69*4882a593Smuzhiyun
70*4882a593Smuzhiyun /* Free queue's descriptor memory */
nicvf_free_q_desc_mem(struct nicvf * nic,struct q_desc_mem * dmem)71*4882a593Smuzhiyun static void nicvf_free_q_desc_mem(struct nicvf *nic, struct q_desc_mem *dmem)
72*4882a593Smuzhiyun {
73*4882a593Smuzhiyun if (!dmem)
74*4882a593Smuzhiyun return;
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun dma_free_coherent(&nic->pdev->dev, dmem->size,
77*4882a593Smuzhiyun dmem->unalign_base, dmem->dma);
78*4882a593Smuzhiyun dmem->unalign_base = NULL;
79*4882a593Smuzhiyun dmem->base = NULL;
80*4882a593Smuzhiyun }
81*4882a593Smuzhiyun
82*4882a593Smuzhiyun #define XDP_PAGE_REFCNT_REFILL 256
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun /* Allocate a new page or recycle one if possible
85*4882a593Smuzhiyun *
86*4882a593Smuzhiyun * We cannot optimize dma mapping here, since
87*4882a593Smuzhiyun * 1. It's only one RBDR ring for 8 Rx queues.
88*4882a593Smuzhiyun * 2. CQE_RX gives address of the buffer where pkt has been DMA'ed
89*4882a593Smuzhiyun * and not idx into RBDR ring, so can't refer to saved info.
90*4882a593Smuzhiyun * 3. There are multiple receive buffers per page
91*4882a593Smuzhiyun */
nicvf_alloc_page(struct nicvf * nic,struct rbdr * rbdr,gfp_t gfp)92*4882a593Smuzhiyun static inline struct pgcache *nicvf_alloc_page(struct nicvf *nic,
93*4882a593Smuzhiyun struct rbdr *rbdr, gfp_t gfp)
94*4882a593Smuzhiyun {
95*4882a593Smuzhiyun int ref_count;
96*4882a593Smuzhiyun struct page *page = NULL;
97*4882a593Smuzhiyun struct pgcache *pgcache, *next;
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun /* Check if page is already allocated */
100*4882a593Smuzhiyun pgcache = &rbdr->pgcache[rbdr->pgidx];
101*4882a593Smuzhiyun page = pgcache->page;
102*4882a593Smuzhiyun /* Check if page can be recycled */
103*4882a593Smuzhiyun if (page) {
104*4882a593Smuzhiyun ref_count = page_ref_count(page);
105*4882a593Smuzhiyun /* This page can be recycled if internal ref_count and page's
106*4882a593Smuzhiyun * ref_count are equal, indicating that the page has been used
107*4882a593Smuzhiyun * once for packet transmission. For non-XDP mode, internal
108*4882a593Smuzhiyun * ref_count is always '1'.
109*4882a593Smuzhiyun */
110*4882a593Smuzhiyun if (rbdr->is_xdp) {
111*4882a593Smuzhiyun if (ref_count == pgcache->ref_count)
112*4882a593Smuzhiyun pgcache->ref_count--;
113*4882a593Smuzhiyun else
114*4882a593Smuzhiyun page = NULL;
115*4882a593Smuzhiyun } else if (ref_count != 1) {
116*4882a593Smuzhiyun page = NULL;
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun }
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun if (!page) {
121*4882a593Smuzhiyun page = alloc_pages(gfp | __GFP_COMP | __GFP_NOWARN, 0);
122*4882a593Smuzhiyun if (!page)
123*4882a593Smuzhiyun return NULL;
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun this_cpu_inc(nic->pnicvf->drv_stats->page_alloc);
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun /* Check for space */
128*4882a593Smuzhiyun if (rbdr->pgalloc >= rbdr->pgcnt) {
129*4882a593Smuzhiyun /* Page can still be used */
130*4882a593Smuzhiyun nic->rb_page = page;
131*4882a593Smuzhiyun return NULL;
132*4882a593Smuzhiyun }
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun /* Save the page in page cache */
135*4882a593Smuzhiyun pgcache->page = page;
136*4882a593Smuzhiyun pgcache->dma_addr = 0;
137*4882a593Smuzhiyun pgcache->ref_count = 0;
138*4882a593Smuzhiyun rbdr->pgalloc++;
139*4882a593Smuzhiyun }
140*4882a593Smuzhiyun
141*4882a593Smuzhiyun /* Take additional page references for recycling */
142*4882a593Smuzhiyun if (rbdr->is_xdp) {
143*4882a593Smuzhiyun /* Since there is single RBDR (i.e single core doing
144*4882a593Smuzhiyun * page recycling) per 8 Rx queues, in XDP mode adjusting
145*4882a593Smuzhiyun * page references atomically is the biggest bottleneck, so
146*4882a593Smuzhiyun * take bunch of references at a time.
147*4882a593Smuzhiyun *
148*4882a593Smuzhiyun * So here, below reference counts defer by '1'.
149*4882a593Smuzhiyun */
150*4882a593Smuzhiyun if (!pgcache->ref_count) {
151*4882a593Smuzhiyun pgcache->ref_count = XDP_PAGE_REFCNT_REFILL;
152*4882a593Smuzhiyun page_ref_add(page, XDP_PAGE_REFCNT_REFILL);
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun } else {
155*4882a593Smuzhiyun /* In non-XDP case, single 64K page is divided across multiple
156*4882a593Smuzhiyun * receive buffers, so cost of recycling is less anyway.
157*4882a593Smuzhiyun * So we can do with just one extra reference.
158*4882a593Smuzhiyun */
159*4882a593Smuzhiyun page_ref_add(page, 1);
160*4882a593Smuzhiyun }
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun rbdr->pgidx++;
163*4882a593Smuzhiyun rbdr->pgidx &= (rbdr->pgcnt - 1);
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun /* Prefetch refcount of next page in page cache */
166*4882a593Smuzhiyun next = &rbdr->pgcache[rbdr->pgidx];
167*4882a593Smuzhiyun page = next->page;
168*4882a593Smuzhiyun if (page)
169*4882a593Smuzhiyun prefetch(&page->_refcount);
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun return pgcache;
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun /* Allocate buffer for packet reception */
nicvf_alloc_rcv_buffer(struct nicvf * nic,struct rbdr * rbdr,gfp_t gfp,u32 buf_len,u64 * rbuf)175*4882a593Smuzhiyun static inline int nicvf_alloc_rcv_buffer(struct nicvf *nic, struct rbdr *rbdr,
176*4882a593Smuzhiyun gfp_t gfp, u32 buf_len, u64 *rbuf)
177*4882a593Smuzhiyun {
178*4882a593Smuzhiyun struct pgcache *pgcache = NULL;
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun /* Check if request can be accomodated in previous allocated page.
181*4882a593Smuzhiyun * But in XDP mode only one buffer per page is permitted.
182*4882a593Smuzhiyun */
183*4882a593Smuzhiyun if (!rbdr->is_xdp && nic->rb_page &&
184*4882a593Smuzhiyun ((nic->rb_page_offset + buf_len) <= PAGE_SIZE)) {
185*4882a593Smuzhiyun nic->rb_pageref++;
186*4882a593Smuzhiyun goto ret;
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun nicvf_get_page(nic);
190*4882a593Smuzhiyun nic->rb_page = NULL;
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun /* Get new page, either recycled or new one */
193*4882a593Smuzhiyun pgcache = nicvf_alloc_page(nic, rbdr, gfp);
194*4882a593Smuzhiyun if (!pgcache && !nic->rb_page) {
195*4882a593Smuzhiyun this_cpu_inc(nic->pnicvf->drv_stats->rcv_buffer_alloc_failures);
196*4882a593Smuzhiyun return -ENOMEM;
197*4882a593Smuzhiyun }
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun nic->rb_page_offset = 0;
200*4882a593Smuzhiyun
201*4882a593Smuzhiyun /* Reserve space for header modifications by BPF program */
202*4882a593Smuzhiyun if (rbdr->is_xdp)
203*4882a593Smuzhiyun buf_len += XDP_PACKET_HEADROOM;
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun /* Check if it's recycled */
206*4882a593Smuzhiyun if (pgcache)
207*4882a593Smuzhiyun nic->rb_page = pgcache->page;
208*4882a593Smuzhiyun ret:
209*4882a593Smuzhiyun if (rbdr->is_xdp && pgcache && pgcache->dma_addr) {
210*4882a593Smuzhiyun *rbuf = pgcache->dma_addr;
211*4882a593Smuzhiyun } else {
212*4882a593Smuzhiyun /* HW will ensure data coherency, CPU sync not required */
213*4882a593Smuzhiyun *rbuf = (u64)dma_map_page_attrs(&nic->pdev->dev, nic->rb_page,
214*4882a593Smuzhiyun nic->rb_page_offset, buf_len,
215*4882a593Smuzhiyun DMA_FROM_DEVICE,
216*4882a593Smuzhiyun DMA_ATTR_SKIP_CPU_SYNC);
217*4882a593Smuzhiyun if (dma_mapping_error(&nic->pdev->dev, (dma_addr_t)*rbuf)) {
218*4882a593Smuzhiyun if (!nic->rb_page_offset)
219*4882a593Smuzhiyun __free_pages(nic->rb_page, 0);
220*4882a593Smuzhiyun nic->rb_page = NULL;
221*4882a593Smuzhiyun return -ENOMEM;
222*4882a593Smuzhiyun }
223*4882a593Smuzhiyun if (pgcache)
224*4882a593Smuzhiyun pgcache->dma_addr = *rbuf + XDP_PACKET_HEADROOM;
225*4882a593Smuzhiyun nic->rb_page_offset += buf_len;
226*4882a593Smuzhiyun }
227*4882a593Smuzhiyun
228*4882a593Smuzhiyun return 0;
229*4882a593Smuzhiyun }
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun /* Build skb around receive buffer */
nicvf_rb_ptr_to_skb(struct nicvf * nic,u64 rb_ptr,int len)232*4882a593Smuzhiyun static struct sk_buff *nicvf_rb_ptr_to_skb(struct nicvf *nic,
233*4882a593Smuzhiyun u64 rb_ptr, int len)
234*4882a593Smuzhiyun {
235*4882a593Smuzhiyun void *data;
236*4882a593Smuzhiyun struct sk_buff *skb;
237*4882a593Smuzhiyun
238*4882a593Smuzhiyun data = phys_to_virt(rb_ptr);
239*4882a593Smuzhiyun
240*4882a593Smuzhiyun /* Now build an skb to give to stack */
241*4882a593Smuzhiyun skb = build_skb(data, RCV_FRAG_LEN);
242*4882a593Smuzhiyun if (!skb) {
243*4882a593Smuzhiyun put_page(virt_to_page(data));
244*4882a593Smuzhiyun return NULL;
245*4882a593Smuzhiyun }
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun prefetch(skb->data);
248*4882a593Smuzhiyun return skb;
249*4882a593Smuzhiyun }
250*4882a593Smuzhiyun
251*4882a593Smuzhiyun /* Allocate RBDR ring and populate receive buffers */
nicvf_init_rbdr(struct nicvf * nic,struct rbdr * rbdr,int ring_len,int buf_size)252*4882a593Smuzhiyun static int nicvf_init_rbdr(struct nicvf *nic, struct rbdr *rbdr,
253*4882a593Smuzhiyun int ring_len, int buf_size)
254*4882a593Smuzhiyun {
255*4882a593Smuzhiyun int idx;
256*4882a593Smuzhiyun u64 rbuf;
257*4882a593Smuzhiyun struct rbdr_entry_t *desc;
258*4882a593Smuzhiyun int err;
259*4882a593Smuzhiyun
260*4882a593Smuzhiyun err = nicvf_alloc_q_desc_mem(nic, &rbdr->dmem, ring_len,
261*4882a593Smuzhiyun sizeof(struct rbdr_entry_t),
262*4882a593Smuzhiyun NICVF_RCV_BUF_ALIGN_BYTES);
263*4882a593Smuzhiyun if (err)
264*4882a593Smuzhiyun return err;
265*4882a593Smuzhiyun
266*4882a593Smuzhiyun rbdr->desc = rbdr->dmem.base;
267*4882a593Smuzhiyun /* Buffer size has to be in multiples of 128 bytes */
268*4882a593Smuzhiyun rbdr->dma_size = buf_size;
269*4882a593Smuzhiyun rbdr->enable = true;
270*4882a593Smuzhiyun rbdr->thresh = RBDR_THRESH;
271*4882a593Smuzhiyun rbdr->head = 0;
272*4882a593Smuzhiyun rbdr->tail = 0;
273*4882a593Smuzhiyun
274*4882a593Smuzhiyun /* Initialize page recycling stuff.
275*4882a593Smuzhiyun *
276*4882a593Smuzhiyun * Can't use single buffer per page especially with 64K pages.
277*4882a593Smuzhiyun * On embedded platforms i.e 81xx/83xx available memory itself
278*4882a593Smuzhiyun * is low and minimum ring size of RBDR is 8K, that takes away
279*4882a593Smuzhiyun * lots of memory.
280*4882a593Smuzhiyun *
281*4882a593Smuzhiyun * But for XDP it has to be a single buffer per page.
282*4882a593Smuzhiyun */
283*4882a593Smuzhiyun if (!nic->pnicvf->xdp_prog) {
284*4882a593Smuzhiyun rbdr->pgcnt = ring_len / (PAGE_SIZE / buf_size);
285*4882a593Smuzhiyun rbdr->is_xdp = false;
286*4882a593Smuzhiyun } else {
287*4882a593Smuzhiyun rbdr->pgcnt = ring_len;
288*4882a593Smuzhiyun rbdr->is_xdp = true;
289*4882a593Smuzhiyun }
290*4882a593Smuzhiyun rbdr->pgcnt = roundup_pow_of_two(rbdr->pgcnt);
291*4882a593Smuzhiyun rbdr->pgcache = kcalloc(rbdr->pgcnt, sizeof(*rbdr->pgcache),
292*4882a593Smuzhiyun GFP_KERNEL);
293*4882a593Smuzhiyun if (!rbdr->pgcache)
294*4882a593Smuzhiyun return -ENOMEM;
295*4882a593Smuzhiyun rbdr->pgidx = 0;
296*4882a593Smuzhiyun rbdr->pgalloc = 0;
297*4882a593Smuzhiyun
298*4882a593Smuzhiyun nic->rb_page = NULL;
299*4882a593Smuzhiyun for (idx = 0; idx < ring_len; idx++) {
300*4882a593Smuzhiyun err = nicvf_alloc_rcv_buffer(nic, rbdr, GFP_KERNEL,
301*4882a593Smuzhiyun RCV_FRAG_LEN, &rbuf);
302*4882a593Smuzhiyun if (err) {
303*4882a593Smuzhiyun /* To free already allocated and mapped ones */
304*4882a593Smuzhiyun rbdr->tail = idx - 1;
305*4882a593Smuzhiyun return err;
306*4882a593Smuzhiyun }
307*4882a593Smuzhiyun
308*4882a593Smuzhiyun desc = GET_RBDR_DESC(rbdr, idx);
309*4882a593Smuzhiyun desc->buf_addr = rbuf & ~(NICVF_RCV_BUF_ALIGN_BYTES - 1);
310*4882a593Smuzhiyun }
311*4882a593Smuzhiyun
312*4882a593Smuzhiyun nicvf_get_page(nic);
313*4882a593Smuzhiyun
314*4882a593Smuzhiyun return 0;
315*4882a593Smuzhiyun }
316*4882a593Smuzhiyun
317*4882a593Smuzhiyun /* Free RBDR ring and its receive buffers */
nicvf_free_rbdr(struct nicvf * nic,struct rbdr * rbdr)318*4882a593Smuzhiyun static void nicvf_free_rbdr(struct nicvf *nic, struct rbdr *rbdr)
319*4882a593Smuzhiyun {
320*4882a593Smuzhiyun int head, tail;
321*4882a593Smuzhiyun u64 buf_addr, phys_addr;
322*4882a593Smuzhiyun struct pgcache *pgcache;
323*4882a593Smuzhiyun struct rbdr_entry_t *desc;
324*4882a593Smuzhiyun
325*4882a593Smuzhiyun if (!rbdr)
326*4882a593Smuzhiyun return;
327*4882a593Smuzhiyun
328*4882a593Smuzhiyun rbdr->enable = false;
329*4882a593Smuzhiyun if (!rbdr->dmem.base)
330*4882a593Smuzhiyun return;
331*4882a593Smuzhiyun
332*4882a593Smuzhiyun head = rbdr->head;
333*4882a593Smuzhiyun tail = rbdr->tail;
334*4882a593Smuzhiyun
335*4882a593Smuzhiyun /* Release page references */
336*4882a593Smuzhiyun while (head != tail) {
337*4882a593Smuzhiyun desc = GET_RBDR_DESC(rbdr, head);
338*4882a593Smuzhiyun buf_addr = desc->buf_addr;
339*4882a593Smuzhiyun phys_addr = nicvf_iova_to_phys(nic, buf_addr);
340*4882a593Smuzhiyun dma_unmap_page_attrs(&nic->pdev->dev, buf_addr, RCV_FRAG_LEN,
341*4882a593Smuzhiyun DMA_FROM_DEVICE, DMA_ATTR_SKIP_CPU_SYNC);
342*4882a593Smuzhiyun if (phys_addr)
343*4882a593Smuzhiyun put_page(virt_to_page(phys_to_virt(phys_addr)));
344*4882a593Smuzhiyun head++;
345*4882a593Smuzhiyun head &= (rbdr->dmem.q_len - 1);
346*4882a593Smuzhiyun }
347*4882a593Smuzhiyun /* Release buffer of tail desc */
348*4882a593Smuzhiyun desc = GET_RBDR_DESC(rbdr, tail);
349*4882a593Smuzhiyun buf_addr = desc->buf_addr;
350*4882a593Smuzhiyun phys_addr = nicvf_iova_to_phys(nic, buf_addr);
351*4882a593Smuzhiyun dma_unmap_page_attrs(&nic->pdev->dev, buf_addr, RCV_FRAG_LEN,
352*4882a593Smuzhiyun DMA_FROM_DEVICE, DMA_ATTR_SKIP_CPU_SYNC);
353*4882a593Smuzhiyun if (phys_addr)
354*4882a593Smuzhiyun put_page(virt_to_page(phys_to_virt(phys_addr)));
355*4882a593Smuzhiyun
356*4882a593Smuzhiyun /* Sync page cache info */
357*4882a593Smuzhiyun smp_rmb();
358*4882a593Smuzhiyun
359*4882a593Smuzhiyun /* Release additional page references held for recycling */
360*4882a593Smuzhiyun head = 0;
361*4882a593Smuzhiyun while (head < rbdr->pgcnt) {
362*4882a593Smuzhiyun pgcache = &rbdr->pgcache[head];
363*4882a593Smuzhiyun if (pgcache->page && page_ref_count(pgcache->page) != 0) {
364*4882a593Smuzhiyun if (rbdr->is_xdp) {
365*4882a593Smuzhiyun page_ref_sub(pgcache->page,
366*4882a593Smuzhiyun pgcache->ref_count - 1);
367*4882a593Smuzhiyun }
368*4882a593Smuzhiyun put_page(pgcache->page);
369*4882a593Smuzhiyun }
370*4882a593Smuzhiyun head++;
371*4882a593Smuzhiyun }
372*4882a593Smuzhiyun
373*4882a593Smuzhiyun /* Free RBDR ring */
374*4882a593Smuzhiyun nicvf_free_q_desc_mem(nic, &rbdr->dmem);
375*4882a593Smuzhiyun }
376*4882a593Smuzhiyun
377*4882a593Smuzhiyun /* Refill receive buffer descriptors with new buffers.
378*4882a593Smuzhiyun */
nicvf_refill_rbdr(struct nicvf * nic,gfp_t gfp)379*4882a593Smuzhiyun static void nicvf_refill_rbdr(struct nicvf *nic, gfp_t gfp)
380*4882a593Smuzhiyun {
381*4882a593Smuzhiyun struct queue_set *qs = nic->qs;
382*4882a593Smuzhiyun int rbdr_idx = qs->rbdr_cnt;
383*4882a593Smuzhiyun int tail, qcount;
384*4882a593Smuzhiyun int refill_rb_cnt;
385*4882a593Smuzhiyun struct rbdr *rbdr;
386*4882a593Smuzhiyun struct rbdr_entry_t *desc;
387*4882a593Smuzhiyun u64 rbuf;
388*4882a593Smuzhiyun int new_rb = 0;
389*4882a593Smuzhiyun
390*4882a593Smuzhiyun refill:
391*4882a593Smuzhiyun if (!rbdr_idx)
392*4882a593Smuzhiyun return;
393*4882a593Smuzhiyun rbdr_idx--;
394*4882a593Smuzhiyun rbdr = &qs->rbdr[rbdr_idx];
395*4882a593Smuzhiyun /* Check if it's enabled */
396*4882a593Smuzhiyun if (!rbdr->enable)
397*4882a593Smuzhiyun goto next_rbdr;
398*4882a593Smuzhiyun
399*4882a593Smuzhiyun /* Get no of desc's to be refilled */
400*4882a593Smuzhiyun qcount = nicvf_queue_reg_read(nic, NIC_QSET_RBDR_0_1_STATUS0, rbdr_idx);
401*4882a593Smuzhiyun qcount &= 0x7FFFF;
402*4882a593Smuzhiyun /* Doorbell can be ringed with a max of ring size minus 1 */
403*4882a593Smuzhiyun if (qcount >= (qs->rbdr_len - 1))
404*4882a593Smuzhiyun goto next_rbdr;
405*4882a593Smuzhiyun else
406*4882a593Smuzhiyun refill_rb_cnt = qs->rbdr_len - qcount - 1;
407*4882a593Smuzhiyun
408*4882a593Smuzhiyun /* Sync page cache info */
409*4882a593Smuzhiyun smp_rmb();
410*4882a593Smuzhiyun
411*4882a593Smuzhiyun /* Start filling descs from tail */
412*4882a593Smuzhiyun tail = nicvf_queue_reg_read(nic, NIC_QSET_RBDR_0_1_TAIL, rbdr_idx) >> 3;
413*4882a593Smuzhiyun while (refill_rb_cnt) {
414*4882a593Smuzhiyun tail++;
415*4882a593Smuzhiyun tail &= (rbdr->dmem.q_len - 1);
416*4882a593Smuzhiyun
417*4882a593Smuzhiyun if (nicvf_alloc_rcv_buffer(nic, rbdr, gfp, RCV_FRAG_LEN, &rbuf))
418*4882a593Smuzhiyun break;
419*4882a593Smuzhiyun
420*4882a593Smuzhiyun desc = GET_RBDR_DESC(rbdr, tail);
421*4882a593Smuzhiyun desc->buf_addr = rbuf & ~(NICVF_RCV_BUF_ALIGN_BYTES - 1);
422*4882a593Smuzhiyun refill_rb_cnt--;
423*4882a593Smuzhiyun new_rb++;
424*4882a593Smuzhiyun }
425*4882a593Smuzhiyun
426*4882a593Smuzhiyun nicvf_get_page(nic);
427*4882a593Smuzhiyun
428*4882a593Smuzhiyun /* make sure all memory stores are done before ringing doorbell */
429*4882a593Smuzhiyun smp_wmb();
430*4882a593Smuzhiyun
431*4882a593Smuzhiyun /* Check if buffer allocation failed */
432*4882a593Smuzhiyun if (refill_rb_cnt)
433*4882a593Smuzhiyun nic->rb_alloc_fail = true;
434*4882a593Smuzhiyun else
435*4882a593Smuzhiyun nic->rb_alloc_fail = false;
436*4882a593Smuzhiyun
437*4882a593Smuzhiyun /* Notify HW */
438*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RBDR_0_1_DOOR,
439*4882a593Smuzhiyun rbdr_idx, new_rb);
440*4882a593Smuzhiyun next_rbdr:
441*4882a593Smuzhiyun /* Re-enable RBDR interrupts only if buffer allocation is success */
442*4882a593Smuzhiyun if (!nic->rb_alloc_fail && rbdr->enable &&
443*4882a593Smuzhiyun netif_running(nic->pnicvf->netdev))
444*4882a593Smuzhiyun nicvf_enable_intr(nic, NICVF_INTR_RBDR, rbdr_idx);
445*4882a593Smuzhiyun
446*4882a593Smuzhiyun if (rbdr_idx)
447*4882a593Smuzhiyun goto refill;
448*4882a593Smuzhiyun }
449*4882a593Smuzhiyun
450*4882a593Smuzhiyun /* Alloc rcv buffers in non-atomic mode for better success */
nicvf_rbdr_work(struct work_struct * work)451*4882a593Smuzhiyun void nicvf_rbdr_work(struct work_struct *work)
452*4882a593Smuzhiyun {
453*4882a593Smuzhiyun struct nicvf *nic = container_of(work, struct nicvf, rbdr_work.work);
454*4882a593Smuzhiyun
455*4882a593Smuzhiyun nicvf_refill_rbdr(nic, GFP_KERNEL);
456*4882a593Smuzhiyun if (nic->rb_alloc_fail)
457*4882a593Smuzhiyun schedule_delayed_work(&nic->rbdr_work, msecs_to_jiffies(10));
458*4882a593Smuzhiyun else
459*4882a593Smuzhiyun nic->rb_work_scheduled = false;
460*4882a593Smuzhiyun }
461*4882a593Smuzhiyun
462*4882a593Smuzhiyun /* In Softirq context, alloc rcv buffers in atomic mode */
nicvf_rbdr_task(struct tasklet_struct * t)463*4882a593Smuzhiyun void nicvf_rbdr_task(struct tasklet_struct *t)
464*4882a593Smuzhiyun {
465*4882a593Smuzhiyun struct nicvf *nic = from_tasklet(nic, t, rbdr_task);
466*4882a593Smuzhiyun
467*4882a593Smuzhiyun nicvf_refill_rbdr(nic, GFP_ATOMIC);
468*4882a593Smuzhiyun if (nic->rb_alloc_fail) {
469*4882a593Smuzhiyun nic->rb_work_scheduled = true;
470*4882a593Smuzhiyun schedule_delayed_work(&nic->rbdr_work, msecs_to_jiffies(10));
471*4882a593Smuzhiyun }
472*4882a593Smuzhiyun }
473*4882a593Smuzhiyun
474*4882a593Smuzhiyun /* Initialize completion queue */
nicvf_init_cmp_queue(struct nicvf * nic,struct cmp_queue * cq,int q_len)475*4882a593Smuzhiyun static int nicvf_init_cmp_queue(struct nicvf *nic,
476*4882a593Smuzhiyun struct cmp_queue *cq, int q_len)
477*4882a593Smuzhiyun {
478*4882a593Smuzhiyun int err;
479*4882a593Smuzhiyun
480*4882a593Smuzhiyun err = nicvf_alloc_q_desc_mem(nic, &cq->dmem, q_len, CMP_QUEUE_DESC_SIZE,
481*4882a593Smuzhiyun NICVF_CQ_BASE_ALIGN_BYTES);
482*4882a593Smuzhiyun if (err)
483*4882a593Smuzhiyun return err;
484*4882a593Smuzhiyun
485*4882a593Smuzhiyun cq->desc = cq->dmem.base;
486*4882a593Smuzhiyun cq->thresh = pass1_silicon(nic->pdev) ? 0 : CMP_QUEUE_CQE_THRESH;
487*4882a593Smuzhiyun nic->cq_coalesce_usecs = (CMP_QUEUE_TIMER_THRESH * 0.05) - 1;
488*4882a593Smuzhiyun
489*4882a593Smuzhiyun return 0;
490*4882a593Smuzhiyun }
491*4882a593Smuzhiyun
nicvf_free_cmp_queue(struct nicvf * nic,struct cmp_queue * cq)492*4882a593Smuzhiyun static void nicvf_free_cmp_queue(struct nicvf *nic, struct cmp_queue *cq)
493*4882a593Smuzhiyun {
494*4882a593Smuzhiyun if (!cq)
495*4882a593Smuzhiyun return;
496*4882a593Smuzhiyun if (!cq->dmem.base)
497*4882a593Smuzhiyun return;
498*4882a593Smuzhiyun
499*4882a593Smuzhiyun nicvf_free_q_desc_mem(nic, &cq->dmem);
500*4882a593Smuzhiyun }
501*4882a593Smuzhiyun
502*4882a593Smuzhiyun /* Initialize transmit queue */
nicvf_init_snd_queue(struct nicvf * nic,struct snd_queue * sq,int q_len,int qidx)503*4882a593Smuzhiyun static int nicvf_init_snd_queue(struct nicvf *nic,
504*4882a593Smuzhiyun struct snd_queue *sq, int q_len, int qidx)
505*4882a593Smuzhiyun {
506*4882a593Smuzhiyun int err;
507*4882a593Smuzhiyun
508*4882a593Smuzhiyun err = nicvf_alloc_q_desc_mem(nic, &sq->dmem, q_len, SND_QUEUE_DESC_SIZE,
509*4882a593Smuzhiyun NICVF_SQ_BASE_ALIGN_BYTES);
510*4882a593Smuzhiyun if (err)
511*4882a593Smuzhiyun return err;
512*4882a593Smuzhiyun
513*4882a593Smuzhiyun sq->desc = sq->dmem.base;
514*4882a593Smuzhiyun sq->skbuff = kcalloc(q_len, sizeof(u64), GFP_KERNEL);
515*4882a593Smuzhiyun if (!sq->skbuff)
516*4882a593Smuzhiyun return -ENOMEM;
517*4882a593Smuzhiyun
518*4882a593Smuzhiyun sq->head = 0;
519*4882a593Smuzhiyun sq->tail = 0;
520*4882a593Smuzhiyun sq->thresh = SND_QUEUE_THRESH;
521*4882a593Smuzhiyun
522*4882a593Smuzhiyun /* Check if this SQ is a XDP TX queue */
523*4882a593Smuzhiyun if (nic->sqs_mode)
524*4882a593Smuzhiyun qidx += ((nic->sqs_id + 1) * MAX_SND_QUEUES_PER_QS);
525*4882a593Smuzhiyun if (qidx < nic->pnicvf->xdp_tx_queues) {
526*4882a593Smuzhiyun /* Alloc memory to save page pointers for XDP_TX */
527*4882a593Smuzhiyun sq->xdp_page = kcalloc(q_len, sizeof(u64), GFP_KERNEL);
528*4882a593Smuzhiyun if (!sq->xdp_page)
529*4882a593Smuzhiyun return -ENOMEM;
530*4882a593Smuzhiyun sq->xdp_desc_cnt = 0;
531*4882a593Smuzhiyun sq->xdp_free_cnt = q_len - 1;
532*4882a593Smuzhiyun sq->is_xdp = true;
533*4882a593Smuzhiyun } else {
534*4882a593Smuzhiyun sq->xdp_page = NULL;
535*4882a593Smuzhiyun sq->xdp_desc_cnt = 0;
536*4882a593Smuzhiyun sq->xdp_free_cnt = 0;
537*4882a593Smuzhiyun sq->is_xdp = false;
538*4882a593Smuzhiyun
539*4882a593Smuzhiyun atomic_set(&sq->free_cnt, q_len - 1);
540*4882a593Smuzhiyun
541*4882a593Smuzhiyun /* Preallocate memory for TSO segment's header */
542*4882a593Smuzhiyun sq->tso_hdrs = dma_alloc_coherent(&nic->pdev->dev,
543*4882a593Smuzhiyun q_len * TSO_HEADER_SIZE,
544*4882a593Smuzhiyun &sq->tso_hdrs_phys,
545*4882a593Smuzhiyun GFP_KERNEL);
546*4882a593Smuzhiyun if (!sq->tso_hdrs)
547*4882a593Smuzhiyun return -ENOMEM;
548*4882a593Smuzhiyun }
549*4882a593Smuzhiyun
550*4882a593Smuzhiyun return 0;
551*4882a593Smuzhiyun }
552*4882a593Smuzhiyun
nicvf_unmap_sndq_buffers(struct nicvf * nic,struct snd_queue * sq,int hdr_sqe,u8 subdesc_cnt)553*4882a593Smuzhiyun void nicvf_unmap_sndq_buffers(struct nicvf *nic, struct snd_queue *sq,
554*4882a593Smuzhiyun int hdr_sqe, u8 subdesc_cnt)
555*4882a593Smuzhiyun {
556*4882a593Smuzhiyun u8 idx;
557*4882a593Smuzhiyun struct sq_gather_subdesc *gather;
558*4882a593Smuzhiyun
559*4882a593Smuzhiyun /* Unmap DMA mapped skb data buffers */
560*4882a593Smuzhiyun for (idx = 0; idx < subdesc_cnt; idx++) {
561*4882a593Smuzhiyun hdr_sqe++;
562*4882a593Smuzhiyun hdr_sqe &= (sq->dmem.q_len - 1);
563*4882a593Smuzhiyun gather = (struct sq_gather_subdesc *)GET_SQ_DESC(sq, hdr_sqe);
564*4882a593Smuzhiyun /* HW will ensure data coherency, CPU sync not required */
565*4882a593Smuzhiyun dma_unmap_page_attrs(&nic->pdev->dev, gather->addr,
566*4882a593Smuzhiyun gather->size, DMA_TO_DEVICE,
567*4882a593Smuzhiyun DMA_ATTR_SKIP_CPU_SYNC);
568*4882a593Smuzhiyun }
569*4882a593Smuzhiyun }
570*4882a593Smuzhiyun
nicvf_free_snd_queue(struct nicvf * nic,struct snd_queue * sq)571*4882a593Smuzhiyun static void nicvf_free_snd_queue(struct nicvf *nic, struct snd_queue *sq)
572*4882a593Smuzhiyun {
573*4882a593Smuzhiyun struct sk_buff *skb;
574*4882a593Smuzhiyun struct page *page;
575*4882a593Smuzhiyun struct sq_hdr_subdesc *hdr;
576*4882a593Smuzhiyun struct sq_hdr_subdesc *tso_sqe;
577*4882a593Smuzhiyun
578*4882a593Smuzhiyun if (!sq)
579*4882a593Smuzhiyun return;
580*4882a593Smuzhiyun if (!sq->dmem.base)
581*4882a593Smuzhiyun return;
582*4882a593Smuzhiyun
583*4882a593Smuzhiyun if (sq->tso_hdrs) {
584*4882a593Smuzhiyun dma_free_coherent(&nic->pdev->dev,
585*4882a593Smuzhiyun sq->dmem.q_len * TSO_HEADER_SIZE,
586*4882a593Smuzhiyun sq->tso_hdrs, sq->tso_hdrs_phys);
587*4882a593Smuzhiyun sq->tso_hdrs = NULL;
588*4882a593Smuzhiyun }
589*4882a593Smuzhiyun
590*4882a593Smuzhiyun /* Free pending skbs in the queue */
591*4882a593Smuzhiyun smp_rmb();
592*4882a593Smuzhiyun while (sq->head != sq->tail) {
593*4882a593Smuzhiyun skb = (struct sk_buff *)sq->skbuff[sq->head];
594*4882a593Smuzhiyun if (!skb || !sq->xdp_page)
595*4882a593Smuzhiyun goto next;
596*4882a593Smuzhiyun
597*4882a593Smuzhiyun page = (struct page *)sq->xdp_page[sq->head];
598*4882a593Smuzhiyun if (!page)
599*4882a593Smuzhiyun goto next;
600*4882a593Smuzhiyun else
601*4882a593Smuzhiyun put_page(page);
602*4882a593Smuzhiyun
603*4882a593Smuzhiyun hdr = (struct sq_hdr_subdesc *)GET_SQ_DESC(sq, sq->head);
604*4882a593Smuzhiyun /* Check for dummy descriptor used for HW TSO offload on 88xx */
605*4882a593Smuzhiyun if (hdr->dont_send) {
606*4882a593Smuzhiyun /* Get actual TSO descriptors and unmap them */
607*4882a593Smuzhiyun tso_sqe =
608*4882a593Smuzhiyun (struct sq_hdr_subdesc *)GET_SQ_DESC(sq, hdr->rsvd2);
609*4882a593Smuzhiyun nicvf_unmap_sndq_buffers(nic, sq, hdr->rsvd2,
610*4882a593Smuzhiyun tso_sqe->subdesc_cnt);
611*4882a593Smuzhiyun } else {
612*4882a593Smuzhiyun nicvf_unmap_sndq_buffers(nic, sq, sq->head,
613*4882a593Smuzhiyun hdr->subdesc_cnt);
614*4882a593Smuzhiyun }
615*4882a593Smuzhiyun if (skb)
616*4882a593Smuzhiyun dev_kfree_skb_any(skb);
617*4882a593Smuzhiyun next:
618*4882a593Smuzhiyun sq->head++;
619*4882a593Smuzhiyun sq->head &= (sq->dmem.q_len - 1);
620*4882a593Smuzhiyun }
621*4882a593Smuzhiyun kfree(sq->skbuff);
622*4882a593Smuzhiyun kfree(sq->xdp_page);
623*4882a593Smuzhiyun nicvf_free_q_desc_mem(nic, &sq->dmem);
624*4882a593Smuzhiyun }
625*4882a593Smuzhiyun
nicvf_reclaim_snd_queue(struct nicvf * nic,struct queue_set * qs,int qidx)626*4882a593Smuzhiyun static void nicvf_reclaim_snd_queue(struct nicvf *nic,
627*4882a593Smuzhiyun struct queue_set *qs, int qidx)
628*4882a593Smuzhiyun {
629*4882a593Smuzhiyun /* Disable send queue */
630*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_CFG, qidx, 0);
631*4882a593Smuzhiyun /* Check if SQ is stopped */
632*4882a593Smuzhiyun if (nicvf_poll_reg(nic, qidx, NIC_QSET_SQ_0_7_STATUS, 21, 1, 0x01))
633*4882a593Smuzhiyun return;
634*4882a593Smuzhiyun /* Reset send queue */
635*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_CFG, qidx, NICVF_SQ_RESET);
636*4882a593Smuzhiyun }
637*4882a593Smuzhiyun
nicvf_reclaim_rcv_queue(struct nicvf * nic,struct queue_set * qs,int qidx)638*4882a593Smuzhiyun static void nicvf_reclaim_rcv_queue(struct nicvf *nic,
639*4882a593Smuzhiyun struct queue_set *qs, int qidx)
640*4882a593Smuzhiyun {
641*4882a593Smuzhiyun union nic_mbx mbx = {};
642*4882a593Smuzhiyun
643*4882a593Smuzhiyun /* Make sure all packets in the pipeline are written back into mem */
644*4882a593Smuzhiyun mbx.msg.msg = NIC_MBOX_MSG_RQ_SW_SYNC;
645*4882a593Smuzhiyun nicvf_send_msg_to_pf(nic, &mbx);
646*4882a593Smuzhiyun }
647*4882a593Smuzhiyun
nicvf_reclaim_cmp_queue(struct nicvf * nic,struct queue_set * qs,int qidx)648*4882a593Smuzhiyun static void nicvf_reclaim_cmp_queue(struct nicvf *nic,
649*4882a593Smuzhiyun struct queue_set *qs, int qidx)
650*4882a593Smuzhiyun {
651*4882a593Smuzhiyun /* Disable timer threshold (doesn't get reset upon CQ reset */
652*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_CQ_0_7_CFG2, qidx, 0);
653*4882a593Smuzhiyun /* Disable completion queue */
654*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_CQ_0_7_CFG, qidx, 0);
655*4882a593Smuzhiyun /* Reset completion queue */
656*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_CQ_0_7_CFG, qidx, NICVF_CQ_RESET);
657*4882a593Smuzhiyun }
658*4882a593Smuzhiyun
nicvf_reclaim_rbdr(struct nicvf * nic,struct rbdr * rbdr,int qidx)659*4882a593Smuzhiyun static void nicvf_reclaim_rbdr(struct nicvf *nic,
660*4882a593Smuzhiyun struct rbdr *rbdr, int qidx)
661*4882a593Smuzhiyun {
662*4882a593Smuzhiyun u64 tmp, fifo_state;
663*4882a593Smuzhiyun int timeout = 10;
664*4882a593Smuzhiyun
665*4882a593Smuzhiyun /* Save head and tail pointers for feeing up buffers */
666*4882a593Smuzhiyun rbdr->head = nicvf_queue_reg_read(nic,
667*4882a593Smuzhiyun NIC_QSET_RBDR_0_1_HEAD,
668*4882a593Smuzhiyun qidx) >> 3;
669*4882a593Smuzhiyun rbdr->tail = nicvf_queue_reg_read(nic,
670*4882a593Smuzhiyun NIC_QSET_RBDR_0_1_TAIL,
671*4882a593Smuzhiyun qidx) >> 3;
672*4882a593Smuzhiyun
673*4882a593Smuzhiyun /* If RBDR FIFO is in 'FAIL' state then do a reset first
674*4882a593Smuzhiyun * before relaiming.
675*4882a593Smuzhiyun */
676*4882a593Smuzhiyun fifo_state = nicvf_queue_reg_read(nic, NIC_QSET_RBDR_0_1_STATUS0, qidx);
677*4882a593Smuzhiyun if (((fifo_state >> 62) & 0x03) == 0x3)
678*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RBDR_0_1_CFG,
679*4882a593Smuzhiyun qidx, NICVF_RBDR_RESET);
680*4882a593Smuzhiyun
681*4882a593Smuzhiyun /* Disable RBDR */
682*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RBDR_0_1_CFG, qidx, 0);
683*4882a593Smuzhiyun if (nicvf_poll_reg(nic, qidx, NIC_QSET_RBDR_0_1_STATUS0, 62, 2, 0x00))
684*4882a593Smuzhiyun return;
685*4882a593Smuzhiyun while (1) {
686*4882a593Smuzhiyun tmp = nicvf_queue_reg_read(nic,
687*4882a593Smuzhiyun NIC_QSET_RBDR_0_1_PREFETCH_STATUS,
688*4882a593Smuzhiyun qidx);
689*4882a593Smuzhiyun if ((tmp & 0xFFFFFFFF) == ((tmp >> 32) & 0xFFFFFFFF))
690*4882a593Smuzhiyun break;
691*4882a593Smuzhiyun usleep_range(1000, 2000);
692*4882a593Smuzhiyun timeout--;
693*4882a593Smuzhiyun if (!timeout) {
694*4882a593Smuzhiyun netdev_err(nic->netdev,
695*4882a593Smuzhiyun "Failed polling on prefetch status\n");
696*4882a593Smuzhiyun return;
697*4882a593Smuzhiyun }
698*4882a593Smuzhiyun }
699*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RBDR_0_1_CFG,
700*4882a593Smuzhiyun qidx, NICVF_RBDR_RESET);
701*4882a593Smuzhiyun
702*4882a593Smuzhiyun if (nicvf_poll_reg(nic, qidx, NIC_QSET_RBDR_0_1_STATUS0, 62, 2, 0x02))
703*4882a593Smuzhiyun return;
704*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RBDR_0_1_CFG, qidx, 0x00);
705*4882a593Smuzhiyun if (nicvf_poll_reg(nic, qidx, NIC_QSET_RBDR_0_1_STATUS0, 62, 2, 0x00))
706*4882a593Smuzhiyun return;
707*4882a593Smuzhiyun }
708*4882a593Smuzhiyun
nicvf_config_vlan_stripping(struct nicvf * nic,netdev_features_t features)709*4882a593Smuzhiyun void nicvf_config_vlan_stripping(struct nicvf *nic, netdev_features_t features)
710*4882a593Smuzhiyun {
711*4882a593Smuzhiyun u64 rq_cfg;
712*4882a593Smuzhiyun int sqs;
713*4882a593Smuzhiyun
714*4882a593Smuzhiyun rq_cfg = nicvf_queue_reg_read(nic, NIC_QSET_RQ_GEN_CFG, 0);
715*4882a593Smuzhiyun
716*4882a593Smuzhiyun /* Enable first VLAN stripping */
717*4882a593Smuzhiyun if (features & NETIF_F_HW_VLAN_CTAG_RX)
718*4882a593Smuzhiyun rq_cfg |= (1ULL << 25);
719*4882a593Smuzhiyun else
720*4882a593Smuzhiyun rq_cfg &= ~(1ULL << 25);
721*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RQ_GEN_CFG, 0, rq_cfg);
722*4882a593Smuzhiyun
723*4882a593Smuzhiyun /* Configure Secondary Qsets, if any */
724*4882a593Smuzhiyun for (sqs = 0; sqs < nic->sqs_count; sqs++)
725*4882a593Smuzhiyun if (nic->snicvf[sqs])
726*4882a593Smuzhiyun nicvf_queue_reg_write(nic->snicvf[sqs],
727*4882a593Smuzhiyun NIC_QSET_RQ_GEN_CFG, 0, rq_cfg);
728*4882a593Smuzhiyun }
729*4882a593Smuzhiyun
nicvf_reset_rcv_queue_stats(struct nicvf * nic)730*4882a593Smuzhiyun static void nicvf_reset_rcv_queue_stats(struct nicvf *nic)
731*4882a593Smuzhiyun {
732*4882a593Smuzhiyun union nic_mbx mbx = {};
733*4882a593Smuzhiyun
734*4882a593Smuzhiyun /* Reset all RQ/SQ and VF stats */
735*4882a593Smuzhiyun mbx.reset_stat.msg = NIC_MBOX_MSG_RESET_STAT_COUNTER;
736*4882a593Smuzhiyun mbx.reset_stat.rx_stat_mask = 0x3FFF;
737*4882a593Smuzhiyun mbx.reset_stat.tx_stat_mask = 0x1F;
738*4882a593Smuzhiyun mbx.reset_stat.rq_stat_mask = 0xFFFF;
739*4882a593Smuzhiyun mbx.reset_stat.sq_stat_mask = 0xFFFF;
740*4882a593Smuzhiyun nicvf_send_msg_to_pf(nic, &mbx);
741*4882a593Smuzhiyun }
742*4882a593Smuzhiyun
743*4882a593Smuzhiyun /* Configures receive queue */
nicvf_rcv_queue_config(struct nicvf * nic,struct queue_set * qs,int qidx,bool enable)744*4882a593Smuzhiyun static void nicvf_rcv_queue_config(struct nicvf *nic, struct queue_set *qs,
745*4882a593Smuzhiyun int qidx, bool enable)
746*4882a593Smuzhiyun {
747*4882a593Smuzhiyun union nic_mbx mbx = {};
748*4882a593Smuzhiyun struct rcv_queue *rq;
749*4882a593Smuzhiyun struct rq_cfg rq_cfg;
750*4882a593Smuzhiyun
751*4882a593Smuzhiyun rq = &qs->rq[qidx];
752*4882a593Smuzhiyun rq->enable = enable;
753*4882a593Smuzhiyun
754*4882a593Smuzhiyun /* Disable receive queue */
755*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RQ_0_7_CFG, qidx, 0);
756*4882a593Smuzhiyun
757*4882a593Smuzhiyun if (!rq->enable) {
758*4882a593Smuzhiyun nicvf_reclaim_rcv_queue(nic, qs, qidx);
759*4882a593Smuzhiyun xdp_rxq_info_unreg(&rq->xdp_rxq);
760*4882a593Smuzhiyun return;
761*4882a593Smuzhiyun }
762*4882a593Smuzhiyun
763*4882a593Smuzhiyun rq->cq_qs = qs->vnic_id;
764*4882a593Smuzhiyun rq->cq_idx = qidx;
765*4882a593Smuzhiyun rq->start_rbdr_qs = qs->vnic_id;
766*4882a593Smuzhiyun rq->start_qs_rbdr_idx = qs->rbdr_cnt - 1;
767*4882a593Smuzhiyun rq->cont_rbdr_qs = qs->vnic_id;
768*4882a593Smuzhiyun rq->cont_qs_rbdr_idx = qs->rbdr_cnt - 1;
769*4882a593Smuzhiyun /* all writes of RBDR data to be loaded into L2 Cache as well*/
770*4882a593Smuzhiyun rq->caching = 1;
771*4882a593Smuzhiyun
772*4882a593Smuzhiyun /* Driver have no proper error path for failed XDP RX-queue info reg */
773*4882a593Smuzhiyun WARN_ON(xdp_rxq_info_reg(&rq->xdp_rxq, nic->netdev, qidx) < 0);
774*4882a593Smuzhiyun
775*4882a593Smuzhiyun /* Send a mailbox msg to PF to config RQ */
776*4882a593Smuzhiyun mbx.rq.msg = NIC_MBOX_MSG_RQ_CFG;
777*4882a593Smuzhiyun mbx.rq.qs_num = qs->vnic_id;
778*4882a593Smuzhiyun mbx.rq.rq_num = qidx;
779*4882a593Smuzhiyun mbx.rq.cfg = ((u64)rq->caching << 26) | (rq->cq_qs << 19) |
780*4882a593Smuzhiyun (rq->cq_idx << 16) | (rq->cont_rbdr_qs << 9) |
781*4882a593Smuzhiyun (rq->cont_qs_rbdr_idx << 8) |
782*4882a593Smuzhiyun (rq->start_rbdr_qs << 1) | (rq->start_qs_rbdr_idx);
783*4882a593Smuzhiyun nicvf_send_msg_to_pf(nic, &mbx);
784*4882a593Smuzhiyun
785*4882a593Smuzhiyun mbx.rq.msg = NIC_MBOX_MSG_RQ_BP_CFG;
786*4882a593Smuzhiyun mbx.rq.cfg = BIT_ULL(63) | BIT_ULL(62) |
787*4882a593Smuzhiyun (RQ_PASS_RBDR_LVL << 16) | (RQ_PASS_CQ_LVL << 8) |
788*4882a593Smuzhiyun (qs->vnic_id << 0);
789*4882a593Smuzhiyun nicvf_send_msg_to_pf(nic, &mbx);
790*4882a593Smuzhiyun
791*4882a593Smuzhiyun /* RQ drop config
792*4882a593Smuzhiyun * Enable CQ drop to reserve sufficient CQEs for all tx packets
793*4882a593Smuzhiyun */
794*4882a593Smuzhiyun mbx.rq.msg = NIC_MBOX_MSG_RQ_DROP_CFG;
795*4882a593Smuzhiyun mbx.rq.cfg = BIT_ULL(63) | BIT_ULL(62) |
796*4882a593Smuzhiyun (RQ_PASS_RBDR_LVL << 40) | (RQ_DROP_RBDR_LVL << 32) |
797*4882a593Smuzhiyun (RQ_PASS_CQ_LVL << 16) | (RQ_DROP_CQ_LVL << 8);
798*4882a593Smuzhiyun nicvf_send_msg_to_pf(nic, &mbx);
799*4882a593Smuzhiyun
800*4882a593Smuzhiyun if (!nic->sqs_mode && (qidx == 0)) {
801*4882a593Smuzhiyun /* Enable checking L3/L4 length and TCP/UDP checksums
802*4882a593Smuzhiyun * Also allow IPv6 pkts with zero UDP checksum.
803*4882a593Smuzhiyun */
804*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RQ_GEN_CFG, 0,
805*4882a593Smuzhiyun (BIT(24) | BIT(23) | BIT(21) | BIT(20)));
806*4882a593Smuzhiyun nicvf_config_vlan_stripping(nic, nic->netdev->features);
807*4882a593Smuzhiyun }
808*4882a593Smuzhiyun
809*4882a593Smuzhiyun /* Enable Receive queue */
810*4882a593Smuzhiyun memset(&rq_cfg, 0, sizeof(struct rq_cfg));
811*4882a593Smuzhiyun rq_cfg.ena = 1;
812*4882a593Smuzhiyun rq_cfg.tcp_ena = 0;
813*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RQ_0_7_CFG, qidx, *(u64 *)&rq_cfg);
814*4882a593Smuzhiyun }
815*4882a593Smuzhiyun
816*4882a593Smuzhiyun /* Configures completion queue */
nicvf_cmp_queue_config(struct nicvf * nic,struct queue_set * qs,int qidx,bool enable)817*4882a593Smuzhiyun void nicvf_cmp_queue_config(struct nicvf *nic, struct queue_set *qs,
818*4882a593Smuzhiyun int qidx, bool enable)
819*4882a593Smuzhiyun {
820*4882a593Smuzhiyun struct cmp_queue *cq;
821*4882a593Smuzhiyun struct cq_cfg cq_cfg;
822*4882a593Smuzhiyun
823*4882a593Smuzhiyun cq = &qs->cq[qidx];
824*4882a593Smuzhiyun cq->enable = enable;
825*4882a593Smuzhiyun
826*4882a593Smuzhiyun if (!cq->enable) {
827*4882a593Smuzhiyun nicvf_reclaim_cmp_queue(nic, qs, qidx);
828*4882a593Smuzhiyun return;
829*4882a593Smuzhiyun }
830*4882a593Smuzhiyun
831*4882a593Smuzhiyun /* Reset completion queue */
832*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_CQ_0_7_CFG, qidx, NICVF_CQ_RESET);
833*4882a593Smuzhiyun
834*4882a593Smuzhiyun if (!cq->enable)
835*4882a593Smuzhiyun return;
836*4882a593Smuzhiyun
837*4882a593Smuzhiyun spin_lock_init(&cq->lock);
838*4882a593Smuzhiyun /* Set completion queue base address */
839*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_CQ_0_7_BASE,
840*4882a593Smuzhiyun qidx, (u64)(cq->dmem.phys_base));
841*4882a593Smuzhiyun
842*4882a593Smuzhiyun /* Enable Completion queue */
843*4882a593Smuzhiyun memset(&cq_cfg, 0, sizeof(struct cq_cfg));
844*4882a593Smuzhiyun cq_cfg.ena = 1;
845*4882a593Smuzhiyun cq_cfg.reset = 0;
846*4882a593Smuzhiyun cq_cfg.caching = 0;
847*4882a593Smuzhiyun cq_cfg.qsize = ilog2(qs->cq_len >> 10);
848*4882a593Smuzhiyun cq_cfg.avg_con = 0;
849*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_CQ_0_7_CFG, qidx, *(u64 *)&cq_cfg);
850*4882a593Smuzhiyun
851*4882a593Smuzhiyun /* Set threshold value for interrupt generation */
852*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_CQ_0_7_THRESH, qidx, cq->thresh);
853*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_CQ_0_7_CFG2,
854*4882a593Smuzhiyun qidx, CMP_QUEUE_TIMER_THRESH);
855*4882a593Smuzhiyun }
856*4882a593Smuzhiyun
857*4882a593Smuzhiyun /* Configures transmit queue */
nicvf_snd_queue_config(struct nicvf * nic,struct queue_set * qs,int qidx,bool enable)858*4882a593Smuzhiyun static void nicvf_snd_queue_config(struct nicvf *nic, struct queue_set *qs,
859*4882a593Smuzhiyun int qidx, bool enable)
860*4882a593Smuzhiyun {
861*4882a593Smuzhiyun union nic_mbx mbx = {};
862*4882a593Smuzhiyun struct snd_queue *sq;
863*4882a593Smuzhiyun struct sq_cfg sq_cfg;
864*4882a593Smuzhiyun
865*4882a593Smuzhiyun sq = &qs->sq[qidx];
866*4882a593Smuzhiyun sq->enable = enable;
867*4882a593Smuzhiyun
868*4882a593Smuzhiyun if (!sq->enable) {
869*4882a593Smuzhiyun nicvf_reclaim_snd_queue(nic, qs, qidx);
870*4882a593Smuzhiyun return;
871*4882a593Smuzhiyun }
872*4882a593Smuzhiyun
873*4882a593Smuzhiyun /* Reset send queue */
874*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_CFG, qidx, NICVF_SQ_RESET);
875*4882a593Smuzhiyun
876*4882a593Smuzhiyun sq->cq_qs = qs->vnic_id;
877*4882a593Smuzhiyun sq->cq_idx = qidx;
878*4882a593Smuzhiyun
879*4882a593Smuzhiyun /* Send a mailbox msg to PF to config SQ */
880*4882a593Smuzhiyun mbx.sq.msg = NIC_MBOX_MSG_SQ_CFG;
881*4882a593Smuzhiyun mbx.sq.qs_num = qs->vnic_id;
882*4882a593Smuzhiyun mbx.sq.sq_num = qidx;
883*4882a593Smuzhiyun mbx.sq.sqs_mode = nic->sqs_mode;
884*4882a593Smuzhiyun mbx.sq.cfg = (sq->cq_qs << 3) | sq->cq_idx;
885*4882a593Smuzhiyun nicvf_send_msg_to_pf(nic, &mbx);
886*4882a593Smuzhiyun
887*4882a593Smuzhiyun /* Set queue base address */
888*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_BASE,
889*4882a593Smuzhiyun qidx, (u64)(sq->dmem.phys_base));
890*4882a593Smuzhiyun
891*4882a593Smuzhiyun /* Enable send queue & set queue size */
892*4882a593Smuzhiyun memset(&sq_cfg, 0, sizeof(struct sq_cfg));
893*4882a593Smuzhiyun sq_cfg.ena = 1;
894*4882a593Smuzhiyun sq_cfg.reset = 0;
895*4882a593Smuzhiyun sq_cfg.ldwb = 0;
896*4882a593Smuzhiyun sq_cfg.qsize = ilog2(qs->sq_len >> 10);
897*4882a593Smuzhiyun sq_cfg.tstmp_bgx_intf = 0;
898*4882a593Smuzhiyun /* CQ's level at which HW will stop processing SQEs to avoid
899*4882a593Smuzhiyun * transmitting a pkt with no space in CQ to post CQE_TX.
900*4882a593Smuzhiyun */
901*4882a593Smuzhiyun sq_cfg.cq_limit = (CMP_QUEUE_PIPELINE_RSVD * 256) / qs->cq_len;
902*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_CFG, qidx, *(u64 *)&sq_cfg);
903*4882a593Smuzhiyun
904*4882a593Smuzhiyun /* Set threshold value for interrupt generation */
905*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_THRESH, qidx, sq->thresh);
906*4882a593Smuzhiyun
907*4882a593Smuzhiyun /* Set queue:cpu affinity for better load distribution */
908*4882a593Smuzhiyun if (cpu_online(qidx)) {
909*4882a593Smuzhiyun cpumask_set_cpu(qidx, &sq->affinity_mask);
910*4882a593Smuzhiyun netif_set_xps_queue(nic->netdev,
911*4882a593Smuzhiyun &sq->affinity_mask, qidx);
912*4882a593Smuzhiyun }
913*4882a593Smuzhiyun }
914*4882a593Smuzhiyun
915*4882a593Smuzhiyun /* Configures receive buffer descriptor ring */
nicvf_rbdr_config(struct nicvf * nic,struct queue_set * qs,int qidx,bool enable)916*4882a593Smuzhiyun static void nicvf_rbdr_config(struct nicvf *nic, struct queue_set *qs,
917*4882a593Smuzhiyun int qidx, bool enable)
918*4882a593Smuzhiyun {
919*4882a593Smuzhiyun struct rbdr *rbdr;
920*4882a593Smuzhiyun struct rbdr_cfg rbdr_cfg;
921*4882a593Smuzhiyun
922*4882a593Smuzhiyun rbdr = &qs->rbdr[qidx];
923*4882a593Smuzhiyun nicvf_reclaim_rbdr(nic, rbdr, qidx);
924*4882a593Smuzhiyun if (!enable)
925*4882a593Smuzhiyun return;
926*4882a593Smuzhiyun
927*4882a593Smuzhiyun /* Set descriptor base address */
928*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RBDR_0_1_BASE,
929*4882a593Smuzhiyun qidx, (u64)(rbdr->dmem.phys_base));
930*4882a593Smuzhiyun
931*4882a593Smuzhiyun /* Enable RBDR & set queue size */
932*4882a593Smuzhiyun /* Buffer size should be in multiples of 128 bytes */
933*4882a593Smuzhiyun memset(&rbdr_cfg, 0, sizeof(struct rbdr_cfg));
934*4882a593Smuzhiyun rbdr_cfg.ena = 1;
935*4882a593Smuzhiyun rbdr_cfg.reset = 0;
936*4882a593Smuzhiyun rbdr_cfg.ldwb = 0;
937*4882a593Smuzhiyun rbdr_cfg.qsize = RBDR_SIZE;
938*4882a593Smuzhiyun rbdr_cfg.avg_con = 0;
939*4882a593Smuzhiyun rbdr_cfg.lines = rbdr->dma_size / 128;
940*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RBDR_0_1_CFG,
941*4882a593Smuzhiyun qidx, *(u64 *)&rbdr_cfg);
942*4882a593Smuzhiyun
943*4882a593Smuzhiyun /* Notify HW */
944*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RBDR_0_1_DOOR,
945*4882a593Smuzhiyun qidx, qs->rbdr_len - 1);
946*4882a593Smuzhiyun
947*4882a593Smuzhiyun /* Set threshold value for interrupt generation */
948*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_RBDR_0_1_THRESH,
949*4882a593Smuzhiyun qidx, rbdr->thresh - 1);
950*4882a593Smuzhiyun }
951*4882a593Smuzhiyun
952*4882a593Smuzhiyun /* Requests PF to assign and enable Qset */
nicvf_qset_config(struct nicvf * nic,bool enable)953*4882a593Smuzhiyun void nicvf_qset_config(struct nicvf *nic, bool enable)
954*4882a593Smuzhiyun {
955*4882a593Smuzhiyun union nic_mbx mbx = {};
956*4882a593Smuzhiyun struct queue_set *qs = nic->qs;
957*4882a593Smuzhiyun struct qs_cfg *qs_cfg;
958*4882a593Smuzhiyun
959*4882a593Smuzhiyun if (!qs) {
960*4882a593Smuzhiyun netdev_warn(nic->netdev,
961*4882a593Smuzhiyun "Qset is still not allocated, don't init queues\n");
962*4882a593Smuzhiyun return;
963*4882a593Smuzhiyun }
964*4882a593Smuzhiyun
965*4882a593Smuzhiyun qs->enable = enable;
966*4882a593Smuzhiyun qs->vnic_id = nic->vf_id;
967*4882a593Smuzhiyun
968*4882a593Smuzhiyun /* Send a mailbox msg to PF to config Qset */
969*4882a593Smuzhiyun mbx.qs.msg = NIC_MBOX_MSG_QS_CFG;
970*4882a593Smuzhiyun mbx.qs.num = qs->vnic_id;
971*4882a593Smuzhiyun mbx.qs.sqs_count = nic->sqs_count;
972*4882a593Smuzhiyun
973*4882a593Smuzhiyun mbx.qs.cfg = 0;
974*4882a593Smuzhiyun qs_cfg = (struct qs_cfg *)&mbx.qs.cfg;
975*4882a593Smuzhiyun if (qs->enable) {
976*4882a593Smuzhiyun qs_cfg->ena = 1;
977*4882a593Smuzhiyun #ifdef __BIG_ENDIAN
978*4882a593Smuzhiyun qs_cfg->be = 1;
979*4882a593Smuzhiyun #endif
980*4882a593Smuzhiyun qs_cfg->vnic = qs->vnic_id;
981*4882a593Smuzhiyun /* Enable Tx timestamping capability */
982*4882a593Smuzhiyun if (nic->ptp_clock)
983*4882a593Smuzhiyun qs_cfg->send_tstmp_ena = 1;
984*4882a593Smuzhiyun }
985*4882a593Smuzhiyun nicvf_send_msg_to_pf(nic, &mbx);
986*4882a593Smuzhiyun }
987*4882a593Smuzhiyun
nicvf_free_resources(struct nicvf * nic)988*4882a593Smuzhiyun static void nicvf_free_resources(struct nicvf *nic)
989*4882a593Smuzhiyun {
990*4882a593Smuzhiyun int qidx;
991*4882a593Smuzhiyun struct queue_set *qs = nic->qs;
992*4882a593Smuzhiyun
993*4882a593Smuzhiyun /* Free receive buffer descriptor ring */
994*4882a593Smuzhiyun for (qidx = 0; qidx < qs->rbdr_cnt; qidx++)
995*4882a593Smuzhiyun nicvf_free_rbdr(nic, &qs->rbdr[qidx]);
996*4882a593Smuzhiyun
997*4882a593Smuzhiyun /* Free completion queue */
998*4882a593Smuzhiyun for (qidx = 0; qidx < qs->cq_cnt; qidx++)
999*4882a593Smuzhiyun nicvf_free_cmp_queue(nic, &qs->cq[qidx]);
1000*4882a593Smuzhiyun
1001*4882a593Smuzhiyun /* Free send queue */
1002*4882a593Smuzhiyun for (qidx = 0; qidx < qs->sq_cnt; qidx++)
1003*4882a593Smuzhiyun nicvf_free_snd_queue(nic, &qs->sq[qidx]);
1004*4882a593Smuzhiyun }
1005*4882a593Smuzhiyun
nicvf_alloc_resources(struct nicvf * nic)1006*4882a593Smuzhiyun static int nicvf_alloc_resources(struct nicvf *nic)
1007*4882a593Smuzhiyun {
1008*4882a593Smuzhiyun int qidx;
1009*4882a593Smuzhiyun struct queue_set *qs = nic->qs;
1010*4882a593Smuzhiyun
1011*4882a593Smuzhiyun /* Alloc receive buffer descriptor ring */
1012*4882a593Smuzhiyun for (qidx = 0; qidx < qs->rbdr_cnt; qidx++) {
1013*4882a593Smuzhiyun if (nicvf_init_rbdr(nic, &qs->rbdr[qidx], qs->rbdr_len,
1014*4882a593Smuzhiyun DMA_BUFFER_LEN))
1015*4882a593Smuzhiyun goto alloc_fail;
1016*4882a593Smuzhiyun }
1017*4882a593Smuzhiyun
1018*4882a593Smuzhiyun /* Alloc send queue */
1019*4882a593Smuzhiyun for (qidx = 0; qidx < qs->sq_cnt; qidx++) {
1020*4882a593Smuzhiyun if (nicvf_init_snd_queue(nic, &qs->sq[qidx], qs->sq_len, qidx))
1021*4882a593Smuzhiyun goto alloc_fail;
1022*4882a593Smuzhiyun }
1023*4882a593Smuzhiyun
1024*4882a593Smuzhiyun /* Alloc completion queue */
1025*4882a593Smuzhiyun for (qidx = 0; qidx < qs->cq_cnt; qidx++) {
1026*4882a593Smuzhiyun if (nicvf_init_cmp_queue(nic, &qs->cq[qidx], qs->cq_len))
1027*4882a593Smuzhiyun goto alloc_fail;
1028*4882a593Smuzhiyun }
1029*4882a593Smuzhiyun
1030*4882a593Smuzhiyun return 0;
1031*4882a593Smuzhiyun alloc_fail:
1032*4882a593Smuzhiyun nicvf_free_resources(nic);
1033*4882a593Smuzhiyun return -ENOMEM;
1034*4882a593Smuzhiyun }
1035*4882a593Smuzhiyun
nicvf_set_qset_resources(struct nicvf * nic)1036*4882a593Smuzhiyun int nicvf_set_qset_resources(struct nicvf *nic)
1037*4882a593Smuzhiyun {
1038*4882a593Smuzhiyun struct queue_set *qs;
1039*4882a593Smuzhiyun
1040*4882a593Smuzhiyun qs = devm_kzalloc(&nic->pdev->dev, sizeof(*qs), GFP_KERNEL);
1041*4882a593Smuzhiyun if (!qs)
1042*4882a593Smuzhiyun return -ENOMEM;
1043*4882a593Smuzhiyun nic->qs = qs;
1044*4882a593Smuzhiyun
1045*4882a593Smuzhiyun /* Set count of each queue */
1046*4882a593Smuzhiyun qs->rbdr_cnt = DEFAULT_RBDR_CNT;
1047*4882a593Smuzhiyun qs->rq_cnt = min_t(u8, MAX_RCV_QUEUES_PER_QS, num_online_cpus());
1048*4882a593Smuzhiyun qs->sq_cnt = min_t(u8, MAX_SND_QUEUES_PER_QS, num_online_cpus());
1049*4882a593Smuzhiyun qs->cq_cnt = max_t(u8, qs->rq_cnt, qs->sq_cnt);
1050*4882a593Smuzhiyun
1051*4882a593Smuzhiyun /* Set queue lengths */
1052*4882a593Smuzhiyun qs->rbdr_len = RCV_BUF_COUNT;
1053*4882a593Smuzhiyun qs->sq_len = SND_QUEUE_LEN;
1054*4882a593Smuzhiyun qs->cq_len = CMP_QUEUE_LEN;
1055*4882a593Smuzhiyun
1056*4882a593Smuzhiyun nic->rx_queues = qs->rq_cnt;
1057*4882a593Smuzhiyun nic->tx_queues = qs->sq_cnt;
1058*4882a593Smuzhiyun nic->xdp_tx_queues = 0;
1059*4882a593Smuzhiyun
1060*4882a593Smuzhiyun return 0;
1061*4882a593Smuzhiyun }
1062*4882a593Smuzhiyun
nicvf_config_data_transfer(struct nicvf * nic,bool enable)1063*4882a593Smuzhiyun int nicvf_config_data_transfer(struct nicvf *nic, bool enable)
1064*4882a593Smuzhiyun {
1065*4882a593Smuzhiyun bool disable = false;
1066*4882a593Smuzhiyun struct queue_set *qs = nic->qs;
1067*4882a593Smuzhiyun struct queue_set *pqs = nic->pnicvf->qs;
1068*4882a593Smuzhiyun int qidx;
1069*4882a593Smuzhiyun
1070*4882a593Smuzhiyun if (!qs)
1071*4882a593Smuzhiyun return 0;
1072*4882a593Smuzhiyun
1073*4882a593Smuzhiyun /* Take primary VF's queue lengths.
1074*4882a593Smuzhiyun * This is needed to take queue lengths set from ethtool
1075*4882a593Smuzhiyun * into consideration.
1076*4882a593Smuzhiyun */
1077*4882a593Smuzhiyun if (nic->sqs_mode && pqs) {
1078*4882a593Smuzhiyun qs->cq_len = pqs->cq_len;
1079*4882a593Smuzhiyun qs->sq_len = pqs->sq_len;
1080*4882a593Smuzhiyun }
1081*4882a593Smuzhiyun
1082*4882a593Smuzhiyun if (enable) {
1083*4882a593Smuzhiyun if (nicvf_alloc_resources(nic))
1084*4882a593Smuzhiyun return -ENOMEM;
1085*4882a593Smuzhiyun
1086*4882a593Smuzhiyun for (qidx = 0; qidx < qs->sq_cnt; qidx++)
1087*4882a593Smuzhiyun nicvf_snd_queue_config(nic, qs, qidx, enable);
1088*4882a593Smuzhiyun for (qidx = 0; qidx < qs->cq_cnt; qidx++)
1089*4882a593Smuzhiyun nicvf_cmp_queue_config(nic, qs, qidx, enable);
1090*4882a593Smuzhiyun for (qidx = 0; qidx < qs->rbdr_cnt; qidx++)
1091*4882a593Smuzhiyun nicvf_rbdr_config(nic, qs, qidx, enable);
1092*4882a593Smuzhiyun for (qidx = 0; qidx < qs->rq_cnt; qidx++)
1093*4882a593Smuzhiyun nicvf_rcv_queue_config(nic, qs, qidx, enable);
1094*4882a593Smuzhiyun } else {
1095*4882a593Smuzhiyun for (qidx = 0; qidx < qs->rq_cnt; qidx++)
1096*4882a593Smuzhiyun nicvf_rcv_queue_config(nic, qs, qidx, disable);
1097*4882a593Smuzhiyun for (qidx = 0; qidx < qs->rbdr_cnt; qidx++)
1098*4882a593Smuzhiyun nicvf_rbdr_config(nic, qs, qidx, disable);
1099*4882a593Smuzhiyun for (qidx = 0; qidx < qs->sq_cnt; qidx++)
1100*4882a593Smuzhiyun nicvf_snd_queue_config(nic, qs, qidx, disable);
1101*4882a593Smuzhiyun for (qidx = 0; qidx < qs->cq_cnt; qidx++)
1102*4882a593Smuzhiyun nicvf_cmp_queue_config(nic, qs, qidx, disable);
1103*4882a593Smuzhiyun
1104*4882a593Smuzhiyun nicvf_free_resources(nic);
1105*4882a593Smuzhiyun }
1106*4882a593Smuzhiyun
1107*4882a593Smuzhiyun /* Reset RXQ's stats.
1108*4882a593Smuzhiyun * SQ's stats will get reset automatically once SQ is reset.
1109*4882a593Smuzhiyun */
1110*4882a593Smuzhiyun nicvf_reset_rcv_queue_stats(nic);
1111*4882a593Smuzhiyun
1112*4882a593Smuzhiyun return 0;
1113*4882a593Smuzhiyun }
1114*4882a593Smuzhiyun
1115*4882a593Smuzhiyun /* Get a free desc from SQ
1116*4882a593Smuzhiyun * returns descriptor ponter & descriptor number
1117*4882a593Smuzhiyun */
nicvf_get_sq_desc(struct snd_queue * sq,int desc_cnt)1118*4882a593Smuzhiyun static inline int nicvf_get_sq_desc(struct snd_queue *sq, int desc_cnt)
1119*4882a593Smuzhiyun {
1120*4882a593Smuzhiyun int qentry;
1121*4882a593Smuzhiyun
1122*4882a593Smuzhiyun qentry = sq->tail;
1123*4882a593Smuzhiyun if (!sq->is_xdp)
1124*4882a593Smuzhiyun atomic_sub(desc_cnt, &sq->free_cnt);
1125*4882a593Smuzhiyun else
1126*4882a593Smuzhiyun sq->xdp_free_cnt -= desc_cnt;
1127*4882a593Smuzhiyun sq->tail += desc_cnt;
1128*4882a593Smuzhiyun sq->tail &= (sq->dmem.q_len - 1);
1129*4882a593Smuzhiyun
1130*4882a593Smuzhiyun return qentry;
1131*4882a593Smuzhiyun }
1132*4882a593Smuzhiyun
1133*4882a593Smuzhiyun /* Rollback to previous tail pointer when descriptors not used */
nicvf_rollback_sq_desc(struct snd_queue * sq,int qentry,int desc_cnt)1134*4882a593Smuzhiyun static inline void nicvf_rollback_sq_desc(struct snd_queue *sq,
1135*4882a593Smuzhiyun int qentry, int desc_cnt)
1136*4882a593Smuzhiyun {
1137*4882a593Smuzhiyun sq->tail = qentry;
1138*4882a593Smuzhiyun atomic_add(desc_cnt, &sq->free_cnt);
1139*4882a593Smuzhiyun }
1140*4882a593Smuzhiyun
1141*4882a593Smuzhiyun /* Free descriptor back to SQ for future use */
nicvf_put_sq_desc(struct snd_queue * sq,int desc_cnt)1142*4882a593Smuzhiyun void nicvf_put_sq_desc(struct snd_queue *sq, int desc_cnt)
1143*4882a593Smuzhiyun {
1144*4882a593Smuzhiyun if (!sq->is_xdp)
1145*4882a593Smuzhiyun atomic_add(desc_cnt, &sq->free_cnt);
1146*4882a593Smuzhiyun else
1147*4882a593Smuzhiyun sq->xdp_free_cnt += desc_cnt;
1148*4882a593Smuzhiyun sq->head += desc_cnt;
1149*4882a593Smuzhiyun sq->head &= (sq->dmem.q_len - 1);
1150*4882a593Smuzhiyun }
1151*4882a593Smuzhiyun
nicvf_get_nxt_sqentry(struct snd_queue * sq,int qentry)1152*4882a593Smuzhiyun static inline int nicvf_get_nxt_sqentry(struct snd_queue *sq, int qentry)
1153*4882a593Smuzhiyun {
1154*4882a593Smuzhiyun qentry++;
1155*4882a593Smuzhiyun qentry &= (sq->dmem.q_len - 1);
1156*4882a593Smuzhiyun return qentry;
1157*4882a593Smuzhiyun }
1158*4882a593Smuzhiyun
nicvf_sq_enable(struct nicvf * nic,struct snd_queue * sq,int qidx)1159*4882a593Smuzhiyun void nicvf_sq_enable(struct nicvf *nic, struct snd_queue *sq, int qidx)
1160*4882a593Smuzhiyun {
1161*4882a593Smuzhiyun u64 sq_cfg;
1162*4882a593Smuzhiyun
1163*4882a593Smuzhiyun sq_cfg = nicvf_queue_reg_read(nic, NIC_QSET_SQ_0_7_CFG, qidx);
1164*4882a593Smuzhiyun sq_cfg |= NICVF_SQ_EN;
1165*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_CFG, qidx, sq_cfg);
1166*4882a593Smuzhiyun /* Ring doorbell so that H/W restarts processing SQEs */
1167*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_DOOR, qidx, 0);
1168*4882a593Smuzhiyun }
1169*4882a593Smuzhiyun
nicvf_sq_disable(struct nicvf * nic,int qidx)1170*4882a593Smuzhiyun void nicvf_sq_disable(struct nicvf *nic, int qidx)
1171*4882a593Smuzhiyun {
1172*4882a593Smuzhiyun u64 sq_cfg;
1173*4882a593Smuzhiyun
1174*4882a593Smuzhiyun sq_cfg = nicvf_queue_reg_read(nic, NIC_QSET_SQ_0_7_CFG, qidx);
1175*4882a593Smuzhiyun sq_cfg &= ~NICVF_SQ_EN;
1176*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_CFG, qidx, sq_cfg);
1177*4882a593Smuzhiyun }
1178*4882a593Smuzhiyun
nicvf_sq_free_used_descs(struct net_device * netdev,struct snd_queue * sq,int qidx)1179*4882a593Smuzhiyun void nicvf_sq_free_used_descs(struct net_device *netdev, struct snd_queue *sq,
1180*4882a593Smuzhiyun int qidx)
1181*4882a593Smuzhiyun {
1182*4882a593Smuzhiyun u64 head;
1183*4882a593Smuzhiyun struct sk_buff *skb;
1184*4882a593Smuzhiyun struct nicvf *nic = netdev_priv(netdev);
1185*4882a593Smuzhiyun struct sq_hdr_subdesc *hdr;
1186*4882a593Smuzhiyun
1187*4882a593Smuzhiyun head = nicvf_queue_reg_read(nic, NIC_QSET_SQ_0_7_HEAD, qidx) >> 4;
1188*4882a593Smuzhiyun while (sq->head != head) {
1189*4882a593Smuzhiyun hdr = (struct sq_hdr_subdesc *)GET_SQ_DESC(sq, sq->head);
1190*4882a593Smuzhiyun if (hdr->subdesc_type != SQ_DESC_TYPE_HEADER) {
1191*4882a593Smuzhiyun nicvf_put_sq_desc(sq, 1);
1192*4882a593Smuzhiyun continue;
1193*4882a593Smuzhiyun }
1194*4882a593Smuzhiyun skb = (struct sk_buff *)sq->skbuff[sq->head];
1195*4882a593Smuzhiyun if (skb)
1196*4882a593Smuzhiyun dev_kfree_skb_any(skb);
1197*4882a593Smuzhiyun atomic64_add(1, (atomic64_t *)&netdev->stats.tx_packets);
1198*4882a593Smuzhiyun atomic64_add(hdr->tot_len,
1199*4882a593Smuzhiyun (atomic64_t *)&netdev->stats.tx_bytes);
1200*4882a593Smuzhiyun nicvf_put_sq_desc(sq, hdr->subdesc_cnt + 1);
1201*4882a593Smuzhiyun }
1202*4882a593Smuzhiyun }
1203*4882a593Smuzhiyun
1204*4882a593Smuzhiyun /* XDP Transmit APIs */
nicvf_xdp_sq_doorbell(struct nicvf * nic,struct snd_queue * sq,int sq_num)1205*4882a593Smuzhiyun void nicvf_xdp_sq_doorbell(struct nicvf *nic,
1206*4882a593Smuzhiyun struct snd_queue *sq, int sq_num)
1207*4882a593Smuzhiyun {
1208*4882a593Smuzhiyun if (!sq->xdp_desc_cnt)
1209*4882a593Smuzhiyun return;
1210*4882a593Smuzhiyun
1211*4882a593Smuzhiyun /* make sure all memory stores are done before ringing doorbell */
1212*4882a593Smuzhiyun wmb();
1213*4882a593Smuzhiyun
1214*4882a593Smuzhiyun /* Inform HW to xmit all TSO segments */
1215*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_DOOR,
1216*4882a593Smuzhiyun sq_num, sq->xdp_desc_cnt);
1217*4882a593Smuzhiyun sq->xdp_desc_cnt = 0;
1218*4882a593Smuzhiyun }
1219*4882a593Smuzhiyun
1220*4882a593Smuzhiyun static inline void
nicvf_xdp_sq_add_hdr_subdesc(struct snd_queue * sq,int qentry,int subdesc_cnt,u64 data,int len)1221*4882a593Smuzhiyun nicvf_xdp_sq_add_hdr_subdesc(struct snd_queue *sq, int qentry,
1222*4882a593Smuzhiyun int subdesc_cnt, u64 data, int len)
1223*4882a593Smuzhiyun {
1224*4882a593Smuzhiyun struct sq_hdr_subdesc *hdr;
1225*4882a593Smuzhiyun
1226*4882a593Smuzhiyun hdr = (struct sq_hdr_subdesc *)GET_SQ_DESC(sq, qentry);
1227*4882a593Smuzhiyun memset(hdr, 0, SND_QUEUE_DESC_SIZE);
1228*4882a593Smuzhiyun hdr->subdesc_type = SQ_DESC_TYPE_HEADER;
1229*4882a593Smuzhiyun hdr->subdesc_cnt = subdesc_cnt;
1230*4882a593Smuzhiyun hdr->tot_len = len;
1231*4882a593Smuzhiyun hdr->post_cqe = 1;
1232*4882a593Smuzhiyun sq->xdp_page[qentry] = (u64)virt_to_page((void *)data);
1233*4882a593Smuzhiyun }
1234*4882a593Smuzhiyun
nicvf_xdp_sq_append_pkt(struct nicvf * nic,struct snd_queue * sq,u64 bufaddr,u64 dma_addr,u16 len)1235*4882a593Smuzhiyun int nicvf_xdp_sq_append_pkt(struct nicvf *nic, struct snd_queue *sq,
1236*4882a593Smuzhiyun u64 bufaddr, u64 dma_addr, u16 len)
1237*4882a593Smuzhiyun {
1238*4882a593Smuzhiyun int subdesc_cnt = MIN_SQ_DESC_PER_PKT_XMIT;
1239*4882a593Smuzhiyun int qentry;
1240*4882a593Smuzhiyun
1241*4882a593Smuzhiyun if (subdesc_cnt > sq->xdp_free_cnt)
1242*4882a593Smuzhiyun return 0;
1243*4882a593Smuzhiyun
1244*4882a593Smuzhiyun qentry = nicvf_get_sq_desc(sq, subdesc_cnt);
1245*4882a593Smuzhiyun
1246*4882a593Smuzhiyun nicvf_xdp_sq_add_hdr_subdesc(sq, qentry, subdesc_cnt - 1, bufaddr, len);
1247*4882a593Smuzhiyun
1248*4882a593Smuzhiyun qentry = nicvf_get_nxt_sqentry(sq, qentry);
1249*4882a593Smuzhiyun nicvf_sq_add_gather_subdesc(sq, qentry, len, dma_addr);
1250*4882a593Smuzhiyun
1251*4882a593Smuzhiyun sq->xdp_desc_cnt += subdesc_cnt;
1252*4882a593Smuzhiyun
1253*4882a593Smuzhiyun return 1;
1254*4882a593Smuzhiyun }
1255*4882a593Smuzhiyun
1256*4882a593Smuzhiyun /* Calculate no of SQ subdescriptors needed to transmit all
1257*4882a593Smuzhiyun * segments of this TSO packet.
1258*4882a593Smuzhiyun * Taken from 'Tilera network driver' with a minor modification.
1259*4882a593Smuzhiyun */
nicvf_tso_count_subdescs(struct sk_buff * skb)1260*4882a593Smuzhiyun static int nicvf_tso_count_subdescs(struct sk_buff *skb)
1261*4882a593Smuzhiyun {
1262*4882a593Smuzhiyun struct skb_shared_info *sh = skb_shinfo(skb);
1263*4882a593Smuzhiyun unsigned int sh_len = skb_transport_offset(skb) + tcp_hdrlen(skb);
1264*4882a593Smuzhiyun unsigned int data_len = skb->len - sh_len;
1265*4882a593Smuzhiyun unsigned int p_len = sh->gso_size;
1266*4882a593Smuzhiyun long f_id = -1; /* id of the current fragment */
1267*4882a593Smuzhiyun long f_size = skb_headlen(skb) - sh_len; /* current fragment size */
1268*4882a593Smuzhiyun long f_used = 0; /* bytes used from the current fragment */
1269*4882a593Smuzhiyun long n; /* size of the current piece of payload */
1270*4882a593Smuzhiyun int num_edescs = 0;
1271*4882a593Smuzhiyun int segment;
1272*4882a593Smuzhiyun
1273*4882a593Smuzhiyun for (segment = 0; segment < sh->gso_segs; segment++) {
1274*4882a593Smuzhiyun unsigned int p_used = 0;
1275*4882a593Smuzhiyun
1276*4882a593Smuzhiyun /* One edesc for header and for each piece of the payload. */
1277*4882a593Smuzhiyun for (num_edescs++; p_used < p_len; num_edescs++) {
1278*4882a593Smuzhiyun /* Advance as needed. */
1279*4882a593Smuzhiyun while (f_used >= f_size) {
1280*4882a593Smuzhiyun f_id++;
1281*4882a593Smuzhiyun f_size = skb_frag_size(&sh->frags[f_id]);
1282*4882a593Smuzhiyun f_used = 0;
1283*4882a593Smuzhiyun }
1284*4882a593Smuzhiyun
1285*4882a593Smuzhiyun /* Use bytes from the current fragment. */
1286*4882a593Smuzhiyun n = p_len - p_used;
1287*4882a593Smuzhiyun if (n > f_size - f_used)
1288*4882a593Smuzhiyun n = f_size - f_used;
1289*4882a593Smuzhiyun f_used += n;
1290*4882a593Smuzhiyun p_used += n;
1291*4882a593Smuzhiyun }
1292*4882a593Smuzhiyun
1293*4882a593Smuzhiyun /* The last segment may be less than gso_size. */
1294*4882a593Smuzhiyun data_len -= p_len;
1295*4882a593Smuzhiyun if (data_len < p_len)
1296*4882a593Smuzhiyun p_len = data_len;
1297*4882a593Smuzhiyun }
1298*4882a593Smuzhiyun
1299*4882a593Smuzhiyun /* '+ gso_segs' for SQ_HDR_SUDESCs for each segment */
1300*4882a593Smuzhiyun return num_edescs + sh->gso_segs;
1301*4882a593Smuzhiyun }
1302*4882a593Smuzhiyun
1303*4882a593Smuzhiyun #define POST_CQE_DESC_COUNT 2
1304*4882a593Smuzhiyun
1305*4882a593Smuzhiyun /* Get the number of SQ descriptors needed to xmit this skb */
nicvf_sq_subdesc_required(struct nicvf * nic,struct sk_buff * skb)1306*4882a593Smuzhiyun static int nicvf_sq_subdesc_required(struct nicvf *nic, struct sk_buff *skb)
1307*4882a593Smuzhiyun {
1308*4882a593Smuzhiyun int subdesc_cnt = MIN_SQ_DESC_PER_PKT_XMIT;
1309*4882a593Smuzhiyun
1310*4882a593Smuzhiyun if (skb_shinfo(skb)->gso_size && !nic->hw_tso) {
1311*4882a593Smuzhiyun subdesc_cnt = nicvf_tso_count_subdescs(skb);
1312*4882a593Smuzhiyun return subdesc_cnt;
1313*4882a593Smuzhiyun }
1314*4882a593Smuzhiyun
1315*4882a593Smuzhiyun /* Dummy descriptors to get TSO pkt completion notification */
1316*4882a593Smuzhiyun if (nic->t88 && nic->hw_tso && skb_shinfo(skb)->gso_size)
1317*4882a593Smuzhiyun subdesc_cnt += POST_CQE_DESC_COUNT;
1318*4882a593Smuzhiyun
1319*4882a593Smuzhiyun if (skb_shinfo(skb)->nr_frags)
1320*4882a593Smuzhiyun subdesc_cnt += skb_shinfo(skb)->nr_frags;
1321*4882a593Smuzhiyun
1322*4882a593Smuzhiyun return subdesc_cnt;
1323*4882a593Smuzhiyun }
1324*4882a593Smuzhiyun
1325*4882a593Smuzhiyun /* Add SQ HEADER subdescriptor.
1326*4882a593Smuzhiyun * First subdescriptor for every send descriptor.
1327*4882a593Smuzhiyun */
1328*4882a593Smuzhiyun static inline void
nicvf_sq_add_hdr_subdesc(struct nicvf * nic,struct snd_queue * sq,int qentry,int subdesc_cnt,struct sk_buff * skb,int len)1329*4882a593Smuzhiyun nicvf_sq_add_hdr_subdesc(struct nicvf *nic, struct snd_queue *sq, int qentry,
1330*4882a593Smuzhiyun int subdesc_cnt, struct sk_buff *skb, int len)
1331*4882a593Smuzhiyun {
1332*4882a593Smuzhiyun int proto;
1333*4882a593Smuzhiyun struct sq_hdr_subdesc *hdr;
1334*4882a593Smuzhiyun union {
1335*4882a593Smuzhiyun struct iphdr *v4;
1336*4882a593Smuzhiyun struct ipv6hdr *v6;
1337*4882a593Smuzhiyun unsigned char *hdr;
1338*4882a593Smuzhiyun } ip;
1339*4882a593Smuzhiyun
1340*4882a593Smuzhiyun ip.hdr = skb_network_header(skb);
1341*4882a593Smuzhiyun hdr = (struct sq_hdr_subdesc *)GET_SQ_DESC(sq, qentry);
1342*4882a593Smuzhiyun memset(hdr, 0, SND_QUEUE_DESC_SIZE);
1343*4882a593Smuzhiyun hdr->subdesc_type = SQ_DESC_TYPE_HEADER;
1344*4882a593Smuzhiyun
1345*4882a593Smuzhiyun if (nic->t88 && nic->hw_tso && skb_shinfo(skb)->gso_size) {
1346*4882a593Smuzhiyun /* post_cqe = 0, to avoid HW posting a CQE for every TSO
1347*4882a593Smuzhiyun * segment transmitted on 88xx.
1348*4882a593Smuzhiyun */
1349*4882a593Smuzhiyun hdr->subdesc_cnt = subdesc_cnt - POST_CQE_DESC_COUNT;
1350*4882a593Smuzhiyun } else {
1351*4882a593Smuzhiyun sq->skbuff[qentry] = (u64)skb;
1352*4882a593Smuzhiyun /* Enable notification via CQE after processing SQE */
1353*4882a593Smuzhiyun hdr->post_cqe = 1;
1354*4882a593Smuzhiyun /* No of subdescriptors following this */
1355*4882a593Smuzhiyun hdr->subdesc_cnt = subdesc_cnt;
1356*4882a593Smuzhiyun }
1357*4882a593Smuzhiyun hdr->tot_len = len;
1358*4882a593Smuzhiyun
1359*4882a593Smuzhiyun /* Offload checksum calculation to HW */
1360*4882a593Smuzhiyun if (skb->ip_summed == CHECKSUM_PARTIAL) {
1361*4882a593Smuzhiyun if (ip.v4->version == 4)
1362*4882a593Smuzhiyun hdr->csum_l3 = 1; /* Enable IP csum calculation */
1363*4882a593Smuzhiyun hdr->l3_offset = skb_network_offset(skb);
1364*4882a593Smuzhiyun hdr->l4_offset = skb_transport_offset(skb);
1365*4882a593Smuzhiyun
1366*4882a593Smuzhiyun proto = (ip.v4->version == 4) ? ip.v4->protocol :
1367*4882a593Smuzhiyun ip.v6->nexthdr;
1368*4882a593Smuzhiyun
1369*4882a593Smuzhiyun switch (proto) {
1370*4882a593Smuzhiyun case IPPROTO_TCP:
1371*4882a593Smuzhiyun hdr->csum_l4 = SEND_L4_CSUM_TCP;
1372*4882a593Smuzhiyun break;
1373*4882a593Smuzhiyun case IPPROTO_UDP:
1374*4882a593Smuzhiyun hdr->csum_l4 = SEND_L4_CSUM_UDP;
1375*4882a593Smuzhiyun break;
1376*4882a593Smuzhiyun case IPPROTO_SCTP:
1377*4882a593Smuzhiyun hdr->csum_l4 = SEND_L4_CSUM_SCTP;
1378*4882a593Smuzhiyun break;
1379*4882a593Smuzhiyun }
1380*4882a593Smuzhiyun }
1381*4882a593Smuzhiyun
1382*4882a593Smuzhiyun if (nic->hw_tso && skb_shinfo(skb)->gso_size) {
1383*4882a593Smuzhiyun hdr->tso = 1;
1384*4882a593Smuzhiyun hdr->tso_start = skb_transport_offset(skb) + tcp_hdrlen(skb);
1385*4882a593Smuzhiyun hdr->tso_max_paysize = skb_shinfo(skb)->gso_size;
1386*4882a593Smuzhiyun /* For non-tunneled pkts, point this to L2 ethertype */
1387*4882a593Smuzhiyun hdr->inner_l3_offset = skb_network_offset(skb) - 2;
1388*4882a593Smuzhiyun this_cpu_inc(nic->pnicvf->drv_stats->tx_tso);
1389*4882a593Smuzhiyun }
1390*4882a593Smuzhiyun
1391*4882a593Smuzhiyun /* Check if timestamp is requested */
1392*4882a593Smuzhiyun if (!(skb_shinfo(skb)->tx_flags & SKBTX_HW_TSTAMP)) {
1393*4882a593Smuzhiyun skb_tx_timestamp(skb);
1394*4882a593Smuzhiyun return;
1395*4882a593Smuzhiyun }
1396*4882a593Smuzhiyun
1397*4882a593Smuzhiyun /* Tx timestamping not supported along with TSO, so ignore request */
1398*4882a593Smuzhiyun if (skb_shinfo(skb)->gso_size)
1399*4882a593Smuzhiyun return;
1400*4882a593Smuzhiyun
1401*4882a593Smuzhiyun /* HW supports only a single outstanding packet to timestamp */
1402*4882a593Smuzhiyun if (!atomic_add_unless(&nic->pnicvf->tx_ptp_skbs, 1, 1))
1403*4882a593Smuzhiyun return;
1404*4882a593Smuzhiyun
1405*4882a593Smuzhiyun /* Mark the SKB for later reference */
1406*4882a593Smuzhiyun skb_shinfo(skb)->tx_flags |= SKBTX_IN_PROGRESS;
1407*4882a593Smuzhiyun
1408*4882a593Smuzhiyun /* Finally enable timestamp generation
1409*4882a593Smuzhiyun * Since 'post_cqe' is also set, two CQEs will be posted
1410*4882a593Smuzhiyun * for this packet i.e CQE_TYPE_SEND and CQE_TYPE_SEND_PTP.
1411*4882a593Smuzhiyun */
1412*4882a593Smuzhiyun hdr->tstmp = 1;
1413*4882a593Smuzhiyun }
1414*4882a593Smuzhiyun
1415*4882a593Smuzhiyun /* SQ GATHER subdescriptor
1416*4882a593Smuzhiyun * Must follow HDR descriptor
1417*4882a593Smuzhiyun */
nicvf_sq_add_gather_subdesc(struct snd_queue * sq,int qentry,int size,u64 data)1418*4882a593Smuzhiyun static inline void nicvf_sq_add_gather_subdesc(struct snd_queue *sq, int qentry,
1419*4882a593Smuzhiyun int size, u64 data)
1420*4882a593Smuzhiyun {
1421*4882a593Smuzhiyun struct sq_gather_subdesc *gather;
1422*4882a593Smuzhiyun
1423*4882a593Smuzhiyun qentry &= (sq->dmem.q_len - 1);
1424*4882a593Smuzhiyun gather = (struct sq_gather_subdesc *)GET_SQ_DESC(sq, qentry);
1425*4882a593Smuzhiyun
1426*4882a593Smuzhiyun memset(gather, 0, SND_QUEUE_DESC_SIZE);
1427*4882a593Smuzhiyun gather->subdesc_type = SQ_DESC_TYPE_GATHER;
1428*4882a593Smuzhiyun gather->ld_type = NIC_SEND_LD_TYPE_E_LDD;
1429*4882a593Smuzhiyun gather->size = size;
1430*4882a593Smuzhiyun gather->addr = data;
1431*4882a593Smuzhiyun }
1432*4882a593Smuzhiyun
1433*4882a593Smuzhiyun /* Add HDR + IMMEDIATE subdescriptors right after descriptors of a TSO
1434*4882a593Smuzhiyun * packet so that a CQE is posted as a notifation for transmission of
1435*4882a593Smuzhiyun * TSO packet.
1436*4882a593Smuzhiyun */
nicvf_sq_add_cqe_subdesc(struct snd_queue * sq,int qentry,int tso_sqe,struct sk_buff * skb)1437*4882a593Smuzhiyun static inline void nicvf_sq_add_cqe_subdesc(struct snd_queue *sq, int qentry,
1438*4882a593Smuzhiyun int tso_sqe, struct sk_buff *skb)
1439*4882a593Smuzhiyun {
1440*4882a593Smuzhiyun struct sq_imm_subdesc *imm;
1441*4882a593Smuzhiyun struct sq_hdr_subdesc *hdr;
1442*4882a593Smuzhiyun
1443*4882a593Smuzhiyun sq->skbuff[qentry] = (u64)skb;
1444*4882a593Smuzhiyun
1445*4882a593Smuzhiyun hdr = (struct sq_hdr_subdesc *)GET_SQ_DESC(sq, qentry);
1446*4882a593Smuzhiyun memset(hdr, 0, SND_QUEUE_DESC_SIZE);
1447*4882a593Smuzhiyun hdr->subdesc_type = SQ_DESC_TYPE_HEADER;
1448*4882a593Smuzhiyun /* Enable notification via CQE after processing SQE */
1449*4882a593Smuzhiyun hdr->post_cqe = 1;
1450*4882a593Smuzhiyun /* There is no packet to transmit here */
1451*4882a593Smuzhiyun hdr->dont_send = 1;
1452*4882a593Smuzhiyun hdr->subdesc_cnt = POST_CQE_DESC_COUNT - 1;
1453*4882a593Smuzhiyun hdr->tot_len = 1;
1454*4882a593Smuzhiyun /* Actual TSO header SQE index, needed for cleanup */
1455*4882a593Smuzhiyun hdr->rsvd2 = tso_sqe;
1456*4882a593Smuzhiyun
1457*4882a593Smuzhiyun qentry = nicvf_get_nxt_sqentry(sq, qentry);
1458*4882a593Smuzhiyun imm = (struct sq_imm_subdesc *)GET_SQ_DESC(sq, qentry);
1459*4882a593Smuzhiyun memset(imm, 0, SND_QUEUE_DESC_SIZE);
1460*4882a593Smuzhiyun imm->subdesc_type = SQ_DESC_TYPE_IMMEDIATE;
1461*4882a593Smuzhiyun imm->len = 1;
1462*4882a593Smuzhiyun }
1463*4882a593Smuzhiyun
nicvf_sq_doorbell(struct nicvf * nic,struct sk_buff * skb,int sq_num,int desc_cnt)1464*4882a593Smuzhiyun static inline void nicvf_sq_doorbell(struct nicvf *nic, struct sk_buff *skb,
1465*4882a593Smuzhiyun int sq_num, int desc_cnt)
1466*4882a593Smuzhiyun {
1467*4882a593Smuzhiyun struct netdev_queue *txq;
1468*4882a593Smuzhiyun
1469*4882a593Smuzhiyun txq = netdev_get_tx_queue(nic->pnicvf->netdev,
1470*4882a593Smuzhiyun skb_get_queue_mapping(skb));
1471*4882a593Smuzhiyun
1472*4882a593Smuzhiyun netdev_tx_sent_queue(txq, skb->len);
1473*4882a593Smuzhiyun
1474*4882a593Smuzhiyun /* make sure all memory stores are done before ringing doorbell */
1475*4882a593Smuzhiyun smp_wmb();
1476*4882a593Smuzhiyun
1477*4882a593Smuzhiyun /* Inform HW to xmit all TSO segments */
1478*4882a593Smuzhiyun nicvf_queue_reg_write(nic, NIC_QSET_SQ_0_7_DOOR,
1479*4882a593Smuzhiyun sq_num, desc_cnt);
1480*4882a593Smuzhiyun }
1481*4882a593Smuzhiyun
1482*4882a593Smuzhiyun /* Segment a TSO packet into 'gso_size' segments and append
1483*4882a593Smuzhiyun * them to SQ for transfer
1484*4882a593Smuzhiyun */
nicvf_sq_append_tso(struct nicvf * nic,struct snd_queue * sq,int sq_num,int qentry,struct sk_buff * skb)1485*4882a593Smuzhiyun static int nicvf_sq_append_tso(struct nicvf *nic, struct snd_queue *sq,
1486*4882a593Smuzhiyun int sq_num, int qentry, struct sk_buff *skb)
1487*4882a593Smuzhiyun {
1488*4882a593Smuzhiyun struct tso_t tso;
1489*4882a593Smuzhiyun int seg_subdescs = 0, desc_cnt = 0;
1490*4882a593Smuzhiyun int seg_len, total_len, data_left;
1491*4882a593Smuzhiyun int hdr_qentry = qentry;
1492*4882a593Smuzhiyun int hdr_len;
1493*4882a593Smuzhiyun
1494*4882a593Smuzhiyun hdr_len = tso_start(skb, &tso);
1495*4882a593Smuzhiyun
1496*4882a593Smuzhiyun total_len = skb->len - hdr_len;
1497*4882a593Smuzhiyun while (total_len > 0) {
1498*4882a593Smuzhiyun char *hdr;
1499*4882a593Smuzhiyun
1500*4882a593Smuzhiyun /* Save Qentry for adding HDR_SUBDESC at the end */
1501*4882a593Smuzhiyun hdr_qentry = qentry;
1502*4882a593Smuzhiyun
1503*4882a593Smuzhiyun data_left = min_t(int, skb_shinfo(skb)->gso_size, total_len);
1504*4882a593Smuzhiyun total_len -= data_left;
1505*4882a593Smuzhiyun
1506*4882a593Smuzhiyun /* Add segment's header */
1507*4882a593Smuzhiyun qentry = nicvf_get_nxt_sqentry(sq, qentry);
1508*4882a593Smuzhiyun hdr = sq->tso_hdrs + qentry * TSO_HEADER_SIZE;
1509*4882a593Smuzhiyun tso_build_hdr(skb, hdr, &tso, data_left, total_len == 0);
1510*4882a593Smuzhiyun nicvf_sq_add_gather_subdesc(sq, qentry, hdr_len,
1511*4882a593Smuzhiyun sq->tso_hdrs_phys +
1512*4882a593Smuzhiyun qentry * TSO_HEADER_SIZE);
1513*4882a593Smuzhiyun /* HDR_SUDESC + GATHER */
1514*4882a593Smuzhiyun seg_subdescs = 2;
1515*4882a593Smuzhiyun seg_len = hdr_len;
1516*4882a593Smuzhiyun
1517*4882a593Smuzhiyun /* Add segment's payload fragments */
1518*4882a593Smuzhiyun while (data_left > 0) {
1519*4882a593Smuzhiyun int size;
1520*4882a593Smuzhiyun
1521*4882a593Smuzhiyun size = min_t(int, tso.size, data_left);
1522*4882a593Smuzhiyun
1523*4882a593Smuzhiyun qentry = nicvf_get_nxt_sqentry(sq, qentry);
1524*4882a593Smuzhiyun nicvf_sq_add_gather_subdesc(sq, qentry, size,
1525*4882a593Smuzhiyun virt_to_phys(tso.data));
1526*4882a593Smuzhiyun seg_subdescs++;
1527*4882a593Smuzhiyun seg_len += size;
1528*4882a593Smuzhiyun
1529*4882a593Smuzhiyun data_left -= size;
1530*4882a593Smuzhiyun tso_build_data(skb, &tso, size);
1531*4882a593Smuzhiyun }
1532*4882a593Smuzhiyun nicvf_sq_add_hdr_subdesc(nic, sq, hdr_qentry,
1533*4882a593Smuzhiyun seg_subdescs - 1, skb, seg_len);
1534*4882a593Smuzhiyun sq->skbuff[hdr_qentry] = (u64)NULL;
1535*4882a593Smuzhiyun qentry = nicvf_get_nxt_sqentry(sq, qentry);
1536*4882a593Smuzhiyun
1537*4882a593Smuzhiyun desc_cnt += seg_subdescs;
1538*4882a593Smuzhiyun }
1539*4882a593Smuzhiyun /* Save SKB in the last segment for freeing */
1540*4882a593Smuzhiyun sq->skbuff[hdr_qentry] = (u64)skb;
1541*4882a593Smuzhiyun
1542*4882a593Smuzhiyun nicvf_sq_doorbell(nic, skb, sq_num, desc_cnt);
1543*4882a593Smuzhiyun
1544*4882a593Smuzhiyun this_cpu_inc(nic->pnicvf->drv_stats->tx_tso);
1545*4882a593Smuzhiyun return 1;
1546*4882a593Smuzhiyun }
1547*4882a593Smuzhiyun
1548*4882a593Smuzhiyun /* Append an skb to a SQ for packet transfer. */
nicvf_sq_append_skb(struct nicvf * nic,struct snd_queue * sq,struct sk_buff * skb,u8 sq_num)1549*4882a593Smuzhiyun int nicvf_sq_append_skb(struct nicvf *nic, struct snd_queue *sq,
1550*4882a593Smuzhiyun struct sk_buff *skb, u8 sq_num)
1551*4882a593Smuzhiyun {
1552*4882a593Smuzhiyun int i, size;
1553*4882a593Smuzhiyun int subdesc_cnt, hdr_sqe = 0;
1554*4882a593Smuzhiyun int qentry;
1555*4882a593Smuzhiyun u64 dma_addr;
1556*4882a593Smuzhiyun
1557*4882a593Smuzhiyun subdesc_cnt = nicvf_sq_subdesc_required(nic, skb);
1558*4882a593Smuzhiyun if (subdesc_cnt > atomic_read(&sq->free_cnt))
1559*4882a593Smuzhiyun goto append_fail;
1560*4882a593Smuzhiyun
1561*4882a593Smuzhiyun qentry = nicvf_get_sq_desc(sq, subdesc_cnt);
1562*4882a593Smuzhiyun
1563*4882a593Smuzhiyun /* Check if its a TSO packet */
1564*4882a593Smuzhiyun if (skb_shinfo(skb)->gso_size && !nic->hw_tso)
1565*4882a593Smuzhiyun return nicvf_sq_append_tso(nic, sq, sq_num, qentry, skb);
1566*4882a593Smuzhiyun
1567*4882a593Smuzhiyun /* Add SQ header subdesc */
1568*4882a593Smuzhiyun nicvf_sq_add_hdr_subdesc(nic, sq, qentry, subdesc_cnt - 1,
1569*4882a593Smuzhiyun skb, skb->len);
1570*4882a593Smuzhiyun hdr_sqe = qentry;
1571*4882a593Smuzhiyun
1572*4882a593Smuzhiyun /* Add SQ gather subdescs */
1573*4882a593Smuzhiyun qentry = nicvf_get_nxt_sqentry(sq, qentry);
1574*4882a593Smuzhiyun size = skb_is_nonlinear(skb) ? skb_headlen(skb) : skb->len;
1575*4882a593Smuzhiyun /* HW will ensure data coherency, CPU sync not required */
1576*4882a593Smuzhiyun dma_addr = dma_map_page_attrs(&nic->pdev->dev, virt_to_page(skb->data),
1577*4882a593Smuzhiyun offset_in_page(skb->data), size,
1578*4882a593Smuzhiyun DMA_TO_DEVICE, DMA_ATTR_SKIP_CPU_SYNC);
1579*4882a593Smuzhiyun if (dma_mapping_error(&nic->pdev->dev, dma_addr)) {
1580*4882a593Smuzhiyun nicvf_rollback_sq_desc(sq, qentry, subdesc_cnt);
1581*4882a593Smuzhiyun return 0;
1582*4882a593Smuzhiyun }
1583*4882a593Smuzhiyun
1584*4882a593Smuzhiyun nicvf_sq_add_gather_subdesc(sq, qentry, size, dma_addr);
1585*4882a593Smuzhiyun
1586*4882a593Smuzhiyun /* Check for scattered buffer */
1587*4882a593Smuzhiyun if (!skb_is_nonlinear(skb))
1588*4882a593Smuzhiyun goto doorbell;
1589*4882a593Smuzhiyun
1590*4882a593Smuzhiyun for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
1591*4882a593Smuzhiyun const skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
1592*4882a593Smuzhiyun
1593*4882a593Smuzhiyun qentry = nicvf_get_nxt_sqentry(sq, qentry);
1594*4882a593Smuzhiyun size = skb_frag_size(frag);
1595*4882a593Smuzhiyun dma_addr = dma_map_page_attrs(&nic->pdev->dev,
1596*4882a593Smuzhiyun skb_frag_page(frag),
1597*4882a593Smuzhiyun skb_frag_off(frag), size,
1598*4882a593Smuzhiyun DMA_TO_DEVICE,
1599*4882a593Smuzhiyun DMA_ATTR_SKIP_CPU_SYNC);
1600*4882a593Smuzhiyun if (dma_mapping_error(&nic->pdev->dev, dma_addr)) {
1601*4882a593Smuzhiyun /* Free entire chain of mapped buffers
1602*4882a593Smuzhiyun * here 'i' = frags mapped + above mapped skb->data
1603*4882a593Smuzhiyun */
1604*4882a593Smuzhiyun nicvf_unmap_sndq_buffers(nic, sq, hdr_sqe, i);
1605*4882a593Smuzhiyun nicvf_rollback_sq_desc(sq, qentry, subdesc_cnt);
1606*4882a593Smuzhiyun return 0;
1607*4882a593Smuzhiyun }
1608*4882a593Smuzhiyun nicvf_sq_add_gather_subdesc(sq, qentry, size, dma_addr);
1609*4882a593Smuzhiyun }
1610*4882a593Smuzhiyun
1611*4882a593Smuzhiyun doorbell:
1612*4882a593Smuzhiyun if (nic->t88 && skb_shinfo(skb)->gso_size) {
1613*4882a593Smuzhiyun qentry = nicvf_get_nxt_sqentry(sq, qentry);
1614*4882a593Smuzhiyun nicvf_sq_add_cqe_subdesc(sq, qentry, hdr_sqe, skb);
1615*4882a593Smuzhiyun }
1616*4882a593Smuzhiyun
1617*4882a593Smuzhiyun nicvf_sq_doorbell(nic, skb, sq_num, subdesc_cnt);
1618*4882a593Smuzhiyun
1619*4882a593Smuzhiyun return 1;
1620*4882a593Smuzhiyun
1621*4882a593Smuzhiyun append_fail:
1622*4882a593Smuzhiyun /* Use original PCI dev for debug log */
1623*4882a593Smuzhiyun nic = nic->pnicvf;
1624*4882a593Smuzhiyun netdev_dbg(nic->netdev, "Not enough SQ descriptors to xmit pkt\n");
1625*4882a593Smuzhiyun return 0;
1626*4882a593Smuzhiyun }
1627*4882a593Smuzhiyun
frag_num(unsigned i)1628*4882a593Smuzhiyun static inline unsigned frag_num(unsigned i)
1629*4882a593Smuzhiyun {
1630*4882a593Smuzhiyun #ifdef __BIG_ENDIAN
1631*4882a593Smuzhiyun return (i & ~3) + 3 - (i & 3);
1632*4882a593Smuzhiyun #else
1633*4882a593Smuzhiyun return i;
1634*4882a593Smuzhiyun #endif
1635*4882a593Smuzhiyun }
1636*4882a593Smuzhiyun
nicvf_unmap_rcv_buffer(struct nicvf * nic,u64 dma_addr,u64 buf_addr,bool xdp)1637*4882a593Smuzhiyun static void nicvf_unmap_rcv_buffer(struct nicvf *nic, u64 dma_addr,
1638*4882a593Smuzhiyun u64 buf_addr, bool xdp)
1639*4882a593Smuzhiyun {
1640*4882a593Smuzhiyun struct page *page = NULL;
1641*4882a593Smuzhiyun int len = RCV_FRAG_LEN;
1642*4882a593Smuzhiyun
1643*4882a593Smuzhiyun if (xdp) {
1644*4882a593Smuzhiyun page = virt_to_page(phys_to_virt(buf_addr));
1645*4882a593Smuzhiyun /* Check if it's a recycled page, if not
1646*4882a593Smuzhiyun * unmap the DMA mapping.
1647*4882a593Smuzhiyun *
1648*4882a593Smuzhiyun * Recycled page holds an extra reference.
1649*4882a593Smuzhiyun */
1650*4882a593Smuzhiyun if (page_ref_count(page) != 1)
1651*4882a593Smuzhiyun return;
1652*4882a593Smuzhiyun
1653*4882a593Smuzhiyun len += XDP_PACKET_HEADROOM;
1654*4882a593Smuzhiyun /* Receive buffers in XDP mode are mapped from page start */
1655*4882a593Smuzhiyun dma_addr &= PAGE_MASK;
1656*4882a593Smuzhiyun }
1657*4882a593Smuzhiyun dma_unmap_page_attrs(&nic->pdev->dev, dma_addr, len,
1658*4882a593Smuzhiyun DMA_FROM_DEVICE, DMA_ATTR_SKIP_CPU_SYNC);
1659*4882a593Smuzhiyun }
1660*4882a593Smuzhiyun
1661*4882a593Smuzhiyun /* Returns SKB for a received packet */
nicvf_get_rcv_skb(struct nicvf * nic,struct cqe_rx_t * cqe_rx,bool xdp)1662*4882a593Smuzhiyun struct sk_buff *nicvf_get_rcv_skb(struct nicvf *nic,
1663*4882a593Smuzhiyun struct cqe_rx_t *cqe_rx, bool xdp)
1664*4882a593Smuzhiyun {
1665*4882a593Smuzhiyun int frag;
1666*4882a593Smuzhiyun int payload_len = 0;
1667*4882a593Smuzhiyun struct sk_buff *skb = NULL;
1668*4882a593Smuzhiyun struct page *page;
1669*4882a593Smuzhiyun int offset;
1670*4882a593Smuzhiyun u16 *rb_lens = NULL;
1671*4882a593Smuzhiyun u64 *rb_ptrs = NULL;
1672*4882a593Smuzhiyun u64 phys_addr;
1673*4882a593Smuzhiyun
1674*4882a593Smuzhiyun rb_lens = (void *)cqe_rx + (3 * sizeof(u64));
1675*4882a593Smuzhiyun /* Except 88xx pass1 on all other chips CQE_RX2_S is added to
1676*4882a593Smuzhiyun * CQE_RX at word6, hence buffer pointers move by word
1677*4882a593Smuzhiyun *
1678*4882a593Smuzhiyun * Use existing 'hw_tso' flag which will be set for all chips
1679*4882a593Smuzhiyun * except 88xx pass1 instead of a additional cache line
1680*4882a593Smuzhiyun * access (or miss) by using pci dev's revision.
1681*4882a593Smuzhiyun */
1682*4882a593Smuzhiyun if (!nic->hw_tso)
1683*4882a593Smuzhiyun rb_ptrs = (void *)cqe_rx + (6 * sizeof(u64));
1684*4882a593Smuzhiyun else
1685*4882a593Smuzhiyun rb_ptrs = (void *)cqe_rx + (7 * sizeof(u64));
1686*4882a593Smuzhiyun
1687*4882a593Smuzhiyun for (frag = 0; frag < cqe_rx->rb_cnt; frag++) {
1688*4882a593Smuzhiyun payload_len = rb_lens[frag_num(frag)];
1689*4882a593Smuzhiyun phys_addr = nicvf_iova_to_phys(nic, *rb_ptrs);
1690*4882a593Smuzhiyun if (!phys_addr) {
1691*4882a593Smuzhiyun if (skb)
1692*4882a593Smuzhiyun dev_kfree_skb_any(skb);
1693*4882a593Smuzhiyun return NULL;
1694*4882a593Smuzhiyun }
1695*4882a593Smuzhiyun
1696*4882a593Smuzhiyun if (!frag) {
1697*4882a593Smuzhiyun /* First fragment */
1698*4882a593Smuzhiyun nicvf_unmap_rcv_buffer(nic,
1699*4882a593Smuzhiyun *rb_ptrs - cqe_rx->align_pad,
1700*4882a593Smuzhiyun phys_addr, xdp);
1701*4882a593Smuzhiyun skb = nicvf_rb_ptr_to_skb(nic,
1702*4882a593Smuzhiyun phys_addr - cqe_rx->align_pad,
1703*4882a593Smuzhiyun payload_len);
1704*4882a593Smuzhiyun if (!skb)
1705*4882a593Smuzhiyun return NULL;
1706*4882a593Smuzhiyun skb_reserve(skb, cqe_rx->align_pad);
1707*4882a593Smuzhiyun skb_put(skb, payload_len);
1708*4882a593Smuzhiyun } else {
1709*4882a593Smuzhiyun /* Add fragments */
1710*4882a593Smuzhiyun nicvf_unmap_rcv_buffer(nic, *rb_ptrs, phys_addr, xdp);
1711*4882a593Smuzhiyun page = virt_to_page(phys_to_virt(phys_addr));
1712*4882a593Smuzhiyun offset = phys_to_virt(phys_addr) - page_address(page);
1713*4882a593Smuzhiyun skb_add_rx_frag(skb, skb_shinfo(skb)->nr_frags, page,
1714*4882a593Smuzhiyun offset, payload_len, RCV_FRAG_LEN);
1715*4882a593Smuzhiyun }
1716*4882a593Smuzhiyun /* Next buffer pointer */
1717*4882a593Smuzhiyun rb_ptrs++;
1718*4882a593Smuzhiyun }
1719*4882a593Smuzhiyun return skb;
1720*4882a593Smuzhiyun }
1721*4882a593Smuzhiyun
nicvf_int_type_to_mask(int int_type,int q_idx)1722*4882a593Smuzhiyun static u64 nicvf_int_type_to_mask(int int_type, int q_idx)
1723*4882a593Smuzhiyun {
1724*4882a593Smuzhiyun u64 reg_val;
1725*4882a593Smuzhiyun
1726*4882a593Smuzhiyun switch (int_type) {
1727*4882a593Smuzhiyun case NICVF_INTR_CQ:
1728*4882a593Smuzhiyun reg_val = ((1ULL << q_idx) << NICVF_INTR_CQ_SHIFT);
1729*4882a593Smuzhiyun break;
1730*4882a593Smuzhiyun case NICVF_INTR_SQ:
1731*4882a593Smuzhiyun reg_val = ((1ULL << q_idx) << NICVF_INTR_SQ_SHIFT);
1732*4882a593Smuzhiyun break;
1733*4882a593Smuzhiyun case NICVF_INTR_RBDR:
1734*4882a593Smuzhiyun reg_val = ((1ULL << q_idx) << NICVF_INTR_RBDR_SHIFT);
1735*4882a593Smuzhiyun break;
1736*4882a593Smuzhiyun case NICVF_INTR_PKT_DROP:
1737*4882a593Smuzhiyun reg_val = (1ULL << NICVF_INTR_PKT_DROP_SHIFT);
1738*4882a593Smuzhiyun break;
1739*4882a593Smuzhiyun case NICVF_INTR_TCP_TIMER:
1740*4882a593Smuzhiyun reg_val = (1ULL << NICVF_INTR_TCP_TIMER_SHIFT);
1741*4882a593Smuzhiyun break;
1742*4882a593Smuzhiyun case NICVF_INTR_MBOX:
1743*4882a593Smuzhiyun reg_val = (1ULL << NICVF_INTR_MBOX_SHIFT);
1744*4882a593Smuzhiyun break;
1745*4882a593Smuzhiyun case NICVF_INTR_QS_ERR:
1746*4882a593Smuzhiyun reg_val = (1ULL << NICVF_INTR_QS_ERR_SHIFT);
1747*4882a593Smuzhiyun break;
1748*4882a593Smuzhiyun default:
1749*4882a593Smuzhiyun reg_val = 0;
1750*4882a593Smuzhiyun }
1751*4882a593Smuzhiyun
1752*4882a593Smuzhiyun return reg_val;
1753*4882a593Smuzhiyun }
1754*4882a593Smuzhiyun
1755*4882a593Smuzhiyun /* Enable interrupt */
nicvf_enable_intr(struct nicvf * nic,int int_type,int q_idx)1756*4882a593Smuzhiyun void nicvf_enable_intr(struct nicvf *nic, int int_type, int q_idx)
1757*4882a593Smuzhiyun {
1758*4882a593Smuzhiyun u64 mask = nicvf_int_type_to_mask(int_type, q_idx);
1759*4882a593Smuzhiyun
1760*4882a593Smuzhiyun if (!mask) {
1761*4882a593Smuzhiyun netdev_dbg(nic->netdev,
1762*4882a593Smuzhiyun "Failed to enable interrupt: unknown type\n");
1763*4882a593Smuzhiyun return;
1764*4882a593Smuzhiyun }
1765*4882a593Smuzhiyun nicvf_reg_write(nic, NIC_VF_ENA_W1S,
1766*4882a593Smuzhiyun nicvf_reg_read(nic, NIC_VF_ENA_W1S) | mask);
1767*4882a593Smuzhiyun }
1768*4882a593Smuzhiyun
1769*4882a593Smuzhiyun /* Disable interrupt */
nicvf_disable_intr(struct nicvf * nic,int int_type,int q_idx)1770*4882a593Smuzhiyun void nicvf_disable_intr(struct nicvf *nic, int int_type, int q_idx)
1771*4882a593Smuzhiyun {
1772*4882a593Smuzhiyun u64 mask = nicvf_int_type_to_mask(int_type, q_idx);
1773*4882a593Smuzhiyun
1774*4882a593Smuzhiyun if (!mask) {
1775*4882a593Smuzhiyun netdev_dbg(nic->netdev,
1776*4882a593Smuzhiyun "Failed to disable interrupt: unknown type\n");
1777*4882a593Smuzhiyun return;
1778*4882a593Smuzhiyun }
1779*4882a593Smuzhiyun
1780*4882a593Smuzhiyun nicvf_reg_write(nic, NIC_VF_ENA_W1C, mask);
1781*4882a593Smuzhiyun }
1782*4882a593Smuzhiyun
1783*4882a593Smuzhiyun /* Clear interrupt */
nicvf_clear_intr(struct nicvf * nic,int int_type,int q_idx)1784*4882a593Smuzhiyun void nicvf_clear_intr(struct nicvf *nic, int int_type, int q_idx)
1785*4882a593Smuzhiyun {
1786*4882a593Smuzhiyun u64 mask = nicvf_int_type_to_mask(int_type, q_idx);
1787*4882a593Smuzhiyun
1788*4882a593Smuzhiyun if (!mask) {
1789*4882a593Smuzhiyun netdev_dbg(nic->netdev,
1790*4882a593Smuzhiyun "Failed to clear interrupt: unknown type\n");
1791*4882a593Smuzhiyun return;
1792*4882a593Smuzhiyun }
1793*4882a593Smuzhiyun
1794*4882a593Smuzhiyun nicvf_reg_write(nic, NIC_VF_INT, mask);
1795*4882a593Smuzhiyun }
1796*4882a593Smuzhiyun
1797*4882a593Smuzhiyun /* Check if interrupt is enabled */
nicvf_is_intr_enabled(struct nicvf * nic,int int_type,int q_idx)1798*4882a593Smuzhiyun int nicvf_is_intr_enabled(struct nicvf *nic, int int_type, int q_idx)
1799*4882a593Smuzhiyun {
1800*4882a593Smuzhiyun u64 mask = nicvf_int_type_to_mask(int_type, q_idx);
1801*4882a593Smuzhiyun /* If interrupt type is unknown, we treat it disabled. */
1802*4882a593Smuzhiyun if (!mask) {
1803*4882a593Smuzhiyun netdev_dbg(nic->netdev,
1804*4882a593Smuzhiyun "Failed to check interrupt enable: unknown type\n");
1805*4882a593Smuzhiyun return 0;
1806*4882a593Smuzhiyun }
1807*4882a593Smuzhiyun
1808*4882a593Smuzhiyun return mask & nicvf_reg_read(nic, NIC_VF_ENA_W1S);
1809*4882a593Smuzhiyun }
1810*4882a593Smuzhiyun
nicvf_update_rq_stats(struct nicvf * nic,int rq_idx)1811*4882a593Smuzhiyun void nicvf_update_rq_stats(struct nicvf *nic, int rq_idx)
1812*4882a593Smuzhiyun {
1813*4882a593Smuzhiyun struct rcv_queue *rq;
1814*4882a593Smuzhiyun
1815*4882a593Smuzhiyun #define GET_RQ_STATS(reg) \
1816*4882a593Smuzhiyun nicvf_reg_read(nic, NIC_QSET_RQ_0_7_STAT_0_1 |\
1817*4882a593Smuzhiyun (rq_idx << NIC_Q_NUM_SHIFT) | (reg << 3))
1818*4882a593Smuzhiyun
1819*4882a593Smuzhiyun rq = &nic->qs->rq[rq_idx];
1820*4882a593Smuzhiyun rq->stats.bytes = GET_RQ_STATS(RQ_SQ_STATS_OCTS);
1821*4882a593Smuzhiyun rq->stats.pkts = GET_RQ_STATS(RQ_SQ_STATS_PKTS);
1822*4882a593Smuzhiyun }
1823*4882a593Smuzhiyun
nicvf_update_sq_stats(struct nicvf * nic,int sq_idx)1824*4882a593Smuzhiyun void nicvf_update_sq_stats(struct nicvf *nic, int sq_idx)
1825*4882a593Smuzhiyun {
1826*4882a593Smuzhiyun struct snd_queue *sq;
1827*4882a593Smuzhiyun
1828*4882a593Smuzhiyun #define GET_SQ_STATS(reg) \
1829*4882a593Smuzhiyun nicvf_reg_read(nic, NIC_QSET_SQ_0_7_STAT_0_1 |\
1830*4882a593Smuzhiyun (sq_idx << NIC_Q_NUM_SHIFT) | (reg << 3))
1831*4882a593Smuzhiyun
1832*4882a593Smuzhiyun sq = &nic->qs->sq[sq_idx];
1833*4882a593Smuzhiyun sq->stats.bytes = GET_SQ_STATS(RQ_SQ_STATS_OCTS);
1834*4882a593Smuzhiyun sq->stats.pkts = GET_SQ_STATS(RQ_SQ_STATS_PKTS);
1835*4882a593Smuzhiyun }
1836*4882a593Smuzhiyun
1837*4882a593Smuzhiyun /* Check for errors in the receive cmp.queue entry */
nicvf_check_cqe_rx_errs(struct nicvf * nic,struct cqe_rx_t * cqe_rx)1838*4882a593Smuzhiyun int nicvf_check_cqe_rx_errs(struct nicvf *nic, struct cqe_rx_t *cqe_rx)
1839*4882a593Smuzhiyun {
1840*4882a593Smuzhiyun netif_err(nic, rx_err, nic->netdev,
1841*4882a593Smuzhiyun "RX error CQE err_level 0x%x err_opcode 0x%x\n",
1842*4882a593Smuzhiyun cqe_rx->err_level, cqe_rx->err_opcode);
1843*4882a593Smuzhiyun
1844*4882a593Smuzhiyun switch (cqe_rx->err_opcode) {
1845*4882a593Smuzhiyun case CQ_RX_ERROP_RE_PARTIAL:
1846*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_bgx_truncated_pkts);
1847*4882a593Smuzhiyun break;
1848*4882a593Smuzhiyun case CQ_RX_ERROP_RE_JABBER:
1849*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_jabber_errs);
1850*4882a593Smuzhiyun break;
1851*4882a593Smuzhiyun case CQ_RX_ERROP_RE_FCS:
1852*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_fcs_errs);
1853*4882a593Smuzhiyun break;
1854*4882a593Smuzhiyun case CQ_RX_ERROP_RE_RX_CTL:
1855*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_bgx_errs);
1856*4882a593Smuzhiyun break;
1857*4882a593Smuzhiyun case CQ_RX_ERROP_PREL2_ERR:
1858*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_prel2_errs);
1859*4882a593Smuzhiyun break;
1860*4882a593Smuzhiyun case CQ_RX_ERROP_L2_MAL:
1861*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_l2_hdr_malformed);
1862*4882a593Smuzhiyun break;
1863*4882a593Smuzhiyun case CQ_RX_ERROP_L2_OVERSIZE:
1864*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_oversize);
1865*4882a593Smuzhiyun break;
1866*4882a593Smuzhiyun case CQ_RX_ERROP_L2_UNDERSIZE:
1867*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_undersize);
1868*4882a593Smuzhiyun break;
1869*4882a593Smuzhiyun case CQ_RX_ERROP_L2_LENMISM:
1870*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_l2_len_mismatch);
1871*4882a593Smuzhiyun break;
1872*4882a593Smuzhiyun case CQ_RX_ERROP_L2_PCLP:
1873*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_l2_pclp);
1874*4882a593Smuzhiyun break;
1875*4882a593Smuzhiyun case CQ_RX_ERROP_IP_NOT:
1876*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_ip_ver_errs);
1877*4882a593Smuzhiyun break;
1878*4882a593Smuzhiyun case CQ_RX_ERROP_IP_CSUM_ERR:
1879*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_ip_csum_errs);
1880*4882a593Smuzhiyun break;
1881*4882a593Smuzhiyun case CQ_RX_ERROP_IP_MAL:
1882*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_ip_hdr_malformed);
1883*4882a593Smuzhiyun break;
1884*4882a593Smuzhiyun case CQ_RX_ERROP_IP_MALD:
1885*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_ip_payload_malformed);
1886*4882a593Smuzhiyun break;
1887*4882a593Smuzhiyun case CQ_RX_ERROP_IP_HOP:
1888*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_ip_ttl_errs);
1889*4882a593Smuzhiyun break;
1890*4882a593Smuzhiyun case CQ_RX_ERROP_L3_PCLP:
1891*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_l3_pclp);
1892*4882a593Smuzhiyun break;
1893*4882a593Smuzhiyun case CQ_RX_ERROP_L4_MAL:
1894*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_l4_malformed);
1895*4882a593Smuzhiyun break;
1896*4882a593Smuzhiyun case CQ_RX_ERROP_L4_CHK:
1897*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_l4_csum_errs);
1898*4882a593Smuzhiyun break;
1899*4882a593Smuzhiyun case CQ_RX_ERROP_UDP_LEN:
1900*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_udp_len_errs);
1901*4882a593Smuzhiyun break;
1902*4882a593Smuzhiyun case CQ_RX_ERROP_L4_PORT:
1903*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_l4_port_errs);
1904*4882a593Smuzhiyun break;
1905*4882a593Smuzhiyun case CQ_RX_ERROP_TCP_FLAG:
1906*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_tcp_flag_errs);
1907*4882a593Smuzhiyun break;
1908*4882a593Smuzhiyun case CQ_RX_ERROP_TCP_OFFSET:
1909*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_tcp_offset_errs);
1910*4882a593Smuzhiyun break;
1911*4882a593Smuzhiyun case CQ_RX_ERROP_L4_PCLP:
1912*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_l4_pclp);
1913*4882a593Smuzhiyun break;
1914*4882a593Smuzhiyun case CQ_RX_ERROP_RBDR_TRUNC:
1915*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->rx_truncated_pkts);
1916*4882a593Smuzhiyun break;
1917*4882a593Smuzhiyun }
1918*4882a593Smuzhiyun
1919*4882a593Smuzhiyun return 1;
1920*4882a593Smuzhiyun }
1921*4882a593Smuzhiyun
1922*4882a593Smuzhiyun /* Check for errors in the send cmp.queue entry */
nicvf_check_cqe_tx_errs(struct nicvf * nic,struct cqe_send_t * cqe_tx)1923*4882a593Smuzhiyun int nicvf_check_cqe_tx_errs(struct nicvf *nic, struct cqe_send_t *cqe_tx)
1924*4882a593Smuzhiyun {
1925*4882a593Smuzhiyun switch (cqe_tx->send_status) {
1926*4882a593Smuzhiyun case CQ_TX_ERROP_DESC_FAULT:
1927*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_desc_fault);
1928*4882a593Smuzhiyun break;
1929*4882a593Smuzhiyun case CQ_TX_ERROP_HDR_CONS_ERR:
1930*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_hdr_cons_err);
1931*4882a593Smuzhiyun break;
1932*4882a593Smuzhiyun case CQ_TX_ERROP_SUBDC_ERR:
1933*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_subdesc_err);
1934*4882a593Smuzhiyun break;
1935*4882a593Smuzhiyun case CQ_TX_ERROP_MAX_SIZE_VIOL:
1936*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_max_size_exceeded);
1937*4882a593Smuzhiyun break;
1938*4882a593Smuzhiyun case CQ_TX_ERROP_IMM_SIZE_OFLOW:
1939*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_imm_size_oflow);
1940*4882a593Smuzhiyun break;
1941*4882a593Smuzhiyun case CQ_TX_ERROP_DATA_SEQUENCE_ERR:
1942*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_data_seq_err);
1943*4882a593Smuzhiyun break;
1944*4882a593Smuzhiyun case CQ_TX_ERROP_MEM_SEQUENCE_ERR:
1945*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_mem_seq_err);
1946*4882a593Smuzhiyun break;
1947*4882a593Smuzhiyun case CQ_TX_ERROP_LOCK_VIOL:
1948*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_lock_viol);
1949*4882a593Smuzhiyun break;
1950*4882a593Smuzhiyun case CQ_TX_ERROP_DATA_FAULT:
1951*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_data_fault);
1952*4882a593Smuzhiyun break;
1953*4882a593Smuzhiyun case CQ_TX_ERROP_TSTMP_CONFLICT:
1954*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_tstmp_conflict);
1955*4882a593Smuzhiyun break;
1956*4882a593Smuzhiyun case CQ_TX_ERROP_TSTMP_TIMEOUT:
1957*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_tstmp_timeout);
1958*4882a593Smuzhiyun break;
1959*4882a593Smuzhiyun case CQ_TX_ERROP_MEM_FAULT:
1960*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_mem_fault);
1961*4882a593Smuzhiyun break;
1962*4882a593Smuzhiyun case CQ_TX_ERROP_CK_OVERLAP:
1963*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_csum_overlap);
1964*4882a593Smuzhiyun break;
1965*4882a593Smuzhiyun case CQ_TX_ERROP_CK_OFLOW:
1966*4882a593Smuzhiyun this_cpu_inc(nic->drv_stats->tx_csum_overflow);
1967*4882a593Smuzhiyun break;
1968*4882a593Smuzhiyun }
1969*4882a593Smuzhiyun
1970*4882a593Smuzhiyun return 1;
1971*4882a593Smuzhiyun }
1972