1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Copyright(c) 2017 - 2020 Intel Corporation.
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * This file is provided under a dual BSD/GPLv2 license. When using or
5*4882a593Smuzhiyun * redistributing this file, you may do so under either license.
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * GPL LICENSE SUMMARY
8*4882a593Smuzhiyun *
9*4882a593Smuzhiyun * This program is free software; you can redistribute it and/or modify
10*4882a593Smuzhiyun * it under the terms of version 2 of the GNU General Public License as
11*4882a593Smuzhiyun * published by the Free Software Foundation.
12*4882a593Smuzhiyun *
13*4882a593Smuzhiyun * This program is distributed in the hope that it will be useful, but
14*4882a593Smuzhiyun * WITHOUT ANY WARRANTY; without even the implied warranty of
15*4882a593Smuzhiyun * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16*4882a593Smuzhiyun * General Public License for more details.
17*4882a593Smuzhiyun *
18*4882a593Smuzhiyun * BSD LICENSE
19*4882a593Smuzhiyun *
20*4882a593Smuzhiyun * Redistribution and use in source and binary forms, with or without
21*4882a593Smuzhiyun * modification, are permitted provided that the following conditions
22*4882a593Smuzhiyun * are met:
23*4882a593Smuzhiyun *
24*4882a593Smuzhiyun * - Redistributions of source code must retain the above copyright
25*4882a593Smuzhiyun * notice, this list of conditions and the following disclaimer.
26*4882a593Smuzhiyun * - Redistributions in binary form must reproduce the above copyright
27*4882a593Smuzhiyun * notice, this list of conditions and the following disclaimer in
28*4882a593Smuzhiyun * the documentation and/or other materials provided with the
29*4882a593Smuzhiyun * distribution.
30*4882a593Smuzhiyun * - Neither the name of Intel Corporation nor the names of its
31*4882a593Smuzhiyun * contributors may be used to endorse or promote products derived
32*4882a593Smuzhiyun * from this software without specific prior written permission.
33*4882a593Smuzhiyun *
34*4882a593Smuzhiyun * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
35*4882a593Smuzhiyun * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
36*4882a593Smuzhiyun * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
37*4882a593Smuzhiyun * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
38*4882a593Smuzhiyun * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
39*4882a593Smuzhiyun * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
40*4882a593Smuzhiyun * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
41*4882a593Smuzhiyun * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
42*4882a593Smuzhiyun * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
43*4882a593Smuzhiyun * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
44*4882a593Smuzhiyun * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
45*4882a593Smuzhiyun *
46*4882a593Smuzhiyun */
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun /*
49*4882a593Smuzhiyun * This file contains HFI1 support for VNIC functionality
50*4882a593Smuzhiyun */
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun #include <linux/io.h>
53*4882a593Smuzhiyun #include <linux/if_vlan.h>
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun #include "vnic.h"
56*4882a593Smuzhiyun #include "netdev.h"
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun #define HFI_TX_TIMEOUT_MS 1000
59*4882a593Smuzhiyun
60*4882a593Smuzhiyun #define HFI1_VNIC_RCV_Q_SIZE 1024
61*4882a593Smuzhiyun
62*4882a593Smuzhiyun #define HFI1_VNIC_UP 0
63*4882a593Smuzhiyun
64*4882a593Smuzhiyun static DEFINE_SPINLOCK(vport_cntr_lock);
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun #define SUM_GRP_COUNTERS(stats, qstats, x_grp) do { \
67*4882a593Smuzhiyun u64 *src64, *dst64; \
68*4882a593Smuzhiyun for (src64 = &qstats->x_grp.unicast, \
69*4882a593Smuzhiyun dst64 = &stats->x_grp.unicast; \
70*4882a593Smuzhiyun dst64 <= &stats->x_grp.s_1519_max;) { \
71*4882a593Smuzhiyun *dst64++ += *src64++; \
72*4882a593Smuzhiyun } \
73*4882a593Smuzhiyun } while (0)
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun #define VNIC_MASK (0xFF)
76*4882a593Smuzhiyun #define VNIC_ID(val) ((1ull << 24) | ((val) & VNIC_MASK))
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun /* hfi1_vnic_update_stats - update statistics */
hfi1_vnic_update_stats(struct hfi1_vnic_vport_info * vinfo,struct opa_vnic_stats * stats)79*4882a593Smuzhiyun static void hfi1_vnic_update_stats(struct hfi1_vnic_vport_info *vinfo,
80*4882a593Smuzhiyun struct opa_vnic_stats *stats)
81*4882a593Smuzhiyun {
82*4882a593Smuzhiyun struct net_device *netdev = vinfo->netdev;
83*4882a593Smuzhiyun u8 i;
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun /* add tx counters on different queues */
86*4882a593Smuzhiyun for (i = 0; i < vinfo->num_tx_q; i++) {
87*4882a593Smuzhiyun struct opa_vnic_stats *qstats = &vinfo->stats[i];
88*4882a593Smuzhiyun struct rtnl_link_stats64 *qnstats = &vinfo->stats[i].netstats;
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun stats->netstats.tx_fifo_errors += qnstats->tx_fifo_errors;
91*4882a593Smuzhiyun stats->netstats.tx_carrier_errors += qnstats->tx_carrier_errors;
92*4882a593Smuzhiyun stats->tx_drop_state += qstats->tx_drop_state;
93*4882a593Smuzhiyun stats->tx_dlid_zero += qstats->tx_dlid_zero;
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun SUM_GRP_COUNTERS(stats, qstats, tx_grp);
96*4882a593Smuzhiyun stats->netstats.tx_packets += qnstats->tx_packets;
97*4882a593Smuzhiyun stats->netstats.tx_bytes += qnstats->tx_bytes;
98*4882a593Smuzhiyun }
99*4882a593Smuzhiyun
100*4882a593Smuzhiyun /* add rx counters on different queues */
101*4882a593Smuzhiyun for (i = 0; i < vinfo->num_rx_q; i++) {
102*4882a593Smuzhiyun struct opa_vnic_stats *qstats = &vinfo->stats[i];
103*4882a593Smuzhiyun struct rtnl_link_stats64 *qnstats = &vinfo->stats[i].netstats;
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun stats->netstats.rx_fifo_errors += qnstats->rx_fifo_errors;
106*4882a593Smuzhiyun stats->netstats.rx_nohandler += qnstats->rx_nohandler;
107*4882a593Smuzhiyun stats->rx_drop_state += qstats->rx_drop_state;
108*4882a593Smuzhiyun stats->rx_oversize += qstats->rx_oversize;
109*4882a593Smuzhiyun stats->rx_runt += qstats->rx_runt;
110*4882a593Smuzhiyun
111*4882a593Smuzhiyun SUM_GRP_COUNTERS(stats, qstats, rx_grp);
112*4882a593Smuzhiyun stats->netstats.rx_packets += qnstats->rx_packets;
113*4882a593Smuzhiyun stats->netstats.rx_bytes += qnstats->rx_bytes;
114*4882a593Smuzhiyun }
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun stats->netstats.tx_errors = stats->netstats.tx_fifo_errors +
117*4882a593Smuzhiyun stats->netstats.tx_carrier_errors +
118*4882a593Smuzhiyun stats->tx_drop_state + stats->tx_dlid_zero;
119*4882a593Smuzhiyun stats->netstats.tx_dropped = stats->netstats.tx_errors;
120*4882a593Smuzhiyun
121*4882a593Smuzhiyun stats->netstats.rx_errors = stats->netstats.rx_fifo_errors +
122*4882a593Smuzhiyun stats->netstats.rx_nohandler +
123*4882a593Smuzhiyun stats->rx_drop_state + stats->rx_oversize +
124*4882a593Smuzhiyun stats->rx_runt;
125*4882a593Smuzhiyun stats->netstats.rx_dropped = stats->netstats.rx_errors;
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun netdev->stats.tx_packets = stats->netstats.tx_packets;
128*4882a593Smuzhiyun netdev->stats.tx_bytes = stats->netstats.tx_bytes;
129*4882a593Smuzhiyun netdev->stats.tx_fifo_errors = stats->netstats.tx_fifo_errors;
130*4882a593Smuzhiyun netdev->stats.tx_carrier_errors = stats->netstats.tx_carrier_errors;
131*4882a593Smuzhiyun netdev->stats.tx_errors = stats->netstats.tx_errors;
132*4882a593Smuzhiyun netdev->stats.tx_dropped = stats->netstats.tx_dropped;
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun netdev->stats.rx_packets = stats->netstats.rx_packets;
135*4882a593Smuzhiyun netdev->stats.rx_bytes = stats->netstats.rx_bytes;
136*4882a593Smuzhiyun netdev->stats.rx_fifo_errors = stats->netstats.rx_fifo_errors;
137*4882a593Smuzhiyun netdev->stats.multicast = stats->rx_grp.mcastbcast;
138*4882a593Smuzhiyun netdev->stats.rx_length_errors = stats->rx_oversize + stats->rx_runt;
139*4882a593Smuzhiyun netdev->stats.rx_errors = stats->netstats.rx_errors;
140*4882a593Smuzhiyun netdev->stats.rx_dropped = stats->netstats.rx_dropped;
141*4882a593Smuzhiyun }
142*4882a593Smuzhiyun
143*4882a593Smuzhiyun /* update_len_counters - update pkt's len histogram counters */
update_len_counters(struct opa_vnic_grp_stats * grp,int len)144*4882a593Smuzhiyun static inline void update_len_counters(struct opa_vnic_grp_stats *grp,
145*4882a593Smuzhiyun int len)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun /* account for 4 byte FCS */
148*4882a593Smuzhiyun if (len >= 1515)
149*4882a593Smuzhiyun grp->s_1519_max++;
150*4882a593Smuzhiyun else if (len >= 1020)
151*4882a593Smuzhiyun grp->s_1024_1518++;
152*4882a593Smuzhiyun else if (len >= 508)
153*4882a593Smuzhiyun grp->s_512_1023++;
154*4882a593Smuzhiyun else if (len >= 252)
155*4882a593Smuzhiyun grp->s_256_511++;
156*4882a593Smuzhiyun else if (len >= 124)
157*4882a593Smuzhiyun grp->s_128_255++;
158*4882a593Smuzhiyun else if (len >= 61)
159*4882a593Smuzhiyun grp->s_65_127++;
160*4882a593Smuzhiyun else
161*4882a593Smuzhiyun grp->s_64++;
162*4882a593Smuzhiyun }
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun /* hfi1_vnic_update_tx_counters - update transmit counters */
hfi1_vnic_update_tx_counters(struct hfi1_vnic_vport_info * vinfo,u8 q_idx,struct sk_buff * skb,int err)165*4882a593Smuzhiyun static void hfi1_vnic_update_tx_counters(struct hfi1_vnic_vport_info *vinfo,
166*4882a593Smuzhiyun u8 q_idx, struct sk_buff *skb, int err)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun struct ethhdr *mac_hdr = (struct ethhdr *)skb_mac_header(skb);
169*4882a593Smuzhiyun struct opa_vnic_stats *stats = &vinfo->stats[q_idx];
170*4882a593Smuzhiyun struct opa_vnic_grp_stats *tx_grp = &stats->tx_grp;
171*4882a593Smuzhiyun u16 vlan_tci;
172*4882a593Smuzhiyun
173*4882a593Smuzhiyun stats->netstats.tx_packets++;
174*4882a593Smuzhiyun stats->netstats.tx_bytes += skb->len + ETH_FCS_LEN;
175*4882a593Smuzhiyun
176*4882a593Smuzhiyun update_len_counters(tx_grp, skb->len);
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun /* rest of the counts are for good packets only */
179*4882a593Smuzhiyun if (unlikely(err))
180*4882a593Smuzhiyun return;
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun if (is_multicast_ether_addr(mac_hdr->h_dest))
183*4882a593Smuzhiyun tx_grp->mcastbcast++;
184*4882a593Smuzhiyun else
185*4882a593Smuzhiyun tx_grp->unicast++;
186*4882a593Smuzhiyun
187*4882a593Smuzhiyun if (!__vlan_get_tag(skb, &vlan_tci))
188*4882a593Smuzhiyun tx_grp->vlan++;
189*4882a593Smuzhiyun else
190*4882a593Smuzhiyun tx_grp->untagged++;
191*4882a593Smuzhiyun }
192*4882a593Smuzhiyun
193*4882a593Smuzhiyun /* hfi1_vnic_update_rx_counters - update receive counters */
hfi1_vnic_update_rx_counters(struct hfi1_vnic_vport_info * vinfo,u8 q_idx,struct sk_buff * skb,int err)194*4882a593Smuzhiyun static void hfi1_vnic_update_rx_counters(struct hfi1_vnic_vport_info *vinfo,
195*4882a593Smuzhiyun u8 q_idx, struct sk_buff *skb, int err)
196*4882a593Smuzhiyun {
197*4882a593Smuzhiyun struct ethhdr *mac_hdr = (struct ethhdr *)skb->data;
198*4882a593Smuzhiyun struct opa_vnic_stats *stats = &vinfo->stats[q_idx];
199*4882a593Smuzhiyun struct opa_vnic_grp_stats *rx_grp = &stats->rx_grp;
200*4882a593Smuzhiyun u16 vlan_tci;
201*4882a593Smuzhiyun
202*4882a593Smuzhiyun stats->netstats.rx_packets++;
203*4882a593Smuzhiyun stats->netstats.rx_bytes += skb->len + ETH_FCS_LEN;
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun update_len_counters(rx_grp, skb->len);
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun /* rest of the counts are for good packets only */
208*4882a593Smuzhiyun if (unlikely(err))
209*4882a593Smuzhiyun return;
210*4882a593Smuzhiyun
211*4882a593Smuzhiyun if (is_multicast_ether_addr(mac_hdr->h_dest))
212*4882a593Smuzhiyun rx_grp->mcastbcast++;
213*4882a593Smuzhiyun else
214*4882a593Smuzhiyun rx_grp->unicast++;
215*4882a593Smuzhiyun
216*4882a593Smuzhiyun if (!__vlan_get_tag(skb, &vlan_tci))
217*4882a593Smuzhiyun rx_grp->vlan++;
218*4882a593Smuzhiyun else
219*4882a593Smuzhiyun rx_grp->untagged++;
220*4882a593Smuzhiyun }
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun /* This function is overloaded for opa_vnic specific implementation */
hfi1_vnic_get_stats64(struct net_device * netdev,struct rtnl_link_stats64 * stats)223*4882a593Smuzhiyun static void hfi1_vnic_get_stats64(struct net_device *netdev,
224*4882a593Smuzhiyun struct rtnl_link_stats64 *stats)
225*4882a593Smuzhiyun {
226*4882a593Smuzhiyun struct opa_vnic_stats *vstats = (struct opa_vnic_stats *)stats;
227*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
228*4882a593Smuzhiyun
229*4882a593Smuzhiyun hfi1_vnic_update_stats(vinfo, vstats);
230*4882a593Smuzhiyun }
231*4882a593Smuzhiyun
create_bypass_pbc(u32 vl,u32 dw_len)232*4882a593Smuzhiyun static u64 create_bypass_pbc(u32 vl, u32 dw_len)
233*4882a593Smuzhiyun {
234*4882a593Smuzhiyun u64 pbc;
235*4882a593Smuzhiyun
236*4882a593Smuzhiyun pbc = ((u64)PBC_IHCRC_NONE << PBC_INSERT_HCRC_SHIFT)
237*4882a593Smuzhiyun | PBC_INSERT_BYPASS_ICRC | PBC_CREDIT_RETURN
238*4882a593Smuzhiyun | PBC_PACKET_BYPASS
239*4882a593Smuzhiyun | ((vl & PBC_VL_MASK) << PBC_VL_SHIFT)
240*4882a593Smuzhiyun | (dw_len & PBC_LENGTH_DWS_MASK) << PBC_LENGTH_DWS_SHIFT;
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun return pbc;
243*4882a593Smuzhiyun }
244*4882a593Smuzhiyun
245*4882a593Smuzhiyun /* hfi1_vnic_maybe_stop_tx - stop tx queue if required */
hfi1_vnic_maybe_stop_tx(struct hfi1_vnic_vport_info * vinfo,u8 q_idx)246*4882a593Smuzhiyun static void hfi1_vnic_maybe_stop_tx(struct hfi1_vnic_vport_info *vinfo,
247*4882a593Smuzhiyun u8 q_idx)
248*4882a593Smuzhiyun {
249*4882a593Smuzhiyun netif_stop_subqueue(vinfo->netdev, q_idx);
250*4882a593Smuzhiyun if (!hfi1_vnic_sdma_write_avail(vinfo, q_idx))
251*4882a593Smuzhiyun return;
252*4882a593Smuzhiyun
253*4882a593Smuzhiyun netif_start_subqueue(vinfo->netdev, q_idx);
254*4882a593Smuzhiyun }
255*4882a593Smuzhiyun
hfi1_netdev_start_xmit(struct sk_buff * skb,struct net_device * netdev)256*4882a593Smuzhiyun static netdev_tx_t hfi1_netdev_start_xmit(struct sk_buff *skb,
257*4882a593Smuzhiyun struct net_device *netdev)
258*4882a593Smuzhiyun {
259*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
260*4882a593Smuzhiyun u8 pad_len, q_idx = skb->queue_mapping;
261*4882a593Smuzhiyun struct hfi1_devdata *dd = vinfo->dd;
262*4882a593Smuzhiyun struct opa_vnic_skb_mdata *mdata;
263*4882a593Smuzhiyun u32 pkt_len, total_len;
264*4882a593Smuzhiyun int err = -EINVAL;
265*4882a593Smuzhiyun u64 pbc;
266*4882a593Smuzhiyun
267*4882a593Smuzhiyun v_dbg("xmit: queue %d skb len %d\n", q_idx, skb->len);
268*4882a593Smuzhiyun if (unlikely(!netif_oper_up(netdev))) {
269*4882a593Smuzhiyun vinfo->stats[q_idx].tx_drop_state++;
270*4882a593Smuzhiyun goto tx_finish;
271*4882a593Smuzhiyun }
272*4882a593Smuzhiyun
273*4882a593Smuzhiyun /* take out meta data */
274*4882a593Smuzhiyun mdata = (struct opa_vnic_skb_mdata *)skb->data;
275*4882a593Smuzhiyun skb_pull(skb, sizeof(*mdata));
276*4882a593Smuzhiyun if (unlikely(mdata->flags & OPA_VNIC_SKB_MDATA_ENCAP_ERR)) {
277*4882a593Smuzhiyun vinfo->stats[q_idx].tx_dlid_zero++;
278*4882a593Smuzhiyun goto tx_finish;
279*4882a593Smuzhiyun }
280*4882a593Smuzhiyun
281*4882a593Smuzhiyun /* add tail padding (for 8 bytes size alignment) and icrc */
282*4882a593Smuzhiyun pad_len = -(skb->len + OPA_VNIC_ICRC_TAIL_LEN) & 0x7;
283*4882a593Smuzhiyun pad_len += OPA_VNIC_ICRC_TAIL_LEN;
284*4882a593Smuzhiyun
285*4882a593Smuzhiyun /*
286*4882a593Smuzhiyun * pkt_len is how much data we have to write, includes header and data.
287*4882a593Smuzhiyun * total_len is length of the packet in Dwords plus the PBC should not
288*4882a593Smuzhiyun * include the CRC.
289*4882a593Smuzhiyun */
290*4882a593Smuzhiyun pkt_len = (skb->len + pad_len) >> 2;
291*4882a593Smuzhiyun total_len = pkt_len + 2; /* PBC + packet */
292*4882a593Smuzhiyun
293*4882a593Smuzhiyun pbc = create_bypass_pbc(mdata->vl, total_len);
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun skb_get(skb);
296*4882a593Smuzhiyun v_dbg("pbc 0x%016llX len %d pad_len %d\n", pbc, skb->len, pad_len);
297*4882a593Smuzhiyun err = dd->process_vnic_dma_send(dd, q_idx, vinfo, skb, pbc, pad_len);
298*4882a593Smuzhiyun if (unlikely(err)) {
299*4882a593Smuzhiyun if (err == -ENOMEM)
300*4882a593Smuzhiyun vinfo->stats[q_idx].netstats.tx_fifo_errors++;
301*4882a593Smuzhiyun else if (err != -EBUSY)
302*4882a593Smuzhiyun vinfo->stats[q_idx].netstats.tx_carrier_errors++;
303*4882a593Smuzhiyun }
304*4882a593Smuzhiyun /* remove the header before updating tx counters */
305*4882a593Smuzhiyun skb_pull(skb, OPA_VNIC_HDR_LEN);
306*4882a593Smuzhiyun
307*4882a593Smuzhiyun if (unlikely(err == -EBUSY)) {
308*4882a593Smuzhiyun hfi1_vnic_maybe_stop_tx(vinfo, q_idx);
309*4882a593Smuzhiyun dev_kfree_skb_any(skb);
310*4882a593Smuzhiyun return NETDEV_TX_BUSY;
311*4882a593Smuzhiyun }
312*4882a593Smuzhiyun
313*4882a593Smuzhiyun tx_finish:
314*4882a593Smuzhiyun /* update tx counters */
315*4882a593Smuzhiyun hfi1_vnic_update_tx_counters(vinfo, q_idx, skb, err);
316*4882a593Smuzhiyun dev_kfree_skb_any(skb);
317*4882a593Smuzhiyun return NETDEV_TX_OK;
318*4882a593Smuzhiyun }
319*4882a593Smuzhiyun
hfi1_vnic_select_queue(struct net_device * netdev,struct sk_buff * skb,struct net_device * sb_dev)320*4882a593Smuzhiyun static u16 hfi1_vnic_select_queue(struct net_device *netdev,
321*4882a593Smuzhiyun struct sk_buff *skb,
322*4882a593Smuzhiyun struct net_device *sb_dev)
323*4882a593Smuzhiyun {
324*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
325*4882a593Smuzhiyun struct opa_vnic_skb_mdata *mdata;
326*4882a593Smuzhiyun struct sdma_engine *sde;
327*4882a593Smuzhiyun
328*4882a593Smuzhiyun mdata = (struct opa_vnic_skb_mdata *)skb->data;
329*4882a593Smuzhiyun sde = sdma_select_engine_vl(vinfo->dd, mdata->entropy, mdata->vl);
330*4882a593Smuzhiyun return sde->this_idx;
331*4882a593Smuzhiyun }
332*4882a593Smuzhiyun
333*4882a593Smuzhiyun /* hfi1_vnic_decap_skb - strip OPA header from the skb (ethernet) packet */
hfi1_vnic_decap_skb(struct hfi1_vnic_rx_queue * rxq,struct sk_buff * skb)334*4882a593Smuzhiyun static inline int hfi1_vnic_decap_skb(struct hfi1_vnic_rx_queue *rxq,
335*4882a593Smuzhiyun struct sk_buff *skb)
336*4882a593Smuzhiyun {
337*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo = rxq->vinfo;
338*4882a593Smuzhiyun int max_len = vinfo->netdev->mtu + VLAN_ETH_HLEN;
339*4882a593Smuzhiyun int rc = -EFAULT;
340*4882a593Smuzhiyun
341*4882a593Smuzhiyun skb_pull(skb, OPA_VNIC_HDR_LEN);
342*4882a593Smuzhiyun
343*4882a593Smuzhiyun /* Validate Packet length */
344*4882a593Smuzhiyun if (unlikely(skb->len > max_len))
345*4882a593Smuzhiyun vinfo->stats[rxq->idx].rx_oversize++;
346*4882a593Smuzhiyun else if (unlikely(skb->len < ETH_ZLEN))
347*4882a593Smuzhiyun vinfo->stats[rxq->idx].rx_runt++;
348*4882a593Smuzhiyun else
349*4882a593Smuzhiyun rc = 0;
350*4882a593Smuzhiyun return rc;
351*4882a593Smuzhiyun }
352*4882a593Smuzhiyun
get_vnic_port(struct hfi1_devdata * dd,int vesw_id)353*4882a593Smuzhiyun static struct hfi1_vnic_vport_info *get_vnic_port(struct hfi1_devdata *dd,
354*4882a593Smuzhiyun int vesw_id)
355*4882a593Smuzhiyun {
356*4882a593Smuzhiyun int vnic_id = VNIC_ID(vesw_id);
357*4882a593Smuzhiyun
358*4882a593Smuzhiyun return hfi1_netdev_get_data(dd, vnic_id);
359*4882a593Smuzhiyun }
360*4882a593Smuzhiyun
get_first_vnic_port(struct hfi1_devdata * dd)361*4882a593Smuzhiyun static struct hfi1_vnic_vport_info *get_first_vnic_port(struct hfi1_devdata *dd)
362*4882a593Smuzhiyun {
363*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo;
364*4882a593Smuzhiyun int next_id = VNIC_ID(0);
365*4882a593Smuzhiyun
366*4882a593Smuzhiyun vinfo = hfi1_netdev_get_first_data(dd, &next_id);
367*4882a593Smuzhiyun
368*4882a593Smuzhiyun if (next_id > VNIC_ID(VNIC_MASK))
369*4882a593Smuzhiyun return NULL;
370*4882a593Smuzhiyun
371*4882a593Smuzhiyun return vinfo;
372*4882a593Smuzhiyun }
373*4882a593Smuzhiyun
hfi1_vnic_bypass_rcv(struct hfi1_packet * packet)374*4882a593Smuzhiyun void hfi1_vnic_bypass_rcv(struct hfi1_packet *packet)
375*4882a593Smuzhiyun {
376*4882a593Smuzhiyun struct hfi1_devdata *dd = packet->rcd->dd;
377*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo = NULL;
378*4882a593Smuzhiyun struct hfi1_vnic_rx_queue *rxq;
379*4882a593Smuzhiyun struct sk_buff *skb;
380*4882a593Smuzhiyun int l4_type, vesw_id = -1, rc;
381*4882a593Smuzhiyun u8 q_idx;
382*4882a593Smuzhiyun unsigned char *pad_info;
383*4882a593Smuzhiyun
384*4882a593Smuzhiyun l4_type = hfi1_16B_get_l4(packet->ebuf);
385*4882a593Smuzhiyun if (likely(l4_type == OPA_16B_L4_ETHR)) {
386*4882a593Smuzhiyun vesw_id = HFI1_VNIC_GET_VESWID(packet->ebuf);
387*4882a593Smuzhiyun vinfo = get_vnic_port(dd, vesw_id);
388*4882a593Smuzhiyun
389*4882a593Smuzhiyun /*
390*4882a593Smuzhiyun * In case of invalid vesw id, count the error on
391*4882a593Smuzhiyun * the first available vport.
392*4882a593Smuzhiyun */
393*4882a593Smuzhiyun if (unlikely(!vinfo)) {
394*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo_tmp;
395*4882a593Smuzhiyun
396*4882a593Smuzhiyun vinfo_tmp = get_first_vnic_port(dd);
397*4882a593Smuzhiyun if (vinfo_tmp) {
398*4882a593Smuzhiyun spin_lock(&vport_cntr_lock);
399*4882a593Smuzhiyun vinfo_tmp->stats[0].netstats.rx_nohandler++;
400*4882a593Smuzhiyun spin_unlock(&vport_cntr_lock);
401*4882a593Smuzhiyun }
402*4882a593Smuzhiyun }
403*4882a593Smuzhiyun }
404*4882a593Smuzhiyun
405*4882a593Smuzhiyun if (unlikely(!vinfo)) {
406*4882a593Smuzhiyun dd_dev_warn(dd, "vnic rcv err: l4 %d vesw id %d ctx %d\n",
407*4882a593Smuzhiyun l4_type, vesw_id, packet->rcd->ctxt);
408*4882a593Smuzhiyun return;
409*4882a593Smuzhiyun }
410*4882a593Smuzhiyun
411*4882a593Smuzhiyun q_idx = packet->rcd->vnic_q_idx;
412*4882a593Smuzhiyun rxq = &vinfo->rxq[q_idx];
413*4882a593Smuzhiyun if (unlikely(!netif_oper_up(vinfo->netdev))) {
414*4882a593Smuzhiyun vinfo->stats[q_idx].rx_drop_state++;
415*4882a593Smuzhiyun return;
416*4882a593Smuzhiyun }
417*4882a593Smuzhiyun
418*4882a593Smuzhiyun skb = netdev_alloc_skb(vinfo->netdev, packet->tlen);
419*4882a593Smuzhiyun if (unlikely(!skb)) {
420*4882a593Smuzhiyun vinfo->stats[q_idx].netstats.rx_fifo_errors++;
421*4882a593Smuzhiyun return;
422*4882a593Smuzhiyun }
423*4882a593Smuzhiyun
424*4882a593Smuzhiyun memcpy(skb->data, packet->ebuf, packet->tlen);
425*4882a593Smuzhiyun skb_put(skb, packet->tlen);
426*4882a593Smuzhiyun
427*4882a593Smuzhiyun pad_info = skb->data + skb->len - 1;
428*4882a593Smuzhiyun skb_trim(skb, (skb->len - OPA_VNIC_ICRC_TAIL_LEN -
429*4882a593Smuzhiyun ((*pad_info) & 0x7)));
430*4882a593Smuzhiyun
431*4882a593Smuzhiyun rc = hfi1_vnic_decap_skb(rxq, skb);
432*4882a593Smuzhiyun
433*4882a593Smuzhiyun /* update rx counters */
434*4882a593Smuzhiyun hfi1_vnic_update_rx_counters(vinfo, rxq->idx, skb, rc);
435*4882a593Smuzhiyun if (unlikely(rc)) {
436*4882a593Smuzhiyun dev_kfree_skb_any(skb);
437*4882a593Smuzhiyun return;
438*4882a593Smuzhiyun }
439*4882a593Smuzhiyun
440*4882a593Smuzhiyun skb_checksum_none_assert(skb);
441*4882a593Smuzhiyun skb->protocol = eth_type_trans(skb, rxq->netdev);
442*4882a593Smuzhiyun
443*4882a593Smuzhiyun napi_gro_receive(&rxq->napi, skb);
444*4882a593Smuzhiyun }
445*4882a593Smuzhiyun
hfi1_vnic_up(struct hfi1_vnic_vport_info * vinfo)446*4882a593Smuzhiyun static int hfi1_vnic_up(struct hfi1_vnic_vport_info *vinfo)
447*4882a593Smuzhiyun {
448*4882a593Smuzhiyun struct hfi1_devdata *dd = vinfo->dd;
449*4882a593Smuzhiyun struct net_device *netdev = vinfo->netdev;
450*4882a593Smuzhiyun int rc;
451*4882a593Smuzhiyun
452*4882a593Smuzhiyun /* ensure virtual eth switch id is valid */
453*4882a593Smuzhiyun if (!vinfo->vesw_id)
454*4882a593Smuzhiyun return -EINVAL;
455*4882a593Smuzhiyun
456*4882a593Smuzhiyun rc = hfi1_netdev_add_data(dd, VNIC_ID(vinfo->vesw_id), vinfo);
457*4882a593Smuzhiyun if (rc < 0)
458*4882a593Smuzhiyun return rc;
459*4882a593Smuzhiyun
460*4882a593Smuzhiyun rc = hfi1_netdev_rx_init(dd);
461*4882a593Smuzhiyun if (rc)
462*4882a593Smuzhiyun goto err_remove;
463*4882a593Smuzhiyun
464*4882a593Smuzhiyun netif_carrier_on(netdev);
465*4882a593Smuzhiyun netif_tx_start_all_queues(netdev);
466*4882a593Smuzhiyun set_bit(HFI1_VNIC_UP, &vinfo->flags);
467*4882a593Smuzhiyun
468*4882a593Smuzhiyun return 0;
469*4882a593Smuzhiyun
470*4882a593Smuzhiyun err_remove:
471*4882a593Smuzhiyun hfi1_netdev_remove_data(dd, VNIC_ID(vinfo->vesw_id));
472*4882a593Smuzhiyun return rc;
473*4882a593Smuzhiyun }
474*4882a593Smuzhiyun
hfi1_vnic_down(struct hfi1_vnic_vport_info * vinfo)475*4882a593Smuzhiyun static void hfi1_vnic_down(struct hfi1_vnic_vport_info *vinfo)
476*4882a593Smuzhiyun {
477*4882a593Smuzhiyun struct hfi1_devdata *dd = vinfo->dd;
478*4882a593Smuzhiyun
479*4882a593Smuzhiyun clear_bit(HFI1_VNIC_UP, &vinfo->flags);
480*4882a593Smuzhiyun netif_carrier_off(vinfo->netdev);
481*4882a593Smuzhiyun netif_tx_disable(vinfo->netdev);
482*4882a593Smuzhiyun hfi1_netdev_remove_data(dd, VNIC_ID(vinfo->vesw_id));
483*4882a593Smuzhiyun
484*4882a593Smuzhiyun hfi1_netdev_rx_destroy(dd);
485*4882a593Smuzhiyun }
486*4882a593Smuzhiyun
hfi1_netdev_open(struct net_device * netdev)487*4882a593Smuzhiyun static int hfi1_netdev_open(struct net_device *netdev)
488*4882a593Smuzhiyun {
489*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
490*4882a593Smuzhiyun int rc;
491*4882a593Smuzhiyun
492*4882a593Smuzhiyun mutex_lock(&vinfo->lock);
493*4882a593Smuzhiyun rc = hfi1_vnic_up(vinfo);
494*4882a593Smuzhiyun mutex_unlock(&vinfo->lock);
495*4882a593Smuzhiyun return rc;
496*4882a593Smuzhiyun }
497*4882a593Smuzhiyun
hfi1_netdev_close(struct net_device * netdev)498*4882a593Smuzhiyun static int hfi1_netdev_close(struct net_device *netdev)
499*4882a593Smuzhiyun {
500*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
501*4882a593Smuzhiyun
502*4882a593Smuzhiyun mutex_lock(&vinfo->lock);
503*4882a593Smuzhiyun if (test_bit(HFI1_VNIC_UP, &vinfo->flags))
504*4882a593Smuzhiyun hfi1_vnic_down(vinfo);
505*4882a593Smuzhiyun mutex_unlock(&vinfo->lock);
506*4882a593Smuzhiyun return 0;
507*4882a593Smuzhiyun }
508*4882a593Smuzhiyun
hfi1_vnic_init(struct hfi1_vnic_vport_info * vinfo)509*4882a593Smuzhiyun static int hfi1_vnic_init(struct hfi1_vnic_vport_info *vinfo)
510*4882a593Smuzhiyun {
511*4882a593Smuzhiyun struct hfi1_devdata *dd = vinfo->dd;
512*4882a593Smuzhiyun int rc = 0;
513*4882a593Smuzhiyun
514*4882a593Smuzhiyun mutex_lock(&hfi1_mutex);
515*4882a593Smuzhiyun if (!dd->vnic_num_vports) {
516*4882a593Smuzhiyun rc = hfi1_vnic_txreq_init(dd);
517*4882a593Smuzhiyun if (rc)
518*4882a593Smuzhiyun goto txreq_fail;
519*4882a593Smuzhiyun }
520*4882a593Smuzhiyun
521*4882a593Smuzhiyun rc = hfi1_netdev_rx_init(dd);
522*4882a593Smuzhiyun if (rc) {
523*4882a593Smuzhiyun dd_dev_err(dd, "Unable to initialize netdev contexts\n");
524*4882a593Smuzhiyun goto alloc_fail;
525*4882a593Smuzhiyun }
526*4882a593Smuzhiyun
527*4882a593Smuzhiyun hfi1_init_vnic_rsm(dd);
528*4882a593Smuzhiyun
529*4882a593Smuzhiyun dd->vnic_num_vports++;
530*4882a593Smuzhiyun hfi1_vnic_sdma_init(vinfo);
531*4882a593Smuzhiyun
532*4882a593Smuzhiyun alloc_fail:
533*4882a593Smuzhiyun if (!dd->vnic_num_vports)
534*4882a593Smuzhiyun hfi1_vnic_txreq_deinit(dd);
535*4882a593Smuzhiyun txreq_fail:
536*4882a593Smuzhiyun mutex_unlock(&hfi1_mutex);
537*4882a593Smuzhiyun return rc;
538*4882a593Smuzhiyun }
539*4882a593Smuzhiyun
hfi1_vnic_deinit(struct hfi1_vnic_vport_info * vinfo)540*4882a593Smuzhiyun static void hfi1_vnic_deinit(struct hfi1_vnic_vport_info *vinfo)
541*4882a593Smuzhiyun {
542*4882a593Smuzhiyun struct hfi1_devdata *dd = vinfo->dd;
543*4882a593Smuzhiyun
544*4882a593Smuzhiyun mutex_lock(&hfi1_mutex);
545*4882a593Smuzhiyun if (--dd->vnic_num_vports == 0) {
546*4882a593Smuzhiyun hfi1_deinit_vnic_rsm(dd);
547*4882a593Smuzhiyun hfi1_vnic_txreq_deinit(dd);
548*4882a593Smuzhiyun }
549*4882a593Smuzhiyun mutex_unlock(&hfi1_mutex);
550*4882a593Smuzhiyun hfi1_netdev_rx_destroy(dd);
551*4882a593Smuzhiyun }
552*4882a593Smuzhiyun
hfi1_vnic_set_vesw_id(struct net_device * netdev,int id)553*4882a593Smuzhiyun static void hfi1_vnic_set_vesw_id(struct net_device *netdev, int id)
554*4882a593Smuzhiyun {
555*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
556*4882a593Smuzhiyun bool reopen = false;
557*4882a593Smuzhiyun
558*4882a593Smuzhiyun /*
559*4882a593Smuzhiyun * If vesw_id is being changed, and if the vnic port is up,
560*4882a593Smuzhiyun * reset the vnic port to ensure new vesw_id gets picked up
561*4882a593Smuzhiyun */
562*4882a593Smuzhiyun if (id != vinfo->vesw_id) {
563*4882a593Smuzhiyun mutex_lock(&vinfo->lock);
564*4882a593Smuzhiyun if (test_bit(HFI1_VNIC_UP, &vinfo->flags)) {
565*4882a593Smuzhiyun hfi1_vnic_down(vinfo);
566*4882a593Smuzhiyun reopen = true;
567*4882a593Smuzhiyun }
568*4882a593Smuzhiyun
569*4882a593Smuzhiyun vinfo->vesw_id = id;
570*4882a593Smuzhiyun if (reopen)
571*4882a593Smuzhiyun hfi1_vnic_up(vinfo);
572*4882a593Smuzhiyun
573*4882a593Smuzhiyun mutex_unlock(&vinfo->lock);
574*4882a593Smuzhiyun }
575*4882a593Smuzhiyun }
576*4882a593Smuzhiyun
577*4882a593Smuzhiyun /* netdev ops */
578*4882a593Smuzhiyun static const struct net_device_ops hfi1_netdev_ops = {
579*4882a593Smuzhiyun .ndo_open = hfi1_netdev_open,
580*4882a593Smuzhiyun .ndo_stop = hfi1_netdev_close,
581*4882a593Smuzhiyun .ndo_start_xmit = hfi1_netdev_start_xmit,
582*4882a593Smuzhiyun .ndo_select_queue = hfi1_vnic_select_queue,
583*4882a593Smuzhiyun .ndo_get_stats64 = hfi1_vnic_get_stats64,
584*4882a593Smuzhiyun };
585*4882a593Smuzhiyun
hfi1_vnic_free_rn(struct net_device * netdev)586*4882a593Smuzhiyun static void hfi1_vnic_free_rn(struct net_device *netdev)
587*4882a593Smuzhiyun {
588*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo = opa_vnic_dev_priv(netdev);
589*4882a593Smuzhiyun
590*4882a593Smuzhiyun hfi1_vnic_deinit(vinfo);
591*4882a593Smuzhiyun mutex_destroy(&vinfo->lock);
592*4882a593Smuzhiyun free_netdev(netdev);
593*4882a593Smuzhiyun }
594*4882a593Smuzhiyun
hfi1_vnic_alloc_rn(struct ib_device * device,u8 port_num,enum rdma_netdev_t type,const char * name,unsigned char name_assign_type,void (* setup)(struct net_device *))595*4882a593Smuzhiyun struct net_device *hfi1_vnic_alloc_rn(struct ib_device *device,
596*4882a593Smuzhiyun u8 port_num,
597*4882a593Smuzhiyun enum rdma_netdev_t type,
598*4882a593Smuzhiyun const char *name,
599*4882a593Smuzhiyun unsigned char name_assign_type,
600*4882a593Smuzhiyun void (*setup)(struct net_device *))
601*4882a593Smuzhiyun {
602*4882a593Smuzhiyun struct hfi1_devdata *dd = dd_from_ibdev(device);
603*4882a593Smuzhiyun struct hfi1_vnic_vport_info *vinfo;
604*4882a593Smuzhiyun struct net_device *netdev;
605*4882a593Smuzhiyun struct rdma_netdev *rn;
606*4882a593Smuzhiyun int i, size, rc;
607*4882a593Smuzhiyun
608*4882a593Smuzhiyun if (!dd->num_netdev_contexts)
609*4882a593Smuzhiyun return ERR_PTR(-ENOMEM);
610*4882a593Smuzhiyun
611*4882a593Smuzhiyun if (!port_num || (port_num > dd->num_pports))
612*4882a593Smuzhiyun return ERR_PTR(-EINVAL);
613*4882a593Smuzhiyun
614*4882a593Smuzhiyun if (type != RDMA_NETDEV_OPA_VNIC)
615*4882a593Smuzhiyun return ERR_PTR(-EOPNOTSUPP);
616*4882a593Smuzhiyun
617*4882a593Smuzhiyun size = sizeof(struct opa_vnic_rdma_netdev) + sizeof(*vinfo);
618*4882a593Smuzhiyun netdev = alloc_netdev_mqs(size, name, name_assign_type, setup,
619*4882a593Smuzhiyun chip_sdma_engines(dd),
620*4882a593Smuzhiyun dd->num_netdev_contexts);
621*4882a593Smuzhiyun if (!netdev)
622*4882a593Smuzhiyun return ERR_PTR(-ENOMEM);
623*4882a593Smuzhiyun
624*4882a593Smuzhiyun rn = netdev_priv(netdev);
625*4882a593Smuzhiyun vinfo = opa_vnic_dev_priv(netdev);
626*4882a593Smuzhiyun vinfo->dd = dd;
627*4882a593Smuzhiyun vinfo->num_tx_q = chip_sdma_engines(dd);
628*4882a593Smuzhiyun vinfo->num_rx_q = dd->num_netdev_contexts;
629*4882a593Smuzhiyun vinfo->netdev = netdev;
630*4882a593Smuzhiyun rn->free_rdma_netdev = hfi1_vnic_free_rn;
631*4882a593Smuzhiyun rn->set_id = hfi1_vnic_set_vesw_id;
632*4882a593Smuzhiyun
633*4882a593Smuzhiyun netdev->features = NETIF_F_HIGHDMA | NETIF_F_SG;
634*4882a593Smuzhiyun netdev->hw_features = netdev->features;
635*4882a593Smuzhiyun netdev->vlan_features = netdev->features;
636*4882a593Smuzhiyun netdev->watchdog_timeo = msecs_to_jiffies(HFI_TX_TIMEOUT_MS);
637*4882a593Smuzhiyun netdev->netdev_ops = &hfi1_netdev_ops;
638*4882a593Smuzhiyun mutex_init(&vinfo->lock);
639*4882a593Smuzhiyun
640*4882a593Smuzhiyun for (i = 0; i < vinfo->num_rx_q; i++) {
641*4882a593Smuzhiyun struct hfi1_vnic_rx_queue *rxq = &vinfo->rxq[i];
642*4882a593Smuzhiyun
643*4882a593Smuzhiyun rxq->idx = i;
644*4882a593Smuzhiyun rxq->vinfo = vinfo;
645*4882a593Smuzhiyun rxq->netdev = netdev;
646*4882a593Smuzhiyun }
647*4882a593Smuzhiyun
648*4882a593Smuzhiyun rc = hfi1_vnic_init(vinfo);
649*4882a593Smuzhiyun if (rc)
650*4882a593Smuzhiyun goto init_fail;
651*4882a593Smuzhiyun
652*4882a593Smuzhiyun return netdev;
653*4882a593Smuzhiyun init_fail:
654*4882a593Smuzhiyun mutex_destroy(&vinfo->lock);
655*4882a593Smuzhiyun free_netdev(netdev);
656*4882a593Smuzhiyun return ERR_PTR(rc);
657*4882a593Smuzhiyun }
658