xref: /OK3568_Linux_fs/kernel/drivers/infiniband/ulp/ipoib/ipoib_verbs.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Copyright (c) 2004, 2005 Topspin Communications.  All rights reserved.
3*4882a593Smuzhiyun  * Copyright (c) 2005 Mellanox Technologies. All rights reserved.
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * This software is available to you under a choice of one of two
6*4882a593Smuzhiyun  * licenses.  You may choose to be licensed under the terms of the GNU
7*4882a593Smuzhiyun  * General Public License (GPL) Version 2, available from the file
8*4882a593Smuzhiyun  * COPYING in the main directory of this source tree, or the
9*4882a593Smuzhiyun  * OpenIB.org BSD license below:
10*4882a593Smuzhiyun  *
11*4882a593Smuzhiyun  *     Redistribution and use in source and binary forms, with or
12*4882a593Smuzhiyun  *     without modification, are permitted provided that the following
13*4882a593Smuzhiyun  *     conditions are met:
14*4882a593Smuzhiyun  *
15*4882a593Smuzhiyun  *      - Redistributions of source code must retain the above
16*4882a593Smuzhiyun  *        copyright notice, this list of conditions and the following
17*4882a593Smuzhiyun  *        disclaimer.
18*4882a593Smuzhiyun  *
19*4882a593Smuzhiyun  *      - Redistributions in binary form must reproduce the above
20*4882a593Smuzhiyun  *        copyright notice, this list of conditions and the following
21*4882a593Smuzhiyun  *        disclaimer in the documentation and/or other materials
22*4882a593Smuzhiyun  *        provided with the distribution.
23*4882a593Smuzhiyun  *
24*4882a593Smuzhiyun  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25*4882a593Smuzhiyun  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26*4882a593Smuzhiyun  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27*4882a593Smuzhiyun  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28*4882a593Smuzhiyun  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29*4882a593Smuzhiyun  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30*4882a593Smuzhiyun  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31*4882a593Smuzhiyun  * SOFTWARE.
32*4882a593Smuzhiyun  */
33*4882a593Smuzhiyun 
34*4882a593Smuzhiyun #include <linux/slab.h>
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun #include "ipoib.h"
37*4882a593Smuzhiyun 
ipoib_mcast_attach(struct net_device * dev,struct ib_device * hca,union ib_gid * mgid,u16 mlid,int set_qkey,u32 qkey)38*4882a593Smuzhiyun int ipoib_mcast_attach(struct net_device *dev, struct ib_device *hca,
39*4882a593Smuzhiyun 		       union ib_gid *mgid, u16 mlid, int set_qkey, u32 qkey)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun 	struct ipoib_dev_priv *priv = ipoib_priv(dev);
42*4882a593Smuzhiyun 	struct ib_qp_attr *qp_attr = NULL;
43*4882a593Smuzhiyun 	int ret;
44*4882a593Smuzhiyun 	u16 pkey_index;
45*4882a593Smuzhiyun 
46*4882a593Smuzhiyun 	if (ib_find_pkey(priv->ca, priv->port, priv->pkey, &pkey_index)) {
47*4882a593Smuzhiyun 		clear_bit(IPOIB_PKEY_ASSIGNED, &priv->flags);
48*4882a593Smuzhiyun 		ret = -ENXIO;
49*4882a593Smuzhiyun 		goto out;
50*4882a593Smuzhiyun 	}
51*4882a593Smuzhiyun 	set_bit(IPOIB_PKEY_ASSIGNED, &priv->flags);
52*4882a593Smuzhiyun 
53*4882a593Smuzhiyun 	if (set_qkey) {
54*4882a593Smuzhiyun 		ret = -ENOMEM;
55*4882a593Smuzhiyun 		qp_attr = kmalloc(sizeof(*qp_attr), GFP_KERNEL);
56*4882a593Smuzhiyun 		if (!qp_attr)
57*4882a593Smuzhiyun 			goto out;
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun 		/* set correct QKey for QP */
60*4882a593Smuzhiyun 		qp_attr->qkey = qkey;
61*4882a593Smuzhiyun 		ret = ib_modify_qp(priv->qp, qp_attr, IB_QP_QKEY);
62*4882a593Smuzhiyun 		if (ret) {
63*4882a593Smuzhiyun 			ipoib_warn(priv, "failed to modify QP, ret = %d\n", ret);
64*4882a593Smuzhiyun 			goto out;
65*4882a593Smuzhiyun 		}
66*4882a593Smuzhiyun 	}
67*4882a593Smuzhiyun 
68*4882a593Smuzhiyun 	/* attach QP to multicast group */
69*4882a593Smuzhiyun 	ret = ib_attach_mcast(priv->qp, mgid, mlid);
70*4882a593Smuzhiyun 	if (ret)
71*4882a593Smuzhiyun 		ipoib_warn(priv, "failed to attach to multicast group, ret = %d\n", ret);
72*4882a593Smuzhiyun 
73*4882a593Smuzhiyun out:
74*4882a593Smuzhiyun 	kfree(qp_attr);
75*4882a593Smuzhiyun 	return ret;
76*4882a593Smuzhiyun }
77*4882a593Smuzhiyun 
ipoib_mcast_detach(struct net_device * dev,struct ib_device * hca,union ib_gid * mgid,u16 mlid)78*4882a593Smuzhiyun int ipoib_mcast_detach(struct net_device *dev, struct ib_device *hca,
79*4882a593Smuzhiyun 		       union ib_gid *mgid, u16 mlid)
80*4882a593Smuzhiyun {
81*4882a593Smuzhiyun 	struct ipoib_dev_priv *priv = ipoib_priv(dev);
82*4882a593Smuzhiyun 	int ret;
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun 	ret = ib_detach_mcast(priv->qp, mgid, mlid);
85*4882a593Smuzhiyun 
86*4882a593Smuzhiyun 	return ret;
87*4882a593Smuzhiyun }
88*4882a593Smuzhiyun 
ipoib_init_qp(struct net_device * dev)89*4882a593Smuzhiyun int ipoib_init_qp(struct net_device *dev)
90*4882a593Smuzhiyun {
91*4882a593Smuzhiyun 	struct ipoib_dev_priv *priv = ipoib_priv(dev);
92*4882a593Smuzhiyun 	int ret;
93*4882a593Smuzhiyun 	struct ib_qp_attr qp_attr;
94*4882a593Smuzhiyun 	int attr_mask;
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun 	if (!test_bit(IPOIB_PKEY_ASSIGNED, &priv->flags))
97*4882a593Smuzhiyun 		return -1;
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun 	qp_attr.qp_state = IB_QPS_INIT;
100*4882a593Smuzhiyun 	qp_attr.qkey = 0;
101*4882a593Smuzhiyun 	qp_attr.port_num = priv->port;
102*4882a593Smuzhiyun 	qp_attr.pkey_index = priv->pkey_index;
103*4882a593Smuzhiyun 	attr_mask =
104*4882a593Smuzhiyun 	    IB_QP_QKEY |
105*4882a593Smuzhiyun 	    IB_QP_PORT |
106*4882a593Smuzhiyun 	    IB_QP_PKEY_INDEX |
107*4882a593Smuzhiyun 	    IB_QP_STATE;
108*4882a593Smuzhiyun 	ret = ib_modify_qp(priv->qp, &qp_attr, attr_mask);
109*4882a593Smuzhiyun 	if (ret) {
110*4882a593Smuzhiyun 		ipoib_warn(priv, "failed to modify QP to init, ret = %d\n", ret);
111*4882a593Smuzhiyun 		goto out_fail;
112*4882a593Smuzhiyun 	}
113*4882a593Smuzhiyun 
114*4882a593Smuzhiyun 	qp_attr.qp_state = IB_QPS_RTR;
115*4882a593Smuzhiyun 	/* Can't set this in a INIT->RTR transition */
116*4882a593Smuzhiyun 	attr_mask &= ~IB_QP_PORT;
117*4882a593Smuzhiyun 	ret = ib_modify_qp(priv->qp, &qp_attr, attr_mask);
118*4882a593Smuzhiyun 	if (ret) {
119*4882a593Smuzhiyun 		ipoib_warn(priv, "failed to modify QP to RTR, ret = %d\n", ret);
120*4882a593Smuzhiyun 		goto out_fail;
121*4882a593Smuzhiyun 	}
122*4882a593Smuzhiyun 
123*4882a593Smuzhiyun 	qp_attr.qp_state = IB_QPS_RTS;
124*4882a593Smuzhiyun 	qp_attr.sq_psn = 0;
125*4882a593Smuzhiyun 	attr_mask |= IB_QP_SQ_PSN;
126*4882a593Smuzhiyun 	attr_mask &= ~IB_QP_PKEY_INDEX;
127*4882a593Smuzhiyun 	ret = ib_modify_qp(priv->qp, &qp_attr, attr_mask);
128*4882a593Smuzhiyun 	if (ret) {
129*4882a593Smuzhiyun 		ipoib_warn(priv, "failed to modify QP to RTS, ret = %d\n", ret);
130*4882a593Smuzhiyun 		goto out_fail;
131*4882a593Smuzhiyun 	}
132*4882a593Smuzhiyun 
133*4882a593Smuzhiyun 	return 0;
134*4882a593Smuzhiyun 
135*4882a593Smuzhiyun out_fail:
136*4882a593Smuzhiyun 	qp_attr.qp_state = IB_QPS_RESET;
137*4882a593Smuzhiyun 	if (ib_modify_qp(priv->qp, &qp_attr, IB_QP_STATE))
138*4882a593Smuzhiyun 		ipoib_warn(priv, "Failed to modify QP to RESET state\n");
139*4882a593Smuzhiyun 
140*4882a593Smuzhiyun 	return ret;
141*4882a593Smuzhiyun }
142*4882a593Smuzhiyun 
ipoib_transport_dev_init(struct net_device * dev,struct ib_device * ca)143*4882a593Smuzhiyun int ipoib_transport_dev_init(struct net_device *dev, struct ib_device *ca)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun 	struct ipoib_dev_priv *priv = ipoib_priv(dev);
146*4882a593Smuzhiyun 	struct ib_qp_init_attr init_attr = {
147*4882a593Smuzhiyun 		.cap = {
148*4882a593Smuzhiyun 			.max_send_wr  = ipoib_sendq_size,
149*4882a593Smuzhiyun 			.max_recv_wr  = ipoib_recvq_size,
150*4882a593Smuzhiyun 			.max_send_sge = min_t(u32, priv->ca->attrs.max_send_sge,
151*4882a593Smuzhiyun 					      MAX_SKB_FRAGS + 1),
152*4882a593Smuzhiyun 			.max_recv_sge = IPOIB_UD_RX_SG
153*4882a593Smuzhiyun 		},
154*4882a593Smuzhiyun 		.sq_sig_type = IB_SIGNAL_ALL_WR,
155*4882a593Smuzhiyun 		.qp_type     = IB_QPT_UD
156*4882a593Smuzhiyun 	};
157*4882a593Smuzhiyun 	struct ib_cq_init_attr cq_attr = {};
158*4882a593Smuzhiyun 
159*4882a593Smuzhiyun 	int ret, size, req_vec;
160*4882a593Smuzhiyun 	int i;
161*4882a593Smuzhiyun 
162*4882a593Smuzhiyun 	size = ipoib_recvq_size + 1;
163*4882a593Smuzhiyun 	ret = ipoib_cm_dev_init(dev);
164*4882a593Smuzhiyun 	if (!ret) {
165*4882a593Smuzhiyun 		size += ipoib_sendq_size;
166*4882a593Smuzhiyun 		if (ipoib_cm_has_srq(dev))
167*4882a593Smuzhiyun 			size += ipoib_recvq_size + 1; /* 1 extra for rx_drain_qp */
168*4882a593Smuzhiyun 		else
169*4882a593Smuzhiyun 			size += ipoib_recvq_size * ipoib_max_conn_qp;
170*4882a593Smuzhiyun 	} else
171*4882a593Smuzhiyun 		if (ret != -EOPNOTSUPP)
172*4882a593Smuzhiyun 			return ret;
173*4882a593Smuzhiyun 
174*4882a593Smuzhiyun 	req_vec = (priv->port - 1) * 2;
175*4882a593Smuzhiyun 
176*4882a593Smuzhiyun 	cq_attr.cqe = size;
177*4882a593Smuzhiyun 	cq_attr.comp_vector = req_vec % priv->ca->num_comp_vectors;
178*4882a593Smuzhiyun 	priv->recv_cq = ib_create_cq(priv->ca, ipoib_ib_rx_completion, NULL,
179*4882a593Smuzhiyun 				     priv, &cq_attr);
180*4882a593Smuzhiyun 	if (IS_ERR(priv->recv_cq)) {
181*4882a593Smuzhiyun 		pr_warn("%s: failed to create receive CQ\n", ca->name);
182*4882a593Smuzhiyun 		goto out_cm_dev_cleanup;
183*4882a593Smuzhiyun 	}
184*4882a593Smuzhiyun 
185*4882a593Smuzhiyun 	cq_attr.cqe = ipoib_sendq_size;
186*4882a593Smuzhiyun 	cq_attr.comp_vector = (req_vec + 1) % priv->ca->num_comp_vectors;
187*4882a593Smuzhiyun 	priv->send_cq = ib_create_cq(priv->ca, ipoib_ib_tx_completion, NULL,
188*4882a593Smuzhiyun 				     priv, &cq_attr);
189*4882a593Smuzhiyun 	if (IS_ERR(priv->send_cq)) {
190*4882a593Smuzhiyun 		pr_warn("%s: failed to create send CQ\n", ca->name);
191*4882a593Smuzhiyun 		goto out_free_recv_cq;
192*4882a593Smuzhiyun 	}
193*4882a593Smuzhiyun 
194*4882a593Smuzhiyun 	if (ib_req_notify_cq(priv->recv_cq, IB_CQ_NEXT_COMP))
195*4882a593Smuzhiyun 		goto out_free_send_cq;
196*4882a593Smuzhiyun 
197*4882a593Smuzhiyun 	init_attr.send_cq = priv->send_cq;
198*4882a593Smuzhiyun 	init_attr.recv_cq = priv->recv_cq;
199*4882a593Smuzhiyun 
200*4882a593Smuzhiyun 	if (priv->hca_caps & IB_DEVICE_UD_TSO)
201*4882a593Smuzhiyun 		init_attr.create_flags |= IB_QP_CREATE_IPOIB_UD_LSO;
202*4882a593Smuzhiyun 
203*4882a593Smuzhiyun 	if (priv->hca_caps & IB_DEVICE_BLOCK_MULTICAST_LOOPBACK)
204*4882a593Smuzhiyun 		init_attr.create_flags |= IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK;
205*4882a593Smuzhiyun 
206*4882a593Smuzhiyun 	if (priv->hca_caps & IB_DEVICE_MANAGED_FLOW_STEERING)
207*4882a593Smuzhiyun 		init_attr.create_flags |= IB_QP_CREATE_NETIF_QP;
208*4882a593Smuzhiyun 
209*4882a593Smuzhiyun 	if (priv->hca_caps & IB_DEVICE_RDMA_NETDEV_OPA)
210*4882a593Smuzhiyun 		init_attr.create_flags |= IB_QP_CREATE_NETDEV_USE;
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun 	priv->qp = ib_create_qp(priv->pd, &init_attr);
213*4882a593Smuzhiyun 	if (IS_ERR(priv->qp)) {
214*4882a593Smuzhiyun 		pr_warn("%s: failed to create QP\n", ca->name);
215*4882a593Smuzhiyun 		goto out_free_send_cq;
216*4882a593Smuzhiyun 	}
217*4882a593Smuzhiyun 
218*4882a593Smuzhiyun 	if (ib_req_notify_cq(priv->send_cq, IB_CQ_NEXT_COMP))
219*4882a593Smuzhiyun 		goto out_free_send_cq;
220*4882a593Smuzhiyun 
221*4882a593Smuzhiyun 	for (i = 0; i < MAX_SKB_FRAGS + 1; ++i)
222*4882a593Smuzhiyun 		priv->tx_sge[i].lkey = priv->pd->local_dma_lkey;
223*4882a593Smuzhiyun 
224*4882a593Smuzhiyun 	priv->tx_wr.wr.opcode		= IB_WR_SEND;
225*4882a593Smuzhiyun 	priv->tx_wr.wr.sg_list		= priv->tx_sge;
226*4882a593Smuzhiyun 	priv->tx_wr.wr.send_flags	= IB_SEND_SIGNALED;
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun 	priv->rx_sge[0].lkey = priv->pd->local_dma_lkey;
229*4882a593Smuzhiyun 
230*4882a593Smuzhiyun 	priv->rx_sge[0].length = IPOIB_UD_BUF_SIZE(priv->max_ib_mtu);
231*4882a593Smuzhiyun 	priv->rx_wr.num_sge = 1;
232*4882a593Smuzhiyun 
233*4882a593Smuzhiyun 	priv->rx_wr.next = NULL;
234*4882a593Smuzhiyun 	priv->rx_wr.sg_list = priv->rx_sge;
235*4882a593Smuzhiyun 
236*4882a593Smuzhiyun 	if (init_attr.cap.max_send_sge > 1)
237*4882a593Smuzhiyun 		dev->features |= NETIF_F_SG;
238*4882a593Smuzhiyun 
239*4882a593Smuzhiyun 	priv->max_send_sge = init_attr.cap.max_send_sge;
240*4882a593Smuzhiyun 
241*4882a593Smuzhiyun 	return 0;
242*4882a593Smuzhiyun 
243*4882a593Smuzhiyun out_free_send_cq:
244*4882a593Smuzhiyun 	ib_destroy_cq(priv->send_cq);
245*4882a593Smuzhiyun 
246*4882a593Smuzhiyun out_free_recv_cq:
247*4882a593Smuzhiyun 	ib_destroy_cq(priv->recv_cq);
248*4882a593Smuzhiyun 
249*4882a593Smuzhiyun out_cm_dev_cleanup:
250*4882a593Smuzhiyun 	ipoib_cm_dev_cleanup(dev);
251*4882a593Smuzhiyun 
252*4882a593Smuzhiyun 	return -ENODEV;
253*4882a593Smuzhiyun }
254*4882a593Smuzhiyun 
ipoib_transport_dev_cleanup(struct net_device * dev)255*4882a593Smuzhiyun void ipoib_transport_dev_cleanup(struct net_device *dev)
256*4882a593Smuzhiyun {
257*4882a593Smuzhiyun 	struct ipoib_dev_priv *priv = ipoib_priv(dev);
258*4882a593Smuzhiyun 
259*4882a593Smuzhiyun 	if (priv->qp) {
260*4882a593Smuzhiyun 		if (ib_destroy_qp(priv->qp))
261*4882a593Smuzhiyun 			ipoib_warn(priv, "ib_qp_destroy failed\n");
262*4882a593Smuzhiyun 
263*4882a593Smuzhiyun 		priv->qp = NULL;
264*4882a593Smuzhiyun 	}
265*4882a593Smuzhiyun 
266*4882a593Smuzhiyun 	ib_destroy_cq(priv->send_cq);
267*4882a593Smuzhiyun 	ib_destroy_cq(priv->recv_cq);
268*4882a593Smuzhiyun }
269*4882a593Smuzhiyun 
ipoib_event(struct ib_event_handler * handler,struct ib_event * record)270*4882a593Smuzhiyun void ipoib_event(struct ib_event_handler *handler,
271*4882a593Smuzhiyun 		 struct ib_event *record)
272*4882a593Smuzhiyun {
273*4882a593Smuzhiyun 	struct ipoib_dev_priv *priv =
274*4882a593Smuzhiyun 		container_of(handler, struct ipoib_dev_priv, event_handler);
275*4882a593Smuzhiyun 
276*4882a593Smuzhiyun 	if (record->element.port_num != priv->port)
277*4882a593Smuzhiyun 		return;
278*4882a593Smuzhiyun 
279*4882a593Smuzhiyun 	ipoib_dbg(priv, "Event %d on device %s port %d\n", record->event,
280*4882a593Smuzhiyun 		  dev_name(&record->device->dev), record->element.port_num);
281*4882a593Smuzhiyun 
282*4882a593Smuzhiyun 	if (record->event == IB_EVENT_CLIENT_REREGISTER) {
283*4882a593Smuzhiyun 		queue_work(ipoib_workqueue, &priv->flush_light);
284*4882a593Smuzhiyun 	} else if (record->event == IB_EVENT_PORT_ERR ||
285*4882a593Smuzhiyun 		   record->event == IB_EVENT_PORT_ACTIVE ||
286*4882a593Smuzhiyun 		   record->event == IB_EVENT_LID_CHANGE) {
287*4882a593Smuzhiyun 		queue_work(ipoib_workqueue, &priv->flush_normal);
288*4882a593Smuzhiyun 	} else if (record->event == IB_EVENT_PKEY_CHANGE) {
289*4882a593Smuzhiyun 		queue_work(ipoib_workqueue, &priv->flush_heavy);
290*4882a593Smuzhiyun 	} else if (record->event == IB_EVENT_GID_CHANGE &&
291*4882a593Smuzhiyun 		   !test_bit(IPOIB_FLAG_DEV_ADDR_SET, &priv->flags)) {
292*4882a593Smuzhiyun 		queue_work(ipoib_workqueue, &priv->flush_light);
293*4882a593Smuzhiyun 	}
294*4882a593Smuzhiyun }
295