xref: /OK3568_Linux_fs/kernel/drivers/infiniband/hw/qib/qib_verbs.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Copyright (c) 2012 - 2018 Intel Corporation.  All rights reserved.
3*4882a593Smuzhiyun  * Copyright (c) 2006 - 2012 QLogic Corporation. All rights reserved.
4*4882a593Smuzhiyun  * Copyright (c) 2005, 2006 PathScale, Inc. All rights reserved.
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  * This software is available to you under a choice of one of two
7*4882a593Smuzhiyun  * licenses.  You may choose to be licensed under the terms of the GNU
8*4882a593Smuzhiyun  * General Public License (GPL) Version 2, available from the file
9*4882a593Smuzhiyun  * COPYING in the main directory of this source tree, or the
10*4882a593Smuzhiyun  * OpenIB.org BSD license below:
11*4882a593Smuzhiyun  *
12*4882a593Smuzhiyun  *     Redistribution and use in source and binary forms, with or
13*4882a593Smuzhiyun  *     without modification, are permitted provided that the following
14*4882a593Smuzhiyun  *     conditions are met:
15*4882a593Smuzhiyun  *
16*4882a593Smuzhiyun  *      - Redistributions of source code must retain the above
17*4882a593Smuzhiyun  *        copyright notice, this list of conditions and the following
18*4882a593Smuzhiyun  *        disclaimer.
19*4882a593Smuzhiyun  *
20*4882a593Smuzhiyun  *      - Redistributions in binary form must reproduce the above
21*4882a593Smuzhiyun  *        copyright notice, this list of conditions and the following
22*4882a593Smuzhiyun  *        disclaimer in the documentation and/or other materials
23*4882a593Smuzhiyun  *        provided with the distribution.
24*4882a593Smuzhiyun  *
25*4882a593Smuzhiyun  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
26*4882a593Smuzhiyun  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
27*4882a593Smuzhiyun  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
28*4882a593Smuzhiyun  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
29*4882a593Smuzhiyun  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
30*4882a593Smuzhiyun  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
31*4882a593Smuzhiyun  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
32*4882a593Smuzhiyun  * SOFTWARE.
33*4882a593Smuzhiyun  */
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun #include <rdma/ib_mad.h>
36*4882a593Smuzhiyun #include <rdma/ib_user_verbs.h>
37*4882a593Smuzhiyun #include <linux/io.h>
38*4882a593Smuzhiyun #include <linux/module.h>
39*4882a593Smuzhiyun #include <linux/utsname.h>
40*4882a593Smuzhiyun #include <linux/rculist.h>
41*4882a593Smuzhiyun #include <linux/mm.h>
42*4882a593Smuzhiyun #include <linux/vmalloc.h>
43*4882a593Smuzhiyun #include <rdma/rdma_vt.h>
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun #include "qib.h"
46*4882a593Smuzhiyun #include "qib_common.h"
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun static unsigned int ib_qib_qp_table_size = 256;
49*4882a593Smuzhiyun module_param_named(qp_table_size, ib_qib_qp_table_size, uint, S_IRUGO);
50*4882a593Smuzhiyun MODULE_PARM_DESC(qp_table_size, "QP table size");
51*4882a593Smuzhiyun 
52*4882a593Smuzhiyun static unsigned int qib_lkey_table_size = 16;
53*4882a593Smuzhiyun module_param_named(lkey_table_size, qib_lkey_table_size, uint,
54*4882a593Smuzhiyun 		   S_IRUGO);
55*4882a593Smuzhiyun MODULE_PARM_DESC(lkey_table_size,
56*4882a593Smuzhiyun 		 "LKEY table size in bits (2^n, 1 <= n <= 23)");
57*4882a593Smuzhiyun 
58*4882a593Smuzhiyun static unsigned int ib_qib_max_pds = 0xFFFF;
59*4882a593Smuzhiyun module_param_named(max_pds, ib_qib_max_pds, uint, S_IRUGO);
60*4882a593Smuzhiyun MODULE_PARM_DESC(max_pds,
61*4882a593Smuzhiyun 		 "Maximum number of protection domains to support");
62*4882a593Smuzhiyun 
63*4882a593Smuzhiyun static unsigned int ib_qib_max_ahs = 0xFFFF;
64*4882a593Smuzhiyun module_param_named(max_ahs, ib_qib_max_ahs, uint, S_IRUGO);
65*4882a593Smuzhiyun MODULE_PARM_DESC(max_ahs, "Maximum number of address handles to support");
66*4882a593Smuzhiyun 
67*4882a593Smuzhiyun unsigned int ib_qib_max_cqes = 0x2FFFF;
68*4882a593Smuzhiyun module_param_named(max_cqes, ib_qib_max_cqes, uint, S_IRUGO);
69*4882a593Smuzhiyun MODULE_PARM_DESC(max_cqes,
70*4882a593Smuzhiyun 		 "Maximum number of completion queue entries to support");
71*4882a593Smuzhiyun 
72*4882a593Smuzhiyun unsigned int ib_qib_max_cqs = 0x1FFFF;
73*4882a593Smuzhiyun module_param_named(max_cqs, ib_qib_max_cqs, uint, S_IRUGO);
74*4882a593Smuzhiyun MODULE_PARM_DESC(max_cqs, "Maximum number of completion queues to support");
75*4882a593Smuzhiyun 
76*4882a593Smuzhiyun unsigned int ib_qib_max_qp_wrs = 0x3FFF;
77*4882a593Smuzhiyun module_param_named(max_qp_wrs, ib_qib_max_qp_wrs, uint, S_IRUGO);
78*4882a593Smuzhiyun MODULE_PARM_DESC(max_qp_wrs, "Maximum number of QP WRs to support");
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun unsigned int ib_qib_max_qps = 16384;
81*4882a593Smuzhiyun module_param_named(max_qps, ib_qib_max_qps, uint, S_IRUGO);
82*4882a593Smuzhiyun MODULE_PARM_DESC(max_qps, "Maximum number of QPs to support");
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun unsigned int ib_qib_max_sges = 0x60;
85*4882a593Smuzhiyun module_param_named(max_sges, ib_qib_max_sges, uint, S_IRUGO);
86*4882a593Smuzhiyun MODULE_PARM_DESC(max_sges, "Maximum number of SGEs to support");
87*4882a593Smuzhiyun 
88*4882a593Smuzhiyun unsigned int ib_qib_max_mcast_grps = 16384;
89*4882a593Smuzhiyun module_param_named(max_mcast_grps, ib_qib_max_mcast_grps, uint, S_IRUGO);
90*4882a593Smuzhiyun MODULE_PARM_DESC(max_mcast_grps,
91*4882a593Smuzhiyun 		 "Maximum number of multicast groups to support");
92*4882a593Smuzhiyun 
93*4882a593Smuzhiyun unsigned int ib_qib_max_mcast_qp_attached = 16;
94*4882a593Smuzhiyun module_param_named(max_mcast_qp_attached, ib_qib_max_mcast_qp_attached,
95*4882a593Smuzhiyun 		   uint, S_IRUGO);
96*4882a593Smuzhiyun MODULE_PARM_DESC(max_mcast_qp_attached,
97*4882a593Smuzhiyun 		 "Maximum number of attached QPs to support");
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun unsigned int ib_qib_max_srqs = 1024;
100*4882a593Smuzhiyun module_param_named(max_srqs, ib_qib_max_srqs, uint, S_IRUGO);
101*4882a593Smuzhiyun MODULE_PARM_DESC(max_srqs, "Maximum number of SRQs to support");
102*4882a593Smuzhiyun 
103*4882a593Smuzhiyun unsigned int ib_qib_max_srq_sges = 128;
104*4882a593Smuzhiyun module_param_named(max_srq_sges, ib_qib_max_srq_sges, uint, S_IRUGO);
105*4882a593Smuzhiyun MODULE_PARM_DESC(max_srq_sges, "Maximum number of SRQ SGEs to support");
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun unsigned int ib_qib_max_srq_wrs = 0x1FFFF;
108*4882a593Smuzhiyun module_param_named(max_srq_wrs, ib_qib_max_srq_wrs, uint, S_IRUGO);
109*4882a593Smuzhiyun MODULE_PARM_DESC(max_srq_wrs, "Maximum number of SRQ WRs support");
110*4882a593Smuzhiyun 
111*4882a593Smuzhiyun static unsigned int ib_qib_disable_sma;
112*4882a593Smuzhiyun module_param_named(disable_sma, ib_qib_disable_sma, uint, S_IWUSR | S_IRUGO);
113*4882a593Smuzhiyun MODULE_PARM_DESC(disable_sma, "Disable the SMA");
114*4882a593Smuzhiyun 
115*4882a593Smuzhiyun /*
116*4882a593Smuzhiyun  * Translate ib_wr_opcode into ib_wc_opcode.
117*4882a593Smuzhiyun  */
118*4882a593Smuzhiyun const enum ib_wc_opcode ib_qib_wc_opcode[] = {
119*4882a593Smuzhiyun 	[IB_WR_RDMA_WRITE] = IB_WC_RDMA_WRITE,
120*4882a593Smuzhiyun 	[IB_WR_RDMA_WRITE_WITH_IMM] = IB_WC_RDMA_WRITE,
121*4882a593Smuzhiyun 	[IB_WR_SEND] = IB_WC_SEND,
122*4882a593Smuzhiyun 	[IB_WR_SEND_WITH_IMM] = IB_WC_SEND,
123*4882a593Smuzhiyun 	[IB_WR_RDMA_READ] = IB_WC_RDMA_READ,
124*4882a593Smuzhiyun 	[IB_WR_ATOMIC_CMP_AND_SWP] = IB_WC_COMP_SWAP,
125*4882a593Smuzhiyun 	[IB_WR_ATOMIC_FETCH_AND_ADD] = IB_WC_FETCH_ADD
126*4882a593Smuzhiyun };
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun /*
129*4882a593Smuzhiyun  * System image GUID.
130*4882a593Smuzhiyun  */
131*4882a593Smuzhiyun __be64 ib_qib_sys_image_guid;
132*4882a593Smuzhiyun 
133*4882a593Smuzhiyun /*
134*4882a593Smuzhiyun  * Count the number of DMA descriptors needed to send length bytes of data.
135*4882a593Smuzhiyun  * Don't modify the qib_sge_state to get the count.
136*4882a593Smuzhiyun  * Return zero if any of the segments is not aligned.
137*4882a593Smuzhiyun  */
qib_count_sge(struct rvt_sge_state * ss,u32 length)138*4882a593Smuzhiyun static u32 qib_count_sge(struct rvt_sge_state *ss, u32 length)
139*4882a593Smuzhiyun {
140*4882a593Smuzhiyun 	struct rvt_sge *sg_list = ss->sg_list;
141*4882a593Smuzhiyun 	struct rvt_sge sge = ss->sge;
142*4882a593Smuzhiyun 	u8 num_sge = ss->num_sge;
143*4882a593Smuzhiyun 	u32 ndesc = 1;  /* count the header */
144*4882a593Smuzhiyun 
145*4882a593Smuzhiyun 	while (length) {
146*4882a593Smuzhiyun 		u32 len = rvt_get_sge_length(&sge, length);
147*4882a593Smuzhiyun 
148*4882a593Smuzhiyun 		if (((long) sge.vaddr & (sizeof(u32) - 1)) ||
149*4882a593Smuzhiyun 		    (len != length && (len & (sizeof(u32) - 1)))) {
150*4882a593Smuzhiyun 			ndesc = 0;
151*4882a593Smuzhiyun 			break;
152*4882a593Smuzhiyun 		}
153*4882a593Smuzhiyun 		ndesc++;
154*4882a593Smuzhiyun 		sge.vaddr += len;
155*4882a593Smuzhiyun 		sge.length -= len;
156*4882a593Smuzhiyun 		sge.sge_length -= len;
157*4882a593Smuzhiyun 		if (sge.sge_length == 0) {
158*4882a593Smuzhiyun 			if (--num_sge)
159*4882a593Smuzhiyun 				sge = *sg_list++;
160*4882a593Smuzhiyun 		} else if (sge.length == 0 && sge.mr->lkey) {
161*4882a593Smuzhiyun 			if (++sge.n >= RVT_SEGSZ) {
162*4882a593Smuzhiyun 				if (++sge.m >= sge.mr->mapsz)
163*4882a593Smuzhiyun 					break;
164*4882a593Smuzhiyun 				sge.n = 0;
165*4882a593Smuzhiyun 			}
166*4882a593Smuzhiyun 			sge.vaddr =
167*4882a593Smuzhiyun 				sge.mr->map[sge.m]->segs[sge.n].vaddr;
168*4882a593Smuzhiyun 			sge.length =
169*4882a593Smuzhiyun 				sge.mr->map[sge.m]->segs[sge.n].length;
170*4882a593Smuzhiyun 		}
171*4882a593Smuzhiyun 		length -= len;
172*4882a593Smuzhiyun 	}
173*4882a593Smuzhiyun 	return ndesc;
174*4882a593Smuzhiyun }
175*4882a593Smuzhiyun 
176*4882a593Smuzhiyun /*
177*4882a593Smuzhiyun  * Copy from the SGEs to the data buffer.
178*4882a593Smuzhiyun  */
qib_copy_from_sge(void * data,struct rvt_sge_state * ss,u32 length)179*4882a593Smuzhiyun static void qib_copy_from_sge(void *data, struct rvt_sge_state *ss, u32 length)
180*4882a593Smuzhiyun {
181*4882a593Smuzhiyun 	struct rvt_sge *sge = &ss->sge;
182*4882a593Smuzhiyun 
183*4882a593Smuzhiyun 	while (length) {
184*4882a593Smuzhiyun 		u32 len = rvt_get_sge_length(sge, length);
185*4882a593Smuzhiyun 
186*4882a593Smuzhiyun 		memcpy(data, sge->vaddr, len);
187*4882a593Smuzhiyun 		sge->vaddr += len;
188*4882a593Smuzhiyun 		sge->length -= len;
189*4882a593Smuzhiyun 		sge->sge_length -= len;
190*4882a593Smuzhiyun 		if (sge->sge_length == 0) {
191*4882a593Smuzhiyun 			if (--ss->num_sge)
192*4882a593Smuzhiyun 				*sge = *ss->sg_list++;
193*4882a593Smuzhiyun 		} else if (sge->length == 0 && sge->mr->lkey) {
194*4882a593Smuzhiyun 			if (++sge->n >= RVT_SEGSZ) {
195*4882a593Smuzhiyun 				if (++sge->m >= sge->mr->mapsz)
196*4882a593Smuzhiyun 					break;
197*4882a593Smuzhiyun 				sge->n = 0;
198*4882a593Smuzhiyun 			}
199*4882a593Smuzhiyun 			sge->vaddr =
200*4882a593Smuzhiyun 				sge->mr->map[sge->m]->segs[sge->n].vaddr;
201*4882a593Smuzhiyun 			sge->length =
202*4882a593Smuzhiyun 				sge->mr->map[sge->m]->segs[sge->n].length;
203*4882a593Smuzhiyun 		}
204*4882a593Smuzhiyun 		data += len;
205*4882a593Smuzhiyun 		length -= len;
206*4882a593Smuzhiyun 	}
207*4882a593Smuzhiyun }
208*4882a593Smuzhiyun 
209*4882a593Smuzhiyun /**
210*4882a593Smuzhiyun  * qib_qp_rcv - processing an incoming packet on a QP
211*4882a593Smuzhiyun  * @rcd: the context pointer
212*4882a593Smuzhiyun  * @hdr: the packet header
213*4882a593Smuzhiyun  * @has_grh: true if the packet has a GRH
214*4882a593Smuzhiyun  * @data: the packet data
215*4882a593Smuzhiyun  * @tlen: the packet length
216*4882a593Smuzhiyun  * @qp: the QP the packet came on
217*4882a593Smuzhiyun  *
218*4882a593Smuzhiyun  * This is called from qib_ib_rcv() to process an incoming packet
219*4882a593Smuzhiyun  * for the given QP.
220*4882a593Smuzhiyun  * Called at interrupt level.
221*4882a593Smuzhiyun  */
qib_qp_rcv(struct qib_ctxtdata * rcd,struct ib_header * hdr,int has_grh,void * data,u32 tlen,struct rvt_qp * qp)222*4882a593Smuzhiyun static void qib_qp_rcv(struct qib_ctxtdata *rcd, struct ib_header *hdr,
223*4882a593Smuzhiyun 		       int has_grh, void *data, u32 tlen, struct rvt_qp *qp)
224*4882a593Smuzhiyun {
225*4882a593Smuzhiyun 	struct qib_ibport *ibp = &rcd->ppd->ibport_data;
226*4882a593Smuzhiyun 
227*4882a593Smuzhiyun 	spin_lock(&qp->r_lock);
228*4882a593Smuzhiyun 
229*4882a593Smuzhiyun 	/* Check for valid receive state. */
230*4882a593Smuzhiyun 	if (!(ib_rvt_state_ops[qp->state] & RVT_PROCESS_RECV_OK)) {
231*4882a593Smuzhiyun 		ibp->rvp.n_pkt_drops++;
232*4882a593Smuzhiyun 		goto unlock;
233*4882a593Smuzhiyun 	}
234*4882a593Smuzhiyun 
235*4882a593Smuzhiyun 	switch (qp->ibqp.qp_type) {
236*4882a593Smuzhiyun 	case IB_QPT_SMI:
237*4882a593Smuzhiyun 	case IB_QPT_GSI:
238*4882a593Smuzhiyun 		if (ib_qib_disable_sma)
239*4882a593Smuzhiyun 			break;
240*4882a593Smuzhiyun 		fallthrough;
241*4882a593Smuzhiyun 	case IB_QPT_UD:
242*4882a593Smuzhiyun 		qib_ud_rcv(ibp, hdr, has_grh, data, tlen, qp);
243*4882a593Smuzhiyun 		break;
244*4882a593Smuzhiyun 
245*4882a593Smuzhiyun 	case IB_QPT_RC:
246*4882a593Smuzhiyun 		qib_rc_rcv(rcd, hdr, has_grh, data, tlen, qp);
247*4882a593Smuzhiyun 		break;
248*4882a593Smuzhiyun 
249*4882a593Smuzhiyun 	case IB_QPT_UC:
250*4882a593Smuzhiyun 		qib_uc_rcv(ibp, hdr, has_grh, data, tlen, qp);
251*4882a593Smuzhiyun 		break;
252*4882a593Smuzhiyun 
253*4882a593Smuzhiyun 	default:
254*4882a593Smuzhiyun 		break;
255*4882a593Smuzhiyun 	}
256*4882a593Smuzhiyun 
257*4882a593Smuzhiyun unlock:
258*4882a593Smuzhiyun 	spin_unlock(&qp->r_lock);
259*4882a593Smuzhiyun }
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun /**
262*4882a593Smuzhiyun  * qib_ib_rcv - process an incoming packet
263*4882a593Smuzhiyun  * @rcd: the context pointer
264*4882a593Smuzhiyun  * @rhdr: the header of the packet
265*4882a593Smuzhiyun  * @data: the packet payload
266*4882a593Smuzhiyun  * @tlen: the packet length
267*4882a593Smuzhiyun  *
268*4882a593Smuzhiyun  * This is called from qib_kreceive() to process an incoming packet at
269*4882a593Smuzhiyun  * interrupt level. Tlen is the length of the header + data + CRC in bytes.
270*4882a593Smuzhiyun  */
qib_ib_rcv(struct qib_ctxtdata * rcd,void * rhdr,void * data,u32 tlen)271*4882a593Smuzhiyun void qib_ib_rcv(struct qib_ctxtdata *rcd, void *rhdr, void *data, u32 tlen)
272*4882a593Smuzhiyun {
273*4882a593Smuzhiyun 	struct qib_pportdata *ppd = rcd->ppd;
274*4882a593Smuzhiyun 	struct qib_ibport *ibp = &ppd->ibport_data;
275*4882a593Smuzhiyun 	struct ib_header *hdr = rhdr;
276*4882a593Smuzhiyun 	struct qib_devdata *dd = ppd->dd;
277*4882a593Smuzhiyun 	struct rvt_dev_info *rdi = &dd->verbs_dev.rdi;
278*4882a593Smuzhiyun 	struct ib_other_headers *ohdr;
279*4882a593Smuzhiyun 	struct rvt_qp *qp;
280*4882a593Smuzhiyun 	u32 qp_num;
281*4882a593Smuzhiyun 	int lnh;
282*4882a593Smuzhiyun 	u8 opcode;
283*4882a593Smuzhiyun 	u16 lid;
284*4882a593Smuzhiyun 
285*4882a593Smuzhiyun 	/* 24 == LRH+BTH+CRC */
286*4882a593Smuzhiyun 	if (unlikely(tlen < 24))
287*4882a593Smuzhiyun 		goto drop;
288*4882a593Smuzhiyun 
289*4882a593Smuzhiyun 	/* Check for a valid destination LID (see ch. 7.11.1). */
290*4882a593Smuzhiyun 	lid = be16_to_cpu(hdr->lrh[1]);
291*4882a593Smuzhiyun 	if (lid < be16_to_cpu(IB_MULTICAST_LID_BASE)) {
292*4882a593Smuzhiyun 		lid &= ~((1 << ppd->lmc) - 1);
293*4882a593Smuzhiyun 		if (unlikely(lid != ppd->lid))
294*4882a593Smuzhiyun 			goto drop;
295*4882a593Smuzhiyun 	}
296*4882a593Smuzhiyun 
297*4882a593Smuzhiyun 	/* Check for GRH */
298*4882a593Smuzhiyun 	lnh = be16_to_cpu(hdr->lrh[0]) & 3;
299*4882a593Smuzhiyun 	if (lnh == QIB_LRH_BTH)
300*4882a593Smuzhiyun 		ohdr = &hdr->u.oth;
301*4882a593Smuzhiyun 	else if (lnh == QIB_LRH_GRH) {
302*4882a593Smuzhiyun 		u32 vtf;
303*4882a593Smuzhiyun 
304*4882a593Smuzhiyun 		ohdr = &hdr->u.l.oth;
305*4882a593Smuzhiyun 		if (hdr->u.l.grh.next_hdr != IB_GRH_NEXT_HDR)
306*4882a593Smuzhiyun 			goto drop;
307*4882a593Smuzhiyun 		vtf = be32_to_cpu(hdr->u.l.grh.version_tclass_flow);
308*4882a593Smuzhiyun 		if ((vtf >> IB_GRH_VERSION_SHIFT) != IB_GRH_VERSION)
309*4882a593Smuzhiyun 			goto drop;
310*4882a593Smuzhiyun 	} else
311*4882a593Smuzhiyun 		goto drop;
312*4882a593Smuzhiyun 
313*4882a593Smuzhiyun 	opcode = (be32_to_cpu(ohdr->bth[0]) >> 24) & 0x7f;
314*4882a593Smuzhiyun #ifdef CONFIG_DEBUG_FS
315*4882a593Smuzhiyun 	rcd->opstats->stats[opcode].n_bytes += tlen;
316*4882a593Smuzhiyun 	rcd->opstats->stats[opcode].n_packets++;
317*4882a593Smuzhiyun #endif
318*4882a593Smuzhiyun 
319*4882a593Smuzhiyun 	/* Get the destination QP number. */
320*4882a593Smuzhiyun 	qp_num = be32_to_cpu(ohdr->bth[1]) & RVT_QPN_MASK;
321*4882a593Smuzhiyun 	if (qp_num == QIB_MULTICAST_QPN) {
322*4882a593Smuzhiyun 		struct rvt_mcast *mcast;
323*4882a593Smuzhiyun 		struct rvt_mcast_qp *p;
324*4882a593Smuzhiyun 
325*4882a593Smuzhiyun 		if (lnh != QIB_LRH_GRH)
326*4882a593Smuzhiyun 			goto drop;
327*4882a593Smuzhiyun 		mcast = rvt_mcast_find(&ibp->rvp, &hdr->u.l.grh.dgid, lid);
328*4882a593Smuzhiyun 		if (mcast == NULL)
329*4882a593Smuzhiyun 			goto drop;
330*4882a593Smuzhiyun 		this_cpu_inc(ibp->pmastats->n_multicast_rcv);
331*4882a593Smuzhiyun 		rcu_read_lock();
332*4882a593Smuzhiyun 		list_for_each_entry_rcu(p, &mcast->qp_list, list)
333*4882a593Smuzhiyun 			qib_qp_rcv(rcd, hdr, 1, data, tlen, p->qp);
334*4882a593Smuzhiyun 		rcu_read_unlock();
335*4882a593Smuzhiyun 		/*
336*4882a593Smuzhiyun 		 * Notify rvt_multicast_detach() if it is waiting for us
337*4882a593Smuzhiyun 		 * to finish.
338*4882a593Smuzhiyun 		 */
339*4882a593Smuzhiyun 		if (atomic_dec_return(&mcast->refcount) <= 1)
340*4882a593Smuzhiyun 			wake_up(&mcast->wait);
341*4882a593Smuzhiyun 	} else {
342*4882a593Smuzhiyun 		rcu_read_lock();
343*4882a593Smuzhiyun 		qp = rvt_lookup_qpn(rdi, &ibp->rvp, qp_num);
344*4882a593Smuzhiyun 		if (!qp) {
345*4882a593Smuzhiyun 			rcu_read_unlock();
346*4882a593Smuzhiyun 			goto drop;
347*4882a593Smuzhiyun 		}
348*4882a593Smuzhiyun 		this_cpu_inc(ibp->pmastats->n_unicast_rcv);
349*4882a593Smuzhiyun 		qib_qp_rcv(rcd, hdr, lnh == QIB_LRH_GRH, data, tlen, qp);
350*4882a593Smuzhiyun 		rcu_read_unlock();
351*4882a593Smuzhiyun 	}
352*4882a593Smuzhiyun 	return;
353*4882a593Smuzhiyun 
354*4882a593Smuzhiyun drop:
355*4882a593Smuzhiyun 	ibp->rvp.n_pkt_drops++;
356*4882a593Smuzhiyun }
357*4882a593Smuzhiyun 
358*4882a593Smuzhiyun /*
359*4882a593Smuzhiyun  * This is called from a timer to check for QPs
360*4882a593Smuzhiyun  * which need kernel memory in order to send a packet.
361*4882a593Smuzhiyun  */
mem_timer(struct timer_list * t)362*4882a593Smuzhiyun static void mem_timer(struct timer_list *t)
363*4882a593Smuzhiyun {
364*4882a593Smuzhiyun 	struct qib_ibdev *dev = from_timer(dev, t, mem_timer);
365*4882a593Smuzhiyun 	struct list_head *list = &dev->memwait;
366*4882a593Smuzhiyun 	struct rvt_qp *qp = NULL;
367*4882a593Smuzhiyun 	struct qib_qp_priv *priv = NULL;
368*4882a593Smuzhiyun 	unsigned long flags;
369*4882a593Smuzhiyun 
370*4882a593Smuzhiyun 	spin_lock_irqsave(&dev->rdi.pending_lock, flags);
371*4882a593Smuzhiyun 	if (!list_empty(list)) {
372*4882a593Smuzhiyun 		priv = list_entry(list->next, struct qib_qp_priv, iowait);
373*4882a593Smuzhiyun 		qp = priv->owner;
374*4882a593Smuzhiyun 		list_del_init(&priv->iowait);
375*4882a593Smuzhiyun 		rvt_get_qp(qp);
376*4882a593Smuzhiyun 		if (!list_empty(list))
377*4882a593Smuzhiyun 			mod_timer(&dev->mem_timer, jiffies + 1);
378*4882a593Smuzhiyun 	}
379*4882a593Smuzhiyun 	spin_unlock_irqrestore(&dev->rdi.pending_lock, flags);
380*4882a593Smuzhiyun 
381*4882a593Smuzhiyun 	if (qp) {
382*4882a593Smuzhiyun 		spin_lock_irqsave(&qp->s_lock, flags);
383*4882a593Smuzhiyun 		if (qp->s_flags & RVT_S_WAIT_KMEM) {
384*4882a593Smuzhiyun 			qp->s_flags &= ~RVT_S_WAIT_KMEM;
385*4882a593Smuzhiyun 			qib_schedule_send(qp);
386*4882a593Smuzhiyun 		}
387*4882a593Smuzhiyun 		spin_unlock_irqrestore(&qp->s_lock, flags);
388*4882a593Smuzhiyun 		rvt_put_qp(qp);
389*4882a593Smuzhiyun 	}
390*4882a593Smuzhiyun }
391*4882a593Smuzhiyun 
392*4882a593Smuzhiyun #ifdef __LITTLE_ENDIAN
get_upper_bits(u32 data,u32 shift)393*4882a593Smuzhiyun static inline u32 get_upper_bits(u32 data, u32 shift)
394*4882a593Smuzhiyun {
395*4882a593Smuzhiyun 	return data >> shift;
396*4882a593Smuzhiyun }
397*4882a593Smuzhiyun 
set_upper_bits(u32 data,u32 shift)398*4882a593Smuzhiyun static inline u32 set_upper_bits(u32 data, u32 shift)
399*4882a593Smuzhiyun {
400*4882a593Smuzhiyun 	return data << shift;
401*4882a593Smuzhiyun }
402*4882a593Smuzhiyun 
clear_upper_bytes(u32 data,u32 n,u32 off)403*4882a593Smuzhiyun static inline u32 clear_upper_bytes(u32 data, u32 n, u32 off)
404*4882a593Smuzhiyun {
405*4882a593Smuzhiyun 	data <<= ((sizeof(u32) - n) * BITS_PER_BYTE);
406*4882a593Smuzhiyun 	data >>= ((sizeof(u32) - n - off) * BITS_PER_BYTE);
407*4882a593Smuzhiyun 	return data;
408*4882a593Smuzhiyun }
409*4882a593Smuzhiyun #else
get_upper_bits(u32 data,u32 shift)410*4882a593Smuzhiyun static inline u32 get_upper_bits(u32 data, u32 shift)
411*4882a593Smuzhiyun {
412*4882a593Smuzhiyun 	return data << shift;
413*4882a593Smuzhiyun }
414*4882a593Smuzhiyun 
set_upper_bits(u32 data,u32 shift)415*4882a593Smuzhiyun static inline u32 set_upper_bits(u32 data, u32 shift)
416*4882a593Smuzhiyun {
417*4882a593Smuzhiyun 	return data >> shift;
418*4882a593Smuzhiyun }
419*4882a593Smuzhiyun 
clear_upper_bytes(u32 data,u32 n,u32 off)420*4882a593Smuzhiyun static inline u32 clear_upper_bytes(u32 data, u32 n, u32 off)
421*4882a593Smuzhiyun {
422*4882a593Smuzhiyun 	data >>= ((sizeof(u32) - n) * BITS_PER_BYTE);
423*4882a593Smuzhiyun 	data <<= ((sizeof(u32) - n - off) * BITS_PER_BYTE);
424*4882a593Smuzhiyun 	return data;
425*4882a593Smuzhiyun }
426*4882a593Smuzhiyun #endif
427*4882a593Smuzhiyun 
copy_io(u32 __iomem * piobuf,struct rvt_sge_state * ss,u32 length,unsigned flush_wc)428*4882a593Smuzhiyun static void copy_io(u32 __iomem *piobuf, struct rvt_sge_state *ss,
429*4882a593Smuzhiyun 		    u32 length, unsigned flush_wc)
430*4882a593Smuzhiyun {
431*4882a593Smuzhiyun 	u32 extra = 0;
432*4882a593Smuzhiyun 	u32 data = 0;
433*4882a593Smuzhiyun 	u32 last;
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun 	while (1) {
436*4882a593Smuzhiyun 		u32 len = rvt_get_sge_length(&ss->sge, length);
437*4882a593Smuzhiyun 		u32 off;
438*4882a593Smuzhiyun 
439*4882a593Smuzhiyun 		/* If the source address is not aligned, try to align it. */
440*4882a593Smuzhiyun 		off = (unsigned long)ss->sge.vaddr & (sizeof(u32) - 1);
441*4882a593Smuzhiyun 		if (off) {
442*4882a593Smuzhiyun 			u32 *addr = (u32 *)((unsigned long)ss->sge.vaddr &
443*4882a593Smuzhiyun 					    ~(sizeof(u32) - 1));
444*4882a593Smuzhiyun 			u32 v = get_upper_bits(*addr, off * BITS_PER_BYTE);
445*4882a593Smuzhiyun 			u32 y;
446*4882a593Smuzhiyun 
447*4882a593Smuzhiyun 			y = sizeof(u32) - off;
448*4882a593Smuzhiyun 			if (len > y)
449*4882a593Smuzhiyun 				len = y;
450*4882a593Smuzhiyun 			if (len + extra >= sizeof(u32)) {
451*4882a593Smuzhiyun 				data |= set_upper_bits(v, extra *
452*4882a593Smuzhiyun 						       BITS_PER_BYTE);
453*4882a593Smuzhiyun 				len = sizeof(u32) - extra;
454*4882a593Smuzhiyun 				if (len == length) {
455*4882a593Smuzhiyun 					last = data;
456*4882a593Smuzhiyun 					break;
457*4882a593Smuzhiyun 				}
458*4882a593Smuzhiyun 				__raw_writel(data, piobuf);
459*4882a593Smuzhiyun 				piobuf++;
460*4882a593Smuzhiyun 				extra = 0;
461*4882a593Smuzhiyun 				data = 0;
462*4882a593Smuzhiyun 			} else {
463*4882a593Smuzhiyun 				/* Clear unused upper bytes */
464*4882a593Smuzhiyun 				data |= clear_upper_bytes(v, len, extra);
465*4882a593Smuzhiyun 				if (len == length) {
466*4882a593Smuzhiyun 					last = data;
467*4882a593Smuzhiyun 					break;
468*4882a593Smuzhiyun 				}
469*4882a593Smuzhiyun 				extra += len;
470*4882a593Smuzhiyun 			}
471*4882a593Smuzhiyun 		} else if (extra) {
472*4882a593Smuzhiyun 			/* Source address is aligned. */
473*4882a593Smuzhiyun 			u32 *addr = (u32 *) ss->sge.vaddr;
474*4882a593Smuzhiyun 			int shift = extra * BITS_PER_BYTE;
475*4882a593Smuzhiyun 			int ushift = 32 - shift;
476*4882a593Smuzhiyun 			u32 l = len;
477*4882a593Smuzhiyun 
478*4882a593Smuzhiyun 			while (l >= sizeof(u32)) {
479*4882a593Smuzhiyun 				u32 v = *addr;
480*4882a593Smuzhiyun 
481*4882a593Smuzhiyun 				data |= set_upper_bits(v, shift);
482*4882a593Smuzhiyun 				__raw_writel(data, piobuf);
483*4882a593Smuzhiyun 				data = get_upper_bits(v, ushift);
484*4882a593Smuzhiyun 				piobuf++;
485*4882a593Smuzhiyun 				addr++;
486*4882a593Smuzhiyun 				l -= sizeof(u32);
487*4882a593Smuzhiyun 			}
488*4882a593Smuzhiyun 			/*
489*4882a593Smuzhiyun 			 * We still have 'extra' number of bytes leftover.
490*4882a593Smuzhiyun 			 */
491*4882a593Smuzhiyun 			if (l) {
492*4882a593Smuzhiyun 				u32 v = *addr;
493*4882a593Smuzhiyun 
494*4882a593Smuzhiyun 				if (l + extra >= sizeof(u32)) {
495*4882a593Smuzhiyun 					data |= set_upper_bits(v, shift);
496*4882a593Smuzhiyun 					len -= l + extra - sizeof(u32);
497*4882a593Smuzhiyun 					if (len == length) {
498*4882a593Smuzhiyun 						last = data;
499*4882a593Smuzhiyun 						break;
500*4882a593Smuzhiyun 					}
501*4882a593Smuzhiyun 					__raw_writel(data, piobuf);
502*4882a593Smuzhiyun 					piobuf++;
503*4882a593Smuzhiyun 					extra = 0;
504*4882a593Smuzhiyun 					data = 0;
505*4882a593Smuzhiyun 				} else {
506*4882a593Smuzhiyun 					/* Clear unused upper bytes */
507*4882a593Smuzhiyun 					data |= clear_upper_bytes(v, l, extra);
508*4882a593Smuzhiyun 					if (len == length) {
509*4882a593Smuzhiyun 						last = data;
510*4882a593Smuzhiyun 						break;
511*4882a593Smuzhiyun 					}
512*4882a593Smuzhiyun 					extra += l;
513*4882a593Smuzhiyun 				}
514*4882a593Smuzhiyun 			} else if (len == length) {
515*4882a593Smuzhiyun 				last = data;
516*4882a593Smuzhiyun 				break;
517*4882a593Smuzhiyun 			}
518*4882a593Smuzhiyun 		} else if (len == length) {
519*4882a593Smuzhiyun 			u32 w;
520*4882a593Smuzhiyun 
521*4882a593Smuzhiyun 			/*
522*4882a593Smuzhiyun 			 * Need to round up for the last dword in the
523*4882a593Smuzhiyun 			 * packet.
524*4882a593Smuzhiyun 			 */
525*4882a593Smuzhiyun 			w = (len + 3) >> 2;
526*4882a593Smuzhiyun 			qib_pio_copy(piobuf, ss->sge.vaddr, w - 1);
527*4882a593Smuzhiyun 			piobuf += w - 1;
528*4882a593Smuzhiyun 			last = ((u32 *) ss->sge.vaddr)[w - 1];
529*4882a593Smuzhiyun 			break;
530*4882a593Smuzhiyun 		} else {
531*4882a593Smuzhiyun 			u32 w = len >> 2;
532*4882a593Smuzhiyun 
533*4882a593Smuzhiyun 			qib_pio_copy(piobuf, ss->sge.vaddr, w);
534*4882a593Smuzhiyun 			piobuf += w;
535*4882a593Smuzhiyun 
536*4882a593Smuzhiyun 			extra = len & (sizeof(u32) - 1);
537*4882a593Smuzhiyun 			if (extra) {
538*4882a593Smuzhiyun 				u32 v = ((u32 *) ss->sge.vaddr)[w];
539*4882a593Smuzhiyun 
540*4882a593Smuzhiyun 				/* Clear unused upper bytes */
541*4882a593Smuzhiyun 				data = clear_upper_bytes(v, extra, 0);
542*4882a593Smuzhiyun 			}
543*4882a593Smuzhiyun 		}
544*4882a593Smuzhiyun 		rvt_update_sge(ss, len, false);
545*4882a593Smuzhiyun 		length -= len;
546*4882a593Smuzhiyun 	}
547*4882a593Smuzhiyun 	/* Update address before sending packet. */
548*4882a593Smuzhiyun 	rvt_update_sge(ss, length, false);
549*4882a593Smuzhiyun 	if (flush_wc) {
550*4882a593Smuzhiyun 		/* must flush early everything before trigger word */
551*4882a593Smuzhiyun 		qib_flush_wc();
552*4882a593Smuzhiyun 		__raw_writel(last, piobuf);
553*4882a593Smuzhiyun 		/* be sure trigger word is written */
554*4882a593Smuzhiyun 		qib_flush_wc();
555*4882a593Smuzhiyun 	} else
556*4882a593Smuzhiyun 		__raw_writel(last, piobuf);
557*4882a593Smuzhiyun }
558*4882a593Smuzhiyun 
__get_txreq(struct qib_ibdev * dev,struct rvt_qp * qp)559*4882a593Smuzhiyun static noinline struct qib_verbs_txreq *__get_txreq(struct qib_ibdev *dev,
560*4882a593Smuzhiyun 					   struct rvt_qp *qp)
561*4882a593Smuzhiyun {
562*4882a593Smuzhiyun 	struct qib_qp_priv *priv = qp->priv;
563*4882a593Smuzhiyun 	struct qib_verbs_txreq *tx;
564*4882a593Smuzhiyun 	unsigned long flags;
565*4882a593Smuzhiyun 
566*4882a593Smuzhiyun 	spin_lock_irqsave(&qp->s_lock, flags);
567*4882a593Smuzhiyun 	spin_lock(&dev->rdi.pending_lock);
568*4882a593Smuzhiyun 
569*4882a593Smuzhiyun 	if (!list_empty(&dev->txreq_free)) {
570*4882a593Smuzhiyun 		struct list_head *l = dev->txreq_free.next;
571*4882a593Smuzhiyun 
572*4882a593Smuzhiyun 		list_del(l);
573*4882a593Smuzhiyun 		spin_unlock(&dev->rdi.pending_lock);
574*4882a593Smuzhiyun 		spin_unlock_irqrestore(&qp->s_lock, flags);
575*4882a593Smuzhiyun 		tx = list_entry(l, struct qib_verbs_txreq, txreq.list);
576*4882a593Smuzhiyun 	} else {
577*4882a593Smuzhiyun 		if (ib_rvt_state_ops[qp->state] & RVT_PROCESS_RECV_OK &&
578*4882a593Smuzhiyun 		    list_empty(&priv->iowait)) {
579*4882a593Smuzhiyun 			dev->n_txwait++;
580*4882a593Smuzhiyun 			qp->s_flags |= RVT_S_WAIT_TX;
581*4882a593Smuzhiyun 			list_add_tail(&priv->iowait, &dev->txwait);
582*4882a593Smuzhiyun 		}
583*4882a593Smuzhiyun 		qp->s_flags &= ~RVT_S_BUSY;
584*4882a593Smuzhiyun 		spin_unlock(&dev->rdi.pending_lock);
585*4882a593Smuzhiyun 		spin_unlock_irqrestore(&qp->s_lock, flags);
586*4882a593Smuzhiyun 		tx = ERR_PTR(-EBUSY);
587*4882a593Smuzhiyun 	}
588*4882a593Smuzhiyun 	return tx;
589*4882a593Smuzhiyun }
590*4882a593Smuzhiyun 
get_txreq(struct qib_ibdev * dev,struct rvt_qp * qp)591*4882a593Smuzhiyun static inline struct qib_verbs_txreq *get_txreq(struct qib_ibdev *dev,
592*4882a593Smuzhiyun 					 struct rvt_qp *qp)
593*4882a593Smuzhiyun {
594*4882a593Smuzhiyun 	struct qib_verbs_txreq *tx;
595*4882a593Smuzhiyun 	unsigned long flags;
596*4882a593Smuzhiyun 
597*4882a593Smuzhiyun 	spin_lock_irqsave(&dev->rdi.pending_lock, flags);
598*4882a593Smuzhiyun 	/* assume the list non empty */
599*4882a593Smuzhiyun 	if (likely(!list_empty(&dev->txreq_free))) {
600*4882a593Smuzhiyun 		struct list_head *l = dev->txreq_free.next;
601*4882a593Smuzhiyun 
602*4882a593Smuzhiyun 		list_del(l);
603*4882a593Smuzhiyun 		spin_unlock_irqrestore(&dev->rdi.pending_lock, flags);
604*4882a593Smuzhiyun 		tx = list_entry(l, struct qib_verbs_txreq, txreq.list);
605*4882a593Smuzhiyun 	} else {
606*4882a593Smuzhiyun 		/* call slow path to get the extra lock */
607*4882a593Smuzhiyun 		spin_unlock_irqrestore(&dev->rdi.pending_lock, flags);
608*4882a593Smuzhiyun 		tx =  __get_txreq(dev, qp);
609*4882a593Smuzhiyun 	}
610*4882a593Smuzhiyun 	return tx;
611*4882a593Smuzhiyun }
612*4882a593Smuzhiyun 
qib_put_txreq(struct qib_verbs_txreq * tx)613*4882a593Smuzhiyun void qib_put_txreq(struct qib_verbs_txreq *tx)
614*4882a593Smuzhiyun {
615*4882a593Smuzhiyun 	struct qib_ibdev *dev;
616*4882a593Smuzhiyun 	struct rvt_qp *qp;
617*4882a593Smuzhiyun 	struct qib_qp_priv *priv;
618*4882a593Smuzhiyun 	unsigned long flags;
619*4882a593Smuzhiyun 
620*4882a593Smuzhiyun 	qp = tx->qp;
621*4882a593Smuzhiyun 	dev = to_idev(qp->ibqp.device);
622*4882a593Smuzhiyun 
623*4882a593Smuzhiyun 	if (tx->mr) {
624*4882a593Smuzhiyun 		rvt_put_mr(tx->mr);
625*4882a593Smuzhiyun 		tx->mr = NULL;
626*4882a593Smuzhiyun 	}
627*4882a593Smuzhiyun 	if (tx->txreq.flags & QIB_SDMA_TXREQ_F_FREEBUF) {
628*4882a593Smuzhiyun 		tx->txreq.flags &= ~QIB_SDMA_TXREQ_F_FREEBUF;
629*4882a593Smuzhiyun 		dma_unmap_single(&dd_from_dev(dev)->pcidev->dev,
630*4882a593Smuzhiyun 				 tx->txreq.addr, tx->hdr_dwords << 2,
631*4882a593Smuzhiyun 				 DMA_TO_DEVICE);
632*4882a593Smuzhiyun 		kfree(tx->align_buf);
633*4882a593Smuzhiyun 	}
634*4882a593Smuzhiyun 
635*4882a593Smuzhiyun 	spin_lock_irqsave(&dev->rdi.pending_lock, flags);
636*4882a593Smuzhiyun 
637*4882a593Smuzhiyun 	/* Put struct back on free list */
638*4882a593Smuzhiyun 	list_add(&tx->txreq.list, &dev->txreq_free);
639*4882a593Smuzhiyun 
640*4882a593Smuzhiyun 	if (!list_empty(&dev->txwait)) {
641*4882a593Smuzhiyun 		/* Wake up first QP wanting a free struct */
642*4882a593Smuzhiyun 		priv = list_entry(dev->txwait.next, struct qib_qp_priv,
643*4882a593Smuzhiyun 				  iowait);
644*4882a593Smuzhiyun 		qp = priv->owner;
645*4882a593Smuzhiyun 		list_del_init(&priv->iowait);
646*4882a593Smuzhiyun 		rvt_get_qp(qp);
647*4882a593Smuzhiyun 		spin_unlock_irqrestore(&dev->rdi.pending_lock, flags);
648*4882a593Smuzhiyun 
649*4882a593Smuzhiyun 		spin_lock_irqsave(&qp->s_lock, flags);
650*4882a593Smuzhiyun 		if (qp->s_flags & RVT_S_WAIT_TX) {
651*4882a593Smuzhiyun 			qp->s_flags &= ~RVT_S_WAIT_TX;
652*4882a593Smuzhiyun 			qib_schedule_send(qp);
653*4882a593Smuzhiyun 		}
654*4882a593Smuzhiyun 		spin_unlock_irqrestore(&qp->s_lock, flags);
655*4882a593Smuzhiyun 
656*4882a593Smuzhiyun 		rvt_put_qp(qp);
657*4882a593Smuzhiyun 	} else
658*4882a593Smuzhiyun 		spin_unlock_irqrestore(&dev->rdi.pending_lock, flags);
659*4882a593Smuzhiyun }
660*4882a593Smuzhiyun 
661*4882a593Smuzhiyun /*
662*4882a593Smuzhiyun  * This is called when there are send DMA descriptors that might be
663*4882a593Smuzhiyun  * available.
664*4882a593Smuzhiyun  *
665*4882a593Smuzhiyun  * This is called with ppd->sdma_lock held.
666*4882a593Smuzhiyun  */
qib_verbs_sdma_desc_avail(struct qib_pportdata * ppd,unsigned avail)667*4882a593Smuzhiyun void qib_verbs_sdma_desc_avail(struct qib_pportdata *ppd, unsigned avail)
668*4882a593Smuzhiyun {
669*4882a593Smuzhiyun 	struct rvt_qp *qp;
670*4882a593Smuzhiyun 	struct qib_qp_priv *qpp, *nqpp;
671*4882a593Smuzhiyun 	struct rvt_qp *qps[20];
672*4882a593Smuzhiyun 	struct qib_ibdev *dev;
673*4882a593Smuzhiyun 	unsigned i, n;
674*4882a593Smuzhiyun 
675*4882a593Smuzhiyun 	n = 0;
676*4882a593Smuzhiyun 	dev = &ppd->dd->verbs_dev;
677*4882a593Smuzhiyun 	spin_lock(&dev->rdi.pending_lock);
678*4882a593Smuzhiyun 
679*4882a593Smuzhiyun 	/* Search wait list for first QP wanting DMA descriptors. */
680*4882a593Smuzhiyun 	list_for_each_entry_safe(qpp, nqpp, &dev->dmawait, iowait) {
681*4882a593Smuzhiyun 		qp = qpp->owner;
682*4882a593Smuzhiyun 		if (qp->port_num != ppd->port)
683*4882a593Smuzhiyun 			continue;
684*4882a593Smuzhiyun 		if (n == ARRAY_SIZE(qps))
685*4882a593Smuzhiyun 			break;
686*4882a593Smuzhiyun 		if (qpp->s_tx->txreq.sg_count > avail)
687*4882a593Smuzhiyun 			break;
688*4882a593Smuzhiyun 		avail -= qpp->s_tx->txreq.sg_count;
689*4882a593Smuzhiyun 		list_del_init(&qpp->iowait);
690*4882a593Smuzhiyun 		rvt_get_qp(qp);
691*4882a593Smuzhiyun 		qps[n++] = qp;
692*4882a593Smuzhiyun 	}
693*4882a593Smuzhiyun 
694*4882a593Smuzhiyun 	spin_unlock(&dev->rdi.pending_lock);
695*4882a593Smuzhiyun 
696*4882a593Smuzhiyun 	for (i = 0; i < n; i++) {
697*4882a593Smuzhiyun 		qp = qps[i];
698*4882a593Smuzhiyun 		spin_lock(&qp->s_lock);
699*4882a593Smuzhiyun 		if (qp->s_flags & RVT_S_WAIT_DMA_DESC) {
700*4882a593Smuzhiyun 			qp->s_flags &= ~RVT_S_WAIT_DMA_DESC;
701*4882a593Smuzhiyun 			qib_schedule_send(qp);
702*4882a593Smuzhiyun 		}
703*4882a593Smuzhiyun 		spin_unlock(&qp->s_lock);
704*4882a593Smuzhiyun 		rvt_put_qp(qp);
705*4882a593Smuzhiyun 	}
706*4882a593Smuzhiyun }
707*4882a593Smuzhiyun 
708*4882a593Smuzhiyun /*
709*4882a593Smuzhiyun  * This is called with ppd->sdma_lock held.
710*4882a593Smuzhiyun  */
sdma_complete(struct qib_sdma_txreq * cookie,int status)711*4882a593Smuzhiyun static void sdma_complete(struct qib_sdma_txreq *cookie, int status)
712*4882a593Smuzhiyun {
713*4882a593Smuzhiyun 	struct qib_verbs_txreq *tx =
714*4882a593Smuzhiyun 		container_of(cookie, struct qib_verbs_txreq, txreq);
715*4882a593Smuzhiyun 	struct rvt_qp *qp = tx->qp;
716*4882a593Smuzhiyun 	struct qib_qp_priv *priv = qp->priv;
717*4882a593Smuzhiyun 
718*4882a593Smuzhiyun 	spin_lock(&qp->s_lock);
719*4882a593Smuzhiyun 	if (tx->wqe)
720*4882a593Smuzhiyun 		rvt_send_complete(qp, tx->wqe, IB_WC_SUCCESS);
721*4882a593Smuzhiyun 	else if (qp->ibqp.qp_type == IB_QPT_RC) {
722*4882a593Smuzhiyun 		struct ib_header *hdr;
723*4882a593Smuzhiyun 
724*4882a593Smuzhiyun 		if (tx->txreq.flags & QIB_SDMA_TXREQ_F_FREEBUF)
725*4882a593Smuzhiyun 			hdr = &tx->align_buf->hdr;
726*4882a593Smuzhiyun 		else {
727*4882a593Smuzhiyun 			struct qib_ibdev *dev = to_idev(qp->ibqp.device);
728*4882a593Smuzhiyun 
729*4882a593Smuzhiyun 			hdr = &dev->pio_hdrs[tx->hdr_inx].hdr;
730*4882a593Smuzhiyun 		}
731*4882a593Smuzhiyun 		qib_rc_send_complete(qp, hdr);
732*4882a593Smuzhiyun 	}
733*4882a593Smuzhiyun 	if (atomic_dec_and_test(&priv->s_dma_busy)) {
734*4882a593Smuzhiyun 		if (qp->state == IB_QPS_RESET)
735*4882a593Smuzhiyun 			wake_up(&priv->wait_dma);
736*4882a593Smuzhiyun 		else if (qp->s_flags & RVT_S_WAIT_DMA) {
737*4882a593Smuzhiyun 			qp->s_flags &= ~RVT_S_WAIT_DMA;
738*4882a593Smuzhiyun 			qib_schedule_send(qp);
739*4882a593Smuzhiyun 		}
740*4882a593Smuzhiyun 	}
741*4882a593Smuzhiyun 	spin_unlock(&qp->s_lock);
742*4882a593Smuzhiyun 
743*4882a593Smuzhiyun 	qib_put_txreq(tx);
744*4882a593Smuzhiyun }
745*4882a593Smuzhiyun 
wait_kmem(struct qib_ibdev * dev,struct rvt_qp * qp)746*4882a593Smuzhiyun static int wait_kmem(struct qib_ibdev *dev, struct rvt_qp *qp)
747*4882a593Smuzhiyun {
748*4882a593Smuzhiyun 	struct qib_qp_priv *priv = qp->priv;
749*4882a593Smuzhiyun 	unsigned long flags;
750*4882a593Smuzhiyun 	int ret = 0;
751*4882a593Smuzhiyun 
752*4882a593Smuzhiyun 	spin_lock_irqsave(&qp->s_lock, flags);
753*4882a593Smuzhiyun 	if (ib_rvt_state_ops[qp->state] & RVT_PROCESS_RECV_OK) {
754*4882a593Smuzhiyun 		spin_lock(&dev->rdi.pending_lock);
755*4882a593Smuzhiyun 		if (list_empty(&priv->iowait)) {
756*4882a593Smuzhiyun 			if (list_empty(&dev->memwait))
757*4882a593Smuzhiyun 				mod_timer(&dev->mem_timer, jiffies + 1);
758*4882a593Smuzhiyun 			qp->s_flags |= RVT_S_WAIT_KMEM;
759*4882a593Smuzhiyun 			list_add_tail(&priv->iowait, &dev->memwait);
760*4882a593Smuzhiyun 		}
761*4882a593Smuzhiyun 		spin_unlock(&dev->rdi.pending_lock);
762*4882a593Smuzhiyun 		qp->s_flags &= ~RVT_S_BUSY;
763*4882a593Smuzhiyun 		ret = -EBUSY;
764*4882a593Smuzhiyun 	}
765*4882a593Smuzhiyun 	spin_unlock_irqrestore(&qp->s_lock, flags);
766*4882a593Smuzhiyun 
767*4882a593Smuzhiyun 	return ret;
768*4882a593Smuzhiyun }
769*4882a593Smuzhiyun 
qib_verbs_send_dma(struct rvt_qp * qp,struct ib_header * hdr,u32 hdrwords,struct rvt_sge_state * ss,u32 len,u32 plen,u32 dwords)770*4882a593Smuzhiyun static int qib_verbs_send_dma(struct rvt_qp *qp, struct ib_header *hdr,
771*4882a593Smuzhiyun 			      u32 hdrwords, struct rvt_sge_state *ss, u32 len,
772*4882a593Smuzhiyun 			      u32 plen, u32 dwords)
773*4882a593Smuzhiyun {
774*4882a593Smuzhiyun 	struct qib_qp_priv *priv = qp->priv;
775*4882a593Smuzhiyun 	struct qib_ibdev *dev = to_idev(qp->ibqp.device);
776*4882a593Smuzhiyun 	struct qib_devdata *dd = dd_from_dev(dev);
777*4882a593Smuzhiyun 	struct qib_ibport *ibp = to_iport(qp->ibqp.device, qp->port_num);
778*4882a593Smuzhiyun 	struct qib_pportdata *ppd = ppd_from_ibp(ibp);
779*4882a593Smuzhiyun 	struct qib_verbs_txreq *tx;
780*4882a593Smuzhiyun 	struct qib_pio_header *phdr;
781*4882a593Smuzhiyun 	u32 control;
782*4882a593Smuzhiyun 	u32 ndesc;
783*4882a593Smuzhiyun 	int ret;
784*4882a593Smuzhiyun 
785*4882a593Smuzhiyun 	tx = priv->s_tx;
786*4882a593Smuzhiyun 	if (tx) {
787*4882a593Smuzhiyun 		priv->s_tx = NULL;
788*4882a593Smuzhiyun 		/* resend previously constructed packet */
789*4882a593Smuzhiyun 		ret = qib_sdma_verbs_send(ppd, tx->ss, tx->dwords, tx);
790*4882a593Smuzhiyun 		goto bail;
791*4882a593Smuzhiyun 	}
792*4882a593Smuzhiyun 
793*4882a593Smuzhiyun 	tx = get_txreq(dev, qp);
794*4882a593Smuzhiyun 	if (IS_ERR(tx))
795*4882a593Smuzhiyun 		goto bail_tx;
796*4882a593Smuzhiyun 
797*4882a593Smuzhiyun 	control = dd->f_setpbc_control(ppd, plen, qp->s_srate,
798*4882a593Smuzhiyun 				       be16_to_cpu(hdr->lrh[0]) >> 12);
799*4882a593Smuzhiyun 	tx->qp = qp;
800*4882a593Smuzhiyun 	tx->wqe = qp->s_wqe;
801*4882a593Smuzhiyun 	tx->mr = qp->s_rdma_mr;
802*4882a593Smuzhiyun 	if (qp->s_rdma_mr)
803*4882a593Smuzhiyun 		qp->s_rdma_mr = NULL;
804*4882a593Smuzhiyun 	tx->txreq.callback = sdma_complete;
805*4882a593Smuzhiyun 	if (dd->flags & QIB_HAS_SDMA_TIMEOUT)
806*4882a593Smuzhiyun 		tx->txreq.flags = QIB_SDMA_TXREQ_F_HEADTOHOST;
807*4882a593Smuzhiyun 	else
808*4882a593Smuzhiyun 		tx->txreq.flags = QIB_SDMA_TXREQ_F_INTREQ;
809*4882a593Smuzhiyun 	if (plen + 1 > dd->piosize2kmax_dwords)
810*4882a593Smuzhiyun 		tx->txreq.flags |= QIB_SDMA_TXREQ_F_USELARGEBUF;
811*4882a593Smuzhiyun 
812*4882a593Smuzhiyun 	if (len) {
813*4882a593Smuzhiyun 		/*
814*4882a593Smuzhiyun 		 * Don't try to DMA if it takes more descriptors than
815*4882a593Smuzhiyun 		 * the queue holds.
816*4882a593Smuzhiyun 		 */
817*4882a593Smuzhiyun 		ndesc = qib_count_sge(ss, len);
818*4882a593Smuzhiyun 		if (ndesc >= ppd->sdma_descq_cnt)
819*4882a593Smuzhiyun 			ndesc = 0;
820*4882a593Smuzhiyun 	} else
821*4882a593Smuzhiyun 		ndesc = 1;
822*4882a593Smuzhiyun 	if (ndesc) {
823*4882a593Smuzhiyun 		phdr = &dev->pio_hdrs[tx->hdr_inx];
824*4882a593Smuzhiyun 		phdr->pbc[0] = cpu_to_le32(plen);
825*4882a593Smuzhiyun 		phdr->pbc[1] = cpu_to_le32(control);
826*4882a593Smuzhiyun 		memcpy(&phdr->hdr, hdr, hdrwords << 2);
827*4882a593Smuzhiyun 		tx->txreq.flags |= QIB_SDMA_TXREQ_F_FREEDESC;
828*4882a593Smuzhiyun 		tx->txreq.sg_count = ndesc;
829*4882a593Smuzhiyun 		tx->txreq.addr = dev->pio_hdrs_phys +
830*4882a593Smuzhiyun 			tx->hdr_inx * sizeof(struct qib_pio_header);
831*4882a593Smuzhiyun 		tx->hdr_dwords = hdrwords + 2; /* add PBC length */
832*4882a593Smuzhiyun 		ret = qib_sdma_verbs_send(ppd, ss, dwords, tx);
833*4882a593Smuzhiyun 		goto bail;
834*4882a593Smuzhiyun 	}
835*4882a593Smuzhiyun 
836*4882a593Smuzhiyun 	/* Allocate a buffer and copy the header and payload to it. */
837*4882a593Smuzhiyun 	tx->hdr_dwords = plen + 1;
838*4882a593Smuzhiyun 	phdr = kmalloc(tx->hdr_dwords << 2, GFP_ATOMIC);
839*4882a593Smuzhiyun 	if (!phdr)
840*4882a593Smuzhiyun 		goto err_tx;
841*4882a593Smuzhiyun 	phdr->pbc[0] = cpu_to_le32(plen);
842*4882a593Smuzhiyun 	phdr->pbc[1] = cpu_to_le32(control);
843*4882a593Smuzhiyun 	memcpy(&phdr->hdr, hdr, hdrwords << 2);
844*4882a593Smuzhiyun 	qib_copy_from_sge((u32 *) &phdr->hdr + hdrwords, ss, len);
845*4882a593Smuzhiyun 
846*4882a593Smuzhiyun 	tx->txreq.addr = dma_map_single(&dd->pcidev->dev, phdr,
847*4882a593Smuzhiyun 					tx->hdr_dwords << 2, DMA_TO_DEVICE);
848*4882a593Smuzhiyun 	if (dma_mapping_error(&dd->pcidev->dev, tx->txreq.addr))
849*4882a593Smuzhiyun 		goto map_err;
850*4882a593Smuzhiyun 	tx->align_buf = phdr;
851*4882a593Smuzhiyun 	tx->txreq.flags |= QIB_SDMA_TXREQ_F_FREEBUF;
852*4882a593Smuzhiyun 	tx->txreq.sg_count = 1;
853*4882a593Smuzhiyun 	ret = qib_sdma_verbs_send(ppd, NULL, 0, tx);
854*4882a593Smuzhiyun 	goto unaligned;
855*4882a593Smuzhiyun 
856*4882a593Smuzhiyun map_err:
857*4882a593Smuzhiyun 	kfree(phdr);
858*4882a593Smuzhiyun err_tx:
859*4882a593Smuzhiyun 	qib_put_txreq(tx);
860*4882a593Smuzhiyun 	ret = wait_kmem(dev, qp);
861*4882a593Smuzhiyun unaligned:
862*4882a593Smuzhiyun 	ibp->rvp.n_unaligned++;
863*4882a593Smuzhiyun bail:
864*4882a593Smuzhiyun 	return ret;
865*4882a593Smuzhiyun bail_tx:
866*4882a593Smuzhiyun 	ret = PTR_ERR(tx);
867*4882a593Smuzhiyun 	goto bail;
868*4882a593Smuzhiyun }
869*4882a593Smuzhiyun 
870*4882a593Smuzhiyun /*
871*4882a593Smuzhiyun  * If we are now in the error state, return zero to flush the
872*4882a593Smuzhiyun  * send work request.
873*4882a593Smuzhiyun  */
no_bufs_available(struct rvt_qp * qp)874*4882a593Smuzhiyun static int no_bufs_available(struct rvt_qp *qp)
875*4882a593Smuzhiyun {
876*4882a593Smuzhiyun 	struct qib_qp_priv *priv = qp->priv;
877*4882a593Smuzhiyun 	struct qib_ibdev *dev = to_idev(qp->ibqp.device);
878*4882a593Smuzhiyun 	struct qib_devdata *dd;
879*4882a593Smuzhiyun 	unsigned long flags;
880*4882a593Smuzhiyun 	int ret = 0;
881*4882a593Smuzhiyun 
882*4882a593Smuzhiyun 	/*
883*4882a593Smuzhiyun 	 * Note that as soon as want_buffer() is called and
884*4882a593Smuzhiyun 	 * possibly before it returns, qib_ib_piobufavail()
885*4882a593Smuzhiyun 	 * could be called. Therefore, put QP on the I/O wait list before
886*4882a593Smuzhiyun 	 * enabling the PIO avail interrupt.
887*4882a593Smuzhiyun 	 */
888*4882a593Smuzhiyun 	spin_lock_irqsave(&qp->s_lock, flags);
889*4882a593Smuzhiyun 	if (ib_rvt_state_ops[qp->state] & RVT_PROCESS_RECV_OK) {
890*4882a593Smuzhiyun 		spin_lock(&dev->rdi.pending_lock);
891*4882a593Smuzhiyun 		if (list_empty(&priv->iowait)) {
892*4882a593Smuzhiyun 			dev->n_piowait++;
893*4882a593Smuzhiyun 			qp->s_flags |= RVT_S_WAIT_PIO;
894*4882a593Smuzhiyun 			list_add_tail(&priv->iowait, &dev->piowait);
895*4882a593Smuzhiyun 			dd = dd_from_dev(dev);
896*4882a593Smuzhiyun 			dd->f_wantpiobuf_intr(dd, 1);
897*4882a593Smuzhiyun 		}
898*4882a593Smuzhiyun 		spin_unlock(&dev->rdi.pending_lock);
899*4882a593Smuzhiyun 		qp->s_flags &= ~RVT_S_BUSY;
900*4882a593Smuzhiyun 		ret = -EBUSY;
901*4882a593Smuzhiyun 	}
902*4882a593Smuzhiyun 	spin_unlock_irqrestore(&qp->s_lock, flags);
903*4882a593Smuzhiyun 	return ret;
904*4882a593Smuzhiyun }
905*4882a593Smuzhiyun 
qib_verbs_send_pio(struct rvt_qp * qp,struct ib_header * ibhdr,u32 hdrwords,struct rvt_sge_state * ss,u32 len,u32 plen,u32 dwords)906*4882a593Smuzhiyun static int qib_verbs_send_pio(struct rvt_qp *qp, struct ib_header *ibhdr,
907*4882a593Smuzhiyun 			      u32 hdrwords, struct rvt_sge_state *ss, u32 len,
908*4882a593Smuzhiyun 			      u32 plen, u32 dwords)
909*4882a593Smuzhiyun {
910*4882a593Smuzhiyun 	struct qib_devdata *dd = dd_from_ibdev(qp->ibqp.device);
911*4882a593Smuzhiyun 	struct qib_pportdata *ppd = dd->pport + qp->port_num - 1;
912*4882a593Smuzhiyun 	u32 *hdr = (u32 *) ibhdr;
913*4882a593Smuzhiyun 	u32 __iomem *piobuf_orig;
914*4882a593Smuzhiyun 	u32 __iomem *piobuf;
915*4882a593Smuzhiyun 	u64 pbc;
916*4882a593Smuzhiyun 	unsigned long flags;
917*4882a593Smuzhiyun 	unsigned flush_wc;
918*4882a593Smuzhiyun 	u32 control;
919*4882a593Smuzhiyun 	u32 pbufn;
920*4882a593Smuzhiyun 
921*4882a593Smuzhiyun 	control = dd->f_setpbc_control(ppd, plen, qp->s_srate,
922*4882a593Smuzhiyun 		be16_to_cpu(ibhdr->lrh[0]) >> 12);
923*4882a593Smuzhiyun 	pbc = ((u64) control << 32) | plen;
924*4882a593Smuzhiyun 	piobuf = dd->f_getsendbuf(ppd, pbc, &pbufn);
925*4882a593Smuzhiyun 	if (unlikely(piobuf == NULL))
926*4882a593Smuzhiyun 		return no_bufs_available(qp);
927*4882a593Smuzhiyun 
928*4882a593Smuzhiyun 	/*
929*4882a593Smuzhiyun 	 * Write the pbc.
930*4882a593Smuzhiyun 	 * We have to flush after the PBC for correctness on some cpus
931*4882a593Smuzhiyun 	 * or WC buffer can be written out of order.
932*4882a593Smuzhiyun 	 */
933*4882a593Smuzhiyun 	writeq(pbc, piobuf);
934*4882a593Smuzhiyun 	piobuf_orig = piobuf;
935*4882a593Smuzhiyun 	piobuf += 2;
936*4882a593Smuzhiyun 
937*4882a593Smuzhiyun 	flush_wc = dd->flags & QIB_PIO_FLUSH_WC;
938*4882a593Smuzhiyun 	if (len == 0) {
939*4882a593Smuzhiyun 		/*
940*4882a593Smuzhiyun 		 * If there is just the header portion, must flush before
941*4882a593Smuzhiyun 		 * writing last word of header for correctness, and after
942*4882a593Smuzhiyun 		 * the last header word (trigger word).
943*4882a593Smuzhiyun 		 */
944*4882a593Smuzhiyun 		if (flush_wc) {
945*4882a593Smuzhiyun 			qib_flush_wc();
946*4882a593Smuzhiyun 			qib_pio_copy(piobuf, hdr, hdrwords - 1);
947*4882a593Smuzhiyun 			qib_flush_wc();
948*4882a593Smuzhiyun 			__raw_writel(hdr[hdrwords - 1], piobuf + hdrwords - 1);
949*4882a593Smuzhiyun 			qib_flush_wc();
950*4882a593Smuzhiyun 		} else
951*4882a593Smuzhiyun 			qib_pio_copy(piobuf, hdr, hdrwords);
952*4882a593Smuzhiyun 		goto done;
953*4882a593Smuzhiyun 	}
954*4882a593Smuzhiyun 
955*4882a593Smuzhiyun 	if (flush_wc)
956*4882a593Smuzhiyun 		qib_flush_wc();
957*4882a593Smuzhiyun 	qib_pio_copy(piobuf, hdr, hdrwords);
958*4882a593Smuzhiyun 	piobuf += hdrwords;
959*4882a593Smuzhiyun 
960*4882a593Smuzhiyun 	/* The common case is aligned and contained in one segment. */
961*4882a593Smuzhiyun 	if (likely(ss->num_sge == 1 && len <= ss->sge.length &&
962*4882a593Smuzhiyun 		   !((unsigned long)ss->sge.vaddr & (sizeof(u32) - 1)))) {
963*4882a593Smuzhiyun 		u32 *addr = (u32 *) ss->sge.vaddr;
964*4882a593Smuzhiyun 
965*4882a593Smuzhiyun 		/* Update address before sending packet. */
966*4882a593Smuzhiyun 		rvt_update_sge(ss, len, false);
967*4882a593Smuzhiyun 		if (flush_wc) {
968*4882a593Smuzhiyun 			qib_pio_copy(piobuf, addr, dwords - 1);
969*4882a593Smuzhiyun 			/* must flush early everything before trigger word */
970*4882a593Smuzhiyun 			qib_flush_wc();
971*4882a593Smuzhiyun 			__raw_writel(addr[dwords - 1], piobuf + dwords - 1);
972*4882a593Smuzhiyun 			/* be sure trigger word is written */
973*4882a593Smuzhiyun 			qib_flush_wc();
974*4882a593Smuzhiyun 		} else
975*4882a593Smuzhiyun 			qib_pio_copy(piobuf, addr, dwords);
976*4882a593Smuzhiyun 		goto done;
977*4882a593Smuzhiyun 	}
978*4882a593Smuzhiyun 	copy_io(piobuf, ss, len, flush_wc);
979*4882a593Smuzhiyun done:
980*4882a593Smuzhiyun 	if (dd->flags & QIB_USE_SPCL_TRIG) {
981*4882a593Smuzhiyun 		u32 spcl_off = (pbufn >= dd->piobcnt2k) ? 2047 : 1023;
982*4882a593Smuzhiyun 
983*4882a593Smuzhiyun 		qib_flush_wc();
984*4882a593Smuzhiyun 		__raw_writel(0xaebecede, piobuf_orig + spcl_off);
985*4882a593Smuzhiyun 	}
986*4882a593Smuzhiyun 	qib_sendbuf_done(dd, pbufn);
987*4882a593Smuzhiyun 	if (qp->s_rdma_mr) {
988*4882a593Smuzhiyun 		rvt_put_mr(qp->s_rdma_mr);
989*4882a593Smuzhiyun 		qp->s_rdma_mr = NULL;
990*4882a593Smuzhiyun 	}
991*4882a593Smuzhiyun 	if (qp->s_wqe) {
992*4882a593Smuzhiyun 		spin_lock_irqsave(&qp->s_lock, flags);
993*4882a593Smuzhiyun 		rvt_send_complete(qp, qp->s_wqe, IB_WC_SUCCESS);
994*4882a593Smuzhiyun 		spin_unlock_irqrestore(&qp->s_lock, flags);
995*4882a593Smuzhiyun 	} else if (qp->ibqp.qp_type == IB_QPT_RC) {
996*4882a593Smuzhiyun 		spin_lock_irqsave(&qp->s_lock, flags);
997*4882a593Smuzhiyun 		qib_rc_send_complete(qp, ibhdr);
998*4882a593Smuzhiyun 		spin_unlock_irqrestore(&qp->s_lock, flags);
999*4882a593Smuzhiyun 	}
1000*4882a593Smuzhiyun 	return 0;
1001*4882a593Smuzhiyun }
1002*4882a593Smuzhiyun 
1003*4882a593Smuzhiyun /**
1004*4882a593Smuzhiyun  * qib_verbs_send - send a packet
1005*4882a593Smuzhiyun  * @qp: the QP to send on
1006*4882a593Smuzhiyun  * @hdr: the packet header
1007*4882a593Smuzhiyun  * @hdrwords: the number of 32-bit words in the header
1008*4882a593Smuzhiyun  * @ss: the SGE to send
1009*4882a593Smuzhiyun  * @len: the length of the packet in bytes
1010*4882a593Smuzhiyun  *
1011*4882a593Smuzhiyun  * Return zero if packet is sent or queued OK.
1012*4882a593Smuzhiyun  * Return non-zero and clear qp->s_flags RVT_S_BUSY otherwise.
1013*4882a593Smuzhiyun  */
qib_verbs_send(struct rvt_qp * qp,struct ib_header * hdr,u32 hdrwords,struct rvt_sge_state * ss,u32 len)1014*4882a593Smuzhiyun int qib_verbs_send(struct rvt_qp *qp, struct ib_header *hdr,
1015*4882a593Smuzhiyun 		   u32 hdrwords, struct rvt_sge_state *ss, u32 len)
1016*4882a593Smuzhiyun {
1017*4882a593Smuzhiyun 	struct qib_devdata *dd = dd_from_ibdev(qp->ibqp.device);
1018*4882a593Smuzhiyun 	u32 plen;
1019*4882a593Smuzhiyun 	int ret;
1020*4882a593Smuzhiyun 	u32 dwords = (len + 3) >> 2;
1021*4882a593Smuzhiyun 
1022*4882a593Smuzhiyun 	/*
1023*4882a593Smuzhiyun 	 * Calculate the send buffer trigger address.
1024*4882a593Smuzhiyun 	 * The +1 counts for the pbc control dword following the pbc length.
1025*4882a593Smuzhiyun 	 */
1026*4882a593Smuzhiyun 	plen = hdrwords + dwords + 1;
1027*4882a593Smuzhiyun 
1028*4882a593Smuzhiyun 	/*
1029*4882a593Smuzhiyun 	 * VL15 packets (IB_QPT_SMI) will always use PIO, so we
1030*4882a593Smuzhiyun 	 * can defer SDMA restart until link goes ACTIVE without
1031*4882a593Smuzhiyun 	 * worrying about just how we got there.
1032*4882a593Smuzhiyun 	 */
1033*4882a593Smuzhiyun 	if (qp->ibqp.qp_type == IB_QPT_SMI ||
1034*4882a593Smuzhiyun 	    !(dd->flags & QIB_HAS_SEND_DMA))
1035*4882a593Smuzhiyun 		ret = qib_verbs_send_pio(qp, hdr, hdrwords, ss, len,
1036*4882a593Smuzhiyun 					 plen, dwords);
1037*4882a593Smuzhiyun 	else
1038*4882a593Smuzhiyun 		ret = qib_verbs_send_dma(qp, hdr, hdrwords, ss, len,
1039*4882a593Smuzhiyun 					 plen, dwords);
1040*4882a593Smuzhiyun 
1041*4882a593Smuzhiyun 	return ret;
1042*4882a593Smuzhiyun }
1043*4882a593Smuzhiyun 
qib_snapshot_counters(struct qib_pportdata * ppd,u64 * swords,u64 * rwords,u64 * spkts,u64 * rpkts,u64 * xmit_wait)1044*4882a593Smuzhiyun int qib_snapshot_counters(struct qib_pportdata *ppd, u64 *swords,
1045*4882a593Smuzhiyun 			  u64 *rwords, u64 *spkts, u64 *rpkts,
1046*4882a593Smuzhiyun 			  u64 *xmit_wait)
1047*4882a593Smuzhiyun {
1048*4882a593Smuzhiyun 	int ret;
1049*4882a593Smuzhiyun 	struct qib_devdata *dd = ppd->dd;
1050*4882a593Smuzhiyun 
1051*4882a593Smuzhiyun 	if (!(dd->flags & QIB_PRESENT)) {
1052*4882a593Smuzhiyun 		/* no hardware, freeze, etc. */
1053*4882a593Smuzhiyun 		ret = -EINVAL;
1054*4882a593Smuzhiyun 		goto bail;
1055*4882a593Smuzhiyun 	}
1056*4882a593Smuzhiyun 	*swords = dd->f_portcntr(ppd, QIBPORTCNTR_WORDSEND);
1057*4882a593Smuzhiyun 	*rwords = dd->f_portcntr(ppd, QIBPORTCNTR_WORDRCV);
1058*4882a593Smuzhiyun 	*spkts = dd->f_portcntr(ppd, QIBPORTCNTR_PKTSEND);
1059*4882a593Smuzhiyun 	*rpkts = dd->f_portcntr(ppd, QIBPORTCNTR_PKTRCV);
1060*4882a593Smuzhiyun 	*xmit_wait = dd->f_portcntr(ppd, QIBPORTCNTR_SENDSTALL);
1061*4882a593Smuzhiyun 
1062*4882a593Smuzhiyun 	ret = 0;
1063*4882a593Smuzhiyun 
1064*4882a593Smuzhiyun bail:
1065*4882a593Smuzhiyun 	return ret;
1066*4882a593Smuzhiyun }
1067*4882a593Smuzhiyun 
1068*4882a593Smuzhiyun /**
1069*4882a593Smuzhiyun  * qib_get_counters - get various chip counters
1070*4882a593Smuzhiyun  * @dd: the qlogic_ib device
1071*4882a593Smuzhiyun  * @cntrs: counters are placed here
1072*4882a593Smuzhiyun  *
1073*4882a593Smuzhiyun  * Return the counters needed by recv_pma_get_portcounters().
1074*4882a593Smuzhiyun  */
qib_get_counters(struct qib_pportdata * ppd,struct qib_verbs_counters * cntrs)1075*4882a593Smuzhiyun int qib_get_counters(struct qib_pportdata *ppd,
1076*4882a593Smuzhiyun 		     struct qib_verbs_counters *cntrs)
1077*4882a593Smuzhiyun {
1078*4882a593Smuzhiyun 	int ret;
1079*4882a593Smuzhiyun 
1080*4882a593Smuzhiyun 	if (!(ppd->dd->flags & QIB_PRESENT)) {
1081*4882a593Smuzhiyun 		/* no hardware, freeze, etc. */
1082*4882a593Smuzhiyun 		ret = -EINVAL;
1083*4882a593Smuzhiyun 		goto bail;
1084*4882a593Smuzhiyun 	}
1085*4882a593Smuzhiyun 	cntrs->symbol_error_counter =
1086*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_IBSYMBOLERR);
1087*4882a593Smuzhiyun 	cntrs->link_error_recovery_counter =
1088*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_IBLINKERRRECOV);
1089*4882a593Smuzhiyun 	/*
1090*4882a593Smuzhiyun 	 * The link downed counter counts when the other side downs the
1091*4882a593Smuzhiyun 	 * connection.  We add in the number of times we downed the link
1092*4882a593Smuzhiyun 	 * due to local link integrity errors to compensate.
1093*4882a593Smuzhiyun 	 */
1094*4882a593Smuzhiyun 	cntrs->link_downed_counter =
1095*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_IBLINKDOWN);
1096*4882a593Smuzhiyun 	cntrs->port_rcv_errors =
1097*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_RXDROPPKT) +
1098*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_RCVOVFL) +
1099*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_ERR_RLEN) +
1100*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_INVALIDRLEN) +
1101*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_ERRLINK) +
1102*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_ERRICRC) +
1103*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_ERRVCRC) +
1104*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_ERRLPCRC) +
1105*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_BADFORMAT);
1106*4882a593Smuzhiyun 	cntrs->port_rcv_errors +=
1107*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_RXLOCALPHYERR);
1108*4882a593Smuzhiyun 	cntrs->port_rcv_errors +=
1109*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_RXVLERR);
1110*4882a593Smuzhiyun 	cntrs->port_rcv_remphys_errors =
1111*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_RCVEBP);
1112*4882a593Smuzhiyun 	cntrs->port_xmit_discards =
1113*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_UNSUPVL);
1114*4882a593Smuzhiyun 	cntrs->port_xmit_data = ppd->dd->f_portcntr(ppd,
1115*4882a593Smuzhiyun 			QIBPORTCNTR_WORDSEND);
1116*4882a593Smuzhiyun 	cntrs->port_rcv_data = ppd->dd->f_portcntr(ppd,
1117*4882a593Smuzhiyun 			QIBPORTCNTR_WORDRCV);
1118*4882a593Smuzhiyun 	cntrs->port_xmit_packets = ppd->dd->f_portcntr(ppd,
1119*4882a593Smuzhiyun 			QIBPORTCNTR_PKTSEND);
1120*4882a593Smuzhiyun 	cntrs->port_rcv_packets = ppd->dd->f_portcntr(ppd,
1121*4882a593Smuzhiyun 			QIBPORTCNTR_PKTRCV);
1122*4882a593Smuzhiyun 	cntrs->local_link_integrity_errors =
1123*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_LLI);
1124*4882a593Smuzhiyun 	cntrs->excessive_buffer_overrun_errors =
1125*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_EXCESSBUFOVFL);
1126*4882a593Smuzhiyun 	cntrs->vl15_dropped =
1127*4882a593Smuzhiyun 		ppd->dd->f_portcntr(ppd, QIBPORTCNTR_VL15PKTDROP);
1128*4882a593Smuzhiyun 
1129*4882a593Smuzhiyun 	ret = 0;
1130*4882a593Smuzhiyun 
1131*4882a593Smuzhiyun bail:
1132*4882a593Smuzhiyun 	return ret;
1133*4882a593Smuzhiyun }
1134*4882a593Smuzhiyun 
1135*4882a593Smuzhiyun /**
1136*4882a593Smuzhiyun  * qib_ib_piobufavail - callback when a PIO buffer is available
1137*4882a593Smuzhiyun  * @dd: the device pointer
1138*4882a593Smuzhiyun  *
1139*4882a593Smuzhiyun  * This is called from qib_intr() at interrupt level when a PIO buffer is
1140*4882a593Smuzhiyun  * available after qib_verbs_send() returned an error that no buffers were
1141*4882a593Smuzhiyun  * available. Disable the interrupt if there are no more QPs waiting.
1142*4882a593Smuzhiyun  */
qib_ib_piobufavail(struct qib_devdata * dd)1143*4882a593Smuzhiyun void qib_ib_piobufavail(struct qib_devdata *dd)
1144*4882a593Smuzhiyun {
1145*4882a593Smuzhiyun 	struct qib_ibdev *dev = &dd->verbs_dev;
1146*4882a593Smuzhiyun 	struct list_head *list;
1147*4882a593Smuzhiyun 	struct rvt_qp *qps[5];
1148*4882a593Smuzhiyun 	struct rvt_qp *qp;
1149*4882a593Smuzhiyun 	unsigned long flags;
1150*4882a593Smuzhiyun 	unsigned i, n;
1151*4882a593Smuzhiyun 	struct qib_qp_priv *priv;
1152*4882a593Smuzhiyun 
1153*4882a593Smuzhiyun 	list = &dev->piowait;
1154*4882a593Smuzhiyun 	n = 0;
1155*4882a593Smuzhiyun 
1156*4882a593Smuzhiyun 	/*
1157*4882a593Smuzhiyun 	 * Note: checking that the piowait list is empty and clearing
1158*4882a593Smuzhiyun 	 * the buffer available interrupt needs to be atomic or we
1159*4882a593Smuzhiyun 	 * could end up with QPs on the wait list with the interrupt
1160*4882a593Smuzhiyun 	 * disabled.
1161*4882a593Smuzhiyun 	 */
1162*4882a593Smuzhiyun 	spin_lock_irqsave(&dev->rdi.pending_lock, flags);
1163*4882a593Smuzhiyun 	while (!list_empty(list)) {
1164*4882a593Smuzhiyun 		if (n == ARRAY_SIZE(qps))
1165*4882a593Smuzhiyun 			goto full;
1166*4882a593Smuzhiyun 		priv = list_entry(list->next, struct qib_qp_priv, iowait);
1167*4882a593Smuzhiyun 		qp = priv->owner;
1168*4882a593Smuzhiyun 		list_del_init(&priv->iowait);
1169*4882a593Smuzhiyun 		rvt_get_qp(qp);
1170*4882a593Smuzhiyun 		qps[n++] = qp;
1171*4882a593Smuzhiyun 	}
1172*4882a593Smuzhiyun 	dd->f_wantpiobuf_intr(dd, 0);
1173*4882a593Smuzhiyun full:
1174*4882a593Smuzhiyun 	spin_unlock_irqrestore(&dev->rdi.pending_lock, flags);
1175*4882a593Smuzhiyun 
1176*4882a593Smuzhiyun 	for (i = 0; i < n; i++) {
1177*4882a593Smuzhiyun 		qp = qps[i];
1178*4882a593Smuzhiyun 
1179*4882a593Smuzhiyun 		spin_lock_irqsave(&qp->s_lock, flags);
1180*4882a593Smuzhiyun 		if (qp->s_flags & RVT_S_WAIT_PIO) {
1181*4882a593Smuzhiyun 			qp->s_flags &= ~RVT_S_WAIT_PIO;
1182*4882a593Smuzhiyun 			qib_schedule_send(qp);
1183*4882a593Smuzhiyun 		}
1184*4882a593Smuzhiyun 		spin_unlock_irqrestore(&qp->s_lock, flags);
1185*4882a593Smuzhiyun 
1186*4882a593Smuzhiyun 		/* Notify qib_destroy_qp() if it is waiting. */
1187*4882a593Smuzhiyun 		rvt_put_qp(qp);
1188*4882a593Smuzhiyun 	}
1189*4882a593Smuzhiyun }
1190*4882a593Smuzhiyun 
qib_query_port(struct rvt_dev_info * rdi,u8 port_num,struct ib_port_attr * props)1191*4882a593Smuzhiyun static int qib_query_port(struct rvt_dev_info *rdi, u8 port_num,
1192*4882a593Smuzhiyun 			  struct ib_port_attr *props)
1193*4882a593Smuzhiyun {
1194*4882a593Smuzhiyun 	struct qib_ibdev *ibdev = container_of(rdi, struct qib_ibdev, rdi);
1195*4882a593Smuzhiyun 	struct qib_devdata *dd = dd_from_dev(ibdev);
1196*4882a593Smuzhiyun 	struct qib_pportdata *ppd = &dd->pport[port_num - 1];
1197*4882a593Smuzhiyun 	enum ib_mtu mtu;
1198*4882a593Smuzhiyun 	u16 lid = ppd->lid;
1199*4882a593Smuzhiyun 
1200*4882a593Smuzhiyun 	/* props being zeroed by the caller, avoid zeroing it here */
1201*4882a593Smuzhiyun 	props->lid = lid ? lid : be16_to_cpu(IB_LID_PERMISSIVE);
1202*4882a593Smuzhiyun 	props->lmc = ppd->lmc;
1203*4882a593Smuzhiyun 	props->state = dd->f_iblink_state(ppd->lastibcstat);
1204*4882a593Smuzhiyun 	props->phys_state = dd->f_ibphys_portstate(ppd->lastibcstat);
1205*4882a593Smuzhiyun 	props->gid_tbl_len = QIB_GUIDS_PER_PORT;
1206*4882a593Smuzhiyun 	props->active_width = ppd->link_width_active;
1207*4882a593Smuzhiyun 	/* See rate_show() */
1208*4882a593Smuzhiyun 	props->active_speed = ppd->link_speed_active;
1209*4882a593Smuzhiyun 	props->max_vl_num = qib_num_vls(ppd->vls_supported);
1210*4882a593Smuzhiyun 
1211*4882a593Smuzhiyun 	props->max_mtu = qib_ibmtu ? qib_ibmtu : IB_MTU_4096;
1212*4882a593Smuzhiyun 	switch (ppd->ibmtu) {
1213*4882a593Smuzhiyun 	case 4096:
1214*4882a593Smuzhiyun 		mtu = IB_MTU_4096;
1215*4882a593Smuzhiyun 		break;
1216*4882a593Smuzhiyun 	case 2048:
1217*4882a593Smuzhiyun 		mtu = IB_MTU_2048;
1218*4882a593Smuzhiyun 		break;
1219*4882a593Smuzhiyun 	case 1024:
1220*4882a593Smuzhiyun 		mtu = IB_MTU_1024;
1221*4882a593Smuzhiyun 		break;
1222*4882a593Smuzhiyun 	case 512:
1223*4882a593Smuzhiyun 		mtu = IB_MTU_512;
1224*4882a593Smuzhiyun 		break;
1225*4882a593Smuzhiyun 	case 256:
1226*4882a593Smuzhiyun 		mtu = IB_MTU_256;
1227*4882a593Smuzhiyun 		break;
1228*4882a593Smuzhiyun 	default:
1229*4882a593Smuzhiyun 		mtu = IB_MTU_2048;
1230*4882a593Smuzhiyun 	}
1231*4882a593Smuzhiyun 	props->active_mtu = mtu;
1232*4882a593Smuzhiyun 
1233*4882a593Smuzhiyun 	return 0;
1234*4882a593Smuzhiyun }
1235*4882a593Smuzhiyun 
qib_modify_device(struct ib_device * device,int device_modify_mask,struct ib_device_modify * device_modify)1236*4882a593Smuzhiyun static int qib_modify_device(struct ib_device *device,
1237*4882a593Smuzhiyun 			     int device_modify_mask,
1238*4882a593Smuzhiyun 			     struct ib_device_modify *device_modify)
1239*4882a593Smuzhiyun {
1240*4882a593Smuzhiyun 	struct qib_devdata *dd = dd_from_ibdev(device);
1241*4882a593Smuzhiyun 	unsigned i;
1242*4882a593Smuzhiyun 	int ret;
1243*4882a593Smuzhiyun 
1244*4882a593Smuzhiyun 	if (device_modify_mask & ~(IB_DEVICE_MODIFY_SYS_IMAGE_GUID |
1245*4882a593Smuzhiyun 				   IB_DEVICE_MODIFY_NODE_DESC)) {
1246*4882a593Smuzhiyun 		ret = -EOPNOTSUPP;
1247*4882a593Smuzhiyun 		goto bail;
1248*4882a593Smuzhiyun 	}
1249*4882a593Smuzhiyun 
1250*4882a593Smuzhiyun 	if (device_modify_mask & IB_DEVICE_MODIFY_NODE_DESC) {
1251*4882a593Smuzhiyun 		memcpy(device->node_desc, device_modify->node_desc,
1252*4882a593Smuzhiyun 		       IB_DEVICE_NODE_DESC_MAX);
1253*4882a593Smuzhiyun 		for (i = 0; i < dd->num_pports; i++) {
1254*4882a593Smuzhiyun 			struct qib_ibport *ibp = &dd->pport[i].ibport_data;
1255*4882a593Smuzhiyun 
1256*4882a593Smuzhiyun 			qib_node_desc_chg(ibp);
1257*4882a593Smuzhiyun 		}
1258*4882a593Smuzhiyun 	}
1259*4882a593Smuzhiyun 
1260*4882a593Smuzhiyun 	if (device_modify_mask & IB_DEVICE_MODIFY_SYS_IMAGE_GUID) {
1261*4882a593Smuzhiyun 		ib_qib_sys_image_guid =
1262*4882a593Smuzhiyun 			cpu_to_be64(device_modify->sys_image_guid);
1263*4882a593Smuzhiyun 		for (i = 0; i < dd->num_pports; i++) {
1264*4882a593Smuzhiyun 			struct qib_ibport *ibp = &dd->pport[i].ibport_data;
1265*4882a593Smuzhiyun 
1266*4882a593Smuzhiyun 			qib_sys_guid_chg(ibp);
1267*4882a593Smuzhiyun 		}
1268*4882a593Smuzhiyun 	}
1269*4882a593Smuzhiyun 
1270*4882a593Smuzhiyun 	ret = 0;
1271*4882a593Smuzhiyun 
1272*4882a593Smuzhiyun bail:
1273*4882a593Smuzhiyun 	return ret;
1274*4882a593Smuzhiyun }
1275*4882a593Smuzhiyun 
qib_shut_down_port(struct rvt_dev_info * rdi,u8 port_num)1276*4882a593Smuzhiyun static int qib_shut_down_port(struct rvt_dev_info *rdi, u8 port_num)
1277*4882a593Smuzhiyun {
1278*4882a593Smuzhiyun 	struct qib_ibdev *ibdev = container_of(rdi, struct qib_ibdev, rdi);
1279*4882a593Smuzhiyun 	struct qib_devdata *dd = dd_from_dev(ibdev);
1280*4882a593Smuzhiyun 	struct qib_pportdata *ppd = &dd->pport[port_num - 1];
1281*4882a593Smuzhiyun 
1282*4882a593Smuzhiyun 	qib_set_linkstate(ppd, QIB_IB_LINKDOWN);
1283*4882a593Smuzhiyun 
1284*4882a593Smuzhiyun 	return 0;
1285*4882a593Smuzhiyun }
1286*4882a593Smuzhiyun 
qib_get_guid_be(struct rvt_dev_info * rdi,struct rvt_ibport * rvp,int guid_index,__be64 * guid)1287*4882a593Smuzhiyun static int qib_get_guid_be(struct rvt_dev_info *rdi, struct rvt_ibport *rvp,
1288*4882a593Smuzhiyun 			   int guid_index, __be64 *guid)
1289*4882a593Smuzhiyun {
1290*4882a593Smuzhiyun 	struct qib_ibport *ibp = container_of(rvp, struct qib_ibport, rvp);
1291*4882a593Smuzhiyun 	struct qib_pportdata *ppd = ppd_from_ibp(ibp);
1292*4882a593Smuzhiyun 
1293*4882a593Smuzhiyun 	if (guid_index == 0)
1294*4882a593Smuzhiyun 		*guid = ppd->guid;
1295*4882a593Smuzhiyun 	else if (guid_index < QIB_GUIDS_PER_PORT)
1296*4882a593Smuzhiyun 		*guid = ibp->guids[guid_index - 1];
1297*4882a593Smuzhiyun 	else
1298*4882a593Smuzhiyun 		return -EINVAL;
1299*4882a593Smuzhiyun 
1300*4882a593Smuzhiyun 	return 0;
1301*4882a593Smuzhiyun }
1302*4882a593Smuzhiyun 
qib_check_ah(struct ib_device * ibdev,struct rdma_ah_attr * ah_attr)1303*4882a593Smuzhiyun int qib_check_ah(struct ib_device *ibdev, struct rdma_ah_attr *ah_attr)
1304*4882a593Smuzhiyun {
1305*4882a593Smuzhiyun 	if (rdma_ah_get_sl(ah_attr) > 15)
1306*4882a593Smuzhiyun 		return -EINVAL;
1307*4882a593Smuzhiyun 
1308*4882a593Smuzhiyun 	if (rdma_ah_get_dlid(ah_attr) == 0)
1309*4882a593Smuzhiyun 		return -EINVAL;
1310*4882a593Smuzhiyun 	if (rdma_ah_get_dlid(ah_attr) >=
1311*4882a593Smuzhiyun 		be16_to_cpu(IB_MULTICAST_LID_BASE) &&
1312*4882a593Smuzhiyun 	    rdma_ah_get_dlid(ah_attr) !=
1313*4882a593Smuzhiyun 		be16_to_cpu(IB_LID_PERMISSIVE) &&
1314*4882a593Smuzhiyun 	    !(rdma_ah_get_ah_flags(ah_attr) & IB_AH_GRH))
1315*4882a593Smuzhiyun 		return -EINVAL;
1316*4882a593Smuzhiyun 
1317*4882a593Smuzhiyun 	return 0;
1318*4882a593Smuzhiyun }
1319*4882a593Smuzhiyun 
qib_notify_new_ah(struct ib_device * ibdev,struct rdma_ah_attr * ah_attr,struct rvt_ah * ah)1320*4882a593Smuzhiyun static void qib_notify_new_ah(struct ib_device *ibdev,
1321*4882a593Smuzhiyun 			      struct rdma_ah_attr *ah_attr,
1322*4882a593Smuzhiyun 			      struct rvt_ah *ah)
1323*4882a593Smuzhiyun {
1324*4882a593Smuzhiyun 	struct qib_ibport *ibp;
1325*4882a593Smuzhiyun 	struct qib_pportdata *ppd;
1326*4882a593Smuzhiyun 
1327*4882a593Smuzhiyun 	/*
1328*4882a593Smuzhiyun 	 * Do not trust reading anything from rvt_ah at this point as it is not
1329*4882a593Smuzhiyun 	 * done being setup. We can however modify things which we need to set.
1330*4882a593Smuzhiyun 	 */
1331*4882a593Smuzhiyun 
1332*4882a593Smuzhiyun 	ibp = to_iport(ibdev, rdma_ah_get_port_num(ah_attr));
1333*4882a593Smuzhiyun 	ppd = ppd_from_ibp(ibp);
1334*4882a593Smuzhiyun 	ah->vl = ibp->sl_to_vl[rdma_ah_get_sl(&ah->attr)];
1335*4882a593Smuzhiyun 	ah->log_pmtu = ilog2(ppd->ibmtu);
1336*4882a593Smuzhiyun }
1337*4882a593Smuzhiyun 
qib_create_qp0_ah(struct qib_ibport * ibp,u16 dlid)1338*4882a593Smuzhiyun struct ib_ah *qib_create_qp0_ah(struct qib_ibport *ibp, u16 dlid)
1339*4882a593Smuzhiyun {
1340*4882a593Smuzhiyun 	struct rdma_ah_attr attr;
1341*4882a593Smuzhiyun 	struct ib_ah *ah = ERR_PTR(-EINVAL);
1342*4882a593Smuzhiyun 	struct rvt_qp *qp0;
1343*4882a593Smuzhiyun 	struct qib_pportdata *ppd = ppd_from_ibp(ibp);
1344*4882a593Smuzhiyun 	struct qib_devdata *dd = dd_from_ppd(ppd);
1345*4882a593Smuzhiyun 	u8 port_num = ppd->port;
1346*4882a593Smuzhiyun 
1347*4882a593Smuzhiyun 	memset(&attr, 0, sizeof(attr));
1348*4882a593Smuzhiyun 	attr.type = rdma_ah_find_type(&dd->verbs_dev.rdi.ibdev, port_num);
1349*4882a593Smuzhiyun 	rdma_ah_set_dlid(&attr, dlid);
1350*4882a593Smuzhiyun 	rdma_ah_set_port_num(&attr, port_num);
1351*4882a593Smuzhiyun 	rcu_read_lock();
1352*4882a593Smuzhiyun 	qp0 = rcu_dereference(ibp->rvp.qp[0]);
1353*4882a593Smuzhiyun 	if (qp0)
1354*4882a593Smuzhiyun 		ah = rdma_create_ah(qp0->ibqp.pd, &attr, 0);
1355*4882a593Smuzhiyun 	rcu_read_unlock();
1356*4882a593Smuzhiyun 	return ah;
1357*4882a593Smuzhiyun }
1358*4882a593Smuzhiyun 
1359*4882a593Smuzhiyun /**
1360*4882a593Smuzhiyun  * qib_get_npkeys - return the size of the PKEY table for context 0
1361*4882a593Smuzhiyun  * @dd: the qlogic_ib device
1362*4882a593Smuzhiyun  */
qib_get_npkeys(struct qib_devdata * dd)1363*4882a593Smuzhiyun unsigned qib_get_npkeys(struct qib_devdata *dd)
1364*4882a593Smuzhiyun {
1365*4882a593Smuzhiyun 	return ARRAY_SIZE(dd->rcd[0]->pkeys);
1366*4882a593Smuzhiyun }
1367*4882a593Smuzhiyun 
1368*4882a593Smuzhiyun /*
1369*4882a593Smuzhiyun  * Return the indexed PKEY from the port PKEY table.
1370*4882a593Smuzhiyun  * No need to validate rcd[ctxt]; the port is setup if we are here.
1371*4882a593Smuzhiyun  */
qib_get_pkey(struct qib_ibport * ibp,unsigned index)1372*4882a593Smuzhiyun unsigned qib_get_pkey(struct qib_ibport *ibp, unsigned index)
1373*4882a593Smuzhiyun {
1374*4882a593Smuzhiyun 	struct qib_pportdata *ppd = ppd_from_ibp(ibp);
1375*4882a593Smuzhiyun 	struct qib_devdata *dd = ppd->dd;
1376*4882a593Smuzhiyun 	unsigned ctxt = ppd->hw_pidx;
1377*4882a593Smuzhiyun 	unsigned ret;
1378*4882a593Smuzhiyun 
1379*4882a593Smuzhiyun 	/* dd->rcd null if mini_init or some init failures */
1380*4882a593Smuzhiyun 	if (!dd->rcd || index >= ARRAY_SIZE(dd->rcd[ctxt]->pkeys))
1381*4882a593Smuzhiyun 		ret = 0;
1382*4882a593Smuzhiyun 	else
1383*4882a593Smuzhiyun 		ret = dd->rcd[ctxt]->pkeys[index];
1384*4882a593Smuzhiyun 
1385*4882a593Smuzhiyun 	return ret;
1386*4882a593Smuzhiyun }
1387*4882a593Smuzhiyun 
init_ibport(struct qib_pportdata * ppd)1388*4882a593Smuzhiyun static void init_ibport(struct qib_pportdata *ppd)
1389*4882a593Smuzhiyun {
1390*4882a593Smuzhiyun 	struct qib_verbs_counters cntrs;
1391*4882a593Smuzhiyun 	struct qib_ibport *ibp = &ppd->ibport_data;
1392*4882a593Smuzhiyun 
1393*4882a593Smuzhiyun 	spin_lock_init(&ibp->rvp.lock);
1394*4882a593Smuzhiyun 	/* Set the prefix to the default value (see ch. 4.1.1) */
1395*4882a593Smuzhiyun 	ibp->rvp.gid_prefix = IB_DEFAULT_GID_PREFIX;
1396*4882a593Smuzhiyun 	ibp->rvp.sm_lid = be16_to_cpu(IB_LID_PERMISSIVE);
1397*4882a593Smuzhiyun 	ibp->rvp.port_cap_flags = IB_PORT_SYS_IMAGE_GUID_SUP |
1398*4882a593Smuzhiyun 		IB_PORT_CLIENT_REG_SUP | IB_PORT_SL_MAP_SUP |
1399*4882a593Smuzhiyun 		IB_PORT_TRAP_SUP | IB_PORT_AUTO_MIGR_SUP |
1400*4882a593Smuzhiyun 		IB_PORT_DR_NOTICE_SUP | IB_PORT_CAP_MASK_NOTICE_SUP |
1401*4882a593Smuzhiyun 		IB_PORT_OTHER_LOCAL_CHANGES_SUP;
1402*4882a593Smuzhiyun 	if (ppd->dd->flags & QIB_HAS_LINK_LATENCY)
1403*4882a593Smuzhiyun 		ibp->rvp.port_cap_flags |= IB_PORT_LINK_LATENCY_SUP;
1404*4882a593Smuzhiyun 	ibp->rvp.pma_counter_select[0] = IB_PMA_PORT_XMIT_DATA;
1405*4882a593Smuzhiyun 	ibp->rvp.pma_counter_select[1] = IB_PMA_PORT_RCV_DATA;
1406*4882a593Smuzhiyun 	ibp->rvp.pma_counter_select[2] = IB_PMA_PORT_XMIT_PKTS;
1407*4882a593Smuzhiyun 	ibp->rvp.pma_counter_select[3] = IB_PMA_PORT_RCV_PKTS;
1408*4882a593Smuzhiyun 	ibp->rvp.pma_counter_select[4] = IB_PMA_PORT_XMIT_WAIT;
1409*4882a593Smuzhiyun 
1410*4882a593Smuzhiyun 	/* Snapshot current HW counters to "clear" them. */
1411*4882a593Smuzhiyun 	qib_get_counters(ppd, &cntrs);
1412*4882a593Smuzhiyun 	ibp->z_symbol_error_counter = cntrs.symbol_error_counter;
1413*4882a593Smuzhiyun 	ibp->z_link_error_recovery_counter =
1414*4882a593Smuzhiyun 		cntrs.link_error_recovery_counter;
1415*4882a593Smuzhiyun 	ibp->z_link_downed_counter = cntrs.link_downed_counter;
1416*4882a593Smuzhiyun 	ibp->z_port_rcv_errors = cntrs.port_rcv_errors;
1417*4882a593Smuzhiyun 	ibp->z_port_rcv_remphys_errors = cntrs.port_rcv_remphys_errors;
1418*4882a593Smuzhiyun 	ibp->z_port_xmit_discards = cntrs.port_xmit_discards;
1419*4882a593Smuzhiyun 	ibp->z_port_xmit_data = cntrs.port_xmit_data;
1420*4882a593Smuzhiyun 	ibp->z_port_rcv_data = cntrs.port_rcv_data;
1421*4882a593Smuzhiyun 	ibp->z_port_xmit_packets = cntrs.port_xmit_packets;
1422*4882a593Smuzhiyun 	ibp->z_port_rcv_packets = cntrs.port_rcv_packets;
1423*4882a593Smuzhiyun 	ibp->z_local_link_integrity_errors =
1424*4882a593Smuzhiyun 		cntrs.local_link_integrity_errors;
1425*4882a593Smuzhiyun 	ibp->z_excessive_buffer_overrun_errors =
1426*4882a593Smuzhiyun 		cntrs.excessive_buffer_overrun_errors;
1427*4882a593Smuzhiyun 	ibp->z_vl15_dropped = cntrs.vl15_dropped;
1428*4882a593Smuzhiyun 	RCU_INIT_POINTER(ibp->rvp.qp[0], NULL);
1429*4882a593Smuzhiyun 	RCU_INIT_POINTER(ibp->rvp.qp[1], NULL);
1430*4882a593Smuzhiyun }
1431*4882a593Smuzhiyun 
1432*4882a593Smuzhiyun /**
1433*4882a593Smuzhiyun  * qib_fill_device_attr - Fill in rvt dev info device attributes.
1434*4882a593Smuzhiyun  * @dd: the device data structure
1435*4882a593Smuzhiyun  */
qib_fill_device_attr(struct qib_devdata * dd)1436*4882a593Smuzhiyun static void qib_fill_device_attr(struct qib_devdata *dd)
1437*4882a593Smuzhiyun {
1438*4882a593Smuzhiyun 	struct rvt_dev_info *rdi = &dd->verbs_dev.rdi;
1439*4882a593Smuzhiyun 
1440*4882a593Smuzhiyun 	memset(&rdi->dparms.props, 0, sizeof(rdi->dparms.props));
1441*4882a593Smuzhiyun 
1442*4882a593Smuzhiyun 	rdi->dparms.props.max_pd = ib_qib_max_pds;
1443*4882a593Smuzhiyun 	rdi->dparms.props.max_ah = ib_qib_max_ahs;
1444*4882a593Smuzhiyun 	rdi->dparms.props.device_cap_flags = IB_DEVICE_BAD_PKEY_CNTR |
1445*4882a593Smuzhiyun 		IB_DEVICE_BAD_QKEY_CNTR | IB_DEVICE_SHUTDOWN_PORT |
1446*4882a593Smuzhiyun 		IB_DEVICE_SYS_IMAGE_GUID | IB_DEVICE_RC_RNR_NAK_GEN |
1447*4882a593Smuzhiyun 		IB_DEVICE_PORT_ACTIVE_EVENT | IB_DEVICE_SRQ_RESIZE;
1448*4882a593Smuzhiyun 	rdi->dparms.props.page_size_cap = PAGE_SIZE;
1449*4882a593Smuzhiyun 	rdi->dparms.props.vendor_id =
1450*4882a593Smuzhiyun 		QIB_SRC_OUI_1 << 16 | QIB_SRC_OUI_2 << 8 | QIB_SRC_OUI_3;
1451*4882a593Smuzhiyun 	rdi->dparms.props.vendor_part_id = dd->deviceid;
1452*4882a593Smuzhiyun 	rdi->dparms.props.hw_ver = dd->minrev;
1453*4882a593Smuzhiyun 	rdi->dparms.props.sys_image_guid = ib_qib_sys_image_guid;
1454*4882a593Smuzhiyun 	rdi->dparms.props.max_mr_size = ~0ULL;
1455*4882a593Smuzhiyun 	rdi->dparms.props.max_qp = ib_qib_max_qps;
1456*4882a593Smuzhiyun 	rdi->dparms.props.max_qp_wr = ib_qib_max_qp_wrs;
1457*4882a593Smuzhiyun 	rdi->dparms.props.max_send_sge = ib_qib_max_sges;
1458*4882a593Smuzhiyun 	rdi->dparms.props.max_recv_sge = ib_qib_max_sges;
1459*4882a593Smuzhiyun 	rdi->dparms.props.max_sge_rd = ib_qib_max_sges;
1460*4882a593Smuzhiyun 	rdi->dparms.props.max_cq = ib_qib_max_cqs;
1461*4882a593Smuzhiyun 	rdi->dparms.props.max_cqe = ib_qib_max_cqes;
1462*4882a593Smuzhiyun 	rdi->dparms.props.max_ah = ib_qib_max_ahs;
1463*4882a593Smuzhiyun 	rdi->dparms.props.max_qp_rd_atom = QIB_MAX_RDMA_ATOMIC;
1464*4882a593Smuzhiyun 	rdi->dparms.props.max_qp_init_rd_atom = 255;
1465*4882a593Smuzhiyun 	rdi->dparms.props.max_srq = ib_qib_max_srqs;
1466*4882a593Smuzhiyun 	rdi->dparms.props.max_srq_wr = ib_qib_max_srq_wrs;
1467*4882a593Smuzhiyun 	rdi->dparms.props.max_srq_sge = ib_qib_max_srq_sges;
1468*4882a593Smuzhiyun 	rdi->dparms.props.atomic_cap = IB_ATOMIC_GLOB;
1469*4882a593Smuzhiyun 	rdi->dparms.props.max_pkeys = qib_get_npkeys(dd);
1470*4882a593Smuzhiyun 	rdi->dparms.props.max_mcast_grp = ib_qib_max_mcast_grps;
1471*4882a593Smuzhiyun 	rdi->dparms.props.max_mcast_qp_attach = ib_qib_max_mcast_qp_attached;
1472*4882a593Smuzhiyun 	rdi->dparms.props.max_total_mcast_qp_attach =
1473*4882a593Smuzhiyun 					rdi->dparms.props.max_mcast_qp_attach *
1474*4882a593Smuzhiyun 					rdi->dparms.props.max_mcast_grp;
1475*4882a593Smuzhiyun 	/* post send table */
1476*4882a593Smuzhiyun 	dd->verbs_dev.rdi.post_parms = qib_post_parms;
1477*4882a593Smuzhiyun 
1478*4882a593Smuzhiyun 	/* opcode translation table */
1479*4882a593Smuzhiyun 	dd->verbs_dev.rdi.wc_opcode = ib_qib_wc_opcode;
1480*4882a593Smuzhiyun }
1481*4882a593Smuzhiyun 
1482*4882a593Smuzhiyun static const struct ib_device_ops qib_dev_ops = {
1483*4882a593Smuzhiyun 	.owner = THIS_MODULE,
1484*4882a593Smuzhiyun 	.driver_id = RDMA_DRIVER_QIB,
1485*4882a593Smuzhiyun 
1486*4882a593Smuzhiyun 	.init_port = qib_create_port_files,
1487*4882a593Smuzhiyun 	.modify_device = qib_modify_device,
1488*4882a593Smuzhiyun 	.process_mad = qib_process_mad,
1489*4882a593Smuzhiyun };
1490*4882a593Smuzhiyun 
1491*4882a593Smuzhiyun /**
1492*4882a593Smuzhiyun  * qib_register_ib_device - register our device with the infiniband core
1493*4882a593Smuzhiyun  * @dd: the device data structure
1494*4882a593Smuzhiyun  * Return the allocated qib_ibdev pointer or NULL on error.
1495*4882a593Smuzhiyun  */
qib_register_ib_device(struct qib_devdata * dd)1496*4882a593Smuzhiyun int qib_register_ib_device(struct qib_devdata *dd)
1497*4882a593Smuzhiyun {
1498*4882a593Smuzhiyun 	struct qib_ibdev *dev = &dd->verbs_dev;
1499*4882a593Smuzhiyun 	struct ib_device *ibdev = &dev->rdi.ibdev;
1500*4882a593Smuzhiyun 	struct qib_pportdata *ppd = dd->pport;
1501*4882a593Smuzhiyun 	unsigned i, ctxt;
1502*4882a593Smuzhiyun 	int ret;
1503*4882a593Smuzhiyun 
1504*4882a593Smuzhiyun 	for (i = 0; i < dd->num_pports; i++)
1505*4882a593Smuzhiyun 		init_ibport(ppd + i);
1506*4882a593Smuzhiyun 
1507*4882a593Smuzhiyun 	/* Only need to initialize non-zero fields. */
1508*4882a593Smuzhiyun 	timer_setup(&dev->mem_timer, mem_timer, 0);
1509*4882a593Smuzhiyun 
1510*4882a593Smuzhiyun 	INIT_LIST_HEAD(&dev->piowait);
1511*4882a593Smuzhiyun 	INIT_LIST_HEAD(&dev->dmawait);
1512*4882a593Smuzhiyun 	INIT_LIST_HEAD(&dev->txwait);
1513*4882a593Smuzhiyun 	INIT_LIST_HEAD(&dev->memwait);
1514*4882a593Smuzhiyun 	INIT_LIST_HEAD(&dev->txreq_free);
1515*4882a593Smuzhiyun 
1516*4882a593Smuzhiyun 	if (ppd->sdma_descq_cnt) {
1517*4882a593Smuzhiyun 		dev->pio_hdrs = dma_alloc_coherent(&dd->pcidev->dev,
1518*4882a593Smuzhiyun 						ppd->sdma_descq_cnt *
1519*4882a593Smuzhiyun 						sizeof(struct qib_pio_header),
1520*4882a593Smuzhiyun 						&dev->pio_hdrs_phys,
1521*4882a593Smuzhiyun 						GFP_KERNEL);
1522*4882a593Smuzhiyun 		if (!dev->pio_hdrs) {
1523*4882a593Smuzhiyun 			ret = -ENOMEM;
1524*4882a593Smuzhiyun 			goto err_hdrs;
1525*4882a593Smuzhiyun 		}
1526*4882a593Smuzhiyun 	}
1527*4882a593Smuzhiyun 
1528*4882a593Smuzhiyun 	for (i = 0; i < ppd->sdma_descq_cnt; i++) {
1529*4882a593Smuzhiyun 		struct qib_verbs_txreq *tx;
1530*4882a593Smuzhiyun 
1531*4882a593Smuzhiyun 		tx = kzalloc(sizeof(*tx), GFP_KERNEL);
1532*4882a593Smuzhiyun 		if (!tx) {
1533*4882a593Smuzhiyun 			ret = -ENOMEM;
1534*4882a593Smuzhiyun 			goto err_tx;
1535*4882a593Smuzhiyun 		}
1536*4882a593Smuzhiyun 		tx->hdr_inx = i;
1537*4882a593Smuzhiyun 		list_add(&tx->txreq.list, &dev->txreq_free);
1538*4882a593Smuzhiyun 	}
1539*4882a593Smuzhiyun 
1540*4882a593Smuzhiyun 	/*
1541*4882a593Smuzhiyun 	 * The system image GUID is supposed to be the same for all
1542*4882a593Smuzhiyun 	 * IB HCAs in a single system but since there can be other
1543*4882a593Smuzhiyun 	 * device types in the system, we can't be sure this is unique.
1544*4882a593Smuzhiyun 	 */
1545*4882a593Smuzhiyun 	if (!ib_qib_sys_image_guid)
1546*4882a593Smuzhiyun 		ib_qib_sys_image_guid = ppd->guid;
1547*4882a593Smuzhiyun 
1548*4882a593Smuzhiyun 	ibdev->node_guid = ppd->guid;
1549*4882a593Smuzhiyun 	ibdev->phys_port_cnt = dd->num_pports;
1550*4882a593Smuzhiyun 	ibdev->dev.parent = &dd->pcidev->dev;
1551*4882a593Smuzhiyun 
1552*4882a593Smuzhiyun 	snprintf(ibdev->node_desc, sizeof(ibdev->node_desc),
1553*4882a593Smuzhiyun 		 "Intel Infiniband HCA %s", init_utsname()->nodename);
1554*4882a593Smuzhiyun 
1555*4882a593Smuzhiyun 	/*
1556*4882a593Smuzhiyun 	 * Fill in rvt info object.
1557*4882a593Smuzhiyun 	 */
1558*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.get_pci_dev = qib_get_pci_dev;
1559*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.check_ah = qib_check_ah;
1560*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.setup_wqe = qib_check_send_wqe;
1561*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.notify_new_ah = qib_notify_new_ah;
1562*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.alloc_qpn = qib_alloc_qpn;
1563*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.qp_priv_alloc = qib_qp_priv_alloc;
1564*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.qp_priv_free = qib_qp_priv_free;
1565*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.free_all_qps = qib_free_all_qps;
1566*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.notify_qp_reset = qib_notify_qp_reset;
1567*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.do_send = qib_do_send;
1568*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.schedule_send = qib_schedule_send;
1569*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.quiesce_qp = qib_quiesce_qp;
1570*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.stop_send_queue = qib_stop_send_queue;
1571*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.flush_qp_waiters = qib_flush_qp_waiters;
1572*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.notify_error_qp = qib_notify_error_qp;
1573*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.notify_restart_rc = qib_restart_rc;
1574*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.mtu_to_path_mtu = qib_mtu_to_path_mtu;
1575*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.mtu_from_qp = qib_mtu_from_qp;
1576*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.get_pmtu_from_attr = qib_get_pmtu_from_attr;
1577*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.schedule_send_no_lock = _qib_schedule_send;
1578*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.query_port_state = qib_query_port;
1579*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.shut_down_port = qib_shut_down_port;
1580*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.cap_mask_chg = qib_cap_mask_chg;
1581*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.notify_create_mad_agent =
1582*4882a593Smuzhiyun 						qib_notify_create_mad_agent;
1583*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.notify_free_mad_agent =
1584*4882a593Smuzhiyun 						qib_notify_free_mad_agent;
1585*4882a593Smuzhiyun 
1586*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.max_rdma_atomic = QIB_MAX_RDMA_ATOMIC;
1587*4882a593Smuzhiyun 	dd->verbs_dev.rdi.driver_f.get_guid_be = qib_get_guid_be;
1588*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.lkey_table_size = qib_lkey_table_size;
1589*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.qp_table_size = ib_qib_qp_table_size;
1590*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.qpn_start = 1;
1591*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.qpn_res_start = QIB_KD_QP;
1592*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.qpn_res_end = QIB_KD_QP; /* Reserve one QP */
1593*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.qpn_inc = 1;
1594*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.qos_shift = 1;
1595*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.psn_mask = QIB_PSN_MASK;
1596*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.psn_shift = QIB_PSN_SHIFT;
1597*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.psn_modify_mask = QIB_PSN_MASK;
1598*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.nports = dd->num_pports;
1599*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.npkeys = qib_get_npkeys(dd);
1600*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.node = dd->assigned_node_id;
1601*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.core_cap_flags = RDMA_CORE_PORT_IBA_IB;
1602*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.max_mad_size = IB_MGMT_MAD_SIZE;
1603*4882a593Smuzhiyun 	dd->verbs_dev.rdi.dparms.sge_copy_mode = RVT_SGE_COPY_MEMCPY;
1604*4882a593Smuzhiyun 
1605*4882a593Smuzhiyun 	qib_fill_device_attr(dd);
1606*4882a593Smuzhiyun 
1607*4882a593Smuzhiyun 	ppd = dd->pport;
1608*4882a593Smuzhiyun 	for (i = 0; i < dd->num_pports; i++, ppd++) {
1609*4882a593Smuzhiyun 		ctxt = ppd->hw_pidx;
1610*4882a593Smuzhiyun 		rvt_init_port(&dd->verbs_dev.rdi,
1611*4882a593Smuzhiyun 			      &ppd->ibport_data.rvp,
1612*4882a593Smuzhiyun 			      i,
1613*4882a593Smuzhiyun 			      dd->rcd[ctxt]->pkeys);
1614*4882a593Smuzhiyun 	}
1615*4882a593Smuzhiyun 	rdma_set_device_sysfs_group(&dd->verbs_dev.rdi.ibdev, &qib_attr_group);
1616*4882a593Smuzhiyun 
1617*4882a593Smuzhiyun 	ib_set_device_ops(ibdev, &qib_dev_ops);
1618*4882a593Smuzhiyun 	ret = rvt_register_device(&dd->verbs_dev.rdi);
1619*4882a593Smuzhiyun 	if (ret)
1620*4882a593Smuzhiyun 		goto err_tx;
1621*4882a593Smuzhiyun 
1622*4882a593Smuzhiyun 	return ret;
1623*4882a593Smuzhiyun 
1624*4882a593Smuzhiyun err_tx:
1625*4882a593Smuzhiyun 	while (!list_empty(&dev->txreq_free)) {
1626*4882a593Smuzhiyun 		struct list_head *l = dev->txreq_free.next;
1627*4882a593Smuzhiyun 		struct qib_verbs_txreq *tx;
1628*4882a593Smuzhiyun 
1629*4882a593Smuzhiyun 		list_del(l);
1630*4882a593Smuzhiyun 		tx = list_entry(l, struct qib_verbs_txreq, txreq.list);
1631*4882a593Smuzhiyun 		kfree(tx);
1632*4882a593Smuzhiyun 	}
1633*4882a593Smuzhiyun 	if (ppd->sdma_descq_cnt)
1634*4882a593Smuzhiyun 		dma_free_coherent(&dd->pcidev->dev,
1635*4882a593Smuzhiyun 				  ppd->sdma_descq_cnt *
1636*4882a593Smuzhiyun 					sizeof(struct qib_pio_header),
1637*4882a593Smuzhiyun 				  dev->pio_hdrs, dev->pio_hdrs_phys);
1638*4882a593Smuzhiyun err_hdrs:
1639*4882a593Smuzhiyun 	qib_dev_err(dd, "cannot register verbs: %d!\n", -ret);
1640*4882a593Smuzhiyun 	return ret;
1641*4882a593Smuzhiyun }
1642*4882a593Smuzhiyun 
qib_unregister_ib_device(struct qib_devdata * dd)1643*4882a593Smuzhiyun void qib_unregister_ib_device(struct qib_devdata *dd)
1644*4882a593Smuzhiyun {
1645*4882a593Smuzhiyun 	struct qib_ibdev *dev = &dd->verbs_dev;
1646*4882a593Smuzhiyun 
1647*4882a593Smuzhiyun 	qib_verbs_unregister_sysfs(dd);
1648*4882a593Smuzhiyun 
1649*4882a593Smuzhiyun 	rvt_unregister_device(&dd->verbs_dev.rdi);
1650*4882a593Smuzhiyun 
1651*4882a593Smuzhiyun 	if (!list_empty(&dev->piowait))
1652*4882a593Smuzhiyun 		qib_dev_err(dd, "piowait list not empty!\n");
1653*4882a593Smuzhiyun 	if (!list_empty(&dev->dmawait))
1654*4882a593Smuzhiyun 		qib_dev_err(dd, "dmawait list not empty!\n");
1655*4882a593Smuzhiyun 	if (!list_empty(&dev->txwait))
1656*4882a593Smuzhiyun 		qib_dev_err(dd, "txwait list not empty!\n");
1657*4882a593Smuzhiyun 	if (!list_empty(&dev->memwait))
1658*4882a593Smuzhiyun 		qib_dev_err(dd, "memwait list not empty!\n");
1659*4882a593Smuzhiyun 
1660*4882a593Smuzhiyun 	del_timer_sync(&dev->mem_timer);
1661*4882a593Smuzhiyun 	while (!list_empty(&dev->txreq_free)) {
1662*4882a593Smuzhiyun 		struct list_head *l = dev->txreq_free.next;
1663*4882a593Smuzhiyun 		struct qib_verbs_txreq *tx;
1664*4882a593Smuzhiyun 
1665*4882a593Smuzhiyun 		list_del(l);
1666*4882a593Smuzhiyun 		tx = list_entry(l, struct qib_verbs_txreq, txreq.list);
1667*4882a593Smuzhiyun 		kfree(tx);
1668*4882a593Smuzhiyun 	}
1669*4882a593Smuzhiyun 	if (dd->pport->sdma_descq_cnt)
1670*4882a593Smuzhiyun 		dma_free_coherent(&dd->pcidev->dev,
1671*4882a593Smuzhiyun 				  dd->pport->sdma_descq_cnt *
1672*4882a593Smuzhiyun 					sizeof(struct qib_pio_header),
1673*4882a593Smuzhiyun 				  dev->pio_hdrs, dev->pio_hdrs_phys);
1674*4882a593Smuzhiyun }
1675*4882a593Smuzhiyun 
1676*4882a593Smuzhiyun /**
1677*4882a593Smuzhiyun  * _qib_schedule_send - schedule progress
1678*4882a593Smuzhiyun  * @qp - the qp
1679*4882a593Smuzhiyun  *
1680*4882a593Smuzhiyun  * This schedules progress w/o regard to the s_flags.
1681*4882a593Smuzhiyun  *
1682*4882a593Smuzhiyun  * It is only used in post send, which doesn't hold
1683*4882a593Smuzhiyun  * the s_lock.
1684*4882a593Smuzhiyun  */
_qib_schedule_send(struct rvt_qp * qp)1685*4882a593Smuzhiyun bool _qib_schedule_send(struct rvt_qp *qp)
1686*4882a593Smuzhiyun {
1687*4882a593Smuzhiyun 	struct qib_ibport *ibp =
1688*4882a593Smuzhiyun 		to_iport(qp->ibqp.device, qp->port_num);
1689*4882a593Smuzhiyun 	struct qib_pportdata *ppd = ppd_from_ibp(ibp);
1690*4882a593Smuzhiyun 	struct qib_qp_priv *priv = qp->priv;
1691*4882a593Smuzhiyun 
1692*4882a593Smuzhiyun 	return queue_work(ppd->qib_wq, &priv->s_work);
1693*4882a593Smuzhiyun }
1694*4882a593Smuzhiyun 
1695*4882a593Smuzhiyun /**
1696*4882a593Smuzhiyun  * qib_schedule_send - schedule progress
1697*4882a593Smuzhiyun  * @qp - the qp
1698*4882a593Smuzhiyun  *
1699*4882a593Smuzhiyun  * This schedules qp progress.  The s_lock
1700*4882a593Smuzhiyun  * should be held.
1701*4882a593Smuzhiyun  */
qib_schedule_send(struct rvt_qp * qp)1702*4882a593Smuzhiyun bool qib_schedule_send(struct rvt_qp *qp)
1703*4882a593Smuzhiyun {
1704*4882a593Smuzhiyun 	if (qib_send_ok(qp))
1705*4882a593Smuzhiyun 		return _qib_schedule_send(qp);
1706*4882a593Smuzhiyun 	return false;
1707*4882a593Smuzhiyun }
1708