xref: /OK3568_Linux_fs/kernel/drivers/infiniband/hw/mlx4/ah.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Copyright (c) 2007 Cisco Systems, Inc. All rights reserved.
3*4882a593Smuzhiyun  *
4*4882a593Smuzhiyun  * This software is available to you under a choice of one of two
5*4882a593Smuzhiyun  * licenses.  You may choose to be licensed under the terms of the GNU
6*4882a593Smuzhiyun  * General Public License (GPL) Version 2, available from the file
7*4882a593Smuzhiyun  * COPYING in the main directory of this source tree, or the
8*4882a593Smuzhiyun  * OpenIB.org BSD license below:
9*4882a593Smuzhiyun  *
10*4882a593Smuzhiyun  *     Redistribution and use in source and binary forms, with or
11*4882a593Smuzhiyun  *     without modification, are permitted provided that the following
12*4882a593Smuzhiyun  *     conditions are met:
13*4882a593Smuzhiyun  *
14*4882a593Smuzhiyun  *      - Redistributions of source code must retain the above
15*4882a593Smuzhiyun  *        copyright notice, this list of conditions and the following
16*4882a593Smuzhiyun  *        disclaimer.
17*4882a593Smuzhiyun  *
18*4882a593Smuzhiyun  *      - Redistributions in binary form must reproduce the above
19*4882a593Smuzhiyun  *        copyright notice, this list of conditions and the following
20*4882a593Smuzhiyun  *        disclaimer in the documentation and/or other materials
21*4882a593Smuzhiyun  *        provided with the distribution.
22*4882a593Smuzhiyun  *
23*4882a593Smuzhiyun  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24*4882a593Smuzhiyun  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25*4882a593Smuzhiyun  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26*4882a593Smuzhiyun  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27*4882a593Smuzhiyun  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28*4882a593Smuzhiyun  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29*4882a593Smuzhiyun  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30*4882a593Smuzhiyun  * SOFTWARE.
31*4882a593Smuzhiyun  */
32*4882a593Smuzhiyun 
33*4882a593Smuzhiyun #include <rdma/ib_addr.h>
34*4882a593Smuzhiyun #include <rdma/ib_cache.h>
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun #include <linux/slab.h>
37*4882a593Smuzhiyun #include <linux/inet.h>
38*4882a593Smuzhiyun #include <linux/string.h>
39*4882a593Smuzhiyun #include <linux/mlx4/driver.h>
40*4882a593Smuzhiyun 
41*4882a593Smuzhiyun #include "mlx4_ib.h"
42*4882a593Smuzhiyun 
create_ib_ah(struct ib_ah * ib_ah,struct rdma_ah_attr * ah_attr)43*4882a593Smuzhiyun static void create_ib_ah(struct ib_ah *ib_ah, struct rdma_ah_attr *ah_attr)
44*4882a593Smuzhiyun {
45*4882a593Smuzhiyun 	struct mlx4_ib_ah *ah = to_mah(ib_ah);
46*4882a593Smuzhiyun 	struct mlx4_dev *dev = to_mdev(ib_ah->device)->dev;
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun 	ah->av.ib.port_pd = cpu_to_be32(to_mpd(ib_ah->pd)->pdn |
49*4882a593Smuzhiyun 			    (rdma_ah_get_port_num(ah_attr) << 24));
50*4882a593Smuzhiyun 	ah->av.ib.g_slid  = rdma_ah_get_path_bits(ah_attr);
51*4882a593Smuzhiyun 	ah->av.ib.sl_tclass_flowlabel =
52*4882a593Smuzhiyun 			cpu_to_be32(rdma_ah_get_sl(ah_attr) << 28);
53*4882a593Smuzhiyun 	if (rdma_ah_get_ah_flags(ah_attr) & IB_AH_GRH) {
54*4882a593Smuzhiyun 		const struct ib_global_route *grh = rdma_ah_read_grh(ah_attr);
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun 		ah->av.ib.g_slid   |= 0x80;
57*4882a593Smuzhiyun 		ah->av.ib.gid_index = grh->sgid_index;
58*4882a593Smuzhiyun 		ah->av.ib.hop_limit = grh->hop_limit;
59*4882a593Smuzhiyun 		ah->av.ib.sl_tclass_flowlabel |=
60*4882a593Smuzhiyun 			cpu_to_be32((grh->traffic_class << 20) |
61*4882a593Smuzhiyun 				    grh->flow_label);
62*4882a593Smuzhiyun 		memcpy(ah->av.ib.dgid, grh->dgid.raw, 16);
63*4882a593Smuzhiyun 	}
64*4882a593Smuzhiyun 
65*4882a593Smuzhiyun 	ah->av.ib.dlid = cpu_to_be16(rdma_ah_get_dlid(ah_attr));
66*4882a593Smuzhiyun 	if (rdma_ah_get_static_rate(ah_attr)) {
67*4882a593Smuzhiyun 		u8 static_rate = rdma_ah_get_static_rate(ah_attr) +
68*4882a593Smuzhiyun 					MLX4_STAT_RATE_OFFSET;
69*4882a593Smuzhiyun 
70*4882a593Smuzhiyun 		while (static_rate > IB_RATE_2_5_GBPS + MLX4_STAT_RATE_OFFSET &&
71*4882a593Smuzhiyun 		       !(1 << static_rate & dev->caps.stat_rate_support))
72*4882a593Smuzhiyun 			--static_rate;
73*4882a593Smuzhiyun 		ah->av.ib.stat_rate = static_rate;
74*4882a593Smuzhiyun 	}
75*4882a593Smuzhiyun }
76*4882a593Smuzhiyun 
create_iboe_ah(struct ib_ah * ib_ah,struct rdma_ah_attr * ah_attr)77*4882a593Smuzhiyun static int create_iboe_ah(struct ib_ah *ib_ah, struct rdma_ah_attr *ah_attr)
78*4882a593Smuzhiyun {
79*4882a593Smuzhiyun 	struct mlx4_ib_dev *ibdev = to_mdev(ib_ah->device);
80*4882a593Smuzhiyun 	struct mlx4_ib_ah *ah = to_mah(ib_ah);
81*4882a593Smuzhiyun 	const struct ib_gid_attr *gid_attr;
82*4882a593Smuzhiyun 	struct mlx4_dev *dev = ibdev->dev;
83*4882a593Smuzhiyun 	int is_mcast = 0;
84*4882a593Smuzhiyun 	struct in6_addr in6;
85*4882a593Smuzhiyun 	u16 vlan_tag = 0xffff;
86*4882a593Smuzhiyun 	const struct ib_global_route *grh = rdma_ah_read_grh(ah_attr);
87*4882a593Smuzhiyun 	int ret;
88*4882a593Smuzhiyun 
89*4882a593Smuzhiyun 	memcpy(&in6, grh->dgid.raw, sizeof(in6));
90*4882a593Smuzhiyun 	if (rdma_is_multicast_addr(&in6))
91*4882a593Smuzhiyun 		is_mcast = 1;
92*4882a593Smuzhiyun 
93*4882a593Smuzhiyun 	memcpy(ah->av.eth.mac, ah_attr->roce.dmac, ETH_ALEN);
94*4882a593Smuzhiyun 	eth_zero_addr(ah->av.eth.s_mac);
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun 	/*
97*4882a593Smuzhiyun 	 * If sgid_attr is NULL we are being called by mlx4_ib_create_ah_slave
98*4882a593Smuzhiyun 	 * and we are directly creating an AV for a slave's gid_index.
99*4882a593Smuzhiyun 	 */
100*4882a593Smuzhiyun 	gid_attr = ah_attr->grh.sgid_attr;
101*4882a593Smuzhiyun 	if (gid_attr) {
102*4882a593Smuzhiyun 		ret = rdma_read_gid_l2_fields(gid_attr, &vlan_tag,
103*4882a593Smuzhiyun 					      &ah->av.eth.s_mac[0]);
104*4882a593Smuzhiyun 		if (ret)
105*4882a593Smuzhiyun 			return ret;
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun 		ret = mlx4_ib_gid_index_to_real_index(ibdev, gid_attr);
108*4882a593Smuzhiyun 		if (ret < 0)
109*4882a593Smuzhiyun 			return ret;
110*4882a593Smuzhiyun 		ah->av.eth.gid_index = ret;
111*4882a593Smuzhiyun 	} else {
112*4882a593Smuzhiyun 		/* mlx4_ib_create_ah_slave fills in the s_mac and the vlan */
113*4882a593Smuzhiyun 		ah->av.eth.gid_index = ah_attr->grh.sgid_index;
114*4882a593Smuzhiyun 	}
115*4882a593Smuzhiyun 
116*4882a593Smuzhiyun 	if (vlan_tag < 0x1000)
117*4882a593Smuzhiyun 		vlan_tag |= (rdma_ah_get_sl(ah_attr) & 7) << 13;
118*4882a593Smuzhiyun 	ah->av.eth.port_pd = cpu_to_be32(to_mpd(ib_ah->pd)->pdn |
119*4882a593Smuzhiyun 					 (rdma_ah_get_port_num(ah_attr) << 24));
120*4882a593Smuzhiyun 	ah->av.eth.vlan = cpu_to_be16(vlan_tag);
121*4882a593Smuzhiyun 	ah->av.eth.hop_limit = grh->hop_limit;
122*4882a593Smuzhiyun 	if (rdma_ah_get_static_rate(ah_attr)) {
123*4882a593Smuzhiyun 		ah->av.eth.stat_rate = rdma_ah_get_static_rate(ah_attr) +
124*4882a593Smuzhiyun 					MLX4_STAT_RATE_OFFSET;
125*4882a593Smuzhiyun 		while (ah->av.eth.stat_rate > IB_RATE_2_5_GBPS + MLX4_STAT_RATE_OFFSET &&
126*4882a593Smuzhiyun 		       !(1 << ah->av.eth.stat_rate & dev->caps.stat_rate_support))
127*4882a593Smuzhiyun 			--ah->av.eth.stat_rate;
128*4882a593Smuzhiyun 	}
129*4882a593Smuzhiyun 	ah->av.eth.sl_tclass_flowlabel |=
130*4882a593Smuzhiyun 			cpu_to_be32((grh->traffic_class << 20) |
131*4882a593Smuzhiyun 				    grh->flow_label);
132*4882a593Smuzhiyun 	/*
133*4882a593Smuzhiyun 	 * HW requires multicast LID so we just choose one.
134*4882a593Smuzhiyun 	 */
135*4882a593Smuzhiyun 	if (is_mcast)
136*4882a593Smuzhiyun 		ah->av.ib.dlid = cpu_to_be16(0xc000);
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun 	memcpy(ah->av.eth.dgid, grh->dgid.raw, 16);
139*4882a593Smuzhiyun 	ah->av.eth.sl_tclass_flowlabel |= cpu_to_be32(rdma_ah_get_sl(ah_attr)
140*4882a593Smuzhiyun 						      << 29);
141*4882a593Smuzhiyun 	return 0;
142*4882a593Smuzhiyun }
143*4882a593Smuzhiyun 
mlx4_ib_create_ah(struct ib_ah * ib_ah,struct rdma_ah_init_attr * init_attr,struct ib_udata * udata)144*4882a593Smuzhiyun int mlx4_ib_create_ah(struct ib_ah *ib_ah, struct rdma_ah_init_attr *init_attr,
145*4882a593Smuzhiyun 		      struct ib_udata *udata)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun 	struct rdma_ah_attr *ah_attr = init_attr->ah_attr;
148*4882a593Smuzhiyun 
149*4882a593Smuzhiyun 	if (ah_attr->type == RDMA_AH_ATTR_TYPE_ROCE) {
150*4882a593Smuzhiyun 		if (!(rdma_ah_get_ah_flags(ah_attr) & IB_AH_GRH))
151*4882a593Smuzhiyun 			return -EINVAL;
152*4882a593Smuzhiyun 		/*
153*4882a593Smuzhiyun 		 * TBD: need to handle the case when we get
154*4882a593Smuzhiyun 		 * called in an atomic context and there we
155*4882a593Smuzhiyun 		 * might sleep.  We don't expect this
156*4882a593Smuzhiyun 		 * currently since we're working with link
157*4882a593Smuzhiyun 		 * local addresses which we can translate
158*4882a593Smuzhiyun 		 * without going to sleep.
159*4882a593Smuzhiyun 		 */
160*4882a593Smuzhiyun 		return create_iboe_ah(ib_ah, ah_attr);
161*4882a593Smuzhiyun 	}
162*4882a593Smuzhiyun 
163*4882a593Smuzhiyun 	create_ib_ah(ib_ah, ah_attr);
164*4882a593Smuzhiyun 	return 0;
165*4882a593Smuzhiyun }
166*4882a593Smuzhiyun 
mlx4_ib_create_ah_slave(struct ib_ah * ah,struct rdma_ah_attr * ah_attr,int slave_sgid_index,u8 * s_mac,u16 vlan_tag)167*4882a593Smuzhiyun int mlx4_ib_create_ah_slave(struct ib_ah *ah, struct rdma_ah_attr *ah_attr,
168*4882a593Smuzhiyun 			    int slave_sgid_index, u8 *s_mac, u16 vlan_tag)
169*4882a593Smuzhiyun {
170*4882a593Smuzhiyun 	struct rdma_ah_attr slave_attr = *ah_attr;
171*4882a593Smuzhiyun 	struct rdma_ah_init_attr init_attr = {};
172*4882a593Smuzhiyun 	struct mlx4_ib_ah *mah = to_mah(ah);
173*4882a593Smuzhiyun 	int ret;
174*4882a593Smuzhiyun 
175*4882a593Smuzhiyun 	slave_attr.grh.sgid_attr = NULL;
176*4882a593Smuzhiyun 	slave_attr.grh.sgid_index = slave_sgid_index;
177*4882a593Smuzhiyun 	init_attr.ah_attr = &slave_attr;
178*4882a593Smuzhiyun 	ret = mlx4_ib_create_ah(ah, &init_attr, NULL);
179*4882a593Smuzhiyun 	if (ret)
180*4882a593Smuzhiyun 		return ret;
181*4882a593Smuzhiyun 
182*4882a593Smuzhiyun 	ah->type = ah_attr->type;
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun 	/* get rid of force-loopback bit */
185*4882a593Smuzhiyun 	mah->av.ib.port_pd &= cpu_to_be32(0x7FFFFFFF);
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun 	if (ah_attr->type == RDMA_AH_ATTR_TYPE_ROCE)
188*4882a593Smuzhiyun 		memcpy(mah->av.eth.s_mac, s_mac, 6);
189*4882a593Smuzhiyun 
190*4882a593Smuzhiyun 	if (vlan_tag < 0x1000)
191*4882a593Smuzhiyun 		vlan_tag |= (rdma_ah_get_sl(ah_attr) & 7) << 13;
192*4882a593Smuzhiyun 	mah->av.eth.vlan = cpu_to_be16(vlan_tag);
193*4882a593Smuzhiyun 
194*4882a593Smuzhiyun 	return 0;
195*4882a593Smuzhiyun }
196*4882a593Smuzhiyun 
mlx4_ib_query_ah(struct ib_ah * ibah,struct rdma_ah_attr * ah_attr)197*4882a593Smuzhiyun int mlx4_ib_query_ah(struct ib_ah *ibah, struct rdma_ah_attr *ah_attr)
198*4882a593Smuzhiyun {
199*4882a593Smuzhiyun 	struct mlx4_ib_ah *ah = to_mah(ibah);
200*4882a593Smuzhiyun 	int port_num = be32_to_cpu(ah->av.ib.port_pd) >> 24;
201*4882a593Smuzhiyun 
202*4882a593Smuzhiyun 	memset(ah_attr, 0, sizeof *ah_attr);
203*4882a593Smuzhiyun 	ah_attr->type = ibah->type;
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun 	if (ah_attr->type == RDMA_AH_ATTR_TYPE_ROCE) {
206*4882a593Smuzhiyun 		rdma_ah_set_dlid(ah_attr, 0);
207*4882a593Smuzhiyun 		rdma_ah_set_sl(ah_attr,
208*4882a593Smuzhiyun 			       be32_to_cpu(ah->av.eth.sl_tclass_flowlabel)
209*4882a593Smuzhiyun 			       >> 29);
210*4882a593Smuzhiyun 	} else {
211*4882a593Smuzhiyun 		rdma_ah_set_dlid(ah_attr, be16_to_cpu(ah->av.ib.dlid));
212*4882a593Smuzhiyun 		rdma_ah_set_sl(ah_attr,
213*4882a593Smuzhiyun 			       be32_to_cpu(ah->av.ib.sl_tclass_flowlabel)
214*4882a593Smuzhiyun 			       >> 28);
215*4882a593Smuzhiyun 	}
216*4882a593Smuzhiyun 
217*4882a593Smuzhiyun 	rdma_ah_set_port_num(ah_attr, port_num);
218*4882a593Smuzhiyun 	if (ah->av.ib.stat_rate)
219*4882a593Smuzhiyun 		rdma_ah_set_static_rate(ah_attr,
220*4882a593Smuzhiyun 					ah->av.ib.stat_rate -
221*4882a593Smuzhiyun 					MLX4_STAT_RATE_OFFSET);
222*4882a593Smuzhiyun 	rdma_ah_set_path_bits(ah_attr, ah->av.ib.g_slid & 0x7F);
223*4882a593Smuzhiyun 	if (mlx4_ib_ah_grh_present(ah)) {
224*4882a593Smuzhiyun 		u32 tc_fl = be32_to_cpu(ah->av.ib.sl_tclass_flowlabel);
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun 		rdma_ah_set_grh(ah_attr, NULL,
227*4882a593Smuzhiyun 				tc_fl & 0xfffff, ah->av.ib.gid_index,
228*4882a593Smuzhiyun 				ah->av.ib.hop_limit,
229*4882a593Smuzhiyun 				tc_fl >> 20);
230*4882a593Smuzhiyun 		rdma_ah_set_dgid_raw(ah_attr, ah->av.ib.dgid);
231*4882a593Smuzhiyun 	}
232*4882a593Smuzhiyun 
233*4882a593Smuzhiyun 	return 0;
234*4882a593Smuzhiyun }
235