1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (c) 2005 Voltaire Inc. All rights reserved.
4*4882a593Smuzhiyun * Copyright (c) 2002-2005, Network Appliance, Inc. All rights reserved.
5*4882a593Smuzhiyun * Copyright (c) 1999-2019, Mellanox Technologies, Inc. All rights reserved.
6*4882a593Smuzhiyun * Copyright (c) 2005-2006 Intel Corporation. All rights reserved.
7*4882a593Smuzhiyun */
8*4882a593Smuzhiyun
9*4882a593Smuzhiyun #include <linux/completion.h>
10*4882a593Smuzhiyun #include <linux/in.h>
11*4882a593Smuzhiyun #include <linux/in6.h>
12*4882a593Smuzhiyun #include <linux/mutex.h>
13*4882a593Smuzhiyun #include <linux/random.h>
14*4882a593Smuzhiyun #include <linux/igmp.h>
15*4882a593Smuzhiyun #include <linux/xarray.h>
16*4882a593Smuzhiyun #include <linux/inetdevice.h>
17*4882a593Smuzhiyun #include <linux/slab.h>
18*4882a593Smuzhiyun #include <linux/module.h>
19*4882a593Smuzhiyun #include <net/route.h>
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun #include <net/net_namespace.h>
22*4882a593Smuzhiyun #include <net/netns/generic.h>
23*4882a593Smuzhiyun #include <net/tcp.h>
24*4882a593Smuzhiyun #include <net/ipv6.h>
25*4882a593Smuzhiyun #include <net/ip_fib.h>
26*4882a593Smuzhiyun #include <net/ip6_route.h>
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun #include <rdma/rdma_cm.h>
29*4882a593Smuzhiyun #include <rdma/rdma_cm_ib.h>
30*4882a593Smuzhiyun #include <rdma/rdma_netlink.h>
31*4882a593Smuzhiyun #include <rdma/ib.h>
32*4882a593Smuzhiyun #include <rdma/ib_cache.h>
33*4882a593Smuzhiyun #include <rdma/ib_cm.h>
34*4882a593Smuzhiyun #include <rdma/ib_sa.h>
35*4882a593Smuzhiyun #include <rdma/iw_cm.h>
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun #include "core_priv.h"
38*4882a593Smuzhiyun #include "cma_priv.h"
39*4882a593Smuzhiyun #include "cma_trace.h"
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun MODULE_AUTHOR("Sean Hefty");
42*4882a593Smuzhiyun MODULE_DESCRIPTION("Generic RDMA CM Agent");
43*4882a593Smuzhiyun MODULE_LICENSE("Dual BSD/GPL");
44*4882a593Smuzhiyun
45*4882a593Smuzhiyun #define CMA_CM_RESPONSE_TIMEOUT 20
46*4882a593Smuzhiyun #define CMA_QUERY_CLASSPORT_INFO_TIMEOUT 3000
47*4882a593Smuzhiyun #define CMA_MAX_CM_RETRIES 15
48*4882a593Smuzhiyun #define CMA_CM_MRA_SETTING (IB_CM_MRA_FLAG_DELAY | 24)
49*4882a593Smuzhiyun #define CMA_IBOE_PACKET_LIFETIME 18
50*4882a593Smuzhiyun #define CMA_PREFERRED_ROCE_GID_TYPE IB_GID_TYPE_ROCE_UDP_ENCAP
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun static const char * const cma_events[] = {
53*4882a593Smuzhiyun [RDMA_CM_EVENT_ADDR_RESOLVED] = "address resolved",
54*4882a593Smuzhiyun [RDMA_CM_EVENT_ADDR_ERROR] = "address error",
55*4882a593Smuzhiyun [RDMA_CM_EVENT_ROUTE_RESOLVED] = "route resolved ",
56*4882a593Smuzhiyun [RDMA_CM_EVENT_ROUTE_ERROR] = "route error",
57*4882a593Smuzhiyun [RDMA_CM_EVENT_CONNECT_REQUEST] = "connect request",
58*4882a593Smuzhiyun [RDMA_CM_EVENT_CONNECT_RESPONSE] = "connect response",
59*4882a593Smuzhiyun [RDMA_CM_EVENT_CONNECT_ERROR] = "connect error",
60*4882a593Smuzhiyun [RDMA_CM_EVENT_UNREACHABLE] = "unreachable",
61*4882a593Smuzhiyun [RDMA_CM_EVENT_REJECTED] = "rejected",
62*4882a593Smuzhiyun [RDMA_CM_EVENT_ESTABLISHED] = "established",
63*4882a593Smuzhiyun [RDMA_CM_EVENT_DISCONNECTED] = "disconnected",
64*4882a593Smuzhiyun [RDMA_CM_EVENT_DEVICE_REMOVAL] = "device removal",
65*4882a593Smuzhiyun [RDMA_CM_EVENT_MULTICAST_JOIN] = "multicast join",
66*4882a593Smuzhiyun [RDMA_CM_EVENT_MULTICAST_ERROR] = "multicast error",
67*4882a593Smuzhiyun [RDMA_CM_EVENT_ADDR_CHANGE] = "address change",
68*4882a593Smuzhiyun [RDMA_CM_EVENT_TIMEWAIT_EXIT] = "timewait exit",
69*4882a593Smuzhiyun };
70*4882a593Smuzhiyun
71*4882a593Smuzhiyun static void cma_iboe_set_mgid(struct sockaddr *addr, union ib_gid *mgid,
72*4882a593Smuzhiyun enum ib_gid_type gid_type);
73*4882a593Smuzhiyun
rdma_event_msg(enum rdma_cm_event_type event)74*4882a593Smuzhiyun const char *__attribute_const__ rdma_event_msg(enum rdma_cm_event_type event)
75*4882a593Smuzhiyun {
76*4882a593Smuzhiyun size_t index = event;
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun return (index < ARRAY_SIZE(cma_events) && cma_events[index]) ?
79*4882a593Smuzhiyun cma_events[index] : "unrecognized event";
80*4882a593Smuzhiyun }
81*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_event_msg);
82*4882a593Smuzhiyun
rdma_reject_msg(struct rdma_cm_id * id,int reason)83*4882a593Smuzhiyun const char *__attribute_const__ rdma_reject_msg(struct rdma_cm_id *id,
84*4882a593Smuzhiyun int reason)
85*4882a593Smuzhiyun {
86*4882a593Smuzhiyun if (rdma_ib_or_roce(id->device, id->port_num))
87*4882a593Smuzhiyun return ibcm_reject_msg(reason);
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun if (rdma_protocol_iwarp(id->device, id->port_num))
90*4882a593Smuzhiyun return iwcm_reject_msg(reason);
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun WARN_ON_ONCE(1);
93*4882a593Smuzhiyun return "unrecognized transport";
94*4882a593Smuzhiyun }
95*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_reject_msg);
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun /**
98*4882a593Smuzhiyun * rdma_is_consumer_reject - return true if the consumer rejected the connect
99*4882a593Smuzhiyun * request.
100*4882a593Smuzhiyun * @id: Communication identifier that received the REJECT event.
101*4882a593Smuzhiyun * @reason: Value returned in the REJECT event status field.
102*4882a593Smuzhiyun */
rdma_is_consumer_reject(struct rdma_cm_id * id,int reason)103*4882a593Smuzhiyun static bool rdma_is_consumer_reject(struct rdma_cm_id *id, int reason)
104*4882a593Smuzhiyun {
105*4882a593Smuzhiyun if (rdma_ib_or_roce(id->device, id->port_num))
106*4882a593Smuzhiyun return reason == IB_CM_REJ_CONSUMER_DEFINED;
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun if (rdma_protocol_iwarp(id->device, id->port_num))
109*4882a593Smuzhiyun return reason == -ECONNREFUSED;
110*4882a593Smuzhiyun
111*4882a593Smuzhiyun WARN_ON_ONCE(1);
112*4882a593Smuzhiyun return false;
113*4882a593Smuzhiyun }
114*4882a593Smuzhiyun
rdma_consumer_reject_data(struct rdma_cm_id * id,struct rdma_cm_event * ev,u8 * data_len)115*4882a593Smuzhiyun const void *rdma_consumer_reject_data(struct rdma_cm_id *id,
116*4882a593Smuzhiyun struct rdma_cm_event *ev, u8 *data_len)
117*4882a593Smuzhiyun {
118*4882a593Smuzhiyun const void *p;
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun if (rdma_is_consumer_reject(id, ev->status)) {
121*4882a593Smuzhiyun *data_len = ev->param.conn.private_data_len;
122*4882a593Smuzhiyun p = ev->param.conn.private_data;
123*4882a593Smuzhiyun } else {
124*4882a593Smuzhiyun *data_len = 0;
125*4882a593Smuzhiyun p = NULL;
126*4882a593Smuzhiyun }
127*4882a593Smuzhiyun return p;
128*4882a593Smuzhiyun }
129*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_consumer_reject_data);
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun /**
132*4882a593Smuzhiyun * rdma_iw_cm_id() - return the iw_cm_id pointer for this cm_id.
133*4882a593Smuzhiyun * @id: Communication Identifier
134*4882a593Smuzhiyun */
rdma_iw_cm_id(struct rdma_cm_id * id)135*4882a593Smuzhiyun struct iw_cm_id *rdma_iw_cm_id(struct rdma_cm_id *id)
136*4882a593Smuzhiyun {
137*4882a593Smuzhiyun struct rdma_id_private *id_priv;
138*4882a593Smuzhiyun
139*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
140*4882a593Smuzhiyun if (id->device->node_type == RDMA_NODE_RNIC)
141*4882a593Smuzhiyun return id_priv->cm_id.iw;
142*4882a593Smuzhiyun return NULL;
143*4882a593Smuzhiyun }
144*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_iw_cm_id);
145*4882a593Smuzhiyun
146*4882a593Smuzhiyun /**
147*4882a593Smuzhiyun * rdma_res_to_id() - return the rdma_cm_id pointer for this restrack.
148*4882a593Smuzhiyun * @res: rdma resource tracking entry pointer
149*4882a593Smuzhiyun */
rdma_res_to_id(struct rdma_restrack_entry * res)150*4882a593Smuzhiyun struct rdma_cm_id *rdma_res_to_id(struct rdma_restrack_entry *res)
151*4882a593Smuzhiyun {
152*4882a593Smuzhiyun struct rdma_id_private *id_priv =
153*4882a593Smuzhiyun container_of(res, struct rdma_id_private, res);
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun return &id_priv->id;
156*4882a593Smuzhiyun }
157*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_res_to_id);
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun static int cma_add_one(struct ib_device *device);
160*4882a593Smuzhiyun static void cma_remove_one(struct ib_device *device, void *client_data);
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun static struct ib_client cma_client = {
163*4882a593Smuzhiyun .name = "cma",
164*4882a593Smuzhiyun .add = cma_add_one,
165*4882a593Smuzhiyun .remove = cma_remove_one
166*4882a593Smuzhiyun };
167*4882a593Smuzhiyun
168*4882a593Smuzhiyun static struct ib_sa_client sa_client;
169*4882a593Smuzhiyun static LIST_HEAD(dev_list);
170*4882a593Smuzhiyun static LIST_HEAD(listen_any_list);
171*4882a593Smuzhiyun static DEFINE_MUTEX(lock);
172*4882a593Smuzhiyun static struct workqueue_struct *cma_wq;
173*4882a593Smuzhiyun static unsigned int cma_pernet_id;
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun struct cma_pernet {
176*4882a593Smuzhiyun struct xarray tcp_ps;
177*4882a593Smuzhiyun struct xarray udp_ps;
178*4882a593Smuzhiyun struct xarray ipoib_ps;
179*4882a593Smuzhiyun struct xarray ib_ps;
180*4882a593Smuzhiyun };
181*4882a593Smuzhiyun
cma_pernet(struct net * net)182*4882a593Smuzhiyun static struct cma_pernet *cma_pernet(struct net *net)
183*4882a593Smuzhiyun {
184*4882a593Smuzhiyun return net_generic(net, cma_pernet_id);
185*4882a593Smuzhiyun }
186*4882a593Smuzhiyun
187*4882a593Smuzhiyun static
cma_pernet_xa(struct net * net,enum rdma_ucm_port_space ps)188*4882a593Smuzhiyun struct xarray *cma_pernet_xa(struct net *net, enum rdma_ucm_port_space ps)
189*4882a593Smuzhiyun {
190*4882a593Smuzhiyun struct cma_pernet *pernet = cma_pernet(net);
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun switch (ps) {
193*4882a593Smuzhiyun case RDMA_PS_TCP:
194*4882a593Smuzhiyun return &pernet->tcp_ps;
195*4882a593Smuzhiyun case RDMA_PS_UDP:
196*4882a593Smuzhiyun return &pernet->udp_ps;
197*4882a593Smuzhiyun case RDMA_PS_IPOIB:
198*4882a593Smuzhiyun return &pernet->ipoib_ps;
199*4882a593Smuzhiyun case RDMA_PS_IB:
200*4882a593Smuzhiyun return &pernet->ib_ps;
201*4882a593Smuzhiyun default:
202*4882a593Smuzhiyun return NULL;
203*4882a593Smuzhiyun }
204*4882a593Smuzhiyun }
205*4882a593Smuzhiyun
206*4882a593Smuzhiyun struct cma_device {
207*4882a593Smuzhiyun struct list_head list;
208*4882a593Smuzhiyun struct ib_device *device;
209*4882a593Smuzhiyun struct completion comp;
210*4882a593Smuzhiyun refcount_t refcount;
211*4882a593Smuzhiyun struct list_head id_list;
212*4882a593Smuzhiyun enum ib_gid_type *default_gid_type;
213*4882a593Smuzhiyun u8 *default_roce_tos;
214*4882a593Smuzhiyun };
215*4882a593Smuzhiyun
216*4882a593Smuzhiyun struct rdma_bind_list {
217*4882a593Smuzhiyun enum rdma_ucm_port_space ps;
218*4882a593Smuzhiyun struct hlist_head owners;
219*4882a593Smuzhiyun unsigned short port;
220*4882a593Smuzhiyun };
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun struct class_port_info_context {
223*4882a593Smuzhiyun struct ib_class_port_info *class_port_info;
224*4882a593Smuzhiyun struct ib_device *device;
225*4882a593Smuzhiyun struct completion done;
226*4882a593Smuzhiyun struct ib_sa_query *sa_query;
227*4882a593Smuzhiyun u8 port_num;
228*4882a593Smuzhiyun };
229*4882a593Smuzhiyun
cma_ps_alloc(struct net * net,enum rdma_ucm_port_space ps,struct rdma_bind_list * bind_list,int snum)230*4882a593Smuzhiyun static int cma_ps_alloc(struct net *net, enum rdma_ucm_port_space ps,
231*4882a593Smuzhiyun struct rdma_bind_list *bind_list, int snum)
232*4882a593Smuzhiyun {
233*4882a593Smuzhiyun struct xarray *xa = cma_pernet_xa(net, ps);
234*4882a593Smuzhiyun
235*4882a593Smuzhiyun return xa_insert(xa, snum, bind_list, GFP_KERNEL);
236*4882a593Smuzhiyun }
237*4882a593Smuzhiyun
cma_ps_find(struct net * net,enum rdma_ucm_port_space ps,int snum)238*4882a593Smuzhiyun static struct rdma_bind_list *cma_ps_find(struct net *net,
239*4882a593Smuzhiyun enum rdma_ucm_port_space ps, int snum)
240*4882a593Smuzhiyun {
241*4882a593Smuzhiyun struct xarray *xa = cma_pernet_xa(net, ps);
242*4882a593Smuzhiyun
243*4882a593Smuzhiyun return xa_load(xa, snum);
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun
cma_ps_remove(struct net * net,enum rdma_ucm_port_space ps,int snum)246*4882a593Smuzhiyun static void cma_ps_remove(struct net *net, enum rdma_ucm_port_space ps,
247*4882a593Smuzhiyun int snum)
248*4882a593Smuzhiyun {
249*4882a593Smuzhiyun struct xarray *xa = cma_pernet_xa(net, ps);
250*4882a593Smuzhiyun
251*4882a593Smuzhiyun xa_erase(xa, snum);
252*4882a593Smuzhiyun }
253*4882a593Smuzhiyun
254*4882a593Smuzhiyun enum {
255*4882a593Smuzhiyun CMA_OPTION_AFONLY,
256*4882a593Smuzhiyun };
257*4882a593Smuzhiyun
cma_dev_get(struct cma_device * cma_dev)258*4882a593Smuzhiyun void cma_dev_get(struct cma_device *cma_dev)
259*4882a593Smuzhiyun {
260*4882a593Smuzhiyun refcount_inc(&cma_dev->refcount);
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun
cma_dev_put(struct cma_device * cma_dev)263*4882a593Smuzhiyun void cma_dev_put(struct cma_device *cma_dev)
264*4882a593Smuzhiyun {
265*4882a593Smuzhiyun if (refcount_dec_and_test(&cma_dev->refcount))
266*4882a593Smuzhiyun complete(&cma_dev->comp);
267*4882a593Smuzhiyun }
268*4882a593Smuzhiyun
cma_enum_devices_by_ibdev(cma_device_filter filter,void * cookie)269*4882a593Smuzhiyun struct cma_device *cma_enum_devices_by_ibdev(cma_device_filter filter,
270*4882a593Smuzhiyun void *cookie)
271*4882a593Smuzhiyun {
272*4882a593Smuzhiyun struct cma_device *cma_dev;
273*4882a593Smuzhiyun struct cma_device *found_cma_dev = NULL;
274*4882a593Smuzhiyun
275*4882a593Smuzhiyun mutex_lock(&lock);
276*4882a593Smuzhiyun
277*4882a593Smuzhiyun list_for_each_entry(cma_dev, &dev_list, list)
278*4882a593Smuzhiyun if (filter(cma_dev->device, cookie)) {
279*4882a593Smuzhiyun found_cma_dev = cma_dev;
280*4882a593Smuzhiyun break;
281*4882a593Smuzhiyun }
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun if (found_cma_dev)
284*4882a593Smuzhiyun cma_dev_get(found_cma_dev);
285*4882a593Smuzhiyun mutex_unlock(&lock);
286*4882a593Smuzhiyun return found_cma_dev;
287*4882a593Smuzhiyun }
288*4882a593Smuzhiyun
cma_get_default_gid_type(struct cma_device * cma_dev,unsigned int port)289*4882a593Smuzhiyun int cma_get_default_gid_type(struct cma_device *cma_dev,
290*4882a593Smuzhiyun unsigned int port)
291*4882a593Smuzhiyun {
292*4882a593Smuzhiyun if (!rdma_is_port_valid(cma_dev->device, port))
293*4882a593Smuzhiyun return -EINVAL;
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun return cma_dev->default_gid_type[port - rdma_start_port(cma_dev->device)];
296*4882a593Smuzhiyun }
297*4882a593Smuzhiyun
cma_set_default_gid_type(struct cma_device * cma_dev,unsigned int port,enum ib_gid_type default_gid_type)298*4882a593Smuzhiyun int cma_set_default_gid_type(struct cma_device *cma_dev,
299*4882a593Smuzhiyun unsigned int port,
300*4882a593Smuzhiyun enum ib_gid_type default_gid_type)
301*4882a593Smuzhiyun {
302*4882a593Smuzhiyun unsigned long supported_gids;
303*4882a593Smuzhiyun
304*4882a593Smuzhiyun if (!rdma_is_port_valid(cma_dev->device, port))
305*4882a593Smuzhiyun return -EINVAL;
306*4882a593Smuzhiyun
307*4882a593Smuzhiyun if (default_gid_type == IB_GID_TYPE_IB &&
308*4882a593Smuzhiyun rdma_protocol_roce_eth_encap(cma_dev->device, port))
309*4882a593Smuzhiyun default_gid_type = IB_GID_TYPE_ROCE;
310*4882a593Smuzhiyun
311*4882a593Smuzhiyun supported_gids = roce_gid_type_mask_support(cma_dev->device, port);
312*4882a593Smuzhiyun
313*4882a593Smuzhiyun if (!(supported_gids & 1 << default_gid_type))
314*4882a593Smuzhiyun return -EINVAL;
315*4882a593Smuzhiyun
316*4882a593Smuzhiyun cma_dev->default_gid_type[port - rdma_start_port(cma_dev->device)] =
317*4882a593Smuzhiyun default_gid_type;
318*4882a593Smuzhiyun
319*4882a593Smuzhiyun return 0;
320*4882a593Smuzhiyun }
321*4882a593Smuzhiyun
cma_get_default_roce_tos(struct cma_device * cma_dev,unsigned int port)322*4882a593Smuzhiyun int cma_get_default_roce_tos(struct cma_device *cma_dev, unsigned int port)
323*4882a593Smuzhiyun {
324*4882a593Smuzhiyun if (!rdma_is_port_valid(cma_dev->device, port))
325*4882a593Smuzhiyun return -EINVAL;
326*4882a593Smuzhiyun
327*4882a593Smuzhiyun return cma_dev->default_roce_tos[port - rdma_start_port(cma_dev->device)];
328*4882a593Smuzhiyun }
329*4882a593Smuzhiyun
cma_set_default_roce_tos(struct cma_device * cma_dev,unsigned int port,u8 default_roce_tos)330*4882a593Smuzhiyun int cma_set_default_roce_tos(struct cma_device *cma_dev, unsigned int port,
331*4882a593Smuzhiyun u8 default_roce_tos)
332*4882a593Smuzhiyun {
333*4882a593Smuzhiyun if (!rdma_is_port_valid(cma_dev->device, port))
334*4882a593Smuzhiyun return -EINVAL;
335*4882a593Smuzhiyun
336*4882a593Smuzhiyun cma_dev->default_roce_tos[port - rdma_start_port(cma_dev->device)] =
337*4882a593Smuzhiyun default_roce_tos;
338*4882a593Smuzhiyun
339*4882a593Smuzhiyun return 0;
340*4882a593Smuzhiyun }
cma_get_ib_dev(struct cma_device * cma_dev)341*4882a593Smuzhiyun struct ib_device *cma_get_ib_dev(struct cma_device *cma_dev)
342*4882a593Smuzhiyun {
343*4882a593Smuzhiyun return cma_dev->device;
344*4882a593Smuzhiyun }
345*4882a593Smuzhiyun
346*4882a593Smuzhiyun /*
347*4882a593Smuzhiyun * Device removal can occur at anytime, so we need extra handling to
348*4882a593Smuzhiyun * serialize notifying the user of device removal with other callbacks.
349*4882a593Smuzhiyun * We do this by disabling removal notification while a callback is in process,
350*4882a593Smuzhiyun * and reporting it after the callback completes.
351*4882a593Smuzhiyun */
352*4882a593Smuzhiyun
353*4882a593Smuzhiyun struct cma_multicast {
354*4882a593Smuzhiyun struct rdma_id_private *id_priv;
355*4882a593Smuzhiyun union {
356*4882a593Smuzhiyun struct ib_sa_multicast *sa_mc;
357*4882a593Smuzhiyun struct {
358*4882a593Smuzhiyun struct work_struct work;
359*4882a593Smuzhiyun struct rdma_cm_event event;
360*4882a593Smuzhiyun } iboe_join;
361*4882a593Smuzhiyun };
362*4882a593Smuzhiyun struct list_head list;
363*4882a593Smuzhiyun void *context;
364*4882a593Smuzhiyun struct sockaddr_storage addr;
365*4882a593Smuzhiyun u8 join_state;
366*4882a593Smuzhiyun };
367*4882a593Smuzhiyun
368*4882a593Smuzhiyun struct cma_work {
369*4882a593Smuzhiyun struct work_struct work;
370*4882a593Smuzhiyun struct rdma_id_private *id;
371*4882a593Smuzhiyun enum rdma_cm_state old_state;
372*4882a593Smuzhiyun enum rdma_cm_state new_state;
373*4882a593Smuzhiyun struct rdma_cm_event event;
374*4882a593Smuzhiyun };
375*4882a593Smuzhiyun
376*4882a593Smuzhiyun union cma_ip_addr {
377*4882a593Smuzhiyun struct in6_addr ip6;
378*4882a593Smuzhiyun struct {
379*4882a593Smuzhiyun __be32 pad[3];
380*4882a593Smuzhiyun __be32 addr;
381*4882a593Smuzhiyun } ip4;
382*4882a593Smuzhiyun };
383*4882a593Smuzhiyun
384*4882a593Smuzhiyun struct cma_hdr {
385*4882a593Smuzhiyun u8 cma_version;
386*4882a593Smuzhiyun u8 ip_version; /* IP version: 7:4 */
387*4882a593Smuzhiyun __be16 port;
388*4882a593Smuzhiyun union cma_ip_addr src_addr;
389*4882a593Smuzhiyun union cma_ip_addr dst_addr;
390*4882a593Smuzhiyun };
391*4882a593Smuzhiyun
392*4882a593Smuzhiyun #define CMA_VERSION 0x00
393*4882a593Smuzhiyun
394*4882a593Smuzhiyun struct cma_req_info {
395*4882a593Smuzhiyun struct sockaddr_storage listen_addr_storage;
396*4882a593Smuzhiyun struct sockaddr_storage src_addr_storage;
397*4882a593Smuzhiyun struct ib_device *device;
398*4882a593Smuzhiyun union ib_gid local_gid;
399*4882a593Smuzhiyun __be64 service_id;
400*4882a593Smuzhiyun int port;
401*4882a593Smuzhiyun bool has_gid;
402*4882a593Smuzhiyun u16 pkey;
403*4882a593Smuzhiyun };
404*4882a593Smuzhiyun
cma_comp_exch(struct rdma_id_private * id_priv,enum rdma_cm_state comp,enum rdma_cm_state exch)405*4882a593Smuzhiyun static int cma_comp_exch(struct rdma_id_private *id_priv,
406*4882a593Smuzhiyun enum rdma_cm_state comp, enum rdma_cm_state exch)
407*4882a593Smuzhiyun {
408*4882a593Smuzhiyun unsigned long flags;
409*4882a593Smuzhiyun int ret;
410*4882a593Smuzhiyun
411*4882a593Smuzhiyun /*
412*4882a593Smuzhiyun * The FSM uses a funny double locking where state is protected by both
413*4882a593Smuzhiyun * the handler_mutex and the spinlock. State is not allowed to change
414*4882a593Smuzhiyun * to/from a handler_mutex protected value without also holding
415*4882a593Smuzhiyun * handler_mutex.
416*4882a593Smuzhiyun */
417*4882a593Smuzhiyun if (comp == RDMA_CM_CONNECT || exch == RDMA_CM_CONNECT)
418*4882a593Smuzhiyun lockdep_assert_held(&id_priv->handler_mutex);
419*4882a593Smuzhiyun
420*4882a593Smuzhiyun spin_lock_irqsave(&id_priv->lock, flags);
421*4882a593Smuzhiyun if ((ret = (id_priv->state == comp)))
422*4882a593Smuzhiyun id_priv->state = exch;
423*4882a593Smuzhiyun spin_unlock_irqrestore(&id_priv->lock, flags);
424*4882a593Smuzhiyun return ret;
425*4882a593Smuzhiyun }
426*4882a593Smuzhiyun
cma_get_ip_ver(const struct cma_hdr * hdr)427*4882a593Smuzhiyun static inline u8 cma_get_ip_ver(const struct cma_hdr *hdr)
428*4882a593Smuzhiyun {
429*4882a593Smuzhiyun return hdr->ip_version >> 4;
430*4882a593Smuzhiyun }
431*4882a593Smuzhiyun
cma_set_ip_ver(struct cma_hdr * hdr,u8 ip_ver)432*4882a593Smuzhiyun static inline void cma_set_ip_ver(struct cma_hdr *hdr, u8 ip_ver)
433*4882a593Smuzhiyun {
434*4882a593Smuzhiyun hdr->ip_version = (ip_ver << 4) | (hdr->ip_version & 0xF);
435*4882a593Smuzhiyun }
436*4882a593Smuzhiyun
cma_igmp_send(struct net_device * ndev,union ib_gid * mgid,bool join)437*4882a593Smuzhiyun static int cma_igmp_send(struct net_device *ndev, union ib_gid *mgid, bool join)
438*4882a593Smuzhiyun {
439*4882a593Smuzhiyun struct in_device *in_dev = NULL;
440*4882a593Smuzhiyun
441*4882a593Smuzhiyun if (ndev) {
442*4882a593Smuzhiyun rtnl_lock();
443*4882a593Smuzhiyun in_dev = __in_dev_get_rtnl(ndev);
444*4882a593Smuzhiyun if (in_dev) {
445*4882a593Smuzhiyun if (join)
446*4882a593Smuzhiyun ip_mc_inc_group(in_dev,
447*4882a593Smuzhiyun *(__be32 *)(mgid->raw + 12));
448*4882a593Smuzhiyun else
449*4882a593Smuzhiyun ip_mc_dec_group(in_dev,
450*4882a593Smuzhiyun *(__be32 *)(mgid->raw + 12));
451*4882a593Smuzhiyun }
452*4882a593Smuzhiyun rtnl_unlock();
453*4882a593Smuzhiyun }
454*4882a593Smuzhiyun return (in_dev) ? 0 : -ENODEV;
455*4882a593Smuzhiyun }
456*4882a593Smuzhiyun
_cma_attach_to_dev(struct rdma_id_private * id_priv,struct cma_device * cma_dev)457*4882a593Smuzhiyun static void _cma_attach_to_dev(struct rdma_id_private *id_priv,
458*4882a593Smuzhiyun struct cma_device *cma_dev)
459*4882a593Smuzhiyun {
460*4882a593Smuzhiyun cma_dev_get(cma_dev);
461*4882a593Smuzhiyun id_priv->cma_dev = cma_dev;
462*4882a593Smuzhiyun id_priv->id.device = cma_dev->device;
463*4882a593Smuzhiyun id_priv->id.route.addr.dev_addr.transport =
464*4882a593Smuzhiyun rdma_node_get_transport(cma_dev->device->node_type);
465*4882a593Smuzhiyun list_add_tail(&id_priv->list, &cma_dev->id_list);
466*4882a593Smuzhiyun
467*4882a593Smuzhiyun trace_cm_id_attach(id_priv, cma_dev->device);
468*4882a593Smuzhiyun }
469*4882a593Smuzhiyun
cma_attach_to_dev(struct rdma_id_private * id_priv,struct cma_device * cma_dev)470*4882a593Smuzhiyun static void cma_attach_to_dev(struct rdma_id_private *id_priv,
471*4882a593Smuzhiyun struct cma_device *cma_dev)
472*4882a593Smuzhiyun {
473*4882a593Smuzhiyun _cma_attach_to_dev(id_priv, cma_dev);
474*4882a593Smuzhiyun id_priv->gid_type =
475*4882a593Smuzhiyun cma_dev->default_gid_type[id_priv->id.port_num -
476*4882a593Smuzhiyun rdma_start_port(cma_dev->device)];
477*4882a593Smuzhiyun }
478*4882a593Smuzhiyun
cma_release_dev(struct rdma_id_private * id_priv)479*4882a593Smuzhiyun static void cma_release_dev(struct rdma_id_private *id_priv)
480*4882a593Smuzhiyun {
481*4882a593Smuzhiyun mutex_lock(&lock);
482*4882a593Smuzhiyun list_del(&id_priv->list);
483*4882a593Smuzhiyun cma_dev_put(id_priv->cma_dev);
484*4882a593Smuzhiyun id_priv->cma_dev = NULL;
485*4882a593Smuzhiyun id_priv->id.device = NULL;
486*4882a593Smuzhiyun if (id_priv->id.route.addr.dev_addr.sgid_attr) {
487*4882a593Smuzhiyun rdma_put_gid_attr(id_priv->id.route.addr.dev_addr.sgid_attr);
488*4882a593Smuzhiyun id_priv->id.route.addr.dev_addr.sgid_attr = NULL;
489*4882a593Smuzhiyun }
490*4882a593Smuzhiyun mutex_unlock(&lock);
491*4882a593Smuzhiyun }
492*4882a593Smuzhiyun
cma_src_addr(struct rdma_id_private * id_priv)493*4882a593Smuzhiyun static inline struct sockaddr *cma_src_addr(struct rdma_id_private *id_priv)
494*4882a593Smuzhiyun {
495*4882a593Smuzhiyun return (struct sockaddr *) &id_priv->id.route.addr.src_addr;
496*4882a593Smuzhiyun }
497*4882a593Smuzhiyun
cma_dst_addr(struct rdma_id_private * id_priv)498*4882a593Smuzhiyun static inline struct sockaddr *cma_dst_addr(struct rdma_id_private *id_priv)
499*4882a593Smuzhiyun {
500*4882a593Smuzhiyun return (struct sockaddr *) &id_priv->id.route.addr.dst_addr;
501*4882a593Smuzhiyun }
502*4882a593Smuzhiyun
cma_family(struct rdma_id_private * id_priv)503*4882a593Smuzhiyun static inline unsigned short cma_family(struct rdma_id_private *id_priv)
504*4882a593Smuzhiyun {
505*4882a593Smuzhiyun return id_priv->id.route.addr.src_addr.ss_family;
506*4882a593Smuzhiyun }
507*4882a593Smuzhiyun
cma_set_qkey(struct rdma_id_private * id_priv,u32 qkey)508*4882a593Smuzhiyun static int cma_set_qkey(struct rdma_id_private *id_priv, u32 qkey)
509*4882a593Smuzhiyun {
510*4882a593Smuzhiyun struct ib_sa_mcmember_rec rec;
511*4882a593Smuzhiyun int ret = 0;
512*4882a593Smuzhiyun
513*4882a593Smuzhiyun if (id_priv->qkey) {
514*4882a593Smuzhiyun if (qkey && id_priv->qkey != qkey)
515*4882a593Smuzhiyun return -EINVAL;
516*4882a593Smuzhiyun return 0;
517*4882a593Smuzhiyun }
518*4882a593Smuzhiyun
519*4882a593Smuzhiyun if (qkey) {
520*4882a593Smuzhiyun id_priv->qkey = qkey;
521*4882a593Smuzhiyun return 0;
522*4882a593Smuzhiyun }
523*4882a593Smuzhiyun
524*4882a593Smuzhiyun switch (id_priv->id.ps) {
525*4882a593Smuzhiyun case RDMA_PS_UDP:
526*4882a593Smuzhiyun case RDMA_PS_IB:
527*4882a593Smuzhiyun id_priv->qkey = RDMA_UDP_QKEY;
528*4882a593Smuzhiyun break;
529*4882a593Smuzhiyun case RDMA_PS_IPOIB:
530*4882a593Smuzhiyun ib_addr_get_mgid(&id_priv->id.route.addr.dev_addr, &rec.mgid);
531*4882a593Smuzhiyun ret = ib_sa_get_mcmember_rec(id_priv->id.device,
532*4882a593Smuzhiyun id_priv->id.port_num, &rec.mgid,
533*4882a593Smuzhiyun &rec);
534*4882a593Smuzhiyun if (!ret)
535*4882a593Smuzhiyun id_priv->qkey = be32_to_cpu(rec.qkey);
536*4882a593Smuzhiyun break;
537*4882a593Smuzhiyun default:
538*4882a593Smuzhiyun break;
539*4882a593Smuzhiyun }
540*4882a593Smuzhiyun return ret;
541*4882a593Smuzhiyun }
542*4882a593Smuzhiyun
cma_translate_ib(struct sockaddr_ib * sib,struct rdma_dev_addr * dev_addr)543*4882a593Smuzhiyun static void cma_translate_ib(struct sockaddr_ib *sib, struct rdma_dev_addr *dev_addr)
544*4882a593Smuzhiyun {
545*4882a593Smuzhiyun dev_addr->dev_type = ARPHRD_INFINIBAND;
546*4882a593Smuzhiyun rdma_addr_set_sgid(dev_addr, (union ib_gid *) &sib->sib_addr);
547*4882a593Smuzhiyun ib_addr_set_pkey(dev_addr, ntohs(sib->sib_pkey));
548*4882a593Smuzhiyun }
549*4882a593Smuzhiyun
cma_translate_addr(struct sockaddr * addr,struct rdma_dev_addr * dev_addr)550*4882a593Smuzhiyun static int cma_translate_addr(struct sockaddr *addr, struct rdma_dev_addr *dev_addr)
551*4882a593Smuzhiyun {
552*4882a593Smuzhiyun int ret;
553*4882a593Smuzhiyun
554*4882a593Smuzhiyun if (addr->sa_family != AF_IB) {
555*4882a593Smuzhiyun ret = rdma_translate_ip(addr, dev_addr);
556*4882a593Smuzhiyun } else {
557*4882a593Smuzhiyun cma_translate_ib((struct sockaddr_ib *) addr, dev_addr);
558*4882a593Smuzhiyun ret = 0;
559*4882a593Smuzhiyun }
560*4882a593Smuzhiyun
561*4882a593Smuzhiyun return ret;
562*4882a593Smuzhiyun }
563*4882a593Smuzhiyun
564*4882a593Smuzhiyun static const struct ib_gid_attr *
cma_validate_port(struct ib_device * device,u8 port,enum ib_gid_type gid_type,union ib_gid * gid,struct rdma_id_private * id_priv)565*4882a593Smuzhiyun cma_validate_port(struct ib_device *device, u8 port,
566*4882a593Smuzhiyun enum ib_gid_type gid_type,
567*4882a593Smuzhiyun union ib_gid *gid,
568*4882a593Smuzhiyun struct rdma_id_private *id_priv)
569*4882a593Smuzhiyun {
570*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
571*4882a593Smuzhiyun int bound_if_index = dev_addr->bound_dev_if;
572*4882a593Smuzhiyun const struct ib_gid_attr *sgid_attr;
573*4882a593Smuzhiyun int dev_type = dev_addr->dev_type;
574*4882a593Smuzhiyun struct net_device *ndev = NULL;
575*4882a593Smuzhiyun
576*4882a593Smuzhiyun if (!rdma_dev_access_netns(device, id_priv->id.route.addr.dev_addr.net))
577*4882a593Smuzhiyun return ERR_PTR(-ENODEV);
578*4882a593Smuzhiyun
579*4882a593Smuzhiyun if ((dev_type == ARPHRD_INFINIBAND) && !rdma_protocol_ib(device, port))
580*4882a593Smuzhiyun return ERR_PTR(-ENODEV);
581*4882a593Smuzhiyun
582*4882a593Smuzhiyun if ((dev_type != ARPHRD_INFINIBAND) && rdma_protocol_ib(device, port))
583*4882a593Smuzhiyun return ERR_PTR(-ENODEV);
584*4882a593Smuzhiyun
585*4882a593Smuzhiyun if (dev_type == ARPHRD_ETHER && rdma_protocol_roce(device, port)) {
586*4882a593Smuzhiyun ndev = dev_get_by_index(dev_addr->net, bound_if_index);
587*4882a593Smuzhiyun if (!ndev)
588*4882a593Smuzhiyun return ERR_PTR(-ENODEV);
589*4882a593Smuzhiyun } else {
590*4882a593Smuzhiyun gid_type = IB_GID_TYPE_IB;
591*4882a593Smuzhiyun }
592*4882a593Smuzhiyun
593*4882a593Smuzhiyun sgid_attr = rdma_find_gid_by_port(device, gid, gid_type, port, ndev);
594*4882a593Smuzhiyun if (ndev)
595*4882a593Smuzhiyun dev_put(ndev);
596*4882a593Smuzhiyun return sgid_attr;
597*4882a593Smuzhiyun }
598*4882a593Smuzhiyun
cma_bind_sgid_attr(struct rdma_id_private * id_priv,const struct ib_gid_attr * sgid_attr)599*4882a593Smuzhiyun static void cma_bind_sgid_attr(struct rdma_id_private *id_priv,
600*4882a593Smuzhiyun const struct ib_gid_attr *sgid_attr)
601*4882a593Smuzhiyun {
602*4882a593Smuzhiyun WARN_ON(id_priv->id.route.addr.dev_addr.sgid_attr);
603*4882a593Smuzhiyun id_priv->id.route.addr.dev_addr.sgid_attr = sgid_attr;
604*4882a593Smuzhiyun }
605*4882a593Smuzhiyun
606*4882a593Smuzhiyun /**
607*4882a593Smuzhiyun * cma_acquire_dev_by_src_ip - Acquire cma device, port, gid attribute
608*4882a593Smuzhiyun * based on source ip address.
609*4882a593Smuzhiyun * @id_priv: cm_id which should be bound to cma device
610*4882a593Smuzhiyun *
611*4882a593Smuzhiyun * cma_acquire_dev_by_src_ip() binds cm id to cma device, port and GID attribute
612*4882a593Smuzhiyun * based on source IP address. It returns 0 on success or error code otherwise.
613*4882a593Smuzhiyun * It is applicable to active and passive side cm_id.
614*4882a593Smuzhiyun */
cma_acquire_dev_by_src_ip(struct rdma_id_private * id_priv)615*4882a593Smuzhiyun static int cma_acquire_dev_by_src_ip(struct rdma_id_private *id_priv)
616*4882a593Smuzhiyun {
617*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
618*4882a593Smuzhiyun const struct ib_gid_attr *sgid_attr;
619*4882a593Smuzhiyun union ib_gid gid, iboe_gid, *gidp;
620*4882a593Smuzhiyun struct cma_device *cma_dev;
621*4882a593Smuzhiyun enum ib_gid_type gid_type;
622*4882a593Smuzhiyun int ret = -ENODEV;
623*4882a593Smuzhiyun unsigned int port;
624*4882a593Smuzhiyun
625*4882a593Smuzhiyun if (dev_addr->dev_type != ARPHRD_INFINIBAND &&
626*4882a593Smuzhiyun id_priv->id.ps == RDMA_PS_IPOIB)
627*4882a593Smuzhiyun return -EINVAL;
628*4882a593Smuzhiyun
629*4882a593Smuzhiyun rdma_ip2gid((struct sockaddr *)&id_priv->id.route.addr.src_addr,
630*4882a593Smuzhiyun &iboe_gid);
631*4882a593Smuzhiyun
632*4882a593Smuzhiyun memcpy(&gid, dev_addr->src_dev_addr +
633*4882a593Smuzhiyun rdma_addr_gid_offset(dev_addr), sizeof(gid));
634*4882a593Smuzhiyun
635*4882a593Smuzhiyun mutex_lock(&lock);
636*4882a593Smuzhiyun list_for_each_entry(cma_dev, &dev_list, list) {
637*4882a593Smuzhiyun rdma_for_each_port (cma_dev->device, port) {
638*4882a593Smuzhiyun gidp = rdma_protocol_roce(cma_dev->device, port) ?
639*4882a593Smuzhiyun &iboe_gid : &gid;
640*4882a593Smuzhiyun gid_type = cma_dev->default_gid_type[port - 1];
641*4882a593Smuzhiyun sgid_attr = cma_validate_port(cma_dev->device, port,
642*4882a593Smuzhiyun gid_type, gidp, id_priv);
643*4882a593Smuzhiyun if (!IS_ERR(sgid_attr)) {
644*4882a593Smuzhiyun id_priv->id.port_num = port;
645*4882a593Smuzhiyun cma_bind_sgid_attr(id_priv, sgid_attr);
646*4882a593Smuzhiyun cma_attach_to_dev(id_priv, cma_dev);
647*4882a593Smuzhiyun ret = 0;
648*4882a593Smuzhiyun goto out;
649*4882a593Smuzhiyun }
650*4882a593Smuzhiyun }
651*4882a593Smuzhiyun }
652*4882a593Smuzhiyun out:
653*4882a593Smuzhiyun mutex_unlock(&lock);
654*4882a593Smuzhiyun return ret;
655*4882a593Smuzhiyun }
656*4882a593Smuzhiyun
657*4882a593Smuzhiyun /**
658*4882a593Smuzhiyun * cma_ib_acquire_dev - Acquire cma device, port and SGID attribute
659*4882a593Smuzhiyun * @id_priv: cm id to bind to cma device
660*4882a593Smuzhiyun * @listen_id_priv: listener cm id to match against
661*4882a593Smuzhiyun * @req: Pointer to req structure containaining incoming
662*4882a593Smuzhiyun * request information
663*4882a593Smuzhiyun * cma_ib_acquire_dev() acquires cma device, port and SGID attribute when
664*4882a593Smuzhiyun * rdma device matches for listen_id and incoming request. It also verifies
665*4882a593Smuzhiyun * that a GID table entry is present for the source address.
666*4882a593Smuzhiyun * Returns 0 on success, or returns error code otherwise.
667*4882a593Smuzhiyun */
cma_ib_acquire_dev(struct rdma_id_private * id_priv,const struct rdma_id_private * listen_id_priv,struct cma_req_info * req)668*4882a593Smuzhiyun static int cma_ib_acquire_dev(struct rdma_id_private *id_priv,
669*4882a593Smuzhiyun const struct rdma_id_private *listen_id_priv,
670*4882a593Smuzhiyun struct cma_req_info *req)
671*4882a593Smuzhiyun {
672*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
673*4882a593Smuzhiyun const struct ib_gid_attr *sgid_attr;
674*4882a593Smuzhiyun enum ib_gid_type gid_type;
675*4882a593Smuzhiyun union ib_gid gid;
676*4882a593Smuzhiyun
677*4882a593Smuzhiyun if (dev_addr->dev_type != ARPHRD_INFINIBAND &&
678*4882a593Smuzhiyun id_priv->id.ps == RDMA_PS_IPOIB)
679*4882a593Smuzhiyun return -EINVAL;
680*4882a593Smuzhiyun
681*4882a593Smuzhiyun if (rdma_protocol_roce(req->device, req->port))
682*4882a593Smuzhiyun rdma_ip2gid((struct sockaddr *)&id_priv->id.route.addr.src_addr,
683*4882a593Smuzhiyun &gid);
684*4882a593Smuzhiyun else
685*4882a593Smuzhiyun memcpy(&gid, dev_addr->src_dev_addr +
686*4882a593Smuzhiyun rdma_addr_gid_offset(dev_addr), sizeof(gid));
687*4882a593Smuzhiyun
688*4882a593Smuzhiyun gid_type = listen_id_priv->cma_dev->default_gid_type[req->port - 1];
689*4882a593Smuzhiyun sgid_attr = cma_validate_port(req->device, req->port,
690*4882a593Smuzhiyun gid_type, &gid, id_priv);
691*4882a593Smuzhiyun if (IS_ERR(sgid_attr))
692*4882a593Smuzhiyun return PTR_ERR(sgid_attr);
693*4882a593Smuzhiyun
694*4882a593Smuzhiyun id_priv->id.port_num = req->port;
695*4882a593Smuzhiyun cma_bind_sgid_attr(id_priv, sgid_attr);
696*4882a593Smuzhiyun /* Need to acquire lock to protect against reader
697*4882a593Smuzhiyun * of cma_dev->id_list such as cma_netdev_callback() and
698*4882a593Smuzhiyun * cma_process_remove().
699*4882a593Smuzhiyun */
700*4882a593Smuzhiyun mutex_lock(&lock);
701*4882a593Smuzhiyun cma_attach_to_dev(id_priv, listen_id_priv->cma_dev);
702*4882a593Smuzhiyun mutex_unlock(&lock);
703*4882a593Smuzhiyun rdma_restrack_add(&id_priv->res);
704*4882a593Smuzhiyun return 0;
705*4882a593Smuzhiyun }
706*4882a593Smuzhiyun
cma_iw_acquire_dev(struct rdma_id_private * id_priv,const struct rdma_id_private * listen_id_priv)707*4882a593Smuzhiyun static int cma_iw_acquire_dev(struct rdma_id_private *id_priv,
708*4882a593Smuzhiyun const struct rdma_id_private *listen_id_priv)
709*4882a593Smuzhiyun {
710*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
711*4882a593Smuzhiyun const struct ib_gid_attr *sgid_attr;
712*4882a593Smuzhiyun struct cma_device *cma_dev;
713*4882a593Smuzhiyun enum ib_gid_type gid_type;
714*4882a593Smuzhiyun int ret = -ENODEV;
715*4882a593Smuzhiyun unsigned int port;
716*4882a593Smuzhiyun union ib_gid gid;
717*4882a593Smuzhiyun
718*4882a593Smuzhiyun if (dev_addr->dev_type != ARPHRD_INFINIBAND &&
719*4882a593Smuzhiyun id_priv->id.ps == RDMA_PS_IPOIB)
720*4882a593Smuzhiyun return -EINVAL;
721*4882a593Smuzhiyun
722*4882a593Smuzhiyun memcpy(&gid, dev_addr->src_dev_addr +
723*4882a593Smuzhiyun rdma_addr_gid_offset(dev_addr), sizeof(gid));
724*4882a593Smuzhiyun
725*4882a593Smuzhiyun mutex_lock(&lock);
726*4882a593Smuzhiyun
727*4882a593Smuzhiyun cma_dev = listen_id_priv->cma_dev;
728*4882a593Smuzhiyun port = listen_id_priv->id.port_num;
729*4882a593Smuzhiyun gid_type = listen_id_priv->gid_type;
730*4882a593Smuzhiyun sgid_attr = cma_validate_port(cma_dev->device, port,
731*4882a593Smuzhiyun gid_type, &gid, id_priv);
732*4882a593Smuzhiyun if (!IS_ERR(sgid_attr)) {
733*4882a593Smuzhiyun id_priv->id.port_num = port;
734*4882a593Smuzhiyun cma_bind_sgid_attr(id_priv, sgid_attr);
735*4882a593Smuzhiyun ret = 0;
736*4882a593Smuzhiyun goto out;
737*4882a593Smuzhiyun }
738*4882a593Smuzhiyun
739*4882a593Smuzhiyun list_for_each_entry(cma_dev, &dev_list, list) {
740*4882a593Smuzhiyun rdma_for_each_port (cma_dev->device, port) {
741*4882a593Smuzhiyun if (listen_id_priv->cma_dev == cma_dev &&
742*4882a593Smuzhiyun listen_id_priv->id.port_num == port)
743*4882a593Smuzhiyun continue;
744*4882a593Smuzhiyun
745*4882a593Smuzhiyun gid_type = cma_dev->default_gid_type[port - 1];
746*4882a593Smuzhiyun sgid_attr = cma_validate_port(cma_dev->device, port,
747*4882a593Smuzhiyun gid_type, &gid, id_priv);
748*4882a593Smuzhiyun if (!IS_ERR(sgid_attr)) {
749*4882a593Smuzhiyun id_priv->id.port_num = port;
750*4882a593Smuzhiyun cma_bind_sgid_attr(id_priv, sgid_attr);
751*4882a593Smuzhiyun ret = 0;
752*4882a593Smuzhiyun goto out;
753*4882a593Smuzhiyun }
754*4882a593Smuzhiyun }
755*4882a593Smuzhiyun }
756*4882a593Smuzhiyun
757*4882a593Smuzhiyun out:
758*4882a593Smuzhiyun if (!ret) {
759*4882a593Smuzhiyun cma_attach_to_dev(id_priv, cma_dev);
760*4882a593Smuzhiyun rdma_restrack_add(&id_priv->res);
761*4882a593Smuzhiyun }
762*4882a593Smuzhiyun
763*4882a593Smuzhiyun mutex_unlock(&lock);
764*4882a593Smuzhiyun return ret;
765*4882a593Smuzhiyun }
766*4882a593Smuzhiyun
767*4882a593Smuzhiyun /*
768*4882a593Smuzhiyun * Select the source IB device and address to reach the destination IB address.
769*4882a593Smuzhiyun */
cma_resolve_ib_dev(struct rdma_id_private * id_priv)770*4882a593Smuzhiyun static int cma_resolve_ib_dev(struct rdma_id_private *id_priv)
771*4882a593Smuzhiyun {
772*4882a593Smuzhiyun struct cma_device *cma_dev, *cur_dev;
773*4882a593Smuzhiyun struct sockaddr_ib *addr;
774*4882a593Smuzhiyun union ib_gid gid, sgid, *dgid;
775*4882a593Smuzhiyun unsigned int p;
776*4882a593Smuzhiyun u16 pkey, index;
777*4882a593Smuzhiyun enum ib_port_state port_state;
778*4882a593Smuzhiyun int ret;
779*4882a593Smuzhiyun int i;
780*4882a593Smuzhiyun
781*4882a593Smuzhiyun cma_dev = NULL;
782*4882a593Smuzhiyun addr = (struct sockaddr_ib *) cma_dst_addr(id_priv);
783*4882a593Smuzhiyun dgid = (union ib_gid *) &addr->sib_addr;
784*4882a593Smuzhiyun pkey = ntohs(addr->sib_pkey);
785*4882a593Smuzhiyun
786*4882a593Smuzhiyun mutex_lock(&lock);
787*4882a593Smuzhiyun list_for_each_entry(cur_dev, &dev_list, list) {
788*4882a593Smuzhiyun rdma_for_each_port (cur_dev->device, p) {
789*4882a593Smuzhiyun if (!rdma_cap_af_ib(cur_dev->device, p))
790*4882a593Smuzhiyun continue;
791*4882a593Smuzhiyun
792*4882a593Smuzhiyun if (ib_find_cached_pkey(cur_dev->device, p, pkey, &index))
793*4882a593Smuzhiyun continue;
794*4882a593Smuzhiyun
795*4882a593Smuzhiyun if (ib_get_cached_port_state(cur_dev->device, p, &port_state))
796*4882a593Smuzhiyun continue;
797*4882a593Smuzhiyun
798*4882a593Smuzhiyun for (i = 0; i < cur_dev->device->port_data[p].immutable.gid_tbl_len;
799*4882a593Smuzhiyun ++i) {
800*4882a593Smuzhiyun ret = rdma_query_gid(cur_dev->device, p, i,
801*4882a593Smuzhiyun &gid);
802*4882a593Smuzhiyun if (ret)
803*4882a593Smuzhiyun continue;
804*4882a593Smuzhiyun
805*4882a593Smuzhiyun if (!memcmp(&gid, dgid, sizeof(gid))) {
806*4882a593Smuzhiyun cma_dev = cur_dev;
807*4882a593Smuzhiyun sgid = gid;
808*4882a593Smuzhiyun id_priv->id.port_num = p;
809*4882a593Smuzhiyun goto found;
810*4882a593Smuzhiyun }
811*4882a593Smuzhiyun
812*4882a593Smuzhiyun if (!cma_dev && (gid.global.subnet_prefix ==
813*4882a593Smuzhiyun dgid->global.subnet_prefix) &&
814*4882a593Smuzhiyun port_state == IB_PORT_ACTIVE) {
815*4882a593Smuzhiyun cma_dev = cur_dev;
816*4882a593Smuzhiyun sgid = gid;
817*4882a593Smuzhiyun id_priv->id.port_num = p;
818*4882a593Smuzhiyun goto found;
819*4882a593Smuzhiyun }
820*4882a593Smuzhiyun }
821*4882a593Smuzhiyun }
822*4882a593Smuzhiyun }
823*4882a593Smuzhiyun mutex_unlock(&lock);
824*4882a593Smuzhiyun return -ENODEV;
825*4882a593Smuzhiyun
826*4882a593Smuzhiyun found:
827*4882a593Smuzhiyun cma_attach_to_dev(id_priv, cma_dev);
828*4882a593Smuzhiyun rdma_restrack_add(&id_priv->res);
829*4882a593Smuzhiyun mutex_unlock(&lock);
830*4882a593Smuzhiyun addr = (struct sockaddr_ib *)cma_src_addr(id_priv);
831*4882a593Smuzhiyun memcpy(&addr->sib_addr, &sgid, sizeof(sgid));
832*4882a593Smuzhiyun cma_translate_ib(addr, &id_priv->id.route.addr.dev_addr);
833*4882a593Smuzhiyun return 0;
834*4882a593Smuzhiyun }
835*4882a593Smuzhiyun
cma_id_get(struct rdma_id_private * id_priv)836*4882a593Smuzhiyun static void cma_id_get(struct rdma_id_private *id_priv)
837*4882a593Smuzhiyun {
838*4882a593Smuzhiyun refcount_inc(&id_priv->refcount);
839*4882a593Smuzhiyun }
840*4882a593Smuzhiyun
cma_id_put(struct rdma_id_private * id_priv)841*4882a593Smuzhiyun static void cma_id_put(struct rdma_id_private *id_priv)
842*4882a593Smuzhiyun {
843*4882a593Smuzhiyun if (refcount_dec_and_test(&id_priv->refcount))
844*4882a593Smuzhiyun complete(&id_priv->comp);
845*4882a593Smuzhiyun }
846*4882a593Smuzhiyun
847*4882a593Smuzhiyun static struct rdma_id_private *
__rdma_create_id(struct net * net,rdma_cm_event_handler event_handler,void * context,enum rdma_ucm_port_space ps,enum ib_qp_type qp_type,const struct rdma_id_private * parent)848*4882a593Smuzhiyun __rdma_create_id(struct net *net, rdma_cm_event_handler event_handler,
849*4882a593Smuzhiyun void *context, enum rdma_ucm_port_space ps,
850*4882a593Smuzhiyun enum ib_qp_type qp_type, const struct rdma_id_private *parent)
851*4882a593Smuzhiyun {
852*4882a593Smuzhiyun struct rdma_id_private *id_priv;
853*4882a593Smuzhiyun
854*4882a593Smuzhiyun id_priv = kzalloc(sizeof *id_priv, GFP_KERNEL);
855*4882a593Smuzhiyun if (!id_priv)
856*4882a593Smuzhiyun return ERR_PTR(-ENOMEM);
857*4882a593Smuzhiyun
858*4882a593Smuzhiyun id_priv->state = RDMA_CM_IDLE;
859*4882a593Smuzhiyun id_priv->id.context = context;
860*4882a593Smuzhiyun id_priv->id.event_handler = event_handler;
861*4882a593Smuzhiyun id_priv->id.ps = ps;
862*4882a593Smuzhiyun id_priv->id.qp_type = qp_type;
863*4882a593Smuzhiyun id_priv->tos_set = false;
864*4882a593Smuzhiyun id_priv->timeout_set = false;
865*4882a593Smuzhiyun id_priv->gid_type = IB_GID_TYPE_IB;
866*4882a593Smuzhiyun spin_lock_init(&id_priv->lock);
867*4882a593Smuzhiyun mutex_init(&id_priv->qp_mutex);
868*4882a593Smuzhiyun init_completion(&id_priv->comp);
869*4882a593Smuzhiyun refcount_set(&id_priv->refcount, 1);
870*4882a593Smuzhiyun mutex_init(&id_priv->handler_mutex);
871*4882a593Smuzhiyun INIT_LIST_HEAD(&id_priv->listen_list);
872*4882a593Smuzhiyun INIT_LIST_HEAD(&id_priv->mc_list);
873*4882a593Smuzhiyun get_random_bytes(&id_priv->seq_num, sizeof id_priv->seq_num);
874*4882a593Smuzhiyun id_priv->id.route.addr.dev_addr.net = get_net(net);
875*4882a593Smuzhiyun id_priv->seq_num &= 0x00ffffff;
876*4882a593Smuzhiyun
877*4882a593Smuzhiyun rdma_restrack_new(&id_priv->res, RDMA_RESTRACK_CM_ID);
878*4882a593Smuzhiyun if (parent)
879*4882a593Smuzhiyun rdma_restrack_parent_name(&id_priv->res, &parent->res);
880*4882a593Smuzhiyun
881*4882a593Smuzhiyun return id_priv;
882*4882a593Smuzhiyun }
883*4882a593Smuzhiyun
884*4882a593Smuzhiyun struct rdma_cm_id *
__rdma_create_kernel_id(struct net * net,rdma_cm_event_handler event_handler,void * context,enum rdma_ucm_port_space ps,enum ib_qp_type qp_type,const char * caller)885*4882a593Smuzhiyun __rdma_create_kernel_id(struct net *net, rdma_cm_event_handler event_handler,
886*4882a593Smuzhiyun void *context, enum rdma_ucm_port_space ps,
887*4882a593Smuzhiyun enum ib_qp_type qp_type, const char *caller)
888*4882a593Smuzhiyun {
889*4882a593Smuzhiyun struct rdma_id_private *ret;
890*4882a593Smuzhiyun
891*4882a593Smuzhiyun ret = __rdma_create_id(net, event_handler, context, ps, qp_type, NULL);
892*4882a593Smuzhiyun if (IS_ERR(ret))
893*4882a593Smuzhiyun return ERR_CAST(ret);
894*4882a593Smuzhiyun
895*4882a593Smuzhiyun rdma_restrack_set_name(&ret->res, caller);
896*4882a593Smuzhiyun return &ret->id;
897*4882a593Smuzhiyun }
898*4882a593Smuzhiyun EXPORT_SYMBOL(__rdma_create_kernel_id);
899*4882a593Smuzhiyun
rdma_create_user_id(rdma_cm_event_handler event_handler,void * context,enum rdma_ucm_port_space ps,enum ib_qp_type qp_type)900*4882a593Smuzhiyun struct rdma_cm_id *rdma_create_user_id(rdma_cm_event_handler event_handler,
901*4882a593Smuzhiyun void *context,
902*4882a593Smuzhiyun enum rdma_ucm_port_space ps,
903*4882a593Smuzhiyun enum ib_qp_type qp_type)
904*4882a593Smuzhiyun {
905*4882a593Smuzhiyun struct rdma_id_private *ret;
906*4882a593Smuzhiyun
907*4882a593Smuzhiyun ret = __rdma_create_id(current->nsproxy->net_ns, event_handler, context,
908*4882a593Smuzhiyun ps, qp_type, NULL);
909*4882a593Smuzhiyun if (IS_ERR(ret))
910*4882a593Smuzhiyun return ERR_CAST(ret);
911*4882a593Smuzhiyun
912*4882a593Smuzhiyun rdma_restrack_set_name(&ret->res, NULL);
913*4882a593Smuzhiyun return &ret->id;
914*4882a593Smuzhiyun }
915*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_create_user_id);
916*4882a593Smuzhiyun
cma_init_ud_qp(struct rdma_id_private * id_priv,struct ib_qp * qp)917*4882a593Smuzhiyun static int cma_init_ud_qp(struct rdma_id_private *id_priv, struct ib_qp *qp)
918*4882a593Smuzhiyun {
919*4882a593Smuzhiyun struct ib_qp_attr qp_attr;
920*4882a593Smuzhiyun int qp_attr_mask, ret;
921*4882a593Smuzhiyun
922*4882a593Smuzhiyun qp_attr.qp_state = IB_QPS_INIT;
923*4882a593Smuzhiyun ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
924*4882a593Smuzhiyun if (ret)
925*4882a593Smuzhiyun return ret;
926*4882a593Smuzhiyun
927*4882a593Smuzhiyun ret = ib_modify_qp(qp, &qp_attr, qp_attr_mask);
928*4882a593Smuzhiyun if (ret)
929*4882a593Smuzhiyun return ret;
930*4882a593Smuzhiyun
931*4882a593Smuzhiyun qp_attr.qp_state = IB_QPS_RTR;
932*4882a593Smuzhiyun ret = ib_modify_qp(qp, &qp_attr, IB_QP_STATE);
933*4882a593Smuzhiyun if (ret)
934*4882a593Smuzhiyun return ret;
935*4882a593Smuzhiyun
936*4882a593Smuzhiyun qp_attr.qp_state = IB_QPS_RTS;
937*4882a593Smuzhiyun qp_attr.sq_psn = 0;
938*4882a593Smuzhiyun ret = ib_modify_qp(qp, &qp_attr, IB_QP_STATE | IB_QP_SQ_PSN);
939*4882a593Smuzhiyun
940*4882a593Smuzhiyun return ret;
941*4882a593Smuzhiyun }
942*4882a593Smuzhiyun
cma_init_conn_qp(struct rdma_id_private * id_priv,struct ib_qp * qp)943*4882a593Smuzhiyun static int cma_init_conn_qp(struct rdma_id_private *id_priv, struct ib_qp *qp)
944*4882a593Smuzhiyun {
945*4882a593Smuzhiyun struct ib_qp_attr qp_attr;
946*4882a593Smuzhiyun int qp_attr_mask, ret;
947*4882a593Smuzhiyun
948*4882a593Smuzhiyun qp_attr.qp_state = IB_QPS_INIT;
949*4882a593Smuzhiyun ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
950*4882a593Smuzhiyun if (ret)
951*4882a593Smuzhiyun return ret;
952*4882a593Smuzhiyun
953*4882a593Smuzhiyun return ib_modify_qp(qp, &qp_attr, qp_attr_mask);
954*4882a593Smuzhiyun }
955*4882a593Smuzhiyun
rdma_create_qp(struct rdma_cm_id * id,struct ib_pd * pd,struct ib_qp_init_attr * qp_init_attr)956*4882a593Smuzhiyun int rdma_create_qp(struct rdma_cm_id *id, struct ib_pd *pd,
957*4882a593Smuzhiyun struct ib_qp_init_attr *qp_init_attr)
958*4882a593Smuzhiyun {
959*4882a593Smuzhiyun struct rdma_id_private *id_priv;
960*4882a593Smuzhiyun struct ib_qp *qp;
961*4882a593Smuzhiyun int ret;
962*4882a593Smuzhiyun
963*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
964*4882a593Smuzhiyun if (id->device != pd->device) {
965*4882a593Smuzhiyun ret = -EINVAL;
966*4882a593Smuzhiyun goto out_err;
967*4882a593Smuzhiyun }
968*4882a593Smuzhiyun
969*4882a593Smuzhiyun qp_init_attr->port_num = id->port_num;
970*4882a593Smuzhiyun qp = ib_create_qp(pd, qp_init_attr);
971*4882a593Smuzhiyun if (IS_ERR(qp)) {
972*4882a593Smuzhiyun ret = PTR_ERR(qp);
973*4882a593Smuzhiyun goto out_err;
974*4882a593Smuzhiyun }
975*4882a593Smuzhiyun
976*4882a593Smuzhiyun if (id->qp_type == IB_QPT_UD)
977*4882a593Smuzhiyun ret = cma_init_ud_qp(id_priv, qp);
978*4882a593Smuzhiyun else
979*4882a593Smuzhiyun ret = cma_init_conn_qp(id_priv, qp);
980*4882a593Smuzhiyun if (ret)
981*4882a593Smuzhiyun goto out_destroy;
982*4882a593Smuzhiyun
983*4882a593Smuzhiyun id->qp = qp;
984*4882a593Smuzhiyun id_priv->qp_num = qp->qp_num;
985*4882a593Smuzhiyun id_priv->srq = (qp->srq != NULL);
986*4882a593Smuzhiyun trace_cm_qp_create(id_priv, pd, qp_init_attr, 0);
987*4882a593Smuzhiyun return 0;
988*4882a593Smuzhiyun out_destroy:
989*4882a593Smuzhiyun ib_destroy_qp(qp);
990*4882a593Smuzhiyun out_err:
991*4882a593Smuzhiyun trace_cm_qp_create(id_priv, pd, qp_init_attr, ret);
992*4882a593Smuzhiyun return ret;
993*4882a593Smuzhiyun }
994*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_create_qp);
995*4882a593Smuzhiyun
rdma_destroy_qp(struct rdma_cm_id * id)996*4882a593Smuzhiyun void rdma_destroy_qp(struct rdma_cm_id *id)
997*4882a593Smuzhiyun {
998*4882a593Smuzhiyun struct rdma_id_private *id_priv;
999*4882a593Smuzhiyun
1000*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
1001*4882a593Smuzhiyun trace_cm_qp_destroy(id_priv);
1002*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
1003*4882a593Smuzhiyun ib_destroy_qp(id_priv->id.qp);
1004*4882a593Smuzhiyun id_priv->id.qp = NULL;
1005*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
1006*4882a593Smuzhiyun }
1007*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_destroy_qp);
1008*4882a593Smuzhiyun
cma_modify_qp_rtr(struct rdma_id_private * id_priv,struct rdma_conn_param * conn_param)1009*4882a593Smuzhiyun static int cma_modify_qp_rtr(struct rdma_id_private *id_priv,
1010*4882a593Smuzhiyun struct rdma_conn_param *conn_param)
1011*4882a593Smuzhiyun {
1012*4882a593Smuzhiyun struct ib_qp_attr qp_attr;
1013*4882a593Smuzhiyun int qp_attr_mask, ret;
1014*4882a593Smuzhiyun
1015*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
1016*4882a593Smuzhiyun if (!id_priv->id.qp) {
1017*4882a593Smuzhiyun ret = 0;
1018*4882a593Smuzhiyun goto out;
1019*4882a593Smuzhiyun }
1020*4882a593Smuzhiyun
1021*4882a593Smuzhiyun /* Need to update QP attributes from default values. */
1022*4882a593Smuzhiyun qp_attr.qp_state = IB_QPS_INIT;
1023*4882a593Smuzhiyun ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
1024*4882a593Smuzhiyun if (ret)
1025*4882a593Smuzhiyun goto out;
1026*4882a593Smuzhiyun
1027*4882a593Smuzhiyun ret = ib_modify_qp(id_priv->id.qp, &qp_attr, qp_attr_mask);
1028*4882a593Smuzhiyun if (ret)
1029*4882a593Smuzhiyun goto out;
1030*4882a593Smuzhiyun
1031*4882a593Smuzhiyun qp_attr.qp_state = IB_QPS_RTR;
1032*4882a593Smuzhiyun ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
1033*4882a593Smuzhiyun if (ret)
1034*4882a593Smuzhiyun goto out;
1035*4882a593Smuzhiyun
1036*4882a593Smuzhiyun BUG_ON(id_priv->cma_dev->device != id_priv->id.device);
1037*4882a593Smuzhiyun
1038*4882a593Smuzhiyun if (conn_param)
1039*4882a593Smuzhiyun qp_attr.max_dest_rd_atomic = conn_param->responder_resources;
1040*4882a593Smuzhiyun ret = ib_modify_qp(id_priv->id.qp, &qp_attr, qp_attr_mask);
1041*4882a593Smuzhiyun out:
1042*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
1043*4882a593Smuzhiyun return ret;
1044*4882a593Smuzhiyun }
1045*4882a593Smuzhiyun
cma_modify_qp_rts(struct rdma_id_private * id_priv,struct rdma_conn_param * conn_param)1046*4882a593Smuzhiyun static int cma_modify_qp_rts(struct rdma_id_private *id_priv,
1047*4882a593Smuzhiyun struct rdma_conn_param *conn_param)
1048*4882a593Smuzhiyun {
1049*4882a593Smuzhiyun struct ib_qp_attr qp_attr;
1050*4882a593Smuzhiyun int qp_attr_mask, ret;
1051*4882a593Smuzhiyun
1052*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
1053*4882a593Smuzhiyun if (!id_priv->id.qp) {
1054*4882a593Smuzhiyun ret = 0;
1055*4882a593Smuzhiyun goto out;
1056*4882a593Smuzhiyun }
1057*4882a593Smuzhiyun
1058*4882a593Smuzhiyun qp_attr.qp_state = IB_QPS_RTS;
1059*4882a593Smuzhiyun ret = rdma_init_qp_attr(&id_priv->id, &qp_attr, &qp_attr_mask);
1060*4882a593Smuzhiyun if (ret)
1061*4882a593Smuzhiyun goto out;
1062*4882a593Smuzhiyun
1063*4882a593Smuzhiyun if (conn_param)
1064*4882a593Smuzhiyun qp_attr.max_rd_atomic = conn_param->initiator_depth;
1065*4882a593Smuzhiyun ret = ib_modify_qp(id_priv->id.qp, &qp_attr, qp_attr_mask);
1066*4882a593Smuzhiyun out:
1067*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
1068*4882a593Smuzhiyun return ret;
1069*4882a593Smuzhiyun }
1070*4882a593Smuzhiyun
cma_modify_qp_err(struct rdma_id_private * id_priv)1071*4882a593Smuzhiyun static int cma_modify_qp_err(struct rdma_id_private *id_priv)
1072*4882a593Smuzhiyun {
1073*4882a593Smuzhiyun struct ib_qp_attr qp_attr;
1074*4882a593Smuzhiyun int ret;
1075*4882a593Smuzhiyun
1076*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
1077*4882a593Smuzhiyun if (!id_priv->id.qp) {
1078*4882a593Smuzhiyun ret = 0;
1079*4882a593Smuzhiyun goto out;
1080*4882a593Smuzhiyun }
1081*4882a593Smuzhiyun
1082*4882a593Smuzhiyun qp_attr.qp_state = IB_QPS_ERR;
1083*4882a593Smuzhiyun ret = ib_modify_qp(id_priv->id.qp, &qp_attr, IB_QP_STATE);
1084*4882a593Smuzhiyun out:
1085*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
1086*4882a593Smuzhiyun return ret;
1087*4882a593Smuzhiyun }
1088*4882a593Smuzhiyun
cma_ib_init_qp_attr(struct rdma_id_private * id_priv,struct ib_qp_attr * qp_attr,int * qp_attr_mask)1089*4882a593Smuzhiyun static int cma_ib_init_qp_attr(struct rdma_id_private *id_priv,
1090*4882a593Smuzhiyun struct ib_qp_attr *qp_attr, int *qp_attr_mask)
1091*4882a593Smuzhiyun {
1092*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
1093*4882a593Smuzhiyun int ret;
1094*4882a593Smuzhiyun u16 pkey;
1095*4882a593Smuzhiyun
1096*4882a593Smuzhiyun if (rdma_cap_eth_ah(id_priv->id.device, id_priv->id.port_num))
1097*4882a593Smuzhiyun pkey = 0xffff;
1098*4882a593Smuzhiyun else
1099*4882a593Smuzhiyun pkey = ib_addr_get_pkey(dev_addr);
1100*4882a593Smuzhiyun
1101*4882a593Smuzhiyun ret = ib_find_cached_pkey(id_priv->id.device, id_priv->id.port_num,
1102*4882a593Smuzhiyun pkey, &qp_attr->pkey_index);
1103*4882a593Smuzhiyun if (ret)
1104*4882a593Smuzhiyun return ret;
1105*4882a593Smuzhiyun
1106*4882a593Smuzhiyun qp_attr->port_num = id_priv->id.port_num;
1107*4882a593Smuzhiyun *qp_attr_mask = IB_QP_STATE | IB_QP_PKEY_INDEX | IB_QP_PORT;
1108*4882a593Smuzhiyun
1109*4882a593Smuzhiyun if (id_priv->id.qp_type == IB_QPT_UD) {
1110*4882a593Smuzhiyun ret = cma_set_qkey(id_priv, 0);
1111*4882a593Smuzhiyun if (ret)
1112*4882a593Smuzhiyun return ret;
1113*4882a593Smuzhiyun
1114*4882a593Smuzhiyun qp_attr->qkey = id_priv->qkey;
1115*4882a593Smuzhiyun *qp_attr_mask |= IB_QP_QKEY;
1116*4882a593Smuzhiyun } else {
1117*4882a593Smuzhiyun qp_attr->qp_access_flags = 0;
1118*4882a593Smuzhiyun *qp_attr_mask |= IB_QP_ACCESS_FLAGS;
1119*4882a593Smuzhiyun }
1120*4882a593Smuzhiyun return 0;
1121*4882a593Smuzhiyun }
1122*4882a593Smuzhiyun
rdma_init_qp_attr(struct rdma_cm_id * id,struct ib_qp_attr * qp_attr,int * qp_attr_mask)1123*4882a593Smuzhiyun int rdma_init_qp_attr(struct rdma_cm_id *id, struct ib_qp_attr *qp_attr,
1124*4882a593Smuzhiyun int *qp_attr_mask)
1125*4882a593Smuzhiyun {
1126*4882a593Smuzhiyun struct rdma_id_private *id_priv;
1127*4882a593Smuzhiyun int ret = 0;
1128*4882a593Smuzhiyun
1129*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
1130*4882a593Smuzhiyun if (rdma_cap_ib_cm(id->device, id->port_num)) {
1131*4882a593Smuzhiyun if (!id_priv->cm_id.ib || (id_priv->id.qp_type == IB_QPT_UD))
1132*4882a593Smuzhiyun ret = cma_ib_init_qp_attr(id_priv, qp_attr, qp_attr_mask);
1133*4882a593Smuzhiyun else
1134*4882a593Smuzhiyun ret = ib_cm_init_qp_attr(id_priv->cm_id.ib, qp_attr,
1135*4882a593Smuzhiyun qp_attr_mask);
1136*4882a593Smuzhiyun
1137*4882a593Smuzhiyun if (qp_attr->qp_state == IB_QPS_RTR)
1138*4882a593Smuzhiyun qp_attr->rq_psn = id_priv->seq_num;
1139*4882a593Smuzhiyun } else if (rdma_cap_iw_cm(id->device, id->port_num)) {
1140*4882a593Smuzhiyun if (!id_priv->cm_id.iw) {
1141*4882a593Smuzhiyun qp_attr->qp_access_flags = 0;
1142*4882a593Smuzhiyun *qp_attr_mask = IB_QP_STATE | IB_QP_ACCESS_FLAGS;
1143*4882a593Smuzhiyun } else
1144*4882a593Smuzhiyun ret = iw_cm_init_qp_attr(id_priv->cm_id.iw, qp_attr,
1145*4882a593Smuzhiyun qp_attr_mask);
1146*4882a593Smuzhiyun qp_attr->port_num = id_priv->id.port_num;
1147*4882a593Smuzhiyun *qp_attr_mask |= IB_QP_PORT;
1148*4882a593Smuzhiyun } else
1149*4882a593Smuzhiyun ret = -ENOSYS;
1150*4882a593Smuzhiyun
1151*4882a593Smuzhiyun if ((*qp_attr_mask & IB_QP_TIMEOUT) && id_priv->timeout_set)
1152*4882a593Smuzhiyun qp_attr->timeout = id_priv->timeout;
1153*4882a593Smuzhiyun
1154*4882a593Smuzhiyun return ret;
1155*4882a593Smuzhiyun }
1156*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_init_qp_attr);
1157*4882a593Smuzhiyun
cma_zero_addr(const struct sockaddr * addr)1158*4882a593Smuzhiyun static inline bool cma_zero_addr(const struct sockaddr *addr)
1159*4882a593Smuzhiyun {
1160*4882a593Smuzhiyun switch (addr->sa_family) {
1161*4882a593Smuzhiyun case AF_INET:
1162*4882a593Smuzhiyun return ipv4_is_zeronet(((struct sockaddr_in *)addr)->sin_addr.s_addr);
1163*4882a593Smuzhiyun case AF_INET6:
1164*4882a593Smuzhiyun return ipv6_addr_any(&((struct sockaddr_in6 *)addr)->sin6_addr);
1165*4882a593Smuzhiyun case AF_IB:
1166*4882a593Smuzhiyun return ib_addr_any(&((struct sockaddr_ib *)addr)->sib_addr);
1167*4882a593Smuzhiyun default:
1168*4882a593Smuzhiyun return false;
1169*4882a593Smuzhiyun }
1170*4882a593Smuzhiyun }
1171*4882a593Smuzhiyun
cma_loopback_addr(const struct sockaddr * addr)1172*4882a593Smuzhiyun static inline bool cma_loopback_addr(const struct sockaddr *addr)
1173*4882a593Smuzhiyun {
1174*4882a593Smuzhiyun switch (addr->sa_family) {
1175*4882a593Smuzhiyun case AF_INET:
1176*4882a593Smuzhiyun return ipv4_is_loopback(
1177*4882a593Smuzhiyun ((struct sockaddr_in *)addr)->sin_addr.s_addr);
1178*4882a593Smuzhiyun case AF_INET6:
1179*4882a593Smuzhiyun return ipv6_addr_loopback(
1180*4882a593Smuzhiyun &((struct sockaddr_in6 *)addr)->sin6_addr);
1181*4882a593Smuzhiyun case AF_IB:
1182*4882a593Smuzhiyun return ib_addr_loopback(
1183*4882a593Smuzhiyun &((struct sockaddr_ib *)addr)->sib_addr);
1184*4882a593Smuzhiyun default:
1185*4882a593Smuzhiyun return false;
1186*4882a593Smuzhiyun }
1187*4882a593Smuzhiyun }
1188*4882a593Smuzhiyun
cma_any_addr(const struct sockaddr * addr)1189*4882a593Smuzhiyun static inline bool cma_any_addr(const struct sockaddr *addr)
1190*4882a593Smuzhiyun {
1191*4882a593Smuzhiyun return cma_zero_addr(addr) || cma_loopback_addr(addr);
1192*4882a593Smuzhiyun }
1193*4882a593Smuzhiyun
cma_addr_cmp(const struct sockaddr * src,const struct sockaddr * dst)1194*4882a593Smuzhiyun static int cma_addr_cmp(const struct sockaddr *src, const struct sockaddr *dst)
1195*4882a593Smuzhiyun {
1196*4882a593Smuzhiyun if (src->sa_family != dst->sa_family)
1197*4882a593Smuzhiyun return -1;
1198*4882a593Smuzhiyun
1199*4882a593Smuzhiyun switch (src->sa_family) {
1200*4882a593Smuzhiyun case AF_INET:
1201*4882a593Smuzhiyun return ((struct sockaddr_in *)src)->sin_addr.s_addr !=
1202*4882a593Smuzhiyun ((struct sockaddr_in *)dst)->sin_addr.s_addr;
1203*4882a593Smuzhiyun case AF_INET6: {
1204*4882a593Smuzhiyun struct sockaddr_in6 *src_addr6 = (struct sockaddr_in6 *)src;
1205*4882a593Smuzhiyun struct sockaddr_in6 *dst_addr6 = (struct sockaddr_in6 *)dst;
1206*4882a593Smuzhiyun bool link_local;
1207*4882a593Smuzhiyun
1208*4882a593Smuzhiyun if (ipv6_addr_cmp(&src_addr6->sin6_addr,
1209*4882a593Smuzhiyun &dst_addr6->sin6_addr))
1210*4882a593Smuzhiyun return 1;
1211*4882a593Smuzhiyun link_local = ipv6_addr_type(&dst_addr6->sin6_addr) &
1212*4882a593Smuzhiyun IPV6_ADDR_LINKLOCAL;
1213*4882a593Smuzhiyun /* Link local must match their scope_ids */
1214*4882a593Smuzhiyun return link_local ? (src_addr6->sin6_scope_id !=
1215*4882a593Smuzhiyun dst_addr6->sin6_scope_id) :
1216*4882a593Smuzhiyun 0;
1217*4882a593Smuzhiyun }
1218*4882a593Smuzhiyun
1219*4882a593Smuzhiyun default:
1220*4882a593Smuzhiyun return ib_addr_cmp(&((struct sockaddr_ib *) src)->sib_addr,
1221*4882a593Smuzhiyun &((struct sockaddr_ib *) dst)->sib_addr);
1222*4882a593Smuzhiyun }
1223*4882a593Smuzhiyun }
1224*4882a593Smuzhiyun
cma_port(const struct sockaddr * addr)1225*4882a593Smuzhiyun static __be16 cma_port(const struct sockaddr *addr)
1226*4882a593Smuzhiyun {
1227*4882a593Smuzhiyun struct sockaddr_ib *sib;
1228*4882a593Smuzhiyun
1229*4882a593Smuzhiyun switch (addr->sa_family) {
1230*4882a593Smuzhiyun case AF_INET:
1231*4882a593Smuzhiyun return ((struct sockaddr_in *) addr)->sin_port;
1232*4882a593Smuzhiyun case AF_INET6:
1233*4882a593Smuzhiyun return ((struct sockaddr_in6 *) addr)->sin6_port;
1234*4882a593Smuzhiyun case AF_IB:
1235*4882a593Smuzhiyun sib = (struct sockaddr_ib *) addr;
1236*4882a593Smuzhiyun return htons((u16) (be64_to_cpu(sib->sib_sid) &
1237*4882a593Smuzhiyun be64_to_cpu(sib->sib_sid_mask)));
1238*4882a593Smuzhiyun default:
1239*4882a593Smuzhiyun return 0;
1240*4882a593Smuzhiyun }
1241*4882a593Smuzhiyun }
1242*4882a593Smuzhiyun
cma_any_port(const struct sockaddr * addr)1243*4882a593Smuzhiyun static inline int cma_any_port(const struct sockaddr *addr)
1244*4882a593Smuzhiyun {
1245*4882a593Smuzhiyun return !cma_port(addr);
1246*4882a593Smuzhiyun }
1247*4882a593Smuzhiyun
cma_save_ib_info(struct sockaddr * src_addr,struct sockaddr * dst_addr,const struct rdma_cm_id * listen_id,const struct sa_path_rec * path)1248*4882a593Smuzhiyun static void cma_save_ib_info(struct sockaddr *src_addr,
1249*4882a593Smuzhiyun struct sockaddr *dst_addr,
1250*4882a593Smuzhiyun const struct rdma_cm_id *listen_id,
1251*4882a593Smuzhiyun const struct sa_path_rec *path)
1252*4882a593Smuzhiyun {
1253*4882a593Smuzhiyun struct sockaddr_ib *listen_ib, *ib;
1254*4882a593Smuzhiyun
1255*4882a593Smuzhiyun listen_ib = (struct sockaddr_ib *) &listen_id->route.addr.src_addr;
1256*4882a593Smuzhiyun if (src_addr) {
1257*4882a593Smuzhiyun ib = (struct sockaddr_ib *)src_addr;
1258*4882a593Smuzhiyun ib->sib_family = AF_IB;
1259*4882a593Smuzhiyun if (path) {
1260*4882a593Smuzhiyun ib->sib_pkey = path->pkey;
1261*4882a593Smuzhiyun ib->sib_flowinfo = path->flow_label;
1262*4882a593Smuzhiyun memcpy(&ib->sib_addr, &path->sgid, 16);
1263*4882a593Smuzhiyun ib->sib_sid = path->service_id;
1264*4882a593Smuzhiyun ib->sib_scope_id = 0;
1265*4882a593Smuzhiyun } else {
1266*4882a593Smuzhiyun ib->sib_pkey = listen_ib->sib_pkey;
1267*4882a593Smuzhiyun ib->sib_flowinfo = listen_ib->sib_flowinfo;
1268*4882a593Smuzhiyun ib->sib_addr = listen_ib->sib_addr;
1269*4882a593Smuzhiyun ib->sib_sid = listen_ib->sib_sid;
1270*4882a593Smuzhiyun ib->sib_scope_id = listen_ib->sib_scope_id;
1271*4882a593Smuzhiyun }
1272*4882a593Smuzhiyun ib->sib_sid_mask = cpu_to_be64(0xffffffffffffffffULL);
1273*4882a593Smuzhiyun }
1274*4882a593Smuzhiyun if (dst_addr) {
1275*4882a593Smuzhiyun ib = (struct sockaddr_ib *)dst_addr;
1276*4882a593Smuzhiyun ib->sib_family = AF_IB;
1277*4882a593Smuzhiyun if (path) {
1278*4882a593Smuzhiyun ib->sib_pkey = path->pkey;
1279*4882a593Smuzhiyun ib->sib_flowinfo = path->flow_label;
1280*4882a593Smuzhiyun memcpy(&ib->sib_addr, &path->dgid, 16);
1281*4882a593Smuzhiyun }
1282*4882a593Smuzhiyun }
1283*4882a593Smuzhiyun }
1284*4882a593Smuzhiyun
cma_save_ip4_info(struct sockaddr_in * src_addr,struct sockaddr_in * dst_addr,struct cma_hdr * hdr,__be16 local_port)1285*4882a593Smuzhiyun static void cma_save_ip4_info(struct sockaddr_in *src_addr,
1286*4882a593Smuzhiyun struct sockaddr_in *dst_addr,
1287*4882a593Smuzhiyun struct cma_hdr *hdr,
1288*4882a593Smuzhiyun __be16 local_port)
1289*4882a593Smuzhiyun {
1290*4882a593Smuzhiyun if (src_addr) {
1291*4882a593Smuzhiyun *src_addr = (struct sockaddr_in) {
1292*4882a593Smuzhiyun .sin_family = AF_INET,
1293*4882a593Smuzhiyun .sin_addr.s_addr = hdr->dst_addr.ip4.addr,
1294*4882a593Smuzhiyun .sin_port = local_port,
1295*4882a593Smuzhiyun };
1296*4882a593Smuzhiyun }
1297*4882a593Smuzhiyun
1298*4882a593Smuzhiyun if (dst_addr) {
1299*4882a593Smuzhiyun *dst_addr = (struct sockaddr_in) {
1300*4882a593Smuzhiyun .sin_family = AF_INET,
1301*4882a593Smuzhiyun .sin_addr.s_addr = hdr->src_addr.ip4.addr,
1302*4882a593Smuzhiyun .sin_port = hdr->port,
1303*4882a593Smuzhiyun };
1304*4882a593Smuzhiyun }
1305*4882a593Smuzhiyun }
1306*4882a593Smuzhiyun
cma_save_ip6_info(struct sockaddr_in6 * src_addr,struct sockaddr_in6 * dst_addr,struct cma_hdr * hdr,__be16 local_port)1307*4882a593Smuzhiyun static void cma_save_ip6_info(struct sockaddr_in6 *src_addr,
1308*4882a593Smuzhiyun struct sockaddr_in6 *dst_addr,
1309*4882a593Smuzhiyun struct cma_hdr *hdr,
1310*4882a593Smuzhiyun __be16 local_port)
1311*4882a593Smuzhiyun {
1312*4882a593Smuzhiyun if (src_addr) {
1313*4882a593Smuzhiyun *src_addr = (struct sockaddr_in6) {
1314*4882a593Smuzhiyun .sin6_family = AF_INET6,
1315*4882a593Smuzhiyun .sin6_addr = hdr->dst_addr.ip6,
1316*4882a593Smuzhiyun .sin6_port = local_port,
1317*4882a593Smuzhiyun };
1318*4882a593Smuzhiyun }
1319*4882a593Smuzhiyun
1320*4882a593Smuzhiyun if (dst_addr) {
1321*4882a593Smuzhiyun *dst_addr = (struct sockaddr_in6) {
1322*4882a593Smuzhiyun .sin6_family = AF_INET6,
1323*4882a593Smuzhiyun .sin6_addr = hdr->src_addr.ip6,
1324*4882a593Smuzhiyun .sin6_port = hdr->port,
1325*4882a593Smuzhiyun };
1326*4882a593Smuzhiyun }
1327*4882a593Smuzhiyun }
1328*4882a593Smuzhiyun
cma_port_from_service_id(__be64 service_id)1329*4882a593Smuzhiyun static u16 cma_port_from_service_id(__be64 service_id)
1330*4882a593Smuzhiyun {
1331*4882a593Smuzhiyun return (u16)be64_to_cpu(service_id);
1332*4882a593Smuzhiyun }
1333*4882a593Smuzhiyun
cma_save_ip_info(struct sockaddr * src_addr,struct sockaddr * dst_addr,const struct ib_cm_event * ib_event,__be64 service_id)1334*4882a593Smuzhiyun static int cma_save_ip_info(struct sockaddr *src_addr,
1335*4882a593Smuzhiyun struct sockaddr *dst_addr,
1336*4882a593Smuzhiyun const struct ib_cm_event *ib_event,
1337*4882a593Smuzhiyun __be64 service_id)
1338*4882a593Smuzhiyun {
1339*4882a593Smuzhiyun struct cma_hdr *hdr;
1340*4882a593Smuzhiyun __be16 port;
1341*4882a593Smuzhiyun
1342*4882a593Smuzhiyun hdr = ib_event->private_data;
1343*4882a593Smuzhiyun if (hdr->cma_version != CMA_VERSION)
1344*4882a593Smuzhiyun return -EINVAL;
1345*4882a593Smuzhiyun
1346*4882a593Smuzhiyun port = htons(cma_port_from_service_id(service_id));
1347*4882a593Smuzhiyun
1348*4882a593Smuzhiyun switch (cma_get_ip_ver(hdr)) {
1349*4882a593Smuzhiyun case 4:
1350*4882a593Smuzhiyun cma_save_ip4_info((struct sockaddr_in *)src_addr,
1351*4882a593Smuzhiyun (struct sockaddr_in *)dst_addr, hdr, port);
1352*4882a593Smuzhiyun break;
1353*4882a593Smuzhiyun case 6:
1354*4882a593Smuzhiyun cma_save_ip6_info((struct sockaddr_in6 *)src_addr,
1355*4882a593Smuzhiyun (struct sockaddr_in6 *)dst_addr, hdr, port);
1356*4882a593Smuzhiyun break;
1357*4882a593Smuzhiyun default:
1358*4882a593Smuzhiyun return -EAFNOSUPPORT;
1359*4882a593Smuzhiyun }
1360*4882a593Smuzhiyun
1361*4882a593Smuzhiyun return 0;
1362*4882a593Smuzhiyun }
1363*4882a593Smuzhiyun
cma_save_net_info(struct sockaddr * src_addr,struct sockaddr * dst_addr,const struct rdma_cm_id * listen_id,const struct ib_cm_event * ib_event,sa_family_t sa_family,__be64 service_id)1364*4882a593Smuzhiyun static int cma_save_net_info(struct sockaddr *src_addr,
1365*4882a593Smuzhiyun struct sockaddr *dst_addr,
1366*4882a593Smuzhiyun const struct rdma_cm_id *listen_id,
1367*4882a593Smuzhiyun const struct ib_cm_event *ib_event,
1368*4882a593Smuzhiyun sa_family_t sa_family, __be64 service_id)
1369*4882a593Smuzhiyun {
1370*4882a593Smuzhiyun if (sa_family == AF_IB) {
1371*4882a593Smuzhiyun if (ib_event->event == IB_CM_REQ_RECEIVED)
1372*4882a593Smuzhiyun cma_save_ib_info(src_addr, dst_addr, listen_id,
1373*4882a593Smuzhiyun ib_event->param.req_rcvd.primary_path);
1374*4882a593Smuzhiyun else if (ib_event->event == IB_CM_SIDR_REQ_RECEIVED)
1375*4882a593Smuzhiyun cma_save_ib_info(src_addr, dst_addr, listen_id, NULL);
1376*4882a593Smuzhiyun return 0;
1377*4882a593Smuzhiyun }
1378*4882a593Smuzhiyun
1379*4882a593Smuzhiyun return cma_save_ip_info(src_addr, dst_addr, ib_event, service_id);
1380*4882a593Smuzhiyun }
1381*4882a593Smuzhiyun
cma_save_req_info(const struct ib_cm_event * ib_event,struct cma_req_info * req)1382*4882a593Smuzhiyun static int cma_save_req_info(const struct ib_cm_event *ib_event,
1383*4882a593Smuzhiyun struct cma_req_info *req)
1384*4882a593Smuzhiyun {
1385*4882a593Smuzhiyun const struct ib_cm_req_event_param *req_param =
1386*4882a593Smuzhiyun &ib_event->param.req_rcvd;
1387*4882a593Smuzhiyun const struct ib_cm_sidr_req_event_param *sidr_param =
1388*4882a593Smuzhiyun &ib_event->param.sidr_req_rcvd;
1389*4882a593Smuzhiyun
1390*4882a593Smuzhiyun switch (ib_event->event) {
1391*4882a593Smuzhiyun case IB_CM_REQ_RECEIVED:
1392*4882a593Smuzhiyun req->device = req_param->listen_id->device;
1393*4882a593Smuzhiyun req->port = req_param->port;
1394*4882a593Smuzhiyun memcpy(&req->local_gid, &req_param->primary_path->sgid,
1395*4882a593Smuzhiyun sizeof(req->local_gid));
1396*4882a593Smuzhiyun req->has_gid = true;
1397*4882a593Smuzhiyun req->service_id = req_param->primary_path->service_id;
1398*4882a593Smuzhiyun req->pkey = be16_to_cpu(req_param->primary_path->pkey);
1399*4882a593Smuzhiyun if (req->pkey != req_param->bth_pkey)
1400*4882a593Smuzhiyun pr_warn_ratelimited("RDMA CMA: got different BTH P_Key (0x%x) and primary path P_Key (0x%x)\n"
1401*4882a593Smuzhiyun "RDMA CMA: in the future this may cause the request to be dropped\n",
1402*4882a593Smuzhiyun req_param->bth_pkey, req->pkey);
1403*4882a593Smuzhiyun break;
1404*4882a593Smuzhiyun case IB_CM_SIDR_REQ_RECEIVED:
1405*4882a593Smuzhiyun req->device = sidr_param->listen_id->device;
1406*4882a593Smuzhiyun req->port = sidr_param->port;
1407*4882a593Smuzhiyun req->has_gid = false;
1408*4882a593Smuzhiyun req->service_id = sidr_param->service_id;
1409*4882a593Smuzhiyun req->pkey = sidr_param->pkey;
1410*4882a593Smuzhiyun if (req->pkey != sidr_param->bth_pkey)
1411*4882a593Smuzhiyun pr_warn_ratelimited("RDMA CMA: got different BTH P_Key (0x%x) and SIDR request payload P_Key (0x%x)\n"
1412*4882a593Smuzhiyun "RDMA CMA: in the future this may cause the request to be dropped\n",
1413*4882a593Smuzhiyun sidr_param->bth_pkey, req->pkey);
1414*4882a593Smuzhiyun break;
1415*4882a593Smuzhiyun default:
1416*4882a593Smuzhiyun return -EINVAL;
1417*4882a593Smuzhiyun }
1418*4882a593Smuzhiyun
1419*4882a593Smuzhiyun return 0;
1420*4882a593Smuzhiyun }
1421*4882a593Smuzhiyun
validate_ipv4_net_dev(struct net_device * net_dev,const struct sockaddr_in * dst_addr,const struct sockaddr_in * src_addr)1422*4882a593Smuzhiyun static bool validate_ipv4_net_dev(struct net_device *net_dev,
1423*4882a593Smuzhiyun const struct sockaddr_in *dst_addr,
1424*4882a593Smuzhiyun const struct sockaddr_in *src_addr)
1425*4882a593Smuzhiyun {
1426*4882a593Smuzhiyun __be32 daddr = dst_addr->sin_addr.s_addr,
1427*4882a593Smuzhiyun saddr = src_addr->sin_addr.s_addr;
1428*4882a593Smuzhiyun struct fib_result res;
1429*4882a593Smuzhiyun struct flowi4 fl4;
1430*4882a593Smuzhiyun int err;
1431*4882a593Smuzhiyun bool ret;
1432*4882a593Smuzhiyun
1433*4882a593Smuzhiyun if (ipv4_is_multicast(saddr) || ipv4_is_lbcast(saddr) ||
1434*4882a593Smuzhiyun ipv4_is_lbcast(daddr) || ipv4_is_zeronet(saddr) ||
1435*4882a593Smuzhiyun ipv4_is_zeronet(daddr) || ipv4_is_loopback(daddr) ||
1436*4882a593Smuzhiyun ipv4_is_loopback(saddr))
1437*4882a593Smuzhiyun return false;
1438*4882a593Smuzhiyun
1439*4882a593Smuzhiyun memset(&fl4, 0, sizeof(fl4));
1440*4882a593Smuzhiyun fl4.flowi4_oif = net_dev->ifindex;
1441*4882a593Smuzhiyun fl4.daddr = daddr;
1442*4882a593Smuzhiyun fl4.saddr = saddr;
1443*4882a593Smuzhiyun
1444*4882a593Smuzhiyun rcu_read_lock();
1445*4882a593Smuzhiyun err = fib_lookup(dev_net(net_dev), &fl4, &res, 0);
1446*4882a593Smuzhiyun ret = err == 0 && FIB_RES_DEV(res) == net_dev;
1447*4882a593Smuzhiyun rcu_read_unlock();
1448*4882a593Smuzhiyun
1449*4882a593Smuzhiyun return ret;
1450*4882a593Smuzhiyun }
1451*4882a593Smuzhiyun
validate_ipv6_net_dev(struct net_device * net_dev,const struct sockaddr_in6 * dst_addr,const struct sockaddr_in6 * src_addr)1452*4882a593Smuzhiyun static bool validate_ipv6_net_dev(struct net_device *net_dev,
1453*4882a593Smuzhiyun const struct sockaddr_in6 *dst_addr,
1454*4882a593Smuzhiyun const struct sockaddr_in6 *src_addr)
1455*4882a593Smuzhiyun {
1456*4882a593Smuzhiyun #if IS_ENABLED(CONFIG_IPV6)
1457*4882a593Smuzhiyun const int strict = ipv6_addr_type(&dst_addr->sin6_addr) &
1458*4882a593Smuzhiyun IPV6_ADDR_LINKLOCAL;
1459*4882a593Smuzhiyun struct rt6_info *rt = rt6_lookup(dev_net(net_dev), &dst_addr->sin6_addr,
1460*4882a593Smuzhiyun &src_addr->sin6_addr, net_dev->ifindex,
1461*4882a593Smuzhiyun NULL, strict);
1462*4882a593Smuzhiyun bool ret;
1463*4882a593Smuzhiyun
1464*4882a593Smuzhiyun if (!rt)
1465*4882a593Smuzhiyun return false;
1466*4882a593Smuzhiyun
1467*4882a593Smuzhiyun ret = rt->rt6i_idev->dev == net_dev;
1468*4882a593Smuzhiyun ip6_rt_put(rt);
1469*4882a593Smuzhiyun
1470*4882a593Smuzhiyun return ret;
1471*4882a593Smuzhiyun #else
1472*4882a593Smuzhiyun return false;
1473*4882a593Smuzhiyun #endif
1474*4882a593Smuzhiyun }
1475*4882a593Smuzhiyun
validate_net_dev(struct net_device * net_dev,const struct sockaddr * daddr,const struct sockaddr * saddr)1476*4882a593Smuzhiyun static bool validate_net_dev(struct net_device *net_dev,
1477*4882a593Smuzhiyun const struct sockaddr *daddr,
1478*4882a593Smuzhiyun const struct sockaddr *saddr)
1479*4882a593Smuzhiyun {
1480*4882a593Smuzhiyun const struct sockaddr_in *daddr4 = (const struct sockaddr_in *)daddr;
1481*4882a593Smuzhiyun const struct sockaddr_in *saddr4 = (const struct sockaddr_in *)saddr;
1482*4882a593Smuzhiyun const struct sockaddr_in6 *daddr6 = (const struct sockaddr_in6 *)daddr;
1483*4882a593Smuzhiyun const struct sockaddr_in6 *saddr6 = (const struct sockaddr_in6 *)saddr;
1484*4882a593Smuzhiyun
1485*4882a593Smuzhiyun switch (daddr->sa_family) {
1486*4882a593Smuzhiyun case AF_INET:
1487*4882a593Smuzhiyun return saddr->sa_family == AF_INET &&
1488*4882a593Smuzhiyun validate_ipv4_net_dev(net_dev, daddr4, saddr4);
1489*4882a593Smuzhiyun
1490*4882a593Smuzhiyun case AF_INET6:
1491*4882a593Smuzhiyun return saddr->sa_family == AF_INET6 &&
1492*4882a593Smuzhiyun validate_ipv6_net_dev(net_dev, daddr6, saddr6);
1493*4882a593Smuzhiyun
1494*4882a593Smuzhiyun default:
1495*4882a593Smuzhiyun return false;
1496*4882a593Smuzhiyun }
1497*4882a593Smuzhiyun }
1498*4882a593Smuzhiyun
1499*4882a593Smuzhiyun static struct net_device *
roce_get_net_dev_by_cm_event(const struct ib_cm_event * ib_event)1500*4882a593Smuzhiyun roce_get_net_dev_by_cm_event(const struct ib_cm_event *ib_event)
1501*4882a593Smuzhiyun {
1502*4882a593Smuzhiyun const struct ib_gid_attr *sgid_attr = NULL;
1503*4882a593Smuzhiyun struct net_device *ndev;
1504*4882a593Smuzhiyun
1505*4882a593Smuzhiyun if (ib_event->event == IB_CM_REQ_RECEIVED)
1506*4882a593Smuzhiyun sgid_attr = ib_event->param.req_rcvd.ppath_sgid_attr;
1507*4882a593Smuzhiyun else if (ib_event->event == IB_CM_SIDR_REQ_RECEIVED)
1508*4882a593Smuzhiyun sgid_attr = ib_event->param.sidr_req_rcvd.sgid_attr;
1509*4882a593Smuzhiyun
1510*4882a593Smuzhiyun if (!sgid_attr)
1511*4882a593Smuzhiyun return NULL;
1512*4882a593Smuzhiyun
1513*4882a593Smuzhiyun rcu_read_lock();
1514*4882a593Smuzhiyun ndev = rdma_read_gid_attr_ndev_rcu(sgid_attr);
1515*4882a593Smuzhiyun if (IS_ERR(ndev))
1516*4882a593Smuzhiyun ndev = NULL;
1517*4882a593Smuzhiyun else
1518*4882a593Smuzhiyun dev_hold(ndev);
1519*4882a593Smuzhiyun rcu_read_unlock();
1520*4882a593Smuzhiyun return ndev;
1521*4882a593Smuzhiyun }
1522*4882a593Smuzhiyun
cma_get_net_dev(const struct ib_cm_event * ib_event,struct cma_req_info * req)1523*4882a593Smuzhiyun static struct net_device *cma_get_net_dev(const struct ib_cm_event *ib_event,
1524*4882a593Smuzhiyun struct cma_req_info *req)
1525*4882a593Smuzhiyun {
1526*4882a593Smuzhiyun struct sockaddr *listen_addr =
1527*4882a593Smuzhiyun (struct sockaddr *)&req->listen_addr_storage;
1528*4882a593Smuzhiyun struct sockaddr *src_addr = (struct sockaddr *)&req->src_addr_storage;
1529*4882a593Smuzhiyun struct net_device *net_dev;
1530*4882a593Smuzhiyun const union ib_gid *gid = req->has_gid ? &req->local_gid : NULL;
1531*4882a593Smuzhiyun int err;
1532*4882a593Smuzhiyun
1533*4882a593Smuzhiyun err = cma_save_ip_info(listen_addr, src_addr, ib_event,
1534*4882a593Smuzhiyun req->service_id);
1535*4882a593Smuzhiyun if (err)
1536*4882a593Smuzhiyun return ERR_PTR(err);
1537*4882a593Smuzhiyun
1538*4882a593Smuzhiyun if (rdma_protocol_roce(req->device, req->port))
1539*4882a593Smuzhiyun net_dev = roce_get_net_dev_by_cm_event(ib_event);
1540*4882a593Smuzhiyun else
1541*4882a593Smuzhiyun net_dev = ib_get_net_dev_by_params(req->device, req->port,
1542*4882a593Smuzhiyun req->pkey,
1543*4882a593Smuzhiyun gid, listen_addr);
1544*4882a593Smuzhiyun if (!net_dev)
1545*4882a593Smuzhiyun return ERR_PTR(-ENODEV);
1546*4882a593Smuzhiyun
1547*4882a593Smuzhiyun return net_dev;
1548*4882a593Smuzhiyun }
1549*4882a593Smuzhiyun
rdma_ps_from_service_id(__be64 service_id)1550*4882a593Smuzhiyun static enum rdma_ucm_port_space rdma_ps_from_service_id(__be64 service_id)
1551*4882a593Smuzhiyun {
1552*4882a593Smuzhiyun return (be64_to_cpu(service_id) >> 16) & 0xffff;
1553*4882a593Smuzhiyun }
1554*4882a593Smuzhiyun
cma_match_private_data(struct rdma_id_private * id_priv,const struct cma_hdr * hdr)1555*4882a593Smuzhiyun static bool cma_match_private_data(struct rdma_id_private *id_priv,
1556*4882a593Smuzhiyun const struct cma_hdr *hdr)
1557*4882a593Smuzhiyun {
1558*4882a593Smuzhiyun struct sockaddr *addr = cma_src_addr(id_priv);
1559*4882a593Smuzhiyun __be32 ip4_addr;
1560*4882a593Smuzhiyun struct in6_addr ip6_addr;
1561*4882a593Smuzhiyun
1562*4882a593Smuzhiyun if (cma_any_addr(addr) && !id_priv->afonly)
1563*4882a593Smuzhiyun return true;
1564*4882a593Smuzhiyun
1565*4882a593Smuzhiyun switch (addr->sa_family) {
1566*4882a593Smuzhiyun case AF_INET:
1567*4882a593Smuzhiyun ip4_addr = ((struct sockaddr_in *)addr)->sin_addr.s_addr;
1568*4882a593Smuzhiyun if (cma_get_ip_ver(hdr) != 4)
1569*4882a593Smuzhiyun return false;
1570*4882a593Smuzhiyun if (!cma_any_addr(addr) &&
1571*4882a593Smuzhiyun hdr->dst_addr.ip4.addr != ip4_addr)
1572*4882a593Smuzhiyun return false;
1573*4882a593Smuzhiyun break;
1574*4882a593Smuzhiyun case AF_INET6:
1575*4882a593Smuzhiyun ip6_addr = ((struct sockaddr_in6 *)addr)->sin6_addr;
1576*4882a593Smuzhiyun if (cma_get_ip_ver(hdr) != 6)
1577*4882a593Smuzhiyun return false;
1578*4882a593Smuzhiyun if (!cma_any_addr(addr) &&
1579*4882a593Smuzhiyun memcmp(&hdr->dst_addr.ip6, &ip6_addr, sizeof(ip6_addr)))
1580*4882a593Smuzhiyun return false;
1581*4882a593Smuzhiyun break;
1582*4882a593Smuzhiyun case AF_IB:
1583*4882a593Smuzhiyun return true;
1584*4882a593Smuzhiyun default:
1585*4882a593Smuzhiyun return false;
1586*4882a593Smuzhiyun }
1587*4882a593Smuzhiyun
1588*4882a593Smuzhiyun return true;
1589*4882a593Smuzhiyun }
1590*4882a593Smuzhiyun
cma_protocol_roce(const struct rdma_cm_id * id)1591*4882a593Smuzhiyun static bool cma_protocol_roce(const struct rdma_cm_id *id)
1592*4882a593Smuzhiyun {
1593*4882a593Smuzhiyun struct ib_device *device = id->device;
1594*4882a593Smuzhiyun const int port_num = id->port_num ?: rdma_start_port(device);
1595*4882a593Smuzhiyun
1596*4882a593Smuzhiyun return rdma_protocol_roce(device, port_num);
1597*4882a593Smuzhiyun }
1598*4882a593Smuzhiyun
cma_is_req_ipv6_ll(const struct cma_req_info * req)1599*4882a593Smuzhiyun static bool cma_is_req_ipv6_ll(const struct cma_req_info *req)
1600*4882a593Smuzhiyun {
1601*4882a593Smuzhiyun const struct sockaddr *daddr =
1602*4882a593Smuzhiyun (const struct sockaddr *)&req->listen_addr_storage;
1603*4882a593Smuzhiyun const struct sockaddr_in6 *daddr6 = (const struct sockaddr_in6 *)daddr;
1604*4882a593Smuzhiyun
1605*4882a593Smuzhiyun /* Returns true if the req is for IPv6 link local */
1606*4882a593Smuzhiyun return (daddr->sa_family == AF_INET6 &&
1607*4882a593Smuzhiyun (ipv6_addr_type(&daddr6->sin6_addr) & IPV6_ADDR_LINKLOCAL));
1608*4882a593Smuzhiyun }
1609*4882a593Smuzhiyun
cma_match_net_dev(const struct rdma_cm_id * id,const struct net_device * net_dev,const struct cma_req_info * req)1610*4882a593Smuzhiyun static bool cma_match_net_dev(const struct rdma_cm_id *id,
1611*4882a593Smuzhiyun const struct net_device *net_dev,
1612*4882a593Smuzhiyun const struct cma_req_info *req)
1613*4882a593Smuzhiyun {
1614*4882a593Smuzhiyun const struct rdma_addr *addr = &id->route.addr;
1615*4882a593Smuzhiyun
1616*4882a593Smuzhiyun if (!net_dev)
1617*4882a593Smuzhiyun /* This request is an AF_IB request */
1618*4882a593Smuzhiyun return (!id->port_num || id->port_num == req->port) &&
1619*4882a593Smuzhiyun (addr->src_addr.ss_family == AF_IB);
1620*4882a593Smuzhiyun
1621*4882a593Smuzhiyun /*
1622*4882a593Smuzhiyun * If the request is not for IPv6 link local, allow matching
1623*4882a593Smuzhiyun * request to any netdevice of the one or multiport rdma device.
1624*4882a593Smuzhiyun */
1625*4882a593Smuzhiyun if (!cma_is_req_ipv6_ll(req))
1626*4882a593Smuzhiyun return true;
1627*4882a593Smuzhiyun /*
1628*4882a593Smuzhiyun * Net namespaces must match, and if the listner is listening
1629*4882a593Smuzhiyun * on a specific netdevice than netdevice must match as well.
1630*4882a593Smuzhiyun */
1631*4882a593Smuzhiyun if (net_eq(dev_net(net_dev), addr->dev_addr.net) &&
1632*4882a593Smuzhiyun (!!addr->dev_addr.bound_dev_if ==
1633*4882a593Smuzhiyun (addr->dev_addr.bound_dev_if == net_dev->ifindex)))
1634*4882a593Smuzhiyun return true;
1635*4882a593Smuzhiyun else
1636*4882a593Smuzhiyun return false;
1637*4882a593Smuzhiyun }
1638*4882a593Smuzhiyun
cma_find_listener(const struct rdma_bind_list * bind_list,const struct ib_cm_id * cm_id,const struct ib_cm_event * ib_event,const struct cma_req_info * req,const struct net_device * net_dev)1639*4882a593Smuzhiyun static struct rdma_id_private *cma_find_listener(
1640*4882a593Smuzhiyun const struct rdma_bind_list *bind_list,
1641*4882a593Smuzhiyun const struct ib_cm_id *cm_id,
1642*4882a593Smuzhiyun const struct ib_cm_event *ib_event,
1643*4882a593Smuzhiyun const struct cma_req_info *req,
1644*4882a593Smuzhiyun const struct net_device *net_dev)
1645*4882a593Smuzhiyun {
1646*4882a593Smuzhiyun struct rdma_id_private *id_priv, *id_priv_dev;
1647*4882a593Smuzhiyun
1648*4882a593Smuzhiyun lockdep_assert_held(&lock);
1649*4882a593Smuzhiyun
1650*4882a593Smuzhiyun if (!bind_list)
1651*4882a593Smuzhiyun return ERR_PTR(-EINVAL);
1652*4882a593Smuzhiyun
1653*4882a593Smuzhiyun hlist_for_each_entry(id_priv, &bind_list->owners, node) {
1654*4882a593Smuzhiyun if (cma_match_private_data(id_priv, ib_event->private_data)) {
1655*4882a593Smuzhiyun if (id_priv->id.device == cm_id->device &&
1656*4882a593Smuzhiyun cma_match_net_dev(&id_priv->id, net_dev, req))
1657*4882a593Smuzhiyun return id_priv;
1658*4882a593Smuzhiyun list_for_each_entry(id_priv_dev,
1659*4882a593Smuzhiyun &id_priv->listen_list,
1660*4882a593Smuzhiyun listen_list) {
1661*4882a593Smuzhiyun if (id_priv_dev->id.device == cm_id->device &&
1662*4882a593Smuzhiyun cma_match_net_dev(&id_priv_dev->id,
1663*4882a593Smuzhiyun net_dev, req))
1664*4882a593Smuzhiyun return id_priv_dev;
1665*4882a593Smuzhiyun }
1666*4882a593Smuzhiyun }
1667*4882a593Smuzhiyun }
1668*4882a593Smuzhiyun
1669*4882a593Smuzhiyun return ERR_PTR(-EINVAL);
1670*4882a593Smuzhiyun }
1671*4882a593Smuzhiyun
1672*4882a593Smuzhiyun static struct rdma_id_private *
cma_ib_id_from_event(struct ib_cm_id * cm_id,const struct ib_cm_event * ib_event,struct cma_req_info * req,struct net_device ** net_dev)1673*4882a593Smuzhiyun cma_ib_id_from_event(struct ib_cm_id *cm_id,
1674*4882a593Smuzhiyun const struct ib_cm_event *ib_event,
1675*4882a593Smuzhiyun struct cma_req_info *req,
1676*4882a593Smuzhiyun struct net_device **net_dev)
1677*4882a593Smuzhiyun {
1678*4882a593Smuzhiyun struct rdma_bind_list *bind_list;
1679*4882a593Smuzhiyun struct rdma_id_private *id_priv;
1680*4882a593Smuzhiyun int err;
1681*4882a593Smuzhiyun
1682*4882a593Smuzhiyun err = cma_save_req_info(ib_event, req);
1683*4882a593Smuzhiyun if (err)
1684*4882a593Smuzhiyun return ERR_PTR(err);
1685*4882a593Smuzhiyun
1686*4882a593Smuzhiyun *net_dev = cma_get_net_dev(ib_event, req);
1687*4882a593Smuzhiyun if (IS_ERR(*net_dev)) {
1688*4882a593Smuzhiyun if (PTR_ERR(*net_dev) == -EAFNOSUPPORT) {
1689*4882a593Smuzhiyun /* Assuming the protocol is AF_IB */
1690*4882a593Smuzhiyun *net_dev = NULL;
1691*4882a593Smuzhiyun } else {
1692*4882a593Smuzhiyun return ERR_CAST(*net_dev);
1693*4882a593Smuzhiyun }
1694*4882a593Smuzhiyun }
1695*4882a593Smuzhiyun
1696*4882a593Smuzhiyun mutex_lock(&lock);
1697*4882a593Smuzhiyun /*
1698*4882a593Smuzhiyun * Net namespace might be getting deleted while route lookup,
1699*4882a593Smuzhiyun * cm_id lookup is in progress. Therefore, perform netdevice
1700*4882a593Smuzhiyun * validation, cm_id lookup under rcu lock.
1701*4882a593Smuzhiyun * RCU lock along with netdevice state check, synchronizes with
1702*4882a593Smuzhiyun * netdevice migrating to different net namespace and also avoids
1703*4882a593Smuzhiyun * case where net namespace doesn't get deleted while lookup is in
1704*4882a593Smuzhiyun * progress.
1705*4882a593Smuzhiyun * If the device state is not IFF_UP, its properties such as ifindex
1706*4882a593Smuzhiyun * and nd_net cannot be trusted to remain valid without rcu lock.
1707*4882a593Smuzhiyun * net/core/dev.c change_net_namespace() ensures to synchronize with
1708*4882a593Smuzhiyun * ongoing operations on net device after device is closed using
1709*4882a593Smuzhiyun * synchronize_net().
1710*4882a593Smuzhiyun */
1711*4882a593Smuzhiyun rcu_read_lock();
1712*4882a593Smuzhiyun if (*net_dev) {
1713*4882a593Smuzhiyun /*
1714*4882a593Smuzhiyun * If netdevice is down, it is likely that it is administratively
1715*4882a593Smuzhiyun * down or it might be migrating to different namespace.
1716*4882a593Smuzhiyun * In that case avoid further processing, as the net namespace
1717*4882a593Smuzhiyun * or ifindex may change.
1718*4882a593Smuzhiyun */
1719*4882a593Smuzhiyun if (((*net_dev)->flags & IFF_UP) == 0) {
1720*4882a593Smuzhiyun id_priv = ERR_PTR(-EHOSTUNREACH);
1721*4882a593Smuzhiyun goto err;
1722*4882a593Smuzhiyun }
1723*4882a593Smuzhiyun
1724*4882a593Smuzhiyun if (!validate_net_dev(*net_dev,
1725*4882a593Smuzhiyun (struct sockaddr *)&req->src_addr_storage,
1726*4882a593Smuzhiyun (struct sockaddr *)&req->listen_addr_storage)) {
1727*4882a593Smuzhiyun id_priv = ERR_PTR(-EHOSTUNREACH);
1728*4882a593Smuzhiyun goto err;
1729*4882a593Smuzhiyun }
1730*4882a593Smuzhiyun }
1731*4882a593Smuzhiyun
1732*4882a593Smuzhiyun bind_list = cma_ps_find(*net_dev ? dev_net(*net_dev) : &init_net,
1733*4882a593Smuzhiyun rdma_ps_from_service_id(req->service_id),
1734*4882a593Smuzhiyun cma_port_from_service_id(req->service_id));
1735*4882a593Smuzhiyun id_priv = cma_find_listener(bind_list, cm_id, ib_event, req, *net_dev);
1736*4882a593Smuzhiyun err:
1737*4882a593Smuzhiyun rcu_read_unlock();
1738*4882a593Smuzhiyun mutex_unlock(&lock);
1739*4882a593Smuzhiyun if (IS_ERR(id_priv) && *net_dev) {
1740*4882a593Smuzhiyun dev_put(*net_dev);
1741*4882a593Smuzhiyun *net_dev = NULL;
1742*4882a593Smuzhiyun }
1743*4882a593Smuzhiyun return id_priv;
1744*4882a593Smuzhiyun }
1745*4882a593Smuzhiyun
cma_user_data_offset(struct rdma_id_private * id_priv)1746*4882a593Smuzhiyun static inline u8 cma_user_data_offset(struct rdma_id_private *id_priv)
1747*4882a593Smuzhiyun {
1748*4882a593Smuzhiyun return cma_family(id_priv) == AF_IB ? 0 : sizeof(struct cma_hdr);
1749*4882a593Smuzhiyun }
1750*4882a593Smuzhiyun
cma_cancel_route(struct rdma_id_private * id_priv)1751*4882a593Smuzhiyun static void cma_cancel_route(struct rdma_id_private *id_priv)
1752*4882a593Smuzhiyun {
1753*4882a593Smuzhiyun if (rdma_cap_ib_sa(id_priv->id.device, id_priv->id.port_num)) {
1754*4882a593Smuzhiyun if (id_priv->query)
1755*4882a593Smuzhiyun ib_sa_cancel_query(id_priv->query_id, id_priv->query);
1756*4882a593Smuzhiyun }
1757*4882a593Smuzhiyun }
1758*4882a593Smuzhiyun
_cma_cancel_listens(struct rdma_id_private * id_priv)1759*4882a593Smuzhiyun static void _cma_cancel_listens(struct rdma_id_private *id_priv)
1760*4882a593Smuzhiyun {
1761*4882a593Smuzhiyun struct rdma_id_private *dev_id_priv;
1762*4882a593Smuzhiyun
1763*4882a593Smuzhiyun lockdep_assert_held(&lock);
1764*4882a593Smuzhiyun
1765*4882a593Smuzhiyun /*
1766*4882a593Smuzhiyun * Remove from listen_any_list to prevent added devices from spawning
1767*4882a593Smuzhiyun * additional listen requests.
1768*4882a593Smuzhiyun */
1769*4882a593Smuzhiyun list_del(&id_priv->list);
1770*4882a593Smuzhiyun
1771*4882a593Smuzhiyun while (!list_empty(&id_priv->listen_list)) {
1772*4882a593Smuzhiyun dev_id_priv = list_entry(id_priv->listen_list.next,
1773*4882a593Smuzhiyun struct rdma_id_private, listen_list);
1774*4882a593Smuzhiyun /* sync with device removal to avoid duplicate destruction */
1775*4882a593Smuzhiyun list_del_init(&dev_id_priv->list);
1776*4882a593Smuzhiyun list_del(&dev_id_priv->listen_list);
1777*4882a593Smuzhiyun mutex_unlock(&lock);
1778*4882a593Smuzhiyun
1779*4882a593Smuzhiyun rdma_destroy_id(&dev_id_priv->id);
1780*4882a593Smuzhiyun mutex_lock(&lock);
1781*4882a593Smuzhiyun }
1782*4882a593Smuzhiyun }
1783*4882a593Smuzhiyun
cma_cancel_listens(struct rdma_id_private * id_priv)1784*4882a593Smuzhiyun static void cma_cancel_listens(struct rdma_id_private *id_priv)
1785*4882a593Smuzhiyun {
1786*4882a593Smuzhiyun mutex_lock(&lock);
1787*4882a593Smuzhiyun _cma_cancel_listens(id_priv);
1788*4882a593Smuzhiyun mutex_unlock(&lock);
1789*4882a593Smuzhiyun }
1790*4882a593Smuzhiyun
cma_cancel_operation(struct rdma_id_private * id_priv,enum rdma_cm_state state)1791*4882a593Smuzhiyun static void cma_cancel_operation(struct rdma_id_private *id_priv,
1792*4882a593Smuzhiyun enum rdma_cm_state state)
1793*4882a593Smuzhiyun {
1794*4882a593Smuzhiyun switch (state) {
1795*4882a593Smuzhiyun case RDMA_CM_ADDR_QUERY:
1796*4882a593Smuzhiyun rdma_addr_cancel(&id_priv->id.route.addr.dev_addr);
1797*4882a593Smuzhiyun break;
1798*4882a593Smuzhiyun case RDMA_CM_ROUTE_QUERY:
1799*4882a593Smuzhiyun cma_cancel_route(id_priv);
1800*4882a593Smuzhiyun break;
1801*4882a593Smuzhiyun case RDMA_CM_LISTEN:
1802*4882a593Smuzhiyun if (cma_any_addr(cma_src_addr(id_priv)) && !id_priv->cma_dev)
1803*4882a593Smuzhiyun cma_cancel_listens(id_priv);
1804*4882a593Smuzhiyun break;
1805*4882a593Smuzhiyun default:
1806*4882a593Smuzhiyun break;
1807*4882a593Smuzhiyun }
1808*4882a593Smuzhiyun }
1809*4882a593Smuzhiyun
cma_release_port(struct rdma_id_private * id_priv)1810*4882a593Smuzhiyun static void cma_release_port(struct rdma_id_private *id_priv)
1811*4882a593Smuzhiyun {
1812*4882a593Smuzhiyun struct rdma_bind_list *bind_list = id_priv->bind_list;
1813*4882a593Smuzhiyun struct net *net = id_priv->id.route.addr.dev_addr.net;
1814*4882a593Smuzhiyun
1815*4882a593Smuzhiyun if (!bind_list)
1816*4882a593Smuzhiyun return;
1817*4882a593Smuzhiyun
1818*4882a593Smuzhiyun mutex_lock(&lock);
1819*4882a593Smuzhiyun hlist_del(&id_priv->node);
1820*4882a593Smuzhiyun if (hlist_empty(&bind_list->owners)) {
1821*4882a593Smuzhiyun cma_ps_remove(net, bind_list->ps, bind_list->port);
1822*4882a593Smuzhiyun kfree(bind_list);
1823*4882a593Smuzhiyun }
1824*4882a593Smuzhiyun mutex_unlock(&lock);
1825*4882a593Smuzhiyun }
1826*4882a593Smuzhiyun
destroy_mc(struct rdma_id_private * id_priv,struct cma_multicast * mc)1827*4882a593Smuzhiyun static void destroy_mc(struct rdma_id_private *id_priv,
1828*4882a593Smuzhiyun struct cma_multicast *mc)
1829*4882a593Smuzhiyun {
1830*4882a593Smuzhiyun bool send_only = mc->join_state == BIT(SENDONLY_FULLMEMBER_JOIN);
1831*4882a593Smuzhiyun
1832*4882a593Smuzhiyun if (rdma_cap_ib_mcast(id_priv->id.device, id_priv->id.port_num))
1833*4882a593Smuzhiyun ib_sa_free_multicast(mc->sa_mc);
1834*4882a593Smuzhiyun
1835*4882a593Smuzhiyun if (rdma_protocol_roce(id_priv->id.device, id_priv->id.port_num)) {
1836*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr =
1837*4882a593Smuzhiyun &id_priv->id.route.addr.dev_addr;
1838*4882a593Smuzhiyun struct net_device *ndev = NULL;
1839*4882a593Smuzhiyun
1840*4882a593Smuzhiyun if (dev_addr->bound_dev_if)
1841*4882a593Smuzhiyun ndev = dev_get_by_index(dev_addr->net,
1842*4882a593Smuzhiyun dev_addr->bound_dev_if);
1843*4882a593Smuzhiyun if (ndev && !send_only) {
1844*4882a593Smuzhiyun enum ib_gid_type gid_type;
1845*4882a593Smuzhiyun union ib_gid mgid;
1846*4882a593Smuzhiyun
1847*4882a593Smuzhiyun gid_type = id_priv->cma_dev->default_gid_type
1848*4882a593Smuzhiyun [id_priv->id.port_num -
1849*4882a593Smuzhiyun rdma_start_port(
1850*4882a593Smuzhiyun id_priv->cma_dev->device)];
1851*4882a593Smuzhiyun cma_iboe_set_mgid((struct sockaddr *)&mc->addr, &mgid,
1852*4882a593Smuzhiyun gid_type);
1853*4882a593Smuzhiyun cma_igmp_send(ndev, &mgid, false);
1854*4882a593Smuzhiyun }
1855*4882a593Smuzhiyun dev_put(ndev);
1856*4882a593Smuzhiyun
1857*4882a593Smuzhiyun cancel_work_sync(&mc->iboe_join.work);
1858*4882a593Smuzhiyun }
1859*4882a593Smuzhiyun kfree(mc);
1860*4882a593Smuzhiyun }
1861*4882a593Smuzhiyun
cma_leave_mc_groups(struct rdma_id_private * id_priv)1862*4882a593Smuzhiyun static void cma_leave_mc_groups(struct rdma_id_private *id_priv)
1863*4882a593Smuzhiyun {
1864*4882a593Smuzhiyun struct cma_multicast *mc;
1865*4882a593Smuzhiyun
1866*4882a593Smuzhiyun while (!list_empty(&id_priv->mc_list)) {
1867*4882a593Smuzhiyun mc = list_first_entry(&id_priv->mc_list, struct cma_multicast,
1868*4882a593Smuzhiyun list);
1869*4882a593Smuzhiyun list_del(&mc->list);
1870*4882a593Smuzhiyun destroy_mc(id_priv, mc);
1871*4882a593Smuzhiyun }
1872*4882a593Smuzhiyun }
1873*4882a593Smuzhiyun
_destroy_id(struct rdma_id_private * id_priv,enum rdma_cm_state state)1874*4882a593Smuzhiyun static void _destroy_id(struct rdma_id_private *id_priv,
1875*4882a593Smuzhiyun enum rdma_cm_state state)
1876*4882a593Smuzhiyun {
1877*4882a593Smuzhiyun cma_cancel_operation(id_priv, state);
1878*4882a593Smuzhiyun
1879*4882a593Smuzhiyun rdma_restrack_del(&id_priv->res);
1880*4882a593Smuzhiyun if (id_priv->cma_dev) {
1881*4882a593Smuzhiyun if (rdma_cap_ib_cm(id_priv->id.device, 1)) {
1882*4882a593Smuzhiyun if (id_priv->cm_id.ib)
1883*4882a593Smuzhiyun ib_destroy_cm_id(id_priv->cm_id.ib);
1884*4882a593Smuzhiyun } else if (rdma_cap_iw_cm(id_priv->id.device, 1)) {
1885*4882a593Smuzhiyun if (id_priv->cm_id.iw)
1886*4882a593Smuzhiyun iw_destroy_cm_id(id_priv->cm_id.iw);
1887*4882a593Smuzhiyun }
1888*4882a593Smuzhiyun cma_leave_mc_groups(id_priv);
1889*4882a593Smuzhiyun cma_release_dev(id_priv);
1890*4882a593Smuzhiyun }
1891*4882a593Smuzhiyun
1892*4882a593Smuzhiyun cma_release_port(id_priv);
1893*4882a593Smuzhiyun cma_id_put(id_priv);
1894*4882a593Smuzhiyun wait_for_completion(&id_priv->comp);
1895*4882a593Smuzhiyun
1896*4882a593Smuzhiyun if (id_priv->internal_id)
1897*4882a593Smuzhiyun cma_id_put(id_priv->id.context);
1898*4882a593Smuzhiyun
1899*4882a593Smuzhiyun kfree(id_priv->id.route.path_rec);
1900*4882a593Smuzhiyun
1901*4882a593Smuzhiyun put_net(id_priv->id.route.addr.dev_addr.net);
1902*4882a593Smuzhiyun kfree(id_priv);
1903*4882a593Smuzhiyun }
1904*4882a593Smuzhiyun
1905*4882a593Smuzhiyun /*
1906*4882a593Smuzhiyun * destroy an ID from within the handler_mutex. This ensures that no other
1907*4882a593Smuzhiyun * handlers can start running concurrently.
1908*4882a593Smuzhiyun */
destroy_id_handler_unlock(struct rdma_id_private * id_priv)1909*4882a593Smuzhiyun static void destroy_id_handler_unlock(struct rdma_id_private *id_priv)
1910*4882a593Smuzhiyun __releases(&idprv->handler_mutex)
1911*4882a593Smuzhiyun {
1912*4882a593Smuzhiyun enum rdma_cm_state state;
1913*4882a593Smuzhiyun unsigned long flags;
1914*4882a593Smuzhiyun
1915*4882a593Smuzhiyun trace_cm_id_destroy(id_priv);
1916*4882a593Smuzhiyun
1917*4882a593Smuzhiyun /*
1918*4882a593Smuzhiyun * Setting the state to destroyed under the handler mutex provides a
1919*4882a593Smuzhiyun * fence against calling handler callbacks. If this is invoked due to
1920*4882a593Smuzhiyun * the failure of a handler callback then it guarentees that no future
1921*4882a593Smuzhiyun * handlers will be called.
1922*4882a593Smuzhiyun */
1923*4882a593Smuzhiyun lockdep_assert_held(&id_priv->handler_mutex);
1924*4882a593Smuzhiyun spin_lock_irqsave(&id_priv->lock, flags);
1925*4882a593Smuzhiyun state = id_priv->state;
1926*4882a593Smuzhiyun id_priv->state = RDMA_CM_DESTROYING;
1927*4882a593Smuzhiyun spin_unlock_irqrestore(&id_priv->lock, flags);
1928*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
1929*4882a593Smuzhiyun _destroy_id(id_priv, state);
1930*4882a593Smuzhiyun }
1931*4882a593Smuzhiyun
rdma_destroy_id(struct rdma_cm_id * id)1932*4882a593Smuzhiyun void rdma_destroy_id(struct rdma_cm_id *id)
1933*4882a593Smuzhiyun {
1934*4882a593Smuzhiyun struct rdma_id_private *id_priv =
1935*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
1936*4882a593Smuzhiyun
1937*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
1938*4882a593Smuzhiyun destroy_id_handler_unlock(id_priv);
1939*4882a593Smuzhiyun }
1940*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_destroy_id);
1941*4882a593Smuzhiyun
cma_rep_recv(struct rdma_id_private * id_priv)1942*4882a593Smuzhiyun static int cma_rep_recv(struct rdma_id_private *id_priv)
1943*4882a593Smuzhiyun {
1944*4882a593Smuzhiyun int ret;
1945*4882a593Smuzhiyun
1946*4882a593Smuzhiyun ret = cma_modify_qp_rtr(id_priv, NULL);
1947*4882a593Smuzhiyun if (ret)
1948*4882a593Smuzhiyun goto reject;
1949*4882a593Smuzhiyun
1950*4882a593Smuzhiyun ret = cma_modify_qp_rts(id_priv, NULL);
1951*4882a593Smuzhiyun if (ret)
1952*4882a593Smuzhiyun goto reject;
1953*4882a593Smuzhiyun
1954*4882a593Smuzhiyun trace_cm_send_rtu(id_priv);
1955*4882a593Smuzhiyun ret = ib_send_cm_rtu(id_priv->cm_id.ib, NULL, 0);
1956*4882a593Smuzhiyun if (ret)
1957*4882a593Smuzhiyun goto reject;
1958*4882a593Smuzhiyun
1959*4882a593Smuzhiyun return 0;
1960*4882a593Smuzhiyun reject:
1961*4882a593Smuzhiyun pr_debug_ratelimited("RDMA CM: CONNECT_ERROR: failed to handle reply. status %d\n", ret);
1962*4882a593Smuzhiyun cma_modify_qp_err(id_priv);
1963*4882a593Smuzhiyun trace_cm_send_rej(id_priv);
1964*4882a593Smuzhiyun ib_send_cm_rej(id_priv->cm_id.ib, IB_CM_REJ_CONSUMER_DEFINED,
1965*4882a593Smuzhiyun NULL, 0, NULL, 0);
1966*4882a593Smuzhiyun return ret;
1967*4882a593Smuzhiyun }
1968*4882a593Smuzhiyun
cma_set_rep_event_data(struct rdma_cm_event * event,const struct ib_cm_rep_event_param * rep_data,void * private_data)1969*4882a593Smuzhiyun static void cma_set_rep_event_data(struct rdma_cm_event *event,
1970*4882a593Smuzhiyun const struct ib_cm_rep_event_param *rep_data,
1971*4882a593Smuzhiyun void *private_data)
1972*4882a593Smuzhiyun {
1973*4882a593Smuzhiyun event->param.conn.private_data = private_data;
1974*4882a593Smuzhiyun event->param.conn.private_data_len = IB_CM_REP_PRIVATE_DATA_SIZE;
1975*4882a593Smuzhiyun event->param.conn.responder_resources = rep_data->responder_resources;
1976*4882a593Smuzhiyun event->param.conn.initiator_depth = rep_data->initiator_depth;
1977*4882a593Smuzhiyun event->param.conn.flow_control = rep_data->flow_control;
1978*4882a593Smuzhiyun event->param.conn.rnr_retry_count = rep_data->rnr_retry_count;
1979*4882a593Smuzhiyun event->param.conn.srq = rep_data->srq;
1980*4882a593Smuzhiyun event->param.conn.qp_num = rep_data->remote_qpn;
1981*4882a593Smuzhiyun
1982*4882a593Smuzhiyun event->ece.vendor_id = rep_data->ece.vendor_id;
1983*4882a593Smuzhiyun event->ece.attr_mod = rep_data->ece.attr_mod;
1984*4882a593Smuzhiyun }
1985*4882a593Smuzhiyun
cma_cm_event_handler(struct rdma_id_private * id_priv,struct rdma_cm_event * event)1986*4882a593Smuzhiyun static int cma_cm_event_handler(struct rdma_id_private *id_priv,
1987*4882a593Smuzhiyun struct rdma_cm_event *event)
1988*4882a593Smuzhiyun {
1989*4882a593Smuzhiyun int ret;
1990*4882a593Smuzhiyun
1991*4882a593Smuzhiyun lockdep_assert_held(&id_priv->handler_mutex);
1992*4882a593Smuzhiyun
1993*4882a593Smuzhiyun trace_cm_event_handler(id_priv, event);
1994*4882a593Smuzhiyun ret = id_priv->id.event_handler(&id_priv->id, event);
1995*4882a593Smuzhiyun trace_cm_event_done(id_priv, event, ret);
1996*4882a593Smuzhiyun return ret;
1997*4882a593Smuzhiyun }
1998*4882a593Smuzhiyun
cma_ib_handler(struct ib_cm_id * cm_id,const struct ib_cm_event * ib_event)1999*4882a593Smuzhiyun static int cma_ib_handler(struct ib_cm_id *cm_id,
2000*4882a593Smuzhiyun const struct ib_cm_event *ib_event)
2001*4882a593Smuzhiyun {
2002*4882a593Smuzhiyun struct rdma_id_private *id_priv = cm_id->context;
2003*4882a593Smuzhiyun struct rdma_cm_event event = {};
2004*4882a593Smuzhiyun enum rdma_cm_state state;
2005*4882a593Smuzhiyun int ret;
2006*4882a593Smuzhiyun
2007*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
2008*4882a593Smuzhiyun state = READ_ONCE(id_priv->state);
2009*4882a593Smuzhiyun if ((ib_event->event != IB_CM_TIMEWAIT_EXIT &&
2010*4882a593Smuzhiyun state != RDMA_CM_CONNECT) ||
2011*4882a593Smuzhiyun (ib_event->event == IB_CM_TIMEWAIT_EXIT &&
2012*4882a593Smuzhiyun state != RDMA_CM_DISCONNECT))
2013*4882a593Smuzhiyun goto out;
2014*4882a593Smuzhiyun
2015*4882a593Smuzhiyun switch (ib_event->event) {
2016*4882a593Smuzhiyun case IB_CM_REQ_ERROR:
2017*4882a593Smuzhiyun case IB_CM_REP_ERROR:
2018*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_UNREACHABLE;
2019*4882a593Smuzhiyun event.status = -ETIMEDOUT;
2020*4882a593Smuzhiyun break;
2021*4882a593Smuzhiyun case IB_CM_REP_RECEIVED:
2022*4882a593Smuzhiyun if (state == RDMA_CM_CONNECT &&
2023*4882a593Smuzhiyun (id_priv->id.qp_type != IB_QPT_UD)) {
2024*4882a593Smuzhiyun trace_cm_send_mra(id_priv);
2025*4882a593Smuzhiyun ib_send_cm_mra(cm_id, CMA_CM_MRA_SETTING, NULL, 0);
2026*4882a593Smuzhiyun }
2027*4882a593Smuzhiyun if (id_priv->id.qp) {
2028*4882a593Smuzhiyun event.status = cma_rep_recv(id_priv);
2029*4882a593Smuzhiyun event.event = event.status ? RDMA_CM_EVENT_CONNECT_ERROR :
2030*4882a593Smuzhiyun RDMA_CM_EVENT_ESTABLISHED;
2031*4882a593Smuzhiyun } else {
2032*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_CONNECT_RESPONSE;
2033*4882a593Smuzhiyun }
2034*4882a593Smuzhiyun cma_set_rep_event_data(&event, &ib_event->param.rep_rcvd,
2035*4882a593Smuzhiyun ib_event->private_data);
2036*4882a593Smuzhiyun break;
2037*4882a593Smuzhiyun case IB_CM_RTU_RECEIVED:
2038*4882a593Smuzhiyun case IB_CM_USER_ESTABLISHED:
2039*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_ESTABLISHED;
2040*4882a593Smuzhiyun break;
2041*4882a593Smuzhiyun case IB_CM_DREQ_ERROR:
2042*4882a593Smuzhiyun event.status = -ETIMEDOUT;
2043*4882a593Smuzhiyun fallthrough;
2044*4882a593Smuzhiyun case IB_CM_DREQ_RECEIVED:
2045*4882a593Smuzhiyun case IB_CM_DREP_RECEIVED:
2046*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, RDMA_CM_CONNECT,
2047*4882a593Smuzhiyun RDMA_CM_DISCONNECT))
2048*4882a593Smuzhiyun goto out;
2049*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_DISCONNECTED;
2050*4882a593Smuzhiyun break;
2051*4882a593Smuzhiyun case IB_CM_TIMEWAIT_EXIT:
2052*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_TIMEWAIT_EXIT;
2053*4882a593Smuzhiyun break;
2054*4882a593Smuzhiyun case IB_CM_MRA_RECEIVED:
2055*4882a593Smuzhiyun /* ignore event */
2056*4882a593Smuzhiyun goto out;
2057*4882a593Smuzhiyun case IB_CM_REJ_RECEIVED:
2058*4882a593Smuzhiyun pr_debug_ratelimited("RDMA CM: REJECTED: %s\n", rdma_reject_msg(&id_priv->id,
2059*4882a593Smuzhiyun ib_event->param.rej_rcvd.reason));
2060*4882a593Smuzhiyun cma_modify_qp_err(id_priv);
2061*4882a593Smuzhiyun event.status = ib_event->param.rej_rcvd.reason;
2062*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_REJECTED;
2063*4882a593Smuzhiyun event.param.conn.private_data = ib_event->private_data;
2064*4882a593Smuzhiyun event.param.conn.private_data_len = IB_CM_REJ_PRIVATE_DATA_SIZE;
2065*4882a593Smuzhiyun break;
2066*4882a593Smuzhiyun default:
2067*4882a593Smuzhiyun pr_err("RDMA CMA: unexpected IB CM event: %d\n",
2068*4882a593Smuzhiyun ib_event->event);
2069*4882a593Smuzhiyun goto out;
2070*4882a593Smuzhiyun }
2071*4882a593Smuzhiyun
2072*4882a593Smuzhiyun ret = cma_cm_event_handler(id_priv, &event);
2073*4882a593Smuzhiyun if (ret) {
2074*4882a593Smuzhiyun /* Destroy the CM ID by returning a non-zero value. */
2075*4882a593Smuzhiyun id_priv->cm_id.ib = NULL;
2076*4882a593Smuzhiyun destroy_id_handler_unlock(id_priv);
2077*4882a593Smuzhiyun return ret;
2078*4882a593Smuzhiyun }
2079*4882a593Smuzhiyun out:
2080*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
2081*4882a593Smuzhiyun return 0;
2082*4882a593Smuzhiyun }
2083*4882a593Smuzhiyun
2084*4882a593Smuzhiyun static struct rdma_id_private *
cma_ib_new_conn_id(const struct rdma_cm_id * listen_id,const struct ib_cm_event * ib_event,struct net_device * net_dev)2085*4882a593Smuzhiyun cma_ib_new_conn_id(const struct rdma_cm_id *listen_id,
2086*4882a593Smuzhiyun const struct ib_cm_event *ib_event,
2087*4882a593Smuzhiyun struct net_device *net_dev)
2088*4882a593Smuzhiyun {
2089*4882a593Smuzhiyun struct rdma_id_private *listen_id_priv;
2090*4882a593Smuzhiyun struct rdma_id_private *id_priv;
2091*4882a593Smuzhiyun struct rdma_cm_id *id;
2092*4882a593Smuzhiyun struct rdma_route *rt;
2093*4882a593Smuzhiyun const sa_family_t ss_family = listen_id->route.addr.src_addr.ss_family;
2094*4882a593Smuzhiyun struct sa_path_rec *path = ib_event->param.req_rcvd.primary_path;
2095*4882a593Smuzhiyun const __be64 service_id =
2096*4882a593Smuzhiyun ib_event->param.req_rcvd.primary_path->service_id;
2097*4882a593Smuzhiyun int ret;
2098*4882a593Smuzhiyun
2099*4882a593Smuzhiyun listen_id_priv = container_of(listen_id, struct rdma_id_private, id);
2100*4882a593Smuzhiyun id_priv = __rdma_create_id(listen_id->route.addr.dev_addr.net,
2101*4882a593Smuzhiyun listen_id->event_handler, listen_id->context,
2102*4882a593Smuzhiyun listen_id->ps,
2103*4882a593Smuzhiyun ib_event->param.req_rcvd.qp_type,
2104*4882a593Smuzhiyun listen_id_priv);
2105*4882a593Smuzhiyun if (IS_ERR(id_priv))
2106*4882a593Smuzhiyun return NULL;
2107*4882a593Smuzhiyun
2108*4882a593Smuzhiyun id = &id_priv->id;
2109*4882a593Smuzhiyun if (cma_save_net_info((struct sockaddr *)&id->route.addr.src_addr,
2110*4882a593Smuzhiyun (struct sockaddr *)&id->route.addr.dst_addr,
2111*4882a593Smuzhiyun listen_id, ib_event, ss_family, service_id))
2112*4882a593Smuzhiyun goto err;
2113*4882a593Smuzhiyun
2114*4882a593Smuzhiyun rt = &id->route;
2115*4882a593Smuzhiyun rt->num_paths = ib_event->param.req_rcvd.alternate_path ? 2 : 1;
2116*4882a593Smuzhiyun rt->path_rec = kmalloc_array(rt->num_paths, sizeof(*rt->path_rec),
2117*4882a593Smuzhiyun GFP_KERNEL);
2118*4882a593Smuzhiyun if (!rt->path_rec)
2119*4882a593Smuzhiyun goto err;
2120*4882a593Smuzhiyun
2121*4882a593Smuzhiyun rt->path_rec[0] = *path;
2122*4882a593Smuzhiyun if (rt->num_paths == 2)
2123*4882a593Smuzhiyun rt->path_rec[1] = *ib_event->param.req_rcvd.alternate_path;
2124*4882a593Smuzhiyun
2125*4882a593Smuzhiyun if (net_dev) {
2126*4882a593Smuzhiyun rdma_copy_src_l2_addr(&rt->addr.dev_addr, net_dev);
2127*4882a593Smuzhiyun } else {
2128*4882a593Smuzhiyun if (!cma_protocol_roce(listen_id) &&
2129*4882a593Smuzhiyun cma_any_addr(cma_src_addr(id_priv))) {
2130*4882a593Smuzhiyun rt->addr.dev_addr.dev_type = ARPHRD_INFINIBAND;
2131*4882a593Smuzhiyun rdma_addr_set_sgid(&rt->addr.dev_addr, &rt->path_rec[0].sgid);
2132*4882a593Smuzhiyun ib_addr_set_pkey(&rt->addr.dev_addr, be16_to_cpu(rt->path_rec[0].pkey));
2133*4882a593Smuzhiyun } else if (!cma_any_addr(cma_src_addr(id_priv))) {
2134*4882a593Smuzhiyun ret = cma_translate_addr(cma_src_addr(id_priv), &rt->addr.dev_addr);
2135*4882a593Smuzhiyun if (ret)
2136*4882a593Smuzhiyun goto err;
2137*4882a593Smuzhiyun }
2138*4882a593Smuzhiyun }
2139*4882a593Smuzhiyun rdma_addr_set_dgid(&rt->addr.dev_addr, &rt->path_rec[0].dgid);
2140*4882a593Smuzhiyun
2141*4882a593Smuzhiyun id_priv->state = RDMA_CM_CONNECT;
2142*4882a593Smuzhiyun return id_priv;
2143*4882a593Smuzhiyun
2144*4882a593Smuzhiyun err:
2145*4882a593Smuzhiyun rdma_destroy_id(id);
2146*4882a593Smuzhiyun return NULL;
2147*4882a593Smuzhiyun }
2148*4882a593Smuzhiyun
2149*4882a593Smuzhiyun static struct rdma_id_private *
cma_ib_new_udp_id(const struct rdma_cm_id * listen_id,const struct ib_cm_event * ib_event,struct net_device * net_dev)2150*4882a593Smuzhiyun cma_ib_new_udp_id(const struct rdma_cm_id *listen_id,
2151*4882a593Smuzhiyun const struct ib_cm_event *ib_event,
2152*4882a593Smuzhiyun struct net_device *net_dev)
2153*4882a593Smuzhiyun {
2154*4882a593Smuzhiyun const struct rdma_id_private *listen_id_priv;
2155*4882a593Smuzhiyun struct rdma_id_private *id_priv;
2156*4882a593Smuzhiyun struct rdma_cm_id *id;
2157*4882a593Smuzhiyun const sa_family_t ss_family = listen_id->route.addr.src_addr.ss_family;
2158*4882a593Smuzhiyun struct net *net = listen_id->route.addr.dev_addr.net;
2159*4882a593Smuzhiyun int ret;
2160*4882a593Smuzhiyun
2161*4882a593Smuzhiyun listen_id_priv = container_of(listen_id, struct rdma_id_private, id);
2162*4882a593Smuzhiyun id_priv = __rdma_create_id(net, listen_id->event_handler,
2163*4882a593Smuzhiyun listen_id->context, listen_id->ps, IB_QPT_UD,
2164*4882a593Smuzhiyun listen_id_priv);
2165*4882a593Smuzhiyun if (IS_ERR(id_priv))
2166*4882a593Smuzhiyun return NULL;
2167*4882a593Smuzhiyun
2168*4882a593Smuzhiyun id = &id_priv->id;
2169*4882a593Smuzhiyun if (cma_save_net_info((struct sockaddr *)&id->route.addr.src_addr,
2170*4882a593Smuzhiyun (struct sockaddr *)&id->route.addr.dst_addr,
2171*4882a593Smuzhiyun listen_id, ib_event, ss_family,
2172*4882a593Smuzhiyun ib_event->param.sidr_req_rcvd.service_id))
2173*4882a593Smuzhiyun goto err;
2174*4882a593Smuzhiyun
2175*4882a593Smuzhiyun if (net_dev) {
2176*4882a593Smuzhiyun rdma_copy_src_l2_addr(&id->route.addr.dev_addr, net_dev);
2177*4882a593Smuzhiyun } else {
2178*4882a593Smuzhiyun if (!cma_any_addr(cma_src_addr(id_priv))) {
2179*4882a593Smuzhiyun ret = cma_translate_addr(cma_src_addr(id_priv),
2180*4882a593Smuzhiyun &id->route.addr.dev_addr);
2181*4882a593Smuzhiyun if (ret)
2182*4882a593Smuzhiyun goto err;
2183*4882a593Smuzhiyun }
2184*4882a593Smuzhiyun }
2185*4882a593Smuzhiyun
2186*4882a593Smuzhiyun id_priv->state = RDMA_CM_CONNECT;
2187*4882a593Smuzhiyun return id_priv;
2188*4882a593Smuzhiyun err:
2189*4882a593Smuzhiyun rdma_destroy_id(id);
2190*4882a593Smuzhiyun return NULL;
2191*4882a593Smuzhiyun }
2192*4882a593Smuzhiyun
cma_set_req_event_data(struct rdma_cm_event * event,const struct ib_cm_req_event_param * req_data,void * private_data,int offset)2193*4882a593Smuzhiyun static void cma_set_req_event_data(struct rdma_cm_event *event,
2194*4882a593Smuzhiyun const struct ib_cm_req_event_param *req_data,
2195*4882a593Smuzhiyun void *private_data, int offset)
2196*4882a593Smuzhiyun {
2197*4882a593Smuzhiyun event->param.conn.private_data = private_data + offset;
2198*4882a593Smuzhiyun event->param.conn.private_data_len = IB_CM_REQ_PRIVATE_DATA_SIZE - offset;
2199*4882a593Smuzhiyun event->param.conn.responder_resources = req_data->responder_resources;
2200*4882a593Smuzhiyun event->param.conn.initiator_depth = req_data->initiator_depth;
2201*4882a593Smuzhiyun event->param.conn.flow_control = req_data->flow_control;
2202*4882a593Smuzhiyun event->param.conn.retry_count = req_data->retry_count;
2203*4882a593Smuzhiyun event->param.conn.rnr_retry_count = req_data->rnr_retry_count;
2204*4882a593Smuzhiyun event->param.conn.srq = req_data->srq;
2205*4882a593Smuzhiyun event->param.conn.qp_num = req_data->remote_qpn;
2206*4882a593Smuzhiyun
2207*4882a593Smuzhiyun event->ece.vendor_id = req_data->ece.vendor_id;
2208*4882a593Smuzhiyun event->ece.attr_mod = req_data->ece.attr_mod;
2209*4882a593Smuzhiyun }
2210*4882a593Smuzhiyun
cma_ib_check_req_qp_type(const struct rdma_cm_id * id,const struct ib_cm_event * ib_event)2211*4882a593Smuzhiyun static int cma_ib_check_req_qp_type(const struct rdma_cm_id *id,
2212*4882a593Smuzhiyun const struct ib_cm_event *ib_event)
2213*4882a593Smuzhiyun {
2214*4882a593Smuzhiyun return (((ib_event->event == IB_CM_REQ_RECEIVED) &&
2215*4882a593Smuzhiyun (ib_event->param.req_rcvd.qp_type == id->qp_type)) ||
2216*4882a593Smuzhiyun ((ib_event->event == IB_CM_SIDR_REQ_RECEIVED) &&
2217*4882a593Smuzhiyun (id->qp_type == IB_QPT_UD)) ||
2218*4882a593Smuzhiyun (!id->qp_type));
2219*4882a593Smuzhiyun }
2220*4882a593Smuzhiyun
cma_ib_req_handler(struct ib_cm_id * cm_id,const struct ib_cm_event * ib_event)2221*4882a593Smuzhiyun static int cma_ib_req_handler(struct ib_cm_id *cm_id,
2222*4882a593Smuzhiyun const struct ib_cm_event *ib_event)
2223*4882a593Smuzhiyun {
2224*4882a593Smuzhiyun struct rdma_id_private *listen_id, *conn_id = NULL;
2225*4882a593Smuzhiyun struct rdma_cm_event event = {};
2226*4882a593Smuzhiyun struct cma_req_info req = {};
2227*4882a593Smuzhiyun struct net_device *net_dev;
2228*4882a593Smuzhiyun u8 offset;
2229*4882a593Smuzhiyun int ret;
2230*4882a593Smuzhiyun
2231*4882a593Smuzhiyun listen_id = cma_ib_id_from_event(cm_id, ib_event, &req, &net_dev);
2232*4882a593Smuzhiyun if (IS_ERR(listen_id))
2233*4882a593Smuzhiyun return PTR_ERR(listen_id);
2234*4882a593Smuzhiyun
2235*4882a593Smuzhiyun trace_cm_req_handler(listen_id, ib_event->event);
2236*4882a593Smuzhiyun if (!cma_ib_check_req_qp_type(&listen_id->id, ib_event)) {
2237*4882a593Smuzhiyun ret = -EINVAL;
2238*4882a593Smuzhiyun goto net_dev_put;
2239*4882a593Smuzhiyun }
2240*4882a593Smuzhiyun
2241*4882a593Smuzhiyun mutex_lock(&listen_id->handler_mutex);
2242*4882a593Smuzhiyun if (READ_ONCE(listen_id->state) != RDMA_CM_LISTEN) {
2243*4882a593Smuzhiyun ret = -ECONNABORTED;
2244*4882a593Smuzhiyun goto err_unlock;
2245*4882a593Smuzhiyun }
2246*4882a593Smuzhiyun
2247*4882a593Smuzhiyun offset = cma_user_data_offset(listen_id);
2248*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_CONNECT_REQUEST;
2249*4882a593Smuzhiyun if (ib_event->event == IB_CM_SIDR_REQ_RECEIVED) {
2250*4882a593Smuzhiyun conn_id = cma_ib_new_udp_id(&listen_id->id, ib_event, net_dev);
2251*4882a593Smuzhiyun event.param.ud.private_data = ib_event->private_data + offset;
2252*4882a593Smuzhiyun event.param.ud.private_data_len =
2253*4882a593Smuzhiyun IB_CM_SIDR_REQ_PRIVATE_DATA_SIZE - offset;
2254*4882a593Smuzhiyun } else {
2255*4882a593Smuzhiyun conn_id = cma_ib_new_conn_id(&listen_id->id, ib_event, net_dev);
2256*4882a593Smuzhiyun cma_set_req_event_data(&event, &ib_event->param.req_rcvd,
2257*4882a593Smuzhiyun ib_event->private_data, offset);
2258*4882a593Smuzhiyun }
2259*4882a593Smuzhiyun if (!conn_id) {
2260*4882a593Smuzhiyun ret = -ENOMEM;
2261*4882a593Smuzhiyun goto err_unlock;
2262*4882a593Smuzhiyun }
2263*4882a593Smuzhiyun
2264*4882a593Smuzhiyun mutex_lock_nested(&conn_id->handler_mutex, SINGLE_DEPTH_NESTING);
2265*4882a593Smuzhiyun ret = cma_ib_acquire_dev(conn_id, listen_id, &req);
2266*4882a593Smuzhiyun if (ret) {
2267*4882a593Smuzhiyun destroy_id_handler_unlock(conn_id);
2268*4882a593Smuzhiyun goto err_unlock;
2269*4882a593Smuzhiyun }
2270*4882a593Smuzhiyun
2271*4882a593Smuzhiyun conn_id->cm_id.ib = cm_id;
2272*4882a593Smuzhiyun cm_id->context = conn_id;
2273*4882a593Smuzhiyun cm_id->cm_handler = cma_ib_handler;
2274*4882a593Smuzhiyun
2275*4882a593Smuzhiyun ret = cma_cm_event_handler(conn_id, &event);
2276*4882a593Smuzhiyun if (ret) {
2277*4882a593Smuzhiyun /* Destroy the CM ID by returning a non-zero value. */
2278*4882a593Smuzhiyun conn_id->cm_id.ib = NULL;
2279*4882a593Smuzhiyun mutex_unlock(&listen_id->handler_mutex);
2280*4882a593Smuzhiyun destroy_id_handler_unlock(conn_id);
2281*4882a593Smuzhiyun goto net_dev_put;
2282*4882a593Smuzhiyun }
2283*4882a593Smuzhiyun
2284*4882a593Smuzhiyun if (READ_ONCE(conn_id->state) == RDMA_CM_CONNECT &&
2285*4882a593Smuzhiyun conn_id->id.qp_type != IB_QPT_UD) {
2286*4882a593Smuzhiyun trace_cm_send_mra(cm_id->context);
2287*4882a593Smuzhiyun ib_send_cm_mra(cm_id, CMA_CM_MRA_SETTING, NULL, 0);
2288*4882a593Smuzhiyun }
2289*4882a593Smuzhiyun mutex_unlock(&conn_id->handler_mutex);
2290*4882a593Smuzhiyun
2291*4882a593Smuzhiyun err_unlock:
2292*4882a593Smuzhiyun mutex_unlock(&listen_id->handler_mutex);
2293*4882a593Smuzhiyun
2294*4882a593Smuzhiyun net_dev_put:
2295*4882a593Smuzhiyun if (net_dev)
2296*4882a593Smuzhiyun dev_put(net_dev);
2297*4882a593Smuzhiyun
2298*4882a593Smuzhiyun return ret;
2299*4882a593Smuzhiyun }
2300*4882a593Smuzhiyun
rdma_get_service_id(struct rdma_cm_id * id,struct sockaddr * addr)2301*4882a593Smuzhiyun __be64 rdma_get_service_id(struct rdma_cm_id *id, struct sockaddr *addr)
2302*4882a593Smuzhiyun {
2303*4882a593Smuzhiyun if (addr->sa_family == AF_IB)
2304*4882a593Smuzhiyun return ((struct sockaddr_ib *) addr)->sib_sid;
2305*4882a593Smuzhiyun
2306*4882a593Smuzhiyun return cpu_to_be64(((u64)id->ps << 16) + be16_to_cpu(cma_port(addr)));
2307*4882a593Smuzhiyun }
2308*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_get_service_id);
2309*4882a593Smuzhiyun
rdma_read_gids(struct rdma_cm_id * cm_id,union ib_gid * sgid,union ib_gid * dgid)2310*4882a593Smuzhiyun void rdma_read_gids(struct rdma_cm_id *cm_id, union ib_gid *sgid,
2311*4882a593Smuzhiyun union ib_gid *dgid)
2312*4882a593Smuzhiyun {
2313*4882a593Smuzhiyun struct rdma_addr *addr = &cm_id->route.addr;
2314*4882a593Smuzhiyun
2315*4882a593Smuzhiyun if (!cm_id->device) {
2316*4882a593Smuzhiyun if (sgid)
2317*4882a593Smuzhiyun memset(sgid, 0, sizeof(*sgid));
2318*4882a593Smuzhiyun if (dgid)
2319*4882a593Smuzhiyun memset(dgid, 0, sizeof(*dgid));
2320*4882a593Smuzhiyun return;
2321*4882a593Smuzhiyun }
2322*4882a593Smuzhiyun
2323*4882a593Smuzhiyun if (rdma_protocol_roce(cm_id->device, cm_id->port_num)) {
2324*4882a593Smuzhiyun if (sgid)
2325*4882a593Smuzhiyun rdma_ip2gid((struct sockaddr *)&addr->src_addr, sgid);
2326*4882a593Smuzhiyun if (dgid)
2327*4882a593Smuzhiyun rdma_ip2gid((struct sockaddr *)&addr->dst_addr, dgid);
2328*4882a593Smuzhiyun } else {
2329*4882a593Smuzhiyun if (sgid)
2330*4882a593Smuzhiyun rdma_addr_get_sgid(&addr->dev_addr, sgid);
2331*4882a593Smuzhiyun if (dgid)
2332*4882a593Smuzhiyun rdma_addr_get_dgid(&addr->dev_addr, dgid);
2333*4882a593Smuzhiyun }
2334*4882a593Smuzhiyun }
2335*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_read_gids);
2336*4882a593Smuzhiyun
cma_iw_handler(struct iw_cm_id * iw_id,struct iw_cm_event * iw_event)2337*4882a593Smuzhiyun static int cma_iw_handler(struct iw_cm_id *iw_id, struct iw_cm_event *iw_event)
2338*4882a593Smuzhiyun {
2339*4882a593Smuzhiyun struct rdma_id_private *id_priv = iw_id->context;
2340*4882a593Smuzhiyun struct rdma_cm_event event = {};
2341*4882a593Smuzhiyun int ret = 0;
2342*4882a593Smuzhiyun struct sockaddr *laddr = (struct sockaddr *)&iw_event->local_addr;
2343*4882a593Smuzhiyun struct sockaddr *raddr = (struct sockaddr *)&iw_event->remote_addr;
2344*4882a593Smuzhiyun
2345*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
2346*4882a593Smuzhiyun if (READ_ONCE(id_priv->state) != RDMA_CM_CONNECT)
2347*4882a593Smuzhiyun goto out;
2348*4882a593Smuzhiyun
2349*4882a593Smuzhiyun switch (iw_event->event) {
2350*4882a593Smuzhiyun case IW_CM_EVENT_CLOSE:
2351*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_DISCONNECTED;
2352*4882a593Smuzhiyun break;
2353*4882a593Smuzhiyun case IW_CM_EVENT_CONNECT_REPLY:
2354*4882a593Smuzhiyun memcpy(cma_src_addr(id_priv), laddr,
2355*4882a593Smuzhiyun rdma_addr_size(laddr));
2356*4882a593Smuzhiyun memcpy(cma_dst_addr(id_priv), raddr,
2357*4882a593Smuzhiyun rdma_addr_size(raddr));
2358*4882a593Smuzhiyun switch (iw_event->status) {
2359*4882a593Smuzhiyun case 0:
2360*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_ESTABLISHED;
2361*4882a593Smuzhiyun event.param.conn.initiator_depth = iw_event->ird;
2362*4882a593Smuzhiyun event.param.conn.responder_resources = iw_event->ord;
2363*4882a593Smuzhiyun break;
2364*4882a593Smuzhiyun case -ECONNRESET:
2365*4882a593Smuzhiyun case -ECONNREFUSED:
2366*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_REJECTED;
2367*4882a593Smuzhiyun break;
2368*4882a593Smuzhiyun case -ETIMEDOUT:
2369*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_UNREACHABLE;
2370*4882a593Smuzhiyun break;
2371*4882a593Smuzhiyun default:
2372*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_CONNECT_ERROR;
2373*4882a593Smuzhiyun break;
2374*4882a593Smuzhiyun }
2375*4882a593Smuzhiyun break;
2376*4882a593Smuzhiyun case IW_CM_EVENT_ESTABLISHED:
2377*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_ESTABLISHED;
2378*4882a593Smuzhiyun event.param.conn.initiator_depth = iw_event->ird;
2379*4882a593Smuzhiyun event.param.conn.responder_resources = iw_event->ord;
2380*4882a593Smuzhiyun break;
2381*4882a593Smuzhiyun default:
2382*4882a593Smuzhiyun goto out;
2383*4882a593Smuzhiyun }
2384*4882a593Smuzhiyun
2385*4882a593Smuzhiyun event.status = iw_event->status;
2386*4882a593Smuzhiyun event.param.conn.private_data = iw_event->private_data;
2387*4882a593Smuzhiyun event.param.conn.private_data_len = iw_event->private_data_len;
2388*4882a593Smuzhiyun ret = cma_cm_event_handler(id_priv, &event);
2389*4882a593Smuzhiyun if (ret) {
2390*4882a593Smuzhiyun /* Destroy the CM ID by returning a non-zero value. */
2391*4882a593Smuzhiyun id_priv->cm_id.iw = NULL;
2392*4882a593Smuzhiyun destroy_id_handler_unlock(id_priv);
2393*4882a593Smuzhiyun return ret;
2394*4882a593Smuzhiyun }
2395*4882a593Smuzhiyun
2396*4882a593Smuzhiyun out:
2397*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
2398*4882a593Smuzhiyun return ret;
2399*4882a593Smuzhiyun }
2400*4882a593Smuzhiyun
iw_conn_req_handler(struct iw_cm_id * cm_id,struct iw_cm_event * iw_event)2401*4882a593Smuzhiyun static int iw_conn_req_handler(struct iw_cm_id *cm_id,
2402*4882a593Smuzhiyun struct iw_cm_event *iw_event)
2403*4882a593Smuzhiyun {
2404*4882a593Smuzhiyun struct rdma_id_private *listen_id, *conn_id;
2405*4882a593Smuzhiyun struct rdma_cm_event event = {};
2406*4882a593Smuzhiyun int ret = -ECONNABORTED;
2407*4882a593Smuzhiyun struct sockaddr *laddr = (struct sockaddr *)&iw_event->local_addr;
2408*4882a593Smuzhiyun struct sockaddr *raddr = (struct sockaddr *)&iw_event->remote_addr;
2409*4882a593Smuzhiyun
2410*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_CONNECT_REQUEST;
2411*4882a593Smuzhiyun event.param.conn.private_data = iw_event->private_data;
2412*4882a593Smuzhiyun event.param.conn.private_data_len = iw_event->private_data_len;
2413*4882a593Smuzhiyun event.param.conn.initiator_depth = iw_event->ird;
2414*4882a593Smuzhiyun event.param.conn.responder_resources = iw_event->ord;
2415*4882a593Smuzhiyun
2416*4882a593Smuzhiyun listen_id = cm_id->context;
2417*4882a593Smuzhiyun
2418*4882a593Smuzhiyun mutex_lock(&listen_id->handler_mutex);
2419*4882a593Smuzhiyun if (READ_ONCE(listen_id->state) != RDMA_CM_LISTEN)
2420*4882a593Smuzhiyun goto out;
2421*4882a593Smuzhiyun
2422*4882a593Smuzhiyun /* Create a new RDMA id for the new IW CM ID */
2423*4882a593Smuzhiyun conn_id = __rdma_create_id(listen_id->id.route.addr.dev_addr.net,
2424*4882a593Smuzhiyun listen_id->id.event_handler,
2425*4882a593Smuzhiyun listen_id->id.context, RDMA_PS_TCP,
2426*4882a593Smuzhiyun IB_QPT_RC, listen_id);
2427*4882a593Smuzhiyun if (IS_ERR(conn_id)) {
2428*4882a593Smuzhiyun ret = -ENOMEM;
2429*4882a593Smuzhiyun goto out;
2430*4882a593Smuzhiyun }
2431*4882a593Smuzhiyun mutex_lock_nested(&conn_id->handler_mutex, SINGLE_DEPTH_NESTING);
2432*4882a593Smuzhiyun conn_id->state = RDMA_CM_CONNECT;
2433*4882a593Smuzhiyun
2434*4882a593Smuzhiyun ret = rdma_translate_ip(laddr, &conn_id->id.route.addr.dev_addr);
2435*4882a593Smuzhiyun if (ret) {
2436*4882a593Smuzhiyun mutex_unlock(&listen_id->handler_mutex);
2437*4882a593Smuzhiyun destroy_id_handler_unlock(conn_id);
2438*4882a593Smuzhiyun return ret;
2439*4882a593Smuzhiyun }
2440*4882a593Smuzhiyun
2441*4882a593Smuzhiyun ret = cma_iw_acquire_dev(conn_id, listen_id);
2442*4882a593Smuzhiyun if (ret) {
2443*4882a593Smuzhiyun mutex_unlock(&listen_id->handler_mutex);
2444*4882a593Smuzhiyun destroy_id_handler_unlock(conn_id);
2445*4882a593Smuzhiyun return ret;
2446*4882a593Smuzhiyun }
2447*4882a593Smuzhiyun
2448*4882a593Smuzhiyun conn_id->cm_id.iw = cm_id;
2449*4882a593Smuzhiyun cm_id->context = conn_id;
2450*4882a593Smuzhiyun cm_id->cm_handler = cma_iw_handler;
2451*4882a593Smuzhiyun
2452*4882a593Smuzhiyun memcpy(cma_src_addr(conn_id), laddr, rdma_addr_size(laddr));
2453*4882a593Smuzhiyun memcpy(cma_dst_addr(conn_id), raddr, rdma_addr_size(raddr));
2454*4882a593Smuzhiyun
2455*4882a593Smuzhiyun ret = cma_cm_event_handler(conn_id, &event);
2456*4882a593Smuzhiyun if (ret) {
2457*4882a593Smuzhiyun /* User wants to destroy the CM ID */
2458*4882a593Smuzhiyun conn_id->cm_id.iw = NULL;
2459*4882a593Smuzhiyun mutex_unlock(&listen_id->handler_mutex);
2460*4882a593Smuzhiyun destroy_id_handler_unlock(conn_id);
2461*4882a593Smuzhiyun return ret;
2462*4882a593Smuzhiyun }
2463*4882a593Smuzhiyun
2464*4882a593Smuzhiyun mutex_unlock(&conn_id->handler_mutex);
2465*4882a593Smuzhiyun
2466*4882a593Smuzhiyun out:
2467*4882a593Smuzhiyun mutex_unlock(&listen_id->handler_mutex);
2468*4882a593Smuzhiyun return ret;
2469*4882a593Smuzhiyun }
2470*4882a593Smuzhiyun
cma_ib_listen(struct rdma_id_private * id_priv)2471*4882a593Smuzhiyun static int cma_ib_listen(struct rdma_id_private *id_priv)
2472*4882a593Smuzhiyun {
2473*4882a593Smuzhiyun struct sockaddr *addr;
2474*4882a593Smuzhiyun struct ib_cm_id *id;
2475*4882a593Smuzhiyun __be64 svc_id;
2476*4882a593Smuzhiyun
2477*4882a593Smuzhiyun addr = cma_src_addr(id_priv);
2478*4882a593Smuzhiyun svc_id = rdma_get_service_id(&id_priv->id, addr);
2479*4882a593Smuzhiyun id = ib_cm_insert_listen(id_priv->id.device,
2480*4882a593Smuzhiyun cma_ib_req_handler, svc_id);
2481*4882a593Smuzhiyun if (IS_ERR(id))
2482*4882a593Smuzhiyun return PTR_ERR(id);
2483*4882a593Smuzhiyun id_priv->cm_id.ib = id;
2484*4882a593Smuzhiyun
2485*4882a593Smuzhiyun return 0;
2486*4882a593Smuzhiyun }
2487*4882a593Smuzhiyun
cma_iw_listen(struct rdma_id_private * id_priv,int backlog)2488*4882a593Smuzhiyun static int cma_iw_listen(struct rdma_id_private *id_priv, int backlog)
2489*4882a593Smuzhiyun {
2490*4882a593Smuzhiyun int ret;
2491*4882a593Smuzhiyun struct iw_cm_id *id;
2492*4882a593Smuzhiyun
2493*4882a593Smuzhiyun id = iw_create_cm_id(id_priv->id.device,
2494*4882a593Smuzhiyun iw_conn_req_handler,
2495*4882a593Smuzhiyun id_priv);
2496*4882a593Smuzhiyun if (IS_ERR(id))
2497*4882a593Smuzhiyun return PTR_ERR(id);
2498*4882a593Smuzhiyun
2499*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
2500*4882a593Smuzhiyun id->tos = id_priv->tos;
2501*4882a593Smuzhiyun id->tos_set = id_priv->tos_set;
2502*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
2503*4882a593Smuzhiyun id_priv->cm_id.iw = id;
2504*4882a593Smuzhiyun
2505*4882a593Smuzhiyun memcpy(&id_priv->cm_id.iw->local_addr, cma_src_addr(id_priv),
2506*4882a593Smuzhiyun rdma_addr_size(cma_src_addr(id_priv)));
2507*4882a593Smuzhiyun
2508*4882a593Smuzhiyun ret = iw_cm_listen(id_priv->cm_id.iw, backlog);
2509*4882a593Smuzhiyun
2510*4882a593Smuzhiyun if (ret) {
2511*4882a593Smuzhiyun iw_destroy_cm_id(id_priv->cm_id.iw);
2512*4882a593Smuzhiyun id_priv->cm_id.iw = NULL;
2513*4882a593Smuzhiyun }
2514*4882a593Smuzhiyun
2515*4882a593Smuzhiyun return ret;
2516*4882a593Smuzhiyun }
2517*4882a593Smuzhiyun
cma_listen_handler(struct rdma_cm_id * id,struct rdma_cm_event * event)2518*4882a593Smuzhiyun static int cma_listen_handler(struct rdma_cm_id *id,
2519*4882a593Smuzhiyun struct rdma_cm_event *event)
2520*4882a593Smuzhiyun {
2521*4882a593Smuzhiyun struct rdma_id_private *id_priv = id->context;
2522*4882a593Smuzhiyun
2523*4882a593Smuzhiyun /* Listening IDs are always destroyed on removal */
2524*4882a593Smuzhiyun if (event->event == RDMA_CM_EVENT_DEVICE_REMOVAL)
2525*4882a593Smuzhiyun return -1;
2526*4882a593Smuzhiyun
2527*4882a593Smuzhiyun id->context = id_priv->id.context;
2528*4882a593Smuzhiyun id->event_handler = id_priv->id.event_handler;
2529*4882a593Smuzhiyun trace_cm_event_handler(id_priv, event);
2530*4882a593Smuzhiyun return id_priv->id.event_handler(id, event);
2531*4882a593Smuzhiyun }
2532*4882a593Smuzhiyun
cma_listen_on_dev(struct rdma_id_private * id_priv,struct cma_device * cma_dev,struct rdma_id_private ** to_destroy)2533*4882a593Smuzhiyun static int cma_listen_on_dev(struct rdma_id_private *id_priv,
2534*4882a593Smuzhiyun struct cma_device *cma_dev,
2535*4882a593Smuzhiyun struct rdma_id_private **to_destroy)
2536*4882a593Smuzhiyun {
2537*4882a593Smuzhiyun struct rdma_id_private *dev_id_priv;
2538*4882a593Smuzhiyun struct net *net = id_priv->id.route.addr.dev_addr.net;
2539*4882a593Smuzhiyun int ret;
2540*4882a593Smuzhiyun
2541*4882a593Smuzhiyun lockdep_assert_held(&lock);
2542*4882a593Smuzhiyun
2543*4882a593Smuzhiyun *to_destroy = NULL;
2544*4882a593Smuzhiyun if (cma_family(id_priv) == AF_IB && !rdma_cap_ib_cm(cma_dev->device, 1))
2545*4882a593Smuzhiyun return 0;
2546*4882a593Smuzhiyun
2547*4882a593Smuzhiyun dev_id_priv =
2548*4882a593Smuzhiyun __rdma_create_id(net, cma_listen_handler, id_priv,
2549*4882a593Smuzhiyun id_priv->id.ps, id_priv->id.qp_type, id_priv);
2550*4882a593Smuzhiyun if (IS_ERR(dev_id_priv))
2551*4882a593Smuzhiyun return PTR_ERR(dev_id_priv);
2552*4882a593Smuzhiyun
2553*4882a593Smuzhiyun dev_id_priv->state = RDMA_CM_ADDR_BOUND;
2554*4882a593Smuzhiyun memcpy(cma_src_addr(dev_id_priv), cma_src_addr(id_priv),
2555*4882a593Smuzhiyun rdma_addr_size(cma_src_addr(id_priv)));
2556*4882a593Smuzhiyun
2557*4882a593Smuzhiyun _cma_attach_to_dev(dev_id_priv, cma_dev);
2558*4882a593Smuzhiyun rdma_restrack_add(&dev_id_priv->res);
2559*4882a593Smuzhiyun cma_id_get(id_priv);
2560*4882a593Smuzhiyun dev_id_priv->internal_id = 1;
2561*4882a593Smuzhiyun dev_id_priv->afonly = id_priv->afonly;
2562*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
2563*4882a593Smuzhiyun dev_id_priv->tos_set = id_priv->tos_set;
2564*4882a593Smuzhiyun dev_id_priv->tos = id_priv->tos;
2565*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
2566*4882a593Smuzhiyun
2567*4882a593Smuzhiyun ret = rdma_listen(&dev_id_priv->id, id_priv->backlog);
2568*4882a593Smuzhiyun if (ret)
2569*4882a593Smuzhiyun goto err_listen;
2570*4882a593Smuzhiyun list_add_tail(&dev_id_priv->listen_list, &id_priv->listen_list);
2571*4882a593Smuzhiyun return 0;
2572*4882a593Smuzhiyun err_listen:
2573*4882a593Smuzhiyun /* Caller must destroy this after releasing lock */
2574*4882a593Smuzhiyun *to_destroy = dev_id_priv;
2575*4882a593Smuzhiyun dev_warn(&cma_dev->device->dev, "RDMA CMA: %s, error %d\n", __func__, ret);
2576*4882a593Smuzhiyun return ret;
2577*4882a593Smuzhiyun }
2578*4882a593Smuzhiyun
cma_listen_on_all(struct rdma_id_private * id_priv)2579*4882a593Smuzhiyun static int cma_listen_on_all(struct rdma_id_private *id_priv)
2580*4882a593Smuzhiyun {
2581*4882a593Smuzhiyun struct rdma_id_private *to_destroy;
2582*4882a593Smuzhiyun struct cma_device *cma_dev;
2583*4882a593Smuzhiyun int ret;
2584*4882a593Smuzhiyun
2585*4882a593Smuzhiyun mutex_lock(&lock);
2586*4882a593Smuzhiyun list_add_tail(&id_priv->list, &listen_any_list);
2587*4882a593Smuzhiyun list_for_each_entry(cma_dev, &dev_list, list) {
2588*4882a593Smuzhiyun ret = cma_listen_on_dev(id_priv, cma_dev, &to_destroy);
2589*4882a593Smuzhiyun if (ret) {
2590*4882a593Smuzhiyun /* Prevent racing with cma_process_remove() */
2591*4882a593Smuzhiyun if (to_destroy)
2592*4882a593Smuzhiyun list_del_init(&to_destroy->list);
2593*4882a593Smuzhiyun goto err_listen;
2594*4882a593Smuzhiyun }
2595*4882a593Smuzhiyun }
2596*4882a593Smuzhiyun mutex_unlock(&lock);
2597*4882a593Smuzhiyun return 0;
2598*4882a593Smuzhiyun
2599*4882a593Smuzhiyun err_listen:
2600*4882a593Smuzhiyun _cma_cancel_listens(id_priv);
2601*4882a593Smuzhiyun mutex_unlock(&lock);
2602*4882a593Smuzhiyun if (to_destroy)
2603*4882a593Smuzhiyun rdma_destroy_id(&to_destroy->id);
2604*4882a593Smuzhiyun return ret;
2605*4882a593Smuzhiyun }
2606*4882a593Smuzhiyun
rdma_set_service_type(struct rdma_cm_id * id,int tos)2607*4882a593Smuzhiyun void rdma_set_service_type(struct rdma_cm_id *id, int tos)
2608*4882a593Smuzhiyun {
2609*4882a593Smuzhiyun struct rdma_id_private *id_priv;
2610*4882a593Smuzhiyun
2611*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
2612*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
2613*4882a593Smuzhiyun id_priv->tos = (u8) tos;
2614*4882a593Smuzhiyun id_priv->tos_set = true;
2615*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
2616*4882a593Smuzhiyun }
2617*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_set_service_type);
2618*4882a593Smuzhiyun
2619*4882a593Smuzhiyun /**
2620*4882a593Smuzhiyun * rdma_set_ack_timeout() - Set the ack timeout of QP associated
2621*4882a593Smuzhiyun * with a connection identifier.
2622*4882a593Smuzhiyun * @id: Communication identifier to associated with service type.
2623*4882a593Smuzhiyun * @timeout: Ack timeout to set a QP, expressed as 4.096 * 2^(timeout) usec.
2624*4882a593Smuzhiyun *
2625*4882a593Smuzhiyun * This function should be called before rdma_connect() on active side,
2626*4882a593Smuzhiyun * and on passive side before rdma_accept(). It is applicable to primary
2627*4882a593Smuzhiyun * path only. The timeout will affect the local side of the QP, it is not
2628*4882a593Smuzhiyun * negotiated with remote side and zero disables the timer. In case it is
2629*4882a593Smuzhiyun * set before rdma_resolve_route, the value will also be used to determine
2630*4882a593Smuzhiyun * PacketLifeTime for RoCE.
2631*4882a593Smuzhiyun *
2632*4882a593Smuzhiyun * Return: 0 for success
2633*4882a593Smuzhiyun */
rdma_set_ack_timeout(struct rdma_cm_id * id,u8 timeout)2634*4882a593Smuzhiyun int rdma_set_ack_timeout(struct rdma_cm_id *id, u8 timeout)
2635*4882a593Smuzhiyun {
2636*4882a593Smuzhiyun struct rdma_id_private *id_priv;
2637*4882a593Smuzhiyun
2638*4882a593Smuzhiyun if (id->qp_type != IB_QPT_RC && id->qp_type != IB_QPT_XRC_INI)
2639*4882a593Smuzhiyun return -EINVAL;
2640*4882a593Smuzhiyun
2641*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
2642*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
2643*4882a593Smuzhiyun id_priv->timeout = timeout;
2644*4882a593Smuzhiyun id_priv->timeout_set = true;
2645*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
2646*4882a593Smuzhiyun
2647*4882a593Smuzhiyun return 0;
2648*4882a593Smuzhiyun }
2649*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_set_ack_timeout);
2650*4882a593Smuzhiyun
cma_query_handler(int status,struct sa_path_rec * path_rec,void * context)2651*4882a593Smuzhiyun static void cma_query_handler(int status, struct sa_path_rec *path_rec,
2652*4882a593Smuzhiyun void *context)
2653*4882a593Smuzhiyun {
2654*4882a593Smuzhiyun struct cma_work *work = context;
2655*4882a593Smuzhiyun struct rdma_route *route;
2656*4882a593Smuzhiyun
2657*4882a593Smuzhiyun route = &work->id->id.route;
2658*4882a593Smuzhiyun
2659*4882a593Smuzhiyun if (!status) {
2660*4882a593Smuzhiyun route->num_paths = 1;
2661*4882a593Smuzhiyun *route->path_rec = *path_rec;
2662*4882a593Smuzhiyun } else {
2663*4882a593Smuzhiyun work->old_state = RDMA_CM_ROUTE_QUERY;
2664*4882a593Smuzhiyun work->new_state = RDMA_CM_ADDR_RESOLVED;
2665*4882a593Smuzhiyun work->event.event = RDMA_CM_EVENT_ROUTE_ERROR;
2666*4882a593Smuzhiyun work->event.status = status;
2667*4882a593Smuzhiyun pr_debug_ratelimited("RDMA CM: ROUTE_ERROR: failed to query path. status %d\n",
2668*4882a593Smuzhiyun status);
2669*4882a593Smuzhiyun }
2670*4882a593Smuzhiyun
2671*4882a593Smuzhiyun queue_work(cma_wq, &work->work);
2672*4882a593Smuzhiyun }
2673*4882a593Smuzhiyun
cma_query_ib_route(struct rdma_id_private * id_priv,unsigned long timeout_ms,struct cma_work * work)2674*4882a593Smuzhiyun static int cma_query_ib_route(struct rdma_id_private *id_priv,
2675*4882a593Smuzhiyun unsigned long timeout_ms, struct cma_work *work)
2676*4882a593Smuzhiyun {
2677*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
2678*4882a593Smuzhiyun struct sa_path_rec path_rec;
2679*4882a593Smuzhiyun ib_sa_comp_mask comp_mask;
2680*4882a593Smuzhiyun struct sockaddr_in6 *sin6;
2681*4882a593Smuzhiyun struct sockaddr_ib *sib;
2682*4882a593Smuzhiyun
2683*4882a593Smuzhiyun memset(&path_rec, 0, sizeof path_rec);
2684*4882a593Smuzhiyun
2685*4882a593Smuzhiyun if (rdma_cap_opa_ah(id_priv->id.device, id_priv->id.port_num))
2686*4882a593Smuzhiyun path_rec.rec_type = SA_PATH_REC_TYPE_OPA;
2687*4882a593Smuzhiyun else
2688*4882a593Smuzhiyun path_rec.rec_type = SA_PATH_REC_TYPE_IB;
2689*4882a593Smuzhiyun rdma_addr_get_sgid(dev_addr, &path_rec.sgid);
2690*4882a593Smuzhiyun rdma_addr_get_dgid(dev_addr, &path_rec.dgid);
2691*4882a593Smuzhiyun path_rec.pkey = cpu_to_be16(ib_addr_get_pkey(dev_addr));
2692*4882a593Smuzhiyun path_rec.numb_path = 1;
2693*4882a593Smuzhiyun path_rec.reversible = 1;
2694*4882a593Smuzhiyun path_rec.service_id = rdma_get_service_id(&id_priv->id,
2695*4882a593Smuzhiyun cma_dst_addr(id_priv));
2696*4882a593Smuzhiyun
2697*4882a593Smuzhiyun comp_mask = IB_SA_PATH_REC_DGID | IB_SA_PATH_REC_SGID |
2698*4882a593Smuzhiyun IB_SA_PATH_REC_PKEY | IB_SA_PATH_REC_NUMB_PATH |
2699*4882a593Smuzhiyun IB_SA_PATH_REC_REVERSIBLE | IB_SA_PATH_REC_SERVICE_ID;
2700*4882a593Smuzhiyun
2701*4882a593Smuzhiyun switch (cma_family(id_priv)) {
2702*4882a593Smuzhiyun case AF_INET:
2703*4882a593Smuzhiyun path_rec.qos_class = cpu_to_be16((u16) id_priv->tos);
2704*4882a593Smuzhiyun comp_mask |= IB_SA_PATH_REC_QOS_CLASS;
2705*4882a593Smuzhiyun break;
2706*4882a593Smuzhiyun case AF_INET6:
2707*4882a593Smuzhiyun sin6 = (struct sockaddr_in6 *) cma_src_addr(id_priv);
2708*4882a593Smuzhiyun path_rec.traffic_class = (u8) (be32_to_cpu(sin6->sin6_flowinfo) >> 20);
2709*4882a593Smuzhiyun comp_mask |= IB_SA_PATH_REC_TRAFFIC_CLASS;
2710*4882a593Smuzhiyun break;
2711*4882a593Smuzhiyun case AF_IB:
2712*4882a593Smuzhiyun sib = (struct sockaddr_ib *) cma_src_addr(id_priv);
2713*4882a593Smuzhiyun path_rec.traffic_class = (u8) (be32_to_cpu(sib->sib_flowinfo) >> 20);
2714*4882a593Smuzhiyun comp_mask |= IB_SA_PATH_REC_TRAFFIC_CLASS;
2715*4882a593Smuzhiyun break;
2716*4882a593Smuzhiyun }
2717*4882a593Smuzhiyun
2718*4882a593Smuzhiyun id_priv->query_id = ib_sa_path_rec_get(&sa_client, id_priv->id.device,
2719*4882a593Smuzhiyun id_priv->id.port_num, &path_rec,
2720*4882a593Smuzhiyun comp_mask, timeout_ms,
2721*4882a593Smuzhiyun GFP_KERNEL, cma_query_handler,
2722*4882a593Smuzhiyun work, &id_priv->query);
2723*4882a593Smuzhiyun
2724*4882a593Smuzhiyun return (id_priv->query_id < 0) ? id_priv->query_id : 0;
2725*4882a593Smuzhiyun }
2726*4882a593Smuzhiyun
cma_iboe_join_work_handler(struct work_struct * work)2727*4882a593Smuzhiyun static void cma_iboe_join_work_handler(struct work_struct *work)
2728*4882a593Smuzhiyun {
2729*4882a593Smuzhiyun struct cma_multicast *mc =
2730*4882a593Smuzhiyun container_of(work, struct cma_multicast, iboe_join.work);
2731*4882a593Smuzhiyun struct rdma_cm_event *event = &mc->iboe_join.event;
2732*4882a593Smuzhiyun struct rdma_id_private *id_priv = mc->id_priv;
2733*4882a593Smuzhiyun int ret;
2734*4882a593Smuzhiyun
2735*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
2736*4882a593Smuzhiyun if (READ_ONCE(id_priv->state) == RDMA_CM_DESTROYING ||
2737*4882a593Smuzhiyun READ_ONCE(id_priv->state) == RDMA_CM_DEVICE_REMOVAL)
2738*4882a593Smuzhiyun goto out_unlock;
2739*4882a593Smuzhiyun
2740*4882a593Smuzhiyun ret = cma_cm_event_handler(id_priv, event);
2741*4882a593Smuzhiyun WARN_ON(ret);
2742*4882a593Smuzhiyun
2743*4882a593Smuzhiyun out_unlock:
2744*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
2745*4882a593Smuzhiyun if (event->event == RDMA_CM_EVENT_MULTICAST_JOIN)
2746*4882a593Smuzhiyun rdma_destroy_ah_attr(&event->param.ud.ah_attr);
2747*4882a593Smuzhiyun }
2748*4882a593Smuzhiyun
cma_work_handler(struct work_struct * _work)2749*4882a593Smuzhiyun static void cma_work_handler(struct work_struct *_work)
2750*4882a593Smuzhiyun {
2751*4882a593Smuzhiyun struct cma_work *work = container_of(_work, struct cma_work, work);
2752*4882a593Smuzhiyun struct rdma_id_private *id_priv = work->id;
2753*4882a593Smuzhiyun
2754*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
2755*4882a593Smuzhiyun if (READ_ONCE(id_priv->state) == RDMA_CM_DESTROYING ||
2756*4882a593Smuzhiyun READ_ONCE(id_priv->state) == RDMA_CM_DEVICE_REMOVAL)
2757*4882a593Smuzhiyun goto out_unlock;
2758*4882a593Smuzhiyun if (work->old_state != 0 || work->new_state != 0) {
2759*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, work->old_state, work->new_state))
2760*4882a593Smuzhiyun goto out_unlock;
2761*4882a593Smuzhiyun }
2762*4882a593Smuzhiyun
2763*4882a593Smuzhiyun if (cma_cm_event_handler(id_priv, &work->event)) {
2764*4882a593Smuzhiyun cma_id_put(id_priv);
2765*4882a593Smuzhiyun destroy_id_handler_unlock(id_priv);
2766*4882a593Smuzhiyun goto out_free;
2767*4882a593Smuzhiyun }
2768*4882a593Smuzhiyun
2769*4882a593Smuzhiyun out_unlock:
2770*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
2771*4882a593Smuzhiyun cma_id_put(id_priv);
2772*4882a593Smuzhiyun out_free:
2773*4882a593Smuzhiyun if (work->event.event == RDMA_CM_EVENT_MULTICAST_JOIN)
2774*4882a593Smuzhiyun rdma_destroy_ah_attr(&work->event.param.ud.ah_attr);
2775*4882a593Smuzhiyun kfree(work);
2776*4882a593Smuzhiyun }
2777*4882a593Smuzhiyun
cma_init_resolve_route_work(struct cma_work * work,struct rdma_id_private * id_priv)2778*4882a593Smuzhiyun static void cma_init_resolve_route_work(struct cma_work *work,
2779*4882a593Smuzhiyun struct rdma_id_private *id_priv)
2780*4882a593Smuzhiyun {
2781*4882a593Smuzhiyun work->id = id_priv;
2782*4882a593Smuzhiyun INIT_WORK(&work->work, cma_work_handler);
2783*4882a593Smuzhiyun work->old_state = RDMA_CM_ROUTE_QUERY;
2784*4882a593Smuzhiyun work->new_state = RDMA_CM_ROUTE_RESOLVED;
2785*4882a593Smuzhiyun work->event.event = RDMA_CM_EVENT_ROUTE_RESOLVED;
2786*4882a593Smuzhiyun }
2787*4882a593Smuzhiyun
enqueue_resolve_addr_work(struct cma_work * work,struct rdma_id_private * id_priv)2788*4882a593Smuzhiyun static void enqueue_resolve_addr_work(struct cma_work *work,
2789*4882a593Smuzhiyun struct rdma_id_private *id_priv)
2790*4882a593Smuzhiyun {
2791*4882a593Smuzhiyun /* Balances with cma_id_put() in cma_work_handler */
2792*4882a593Smuzhiyun cma_id_get(id_priv);
2793*4882a593Smuzhiyun
2794*4882a593Smuzhiyun work->id = id_priv;
2795*4882a593Smuzhiyun INIT_WORK(&work->work, cma_work_handler);
2796*4882a593Smuzhiyun work->old_state = RDMA_CM_ADDR_QUERY;
2797*4882a593Smuzhiyun work->new_state = RDMA_CM_ADDR_RESOLVED;
2798*4882a593Smuzhiyun work->event.event = RDMA_CM_EVENT_ADDR_RESOLVED;
2799*4882a593Smuzhiyun
2800*4882a593Smuzhiyun queue_work(cma_wq, &work->work);
2801*4882a593Smuzhiyun }
2802*4882a593Smuzhiyun
cma_resolve_ib_route(struct rdma_id_private * id_priv,unsigned long timeout_ms)2803*4882a593Smuzhiyun static int cma_resolve_ib_route(struct rdma_id_private *id_priv,
2804*4882a593Smuzhiyun unsigned long timeout_ms)
2805*4882a593Smuzhiyun {
2806*4882a593Smuzhiyun struct rdma_route *route = &id_priv->id.route;
2807*4882a593Smuzhiyun struct cma_work *work;
2808*4882a593Smuzhiyun int ret;
2809*4882a593Smuzhiyun
2810*4882a593Smuzhiyun work = kzalloc(sizeof *work, GFP_KERNEL);
2811*4882a593Smuzhiyun if (!work)
2812*4882a593Smuzhiyun return -ENOMEM;
2813*4882a593Smuzhiyun
2814*4882a593Smuzhiyun cma_init_resolve_route_work(work, id_priv);
2815*4882a593Smuzhiyun
2816*4882a593Smuzhiyun if (!route->path_rec)
2817*4882a593Smuzhiyun route->path_rec = kmalloc(sizeof *route->path_rec, GFP_KERNEL);
2818*4882a593Smuzhiyun if (!route->path_rec) {
2819*4882a593Smuzhiyun ret = -ENOMEM;
2820*4882a593Smuzhiyun goto err1;
2821*4882a593Smuzhiyun }
2822*4882a593Smuzhiyun
2823*4882a593Smuzhiyun ret = cma_query_ib_route(id_priv, timeout_ms, work);
2824*4882a593Smuzhiyun if (ret)
2825*4882a593Smuzhiyun goto err2;
2826*4882a593Smuzhiyun
2827*4882a593Smuzhiyun return 0;
2828*4882a593Smuzhiyun err2:
2829*4882a593Smuzhiyun kfree(route->path_rec);
2830*4882a593Smuzhiyun route->path_rec = NULL;
2831*4882a593Smuzhiyun err1:
2832*4882a593Smuzhiyun kfree(work);
2833*4882a593Smuzhiyun return ret;
2834*4882a593Smuzhiyun }
2835*4882a593Smuzhiyun
cma_route_gid_type(enum rdma_network_type network_type,unsigned long supported_gids,enum ib_gid_type default_gid)2836*4882a593Smuzhiyun static enum ib_gid_type cma_route_gid_type(enum rdma_network_type network_type,
2837*4882a593Smuzhiyun unsigned long supported_gids,
2838*4882a593Smuzhiyun enum ib_gid_type default_gid)
2839*4882a593Smuzhiyun {
2840*4882a593Smuzhiyun if ((network_type == RDMA_NETWORK_IPV4 ||
2841*4882a593Smuzhiyun network_type == RDMA_NETWORK_IPV6) &&
2842*4882a593Smuzhiyun test_bit(IB_GID_TYPE_ROCE_UDP_ENCAP, &supported_gids))
2843*4882a593Smuzhiyun return IB_GID_TYPE_ROCE_UDP_ENCAP;
2844*4882a593Smuzhiyun
2845*4882a593Smuzhiyun return default_gid;
2846*4882a593Smuzhiyun }
2847*4882a593Smuzhiyun
2848*4882a593Smuzhiyun /*
2849*4882a593Smuzhiyun * cma_iboe_set_path_rec_l2_fields() is helper function which sets
2850*4882a593Smuzhiyun * path record type based on GID type.
2851*4882a593Smuzhiyun * It also sets up other L2 fields which includes destination mac address
2852*4882a593Smuzhiyun * netdev ifindex, of the path record.
2853*4882a593Smuzhiyun * It returns the netdev of the bound interface for this path record entry.
2854*4882a593Smuzhiyun */
2855*4882a593Smuzhiyun static struct net_device *
cma_iboe_set_path_rec_l2_fields(struct rdma_id_private * id_priv)2856*4882a593Smuzhiyun cma_iboe_set_path_rec_l2_fields(struct rdma_id_private *id_priv)
2857*4882a593Smuzhiyun {
2858*4882a593Smuzhiyun struct rdma_route *route = &id_priv->id.route;
2859*4882a593Smuzhiyun enum ib_gid_type gid_type = IB_GID_TYPE_ROCE;
2860*4882a593Smuzhiyun struct rdma_addr *addr = &route->addr;
2861*4882a593Smuzhiyun unsigned long supported_gids;
2862*4882a593Smuzhiyun struct net_device *ndev;
2863*4882a593Smuzhiyun
2864*4882a593Smuzhiyun if (!addr->dev_addr.bound_dev_if)
2865*4882a593Smuzhiyun return NULL;
2866*4882a593Smuzhiyun
2867*4882a593Smuzhiyun ndev = dev_get_by_index(addr->dev_addr.net,
2868*4882a593Smuzhiyun addr->dev_addr.bound_dev_if);
2869*4882a593Smuzhiyun if (!ndev)
2870*4882a593Smuzhiyun return NULL;
2871*4882a593Smuzhiyun
2872*4882a593Smuzhiyun supported_gids = roce_gid_type_mask_support(id_priv->id.device,
2873*4882a593Smuzhiyun id_priv->id.port_num);
2874*4882a593Smuzhiyun gid_type = cma_route_gid_type(addr->dev_addr.network,
2875*4882a593Smuzhiyun supported_gids,
2876*4882a593Smuzhiyun id_priv->gid_type);
2877*4882a593Smuzhiyun /* Use the hint from IP Stack to select GID Type */
2878*4882a593Smuzhiyun if (gid_type < ib_network_to_gid_type(addr->dev_addr.network))
2879*4882a593Smuzhiyun gid_type = ib_network_to_gid_type(addr->dev_addr.network);
2880*4882a593Smuzhiyun route->path_rec->rec_type = sa_conv_gid_to_pathrec_type(gid_type);
2881*4882a593Smuzhiyun
2882*4882a593Smuzhiyun route->path_rec->roce.route_resolved = true;
2883*4882a593Smuzhiyun sa_path_set_dmac(route->path_rec, addr->dev_addr.dst_dev_addr);
2884*4882a593Smuzhiyun return ndev;
2885*4882a593Smuzhiyun }
2886*4882a593Smuzhiyun
rdma_set_ib_path(struct rdma_cm_id * id,struct sa_path_rec * path_rec)2887*4882a593Smuzhiyun int rdma_set_ib_path(struct rdma_cm_id *id,
2888*4882a593Smuzhiyun struct sa_path_rec *path_rec)
2889*4882a593Smuzhiyun {
2890*4882a593Smuzhiyun struct rdma_id_private *id_priv;
2891*4882a593Smuzhiyun struct net_device *ndev;
2892*4882a593Smuzhiyun int ret;
2893*4882a593Smuzhiyun
2894*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
2895*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_RESOLVED,
2896*4882a593Smuzhiyun RDMA_CM_ROUTE_RESOLVED))
2897*4882a593Smuzhiyun return -EINVAL;
2898*4882a593Smuzhiyun
2899*4882a593Smuzhiyun id->route.path_rec = kmemdup(path_rec, sizeof(*path_rec),
2900*4882a593Smuzhiyun GFP_KERNEL);
2901*4882a593Smuzhiyun if (!id->route.path_rec) {
2902*4882a593Smuzhiyun ret = -ENOMEM;
2903*4882a593Smuzhiyun goto err;
2904*4882a593Smuzhiyun }
2905*4882a593Smuzhiyun
2906*4882a593Smuzhiyun if (rdma_protocol_roce(id->device, id->port_num)) {
2907*4882a593Smuzhiyun ndev = cma_iboe_set_path_rec_l2_fields(id_priv);
2908*4882a593Smuzhiyun if (!ndev) {
2909*4882a593Smuzhiyun ret = -ENODEV;
2910*4882a593Smuzhiyun goto err_free;
2911*4882a593Smuzhiyun }
2912*4882a593Smuzhiyun dev_put(ndev);
2913*4882a593Smuzhiyun }
2914*4882a593Smuzhiyun
2915*4882a593Smuzhiyun id->route.num_paths = 1;
2916*4882a593Smuzhiyun return 0;
2917*4882a593Smuzhiyun
2918*4882a593Smuzhiyun err_free:
2919*4882a593Smuzhiyun kfree(id->route.path_rec);
2920*4882a593Smuzhiyun id->route.path_rec = NULL;
2921*4882a593Smuzhiyun err:
2922*4882a593Smuzhiyun cma_comp_exch(id_priv, RDMA_CM_ROUTE_RESOLVED, RDMA_CM_ADDR_RESOLVED);
2923*4882a593Smuzhiyun return ret;
2924*4882a593Smuzhiyun }
2925*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_set_ib_path);
2926*4882a593Smuzhiyun
cma_resolve_iw_route(struct rdma_id_private * id_priv)2927*4882a593Smuzhiyun static int cma_resolve_iw_route(struct rdma_id_private *id_priv)
2928*4882a593Smuzhiyun {
2929*4882a593Smuzhiyun struct cma_work *work;
2930*4882a593Smuzhiyun
2931*4882a593Smuzhiyun work = kzalloc(sizeof *work, GFP_KERNEL);
2932*4882a593Smuzhiyun if (!work)
2933*4882a593Smuzhiyun return -ENOMEM;
2934*4882a593Smuzhiyun
2935*4882a593Smuzhiyun cma_init_resolve_route_work(work, id_priv);
2936*4882a593Smuzhiyun queue_work(cma_wq, &work->work);
2937*4882a593Smuzhiyun return 0;
2938*4882a593Smuzhiyun }
2939*4882a593Smuzhiyun
get_vlan_ndev_tc(struct net_device * vlan_ndev,int prio)2940*4882a593Smuzhiyun static int get_vlan_ndev_tc(struct net_device *vlan_ndev, int prio)
2941*4882a593Smuzhiyun {
2942*4882a593Smuzhiyun struct net_device *dev;
2943*4882a593Smuzhiyun
2944*4882a593Smuzhiyun dev = vlan_dev_real_dev(vlan_ndev);
2945*4882a593Smuzhiyun if (dev->num_tc)
2946*4882a593Smuzhiyun return netdev_get_prio_tc_map(dev, prio);
2947*4882a593Smuzhiyun
2948*4882a593Smuzhiyun return (vlan_dev_get_egress_qos_mask(vlan_ndev, prio) &
2949*4882a593Smuzhiyun VLAN_PRIO_MASK) >> VLAN_PRIO_SHIFT;
2950*4882a593Smuzhiyun }
2951*4882a593Smuzhiyun
2952*4882a593Smuzhiyun struct iboe_prio_tc_map {
2953*4882a593Smuzhiyun int input_prio;
2954*4882a593Smuzhiyun int output_tc;
2955*4882a593Smuzhiyun bool found;
2956*4882a593Smuzhiyun };
2957*4882a593Smuzhiyun
get_lower_vlan_dev_tc(struct net_device * dev,struct netdev_nested_priv * priv)2958*4882a593Smuzhiyun static int get_lower_vlan_dev_tc(struct net_device *dev,
2959*4882a593Smuzhiyun struct netdev_nested_priv *priv)
2960*4882a593Smuzhiyun {
2961*4882a593Smuzhiyun struct iboe_prio_tc_map *map = (struct iboe_prio_tc_map *)priv->data;
2962*4882a593Smuzhiyun
2963*4882a593Smuzhiyun if (is_vlan_dev(dev))
2964*4882a593Smuzhiyun map->output_tc = get_vlan_ndev_tc(dev, map->input_prio);
2965*4882a593Smuzhiyun else if (dev->num_tc)
2966*4882a593Smuzhiyun map->output_tc = netdev_get_prio_tc_map(dev, map->input_prio);
2967*4882a593Smuzhiyun else
2968*4882a593Smuzhiyun map->output_tc = 0;
2969*4882a593Smuzhiyun /* We are interested only in first level VLAN device, so always
2970*4882a593Smuzhiyun * return 1 to stop iterating over next level devices.
2971*4882a593Smuzhiyun */
2972*4882a593Smuzhiyun map->found = true;
2973*4882a593Smuzhiyun return 1;
2974*4882a593Smuzhiyun }
2975*4882a593Smuzhiyun
iboe_tos_to_sl(struct net_device * ndev,int tos)2976*4882a593Smuzhiyun static int iboe_tos_to_sl(struct net_device *ndev, int tos)
2977*4882a593Smuzhiyun {
2978*4882a593Smuzhiyun struct iboe_prio_tc_map prio_tc_map = {};
2979*4882a593Smuzhiyun int prio = rt_tos2priority(tos);
2980*4882a593Smuzhiyun struct netdev_nested_priv priv;
2981*4882a593Smuzhiyun
2982*4882a593Smuzhiyun /* If VLAN device, get it directly from the VLAN netdev */
2983*4882a593Smuzhiyun if (is_vlan_dev(ndev))
2984*4882a593Smuzhiyun return get_vlan_ndev_tc(ndev, prio);
2985*4882a593Smuzhiyun
2986*4882a593Smuzhiyun prio_tc_map.input_prio = prio;
2987*4882a593Smuzhiyun priv.data = (void *)&prio_tc_map;
2988*4882a593Smuzhiyun rcu_read_lock();
2989*4882a593Smuzhiyun netdev_walk_all_lower_dev_rcu(ndev,
2990*4882a593Smuzhiyun get_lower_vlan_dev_tc,
2991*4882a593Smuzhiyun &priv);
2992*4882a593Smuzhiyun rcu_read_unlock();
2993*4882a593Smuzhiyun /* If map is found from lower device, use it; Otherwise
2994*4882a593Smuzhiyun * continue with the current netdevice to get priority to tc map.
2995*4882a593Smuzhiyun */
2996*4882a593Smuzhiyun if (prio_tc_map.found)
2997*4882a593Smuzhiyun return prio_tc_map.output_tc;
2998*4882a593Smuzhiyun else if (ndev->num_tc)
2999*4882a593Smuzhiyun return netdev_get_prio_tc_map(ndev, prio);
3000*4882a593Smuzhiyun else
3001*4882a593Smuzhiyun return 0;
3002*4882a593Smuzhiyun }
3003*4882a593Smuzhiyun
cma_get_roce_udp_flow_label(struct rdma_id_private * id_priv)3004*4882a593Smuzhiyun static __be32 cma_get_roce_udp_flow_label(struct rdma_id_private *id_priv)
3005*4882a593Smuzhiyun {
3006*4882a593Smuzhiyun struct sockaddr_in6 *addr6;
3007*4882a593Smuzhiyun u16 dport, sport;
3008*4882a593Smuzhiyun u32 hash, fl;
3009*4882a593Smuzhiyun
3010*4882a593Smuzhiyun addr6 = (struct sockaddr_in6 *)cma_src_addr(id_priv);
3011*4882a593Smuzhiyun fl = be32_to_cpu(addr6->sin6_flowinfo) & IB_GRH_FLOWLABEL_MASK;
3012*4882a593Smuzhiyun if ((cma_family(id_priv) != AF_INET6) || !fl) {
3013*4882a593Smuzhiyun dport = be16_to_cpu(cma_port(cma_dst_addr(id_priv)));
3014*4882a593Smuzhiyun sport = be16_to_cpu(cma_port(cma_src_addr(id_priv)));
3015*4882a593Smuzhiyun hash = (u32)sport * 31 + dport;
3016*4882a593Smuzhiyun fl = hash & IB_GRH_FLOWLABEL_MASK;
3017*4882a593Smuzhiyun }
3018*4882a593Smuzhiyun
3019*4882a593Smuzhiyun return cpu_to_be32(fl);
3020*4882a593Smuzhiyun }
3021*4882a593Smuzhiyun
cma_resolve_iboe_route(struct rdma_id_private * id_priv)3022*4882a593Smuzhiyun static int cma_resolve_iboe_route(struct rdma_id_private *id_priv)
3023*4882a593Smuzhiyun {
3024*4882a593Smuzhiyun struct rdma_route *route = &id_priv->id.route;
3025*4882a593Smuzhiyun struct rdma_addr *addr = &route->addr;
3026*4882a593Smuzhiyun struct cma_work *work;
3027*4882a593Smuzhiyun int ret;
3028*4882a593Smuzhiyun struct net_device *ndev;
3029*4882a593Smuzhiyun
3030*4882a593Smuzhiyun u8 default_roce_tos = id_priv->cma_dev->default_roce_tos[id_priv->id.port_num -
3031*4882a593Smuzhiyun rdma_start_port(id_priv->cma_dev->device)];
3032*4882a593Smuzhiyun u8 tos;
3033*4882a593Smuzhiyun
3034*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
3035*4882a593Smuzhiyun tos = id_priv->tos_set ? id_priv->tos : default_roce_tos;
3036*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
3037*4882a593Smuzhiyun
3038*4882a593Smuzhiyun work = kzalloc(sizeof *work, GFP_KERNEL);
3039*4882a593Smuzhiyun if (!work)
3040*4882a593Smuzhiyun return -ENOMEM;
3041*4882a593Smuzhiyun
3042*4882a593Smuzhiyun route->path_rec = kzalloc(sizeof *route->path_rec, GFP_KERNEL);
3043*4882a593Smuzhiyun if (!route->path_rec) {
3044*4882a593Smuzhiyun ret = -ENOMEM;
3045*4882a593Smuzhiyun goto err1;
3046*4882a593Smuzhiyun }
3047*4882a593Smuzhiyun
3048*4882a593Smuzhiyun route->num_paths = 1;
3049*4882a593Smuzhiyun
3050*4882a593Smuzhiyun ndev = cma_iboe_set_path_rec_l2_fields(id_priv);
3051*4882a593Smuzhiyun if (!ndev) {
3052*4882a593Smuzhiyun ret = -ENODEV;
3053*4882a593Smuzhiyun goto err2;
3054*4882a593Smuzhiyun }
3055*4882a593Smuzhiyun
3056*4882a593Smuzhiyun rdma_ip2gid((struct sockaddr *)&id_priv->id.route.addr.src_addr,
3057*4882a593Smuzhiyun &route->path_rec->sgid);
3058*4882a593Smuzhiyun rdma_ip2gid((struct sockaddr *)&id_priv->id.route.addr.dst_addr,
3059*4882a593Smuzhiyun &route->path_rec->dgid);
3060*4882a593Smuzhiyun
3061*4882a593Smuzhiyun if (((struct sockaddr *)&id_priv->id.route.addr.dst_addr)->sa_family != AF_IB)
3062*4882a593Smuzhiyun /* TODO: get the hoplimit from the inet/inet6 device */
3063*4882a593Smuzhiyun route->path_rec->hop_limit = addr->dev_addr.hoplimit;
3064*4882a593Smuzhiyun else
3065*4882a593Smuzhiyun route->path_rec->hop_limit = 1;
3066*4882a593Smuzhiyun route->path_rec->reversible = 1;
3067*4882a593Smuzhiyun route->path_rec->pkey = cpu_to_be16(0xffff);
3068*4882a593Smuzhiyun route->path_rec->mtu_selector = IB_SA_EQ;
3069*4882a593Smuzhiyun route->path_rec->sl = iboe_tos_to_sl(ndev, tos);
3070*4882a593Smuzhiyun route->path_rec->traffic_class = tos;
3071*4882a593Smuzhiyun route->path_rec->mtu = iboe_get_mtu(ndev->mtu);
3072*4882a593Smuzhiyun route->path_rec->rate_selector = IB_SA_EQ;
3073*4882a593Smuzhiyun route->path_rec->rate = iboe_get_rate(ndev);
3074*4882a593Smuzhiyun dev_put(ndev);
3075*4882a593Smuzhiyun route->path_rec->packet_life_time_selector = IB_SA_EQ;
3076*4882a593Smuzhiyun /* In case ACK timeout is set, use this value to calculate
3077*4882a593Smuzhiyun * PacketLifeTime. As per IBTA 12.7.34,
3078*4882a593Smuzhiyun * local ACK timeout = (2 * PacketLifeTime + Local CA’s ACK delay).
3079*4882a593Smuzhiyun * Assuming a negligible local ACK delay, we can use
3080*4882a593Smuzhiyun * PacketLifeTime = local ACK timeout/2
3081*4882a593Smuzhiyun * as a reasonable approximation for RoCE networks.
3082*4882a593Smuzhiyun */
3083*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
3084*4882a593Smuzhiyun if (id_priv->timeout_set && id_priv->timeout)
3085*4882a593Smuzhiyun route->path_rec->packet_life_time = id_priv->timeout - 1;
3086*4882a593Smuzhiyun else
3087*4882a593Smuzhiyun route->path_rec->packet_life_time = CMA_IBOE_PACKET_LIFETIME;
3088*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
3089*4882a593Smuzhiyun
3090*4882a593Smuzhiyun if (!route->path_rec->mtu) {
3091*4882a593Smuzhiyun ret = -EINVAL;
3092*4882a593Smuzhiyun goto err2;
3093*4882a593Smuzhiyun }
3094*4882a593Smuzhiyun
3095*4882a593Smuzhiyun if (rdma_protocol_roce_udp_encap(id_priv->id.device,
3096*4882a593Smuzhiyun id_priv->id.port_num))
3097*4882a593Smuzhiyun route->path_rec->flow_label =
3098*4882a593Smuzhiyun cma_get_roce_udp_flow_label(id_priv);
3099*4882a593Smuzhiyun
3100*4882a593Smuzhiyun cma_init_resolve_route_work(work, id_priv);
3101*4882a593Smuzhiyun queue_work(cma_wq, &work->work);
3102*4882a593Smuzhiyun
3103*4882a593Smuzhiyun return 0;
3104*4882a593Smuzhiyun
3105*4882a593Smuzhiyun err2:
3106*4882a593Smuzhiyun kfree(route->path_rec);
3107*4882a593Smuzhiyun route->path_rec = NULL;
3108*4882a593Smuzhiyun route->num_paths = 0;
3109*4882a593Smuzhiyun err1:
3110*4882a593Smuzhiyun kfree(work);
3111*4882a593Smuzhiyun return ret;
3112*4882a593Smuzhiyun }
3113*4882a593Smuzhiyun
rdma_resolve_route(struct rdma_cm_id * id,unsigned long timeout_ms)3114*4882a593Smuzhiyun int rdma_resolve_route(struct rdma_cm_id *id, unsigned long timeout_ms)
3115*4882a593Smuzhiyun {
3116*4882a593Smuzhiyun struct rdma_id_private *id_priv;
3117*4882a593Smuzhiyun int ret;
3118*4882a593Smuzhiyun
3119*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
3120*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_RESOLVED, RDMA_CM_ROUTE_QUERY))
3121*4882a593Smuzhiyun return -EINVAL;
3122*4882a593Smuzhiyun
3123*4882a593Smuzhiyun cma_id_get(id_priv);
3124*4882a593Smuzhiyun if (rdma_cap_ib_sa(id->device, id->port_num))
3125*4882a593Smuzhiyun ret = cma_resolve_ib_route(id_priv, timeout_ms);
3126*4882a593Smuzhiyun else if (rdma_protocol_roce(id->device, id->port_num))
3127*4882a593Smuzhiyun ret = cma_resolve_iboe_route(id_priv);
3128*4882a593Smuzhiyun else if (rdma_protocol_iwarp(id->device, id->port_num))
3129*4882a593Smuzhiyun ret = cma_resolve_iw_route(id_priv);
3130*4882a593Smuzhiyun else
3131*4882a593Smuzhiyun ret = -ENOSYS;
3132*4882a593Smuzhiyun
3133*4882a593Smuzhiyun if (ret)
3134*4882a593Smuzhiyun goto err;
3135*4882a593Smuzhiyun
3136*4882a593Smuzhiyun return 0;
3137*4882a593Smuzhiyun err:
3138*4882a593Smuzhiyun cma_comp_exch(id_priv, RDMA_CM_ROUTE_QUERY, RDMA_CM_ADDR_RESOLVED);
3139*4882a593Smuzhiyun cma_id_put(id_priv);
3140*4882a593Smuzhiyun return ret;
3141*4882a593Smuzhiyun }
3142*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_resolve_route);
3143*4882a593Smuzhiyun
cma_set_loopback(struct sockaddr * addr)3144*4882a593Smuzhiyun static void cma_set_loopback(struct sockaddr *addr)
3145*4882a593Smuzhiyun {
3146*4882a593Smuzhiyun switch (addr->sa_family) {
3147*4882a593Smuzhiyun case AF_INET:
3148*4882a593Smuzhiyun ((struct sockaddr_in *) addr)->sin_addr.s_addr = htonl(INADDR_LOOPBACK);
3149*4882a593Smuzhiyun break;
3150*4882a593Smuzhiyun case AF_INET6:
3151*4882a593Smuzhiyun ipv6_addr_set(&((struct sockaddr_in6 *) addr)->sin6_addr,
3152*4882a593Smuzhiyun 0, 0, 0, htonl(1));
3153*4882a593Smuzhiyun break;
3154*4882a593Smuzhiyun default:
3155*4882a593Smuzhiyun ib_addr_set(&((struct sockaddr_ib *) addr)->sib_addr,
3156*4882a593Smuzhiyun 0, 0, 0, htonl(1));
3157*4882a593Smuzhiyun break;
3158*4882a593Smuzhiyun }
3159*4882a593Smuzhiyun }
3160*4882a593Smuzhiyun
cma_bind_loopback(struct rdma_id_private * id_priv)3161*4882a593Smuzhiyun static int cma_bind_loopback(struct rdma_id_private *id_priv)
3162*4882a593Smuzhiyun {
3163*4882a593Smuzhiyun struct cma_device *cma_dev, *cur_dev;
3164*4882a593Smuzhiyun union ib_gid gid;
3165*4882a593Smuzhiyun enum ib_port_state port_state;
3166*4882a593Smuzhiyun unsigned int p;
3167*4882a593Smuzhiyun u16 pkey;
3168*4882a593Smuzhiyun int ret;
3169*4882a593Smuzhiyun
3170*4882a593Smuzhiyun cma_dev = NULL;
3171*4882a593Smuzhiyun mutex_lock(&lock);
3172*4882a593Smuzhiyun list_for_each_entry(cur_dev, &dev_list, list) {
3173*4882a593Smuzhiyun if (cma_family(id_priv) == AF_IB &&
3174*4882a593Smuzhiyun !rdma_cap_ib_cm(cur_dev->device, 1))
3175*4882a593Smuzhiyun continue;
3176*4882a593Smuzhiyun
3177*4882a593Smuzhiyun if (!cma_dev)
3178*4882a593Smuzhiyun cma_dev = cur_dev;
3179*4882a593Smuzhiyun
3180*4882a593Smuzhiyun rdma_for_each_port (cur_dev->device, p) {
3181*4882a593Smuzhiyun if (!ib_get_cached_port_state(cur_dev->device, p, &port_state) &&
3182*4882a593Smuzhiyun port_state == IB_PORT_ACTIVE) {
3183*4882a593Smuzhiyun cma_dev = cur_dev;
3184*4882a593Smuzhiyun goto port_found;
3185*4882a593Smuzhiyun }
3186*4882a593Smuzhiyun }
3187*4882a593Smuzhiyun }
3188*4882a593Smuzhiyun
3189*4882a593Smuzhiyun if (!cma_dev) {
3190*4882a593Smuzhiyun ret = -ENODEV;
3191*4882a593Smuzhiyun goto out;
3192*4882a593Smuzhiyun }
3193*4882a593Smuzhiyun
3194*4882a593Smuzhiyun p = 1;
3195*4882a593Smuzhiyun
3196*4882a593Smuzhiyun port_found:
3197*4882a593Smuzhiyun ret = rdma_query_gid(cma_dev->device, p, 0, &gid);
3198*4882a593Smuzhiyun if (ret)
3199*4882a593Smuzhiyun goto out;
3200*4882a593Smuzhiyun
3201*4882a593Smuzhiyun ret = ib_get_cached_pkey(cma_dev->device, p, 0, &pkey);
3202*4882a593Smuzhiyun if (ret)
3203*4882a593Smuzhiyun goto out;
3204*4882a593Smuzhiyun
3205*4882a593Smuzhiyun id_priv->id.route.addr.dev_addr.dev_type =
3206*4882a593Smuzhiyun (rdma_protocol_ib(cma_dev->device, p)) ?
3207*4882a593Smuzhiyun ARPHRD_INFINIBAND : ARPHRD_ETHER;
3208*4882a593Smuzhiyun
3209*4882a593Smuzhiyun rdma_addr_set_sgid(&id_priv->id.route.addr.dev_addr, &gid);
3210*4882a593Smuzhiyun ib_addr_set_pkey(&id_priv->id.route.addr.dev_addr, pkey);
3211*4882a593Smuzhiyun id_priv->id.port_num = p;
3212*4882a593Smuzhiyun cma_attach_to_dev(id_priv, cma_dev);
3213*4882a593Smuzhiyun rdma_restrack_add(&id_priv->res);
3214*4882a593Smuzhiyun cma_set_loopback(cma_src_addr(id_priv));
3215*4882a593Smuzhiyun out:
3216*4882a593Smuzhiyun mutex_unlock(&lock);
3217*4882a593Smuzhiyun return ret;
3218*4882a593Smuzhiyun }
3219*4882a593Smuzhiyun
addr_handler(int status,struct sockaddr * src_addr,struct rdma_dev_addr * dev_addr,void * context)3220*4882a593Smuzhiyun static void addr_handler(int status, struct sockaddr *src_addr,
3221*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr, void *context)
3222*4882a593Smuzhiyun {
3223*4882a593Smuzhiyun struct rdma_id_private *id_priv = context;
3224*4882a593Smuzhiyun struct rdma_cm_event event = {};
3225*4882a593Smuzhiyun struct sockaddr *addr;
3226*4882a593Smuzhiyun struct sockaddr_storage old_addr;
3227*4882a593Smuzhiyun
3228*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
3229*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_QUERY,
3230*4882a593Smuzhiyun RDMA_CM_ADDR_RESOLVED))
3231*4882a593Smuzhiyun goto out;
3232*4882a593Smuzhiyun
3233*4882a593Smuzhiyun /*
3234*4882a593Smuzhiyun * Store the previous src address, so that if we fail to acquire
3235*4882a593Smuzhiyun * matching rdma device, old address can be restored back, which helps
3236*4882a593Smuzhiyun * to cancel the cma listen operation correctly.
3237*4882a593Smuzhiyun */
3238*4882a593Smuzhiyun addr = cma_src_addr(id_priv);
3239*4882a593Smuzhiyun memcpy(&old_addr, addr, rdma_addr_size(addr));
3240*4882a593Smuzhiyun memcpy(addr, src_addr, rdma_addr_size(src_addr));
3241*4882a593Smuzhiyun if (!status && !id_priv->cma_dev) {
3242*4882a593Smuzhiyun status = cma_acquire_dev_by_src_ip(id_priv);
3243*4882a593Smuzhiyun if (status)
3244*4882a593Smuzhiyun pr_debug_ratelimited("RDMA CM: ADDR_ERROR: failed to acquire device. status %d\n",
3245*4882a593Smuzhiyun status);
3246*4882a593Smuzhiyun rdma_restrack_add(&id_priv->res);
3247*4882a593Smuzhiyun } else if (status) {
3248*4882a593Smuzhiyun pr_debug_ratelimited("RDMA CM: ADDR_ERROR: failed to resolve IP. status %d\n", status);
3249*4882a593Smuzhiyun }
3250*4882a593Smuzhiyun
3251*4882a593Smuzhiyun if (status) {
3252*4882a593Smuzhiyun memcpy(addr, &old_addr,
3253*4882a593Smuzhiyun rdma_addr_size((struct sockaddr *)&old_addr));
3254*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_RESOLVED,
3255*4882a593Smuzhiyun RDMA_CM_ADDR_BOUND))
3256*4882a593Smuzhiyun goto out;
3257*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_ADDR_ERROR;
3258*4882a593Smuzhiyun event.status = status;
3259*4882a593Smuzhiyun } else
3260*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_ADDR_RESOLVED;
3261*4882a593Smuzhiyun
3262*4882a593Smuzhiyun if (cma_cm_event_handler(id_priv, &event)) {
3263*4882a593Smuzhiyun destroy_id_handler_unlock(id_priv);
3264*4882a593Smuzhiyun return;
3265*4882a593Smuzhiyun }
3266*4882a593Smuzhiyun out:
3267*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
3268*4882a593Smuzhiyun }
3269*4882a593Smuzhiyun
cma_resolve_loopback(struct rdma_id_private * id_priv)3270*4882a593Smuzhiyun static int cma_resolve_loopback(struct rdma_id_private *id_priv)
3271*4882a593Smuzhiyun {
3272*4882a593Smuzhiyun struct cma_work *work;
3273*4882a593Smuzhiyun union ib_gid gid;
3274*4882a593Smuzhiyun int ret;
3275*4882a593Smuzhiyun
3276*4882a593Smuzhiyun work = kzalloc(sizeof *work, GFP_KERNEL);
3277*4882a593Smuzhiyun if (!work)
3278*4882a593Smuzhiyun return -ENOMEM;
3279*4882a593Smuzhiyun
3280*4882a593Smuzhiyun if (!id_priv->cma_dev) {
3281*4882a593Smuzhiyun ret = cma_bind_loopback(id_priv);
3282*4882a593Smuzhiyun if (ret)
3283*4882a593Smuzhiyun goto err;
3284*4882a593Smuzhiyun }
3285*4882a593Smuzhiyun
3286*4882a593Smuzhiyun rdma_addr_get_sgid(&id_priv->id.route.addr.dev_addr, &gid);
3287*4882a593Smuzhiyun rdma_addr_set_dgid(&id_priv->id.route.addr.dev_addr, &gid);
3288*4882a593Smuzhiyun
3289*4882a593Smuzhiyun enqueue_resolve_addr_work(work, id_priv);
3290*4882a593Smuzhiyun return 0;
3291*4882a593Smuzhiyun err:
3292*4882a593Smuzhiyun kfree(work);
3293*4882a593Smuzhiyun return ret;
3294*4882a593Smuzhiyun }
3295*4882a593Smuzhiyun
cma_resolve_ib_addr(struct rdma_id_private * id_priv)3296*4882a593Smuzhiyun static int cma_resolve_ib_addr(struct rdma_id_private *id_priv)
3297*4882a593Smuzhiyun {
3298*4882a593Smuzhiyun struct cma_work *work;
3299*4882a593Smuzhiyun int ret;
3300*4882a593Smuzhiyun
3301*4882a593Smuzhiyun work = kzalloc(sizeof *work, GFP_KERNEL);
3302*4882a593Smuzhiyun if (!work)
3303*4882a593Smuzhiyun return -ENOMEM;
3304*4882a593Smuzhiyun
3305*4882a593Smuzhiyun if (!id_priv->cma_dev) {
3306*4882a593Smuzhiyun ret = cma_resolve_ib_dev(id_priv);
3307*4882a593Smuzhiyun if (ret)
3308*4882a593Smuzhiyun goto err;
3309*4882a593Smuzhiyun }
3310*4882a593Smuzhiyun
3311*4882a593Smuzhiyun rdma_addr_set_dgid(&id_priv->id.route.addr.dev_addr, (union ib_gid *)
3312*4882a593Smuzhiyun &(((struct sockaddr_ib *) &id_priv->id.route.addr.dst_addr)->sib_addr));
3313*4882a593Smuzhiyun
3314*4882a593Smuzhiyun enqueue_resolve_addr_work(work, id_priv);
3315*4882a593Smuzhiyun return 0;
3316*4882a593Smuzhiyun err:
3317*4882a593Smuzhiyun kfree(work);
3318*4882a593Smuzhiyun return ret;
3319*4882a593Smuzhiyun }
3320*4882a593Smuzhiyun
cma_bind_addr(struct rdma_cm_id * id,struct sockaddr * src_addr,const struct sockaddr * dst_addr)3321*4882a593Smuzhiyun static int cma_bind_addr(struct rdma_cm_id *id, struct sockaddr *src_addr,
3322*4882a593Smuzhiyun const struct sockaddr *dst_addr)
3323*4882a593Smuzhiyun {
3324*4882a593Smuzhiyun struct sockaddr_storage zero_sock = {};
3325*4882a593Smuzhiyun
3326*4882a593Smuzhiyun if (src_addr && src_addr->sa_family)
3327*4882a593Smuzhiyun return rdma_bind_addr(id, src_addr);
3328*4882a593Smuzhiyun
3329*4882a593Smuzhiyun /*
3330*4882a593Smuzhiyun * When the src_addr is not specified, automatically supply an any addr
3331*4882a593Smuzhiyun */
3332*4882a593Smuzhiyun zero_sock.ss_family = dst_addr->sa_family;
3333*4882a593Smuzhiyun if (IS_ENABLED(CONFIG_IPV6) && dst_addr->sa_family == AF_INET6) {
3334*4882a593Smuzhiyun struct sockaddr_in6 *src_addr6 =
3335*4882a593Smuzhiyun (struct sockaddr_in6 *)&zero_sock;
3336*4882a593Smuzhiyun struct sockaddr_in6 *dst_addr6 =
3337*4882a593Smuzhiyun (struct sockaddr_in6 *)dst_addr;
3338*4882a593Smuzhiyun
3339*4882a593Smuzhiyun src_addr6->sin6_scope_id = dst_addr6->sin6_scope_id;
3340*4882a593Smuzhiyun if (ipv6_addr_type(&dst_addr6->sin6_addr) & IPV6_ADDR_LINKLOCAL)
3341*4882a593Smuzhiyun id->route.addr.dev_addr.bound_dev_if =
3342*4882a593Smuzhiyun dst_addr6->sin6_scope_id;
3343*4882a593Smuzhiyun } else if (dst_addr->sa_family == AF_IB) {
3344*4882a593Smuzhiyun ((struct sockaddr_ib *)&zero_sock)->sib_pkey =
3345*4882a593Smuzhiyun ((struct sockaddr_ib *)dst_addr)->sib_pkey;
3346*4882a593Smuzhiyun }
3347*4882a593Smuzhiyun return rdma_bind_addr(id, (struct sockaddr *)&zero_sock);
3348*4882a593Smuzhiyun }
3349*4882a593Smuzhiyun
3350*4882a593Smuzhiyun /*
3351*4882a593Smuzhiyun * If required, resolve the source address for bind and leave the id_priv in
3352*4882a593Smuzhiyun * state RDMA_CM_ADDR_BOUND. This oddly uses the state to determine the prior
3353*4882a593Smuzhiyun * calls made by ULP, a previously bound ID will not be re-bound and src_addr is
3354*4882a593Smuzhiyun * ignored.
3355*4882a593Smuzhiyun */
resolve_prepare_src(struct rdma_id_private * id_priv,struct sockaddr * src_addr,const struct sockaddr * dst_addr)3356*4882a593Smuzhiyun static int resolve_prepare_src(struct rdma_id_private *id_priv,
3357*4882a593Smuzhiyun struct sockaddr *src_addr,
3358*4882a593Smuzhiyun const struct sockaddr *dst_addr)
3359*4882a593Smuzhiyun {
3360*4882a593Smuzhiyun int ret;
3361*4882a593Smuzhiyun
3362*4882a593Smuzhiyun memcpy(cma_dst_addr(id_priv), dst_addr, rdma_addr_size(dst_addr));
3363*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_BOUND, RDMA_CM_ADDR_QUERY)) {
3364*4882a593Smuzhiyun /* For a well behaved ULP state will be RDMA_CM_IDLE */
3365*4882a593Smuzhiyun ret = cma_bind_addr(&id_priv->id, src_addr, dst_addr);
3366*4882a593Smuzhiyun if (ret)
3367*4882a593Smuzhiyun goto err_dst;
3368*4882a593Smuzhiyun if (WARN_ON(!cma_comp_exch(id_priv, RDMA_CM_ADDR_BOUND,
3369*4882a593Smuzhiyun RDMA_CM_ADDR_QUERY))) {
3370*4882a593Smuzhiyun ret = -EINVAL;
3371*4882a593Smuzhiyun goto err_dst;
3372*4882a593Smuzhiyun }
3373*4882a593Smuzhiyun }
3374*4882a593Smuzhiyun
3375*4882a593Smuzhiyun if (cma_family(id_priv) != dst_addr->sa_family) {
3376*4882a593Smuzhiyun ret = -EINVAL;
3377*4882a593Smuzhiyun goto err_state;
3378*4882a593Smuzhiyun }
3379*4882a593Smuzhiyun return 0;
3380*4882a593Smuzhiyun
3381*4882a593Smuzhiyun err_state:
3382*4882a593Smuzhiyun cma_comp_exch(id_priv, RDMA_CM_ADDR_QUERY, RDMA_CM_ADDR_BOUND);
3383*4882a593Smuzhiyun err_dst:
3384*4882a593Smuzhiyun memset(cma_dst_addr(id_priv), 0, rdma_addr_size(dst_addr));
3385*4882a593Smuzhiyun return ret;
3386*4882a593Smuzhiyun }
3387*4882a593Smuzhiyun
rdma_resolve_addr(struct rdma_cm_id * id,struct sockaddr * src_addr,const struct sockaddr * dst_addr,unsigned long timeout_ms)3388*4882a593Smuzhiyun int rdma_resolve_addr(struct rdma_cm_id *id, struct sockaddr *src_addr,
3389*4882a593Smuzhiyun const struct sockaddr *dst_addr, unsigned long timeout_ms)
3390*4882a593Smuzhiyun {
3391*4882a593Smuzhiyun struct rdma_id_private *id_priv =
3392*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
3393*4882a593Smuzhiyun int ret;
3394*4882a593Smuzhiyun
3395*4882a593Smuzhiyun ret = resolve_prepare_src(id_priv, src_addr, dst_addr);
3396*4882a593Smuzhiyun if (ret)
3397*4882a593Smuzhiyun return ret;
3398*4882a593Smuzhiyun
3399*4882a593Smuzhiyun if (cma_any_addr(dst_addr)) {
3400*4882a593Smuzhiyun ret = cma_resolve_loopback(id_priv);
3401*4882a593Smuzhiyun } else {
3402*4882a593Smuzhiyun if (dst_addr->sa_family == AF_IB) {
3403*4882a593Smuzhiyun ret = cma_resolve_ib_addr(id_priv);
3404*4882a593Smuzhiyun } else {
3405*4882a593Smuzhiyun ret = rdma_resolve_ip(cma_src_addr(id_priv), dst_addr,
3406*4882a593Smuzhiyun &id->route.addr.dev_addr,
3407*4882a593Smuzhiyun timeout_ms, addr_handler,
3408*4882a593Smuzhiyun false, id_priv);
3409*4882a593Smuzhiyun }
3410*4882a593Smuzhiyun }
3411*4882a593Smuzhiyun if (ret)
3412*4882a593Smuzhiyun goto err;
3413*4882a593Smuzhiyun
3414*4882a593Smuzhiyun return 0;
3415*4882a593Smuzhiyun err:
3416*4882a593Smuzhiyun cma_comp_exch(id_priv, RDMA_CM_ADDR_QUERY, RDMA_CM_ADDR_BOUND);
3417*4882a593Smuzhiyun return ret;
3418*4882a593Smuzhiyun }
3419*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_resolve_addr);
3420*4882a593Smuzhiyun
rdma_set_reuseaddr(struct rdma_cm_id * id,int reuse)3421*4882a593Smuzhiyun int rdma_set_reuseaddr(struct rdma_cm_id *id, int reuse)
3422*4882a593Smuzhiyun {
3423*4882a593Smuzhiyun struct rdma_id_private *id_priv;
3424*4882a593Smuzhiyun unsigned long flags;
3425*4882a593Smuzhiyun int ret;
3426*4882a593Smuzhiyun
3427*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
3428*4882a593Smuzhiyun spin_lock_irqsave(&id_priv->lock, flags);
3429*4882a593Smuzhiyun if ((reuse && id_priv->state != RDMA_CM_LISTEN) ||
3430*4882a593Smuzhiyun id_priv->state == RDMA_CM_IDLE) {
3431*4882a593Smuzhiyun id_priv->reuseaddr = reuse;
3432*4882a593Smuzhiyun ret = 0;
3433*4882a593Smuzhiyun } else {
3434*4882a593Smuzhiyun ret = -EINVAL;
3435*4882a593Smuzhiyun }
3436*4882a593Smuzhiyun spin_unlock_irqrestore(&id_priv->lock, flags);
3437*4882a593Smuzhiyun return ret;
3438*4882a593Smuzhiyun }
3439*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_set_reuseaddr);
3440*4882a593Smuzhiyun
rdma_set_afonly(struct rdma_cm_id * id,int afonly)3441*4882a593Smuzhiyun int rdma_set_afonly(struct rdma_cm_id *id, int afonly)
3442*4882a593Smuzhiyun {
3443*4882a593Smuzhiyun struct rdma_id_private *id_priv;
3444*4882a593Smuzhiyun unsigned long flags;
3445*4882a593Smuzhiyun int ret;
3446*4882a593Smuzhiyun
3447*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
3448*4882a593Smuzhiyun spin_lock_irqsave(&id_priv->lock, flags);
3449*4882a593Smuzhiyun if (id_priv->state == RDMA_CM_IDLE || id_priv->state == RDMA_CM_ADDR_BOUND) {
3450*4882a593Smuzhiyun id_priv->options |= (1 << CMA_OPTION_AFONLY);
3451*4882a593Smuzhiyun id_priv->afonly = afonly;
3452*4882a593Smuzhiyun ret = 0;
3453*4882a593Smuzhiyun } else {
3454*4882a593Smuzhiyun ret = -EINVAL;
3455*4882a593Smuzhiyun }
3456*4882a593Smuzhiyun spin_unlock_irqrestore(&id_priv->lock, flags);
3457*4882a593Smuzhiyun return ret;
3458*4882a593Smuzhiyun }
3459*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_set_afonly);
3460*4882a593Smuzhiyun
cma_bind_port(struct rdma_bind_list * bind_list,struct rdma_id_private * id_priv)3461*4882a593Smuzhiyun static void cma_bind_port(struct rdma_bind_list *bind_list,
3462*4882a593Smuzhiyun struct rdma_id_private *id_priv)
3463*4882a593Smuzhiyun {
3464*4882a593Smuzhiyun struct sockaddr *addr;
3465*4882a593Smuzhiyun struct sockaddr_ib *sib;
3466*4882a593Smuzhiyun u64 sid, mask;
3467*4882a593Smuzhiyun __be16 port;
3468*4882a593Smuzhiyun
3469*4882a593Smuzhiyun lockdep_assert_held(&lock);
3470*4882a593Smuzhiyun
3471*4882a593Smuzhiyun addr = cma_src_addr(id_priv);
3472*4882a593Smuzhiyun port = htons(bind_list->port);
3473*4882a593Smuzhiyun
3474*4882a593Smuzhiyun switch (addr->sa_family) {
3475*4882a593Smuzhiyun case AF_INET:
3476*4882a593Smuzhiyun ((struct sockaddr_in *) addr)->sin_port = port;
3477*4882a593Smuzhiyun break;
3478*4882a593Smuzhiyun case AF_INET6:
3479*4882a593Smuzhiyun ((struct sockaddr_in6 *) addr)->sin6_port = port;
3480*4882a593Smuzhiyun break;
3481*4882a593Smuzhiyun case AF_IB:
3482*4882a593Smuzhiyun sib = (struct sockaddr_ib *) addr;
3483*4882a593Smuzhiyun sid = be64_to_cpu(sib->sib_sid);
3484*4882a593Smuzhiyun mask = be64_to_cpu(sib->sib_sid_mask);
3485*4882a593Smuzhiyun sib->sib_sid = cpu_to_be64((sid & mask) | (u64) ntohs(port));
3486*4882a593Smuzhiyun sib->sib_sid_mask = cpu_to_be64(~0ULL);
3487*4882a593Smuzhiyun break;
3488*4882a593Smuzhiyun }
3489*4882a593Smuzhiyun id_priv->bind_list = bind_list;
3490*4882a593Smuzhiyun hlist_add_head(&id_priv->node, &bind_list->owners);
3491*4882a593Smuzhiyun }
3492*4882a593Smuzhiyun
cma_alloc_port(enum rdma_ucm_port_space ps,struct rdma_id_private * id_priv,unsigned short snum)3493*4882a593Smuzhiyun static int cma_alloc_port(enum rdma_ucm_port_space ps,
3494*4882a593Smuzhiyun struct rdma_id_private *id_priv, unsigned short snum)
3495*4882a593Smuzhiyun {
3496*4882a593Smuzhiyun struct rdma_bind_list *bind_list;
3497*4882a593Smuzhiyun int ret;
3498*4882a593Smuzhiyun
3499*4882a593Smuzhiyun lockdep_assert_held(&lock);
3500*4882a593Smuzhiyun
3501*4882a593Smuzhiyun bind_list = kzalloc(sizeof *bind_list, GFP_KERNEL);
3502*4882a593Smuzhiyun if (!bind_list)
3503*4882a593Smuzhiyun return -ENOMEM;
3504*4882a593Smuzhiyun
3505*4882a593Smuzhiyun ret = cma_ps_alloc(id_priv->id.route.addr.dev_addr.net, ps, bind_list,
3506*4882a593Smuzhiyun snum);
3507*4882a593Smuzhiyun if (ret < 0)
3508*4882a593Smuzhiyun goto err;
3509*4882a593Smuzhiyun
3510*4882a593Smuzhiyun bind_list->ps = ps;
3511*4882a593Smuzhiyun bind_list->port = snum;
3512*4882a593Smuzhiyun cma_bind_port(bind_list, id_priv);
3513*4882a593Smuzhiyun return 0;
3514*4882a593Smuzhiyun err:
3515*4882a593Smuzhiyun kfree(bind_list);
3516*4882a593Smuzhiyun return ret == -ENOSPC ? -EADDRNOTAVAIL : ret;
3517*4882a593Smuzhiyun }
3518*4882a593Smuzhiyun
cma_port_is_unique(struct rdma_bind_list * bind_list,struct rdma_id_private * id_priv)3519*4882a593Smuzhiyun static int cma_port_is_unique(struct rdma_bind_list *bind_list,
3520*4882a593Smuzhiyun struct rdma_id_private *id_priv)
3521*4882a593Smuzhiyun {
3522*4882a593Smuzhiyun struct rdma_id_private *cur_id;
3523*4882a593Smuzhiyun struct sockaddr *daddr = cma_dst_addr(id_priv);
3524*4882a593Smuzhiyun struct sockaddr *saddr = cma_src_addr(id_priv);
3525*4882a593Smuzhiyun __be16 dport = cma_port(daddr);
3526*4882a593Smuzhiyun
3527*4882a593Smuzhiyun lockdep_assert_held(&lock);
3528*4882a593Smuzhiyun
3529*4882a593Smuzhiyun hlist_for_each_entry(cur_id, &bind_list->owners, node) {
3530*4882a593Smuzhiyun struct sockaddr *cur_daddr = cma_dst_addr(cur_id);
3531*4882a593Smuzhiyun struct sockaddr *cur_saddr = cma_src_addr(cur_id);
3532*4882a593Smuzhiyun __be16 cur_dport = cma_port(cur_daddr);
3533*4882a593Smuzhiyun
3534*4882a593Smuzhiyun if (id_priv == cur_id)
3535*4882a593Smuzhiyun continue;
3536*4882a593Smuzhiyun
3537*4882a593Smuzhiyun /* different dest port -> unique */
3538*4882a593Smuzhiyun if (!cma_any_port(daddr) &&
3539*4882a593Smuzhiyun !cma_any_port(cur_daddr) &&
3540*4882a593Smuzhiyun (dport != cur_dport))
3541*4882a593Smuzhiyun continue;
3542*4882a593Smuzhiyun
3543*4882a593Smuzhiyun /* different src address -> unique */
3544*4882a593Smuzhiyun if (!cma_any_addr(saddr) &&
3545*4882a593Smuzhiyun !cma_any_addr(cur_saddr) &&
3546*4882a593Smuzhiyun cma_addr_cmp(saddr, cur_saddr))
3547*4882a593Smuzhiyun continue;
3548*4882a593Smuzhiyun
3549*4882a593Smuzhiyun /* different dst address -> unique */
3550*4882a593Smuzhiyun if (!cma_any_addr(daddr) &&
3551*4882a593Smuzhiyun !cma_any_addr(cur_daddr) &&
3552*4882a593Smuzhiyun cma_addr_cmp(daddr, cur_daddr))
3553*4882a593Smuzhiyun continue;
3554*4882a593Smuzhiyun
3555*4882a593Smuzhiyun return -EADDRNOTAVAIL;
3556*4882a593Smuzhiyun }
3557*4882a593Smuzhiyun return 0;
3558*4882a593Smuzhiyun }
3559*4882a593Smuzhiyun
cma_alloc_any_port(enum rdma_ucm_port_space ps,struct rdma_id_private * id_priv)3560*4882a593Smuzhiyun static int cma_alloc_any_port(enum rdma_ucm_port_space ps,
3561*4882a593Smuzhiyun struct rdma_id_private *id_priv)
3562*4882a593Smuzhiyun {
3563*4882a593Smuzhiyun static unsigned int last_used_port;
3564*4882a593Smuzhiyun int low, high, remaining;
3565*4882a593Smuzhiyun unsigned int rover;
3566*4882a593Smuzhiyun struct net *net = id_priv->id.route.addr.dev_addr.net;
3567*4882a593Smuzhiyun
3568*4882a593Smuzhiyun lockdep_assert_held(&lock);
3569*4882a593Smuzhiyun
3570*4882a593Smuzhiyun inet_get_local_port_range(net, &low, &high);
3571*4882a593Smuzhiyun remaining = (high - low) + 1;
3572*4882a593Smuzhiyun rover = prandom_u32() % remaining + low;
3573*4882a593Smuzhiyun retry:
3574*4882a593Smuzhiyun if (last_used_port != rover) {
3575*4882a593Smuzhiyun struct rdma_bind_list *bind_list;
3576*4882a593Smuzhiyun int ret;
3577*4882a593Smuzhiyun
3578*4882a593Smuzhiyun bind_list = cma_ps_find(net, ps, (unsigned short)rover);
3579*4882a593Smuzhiyun
3580*4882a593Smuzhiyun if (!bind_list) {
3581*4882a593Smuzhiyun ret = cma_alloc_port(ps, id_priv, rover);
3582*4882a593Smuzhiyun } else {
3583*4882a593Smuzhiyun ret = cma_port_is_unique(bind_list, id_priv);
3584*4882a593Smuzhiyun if (!ret)
3585*4882a593Smuzhiyun cma_bind_port(bind_list, id_priv);
3586*4882a593Smuzhiyun }
3587*4882a593Smuzhiyun /*
3588*4882a593Smuzhiyun * Remember previously used port number in order to avoid
3589*4882a593Smuzhiyun * re-using same port immediately after it is closed.
3590*4882a593Smuzhiyun */
3591*4882a593Smuzhiyun if (!ret)
3592*4882a593Smuzhiyun last_used_port = rover;
3593*4882a593Smuzhiyun if (ret != -EADDRNOTAVAIL)
3594*4882a593Smuzhiyun return ret;
3595*4882a593Smuzhiyun }
3596*4882a593Smuzhiyun if (--remaining) {
3597*4882a593Smuzhiyun rover++;
3598*4882a593Smuzhiyun if ((rover < low) || (rover > high))
3599*4882a593Smuzhiyun rover = low;
3600*4882a593Smuzhiyun goto retry;
3601*4882a593Smuzhiyun }
3602*4882a593Smuzhiyun return -EADDRNOTAVAIL;
3603*4882a593Smuzhiyun }
3604*4882a593Smuzhiyun
3605*4882a593Smuzhiyun /*
3606*4882a593Smuzhiyun * Check that the requested port is available. This is called when trying to
3607*4882a593Smuzhiyun * bind to a specific port, or when trying to listen on a bound port. In
3608*4882a593Smuzhiyun * the latter case, the provided id_priv may already be on the bind_list, but
3609*4882a593Smuzhiyun * we still need to check that it's okay to start listening.
3610*4882a593Smuzhiyun */
cma_check_port(struct rdma_bind_list * bind_list,struct rdma_id_private * id_priv,uint8_t reuseaddr)3611*4882a593Smuzhiyun static int cma_check_port(struct rdma_bind_list *bind_list,
3612*4882a593Smuzhiyun struct rdma_id_private *id_priv, uint8_t reuseaddr)
3613*4882a593Smuzhiyun {
3614*4882a593Smuzhiyun struct rdma_id_private *cur_id;
3615*4882a593Smuzhiyun struct sockaddr *addr, *cur_addr;
3616*4882a593Smuzhiyun
3617*4882a593Smuzhiyun lockdep_assert_held(&lock);
3618*4882a593Smuzhiyun
3619*4882a593Smuzhiyun addr = cma_src_addr(id_priv);
3620*4882a593Smuzhiyun hlist_for_each_entry(cur_id, &bind_list->owners, node) {
3621*4882a593Smuzhiyun if (id_priv == cur_id)
3622*4882a593Smuzhiyun continue;
3623*4882a593Smuzhiyun
3624*4882a593Smuzhiyun if (reuseaddr && cur_id->reuseaddr)
3625*4882a593Smuzhiyun continue;
3626*4882a593Smuzhiyun
3627*4882a593Smuzhiyun cur_addr = cma_src_addr(cur_id);
3628*4882a593Smuzhiyun if (id_priv->afonly && cur_id->afonly &&
3629*4882a593Smuzhiyun (addr->sa_family != cur_addr->sa_family))
3630*4882a593Smuzhiyun continue;
3631*4882a593Smuzhiyun
3632*4882a593Smuzhiyun if (cma_any_addr(addr) || cma_any_addr(cur_addr))
3633*4882a593Smuzhiyun return -EADDRNOTAVAIL;
3634*4882a593Smuzhiyun
3635*4882a593Smuzhiyun if (!cma_addr_cmp(addr, cur_addr))
3636*4882a593Smuzhiyun return -EADDRINUSE;
3637*4882a593Smuzhiyun }
3638*4882a593Smuzhiyun return 0;
3639*4882a593Smuzhiyun }
3640*4882a593Smuzhiyun
cma_use_port(enum rdma_ucm_port_space ps,struct rdma_id_private * id_priv)3641*4882a593Smuzhiyun static int cma_use_port(enum rdma_ucm_port_space ps,
3642*4882a593Smuzhiyun struct rdma_id_private *id_priv)
3643*4882a593Smuzhiyun {
3644*4882a593Smuzhiyun struct rdma_bind_list *bind_list;
3645*4882a593Smuzhiyun unsigned short snum;
3646*4882a593Smuzhiyun int ret;
3647*4882a593Smuzhiyun
3648*4882a593Smuzhiyun lockdep_assert_held(&lock);
3649*4882a593Smuzhiyun
3650*4882a593Smuzhiyun snum = ntohs(cma_port(cma_src_addr(id_priv)));
3651*4882a593Smuzhiyun if (snum < PROT_SOCK && !capable(CAP_NET_BIND_SERVICE))
3652*4882a593Smuzhiyun return -EACCES;
3653*4882a593Smuzhiyun
3654*4882a593Smuzhiyun bind_list = cma_ps_find(id_priv->id.route.addr.dev_addr.net, ps, snum);
3655*4882a593Smuzhiyun if (!bind_list) {
3656*4882a593Smuzhiyun ret = cma_alloc_port(ps, id_priv, snum);
3657*4882a593Smuzhiyun } else {
3658*4882a593Smuzhiyun ret = cma_check_port(bind_list, id_priv, id_priv->reuseaddr);
3659*4882a593Smuzhiyun if (!ret)
3660*4882a593Smuzhiyun cma_bind_port(bind_list, id_priv);
3661*4882a593Smuzhiyun }
3662*4882a593Smuzhiyun return ret;
3663*4882a593Smuzhiyun }
3664*4882a593Smuzhiyun
3665*4882a593Smuzhiyun static enum rdma_ucm_port_space
cma_select_inet_ps(struct rdma_id_private * id_priv)3666*4882a593Smuzhiyun cma_select_inet_ps(struct rdma_id_private *id_priv)
3667*4882a593Smuzhiyun {
3668*4882a593Smuzhiyun switch (id_priv->id.ps) {
3669*4882a593Smuzhiyun case RDMA_PS_TCP:
3670*4882a593Smuzhiyun case RDMA_PS_UDP:
3671*4882a593Smuzhiyun case RDMA_PS_IPOIB:
3672*4882a593Smuzhiyun case RDMA_PS_IB:
3673*4882a593Smuzhiyun return id_priv->id.ps;
3674*4882a593Smuzhiyun default:
3675*4882a593Smuzhiyun
3676*4882a593Smuzhiyun return 0;
3677*4882a593Smuzhiyun }
3678*4882a593Smuzhiyun }
3679*4882a593Smuzhiyun
3680*4882a593Smuzhiyun static enum rdma_ucm_port_space
cma_select_ib_ps(struct rdma_id_private * id_priv)3681*4882a593Smuzhiyun cma_select_ib_ps(struct rdma_id_private *id_priv)
3682*4882a593Smuzhiyun {
3683*4882a593Smuzhiyun enum rdma_ucm_port_space ps = 0;
3684*4882a593Smuzhiyun struct sockaddr_ib *sib;
3685*4882a593Smuzhiyun u64 sid_ps, mask, sid;
3686*4882a593Smuzhiyun
3687*4882a593Smuzhiyun sib = (struct sockaddr_ib *) cma_src_addr(id_priv);
3688*4882a593Smuzhiyun mask = be64_to_cpu(sib->sib_sid_mask) & RDMA_IB_IP_PS_MASK;
3689*4882a593Smuzhiyun sid = be64_to_cpu(sib->sib_sid) & mask;
3690*4882a593Smuzhiyun
3691*4882a593Smuzhiyun if ((id_priv->id.ps == RDMA_PS_IB) && (sid == (RDMA_IB_IP_PS_IB & mask))) {
3692*4882a593Smuzhiyun sid_ps = RDMA_IB_IP_PS_IB;
3693*4882a593Smuzhiyun ps = RDMA_PS_IB;
3694*4882a593Smuzhiyun } else if (((id_priv->id.ps == RDMA_PS_IB) || (id_priv->id.ps == RDMA_PS_TCP)) &&
3695*4882a593Smuzhiyun (sid == (RDMA_IB_IP_PS_TCP & mask))) {
3696*4882a593Smuzhiyun sid_ps = RDMA_IB_IP_PS_TCP;
3697*4882a593Smuzhiyun ps = RDMA_PS_TCP;
3698*4882a593Smuzhiyun } else if (((id_priv->id.ps == RDMA_PS_IB) || (id_priv->id.ps == RDMA_PS_UDP)) &&
3699*4882a593Smuzhiyun (sid == (RDMA_IB_IP_PS_UDP & mask))) {
3700*4882a593Smuzhiyun sid_ps = RDMA_IB_IP_PS_UDP;
3701*4882a593Smuzhiyun ps = RDMA_PS_UDP;
3702*4882a593Smuzhiyun }
3703*4882a593Smuzhiyun
3704*4882a593Smuzhiyun if (ps) {
3705*4882a593Smuzhiyun sib->sib_sid = cpu_to_be64(sid_ps | ntohs(cma_port((struct sockaddr *) sib)));
3706*4882a593Smuzhiyun sib->sib_sid_mask = cpu_to_be64(RDMA_IB_IP_PS_MASK |
3707*4882a593Smuzhiyun be64_to_cpu(sib->sib_sid_mask));
3708*4882a593Smuzhiyun }
3709*4882a593Smuzhiyun return ps;
3710*4882a593Smuzhiyun }
3711*4882a593Smuzhiyun
cma_get_port(struct rdma_id_private * id_priv)3712*4882a593Smuzhiyun static int cma_get_port(struct rdma_id_private *id_priv)
3713*4882a593Smuzhiyun {
3714*4882a593Smuzhiyun enum rdma_ucm_port_space ps;
3715*4882a593Smuzhiyun int ret;
3716*4882a593Smuzhiyun
3717*4882a593Smuzhiyun if (cma_family(id_priv) != AF_IB)
3718*4882a593Smuzhiyun ps = cma_select_inet_ps(id_priv);
3719*4882a593Smuzhiyun else
3720*4882a593Smuzhiyun ps = cma_select_ib_ps(id_priv);
3721*4882a593Smuzhiyun if (!ps)
3722*4882a593Smuzhiyun return -EPROTONOSUPPORT;
3723*4882a593Smuzhiyun
3724*4882a593Smuzhiyun mutex_lock(&lock);
3725*4882a593Smuzhiyun if (cma_any_port(cma_src_addr(id_priv)))
3726*4882a593Smuzhiyun ret = cma_alloc_any_port(ps, id_priv);
3727*4882a593Smuzhiyun else
3728*4882a593Smuzhiyun ret = cma_use_port(ps, id_priv);
3729*4882a593Smuzhiyun mutex_unlock(&lock);
3730*4882a593Smuzhiyun
3731*4882a593Smuzhiyun return ret;
3732*4882a593Smuzhiyun }
3733*4882a593Smuzhiyun
cma_check_linklocal(struct rdma_dev_addr * dev_addr,struct sockaddr * addr)3734*4882a593Smuzhiyun static int cma_check_linklocal(struct rdma_dev_addr *dev_addr,
3735*4882a593Smuzhiyun struct sockaddr *addr)
3736*4882a593Smuzhiyun {
3737*4882a593Smuzhiyun #if IS_ENABLED(CONFIG_IPV6)
3738*4882a593Smuzhiyun struct sockaddr_in6 *sin6;
3739*4882a593Smuzhiyun
3740*4882a593Smuzhiyun if (addr->sa_family != AF_INET6)
3741*4882a593Smuzhiyun return 0;
3742*4882a593Smuzhiyun
3743*4882a593Smuzhiyun sin6 = (struct sockaddr_in6 *) addr;
3744*4882a593Smuzhiyun
3745*4882a593Smuzhiyun if (!(ipv6_addr_type(&sin6->sin6_addr) & IPV6_ADDR_LINKLOCAL))
3746*4882a593Smuzhiyun return 0;
3747*4882a593Smuzhiyun
3748*4882a593Smuzhiyun if (!sin6->sin6_scope_id)
3749*4882a593Smuzhiyun return -EINVAL;
3750*4882a593Smuzhiyun
3751*4882a593Smuzhiyun dev_addr->bound_dev_if = sin6->sin6_scope_id;
3752*4882a593Smuzhiyun #endif
3753*4882a593Smuzhiyun return 0;
3754*4882a593Smuzhiyun }
3755*4882a593Smuzhiyun
rdma_listen(struct rdma_cm_id * id,int backlog)3756*4882a593Smuzhiyun int rdma_listen(struct rdma_cm_id *id, int backlog)
3757*4882a593Smuzhiyun {
3758*4882a593Smuzhiyun struct rdma_id_private *id_priv =
3759*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
3760*4882a593Smuzhiyun int ret;
3761*4882a593Smuzhiyun
3762*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, RDMA_CM_ADDR_BOUND, RDMA_CM_LISTEN)) {
3763*4882a593Smuzhiyun struct sockaddr_in any_in = {
3764*4882a593Smuzhiyun .sin_family = AF_INET,
3765*4882a593Smuzhiyun .sin_addr.s_addr = htonl(INADDR_ANY),
3766*4882a593Smuzhiyun };
3767*4882a593Smuzhiyun
3768*4882a593Smuzhiyun /* For a well behaved ULP state will be RDMA_CM_IDLE */
3769*4882a593Smuzhiyun ret = rdma_bind_addr(id, (struct sockaddr *)&any_in);
3770*4882a593Smuzhiyun if (ret)
3771*4882a593Smuzhiyun return ret;
3772*4882a593Smuzhiyun if (WARN_ON(!cma_comp_exch(id_priv, RDMA_CM_ADDR_BOUND,
3773*4882a593Smuzhiyun RDMA_CM_LISTEN)))
3774*4882a593Smuzhiyun return -EINVAL;
3775*4882a593Smuzhiyun }
3776*4882a593Smuzhiyun
3777*4882a593Smuzhiyun /*
3778*4882a593Smuzhiyun * Once the ID reaches RDMA_CM_LISTEN it is not allowed to be reusable
3779*4882a593Smuzhiyun * any more, and has to be unique in the bind list.
3780*4882a593Smuzhiyun */
3781*4882a593Smuzhiyun if (id_priv->reuseaddr) {
3782*4882a593Smuzhiyun mutex_lock(&lock);
3783*4882a593Smuzhiyun ret = cma_check_port(id_priv->bind_list, id_priv, 0);
3784*4882a593Smuzhiyun if (!ret)
3785*4882a593Smuzhiyun id_priv->reuseaddr = 0;
3786*4882a593Smuzhiyun mutex_unlock(&lock);
3787*4882a593Smuzhiyun if (ret)
3788*4882a593Smuzhiyun goto err;
3789*4882a593Smuzhiyun }
3790*4882a593Smuzhiyun
3791*4882a593Smuzhiyun id_priv->backlog = backlog;
3792*4882a593Smuzhiyun if (id_priv->cma_dev) {
3793*4882a593Smuzhiyun if (rdma_cap_ib_cm(id->device, 1)) {
3794*4882a593Smuzhiyun ret = cma_ib_listen(id_priv);
3795*4882a593Smuzhiyun if (ret)
3796*4882a593Smuzhiyun goto err;
3797*4882a593Smuzhiyun } else if (rdma_cap_iw_cm(id->device, 1)) {
3798*4882a593Smuzhiyun ret = cma_iw_listen(id_priv, backlog);
3799*4882a593Smuzhiyun if (ret)
3800*4882a593Smuzhiyun goto err;
3801*4882a593Smuzhiyun } else {
3802*4882a593Smuzhiyun ret = -ENOSYS;
3803*4882a593Smuzhiyun goto err;
3804*4882a593Smuzhiyun }
3805*4882a593Smuzhiyun } else {
3806*4882a593Smuzhiyun ret = cma_listen_on_all(id_priv);
3807*4882a593Smuzhiyun if (ret)
3808*4882a593Smuzhiyun goto err;
3809*4882a593Smuzhiyun }
3810*4882a593Smuzhiyun
3811*4882a593Smuzhiyun return 0;
3812*4882a593Smuzhiyun err:
3813*4882a593Smuzhiyun id_priv->backlog = 0;
3814*4882a593Smuzhiyun /*
3815*4882a593Smuzhiyun * All the failure paths that lead here will not allow the req_handler's
3816*4882a593Smuzhiyun * to have run.
3817*4882a593Smuzhiyun */
3818*4882a593Smuzhiyun cma_comp_exch(id_priv, RDMA_CM_LISTEN, RDMA_CM_ADDR_BOUND);
3819*4882a593Smuzhiyun return ret;
3820*4882a593Smuzhiyun }
3821*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_listen);
3822*4882a593Smuzhiyun
rdma_bind_addr(struct rdma_cm_id * id,struct sockaddr * addr)3823*4882a593Smuzhiyun int rdma_bind_addr(struct rdma_cm_id *id, struct sockaddr *addr)
3824*4882a593Smuzhiyun {
3825*4882a593Smuzhiyun struct rdma_id_private *id_priv;
3826*4882a593Smuzhiyun int ret;
3827*4882a593Smuzhiyun struct sockaddr *daddr;
3828*4882a593Smuzhiyun
3829*4882a593Smuzhiyun if (addr->sa_family != AF_INET && addr->sa_family != AF_INET6 &&
3830*4882a593Smuzhiyun addr->sa_family != AF_IB)
3831*4882a593Smuzhiyun return -EAFNOSUPPORT;
3832*4882a593Smuzhiyun
3833*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
3834*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, RDMA_CM_IDLE, RDMA_CM_ADDR_BOUND))
3835*4882a593Smuzhiyun return -EINVAL;
3836*4882a593Smuzhiyun
3837*4882a593Smuzhiyun ret = cma_check_linklocal(&id->route.addr.dev_addr, addr);
3838*4882a593Smuzhiyun if (ret)
3839*4882a593Smuzhiyun goto err1;
3840*4882a593Smuzhiyun
3841*4882a593Smuzhiyun memcpy(cma_src_addr(id_priv), addr, rdma_addr_size(addr));
3842*4882a593Smuzhiyun if (!cma_any_addr(addr)) {
3843*4882a593Smuzhiyun ret = cma_translate_addr(addr, &id->route.addr.dev_addr);
3844*4882a593Smuzhiyun if (ret)
3845*4882a593Smuzhiyun goto err1;
3846*4882a593Smuzhiyun
3847*4882a593Smuzhiyun ret = cma_acquire_dev_by_src_ip(id_priv);
3848*4882a593Smuzhiyun if (ret)
3849*4882a593Smuzhiyun goto err1;
3850*4882a593Smuzhiyun }
3851*4882a593Smuzhiyun
3852*4882a593Smuzhiyun if (!(id_priv->options & (1 << CMA_OPTION_AFONLY))) {
3853*4882a593Smuzhiyun if (addr->sa_family == AF_INET)
3854*4882a593Smuzhiyun id_priv->afonly = 1;
3855*4882a593Smuzhiyun #if IS_ENABLED(CONFIG_IPV6)
3856*4882a593Smuzhiyun else if (addr->sa_family == AF_INET6) {
3857*4882a593Smuzhiyun struct net *net = id_priv->id.route.addr.dev_addr.net;
3858*4882a593Smuzhiyun
3859*4882a593Smuzhiyun id_priv->afonly = net->ipv6.sysctl.bindv6only;
3860*4882a593Smuzhiyun }
3861*4882a593Smuzhiyun #endif
3862*4882a593Smuzhiyun }
3863*4882a593Smuzhiyun daddr = cma_dst_addr(id_priv);
3864*4882a593Smuzhiyun daddr->sa_family = addr->sa_family;
3865*4882a593Smuzhiyun
3866*4882a593Smuzhiyun ret = cma_get_port(id_priv);
3867*4882a593Smuzhiyun if (ret)
3868*4882a593Smuzhiyun goto err2;
3869*4882a593Smuzhiyun
3870*4882a593Smuzhiyun if (!cma_any_addr(addr))
3871*4882a593Smuzhiyun rdma_restrack_add(&id_priv->res);
3872*4882a593Smuzhiyun return 0;
3873*4882a593Smuzhiyun err2:
3874*4882a593Smuzhiyun if (id_priv->cma_dev)
3875*4882a593Smuzhiyun cma_release_dev(id_priv);
3876*4882a593Smuzhiyun err1:
3877*4882a593Smuzhiyun cma_comp_exch(id_priv, RDMA_CM_ADDR_BOUND, RDMA_CM_IDLE);
3878*4882a593Smuzhiyun return ret;
3879*4882a593Smuzhiyun }
3880*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_bind_addr);
3881*4882a593Smuzhiyun
cma_format_hdr(void * hdr,struct rdma_id_private * id_priv)3882*4882a593Smuzhiyun static int cma_format_hdr(void *hdr, struct rdma_id_private *id_priv)
3883*4882a593Smuzhiyun {
3884*4882a593Smuzhiyun struct cma_hdr *cma_hdr;
3885*4882a593Smuzhiyun
3886*4882a593Smuzhiyun cma_hdr = hdr;
3887*4882a593Smuzhiyun cma_hdr->cma_version = CMA_VERSION;
3888*4882a593Smuzhiyun if (cma_family(id_priv) == AF_INET) {
3889*4882a593Smuzhiyun struct sockaddr_in *src4, *dst4;
3890*4882a593Smuzhiyun
3891*4882a593Smuzhiyun src4 = (struct sockaddr_in *) cma_src_addr(id_priv);
3892*4882a593Smuzhiyun dst4 = (struct sockaddr_in *) cma_dst_addr(id_priv);
3893*4882a593Smuzhiyun
3894*4882a593Smuzhiyun cma_set_ip_ver(cma_hdr, 4);
3895*4882a593Smuzhiyun cma_hdr->src_addr.ip4.addr = src4->sin_addr.s_addr;
3896*4882a593Smuzhiyun cma_hdr->dst_addr.ip4.addr = dst4->sin_addr.s_addr;
3897*4882a593Smuzhiyun cma_hdr->port = src4->sin_port;
3898*4882a593Smuzhiyun } else if (cma_family(id_priv) == AF_INET6) {
3899*4882a593Smuzhiyun struct sockaddr_in6 *src6, *dst6;
3900*4882a593Smuzhiyun
3901*4882a593Smuzhiyun src6 = (struct sockaddr_in6 *) cma_src_addr(id_priv);
3902*4882a593Smuzhiyun dst6 = (struct sockaddr_in6 *) cma_dst_addr(id_priv);
3903*4882a593Smuzhiyun
3904*4882a593Smuzhiyun cma_set_ip_ver(cma_hdr, 6);
3905*4882a593Smuzhiyun cma_hdr->src_addr.ip6 = src6->sin6_addr;
3906*4882a593Smuzhiyun cma_hdr->dst_addr.ip6 = dst6->sin6_addr;
3907*4882a593Smuzhiyun cma_hdr->port = src6->sin6_port;
3908*4882a593Smuzhiyun }
3909*4882a593Smuzhiyun return 0;
3910*4882a593Smuzhiyun }
3911*4882a593Smuzhiyun
cma_sidr_rep_handler(struct ib_cm_id * cm_id,const struct ib_cm_event * ib_event)3912*4882a593Smuzhiyun static int cma_sidr_rep_handler(struct ib_cm_id *cm_id,
3913*4882a593Smuzhiyun const struct ib_cm_event *ib_event)
3914*4882a593Smuzhiyun {
3915*4882a593Smuzhiyun struct rdma_id_private *id_priv = cm_id->context;
3916*4882a593Smuzhiyun struct rdma_cm_event event = {};
3917*4882a593Smuzhiyun const struct ib_cm_sidr_rep_event_param *rep =
3918*4882a593Smuzhiyun &ib_event->param.sidr_rep_rcvd;
3919*4882a593Smuzhiyun int ret;
3920*4882a593Smuzhiyun
3921*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
3922*4882a593Smuzhiyun if (READ_ONCE(id_priv->state) != RDMA_CM_CONNECT)
3923*4882a593Smuzhiyun goto out;
3924*4882a593Smuzhiyun
3925*4882a593Smuzhiyun switch (ib_event->event) {
3926*4882a593Smuzhiyun case IB_CM_SIDR_REQ_ERROR:
3927*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_UNREACHABLE;
3928*4882a593Smuzhiyun event.status = -ETIMEDOUT;
3929*4882a593Smuzhiyun break;
3930*4882a593Smuzhiyun case IB_CM_SIDR_REP_RECEIVED:
3931*4882a593Smuzhiyun event.param.ud.private_data = ib_event->private_data;
3932*4882a593Smuzhiyun event.param.ud.private_data_len = IB_CM_SIDR_REP_PRIVATE_DATA_SIZE;
3933*4882a593Smuzhiyun if (rep->status != IB_SIDR_SUCCESS) {
3934*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_UNREACHABLE;
3935*4882a593Smuzhiyun event.status = ib_event->param.sidr_rep_rcvd.status;
3936*4882a593Smuzhiyun pr_debug_ratelimited("RDMA CM: UNREACHABLE: bad SIDR reply. status %d\n",
3937*4882a593Smuzhiyun event.status);
3938*4882a593Smuzhiyun break;
3939*4882a593Smuzhiyun }
3940*4882a593Smuzhiyun ret = cma_set_qkey(id_priv, rep->qkey);
3941*4882a593Smuzhiyun if (ret) {
3942*4882a593Smuzhiyun pr_debug_ratelimited("RDMA CM: ADDR_ERROR: failed to set qkey. status %d\n", ret);
3943*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_ADDR_ERROR;
3944*4882a593Smuzhiyun event.status = ret;
3945*4882a593Smuzhiyun break;
3946*4882a593Smuzhiyun }
3947*4882a593Smuzhiyun ib_init_ah_attr_from_path(id_priv->id.device,
3948*4882a593Smuzhiyun id_priv->id.port_num,
3949*4882a593Smuzhiyun id_priv->id.route.path_rec,
3950*4882a593Smuzhiyun &event.param.ud.ah_attr,
3951*4882a593Smuzhiyun rep->sgid_attr);
3952*4882a593Smuzhiyun event.param.ud.qp_num = rep->qpn;
3953*4882a593Smuzhiyun event.param.ud.qkey = rep->qkey;
3954*4882a593Smuzhiyun event.event = RDMA_CM_EVENT_ESTABLISHED;
3955*4882a593Smuzhiyun event.status = 0;
3956*4882a593Smuzhiyun break;
3957*4882a593Smuzhiyun default:
3958*4882a593Smuzhiyun pr_err("RDMA CMA: unexpected IB CM event: %d\n",
3959*4882a593Smuzhiyun ib_event->event);
3960*4882a593Smuzhiyun goto out;
3961*4882a593Smuzhiyun }
3962*4882a593Smuzhiyun
3963*4882a593Smuzhiyun ret = cma_cm_event_handler(id_priv, &event);
3964*4882a593Smuzhiyun
3965*4882a593Smuzhiyun rdma_destroy_ah_attr(&event.param.ud.ah_attr);
3966*4882a593Smuzhiyun if (ret) {
3967*4882a593Smuzhiyun /* Destroy the CM ID by returning a non-zero value. */
3968*4882a593Smuzhiyun id_priv->cm_id.ib = NULL;
3969*4882a593Smuzhiyun destroy_id_handler_unlock(id_priv);
3970*4882a593Smuzhiyun return ret;
3971*4882a593Smuzhiyun }
3972*4882a593Smuzhiyun out:
3973*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
3974*4882a593Smuzhiyun return 0;
3975*4882a593Smuzhiyun }
3976*4882a593Smuzhiyun
cma_resolve_ib_udp(struct rdma_id_private * id_priv,struct rdma_conn_param * conn_param)3977*4882a593Smuzhiyun static int cma_resolve_ib_udp(struct rdma_id_private *id_priv,
3978*4882a593Smuzhiyun struct rdma_conn_param *conn_param)
3979*4882a593Smuzhiyun {
3980*4882a593Smuzhiyun struct ib_cm_sidr_req_param req;
3981*4882a593Smuzhiyun struct ib_cm_id *id;
3982*4882a593Smuzhiyun void *private_data;
3983*4882a593Smuzhiyun u8 offset;
3984*4882a593Smuzhiyun int ret;
3985*4882a593Smuzhiyun
3986*4882a593Smuzhiyun memset(&req, 0, sizeof req);
3987*4882a593Smuzhiyun offset = cma_user_data_offset(id_priv);
3988*4882a593Smuzhiyun req.private_data_len = offset + conn_param->private_data_len;
3989*4882a593Smuzhiyun if (req.private_data_len < conn_param->private_data_len)
3990*4882a593Smuzhiyun return -EINVAL;
3991*4882a593Smuzhiyun
3992*4882a593Smuzhiyun if (req.private_data_len) {
3993*4882a593Smuzhiyun private_data = kzalloc(req.private_data_len, GFP_ATOMIC);
3994*4882a593Smuzhiyun if (!private_data)
3995*4882a593Smuzhiyun return -ENOMEM;
3996*4882a593Smuzhiyun } else {
3997*4882a593Smuzhiyun private_data = NULL;
3998*4882a593Smuzhiyun }
3999*4882a593Smuzhiyun
4000*4882a593Smuzhiyun if (conn_param->private_data && conn_param->private_data_len)
4001*4882a593Smuzhiyun memcpy(private_data + offset, conn_param->private_data,
4002*4882a593Smuzhiyun conn_param->private_data_len);
4003*4882a593Smuzhiyun
4004*4882a593Smuzhiyun if (private_data) {
4005*4882a593Smuzhiyun ret = cma_format_hdr(private_data, id_priv);
4006*4882a593Smuzhiyun if (ret)
4007*4882a593Smuzhiyun goto out;
4008*4882a593Smuzhiyun req.private_data = private_data;
4009*4882a593Smuzhiyun }
4010*4882a593Smuzhiyun
4011*4882a593Smuzhiyun id = ib_create_cm_id(id_priv->id.device, cma_sidr_rep_handler,
4012*4882a593Smuzhiyun id_priv);
4013*4882a593Smuzhiyun if (IS_ERR(id)) {
4014*4882a593Smuzhiyun ret = PTR_ERR(id);
4015*4882a593Smuzhiyun goto out;
4016*4882a593Smuzhiyun }
4017*4882a593Smuzhiyun id_priv->cm_id.ib = id;
4018*4882a593Smuzhiyun
4019*4882a593Smuzhiyun req.path = id_priv->id.route.path_rec;
4020*4882a593Smuzhiyun req.sgid_attr = id_priv->id.route.addr.dev_addr.sgid_attr;
4021*4882a593Smuzhiyun req.service_id = rdma_get_service_id(&id_priv->id, cma_dst_addr(id_priv));
4022*4882a593Smuzhiyun req.timeout_ms = 1 << (CMA_CM_RESPONSE_TIMEOUT - 8);
4023*4882a593Smuzhiyun req.max_cm_retries = CMA_MAX_CM_RETRIES;
4024*4882a593Smuzhiyun
4025*4882a593Smuzhiyun trace_cm_send_sidr_req(id_priv);
4026*4882a593Smuzhiyun ret = ib_send_cm_sidr_req(id_priv->cm_id.ib, &req);
4027*4882a593Smuzhiyun if (ret) {
4028*4882a593Smuzhiyun ib_destroy_cm_id(id_priv->cm_id.ib);
4029*4882a593Smuzhiyun id_priv->cm_id.ib = NULL;
4030*4882a593Smuzhiyun }
4031*4882a593Smuzhiyun out:
4032*4882a593Smuzhiyun kfree(private_data);
4033*4882a593Smuzhiyun return ret;
4034*4882a593Smuzhiyun }
4035*4882a593Smuzhiyun
cma_connect_ib(struct rdma_id_private * id_priv,struct rdma_conn_param * conn_param)4036*4882a593Smuzhiyun static int cma_connect_ib(struct rdma_id_private *id_priv,
4037*4882a593Smuzhiyun struct rdma_conn_param *conn_param)
4038*4882a593Smuzhiyun {
4039*4882a593Smuzhiyun struct ib_cm_req_param req;
4040*4882a593Smuzhiyun struct rdma_route *route;
4041*4882a593Smuzhiyun void *private_data;
4042*4882a593Smuzhiyun struct ib_cm_id *id;
4043*4882a593Smuzhiyun u8 offset;
4044*4882a593Smuzhiyun int ret;
4045*4882a593Smuzhiyun
4046*4882a593Smuzhiyun memset(&req, 0, sizeof req);
4047*4882a593Smuzhiyun offset = cma_user_data_offset(id_priv);
4048*4882a593Smuzhiyun req.private_data_len = offset + conn_param->private_data_len;
4049*4882a593Smuzhiyun if (req.private_data_len < conn_param->private_data_len)
4050*4882a593Smuzhiyun return -EINVAL;
4051*4882a593Smuzhiyun
4052*4882a593Smuzhiyun if (req.private_data_len) {
4053*4882a593Smuzhiyun private_data = kzalloc(req.private_data_len, GFP_ATOMIC);
4054*4882a593Smuzhiyun if (!private_data)
4055*4882a593Smuzhiyun return -ENOMEM;
4056*4882a593Smuzhiyun } else {
4057*4882a593Smuzhiyun private_data = NULL;
4058*4882a593Smuzhiyun }
4059*4882a593Smuzhiyun
4060*4882a593Smuzhiyun if (conn_param->private_data && conn_param->private_data_len)
4061*4882a593Smuzhiyun memcpy(private_data + offset, conn_param->private_data,
4062*4882a593Smuzhiyun conn_param->private_data_len);
4063*4882a593Smuzhiyun
4064*4882a593Smuzhiyun id = ib_create_cm_id(id_priv->id.device, cma_ib_handler, id_priv);
4065*4882a593Smuzhiyun if (IS_ERR(id)) {
4066*4882a593Smuzhiyun ret = PTR_ERR(id);
4067*4882a593Smuzhiyun goto out;
4068*4882a593Smuzhiyun }
4069*4882a593Smuzhiyun id_priv->cm_id.ib = id;
4070*4882a593Smuzhiyun
4071*4882a593Smuzhiyun route = &id_priv->id.route;
4072*4882a593Smuzhiyun if (private_data) {
4073*4882a593Smuzhiyun ret = cma_format_hdr(private_data, id_priv);
4074*4882a593Smuzhiyun if (ret)
4075*4882a593Smuzhiyun goto out;
4076*4882a593Smuzhiyun req.private_data = private_data;
4077*4882a593Smuzhiyun }
4078*4882a593Smuzhiyun
4079*4882a593Smuzhiyun req.primary_path = &route->path_rec[0];
4080*4882a593Smuzhiyun if (route->num_paths == 2)
4081*4882a593Smuzhiyun req.alternate_path = &route->path_rec[1];
4082*4882a593Smuzhiyun
4083*4882a593Smuzhiyun req.ppath_sgid_attr = id_priv->id.route.addr.dev_addr.sgid_attr;
4084*4882a593Smuzhiyun /* Alternate path SGID attribute currently unsupported */
4085*4882a593Smuzhiyun req.service_id = rdma_get_service_id(&id_priv->id, cma_dst_addr(id_priv));
4086*4882a593Smuzhiyun req.qp_num = id_priv->qp_num;
4087*4882a593Smuzhiyun req.qp_type = id_priv->id.qp_type;
4088*4882a593Smuzhiyun req.starting_psn = id_priv->seq_num;
4089*4882a593Smuzhiyun req.responder_resources = conn_param->responder_resources;
4090*4882a593Smuzhiyun req.initiator_depth = conn_param->initiator_depth;
4091*4882a593Smuzhiyun req.flow_control = conn_param->flow_control;
4092*4882a593Smuzhiyun req.retry_count = min_t(u8, 7, conn_param->retry_count);
4093*4882a593Smuzhiyun req.rnr_retry_count = min_t(u8, 7, conn_param->rnr_retry_count);
4094*4882a593Smuzhiyun req.remote_cm_response_timeout = CMA_CM_RESPONSE_TIMEOUT;
4095*4882a593Smuzhiyun req.local_cm_response_timeout = CMA_CM_RESPONSE_TIMEOUT;
4096*4882a593Smuzhiyun req.max_cm_retries = CMA_MAX_CM_RETRIES;
4097*4882a593Smuzhiyun req.srq = id_priv->srq ? 1 : 0;
4098*4882a593Smuzhiyun req.ece.vendor_id = id_priv->ece.vendor_id;
4099*4882a593Smuzhiyun req.ece.attr_mod = id_priv->ece.attr_mod;
4100*4882a593Smuzhiyun
4101*4882a593Smuzhiyun trace_cm_send_req(id_priv);
4102*4882a593Smuzhiyun ret = ib_send_cm_req(id_priv->cm_id.ib, &req);
4103*4882a593Smuzhiyun out:
4104*4882a593Smuzhiyun if (ret && !IS_ERR(id)) {
4105*4882a593Smuzhiyun ib_destroy_cm_id(id);
4106*4882a593Smuzhiyun id_priv->cm_id.ib = NULL;
4107*4882a593Smuzhiyun }
4108*4882a593Smuzhiyun
4109*4882a593Smuzhiyun kfree(private_data);
4110*4882a593Smuzhiyun return ret;
4111*4882a593Smuzhiyun }
4112*4882a593Smuzhiyun
cma_connect_iw(struct rdma_id_private * id_priv,struct rdma_conn_param * conn_param)4113*4882a593Smuzhiyun static int cma_connect_iw(struct rdma_id_private *id_priv,
4114*4882a593Smuzhiyun struct rdma_conn_param *conn_param)
4115*4882a593Smuzhiyun {
4116*4882a593Smuzhiyun struct iw_cm_id *cm_id;
4117*4882a593Smuzhiyun int ret;
4118*4882a593Smuzhiyun struct iw_cm_conn_param iw_param;
4119*4882a593Smuzhiyun
4120*4882a593Smuzhiyun cm_id = iw_create_cm_id(id_priv->id.device, cma_iw_handler, id_priv);
4121*4882a593Smuzhiyun if (IS_ERR(cm_id))
4122*4882a593Smuzhiyun return PTR_ERR(cm_id);
4123*4882a593Smuzhiyun
4124*4882a593Smuzhiyun mutex_lock(&id_priv->qp_mutex);
4125*4882a593Smuzhiyun cm_id->tos = id_priv->tos;
4126*4882a593Smuzhiyun cm_id->tos_set = id_priv->tos_set;
4127*4882a593Smuzhiyun mutex_unlock(&id_priv->qp_mutex);
4128*4882a593Smuzhiyun
4129*4882a593Smuzhiyun id_priv->cm_id.iw = cm_id;
4130*4882a593Smuzhiyun
4131*4882a593Smuzhiyun memcpy(&cm_id->local_addr, cma_src_addr(id_priv),
4132*4882a593Smuzhiyun rdma_addr_size(cma_src_addr(id_priv)));
4133*4882a593Smuzhiyun memcpy(&cm_id->remote_addr, cma_dst_addr(id_priv),
4134*4882a593Smuzhiyun rdma_addr_size(cma_dst_addr(id_priv)));
4135*4882a593Smuzhiyun
4136*4882a593Smuzhiyun ret = cma_modify_qp_rtr(id_priv, conn_param);
4137*4882a593Smuzhiyun if (ret)
4138*4882a593Smuzhiyun goto out;
4139*4882a593Smuzhiyun
4140*4882a593Smuzhiyun if (conn_param) {
4141*4882a593Smuzhiyun iw_param.ord = conn_param->initiator_depth;
4142*4882a593Smuzhiyun iw_param.ird = conn_param->responder_resources;
4143*4882a593Smuzhiyun iw_param.private_data = conn_param->private_data;
4144*4882a593Smuzhiyun iw_param.private_data_len = conn_param->private_data_len;
4145*4882a593Smuzhiyun iw_param.qpn = id_priv->id.qp ? id_priv->qp_num : conn_param->qp_num;
4146*4882a593Smuzhiyun } else {
4147*4882a593Smuzhiyun memset(&iw_param, 0, sizeof iw_param);
4148*4882a593Smuzhiyun iw_param.qpn = id_priv->qp_num;
4149*4882a593Smuzhiyun }
4150*4882a593Smuzhiyun ret = iw_cm_connect(cm_id, &iw_param);
4151*4882a593Smuzhiyun out:
4152*4882a593Smuzhiyun if (ret) {
4153*4882a593Smuzhiyun iw_destroy_cm_id(cm_id);
4154*4882a593Smuzhiyun id_priv->cm_id.iw = NULL;
4155*4882a593Smuzhiyun }
4156*4882a593Smuzhiyun return ret;
4157*4882a593Smuzhiyun }
4158*4882a593Smuzhiyun
4159*4882a593Smuzhiyun /**
4160*4882a593Smuzhiyun * rdma_connect_locked - Initiate an active connection request.
4161*4882a593Smuzhiyun * @id: Connection identifier to connect.
4162*4882a593Smuzhiyun * @conn_param: Connection information used for connected QPs.
4163*4882a593Smuzhiyun *
4164*4882a593Smuzhiyun * Same as rdma_connect() but can only be called from the
4165*4882a593Smuzhiyun * RDMA_CM_EVENT_ROUTE_RESOLVED handler callback.
4166*4882a593Smuzhiyun */
rdma_connect_locked(struct rdma_cm_id * id,struct rdma_conn_param * conn_param)4167*4882a593Smuzhiyun int rdma_connect_locked(struct rdma_cm_id *id,
4168*4882a593Smuzhiyun struct rdma_conn_param *conn_param)
4169*4882a593Smuzhiyun {
4170*4882a593Smuzhiyun struct rdma_id_private *id_priv =
4171*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
4172*4882a593Smuzhiyun int ret;
4173*4882a593Smuzhiyun
4174*4882a593Smuzhiyun if (!cma_comp_exch(id_priv, RDMA_CM_ROUTE_RESOLVED, RDMA_CM_CONNECT))
4175*4882a593Smuzhiyun return -EINVAL;
4176*4882a593Smuzhiyun
4177*4882a593Smuzhiyun if (!id->qp) {
4178*4882a593Smuzhiyun id_priv->qp_num = conn_param->qp_num;
4179*4882a593Smuzhiyun id_priv->srq = conn_param->srq;
4180*4882a593Smuzhiyun }
4181*4882a593Smuzhiyun
4182*4882a593Smuzhiyun if (rdma_cap_ib_cm(id->device, id->port_num)) {
4183*4882a593Smuzhiyun if (id->qp_type == IB_QPT_UD)
4184*4882a593Smuzhiyun ret = cma_resolve_ib_udp(id_priv, conn_param);
4185*4882a593Smuzhiyun else
4186*4882a593Smuzhiyun ret = cma_connect_ib(id_priv, conn_param);
4187*4882a593Smuzhiyun } else if (rdma_cap_iw_cm(id->device, id->port_num))
4188*4882a593Smuzhiyun ret = cma_connect_iw(id_priv, conn_param);
4189*4882a593Smuzhiyun else
4190*4882a593Smuzhiyun ret = -ENOSYS;
4191*4882a593Smuzhiyun if (ret)
4192*4882a593Smuzhiyun goto err_state;
4193*4882a593Smuzhiyun return 0;
4194*4882a593Smuzhiyun err_state:
4195*4882a593Smuzhiyun cma_comp_exch(id_priv, RDMA_CM_CONNECT, RDMA_CM_ROUTE_RESOLVED);
4196*4882a593Smuzhiyun return ret;
4197*4882a593Smuzhiyun }
4198*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_connect_locked);
4199*4882a593Smuzhiyun
4200*4882a593Smuzhiyun /**
4201*4882a593Smuzhiyun * rdma_connect - Initiate an active connection request.
4202*4882a593Smuzhiyun * @id: Connection identifier to connect.
4203*4882a593Smuzhiyun * @conn_param: Connection information used for connected QPs.
4204*4882a593Smuzhiyun *
4205*4882a593Smuzhiyun * Users must have resolved a route for the rdma_cm_id to connect with by having
4206*4882a593Smuzhiyun * called rdma_resolve_route before calling this routine.
4207*4882a593Smuzhiyun *
4208*4882a593Smuzhiyun * This call will either connect to a remote QP or obtain remote QP information
4209*4882a593Smuzhiyun * for unconnected rdma_cm_id's. The actual operation is based on the
4210*4882a593Smuzhiyun * rdma_cm_id's port space.
4211*4882a593Smuzhiyun */
rdma_connect(struct rdma_cm_id * id,struct rdma_conn_param * conn_param)4212*4882a593Smuzhiyun int rdma_connect(struct rdma_cm_id *id, struct rdma_conn_param *conn_param)
4213*4882a593Smuzhiyun {
4214*4882a593Smuzhiyun struct rdma_id_private *id_priv =
4215*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
4216*4882a593Smuzhiyun int ret;
4217*4882a593Smuzhiyun
4218*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
4219*4882a593Smuzhiyun ret = rdma_connect_locked(id, conn_param);
4220*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
4221*4882a593Smuzhiyun return ret;
4222*4882a593Smuzhiyun }
4223*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_connect);
4224*4882a593Smuzhiyun
4225*4882a593Smuzhiyun /**
4226*4882a593Smuzhiyun * rdma_connect_ece - Initiate an active connection request with ECE data.
4227*4882a593Smuzhiyun * @id: Connection identifier to connect.
4228*4882a593Smuzhiyun * @conn_param: Connection information used for connected QPs.
4229*4882a593Smuzhiyun * @ece: ECE parameters
4230*4882a593Smuzhiyun *
4231*4882a593Smuzhiyun * See rdma_connect() explanation.
4232*4882a593Smuzhiyun */
rdma_connect_ece(struct rdma_cm_id * id,struct rdma_conn_param * conn_param,struct rdma_ucm_ece * ece)4233*4882a593Smuzhiyun int rdma_connect_ece(struct rdma_cm_id *id, struct rdma_conn_param *conn_param,
4234*4882a593Smuzhiyun struct rdma_ucm_ece *ece)
4235*4882a593Smuzhiyun {
4236*4882a593Smuzhiyun struct rdma_id_private *id_priv =
4237*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
4238*4882a593Smuzhiyun
4239*4882a593Smuzhiyun id_priv->ece.vendor_id = ece->vendor_id;
4240*4882a593Smuzhiyun id_priv->ece.attr_mod = ece->attr_mod;
4241*4882a593Smuzhiyun
4242*4882a593Smuzhiyun return rdma_connect(id, conn_param);
4243*4882a593Smuzhiyun }
4244*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_connect_ece);
4245*4882a593Smuzhiyun
cma_accept_ib(struct rdma_id_private * id_priv,struct rdma_conn_param * conn_param)4246*4882a593Smuzhiyun static int cma_accept_ib(struct rdma_id_private *id_priv,
4247*4882a593Smuzhiyun struct rdma_conn_param *conn_param)
4248*4882a593Smuzhiyun {
4249*4882a593Smuzhiyun struct ib_cm_rep_param rep;
4250*4882a593Smuzhiyun int ret;
4251*4882a593Smuzhiyun
4252*4882a593Smuzhiyun ret = cma_modify_qp_rtr(id_priv, conn_param);
4253*4882a593Smuzhiyun if (ret)
4254*4882a593Smuzhiyun goto out;
4255*4882a593Smuzhiyun
4256*4882a593Smuzhiyun ret = cma_modify_qp_rts(id_priv, conn_param);
4257*4882a593Smuzhiyun if (ret)
4258*4882a593Smuzhiyun goto out;
4259*4882a593Smuzhiyun
4260*4882a593Smuzhiyun memset(&rep, 0, sizeof rep);
4261*4882a593Smuzhiyun rep.qp_num = id_priv->qp_num;
4262*4882a593Smuzhiyun rep.starting_psn = id_priv->seq_num;
4263*4882a593Smuzhiyun rep.private_data = conn_param->private_data;
4264*4882a593Smuzhiyun rep.private_data_len = conn_param->private_data_len;
4265*4882a593Smuzhiyun rep.responder_resources = conn_param->responder_resources;
4266*4882a593Smuzhiyun rep.initiator_depth = conn_param->initiator_depth;
4267*4882a593Smuzhiyun rep.failover_accepted = 0;
4268*4882a593Smuzhiyun rep.flow_control = conn_param->flow_control;
4269*4882a593Smuzhiyun rep.rnr_retry_count = min_t(u8, 7, conn_param->rnr_retry_count);
4270*4882a593Smuzhiyun rep.srq = id_priv->srq ? 1 : 0;
4271*4882a593Smuzhiyun rep.ece.vendor_id = id_priv->ece.vendor_id;
4272*4882a593Smuzhiyun rep.ece.attr_mod = id_priv->ece.attr_mod;
4273*4882a593Smuzhiyun
4274*4882a593Smuzhiyun trace_cm_send_rep(id_priv);
4275*4882a593Smuzhiyun ret = ib_send_cm_rep(id_priv->cm_id.ib, &rep);
4276*4882a593Smuzhiyun out:
4277*4882a593Smuzhiyun return ret;
4278*4882a593Smuzhiyun }
4279*4882a593Smuzhiyun
cma_accept_iw(struct rdma_id_private * id_priv,struct rdma_conn_param * conn_param)4280*4882a593Smuzhiyun static int cma_accept_iw(struct rdma_id_private *id_priv,
4281*4882a593Smuzhiyun struct rdma_conn_param *conn_param)
4282*4882a593Smuzhiyun {
4283*4882a593Smuzhiyun struct iw_cm_conn_param iw_param;
4284*4882a593Smuzhiyun int ret;
4285*4882a593Smuzhiyun
4286*4882a593Smuzhiyun if (!conn_param)
4287*4882a593Smuzhiyun return -EINVAL;
4288*4882a593Smuzhiyun
4289*4882a593Smuzhiyun ret = cma_modify_qp_rtr(id_priv, conn_param);
4290*4882a593Smuzhiyun if (ret)
4291*4882a593Smuzhiyun return ret;
4292*4882a593Smuzhiyun
4293*4882a593Smuzhiyun iw_param.ord = conn_param->initiator_depth;
4294*4882a593Smuzhiyun iw_param.ird = conn_param->responder_resources;
4295*4882a593Smuzhiyun iw_param.private_data = conn_param->private_data;
4296*4882a593Smuzhiyun iw_param.private_data_len = conn_param->private_data_len;
4297*4882a593Smuzhiyun if (id_priv->id.qp) {
4298*4882a593Smuzhiyun iw_param.qpn = id_priv->qp_num;
4299*4882a593Smuzhiyun } else
4300*4882a593Smuzhiyun iw_param.qpn = conn_param->qp_num;
4301*4882a593Smuzhiyun
4302*4882a593Smuzhiyun return iw_cm_accept(id_priv->cm_id.iw, &iw_param);
4303*4882a593Smuzhiyun }
4304*4882a593Smuzhiyun
cma_send_sidr_rep(struct rdma_id_private * id_priv,enum ib_cm_sidr_status status,u32 qkey,const void * private_data,int private_data_len)4305*4882a593Smuzhiyun static int cma_send_sidr_rep(struct rdma_id_private *id_priv,
4306*4882a593Smuzhiyun enum ib_cm_sidr_status status, u32 qkey,
4307*4882a593Smuzhiyun const void *private_data, int private_data_len)
4308*4882a593Smuzhiyun {
4309*4882a593Smuzhiyun struct ib_cm_sidr_rep_param rep;
4310*4882a593Smuzhiyun int ret;
4311*4882a593Smuzhiyun
4312*4882a593Smuzhiyun memset(&rep, 0, sizeof rep);
4313*4882a593Smuzhiyun rep.status = status;
4314*4882a593Smuzhiyun if (status == IB_SIDR_SUCCESS) {
4315*4882a593Smuzhiyun ret = cma_set_qkey(id_priv, qkey);
4316*4882a593Smuzhiyun if (ret)
4317*4882a593Smuzhiyun return ret;
4318*4882a593Smuzhiyun rep.qp_num = id_priv->qp_num;
4319*4882a593Smuzhiyun rep.qkey = id_priv->qkey;
4320*4882a593Smuzhiyun
4321*4882a593Smuzhiyun rep.ece.vendor_id = id_priv->ece.vendor_id;
4322*4882a593Smuzhiyun rep.ece.attr_mod = id_priv->ece.attr_mod;
4323*4882a593Smuzhiyun }
4324*4882a593Smuzhiyun
4325*4882a593Smuzhiyun rep.private_data = private_data;
4326*4882a593Smuzhiyun rep.private_data_len = private_data_len;
4327*4882a593Smuzhiyun
4328*4882a593Smuzhiyun trace_cm_send_sidr_rep(id_priv);
4329*4882a593Smuzhiyun return ib_send_cm_sidr_rep(id_priv->cm_id.ib, &rep);
4330*4882a593Smuzhiyun }
4331*4882a593Smuzhiyun
4332*4882a593Smuzhiyun /**
4333*4882a593Smuzhiyun * rdma_accept - Called to accept a connection request or response.
4334*4882a593Smuzhiyun * @id: Connection identifier associated with the request.
4335*4882a593Smuzhiyun * @conn_param: Information needed to establish the connection. This must be
4336*4882a593Smuzhiyun * provided if accepting a connection request. If accepting a connection
4337*4882a593Smuzhiyun * response, this parameter must be NULL.
4338*4882a593Smuzhiyun *
4339*4882a593Smuzhiyun * Typically, this routine is only called by the listener to accept a connection
4340*4882a593Smuzhiyun * request. It must also be called on the active side of a connection if the
4341*4882a593Smuzhiyun * user is performing their own QP transitions.
4342*4882a593Smuzhiyun *
4343*4882a593Smuzhiyun * In the case of error, a reject message is sent to the remote side and the
4344*4882a593Smuzhiyun * state of the qp associated with the id is modified to error, such that any
4345*4882a593Smuzhiyun * previously posted receive buffers would be flushed.
4346*4882a593Smuzhiyun *
4347*4882a593Smuzhiyun * This function is for use by kernel ULPs and must be called from under the
4348*4882a593Smuzhiyun * handler callback.
4349*4882a593Smuzhiyun */
rdma_accept(struct rdma_cm_id * id,struct rdma_conn_param * conn_param)4350*4882a593Smuzhiyun int rdma_accept(struct rdma_cm_id *id, struct rdma_conn_param *conn_param)
4351*4882a593Smuzhiyun {
4352*4882a593Smuzhiyun struct rdma_id_private *id_priv =
4353*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
4354*4882a593Smuzhiyun int ret;
4355*4882a593Smuzhiyun
4356*4882a593Smuzhiyun lockdep_assert_held(&id_priv->handler_mutex);
4357*4882a593Smuzhiyun
4358*4882a593Smuzhiyun if (READ_ONCE(id_priv->state) != RDMA_CM_CONNECT)
4359*4882a593Smuzhiyun return -EINVAL;
4360*4882a593Smuzhiyun
4361*4882a593Smuzhiyun if (!id->qp && conn_param) {
4362*4882a593Smuzhiyun id_priv->qp_num = conn_param->qp_num;
4363*4882a593Smuzhiyun id_priv->srq = conn_param->srq;
4364*4882a593Smuzhiyun }
4365*4882a593Smuzhiyun
4366*4882a593Smuzhiyun if (rdma_cap_ib_cm(id->device, id->port_num)) {
4367*4882a593Smuzhiyun if (id->qp_type == IB_QPT_UD) {
4368*4882a593Smuzhiyun if (conn_param)
4369*4882a593Smuzhiyun ret = cma_send_sidr_rep(id_priv, IB_SIDR_SUCCESS,
4370*4882a593Smuzhiyun conn_param->qkey,
4371*4882a593Smuzhiyun conn_param->private_data,
4372*4882a593Smuzhiyun conn_param->private_data_len);
4373*4882a593Smuzhiyun else
4374*4882a593Smuzhiyun ret = cma_send_sidr_rep(id_priv, IB_SIDR_SUCCESS,
4375*4882a593Smuzhiyun 0, NULL, 0);
4376*4882a593Smuzhiyun } else {
4377*4882a593Smuzhiyun if (conn_param)
4378*4882a593Smuzhiyun ret = cma_accept_ib(id_priv, conn_param);
4379*4882a593Smuzhiyun else
4380*4882a593Smuzhiyun ret = cma_rep_recv(id_priv);
4381*4882a593Smuzhiyun }
4382*4882a593Smuzhiyun } else if (rdma_cap_iw_cm(id->device, id->port_num))
4383*4882a593Smuzhiyun ret = cma_accept_iw(id_priv, conn_param);
4384*4882a593Smuzhiyun else
4385*4882a593Smuzhiyun ret = -ENOSYS;
4386*4882a593Smuzhiyun
4387*4882a593Smuzhiyun if (ret)
4388*4882a593Smuzhiyun goto reject;
4389*4882a593Smuzhiyun
4390*4882a593Smuzhiyun return 0;
4391*4882a593Smuzhiyun reject:
4392*4882a593Smuzhiyun cma_modify_qp_err(id_priv);
4393*4882a593Smuzhiyun rdma_reject(id, NULL, 0, IB_CM_REJ_CONSUMER_DEFINED);
4394*4882a593Smuzhiyun return ret;
4395*4882a593Smuzhiyun }
4396*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_accept);
4397*4882a593Smuzhiyun
rdma_accept_ece(struct rdma_cm_id * id,struct rdma_conn_param * conn_param,struct rdma_ucm_ece * ece)4398*4882a593Smuzhiyun int rdma_accept_ece(struct rdma_cm_id *id, struct rdma_conn_param *conn_param,
4399*4882a593Smuzhiyun struct rdma_ucm_ece *ece)
4400*4882a593Smuzhiyun {
4401*4882a593Smuzhiyun struct rdma_id_private *id_priv =
4402*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
4403*4882a593Smuzhiyun
4404*4882a593Smuzhiyun id_priv->ece.vendor_id = ece->vendor_id;
4405*4882a593Smuzhiyun id_priv->ece.attr_mod = ece->attr_mod;
4406*4882a593Smuzhiyun
4407*4882a593Smuzhiyun return rdma_accept(id, conn_param);
4408*4882a593Smuzhiyun }
4409*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_accept_ece);
4410*4882a593Smuzhiyun
rdma_lock_handler(struct rdma_cm_id * id)4411*4882a593Smuzhiyun void rdma_lock_handler(struct rdma_cm_id *id)
4412*4882a593Smuzhiyun {
4413*4882a593Smuzhiyun struct rdma_id_private *id_priv =
4414*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
4415*4882a593Smuzhiyun
4416*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
4417*4882a593Smuzhiyun }
4418*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_lock_handler);
4419*4882a593Smuzhiyun
rdma_unlock_handler(struct rdma_cm_id * id)4420*4882a593Smuzhiyun void rdma_unlock_handler(struct rdma_cm_id *id)
4421*4882a593Smuzhiyun {
4422*4882a593Smuzhiyun struct rdma_id_private *id_priv =
4423*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
4424*4882a593Smuzhiyun
4425*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
4426*4882a593Smuzhiyun }
4427*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_unlock_handler);
4428*4882a593Smuzhiyun
rdma_notify(struct rdma_cm_id * id,enum ib_event_type event)4429*4882a593Smuzhiyun int rdma_notify(struct rdma_cm_id *id, enum ib_event_type event)
4430*4882a593Smuzhiyun {
4431*4882a593Smuzhiyun struct rdma_id_private *id_priv;
4432*4882a593Smuzhiyun int ret;
4433*4882a593Smuzhiyun
4434*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
4435*4882a593Smuzhiyun if (!id_priv->cm_id.ib)
4436*4882a593Smuzhiyun return -EINVAL;
4437*4882a593Smuzhiyun
4438*4882a593Smuzhiyun switch (id->device->node_type) {
4439*4882a593Smuzhiyun case RDMA_NODE_IB_CA:
4440*4882a593Smuzhiyun ret = ib_cm_notify(id_priv->cm_id.ib, event);
4441*4882a593Smuzhiyun break;
4442*4882a593Smuzhiyun default:
4443*4882a593Smuzhiyun ret = 0;
4444*4882a593Smuzhiyun break;
4445*4882a593Smuzhiyun }
4446*4882a593Smuzhiyun return ret;
4447*4882a593Smuzhiyun }
4448*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_notify);
4449*4882a593Smuzhiyun
rdma_reject(struct rdma_cm_id * id,const void * private_data,u8 private_data_len,u8 reason)4450*4882a593Smuzhiyun int rdma_reject(struct rdma_cm_id *id, const void *private_data,
4451*4882a593Smuzhiyun u8 private_data_len, u8 reason)
4452*4882a593Smuzhiyun {
4453*4882a593Smuzhiyun struct rdma_id_private *id_priv;
4454*4882a593Smuzhiyun int ret;
4455*4882a593Smuzhiyun
4456*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
4457*4882a593Smuzhiyun if (!id_priv->cm_id.ib)
4458*4882a593Smuzhiyun return -EINVAL;
4459*4882a593Smuzhiyun
4460*4882a593Smuzhiyun if (rdma_cap_ib_cm(id->device, id->port_num)) {
4461*4882a593Smuzhiyun if (id->qp_type == IB_QPT_UD) {
4462*4882a593Smuzhiyun ret = cma_send_sidr_rep(id_priv, IB_SIDR_REJECT, 0,
4463*4882a593Smuzhiyun private_data, private_data_len);
4464*4882a593Smuzhiyun } else {
4465*4882a593Smuzhiyun trace_cm_send_rej(id_priv);
4466*4882a593Smuzhiyun ret = ib_send_cm_rej(id_priv->cm_id.ib, reason, NULL, 0,
4467*4882a593Smuzhiyun private_data, private_data_len);
4468*4882a593Smuzhiyun }
4469*4882a593Smuzhiyun } else if (rdma_cap_iw_cm(id->device, id->port_num)) {
4470*4882a593Smuzhiyun ret = iw_cm_reject(id_priv->cm_id.iw,
4471*4882a593Smuzhiyun private_data, private_data_len);
4472*4882a593Smuzhiyun } else
4473*4882a593Smuzhiyun ret = -ENOSYS;
4474*4882a593Smuzhiyun
4475*4882a593Smuzhiyun return ret;
4476*4882a593Smuzhiyun }
4477*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_reject);
4478*4882a593Smuzhiyun
rdma_disconnect(struct rdma_cm_id * id)4479*4882a593Smuzhiyun int rdma_disconnect(struct rdma_cm_id *id)
4480*4882a593Smuzhiyun {
4481*4882a593Smuzhiyun struct rdma_id_private *id_priv;
4482*4882a593Smuzhiyun int ret;
4483*4882a593Smuzhiyun
4484*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
4485*4882a593Smuzhiyun if (!id_priv->cm_id.ib)
4486*4882a593Smuzhiyun return -EINVAL;
4487*4882a593Smuzhiyun
4488*4882a593Smuzhiyun if (rdma_cap_ib_cm(id->device, id->port_num)) {
4489*4882a593Smuzhiyun ret = cma_modify_qp_err(id_priv);
4490*4882a593Smuzhiyun if (ret)
4491*4882a593Smuzhiyun goto out;
4492*4882a593Smuzhiyun /* Initiate or respond to a disconnect. */
4493*4882a593Smuzhiyun trace_cm_disconnect(id_priv);
4494*4882a593Smuzhiyun if (ib_send_cm_dreq(id_priv->cm_id.ib, NULL, 0)) {
4495*4882a593Smuzhiyun if (!ib_send_cm_drep(id_priv->cm_id.ib, NULL, 0))
4496*4882a593Smuzhiyun trace_cm_sent_drep(id_priv);
4497*4882a593Smuzhiyun } else {
4498*4882a593Smuzhiyun trace_cm_sent_dreq(id_priv);
4499*4882a593Smuzhiyun }
4500*4882a593Smuzhiyun } else if (rdma_cap_iw_cm(id->device, id->port_num)) {
4501*4882a593Smuzhiyun ret = iw_cm_disconnect(id_priv->cm_id.iw, 0);
4502*4882a593Smuzhiyun } else
4503*4882a593Smuzhiyun ret = -EINVAL;
4504*4882a593Smuzhiyun
4505*4882a593Smuzhiyun out:
4506*4882a593Smuzhiyun return ret;
4507*4882a593Smuzhiyun }
4508*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_disconnect);
4509*4882a593Smuzhiyun
cma_make_mc_event(int status,struct rdma_id_private * id_priv,struct ib_sa_multicast * multicast,struct rdma_cm_event * event,struct cma_multicast * mc)4510*4882a593Smuzhiyun static void cma_make_mc_event(int status, struct rdma_id_private *id_priv,
4511*4882a593Smuzhiyun struct ib_sa_multicast *multicast,
4512*4882a593Smuzhiyun struct rdma_cm_event *event,
4513*4882a593Smuzhiyun struct cma_multicast *mc)
4514*4882a593Smuzhiyun {
4515*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr;
4516*4882a593Smuzhiyun enum ib_gid_type gid_type;
4517*4882a593Smuzhiyun struct net_device *ndev;
4518*4882a593Smuzhiyun
4519*4882a593Smuzhiyun if (!status)
4520*4882a593Smuzhiyun status = cma_set_qkey(id_priv, be32_to_cpu(multicast->rec.qkey));
4521*4882a593Smuzhiyun else
4522*4882a593Smuzhiyun pr_debug_ratelimited("RDMA CM: MULTICAST_ERROR: failed to join multicast. status %d\n",
4523*4882a593Smuzhiyun status);
4524*4882a593Smuzhiyun
4525*4882a593Smuzhiyun event->status = status;
4526*4882a593Smuzhiyun event->param.ud.private_data = mc->context;
4527*4882a593Smuzhiyun if (status) {
4528*4882a593Smuzhiyun event->event = RDMA_CM_EVENT_MULTICAST_ERROR;
4529*4882a593Smuzhiyun return;
4530*4882a593Smuzhiyun }
4531*4882a593Smuzhiyun
4532*4882a593Smuzhiyun dev_addr = &id_priv->id.route.addr.dev_addr;
4533*4882a593Smuzhiyun ndev = dev_get_by_index(dev_addr->net, dev_addr->bound_dev_if);
4534*4882a593Smuzhiyun gid_type =
4535*4882a593Smuzhiyun id_priv->cma_dev
4536*4882a593Smuzhiyun ->default_gid_type[id_priv->id.port_num -
4537*4882a593Smuzhiyun rdma_start_port(
4538*4882a593Smuzhiyun id_priv->cma_dev->device)];
4539*4882a593Smuzhiyun
4540*4882a593Smuzhiyun event->event = RDMA_CM_EVENT_MULTICAST_JOIN;
4541*4882a593Smuzhiyun if (ib_init_ah_from_mcmember(id_priv->id.device, id_priv->id.port_num,
4542*4882a593Smuzhiyun &multicast->rec, ndev, gid_type,
4543*4882a593Smuzhiyun &event->param.ud.ah_attr)) {
4544*4882a593Smuzhiyun event->event = RDMA_CM_EVENT_MULTICAST_ERROR;
4545*4882a593Smuzhiyun goto out;
4546*4882a593Smuzhiyun }
4547*4882a593Smuzhiyun
4548*4882a593Smuzhiyun event->param.ud.qp_num = 0xFFFFFF;
4549*4882a593Smuzhiyun event->param.ud.qkey = be32_to_cpu(multicast->rec.qkey);
4550*4882a593Smuzhiyun
4551*4882a593Smuzhiyun out:
4552*4882a593Smuzhiyun if (ndev)
4553*4882a593Smuzhiyun dev_put(ndev);
4554*4882a593Smuzhiyun }
4555*4882a593Smuzhiyun
cma_ib_mc_handler(int status,struct ib_sa_multicast * multicast)4556*4882a593Smuzhiyun static int cma_ib_mc_handler(int status, struct ib_sa_multicast *multicast)
4557*4882a593Smuzhiyun {
4558*4882a593Smuzhiyun struct cma_multicast *mc = multicast->context;
4559*4882a593Smuzhiyun struct rdma_id_private *id_priv = mc->id_priv;
4560*4882a593Smuzhiyun struct rdma_cm_event event = {};
4561*4882a593Smuzhiyun int ret = 0;
4562*4882a593Smuzhiyun
4563*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
4564*4882a593Smuzhiyun if (READ_ONCE(id_priv->state) == RDMA_CM_DEVICE_REMOVAL ||
4565*4882a593Smuzhiyun READ_ONCE(id_priv->state) == RDMA_CM_DESTROYING)
4566*4882a593Smuzhiyun goto out;
4567*4882a593Smuzhiyun
4568*4882a593Smuzhiyun cma_make_mc_event(status, id_priv, multicast, &event, mc);
4569*4882a593Smuzhiyun ret = cma_cm_event_handler(id_priv, &event);
4570*4882a593Smuzhiyun rdma_destroy_ah_attr(&event.param.ud.ah_attr);
4571*4882a593Smuzhiyun WARN_ON(ret);
4572*4882a593Smuzhiyun
4573*4882a593Smuzhiyun out:
4574*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
4575*4882a593Smuzhiyun return 0;
4576*4882a593Smuzhiyun }
4577*4882a593Smuzhiyun
cma_set_mgid(struct rdma_id_private * id_priv,struct sockaddr * addr,union ib_gid * mgid)4578*4882a593Smuzhiyun static void cma_set_mgid(struct rdma_id_private *id_priv,
4579*4882a593Smuzhiyun struct sockaddr *addr, union ib_gid *mgid)
4580*4882a593Smuzhiyun {
4581*4882a593Smuzhiyun unsigned char mc_map[MAX_ADDR_LEN];
4582*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
4583*4882a593Smuzhiyun struct sockaddr_in *sin = (struct sockaddr_in *) addr;
4584*4882a593Smuzhiyun struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *) addr;
4585*4882a593Smuzhiyun
4586*4882a593Smuzhiyun if (cma_any_addr(addr)) {
4587*4882a593Smuzhiyun memset(mgid, 0, sizeof *mgid);
4588*4882a593Smuzhiyun } else if ((addr->sa_family == AF_INET6) &&
4589*4882a593Smuzhiyun ((be32_to_cpu(sin6->sin6_addr.s6_addr32[0]) & 0xFFF0FFFF) ==
4590*4882a593Smuzhiyun 0xFF10A01B)) {
4591*4882a593Smuzhiyun /* IPv6 address is an SA assigned MGID. */
4592*4882a593Smuzhiyun memcpy(mgid, &sin6->sin6_addr, sizeof *mgid);
4593*4882a593Smuzhiyun } else if (addr->sa_family == AF_IB) {
4594*4882a593Smuzhiyun memcpy(mgid, &((struct sockaddr_ib *) addr)->sib_addr, sizeof *mgid);
4595*4882a593Smuzhiyun } else if (addr->sa_family == AF_INET6) {
4596*4882a593Smuzhiyun ipv6_ib_mc_map(&sin6->sin6_addr, dev_addr->broadcast, mc_map);
4597*4882a593Smuzhiyun if (id_priv->id.ps == RDMA_PS_UDP)
4598*4882a593Smuzhiyun mc_map[7] = 0x01; /* Use RDMA CM signature */
4599*4882a593Smuzhiyun *mgid = *(union ib_gid *) (mc_map + 4);
4600*4882a593Smuzhiyun } else {
4601*4882a593Smuzhiyun ip_ib_mc_map(sin->sin_addr.s_addr, dev_addr->broadcast, mc_map);
4602*4882a593Smuzhiyun if (id_priv->id.ps == RDMA_PS_UDP)
4603*4882a593Smuzhiyun mc_map[7] = 0x01; /* Use RDMA CM signature */
4604*4882a593Smuzhiyun *mgid = *(union ib_gid *) (mc_map + 4);
4605*4882a593Smuzhiyun }
4606*4882a593Smuzhiyun }
4607*4882a593Smuzhiyun
cma_join_ib_multicast(struct rdma_id_private * id_priv,struct cma_multicast * mc)4608*4882a593Smuzhiyun static int cma_join_ib_multicast(struct rdma_id_private *id_priv,
4609*4882a593Smuzhiyun struct cma_multicast *mc)
4610*4882a593Smuzhiyun {
4611*4882a593Smuzhiyun struct ib_sa_mcmember_rec rec;
4612*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
4613*4882a593Smuzhiyun ib_sa_comp_mask comp_mask;
4614*4882a593Smuzhiyun int ret;
4615*4882a593Smuzhiyun
4616*4882a593Smuzhiyun ib_addr_get_mgid(dev_addr, &rec.mgid);
4617*4882a593Smuzhiyun ret = ib_sa_get_mcmember_rec(id_priv->id.device, id_priv->id.port_num,
4618*4882a593Smuzhiyun &rec.mgid, &rec);
4619*4882a593Smuzhiyun if (ret)
4620*4882a593Smuzhiyun return ret;
4621*4882a593Smuzhiyun
4622*4882a593Smuzhiyun ret = cma_set_qkey(id_priv, 0);
4623*4882a593Smuzhiyun if (ret)
4624*4882a593Smuzhiyun return ret;
4625*4882a593Smuzhiyun
4626*4882a593Smuzhiyun cma_set_mgid(id_priv, (struct sockaddr *) &mc->addr, &rec.mgid);
4627*4882a593Smuzhiyun rec.qkey = cpu_to_be32(id_priv->qkey);
4628*4882a593Smuzhiyun rdma_addr_get_sgid(dev_addr, &rec.port_gid);
4629*4882a593Smuzhiyun rec.pkey = cpu_to_be16(ib_addr_get_pkey(dev_addr));
4630*4882a593Smuzhiyun rec.join_state = mc->join_state;
4631*4882a593Smuzhiyun
4632*4882a593Smuzhiyun if ((rec.join_state == BIT(SENDONLY_FULLMEMBER_JOIN)) &&
4633*4882a593Smuzhiyun (!ib_sa_sendonly_fullmem_support(&sa_client,
4634*4882a593Smuzhiyun id_priv->id.device,
4635*4882a593Smuzhiyun id_priv->id.port_num))) {
4636*4882a593Smuzhiyun dev_warn(
4637*4882a593Smuzhiyun &id_priv->id.device->dev,
4638*4882a593Smuzhiyun "RDMA CM: port %u Unable to multicast join: SM doesn't support Send Only Full Member option\n",
4639*4882a593Smuzhiyun id_priv->id.port_num);
4640*4882a593Smuzhiyun return -EOPNOTSUPP;
4641*4882a593Smuzhiyun }
4642*4882a593Smuzhiyun
4643*4882a593Smuzhiyun comp_mask = IB_SA_MCMEMBER_REC_MGID | IB_SA_MCMEMBER_REC_PORT_GID |
4644*4882a593Smuzhiyun IB_SA_MCMEMBER_REC_PKEY | IB_SA_MCMEMBER_REC_JOIN_STATE |
4645*4882a593Smuzhiyun IB_SA_MCMEMBER_REC_QKEY | IB_SA_MCMEMBER_REC_SL |
4646*4882a593Smuzhiyun IB_SA_MCMEMBER_REC_FLOW_LABEL |
4647*4882a593Smuzhiyun IB_SA_MCMEMBER_REC_TRAFFIC_CLASS;
4648*4882a593Smuzhiyun
4649*4882a593Smuzhiyun if (id_priv->id.ps == RDMA_PS_IPOIB)
4650*4882a593Smuzhiyun comp_mask |= IB_SA_MCMEMBER_REC_RATE |
4651*4882a593Smuzhiyun IB_SA_MCMEMBER_REC_RATE_SELECTOR |
4652*4882a593Smuzhiyun IB_SA_MCMEMBER_REC_MTU_SELECTOR |
4653*4882a593Smuzhiyun IB_SA_MCMEMBER_REC_MTU |
4654*4882a593Smuzhiyun IB_SA_MCMEMBER_REC_HOP_LIMIT;
4655*4882a593Smuzhiyun
4656*4882a593Smuzhiyun mc->sa_mc = ib_sa_join_multicast(&sa_client, id_priv->id.device,
4657*4882a593Smuzhiyun id_priv->id.port_num, &rec, comp_mask,
4658*4882a593Smuzhiyun GFP_KERNEL, cma_ib_mc_handler, mc);
4659*4882a593Smuzhiyun return PTR_ERR_OR_ZERO(mc->sa_mc);
4660*4882a593Smuzhiyun }
4661*4882a593Smuzhiyun
cma_iboe_set_mgid(struct sockaddr * addr,union ib_gid * mgid,enum ib_gid_type gid_type)4662*4882a593Smuzhiyun static void cma_iboe_set_mgid(struct sockaddr *addr, union ib_gid *mgid,
4663*4882a593Smuzhiyun enum ib_gid_type gid_type)
4664*4882a593Smuzhiyun {
4665*4882a593Smuzhiyun struct sockaddr_in *sin = (struct sockaddr_in *)addr;
4666*4882a593Smuzhiyun struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)addr;
4667*4882a593Smuzhiyun
4668*4882a593Smuzhiyun if (cma_any_addr(addr)) {
4669*4882a593Smuzhiyun memset(mgid, 0, sizeof *mgid);
4670*4882a593Smuzhiyun } else if (addr->sa_family == AF_INET6) {
4671*4882a593Smuzhiyun memcpy(mgid, &sin6->sin6_addr, sizeof *mgid);
4672*4882a593Smuzhiyun } else {
4673*4882a593Smuzhiyun mgid->raw[0] =
4674*4882a593Smuzhiyun (gid_type == IB_GID_TYPE_ROCE_UDP_ENCAP) ? 0 : 0xff;
4675*4882a593Smuzhiyun mgid->raw[1] =
4676*4882a593Smuzhiyun (gid_type == IB_GID_TYPE_ROCE_UDP_ENCAP) ? 0 : 0x0e;
4677*4882a593Smuzhiyun mgid->raw[2] = 0;
4678*4882a593Smuzhiyun mgid->raw[3] = 0;
4679*4882a593Smuzhiyun mgid->raw[4] = 0;
4680*4882a593Smuzhiyun mgid->raw[5] = 0;
4681*4882a593Smuzhiyun mgid->raw[6] = 0;
4682*4882a593Smuzhiyun mgid->raw[7] = 0;
4683*4882a593Smuzhiyun mgid->raw[8] = 0;
4684*4882a593Smuzhiyun mgid->raw[9] = 0;
4685*4882a593Smuzhiyun mgid->raw[10] = 0xff;
4686*4882a593Smuzhiyun mgid->raw[11] = 0xff;
4687*4882a593Smuzhiyun *(__be32 *)(&mgid->raw[12]) = sin->sin_addr.s_addr;
4688*4882a593Smuzhiyun }
4689*4882a593Smuzhiyun }
4690*4882a593Smuzhiyun
cma_iboe_join_multicast(struct rdma_id_private * id_priv,struct cma_multicast * mc)4691*4882a593Smuzhiyun static int cma_iboe_join_multicast(struct rdma_id_private *id_priv,
4692*4882a593Smuzhiyun struct cma_multicast *mc)
4693*4882a593Smuzhiyun {
4694*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr = &id_priv->id.route.addr.dev_addr;
4695*4882a593Smuzhiyun int err = 0;
4696*4882a593Smuzhiyun struct sockaddr *addr = (struct sockaddr *)&mc->addr;
4697*4882a593Smuzhiyun struct net_device *ndev = NULL;
4698*4882a593Smuzhiyun struct ib_sa_multicast ib;
4699*4882a593Smuzhiyun enum ib_gid_type gid_type;
4700*4882a593Smuzhiyun bool send_only;
4701*4882a593Smuzhiyun
4702*4882a593Smuzhiyun send_only = mc->join_state == BIT(SENDONLY_FULLMEMBER_JOIN);
4703*4882a593Smuzhiyun
4704*4882a593Smuzhiyun if (cma_zero_addr(addr))
4705*4882a593Smuzhiyun return -EINVAL;
4706*4882a593Smuzhiyun
4707*4882a593Smuzhiyun gid_type = id_priv->cma_dev->default_gid_type[id_priv->id.port_num -
4708*4882a593Smuzhiyun rdma_start_port(id_priv->cma_dev->device)];
4709*4882a593Smuzhiyun cma_iboe_set_mgid(addr, &ib.rec.mgid, gid_type);
4710*4882a593Smuzhiyun
4711*4882a593Smuzhiyun ib.rec.pkey = cpu_to_be16(0xffff);
4712*4882a593Smuzhiyun if (id_priv->id.ps == RDMA_PS_UDP)
4713*4882a593Smuzhiyun ib.rec.qkey = cpu_to_be32(RDMA_UDP_QKEY);
4714*4882a593Smuzhiyun
4715*4882a593Smuzhiyun if (dev_addr->bound_dev_if)
4716*4882a593Smuzhiyun ndev = dev_get_by_index(dev_addr->net, dev_addr->bound_dev_if);
4717*4882a593Smuzhiyun if (!ndev)
4718*4882a593Smuzhiyun return -ENODEV;
4719*4882a593Smuzhiyun
4720*4882a593Smuzhiyun ib.rec.rate = iboe_get_rate(ndev);
4721*4882a593Smuzhiyun ib.rec.hop_limit = 1;
4722*4882a593Smuzhiyun ib.rec.mtu = iboe_get_mtu(ndev->mtu);
4723*4882a593Smuzhiyun
4724*4882a593Smuzhiyun if (addr->sa_family == AF_INET) {
4725*4882a593Smuzhiyun if (gid_type == IB_GID_TYPE_ROCE_UDP_ENCAP) {
4726*4882a593Smuzhiyun ib.rec.hop_limit = IPV6_DEFAULT_HOPLIMIT;
4727*4882a593Smuzhiyun if (!send_only) {
4728*4882a593Smuzhiyun err = cma_igmp_send(ndev, &ib.rec.mgid,
4729*4882a593Smuzhiyun true);
4730*4882a593Smuzhiyun }
4731*4882a593Smuzhiyun }
4732*4882a593Smuzhiyun } else {
4733*4882a593Smuzhiyun if (gid_type == IB_GID_TYPE_ROCE_UDP_ENCAP)
4734*4882a593Smuzhiyun err = -ENOTSUPP;
4735*4882a593Smuzhiyun }
4736*4882a593Smuzhiyun dev_put(ndev);
4737*4882a593Smuzhiyun if (err || !ib.rec.mtu)
4738*4882a593Smuzhiyun return err ?: -EINVAL;
4739*4882a593Smuzhiyun
4740*4882a593Smuzhiyun rdma_ip2gid((struct sockaddr *)&id_priv->id.route.addr.src_addr,
4741*4882a593Smuzhiyun &ib.rec.port_gid);
4742*4882a593Smuzhiyun INIT_WORK(&mc->iboe_join.work, cma_iboe_join_work_handler);
4743*4882a593Smuzhiyun cma_make_mc_event(0, id_priv, &ib, &mc->iboe_join.event, mc);
4744*4882a593Smuzhiyun queue_work(cma_wq, &mc->iboe_join.work);
4745*4882a593Smuzhiyun return 0;
4746*4882a593Smuzhiyun }
4747*4882a593Smuzhiyun
rdma_join_multicast(struct rdma_cm_id * id,struct sockaddr * addr,u8 join_state,void * context)4748*4882a593Smuzhiyun int rdma_join_multicast(struct rdma_cm_id *id, struct sockaddr *addr,
4749*4882a593Smuzhiyun u8 join_state, void *context)
4750*4882a593Smuzhiyun {
4751*4882a593Smuzhiyun struct rdma_id_private *id_priv =
4752*4882a593Smuzhiyun container_of(id, struct rdma_id_private, id);
4753*4882a593Smuzhiyun struct cma_multicast *mc;
4754*4882a593Smuzhiyun int ret;
4755*4882a593Smuzhiyun
4756*4882a593Smuzhiyun /* Not supported for kernel QPs */
4757*4882a593Smuzhiyun if (WARN_ON(id->qp))
4758*4882a593Smuzhiyun return -EINVAL;
4759*4882a593Smuzhiyun
4760*4882a593Smuzhiyun /* ULP is calling this wrong. */
4761*4882a593Smuzhiyun if (!id->device || (READ_ONCE(id_priv->state) != RDMA_CM_ADDR_BOUND &&
4762*4882a593Smuzhiyun READ_ONCE(id_priv->state) != RDMA_CM_ADDR_RESOLVED))
4763*4882a593Smuzhiyun return -EINVAL;
4764*4882a593Smuzhiyun
4765*4882a593Smuzhiyun mc = kzalloc(sizeof(*mc), GFP_KERNEL);
4766*4882a593Smuzhiyun if (!mc)
4767*4882a593Smuzhiyun return -ENOMEM;
4768*4882a593Smuzhiyun
4769*4882a593Smuzhiyun memcpy(&mc->addr, addr, rdma_addr_size(addr));
4770*4882a593Smuzhiyun mc->context = context;
4771*4882a593Smuzhiyun mc->id_priv = id_priv;
4772*4882a593Smuzhiyun mc->join_state = join_state;
4773*4882a593Smuzhiyun
4774*4882a593Smuzhiyun if (rdma_protocol_roce(id->device, id->port_num)) {
4775*4882a593Smuzhiyun ret = cma_iboe_join_multicast(id_priv, mc);
4776*4882a593Smuzhiyun if (ret)
4777*4882a593Smuzhiyun goto out_err;
4778*4882a593Smuzhiyun } else if (rdma_cap_ib_mcast(id->device, id->port_num)) {
4779*4882a593Smuzhiyun ret = cma_join_ib_multicast(id_priv, mc);
4780*4882a593Smuzhiyun if (ret)
4781*4882a593Smuzhiyun goto out_err;
4782*4882a593Smuzhiyun } else {
4783*4882a593Smuzhiyun ret = -ENOSYS;
4784*4882a593Smuzhiyun goto out_err;
4785*4882a593Smuzhiyun }
4786*4882a593Smuzhiyun
4787*4882a593Smuzhiyun spin_lock(&id_priv->lock);
4788*4882a593Smuzhiyun list_add(&mc->list, &id_priv->mc_list);
4789*4882a593Smuzhiyun spin_unlock(&id_priv->lock);
4790*4882a593Smuzhiyun
4791*4882a593Smuzhiyun return 0;
4792*4882a593Smuzhiyun out_err:
4793*4882a593Smuzhiyun kfree(mc);
4794*4882a593Smuzhiyun return ret;
4795*4882a593Smuzhiyun }
4796*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_join_multicast);
4797*4882a593Smuzhiyun
rdma_leave_multicast(struct rdma_cm_id * id,struct sockaddr * addr)4798*4882a593Smuzhiyun void rdma_leave_multicast(struct rdma_cm_id *id, struct sockaddr *addr)
4799*4882a593Smuzhiyun {
4800*4882a593Smuzhiyun struct rdma_id_private *id_priv;
4801*4882a593Smuzhiyun struct cma_multicast *mc;
4802*4882a593Smuzhiyun
4803*4882a593Smuzhiyun id_priv = container_of(id, struct rdma_id_private, id);
4804*4882a593Smuzhiyun spin_lock_irq(&id_priv->lock);
4805*4882a593Smuzhiyun list_for_each_entry(mc, &id_priv->mc_list, list) {
4806*4882a593Smuzhiyun if (memcmp(&mc->addr, addr, rdma_addr_size(addr)) != 0)
4807*4882a593Smuzhiyun continue;
4808*4882a593Smuzhiyun list_del(&mc->list);
4809*4882a593Smuzhiyun spin_unlock_irq(&id_priv->lock);
4810*4882a593Smuzhiyun
4811*4882a593Smuzhiyun WARN_ON(id_priv->cma_dev->device != id->device);
4812*4882a593Smuzhiyun destroy_mc(id_priv, mc);
4813*4882a593Smuzhiyun return;
4814*4882a593Smuzhiyun }
4815*4882a593Smuzhiyun spin_unlock_irq(&id_priv->lock);
4816*4882a593Smuzhiyun }
4817*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_leave_multicast);
4818*4882a593Smuzhiyun
cma_netdev_change(struct net_device * ndev,struct rdma_id_private * id_priv)4819*4882a593Smuzhiyun static int cma_netdev_change(struct net_device *ndev, struct rdma_id_private *id_priv)
4820*4882a593Smuzhiyun {
4821*4882a593Smuzhiyun struct rdma_dev_addr *dev_addr;
4822*4882a593Smuzhiyun struct cma_work *work;
4823*4882a593Smuzhiyun
4824*4882a593Smuzhiyun dev_addr = &id_priv->id.route.addr.dev_addr;
4825*4882a593Smuzhiyun
4826*4882a593Smuzhiyun if ((dev_addr->bound_dev_if == ndev->ifindex) &&
4827*4882a593Smuzhiyun (net_eq(dev_net(ndev), dev_addr->net)) &&
4828*4882a593Smuzhiyun memcmp(dev_addr->src_dev_addr, ndev->dev_addr, ndev->addr_len)) {
4829*4882a593Smuzhiyun pr_info("RDMA CM addr change for ndev %s used by id %p\n",
4830*4882a593Smuzhiyun ndev->name, &id_priv->id);
4831*4882a593Smuzhiyun work = kzalloc(sizeof *work, GFP_KERNEL);
4832*4882a593Smuzhiyun if (!work)
4833*4882a593Smuzhiyun return -ENOMEM;
4834*4882a593Smuzhiyun
4835*4882a593Smuzhiyun INIT_WORK(&work->work, cma_work_handler);
4836*4882a593Smuzhiyun work->id = id_priv;
4837*4882a593Smuzhiyun work->event.event = RDMA_CM_EVENT_ADDR_CHANGE;
4838*4882a593Smuzhiyun cma_id_get(id_priv);
4839*4882a593Smuzhiyun queue_work(cma_wq, &work->work);
4840*4882a593Smuzhiyun }
4841*4882a593Smuzhiyun
4842*4882a593Smuzhiyun return 0;
4843*4882a593Smuzhiyun }
4844*4882a593Smuzhiyun
cma_netdev_callback(struct notifier_block * self,unsigned long event,void * ptr)4845*4882a593Smuzhiyun static int cma_netdev_callback(struct notifier_block *self, unsigned long event,
4846*4882a593Smuzhiyun void *ptr)
4847*4882a593Smuzhiyun {
4848*4882a593Smuzhiyun struct net_device *ndev = netdev_notifier_info_to_dev(ptr);
4849*4882a593Smuzhiyun struct cma_device *cma_dev;
4850*4882a593Smuzhiyun struct rdma_id_private *id_priv;
4851*4882a593Smuzhiyun int ret = NOTIFY_DONE;
4852*4882a593Smuzhiyun
4853*4882a593Smuzhiyun if (event != NETDEV_BONDING_FAILOVER)
4854*4882a593Smuzhiyun return NOTIFY_DONE;
4855*4882a593Smuzhiyun
4856*4882a593Smuzhiyun if (!netif_is_bond_master(ndev))
4857*4882a593Smuzhiyun return NOTIFY_DONE;
4858*4882a593Smuzhiyun
4859*4882a593Smuzhiyun mutex_lock(&lock);
4860*4882a593Smuzhiyun list_for_each_entry(cma_dev, &dev_list, list)
4861*4882a593Smuzhiyun list_for_each_entry(id_priv, &cma_dev->id_list, list) {
4862*4882a593Smuzhiyun ret = cma_netdev_change(ndev, id_priv);
4863*4882a593Smuzhiyun if (ret)
4864*4882a593Smuzhiyun goto out;
4865*4882a593Smuzhiyun }
4866*4882a593Smuzhiyun
4867*4882a593Smuzhiyun out:
4868*4882a593Smuzhiyun mutex_unlock(&lock);
4869*4882a593Smuzhiyun return ret;
4870*4882a593Smuzhiyun }
4871*4882a593Smuzhiyun
4872*4882a593Smuzhiyun static struct notifier_block cma_nb = {
4873*4882a593Smuzhiyun .notifier_call = cma_netdev_callback
4874*4882a593Smuzhiyun };
4875*4882a593Smuzhiyun
cma_send_device_removal_put(struct rdma_id_private * id_priv)4876*4882a593Smuzhiyun static void cma_send_device_removal_put(struct rdma_id_private *id_priv)
4877*4882a593Smuzhiyun {
4878*4882a593Smuzhiyun struct rdma_cm_event event = { .event = RDMA_CM_EVENT_DEVICE_REMOVAL };
4879*4882a593Smuzhiyun enum rdma_cm_state state;
4880*4882a593Smuzhiyun unsigned long flags;
4881*4882a593Smuzhiyun
4882*4882a593Smuzhiyun mutex_lock(&id_priv->handler_mutex);
4883*4882a593Smuzhiyun /* Record that we want to remove the device */
4884*4882a593Smuzhiyun spin_lock_irqsave(&id_priv->lock, flags);
4885*4882a593Smuzhiyun state = id_priv->state;
4886*4882a593Smuzhiyun if (state == RDMA_CM_DESTROYING || state == RDMA_CM_DEVICE_REMOVAL) {
4887*4882a593Smuzhiyun spin_unlock_irqrestore(&id_priv->lock, flags);
4888*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
4889*4882a593Smuzhiyun cma_id_put(id_priv);
4890*4882a593Smuzhiyun return;
4891*4882a593Smuzhiyun }
4892*4882a593Smuzhiyun id_priv->state = RDMA_CM_DEVICE_REMOVAL;
4893*4882a593Smuzhiyun spin_unlock_irqrestore(&id_priv->lock, flags);
4894*4882a593Smuzhiyun
4895*4882a593Smuzhiyun if (cma_cm_event_handler(id_priv, &event)) {
4896*4882a593Smuzhiyun /*
4897*4882a593Smuzhiyun * At this point the ULP promises it won't call
4898*4882a593Smuzhiyun * rdma_destroy_id() concurrently
4899*4882a593Smuzhiyun */
4900*4882a593Smuzhiyun cma_id_put(id_priv);
4901*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
4902*4882a593Smuzhiyun trace_cm_id_destroy(id_priv);
4903*4882a593Smuzhiyun _destroy_id(id_priv, state);
4904*4882a593Smuzhiyun return;
4905*4882a593Smuzhiyun }
4906*4882a593Smuzhiyun mutex_unlock(&id_priv->handler_mutex);
4907*4882a593Smuzhiyun
4908*4882a593Smuzhiyun /*
4909*4882a593Smuzhiyun * If this races with destroy then the thread that first assigns state
4910*4882a593Smuzhiyun * to a destroying does the cancel.
4911*4882a593Smuzhiyun */
4912*4882a593Smuzhiyun cma_cancel_operation(id_priv, state);
4913*4882a593Smuzhiyun cma_id_put(id_priv);
4914*4882a593Smuzhiyun }
4915*4882a593Smuzhiyun
cma_process_remove(struct cma_device * cma_dev)4916*4882a593Smuzhiyun static void cma_process_remove(struct cma_device *cma_dev)
4917*4882a593Smuzhiyun {
4918*4882a593Smuzhiyun mutex_lock(&lock);
4919*4882a593Smuzhiyun while (!list_empty(&cma_dev->id_list)) {
4920*4882a593Smuzhiyun struct rdma_id_private *id_priv = list_first_entry(
4921*4882a593Smuzhiyun &cma_dev->id_list, struct rdma_id_private, list);
4922*4882a593Smuzhiyun
4923*4882a593Smuzhiyun list_del(&id_priv->listen_list);
4924*4882a593Smuzhiyun list_del_init(&id_priv->list);
4925*4882a593Smuzhiyun cma_id_get(id_priv);
4926*4882a593Smuzhiyun mutex_unlock(&lock);
4927*4882a593Smuzhiyun
4928*4882a593Smuzhiyun cma_send_device_removal_put(id_priv);
4929*4882a593Smuzhiyun
4930*4882a593Smuzhiyun mutex_lock(&lock);
4931*4882a593Smuzhiyun }
4932*4882a593Smuzhiyun mutex_unlock(&lock);
4933*4882a593Smuzhiyun
4934*4882a593Smuzhiyun cma_dev_put(cma_dev);
4935*4882a593Smuzhiyun wait_for_completion(&cma_dev->comp);
4936*4882a593Smuzhiyun }
4937*4882a593Smuzhiyun
cma_add_one(struct ib_device * device)4938*4882a593Smuzhiyun static int cma_add_one(struct ib_device *device)
4939*4882a593Smuzhiyun {
4940*4882a593Smuzhiyun struct rdma_id_private *to_destroy;
4941*4882a593Smuzhiyun struct cma_device *cma_dev;
4942*4882a593Smuzhiyun struct rdma_id_private *id_priv;
4943*4882a593Smuzhiyun unsigned int i;
4944*4882a593Smuzhiyun unsigned long supported_gids = 0;
4945*4882a593Smuzhiyun int ret;
4946*4882a593Smuzhiyun
4947*4882a593Smuzhiyun cma_dev = kmalloc(sizeof(*cma_dev), GFP_KERNEL);
4948*4882a593Smuzhiyun if (!cma_dev)
4949*4882a593Smuzhiyun return -ENOMEM;
4950*4882a593Smuzhiyun
4951*4882a593Smuzhiyun cma_dev->device = device;
4952*4882a593Smuzhiyun cma_dev->default_gid_type = kcalloc(device->phys_port_cnt,
4953*4882a593Smuzhiyun sizeof(*cma_dev->default_gid_type),
4954*4882a593Smuzhiyun GFP_KERNEL);
4955*4882a593Smuzhiyun if (!cma_dev->default_gid_type) {
4956*4882a593Smuzhiyun ret = -ENOMEM;
4957*4882a593Smuzhiyun goto free_cma_dev;
4958*4882a593Smuzhiyun }
4959*4882a593Smuzhiyun
4960*4882a593Smuzhiyun cma_dev->default_roce_tos = kcalloc(device->phys_port_cnt,
4961*4882a593Smuzhiyun sizeof(*cma_dev->default_roce_tos),
4962*4882a593Smuzhiyun GFP_KERNEL);
4963*4882a593Smuzhiyun if (!cma_dev->default_roce_tos) {
4964*4882a593Smuzhiyun ret = -ENOMEM;
4965*4882a593Smuzhiyun goto free_gid_type;
4966*4882a593Smuzhiyun }
4967*4882a593Smuzhiyun
4968*4882a593Smuzhiyun rdma_for_each_port (device, i) {
4969*4882a593Smuzhiyun supported_gids = roce_gid_type_mask_support(device, i);
4970*4882a593Smuzhiyun WARN_ON(!supported_gids);
4971*4882a593Smuzhiyun if (supported_gids & (1 << CMA_PREFERRED_ROCE_GID_TYPE))
4972*4882a593Smuzhiyun cma_dev->default_gid_type[i - rdma_start_port(device)] =
4973*4882a593Smuzhiyun CMA_PREFERRED_ROCE_GID_TYPE;
4974*4882a593Smuzhiyun else
4975*4882a593Smuzhiyun cma_dev->default_gid_type[i - rdma_start_port(device)] =
4976*4882a593Smuzhiyun find_first_bit(&supported_gids, BITS_PER_LONG);
4977*4882a593Smuzhiyun cma_dev->default_roce_tos[i - rdma_start_port(device)] = 0;
4978*4882a593Smuzhiyun }
4979*4882a593Smuzhiyun
4980*4882a593Smuzhiyun init_completion(&cma_dev->comp);
4981*4882a593Smuzhiyun refcount_set(&cma_dev->refcount, 1);
4982*4882a593Smuzhiyun INIT_LIST_HEAD(&cma_dev->id_list);
4983*4882a593Smuzhiyun ib_set_client_data(device, &cma_client, cma_dev);
4984*4882a593Smuzhiyun
4985*4882a593Smuzhiyun mutex_lock(&lock);
4986*4882a593Smuzhiyun list_add_tail(&cma_dev->list, &dev_list);
4987*4882a593Smuzhiyun list_for_each_entry(id_priv, &listen_any_list, list) {
4988*4882a593Smuzhiyun ret = cma_listen_on_dev(id_priv, cma_dev, &to_destroy);
4989*4882a593Smuzhiyun if (ret)
4990*4882a593Smuzhiyun goto free_listen;
4991*4882a593Smuzhiyun }
4992*4882a593Smuzhiyun mutex_unlock(&lock);
4993*4882a593Smuzhiyun
4994*4882a593Smuzhiyun trace_cm_add_one(device);
4995*4882a593Smuzhiyun return 0;
4996*4882a593Smuzhiyun
4997*4882a593Smuzhiyun free_listen:
4998*4882a593Smuzhiyun list_del(&cma_dev->list);
4999*4882a593Smuzhiyun mutex_unlock(&lock);
5000*4882a593Smuzhiyun
5001*4882a593Smuzhiyun /* cma_process_remove() will delete to_destroy */
5002*4882a593Smuzhiyun cma_process_remove(cma_dev);
5003*4882a593Smuzhiyun kfree(cma_dev->default_roce_tos);
5004*4882a593Smuzhiyun free_gid_type:
5005*4882a593Smuzhiyun kfree(cma_dev->default_gid_type);
5006*4882a593Smuzhiyun
5007*4882a593Smuzhiyun free_cma_dev:
5008*4882a593Smuzhiyun kfree(cma_dev);
5009*4882a593Smuzhiyun return ret;
5010*4882a593Smuzhiyun }
5011*4882a593Smuzhiyun
cma_remove_one(struct ib_device * device,void * client_data)5012*4882a593Smuzhiyun static void cma_remove_one(struct ib_device *device, void *client_data)
5013*4882a593Smuzhiyun {
5014*4882a593Smuzhiyun struct cma_device *cma_dev = client_data;
5015*4882a593Smuzhiyun
5016*4882a593Smuzhiyun trace_cm_remove_one(device);
5017*4882a593Smuzhiyun
5018*4882a593Smuzhiyun mutex_lock(&lock);
5019*4882a593Smuzhiyun list_del(&cma_dev->list);
5020*4882a593Smuzhiyun mutex_unlock(&lock);
5021*4882a593Smuzhiyun
5022*4882a593Smuzhiyun cma_process_remove(cma_dev);
5023*4882a593Smuzhiyun kfree(cma_dev->default_roce_tos);
5024*4882a593Smuzhiyun kfree(cma_dev->default_gid_type);
5025*4882a593Smuzhiyun kfree(cma_dev);
5026*4882a593Smuzhiyun }
5027*4882a593Smuzhiyun
cma_init_net(struct net * net)5028*4882a593Smuzhiyun static int cma_init_net(struct net *net)
5029*4882a593Smuzhiyun {
5030*4882a593Smuzhiyun struct cma_pernet *pernet = cma_pernet(net);
5031*4882a593Smuzhiyun
5032*4882a593Smuzhiyun xa_init(&pernet->tcp_ps);
5033*4882a593Smuzhiyun xa_init(&pernet->udp_ps);
5034*4882a593Smuzhiyun xa_init(&pernet->ipoib_ps);
5035*4882a593Smuzhiyun xa_init(&pernet->ib_ps);
5036*4882a593Smuzhiyun
5037*4882a593Smuzhiyun return 0;
5038*4882a593Smuzhiyun }
5039*4882a593Smuzhiyun
cma_exit_net(struct net * net)5040*4882a593Smuzhiyun static void cma_exit_net(struct net *net)
5041*4882a593Smuzhiyun {
5042*4882a593Smuzhiyun struct cma_pernet *pernet = cma_pernet(net);
5043*4882a593Smuzhiyun
5044*4882a593Smuzhiyun WARN_ON(!xa_empty(&pernet->tcp_ps));
5045*4882a593Smuzhiyun WARN_ON(!xa_empty(&pernet->udp_ps));
5046*4882a593Smuzhiyun WARN_ON(!xa_empty(&pernet->ipoib_ps));
5047*4882a593Smuzhiyun WARN_ON(!xa_empty(&pernet->ib_ps));
5048*4882a593Smuzhiyun }
5049*4882a593Smuzhiyun
5050*4882a593Smuzhiyun static struct pernet_operations cma_pernet_operations = {
5051*4882a593Smuzhiyun .init = cma_init_net,
5052*4882a593Smuzhiyun .exit = cma_exit_net,
5053*4882a593Smuzhiyun .id = &cma_pernet_id,
5054*4882a593Smuzhiyun .size = sizeof(struct cma_pernet),
5055*4882a593Smuzhiyun };
5056*4882a593Smuzhiyun
cma_init(void)5057*4882a593Smuzhiyun static int __init cma_init(void)
5058*4882a593Smuzhiyun {
5059*4882a593Smuzhiyun int ret;
5060*4882a593Smuzhiyun
5061*4882a593Smuzhiyun /*
5062*4882a593Smuzhiyun * There is a rare lock ordering dependency in cma_netdev_callback()
5063*4882a593Smuzhiyun * that only happens when bonding is enabled. Teach lockdep that rtnl
5064*4882a593Smuzhiyun * must never be nested under lock so it can find these without having
5065*4882a593Smuzhiyun * to test with bonding.
5066*4882a593Smuzhiyun */
5067*4882a593Smuzhiyun if (IS_ENABLED(CONFIG_LOCKDEP)) {
5068*4882a593Smuzhiyun rtnl_lock();
5069*4882a593Smuzhiyun mutex_lock(&lock);
5070*4882a593Smuzhiyun mutex_unlock(&lock);
5071*4882a593Smuzhiyun rtnl_unlock();
5072*4882a593Smuzhiyun }
5073*4882a593Smuzhiyun
5074*4882a593Smuzhiyun cma_wq = alloc_ordered_workqueue("rdma_cm", WQ_MEM_RECLAIM);
5075*4882a593Smuzhiyun if (!cma_wq)
5076*4882a593Smuzhiyun return -ENOMEM;
5077*4882a593Smuzhiyun
5078*4882a593Smuzhiyun ret = register_pernet_subsys(&cma_pernet_operations);
5079*4882a593Smuzhiyun if (ret)
5080*4882a593Smuzhiyun goto err_wq;
5081*4882a593Smuzhiyun
5082*4882a593Smuzhiyun ib_sa_register_client(&sa_client);
5083*4882a593Smuzhiyun register_netdevice_notifier(&cma_nb);
5084*4882a593Smuzhiyun
5085*4882a593Smuzhiyun ret = ib_register_client(&cma_client);
5086*4882a593Smuzhiyun if (ret)
5087*4882a593Smuzhiyun goto err;
5088*4882a593Smuzhiyun
5089*4882a593Smuzhiyun ret = cma_configfs_init();
5090*4882a593Smuzhiyun if (ret)
5091*4882a593Smuzhiyun goto err_ib;
5092*4882a593Smuzhiyun
5093*4882a593Smuzhiyun return 0;
5094*4882a593Smuzhiyun
5095*4882a593Smuzhiyun err_ib:
5096*4882a593Smuzhiyun ib_unregister_client(&cma_client);
5097*4882a593Smuzhiyun err:
5098*4882a593Smuzhiyun unregister_netdevice_notifier(&cma_nb);
5099*4882a593Smuzhiyun ib_sa_unregister_client(&sa_client);
5100*4882a593Smuzhiyun unregister_pernet_subsys(&cma_pernet_operations);
5101*4882a593Smuzhiyun err_wq:
5102*4882a593Smuzhiyun destroy_workqueue(cma_wq);
5103*4882a593Smuzhiyun return ret;
5104*4882a593Smuzhiyun }
5105*4882a593Smuzhiyun
cma_cleanup(void)5106*4882a593Smuzhiyun static void __exit cma_cleanup(void)
5107*4882a593Smuzhiyun {
5108*4882a593Smuzhiyun cma_configfs_exit();
5109*4882a593Smuzhiyun ib_unregister_client(&cma_client);
5110*4882a593Smuzhiyun unregister_netdevice_notifier(&cma_nb);
5111*4882a593Smuzhiyun ib_sa_unregister_client(&sa_client);
5112*4882a593Smuzhiyun unregister_pernet_subsys(&cma_pernet_operations);
5113*4882a593Smuzhiyun destroy_workqueue(cma_wq);
5114*4882a593Smuzhiyun }
5115*4882a593Smuzhiyun
5116*4882a593Smuzhiyun module_init(cma_init);
5117*4882a593Smuzhiyun module_exit(cma_cleanup);
5118