xref: /OK3568_Linux_fs/kernel/net/smc/smc_pnet.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  *  Shared Memory Communications over RDMA (SMC-R) and RoCE
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  *  Generic netlink support functions to configure an SMC-R PNET table
6*4882a593Smuzhiyun  *
7*4882a593Smuzhiyun  *  Copyright IBM Corp. 2016
8*4882a593Smuzhiyun  *
9*4882a593Smuzhiyun  *  Author(s):  Thomas Richter <tmricht@linux.vnet.ibm.com>
10*4882a593Smuzhiyun  */
11*4882a593Smuzhiyun 
12*4882a593Smuzhiyun #include <linux/module.h>
13*4882a593Smuzhiyun #include <linux/list.h>
14*4882a593Smuzhiyun #include <linux/ctype.h>
15*4882a593Smuzhiyun #include <linux/mutex.h>
16*4882a593Smuzhiyun #include <net/netlink.h>
17*4882a593Smuzhiyun #include <net/genetlink.h>
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #include <uapi/linux/if.h>
20*4882a593Smuzhiyun #include <uapi/linux/smc.h>
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun #include <rdma/ib_verbs.h>
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun #include <net/netns/generic.h>
25*4882a593Smuzhiyun #include "smc_netns.h"
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun #include "smc_pnet.h"
28*4882a593Smuzhiyun #include "smc_ib.h"
29*4882a593Smuzhiyun #include "smc_ism.h"
30*4882a593Smuzhiyun #include "smc_core.h"
31*4882a593Smuzhiyun 
32*4882a593Smuzhiyun static struct net_device *__pnet_find_base_ndev(struct net_device *ndev);
33*4882a593Smuzhiyun static struct net_device *pnet_find_base_ndev(struct net_device *ndev);
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun static const struct nla_policy smc_pnet_policy[SMC_PNETID_MAX + 1] = {
36*4882a593Smuzhiyun 	[SMC_PNETID_NAME] = {
37*4882a593Smuzhiyun 		.type = NLA_NUL_STRING,
38*4882a593Smuzhiyun 		.len = SMC_MAX_PNETID_LEN
39*4882a593Smuzhiyun 	},
40*4882a593Smuzhiyun 	[SMC_PNETID_ETHNAME] = {
41*4882a593Smuzhiyun 		.type = NLA_NUL_STRING,
42*4882a593Smuzhiyun 		.len = IFNAMSIZ - 1
43*4882a593Smuzhiyun 	},
44*4882a593Smuzhiyun 	[SMC_PNETID_IBNAME] = {
45*4882a593Smuzhiyun 		.type = NLA_NUL_STRING,
46*4882a593Smuzhiyun 		.len = IB_DEVICE_NAME_MAX - 1
47*4882a593Smuzhiyun 	},
48*4882a593Smuzhiyun 	[SMC_PNETID_IBPORT] = { .type = NLA_U8 }
49*4882a593Smuzhiyun };
50*4882a593Smuzhiyun 
51*4882a593Smuzhiyun static struct genl_family smc_pnet_nl_family;
52*4882a593Smuzhiyun 
53*4882a593Smuzhiyun enum smc_pnet_nametype {
54*4882a593Smuzhiyun 	SMC_PNET_ETH	= 1,
55*4882a593Smuzhiyun 	SMC_PNET_IB	= 2,
56*4882a593Smuzhiyun };
57*4882a593Smuzhiyun 
58*4882a593Smuzhiyun /* pnet entry stored in pnet table */
59*4882a593Smuzhiyun struct smc_pnetentry {
60*4882a593Smuzhiyun 	struct list_head list;
61*4882a593Smuzhiyun 	char pnet_name[SMC_MAX_PNETID_LEN + 1];
62*4882a593Smuzhiyun 	enum smc_pnet_nametype type;
63*4882a593Smuzhiyun 	union {
64*4882a593Smuzhiyun 		struct {
65*4882a593Smuzhiyun 			char eth_name[IFNAMSIZ + 1];
66*4882a593Smuzhiyun 			struct net_device *ndev;
67*4882a593Smuzhiyun 		};
68*4882a593Smuzhiyun 		struct {
69*4882a593Smuzhiyun 			char ib_name[IB_DEVICE_NAME_MAX + 1];
70*4882a593Smuzhiyun 			u8 ib_port;
71*4882a593Smuzhiyun 		};
72*4882a593Smuzhiyun 	};
73*4882a593Smuzhiyun };
74*4882a593Smuzhiyun 
75*4882a593Smuzhiyun /* Check if the pnetid is set */
smc_pnet_is_pnetid_set(u8 * pnetid)76*4882a593Smuzhiyun bool smc_pnet_is_pnetid_set(u8 *pnetid)
77*4882a593Smuzhiyun {
78*4882a593Smuzhiyun 	if (pnetid[0] == 0 || pnetid[0] == _S)
79*4882a593Smuzhiyun 		return false;
80*4882a593Smuzhiyun 	return true;
81*4882a593Smuzhiyun }
82*4882a593Smuzhiyun 
83*4882a593Smuzhiyun /* Check if two given pnetids match */
smc_pnet_match(u8 * pnetid1,u8 * pnetid2)84*4882a593Smuzhiyun static bool smc_pnet_match(u8 *pnetid1, u8 *pnetid2)
85*4882a593Smuzhiyun {
86*4882a593Smuzhiyun 	int i;
87*4882a593Smuzhiyun 
88*4882a593Smuzhiyun 	for (i = 0; i < SMC_MAX_PNETID_LEN; i++) {
89*4882a593Smuzhiyun 		if ((pnetid1[i] == 0 || pnetid1[i] == _S) &&
90*4882a593Smuzhiyun 		    (pnetid2[i] == 0 || pnetid2[i] == _S))
91*4882a593Smuzhiyun 			break;
92*4882a593Smuzhiyun 		if (pnetid1[i] != pnetid2[i])
93*4882a593Smuzhiyun 			return false;
94*4882a593Smuzhiyun 	}
95*4882a593Smuzhiyun 	return true;
96*4882a593Smuzhiyun }
97*4882a593Smuzhiyun 
98*4882a593Smuzhiyun /* Remove a pnetid from the pnet table.
99*4882a593Smuzhiyun  */
smc_pnet_remove_by_pnetid(struct net * net,char * pnet_name)100*4882a593Smuzhiyun static int smc_pnet_remove_by_pnetid(struct net *net, char *pnet_name)
101*4882a593Smuzhiyun {
102*4882a593Smuzhiyun 	struct smc_pnetentry *pnetelem, *tmp_pe;
103*4882a593Smuzhiyun 	struct smc_pnettable *pnettable;
104*4882a593Smuzhiyun 	struct smc_ib_device *ibdev;
105*4882a593Smuzhiyun 	struct smcd_dev *smcd_dev;
106*4882a593Smuzhiyun 	struct smc_net *sn;
107*4882a593Smuzhiyun 	int rc = -ENOENT;
108*4882a593Smuzhiyun 	int ibport;
109*4882a593Smuzhiyun 
110*4882a593Smuzhiyun 	/* get pnettable for namespace */
111*4882a593Smuzhiyun 	sn = net_generic(net, smc_net_id);
112*4882a593Smuzhiyun 	pnettable = &sn->pnettable;
113*4882a593Smuzhiyun 
114*4882a593Smuzhiyun 	/* remove table entry */
115*4882a593Smuzhiyun 	mutex_lock(&pnettable->lock);
116*4882a593Smuzhiyun 	list_for_each_entry_safe(pnetelem, tmp_pe, &pnettable->pnetlist,
117*4882a593Smuzhiyun 				 list) {
118*4882a593Smuzhiyun 		if (!pnet_name ||
119*4882a593Smuzhiyun 		    smc_pnet_match(pnetelem->pnet_name, pnet_name)) {
120*4882a593Smuzhiyun 			list_del(&pnetelem->list);
121*4882a593Smuzhiyun 			if (pnetelem->type == SMC_PNET_ETH && pnetelem->ndev) {
122*4882a593Smuzhiyun 				dev_put(pnetelem->ndev);
123*4882a593Smuzhiyun 				pr_warn_ratelimited("smc: net device %s "
124*4882a593Smuzhiyun 						    "erased user defined "
125*4882a593Smuzhiyun 						    "pnetid %.16s\n",
126*4882a593Smuzhiyun 						    pnetelem->eth_name,
127*4882a593Smuzhiyun 						    pnetelem->pnet_name);
128*4882a593Smuzhiyun 			}
129*4882a593Smuzhiyun 			kfree(pnetelem);
130*4882a593Smuzhiyun 			rc = 0;
131*4882a593Smuzhiyun 		}
132*4882a593Smuzhiyun 	}
133*4882a593Smuzhiyun 	mutex_unlock(&pnettable->lock);
134*4882a593Smuzhiyun 
135*4882a593Smuzhiyun 	/* if this is not the initial namespace, stop here */
136*4882a593Smuzhiyun 	if (net != &init_net)
137*4882a593Smuzhiyun 		return rc;
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun 	/* remove ib devices */
140*4882a593Smuzhiyun 	mutex_lock(&smc_ib_devices.mutex);
141*4882a593Smuzhiyun 	list_for_each_entry(ibdev, &smc_ib_devices.list, list) {
142*4882a593Smuzhiyun 		for (ibport = 0; ibport < SMC_MAX_PORTS; ibport++) {
143*4882a593Smuzhiyun 			if (ibdev->pnetid_by_user[ibport] &&
144*4882a593Smuzhiyun 			    (!pnet_name ||
145*4882a593Smuzhiyun 			     smc_pnet_match(pnet_name,
146*4882a593Smuzhiyun 					    ibdev->pnetid[ibport]))) {
147*4882a593Smuzhiyun 				pr_warn_ratelimited("smc: ib device %s ibport "
148*4882a593Smuzhiyun 						    "%d erased user defined "
149*4882a593Smuzhiyun 						    "pnetid %.16s\n",
150*4882a593Smuzhiyun 						    ibdev->ibdev->name,
151*4882a593Smuzhiyun 						    ibport + 1,
152*4882a593Smuzhiyun 						    ibdev->pnetid[ibport]);
153*4882a593Smuzhiyun 				memset(ibdev->pnetid[ibport], 0,
154*4882a593Smuzhiyun 				       SMC_MAX_PNETID_LEN);
155*4882a593Smuzhiyun 				ibdev->pnetid_by_user[ibport] = false;
156*4882a593Smuzhiyun 				rc = 0;
157*4882a593Smuzhiyun 			}
158*4882a593Smuzhiyun 		}
159*4882a593Smuzhiyun 	}
160*4882a593Smuzhiyun 	mutex_unlock(&smc_ib_devices.mutex);
161*4882a593Smuzhiyun 	/* remove smcd devices */
162*4882a593Smuzhiyun 	mutex_lock(&smcd_dev_list.mutex);
163*4882a593Smuzhiyun 	list_for_each_entry(smcd_dev, &smcd_dev_list.list, list) {
164*4882a593Smuzhiyun 		if (smcd_dev->pnetid_by_user &&
165*4882a593Smuzhiyun 		    (!pnet_name ||
166*4882a593Smuzhiyun 		     smc_pnet_match(pnet_name, smcd_dev->pnetid))) {
167*4882a593Smuzhiyun 			pr_warn_ratelimited("smc: smcd device %s "
168*4882a593Smuzhiyun 					    "erased user defined pnetid "
169*4882a593Smuzhiyun 					    "%.16s\n", dev_name(&smcd_dev->dev),
170*4882a593Smuzhiyun 					    smcd_dev->pnetid);
171*4882a593Smuzhiyun 			memset(smcd_dev->pnetid, 0, SMC_MAX_PNETID_LEN);
172*4882a593Smuzhiyun 			smcd_dev->pnetid_by_user = false;
173*4882a593Smuzhiyun 			rc = 0;
174*4882a593Smuzhiyun 		}
175*4882a593Smuzhiyun 	}
176*4882a593Smuzhiyun 	mutex_unlock(&smcd_dev_list.mutex);
177*4882a593Smuzhiyun 	return rc;
178*4882a593Smuzhiyun }
179*4882a593Smuzhiyun 
180*4882a593Smuzhiyun /* Add the reference to a given network device to the pnet table.
181*4882a593Smuzhiyun  */
smc_pnet_add_by_ndev(struct net_device * ndev)182*4882a593Smuzhiyun static int smc_pnet_add_by_ndev(struct net_device *ndev)
183*4882a593Smuzhiyun {
184*4882a593Smuzhiyun 	struct smc_pnetentry *pnetelem, *tmp_pe;
185*4882a593Smuzhiyun 	struct smc_pnettable *pnettable;
186*4882a593Smuzhiyun 	struct net *net = dev_net(ndev);
187*4882a593Smuzhiyun 	struct smc_net *sn;
188*4882a593Smuzhiyun 	int rc = -ENOENT;
189*4882a593Smuzhiyun 
190*4882a593Smuzhiyun 	/* get pnettable for namespace */
191*4882a593Smuzhiyun 	sn = net_generic(net, smc_net_id);
192*4882a593Smuzhiyun 	pnettable = &sn->pnettable;
193*4882a593Smuzhiyun 
194*4882a593Smuzhiyun 	mutex_lock(&pnettable->lock);
195*4882a593Smuzhiyun 	list_for_each_entry_safe(pnetelem, tmp_pe, &pnettable->pnetlist, list) {
196*4882a593Smuzhiyun 		if (pnetelem->type == SMC_PNET_ETH && !pnetelem->ndev &&
197*4882a593Smuzhiyun 		    !strncmp(pnetelem->eth_name, ndev->name, IFNAMSIZ)) {
198*4882a593Smuzhiyun 			dev_hold(ndev);
199*4882a593Smuzhiyun 			pnetelem->ndev = ndev;
200*4882a593Smuzhiyun 			rc = 0;
201*4882a593Smuzhiyun 			pr_warn_ratelimited("smc: adding net device %s with "
202*4882a593Smuzhiyun 					    "user defined pnetid %.16s\n",
203*4882a593Smuzhiyun 					    pnetelem->eth_name,
204*4882a593Smuzhiyun 					    pnetelem->pnet_name);
205*4882a593Smuzhiyun 			break;
206*4882a593Smuzhiyun 		}
207*4882a593Smuzhiyun 	}
208*4882a593Smuzhiyun 	mutex_unlock(&pnettable->lock);
209*4882a593Smuzhiyun 	return rc;
210*4882a593Smuzhiyun }
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun /* Remove the reference to a given network device from the pnet table.
213*4882a593Smuzhiyun  */
smc_pnet_remove_by_ndev(struct net_device * ndev)214*4882a593Smuzhiyun static int smc_pnet_remove_by_ndev(struct net_device *ndev)
215*4882a593Smuzhiyun {
216*4882a593Smuzhiyun 	struct smc_pnetentry *pnetelem, *tmp_pe;
217*4882a593Smuzhiyun 	struct smc_pnettable *pnettable;
218*4882a593Smuzhiyun 	struct net *net = dev_net(ndev);
219*4882a593Smuzhiyun 	struct smc_net *sn;
220*4882a593Smuzhiyun 	int rc = -ENOENT;
221*4882a593Smuzhiyun 
222*4882a593Smuzhiyun 	/* get pnettable for namespace */
223*4882a593Smuzhiyun 	sn = net_generic(net, smc_net_id);
224*4882a593Smuzhiyun 	pnettable = &sn->pnettable;
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun 	mutex_lock(&pnettable->lock);
227*4882a593Smuzhiyun 	list_for_each_entry_safe(pnetelem, tmp_pe, &pnettable->pnetlist, list) {
228*4882a593Smuzhiyun 		if (pnetelem->type == SMC_PNET_ETH && pnetelem->ndev == ndev) {
229*4882a593Smuzhiyun 			dev_put(pnetelem->ndev);
230*4882a593Smuzhiyun 			pnetelem->ndev = NULL;
231*4882a593Smuzhiyun 			rc = 0;
232*4882a593Smuzhiyun 			pr_warn_ratelimited("smc: removing net device %s with "
233*4882a593Smuzhiyun 					    "user defined pnetid %.16s\n",
234*4882a593Smuzhiyun 					    pnetelem->eth_name,
235*4882a593Smuzhiyun 					    pnetelem->pnet_name);
236*4882a593Smuzhiyun 			break;
237*4882a593Smuzhiyun 		}
238*4882a593Smuzhiyun 	}
239*4882a593Smuzhiyun 	mutex_unlock(&pnettable->lock);
240*4882a593Smuzhiyun 	return rc;
241*4882a593Smuzhiyun }
242*4882a593Smuzhiyun 
243*4882a593Smuzhiyun /* Apply pnetid to ib device when no pnetid is set.
244*4882a593Smuzhiyun  */
smc_pnet_apply_ib(struct smc_ib_device * ib_dev,u8 ib_port,char * pnet_name)245*4882a593Smuzhiyun static bool smc_pnet_apply_ib(struct smc_ib_device *ib_dev, u8 ib_port,
246*4882a593Smuzhiyun 			      char *pnet_name)
247*4882a593Smuzhiyun {
248*4882a593Smuzhiyun 	bool applied = false;
249*4882a593Smuzhiyun 
250*4882a593Smuzhiyun 	mutex_lock(&smc_ib_devices.mutex);
251*4882a593Smuzhiyun 	if (!smc_pnet_is_pnetid_set(ib_dev->pnetid[ib_port - 1])) {
252*4882a593Smuzhiyun 		memcpy(ib_dev->pnetid[ib_port - 1], pnet_name,
253*4882a593Smuzhiyun 		       SMC_MAX_PNETID_LEN);
254*4882a593Smuzhiyun 		ib_dev->pnetid_by_user[ib_port - 1] = true;
255*4882a593Smuzhiyun 		applied = true;
256*4882a593Smuzhiyun 	}
257*4882a593Smuzhiyun 	mutex_unlock(&smc_ib_devices.mutex);
258*4882a593Smuzhiyun 	return applied;
259*4882a593Smuzhiyun }
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun /* Apply pnetid to smcd device when no pnetid is set.
262*4882a593Smuzhiyun  */
smc_pnet_apply_smcd(struct smcd_dev * smcd_dev,char * pnet_name)263*4882a593Smuzhiyun static bool smc_pnet_apply_smcd(struct smcd_dev *smcd_dev, char *pnet_name)
264*4882a593Smuzhiyun {
265*4882a593Smuzhiyun 	bool applied = false;
266*4882a593Smuzhiyun 
267*4882a593Smuzhiyun 	mutex_lock(&smcd_dev_list.mutex);
268*4882a593Smuzhiyun 	if (!smc_pnet_is_pnetid_set(smcd_dev->pnetid)) {
269*4882a593Smuzhiyun 		memcpy(smcd_dev->pnetid, pnet_name, SMC_MAX_PNETID_LEN);
270*4882a593Smuzhiyun 		smcd_dev->pnetid_by_user = true;
271*4882a593Smuzhiyun 		applied = true;
272*4882a593Smuzhiyun 	}
273*4882a593Smuzhiyun 	mutex_unlock(&smcd_dev_list.mutex);
274*4882a593Smuzhiyun 	return applied;
275*4882a593Smuzhiyun }
276*4882a593Smuzhiyun 
277*4882a593Smuzhiyun /* The limit for pnetid is 16 characters.
278*4882a593Smuzhiyun  * Valid characters should be (single-byte character set) a-z, A-Z, 0-9.
279*4882a593Smuzhiyun  * Lower case letters are converted to upper case.
280*4882a593Smuzhiyun  * Interior blanks should not be used.
281*4882a593Smuzhiyun  */
smc_pnetid_valid(const char * pnet_name,char * pnetid)282*4882a593Smuzhiyun static bool smc_pnetid_valid(const char *pnet_name, char *pnetid)
283*4882a593Smuzhiyun {
284*4882a593Smuzhiyun 	char *bf = skip_spaces(pnet_name);
285*4882a593Smuzhiyun 	size_t len = strlen(bf);
286*4882a593Smuzhiyun 	char *end = bf + len;
287*4882a593Smuzhiyun 
288*4882a593Smuzhiyun 	if (!len)
289*4882a593Smuzhiyun 		return false;
290*4882a593Smuzhiyun 	while (--end >= bf && isspace(*end))
291*4882a593Smuzhiyun 		;
292*4882a593Smuzhiyun 	if (end - bf >= SMC_MAX_PNETID_LEN)
293*4882a593Smuzhiyun 		return false;
294*4882a593Smuzhiyun 	while (bf <= end) {
295*4882a593Smuzhiyun 		if (!isalnum(*bf))
296*4882a593Smuzhiyun 			return false;
297*4882a593Smuzhiyun 		*pnetid++ = islower(*bf) ? toupper(*bf) : *bf;
298*4882a593Smuzhiyun 		bf++;
299*4882a593Smuzhiyun 	}
300*4882a593Smuzhiyun 	*pnetid = '\0';
301*4882a593Smuzhiyun 	return true;
302*4882a593Smuzhiyun }
303*4882a593Smuzhiyun 
304*4882a593Smuzhiyun /* Find an infiniband device by a given name. The device might not exist. */
smc_pnet_find_ib(char * ib_name)305*4882a593Smuzhiyun static struct smc_ib_device *smc_pnet_find_ib(char *ib_name)
306*4882a593Smuzhiyun {
307*4882a593Smuzhiyun 	struct smc_ib_device *ibdev;
308*4882a593Smuzhiyun 
309*4882a593Smuzhiyun 	mutex_lock(&smc_ib_devices.mutex);
310*4882a593Smuzhiyun 	list_for_each_entry(ibdev, &smc_ib_devices.list, list) {
311*4882a593Smuzhiyun 		if (!strncmp(ibdev->ibdev->name, ib_name,
312*4882a593Smuzhiyun 			     sizeof(ibdev->ibdev->name)) ||
313*4882a593Smuzhiyun 		    (ibdev->ibdev->dev.parent &&
314*4882a593Smuzhiyun 		     !strncmp(dev_name(ibdev->ibdev->dev.parent), ib_name,
315*4882a593Smuzhiyun 			     IB_DEVICE_NAME_MAX - 1))) {
316*4882a593Smuzhiyun 			goto out;
317*4882a593Smuzhiyun 		}
318*4882a593Smuzhiyun 	}
319*4882a593Smuzhiyun 	ibdev = NULL;
320*4882a593Smuzhiyun out:
321*4882a593Smuzhiyun 	mutex_unlock(&smc_ib_devices.mutex);
322*4882a593Smuzhiyun 	return ibdev;
323*4882a593Smuzhiyun }
324*4882a593Smuzhiyun 
325*4882a593Smuzhiyun /* Find an smcd device by a given name. The device might not exist. */
smc_pnet_find_smcd(char * smcd_name)326*4882a593Smuzhiyun static struct smcd_dev *smc_pnet_find_smcd(char *smcd_name)
327*4882a593Smuzhiyun {
328*4882a593Smuzhiyun 	struct smcd_dev *smcd_dev;
329*4882a593Smuzhiyun 
330*4882a593Smuzhiyun 	mutex_lock(&smcd_dev_list.mutex);
331*4882a593Smuzhiyun 	list_for_each_entry(smcd_dev, &smcd_dev_list.list, list) {
332*4882a593Smuzhiyun 		if (!strncmp(dev_name(&smcd_dev->dev), smcd_name,
333*4882a593Smuzhiyun 			     IB_DEVICE_NAME_MAX - 1))
334*4882a593Smuzhiyun 			goto out;
335*4882a593Smuzhiyun 	}
336*4882a593Smuzhiyun 	smcd_dev = NULL;
337*4882a593Smuzhiyun out:
338*4882a593Smuzhiyun 	mutex_unlock(&smcd_dev_list.mutex);
339*4882a593Smuzhiyun 	return smcd_dev;
340*4882a593Smuzhiyun }
341*4882a593Smuzhiyun 
smc_pnet_add_eth(struct smc_pnettable * pnettable,struct net * net,char * eth_name,char * pnet_name)342*4882a593Smuzhiyun static int smc_pnet_add_eth(struct smc_pnettable *pnettable, struct net *net,
343*4882a593Smuzhiyun 			    char *eth_name, char *pnet_name)
344*4882a593Smuzhiyun {
345*4882a593Smuzhiyun 	struct smc_pnetentry *tmp_pe, *new_pe;
346*4882a593Smuzhiyun 	struct net_device *ndev, *base_ndev;
347*4882a593Smuzhiyun 	u8 ndev_pnetid[SMC_MAX_PNETID_LEN];
348*4882a593Smuzhiyun 	bool new_netdev;
349*4882a593Smuzhiyun 	int rc;
350*4882a593Smuzhiyun 
351*4882a593Smuzhiyun 	/* check if (base) netdev already has a pnetid. If there is one, we do
352*4882a593Smuzhiyun 	 * not want to add a pnet table entry
353*4882a593Smuzhiyun 	 */
354*4882a593Smuzhiyun 	rc = -EEXIST;
355*4882a593Smuzhiyun 	ndev = dev_get_by_name(net, eth_name);	/* dev_hold() */
356*4882a593Smuzhiyun 	if (ndev) {
357*4882a593Smuzhiyun 		base_ndev = pnet_find_base_ndev(ndev);
358*4882a593Smuzhiyun 		if (!smc_pnetid_by_dev_port(base_ndev->dev.parent,
359*4882a593Smuzhiyun 					    base_ndev->dev_port, ndev_pnetid))
360*4882a593Smuzhiyun 			goto out_put;
361*4882a593Smuzhiyun 	}
362*4882a593Smuzhiyun 
363*4882a593Smuzhiyun 	/* add a new netdev entry to the pnet table if there isn't one */
364*4882a593Smuzhiyun 	rc = -ENOMEM;
365*4882a593Smuzhiyun 	new_pe = kzalloc(sizeof(*new_pe), GFP_KERNEL);
366*4882a593Smuzhiyun 	if (!new_pe)
367*4882a593Smuzhiyun 		goto out_put;
368*4882a593Smuzhiyun 	new_pe->type = SMC_PNET_ETH;
369*4882a593Smuzhiyun 	memcpy(new_pe->pnet_name, pnet_name, SMC_MAX_PNETID_LEN);
370*4882a593Smuzhiyun 	strncpy(new_pe->eth_name, eth_name, IFNAMSIZ);
371*4882a593Smuzhiyun 	new_pe->ndev = ndev;
372*4882a593Smuzhiyun 
373*4882a593Smuzhiyun 	rc = -EEXIST;
374*4882a593Smuzhiyun 	new_netdev = true;
375*4882a593Smuzhiyun 	mutex_lock(&pnettable->lock);
376*4882a593Smuzhiyun 	list_for_each_entry(tmp_pe, &pnettable->pnetlist, list) {
377*4882a593Smuzhiyun 		if (tmp_pe->type == SMC_PNET_ETH &&
378*4882a593Smuzhiyun 		    !strncmp(tmp_pe->eth_name, eth_name, IFNAMSIZ)) {
379*4882a593Smuzhiyun 			new_netdev = false;
380*4882a593Smuzhiyun 			break;
381*4882a593Smuzhiyun 		}
382*4882a593Smuzhiyun 	}
383*4882a593Smuzhiyun 	if (new_netdev) {
384*4882a593Smuzhiyun 		list_add_tail(&new_pe->list, &pnettable->pnetlist);
385*4882a593Smuzhiyun 		mutex_unlock(&pnettable->lock);
386*4882a593Smuzhiyun 	} else {
387*4882a593Smuzhiyun 		mutex_unlock(&pnettable->lock);
388*4882a593Smuzhiyun 		kfree(new_pe);
389*4882a593Smuzhiyun 		goto out_put;
390*4882a593Smuzhiyun 	}
391*4882a593Smuzhiyun 	if (ndev)
392*4882a593Smuzhiyun 		pr_warn_ratelimited("smc: net device %s "
393*4882a593Smuzhiyun 				    "applied user defined pnetid %.16s\n",
394*4882a593Smuzhiyun 				    new_pe->eth_name, new_pe->pnet_name);
395*4882a593Smuzhiyun 	return 0;
396*4882a593Smuzhiyun 
397*4882a593Smuzhiyun out_put:
398*4882a593Smuzhiyun 	if (ndev)
399*4882a593Smuzhiyun 		dev_put(ndev);
400*4882a593Smuzhiyun 	return rc;
401*4882a593Smuzhiyun }
402*4882a593Smuzhiyun 
smc_pnet_add_ib(struct smc_pnettable * pnettable,char * ib_name,u8 ib_port,char * pnet_name)403*4882a593Smuzhiyun static int smc_pnet_add_ib(struct smc_pnettable *pnettable, char *ib_name,
404*4882a593Smuzhiyun 			   u8 ib_port, char *pnet_name)
405*4882a593Smuzhiyun {
406*4882a593Smuzhiyun 	struct smc_pnetentry *tmp_pe, *new_pe;
407*4882a593Smuzhiyun 	struct smc_ib_device *ib_dev;
408*4882a593Smuzhiyun 	bool smcddev_applied = true;
409*4882a593Smuzhiyun 	bool ibdev_applied = true;
410*4882a593Smuzhiyun 	struct smcd_dev *smcd_dev;
411*4882a593Smuzhiyun 	bool new_ibdev;
412*4882a593Smuzhiyun 
413*4882a593Smuzhiyun 	/* try to apply the pnetid to active devices */
414*4882a593Smuzhiyun 	ib_dev = smc_pnet_find_ib(ib_name);
415*4882a593Smuzhiyun 	if (ib_dev) {
416*4882a593Smuzhiyun 		ibdev_applied = smc_pnet_apply_ib(ib_dev, ib_port, pnet_name);
417*4882a593Smuzhiyun 		if (ibdev_applied)
418*4882a593Smuzhiyun 			pr_warn_ratelimited("smc: ib device %s ibport %d "
419*4882a593Smuzhiyun 					    "applied user defined pnetid "
420*4882a593Smuzhiyun 					    "%.16s\n", ib_dev->ibdev->name,
421*4882a593Smuzhiyun 					    ib_port,
422*4882a593Smuzhiyun 					    ib_dev->pnetid[ib_port - 1]);
423*4882a593Smuzhiyun 	}
424*4882a593Smuzhiyun 	smcd_dev = smc_pnet_find_smcd(ib_name);
425*4882a593Smuzhiyun 	if (smcd_dev) {
426*4882a593Smuzhiyun 		smcddev_applied = smc_pnet_apply_smcd(smcd_dev, pnet_name);
427*4882a593Smuzhiyun 		if (smcddev_applied)
428*4882a593Smuzhiyun 			pr_warn_ratelimited("smc: smcd device %s "
429*4882a593Smuzhiyun 					    "applied user defined pnetid "
430*4882a593Smuzhiyun 					    "%.16s\n", dev_name(&smcd_dev->dev),
431*4882a593Smuzhiyun 					    smcd_dev->pnetid);
432*4882a593Smuzhiyun 	}
433*4882a593Smuzhiyun 	/* Apply fails when a device has a hardware-defined pnetid set, do not
434*4882a593Smuzhiyun 	 * add a pnet table entry in that case.
435*4882a593Smuzhiyun 	 */
436*4882a593Smuzhiyun 	if (!ibdev_applied || !smcddev_applied)
437*4882a593Smuzhiyun 		return -EEXIST;
438*4882a593Smuzhiyun 
439*4882a593Smuzhiyun 	/* add a new ib entry to the pnet table if there isn't one */
440*4882a593Smuzhiyun 	new_pe = kzalloc(sizeof(*new_pe), GFP_KERNEL);
441*4882a593Smuzhiyun 	if (!new_pe)
442*4882a593Smuzhiyun 		return -ENOMEM;
443*4882a593Smuzhiyun 	new_pe->type = SMC_PNET_IB;
444*4882a593Smuzhiyun 	memcpy(new_pe->pnet_name, pnet_name, SMC_MAX_PNETID_LEN);
445*4882a593Smuzhiyun 	strncpy(new_pe->ib_name, ib_name, IB_DEVICE_NAME_MAX);
446*4882a593Smuzhiyun 	new_pe->ib_port = ib_port;
447*4882a593Smuzhiyun 
448*4882a593Smuzhiyun 	new_ibdev = true;
449*4882a593Smuzhiyun 	mutex_lock(&pnettable->lock);
450*4882a593Smuzhiyun 	list_for_each_entry(tmp_pe, &pnettable->pnetlist, list) {
451*4882a593Smuzhiyun 		if (tmp_pe->type == SMC_PNET_IB &&
452*4882a593Smuzhiyun 		    !strncmp(tmp_pe->ib_name, ib_name, IB_DEVICE_NAME_MAX)) {
453*4882a593Smuzhiyun 			new_ibdev = false;
454*4882a593Smuzhiyun 			break;
455*4882a593Smuzhiyun 		}
456*4882a593Smuzhiyun 	}
457*4882a593Smuzhiyun 	if (new_ibdev) {
458*4882a593Smuzhiyun 		list_add_tail(&new_pe->list, &pnettable->pnetlist);
459*4882a593Smuzhiyun 		mutex_unlock(&pnettable->lock);
460*4882a593Smuzhiyun 	} else {
461*4882a593Smuzhiyun 		mutex_unlock(&pnettable->lock);
462*4882a593Smuzhiyun 		kfree(new_pe);
463*4882a593Smuzhiyun 	}
464*4882a593Smuzhiyun 	return (new_ibdev) ? 0 : -EEXIST;
465*4882a593Smuzhiyun }
466*4882a593Smuzhiyun 
467*4882a593Smuzhiyun /* Append a pnetid to the end of the pnet table if not already on this list.
468*4882a593Smuzhiyun  */
smc_pnet_enter(struct net * net,struct nlattr * tb[])469*4882a593Smuzhiyun static int smc_pnet_enter(struct net *net, struct nlattr *tb[])
470*4882a593Smuzhiyun {
471*4882a593Smuzhiyun 	char pnet_name[SMC_MAX_PNETID_LEN + 1];
472*4882a593Smuzhiyun 	struct smc_pnettable *pnettable;
473*4882a593Smuzhiyun 	bool new_netdev = false;
474*4882a593Smuzhiyun 	bool new_ibdev = false;
475*4882a593Smuzhiyun 	struct smc_net *sn;
476*4882a593Smuzhiyun 	u8 ibport = 1;
477*4882a593Smuzhiyun 	char *string;
478*4882a593Smuzhiyun 	int rc;
479*4882a593Smuzhiyun 
480*4882a593Smuzhiyun 	/* get pnettable for namespace */
481*4882a593Smuzhiyun 	sn = net_generic(net, smc_net_id);
482*4882a593Smuzhiyun 	pnettable = &sn->pnettable;
483*4882a593Smuzhiyun 
484*4882a593Smuzhiyun 	rc = -EINVAL;
485*4882a593Smuzhiyun 	if (!tb[SMC_PNETID_NAME])
486*4882a593Smuzhiyun 		goto error;
487*4882a593Smuzhiyun 	string = (char *)nla_data(tb[SMC_PNETID_NAME]);
488*4882a593Smuzhiyun 	if (!smc_pnetid_valid(string, pnet_name))
489*4882a593Smuzhiyun 		goto error;
490*4882a593Smuzhiyun 
491*4882a593Smuzhiyun 	if (tb[SMC_PNETID_ETHNAME]) {
492*4882a593Smuzhiyun 		string = (char *)nla_data(tb[SMC_PNETID_ETHNAME]);
493*4882a593Smuzhiyun 		rc = smc_pnet_add_eth(pnettable, net, string, pnet_name);
494*4882a593Smuzhiyun 		if (!rc)
495*4882a593Smuzhiyun 			new_netdev = true;
496*4882a593Smuzhiyun 		else if (rc != -EEXIST)
497*4882a593Smuzhiyun 			goto error;
498*4882a593Smuzhiyun 	}
499*4882a593Smuzhiyun 
500*4882a593Smuzhiyun 	/* if this is not the initial namespace, stop here */
501*4882a593Smuzhiyun 	if (net != &init_net)
502*4882a593Smuzhiyun 		return new_netdev ? 0 : -EEXIST;
503*4882a593Smuzhiyun 
504*4882a593Smuzhiyun 	rc = -EINVAL;
505*4882a593Smuzhiyun 	if (tb[SMC_PNETID_IBNAME]) {
506*4882a593Smuzhiyun 		string = (char *)nla_data(tb[SMC_PNETID_IBNAME]);
507*4882a593Smuzhiyun 		string = strim(string);
508*4882a593Smuzhiyun 		if (tb[SMC_PNETID_IBPORT]) {
509*4882a593Smuzhiyun 			ibport = nla_get_u8(tb[SMC_PNETID_IBPORT]);
510*4882a593Smuzhiyun 			if (ibport < 1 || ibport > SMC_MAX_PORTS)
511*4882a593Smuzhiyun 				goto error;
512*4882a593Smuzhiyun 		}
513*4882a593Smuzhiyun 		rc = smc_pnet_add_ib(pnettable, string, ibport, pnet_name);
514*4882a593Smuzhiyun 		if (!rc)
515*4882a593Smuzhiyun 			new_ibdev = true;
516*4882a593Smuzhiyun 		else if (rc != -EEXIST)
517*4882a593Smuzhiyun 			goto error;
518*4882a593Smuzhiyun 	}
519*4882a593Smuzhiyun 	return (new_netdev || new_ibdev) ? 0 : -EEXIST;
520*4882a593Smuzhiyun 
521*4882a593Smuzhiyun error:
522*4882a593Smuzhiyun 	return rc;
523*4882a593Smuzhiyun }
524*4882a593Smuzhiyun 
525*4882a593Smuzhiyun /* Convert an smc_pnetentry to a netlink attribute sequence */
smc_pnet_set_nla(struct sk_buff * msg,struct smc_pnetentry * pnetelem)526*4882a593Smuzhiyun static int smc_pnet_set_nla(struct sk_buff *msg,
527*4882a593Smuzhiyun 			    struct smc_pnetentry *pnetelem)
528*4882a593Smuzhiyun {
529*4882a593Smuzhiyun 	if (nla_put_string(msg, SMC_PNETID_NAME, pnetelem->pnet_name))
530*4882a593Smuzhiyun 		return -1;
531*4882a593Smuzhiyun 	if (pnetelem->type == SMC_PNET_ETH) {
532*4882a593Smuzhiyun 		if (nla_put_string(msg, SMC_PNETID_ETHNAME,
533*4882a593Smuzhiyun 				   pnetelem->eth_name))
534*4882a593Smuzhiyun 			return -1;
535*4882a593Smuzhiyun 	} else {
536*4882a593Smuzhiyun 		if (nla_put_string(msg, SMC_PNETID_ETHNAME, "n/a"))
537*4882a593Smuzhiyun 			return -1;
538*4882a593Smuzhiyun 	}
539*4882a593Smuzhiyun 	if (pnetelem->type == SMC_PNET_IB) {
540*4882a593Smuzhiyun 		if (nla_put_string(msg, SMC_PNETID_IBNAME, pnetelem->ib_name) ||
541*4882a593Smuzhiyun 		    nla_put_u8(msg, SMC_PNETID_IBPORT, pnetelem->ib_port))
542*4882a593Smuzhiyun 			return -1;
543*4882a593Smuzhiyun 	} else {
544*4882a593Smuzhiyun 		if (nla_put_string(msg, SMC_PNETID_IBNAME, "n/a") ||
545*4882a593Smuzhiyun 		    nla_put_u8(msg, SMC_PNETID_IBPORT, 0xff))
546*4882a593Smuzhiyun 			return -1;
547*4882a593Smuzhiyun 	}
548*4882a593Smuzhiyun 
549*4882a593Smuzhiyun 	return 0;
550*4882a593Smuzhiyun }
551*4882a593Smuzhiyun 
smc_pnet_add(struct sk_buff * skb,struct genl_info * info)552*4882a593Smuzhiyun static int smc_pnet_add(struct sk_buff *skb, struct genl_info *info)
553*4882a593Smuzhiyun {
554*4882a593Smuzhiyun 	struct net *net = genl_info_net(info);
555*4882a593Smuzhiyun 
556*4882a593Smuzhiyun 	return smc_pnet_enter(net, info->attrs);
557*4882a593Smuzhiyun }
558*4882a593Smuzhiyun 
smc_pnet_del(struct sk_buff * skb,struct genl_info * info)559*4882a593Smuzhiyun static int smc_pnet_del(struct sk_buff *skb, struct genl_info *info)
560*4882a593Smuzhiyun {
561*4882a593Smuzhiyun 	struct net *net = genl_info_net(info);
562*4882a593Smuzhiyun 
563*4882a593Smuzhiyun 	if (!info->attrs[SMC_PNETID_NAME])
564*4882a593Smuzhiyun 		return -EINVAL;
565*4882a593Smuzhiyun 	return smc_pnet_remove_by_pnetid(net,
566*4882a593Smuzhiyun 				(char *)nla_data(info->attrs[SMC_PNETID_NAME]));
567*4882a593Smuzhiyun }
568*4882a593Smuzhiyun 
smc_pnet_dump_start(struct netlink_callback * cb)569*4882a593Smuzhiyun static int smc_pnet_dump_start(struct netlink_callback *cb)
570*4882a593Smuzhiyun {
571*4882a593Smuzhiyun 	cb->args[0] = 0;
572*4882a593Smuzhiyun 	return 0;
573*4882a593Smuzhiyun }
574*4882a593Smuzhiyun 
smc_pnet_dumpinfo(struct sk_buff * skb,u32 portid,u32 seq,u32 flags,struct smc_pnetentry * pnetelem)575*4882a593Smuzhiyun static int smc_pnet_dumpinfo(struct sk_buff *skb,
576*4882a593Smuzhiyun 			     u32 portid, u32 seq, u32 flags,
577*4882a593Smuzhiyun 			     struct smc_pnetentry *pnetelem)
578*4882a593Smuzhiyun {
579*4882a593Smuzhiyun 	void *hdr;
580*4882a593Smuzhiyun 
581*4882a593Smuzhiyun 	hdr = genlmsg_put(skb, portid, seq, &smc_pnet_nl_family,
582*4882a593Smuzhiyun 			  flags, SMC_PNETID_GET);
583*4882a593Smuzhiyun 	if (!hdr)
584*4882a593Smuzhiyun 		return -ENOMEM;
585*4882a593Smuzhiyun 	if (smc_pnet_set_nla(skb, pnetelem) < 0) {
586*4882a593Smuzhiyun 		genlmsg_cancel(skb, hdr);
587*4882a593Smuzhiyun 		return -EMSGSIZE;
588*4882a593Smuzhiyun 	}
589*4882a593Smuzhiyun 	genlmsg_end(skb, hdr);
590*4882a593Smuzhiyun 	return 0;
591*4882a593Smuzhiyun }
592*4882a593Smuzhiyun 
_smc_pnet_dump(struct net * net,struct sk_buff * skb,u32 portid,u32 seq,u8 * pnetid,int start_idx)593*4882a593Smuzhiyun static int _smc_pnet_dump(struct net *net, struct sk_buff *skb, u32 portid,
594*4882a593Smuzhiyun 			  u32 seq, u8 *pnetid, int start_idx)
595*4882a593Smuzhiyun {
596*4882a593Smuzhiyun 	struct smc_pnettable *pnettable;
597*4882a593Smuzhiyun 	struct smc_pnetentry *pnetelem;
598*4882a593Smuzhiyun 	struct smc_net *sn;
599*4882a593Smuzhiyun 	int idx = 0;
600*4882a593Smuzhiyun 
601*4882a593Smuzhiyun 	/* get pnettable for namespace */
602*4882a593Smuzhiyun 	sn = net_generic(net, smc_net_id);
603*4882a593Smuzhiyun 	pnettable = &sn->pnettable;
604*4882a593Smuzhiyun 
605*4882a593Smuzhiyun 	/* dump pnettable entries */
606*4882a593Smuzhiyun 	mutex_lock(&pnettable->lock);
607*4882a593Smuzhiyun 	list_for_each_entry(pnetelem, &pnettable->pnetlist, list) {
608*4882a593Smuzhiyun 		if (pnetid && !smc_pnet_match(pnetelem->pnet_name, pnetid))
609*4882a593Smuzhiyun 			continue;
610*4882a593Smuzhiyun 		if (idx++ < start_idx)
611*4882a593Smuzhiyun 			continue;
612*4882a593Smuzhiyun 		/* if this is not the initial namespace, dump only netdev */
613*4882a593Smuzhiyun 		if (net != &init_net && pnetelem->type != SMC_PNET_ETH)
614*4882a593Smuzhiyun 			continue;
615*4882a593Smuzhiyun 		if (smc_pnet_dumpinfo(skb, portid, seq, NLM_F_MULTI,
616*4882a593Smuzhiyun 				      pnetelem)) {
617*4882a593Smuzhiyun 			--idx;
618*4882a593Smuzhiyun 			break;
619*4882a593Smuzhiyun 		}
620*4882a593Smuzhiyun 	}
621*4882a593Smuzhiyun 	mutex_unlock(&pnettable->lock);
622*4882a593Smuzhiyun 	return idx;
623*4882a593Smuzhiyun }
624*4882a593Smuzhiyun 
smc_pnet_dump(struct sk_buff * skb,struct netlink_callback * cb)625*4882a593Smuzhiyun static int smc_pnet_dump(struct sk_buff *skb, struct netlink_callback *cb)
626*4882a593Smuzhiyun {
627*4882a593Smuzhiyun 	struct net *net = sock_net(skb->sk);
628*4882a593Smuzhiyun 	int idx;
629*4882a593Smuzhiyun 
630*4882a593Smuzhiyun 	idx = _smc_pnet_dump(net, skb, NETLINK_CB(cb->skb).portid,
631*4882a593Smuzhiyun 			     cb->nlh->nlmsg_seq, NULL, cb->args[0]);
632*4882a593Smuzhiyun 
633*4882a593Smuzhiyun 	cb->args[0] = idx;
634*4882a593Smuzhiyun 	return skb->len;
635*4882a593Smuzhiyun }
636*4882a593Smuzhiyun 
637*4882a593Smuzhiyun /* Retrieve one PNETID entry */
smc_pnet_get(struct sk_buff * skb,struct genl_info * info)638*4882a593Smuzhiyun static int smc_pnet_get(struct sk_buff *skb, struct genl_info *info)
639*4882a593Smuzhiyun {
640*4882a593Smuzhiyun 	struct net *net = genl_info_net(info);
641*4882a593Smuzhiyun 	struct sk_buff *msg;
642*4882a593Smuzhiyun 	void *hdr;
643*4882a593Smuzhiyun 
644*4882a593Smuzhiyun 	if (!info->attrs[SMC_PNETID_NAME])
645*4882a593Smuzhiyun 		return -EINVAL;
646*4882a593Smuzhiyun 
647*4882a593Smuzhiyun 	msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
648*4882a593Smuzhiyun 	if (!msg)
649*4882a593Smuzhiyun 		return -ENOMEM;
650*4882a593Smuzhiyun 
651*4882a593Smuzhiyun 	_smc_pnet_dump(net, msg, info->snd_portid, info->snd_seq,
652*4882a593Smuzhiyun 		       nla_data(info->attrs[SMC_PNETID_NAME]), 0);
653*4882a593Smuzhiyun 
654*4882a593Smuzhiyun 	/* finish multi part message and send it */
655*4882a593Smuzhiyun 	hdr = nlmsg_put(msg, info->snd_portid, info->snd_seq, NLMSG_DONE, 0,
656*4882a593Smuzhiyun 			NLM_F_MULTI);
657*4882a593Smuzhiyun 	if (!hdr) {
658*4882a593Smuzhiyun 		nlmsg_free(msg);
659*4882a593Smuzhiyun 		return -EMSGSIZE;
660*4882a593Smuzhiyun 	}
661*4882a593Smuzhiyun 	return genlmsg_reply(msg, info);
662*4882a593Smuzhiyun }
663*4882a593Smuzhiyun 
664*4882a593Smuzhiyun /* Remove and delete all pnetids from pnet table.
665*4882a593Smuzhiyun  */
smc_pnet_flush(struct sk_buff * skb,struct genl_info * info)666*4882a593Smuzhiyun static int smc_pnet_flush(struct sk_buff *skb, struct genl_info *info)
667*4882a593Smuzhiyun {
668*4882a593Smuzhiyun 	struct net *net = genl_info_net(info);
669*4882a593Smuzhiyun 
670*4882a593Smuzhiyun 	smc_pnet_remove_by_pnetid(net, NULL);
671*4882a593Smuzhiyun 	return 0;
672*4882a593Smuzhiyun }
673*4882a593Smuzhiyun 
674*4882a593Smuzhiyun /* SMC_PNETID generic netlink operation definition */
675*4882a593Smuzhiyun static const struct genl_ops smc_pnet_ops[] = {
676*4882a593Smuzhiyun 	{
677*4882a593Smuzhiyun 		.cmd = SMC_PNETID_GET,
678*4882a593Smuzhiyun 		.validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
679*4882a593Smuzhiyun 		/* can be retrieved by unprivileged users */
680*4882a593Smuzhiyun 		.doit = smc_pnet_get,
681*4882a593Smuzhiyun 		.dumpit = smc_pnet_dump,
682*4882a593Smuzhiyun 		.start = smc_pnet_dump_start
683*4882a593Smuzhiyun 	},
684*4882a593Smuzhiyun 	{
685*4882a593Smuzhiyun 		.cmd = SMC_PNETID_ADD,
686*4882a593Smuzhiyun 		.validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
687*4882a593Smuzhiyun 		.flags = GENL_ADMIN_PERM,
688*4882a593Smuzhiyun 		.doit = smc_pnet_add
689*4882a593Smuzhiyun 	},
690*4882a593Smuzhiyun 	{
691*4882a593Smuzhiyun 		.cmd = SMC_PNETID_DEL,
692*4882a593Smuzhiyun 		.validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
693*4882a593Smuzhiyun 		.flags = GENL_ADMIN_PERM,
694*4882a593Smuzhiyun 		.doit = smc_pnet_del
695*4882a593Smuzhiyun 	},
696*4882a593Smuzhiyun 	{
697*4882a593Smuzhiyun 		.cmd = SMC_PNETID_FLUSH,
698*4882a593Smuzhiyun 		.validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
699*4882a593Smuzhiyun 		.flags = GENL_ADMIN_PERM,
700*4882a593Smuzhiyun 		.doit = smc_pnet_flush
701*4882a593Smuzhiyun 	}
702*4882a593Smuzhiyun };
703*4882a593Smuzhiyun 
704*4882a593Smuzhiyun /* SMC_PNETID family definition */
705*4882a593Smuzhiyun static struct genl_family smc_pnet_nl_family __ro_after_init = {
706*4882a593Smuzhiyun 	.hdrsize = 0,
707*4882a593Smuzhiyun 	.name = SMCR_GENL_FAMILY_NAME,
708*4882a593Smuzhiyun 	.version = SMCR_GENL_FAMILY_VERSION,
709*4882a593Smuzhiyun 	.maxattr = SMC_PNETID_MAX,
710*4882a593Smuzhiyun 	.policy = smc_pnet_policy,
711*4882a593Smuzhiyun 	.netnsok = true,
712*4882a593Smuzhiyun 	.module = THIS_MODULE,
713*4882a593Smuzhiyun 	.ops = smc_pnet_ops,
714*4882a593Smuzhiyun 	.n_ops =  ARRAY_SIZE(smc_pnet_ops)
715*4882a593Smuzhiyun };
716*4882a593Smuzhiyun 
smc_pnet_is_ndev_pnetid(struct net * net,u8 * pnetid)717*4882a593Smuzhiyun bool smc_pnet_is_ndev_pnetid(struct net *net, u8 *pnetid)
718*4882a593Smuzhiyun {
719*4882a593Smuzhiyun 	struct smc_net *sn = net_generic(net, smc_net_id);
720*4882a593Smuzhiyun 	struct smc_pnetids_ndev_entry *pe;
721*4882a593Smuzhiyun 	bool rc = false;
722*4882a593Smuzhiyun 
723*4882a593Smuzhiyun 	read_lock(&sn->pnetids_ndev.lock);
724*4882a593Smuzhiyun 	list_for_each_entry(pe, &sn->pnetids_ndev.list, list) {
725*4882a593Smuzhiyun 		if (smc_pnet_match(pnetid, pe->pnetid)) {
726*4882a593Smuzhiyun 			rc = true;
727*4882a593Smuzhiyun 			goto unlock;
728*4882a593Smuzhiyun 		}
729*4882a593Smuzhiyun 	}
730*4882a593Smuzhiyun 
731*4882a593Smuzhiyun unlock:
732*4882a593Smuzhiyun 	read_unlock(&sn->pnetids_ndev.lock);
733*4882a593Smuzhiyun 	return rc;
734*4882a593Smuzhiyun }
735*4882a593Smuzhiyun 
smc_pnet_add_pnetid(struct net * net,u8 * pnetid)736*4882a593Smuzhiyun static int smc_pnet_add_pnetid(struct net *net, u8 *pnetid)
737*4882a593Smuzhiyun {
738*4882a593Smuzhiyun 	struct smc_net *sn = net_generic(net, smc_net_id);
739*4882a593Smuzhiyun 	struct smc_pnetids_ndev_entry *pe, *pi;
740*4882a593Smuzhiyun 
741*4882a593Smuzhiyun 	pe = kzalloc(sizeof(*pe), GFP_KERNEL);
742*4882a593Smuzhiyun 	if (!pe)
743*4882a593Smuzhiyun 		return -ENOMEM;
744*4882a593Smuzhiyun 
745*4882a593Smuzhiyun 	write_lock(&sn->pnetids_ndev.lock);
746*4882a593Smuzhiyun 	list_for_each_entry(pi, &sn->pnetids_ndev.list, list) {
747*4882a593Smuzhiyun 		if (smc_pnet_match(pnetid, pe->pnetid)) {
748*4882a593Smuzhiyun 			refcount_inc(&pi->refcnt);
749*4882a593Smuzhiyun 			kfree(pe);
750*4882a593Smuzhiyun 			goto unlock;
751*4882a593Smuzhiyun 		}
752*4882a593Smuzhiyun 	}
753*4882a593Smuzhiyun 	refcount_set(&pe->refcnt, 1);
754*4882a593Smuzhiyun 	memcpy(pe->pnetid, pnetid, SMC_MAX_PNETID_LEN);
755*4882a593Smuzhiyun 	list_add_tail(&pe->list, &sn->pnetids_ndev.list);
756*4882a593Smuzhiyun 
757*4882a593Smuzhiyun unlock:
758*4882a593Smuzhiyun 	write_unlock(&sn->pnetids_ndev.lock);
759*4882a593Smuzhiyun 	return 0;
760*4882a593Smuzhiyun }
761*4882a593Smuzhiyun 
smc_pnet_remove_pnetid(struct net * net,u8 * pnetid)762*4882a593Smuzhiyun static void smc_pnet_remove_pnetid(struct net *net, u8 *pnetid)
763*4882a593Smuzhiyun {
764*4882a593Smuzhiyun 	struct smc_net *sn = net_generic(net, smc_net_id);
765*4882a593Smuzhiyun 	struct smc_pnetids_ndev_entry *pe, *pe2;
766*4882a593Smuzhiyun 
767*4882a593Smuzhiyun 	write_lock(&sn->pnetids_ndev.lock);
768*4882a593Smuzhiyun 	list_for_each_entry_safe(pe, pe2, &sn->pnetids_ndev.list, list) {
769*4882a593Smuzhiyun 		if (smc_pnet_match(pnetid, pe->pnetid)) {
770*4882a593Smuzhiyun 			if (refcount_dec_and_test(&pe->refcnt)) {
771*4882a593Smuzhiyun 				list_del(&pe->list);
772*4882a593Smuzhiyun 				kfree(pe);
773*4882a593Smuzhiyun 			}
774*4882a593Smuzhiyun 			break;
775*4882a593Smuzhiyun 		}
776*4882a593Smuzhiyun 	}
777*4882a593Smuzhiyun 	write_unlock(&sn->pnetids_ndev.lock);
778*4882a593Smuzhiyun }
779*4882a593Smuzhiyun 
smc_pnet_add_base_pnetid(struct net * net,struct net_device * dev,u8 * ndev_pnetid)780*4882a593Smuzhiyun static void smc_pnet_add_base_pnetid(struct net *net, struct net_device *dev,
781*4882a593Smuzhiyun 				     u8 *ndev_pnetid)
782*4882a593Smuzhiyun {
783*4882a593Smuzhiyun 	struct net_device *base_dev;
784*4882a593Smuzhiyun 
785*4882a593Smuzhiyun 	base_dev = __pnet_find_base_ndev(dev);
786*4882a593Smuzhiyun 	if (base_dev->flags & IFF_UP &&
787*4882a593Smuzhiyun 	    !smc_pnetid_by_dev_port(base_dev->dev.parent, base_dev->dev_port,
788*4882a593Smuzhiyun 				    ndev_pnetid)) {
789*4882a593Smuzhiyun 		/* add to PNETIDs list */
790*4882a593Smuzhiyun 		smc_pnet_add_pnetid(net, ndev_pnetid);
791*4882a593Smuzhiyun 	}
792*4882a593Smuzhiyun }
793*4882a593Smuzhiyun 
794*4882a593Smuzhiyun /* create initial list of netdevice pnetids */
smc_pnet_create_pnetids_list(struct net * net)795*4882a593Smuzhiyun static void smc_pnet_create_pnetids_list(struct net *net)
796*4882a593Smuzhiyun {
797*4882a593Smuzhiyun 	u8 ndev_pnetid[SMC_MAX_PNETID_LEN];
798*4882a593Smuzhiyun 	struct net_device *dev;
799*4882a593Smuzhiyun 
800*4882a593Smuzhiyun 	rtnl_lock();
801*4882a593Smuzhiyun 	for_each_netdev(net, dev)
802*4882a593Smuzhiyun 		smc_pnet_add_base_pnetid(net, dev, ndev_pnetid);
803*4882a593Smuzhiyun 	rtnl_unlock();
804*4882a593Smuzhiyun }
805*4882a593Smuzhiyun 
806*4882a593Smuzhiyun /* clean up list of netdevice pnetids */
smc_pnet_destroy_pnetids_list(struct net * net)807*4882a593Smuzhiyun static void smc_pnet_destroy_pnetids_list(struct net *net)
808*4882a593Smuzhiyun {
809*4882a593Smuzhiyun 	struct smc_net *sn = net_generic(net, smc_net_id);
810*4882a593Smuzhiyun 	struct smc_pnetids_ndev_entry *pe, *temp_pe;
811*4882a593Smuzhiyun 
812*4882a593Smuzhiyun 	write_lock(&sn->pnetids_ndev.lock);
813*4882a593Smuzhiyun 	list_for_each_entry_safe(pe, temp_pe, &sn->pnetids_ndev.list, list) {
814*4882a593Smuzhiyun 		list_del(&pe->list);
815*4882a593Smuzhiyun 		kfree(pe);
816*4882a593Smuzhiyun 	}
817*4882a593Smuzhiyun 	write_unlock(&sn->pnetids_ndev.lock);
818*4882a593Smuzhiyun }
819*4882a593Smuzhiyun 
smc_pnet_netdev_event(struct notifier_block * this,unsigned long event,void * ptr)820*4882a593Smuzhiyun static int smc_pnet_netdev_event(struct notifier_block *this,
821*4882a593Smuzhiyun 				 unsigned long event, void *ptr)
822*4882a593Smuzhiyun {
823*4882a593Smuzhiyun 	struct net_device *event_dev = netdev_notifier_info_to_dev(ptr);
824*4882a593Smuzhiyun 	struct net *net = dev_net(event_dev);
825*4882a593Smuzhiyun 	u8 ndev_pnetid[SMC_MAX_PNETID_LEN];
826*4882a593Smuzhiyun 
827*4882a593Smuzhiyun 	switch (event) {
828*4882a593Smuzhiyun 	case NETDEV_REBOOT:
829*4882a593Smuzhiyun 	case NETDEV_UNREGISTER:
830*4882a593Smuzhiyun 		smc_pnet_remove_by_ndev(event_dev);
831*4882a593Smuzhiyun 		return NOTIFY_OK;
832*4882a593Smuzhiyun 	case NETDEV_REGISTER:
833*4882a593Smuzhiyun 		smc_pnet_add_by_ndev(event_dev);
834*4882a593Smuzhiyun 		return NOTIFY_OK;
835*4882a593Smuzhiyun 	case NETDEV_UP:
836*4882a593Smuzhiyun 		smc_pnet_add_base_pnetid(net, event_dev, ndev_pnetid);
837*4882a593Smuzhiyun 		return NOTIFY_OK;
838*4882a593Smuzhiyun 	case NETDEV_DOWN:
839*4882a593Smuzhiyun 		event_dev = __pnet_find_base_ndev(event_dev);
840*4882a593Smuzhiyun 		if (!smc_pnetid_by_dev_port(event_dev->dev.parent,
841*4882a593Smuzhiyun 					    event_dev->dev_port, ndev_pnetid)) {
842*4882a593Smuzhiyun 			/* remove from PNETIDs list */
843*4882a593Smuzhiyun 			smc_pnet_remove_pnetid(net, ndev_pnetid);
844*4882a593Smuzhiyun 		}
845*4882a593Smuzhiyun 		return NOTIFY_OK;
846*4882a593Smuzhiyun 	default:
847*4882a593Smuzhiyun 		return NOTIFY_DONE;
848*4882a593Smuzhiyun 	}
849*4882a593Smuzhiyun }
850*4882a593Smuzhiyun 
851*4882a593Smuzhiyun static struct notifier_block smc_netdev_notifier = {
852*4882a593Smuzhiyun 	.notifier_call = smc_pnet_netdev_event
853*4882a593Smuzhiyun };
854*4882a593Smuzhiyun 
855*4882a593Smuzhiyun /* init network namespace */
smc_pnet_net_init(struct net * net)856*4882a593Smuzhiyun int smc_pnet_net_init(struct net *net)
857*4882a593Smuzhiyun {
858*4882a593Smuzhiyun 	struct smc_net *sn = net_generic(net, smc_net_id);
859*4882a593Smuzhiyun 	struct smc_pnettable *pnettable = &sn->pnettable;
860*4882a593Smuzhiyun 	struct smc_pnetids_ndev *pnetids_ndev = &sn->pnetids_ndev;
861*4882a593Smuzhiyun 
862*4882a593Smuzhiyun 	INIT_LIST_HEAD(&pnettable->pnetlist);
863*4882a593Smuzhiyun 	mutex_init(&pnettable->lock);
864*4882a593Smuzhiyun 	INIT_LIST_HEAD(&pnetids_ndev->list);
865*4882a593Smuzhiyun 	rwlock_init(&pnetids_ndev->lock);
866*4882a593Smuzhiyun 
867*4882a593Smuzhiyun 	smc_pnet_create_pnetids_list(net);
868*4882a593Smuzhiyun 
869*4882a593Smuzhiyun 	return 0;
870*4882a593Smuzhiyun }
871*4882a593Smuzhiyun 
smc_pnet_init(void)872*4882a593Smuzhiyun int __init smc_pnet_init(void)
873*4882a593Smuzhiyun {
874*4882a593Smuzhiyun 	int rc;
875*4882a593Smuzhiyun 
876*4882a593Smuzhiyun 	rc = genl_register_family(&smc_pnet_nl_family);
877*4882a593Smuzhiyun 	if (rc)
878*4882a593Smuzhiyun 		return rc;
879*4882a593Smuzhiyun 	rc = register_netdevice_notifier(&smc_netdev_notifier);
880*4882a593Smuzhiyun 	if (rc)
881*4882a593Smuzhiyun 		genl_unregister_family(&smc_pnet_nl_family);
882*4882a593Smuzhiyun 
883*4882a593Smuzhiyun 	return rc;
884*4882a593Smuzhiyun }
885*4882a593Smuzhiyun 
886*4882a593Smuzhiyun /* exit network namespace */
smc_pnet_net_exit(struct net * net)887*4882a593Smuzhiyun void smc_pnet_net_exit(struct net *net)
888*4882a593Smuzhiyun {
889*4882a593Smuzhiyun 	/* flush pnet table */
890*4882a593Smuzhiyun 	smc_pnet_remove_by_pnetid(net, NULL);
891*4882a593Smuzhiyun 	smc_pnet_destroy_pnetids_list(net);
892*4882a593Smuzhiyun }
893*4882a593Smuzhiyun 
smc_pnet_exit(void)894*4882a593Smuzhiyun void smc_pnet_exit(void)
895*4882a593Smuzhiyun {
896*4882a593Smuzhiyun 	unregister_netdevice_notifier(&smc_netdev_notifier);
897*4882a593Smuzhiyun 	genl_unregister_family(&smc_pnet_nl_family);
898*4882a593Smuzhiyun }
899*4882a593Smuzhiyun 
__pnet_find_base_ndev(struct net_device * ndev)900*4882a593Smuzhiyun static struct net_device *__pnet_find_base_ndev(struct net_device *ndev)
901*4882a593Smuzhiyun {
902*4882a593Smuzhiyun 	int i, nest_lvl;
903*4882a593Smuzhiyun 
904*4882a593Smuzhiyun 	ASSERT_RTNL();
905*4882a593Smuzhiyun 	nest_lvl = ndev->lower_level;
906*4882a593Smuzhiyun 	for (i = 0; i < nest_lvl; i++) {
907*4882a593Smuzhiyun 		struct list_head *lower = &ndev->adj_list.lower;
908*4882a593Smuzhiyun 
909*4882a593Smuzhiyun 		if (list_empty(lower))
910*4882a593Smuzhiyun 			break;
911*4882a593Smuzhiyun 		lower = lower->next;
912*4882a593Smuzhiyun 		ndev = netdev_lower_get_next(ndev, &lower);
913*4882a593Smuzhiyun 	}
914*4882a593Smuzhiyun 	return ndev;
915*4882a593Smuzhiyun }
916*4882a593Smuzhiyun 
917*4882a593Smuzhiyun /* Determine one base device for stacked net devices.
918*4882a593Smuzhiyun  * If the lower device level contains more than one devices
919*4882a593Smuzhiyun  * (for instance with bonding slaves), just the first device
920*4882a593Smuzhiyun  * is used to reach a base device.
921*4882a593Smuzhiyun  */
pnet_find_base_ndev(struct net_device * ndev)922*4882a593Smuzhiyun static struct net_device *pnet_find_base_ndev(struct net_device *ndev)
923*4882a593Smuzhiyun {
924*4882a593Smuzhiyun 	rtnl_lock();
925*4882a593Smuzhiyun 	ndev = __pnet_find_base_ndev(ndev);
926*4882a593Smuzhiyun 	rtnl_unlock();
927*4882a593Smuzhiyun 	return ndev;
928*4882a593Smuzhiyun }
929*4882a593Smuzhiyun 
smc_pnet_find_ndev_pnetid_by_table(struct net_device * ndev,u8 * pnetid)930*4882a593Smuzhiyun static int smc_pnet_find_ndev_pnetid_by_table(struct net_device *ndev,
931*4882a593Smuzhiyun 					      u8 *pnetid)
932*4882a593Smuzhiyun {
933*4882a593Smuzhiyun 	struct smc_pnettable *pnettable;
934*4882a593Smuzhiyun 	struct net *net = dev_net(ndev);
935*4882a593Smuzhiyun 	struct smc_pnetentry *pnetelem;
936*4882a593Smuzhiyun 	struct smc_net *sn;
937*4882a593Smuzhiyun 	int rc = -ENOENT;
938*4882a593Smuzhiyun 
939*4882a593Smuzhiyun 	/* get pnettable for namespace */
940*4882a593Smuzhiyun 	sn = net_generic(net, smc_net_id);
941*4882a593Smuzhiyun 	pnettable = &sn->pnettable;
942*4882a593Smuzhiyun 
943*4882a593Smuzhiyun 	mutex_lock(&pnettable->lock);
944*4882a593Smuzhiyun 	list_for_each_entry(pnetelem, &pnettable->pnetlist, list) {
945*4882a593Smuzhiyun 		if (pnetelem->type == SMC_PNET_ETH && ndev == pnetelem->ndev) {
946*4882a593Smuzhiyun 			/* get pnetid of netdev device */
947*4882a593Smuzhiyun 			memcpy(pnetid, pnetelem->pnet_name, SMC_MAX_PNETID_LEN);
948*4882a593Smuzhiyun 			rc = 0;
949*4882a593Smuzhiyun 			break;
950*4882a593Smuzhiyun 		}
951*4882a593Smuzhiyun 	}
952*4882a593Smuzhiyun 	mutex_unlock(&pnettable->lock);
953*4882a593Smuzhiyun 	return rc;
954*4882a593Smuzhiyun }
955*4882a593Smuzhiyun 
956*4882a593Smuzhiyun /* find a roce device for the given pnetid */
_smc_pnet_find_roce_by_pnetid(u8 * pnet_id,struct smc_init_info * ini,struct smc_ib_device * known_dev)957*4882a593Smuzhiyun static void _smc_pnet_find_roce_by_pnetid(u8 *pnet_id,
958*4882a593Smuzhiyun 					  struct smc_init_info *ini,
959*4882a593Smuzhiyun 					  struct smc_ib_device *known_dev)
960*4882a593Smuzhiyun {
961*4882a593Smuzhiyun 	struct smc_ib_device *ibdev;
962*4882a593Smuzhiyun 	int i;
963*4882a593Smuzhiyun 
964*4882a593Smuzhiyun 	ini->ib_dev = NULL;
965*4882a593Smuzhiyun 	mutex_lock(&smc_ib_devices.mutex);
966*4882a593Smuzhiyun 	list_for_each_entry(ibdev, &smc_ib_devices.list, list) {
967*4882a593Smuzhiyun 		if (ibdev == known_dev)
968*4882a593Smuzhiyun 			continue;
969*4882a593Smuzhiyun 		for (i = 1; i <= SMC_MAX_PORTS; i++) {
970*4882a593Smuzhiyun 			if (!rdma_is_port_valid(ibdev->ibdev, i))
971*4882a593Smuzhiyun 				continue;
972*4882a593Smuzhiyun 			if (smc_pnet_match(ibdev->pnetid[i - 1], pnet_id) &&
973*4882a593Smuzhiyun 			    smc_ib_port_active(ibdev, i) &&
974*4882a593Smuzhiyun 			    !test_bit(i - 1, ibdev->ports_going_away) &&
975*4882a593Smuzhiyun 			    !smc_ib_determine_gid(ibdev, i, ini->vlan_id,
976*4882a593Smuzhiyun 						  ini->ib_gid, NULL)) {
977*4882a593Smuzhiyun 				ini->ib_dev = ibdev;
978*4882a593Smuzhiyun 				ini->ib_port = i;
979*4882a593Smuzhiyun 				goto out;
980*4882a593Smuzhiyun 			}
981*4882a593Smuzhiyun 		}
982*4882a593Smuzhiyun 	}
983*4882a593Smuzhiyun out:
984*4882a593Smuzhiyun 	mutex_unlock(&smc_ib_devices.mutex);
985*4882a593Smuzhiyun }
986*4882a593Smuzhiyun 
987*4882a593Smuzhiyun /* find alternate roce device with same pnet_id and vlan_id */
smc_pnet_find_alt_roce(struct smc_link_group * lgr,struct smc_init_info * ini,struct smc_ib_device * known_dev)988*4882a593Smuzhiyun void smc_pnet_find_alt_roce(struct smc_link_group *lgr,
989*4882a593Smuzhiyun 			    struct smc_init_info *ini,
990*4882a593Smuzhiyun 			    struct smc_ib_device *known_dev)
991*4882a593Smuzhiyun {
992*4882a593Smuzhiyun 	_smc_pnet_find_roce_by_pnetid(lgr->pnet_id, ini, known_dev);
993*4882a593Smuzhiyun }
994*4882a593Smuzhiyun 
995*4882a593Smuzhiyun /* if handshake network device belongs to a roce device, return its
996*4882a593Smuzhiyun  * IB device and port
997*4882a593Smuzhiyun  */
smc_pnet_find_rdma_dev(struct net_device * netdev,struct smc_init_info * ini)998*4882a593Smuzhiyun static void smc_pnet_find_rdma_dev(struct net_device *netdev,
999*4882a593Smuzhiyun 				   struct smc_init_info *ini)
1000*4882a593Smuzhiyun {
1001*4882a593Smuzhiyun 	struct smc_ib_device *ibdev;
1002*4882a593Smuzhiyun 
1003*4882a593Smuzhiyun 	mutex_lock(&smc_ib_devices.mutex);
1004*4882a593Smuzhiyun 	list_for_each_entry(ibdev, &smc_ib_devices.list, list) {
1005*4882a593Smuzhiyun 		struct net_device *ndev;
1006*4882a593Smuzhiyun 		int i;
1007*4882a593Smuzhiyun 
1008*4882a593Smuzhiyun 		for (i = 1; i <= SMC_MAX_PORTS; i++) {
1009*4882a593Smuzhiyun 			if (!rdma_is_port_valid(ibdev->ibdev, i))
1010*4882a593Smuzhiyun 				continue;
1011*4882a593Smuzhiyun 			if (!ibdev->ibdev->ops.get_netdev)
1012*4882a593Smuzhiyun 				continue;
1013*4882a593Smuzhiyun 			ndev = ibdev->ibdev->ops.get_netdev(ibdev->ibdev, i);
1014*4882a593Smuzhiyun 			if (!ndev)
1015*4882a593Smuzhiyun 				continue;
1016*4882a593Smuzhiyun 			dev_put(ndev);
1017*4882a593Smuzhiyun 			if (netdev == ndev &&
1018*4882a593Smuzhiyun 			    smc_ib_port_active(ibdev, i) &&
1019*4882a593Smuzhiyun 			    !test_bit(i - 1, ibdev->ports_going_away) &&
1020*4882a593Smuzhiyun 			    !smc_ib_determine_gid(ibdev, i, ini->vlan_id,
1021*4882a593Smuzhiyun 						  ini->ib_gid, NULL)) {
1022*4882a593Smuzhiyun 				ini->ib_dev = ibdev;
1023*4882a593Smuzhiyun 				ini->ib_port = i;
1024*4882a593Smuzhiyun 				break;
1025*4882a593Smuzhiyun 			}
1026*4882a593Smuzhiyun 		}
1027*4882a593Smuzhiyun 	}
1028*4882a593Smuzhiyun 	mutex_unlock(&smc_ib_devices.mutex);
1029*4882a593Smuzhiyun }
1030*4882a593Smuzhiyun 
1031*4882a593Smuzhiyun /* Determine the corresponding IB device port based on the hardware PNETID.
1032*4882a593Smuzhiyun  * Searching stops at the first matching active IB device port with vlan_id
1033*4882a593Smuzhiyun  * configured.
1034*4882a593Smuzhiyun  * If nothing found, check pnetid table.
1035*4882a593Smuzhiyun  * If nothing found, try to use handshake device
1036*4882a593Smuzhiyun  */
smc_pnet_find_roce_by_pnetid(struct net_device * ndev,struct smc_init_info * ini)1037*4882a593Smuzhiyun static void smc_pnet_find_roce_by_pnetid(struct net_device *ndev,
1038*4882a593Smuzhiyun 					 struct smc_init_info *ini)
1039*4882a593Smuzhiyun {
1040*4882a593Smuzhiyun 	u8 ndev_pnetid[SMC_MAX_PNETID_LEN];
1041*4882a593Smuzhiyun 
1042*4882a593Smuzhiyun 	ndev = pnet_find_base_ndev(ndev);
1043*4882a593Smuzhiyun 	if (smc_pnetid_by_dev_port(ndev->dev.parent, ndev->dev_port,
1044*4882a593Smuzhiyun 				   ndev_pnetid) &&
1045*4882a593Smuzhiyun 	    smc_pnet_find_ndev_pnetid_by_table(ndev, ndev_pnetid)) {
1046*4882a593Smuzhiyun 		smc_pnet_find_rdma_dev(ndev, ini);
1047*4882a593Smuzhiyun 		return; /* pnetid could not be determined */
1048*4882a593Smuzhiyun 	}
1049*4882a593Smuzhiyun 	_smc_pnet_find_roce_by_pnetid(ndev_pnetid, ini, NULL);
1050*4882a593Smuzhiyun }
1051*4882a593Smuzhiyun 
smc_pnet_find_ism_by_pnetid(struct net_device * ndev,struct smc_init_info * ini)1052*4882a593Smuzhiyun static void smc_pnet_find_ism_by_pnetid(struct net_device *ndev,
1053*4882a593Smuzhiyun 					struct smc_init_info *ini)
1054*4882a593Smuzhiyun {
1055*4882a593Smuzhiyun 	u8 ndev_pnetid[SMC_MAX_PNETID_LEN];
1056*4882a593Smuzhiyun 	struct smcd_dev *ismdev;
1057*4882a593Smuzhiyun 
1058*4882a593Smuzhiyun 	ndev = pnet_find_base_ndev(ndev);
1059*4882a593Smuzhiyun 	if (smc_pnetid_by_dev_port(ndev->dev.parent, ndev->dev_port,
1060*4882a593Smuzhiyun 				   ndev_pnetid) &&
1061*4882a593Smuzhiyun 	    smc_pnet_find_ndev_pnetid_by_table(ndev, ndev_pnetid))
1062*4882a593Smuzhiyun 		return; /* pnetid could not be determined */
1063*4882a593Smuzhiyun 
1064*4882a593Smuzhiyun 	mutex_lock(&smcd_dev_list.mutex);
1065*4882a593Smuzhiyun 	list_for_each_entry(ismdev, &smcd_dev_list.list, list) {
1066*4882a593Smuzhiyun 		if (smc_pnet_match(ismdev->pnetid, ndev_pnetid) &&
1067*4882a593Smuzhiyun 		    !ismdev->going_away &&
1068*4882a593Smuzhiyun 		    (!ini->ism_peer_gid[0] ||
1069*4882a593Smuzhiyun 		     !smc_ism_cantalk(ini->ism_peer_gid[0], ini->vlan_id,
1070*4882a593Smuzhiyun 				      ismdev))) {
1071*4882a593Smuzhiyun 			ini->ism_dev[0] = ismdev;
1072*4882a593Smuzhiyun 			break;
1073*4882a593Smuzhiyun 		}
1074*4882a593Smuzhiyun 	}
1075*4882a593Smuzhiyun 	mutex_unlock(&smcd_dev_list.mutex);
1076*4882a593Smuzhiyun }
1077*4882a593Smuzhiyun 
1078*4882a593Smuzhiyun /* PNET table analysis for a given sock:
1079*4882a593Smuzhiyun  * determine ib_device and port belonging to used internal TCP socket
1080*4882a593Smuzhiyun  * ethernet interface.
1081*4882a593Smuzhiyun  */
smc_pnet_find_roce_resource(struct sock * sk,struct smc_init_info * ini)1082*4882a593Smuzhiyun void smc_pnet_find_roce_resource(struct sock *sk, struct smc_init_info *ini)
1083*4882a593Smuzhiyun {
1084*4882a593Smuzhiyun 	struct dst_entry *dst = sk_dst_get(sk);
1085*4882a593Smuzhiyun 
1086*4882a593Smuzhiyun 	ini->ib_dev = NULL;
1087*4882a593Smuzhiyun 	ini->ib_port = 0;
1088*4882a593Smuzhiyun 	if (!dst)
1089*4882a593Smuzhiyun 		goto out;
1090*4882a593Smuzhiyun 	if (!dst->dev)
1091*4882a593Smuzhiyun 		goto out_rel;
1092*4882a593Smuzhiyun 
1093*4882a593Smuzhiyun 	smc_pnet_find_roce_by_pnetid(dst->dev, ini);
1094*4882a593Smuzhiyun 
1095*4882a593Smuzhiyun out_rel:
1096*4882a593Smuzhiyun 	dst_release(dst);
1097*4882a593Smuzhiyun out:
1098*4882a593Smuzhiyun 	return;
1099*4882a593Smuzhiyun }
1100*4882a593Smuzhiyun 
smc_pnet_find_ism_resource(struct sock * sk,struct smc_init_info * ini)1101*4882a593Smuzhiyun void smc_pnet_find_ism_resource(struct sock *sk, struct smc_init_info *ini)
1102*4882a593Smuzhiyun {
1103*4882a593Smuzhiyun 	struct dst_entry *dst = sk_dst_get(sk);
1104*4882a593Smuzhiyun 
1105*4882a593Smuzhiyun 	ini->ism_dev[0] = NULL;
1106*4882a593Smuzhiyun 	if (!dst)
1107*4882a593Smuzhiyun 		goto out;
1108*4882a593Smuzhiyun 	if (!dst->dev)
1109*4882a593Smuzhiyun 		goto out_rel;
1110*4882a593Smuzhiyun 
1111*4882a593Smuzhiyun 	smc_pnet_find_ism_by_pnetid(dst->dev, ini);
1112*4882a593Smuzhiyun 
1113*4882a593Smuzhiyun out_rel:
1114*4882a593Smuzhiyun 	dst_release(dst);
1115*4882a593Smuzhiyun out:
1116*4882a593Smuzhiyun 	return;
1117*4882a593Smuzhiyun }
1118*4882a593Smuzhiyun 
1119*4882a593Smuzhiyun /* Lookup and apply a pnet table entry to the given ib device.
1120*4882a593Smuzhiyun  */
smc_pnetid_by_table_ib(struct smc_ib_device * smcibdev,u8 ib_port)1121*4882a593Smuzhiyun int smc_pnetid_by_table_ib(struct smc_ib_device *smcibdev, u8 ib_port)
1122*4882a593Smuzhiyun {
1123*4882a593Smuzhiyun 	char *ib_name = smcibdev->ibdev->name;
1124*4882a593Smuzhiyun 	struct smc_pnettable *pnettable;
1125*4882a593Smuzhiyun 	struct smc_pnetentry *tmp_pe;
1126*4882a593Smuzhiyun 	struct smc_net *sn;
1127*4882a593Smuzhiyun 	int rc = -ENOENT;
1128*4882a593Smuzhiyun 
1129*4882a593Smuzhiyun 	/* get pnettable for init namespace */
1130*4882a593Smuzhiyun 	sn = net_generic(&init_net, smc_net_id);
1131*4882a593Smuzhiyun 	pnettable = &sn->pnettable;
1132*4882a593Smuzhiyun 
1133*4882a593Smuzhiyun 	mutex_lock(&pnettable->lock);
1134*4882a593Smuzhiyun 	list_for_each_entry(tmp_pe, &pnettable->pnetlist, list) {
1135*4882a593Smuzhiyun 		if (tmp_pe->type == SMC_PNET_IB &&
1136*4882a593Smuzhiyun 		    !strncmp(tmp_pe->ib_name, ib_name, IB_DEVICE_NAME_MAX) &&
1137*4882a593Smuzhiyun 		    tmp_pe->ib_port == ib_port) {
1138*4882a593Smuzhiyun 			smc_pnet_apply_ib(smcibdev, ib_port, tmp_pe->pnet_name);
1139*4882a593Smuzhiyun 			rc = 0;
1140*4882a593Smuzhiyun 			break;
1141*4882a593Smuzhiyun 		}
1142*4882a593Smuzhiyun 	}
1143*4882a593Smuzhiyun 	mutex_unlock(&pnettable->lock);
1144*4882a593Smuzhiyun 
1145*4882a593Smuzhiyun 	return rc;
1146*4882a593Smuzhiyun }
1147*4882a593Smuzhiyun 
1148*4882a593Smuzhiyun /* Lookup and apply a pnet table entry to the given smcd device.
1149*4882a593Smuzhiyun  */
smc_pnetid_by_table_smcd(struct smcd_dev * smcddev)1150*4882a593Smuzhiyun int smc_pnetid_by_table_smcd(struct smcd_dev *smcddev)
1151*4882a593Smuzhiyun {
1152*4882a593Smuzhiyun 	const char *ib_name = dev_name(&smcddev->dev);
1153*4882a593Smuzhiyun 	struct smc_pnettable *pnettable;
1154*4882a593Smuzhiyun 	struct smc_pnetentry *tmp_pe;
1155*4882a593Smuzhiyun 	struct smc_net *sn;
1156*4882a593Smuzhiyun 	int rc = -ENOENT;
1157*4882a593Smuzhiyun 
1158*4882a593Smuzhiyun 	/* get pnettable for init namespace */
1159*4882a593Smuzhiyun 	sn = net_generic(&init_net, smc_net_id);
1160*4882a593Smuzhiyun 	pnettable = &sn->pnettable;
1161*4882a593Smuzhiyun 
1162*4882a593Smuzhiyun 	mutex_lock(&pnettable->lock);
1163*4882a593Smuzhiyun 	list_for_each_entry(tmp_pe, &pnettable->pnetlist, list) {
1164*4882a593Smuzhiyun 		if (tmp_pe->type == SMC_PNET_IB &&
1165*4882a593Smuzhiyun 		    !strncmp(tmp_pe->ib_name, ib_name, IB_DEVICE_NAME_MAX)) {
1166*4882a593Smuzhiyun 			smc_pnet_apply_smcd(smcddev, tmp_pe->pnet_name);
1167*4882a593Smuzhiyun 			rc = 0;
1168*4882a593Smuzhiyun 			break;
1169*4882a593Smuzhiyun 		}
1170*4882a593Smuzhiyun 	}
1171*4882a593Smuzhiyun 	mutex_unlock(&pnettable->lock);
1172*4882a593Smuzhiyun 
1173*4882a593Smuzhiyun 	return rc;
1174*4882a593Smuzhiyun }
1175