xref: /OK3568_Linux_fs/kernel/drivers/infiniband/core/cache.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Copyright (c) 2004 Topspin Communications.  All rights reserved.
3*4882a593Smuzhiyun  * Copyright (c) 2005 Intel Corporation. All rights reserved.
4*4882a593Smuzhiyun  * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved.
5*4882a593Smuzhiyun  * Copyright (c) 2005 Voltaire, Inc. All rights reserved.
6*4882a593Smuzhiyun  *
7*4882a593Smuzhiyun  * This software is available to you under a choice of one of two
8*4882a593Smuzhiyun  * licenses.  You may choose to be licensed under the terms of the GNU
9*4882a593Smuzhiyun  * General Public License (GPL) Version 2, available from the file
10*4882a593Smuzhiyun  * COPYING in the main directory of this source tree, or the
11*4882a593Smuzhiyun  * OpenIB.org BSD license below:
12*4882a593Smuzhiyun  *
13*4882a593Smuzhiyun  *     Redistribution and use in source and binary forms, with or
14*4882a593Smuzhiyun  *     without modification, are permitted provided that the following
15*4882a593Smuzhiyun  *     conditions are met:
16*4882a593Smuzhiyun  *
17*4882a593Smuzhiyun  *      - Redistributions of source code must retain the above
18*4882a593Smuzhiyun  *        copyright notice, this list of conditions and the following
19*4882a593Smuzhiyun  *        disclaimer.
20*4882a593Smuzhiyun  *
21*4882a593Smuzhiyun  *      - Redistributions in binary form must reproduce the above
22*4882a593Smuzhiyun  *        copyright notice, this list of conditions and the following
23*4882a593Smuzhiyun  *        disclaimer in the documentation and/or other materials
24*4882a593Smuzhiyun  *        provided with the distribution.
25*4882a593Smuzhiyun  *
26*4882a593Smuzhiyun  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
27*4882a593Smuzhiyun  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
28*4882a593Smuzhiyun  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
29*4882a593Smuzhiyun  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
30*4882a593Smuzhiyun  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
31*4882a593Smuzhiyun  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
32*4882a593Smuzhiyun  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
33*4882a593Smuzhiyun  * SOFTWARE.
34*4882a593Smuzhiyun  */
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun #include <linux/module.h>
37*4882a593Smuzhiyun #include <linux/errno.h>
38*4882a593Smuzhiyun #include <linux/slab.h>
39*4882a593Smuzhiyun #include <linux/workqueue.h>
40*4882a593Smuzhiyun #include <linux/netdevice.h>
41*4882a593Smuzhiyun #include <net/addrconf.h>
42*4882a593Smuzhiyun 
43*4882a593Smuzhiyun #include <rdma/ib_cache.h>
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun #include "core_priv.h"
46*4882a593Smuzhiyun 
47*4882a593Smuzhiyun struct ib_pkey_cache {
48*4882a593Smuzhiyun 	int             table_len;
49*4882a593Smuzhiyun 	u16             table[];
50*4882a593Smuzhiyun };
51*4882a593Smuzhiyun 
52*4882a593Smuzhiyun struct ib_update_work {
53*4882a593Smuzhiyun 	struct work_struct work;
54*4882a593Smuzhiyun 	struct ib_event event;
55*4882a593Smuzhiyun 	bool enforce_security;
56*4882a593Smuzhiyun };
57*4882a593Smuzhiyun 
58*4882a593Smuzhiyun union ib_gid zgid;
59*4882a593Smuzhiyun EXPORT_SYMBOL(zgid);
60*4882a593Smuzhiyun 
61*4882a593Smuzhiyun enum gid_attr_find_mask {
62*4882a593Smuzhiyun 	GID_ATTR_FIND_MASK_GID          = 1UL << 0,
63*4882a593Smuzhiyun 	GID_ATTR_FIND_MASK_NETDEV	= 1UL << 1,
64*4882a593Smuzhiyun 	GID_ATTR_FIND_MASK_DEFAULT	= 1UL << 2,
65*4882a593Smuzhiyun 	GID_ATTR_FIND_MASK_GID_TYPE	= 1UL << 3,
66*4882a593Smuzhiyun };
67*4882a593Smuzhiyun 
68*4882a593Smuzhiyun enum gid_table_entry_state {
69*4882a593Smuzhiyun 	GID_TABLE_ENTRY_INVALID		= 1,
70*4882a593Smuzhiyun 	GID_TABLE_ENTRY_VALID		= 2,
71*4882a593Smuzhiyun 	/*
72*4882a593Smuzhiyun 	 * Indicates that entry is pending to be removed, there may
73*4882a593Smuzhiyun 	 * be active users of this GID entry.
74*4882a593Smuzhiyun 	 * When last user of the GID entry releases reference to it,
75*4882a593Smuzhiyun 	 * GID entry is detached from the table.
76*4882a593Smuzhiyun 	 */
77*4882a593Smuzhiyun 	GID_TABLE_ENTRY_PENDING_DEL	= 3,
78*4882a593Smuzhiyun };
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun struct roce_gid_ndev_storage {
81*4882a593Smuzhiyun 	struct rcu_head rcu_head;
82*4882a593Smuzhiyun 	struct net_device *ndev;
83*4882a593Smuzhiyun };
84*4882a593Smuzhiyun 
85*4882a593Smuzhiyun struct ib_gid_table_entry {
86*4882a593Smuzhiyun 	struct kref			kref;
87*4882a593Smuzhiyun 	struct work_struct		del_work;
88*4882a593Smuzhiyun 	struct ib_gid_attr		attr;
89*4882a593Smuzhiyun 	void				*context;
90*4882a593Smuzhiyun 	/* Store the ndev pointer to release reference later on in
91*4882a593Smuzhiyun 	 * call_rcu context because by that time gid_table_entry
92*4882a593Smuzhiyun 	 * and attr might be already freed. So keep a copy of it.
93*4882a593Smuzhiyun 	 * ndev_storage is freed by rcu callback.
94*4882a593Smuzhiyun 	 */
95*4882a593Smuzhiyun 	struct roce_gid_ndev_storage	*ndev_storage;
96*4882a593Smuzhiyun 	enum gid_table_entry_state	state;
97*4882a593Smuzhiyun };
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun struct ib_gid_table {
100*4882a593Smuzhiyun 	int				sz;
101*4882a593Smuzhiyun 	/* In RoCE, adding a GID to the table requires:
102*4882a593Smuzhiyun 	 * (a) Find if this GID is already exists.
103*4882a593Smuzhiyun 	 * (b) Find a free space.
104*4882a593Smuzhiyun 	 * (c) Write the new GID
105*4882a593Smuzhiyun 	 *
106*4882a593Smuzhiyun 	 * Delete requires different set of operations:
107*4882a593Smuzhiyun 	 * (a) Find the GID
108*4882a593Smuzhiyun 	 * (b) Delete it.
109*4882a593Smuzhiyun 	 *
110*4882a593Smuzhiyun 	 **/
111*4882a593Smuzhiyun 	/* Any writer to data_vec must hold this lock and the write side of
112*4882a593Smuzhiyun 	 * rwlock. Readers must hold only rwlock. All writers must be in a
113*4882a593Smuzhiyun 	 * sleepable context.
114*4882a593Smuzhiyun 	 */
115*4882a593Smuzhiyun 	struct mutex			lock;
116*4882a593Smuzhiyun 	/* rwlock protects data_vec[ix]->state and entry pointer.
117*4882a593Smuzhiyun 	 */
118*4882a593Smuzhiyun 	rwlock_t			rwlock;
119*4882a593Smuzhiyun 	struct ib_gid_table_entry	**data_vec;
120*4882a593Smuzhiyun 	/* bit field, each bit indicates the index of default GID */
121*4882a593Smuzhiyun 	u32				default_gid_indices;
122*4882a593Smuzhiyun };
123*4882a593Smuzhiyun 
dispatch_gid_change_event(struct ib_device * ib_dev,u8 port)124*4882a593Smuzhiyun static void dispatch_gid_change_event(struct ib_device *ib_dev, u8 port)
125*4882a593Smuzhiyun {
126*4882a593Smuzhiyun 	struct ib_event event;
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun 	event.device		= ib_dev;
129*4882a593Smuzhiyun 	event.element.port_num	= port;
130*4882a593Smuzhiyun 	event.event		= IB_EVENT_GID_CHANGE;
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun 	ib_dispatch_event_clients(&event);
133*4882a593Smuzhiyun }
134*4882a593Smuzhiyun 
135*4882a593Smuzhiyun static const char * const gid_type_str[] = {
136*4882a593Smuzhiyun 	/* IB/RoCE v1 value is set for IB_GID_TYPE_IB and IB_GID_TYPE_ROCE for
137*4882a593Smuzhiyun 	 * user space compatibility reasons.
138*4882a593Smuzhiyun 	 */
139*4882a593Smuzhiyun 	[IB_GID_TYPE_IB]	= "IB/RoCE v1",
140*4882a593Smuzhiyun 	[IB_GID_TYPE_ROCE]	= "IB/RoCE v1",
141*4882a593Smuzhiyun 	[IB_GID_TYPE_ROCE_UDP_ENCAP]	= "RoCE v2",
142*4882a593Smuzhiyun };
143*4882a593Smuzhiyun 
ib_cache_gid_type_str(enum ib_gid_type gid_type)144*4882a593Smuzhiyun const char *ib_cache_gid_type_str(enum ib_gid_type gid_type)
145*4882a593Smuzhiyun {
146*4882a593Smuzhiyun 	if (gid_type < ARRAY_SIZE(gid_type_str) && gid_type_str[gid_type])
147*4882a593Smuzhiyun 		return gid_type_str[gid_type];
148*4882a593Smuzhiyun 
149*4882a593Smuzhiyun 	return "Invalid GID type";
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun EXPORT_SYMBOL(ib_cache_gid_type_str);
152*4882a593Smuzhiyun 
153*4882a593Smuzhiyun /** rdma_is_zero_gid - Check if given GID is zero or not.
154*4882a593Smuzhiyun  * @gid:	GID to check
155*4882a593Smuzhiyun  * Returns true if given GID is zero, returns false otherwise.
156*4882a593Smuzhiyun  */
rdma_is_zero_gid(const union ib_gid * gid)157*4882a593Smuzhiyun bool rdma_is_zero_gid(const union ib_gid *gid)
158*4882a593Smuzhiyun {
159*4882a593Smuzhiyun 	return !memcmp(gid, &zgid, sizeof(*gid));
160*4882a593Smuzhiyun }
161*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_is_zero_gid);
162*4882a593Smuzhiyun 
163*4882a593Smuzhiyun /** is_gid_index_default - Check if a given index belongs to
164*4882a593Smuzhiyun  * reserved default GIDs or not.
165*4882a593Smuzhiyun  * @table:	GID table pointer
166*4882a593Smuzhiyun  * @index:	Index to check in GID table
167*4882a593Smuzhiyun  * Returns true if index is one of the reserved default GID index otherwise
168*4882a593Smuzhiyun  * returns false.
169*4882a593Smuzhiyun  */
is_gid_index_default(const struct ib_gid_table * table,unsigned int index)170*4882a593Smuzhiyun static bool is_gid_index_default(const struct ib_gid_table *table,
171*4882a593Smuzhiyun 				 unsigned int index)
172*4882a593Smuzhiyun {
173*4882a593Smuzhiyun 	return index < 32 && (BIT(index) & table->default_gid_indices);
174*4882a593Smuzhiyun }
175*4882a593Smuzhiyun 
ib_cache_gid_parse_type_str(const char * buf)176*4882a593Smuzhiyun int ib_cache_gid_parse_type_str(const char *buf)
177*4882a593Smuzhiyun {
178*4882a593Smuzhiyun 	unsigned int i;
179*4882a593Smuzhiyun 	size_t len;
180*4882a593Smuzhiyun 	int err = -EINVAL;
181*4882a593Smuzhiyun 
182*4882a593Smuzhiyun 	len = strlen(buf);
183*4882a593Smuzhiyun 	if (len == 0)
184*4882a593Smuzhiyun 		return -EINVAL;
185*4882a593Smuzhiyun 
186*4882a593Smuzhiyun 	if (buf[len - 1] == '\n')
187*4882a593Smuzhiyun 		len--;
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun 	for (i = 0; i < ARRAY_SIZE(gid_type_str); ++i)
190*4882a593Smuzhiyun 		if (gid_type_str[i] && !strncmp(buf, gid_type_str[i], len) &&
191*4882a593Smuzhiyun 		    len == strlen(gid_type_str[i])) {
192*4882a593Smuzhiyun 			err = i;
193*4882a593Smuzhiyun 			break;
194*4882a593Smuzhiyun 		}
195*4882a593Smuzhiyun 
196*4882a593Smuzhiyun 	return err;
197*4882a593Smuzhiyun }
198*4882a593Smuzhiyun EXPORT_SYMBOL(ib_cache_gid_parse_type_str);
199*4882a593Smuzhiyun 
rdma_gid_table(struct ib_device * device,u8 port)200*4882a593Smuzhiyun static struct ib_gid_table *rdma_gid_table(struct ib_device *device, u8 port)
201*4882a593Smuzhiyun {
202*4882a593Smuzhiyun 	return device->port_data[port].cache.gid;
203*4882a593Smuzhiyun }
204*4882a593Smuzhiyun 
is_gid_entry_free(const struct ib_gid_table_entry * entry)205*4882a593Smuzhiyun static bool is_gid_entry_free(const struct ib_gid_table_entry *entry)
206*4882a593Smuzhiyun {
207*4882a593Smuzhiyun 	return !entry;
208*4882a593Smuzhiyun }
209*4882a593Smuzhiyun 
is_gid_entry_valid(const struct ib_gid_table_entry * entry)210*4882a593Smuzhiyun static bool is_gid_entry_valid(const struct ib_gid_table_entry *entry)
211*4882a593Smuzhiyun {
212*4882a593Smuzhiyun 	return entry && entry->state == GID_TABLE_ENTRY_VALID;
213*4882a593Smuzhiyun }
214*4882a593Smuzhiyun 
schedule_free_gid(struct kref * kref)215*4882a593Smuzhiyun static void schedule_free_gid(struct kref *kref)
216*4882a593Smuzhiyun {
217*4882a593Smuzhiyun 	struct ib_gid_table_entry *entry =
218*4882a593Smuzhiyun 			container_of(kref, struct ib_gid_table_entry, kref);
219*4882a593Smuzhiyun 
220*4882a593Smuzhiyun 	queue_work(ib_wq, &entry->del_work);
221*4882a593Smuzhiyun }
222*4882a593Smuzhiyun 
put_gid_ndev(struct rcu_head * head)223*4882a593Smuzhiyun static void put_gid_ndev(struct rcu_head *head)
224*4882a593Smuzhiyun {
225*4882a593Smuzhiyun 	struct roce_gid_ndev_storage *storage =
226*4882a593Smuzhiyun 		container_of(head, struct roce_gid_ndev_storage, rcu_head);
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun 	WARN_ON(!storage->ndev);
229*4882a593Smuzhiyun 	/* At this point its safe to release netdev reference,
230*4882a593Smuzhiyun 	 * as all callers working on gid_attr->ndev are done
231*4882a593Smuzhiyun 	 * using this netdev.
232*4882a593Smuzhiyun 	 */
233*4882a593Smuzhiyun 	dev_put(storage->ndev);
234*4882a593Smuzhiyun 	kfree(storage);
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun 
free_gid_entry_locked(struct ib_gid_table_entry * entry)237*4882a593Smuzhiyun static void free_gid_entry_locked(struct ib_gid_table_entry *entry)
238*4882a593Smuzhiyun {
239*4882a593Smuzhiyun 	struct ib_device *device = entry->attr.device;
240*4882a593Smuzhiyun 	u8 port_num = entry->attr.port_num;
241*4882a593Smuzhiyun 	struct ib_gid_table *table = rdma_gid_table(device, port_num);
242*4882a593Smuzhiyun 
243*4882a593Smuzhiyun 	dev_dbg(&device->dev, "%s port=%d index=%d gid %pI6\n", __func__,
244*4882a593Smuzhiyun 		port_num, entry->attr.index, entry->attr.gid.raw);
245*4882a593Smuzhiyun 
246*4882a593Smuzhiyun 	write_lock_irq(&table->rwlock);
247*4882a593Smuzhiyun 
248*4882a593Smuzhiyun 	/*
249*4882a593Smuzhiyun 	 * The only way to avoid overwriting NULL in table is
250*4882a593Smuzhiyun 	 * by comparing if it is same entry in table or not!
251*4882a593Smuzhiyun 	 * If new entry in table is added by the time we free here,
252*4882a593Smuzhiyun 	 * don't overwrite the table entry.
253*4882a593Smuzhiyun 	 */
254*4882a593Smuzhiyun 	if (entry == table->data_vec[entry->attr.index])
255*4882a593Smuzhiyun 		table->data_vec[entry->attr.index] = NULL;
256*4882a593Smuzhiyun 	/* Now this index is ready to be allocated */
257*4882a593Smuzhiyun 	write_unlock_irq(&table->rwlock);
258*4882a593Smuzhiyun 
259*4882a593Smuzhiyun 	if (entry->ndev_storage)
260*4882a593Smuzhiyun 		call_rcu(&entry->ndev_storage->rcu_head, put_gid_ndev);
261*4882a593Smuzhiyun 	kfree(entry);
262*4882a593Smuzhiyun }
263*4882a593Smuzhiyun 
free_gid_entry(struct kref * kref)264*4882a593Smuzhiyun static void free_gid_entry(struct kref *kref)
265*4882a593Smuzhiyun {
266*4882a593Smuzhiyun 	struct ib_gid_table_entry *entry =
267*4882a593Smuzhiyun 			container_of(kref, struct ib_gid_table_entry, kref);
268*4882a593Smuzhiyun 
269*4882a593Smuzhiyun 	free_gid_entry_locked(entry);
270*4882a593Smuzhiyun }
271*4882a593Smuzhiyun 
272*4882a593Smuzhiyun /**
273*4882a593Smuzhiyun  * free_gid_work - Release reference to the GID entry
274*4882a593Smuzhiyun  * @work: Work structure to refer to GID entry which needs to be
275*4882a593Smuzhiyun  * deleted.
276*4882a593Smuzhiyun  *
277*4882a593Smuzhiyun  * free_gid_work() frees the entry from the HCA's hardware table
278*4882a593Smuzhiyun  * if provider supports it. It releases reference to netdevice.
279*4882a593Smuzhiyun  */
free_gid_work(struct work_struct * work)280*4882a593Smuzhiyun static void free_gid_work(struct work_struct *work)
281*4882a593Smuzhiyun {
282*4882a593Smuzhiyun 	struct ib_gid_table_entry *entry =
283*4882a593Smuzhiyun 		container_of(work, struct ib_gid_table_entry, del_work);
284*4882a593Smuzhiyun 	struct ib_device *device = entry->attr.device;
285*4882a593Smuzhiyun 	u8 port_num = entry->attr.port_num;
286*4882a593Smuzhiyun 	struct ib_gid_table *table = rdma_gid_table(device, port_num);
287*4882a593Smuzhiyun 
288*4882a593Smuzhiyun 	mutex_lock(&table->lock);
289*4882a593Smuzhiyun 	free_gid_entry_locked(entry);
290*4882a593Smuzhiyun 	mutex_unlock(&table->lock);
291*4882a593Smuzhiyun }
292*4882a593Smuzhiyun 
293*4882a593Smuzhiyun static struct ib_gid_table_entry *
alloc_gid_entry(const struct ib_gid_attr * attr)294*4882a593Smuzhiyun alloc_gid_entry(const struct ib_gid_attr *attr)
295*4882a593Smuzhiyun {
296*4882a593Smuzhiyun 	struct ib_gid_table_entry *entry;
297*4882a593Smuzhiyun 	struct net_device *ndev;
298*4882a593Smuzhiyun 
299*4882a593Smuzhiyun 	entry = kzalloc(sizeof(*entry), GFP_KERNEL);
300*4882a593Smuzhiyun 	if (!entry)
301*4882a593Smuzhiyun 		return NULL;
302*4882a593Smuzhiyun 
303*4882a593Smuzhiyun 	ndev = rcu_dereference_protected(attr->ndev, 1);
304*4882a593Smuzhiyun 	if (ndev) {
305*4882a593Smuzhiyun 		entry->ndev_storage = kzalloc(sizeof(*entry->ndev_storage),
306*4882a593Smuzhiyun 					      GFP_KERNEL);
307*4882a593Smuzhiyun 		if (!entry->ndev_storage) {
308*4882a593Smuzhiyun 			kfree(entry);
309*4882a593Smuzhiyun 			return NULL;
310*4882a593Smuzhiyun 		}
311*4882a593Smuzhiyun 		dev_hold(ndev);
312*4882a593Smuzhiyun 		entry->ndev_storage->ndev = ndev;
313*4882a593Smuzhiyun 	}
314*4882a593Smuzhiyun 	kref_init(&entry->kref);
315*4882a593Smuzhiyun 	memcpy(&entry->attr, attr, sizeof(*attr));
316*4882a593Smuzhiyun 	INIT_WORK(&entry->del_work, free_gid_work);
317*4882a593Smuzhiyun 	entry->state = GID_TABLE_ENTRY_INVALID;
318*4882a593Smuzhiyun 	return entry;
319*4882a593Smuzhiyun }
320*4882a593Smuzhiyun 
store_gid_entry(struct ib_gid_table * table,struct ib_gid_table_entry * entry)321*4882a593Smuzhiyun static void store_gid_entry(struct ib_gid_table *table,
322*4882a593Smuzhiyun 			    struct ib_gid_table_entry *entry)
323*4882a593Smuzhiyun {
324*4882a593Smuzhiyun 	entry->state = GID_TABLE_ENTRY_VALID;
325*4882a593Smuzhiyun 
326*4882a593Smuzhiyun 	dev_dbg(&entry->attr.device->dev, "%s port=%d index=%d gid %pI6\n",
327*4882a593Smuzhiyun 		__func__, entry->attr.port_num, entry->attr.index,
328*4882a593Smuzhiyun 		entry->attr.gid.raw);
329*4882a593Smuzhiyun 
330*4882a593Smuzhiyun 	lockdep_assert_held(&table->lock);
331*4882a593Smuzhiyun 	write_lock_irq(&table->rwlock);
332*4882a593Smuzhiyun 	table->data_vec[entry->attr.index] = entry;
333*4882a593Smuzhiyun 	write_unlock_irq(&table->rwlock);
334*4882a593Smuzhiyun }
335*4882a593Smuzhiyun 
get_gid_entry(struct ib_gid_table_entry * entry)336*4882a593Smuzhiyun static void get_gid_entry(struct ib_gid_table_entry *entry)
337*4882a593Smuzhiyun {
338*4882a593Smuzhiyun 	kref_get(&entry->kref);
339*4882a593Smuzhiyun }
340*4882a593Smuzhiyun 
put_gid_entry(struct ib_gid_table_entry * entry)341*4882a593Smuzhiyun static void put_gid_entry(struct ib_gid_table_entry *entry)
342*4882a593Smuzhiyun {
343*4882a593Smuzhiyun 	kref_put(&entry->kref, schedule_free_gid);
344*4882a593Smuzhiyun }
345*4882a593Smuzhiyun 
put_gid_entry_locked(struct ib_gid_table_entry * entry)346*4882a593Smuzhiyun static void put_gid_entry_locked(struct ib_gid_table_entry *entry)
347*4882a593Smuzhiyun {
348*4882a593Smuzhiyun 	kref_put(&entry->kref, free_gid_entry);
349*4882a593Smuzhiyun }
350*4882a593Smuzhiyun 
add_roce_gid(struct ib_gid_table_entry * entry)351*4882a593Smuzhiyun static int add_roce_gid(struct ib_gid_table_entry *entry)
352*4882a593Smuzhiyun {
353*4882a593Smuzhiyun 	const struct ib_gid_attr *attr = &entry->attr;
354*4882a593Smuzhiyun 	int ret;
355*4882a593Smuzhiyun 
356*4882a593Smuzhiyun 	if (!attr->ndev) {
357*4882a593Smuzhiyun 		dev_err(&attr->device->dev, "%s NULL netdev port=%d index=%d\n",
358*4882a593Smuzhiyun 			__func__, attr->port_num, attr->index);
359*4882a593Smuzhiyun 		return -EINVAL;
360*4882a593Smuzhiyun 	}
361*4882a593Smuzhiyun 	if (rdma_cap_roce_gid_table(attr->device, attr->port_num)) {
362*4882a593Smuzhiyun 		ret = attr->device->ops.add_gid(attr, &entry->context);
363*4882a593Smuzhiyun 		if (ret) {
364*4882a593Smuzhiyun 			dev_err(&attr->device->dev,
365*4882a593Smuzhiyun 				"%s GID add failed port=%d index=%d\n",
366*4882a593Smuzhiyun 				__func__, attr->port_num, attr->index);
367*4882a593Smuzhiyun 			return ret;
368*4882a593Smuzhiyun 		}
369*4882a593Smuzhiyun 	}
370*4882a593Smuzhiyun 	return 0;
371*4882a593Smuzhiyun }
372*4882a593Smuzhiyun 
373*4882a593Smuzhiyun /**
374*4882a593Smuzhiyun  * del_gid - Delete GID table entry
375*4882a593Smuzhiyun  *
376*4882a593Smuzhiyun  * @ib_dev:	IB device whose GID entry to be deleted
377*4882a593Smuzhiyun  * @port:	Port number of the IB device
378*4882a593Smuzhiyun  * @table:	GID table of the IB device for a port
379*4882a593Smuzhiyun  * @ix:		GID entry index to delete
380*4882a593Smuzhiyun  *
381*4882a593Smuzhiyun  */
del_gid(struct ib_device * ib_dev,u8 port,struct ib_gid_table * table,int ix)382*4882a593Smuzhiyun static void del_gid(struct ib_device *ib_dev, u8 port,
383*4882a593Smuzhiyun 		    struct ib_gid_table *table, int ix)
384*4882a593Smuzhiyun {
385*4882a593Smuzhiyun 	struct roce_gid_ndev_storage *ndev_storage;
386*4882a593Smuzhiyun 	struct ib_gid_table_entry *entry;
387*4882a593Smuzhiyun 
388*4882a593Smuzhiyun 	lockdep_assert_held(&table->lock);
389*4882a593Smuzhiyun 
390*4882a593Smuzhiyun 	dev_dbg(&ib_dev->dev, "%s port=%d index=%d gid %pI6\n", __func__, port,
391*4882a593Smuzhiyun 		ix, table->data_vec[ix]->attr.gid.raw);
392*4882a593Smuzhiyun 
393*4882a593Smuzhiyun 	write_lock_irq(&table->rwlock);
394*4882a593Smuzhiyun 	entry = table->data_vec[ix];
395*4882a593Smuzhiyun 	entry->state = GID_TABLE_ENTRY_PENDING_DEL;
396*4882a593Smuzhiyun 	/*
397*4882a593Smuzhiyun 	 * For non RoCE protocol, GID entry slot is ready to use.
398*4882a593Smuzhiyun 	 */
399*4882a593Smuzhiyun 	if (!rdma_protocol_roce(ib_dev, port))
400*4882a593Smuzhiyun 		table->data_vec[ix] = NULL;
401*4882a593Smuzhiyun 	write_unlock_irq(&table->rwlock);
402*4882a593Smuzhiyun 
403*4882a593Smuzhiyun 	ndev_storage = entry->ndev_storage;
404*4882a593Smuzhiyun 	if (ndev_storage) {
405*4882a593Smuzhiyun 		entry->ndev_storage = NULL;
406*4882a593Smuzhiyun 		rcu_assign_pointer(entry->attr.ndev, NULL);
407*4882a593Smuzhiyun 		call_rcu(&ndev_storage->rcu_head, put_gid_ndev);
408*4882a593Smuzhiyun 	}
409*4882a593Smuzhiyun 
410*4882a593Smuzhiyun 	if (rdma_cap_roce_gid_table(ib_dev, port))
411*4882a593Smuzhiyun 		ib_dev->ops.del_gid(&entry->attr, &entry->context);
412*4882a593Smuzhiyun 
413*4882a593Smuzhiyun 	put_gid_entry_locked(entry);
414*4882a593Smuzhiyun }
415*4882a593Smuzhiyun 
416*4882a593Smuzhiyun /**
417*4882a593Smuzhiyun  * add_modify_gid - Add or modify GID table entry
418*4882a593Smuzhiyun  *
419*4882a593Smuzhiyun  * @table:	GID table in which GID to be added or modified
420*4882a593Smuzhiyun  * @attr:	Attributes of the GID
421*4882a593Smuzhiyun  *
422*4882a593Smuzhiyun  * Returns 0 on success or appropriate error code. It accepts zero
423*4882a593Smuzhiyun  * GID addition for non RoCE ports for HCA's who report them as valid
424*4882a593Smuzhiyun  * GID. However such zero GIDs are not added to the cache.
425*4882a593Smuzhiyun  */
add_modify_gid(struct ib_gid_table * table,const struct ib_gid_attr * attr)426*4882a593Smuzhiyun static int add_modify_gid(struct ib_gid_table *table,
427*4882a593Smuzhiyun 			  const struct ib_gid_attr *attr)
428*4882a593Smuzhiyun {
429*4882a593Smuzhiyun 	struct ib_gid_table_entry *entry;
430*4882a593Smuzhiyun 	int ret = 0;
431*4882a593Smuzhiyun 
432*4882a593Smuzhiyun 	/*
433*4882a593Smuzhiyun 	 * Invalidate any old entry in the table to make it safe to write to
434*4882a593Smuzhiyun 	 * this index.
435*4882a593Smuzhiyun 	 */
436*4882a593Smuzhiyun 	if (is_gid_entry_valid(table->data_vec[attr->index]))
437*4882a593Smuzhiyun 		del_gid(attr->device, attr->port_num, table, attr->index);
438*4882a593Smuzhiyun 
439*4882a593Smuzhiyun 	/*
440*4882a593Smuzhiyun 	 * Some HCA's report multiple GID entries with only one valid GID, and
441*4882a593Smuzhiyun 	 * leave other unused entries as the zero GID. Convert zero GIDs to
442*4882a593Smuzhiyun 	 * empty table entries instead of storing them.
443*4882a593Smuzhiyun 	 */
444*4882a593Smuzhiyun 	if (rdma_is_zero_gid(&attr->gid))
445*4882a593Smuzhiyun 		return 0;
446*4882a593Smuzhiyun 
447*4882a593Smuzhiyun 	entry = alloc_gid_entry(attr);
448*4882a593Smuzhiyun 	if (!entry)
449*4882a593Smuzhiyun 		return -ENOMEM;
450*4882a593Smuzhiyun 
451*4882a593Smuzhiyun 	if (rdma_protocol_roce(attr->device, attr->port_num)) {
452*4882a593Smuzhiyun 		ret = add_roce_gid(entry);
453*4882a593Smuzhiyun 		if (ret)
454*4882a593Smuzhiyun 			goto done;
455*4882a593Smuzhiyun 	}
456*4882a593Smuzhiyun 
457*4882a593Smuzhiyun 	store_gid_entry(table, entry);
458*4882a593Smuzhiyun 	return 0;
459*4882a593Smuzhiyun 
460*4882a593Smuzhiyun done:
461*4882a593Smuzhiyun 	put_gid_entry(entry);
462*4882a593Smuzhiyun 	return ret;
463*4882a593Smuzhiyun }
464*4882a593Smuzhiyun 
465*4882a593Smuzhiyun /* rwlock should be read locked, or lock should be held */
find_gid(struct ib_gid_table * table,const union ib_gid * gid,const struct ib_gid_attr * val,bool default_gid,unsigned long mask,int * pempty)466*4882a593Smuzhiyun static int find_gid(struct ib_gid_table *table, const union ib_gid *gid,
467*4882a593Smuzhiyun 		    const struct ib_gid_attr *val, bool default_gid,
468*4882a593Smuzhiyun 		    unsigned long mask, int *pempty)
469*4882a593Smuzhiyun {
470*4882a593Smuzhiyun 	int i = 0;
471*4882a593Smuzhiyun 	int found = -1;
472*4882a593Smuzhiyun 	int empty = pempty ? -1 : 0;
473*4882a593Smuzhiyun 
474*4882a593Smuzhiyun 	while (i < table->sz && (found < 0 || empty < 0)) {
475*4882a593Smuzhiyun 		struct ib_gid_table_entry *data = table->data_vec[i];
476*4882a593Smuzhiyun 		struct ib_gid_attr *attr;
477*4882a593Smuzhiyun 		int curr_index = i;
478*4882a593Smuzhiyun 
479*4882a593Smuzhiyun 		i++;
480*4882a593Smuzhiyun 
481*4882a593Smuzhiyun 		/* find_gid() is used during GID addition where it is expected
482*4882a593Smuzhiyun 		 * to return a free entry slot which is not duplicate.
483*4882a593Smuzhiyun 		 * Free entry slot is requested and returned if pempty is set,
484*4882a593Smuzhiyun 		 * so lookup free slot only if requested.
485*4882a593Smuzhiyun 		 */
486*4882a593Smuzhiyun 		if (pempty && empty < 0) {
487*4882a593Smuzhiyun 			if (is_gid_entry_free(data) &&
488*4882a593Smuzhiyun 			    default_gid ==
489*4882a593Smuzhiyun 				is_gid_index_default(table, curr_index)) {
490*4882a593Smuzhiyun 				/*
491*4882a593Smuzhiyun 				 * Found an invalid (free) entry; allocate it.
492*4882a593Smuzhiyun 				 * If default GID is requested, then our
493*4882a593Smuzhiyun 				 * found slot must be one of the DEFAULT
494*4882a593Smuzhiyun 				 * reserved slots or we fail.
495*4882a593Smuzhiyun 				 * This ensures that only DEFAULT reserved
496*4882a593Smuzhiyun 				 * slots are used for default property GIDs.
497*4882a593Smuzhiyun 				 */
498*4882a593Smuzhiyun 				empty = curr_index;
499*4882a593Smuzhiyun 			}
500*4882a593Smuzhiyun 		}
501*4882a593Smuzhiyun 
502*4882a593Smuzhiyun 		/*
503*4882a593Smuzhiyun 		 * Additionally find_gid() is used to find valid entry during
504*4882a593Smuzhiyun 		 * lookup operation; so ignore the entries which are marked as
505*4882a593Smuzhiyun 		 * pending for removal and the entries which are marked as
506*4882a593Smuzhiyun 		 * invalid.
507*4882a593Smuzhiyun 		 */
508*4882a593Smuzhiyun 		if (!is_gid_entry_valid(data))
509*4882a593Smuzhiyun 			continue;
510*4882a593Smuzhiyun 
511*4882a593Smuzhiyun 		if (found >= 0)
512*4882a593Smuzhiyun 			continue;
513*4882a593Smuzhiyun 
514*4882a593Smuzhiyun 		attr = &data->attr;
515*4882a593Smuzhiyun 		if (mask & GID_ATTR_FIND_MASK_GID_TYPE &&
516*4882a593Smuzhiyun 		    attr->gid_type != val->gid_type)
517*4882a593Smuzhiyun 			continue;
518*4882a593Smuzhiyun 
519*4882a593Smuzhiyun 		if (mask & GID_ATTR_FIND_MASK_GID &&
520*4882a593Smuzhiyun 		    memcmp(gid, &data->attr.gid, sizeof(*gid)))
521*4882a593Smuzhiyun 			continue;
522*4882a593Smuzhiyun 
523*4882a593Smuzhiyun 		if (mask & GID_ATTR_FIND_MASK_NETDEV &&
524*4882a593Smuzhiyun 		    attr->ndev != val->ndev)
525*4882a593Smuzhiyun 			continue;
526*4882a593Smuzhiyun 
527*4882a593Smuzhiyun 		if (mask & GID_ATTR_FIND_MASK_DEFAULT &&
528*4882a593Smuzhiyun 		    is_gid_index_default(table, curr_index) != default_gid)
529*4882a593Smuzhiyun 			continue;
530*4882a593Smuzhiyun 
531*4882a593Smuzhiyun 		found = curr_index;
532*4882a593Smuzhiyun 	}
533*4882a593Smuzhiyun 
534*4882a593Smuzhiyun 	if (pempty)
535*4882a593Smuzhiyun 		*pempty = empty;
536*4882a593Smuzhiyun 
537*4882a593Smuzhiyun 	return found;
538*4882a593Smuzhiyun }
539*4882a593Smuzhiyun 
make_default_gid(struct net_device * dev,union ib_gid * gid)540*4882a593Smuzhiyun static void make_default_gid(struct  net_device *dev, union ib_gid *gid)
541*4882a593Smuzhiyun {
542*4882a593Smuzhiyun 	gid->global.subnet_prefix = cpu_to_be64(0xfe80000000000000LL);
543*4882a593Smuzhiyun 	addrconf_ifid_eui48(&gid->raw[8], dev);
544*4882a593Smuzhiyun }
545*4882a593Smuzhiyun 
__ib_cache_gid_add(struct ib_device * ib_dev,u8 port,union ib_gid * gid,struct ib_gid_attr * attr,unsigned long mask,bool default_gid)546*4882a593Smuzhiyun static int __ib_cache_gid_add(struct ib_device *ib_dev, u8 port,
547*4882a593Smuzhiyun 			      union ib_gid *gid, struct ib_gid_attr *attr,
548*4882a593Smuzhiyun 			      unsigned long mask, bool default_gid)
549*4882a593Smuzhiyun {
550*4882a593Smuzhiyun 	struct ib_gid_table *table;
551*4882a593Smuzhiyun 	int ret = 0;
552*4882a593Smuzhiyun 	int empty;
553*4882a593Smuzhiyun 	int ix;
554*4882a593Smuzhiyun 
555*4882a593Smuzhiyun 	/* Do not allow adding zero GID in support of
556*4882a593Smuzhiyun 	 * IB spec version 1.3 section 4.1.1 point (6) and
557*4882a593Smuzhiyun 	 * section 12.7.10 and section 12.7.20
558*4882a593Smuzhiyun 	 */
559*4882a593Smuzhiyun 	if (rdma_is_zero_gid(gid))
560*4882a593Smuzhiyun 		return -EINVAL;
561*4882a593Smuzhiyun 
562*4882a593Smuzhiyun 	table = rdma_gid_table(ib_dev, port);
563*4882a593Smuzhiyun 
564*4882a593Smuzhiyun 	mutex_lock(&table->lock);
565*4882a593Smuzhiyun 
566*4882a593Smuzhiyun 	ix = find_gid(table, gid, attr, default_gid, mask, &empty);
567*4882a593Smuzhiyun 	if (ix >= 0)
568*4882a593Smuzhiyun 		goto out_unlock;
569*4882a593Smuzhiyun 
570*4882a593Smuzhiyun 	if (empty < 0) {
571*4882a593Smuzhiyun 		ret = -ENOSPC;
572*4882a593Smuzhiyun 		goto out_unlock;
573*4882a593Smuzhiyun 	}
574*4882a593Smuzhiyun 	attr->device = ib_dev;
575*4882a593Smuzhiyun 	attr->index = empty;
576*4882a593Smuzhiyun 	attr->port_num = port;
577*4882a593Smuzhiyun 	attr->gid = *gid;
578*4882a593Smuzhiyun 	ret = add_modify_gid(table, attr);
579*4882a593Smuzhiyun 	if (!ret)
580*4882a593Smuzhiyun 		dispatch_gid_change_event(ib_dev, port);
581*4882a593Smuzhiyun 
582*4882a593Smuzhiyun out_unlock:
583*4882a593Smuzhiyun 	mutex_unlock(&table->lock);
584*4882a593Smuzhiyun 	if (ret)
585*4882a593Smuzhiyun 		pr_warn("%s: unable to add gid %pI6 error=%d\n",
586*4882a593Smuzhiyun 			__func__, gid->raw, ret);
587*4882a593Smuzhiyun 	return ret;
588*4882a593Smuzhiyun }
589*4882a593Smuzhiyun 
ib_cache_gid_add(struct ib_device * ib_dev,u8 port,union ib_gid * gid,struct ib_gid_attr * attr)590*4882a593Smuzhiyun int ib_cache_gid_add(struct ib_device *ib_dev, u8 port,
591*4882a593Smuzhiyun 		     union ib_gid *gid, struct ib_gid_attr *attr)
592*4882a593Smuzhiyun {
593*4882a593Smuzhiyun 	unsigned long mask = GID_ATTR_FIND_MASK_GID |
594*4882a593Smuzhiyun 			     GID_ATTR_FIND_MASK_GID_TYPE |
595*4882a593Smuzhiyun 			     GID_ATTR_FIND_MASK_NETDEV;
596*4882a593Smuzhiyun 
597*4882a593Smuzhiyun 	return __ib_cache_gid_add(ib_dev, port, gid, attr, mask, false);
598*4882a593Smuzhiyun }
599*4882a593Smuzhiyun 
600*4882a593Smuzhiyun static int
_ib_cache_gid_del(struct ib_device * ib_dev,u8 port,union ib_gid * gid,struct ib_gid_attr * attr,unsigned long mask,bool default_gid)601*4882a593Smuzhiyun _ib_cache_gid_del(struct ib_device *ib_dev, u8 port,
602*4882a593Smuzhiyun 		  union ib_gid *gid, struct ib_gid_attr *attr,
603*4882a593Smuzhiyun 		  unsigned long mask, bool default_gid)
604*4882a593Smuzhiyun {
605*4882a593Smuzhiyun 	struct ib_gid_table *table;
606*4882a593Smuzhiyun 	int ret = 0;
607*4882a593Smuzhiyun 	int ix;
608*4882a593Smuzhiyun 
609*4882a593Smuzhiyun 	table = rdma_gid_table(ib_dev, port);
610*4882a593Smuzhiyun 
611*4882a593Smuzhiyun 	mutex_lock(&table->lock);
612*4882a593Smuzhiyun 
613*4882a593Smuzhiyun 	ix = find_gid(table, gid, attr, default_gid, mask, NULL);
614*4882a593Smuzhiyun 	if (ix < 0) {
615*4882a593Smuzhiyun 		ret = -EINVAL;
616*4882a593Smuzhiyun 		goto out_unlock;
617*4882a593Smuzhiyun 	}
618*4882a593Smuzhiyun 
619*4882a593Smuzhiyun 	del_gid(ib_dev, port, table, ix);
620*4882a593Smuzhiyun 	dispatch_gid_change_event(ib_dev, port);
621*4882a593Smuzhiyun 
622*4882a593Smuzhiyun out_unlock:
623*4882a593Smuzhiyun 	mutex_unlock(&table->lock);
624*4882a593Smuzhiyun 	if (ret)
625*4882a593Smuzhiyun 		pr_debug("%s: can't delete gid %pI6 error=%d\n",
626*4882a593Smuzhiyun 			 __func__, gid->raw, ret);
627*4882a593Smuzhiyun 	return ret;
628*4882a593Smuzhiyun }
629*4882a593Smuzhiyun 
ib_cache_gid_del(struct ib_device * ib_dev,u8 port,union ib_gid * gid,struct ib_gid_attr * attr)630*4882a593Smuzhiyun int ib_cache_gid_del(struct ib_device *ib_dev, u8 port,
631*4882a593Smuzhiyun 		     union ib_gid *gid, struct ib_gid_attr *attr)
632*4882a593Smuzhiyun {
633*4882a593Smuzhiyun 	unsigned long mask = GID_ATTR_FIND_MASK_GID	  |
634*4882a593Smuzhiyun 			     GID_ATTR_FIND_MASK_GID_TYPE |
635*4882a593Smuzhiyun 			     GID_ATTR_FIND_MASK_DEFAULT  |
636*4882a593Smuzhiyun 			     GID_ATTR_FIND_MASK_NETDEV;
637*4882a593Smuzhiyun 
638*4882a593Smuzhiyun 	return _ib_cache_gid_del(ib_dev, port, gid, attr, mask, false);
639*4882a593Smuzhiyun }
640*4882a593Smuzhiyun 
ib_cache_gid_del_all_netdev_gids(struct ib_device * ib_dev,u8 port,struct net_device * ndev)641*4882a593Smuzhiyun int ib_cache_gid_del_all_netdev_gids(struct ib_device *ib_dev, u8 port,
642*4882a593Smuzhiyun 				     struct net_device *ndev)
643*4882a593Smuzhiyun {
644*4882a593Smuzhiyun 	struct ib_gid_table *table;
645*4882a593Smuzhiyun 	int ix;
646*4882a593Smuzhiyun 	bool deleted = false;
647*4882a593Smuzhiyun 
648*4882a593Smuzhiyun 	table = rdma_gid_table(ib_dev, port);
649*4882a593Smuzhiyun 
650*4882a593Smuzhiyun 	mutex_lock(&table->lock);
651*4882a593Smuzhiyun 
652*4882a593Smuzhiyun 	for (ix = 0; ix < table->sz; ix++) {
653*4882a593Smuzhiyun 		if (is_gid_entry_valid(table->data_vec[ix]) &&
654*4882a593Smuzhiyun 		    table->data_vec[ix]->attr.ndev == ndev) {
655*4882a593Smuzhiyun 			del_gid(ib_dev, port, table, ix);
656*4882a593Smuzhiyun 			deleted = true;
657*4882a593Smuzhiyun 		}
658*4882a593Smuzhiyun 	}
659*4882a593Smuzhiyun 
660*4882a593Smuzhiyun 	mutex_unlock(&table->lock);
661*4882a593Smuzhiyun 
662*4882a593Smuzhiyun 	if (deleted)
663*4882a593Smuzhiyun 		dispatch_gid_change_event(ib_dev, port);
664*4882a593Smuzhiyun 
665*4882a593Smuzhiyun 	return 0;
666*4882a593Smuzhiyun }
667*4882a593Smuzhiyun 
668*4882a593Smuzhiyun /**
669*4882a593Smuzhiyun  * rdma_find_gid_by_port - Returns the GID entry attributes when it finds
670*4882a593Smuzhiyun  * a valid GID entry for given search parameters. It searches for the specified
671*4882a593Smuzhiyun  * GID value in the local software cache.
672*4882a593Smuzhiyun  * @device: The device to query.
673*4882a593Smuzhiyun  * @gid: The GID value to search for.
674*4882a593Smuzhiyun  * @gid_type: The GID type to search for.
675*4882a593Smuzhiyun  * @port_num: The port number of the device where the GID value should be
676*4882a593Smuzhiyun  *   searched.
677*4882a593Smuzhiyun  * @ndev: In RoCE, the net device of the device. NULL means ignore.
678*4882a593Smuzhiyun  *
679*4882a593Smuzhiyun  * Returns sgid attributes if the GID is found with valid reference or
680*4882a593Smuzhiyun  * returns ERR_PTR for the error.
681*4882a593Smuzhiyun  * The caller must invoke rdma_put_gid_attr() to release the reference.
682*4882a593Smuzhiyun  */
683*4882a593Smuzhiyun const struct ib_gid_attr *
rdma_find_gid_by_port(struct ib_device * ib_dev,const union ib_gid * gid,enum ib_gid_type gid_type,u8 port,struct net_device * ndev)684*4882a593Smuzhiyun rdma_find_gid_by_port(struct ib_device *ib_dev,
685*4882a593Smuzhiyun 		      const union ib_gid *gid,
686*4882a593Smuzhiyun 		      enum ib_gid_type gid_type,
687*4882a593Smuzhiyun 		      u8 port, struct net_device *ndev)
688*4882a593Smuzhiyun {
689*4882a593Smuzhiyun 	int local_index;
690*4882a593Smuzhiyun 	struct ib_gid_table *table;
691*4882a593Smuzhiyun 	unsigned long mask = GID_ATTR_FIND_MASK_GID |
692*4882a593Smuzhiyun 			     GID_ATTR_FIND_MASK_GID_TYPE;
693*4882a593Smuzhiyun 	struct ib_gid_attr val = {.ndev = ndev, .gid_type = gid_type};
694*4882a593Smuzhiyun 	const struct ib_gid_attr *attr;
695*4882a593Smuzhiyun 	unsigned long flags;
696*4882a593Smuzhiyun 
697*4882a593Smuzhiyun 	if (!rdma_is_port_valid(ib_dev, port))
698*4882a593Smuzhiyun 		return ERR_PTR(-ENOENT);
699*4882a593Smuzhiyun 
700*4882a593Smuzhiyun 	table = rdma_gid_table(ib_dev, port);
701*4882a593Smuzhiyun 
702*4882a593Smuzhiyun 	if (ndev)
703*4882a593Smuzhiyun 		mask |= GID_ATTR_FIND_MASK_NETDEV;
704*4882a593Smuzhiyun 
705*4882a593Smuzhiyun 	read_lock_irqsave(&table->rwlock, flags);
706*4882a593Smuzhiyun 	local_index = find_gid(table, gid, &val, false, mask, NULL);
707*4882a593Smuzhiyun 	if (local_index >= 0) {
708*4882a593Smuzhiyun 		get_gid_entry(table->data_vec[local_index]);
709*4882a593Smuzhiyun 		attr = &table->data_vec[local_index]->attr;
710*4882a593Smuzhiyun 		read_unlock_irqrestore(&table->rwlock, flags);
711*4882a593Smuzhiyun 		return attr;
712*4882a593Smuzhiyun 	}
713*4882a593Smuzhiyun 
714*4882a593Smuzhiyun 	read_unlock_irqrestore(&table->rwlock, flags);
715*4882a593Smuzhiyun 	return ERR_PTR(-ENOENT);
716*4882a593Smuzhiyun }
717*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_find_gid_by_port);
718*4882a593Smuzhiyun 
719*4882a593Smuzhiyun /**
720*4882a593Smuzhiyun  * rdma_find_gid_by_filter - Returns the GID table attribute where a
721*4882a593Smuzhiyun  * specified GID value occurs
722*4882a593Smuzhiyun  * @device: The device to query.
723*4882a593Smuzhiyun  * @gid: The GID value to search for.
724*4882a593Smuzhiyun  * @port: The port number of the device where the GID value could be
725*4882a593Smuzhiyun  *   searched.
726*4882a593Smuzhiyun  * @filter: The filter function is executed on any matching GID in the table.
727*4882a593Smuzhiyun  *   If the filter function returns true, the corresponding index is returned,
728*4882a593Smuzhiyun  *   otherwise, we continue searching the GID table. It's guaranteed that
729*4882a593Smuzhiyun  *   while filter is executed, ndev field is valid and the structure won't
730*4882a593Smuzhiyun  *   change. filter is executed in an atomic context. filter must not be NULL.
731*4882a593Smuzhiyun  *
732*4882a593Smuzhiyun  * rdma_find_gid_by_filter() searches for the specified GID value
733*4882a593Smuzhiyun  * of which the filter function returns true in the port's GID table.
734*4882a593Smuzhiyun  *
735*4882a593Smuzhiyun  */
rdma_find_gid_by_filter(struct ib_device * ib_dev,const union ib_gid * gid,u8 port,bool (* filter)(const union ib_gid * gid,const struct ib_gid_attr *,void *),void * context)736*4882a593Smuzhiyun const struct ib_gid_attr *rdma_find_gid_by_filter(
737*4882a593Smuzhiyun 	struct ib_device *ib_dev, const union ib_gid *gid, u8 port,
738*4882a593Smuzhiyun 	bool (*filter)(const union ib_gid *gid, const struct ib_gid_attr *,
739*4882a593Smuzhiyun 		       void *),
740*4882a593Smuzhiyun 	void *context)
741*4882a593Smuzhiyun {
742*4882a593Smuzhiyun 	const struct ib_gid_attr *res = ERR_PTR(-ENOENT);
743*4882a593Smuzhiyun 	struct ib_gid_table *table;
744*4882a593Smuzhiyun 	unsigned long flags;
745*4882a593Smuzhiyun 	unsigned int i;
746*4882a593Smuzhiyun 
747*4882a593Smuzhiyun 	if (!rdma_is_port_valid(ib_dev, port))
748*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
749*4882a593Smuzhiyun 
750*4882a593Smuzhiyun 	table = rdma_gid_table(ib_dev, port);
751*4882a593Smuzhiyun 
752*4882a593Smuzhiyun 	read_lock_irqsave(&table->rwlock, flags);
753*4882a593Smuzhiyun 	for (i = 0; i < table->sz; i++) {
754*4882a593Smuzhiyun 		struct ib_gid_table_entry *entry = table->data_vec[i];
755*4882a593Smuzhiyun 
756*4882a593Smuzhiyun 		if (!is_gid_entry_valid(entry))
757*4882a593Smuzhiyun 			continue;
758*4882a593Smuzhiyun 
759*4882a593Smuzhiyun 		if (memcmp(gid, &entry->attr.gid, sizeof(*gid)))
760*4882a593Smuzhiyun 			continue;
761*4882a593Smuzhiyun 
762*4882a593Smuzhiyun 		if (filter(gid, &entry->attr, context)) {
763*4882a593Smuzhiyun 			get_gid_entry(entry);
764*4882a593Smuzhiyun 			res = &entry->attr;
765*4882a593Smuzhiyun 			break;
766*4882a593Smuzhiyun 		}
767*4882a593Smuzhiyun 	}
768*4882a593Smuzhiyun 	read_unlock_irqrestore(&table->rwlock, flags);
769*4882a593Smuzhiyun 	return res;
770*4882a593Smuzhiyun }
771*4882a593Smuzhiyun 
alloc_gid_table(int sz)772*4882a593Smuzhiyun static struct ib_gid_table *alloc_gid_table(int sz)
773*4882a593Smuzhiyun {
774*4882a593Smuzhiyun 	struct ib_gid_table *table = kzalloc(sizeof(*table), GFP_KERNEL);
775*4882a593Smuzhiyun 
776*4882a593Smuzhiyun 	if (!table)
777*4882a593Smuzhiyun 		return NULL;
778*4882a593Smuzhiyun 
779*4882a593Smuzhiyun 	table->data_vec = kcalloc(sz, sizeof(*table->data_vec), GFP_KERNEL);
780*4882a593Smuzhiyun 	if (!table->data_vec)
781*4882a593Smuzhiyun 		goto err_free_table;
782*4882a593Smuzhiyun 
783*4882a593Smuzhiyun 	mutex_init(&table->lock);
784*4882a593Smuzhiyun 
785*4882a593Smuzhiyun 	table->sz = sz;
786*4882a593Smuzhiyun 	rwlock_init(&table->rwlock);
787*4882a593Smuzhiyun 	return table;
788*4882a593Smuzhiyun 
789*4882a593Smuzhiyun err_free_table:
790*4882a593Smuzhiyun 	kfree(table);
791*4882a593Smuzhiyun 	return NULL;
792*4882a593Smuzhiyun }
793*4882a593Smuzhiyun 
release_gid_table(struct ib_device * device,struct ib_gid_table * table)794*4882a593Smuzhiyun static void release_gid_table(struct ib_device *device,
795*4882a593Smuzhiyun 			      struct ib_gid_table *table)
796*4882a593Smuzhiyun {
797*4882a593Smuzhiyun 	bool leak = false;
798*4882a593Smuzhiyun 	int i;
799*4882a593Smuzhiyun 
800*4882a593Smuzhiyun 	if (!table)
801*4882a593Smuzhiyun 		return;
802*4882a593Smuzhiyun 
803*4882a593Smuzhiyun 	for (i = 0; i < table->sz; i++) {
804*4882a593Smuzhiyun 		if (is_gid_entry_free(table->data_vec[i]))
805*4882a593Smuzhiyun 			continue;
806*4882a593Smuzhiyun 		if (kref_read(&table->data_vec[i]->kref) > 1) {
807*4882a593Smuzhiyun 			dev_err(&device->dev,
808*4882a593Smuzhiyun 				"GID entry ref leak for index %d ref=%d\n", i,
809*4882a593Smuzhiyun 				kref_read(&table->data_vec[i]->kref));
810*4882a593Smuzhiyun 			leak = true;
811*4882a593Smuzhiyun 		}
812*4882a593Smuzhiyun 	}
813*4882a593Smuzhiyun 	if (leak)
814*4882a593Smuzhiyun 		return;
815*4882a593Smuzhiyun 
816*4882a593Smuzhiyun 	mutex_destroy(&table->lock);
817*4882a593Smuzhiyun 	kfree(table->data_vec);
818*4882a593Smuzhiyun 	kfree(table);
819*4882a593Smuzhiyun }
820*4882a593Smuzhiyun 
cleanup_gid_table_port(struct ib_device * ib_dev,u8 port,struct ib_gid_table * table)821*4882a593Smuzhiyun static void cleanup_gid_table_port(struct ib_device *ib_dev, u8 port,
822*4882a593Smuzhiyun 				   struct ib_gid_table *table)
823*4882a593Smuzhiyun {
824*4882a593Smuzhiyun 	int i;
825*4882a593Smuzhiyun 
826*4882a593Smuzhiyun 	if (!table)
827*4882a593Smuzhiyun 		return;
828*4882a593Smuzhiyun 
829*4882a593Smuzhiyun 	mutex_lock(&table->lock);
830*4882a593Smuzhiyun 	for (i = 0; i < table->sz; ++i) {
831*4882a593Smuzhiyun 		if (is_gid_entry_valid(table->data_vec[i]))
832*4882a593Smuzhiyun 			del_gid(ib_dev, port, table, i);
833*4882a593Smuzhiyun 	}
834*4882a593Smuzhiyun 	mutex_unlock(&table->lock);
835*4882a593Smuzhiyun }
836*4882a593Smuzhiyun 
ib_cache_gid_set_default_gid(struct ib_device * ib_dev,u8 port,struct net_device * ndev,unsigned long gid_type_mask,enum ib_cache_gid_default_mode mode)837*4882a593Smuzhiyun void ib_cache_gid_set_default_gid(struct ib_device *ib_dev, u8 port,
838*4882a593Smuzhiyun 				  struct net_device *ndev,
839*4882a593Smuzhiyun 				  unsigned long gid_type_mask,
840*4882a593Smuzhiyun 				  enum ib_cache_gid_default_mode mode)
841*4882a593Smuzhiyun {
842*4882a593Smuzhiyun 	union ib_gid gid = { };
843*4882a593Smuzhiyun 	struct ib_gid_attr gid_attr;
844*4882a593Smuzhiyun 	unsigned int gid_type;
845*4882a593Smuzhiyun 	unsigned long mask;
846*4882a593Smuzhiyun 
847*4882a593Smuzhiyun 	mask = GID_ATTR_FIND_MASK_GID_TYPE |
848*4882a593Smuzhiyun 	       GID_ATTR_FIND_MASK_DEFAULT |
849*4882a593Smuzhiyun 	       GID_ATTR_FIND_MASK_NETDEV;
850*4882a593Smuzhiyun 	memset(&gid_attr, 0, sizeof(gid_attr));
851*4882a593Smuzhiyun 	gid_attr.ndev = ndev;
852*4882a593Smuzhiyun 
853*4882a593Smuzhiyun 	for (gid_type = 0; gid_type < IB_GID_TYPE_SIZE; ++gid_type) {
854*4882a593Smuzhiyun 		if (1UL << gid_type & ~gid_type_mask)
855*4882a593Smuzhiyun 			continue;
856*4882a593Smuzhiyun 
857*4882a593Smuzhiyun 		gid_attr.gid_type = gid_type;
858*4882a593Smuzhiyun 
859*4882a593Smuzhiyun 		if (mode == IB_CACHE_GID_DEFAULT_MODE_SET) {
860*4882a593Smuzhiyun 			make_default_gid(ndev, &gid);
861*4882a593Smuzhiyun 			__ib_cache_gid_add(ib_dev, port, &gid,
862*4882a593Smuzhiyun 					   &gid_attr, mask, true);
863*4882a593Smuzhiyun 		} else if (mode == IB_CACHE_GID_DEFAULT_MODE_DELETE) {
864*4882a593Smuzhiyun 			_ib_cache_gid_del(ib_dev, port, &gid,
865*4882a593Smuzhiyun 					  &gid_attr, mask, true);
866*4882a593Smuzhiyun 		}
867*4882a593Smuzhiyun 	}
868*4882a593Smuzhiyun }
869*4882a593Smuzhiyun 
gid_table_reserve_default(struct ib_device * ib_dev,u8 port,struct ib_gid_table * table)870*4882a593Smuzhiyun static void gid_table_reserve_default(struct ib_device *ib_dev, u8 port,
871*4882a593Smuzhiyun 				      struct ib_gid_table *table)
872*4882a593Smuzhiyun {
873*4882a593Smuzhiyun 	unsigned int i;
874*4882a593Smuzhiyun 	unsigned long roce_gid_type_mask;
875*4882a593Smuzhiyun 	unsigned int num_default_gids;
876*4882a593Smuzhiyun 
877*4882a593Smuzhiyun 	roce_gid_type_mask = roce_gid_type_mask_support(ib_dev, port);
878*4882a593Smuzhiyun 	num_default_gids = hweight_long(roce_gid_type_mask);
879*4882a593Smuzhiyun 	/* Reserve starting indices for default GIDs */
880*4882a593Smuzhiyun 	for (i = 0; i < num_default_gids && i < table->sz; i++)
881*4882a593Smuzhiyun 		table->default_gid_indices |= BIT(i);
882*4882a593Smuzhiyun }
883*4882a593Smuzhiyun 
884*4882a593Smuzhiyun 
gid_table_release_one(struct ib_device * ib_dev)885*4882a593Smuzhiyun static void gid_table_release_one(struct ib_device *ib_dev)
886*4882a593Smuzhiyun {
887*4882a593Smuzhiyun 	unsigned int p;
888*4882a593Smuzhiyun 
889*4882a593Smuzhiyun 	rdma_for_each_port (ib_dev, p) {
890*4882a593Smuzhiyun 		release_gid_table(ib_dev, ib_dev->port_data[p].cache.gid);
891*4882a593Smuzhiyun 		ib_dev->port_data[p].cache.gid = NULL;
892*4882a593Smuzhiyun 	}
893*4882a593Smuzhiyun }
894*4882a593Smuzhiyun 
_gid_table_setup_one(struct ib_device * ib_dev)895*4882a593Smuzhiyun static int _gid_table_setup_one(struct ib_device *ib_dev)
896*4882a593Smuzhiyun {
897*4882a593Smuzhiyun 	struct ib_gid_table *table;
898*4882a593Smuzhiyun 	unsigned int rdma_port;
899*4882a593Smuzhiyun 
900*4882a593Smuzhiyun 	rdma_for_each_port (ib_dev, rdma_port) {
901*4882a593Smuzhiyun 		table = alloc_gid_table(
902*4882a593Smuzhiyun 			ib_dev->port_data[rdma_port].immutable.gid_tbl_len);
903*4882a593Smuzhiyun 		if (!table)
904*4882a593Smuzhiyun 			goto rollback_table_setup;
905*4882a593Smuzhiyun 
906*4882a593Smuzhiyun 		gid_table_reserve_default(ib_dev, rdma_port, table);
907*4882a593Smuzhiyun 		ib_dev->port_data[rdma_port].cache.gid = table;
908*4882a593Smuzhiyun 	}
909*4882a593Smuzhiyun 	return 0;
910*4882a593Smuzhiyun 
911*4882a593Smuzhiyun rollback_table_setup:
912*4882a593Smuzhiyun 	gid_table_release_one(ib_dev);
913*4882a593Smuzhiyun 	return -ENOMEM;
914*4882a593Smuzhiyun }
915*4882a593Smuzhiyun 
gid_table_cleanup_one(struct ib_device * ib_dev)916*4882a593Smuzhiyun static void gid_table_cleanup_one(struct ib_device *ib_dev)
917*4882a593Smuzhiyun {
918*4882a593Smuzhiyun 	unsigned int p;
919*4882a593Smuzhiyun 
920*4882a593Smuzhiyun 	rdma_for_each_port (ib_dev, p)
921*4882a593Smuzhiyun 		cleanup_gid_table_port(ib_dev, p,
922*4882a593Smuzhiyun 				       ib_dev->port_data[p].cache.gid);
923*4882a593Smuzhiyun }
924*4882a593Smuzhiyun 
gid_table_setup_one(struct ib_device * ib_dev)925*4882a593Smuzhiyun static int gid_table_setup_one(struct ib_device *ib_dev)
926*4882a593Smuzhiyun {
927*4882a593Smuzhiyun 	int err;
928*4882a593Smuzhiyun 
929*4882a593Smuzhiyun 	err = _gid_table_setup_one(ib_dev);
930*4882a593Smuzhiyun 
931*4882a593Smuzhiyun 	if (err)
932*4882a593Smuzhiyun 		return err;
933*4882a593Smuzhiyun 
934*4882a593Smuzhiyun 	rdma_roce_rescan_device(ib_dev);
935*4882a593Smuzhiyun 
936*4882a593Smuzhiyun 	return err;
937*4882a593Smuzhiyun }
938*4882a593Smuzhiyun 
939*4882a593Smuzhiyun /**
940*4882a593Smuzhiyun  * rdma_query_gid - Read the GID content from the GID software cache
941*4882a593Smuzhiyun  * @device:		Device to query the GID
942*4882a593Smuzhiyun  * @port_num:		Port number of the device
943*4882a593Smuzhiyun  * @index:		Index of the GID table entry to read
944*4882a593Smuzhiyun  * @gid:		Pointer to GID where to store the entry's GID
945*4882a593Smuzhiyun  *
946*4882a593Smuzhiyun  * rdma_query_gid() only reads the GID entry content for requested device,
947*4882a593Smuzhiyun  * port and index. It reads for IB, RoCE and iWarp link layers.  It doesn't
948*4882a593Smuzhiyun  * hold any reference to the GID table entry in the HCA or software cache.
949*4882a593Smuzhiyun  *
950*4882a593Smuzhiyun  * Returns 0 on success or appropriate error code.
951*4882a593Smuzhiyun  *
952*4882a593Smuzhiyun  */
rdma_query_gid(struct ib_device * device,u8 port_num,int index,union ib_gid * gid)953*4882a593Smuzhiyun int rdma_query_gid(struct ib_device *device, u8 port_num,
954*4882a593Smuzhiyun 		   int index, union ib_gid *gid)
955*4882a593Smuzhiyun {
956*4882a593Smuzhiyun 	struct ib_gid_table *table;
957*4882a593Smuzhiyun 	unsigned long flags;
958*4882a593Smuzhiyun 	int res = -EINVAL;
959*4882a593Smuzhiyun 
960*4882a593Smuzhiyun 	if (!rdma_is_port_valid(device, port_num))
961*4882a593Smuzhiyun 		return -EINVAL;
962*4882a593Smuzhiyun 
963*4882a593Smuzhiyun 	table = rdma_gid_table(device, port_num);
964*4882a593Smuzhiyun 	read_lock_irqsave(&table->rwlock, flags);
965*4882a593Smuzhiyun 
966*4882a593Smuzhiyun 	if (index < 0 || index >= table->sz ||
967*4882a593Smuzhiyun 	    !is_gid_entry_valid(table->data_vec[index]))
968*4882a593Smuzhiyun 		goto done;
969*4882a593Smuzhiyun 
970*4882a593Smuzhiyun 	memcpy(gid, &table->data_vec[index]->attr.gid, sizeof(*gid));
971*4882a593Smuzhiyun 	res = 0;
972*4882a593Smuzhiyun 
973*4882a593Smuzhiyun done:
974*4882a593Smuzhiyun 	read_unlock_irqrestore(&table->rwlock, flags);
975*4882a593Smuzhiyun 	return res;
976*4882a593Smuzhiyun }
977*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_query_gid);
978*4882a593Smuzhiyun 
979*4882a593Smuzhiyun /**
980*4882a593Smuzhiyun  * rdma_read_gid_hw_context - Read the HW GID context from GID attribute
981*4882a593Smuzhiyun  * @attr:		Potinter to the GID attribute
982*4882a593Smuzhiyun  *
983*4882a593Smuzhiyun  * rdma_read_gid_hw_context() reads the drivers GID HW context corresponding
984*4882a593Smuzhiyun  * to the SGID attr. Callers are required to already be holding the reference
985*4882a593Smuzhiyun  * to an existing GID entry.
986*4882a593Smuzhiyun  *
987*4882a593Smuzhiyun  * Returns the HW GID context
988*4882a593Smuzhiyun  *
989*4882a593Smuzhiyun  */
rdma_read_gid_hw_context(const struct ib_gid_attr * attr)990*4882a593Smuzhiyun void *rdma_read_gid_hw_context(const struct ib_gid_attr *attr)
991*4882a593Smuzhiyun {
992*4882a593Smuzhiyun 	return container_of(attr, struct ib_gid_table_entry, attr)->context;
993*4882a593Smuzhiyun }
994*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_read_gid_hw_context);
995*4882a593Smuzhiyun 
996*4882a593Smuzhiyun /**
997*4882a593Smuzhiyun  * rdma_find_gid - Returns SGID attributes if the matching GID is found.
998*4882a593Smuzhiyun  * @device: The device to query.
999*4882a593Smuzhiyun  * @gid: The GID value to search for.
1000*4882a593Smuzhiyun  * @gid_type: The GID type to search for.
1001*4882a593Smuzhiyun  * @ndev: In RoCE, the net device of the device. NULL means ignore.
1002*4882a593Smuzhiyun  *
1003*4882a593Smuzhiyun  * rdma_find_gid() searches for the specified GID value in the software cache.
1004*4882a593Smuzhiyun  *
1005*4882a593Smuzhiyun  * Returns GID attributes if a valid GID is found or returns ERR_PTR for the
1006*4882a593Smuzhiyun  * error. The caller must invoke rdma_put_gid_attr() to release the reference.
1007*4882a593Smuzhiyun  *
1008*4882a593Smuzhiyun  */
rdma_find_gid(struct ib_device * device,const union ib_gid * gid,enum ib_gid_type gid_type,struct net_device * ndev)1009*4882a593Smuzhiyun const struct ib_gid_attr *rdma_find_gid(struct ib_device *device,
1010*4882a593Smuzhiyun 					const union ib_gid *gid,
1011*4882a593Smuzhiyun 					enum ib_gid_type gid_type,
1012*4882a593Smuzhiyun 					struct net_device *ndev)
1013*4882a593Smuzhiyun {
1014*4882a593Smuzhiyun 	unsigned long mask = GID_ATTR_FIND_MASK_GID |
1015*4882a593Smuzhiyun 			     GID_ATTR_FIND_MASK_GID_TYPE;
1016*4882a593Smuzhiyun 	struct ib_gid_attr gid_attr_val = {.ndev = ndev, .gid_type = gid_type};
1017*4882a593Smuzhiyun 	unsigned int p;
1018*4882a593Smuzhiyun 
1019*4882a593Smuzhiyun 	if (ndev)
1020*4882a593Smuzhiyun 		mask |= GID_ATTR_FIND_MASK_NETDEV;
1021*4882a593Smuzhiyun 
1022*4882a593Smuzhiyun 	rdma_for_each_port(device, p) {
1023*4882a593Smuzhiyun 		struct ib_gid_table *table;
1024*4882a593Smuzhiyun 		unsigned long flags;
1025*4882a593Smuzhiyun 		int index;
1026*4882a593Smuzhiyun 
1027*4882a593Smuzhiyun 		table = device->port_data[p].cache.gid;
1028*4882a593Smuzhiyun 		read_lock_irqsave(&table->rwlock, flags);
1029*4882a593Smuzhiyun 		index = find_gid(table, gid, &gid_attr_val, false, mask, NULL);
1030*4882a593Smuzhiyun 		if (index >= 0) {
1031*4882a593Smuzhiyun 			const struct ib_gid_attr *attr;
1032*4882a593Smuzhiyun 
1033*4882a593Smuzhiyun 			get_gid_entry(table->data_vec[index]);
1034*4882a593Smuzhiyun 			attr = &table->data_vec[index]->attr;
1035*4882a593Smuzhiyun 			read_unlock_irqrestore(&table->rwlock, flags);
1036*4882a593Smuzhiyun 			return attr;
1037*4882a593Smuzhiyun 		}
1038*4882a593Smuzhiyun 		read_unlock_irqrestore(&table->rwlock, flags);
1039*4882a593Smuzhiyun 	}
1040*4882a593Smuzhiyun 
1041*4882a593Smuzhiyun 	return ERR_PTR(-ENOENT);
1042*4882a593Smuzhiyun }
1043*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_find_gid);
1044*4882a593Smuzhiyun 
ib_get_cached_pkey(struct ib_device * device,u8 port_num,int index,u16 * pkey)1045*4882a593Smuzhiyun int ib_get_cached_pkey(struct ib_device *device,
1046*4882a593Smuzhiyun 		       u8                port_num,
1047*4882a593Smuzhiyun 		       int               index,
1048*4882a593Smuzhiyun 		       u16              *pkey)
1049*4882a593Smuzhiyun {
1050*4882a593Smuzhiyun 	struct ib_pkey_cache *cache;
1051*4882a593Smuzhiyun 	unsigned long flags;
1052*4882a593Smuzhiyun 	int ret = 0;
1053*4882a593Smuzhiyun 
1054*4882a593Smuzhiyun 	if (!rdma_is_port_valid(device, port_num))
1055*4882a593Smuzhiyun 		return -EINVAL;
1056*4882a593Smuzhiyun 
1057*4882a593Smuzhiyun 	read_lock_irqsave(&device->cache_lock, flags);
1058*4882a593Smuzhiyun 
1059*4882a593Smuzhiyun 	cache = device->port_data[port_num].cache.pkey;
1060*4882a593Smuzhiyun 
1061*4882a593Smuzhiyun 	if (!cache || index < 0 || index >= cache->table_len)
1062*4882a593Smuzhiyun 		ret = -EINVAL;
1063*4882a593Smuzhiyun 	else
1064*4882a593Smuzhiyun 		*pkey = cache->table[index];
1065*4882a593Smuzhiyun 
1066*4882a593Smuzhiyun 	read_unlock_irqrestore(&device->cache_lock, flags);
1067*4882a593Smuzhiyun 
1068*4882a593Smuzhiyun 	return ret;
1069*4882a593Smuzhiyun }
1070*4882a593Smuzhiyun EXPORT_SYMBOL(ib_get_cached_pkey);
1071*4882a593Smuzhiyun 
ib_get_cached_subnet_prefix(struct ib_device * device,u8 port_num,u64 * sn_pfx)1072*4882a593Smuzhiyun int ib_get_cached_subnet_prefix(struct ib_device *device,
1073*4882a593Smuzhiyun 				u8                port_num,
1074*4882a593Smuzhiyun 				u64              *sn_pfx)
1075*4882a593Smuzhiyun {
1076*4882a593Smuzhiyun 	unsigned long flags;
1077*4882a593Smuzhiyun 
1078*4882a593Smuzhiyun 	if (!rdma_is_port_valid(device, port_num))
1079*4882a593Smuzhiyun 		return -EINVAL;
1080*4882a593Smuzhiyun 
1081*4882a593Smuzhiyun 	read_lock_irqsave(&device->cache_lock, flags);
1082*4882a593Smuzhiyun 	*sn_pfx = device->port_data[port_num].cache.subnet_prefix;
1083*4882a593Smuzhiyun 	read_unlock_irqrestore(&device->cache_lock, flags);
1084*4882a593Smuzhiyun 
1085*4882a593Smuzhiyun 	return 0;
1086*4882a593Smuzhiyun }
1087*4882a593Smuzhiyun EXPORT_SYMBOL(ib_get_cached_subnet_prefix);
1088*4882a593Smuzhiyun 
ib_find_cached_pkey(struct ib_device * device,u8 port_num,u16 pkey,u16 * index)1089*4882a593Smuzhiyun int ib_find_cached_pkey(struct ib_device *device,
1090*4882a593Smuzhiyun 			u8                port_num,
1091*4882a593Smuzhiyun 			u16               pkey,
1092*4882a593Smuzhiyun 			u16              *index)
1093*4882a593Smuzhiyun {
1094*4882a593Smuzhiyun 	struct ib_pkey_cache *cache;
1095*4882a593Smuzhiyun 	unsigned long flags;
1096*4882a593Smuzhiyun 	int i;
1097*4882a593Smuzhiyun 	int ret = -ENOENT;
1098*4882a593Smuzhiyun 	int partial_ix = -1;
1099*4882a593Smuzhiyun 
1100*4882a593Smuzhiyun 	if (!rdma_is_port_valid(device, port_num))
1101*4882a593Smuzhiyun 		return -EINVAL;
1102*4882a593Smuzhiyun 
1103*4882a593Smuzhiyun 	read_lock_irqsave(&device->cache_lock, flags);
1104*4882a593Smuzhiyun 
1105*4882a593Smuzhiyun 	cache = device->port_data[port_num].cache.pkey;
1106*4882a593Smuzhiyun 	if (!cache) {
1107*4882a593Smuzhiyun 		ret = -EINVAL;
1108*4882a593Smuzhiyun 		goto err;
1109*4882a593Smuzhiyun 	}
1110*4882a593Smuzhiyun 
1111*4882a593Smuzhiyun 	*index = -1;
1112*4882a593Smuzhiyun 
1113*4882a593Smuzhiyun 	for (i = 0; i < cache->table_len; ++i)
1114*4882a593Smuzhiyun 		if ((cache->table[i] & 0x7fff) == (pkey & 0x7fff)) {
1115*4882a593Smuzhiyun 			if (cache->table[i] & 0x8000) {
1116*4882a593Smuzhiyun 				*index = i;
1117*4882a593Smuzhiyun 				ret = 0;
1118*4882a593Smuzhiyun 				break;
1119*4882a593Smuzhiyun 			} else
1120*4882a593Smuzhiyun 				partial_ix = i;
1121*4882a593Smuzhiyun 		}
1122*4882a593Smuzhiyun 
1123*4882a593Smuzhiyun 	if (ret && partial_ix >= 0) {
1124*4882a593Smuzhiyun 		*index = partial_ix;
1125*4882a593Smuzhiyun 		ret = 0;
1126*4882a593Smuzhiyun 	}
1127*4882a593Smuzhiyun 
1128*4882a593Smuzhiyun err:
1129*4882a593Smuzhiyun 	read_unlock_irqrestore(&device->cache_lock, flags);
1130*4882a593Smuzhiyun 
1131*4882a593Smuzhiyun 	return ret;
1132*4882a593Smuzhiyun }
1133*4882a593Smuzhiyun EXPORT_SYMBOL(ib_find_cached_pkey);
1134*4882a593Smuzhiyun 
ib_find_exact_cached_pkey(struct ib_device * device,u8 port_num,u16 pkey,u16 * index)1135*4882a593Smuzhiyun int ib_find_exact_cached_pkey(struct ib_device *device,
1136*4882a593Smuzhiyun 			      u8                port_num,
1137*4882a593Smuzhiyun 			      u16               pkey,
1138*4882a593Smuzhiyun 			      u16              *index)
1139*4882a593Smuzhiyun {
1140*4882a593Smuzhiyun 	struct ib_pkey_cache *cache;
1141*4882a593Smuzhiyun 	unsigned long flags;
1142*4882a593Smuzhiyun 	int i;
1143*4882a593Smuzhiyun 	int ret = -ENOENT;
1144*4882a593Smuzhiyun 
1145*4882a593Smuzhiyun 	if (!rdma_is_port_valid(device, port_num))
1146*4882a593Smuzhiyun 		return -EINVAL;
1147*4882a593Smuzhiyun 
1148*4882a593Smuzhiyun 	read_lock_irqsave(&device->cache_lock, flags);
1149*4882a593Smuzhiyun 
1150*4882a593Smuzhiyun 	cache = device->port_data[port_num].cache.pkey;
1151*4882a593Smuzhiyun 	if (!cache) {
1152*4882a593Smuzhiyun 		ret = -EINVAL;
1153*4882a593Smuzhiyun 		goto err;
1154*4882a593Smuzhiyun 	}
1155*4882a593Smuzhiyun 
1156*4882a593Smuzhiyun 	*index = -1;
1157*4882a593Smuzhiyun 
1158*4882a593Smuzhiyun 	for (i = 0; i < cache->table_len; ++i)
1159*4882a593Smuzhiyun 		if (cache->table[i] == pkey) {
1160*4882a593Smuzhiyun 			*index = i;
1161*4882a593Smuzhiyun 			ret = 0;
1162*4882a593Smuzhiyun 			break;
1163*4882a593Smuzhiyun 		}
1164*4882a593Smuzhiyun 
1165*4882a593Smuzhiyun err:
1166*4882a593Smuzhiyun 	read_unlock_irqrestore(&device->cache_lock, flags);
1167*4882a593Smuzhiyun 
1168*4882a593Smuzhiyun 	return ret;
1169*4882a593Smuzhiyun }
1170*4882a593Smuzhiyun EXPORT_SYMBOL(ib_find_exact_cached_pkey);
1171*4882a593Smuzhiyun 
ib_get_cached_lmc(struct ib_device * device,u8 port_num,u8 * lmc)1172*4882a593Smuzhiyun int ib_get_cached_lmc(struct ib_device *device,
1173*4882a593Smuzhiyun 		      u8                port_num,
1174*4882a593Smuzhiyun 		      u8                *lmc)
1175*4882a593Smuzhiyun {
1176*4882a593Smuzhiyun 	unsigned long flags;
1177*4882a593Smuzhiyun 	int ret = 0;
1178*4882a593Smuzhiyun 
1179*4882a593Smuzhiyun 	if (!rdma_is_port_valid(device, port_num))
1180*4882a593Smuzhiyun 		return -EINVAL;
1181*4882a593Smuzhiyun 
1182*4882a593Smuzhiyun 	read_lock_irqsave(&device->cache_lock, flags);
1183*4882a593Smuzhiyun 	*lmc = device->port_data[port_num].cache.lmc;
1184*4882a593Smuzhiyun 	read_unlock_irqrestore(&device->cache_lock, flags);
1185*4882a593Smuzhiyun 
1186*4882a593Smuzhiyun 	return ret;
1187*4882a593Smuzhiyun }
1188*4882a593Smuzhiyun EXPORT_SYMBOL(ib_get_cached_lmc);
1189*4882a593Smuzhiyun 
ib_get_cached_port_state(struct ib_device * device,u8 port_num,enum ib_port_state * port_state)1190*4882a593Smuzhiyun int ib_get_cached_port_state(struct ib_device   *device,
1191*4882a593Smuzhiyun 			     u8                  port_num,
1192*4882a593Smuzhiyun 			     enum ib_port_state *port_state)
1193*4882a593Smuzhiyun {
1194*4882a593Smuzhiyun 	unsigned long flags;
1195*4882a593Smuzhiyun 	int ret = 0;
1196*4882a593Smuzhiyun 
1197*4882a593Smuzhiyun 	if (!rdma_is_port_valid(device, port_num))
1198*4882a593Smuzhiyun 		return -EINVAL;
1199*4882a593Smuzhiyun 
1200*4882a593Smuzhiyun 	read_lock_irqsave(&device->cache_lock, flags);
1201*4882a593Smuzhiyun 	*port_state = device->port_data[port_num].cache.port_state;
1202*4882a593Smuzhiyun 	read_unlock_irqrestore(&device->cache_lock, flags);
1203*4882a593Smuzhiyun 
1204*4882a593Smuzhiyun 	return ret;
1205*4882a593Smuzhiyun }
1206*4882a593Smuzhiyun EXPORT_SYMBOL(ib_get_cached_port_state);
1207*4882a593Smuzhiyun 
1208*4882a593Smuzhiyun /**
1209*4882a593Smuzhiyun  * rdma_get_gid_attr - Returns GID attributes for a port of a device
1210*4882a593Smuzhiyun  * at a requested gid_index, if a valid GID entry exists.
1211*4882a593Smuzhiyun  * @device:		The device to query.
1212*4882a593Smuzhiyun  * @port_num:		The port number on the device where the GID value
1213*4882a593Smuzhiyun  *			is to be queried.
1214*4882a593Smuzhiyun  * @index:		Index of the GID table entry whose attributes are to
1215*4882a593Smuzhiyun  *                      be queried.
1216*4882a593Smuzhiyun  *
1217*4882a593Smuzhiyun  * rdma_get_gid_attr() acquires reference count of gid attributes from the
1218*4882a593Smuzhiyun  * cached GID table. Caller must invoke rdma_put_gid_attr() to release
1219*4882a593Smuzhiyun  * reference to gid attribute regardless of link layer.
1220*4882a593Smuzhiyun  *
1221*4882a593Smuzhiyun  * Returns pointer to valid gid attribute or ERR_PTR for the appropriate error
1222*4882a593Smuzhiyun  * code.
1223*4882a593Smuzhiyun  */
1224*4882a593Smuzhiyun const struct ib_gid_attr *
rdma_get_gid_attr(struct ib_device * device,u8 port_num,int index)1225*4882a593Smuzhiyun rdma_get_gid_attr(struct ib_device *device, u8 port_num, int index)
1226*4882a593Smuzhiyun {
1227*4882a593Smuzhiyun 	const struct ib_gid_attr *attr = ERR_PTR(-ENODATA);
1228*4882a593Smuzhiyun 	struct ib_gid_table *table;
1229*4882a593Smuzhiyun 	unsigned long flags;
1230*4882a593Smuzhiyun 
1231*4882a593Smuzhiyun 	if (!rdma_is_port_valid(device, port_num))
1232*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
1233*4882a593Smuzhiyun 
1234*4882a593Smuzhiyun 	table = rdma_gid_table(device, port_num);
1235*4882a593Smuzhiyun 	if (index < 0 || index >= table->sz)
1236*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
1237*4882a593Smuzhiyun 
1238*4882a593Smuzhiyun 	read_lock_irqsave(&table->rwlock, flags);
1239*4882a593Smuzhiyun 	if (!is_gid_entry_valid(table->data_vec[index]))
1240*4882a593Smuzhiyun 		goto done;
1241*4882a593Smuzhiyun 
1242*4882a593Smuzhiyun 	get_gid_entry(table->data_vec[index]);
1243*4882a593Smuzhiyun 	attr = &table->data_vec[index]->attr;
1244*4882a593Smuzhiyun done:
1245*4882a593Smuzhiyun 	read_unlock_irqrestore(&table->rwlock, flags);
1246*4882a593Smuzhiyun 	return attr;
1247*4882a593Smuzhiyun }
1248*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_get_gid_attr);
1249*4882a593Smuzhiyun 
1250*4882a593Smuzhiyun /**
1251*4882a593Smuzhiyun  * rdma_query_gid_table - Reads GID table entries of all the ports of a device up to max_entries.
1252*4882a593Smuzhiyun  * @device: The device to query.
1253*4882a593Smuzhiyun  * @entries: Entries where GID entries are returned.
1254*4882a593Smuzhiyun  * @max_entries: Maximum number of entries that can be returned.
1255*4882a593Smuzhiyun  * Entries array must be allocated to hold max_entries number of entries.
1256*4882a593Smuzhiyun  * @num_entries: Updated to the number of entries that were successfully read.
1257*4882a593Smuzhiyun  *
1258*4882a593Smuzhiyun  * Returns number of entries on success or appropriate error code.
1259*4882a593Smuzhiyun  */
rdma_query_gid_table(struct ib_device * device,struct ib_uverbs_gid_entry * entries,size_t max_entries)1260*4882a593Smuzhiyun ssize_t rdma_query_gid_table(struct ib_device *device,
1261*4882a593Smuzhiyun 			     struct ib_uverbs_gid_entry *entries,
1262*4882a593Smuzhiyun 			     size_t max_entries)
1263*4882a593Smuzhiyun {
1264*4882a593Smuzhiyun 	const struct ib_gid_attr *gid_attr;
1265*4882a593Smuzhiyun 	ssize_t num_entries = 0, ret;
1266*4882a593Smuzhiyun 	struct ib_gid_table *table;
1267*4882a593Smuzhiyun 	unsigned int port_num, i;
1268*4882a593Smuzhiyun 	struct net_device *ndev;
1269*4882a593Smuzhiyun 	unsigned long flags;
1270*4882a593Smuzhiyun 
1271*4882a593Smuzhiyun 	rdma_for_each_port(device, port_num) {
1272*4882a593Smuzhiyun 		table = rdma_gid_table(device, port_num);
1273*4882a593Smuzhiyun 		read_lock_irqsave(&table->rwlock, flags);
1274*4882a593Smuzhiyun 		for (i = 0; i < table->sz; i++) {
1275*4882a593Smuzhiyun 			if (!is_gid_entry_valid(table->data_vec[i]))
1276*4882a593Smuzhiyun 				continue;
1277*4882a593Smuzhiyun 			if (num_entries >= max_entries) {
1278*4882a593Smuzhiyun 				ret = -EINVAL;
1279*4882a593Smuzhiyun 				goto err;
1280*4882a593Smuzhiyun 			}
1281*4882a593Smuzhiyun 
1282*4882a593Smuzhiyun 			gid_attr = &table->data_vec[i]->attr;
1283*4882a593Smuzhiyun 
1284*4882a593Smuzhiyun 			memcpy(&entries->gid, &gid_attr->gid,
1285*4882a593Smuzhiyun 			       sizeof(gid_attr->gid));
1286*4882a593Smuzhiyun 			entries->gid_index = gid_attr->index;
1287*4882a593Smuzhiyun 			entries->port_num = gid_attr->port_num;
1288*4882a593Smuzhiyun 			entries->gid_type = gid_attr->gid_type;
1289*4882a593Smuzhiyun 			ndev = rcu_dereference_protected(
1290*4882a593Smuzhiyun 				gid_attr->ndev,
1291*4882a593Smuzhiyun 				lockdep_is_held(&table->rwlock));
1292*4882a593Smuzhiyun 			if (ndev)
1293*4882a593Smuzhiyun 				entries->netdev_ifindex = ndev->ifindex;
1294*4882a593Smuzhiyun 
1295*4882a593Smuzhiyun 			num_entries++;
1296*4882a593Smuzhiyun 			entries++;
1297*4882a593Smuzhiyun 		}
1298*4882a593Smuzhiyun 		read_unlock_irqrestore(&table->rwlock, flags);
1299*4882a593Smuzhiyun 	}
1300*4882a593Smuzhiyun 
1301*4882a593Smuzhiyun 	return num_entries;
1302*4882a593Smuzhiyun err:
1303*4882a593Smuzhiyun 	read_unlock_irqrestore(&table->rwlock, flags);
1304*4882a593Smuzhiyun 	return ret;
1305*4882a593Smuzhiyun }
1306*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_query_gid_table);
1307*4882a593Smuzhiyun 
1308*4882a593Smuzhiyun /**
1309*4882a593Smuzhiyun  * rdma_put_gid_attr - Release reference to the GID attribute
1310*4882a593Smuzhiyun  * @attr:		Pointer to the GID attribute whose reference
1311*4882a593Smuzhiyun  *			needs to be released.
1312*4882a593Smuzhiyun  *
1313*4882a593Smuzhiyun  * rdma_put_gid_attr() must be used to release reference whose
1314*4882a593Smuzhiyun  * reference is acquired using rdma_get_gid_attr() or any APIs
1315*4882a593Smuzhiyun  * which returns a pointer to the ib_gid_attr regardless of link layer
1316*4882a593Smuzhiyun  * of IB or RoCE.
1317*4882a593Smuzhiyun  *
1318*4882a593Smuzhiyun  */
rdma_put_gid_attr(const struct ib_gid_attr * attr)1319*4882a593Smuzhiyun void rdma_put_gid_attr(const struct ib_gid_attr *attr)
1320*4882a593Smuzhiyun {
1321*4882a593Smuzhiyun 	struct ib_gid_table_entry *entry =
1322*4882a593Smuzhiyun 		container_of(attr, struct ib_gid_table_entry, attr);
1323*4882a593Smuzhiyun 
1324*4882a593Smuzhiyun 	put_gid_entry(entry);
1325*4882a593Smuzhiyun }
1326*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_put_gid_attr);
1327*4882a593Smuzhiyun 
1328*4882a593Smuzhiyun /**
1329*4882a593Smuzhiyun  * rdma_hold_gid_attr - Get reference to existing GID attribute
1330*4882a593Smuzhiyun  *
1331*4882a593Smuzhiyun  * @attr:		Pointer to the GID attribute whose reference
1332*4882a593Smuzhiyun  *			needs to be taken.
1333*4882a593Smuzhiyun  *
1334*4882a593Smuzhiyun  * Increase the reference count to a GID attribute to keep it from being
1335*4882a593Smuzhiyun  * freed. Callers are required to already be holding a reference to attribute.
1336*4882a593Smuzhiyun  *
1337*4882a593Smuzhiyun  */
rdma_hold_gid_attr(const struct ib_gid_attr * attr)1338*4882a593Smuzhiyun void rdma_hold_gid_attr(const struct ib_gid_attr *attr)
1339*4882a593Smuzhiyun {
1340*4882a593Smuzhiyun 	struct ib_gid_table_entry *entry =
1341*4882a593Smuzhiyun 		container_of(attr, struct ib_gid_table_entry, attr);
1342*4882a593Smuzhiyun 
1343*4882a593Smuzhiyun 	get_gid_entry(entry);
1344*4882a593Smuzhiyun }
1345*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_hold_gid_attr);
1346*4882a593Smuzhiyun 
1347*4882a593Smuzhiyun /**
1348*4882a593Smuzhiyun  * rdma_read_gid_attr_ndev_rcu - Read GID attribute netdevice
1349*4882a593Smuzhiyun  * which must be in UP state.
1350*4882a593Smuzhiyun  *
1351*4882a593Smuzhiyun  * @attr:Pointer to the GID attribute
1352*4882a593Smuzhiyun  *
1353*4882a593Smuzhiyun  * Returns pointer to netdevice if the netdevice was attached to GID and
1354*4882a593Smuzhiyun  * netdevice is in UP state. Caller must hold RCU lock as this API
1355*4882a593Smuzhiyun  * reads the netdev flags which can change while netdevice migrates to
1356*4882a593Smuzhiyun  * different net namespace. Returns ERR_PTR with error code otherwise.
1357*4882a593Smuzhiyun  *
1358*4882a593Smuzhiyun  */
rdma_read_gid_attr_ndev_rcu(const struct ib_gid_attr * attr)1359*4882a593Smuzhiyun struct net_device *rdma_read_gid_attr_ndev_rcu(const struct ib_gid_attr *attr)
1360*4882a593Smuzhiyun {
1361*4882a593Smuzhiyun 	struct ib_gid_table_entry *entry =
1362*4882a593Smuzhiyun 			container_of(attr, struct ib_gid_table_entry, attr);
1363*4882a593Smuzhiyun 	struct ib_device *device = entry->attr.device;
1364*4882a593Smuzhiyun 	struct net_device *ndev = ERR_PTR(-EINVAL);
1365*4882a593Smuzhiyun 	u8 port_num = entry->attr.port_num;
1366*4882a593Smuzhiyun 	struct ib_gid_table *table;
1367*4882a593Smuzhiyun 	unsigned long flags;
1368*4882a593Smuzhiyun 	bool valid;
1369*4882a593Smuzhiyun 
1370*4882a593Smuzhiyun 	table = rdma_gid_table(device, port_num);
1371*4882a593Smuzhiyun 
1372*4882a593Smuzhiyun 	read_lock_irqsave(&table->rwlock, flags);
1373*4882a593Smuzhiyun 	valid = is_gid_entry_valid(table->data_vec[attr->index]);
1374*4882a593Smuzhiyun 	if (valid) {
1375*4882a593Smuzhiyun 		ndev = rcu_dereference(attr->ndev);
1376*4882a593Smuzhiyun 		if (!ndev)
1377*4882a593Smuzhiyun 			ndev = ERR_PTR(-ENODEV);
1378*4882a593Smuzhiyun 	}
1379*4882a593Smuzhiyun 	read_unlock_irqrestore(&table->rwlock, flags);
1380*4882a593Smuzhiyun 	return ndev;
1381*4882a593Smuzhiyun }
1382*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_read_gid_attr_ndev_rcu);
1383*4882a593Smuzhiyun 
get_lower_dev_vlan(struct net_device * lower_dev,struct netdev_nested_priv * priv)1384*4882a593Smuzhiyun static int get_lower_dev_vlan(struct net_device *lower_dev,
1385*4882a593Smuzhiyun 			      struct netdev_nested_priv *priv)
1386*4882a593Smuzhiyun {
1387*4882a593Smuzhiyun 	u16 *vlan_id = (u16 *)priv->data;
1388*4882a593Smuzhiyun 
1389*4882a593Smuzhiyun 	if (is_vlan_dev(lower_dev))
1390*4882a593Smuzhiyun 		*vlan_id = vlan_dev_vlan_id(lower_dev);
1391*4882a593Smuzhiyun 
1392*4882a593Smuzhiyun 	/* We are interested only in first level vlan device, so
1393*4882a593Smuzhiyun 	 * always return 1 to stop iterating over next level devices.
1394*4882a593Smuzhiyun 	 */
1395*4882a593Smuzhiyun 	return 1;
1396*4882a593Smuzhiyun }
1397*4882a593Smuzhiyun 
1398*4882a593Smuzhiyun /**
1399*4882a593Smuzhiyun  * rdma_read_gid_l2_fields - Read the vlan ID and source MAC address
1400*4882a593Smuzhiyun  *			     of a GID entry.
1401*4882a593Smuzhiyun  *
1402*4882a593Smuzhiyun  * @attr:	GID attribute pointer whose L2 fields to be read
1403*4882a593Smuzhiyun  * @vlan_id:	Pointer to vlan id to fill up if the GID entry has
1404*4882a593Smuzhiyun  *		vlan id. It is optional.
1405*4882a593Smuzhiyun  * @smac:	Pointer to smac to fill up for a GID entry. It is optional.
1406*4882a593Smuzhiyun  *
1407*4882a593Smuzhiyun  * rdma_read_gid_l2_fields() returns 0 on success and returns vlan id
1408*4882a593Smuzhiyun  * (if gid entry has vlan) and source MAC, or returns error.
1409*4882a593Smuzhiyun  */
rdma_read_gid_l2_fields(const struct ib_gid_attr * attr,u16 * vlan_id,u8 * smac)1410*4882a593Smuzhiyun int rdma_read_gid_l2_fields(const struct ib_gid_attr *attr,
1411*4882a593Smuzhiyun 			    u16 *vlan_id, u8 *smac)
1412*4882a593Smuzhiyun {
1413*4882a593Smuzhiyun 	struct netdev_nested_priv priv = {
1414*4882a593Smuzhiyun 		.data = (void *)vlan_id,
1415*4882a593Smuzhiyun 	};
1416*4882a593Smuzhiyun 	struct net_device *ndev;
1417*4882a593Smuzhiyun 
1418*4882a593Smuzhiyun 	rcu_read_lock();
1419*4882a593Smuzhiyun 	ndev = rcu_dereference(attr->ndev);
1420*4882a593Smuzhiyun 	if (!ndev) {
1421*4882a593Smuzhiyun 		rcu_read_unlock();
1422*4882a593Smuzhiyun 		return -ENODEV;
1423*4882a593Smuzhiyun 	}
1424*4882a593Smuzhiyun 	if (smac)
1425*4882a593Smuzhiyun 		ether_addr_copy(smac, ndev->dev_addr);
1426*4882a593Smuzhiyun 	if (vlan_id) {
1427*4882a593Smuzhiyun 		*vlan_id = 0xffff;
1428*4882a593Smuzhiyun 		if (is_vlan_dev(ndev)) {
1429*4882a593Smuzhiyun 			*vlan_id = vlan_dev_vlan_id(ndev);
1430*4882a593Smuzhiyun 		} else {
1431*4882a593Smuzhiyun 			/* If the netdev is upper device and if it's lower
1432*4882a593Smuzhiyun 			 * device is vlan device, consider vlan id of the
1433*4882a593Smuzhiyun 			 * the lower vlan device for this gid entry.
1434*4882a593Smuzhiyun 			 */
1435*4882a593Smuzhiyun 			netdev_walk_all_lower_dev_rcu(attr->ndev,
1436*4882a593Smuzhiyun 					get_lower_dev_vlan, &priv);
1437*4882a593Smuzhiyun 		}
1438*4882a593Smuzhiyun 	}
1439*4882a593Smuzhiyun 	rcu_read_unlock();
1440*4882a593Smuzhiyun 	return 0;
1441*4882a593Smuzhiyun }
1442*4882a593Smuzhiyun EXPORT_SYMBOL(rdma_read_gid_l2_fields);
1443*4882a593Smuzhiyun 
config_non_roce_gid_cache(struct ib_device * device,u8 port,int gid_tbl_len)1444*4882a593Smuzhiyun static int config_non_roce_gid_cache(struct ib_device *device,
1445*4882a593Smuzhiyun 				     u8 port, int gid_tbl_len)
1446*4882a593Smuzhiyun {
1447*4882a593Smuzhiyun 	struct ib_gid_attr gid_attr = {};
1448*4882a593Smuzhiyun 	struct ib_gid_table *table;
1449*4882a593Smuzhiyun 	int ret = 0;
1450*4882a593Smuzhiyun 	int i;
1451*4882a593Smuzhiyun 
1452*4882a593Smuzhiyun 	gid_attr.device = device;
1453*4882a593Smuzhiyun 	gid_attr.port_num = port;
1454*4882a593Smuzhiyun 	table = rdma_gid_table(device, port);
1455*4882a593Smuzhiyun 
1456*4882a593Smuzhiyun 	mutex_lock(&table->lock);
1457*4882a593Smuzhiyun 	for (i = 0; i < gid_tbl_len; ++i) {
1458*4882a593Smuzhiyun 		if (!device->ops.query_gid)
1459*4882a593Smuzhiyun 			continue;
1460*4882a593Smuzhiyun 		ret = device->ops.query_gid(device, port, i, &gid_attr.gid);
1461*4882a593Smuzhiyun 		if (ret) {
1462*4882a593Smuzhiyun 			dev_warn(&device->dev,
1463*4882a593Smuzhiyun 				 "query_gid failed (%d) for index %d\n", ret,
1464*4882a593Smuzhiyun 				 i);
1465*4882a593Smuzhiyun 			goto err;
1466*4882a593Smuzhiyun 		}
1467*4882a593Smuzhiyun 		gid_attr.index = i;
1468*4882a593Smuzhiyun 		add_modify_gid(table, &gid_attr);
1469*4882a593Smuzhiyun 	}
1470*4882a593Smuzhiyun err:
1471*4882a593Smuzhiyun 	mutex_unlock(&table->lock);
1472*4882a593Smuzhiyun 	return ret;
1473*4882a593Smuzhiyun }
1474*4882a593Smuzhiyun 
1475*4882a593Smuzhiyun static int
ib_cache_update(struct ib_device * device,u8 port,bool enforce_security)1476*4882a593Smuzhiyun ib_cache_update(struct ib_device *device, u8 port, bool enforce_security)
1477*4882a593Smuzhiyun {
1478*4882a593Smuzhiyun 	struct ib_port_attr       *tprops = NULL;
1479*4882a593Smuzhiyun 	struct ib_pkey_cache      *pkey_cache = NULL, *old_pkey_cache;
1480*4882a593Smuzhiyun 	int                        i;
1481*4882a593Smuzhiyun 	int                        ret;
1482*4882a593Smuzhiyun 
1483*4882a593Smuzhiyun 	if (!rdma_is_port_valid(device, port))
1484*4882a593Smuzhiyun 		return -EINVAL;
1485*4882a593Smuzhiyun 
1486*4882a593Smuzhiyun 	tprops = kmalloc(sizeof *tprops, GFP_KERNEL);
1487*4882a593Smuzhiyun 	if (!tprops)
1488*4882a593Smuzhiyun 		return -ENOMEM;
1489*4882a593Smuzhiyun 
1490*4882a593Smuzhiyun 	ret = ib_query_port(device, port, tprops);
1491*4882a593Smuzhiyun 	if (ret) {
1492*4882a593Smuzhiyun 		dev_warn(&device->dev, "ib_query_port failed (%d)\n", ret);
1493*4882a593Smuzhiyun 		goto err;
1494*4882a593Smuzhiyun 	}
1495*4882a593Smuzhiyun 
1496*4882a593Smuzhiyun 	if (!rdma_protocol_roce(device, port)) {
1497*4882a593Smuzhiyun 		ret = config_non_roce_gid_cache(device, port,
1498*4882a593Smuzhiyun 						tprops->gid_tbl_len);
1499*4882a593Smuzhiyun 		if (ret)
1500*4882a593Smuzhiyun 			goto err;
1501*4882a593Smuzhiyun 	}
1502*4882a593Smuzhiyun 
1503*4882a593Smuzhiyun 	if (tprops->pkey_tbl_len) {
1504*4882a593Smuzhiyun 		pkey_cache = kmalloc(struct_size(pkey_cache, table,
1505*4882a593Smuzhiyun 						 tprops->pkey_tbl_len),
1506*4882a593Smuzhiyun 				     GFP_KERNEL);
1507*4882a593Smuzhiyun 		if (!pkey_cache) {
1508*4882a593Smuzhiyun 			ret = -ENOMEM;
1509*4882a593Smuzhiyun 			goto err;
1510*4882a593Smuzhiyun 		}
1511*4882a593Smuzhiyun 
1512*4882a593Smuzhiyun 		pkey_cache->table_len = tprops->pkey_tbl_len;
1513*4882a593Smuzhiyun 
1514*4882a593Smuzhiyun 		for (i = 0; i < pkey_cache->table_len; ++i) {
1515*4882a593Smuzhiyun 			ret = ib_query_pkey(device, port, i,
1516*4882a593Smuzhiyun 					    pkey_cache->table + i);
1517*4882a593Smuzhiyun 			if (ret) {
1518*4882a593Smuzhiyun 				dev_warn(&device->dev,
1519*4882a593Smuzhiyun 					 "ib_query_pkey failed (%d) for index %d\n",
1520*4882a593Smuzhiyun 					 ret, i);
1521*4882a593Smuzhiyun 				goto err;
1522*4882a593Smuzhiyun 			}
1523*4882a593Smuzhiyun 		}
1524*4882a593Smuzhiyun 	}
1525*4882a593Smuzhiyun 
1526*4882a593Smuzhiyun 	write_lock_irq(&device->cache_lock);
1527*4882a593Smuzhiyun 
1528*4882a593Smuzhiyun 	old_pkey_cache = device->port_data[port].cache.pkey;
1529*4882a593Smuzhiyun 
1530*4882a593Smuzhiyun 	device->port_data[port].cache.pkey = pkey_cache;
1531*4882a593Smuzhiyun 	device->port_data[port].cache.lmc = tprops->lmc;
1532*4882a593Smuzhiyun 	device->port_data[port].cache.port_state = tprops->state;
1533*4882a593Smuzhiyun 
1534*4882a593Smuzhiyun 	device->port_data[port].cache.subnet_prefix = tprops->subnet_prefix;
1535*4882a593Smuzhiyun 	write_unlock_irq(&device->cache_lock);
1536*4882a593Smuzhiyun 
1537*4882a593Smuzhiyun 	if (enforce_security)
1538*4882a593Smuzhiyun 		ib_security_cache_change(device,
1539*4882a593Smuzhiyun 					 port,
1540*4882a593Smuzhiyun 					 tprops->subnet_prefix);
1541*4882a593Smuzhiyun 
1542*4882a593Smuzhiyun 	kfree(old_pkey_cache);
1543*4882a593Smuzhiyun 	kfree(tprops);
1544*4882a593Smuzhiyun 	return 0;
1545*4882a593Smuzhiyun 
1546*4882a593Smuzhiyun err:
1547*4882a593Smuzhiyun 	kfree(pkey_cache);
1548*4882a593Smuzhiyun 	kfree(tprops);
1549*4882a593Smuzhiyun 	return ret;
1550*4882a593Smuzhiyun }
1551*4882a593Smuzhiyun 
ib_cache_event_task(struct work_struct * _work)1552*4882a593Smuzhiyun static void ib_cache_event_task(struct work_struct *_work)
1553*4882a593Smuzhiyun {
1554*4882a593Smuzhiyun 	struct ib_update_work *work =
1555*4882a593Smuzhiyun 		container_of(_work, struct ib_update_work, work);
1556*4882a593Smuzhiyun 	int ret;
1557*4882a593Smuzhiyun 
1558*4882a593Smuzhiyun 	/* Before distributing the cache update event, first sync
1559*4882a593Smuzhiyun 	 * the cache.
1560*4882a593Smuzhiyun 	 */
1561*4882a593Smuzhiyun 	ret = ib_cache_update(work->event.device, work->event.element.port_num,
1562*4882a593Smuzhiyun 			      work->enforce_security);
1563*4882a593Smuzhiyun 
1564*4882a593Smuzhiyun 	/* GID event is notified already for individual GID entries by
1565*4882a593Smuzhiyun 	 * dispatch_gid_change_event(). Hence, notifiy for rest of the
1566*4882a593Smuzhiyun 	 * events.
1567*4882a593Smuzhiyun 	 */
1568*4882a593Smuzhiyun 	if (!ret && work->event.event != IB_EVENT_GID_CHANGE)
1569*4882a593Smuzhiyun 		ib_dispatch_event_clients(&work->event);
1570*4882a593Smuzhiyun 
1571*4882a593Smuzhiyun 	kfree(work);
1572*4882a593Smuzhiyun }
1573*4882a593Smuzhiyun 
ib_generic_event_task(struct work_struct * _work)1574*4882a593Smuzhiyun static void ib_generic_event_task(struct work_struct *_work)
1575*4882a593Smuzhiyun {
1576*4882a593Smuzhiyun 	struct ib_update_work *work =
1577*4882a593Smuzhiyun 		container_of(_work, struct ib_update_work, work);
1578*4882a593Smuzhiyun 
1579*4882a593Smuzhiyun 	ib_dispatch_event_clients(&work->event);
1580*4882a593Smuzhiyun 	kfree(work);
1581*4882a593Smuzhiyun }
1582*4882a593Smuzhiyun 
is_cache_update_event(const struct ib_event * event)1583*4882a593Smuzhiyun static bool is_cache_update_event(const struct ib_event *event)
1584*4882a593Smuzhiyun {
1585*4882a593Smuzhiyun 	return (event->event == IB_EVENT_PORT_ERR    ||
1586*4882a593Smuzhiyun 		event->event == IB_EVENT_PORT_ACTIVE ||
1587*4882a593Smuzhiyun 		event->event == IB_EVENT_LID_CHANGE  ||
1588*4882a593Smuzhiyun 		event->event == IB_EVENT_PKEY_CHANGE ||
1589*4882a593Smuzhiyun 		event->event == IB_EVENT_CLIENT_REREGISTER ||
1590*4882a593Smuzhiyun 		event->event == IB_EVENT_GID_CHANGE);
1591*4882a593Smuzhiyun }
1592*4882a593Smuzhiyun 
1593*4882a593Smuzhiyun /**
1594*4882a593Smuzhiyun  * ib_dispatch_event - Dispatch an asynchronous event
1595*4882a593Smuzhiyun  * @event:Event to dispatch
1596*4882a593Smuzhiyun  *
1597*4882a593Smuzhiyun  * Low-level drivers must call ib_dispatch_event() to dispatch the
1598*4882a593Smuzhiyun  * event to all registered event handlers when an asynchronous event
1599*4882a593Smuzhiyun  * occurs.
1600*4882a593Smuzhiyun  */
ib_dispatch_event(const struct ib_event * event)1601*4882a593Smuzhiyun void ib_dispatch_event(const struct ib_event *event)
1602*4882a593Smuzhiyun {
1603*4882a593Smuzhiyun 	struct ib_update_work *work;
1604*4882a593Smuzhiyun 
1605*4882a593Smuzhiyun 	work = kzalloc(sizeof(*work), GFP_ATOMIC);
1606*4882a593Smuzhiyun 	if (!work)
1607*4882a593Smuzhiyun 		return;
1608*4882a593Smuzhiyun 
1609*4882a593Smuzhiyun 	if (is_cache_update_event(event))
1610*4882a593Smuzhiyun 		INIT_WORK(&work->work, ib_cache_event_task);
1611*4882a593Smuzhiyun 	else
1612*4882a593Smuzhiyun 		INIT_WORK(&work->work, ib_generic_event_task);
1613*4882a593Smuzhiyun 
1614*4882a593Smuzhiyun 	work->event = *event;
1615*4882a593Smuzhiyun 	if (event->event == IB_EVENT_PKEY_CHANGE ||
1616*4882a593Smuzhiyun 	    event->event == IB_EVENT_GID_CHANGE)
1617*4882a593Smuzhiyun 		work->enforce_security = true;
1618*4882a593Smuzhiyun 
1619*4882a593Smuzhiyun 	queue_work(ib_wq, &work->work);
1620*4882a593Smuzhiyun }
1621*4882a593Smuzhiyun EXPORT_SYMBOL(ib_dispatch_event);
1622*4882a593Smuzhiyun 
ib_cache_setup_one(struct ib_device * device)1623*4882a593Smuzhiyun int ib_cache_setup_one(struct ib_device *device)
1624*4882a593Smuzhiyun {
1625*4882a593Smuzhiyun 	unsigned int p;
1626*4882a593Smuzhiyun 	int err;
1627*4882a593Smuzhiyun 
1628*4882a593Smuzhiyun 	rwlock_init(&device->cache_lock);
1629*4882a593Smuzhiyun 
1630*4882a593Smuzhiyun 	err = gid_table_setup_one(device);
1631*4882a593Smuzhiyun 	if (err)
1632*4882a593Smuzhiyun 		return err;
1633*4882a593Smuzhiyun 
1634*4882a593Smuzhiyun 	rdma_for_each_port (device, p) {
1635*4882a593Smuzhiyun 		err = ib_cache_update(device, p, true);
1636*4882a593Smuzhiyun 		if (err)
1637*4882a593Smuzhiyun 			return err;
1638*4882a593Smuzhiyun 	}
1639*4882a593Smuzhiyun 
1640*4882a593Smuzhiyun 	return 0;
1641*4882a593Smuzhiyun }
1642*4882a593Smuzhiyun 
ib_cache_release_one(struct ib_device * device)1643*4882a593Smuzhiyun void ib_cache_release_one(struct ib_device *device)
1644*4882a593Smuzhiyun {
1645*4882a593Smuzhiyun 	unsigned int p;
1646*4882a593Smuzhiyun 
1647*4882a593Smuzhiyun 	/*
1648*4882a593Smuzhiyun 	 * The release function frees all the cache elements.
1649*4882a593Smuzhiyun 	 * This function should be called as part of freeing
1650*4882a593Smuzhiyun 	 * all the device's resources when the cache could no
1651*4882a593Smuzhiyun 	 * longer be accessed.
1652*4882a593Smuzhiyun 	 */
1653*4882a593Smuzhiyun 	rdma_for_each_port (device, p)
1654*4882a593Smuzhiyun 		kfree(device->port_data[p].cache.pkey);
1655*4882a593Smuzhiyun 
1656*4882a593Smuzhiyun 	gid_table_release_one(device);
1657*4882a593Smuzhiyun }
1658*4882a593Smuzhiyun 
ib_cache_cleanup_one(struct ib_device * device)1659*4882a593Smuzhiyun void ib_cache_cleanup_one(struct ib_device *device)
1660*4882a593Smuzhiyun {
1661*4882a593Smuzhiyun 	/* The cleanup function waits for all in-progress workqueue
1662*4882a593Smuzhiyun 	 * elements and cleans up the GID cache. This function should be
1663*4882a593Smuzhiyun 	 * called after the device was removed from the devices list and
1664*4882a593Smuzhiyun 	 * all clients were removed, so the cache exists but is
1665*4882a593Smuzhiyun 	 * non-functional and shouldn't be updated anymore.
1666*4882a593Smuzhiyun 	 */
1667*4882a593Smuzhiyun 	flush_workqueue(ib_wq);
1668*4882a593Smuzhiyun 	gid_table_cleanup_one(device);
1669*4882a593Smuzhiyun 
1670*4882a593Smuzhiyun 	/*
1671*4882a593Smuzhiyun 	 * Flush the wq second time for any pending GID delete work.
1672*4882a593Smuzhiyun 	 */
1673*4882a593Smuzhiyun 	flush_workqueue(ib_wq);
1674*4882a593Smuzhiyun }
1675