1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * net/l3mdev/l3mdev.c - L3 master device implementation
4*4882a593Smuzhiyun * Copyright (c) 2015 Cumulus Networks
5*4882a593Smuzhiyun * Copyright (c) 2015 David Ahern <dsa@cumulusnetworks.com>
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <linux/netdevice.h>
9*4882a593Smuzhiyun #include <net/fib_rules.h>
10*4882a593Smuzhiyun #include <net/l3mdev.h>
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun static DEFINE_SPINLOCK(l3mdev_lock);
13*4882a593Smuzhiyun
14*4882a593Smuzhiyun struct l3mdev_handler {
15*4882a593Smuzhiyun lookup_by_table_id_t dev_lookup;
16*4882a593Smuzhiyun };
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun static struct l3mdev_handler l3mdev_handlers[L3MDEV_TYPE_MAX + 1];
19*4882a593Smuzhiyun
l3mdev_check_type(enum l3mdev_type l3type)20*4882a593Smuzhiyun static int l3mdev_check_type(enum l3mdev_type l3type)
21*4882a593Smuzhiyun {
22*4882a593Smuzhiyun if (l3type <= L3MDEV_TYPE_UNSPEC || l3type > L3MDEV_TYPE_MAX)
23*4882a593Smuzhiyun return -EINVAL;
24*4882a593Smuzhiyun
25*4882a593Smuzhiyun return 0;
26*4882a593Smuzhiyun }
27*4882a593Smuzhiyun
l3mdev_table_lookup_register(enum l3mdev_type l3type,lookup_by_table_id_t fn)28*4882a593Smuzhiyun int l3mdev_table_lookup_register(enum l3mdev_type l3type,
29*4882a593Smuzhiyun lookup_by_table_id_t fn)
30*4882a593Smuzhiyun {
31*4882a593Smuzhiyun struct l3mdev_handler *hdlr;
32*4882a593Smuzhiyun int res;
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun res = l3mdev_check_type(l3type);
35*4882a593Smuzhiyun if (res)
36*4882a593Smuzhiyun return res;
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun hdlr = &l3mdev_handlers[l3type];
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun spin_lock(&l3mdev_lock);
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun if (hdlr->dev_lookup) {
43*4882a593Smuzhiyun res = -EBUSY;
44*4882a593Smuzhiyun goto unlock;
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun hdlr->dev_lookup = fn;
48*4882a593Smuzhiyun res = 0;
49*4882a593Smuzhiyun
50*4882a593Smuzhiyun unlock:
51*4882a593Smuzhiyun spin_unlock(&l3mdev_lock);
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun return res;
54*4882a593Smuzhiyun }
55*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(l3mdev_table_lookup_register);
56*4882a593Smuzhiyun
l3mdev_table_lookup_unregister(enum l3mdev_type l3type,lookup_by_table_id_t fn)57*4882a593Smuzhiyun void l3mdev_table_lookup_unregister(enum l3mdev_type l3type,
58*4882a593Smuzhiyun lookup_by_table_id_t fn)
59*4882a593Smuzhiyun {
60*4882a593Smuzhiyun struct l3mdev_handler *hdlr;
61*4882a593Smuzhiyun
62*4882a593Smuzhiyun if (l3mdev_check_type(l3type))
63*4882a593Smuzhiyun return;
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun hdlr = &l3mdev_handlers[l3type];
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun spin_lock(&l3mdev_lock);
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun if (hdlr->dev_lookup == fn)
70*4882a593Smuzhiyun hdlr->dev_lookup = NULL;
71*4882a593Smuzhiyun
72*4882a593Smuzhiyun spin_unlock(&l3mdev_lock);
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(l3mdev_table_lookup_unregister);
75*4882a593Smuzhiyun
l3mdev_ifindex_lookup_by_table_id(enum l3mdev_type l3type,struct net * net,u32 table_id)76*4882a593Smuzhiyun int l3mdev_ifindex_lookup_by_table_id(enum l3mdev_type l3type,
77*4882a593Smuzhiyun struct net *net, u32 table_id)
78*4882a593Smuzhiyun {
79*4882a593Smuzhiyun lookup_by_table_id_t lookup;
80*4882a593Smuzhiyun struct l3mdev_handler *hdlr;
81*4882a593Smuzhiyun int ifindex = -EINVAL;
82*4882a593Smuzhiyun int res;
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun res = l3mdev_check_type(l3type);
85*4882a593Smuzhiyun if (res)
86*4882a593Smuzhiyun return res;
87*4882a593Smuzhiyun
88*4882a593Smuzhiyun hdlr = &l3mdev_handlers[l3type];
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun spin_lock(&l3mdev_lock);
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun lookup = hdlr->dev_lookup;
93*4882a593Smuzhiyun if (!lookup)
94*4882a593Smuzhiyun goto unlock;
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun ifindex = lookup(net, table_id);
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun unlock:
99*4882a593Smuzhiyun spin_unlock(&l3mdev_lock);
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun return ifindex;
102*4882a593Smuzhiyun }
103*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(l3mdev_ifindex_lookup_by_table_id);
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun /**
106*4882a593Smuzhiyun * l3mdev_master_ifindex - get index of L3 master device
107*4882a593Smuzhiyun * @dev: targeted interface
108*4882a593Smuzhiyun */
109*4882a593Smuzhiyun
l3mdev_master_ifindex_rcu(const struct net_device * dev)110*4882a593Smuzhiyun int l3mdev_master_ifindex_rcu(const struct net_device *dev)
111*4882a593Smuzhiyun {
112*4882a593Smuzhiyun int ifindex = 0;
113*4882a593Smuzhiyun
114*4882a593Smuzhiyun if (!dev)
115*4882a593Smuzhiyun return 0;
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun if (netif_is_l3_master(dev)) {
118*4882a593Smuzhiyun ifindex = dev->ifindex;
119*4882a593Smuzhiyun } else if (netif_is_l3_slave(dev)) {
120*4882a593Smuzhiyun struct net_device *master;
121*4882a593Smuzhiyun struct net_device *_dev = (struct net_device *)dev;
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun /* netdev_master_upper_dev_get_rcu calls
124*4882a593Smuzhiyun * list_first_or_null_rcu to walk the upper dev list.
125*4882a593Smuzhiyun * list_first_or_null_rcu does not handle a const arg. We aren't
126*4882a593Smuzhiyun * making changes, just want the master device from that list so
127*4882a593Smuzhiyun * typecast to remove the const
128*4882a593Smuzhiyun */
129*4882a593Smuzhiyun master = netdev_master_upper_dev_get_rcu(_dev);
130*4882a593Smuzhiyun if (master)
131*4882a593Smuzhiyun ifindex = master->ifindex;
132*4882a593Smuzhiyun }
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun return ifindex;
135*4882a593Smuzhiyun }
136*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(l3mdev_master_ifindex_rcu);
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun /**
139*4882a593Smuzhiyun * l3mdev_master_upper_ifindex_by_index - get index of upper l3 master
140*4882a593Smuzhiyun * device
141*4882a593Smuzhiyun * @net: network namespace for device index lookup
142*4882a593Smuzhiyun * @ifindex: targeted interface
143*4882a593Smuzhiyun */
l3mdev_master_upper_ifindex_by_index_rcu(struct net * net,int ifindex)144*4882a593Smuzhiyun int l3mdev_master_upper_ifindex_by_index_rcu(struct net *net, int ifindex)
145*4882a593Smuzhiyun {
146*4882a593Smuzhiyun struct net_device *dev;
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun dev = dev_get_by_index_rcu(net, ifindex);
149*4882a593Smuzhiyun while (dev && !netif_is_l3_master(dev))
150*4882a593Smuzhiyun dev = netdev_master_upper_dev_get_rcu(dev);
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun return dev ? dev->ifindex : 0;
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(l3mdev_master_upper_ifindex_by_index_rcu);
155*4882a593Smuzhiyun
156*4882a593Smuzhiyun /**
157*4882a593Smuzhiyun * l3mdev_fib_table_rcu - get FIB table id associated with an L3
158*4882a593Smuzhiyun * master interface
159*4882a593Smuzhiyun * @dev: targeted interface
160*4882a593Smuzhiyun */
161*4882a593Smuzhiyun
l3mdev_fib_table_rcu(const struct net_device * dev)162*4882a593Smuzhiyun u32 l3mdev_fib_table_rcu(const struct net_device *dev)
163*4882a593Smuzhiyun {
164*4882a593Smuzhiyun u32 tb_id = 0;
165*4882a593Smuzhiyun
166*4882a593Smuzhiyun if (!dev)
167*4882a593Smuzhiyun return 0;
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun if (netif_is_l3_master(dev)) {
170*4882a593Smuzhiyun if (dev->l3mdev_ops->l3mdev_fib_table)
171*4882a593Smuzhiyun tb_id = dev->l3mdev_ops->l3mdev_fib_table(dev);
172*4882a593Smuzhiyun } else if (netif_is_l3_slave(dev)) {
173*4882a593Smuzhiyun /* Users of netdev_master_upper_dev_get_rcu need non-const,
174*4882a593Smuzhiyun * but current inet_*type functions take a const
175*4882a593Smuzhiyun */
176*4882a593Smuzhiyun struct net_device *_dev = (struct net_device *) dev;
177*4882a593Smuzhiyun const struct net_device *master;
178*4882a593Smuzhiyun
179*4882a593Smuzhiyun master = netdev_master_upper_dev_get_rcu(_dev);
180*4882a593Smuzhiyun if (master &&
181*4882a593Smuzhiyun master->l3mdev_ops->l3mdev_fib_table)
182*4882a593Smuzhiyun tb_id = master->l3mdev_ops->l3mdev_fib_table(master);
183*4882a593Smuzhiyun }
184*4882a593Smuzhiyun
185*4882a593Smuzhiyun return tb_id;
186*4882a593Smuzhiyun }
187*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(l3mdev_fib_table_rcu);
188*4882a593Smuzhiyun
l3mdev_fib_table_by_index(struct net * net,int ifindex)189*4882a593Smuzhiyun u32 l3mdev_fib_table_by_index(struct net *net, int ifindex)
190*4882a593Smuzhiyun {
191*4882a593Smuzhiyun struct net_device *dev;
192*4882a593Smuzhiyun u32 tb_id = 0;
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun if (!ifindex)
195*4882a593Smuzhiyun return 0;
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun rcu_read_lock();
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun dev = dev_get_by_index_rcu(net, ifindex);
200*4882a593Smuzhiyun if (dev)
201*4882a593Smuzhiyun tb_id = l3mdev_fib_table_rcu(dev);
202*4882a593Smuzhiyun
203*4882a593Smuzhiyun rcu_read_unlock();
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun return tb_id;
206*4882a593Smuzhiyun }
207*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(l3mdev_fib_table_by_index);
208*4882a593Smuzhiyun
209*4882a593Smuzhiyun /**
210*4882a593Smuzhiyun * l3mdev_link_scope_lookup - IPv6 route lookup based on flow for link
211*4882a593Smuzhiyun * local and multicast addresses
212*4882a593Smuzhiyun * @net: network namespace for device index lookup
213*4882a593Smuzhiyun * @fl6: IPv6 flow struct for lookup
214*4882a593Smuzhiyun * This function does not hold refcnt on the returned dst.
215*4882a593Smuzhiyun * Caller must hold rcu_read_lock().
216*4882a593Smuzhiyun */
217*4882a593Smuzhiyun
l3mdev_link_scope_lookup(struct net * net,struct flowi6 * fl6)218*4882a593Smuzhiyun struct dst_entry *l3mdev_link_scope_lookup(struct net *net,
219*4882a593Smuzhiyun struct flowi6 *fl6)
220*4882a593Smuzhiyun {
221*4882a593Smuzhiyun struct dst_entry *dst = NULL;
222*4882a593Smuzhiyun struct net_device *dev;
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun WARN_ON_ONCE(!rcu_read_lock_held());
225*4882a593Smuzhiyun if (fl6->flowi6_oif) {
226*4882a593Smuzhiyun dev = dev_get_by_index_rcu(net, fl6->flowi6_oif);
227*4882a593Smuzhiyun if (dev && netif_is_l3_slave(dev))
228*4882a593Smuzhiyun dev = netdev_master_upper_dev_get_rcu(dev);
229*4882a593Smuzhiyun
230*4882a593Smuzhiyun if (dev && netif_is_l3_master(dev) &&
231*4882a593Smuzhiyun dev->l3mdev_ops->l3mdev_link_scope_lookup)
232*4882a593Smuzhiyun dst = dev->l3mdev_ops->l3mdev_link_scope_lookup(dev, fl6);
233*4882a593Smuzhiyun }
234*4882a593Smuzhiyun
235*4882a593Smuzhiyun return dst;
236*4882a593Smuzhiyun }
237*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(l3mdev_link_scope_lookup);
238*4882a593Smuzhiyun
239*4882a593Smuzhiyun /**
240*4882a593Smuzhiyun * l3mdev_fib_rule_match - Determine if flowi references an
241*4882a593Smuzhiyun * L3 master device
242*4882a593Smuzhiyun * @net: network namespace for device index lookup
243*4882a593Smuzhiyun * @fl: flow struct
244*4882a593Smuzhiyun */
245*4882a593Smuzhiyun
l3mdev_fib_rule_match(struct net * net,struct flowi * fl,struct fib_lookup_arg * arg)246*4882a593Smuzhiyun int l3mdev_fib_rule_match(struct net *net, struct flowi *fl,
247*4882a593Smuzhiyun struct fib_lookup_arg *arg)
248*4882a593Smuzhiyun {
249*4882a593Smuzhiyun struct net_device *dev;
250*4882a593Smuzhiyun int rc = 0;
251*4882a593Smuzhiyun
252*4882a593Smuzhiyun rcu_read_lock();
253*4882a593Smuzhiyun
254*4882a593Smuzhiyun dev = dev_get_by_index_rcu(net, fl->flowi_oif);
255*4882a593Smuzhiyun if (dev && netif_is_l3_master(dev) &&
256*4882a593Smuzhiyun dev->l3mdev_ops->l3mdev_fib_table) {
257*4882a593Smuzhiyun arg->table = dev->l3mdev_ops->l3mdev_fib_table(dev);
258*4882a593Smuzhiyun rc = 1;
259*4882a593Smuzhiyun goto out;
260*4882a593Smuzhiyun }
261*4882a593Smuzhiyun
262*4882a593Smuzhiyun dev = dev_get_by_index_rcu(net, fl->flowi_iif);
263*4882a593Smuzhiyun if (dev && netif_is_l3_master(dev) &&
264*4882a593Smuzhiyun dev->l3mdev_ops->l3mdev_fib_table) {
265*4882a593Smuzhiyun arg->table = dev->l3mdev_ops->l3mdev_fib_table(dev);
266*4882a593Smuzhiyun rc = 1;
267*4882a593Smuzhiyun goto out;
268*4882a593Smuzhiyun }
269*4882a593Smuzhiyun
270*4882a593Smuzhiyun out:
271*4882a593Smuzhiyun rcu_read_unlock();
272*4882a593Smuzhiyun
273*4882a593Smuzhiyun return rc;
274*4882a593Smuzhiyun }
275*4882a593Smuzhiyun
l3mdev_update_flow(struct net * net,struct flowi * fl)276*4882a593Smuzhiyun void l3mdev_update_flow(struct net *net, struct flowi *fl)
277*4882a593Smuzhiyun {
278*4882a593Smuzhiyun struct net_device *dev;
279*4882a593Smuzhiyun int ifindex;
280*4882a593Smuzhiyun
281*4882a593Smuzhiyun rcu_read_lock();
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun if (fl->flowi_oif) {
284*4882a593Smuzhiyun dev = dev_get_by_index_rcu(net, fl->flowi_oif);
285*4882a593Smuzhiyun if (dev) {
286*4882a593Smuzhiyun ifindex = l3mdev_master_ifindex_rcu(dev);
287*4882a593Smuzhiyun if (ifindex) {
288*4882a593Smuzhiyun fl->flowi_oif = ifindex;
289*4882a593Smuzhiyun fl->flowi_flags |= FLOWI_FLAG_SKIP_NH_OIF;
290*4882a593Smuzhiyun goto out;
291*4882a593Smuzhiyun }
292*4882a593Smuzhiyun }
293*4882a593Smuzhiyun }
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun if (fl->flowi_iif) {
296*4882a593Smuzhiyun dev = dev_get_by_index_rcu(net, fl->flowi_iif);
297*4882a593Smuzhiyun if (dev) {
298*4882a593Smuzhiyun ifindex = l3mdev_master_ifindex_rcu(dev);
299*4882a593Smuzhiyun if (ifindex) {
300*4882a593Smuzhiyun fl->flowi_iif = ifindex;
301*4882a593Smuzhiyun fl->flowi_flags |= FLOWI_FLAG_SKIP_NH_OIF;
302*4882a593Smuzhiyun }
303*4882a593Smuzhiyun }
304*4882a593Smuzhiyun }
305*4882a593Smuzhiyun
306*4882a593Smuzhiyun out:
307*4882a593Smuzhiyun rcu_read_unlock();
308*4882a593Smuzhiyun }
309*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(l3mdev_update_flow);
310