1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Forwarding decision
4*4882a593Smuzhiyun * Linux ethernet bridge
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * Authors:
7*4882a593Smuzhiyun * Lennert Buytenhek <buytenh@gnu.org>
8*4882a593Smuzhiyun */
9*4882a593Smuzhiyun
10*4882a593Smuzhiyun #include <linux/err.h>
11*4882a593Smuzhiyun #include <linux/slab.h>
12*4882a593Smuzhiyun #include <linux/kernel.h>
13*4882a593Smuzhiyun #include <linux/netdevice.h>
14*4882a593Smuzhiyun #include <linux/netpoll.h>
15*4882a593Smuzhiyun #include <linux/skbuff.h>
16*4882a593Smuzhiyun #include <linux/if_vlan.h>
17*4882a593Smuzhiyun #include <linux/netfilter_bridge.h>
18*4882a593Smuzhiyun #include "br_private.h"
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun /* Don't forward packets to originating port or forwarding disabled */
should_deliver(const struct net_bridge_port * p,const struct sk_buff * skb)21*4882a593Smuzhiyun static inline int should_deliver(const struct net_bridge_port *p,
22*4882a593Smuzhiyun const struct sk_buff *skb)
23*4882a593Smuzhiyun {
24*4882a593Smuzhiyun struct net_bridge_vlan_group *vg;
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun vg = nbp_vlan_group_rcu(p);
27*4882a593Smuzhiyun return ((p->flags & BR_HAIRPIN_MODE) || skb->dev != p->dev) &&
28*4882a593Smuzhiyun p->state == BR_STATE_FORWARDING && br_allowed_egress(vg, skb) &&
29*4882a593Smuzhiyun nbp_switchdev_allowed_egress(p, skb) &&
30*4882a593Smuzhiyun !br_skb_isolated(p, skb);
31*4882a593Smuzhiyun }
32*4882a593Smuzhiyun
br_dev_queue_push_xmit(struct net * net,struct sock * sk,struct sk_buff * skb)33*4882a593Smuzhiyun int br_dev_queue_push_xmit(struct net *net, struct sock *sk, struct sk_buff *skb)
34*4882a593Smuzhiyun {
35*4882a593Smuzhiyun skb_push(skb, ETH_HLEN);
36*4882a593Smuzhiyun if (!is_skb_forwardable(skb->dev, skb))
37*4882a593Smuzhiyun goto drop;
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun br_drop_fake_rtable(skb);
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun if (skb->ip_summed == CHECKSUM_PARTIAL &&
42*4882a593Smuzhiyun (skb->protocol == htons(ETH_P_8021Q) ||
43*4882a593Smuzhiyun skb->protocol == htons(ETH_P_8021AD))) {
44*4882a593Smuzhiyun int depth;
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun if (!__vlan_get_protocol(skb, skb->protocol, &depth))
47*4882a593Smuzhiyun goto drop;
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun skb_set_network_header(skb, depth);
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun dev_queue_xmit(skb);
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun return 0;
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun drop:
57*4882a593Smuzhiyun kfree_skb(skb);
58*4882a593Smuzhiyun return 0;
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(br_dev_queue_push_xmit);
61*4882a593Smuzhiyun
br_forward_finish(struct net * net,struct sock * sk,struct sk_buff * skb)62*4882a593Smuzhiyun int br_forward_finish(struct net *net, struct sock *sk, struct sk_buff *skb)
63*4882a593Smuzhiyun {
64*4882a593Smuzhiyun skb->tstamp = 0;
65*4882a593Smuzhiyun return NF_HOOK(NFPROTO_BRIDGE, NF_BR_POST_ROUTING,
66*4882a593Smuzhiyun net, sk, skb, NULL, skb->dev,
67*4882a593Smuzhiyun br_dev_queue_push_xmit);
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun }
70*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(br_forward_finish);
71*4882a593Smuzhiyun
__br_forward(const struct net_bridge_port * to,struct sk_buff * skb,bool local_orig)72*4882a593Smuzhiyun static void __br_forward(const struct net_bridge_port *to,
73*4882a593Smuzhiyun struct sk_buff *skb, bool local_orig)
74*4882a593Smuzhiyun {
75*4882a593Smuzhiyun struct net_bridge_vlan_group *vg;
76*4882a593Smuzhiyun struct net_device *indev;
77*4882a593Smuzhiyun struct net *net;
78*4882a593Smuzhiyun int br_hook;
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun vg = nbp_vlan_group_rcu(to);
81*4882a593Smuzhiyun skb = br_handle_vlan(to->br, to, vg, skb);
82*4882a593Smuzhiyun if (!skb)
83*4882a593Smuzhiyun return;
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun indev = skb->dev;
86*4882a593Smuzhiyun skb->dev = to->dev;
87*4882a593Smuzhiyun if (!local_orig) {
88*4882a593Smuzhiyun if (skb_warn_if_lro(skb)) {
89*4882a593Smuzhiyun kfree_skb(skb);
90*4882a593Smuzhiyun return;
91*4882a593Smuzhiyun }
92*4882a593Smuzhiyun br_hook = NF_BR_FORWARD;
93*4882a593Smuzhiyun skb_forward_csum(skb);
94*4882a593Smuzhiyun net = dev_net(indev);
95*4882a593Smuzhiyun } else {
96*4882a593Smuzhiyun if (unlikely(netpoll_tx_running(to->br->dev))) {
97*4882a593Smuzhiyun skb_push(skb, ETH_HLEN);
98*4882a593Smuzhiyun if (!is_skb_forwardable(skb->dev, skb))
99*4882a593Smuzhiyun kfree_skb(skb);
100*4882a593Smuzhiyun else
101*4882a593Smuzhiyun br_netpoll_send_skb(to, skb);
102*4882a593Smuzhiyun return;
103*4882a593Smuzhiyun }
104*4882a593Smuzhiyun br_hook = NF_BR_LOCAL_OUT;
105*4882a593Smuzhiyun net = dev_net(skb->dev);
106*4882a593Smuzhiyun indev = NULL;
107*4882a593Smuzhiyun }
108*4882a593Smuzhiyun
109*4882a593Smuzhiyun NF_HOOK(NFPROTO_BRIDGE, br_hook,
110*4882a593Smuzhiyun net, NULL, skb, indev, skb->dev,
111*4882a593Smuzhiyun br_forward_finish);
112*4882a593Smuzhiyun }
113*4882a593Smuzhiyun
deliver_clone(const struct net_bridge_port * prev,struct sk_buff * skb,bool local_orig)114*4882a593Smuzhiyun static int deliver_clone(const struct net_bridge_port *prev,
115*4882a593Smuzhiyun struct sk_buff *skb, bool local_orig)
116*4882a593Smuzhiyun {
117*4882a593Smuzhiyun struct net_device *dev = BR_INPUT_SKB_CB(skb)->brdev;
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun skb = skb_clone(skb, GFP_ATOMIC);
120*4882a593Smuzhiyun if (!skb) {
121*4882a593Smuzhiyun dev->stats.tx_dropped++;
122*4882a593Smuzhiyun return -ENOMEM;
123*4882a593Smuzhiyun }
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun __br_forward(prev, skb, local_orig);
126*4882a593Smuzhiyun return 0;
127*4882a593Smuzhiyun }
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun /**
130*4882a593Smuzhiyun * br_forward - forward a packet to a specific port
131*4882a593Smuzhiyun * @to: destination port
132*4882a593Smuzhiyun * @skb: packet being forwarded
133*4882a593Smuzhiyun * @local_rcv: packet will be received locally after forwarding
134*4882a593Smuzhiyun * @local_orig: packet is locally originated
135*4882a593Smuzhiyun *
136*4882a593Smuzhiyun * Should be called with rcu_read_lock.
137*4882a593Smuzhiyun */
br_forward(const struct net_bridge_port * to,struct sk_buff * skb,bool local_rcv,bool local_orig)138*4882a593Smuzhiyun void br_forward(const struct net_bridge_port *to,
139*4882a593Smuzhiyun struct sk_buff *skb, bool local_rcv, bool local_orig)
140*4882a593Smuzhiyun {
141*4882a593Smuzhiyun if (unlikely(!to))
142*4882a593Smuzhiyun goto out;
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun /* redirect to backup link if the destination port is down */
145*4882a593Smuzhiyun if (rcu_access_pointer(to->backup_port) && !netif_carrier_ok(to->dev)) {
146*4882a593Smuzhiyun struct net_bridge_port *backup_port;
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun backup_port = rcu_dereference(to->backup_port);
149*4882a593Smuzhiyun if (unlikely(!backup_port))
150*4882a593Smuzhiyun goto out;
151*4882a593Smuzhiyun to = backup_port;
152*4882a593Smuzhiyun }
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun if (should_deliver(to, skb)) {
155*4882a593Smuzhiyun if (local_rcv)
156*4882a593Smuzhiyun deliver_clone(to, skb, local_orig);
157*4882a593Smuzhiyun else
158*4882a593Smuzhiyun __br_forward(to, skb, local_orig);
159*4882a593Smuzhiyun return;
160*4882a593Smuzhiyun }
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun out:
163*4882a593Smuzhiyun if (!local_rcv)
164*4882a593Smuzhiyun kfree_skb(skb);
165*4882a593Smuzhiyun }
166*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(br_forward);
167*4882a593Smuzhiyun
maybe_deliver(struct net_bridge_port * prev,struct net_bridge_port * p,struct sk_buff * skb,bool local_orig)168*4882a593Smuzhiyun static struct net_bridge_port *maybe_deliver(
169*4882a593Smuzhiyun struct net_bridge_port *prev, struct net_bridge_port *p,
170*4882a593Smuzhiyun struct sk_buff *skb, bool local_orig)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun u8 igmp_type = br_multicast_igmp_type(skb);
173*4882a593Smuzhiyun int err;
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun if (!should_deliver(p, skb))
176*4882a593Smuzhiyun return prev;
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun if (!prev)
179*4882a593Smuzhiyun goto out;
180*4882a593Smuzhiyun
181*4882a593Smuzhiyun err = deliver_clone(prev, skb, local_orig);
182*4882a593Smuzhiyun if (err)
183*4882a593Smuzhiyun return ERR_PTR(err);
184*4882a593Smuzhiyun out:
185*4882a593Smuzhiyun br_multicast_count(p->br, p, skb, igmp_type, BR_MCAST_DIR_TX);
186*4882a593Smuzhiyun
187*4882a593Smuzhiyun return p;
188*4882a593Smuzhiyun }
189*4882a593Smuzhiyun
190*4882a593Smuzhiyun /* called under rcu_read_lock */
br_flood(struct net_bridge * br,struct sk_buff * skb,enum br_pkt_type pkt_type,bool local_rcv,bool local_orig)191*4882a593Smuzhiyun void br_flood(struct net_bridge *br, struct sk_buff *skb,
192*4882a593Smuzhiyun enum br_pkt_type pkt_type, bool local_rcv, bool local_orig)
193*4882a593Smuzhiyun {
194*4882a593Smuzhiyun struct net_bridge_port *prev = NULL;
195*4882a593Smuzhiyun struct net_bridge_port *p;
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun list_for_each_entry_rcu(p, &br->port_list, list) {
198*4882a593Smuzhiyun /* Do not flood unicast traffic to ports that turn it off, nor
199*4882a593Smuzhiyun * other traffic if flood off, except for traffic we originate
200*4882a593Smuzhiyun */
201*4882a593Smuzhiyun switch (pkt_type) {
202*4882a593Smuzhiyun case BR_PKT_UNICAST:
203*4882a593Smuzhiyun if (!(p->flags & BR_FLOOD))
204*4882a593Smuzhiyun continue;
205*4882a593Smuzhiyun break;
206*4882a593Smuzhiyun case BR_PKT_MULTICAST:
207*4882a593Smuzhiyun if (!(p->flags & BR_MCAST_FLOOD) && skb->dev != br->dev)
208*4882a593Smuzhiyun continue;
209*4882a593Smuzhiyun break;
210*4882a593Smuzhiyun case BR_PKT_BROADCAST:
211*4882a593Smuzhiyun if (!(p->flags & BR_BCAST_FLOOD) && skb->dev != br->dev)
212*4882a593Smuzhiyun continue;
213*4882a593Smuzhiyun break;
214*4882a593Smuzhiyun }
215*4882a593Smuzhiyun
216*4882a593Smuzhiyun /* Do not flood to ports that enable proxy ARP */
217*4882a593Smuzhiyun if (p->flags & BR_PROXYARP)
218*4882a593Smuzhiyun continue;
219*4882a593Smuzhiyun if ((p->flags & (BR_PROXYARP_WIFI | BR_NEIGH_SUPPRESS)) &&
220*4882a593Smuzhiyun BR_INPUT_SKB_CB(skb)->proxyarp_replied)
221*4882a593Smuzhiyun continue;
222*4882a593Smuzhiyun
223*4882a593Smuzhiyun prev = maybe_deliver(prev, p, skb, local_orig);
224*4882a593Smuzhiyun if (IS_ERR(prev))
225*4882a593Smuzhiyun goto out;
226*4882a593Smuzhiyun }
227*4882a593Smuzhiyun
228*4882a593Smuzhiyun if (!prev)
229*4882a593Smuzhiyun goto out;
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun if (local_rcv)
232*4882a593Smuzhiyun deliver_clone(prev, skb, local_orig);
233*4882a593Smuzhiyun else
234*4882a593Smuzhiyun __br_forward(prev, skb, local_orig);
235*4882a593Smuzhiyun return;
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun out:
238*4882a593Smuzhiyun if (!local_rcv)
239*4882a593Smuzhiyun kfree_skb(skb);
240*4882a593Smuzhiyun }
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun #ifdef CONFIG_BRIDGE_IGMP_SNOOPING
maybe_deliver_addr(struct net_bridge_port * p,struct sk_buff * skb,const unsigned char * addr,bool local_orig)243*4882a593Smuzhiyun static void maybe_deliver_addr(struct net_bridge_port *p, struct sk_buff *skb,
244*4882a593Smuzhiyun const unsigned char *addr, bool local_orig)
245*4882a593Smuzhiyun {
246*4882a593Smuzhiyun struct net_device *dev = BR_INPUT_SKB_CB(skb)->brdev;
247*4882a593Smuzhiyun const unsigned char *src = eth_hdr(skb)->h_source;
248*4882a593Smuzhiyun
249*4882a593Smuzhiyun if (!should_deliver(p, skb))
250*4882a593Smuzhiyun return;
251*4882a593Smuzhiyun
252*4882a593Smuzhiyun /* Even with hairpin, no soliloquies - prevent breaking IPv6 DAD */
253*4882a593Smuzhiyun if (skb->dev == p->dev && ether_addr_equal(src, addr))
254*4882a593Smuzhiyun return;
255*4882a593Smuzhiyun
256*4882a593Smuzhiyun skb = skb_copy(skb, GFP_ATOMIC);
257*4882a593Smuzhiyun if (!skb) {
258*4882a593Smuzhiyun dev->stats.tx_dropped++;
259*4882a593Smuzhiyun return;
260*4882a593Smuzhiyun }
261*4882a593Smuzhiyun
262*4882a593Smuzhiyun if (!is_broadcast_ether_addr(addr))
263*4882a593Smuzhiyun memcpy(eth_hdr(skb)->h_dest, addr, ETH_ALEN);
264*4882a593Smuzhiyun
265*4882a593Smuzhiyun __br_forward(p, skb, local_orig);
266*4882a593Smuzhiyun }
267*4882a593Smuzhiyun
268*4882a593Smuzhiyun /* called with rcu_read_lock */
br_multicast_flood(struct net_bridge_mdb_entry * mdst,struct sk_buff * skb,bool local_rcv,bool local_orig)269*4882a593Smuzhiyun void br_multicast_flood(struct net_bridge_mdb_entry *mdst,
270*4882a593Smuzhiyun struct sk_buff *skb,
271*4882a593Smuzhiyun bool local_rcv, bool local_orig)
272*4882a593Smuzhiyun {
273*4882a593Smuzhiyun struct net_device *dev = BR_INPUT_SKB_CB(skb)->brdev;
274*4882a593Smuzhiyun struct net_bridge *br = netdev_priv(dev);
275*4882a593Smuzhiyun struct net_bridge_port *prev = NULL;
276*4882a593Smuzhiyun struct net_bridge_port_group *p;
277*4882a593Smuzhiyun bool allow_mode_include = true;
278*4882a593Smuzhiyun struct hlist_node *rp;
279*4882a593Smuzhiyun
280*4882a593Smuzhiyun rp = rcu_dereference(hlist_first_rcu(&br->router_list));
281*4882a593Smuzhiyun if (mdst) {
282*4882a593Smuzhiyun p = rcu_dereference(mdst->ports);
283*4882a593Smuzhiyun if (br_multicast_should_handle_mode(br, mdst->addr.proto) &&
284*4882a593Smuzhiyun br_multicast_is_star_g(&mdst->addr))
285*4882a593Smuzhiyun allow_mode_include = false;
286*4882a593Smuzhiyun } else {
287*4882a593Smuzhiyun p = NULL;
288*4882a593Smuzhiyun }
289*4882a593Smuzhiyun
290*4882a593Smuzhiyun while (p || rp) {
291*4882a593Smuzhiyun struct net_bridge_port *port, *lport, *rport;
292*4882a593Smuzhiyun
293*4882a593Smuzhiyun lport = p ? p->key.port : NULL;
294*4882a593Smuzhiyun rport = hlist_entry_safe(rp, struct net_bridge_port, rlist);
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun if ((unsigned long)lport > (unsigned long)rport) {
297*4882a593Smuzhiyun port = lport;
298*4882a593Smuzhiyun
299*4882a593Smuzhiyun if (port->flags & BR_MULTICAST_TO_UNICAST) {
300*4882a593Smuzhiyun maybe_deliver_addr(lport, skb, p->eth_addr,
301*4882a593Smuzhiyun local_orig);
302*4882a593Smuzhiyun goto delivered;
303*4882a593Smuzhiyun }
304*4882a593Smuzhiyun if ((!allow_mode_include &&
305*4882a593Smuzhiyun p->filter_mode == MCAST_INCLUDE) ||
306*4882a593Smuzhiyun (p->flags & MDB_PG_FLAGS_BLOCKED))
307*4882a593Smuzhiyun goto delivered;
308*4882a593Smuzhiyun } else {
309*4882a593Smuzhiyun port = rport;
310*4882a593Smuzhiyun }
311*4882a593Smuzhiyun
312*4882a593Smuzhiyun prev = maybe_deliver(prev, port, skb, local_orig);
313*4882a593Smuzhiyun if (IS_ERR(prev))
314*4882a593Smuzhiyun goto out;
315*4882a593Smuzhiyun delivered:
316*4882a593Smuzhiyun if ((unsigned long)lport >= (unsigned long)port)
317*4882a593Smuzhiyun p = rcu_dereference(p->next);
318*4882a593Smuzhiyun if ((unsigned long)rport >= (unsigned long)port)
319*4882a593Smuzhiyun rp = rcu_dereference(hlist_next_rcu(rp));
320*4882a593Smuzhiyun }
321*4882a593Smuzhiyun
322*4882a593Smuzhiyun if (!prev)
323*4882a593Smuzhiyun goto out;
324*4882a593Smuzhiyun
325*4882a593Smuzhiyun if (local_rcv)
326*4882a593Smuzhiyun deliver_clone(prev, skb, local_orig);
327*4882a593Smuzhiyun else
328*4882a593Smuzhiyun __br_forward(prev, skb, local_orig);
329*4882a593Smuzhiyun return;
330*4882a593Smuzhiyun
331*4882a593Smuzhiyun out:
332*4882a593Smuzhiyun if (!local_rcv)
333*4882a593Smuzhiyun kfree_skb(skb);
334*4882a593Smuzhiyun }
335*4882a593Smuzhiyun #endif
336