1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Linux network device link state notification
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Author:
6*4882a593Smuzhiyun * Stefan Rompf <sux@loplof.de>
7*4882a593Smuzhiyun */
8*4882a593Smuzhiyun
9*4882a593Smuzhiyun #include <linux/module.h>
10*4882a593Smuzhiyun #include <linux/netdevice.h>
11*4882a593Smuzhiyun #include <linux/if.h>
12*4882a593Smuzhiyun #include <net/sock.h>
13*4882a593Smuzhiyun #include <net/pkt_sched.h>
14*4882a593Smuzhiyun #include <linux/rtnetlink.h>
15*4882a593Smuzhiyun #include <linux/jiffies.h>
16*4882a593Smuzhiyun #include <linux/spinlock.h>
17*4882a593Smuzhiyun #include <linux/workqueue.h>
18*4882a593Smuzhiyun #include <linux/bitops.h>
19*4882a593Smuzhiyun #include <linux/types.h>
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun enum lw_bits {
23*4882a593Smuzhiyun LW_URGENT = 0,
24*4882a593Smuzhiyun };
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun static unsigned long linkwatch_flags;
27*4882a593Smuzhiyun static unsigned long linkwatch_nextevent;
28*4882a593Smuzhiyun
29*4882a593Smuzhiyun static void linkwatch_event(struct work_struct *dummy);
30*4882a593Smuzhiyun static DECLARE_DELAYED_WORK(linkwatch_work, linkwatch_event);
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun static LIST_HEAD(lweventlist);
33*4882a593Smuzhiyun static DEFINE_SPINLOCK(lweventlist_lock);
34*4882a593Smuzhiyun
default_operstate(const struct net_device * dev)35*4882a593Smuzhiyun static unsigned char default_operstate(const struct net_device *dev)
36*4882a593Smuzhiyun {
37*4882a593Smuzhiyun if (netif_testing(dev))
38*4882a593Smuzhiyun return IF_OPER_TESTING;
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun if (!netif_carrier_ok(dev))
41*4882a593Smuzhiyun return (dev->ifindex != dev_get_iflink(dev) ?
42*4882a593Smuzhiyun IF_OPER_LOWERLAYERDOWN : IF_OPER_DOWN);
43*4882a593Smuzhiyun
44*4882a593Smuzhiyun if (netif_dormant(dev))
45*4882a593Smuzhiyun return IF_OPER_DORMANT;
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun return IF_OPER_UP;
48*4882a593Smuzhiyun }
49*4882a593Smuzhiyun
50*4882a593Smuzhiyun
rfc2863_policy(struct net_device * dev)51*4882a593Smuzhiyun static void rfc2863_policy(struct net_device *dev)
52*4882a593Smuzhiyun {
53*4882a593Smuzhiyun unsigned char operstate = default_operstate(dev);
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun if (operstate == dev->operstate)
56*4882a593Smuzhiyun return;
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun write_lock_bh(&dev_base_lock);
59*4882a593Smuzhiyun
60*4882a593Smuzhiyun switch(dev->link_mode) {
61*4882a593Smuzhiyun case IF_LINK_MODE_TESTING:
62*4882a593Smuzhiyun if (operstate == IF_OPER_UP)
63*4882a593Smuzhiyun operstate = IF_OPER_TESTING;
64*4882a593Smuzhiyun break;
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun case IF_LINK_MODE_DORMANT:
67*4882a593Smuzhiyun if (operstate == IF_OPER_UP)
68*4882a593Smuzhiyun operstate = IF_OPER_DORMANT;
69*4882a593Smuzhiyun break;
70*4882a593Smuzhiyun case IF_LINK_MODE_DEFAULT:
71*4882a593Smuzhiyun default:
72*4882a593Smuzhiyun break;
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun dev->operstate = operstate;
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun write_unlock_bh(&dev_base_lock);
78*4882a593Smuzhiyun }
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun
linkwatch_init_dev(struct net_device * dev)81*4882a593Smuzhiyun void linkwatch_init_dev(struct net_device *dev)
82*4882a593Smuzhiyun {
83*4882a593Smuzhiyun /* Handle pre-registration link state changes */
84*4882a593Smuzhiyun if (!netif_carrier_ok(dev) || netif_dormant(dev) ||
85*4882a593Smuzhiyun netif_testing(dev))
86*4882a593Smuzhiyun rfc2863_policy(dev);
87*4882a593Smuzhiyun }
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun
linkwatch_urgent_event(struct net_device * dev)90*4882a593Smuzhiyun static bool linkwatch_urgent_event(struct net_device *dev)
91*4882a593Smuzhiyun {
92*4882a593Smuzhiyun if (!netif_running(dev))
93*4882a593Smuzhiyun return false;
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun if (dev->ifindex != dev_get_iflink(dev))
96*4882a593Smuzhiyun return true;
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun if (netif_is_lag_port(dev) || netif_is_lag_master(dev))
99*4882a593Smuzhiyun return true;
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun return netif_carrier_ok(dev) && qdisc_tx_changing(dev);
102*4882a593Smuzhiyun }
103*4882a593Smuzhiyun
104*4882a593Smuzhiyun
linkwatch_add_event(struct net_device * dev)105*4882a593Smuzhiyun static void linkwatch_add_event(struct net_device *dev)
106*4882a593Smuzhiyun {
107*4882a593Smuzhiyun unsigned long flags;
108*4882a593Smuzhiyun
109*4882a593Smuzhiyun spin_lock_irqsave(&lweventlist_lock, flags);
110*4882a593Smuzhiyun if (list_empty(&dev->link_watch_list)) {
111*4882a593Smuzhiyun list_add_tail(&dev->link_watch_list, &lweventlist);
112*4882a593Smuzhiyun dev_hold(dev);
113*4882a593Smuzhiyun }
114*4882a593Smuzhiyun spin_unlock_irqrestore(&lweventlist_lock, flags);
115*4882a593Smuzhiyun }
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun
linkwatch_schedule_work(int urgent)118*4882a593Smuzhiyun static void linkwatch_schedule_work(int urgent)
119*4882a593Smuzhiyun {
120*4882a593Smuzhiyun unsigned long delay = linkwatch_nextevent - jiffies;
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun if (test_bit(LW_URGENT, &linkwatch_flags))
123*4882a593Smuzhiyun return;
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun /* Minimise down-time: drop delay for up event. */
126*4882a593Smuzhiyun if (urgent) {
127*4882a593Smuzhiyun if (test_and_set_bit(LW_URGENT, &linkwatch_flags))
128*4882a593Smuzhiyun return;
129*4882a593Smuzhiyun delay = 0;
130*4882a593Smuzhiyun }
131*4882a593Smuzhiyun
132*4882a593Smuzhiyun /* If we wrap around we'll delay it by at most HZ. */
133*4882a593Smuzhiyun if (delay > HZ)
134*4882a593Smuzhiyun delay = 0;
135*4882a593Smuzhiyun
136*4882a593Smuzhiyun /*
137*4882a593Smuzhiyun * If urgent, schedule immediate execution; otherwise, don't
138*4882a593Smuzhiyun * override the existing timer.
139*4882a593Smuzhiyun */
140*4882a593Smuzhiyun if (test_bit(LW_URGENT, &linkwatch_flags))
141*4882a593Smuzhiyun mod_delayed_work(system_wq, &linkwatch_work, 0);
142*4882a593Smuzhiyun else
143*4882a593Smuzhiyun schedule_delayed_work(&linkwatch_work, delay);
144*4882a593Smuzhiyun }
145*4882a593Smuzhiyun
146*4882a593Smuzhiyun
linkwatch_do_dev(struct net_device * dev)147*4882a593Smuzhiyun static void linkwatch_do_dev(struct net_device *dev)
148*4882a593Smuzhiyun {
149*4882a593Smuzhiyun /*
150*4882a593Smuzhiyun * Make sure the above read is complete since it can be
151*4882a593Smuzhiyun * rewritten as soon as we clear the bit below.
152*4882a593Smuzhiyun */
153*4882a593Smuzhiyun smp_mb__before_atomic();
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun /* We are about to handle this device,
156*4882a593Smuzhiyun * so new events can be accepted
157*4882a593Smuzhiyun */
158*4882a593Smuzhiyun clear_bit(__LINK_STATE_LINKWATCH_PENDING, &dev->state);
159*4882a593Smuzhiyun
160*4882a593Smuzhiyun rfc2863_policy(dev);
161*4882a593Smuzhiyun if (dev->flags & IFF_UP) {
162*4882a593Smuzhiyun if (netif_carrier_ok(dev))
163*4882a593Smuzhiyun dev_activate(dev);
164*4882a593Smuzhiyun else
165*4882a593Smuzhiyun dev_deactivate(dev);
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun netdev_state_change(dev);
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun dev_put(dev);
170*4882a593Smuzhiyun }
171*4882a593Smuzhiyun
__linkwatch_run_queue(int urgent_only)172*4882a593Smuzhiyun static void __linkwatch_run_queue(int urgent_only)
173*4882a593Smuzhiyun {
174*4882a593Smuzhiyun #define MAX_DO_DEV_PER_LOOP 100
175*4882a593Smuzhiyun
176*4882a593Smuzhiyun int do_dev = MAX_DO_DEV_PER_LOOP;
177*4882a593Smuzhiyun struct net_device *dev;
178*4882a593Smuzhiyun LIST_HEAD(wrk);
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun /* Give urgent case more budget */
181*4882a593Smuzhiyun if (urgent_only)
182*4882a593Smuzhiyun do_dev += MAX_DO_DEV_PER_LOOP;
183*4882a593Smuzhiyun
184*4882a593Smuzhiyun /*
185*4882a593Smuzhiyun * Limit the number of linkwatch events to one
186*4882a593Smuzhiyun * per second so that a runaway driver does not
187*4882a593Smuzhiyun * cause a storm of messages on the netlink
188*4882a593Smuzhiyun * socket. This limit does not apply to up events
189*4882a593Smuzhiyun * while the device qdisc is down.
190*4882a593Smuzhiyun */
191*4882a593Smuzhiyun if (!urgent_only)
192*4882a593Smuzhiyun linkwatch_nextevent = jiffies + HZ;
193*4882a593Smuzhiyun /* Limit wrap-around effect on delay. */
194*4882a593Smuzhiyun else if (time_after(linkwatch_nextevent, jiffies + HZ))
195*4882a593Smuzhiyun linkwatch_nextevent = jiffies;
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun clear_bit(LW_URGENT, &linkwatch_flags);
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun spin_lock_irq(&lweventlist_lock);
200*4882a593Smuzhiyun list_splice_init(&lweventlist, &wrk);
201*4882a593Smuzhiyun
202*4882a593Smuzhiyun while (!list_empty(&wrk) && do_dev > 0) {
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun dev = list_first_entry(&wrk, struct net_device, link_watch_list);
205*4882a593Smuzhiyun list_del_init(&dev->link_watch_list);
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun if (!netif_device_present(dev) ||
208*4882a593Smuzhiyun (urgent_only && !linkwatch_urgent_event(dev))) {
209*4882a593Smuzhiyun list_add_tail(&dev->link_watch_list, &lweventlist);
210*4882a593Smuzhiyun continue;
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun spin_unlock_irq(&lweventlist_lock);
213*4882a593Smuzhiyun linkwatch_do_dev(dev);
214*4882a593Smuzhiyun do_dev--;
215*4882a593Smuzhiyun spin_lock_irq(&lweventlist_lock);
216*4882a593Smuzhiyun }
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun /* Add the remaining work back to lweventlist */
219*4882a593Smuzhiyun list_splice_init(&wrk, &lweventlist);
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun if (!list_empty(&lweventlist))
222*4882a593Smuzhiyun linkwatch_schedule_work(0);
223*4882a593Smuzhiyun spin_unlock_irq(&lweventlist_lock);
224*4882a593Smuzhiyun }
225*4882a593Smuzhiyun
linkwatch_forget_dev(struct net_device * dev)226*4882a593Smuzhiyun void linkwatch_forget_dev(struct net_device *dev)
227*4882a593Smuzhiyun {
228*4882a593Smuzhiyun unsigned long flags;
229*4882a593Smuzhiyun int clean = 0;
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun spin_lock_irqsave(&lweventlist_lock, flags);
232*4882a593Smuzhiyun if (!list_empty(&dev->link_watch_list)) {
233*4882a593Smuzhiyun list_del_init(&dev->link_watch_list);
234*4882a593Smuzhiyun clean = 1;
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun spin_unlock_irqrestore(&lweventlist_lock, flags);
237*4882a593Smuzhiyun if (clean)
238*4882a593Smuzhiyun linkwatch_do_dev(dev);
239*4882a593Smuzhiyun }
240*4882a593Smuzhiyun
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun /* Must be called with the rtnl semaphore held */
linkwatch_run_queue(void)243*4882a593Smuzhiyun void linkwatch_run_queue(void)
244*4882a593Smuzhiyun {
245*4882a593Smuzhiyun __linkwatch_run_queue(0);
246*4882a593Smuzhiyun }
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun
linkwatch_event(struct work_struct * dummy)249*4882a593Smuzhiyun static void linkwatch_event(struct work_struct *dummy)
250*4882a593Smuzhiyun {
251*4882a593Smuzhiyun rtnl_lock();
252*4882a593Smuzhiyun __linkwatch_run_queue(time_after(linkwatch_nextevent, jiffies));
253*4882a593Smuzhiyun rtnl_unlock();
254*4882a593Smuzhiyun }
255*4882a593Smuzhiyun
256*4882a593Smuzhiyun
linkwatch_fire_event(struct net_device * dev)257*4882a593Smuzhiyun void linkwatch_fire_event(struct net_device *dev)
258*4882a593Smuzhiyun {
259*4882a593Smuzhiyun bool urgent = linkwatch_urgent_event(dev);
260*4882a593Smuzhiyun
261*4882a593Smuzhiyun if (!test_and_set_bit(__LINK_STATE_LINKWATCH_PENDING, &dev->state)) {
262*4882a593Smuzhiyun linkwatch_add_event(dev);
263*4882a593Smuzhiyun } else if (!urgent)
264*4882a593Smuzhiyun return;
265*4882a593Smuzhiyun
266*4882a593Smuzhiyun linkwatch_schedule_work(urgent);
267*4882a593Smuzhiyun }
268*4882a593Smuzhiyun EXPORT_SYMBOL(linkwatch_fire_event);
269