162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Linux network device link state notification 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Author: 662306a36Sopenharmony_ci * Stefan Rompf <sux@loplof.de> 762306a36Sopenharmony_ci */ 862306a36Sopenharmony_ci 962306a36Sopenharmony_ci#include <linux/module.h> 1062306a36Sopenharmony_ci#include <linux/netdevice.h> 1162306a36Sopenharmony_ci#include <linux/if.h> 1262306a36Sopenharmony_ci#include <net/sock.h> 1362306a36Sopenharmony_ci#include <net/pkt_sched.h> 1462306a36Sopenharmony_ci#include <linux/rtnetlink.h> 1562306a36Sopenharmony_ci#include <linux/jiffies.h> 1662306a36Sopenharmony_ci#include <linux/spinlock.h> 1762306a36Sopenharmony_ci#include <linux/workqueue.h> 1862306a36Sopenharmony_ci#include <linux/bitops.h> 1962306a36Sopenharmony_ci#include <linux/types.h> 2062306a36Sopenharmony_ci 2162306a36Sopenharmony_ci#include "dev.h" 2262306a36Sopenharmony_ci 2362306a36Sopenharmony_cienum lw_bits { 2462306a36Sopenharmony_ci LW_URGENT = 0, 2562306a36Sopenharmony_ci}; 2662306a36Sopenharmony_ci 2762306a36Sopenharmony_cistatic unsigned long linkwatch_flags; 2862306a36Sopenharmony_cistatic unsigned long linkwatch_nextevent; 2962306a36Sopenharmony_ci 3062306a36Sopenharmony_cistatic void linkwatch_event(struct work_struct *dummy); 3162306a36Sopenharmony_cistatic DECLARE_DELAYED_WORK(linkwatch_work, linkwatch_event); 3262306a36Sopenharmony_ci 3362306a36Sopenharmony_cistatic LIST_HEAD(lweventlist); 3462306a36Sopenharmony_cistatic DEFINE_SPINLOCK(lweventlist_lock); 3562306a36Sopenharmony_ci 3662306a36Sopenharmony_cistatic unsigned char default_operstate(const struct net_device *dev) 3762306a36Sopenharmony_ci{ 3862306a36Sopenharmony_ci if (netif_testing(dev)) 3962306a36Sopenharmony_ci return IF_OPER_TESTING; 4062306a36Sopenharmony_ci 4162306a36Sopenharmony_ci /* Some uppers (DSA) have additional sources for being down, so 4262306a36Sopenharmony_ci * first check whether lower is indeed the source of its down state. 4362306a36Sopenharmony_ci */ 4462306a36Sopenharmony_ci if (!netif_carrier_ok(dev)) { 4562306a36Sopenharmony_ci int iflink = dev_get_iflink(dev); 4662306a36Sopenharmony_ci struct net_device *peer; 4762306a36Sopenharmony_ci 4862306a36Sopenharmony_ci if (iflink == dev->ifindex) 4962306a36Sopenharmony_ci return IF_OPER_DOWN; 5062306a36Sopenharmony_ci 5162306a36Sopenharmony_ci peer = __dev_get_by_index(dev_net(dev), iflink); 5262306a36Sopenharmony_ci if (!peer) 5362306a36Sopenharmony_ci return IF_OPER_DOWN; 5462306a36Sopenharmony_ci 5562306a36Sopenharmony_ci return netif_carrier_ok(peer) ? IF_OPER_DOWN : 5662306a36Sopenharmony_ci IF_OPER_LOWERLAYERDOWN; 5762306a36Sopenharmony_ci } 5862306a36Sopenharmony_ci 5962306a36Sopenharmony_ci if (netif_dormant(dev)) 6062306a36Sopenharmony_ci return IF_OPER_DORMANT; 6162306a36Sopenharmony_ci 6262306a36Sopenharmony_ci return IF_OPER_UP; 6362306a36Sopenharmony_ci} 6462306a36Sopenharmony_ci 6562306a36Sopenharmony_ci 6662306a36Sopenharmony_cistatic void rfc2863_policy(struct net_device *dev) 6762306a36Sopenharmony_ci{ 6862306a36Sopenharmony_ci unsigned char operstate = default_operstate(dev); 6962306a36Sopenharmony_ci 7062306a36Sopenharmony_ci if (operstate == dev->operstate) 7162306a36Sopenharmony_ci return; 7262306a36Sopenharmony_ci 7362306a36Sopenharmony_ci write_lock(&dev_base_lock); 7462306a36Sopenharmony_ci 7562306a36Sopenharmony_ci switch(dev->link_mode) { 7662306a36Sopenharmony_ci case IF_LINK_MODE_TESTING: 7762306a36Sopenharmony_ci if (operstate == IF_OPER_UP) 7862306a36Sopenharmony_ci operstate = IF_OPER_TESTING; 7962306a36Sopenharmony_ci break; 8062306a36Sopenharmony_ci 8162306a36Sopenharmony_ci case IF_LINK_MODE_DORMANT: 8262306a36Sopenharmony_ci if (operstate == IF_OPER_UP) 8362306a36Sopenharmony_ci operstate = IF_OPER_DORMANT; 8462306a36Sopenharmony_ci break; 8562306a36Sopenharmony_ci case IF_LINK_MODE_DEFAULT: 8662306a36Sopenharmony_ci default: 8762306a36Sopenharmony_ci break; 8862306a36Sopenharmony_ci } 8962306a36Sopenharmony_ci 9062306a36Sopenharmony_ci dev->operstate = operstate; 9162306a36Sopenharmony_ci 9262306a36Sopenharmony_ci write_unlock(&dev_base_lock); 9362306a36Sopenharmony_ci} 9462306a36Sopenharmony_ci 9562306a36Sopenharmony_ci 9662306a36Sopenharmony_civoid linkwatch_init_dev(struct net_device *dev) 9762306a36Sopenharmony_ci{ 9862306a36Sopenharmony_ci /* Handle pre-registration link state changes */ 9962306a36Sopenharmony_ci if (!netif_carrier_ok(dev) || netif_dormant(dev) || 10062306a36Sopenharmony_ci netif_testing(dev)) 10162306a36Sopenharmony_ci rfc2863_policy(dev); 10262306a36Sopenharmony_ci} 10362306a36Sopenharmony_ci 10462306a36Sopenharmony_ci 10562306a36Sopenharmony_cistatic bool linkwatch_urgent_event(struct net_device *dev) 10662306a36Sopenharmony_ci{ 10762306a36Sopenharmony_ci if (!netif_running(dev)) 10862306a36Sopenharmony_ci return false; 10962306a36Sopenharmony_ci 11062306a36Sopenharmony_ci if (dev->ifindex != dev_get_iflink(dev)) 11162306a36Sopenharmony_ci return true; 11262306a36Sopenharmony_ci 11362306a36Sopenharmony_ci if (netif_is_lag_port(dev) || netif_is_lag_master(dev)) 11462306a36Sopenharmony_ci return true; 11562306a36Sopenharmony_ci 11662306a36Sopenharmony_ci return netif_carrier_ok(dev) && qdisc_tx_changing(dev); 11762306a36Sopenharmony_ci} 11862306a36Sopenharmony_ci 11962306a36Sopenharmony_ci 12062306a36Sopenharmony_cistatic void linkwatch_add_event(struct net_device *dev) 12162306a36Sopenharmony_ci{ 12262306a36Sopenharmony_ci unsigned long flags; 12362306a36Sopenharmony_ci 12462306a36Sopenharmony_ci spin_lock_irqsave(&lweventlist_lock, flags); 12562306a36Sopenharmony_ci if (list_empty(&dev->link_watch_list)) { 12662306a36Sopenharmony_ci list_add_tail(&dev->link_watch_list, &lweventlist); 12762306a36Sopenharmony_ci netdev_hold(dev, &dev->linkwatch_dev_tracker, GFP_ATOMIC); 12862306a36Sopenharmony_ci } 12962306a36Sopenharmony_ci spin_unlock_irqrestore(&lweventlist_lock, flags); 13062306a36Sopenharmony_ci} 13162306a36Sopenharmony_ci 13262306a36Sopenharmony_ci 13362306a36Sopenharmony_cistatic void linkwatch_schedule_work(int urgent) 13462306a36Sopenharmony_ci{ 13562306a36Sopenharmony_ci unsigned long delay = linkwatch_nextevent - jiffies; 13662306a36Sopenharmony_ci 13762306a36Sopenharmony_ci if (test_bit(LW_URGENT, &linkwatch_flags)) 13862306a36Sopenharmony_ci return; 13962306a36Sopenharmony_ci 14062306a36Sopenharmony_ci /* Minimise down-time: drop delay for up event. */ 14162306a36Sopenharmony_ci if (urgent) { 14262306a36Sopenharmony_ci if (test_and_set_bit(LW_URGENT, &linkwatch_flags)) 14362306a36Sopenharmony_ci return; 14462306a36Sopenharmony_ci delay = 0; 14562306a36Sopenharmony_ci } 14662306a36Sopenharmony_ci 14762306a36Sopenharmony_ci /* If we wrap around we'll delay it by at most HZ. */ 14862306a36Sopenharmony_ci if (delay > HZ) 14962306a36Sopenharmony_ci delay = 0; 15062306a36Sopenharmony_ci 15162306a36Sopenharmony_ci /* 15262306a36Sopenharmony_ci * If urgent, schedule immediate execution; otherwise, don't 15362306a36Sopenharmony_ci * override the existing timer. 15462306a36Sopenharmony_ci */ 15562306a36Sopenharmony_ci if (test_bit(LW_URGENT, &linkwatch_flags)) 15662306a36Sopenharmony_ci mod_delayed_work(system_wq, &linkwatch_work, 0); 15762306a36Sopenharmony_ci else 15862306a36Sopenharmony_ci schedule_delayed_work(&linkwatch_work, delay); 15962306a36Sopenharmony_ci} 16062306a36Sopenharmony_ci 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_cistatic void linkwatch_do_dev(struct net_device *dev) 16362306a36Sopenharmony_ci{ 16462306a36Sopenharmony_ci /* 16562306a36Sopenharmony_ci * Make sure the above read is complete since it can be 16662306a36Sopenharmony_ci * rewritten as soon as we clear the bit below. 16762306a36Sopenharmony_ci */ 16862306a36Sopenharmony_ci smp_mb__before_atomic(); 16962306a36Sopenharmony_ci 17062306a36Sopenharmony_ci /* We are about to handle this device, 17162306a36Sopenharmony_ci * so new events can be accepted 17262306a36Sopenharmony_ci */ 17362306a36Sopenharmony_ci clear_bit(__LINK_STATE_LINKWATCH_PENDING, &dev->state); 17462306a36Sopenharmony_ci 17562306a36Sopenharmony_ci rfc2863_policy(dev); 17662306a36Sopenharmony_ci if (dev->flags & IFF_UP) { 17762306a36Sopenharmony_ci if (netif_carrier_ok(dev)) 17862306a36Sopenharmony_ci dev_activate(dev); 17962306a36Sopenharmony_ci else 18062306a36Sopenharmony_ci dev_deactivate(dev); 18162306a36Sopenharmony_ci 18262306a36Sopenharmony_ci netdev_state_change(dev); 18362306a36Sopenharmony_ci } 18462306a36Sopenharmony_ci /* Note: our callers are responsible for calling netdev_tracker_free(). 18562306a36Sopenharmony_ci * This is the reason we use __dev_put() instead of dev_put(). 18662306a36Sopenharmony_ci */ 18762306a36Sopenharmony_ci __dev_put(dev); 18862306a36Sopenharmony_ci} 18962306a36Sopenharmony_ci 19062306a36Sopenharmony_cistatic void __linkwatch_run_queue(int urgent_only) 19162306a36Sopenharmony_ci{ 19262306a36Sopenharmony_ci#define MAX_DO_DEV_PER_LOOP 100 19362306a36Sopenharmony_ci 19462306a36Sopenharmony_ci int do_dev = MAX_DO_DEV_PER_LOOP; 19562306a36Sopenharmony_ci struct net_device *dev; 19662306a36Sopenharmony_ci LIST_HEAD(wrk); 19762306a36Sopenharmony_ci 19862306a36Sopenharmony_ci /* Give urgent case more budget */ 19962306a36Sopenharmony_ci if (urgent_only) 20062306a36Sopenharmony_ci do_dev += MAX_DO_DEV_PER_LOOP; 20162306a36Sopenharmony_ci 20262306a36Sopenharmony_ci /* 20362306a36Sopenharmony_ci * Limit the number of linkwatch events to one 20462306a36Sopenharmony_ci * per second so that a runaway driver does not 20562306a36Sopenharmony_ci * cause a storm of messages on the netlink 20662306a36Sopenharmony_ci * socket. This limit does not apply to up events 20762306a36Sopenharmony_ci * while the device qdisc is down. 20862306a36Sopenharmony_ci */ 20962306a36Sopenharmony_ci if (!urgent_only) 21062306a36Sopenharmony_ci linkwatch_nextevent = jiffies + HZ; 21162306a36Sopenharmony_ci /* Limit wrap-around effect on delay. */ 21262306a36Sopenharmony_ci else if (time_after(linkwatch_nextevent, jiffies + HZ)) 21362306a36Sopenharmony_ci linkwatch_nextevent = jiffies; 21462306a36Sopenharmony_ci 21562306a36Sopenharmony_ci clear_bit(LW_URGENT, &linkwatch_flags); 21662306a36Sopenharmony_ci 21762306a36Sopenharmony_ci spin_lock_irq(&lweventlist_lock); 21862306a36Sopenharmony_ci list_splice_init(&lweventlist, &wrk); 21962306a36Sopenharmony_ci 22062306a36Sopenharmony_ci while (!list_empty(&wrk) && do_dev > 0) { 22162306a36Sopenharmony_ci 22262306a36Sopenharmony_ci dev = list_first_entry(&wrk, struct net_device, link_watch_list); 22362306a36Sopenharmony_ci list_del_init(&dev->link_watch_list); 22462306a36Sopenharmony_ci 22562306a36Sopenharmony_ci if (!netif_device_present(dev) || 22662306a36Sopenharmony_ci (urgent_only && !linkwatch_urgent_event(dev))) { 22762306a36Sopenharmony_ci list_add_tail(&dev->link_watch_list, &lweventlist); 22862306a36Sopenharmony_ci continue; 22962306a36Sopenharmony_ci } 23062306a36Sopenharmony_ci /* We must free netdev tracker under 23162306a36Sopenharmony_ci * the spinlock protection. 23262306a36Sopenharmony_ci */ 23362306a36Sopenharmony_ci netdev_tracker_free(dev, &dev->linkwatch_dev_tracker); 23462306a36Sopenharmony_ci spin_unlock_irq(&lweventlist_lock); 23562306a36Sopenharmony_ci linkwatch_do_dev(dev); 23662306a36Sopenharmony_ci do_dev--; 23762306a36Sopenharmony_ci spin_lock_irq(&lweventlist_lock); 23862306a36Sopenharmony_ci } 23962306a36Sopenharmony_ci 24062306a36Sopenharmony_ci /* Add the remaining work back to lweventlist */ 24162306a36Sopenharmony_ci list_splice_init(&wrk, &lweventlist); 24262306a36Sopenharmony_ci 24362306a36Sopenharmony_ci if (!list_empty(&lweventlist)) 24462306a36Sopenharmony_ci linkwatch_schedule_work(0); 24562306a36Sopenharmony_ci spin_unlock_irq(&lweventlist_lock); 24662306a36Sopenharmony_ci} 24762306a36Sopenharmony_ci 24862306a36Sopenharmony_civoid linkwatch_forget_dev(struct net_device *dev) 24962306a36Sopenharmony_ci{ 25062306a36Sopenharmony_ci unsigned long flags; 25162306a36Sopenharmony_ci int clean = 0; 25262306a36Sopenharmony_ci 25362306a36Sopenharmony_ci spin_lock_irqsave(&lweventlist_lock, flags); 25462306a36Sopenharmony_ci if (!list_empty(&dev->link_watch_list)) { 25562306a36Sopenharmony_ci list_del_init(&dev->link_watch_list); 25662306a36Sopenharmony_ci clean = 1; 25762306a36Sopenharmony_ci /* We must release netdev tracker under 25862306a36Sopenharmony_ci * the spinlock protection. 25962306a36Sopenharmony_ci */ 26062306a36Sopenharmony_ci netdev_tracker_free(dev, &dev->linkwatch_dev_tracker); 26162306a36Sopenharmony_ci } 26262306a36Sopenharmony_ci spin_unlock_irqrestore(&lweventlist_lock, flags); 26362306a36Sopenharmony_ci if (clean) 26462306a36Sopenharmony_ci linkwatch_do_dev(dev); 26562306a36Sopenharmony_ci} 26662306a36Sopenharmony_ci 26762306a36Sopenharmony_ci 26862306a36Sopenharmony_ci/* Must be called with the rtnl semaphore held */ 26962306a36Sopenharmony_civoid linkwatch_run_queue(void) 27062306a36Sopenharmony_ci{ 27162306a36Sopenharmony_ci __linkwatch_run_queue(0); 27262306a36Sopenharmony_ci} 27362306a36Sopenharmony_ci 27462306a36Sopenharmony_ci 27562306a36Sopenharmony_cistatic void linkwatch_event(struct work_struct *dummy) 27662306a36Sopenharmony_ci{ 27762306a36Sopenharmony_ci rtnl_lock(); 27862306a36Sopenharmony_ci __linkwatch_run_queue(time_after(linkwatch_nextevent, jiffies)); 27962306a36Sopenharmony_ci rtnl_unlock(); 28062306a36Sopenharmony_ci} 28162306a36Sopenharmony_ci 28262306a36Sopenharmony_ci 28362306a36Sopenharmony_civoid linkwatch_fire_event(struct net_device *dev) 28462306a36Sopenharmony_ci{ 28562306a36Sopenharmony_ci bool urgent = linkwatch_urgent_event(dev); 28662306a36Sopenharmony_ci 28762306a36Sopenharmony_ci if (!test_and_set_bit(__LINK_STATE_LINKWATCH_PENDING, &dev->state)) { 28862306a36Sopenharmony_ci linkwatch_add_event(dev); 28962306a36Sopenharmony_ci } else if (!urgent) 29062306a36Sopenharmony_ci return; 29162306a36Sopenharmony_ci 29262306a36Sopenharmony_ci linkwatch_schedule_work(urgent); 29362306a36Sopenharmony_ci} 29462306a36Sopenharmony_ciEXPORT_SYMBOL(linkwatch_fire_event); 295