1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * INET An implementation of the TCP/IP protocol suite for the LINUX
4*4882a593Smuzhiyun * operating system. INET is implemented using the BSD Socket
5*4882a593Smuzhiyun * interface as the means of communication with the user level.
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * Pseudo-driver for the loopback interface.
8*4882a593Smuzhiyun *
9*4882a593Smuzhiyun * Version: @(#)loopback.c 1.0.4b 08/16/93
10*4882a593Smuzhiyun *
11*4882a593Smuzhiyun * Authors: Ross Biro
12*4882a593Smuzhiyun * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
13*4882a593Smuzhiyun * Donald Becker, <becker@scyld.com>
14*4882a593Smuzhiyun *
15*4882a593Smuzhiyun * Alan Cox : Fixed oddments for NET3.014
16*4882a593Smuzhiyun * Alan Cox : Rejig for NET3.029 snap #3
17*4882a593Smuzhiyun * Alan Cox : Fixed NET3.029 bugs and sped up
18*4882a593Smuzhiyun * Larry McVoy : Tiny tweak to double performance
19*4882a593Smuzhiyun * Alan Cox : Backed out LMV's tweak - the linux mm
20*4882a593Smuzhiyun * can't take it...
21*4882a593Smuzhiyun * Michael Griffith: Don't bother computing the checksums
22*4882a593Smuzhiyun * on packets received on the loopback
23*4882a593Smuzhiyun * interface.
24*4882a593Smuzhiyun * Alexey Kuznetsov: Potential hang under some extreme
25*4882a593Smuzhiyun * cases removed.
26*4882a593Smuzhiyun */
27*4882a593Smuzhiyun #include <linux/kernel.h>
28*4882a593Smuzhiyun #include <linux/jiffies.h>
29*4882a593Smuzhiyun #include <linux/module.h>
30*4882a593Smuzhiyun #include <linux/interrupt.h>
31*4882a593Smuzhiyun #include <linux/fs.h>
32*4882a593Smuzhiyun #include <linux/types.h>
33*4882a593Smuzhiyun #include <linux/string.h>
34*4882a593Smuzhiyun #include <linux/socket.h>
35*4882a593Smuzhiyun #include <linux/errno.h>
36*4882a593Smuzhiyun #include <linux/fcntl.h>
37*4882a593Smuzhiyun #include <linux/in.h>
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun #include <linux/uaccess.h>
40*4882a593Smuzhiyun #include <linux/io.h>
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun #include <linux/inet.h>
43*4882a593Smuzhiyun #include <linux/netdevice.h>
44*4882a593Smuzhiyun #include <linux/etherdevice.h>
45*4882a593Smuzhiyun #include <linux/skbuff.h>
46*4882a593Smuzhiyun #include <linux/ethtool.h>
47*4882a593Smuzhiyun #include <net/sock.h>
48*4882a593Smuzhiyun #include <net/checksum.h>
49*4882a593Smuzhiyun #include <linux/if_ether.h> /* For the statistics structure. */
50*4882a593Smuzhiyun #include <linux/if_arp.h> /* For ARPHRD_ETHER */
51*4882a593Smuzhiyun #include <linux/ip.h>
52*4882a593Smuzhiyun #include <linux/tcp.h>
53*4882a593Smuzhiyun #include <linux/percpu.h>
54*4882a593Smuzhiyun #include <linux/net_tstamp.h>
55*4882a593Smuzhiyun #include <net/net_namespace.h>
56*4882a593Smuzhiyun #include <linux/u64_stats_sync.h>
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun /* blackhole_netdev - a device used for dsts that are marked expired!
59*4882a593Smuzhiyun * This is global device (instead of per-net-ns) since it's not needed
60*4882a593Smuzhiyun * to be per-ns and gets initialized at boot time.
61*4882a593Smuzhiyun */
62*4882a593Smuzhiyun struct net_device *blackhole_netdev;
63*4882a593Smuzhiyun EXPORT_SYMBOL(blackhole_netdev);
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun /* The higher levels take care of making this non-reentrant (it's
66*4882a593Smuzhiyun * called with bh's disabled).
67*4882a593Smuzhiyun */
loopback_xmit(struct sk_buff * skb,struct net_device * dev)68*4882a593Smuzhiyun static netdev_tx_t loopback_xmit(struct sk_buff *skb,
69*4882a593Smuzhiyun struct net_device *dev)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun int len;
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun skb_tx_timestamp(skb);
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun /* do not fool net_timestamp_check() with various clock bases */
76*4882a593Smuzhiyun skb->tstamp = 0;
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun skb_orphan(skb);
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun /* Before queueing this packet to netif_rx(),
81*4882a593Smuzhiyun * make sure dst is refcounted.
82*4882a593Smuzhiyun */
83*4882a593Smuzhiyun skb_dst_force(skb);
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun skb->protocol = eth_type_trans(skb, dev);
86*4882a593Smuzhiyun
87*4882a593Smuzhiyun len = skb->len;
88*4882a593Smuzhiyun if (likely(netif_rx(skb) == NET_RX_SUCCESS))
89*4882a593Smuzhiyun dev_lstats_add(dev, len);
90*4882a593Smuzhiyun
91*4882a593Smuzhiyun return NETDEV_TX_OK;
92*4882a593Smuzhiyun }
93*4882a593Smuzhiyun
dev_lstats_read(struct net_device * dev,u64 * packets,u64 * bytes)94*4882a593Smuzhiyun void dev_lstats_read(struct net_device *dev, u64 *packets, u64 *bytes)
95*4882a593Smuzhiyun {
96*4882a593Smuzhiyun int i;
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun *packets = 0;
99*4882a593Smuzhiyun *bytes = 0;
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun for_each_possible_cpu(i) {
102*4882a593Smuzhiyun const struct pcpu_lstats *lb_stats;
103*4882a593Smuzhiyun u64 tbytes, tpackets;
104*4882a593Smuzhiyun unsigned int start;
105*4882a593Smuzhiyun
106*4882a593Smuzhiyun lb_stats = per_cpu_ptr(dev->lstats, i);
107*4882a593Smuzhiyun do {
108*4882a593Smuzhiyun start = u64_stats_fetch_begin_irq(&lb_stats->syncp);
109*4882a593Smuzhiyun tpackets = u64_stats_read(&lb_stats->packets);
110*4882a593Smuzhiyun tbytes = u64_stats_read(&lb_stats->bytes);
111*4882a593Smuzhiyun } while (u64_stats_fetch_retry_irq(&lb_stats->syncp, start));
112*4882a593Smuzhiyun *bytes += tbytes;
113*4882a593Smuzhiyun *packets += tpackets;
114*4882a593Smuzhiyun }
115*4882a593Smuzhiyun }
116*4882a593Smuzhiyun EXPORT_SYMBOL(dev_lstats_read);
117*4882a593Smuzhiyun
loopback_get_stats64(struct net_device * dev,struct rtnl_link_stats64 * stats)118*4882a593Smuzhiyun static void loopback_get_stats64(struct net_device *dev,
119*4882a593Smuzhiyun struct rtnl_link_stats64 *stats)
120*4882a593Smuzhiyun {
121*4882a593Smuzhiyun u64 packets, bytes;
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun dev_lstats_read(dev, &packets, &bytes);
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun stats->rx_packets = packets;
126*4882a593Smuzhiyun stats->tx_packets = packets;
127*4882a593Smuzhiyun stats->rx_bytes = bytes;
128*4882a593Smuzhiyun stats->tx_bytes = bytes;
129*4882a593Smuzhiyun }
130*4882a593Smuzhiyun
always_on(struct net_device * dev)131*4882a593Smuzhiyun static u32 always_on(struct net_device *dev)
132*4882a593Smuzhiyun {
133*4882a593Smuzhiyun return 1;
134*4882a593Smuzhiyun }
135*4882a593Smuzhiyun
136*4882a593Smuzhiyun static const struct ethtool_ops loopback_ethtool_ops = {
137*4882a593Smuzhiyun .get_link = always_on,
138*4882a593Smuzhiyun .get_ts_info = ethtool_op_get_ts_info,
139*4882a593Smuzhiyun };
140*4882a593Smuzhiyun
loopback_dev_init(struct net_device * dev)141*4882a593Smuzhiyun static int loopback_dev_init(struct net_device *dev)
142*4882a593Smuzhiyun {
143*4882a593Smuzhiyun dev->lstats = netdev_alloc_pcpu_stats(struct pcpu_lstats);
144*4882a593Smuzhiyun if (!dev->lstats)
145*4882a593Smuzhiyun return -ENOMEM;
146*4882a593Smuzhiyun return 0;
147*4882a593Smuzhiyun }
148*4882a593Smuzhiyun
loopback_dev_free(struct net_device * dev)149*4882a593Smuzhiyun static void loopback_dev_free(struct net_device *dev)
150*4882a593Smuzhiyun {
151*4882a593Smuzhiyun dev_net(dev)->loopback_dev = NULL;
152*4882a593Smuzhiyun free_percpu(dev->lstats);
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun static const struct net_device_ops loopback_ops = {
156*4882a593Smuzhiyun .ndo_init = loopback_dev_init,
157*4882a593Smuzhiyun .ndo_start_xmit = loopback_xmit,
158*4882a593Smuzhiyun .ndo_get_stats64 = loopback_get_stats64,
159*4882a593Smuzhiyun .ndo_set_mac_address = eth_mac_addr,
160*4882a593Smuzhiyun };
161*4882a593Smuzhiyun
gen_lo_setup(struct net_device * dev,unsigned int mtu,const struct ethtool_ops * eth_ops,const struct header_ops * hdr_ops,const struct net_device_ops * dev_ops,void (* dev_destructor)(struct net_device * dev))162*4882a593Smuzhiyun static void gen_lo_setup(struct net_device *dev,
163*4882a593Smuzhiyun unsigned int mtu,
164*4882a593Smuzhiyun const struct ethtool_ops *eth_ops,
165*4882a593Smuzhiyun const struct header_ops *hdr_ops,
166*4882a593Smuzhiyun const struct net_device_ops *dev_ops,
167*4882a593Smuzhiyun void (*dev_destructor)(struct net_device *dev))
168*4882a593Smuzhiyun {
169*4882a593Smuzhiyun dev->mtu = mtu;
170*4882a593Smuzhiyun dev->hard_header_len = ETH_HLEN; /* 14 */
171*4882a593Smuzhiyun dev->min_header_len = ETH_HLEN; /* 14 */
172*4882a593Smuzhiyun dev->addr_len = ETH_ALEN; /* 6 */
173*4882a593Smuzhiyun dev->type = ARPHRD_LOOPBACK; /* 0x0001*/
174*4882a593Smuzhiyun dev->flags = IFF_LOOPBACK;
175*4882a593Smuzhiyun dev->priv_flags |= IFF_LIVE_ADDR_CHANGE | IFF_NO_QUEUE;
176*4882a593Smuzhiyun netif_keep_dst(dev);
177*4882a593Smuzhiyun dev->hw_features = NETIF_F_GSO_SOFTWARE;
178*4882a593Smuzhiyun dev->features = NETIF_F_SG | NETIF_F_FRAGLIST
179*4882a593Smuzhiyun | NETIF_F_GSO_SOFTWARE
180*4882a593Smuzhiyun | NETIF_F_HW_CSUM
181*4882a593Smuzhiyun | NETIF_F_RXCSUM
182*4882a593Smuzhiyun | NETIF_F_SCTP_CRC
183*4882a593Smuzhiyun | NETIF_F_HIGHDMA
184*4882a593Smuzhiyun | NETIF_F_LLTX
185*4882a593Smuzhiyun | NETIF_F_NETNS_LOCAL
186*4882a593Smuzhiyun | NETIF_F_VLAN_CHALLENGED
187*4882a593Smuzhiyun | NETIF_F_LOOPBACK;
188*4882a593Smuzhiyun dev->ethtool_ops = eth_ops;
189*4882a593Smuzhiyun dev->header_ops = hdr_ops;
190*4882a593Smuzhiyun dev->netdev_ops = dev_ops;
191*4882a593Smuzhiyun dev->needs_free_netdev = true;
192*4882a593Smuzhiyun dev->priv_destructor = dev_destructor;
193*4882a593Smuzhiyun }
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun /* The loopback device is special. There is only one instance
196*4882a593Smuzhiyun * per network namespace.
197*4882a593Smuzhiyun */
loopback_setup(struct net_device * dev)198*4882a593Smuzhiyun static void loopback_setup(struct net_device *dev)
199*4882a593Smuzhiyun {
200*4882a593Smuzhiyun gen_lo_setup(dev, (64 * 1024), &loopback_ethtool_ops, ð_header_ops,
201*4882a593Smuzhiyun &loopback_ops, loopback_dev_free);
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun /* Setup and register the loopback device. */
loopback_net_init(struct net * net)205*4882a593Smuzhiyun static __net_init int loopback_net_init(struct net *net)
206*4882a593Smuzhiyun {
207*4882a593Smuzhiyun struct net_device *dev;
208*4882a593Smuzhiyun int err;
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun err = -ENOMEM;
211*4882a593Smuzhiyun dev = alloc_netdev(0, "lo", NET_NAME_PREDICTABLE, loopback_setup);
212*4882a593Smuzhiyun if (!dev)
213*4882a593Smuzhiyun goto out;
214*4882a593Smuzhiyun
215*4882a593Smuzhiyun dev_net_set(dev, net);
216*4882a593Smuzhiyun err = register_netdev(dev);
217*4882a593Smuzhiyun if (err)
218*4882a593Smuzhiyun goto out_free_netdev;
219*4882a593Smuzhiyun
220*4882a593Smuzhiyun BUG_ON(dev->ifindex != LOOPBACK_IFINDEX);
221*4882a593Smuzhiyun net->loopback_dev = dev;
222*4882a593Smuzhiyun return 0;
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun out_free_netdev:
225*4882a593Smuzhiyun free_netdev(dev);
226*4882a593Smuzhiyun out:
227*4882a593Smuzhiyun if (net_eq(net, &init_net))
228*4882a593Smuzhiyun panic("loopback: Failed to register netdevice: %d\n", err);
229*4882a593Smuzhiyun return err;
230*4882a593Smuzhiyun }
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun /* Registered in net/core/dev.c */
233*4882a593Smuzhiyun struct pernet_operations __net_initdata loopback_net_ops = {
234*4882a593Smuzhiyun .init = loopback_net_init,
235*4882a593Smuzhiyun };
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun /* blackhole netdevice */
blackhole_netdev_xmit(struct sk_buff * skb,struct net_device * dev)238*4882a593Smuzhiyun static netdev_tx_t blackhole_netdev_xmit(struct sk_buff *skb,
239*4882a593Smuzhiyun struct net_device *dev)
240*4882a593Smuzhiyun {
241*4882a593Smuzhiyun kfree_skb(skb);
242*4882a593Smuzhiyun net_warn_ratelimited("%s(): Dropping skb.\n", __func__);
243*4882a593Smuzhiyun return NETDEV_TX_OK;
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun static const struct net_device_ops blackhole_netdev_ops = {
247*4882a593Smuzhiyun .ndo_start_xmit = blackhole_netdev_xmit,
248*4882a593Smuzhiyun };
249*4882a593Smuzhiyun
250*4882a593Smuzhiyun /* This is a dst-dummy device used specifically for invalidated
251*4882a593Smuzhiyun * DSTs and unlike loopback, this is not per-ns.
252*4882a593Smuzhiyun */
blackhole_netdev_setup(struct net_device * dev)253*4882a593Smuzhiyun static void blackhole_netdev_setup(struct net_device *dev)
254*4882a593Smuzhiyun {
255*4882a593Smuzhiyun gen_lo_setup(dev, ETH_MIN_MTU, NULL, NULL, &blackhole_netdev_ops, NULL);
256*4882a593Smuzhiyun }
257*4882a593Smuzhiyun
258*4882a593Smuzhiyun /* Setup and register the blackhole_netdev. */
blackhole_netdev_init(void)259*4882a593Smuzhiyun static int __init blackhole_netdev_init(void)
260*4882a593Smuzhiyun {
261*4882a593Smuzhiyun blackhole_netdev = alloc_netdev(0, "blackhole_dev", NET_NAME_UNKNOWN,
262*4882a593Smuzhiyun blackhole_netdev_setup);
263*4882a593Smuzhiyun if (!blackhole_netdev)
264*4882a593Smuzhiyun return -ENOMEM;
265*4882a593Smuzhiyun
266*4882a593Smuzhiyun rtnl_lock();
267*4882a593Smuzhiyun dev_init_scheduler(blackhole_netdev);
268*4882a593Smuzhiyun dev_activate(blackhole_netdev);
269*4882a593Smuzhiyun rtnl_unlock();
270*4882a593Smuzhiyun
271*4882a593Smuzhiyun blackhole_netdev->flags |= IFF_UP | IFF_RUNNING;
272*4882a593Smuzhiyun dev_net_set(blackhole_netdev, &init_net);
273*4882a593Smuzhiyun
274*4882a593Smuzhiyun return 0;
275*4882a593Smuzhiyun }
276*4882a593Smuzhiyun
277*4882a593Smuzhiyun device_initcall(blackhole_netdev_init);
278