loopback.c 7.0 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0-or-later
L
Linus Torvalds 已提交
2 3 4 5 6 7 8 9 10
/*
 * INET		An implementation of the TCP/IP protocol suite for the LINUX
 *		operating system.  INET is implemented using the  BSD Socket
 *		interface as the means of communication with the user level.
 *
 *		Pseudo-driver for the loopback interface.
 *
 * Version:	@(#)loopback.c	1.0.4b	08/16/93
 *
11
 * Authors:	Ross Biro
L
Linus Torvalds 已提交
12 13 14 15 16
 *		Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
 *		Donald Becker, <becker@scyld.com>
 *
 *		Alan Cox	:	Fixed oddments for NET3.014
 *		Alan Cox	:	Rejig for NET3.029 snap #3
17
 *		Alan Cox	:	Fixed NET3.029 bugs and sped up
L
Linus Torvalds 已提交
18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38
 *		Larry McVoy	:	Tiny tweak to double performance
 *		Alan Cox	:	Backed out LMV's tweak - the linux mm
 *					can't take it...
 *              Michael Griffith:       Don't bother computing the checksums
 *                                      on packets received on the loopback
 *                                      interface.
 *		Alexey Kuznetsov:	Potential hang under some extreme
 *					cases removed.
 */
#include <linux/kernel.h>
#include <linux/jiffies.h>
#include <linux/module.h>
#include <linux/interrupt.h>
#include <linux/fs.h>
#include <linux/types.h>
#include <linux/string.h>
#include <linux/socket.h>
#include <linux/errno.h>
#include <linux/fcntl.h>
#include <linux/in.h>

39
#include <linux/uaccess.h>
40
#include <linux/io.h>
L
Linus Torvalds 已提交
41 42 43 44 45 46 47 48 49 50 51 52 53

#include <linux/inet.h>
#include <linux/netdevice.h>
#include <linux/etherdevice.h>
#include <linux/skbuff.h>
#include <linux/ethtool.h>
#include <net/sock.h>
#include <net/checksum.h>
#include <linux/if_ether.h>	/* For the statistics structure. */
#include <linux/if_arp.h>	/* For ARPHRD_ETHER */
#include <linux/ip.h>
#include <linux/tcp.h>
#include <linux/percpu.h>
54
#include <linux/net_tstamp.h>
55
#include <net/net_namespace.h>
56
#include <linux/u64_stats_sync.h>
L
Linus Torvalds 已提交
57

58 59 60 61 62 63 64
/* blackhole_netdev - a device used for dsts that are marked expired!
 * This is global device (instead of per-net-ns) since it's not needed
 * to be per-ns and gets initialized at boot time.
 */
struct net_device *blackhole_netdev;
EXPORT_SYMBOL(blackhole_netdev);

65
/* The higher levels take care of making this non-reentrant (it's
L
Linus Torvalds 已提交
66 67
 * called with bh's disabled).
 */
68 69
static netdev_tx_t loopback_xmit(struct sk_buff *skb,
				 struct net_device *dev)
L
Linus Torvalds 已提交
70
{
E
Eric Dumazet 已提交
71
	int len;
L
Linus Torvalds 已提交
72

73
	skb_tx_timestamp(skb);
74 75 76 77

	/* do not fool net_timestamp_check() with various clock bases */
	skb->tstamp = 0;

L
Linus Torvalds 已提交
78 79
	skb_orphan(skb);

80 81 82 83 84
	/* Before queueing this packet to netif_rx(),
	 * make sure dst is refcounted.
	 */
	skb_dst_force(skb);

E
Eric Dumazet 已提交
85
	skb->protocol = eth_type_trans(skb, dev);
L
Linus Torvalds 已提交
86

E
Eric Dumazet 已提交
87
	len = skb->len;
88 89
	if (likely(netif_rx(skb) == NET_RX_SUCCESS))
		dev_lstats_add(dev, len);
L
Linus Torvalds 已提交
90

91
	return NETDEV_TX_OK;
L
Linus Torvalds 已提交
92 93
}

94
void dev_lstats_read(struct net_device *dev, u64 *packets, u64 *bytes)
L
Linus Torvalds 已提交
95 96 97
{
	int i;

98 99 100
	*packets = 0;
	*bytes = 0;

101
	for_each_possible_cpu(i) {
102
		const struct pcpu_lstats *lb_stats;
103 104
		u64 tbytes, tpackets;
		unsigned int start;
L
Linus Torvalds 已提交
105

E
Eric Dumazet 已提交
106
		lb_stats = per_cpu_ptr(dev->lstats, i);
107
		do {
108
			start = u64_stats_fetch_begin_irq(&lb_stats->syncp);
109
			tpackets = lb_stats->packets;
110
			tbytes = lb_stats->bytes;
111
		} while (u64_stats_fetch_retry_irq(&lb_stats->syncp, start));
112 113
		*bytes   += tbytes;
		*packets += tpackets;
L
Linus Torvalds 已提交
114
	}
115 116 117 118 119 120 121 122 123 124
}
EXPORT_SYMBOL(dev_lstats_read);

static void loopback_get_stats64(struct net_device *dev,
				 struct rtnl_link_stats64 *stats)
{
	u64 packets, bytes;

	dev_lstats_read(dev, &packets, &bytes);

125 126
	stats->rx_packets = packets;
	stats->tx_packets = packets;
E
Eric Dumazet 已提交
127 128
	stats->rx_bytes   = bytes;
	stats->tx_bytes   = bytes;
L
Linus Torvalds 已提交
129 130
}

131
static u32 always_on(struct net_device *dev)
L
Linus Torvalds 已提交
132 133 134 135
{
	return 1;
}

136
static const struct ethtool_ops loopback_ethtool_ops = {
137
	.get_link		= always_on,
138
	.get_ts_info		= ethtool_op_get_ts_info,
L
Linus Torvalds 已提交
139 140
};

141 142
static int loopback_dev_init(struct net_device *dev)
{
143
	dev->lstats = netdev_alloc_pcpu_stats(struct pcpu_lstats);
E
Eric Dumazet 已提交
144
	if (!dev->lstats)
145 146 147 148 149 150
		return -ENOMEM;
	return 0;
}

static void loopback_dev_free(struct net_device *dev)
{
151
	dev_net(dev)->loopback_dev = NULL;
E
Eric Dumazet 已提交
152
	free_percpu(dev->lstats);
153 154
}

155
static const struct net_device_ops loopback_ops = {
156 157
	.ndo_init        = loopback_dev_init,
	.ndo_start_xmit  = loopback_xmit,
158
	.ndo_get_stats64 = loopback_get_stats64,
159
	.ndo_set_mac_address = eth_mac_addr,
160 161
};

162 163 164 165 166 167
static void gen_lo_setup(struct net_device *dev,
			 unsigned int mtu,
			 const struct ethtool_ops *eth_ops,
			 const struct header_ops *hdr_ops,
			 const struct net_device_ops *dev_ops,
			 void (*dev_destructor)(struct net_device *dev))
168
{
169
	dev->mtu		= mtu;
170
	dev->hard_header_len	= ETH_HLEN;	/* 14	*/
171
	dev->min_header_len	= ETH_HLEN;	/* 14	*/
172 173 174
	dev->addr_len		= ETH_ALEN;	/* 6	*/
	dev->type		= ARPHRD_LOOPBACK;	/* 0x0001*/
	dev->flags		= IFF_LOOPBACK;
175
	dev->priv_flags		|= IFF_LIVE_ADDR_CHANGE | IFF_NO_QUEUE;
176
	netif_keep_dst(dev);
177
	dev->hw_features	= NETIF_F_GSO_SOFTWARE;
178
	dev->features		= NETIF_F_SG | NETIF_F_FRAGLIST
179
		| NETIF_F_GSO_SOFTWARE
180
		| NETIF_F_HW_CSUM
181
		| NETIF_F_RXCSUM
182
		| NETIF_F_SCTP_CRC
183 184
		| NETIF_F_HIGHDMA
		| NETIF_F_LLTX
185
		| NETIF_F_NETNS_LOCAL
186 187
		| NETIF_F_VLAN_CHALLENGED
		| NETIF_F_LOOPBACK;
188 189 190
	dev->ethtool_ops	= eth_ops;
	dev->header_ops		= hdr_ops;
	dev->netdev_ops		= dev_ops;
191
	dev->needs_free_netdev	= true;
192 193 194 195 196 197 198 199 200 201
	dev->priv_destructor	= dev_destructor;
}

/* The loopback device is special. There is only one instance
 * per network namespace.
 */
static void loopback_setup(struct net_device *dev)
{
	gen_lo_setup(dev, (64 * 1024), &loopback_ethtool_ops, &eth_header_ops,
		     &loopback_ops, loopback_dev_free);
202
}
203

204
/* Setup and register the loopback device. */
205
static __net_init int loopback_net_init(struct net *net)
L
Linus Torvalds 已提交
206
{
207 208 209 210
	struct net_device *dev;
	int err;

	err = -ENOMEM;
211
	dev = alloc_netdev(0, "lo", NET_NAME_UNKNOWN, loopback_setup);
212 213
	if (!dev)
		goto out;
214

215
	dev_net_set(dev, net);
216
	err = register_netdev(dev);
217
	if (err)
218
		goto out_free_netdev;
219

220
	BUG_ON(dev->ifindex != LOOPBACK_IFINDEX);
221
	net->loopback_dev = dev;
222
	return 0;
223 224 225

out_free_netdev:
	free_netdev(dev);
226
out:
O
Octavian Purdila 已提交
227
	if (net_eq(net, &init_net))
228 229
		panic("loopback: Failed to register netdevice: %d\n", err);
	return err;
230 231
}

232 233
/* Registered in net/core/dev.c */
struct pernet_operations __net_initdata loopback_net_ops = {
234
	.init = loopback_net_init,
235
};
236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265

/* blackhole netdevice */
static netdev_tx_t blackhole_netdev_xmit(struct sk_buff *skb,
					 struct net_device *dev)
{
	kfree_skb(skb);
	net_warn_ratelimited("%s(): Dropping skb.\n", __func__);
	return NETDEV_TX_OK;
}

static const struct net_device_ops blackhole_netdev_ops = {
	.ndo_start_xmit = blackhole_netdev_xmit,
};

/* This is a dst-dummy device used specifically for invalidated
 * DSTs and unlike loopback, this is not per-ns.
 */
static void blackhole_netdev_setup(struct net_device *dev)
{
	gen_lo_setup(dev, ETH_MIN_MTU, NULL, NULL, &blackhole_netdev_ops, NULL);
}

/* Setup and register the blackhole_netdev. */
static int __init blackhole_netdev_init(void)
{
	blackhole_netdev = alloc_netdev(0, "blackhole_dev", NET_NAME_UNKNOWN,
					blackhole_netdev_setup);
	if (!blackhole_netdev)
		return -ENOMEM;

M
Mahesh Bandewar 已提交
266
	rtnl_lock();
267 268
	dev_init_scheduler(blackhole_netdev);
	dev_activate(blackhole_netdev);
M
Mahesh Bandewar 已提交
269
	rtnl_unlock();
270 271 272 273 274 275 276 277

	blackhole_netdev->flags |= IFF_UP | IFF_RUNNING;
	dev_net_set(blackhole_netdev, &init_net);

	return 0;
}

device_initcall(blackhole_netdev_init);