vport-internal_dev.c 6.8 KB
Newer Older
1
/*
2
 * Copyright (c) 2007-2012 Nicira, Inc.
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of version 2 of the GNU General Public
 * License as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
 * General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
 * 02110-1301, USA
 */

#include <linux/hardirq.h>
#include <linux/if_vlan.h>
#include <linux/kernel.h>
#include <linux/netdevice.h>
#include <linux/etherdevice.h>
#include <linux/ethtool.h>
#include <linux/skbuff.h>

27 28
#include <net/dst.h>
#include <net/xfrm.h>
29
#include <net/rtnetlink.h>
30

31 32 33 34 35 36 37 38
#include "datapath.h"
#include "vport-internal_dev.h"
#include "vport-netdev.h"

struct internal_dev {
	struct vport *vport;
};

39 40
static struct vport_ops ovs_internal_vport_ops;

41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
static struct internal_dev *internal_dev_priv(struct net_device *netdev)
{
	return netdev_priv(netdev);
}

/* This function is only called by the kernel network layer.*/
static struct rtnl_link_stats64 *internal_dev_get_stats(struct net_device *netdev,
							struct rtnl_link_stats64 *stats)
{
	struct vport *vport = ovs_internal_dev_get_vport(netdev);
	struct ovs_vport_stats vport_stats;

	ovs_vport_get_stats(vport, &vport_stats);

	/* The tx and rx stats need to be swapped because the
	 * switch and host OS have opposite perspectives. */
	stats->rx_packets	= vport_stats.tx_packets;
	stats->tx_packets	= vport_stats.rx_packets;
	stats->rx_bytes		= vport_stats.tx_bytes;
	stats->tx_bytes		= vport_stats.rx_bytes;
	stats->rx_errors	= vport_stats.tx_errors;
	stats->tx_errors	= vport_stats.rx_errors;
	stats->rx_dropped	= vport_stats.tx_dropped;
	stats->tx_dropped	= vport_stats.rx_dropped;

	return stats;
}

/* Called with rcu_read_lock_bh. */
static int internal_dev_xmit(struct sk_buff *skb, struct net_device *netdev)
{
	rcu_read_lock();
73
	ovs_vport_receive(internal_dev_priv(netdev)->vport, skb, NULL);
74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92
	rcu_read_unlock();
	return 0;
}

static int internal_dev_open(struct net_device *netdev)
{
	netif_start_queue(netdev);
	return 0;
}

static int internal_dev_stop(struct net_device *netdev)
{
	netif_stop_queue(netdev);
	return 0;
}

static void internal_dev_getinfo(struct net_device *netdev,
				 struct ethtool_drvinfo *info)
{
93
	strlcpy(info->driver, "openvswitch", sizeof(info->driver));
94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121
}

static const struct ethtool_ops internal_dev_ethtool_ops = {
	.get_drvinfo	= internal_dev_getinfo,
	.get_link	= ethtool_op_get_link,
};

static int internal_dev_change_mtu(struct net_device *netdev, int new_mtu)
{
	if (new_mtu < 68)
		return -EINVAL;

	netdev->mtu = new_mtu;
	return 0;
}

static void internal_dev_destructor(struct net_device *dev)
{
	struct vport *vport = ovs_internal_dev_get_vport(dev);

	ovs_vport_free(vport);
	free_netdev(dev);
}

static const struct net_device_ops internal_dev_netdev_ops = {
	.ndo_open = internal_dev_open,
	.ndo_stop = internal_dev_stop,
	.ndo_start_xmit = internal_dev_xmit,
122
	.ndo_set_mac_address = eth_mac_addr,
123 124 125 126
	.ndo_change_mtu = internal_dev_change_mtu,
	.ndo_get_stats64 = internal_dev_get_stats,
};

127 128 129 130
static struct rtnl_link_ops internal_dev_link_ops __read_mostly = {
	.kind = "openvswitch",
};

131 132 133 134 135 136 137
static void do_setup(struct net_device *netdev)
{
	ether_setup(netdev);

	netdev->netdev_ops = &internal_dev_netdev_ops;

	netdev->priv_flags &= ~IFF_TX_SKB_SHARING;
138
	netdev->priv_flags |= IFF_LIVE_ADDR_CHANGE | IFF_OPENVSWITCH;
139
	netdev->destructor = internal_dev_destructor;
140
	netdev->ethtool_ops = &internal_dev_ethtool_ops;
141
	netdev->rtnl_link_ops = &internal_dev_link_ops;
142 143 144
	netdev->tx_queue_len = 0;

	netdev->features = NETIF_F_LLTX | NETIF_F_SG | NETIF_F_FRAGLIST |
145 146
			   NETIF_F_HIGHDMA | NETIF_F_HW_CSUM |
			   NETIF_F_GSO_SOFTWARE | NETIF_F_GSO_ENCAP_ALL;
147 148

	netdev->vlan_features = netdev->features;
149
	netdev->hw_enc_features = netdev->features;
150
	netdev->features |= NETIF_F_HW_VLAN_CTAG_TX;
151
	netdev->hw_features = netdev->features & ~NETIF_F_LLTX;
152

153
	eth_hw_addr_random(netdev);
154 155 156 157 158 159 160 161
}

static struct vport *internal_dev_create(const struct vport_parms *parms)
{
	struct vport *vport;
	struct internal_dev *internal_dev;
	int err;

162
	vport = ovs_vport_alloc(0, &ovs_internal_vport_ops, parms);
163 164 165 166 167
	if (IS_ERR(vport)) {
		err = PTR_ERR(vport);
		goto error;
	}

168 169 170
	vport->dev = alloc_netdev(sizeof(struct internal_dev),
				  parms->name, NET_NAME_UNKNOWN, do_setup);
	if (!vport->dev) {
171 172 173 174
		err = -ENOMEM;
		goto error_free_vport;
	}

175 176
	dev_net_set(vport->dev, ovs_dp_get_net(vport->dp));
	internal_dev = internal_dev_priv(vport->dev);
177 178
	internal_dev->vport = vport;

179 180
	/* Restrict bridge port to current netns. */
	if (vport->port_no == OVSP_LOCAL)
181
		vport->dev->features |= NETIF_F_NETNS_LOCAL;
182

183
	rtnl_lock();
184
	err = register_netdevice(vport->dev);
185 186 187
	if (err)
		goto error_free_netdev;

188
	dev_set_promiscuity(vport->dev, 1);
189
	rtnl_unlock();
190
	netif_start_queue(vport->dev);
191 192 193 194

	return vport;

error_free_netdev:
195
	rtnl_unlock();
196
	free_netdev(vport->dev);
197 198 199 200 201 202 203 204
error_free_vport:
	ovs_vport_free(vport);
error:
	return ERR_PTR(err);
}

static void internal_dev_destroy(struct vport *vport)
{
205
	netif_stop_queue(vport->dev);
206
	rtnl_lock();
207
	dev_set_promiscuity(vport->dev, -1);
208 209

	/* unregister_netdevice() waits for an RCU grace period. */
210
	unregister_netdevice(vport->dev);
211 212

	rtnl_unlock();
213 214 215 216
}

static int internal_dev_recv(struct vport *vport, struct sk_buff *skb)
{
217
	struct net_device *netdev = vport->dev;
218 219
	int len;

220 221 222 223 224
	if (unlikely(!(netdev->flags & IFF_UP))) {
		kfree_skb(skb);
		return 0;
	}

225
	len = skb->len;
226 227 228 229 230

	skb_dst_drop(skb);
	nf_reset(skb);
	secpath_reset(skb);

231 232 233
	skb->dev = netdev;
	skb->pkt_type = PACKET_HOST;
	skb->protocol = eth_type_trans(skb, netdev);
234
	skb_postpull_rcsum(skb, eth_hdr(skb), ETH_HLEN);
235 236 237 238 239 240

	netif_rx(skb);

	return len;
}

241
static struct vport_ops ovs_internal_vport_ops = {
242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259
	.type		= OVS_VPORT_TYPE_INTERNAL,
	.create		= internal_dev_create,
	.destroy	= internal_dev_destroy,
	.send		= internal_dev_recv,
};

int ovs_is_internal_dev(const struct net_device *netdev)
{
	return netdev->netdev_ops == &internal_dev_netdev_ops;
}

struct vport *ovs_internal_dev_get_vport(struct net_device *netdev)
{
	if (!ovs_is_internal_dev(netdev))
		return NULL;

	return internal_dev_priv(netdev)->vport;
}
260 261 262

int ovs_internal_dev_rtnl_link_register(void)
{
263 264 265 266 267 268 269 270 271 272 273
	int err;

	err = rtnl_link_register(&internal_dev_link_ops);
	if (err < 0)
		return err;

	err = ovs_vport_ops_register(&ovs_internal_vport_ops);
	if (err < 0)
		rtnl_link_unregister(&internal_dev_link_ops);

	return err;
274 275 276 277
}

void ovs_internal_dev_rtnl_link_unregister(void)
{
278
	ovs_vport_ops_unregister(&ovs_internal_vport_ops);
279 280
	rtnl_link_unregister(&internal_dev_link_ops);
}