2 * Copyright (c) 2009, 2010 Nicira Networks.
3 * Distributed under the terms of the GNU GPL version 2.
5 * Significant portions of this file may be copied from parts of the Linux
6 * kernel, by Linus Torvalds and others.
9 #include <linux/kernel.h>
10 #include <linux/netdevice.h>
11 #include <linux/etherdevice.h>
12 #include <linux/ethtool.h>
13 #include <linux/percpu.h>
14 #include <linux/rcupdate.h>
15 #include <linux/skbuff.h>
18 #include "openvswitch/internal_dev.h"
19 #include "vport-internal_dev.h"
20 #include "vport-netdev.h"
23 unsigned long rx_packets;
24 unsigned long rx_bytes;
25 unsigned long tx_packets;
26 unsigned long tx_bytes;
32 struct net_device_stats stats;
33 struct pcpu_lstats *lstats;
35 /* This is warty support for XAPI, which does not support summing bond
36 * device statistics itself. 'extra_stats' can be set by userspace via
37 * the DP_DEV_SET_STATS ioctl and, if they are, then they are added to
38 * the real device stats. */
39 struct pcpu_lstats extra_stats;
42 struct vport_ops internal_vport_ops;
44 static inline struct internal_dev *internal_dev_priv(struct net_device *netdev)
46 return netdev_priv(netdev);
49 static struct net_device_stats *internal_dev_get_stats(struct net_device *netdev)
51 struct internal_dev *internal_dev = internal_dev_priv(netdev);
52 struct net_device_stats *stats;
55 stats = &internal_dev->stats;
56 stats->rx_bytes = internal_dev->extra_stats.rx_bytes;
57 stats->rx_packets = internal_dev->extra_stats.rx_packets;
58 stats->tx_bytes = internal_dev->extra_stats.tx_bytes;
59 stats->tx_packets = internal_dev->extra_stats.tx_packets;
60 for_each_possible_cpu(i) {
61 const struct pcpu_lstats *lb_stats;
63 lb_stats = per_cpu_ptr(internal_dev->lstats, i);
64 stats->rx_bytes += lb_stats->rx_bytes;
65 stats->rx_packets += lb_stats->rx_packets;
66 stats->tx_bytes += lb_stats->tx_bytes;
67 stats->tx_packets += lb_stats->tx_packets;
72 static int internal_dev_mac_addr(struct net_device *dev, void *p)
74 struct sockaddr *addr = p;
76 if (!is_valid_ether_addr(addr->sa_data))
77 return -EADDRNOTAVAIL;
78 memcpy(dev->dev_addr, addr->sa_data, dev->addr_len);
82 /* Called with rcu_read_lock and bottom-halves disabled. */
83 static int internal_dev_xmit(struct sk_buff *skb, struct net_device *netdev)
85 struct internal_dev *internal_dev = internal_dev_priv(netdev);
86 struct vport *vport = internal_dev_get_vport(netdev);
87 struct pcpu_lstats *lb_stats;
89 /* We need our own clone. */
90 skb = skb_share_check(skb, GFP_ATOMIC);
94 lb_stats = per_cpu_ptr(internal_dev->lstats, smp_processor_id());
95 lb_stats->tx_packets++;
96 lb_stats->tx_bytes += skb->len;
98 skb_reset_mac_header(skb);
99 compute_ip_summed(skb, true);
101 vport_receive(vport, skb);
106 static int internal_dev_open(struct net_device *netdev)
108 netif_start_queue(netdev);
112 static int internal_dev_stop(struct net_device *netdev)
114 netif_stop_queue(netdev);
118 static void internal_dev_getinfo(struct net_device *netdev,
119 struct ethtool_drvinfo *info)
121 struct dp_port *dp_port = vport_get_dp_port(internal_dev_get_vport(netdev));
123 strcpy(info->driver, "openvswitch");
125 sprintf(info->bus_info, "%d.%d", dp_port->dp->dp_idx, dp_port->port_no);
128 static struct ethtool_ops internal_dev_ethtool_ops = {
129 .get_drvinfo = internal_dev_getinfo,
130 .get_link = ethtool_op_get_link,
131 .get_sg = ethtool_op_get_sg,
132 .set_sg = ethtool_op_set_sg,
133 .get_tx_csum = ethtool_op_get_tx_csum,
134 .set_tx_csum = ethtool_op_set_tx_hw_csum,
135 .get_tso = ethtool_op_get_tso,
136 .set_tso = ethtool_op_set_tso,
139 static int internal_dev_change_mtu(struct net_device *netdev, int new_mtu)
141 struct dp_port *dp_port = vport_get_dp_port(internal_dev_get_vport(netdev));
147 if (new_mtu > dp_min_mtu(dp_port->dp))
151 netdev->mtu = new_mtu;
155 static int internal_dev_init(struct net_device *netdev)
157 struct internal_dev *internal_dev = internal_dev_priv(netdev);
159 internal_dev->lstats = alloc_percpu(struct pcpu_lstats);
160 if (!internal_dev->lstats)
166 static void internal_dev_free(struct net_device *netdev)
168 struct internal_dev *internal_dev = internal_dev_priv(netdev);
170 free_percpu(internal_dev->lstats);
174 static int internal_dev_do_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
176 struct internal_dev *internal_dev = internal_dev_priv(dev);
178 if (cmd == INTERNAL_DEV_SET_STATS) {
179 struct internal_dev_stats stats;
181 if (copy_from_user(&stats, ifr->ifr_data, sizeof(stats)))
184 internal_dev->extra_stats.rx_bytes = stats.rx_bytes;
185 internal_dev->extra_stats.rx_packets = stats.rx_packets;
186 internal_dev->extra_stats.tx_bytes = stats.tx_bytes;
187 internal_dev->extra_stats.tx_packets = stats.tx_packets;
193 return dp_ioctl_hook(dev, ifr, cmd);
197 #ifdef HAVE_NET_DEVICE_OPS
198 static const struct net_device_ops internal_dev_netdev_ops = {
199 .ndo_init = internal_dev_init,
200 .ndo_open = internal_dev_open,
201 .ndo_stop = internal_dev_stop,
202 .ndo_start_xmit = internal_dev_xmit,
203 .ndo_set_mac_address = internal_dev_mac_addr,
204 .ndo_do_ioctl = internal_dev_do_ioctl,
205 .ndo_change_mtu = internal_dev_change_mtu,
206 .ndo_get_stats = internal_dev_get_stats,
211 do_setup(struct net_device *netdev)
215 #ifdef HAVE_NET_DEVICE_OPS
216 netdev->netdev_ops = &internal_dev_netdev_ops;
218 netdev->do_ioctl = internal_dev_do_ioctl;
219 netdev->get_stats = internal_dev_get_stats;
220 netdev->hard_start_xmit = internal_dev_xmit;
221 netdev->open = internal_dev_open;
222 netdev->stop = internal_dev_stop;
223 netdev->set_mac_address = internal_dev_mac_addr;
224 netdev->change_mtu = internal_dev_change_mtu;
225 netdev->init = internal_dev_init;
228 netdev->destructor = internal_dev_free;
229 SET_ETHTOOL_OPS(netdev, &internal_dev_ethtool_ops);
230 netdev->tx_queue_len = 0;
232 netdev->flags = IFF_BROADCAST | IFF_MULTICAST;
233 netdev->features = NETIF_F_LLTX | NETIF_F_SG | NETIF_F_HIGHDMA
234 | NETIF_F_HW_CSUM | NETIF_F_TSO;
236 vport_gen_ether_addr(netdev->dev_addr);
239 static struct vport *
240 internal_dev_create(const char *name, const void __user *config)
243 struct netdev_vport *netdev_vport;
244 struct internal_dev *internal_dev;
247 vport = vport_alloc(sizeof(struct netdev_vport), &internal_vport_ops);
249 err = PTR_ERR(vport);
253 netdev_vport = netdev_vport_priv(vport);
255 netdev_vport->dev = alloc_netdev(sizeof(struct internal_dev), name, do_setup);
256 if (!netdev_vport->dev) {
258 goto error_free_vport;
261 internal_dev = internal_dev_priv(netdev_vport->dev);
262 internal_dev->vport = vport;
264 err = register_netdevice(netdev_vport->dev);
266 goto error_free_netdev;
271 free_netdev(netdev_vport->dev);
279 internal_dev_destroy(struct vport *vport)
281 struct netdev_vport *netdev_vport = netdev_vport_priv(vport);
283 unregister_netdevice(netdev_vport->dev);
290 internal_dev_attach(struct vport *vport)
292 struct netdev_vport *netdev_vport = netdev_vport_priv(vport);
294 dev_set_promiscuity(netdev_vport->dev, 1);
296 /* It would make sense to assign dev->br_port here too, but
297 * that causes packets received on internal ports to get caught
298 * in netdev_frame_hook(). In turn netdev_frame_hook() can reject them
299 * back to the network stack, but that's a waste of time. */
305 internal_dev_detach(struct vport *vport)
307 struct netdev_vport *netdev_vport = netdev_vport_priv(vport);
309 dev_set_promiscuity(netdev_vport->dev, -1);
311 /* Make sure that no packets arrive from now on, since
312 * internal_dev_xmit() will try to find itself through
313 * p->dp->ports[], and we're about to set that to null. */
314 netif_tx_disable(netdev_vport->dev);
320 internal_dev_recv(struct vport *vport, struct sk_buff *skb)
322 struct net_device *netdev = netdev_vport_priv(vport)->dev;
323 struct internal_dev *internal_dev = internal_dev_priv(netdev);
324 struct pcpu_lstats *lb_stats;
329 skb->pkt_type = PACKET_HOST;
330 skb->protocol = eth_type_trans(skb, netdev);
336 netdev->last_rx = jiffies;
339 lb_stats = per_cpu_ptr(internal_dev->lstats, smp_processor_id());
340 lb_stats->rx_packets++;
341 lb_stats->rx_bytes += len;
347 struct vport_ops internal_vport_ops = {
349 .flags = VPORT_F_REQUIRED,
350 .create = internal_dev_create,
351 .destroy = internal_dev_destroy,
352 .attach = internal_dev_attach,
353 .detach = internal_dev_detach,
354 .set_mtu = netdev_set_mtu,
355 .set_addr = netdev_set_addr,
356 .get_name = netdev_get_name,
357 .get_addr = netdev_get_addr,
358 .get_kobj = netdev_get_kobj,
359 .get_stats = netdev_get_stats,
360 .get_dev_flags = netdev_get_dev_flags,
361 .is_running = netdev_is_running,
362 .get_operstate = netdev_get_operstate,
363 .get_ifindex = netdev_get_ifindex,
364 .get_iflink = netdev_get_iflink,
365 .get_mtu = netdev_get_mtu,
366 .send = internal_dev_recv,
369 int is_internal_dev(const struct net_device *netdev)
371 #ifdef HAVE_NET_DEVICE_OPS
372 return netdev->netdev_ops == &internal_dev_netdev_ops;
374 return netdev->open == internal_dev_open;
379 is_internal_vport(const struct vport *vport)
381 return vport->ops == &internal_vport_ops;
385 internal_dev_get_vport(struct net_device *netdev)
387 struct internal_dev *internal_dev = internal_dev_priv(netdev);
388 return rcu_dereference(internal_dev->vport);