2
0
mirror of https://github.com/openvswitch/ovs synced 2025-08-22 09:58:01 +00:00
ovs/lib/netdev-bsd.c
Ilya Maximets 77ac0b28c8 netdev: Always clear struct ifreq before ioctl.
It's not nice to send random stack memory to a kernel over ioctl:

  Uninitialized bytes in ioctl_common_pre
    at offset 20 inside [0x7fff8899f3c0, 40)
  WARNING: MemorySanitizer: use-of-uninitialized-value
   0 0x1180b7 in af_inet_ioctl lib/socket-util-unix.c:417:15
   1 0x1180ff in af_inet_ifreq_ioctl lib/socket-util-unix.c:428:13
   2 0x11e4fd in netdev_linux_set_mtu lib/netdev-linux.c:2005:13
   3 0xba250b in netdev_set_mtu lib/netdev.c:1132:30
   4 0x59a19f in update_mtu_ofproto ofproto/ofproto.c:3042:18
   5 0x596947 in update_mtu ofproto/ofproto.c:3024:5
   6 0x5976d6 in ofport_install ofproto/ofproto.c:2617:5
   7 0x572e96 in update_port ofproto/ofproto.c:2893:21
   8 0x57636b in ofproto_port_add ofproto/ofproto.c:2208:17
   9 0x4f9e0b in iface_do_create vswitchd/bridge.c:2203:13
  10 0x4f7f43 in iface_create vswitchd/bridge.c:2246:13
  11 0x4f7a63 in bridge_add_ports__ vswitchd/bridge.c:1225:21
  12 0x4d8ea4 in bridge_add_ports vswitchd/bridge.c:1241:5
  13 0x4cce3a in bridge_reconfigure vswitchd/bridge.c:952:9
  14 0x4ca156 in bridge_run vswitchd/bridge.c:3439:9
  15 0x5278e7 in main vswitchd/ovs-vswitchd.c:137:9
  16 0x7f9def in __libc_start_call_main
  17 0x7f9def in __libc_start_main@GLIBC_2.2.5
  18 0x432b14 in _start (vswitchd/ovs-vswitchd+0x432b14)

We do already initialize this structure for a few ioctls, let's
do that for all of them.

Acked-by: Eelco Chaudron <echaudro@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>
2024-12-02 20:22:01 +01:00

1752 lines
48 KiB
C
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

/*
* Copyright (c) 2011, 2013, 2014 Gaetano Catalli.
* Copyright (c) 2013, 2014 YAMAMOTO Takashi.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#if !defined(__MACH__)
#include <config.h>
#include "netdev-provider.h"
#include <stdlib.h>
#include <errno.h>
#include <fcntl.h>
#include <sys/types.h>
#include <sys/time.h>
#include <sys/ioctl.h>
#include <sys/socket.h>
#include <sys/sockio.h>
#include <net/bpf.h>
#include <ifaddrs.h>
#include <pcap/pcap.h>
#include <net/if.h>
#include <net/if_dl.h>
#include <net/if_media.h>
#include <net/if_tap.h>
#include <netinet/in.h>
#ifdef HAVE_NET_IF_MIB_H
#include <net/if_mib.h>
#endif
#include <poll.h>
#include <string.h>
#include <unistd.h>
#include <sys/sysctl.h>
#if defined(__NetBSD__)
#include <net/route.h>
#include <netinet/if_inarp.h>
#endif
#include "rtbsd.h"
#include "coverage.h"
#include "dp-packet.h"
#include "dpif-netdev.h"
#include "openvswitch/dynamic-string.h"
#include "fatal-signal.h"
#include "openflow/openflow.h"
#include "ovs-thread.h"
#include "packets.h"
#include "openvswitch/poll-loop.h"
#include "openvswitch/shash.h"
#include "socket-util.h"
#include "svec.h"
#include "util.h"
#include "openvswitch/vlog.h"
VLOG_DEFINE_THIS_MODULE(netdev_bsd);
struct netdev_rxq_bsd {
struct netdev_rxq up;
/* Packet capture descriptor for a system network device.
* For a tap device this is NULL. */
pcap_t *pcap_handle;
/* Selectable file descriptor for the network device.
* This descriptor will be used for polling operations. */
int fd;
};
struct netdev_bsd {
struct netdev up;
/* Never changes after initialization. */
char *kernel_name;
/* Protects all members below. */
struct ovs_mutex mutex;
unsigned int cache_valid;
int ifindex;
struct eth_addr etheraddr;
int mtu;
int carrier;
int tap_fd; /* TAP character device, if any, otherwise -1. */
/* Used for sending packets on non-tap devices. */
pcap_t *pcap;
int fd;
};
enum {
VALID_IFINDEX = 1 << 0,
VALID_ETHERADDR = 1 << 1,
VALID_IN = 1 << 2,
VALID_MTU = 1 << 3,
VALID_CARRIER = 1 << 4
};
#define PCAP_SNAPLEN 2048
/*
* Notifier used to invalidate device informations in case of status change.
*
* It will be registered with a 'rtbsd_notifier_register()' when the first
* device will be created with the call of either 'netdev_bsd_tap_create()' or
* 'netdev_bsd_system_create()'.
*
* The callback associated with this notifier ('netdev_bsd_cache_cb()') will
* invalidate cached information about the device.
*/
static struct rtbsd_notifier netdev_bsd_cache_notifier;
static int cache_notifier_refcount;
static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(5, 20);
static void destroy_tap(int fd, const char *name);
static int get_flags(const struct netdev *, int *flagsp);
static int set_flags(const char *, int flags);
static int do_set_addr(struct netdev *netdev,
unsigned long ioctl_nr, const char *ioctl_name,
struct in_addr addr);
static int get_etheraddr(const char *netdev_name, struct eth_addr *ea);
static int set_etheraddr(const char *netdev_name, int hwaddr_family,
int hwaddr_len, const struct eth_addr);
static int get_ifindex(const struct netdev *, int *ifindexp);
static int ifr_get_flags(const struct ifreq *);
static void ifr_set_flags(struct ifreq *, int flags);
#ifdef __NetBSD__
static int af_link_ioctl(unsigned long command, const void *arg);
#endif
static void netdev_bsd_run(const struct netdev_class *);
static int netdev_bsd_get_mtu(const struct netdev *netdev_, int *mtup);
static bool
is_netdev_bsd_class(const struct netdev_class *netdev_class)
{
return netdev_class->run == netdev_bsd_run;
}
static struct netdev_bsd *
netdev_bsd_cast(const struct netdev *netdev)
{
ovs_assert(is_netdev_bsd_class(netdev_get_class(netdev)));
return CONTAINER_OF(netdev, struct netdev_bsd, up);
}
static struct netdev_rxq_bsd *
netdev_rxq_bsd_cast(const struct netdev_rxq *rxq)
{
ovs_assert(is_netdev_bsd_class(netdev_get_class(rxq->netdev)));
return CONTAINER_OF(rxq, struct netdev_rxq_bsd, up);
}
static const char *
netdev_get_kernel_name(const struct netdev *netdev)
{
return netdev_bsd_cast(netdev)->kernel_name;
}
/*
* Perform periodic work needed by netdev. In BSD netdevs it checks for any
* interface status changes, and eventually calls all the user callbacks.
*/
static void
netdev_bsd_run(const struct netdev_class *netdev_class OVS_UNUSED)
{
rtbsd_notifier_run();
}
/*
* Arranges for poll_block() to wake up if the "run" member function needs to
* be called.
*/
static void
netdev_bsd_wait(const struct netdev_class *netdev_class OVS_UNUSED)
{
rtbsd_notifier_wait();
}
/* Invalidate cache in case of interface status change. */
static void
netdev_bsd_cache_cb(const struct rtbsd_change *change,
void *aux OVS_UNUSED)
{
struct netdev_bsd *dev;
if (change) {
struct netdev *base_dev = netdev_from_name(change->if_name);
if (base_dev) {
const struct netdev_class *netdev_class =
netdev_get_class(base_dev);
if (is_netdev_bsd_class(netdev_class)) {
dev = netdev_bsd_cast(base_dev);
dev->cache_valid = 0;
netdev_change_seq_changed(base_dev);
}
netdev_close(base_dev);
}
} else {
/*
* XXX the API is lacking, we should be able to iterate on the list of
* netdevs without having to store the info in a temp shash.
*/
struct shash device_shash;
struct shash_node *node;
shash_init(&device_shash);
netdev_get_devices(&netdev_bsd_class, &device_shash);
SHASH_FOR_EACH (node, &device_shash) {
struct netdev *netdev = node->data;
dev = netdev_bsd_cast(netdev);
dev->cache_valid = 0;
netdev_change_seq_changed(netdev);
netdev_close(netdev);
}
shash_destroy(&device_shash);
}
}
static int
cache_notifier_ref(void)
{
int ret = 0;
if (!cache_notifier_refcount) {
ret = rtbsd_notifier_register(&netdev_bsd_cache_notifier,
netdev_bsd_cache_cb, NULL);
if (ret) {
return ret;
}
}
cache_notifier_refcount++;
return 0;
}
static int
cache_notifier_unref(void)
{
cache_notifier_refcount--;
if (cache_notifier_refcount == 0) {
rtbsd_notifier_unregister(&netdev_bsd_cache_notifier);
}
return 0;
}
static struct netdev *
netdev_bsd_alloc(void)
{
struct netdev_bsd *netdev = xzalloc(sizeof *netdev);
return &netdev->up;
}
static int
netdev_bsd_construct_system(struct netdev *netdev_)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
enum netdev_flags flags;
int error;
error = cache_notifier_ref();
if (error) {
return error;
}
ovs_mutex_init(&netdev->mutex);
netdev->tap_fd = -1;
netdev->kernel_name = xstrdup(netdev_->name);
/* Verify that the netdev really exists by attempting to read its flags */
error = netdev_get_flags(netdev_, &flags);
if (error == ENXIO) {
free(netdev->kernel_name);
cache_notifier_unref();
ovs_mutex_destroy(&netdev->mutex);
return error;
}
return 0;
}
static int
netdev_bsd_construct_tap(struct netdev *netdev_)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
const char *name = netdev_->name;
int error = 0;
struct ifreq ifr;
char *kernel_name = NULL;
error = cache_notifier_ref();
if (error) {
goto error;
}
memset(&ifr, 0, sizeof(ifr));
/* Create a tap device by opening /dev/tap. The TAPGIFNAME ioctl is used
* to retrieve the name of the tap device. */
ovs_mutex_init(&netdev->mutex);
netdev->tap_fd = open("/dev/tap", O_RDWR);
if (netdev->tap_fd < 0) {
error = errno;
VLOG_WARN("opening \"/dev/tap\" failed: %s", ovs_strerror(error));
goto error_unref_notifier;
}
/* Retrieve tap name (e.g. tap0) */
if (ioctl(netdev->tap_fd, TAPGIFNAME, &ifr) == -1) {
/* XXX Need to destroy the device? */
error = errno;
close(netdev->tap_fd);
goto error_unref_notifier;
}
/* Change the name of the tap device */
#if defined(SIOCSIFNAME)
ifr.ifr_data = (void *)name;
error = af_inet_ioctl(SIOCSIFNAME, &ifr);
if (error) {
destroy_tap(netdev->tap_fd, ifr.ifr_name);
goto error_unref_notifier;
}
kernel_name = xstrdup(name);
#else
/*
* NetBSD doesn't support inteface renaming.
*/
VLOG_INFO("tap %s is created for bridge %s", ifr.ifr_name, name);
kernel_name = xstrdup(ifr.ifr_name);
#endif
/* set non-blocking. */
error = set_nonblocking(netdev->tap_fd);
if (error) {
destroy_tap(netdev->tap_fd, kernel_name);
goto error_unref_notifier;
}
/* Turn device UP */
ifr_set_flags(&ifr, IFF_UP);
ovs_strlcpy(ifr.ifr_name, kernel_name, sizeof ifr.ifr_name);
error = af_inet_ioctl(SIOCSIFFLAGS, &ifr);
if (error) {
destroy_tap(netdev->tap_fd, kernel_name);
goto error_unref_notifier;
}
netdev->kernel_name = kernel_name;
return 0;
error_unref_notifier:
ovs_mutex_destroy(&netdev->mutex);
cache_notifier_unref();
error:
free(kernel_name);
return error;
}
static void
netdev_bsd_destruct(struct netdev *netdev_)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
cache_notifier_unref();
if (netdev->tap_fd >= 0) {
destroy_tap(netdev->tap_fd, netdev_get_kernel_name(netdev_));
}
if (netdev->pcap) {
pcap_close(netdev->pcap);
}
free(netdev->kernel_name);
ovs_mutex_destroy(&netdev->mutex);
}
static void
netdev_bsd_dealloc(struct netdev *netdev_)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
free(netdev);
}
static int
netdev_bsd_open_pcap(const char *name, pcap_t **pcapp, int *fdp)
{
char errbuf[PCAP_ERRBUF_SIZE];
pcap_t *pcap = NULL;
int one = 1;
int error;
int fd;
/* Open the pcap device. The device is opened in non-promiscuous mode
* because the interface flags are manually set by the caller. */
errbuf[0] = '\0';
pcap = pcap_open_live(name, PCAP_SNAPLEN, 0, 1000, errbuf);
if (!pcap) {
VLOG_ERR_RL(&rl, "%s: pcap_open_live failed: %s", name, errbuf);
error = EIO;
goto error;
}
if (errbuf[0] != '\0') {
VLOG_WARN_RL(&rl, "%s: pcap_open_live: %s", name, errbuf);
}
/* Get the underlying fd. */
fd = pcap_get_selectable_fd(pcap);
if (fd == -1) {
VLOG_WARN_RL(&rl, "%s: no selectable file descriptor", name);
error = errno;
goto error;
}
/* Set non-blocking mode. Also the BIOCIMMEDIATE ioctl must be called
* on the file descriptor returned by pcap_get_selectable_fd to achieve
* a real non-blocking behaviour.*/
error = pcap_setnonblock(pcap, 1, errbuf);
if (error == -1) {
error = errno;
goto error;
}
/* This call assure that reads return immediately upon packet
* reception. Otherwise, a read will block until either the kernel
* buffer becomes full or a timeout occurs. */
if (ioctl(fd, BIOCIMMEDIATE, &one) < 0 ) {
VLOG_ERR_RL(&rl, "ioctl(BIOCIMMEDIATE) on %s device failed: %s",
name, ovs_strerror(errno));
error = errno;
goto error;
}
/* Capture only incoming packets. */
error = pcap_setdirection(pcap, PCAP_D_IN);
if (error == -1) {
error = errno;
goto error;
}
*pcapp = pcap;
*fdp = fd;
return 0;
error:
if (pcap) {
pcap_close(pcap);
}
*pcapp = NULL;
*fdp = -1;
return error;
}
static struct netdev_rxq *
netdev_bsd_rxq_alloc(void)
{
struct netdev_rxq_bsd *rxq = xzalloc(sizeof *rxq);
return &rxq->up;
}
static int
netdev_bsd_rxq_construct(struct netdev_rxq *rxq_)
{
struct netdev_rxq_bsd *rxq = netdev_rxq_bsd_cast(rxq_);
struct netdev *netdev_ = rxq->up.netdev;
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
int error;
if (!strcmp(netdev_get_type(netdev_), "tap")) {
rxq->pcap_handle = NULL;
rxq->fd = netdev->tap_fd;
error = 0;
} else {
ovs_mutex_lock(&netdev->mutex);
error = netdev_bsd_open_pcap(netdev_get_kernel_name(netdev_),
&rxq->pcap_handle, &rxq->fd);
ovs_mutex_unlock(&netdev->mutex);
}
return error;
}
static void
netdev_bsd_rxq_destruct(struct netdev_rxq *rxq_)
{
struct netdev_rxq_bsd *rxq = netdev_rxq_bsd_cast(rxq_);
if (rxq->pcap_handle) {
pcap_close(rxq->pcap_handle);
}
}
static void
netdev_bsd_rxq_dealloc(struct netdev_rxq *rxq_)
{
struct netdev_rxq_bsd *rxq = netdev_rxq_bsd_cast(rxq_);
free(rxq);
}
/* The recv callback of the netdev class returns the number of bytes of the
* received packet.
*
* This can be done by the pcap_next() function. Unfortunately pcap_next() does
* not make difference between a missing packet on the capture interface and
* an error during the file capture. We can use the pcap_dispatch() function
* instead, which is able to distinguish between errors and null packet.
*
* To make pcap_dispatch() returns the number of bytes read from the interface
* we need to define the following callback and argument.
*/
struct pcap_arg {
void *data;
int size;
int retval;
};
/*
* This callback will be executed on every captured packet.
*
* If the packet captured by pcap_dispatch() does not fit the pcap buffer,
* pcap returns a truncated packet and we follow this behavior.
*
* The argument args->retval is the packet size in bytes.
*/
static void
proc_pkt(u_char *args_, const struct pcap_pkthdr *hdr, const u_char *packet)
{
struct pcap_arg *args = ALIGNED_CAST(struct pcap_arg *, args_);
if (args->size < hdr->len) {
VLOG_WARN_RL(&rl, "packet truncated");
args->retval = args->size;
} else {
args->retval = hdr->len;
}
/* copy the packet to our buffer */
memcpy(args->data, packet, args->retval);
}
/*
* This function attempts to receive a packet from the specified network
* device. It is assumed that the network device is a system device or a tap
* device opened as a system one. In this case the read operation is performed
* from rxq->pcap.
*/
static int
netdev_rxq_bsd_recv_pcap(struct netdev_rxq_bsd *rxq, struct dp_packet *buffer)
{
struct pcap_arg arg;
int ret;
/* prepare the pcap argument to store the packet */
arg.size = dp_packet_tailroom(buffer);
arg.data = dp_packet_data(buffer);
for (;;) {
ret = pcap_dispatch(rxq->pcap_handle, 1, proc_pkt, (u_char *) &arg);
if (ret > 0) {
dp_packet_set_size(buffer, dp_packet_size(buffer) + arg.retval);
return 0;
}
if (ret == -1) {
if (errno == EINTR) {
continue;
}
}
return EAGAIN;
}
}
/*
* This function attempts to receive a packet from the specified network
* device. It is assumed that the network device is a tap device and
* 'rxq->fd' is initialized with the tap file descriptor.
*/
static int
netdev_rxq_bsd_recv_tap(struct netdev_rxq_bsd *rxq, struct dp_packet *buffer)
{
size_t size = dp_packet_tailroom(buffer);
for (;;) {
ssize_t retval = read(rxq->fd, dp_packet_data(buffer), size);
if (retval >= 0) {
dp_packet_set_size(buffer, dp_packet_size(buffer) + retval);
return 0;
} else if (errno != EINTR) {
if (errno != EAGAIN) {
VLOG_WARN_RL(&rl, "error receiving Ethernet packet on %s: %s",
ovs_strerror(errno), netdev_rxq_get_name(&rxq->up));
}
return errno;
}
}
}
static int
netdev_bsd_rxq_recv(struct netdev_rxq *rxq_, struct dp_packet_batch *batch,
int *qfill)
{
struct netdev_rxq_bsd *rxq = netdev_rxq_bsd_cast(rxq_);
struct netdev *netdev = rxq->up.netdev;
struct dp_packet *packet;
ssize_t retval;
int mtu;
if (netdev_bsd_get_mtu(netdev, &mtu)) {
mtu = ETH_PAYLOAD_MAX;
}
/* Assume Ethernet port. No need to set packet_type. */
packet = dp_packet_new_with_headroom(VLAN_ETH_HEADER_LEN + mtu,
DP_NETDEV_HEADROOM);
retval = (rxq->pcap_handle
? netdev_rxq_bsd_recv_pcap(rxq, packet)
: netdev_rxq_bsd_recv_tap(rxq, packet));
if (retval) {
dp_packet_delete(packet);
} else {
dp_packet_batch_init_packet(batch, packet);
}
if (qfill) {
*qfill = -ENOTSUP;
}
return retval;
}
/*
* Registers with the poll loop to wake up from the next call to poll_block()
* when a packet is ready to be received with netdev_rxq_recv() on 'rxq'.
*/
static void
netdev_bsd_rxq_wait(struct netdev_rxq *rxq_)
{
struct netdev_rxq_bsd *rxq = netdev_rxq_bsd_cast(rxq_);
poll_fd_wait(rxq->fd, POLLIN);
}
/* Discards all packets waiting to be received from 'rxq'. */
static int
netdev_bsd_rxq_drain(struct netdev_rxq *rxq_)
{
struct ifreq ifr;
struct netdev_rxq_bsd *rxq = netdev_rxq_bsd_cast(rxq_);
memset(&ifr, 0, sizeof ifr);
strcpy(ifr.ifr_name, netdev_get_kernel_name(netdev_rxq_get_netdev(rxq_)));
if (ioctl(rxq->fd, BIOCFLUSH, &ifr) == -1) {
VLOG_DBG_RL(&rl, "%s: ioctl(BIOCFLUSH) failed: %s",
netdev_rxq_get_name(rxq_), ovs_strerror(errno));
return errno;
}
return 0;
}
/*
* Send a packet on the specified network device. The device could be either a
* system or a tap device.
*/
static int
netdev_bsd_send(struct netdev *netdev_, int qid OVS_UNUSED,
struct dp_packet_batch *batch,
bool concurrent_txq OVS_UNUSED)
{
struct netdev_bsd *dev = netdev_bsd_cast(netdev_);
const char *name = netdev_get_name(netdev_);
struct dp_packet *packet;
int error;
ovs_mutex_lock(&dev->mutex);
if (dev->tap_fd < 0 && !dev->pcap) {
error = netdev_bsd_open_pcap(name, &dev->pcap, &dev->fd);
} else {
error = 0;
}
DP_PACKET_BATCH_FOR_EACH (i, packet, batch) {
const void *data = dp_packet_data(packet);
size_t size = dp_packet_size(packet);
while (!error) {
ssize_t retval;
if (dev->tap_fd >= 0) {
retval = write(dev->tap_fd, data, size);
} else {
retval = pcap_inject(dev->pcap, data, size);
}
if (retval < 0) {
if (errno == EINTR) {
continue;
} else {
error = errno;
if (error != EAGAIN) {
VLOG_WARN_RL(&rl, "error sending Ethernet packet on"
" %s: %s", name, ovs_strerror(error));
}
}
} else if (retval != size) {
VLOG_WARN_RL(&rl, "sent partial Ethernet packet "
"(%"PRIuSIZE" bytes of "
"%"PRIuSIZE") on %s", retval, size, name);
error = EMSGSIZE;
} else {
break;
}
}
}
ovs_mutex_unlock(&dev->mutex);
dp_packet_delete_batch(batch, true);
return error;
}
/*
* Registers with the poll loop to wake up from the next call to poll_block()
* when the packet transmission queue has sufficient room to transmit a packet
* with netdev_send().
*/
static void
netdev_bsd_send_wait(struct netdev *netdev_, int qid OVS_UNUSED)
{
struct netdev_bsd *dev = netdev_bsd_cast(netdev_);
ovs_mutex_lock(&dev->mutex);
if (dev->tap_fd >= 0) {
/* TAP device always accepts packets. */
poll_immediate_wake();
} else if (dev->pcap) {
poll_fd_wait(dev->fd, POLLOUT);
} else {
/* We haven't even tried to send a packet yet. */
poll_immediate_wake();
}
ovs_mutex_unlock(&dev->mutex);
}
/*
* Attempts to set 'netdev''s MAC address to 'mac'. Returns 0 if successful,
* otherwise a positive errno value.
*/
static int
netdev_bsd_set_etheraddr(struct netdev *netdev_,
const struct eth_addr mac)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
int error = 0;
ovs_mutex_lock(&netdev->mutex);
if (!(netdev->cache_valid & VALID_ETHERADDR)
|| !eth_addr_equals(netdev->etheraddr, mac)) {
error = set_etheraddr(netdev_get_kernel_name(netdev_), AF_LINK,
ETH_ADDR_LEN, mac);
if (!error) {
netdev->cache_valid |= VALID_ETHERADDR;
netdev->etheraddr = mac;
netdev_change_seq_changed(netdev_);
}
}
ovs_mutex_unlock(&netdev->mutex);
return error;
}
/*
* Returns a pointer to 'netdev''s MAC address. The caller must not modify or
* free the returned buffer.
*/
static int
netdev_bsd_get_etheraddr(const struct netdev *netdev_, struct eth_addr *mac)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
int error = 0;
ovs_mutex_lock(&netdev->mutex);
if (!(netdev->cache_valid & VALID_ETHERADDR)) {
error = get_etheraddr(netdev_get_kernel_name(netdev_),
&netdev->etheraddr);
if (!error) {
netdev->cache_valid |= VALID_ETHERADDR;
}
}
if (!error) {
*mac = netdev->etheraddr;
}
ovs_mutex_unlock(&netdev->mutex);
return error;
}
/*
* Returns the maximum size of transmitted (and received) packets on 'netdev',
* in bytes, not including the hardware header; thus, this is typically 1500
* bytes for Ethernet devices.
*/
static int
netdev_bsd_get_mtu(const struct netdev *netdev_, int *mtup)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
int error = 0;
ovs_mutex_lock(&netdev->mutex);
if (!(netdev->cache_valid & VALID_MTU)) {
struct ifreq ifr;
memset(&ifr, 0, sizeof ifr);
error = af_inet_ifreq_ioctl(netdev_get_kernel_name(netdev_), &ifr,
SIOCGIFMTU, "SIOCGIFMTU");
if (!error) {
netdev->mtu = ifr.ifr_mtu;
netdev->cache_valid |= VALID_MTU;
}
}
if (!error) {
*mtup = netdev->mtu;
}
ovs_mutex_unlock(&netdev->mutex);
return error;
}
static int
netdev_bsd_get_ifindex(const struct netdev *netdev_)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
int ifindex, error;
ovs_mutex_lock(&netdev->mutex);
error = get_ifindex(netdev_, &ifindex);
ovs_mutex_unlock(&netdev->mutex);
return error ? -error : ifindex;
}
static int
netdev_bsd_get_carrier(const struct netdev *netdev_, bool *carrier)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
int error = 0;
ovs_mutex_lock(&netdev->mutex);
if (!(netdev->cache_valid & VALID_CARRIER)) {
struct ifmediareq ifmr;
memset(&ifmr, 0, sizeof(ifmr));
ovs_strlcpy(ifmr.ifm_name, netdev_get_kernel_name(netdev_),
sizeof ifmr.ifm_name);
error = af_inet_ioctl(SIOCGIFMEDIA, &ifmr);
if (!error) {
netdev->carrier = (ifmr.ifm_status & IFM_ACTIVE) == IFM_ACTIVE;
netdev->cache_valid |= VALID_CARRIER;
/* If the interface doesn't report whether the media is active,
* just assume it is active. */
if ((ifmr.ifm_status & IFM_AVALID) == 0) {
netdev->carrier = true;
}
} else {
VLOG_DBG_RL(&rl, "%s: ioctl(SIOCGIFMEDIA) failed: %s",
netdev_get_name(netdev_), ovs_strerror(error));
}
}
if (!error) {
*carrier = netdev->carrier;
}
ovs_mutex_unlock(&netdev->mutex);
return error;
}
static void
convert_stats_system(struct netdev_stats *stats, const struct if_data *ifd)
{
/*
* note: UINT64_MAX means unsupported
*/
stats->rx_packets = ifd->ifi_ipackets;
stats->tx_packets = ifd->ifi_opackets;
stats->rx_bytes = ifd->ifi_obytes;
stats->tx_bytes = ifd->ifi_ibytes;
stats->rx_errors = ifd->ifi_ierrors;
stats->tx_errors = ifd->ifi_oerrors;
stats->rx_dropped = ifd->ifi_iqdrops;
stats->tx_dropped = UINT64_MAX;
stats->multicast = ifd->ifi_imcasts;
stats->collisions = ifd->ifi_collisions;
stats->rx_length_errors = UINT64_MAX;
stats->rx_over_errors = UINT64_MAX;
stats->rx_crc_errors = UINT64_MAX;
stats->rx_frame_errors = UINT64_MAX;
stats->rx_fifo_errors = UINT64_MAX;
stats->rx_missed_errors = UINT64_MAX;
stats->tx_aborted_errors = UINT64_MAX;
stats->tx_carrier_errors = UINT64_MAX;
stats->tx_fifo_errors = UINT64_MAX;
stats->tx_heartbeat_errors = UINT64_MAX;
stats->tx_window_errors = UINT64_MAX;
}
static void
convert_stats_tap(struct netdev_stats *stats, const struct if_data *ifd)
{
/*
* Similar to convert_stats_system but swapping rxq and tx
* because 'ifd' is stats for the network interface side of the
* tap device and what the caller wants is one for the character
* device side.
*
* note: UINT64_MAX means unsupported
*/
stats->rx_packets = ifd->ifi_opackets;
stats->tx_packets = ifd->ifi_ipackets;
stats->rx_bytes = ifd->ifi_ibytes;
stats->tx_bytes = ifd->ifi_obytes;
stats->rx_errors = ifd->ifi_oerrors;
stats->tx_errors = ifd->ifi_ierrors;
stats->rx_dropped = UINT64_MAX;
stats->tx_dropped = ifd->ifi_iqdrops;
stats->multicast = ifd->ifi_omcasts;
stats->collisions = UINT64_MAX;
stats->rx_length_errors = UINT64_MAX;
stats->rx_over_errors = UINT64_MAX;
stats->rx_crc_errors = UINT64_MAX;
stats->rx_frame_errors = UINT64_MAX;
stats->rx_fifo_errors = UINT64_MAX;
stats->rx_missed_errors = UINT64_MAX;
stats->tx_aborted_errors = UINT64_MAX;
stats->tx_carrier_errors = UINT64_MAX;
stats->tx_fifo_errors = UINT64_MAX;
stats->tx_heartbeat_errors = UINT64_MAX;
stats->tx_window_errors = UINT64_MAX;
}
static void
convert_stats(const struct netdev *netdev, struct netdev_stats *stats,
const struct if_data *ifd)
{
if (netdev_bsd_cast(netdev)->tap_fd == -1) {
convert_stats_system(stats, ifd);
} else {
convert_stats_tap(stats, ifd);
}
}
/* Retrieves current device stats for 'netdev'. */
static int
netdev_bsd_get_stats(const struct netdev *netdev_, struct netdev_stats *stats)
{
#if defined(__FreeBSD__)
int if_count, i;
int mib[6];
size_t len;
struct ifmibdata ifmd;
mib[0] = CTL_NET;
mib[1] = PF_LINK;
mib[2] = NETLINK_GENERIC;
mib[3] = IFMIB_SYSTEM;
mib[4] = IFMIB_IFCOUNT;
len = sizeof(if_count);
if (sysctl(mib, 5, &if_count, &len, (void *)0, 0) == -1) {
VLOG_DBG_RL(&rl, "%s: sysctl failed: %s",
netdev_get_name(netdev_), ovs_strerror(errno));
return errno;
}
mib[5] = IFDATA_GENERAL;
mib[3] = IFMIB_IFDATA;
len = sizeof(ifmd);
for (i = 1; i <= if_count; i++) {
mib[4] = i; /* row */
if (sysctl(mib, 6, &ifmd, &len, (void *)0, 0) == -1) {
VLOG_DBG_RL(&rl, "%s: sysctl failed: %s",
netdev_get_name(netdev_), ovs_strerror(errno));
return errno;
} else if (!strcmp(ifmd.ifmd_name, netdev_get_name(netdev_))) {
convert_stats(netdev_, stats, &ifmd.ifmd_data);
break;
}
}
return 0;
#elif defined(__NetBSD__)
struct ifdatareq ifdr;
int error;
memset(&ifdr, 0, sizeof(ifdr));
ovs_strlcpy(ifdr.ifdr_name, netdev_get_kernel_name(netdev_),
sizeof(ifdr.ifdr_name));
error = af_link_ioctl(SIOCGIFDATA, &ifdr);
if (!error) {
convert_stats(netdev_, stats, &ifdr.ifdr_data);
}
return error;
#else
#error not implemented
#endif
}
static uint32_t
netdev_bsd_parse_media(int media)
{
uint32_t supported = 0;
bool half_duplex = media & IFM_HDX ? true : false;
switch (IFM_SUBTYPE(media)) {
case IFM_10_2:
case IFM_10_5:
case IFM_10_STP:
case IFM_10_T:
supported |= half_duplex ? NETDEV_F_10MB_HD : NETDEV_F_10MB_FD;
supported |= NETDEV_F_COPPER;
break;
case IFM_10_FL:
supported |= half_duplex ? NETDEV_F_10MB_HD : NETDEV_F_10MB_FD;
supported |= NETDEV_F_FIBER;
break;
case IFM_100_T2:
case IFM_100_T4:
case IFM_100_TX:
case IFM_100_VG:
supported |= half_duplex ? NETDEV_F_100MB_HD : NETDEV_F_100MB_FD;
supported |= NETDEV_F_COPPER;
break;
case IFM_100_FX:
supported |= half_duplex ? NETDEV_F_100MB_HD : NETDEV_F_100MB_FD;
supported |= NETDEV_F_FIBER;
break;
case IFM_1000_CX:
case IFM_1000_T:
supported |= half_duplex ? NETDEV_F_1GB_HD : NETDEV_F_1GB_FD;
supported |= NETDEV_F_COPPER;
break;
case IFM_1000_LX:
case IFM_1000_SX:
supported |= half_duplex ? NETDEV_F_1GB_HD : NETDEV_F_1GB_FD;
supported |= NETDEV_F_FIBER;
break;
case IFM_10G_CX4:
supported |= NETDEV_F_10GB_FD;
supported |= NETDEV_F_COPPER;
break;
case IFM_10G_LR:
case IFM_10G_SR:
supported |= NETDEV_F_10GB_FD;
supported |= NETDEV_F_FIBER;
break;
default:
return 0;
}
if (IFM_SUBTYPE(media) == IFM_AUTO) {
supported |= NETDEV_F_AUTONEG;
}
/*
if (media & IFM_ETH_FMASK) {
supported |= NETDEV_F_PAUSE;
}
*/
return supported;
}
/*
* Stores the features supported by 'netdev' into each of '*current',
* '*advertised', '*supported', and '*peer' that are non-null. Each value is a
* bitmap of "enum ofp_port_features" bits, in host byte order. Returns 0 if
* successful, otherwise a positive errno value. On failure, all of the
* passed-in values are set to 0.
*/
static int
netdev_bsd_get_features(const struct netdev *netdev,
enum netdev_features *current, uint32_t *advertised,
enum netdev_features *supported, uint32_t *peer)
{
struct ifmediareq ifmr;
int *media_list;
int i;
int error;
/* XXX Look into SIOCGIFCAP instead of SIOCGIFMEDIA */
memset(&ifmr, 0, sizeof(ifmr));
ovs_strlcpy(ifmr.ifm_name, netdev_get_name(netdev), sizeof ifmr.ifm_name);
/* We make two SIOCGIFMEDIA ioctl calls. The first to determine the
* number of supported modes, and a second with a buffer to retrieve
* them. */
error = af_inet_ioctl(SIOCGIFMEDIA, &ifmr);
if (error) {
VLOG_DBG_RL(&rl, "%s: ioctl(SIOCGIFMEDIA) failed: %s",
netdev_get_name(netdev), ovs_strerror(error));
return error;
}
media_list = xcalloc(ifmr.ifm_count, sizeof(int));
ifmr.ifm_ulist = media_list;
if (IFM_TYPE(ifmr.ifm_current) != IFM_ETHER) {
VLOG_DBG_RL(&rl, "%s: doesn't appear to be ethernet",
netdev_get_name(netdev));
error = EINVAL;
goto cleanup;
}
error = af_inet_ioctl(SIOCGIFMEDIA, &ifmr);
if (error) {
VLOG_DBG_RL(&rl, "%s: ioctl(SIOCGIFMEDIA) failed: %s",
netdev_get_name(netdev), ovs_strerror(error));
goto cleanup;
}
/* Current settings. */
*current = netdev_bsd_parse_media(ifmr.ifm_active);
/* Advertised features. */
*advertised = netdev_bsd_parse_media(ifmr.ifm_current);
/* Supported features. */
*supported = 0;
for (i = 0; i < ifmr.ifm_count; i++) {
*supported |= netdev_bsd_parse_media(ifmr.ifm_ulist[i]);
}
/* Peer advertisements. */
*peer = 0; /* XXX */
error = 0;
cleanup:
free(media_list);
return error;
}
static int
netdev_bsd_get_speed(const struct netdev *netdev, uint32_t *current,
uint32_t *max)
{
enum netdev_features f_current, f_supported, f_advertised, f_peer;
int error;
error = netdev_bsd_get_features(netdev, &f_current, &f_advertised,
&f_supported, &f_peer);
if (error) {
return error;
}
*current = MIN(UINT32_MAX,
netdev_features_to_bps(f_current, 0) / 1000000ULL);
*max = MIN(UINT32_MAX,
netdev_features_to_bps(f_supported, 0) / 1000000ULL);
return 0;
}
/*
* Assigns 'addr' as 'netdev''s IPv4 address and 'mask' as its netmask. If
* 'addr' is INADDR_ANY, 'netdev''s IPv4 address is cleared. Returns a
* positive errno value.
*/
static int
netdev_bsd_set_in4(struct netdev *netdev_, struct in_addr addr,
struct in_addr mask)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
int error;
ovs_mutex_lock(&netdev->mutex);
error = do_set_addr(netdev_, SIOCSIFADDR, "SIOCSIFADDR", addr);
if (!error) {
if (addr.s_addr != INADDR_ANY) {
error = do_set_addr(netdev_, SIOCSIFNETMASK,
"SIOCSIFNETMASK", mask);
}
netdev_change_seq_changed(netdev_);
}
ovs_mutex_unlock(&netdev->mutex);
return error;
}
static int
netdev_bsd_get_addr_list(const struct netdev *netdev_,
struct in6_addr **addr, struct in6_addr **mask, int *n_cnt)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
int error;
if (!(netdev->cache_valid & VALID_IN)) {
netdev_get_addrs_list_flush();
}
error = netdev_get_addrs(netdev_get_name(netdev_), addr, mask, n_cnt);
if (!error) {
netdev->cache_valid |= VALID_IN;
}
return error;
}
#if defined(__NetBSD__)
static char *
netdev_bsd_kernel_name_to_ovs_name(const char *kernel_name)
{
char *ovs_name = NULL;
struct shash device_shash;
struct shash_node *node;
shash_init(&device_shash);
netdev_get_devices(&netdev_tap_class, &device_shash);
SHASH_FOR_EACH(node, &device_shash) {
struct netdev *netdev = node->data;
struct netdev_bsd * const dev = netdev_bsd_cast(netdev);
if (!strcmp(dev->kernel_name, kernel_name)) {
free(ovs_name);
ovs_name = xstrdup(netdev_get_name(&dev->up));
}
netdev_close(netdev);
}
shash_destroy(&device_shash);
return ovs_name ? ovs_name : xstrdup(kernel_name);
}
#endif
static int
netdev_bsd_get_next_hop(const struct in_addr *host OVS_UNUSED,
struct in_addr *next_hop OVS_UNUSED,
char **netdev_name OVS_UNUSED)
{
#if defined(__NetBSD__)
static int seq = 0;
struct sockaddr_in sin;
struct sockaddr_dl sdl;
int s;
int i;
struct {
struct rt_msghdr h;
char space[512];
} buf;
struct rt_msghdr *rtm = &buf.h;
const pid_t pid = getpid();
char *cp;
ssize_t ssz;
bool gateway = false;
char *ifname = NULL;
int saved_errno;
memset(next_hop, 0, sizeof(*next_hop));
*netdev_name = NULL;
memset(&sin, 0, sizeof(sin));
sin.sin_len = sizeof(sin);
sin.sin_family = AF_INET;
sin.sin_port = 0;
sin.sin_addr = *host;
memset(&sdl, 0, sizeof(sdl));
sdl.sdl_len = sizeof(sdl);
sdl.sdl_family = AF_LINK;
s = socket(PF_ROUTE, SOCK_RAW, 0);
memset(&buf, 0, sizeof(buf));
rtm->rtm_flags = RTF_HOST|RTF_UP;
rtm->rtm_version = RTM_VERSION;
rtm->rtm_addrs = RTA_DST|RTA_IFP;
cp = (void *)&buf.space;
memcpy(cp, &sin, sizeof(sin));
RT_ADVANCE(cp, (struct sockaddr *)(void *)&sin);
memcpy(cp, &sdl, sizeof(sdl));
RT_ADVANCE(cp, (struct sockaddr *)(void *)&sdl);
rtm->rtm_msglen = cp - (char *)(void *)rtm;
rtm->rtm_seq = ++seq;
rtm->rtm_type = RTM_GET;
rtm->rtm_pid = pid;
write(s, rtm, rtm->rtm_msglen);
memset(&buf, 0, sizeof(buf));
do {
ssz = read(s, &buf, sizeof(buf));
} while (ssz > 0 && (rtm->rtm_seq != seq || rtm->rtm_pid != pid));
saved_errno = errno;
close(s);
if (ssz <= 0) {
if (ssz < 0) {
return saved_errno;
}
return EPIPE; /* XXX */
}
cp = (void *)&buf.space;
for (i = 1; i; i <<= 1) {
if ((rtm->rtm_addrs & i) != 0) {
const struct sockaddr *sa = (const void *)cp;
if ((i == RTA_GATEWAY) && sa->sa_family == AF_INET) {
const struct sockaddr_in * const sin =
ALIGNED_CAST(const struct sockaddr_in *, sa);
*next_hop = sin->sin_addr;
gateway = true;
}
if ((i == RTA_IFP) && sa->sa_family == AF_LINK) {
const struct sockaddr_dl * const sdl =
ALIGNED_CAST(const struct sockaddr_dl *, sa);
char *kernel_name;
kernel_name = xmemdup0(sdl->sdl_data, sdl->sdl_nlen);
ifname = netdev_bsd_kernel_name_to_ovs_name(kernel_name);
free(kernel_name);
}
RT_ADVANCE(cp, sa);
}
}
if (ifname == NULL) {
return ENXIO;
}
if (!gateway) {
*next_hop = *host;
}
*netdev_name = ifname;
VLOG_DBG("host " IP_FMT " next-hop " IP_FMT " if %s",
IP_ARGS(host->s_addr), IP_ARGS(next_hop->s_addr), *netdev_name);
return 0;
#else
return EOPNOTSUPP;
#endif
}
static int
netdev_bsd_arp_lookup(const struct netdev *netdev OVS_UNUSED,
ovs_be32 ip OVS_UNUSED,
struct eth_addr *mac OVS_UNUSED)
{
#if defined(__NetBSD__)
const struct rt_msghdr *rtm;
size_t needed;
char *buf;
const char *cp;
const char *ep;
int mib[6];
int error;
buf = NULL;
mib[0] = CTL_NET;
mib[1] = PF_ROUTE;
mib[2] = 0;
mib[3] = AF_INET;
mib[4] = NET_RT_FLAGS;
#ifdef RTF_LLINFO
mib[5] = RTF_LLINFO;
#else
mib[5] = 0;
#endif
if (sysctl(mib, 6, NULL, &needed, NULL, 0) == -1) {
error = errno;
goto error;
}
buf = xmalloc(needed);
if (sysctl(mib, 6, buf, &needed, NULL, 0) == -1) {
error = errno;
goto error;
}
ep = buf + needed;
for (cp = buf; cp < ep; cp += rtm->rtm_msglen) {
const struct sockaddr_inarp *sina;
const struct sockaddr_dl *sdl;
rtm = (const void *)cp;
sina = (const void *)(rtm + 1);
if (ip != sina->sin_addr.s_addr) {
continue;
}
sdl = (const void *)
((const char *)(const void *)sina + RT_ROUNDUP(sina->sin_len));
if (sdl->sdl_alen == ETH_ADDR_LEN) {
memcpy(mac, &sdl->sdl_data[sdl->sdl_nlen], ETH_ADDR_LEN);
error = 0;
goto error;
}
}
error = ENXIO;
error:
free(buf);
return error;
#else
return EOPNOTSUPP;
#endif
}
static void
make_in4_sockaddr(struct sockaddr *sa, struct in_addr addr)
{
struct sockaddr_in sin;
memset(&sin, 0, sizeof sin);
sin.sin_family = AF_INET;
sin.sin_addr = addr;
sin.sin_port = 0;
memset(sa, 0, sizeof *sa);
memcpy(sa, &sin, sizeof sin);
}
static int
do_set_addr(struct netdev *netdev,
unsigned long ioctl_nr, const char *ioctl_name,
struct in_addr addr)
{
struct ifreq ifr;
memset(&ifr, 0, sizeof ifr);
make_in4_sockaddr(&ifr.ifr_addr, addr);
return af_inet_ifreq_ioctl(netdev_get_kernel_name(netdev), &ifr, ioctl_nr,
ioctl_name);
}
static int
nd_to_iff_flags(enum netdev_flags nd)
{
int iff = 0;
if (nd & NETDEV_UP) {
iff |= IFF_UP;
}
if (nd & NETDEV_PROMISC) {
iff |= IFF_PROMISC;
#if defined(IFF_PPROMISC)
iff |= IFF_PPROMISC;
#endif
}
if (nd & NETDEV_LOOPBACK) {
iff |= IFF_LOOPBACK;
}
return iff;
}
static int
iff_to_nd_flags(int iff)
{
enum netdev_flags nd = 0;
if (iff & IFF_UP) {
nd |= NETDEV_UP;
}
if (iff & IFF_PROMISC) {
nd |= NETDEV_PROMISC;
}
if (iff & IFF_LOOPBACK) {
nd |= NETDEV_LOOPBACK;
}
return nd;
}
static int
netdev_bsd_update_flags(struct netdev *netdev_, enum netdev_flags off,
enum netdev_flags on, enum netdev_flags *old_flagsp)
{
int old_flags, new_flags;
int error;
error = get_flags(netdev_, &old_flags);
if (!error) {
*old_flagsp = iff_to_nd_flags(old_flags);
new_flags = (old_flags & ~nd_to_iff_flags(off)) | nd_to_iff_flags(on);
if (new_flags != old_flags) {
error = set_flags(netdev_get_kernel_name(netdev_), new_flags);
netdev_change_seq_changed(netdev_);
}
}
return error;
}
#define NETDEV_BSD_CLASS_COMMON \
.run = netdev_bsd_run, \
.wait = netdev_bsd_wait, \
.alloc = netdev_bsd_alloc, \
.destruct = netdev_bsd_destruct, \
.dealloc = netdev_bsd_dealloc, \
.send = netdev_bsd_send, \
.send_wait = netdev_bsd_send_wait, \
.set_etheraddr = netdev_bsd_set_etheraddr, \
.get_etheraddr = netdev_bsd_get_etheraddr, \
.get_mtu = netdev_bsd_get_mtu, \
.get_ifindex = netdev_bsd_get_ifindex, \
.get_carrier = netdev_bsd_get_carrier, \
.get_stats = netdev_bsd_get_stats, \
.get_features = netdev_bsd_get_features, \
.get_speed = netdev_bsd_get_speed, \
.set_in4 = netdev_bsd_set_in4, \
.get_addr_list = netdev_bsd_get_addr_list, \
.get_next_hop = netdev_bsd_get_next_hop, \
.arp_lookup = netdev_bsd_arp_lookup, \
.update_flags = netdev_bsd_update_flags, \
.rxq_alloc = netdev_bsd_rxq_alloc, \
.rxq_construct = netdev_bsd_rxq_construct, \
.rxq_destruct = netdev_bsd_rxq_destruct, \
.rxq_dealloc = netdev_bsd_rxq_dealloc, \
.rxq_recv = netdev_bsd_rxq_recv, \
.rxq_wait = netdev_bsd_rxq_wait, \
.rxq_drain = netdev_bsd_rxq_drain
const struct netdev_class netdev_bsd_class = {
NETDEV_BSD_CLASS_COMMON,
.type = "system",
.construct = netdev_bsd_construct_system,
};
const struct netdev_class netdev_tap_class = {
NETDEV_BSD_CLASS_COMMON,
.type = "tap",
.construct = netdev_bsd_construct_tap,
};
static void
destroy_tap(int fd, const char *name)
{
struct ifreq ifr;
close(fd);
memset(&ifr, 0, sizeof ifr);
strcpy(ifr.ifr_name, name);
/* XXX What to do if this call fails? */
af_inet_ioctl(SIOCIFDESTROY, &ifr);
}
static int
get_flags(const struct netdev *netdev, int *flags)
{
struct ifreq ifr;
int error;
memset(&ifr, 0, sizeof ifr);
error = af_inet_ifreq_ioctl(netdev_get_kernel_name(netdev), &ifr,
SIOCGIFFLAGS, "SIOCGIFFLAGS");
*flags = ifr_get_flags(&ifr);
return error;
}
static int
set_flags(const char *name, int flags)
{
struct ifreq ifr;
memset(&ifr, 0, sizeof ifr);
ifr_set_flags(&ifr, flags);
return af_inet_ifreq_ioctl(name, &ifr, SIOCSIFFLAGS, "SIOCSIFFLAGS");
}
static int
get_ifindex(const struct netdev *netdev_, int *ifindexp)
{
struct netdev_bsd *netdev = netdev_bsd_cast(netdev_);
*ifindexp = 0;
if (!(netdev->cache_valid & VALID_IFINDEX)) {
int ifindex = if_nametoindex(netdev_get_name(netdev_));
if (ifindex <= 0) {
return errno;
}
netdev->cache_valid |= VALID_IFINDEX;
netdev->ifindex = ifindex;
}
*ifindexp = netdev->ifindex;
return 0;
}
static int
get_etheraddr(const char *netdev_name, struct eth_addr *ea)
{
struct ifaddrs *head;
struct ifaddrs *ifa;
struct sockaddr_dl *sdl;
if (getifaddrs(&head) != 0) {
VLOG_ERR("getifaddrs on %s device failed: %s", netdev_name,
ovs_strerror(errno));
return errno;
}
for (ifa = head; ifa; ifa = ifa->ifa_next) {
if (ifa->ifa_addr->sa_family == AF_LINK) {
if (!strcmp(ifa->ifa_name, netdev_name)) {
sdl = ALIGNED_CAST(struct sockaddr_dl *, ifa->ifa_addr);
if (sdl) {
memcpy(ea, LLADDR(sdl), sdl->sdl_alen);
freeifaddrs(head);
return 0;
}
}
}
}
VLOG_ERR("could not find ethernet address for %s device", netdev_name);
freeifaddrs(head);
return ENODEV;
}
static int
set_etheraddr(const char *netdev_name OVS_UNUSED, int hwaddr_family OVS_UNUSED,
int hwaddr_len OVS_UNUSED,
const struct eth_addr mac OVS_UNUSED)
{
#if defined(__FreeBSD__)
struct ifreq ifr;
int error;
memset(&ifr, 0, sizeof ifr);
ovs_strlcpy(ifr.ifr_name, netdev_name, sizeof ifr.ifr_name);
ifr.ifr_addr.sa_family = hwaddr_family;
ifr.ifr_addr.sa_len = hwaddr_len;
memcpy(ifr.ifr_addr.sa_data, &mac, hwaddr_len);
error = af_inet_ioctl(SIOCSIFLLADDR, &ifr);
if (error) {
VLOG_ERR("ioctl(SIOCSIFLLADDR) on %s device failed: %s",
netdev_name, ovs_strerror(error));
return error;
}
return 0;
#elif defined(__NetBSD__)
struct if_laddrreq req;
struct sockaddr_dl *sdl;
struct sockaddr_storage oldaddr;
int error;
/*
* get the old address, add new one, and then remove old one.
*/
if (hwaddr_len != ETH_ADDR_LEN) {
/* just to be safe about sockaddr storage size */
return EOPNOTSUPP;
}
memset(&req, 0, sizeof(req));
ovs_strlcpy(req.iflr_name, netdev_name, sizeof(req.iflr_name));
req.addr.ss_len = sizeof(req.addr);
req.addr.ss_family = hwaddr_family;
sdl = (struct sockaddr_dl *)&req.addr;
sdl->sdl_alen = hwaddr_len;
error = af_link_ioctl(SIOCGLIFADDR, &req);
if (error) {
return error;
}
if (!memcmp(&sdl->sdl_data[sdl->sdl_nlen], &mac, hwaddr_len)) {
return 0;
}
oldaddr = req.addr;
memset(&req, 0, sizeof(req));
ovs_strlcpy(req.iflr_name, netdev_name, sizeof(req.iflr_name));
req.flags = IFLR_ACTIVE;
sdl = (struct sockaddr_dl *)&req.addr;
sdl->sdl_len = offsetof(struct sockaddr_dl, sdl_data) + hwaddr_len;
sdl->sdl_alen = hwaddr_len;
sdl->sdl_family = hwaddr_family;
memcpy(sdl->sdl_data, &mac, hwaddr_len);
error = af_link_ioctl(SIOCALIFADDR, &req);
if (error) {
return error;
}
memset(&req, 0, sizeof(req));
ovs_strlcpy(req.iflr_name, netdev_name, sizeof(req.iflr_name));
req.addr = oldaddr;
return af_link_ioctl(SIOCDLIFADDR, &req);
#else
#error not implemented
#endif
}
static int
ifr_get_flags(const struct ifreq *ifr)
{
#ifdef HAVE_STRUCT_IFREQ_IFR_FLAGSHIGH
return (ifr->ifr_flagshigh << 16) | (ifr->ifr_flags & 0xffff);
#else
return ifr->ifr_flags;
#endif
}
static void
ifr_set_flags(struct ifreq *ifr, int flags)
{
#ifdef HAVE_STRUCT_IFREQ_IFR_FLAGSHIGH
ifr->ifr_flags = flags & 0xffff;
ifr->ifr_flagshigh = flags >> 16;
#else
ifr->ifr_flags = flags;
#endif
}
#if defined(__NetBSD__)
/* Calls ioctl() on an AF_LINK sock, passing the specified 'command' and
* 'arg'. Returns 0 if successful, otherwise a positive errno value. */
int
af_link_ioctl(unsigned long command, const void *arg)
{
static struct ovsthread_once once = OVSTHREAD_ONCE_INITIALIZER;
static int sock;
if (ovsthread_once_start(&once)) {
sock = socket(AF_LINK, SOCK_DGRAM, 0);
if (sock < 0) {
sock = -errno;
VLOG_ERR("failed to create link socket: %s", ovs_strerror(errno));
}
ovsthread_once_done(&once);
}
return (sock < 0 ? -sock
: ioctl(sock, command, arg) == -1 ? errno
: 0);
}
#endif
#endif /* !defined(__MACH__) */