ovs/lib/util.c

/*
 * Copyright (c) 2008, 2009, 2010, 2011, 2012, 2013, 2014, 2015, 2016 Nicira, Inc.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at:
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include <config.h>
#include "util.h"
#include <ctype.h>
#include <errno.h>
#include <limits.h>
#include <pthread.h>
#include <stdarg.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#ifdef __linux__
#include <sys/prctl.h>
#include <sys/utsname.h>
#endif
#include <sys/stat.h>
#include <unistd.h>
#include "bitmap.h"
#include "byte-order.h"
#include "coverage.h"
#include "ovs-rcu.h"
#include "ovs-thread.h"
#include "socket-util.h"
#include "timeval.h"
#include "openvswitch/vlog.h"
#ifdef HAVE_PTHREAD_SET_NAME_NP
#include <pthread_np.h>
#endif
#ifdef _WIN32
#include <shlwapi.h>
#endif

VLOG_DEFINE_THIS_MODULE(util);

#ifdef __linux__
#define LINUX 1
#include <asm/param.h>
#else
#define LINUX 0
#endif

COVERAGE_DEFINE(util_xalloc);

/* argv[0] without directory names. */
char *program_name;

/* Name for the currently running thread or process, for log messages, process
 * listings, and debuggers. */
DEFINE_PER_THREAD_MALLOCED_DATA(char *, subprogram_name);

/* --version option output. */
static char *program_version;

/* 'true' if mlockall() succeeded, but doesn't support ONFAULT. */
static bool is_all_memory_locked = false;

/* Buffer used by ovs_strerror() and ovs_format_message(). */
DEFINE_STATIC_PER_THREAD_DATA(struct { char s[128]; },
                              strerror_buffer,
                              { "" });

static char *xreadlink(const char *filename);

void
ovs_assert_failure(const char *where, const char *function,
                   const char *condition)
{
    /* Prevent an infinite loop (or stack overflow) in case VLOG_ABORT happens
     * to trigger an assertion failure of its own. */
    static int reentry = 0;

    switch (reentry++) {
    case 0:
        VLOG_ABORT("%s: assertion %s failed in %s()",
                   where, condition, function);
        OVS_NOT_REACHED();

    case 1:
        fprintf(stderr, "%s: assertion %s failed in %s()",
                where, condition, function);
        abort();

    default:
        abort();
    }
}

void
set_all_memory_locked(void)
{
    is_all_memory_locked = true;
}

bool
memory_all_locked(void)
{
    return is_all_memory_locked;
}

void
out_of_memory(void)
{
    ovs_abort(0, "virtual memory exhausted");
}

void *
xcalloc__(size_t count, size_t size)
{
    void *p = count && size ? calloc(count, size) : malloc(1);
    if (p == NULL) {
        out_of_memory();
    }
    return p;
}

void *
xzalloc__(size_t size)
{
    return xcalloc__(1, size);
}

void *
xmalloc__(size_t size)
{
    void *p = malloc(size ? size : 1);
    if (p == NULL) {
        out_of_memory();
    }
    return p;
}

void *
xrealloc__(void *p, size_t size)
{
    p = realloc(p, size ? size : 1);
    if (p == NULL) {
        out_of_memory();
    }
    return p;
}

void *
xcalloc(size_t count, size_t size)
{
    COVERAGE_INC(util_xalloc);
    return xcalloc__(count, size);
}

void *
xzalloc(size_t size)
{
    COVERAGE_INC(util_xalloc);
    return xzalloc__(size);
}

void *
xmalloc(size_t size)
{
    COVERAGE_INC(util_xalloc);
    return xmalloc__(size);
}

void *
xrealloc(void *p, size_t size)
{
    COVERAGE_INC(util_xalloc);
    return xrealloc__(p, size);
}

void *
xmemdup(const void *p_, size_t size)
{
    void *p = xmalloc(size);
    nullable_memcpy(p, p_, size);
    return p;
}

char *
xmemdup0(const char *p_, size_t length)
{
    char *p = xmalloc(length + 1);
    memcpy(p, p_, length);
    p[length] = '\0';
    return p;
}

char *
xstrdup(const char *s)
{
    return xmemdup0(s, strlen(s));
}

char * MALLOC_LIKE
nullable_xstrdup(const char *s)
{
    return s ? xstrdup(s) : NULL;
}

bool
nullable_string_is_equal(const char *a, const char *b)
{
    return a ? b && !strcmp(a, b) : !b;
}

char *
xvasprintf(const char *format, va_list args)
{
    va_list args2;
    size_t needed;
    char *s;

    va_copy(args2, args);
    needed = vsnprintf(NULL, 0, format, args);

    s = xmalloc(needed + 1);

    vsnprintf(s, needed + 1, format, args2);
    va_end(args2);

    return s;
}

void *
x2nrealloc(void *p, size_t *n, size_t s)
{
    *n = *n == 0 ? 1 : 2 * *n;
    return xrealloc(p, *n * s);
}

/* Allocates and returns 'size' bytes of memory aligned to 'alignment' bytes.
 * 'alignment' must be a power of two and a multiple of sizeof(void *).
 *
 * Use free_size_align() to free the returned memory block. */
void *
xmalloc_size_align(size_t size, size_t alignment)
{
#ifdef HAVE_POSIX_MEMALIGN
    void *p;
    int error;

    COVERAGE_INC(util_xalloc);
    error = posix_memalign(&p, alignment, size ? size : 1);
    if (error != 0) {
        out_of_memory();
    }
    return p;
#else
    /* Allocate room for:
     *
     *     - Header padding: Up to alignment - 1 bytes, to allow the
     *       pointer 'q' to be aligned exactly sizeof(void *) bytes before the
     *       beginning of the alignment.
     *
     *     - Pointer: A pointer to the start of the header padding, to allow us
     *       to free() the block later.
     *
     *     - User data: 'size' bytes.
     *
     *     - Trailer padding: Enough to bring the user data up to a alignment
     *       multiple.
     *
     * +---------------+---------+------------------------+---------+
     * | header        | pointer | user data              | trailer |
     * +---------------+---------+------------------------+---------+
     * ^               ^         ^
     * |               |         |
     * p               q         r
     *
     */
    void *p, *r, **q;
    bool runt;

    if (!IS_POW2(alignment) || (alignment % sizeof(void *) != 0)) {
        ovs_abort(0, "Invalid alignment");
    }

    p = xmalloc((alignment - 1)
                + sizeof(void *)
                + ROUND_UP(size, alignment));

    runt = PAD_SIZE((uintptr_t) p, alignment) < sizeof(void *);
    /* When the padding size < sizeof(void*), we don't have enough room for
     * pointer 'q'. As a reuslt, need to move 'r' to the next alignment.
     * So ROUND_UP when xmalloc above, and ROUND_UP again when calculate 'r'
     * below.
     */
    r = (void *) ROUND_UP((uintptr_t) p + (runt ? alignment : 0), alignment);
    q = (void **) r - 1;
    *q = p;

    return r;
#endif
}

void
free_size_align(void *p)
{
#ifdef HAVE_POSIX_MEMALIGN
    free(p);
#else
    if (p) {
        void **q = (void **) p - 1;
        free(*q);
    }
#endif
}

/* Allocates and returns 'size' bytes of memory aligned to a cache line and in
 * dedicated cache lines.  That is, the memory block returned will not share a
 * cache line with other data, avoiding "false sharing".
 *
 * Use free_cacheline() to free the returned memory block. */
void *
xmalloc_cacheline(size_t size)
{
    return xmalloc_size_align(size, CACHE_LINE_SIZE);
}

/* Like xmalloc_cacheline() but clears the allocated memory to all zero
 * bytes. */
void *
xzalloc_cacheline(size_t size)
{
    void *p = xmalloc_cacheline(size);
    memset(p, 0, size);
    return p;
}

/* Frees a memory block allocated with xmalloc_cacheline() or
 * xzalloc_cacheline(). */
void
free_cacheline(void *p)
{
    free_size_align(p);
}

void *
xmalloc_pagealign(size_t size)
{
    return xmalloc_size_align(size, get_page_size());
}

void
free_pagealign(void *p)
{
    free_size_align(p);
}

char *
xasprintf(const char *format, ...)
{
    va_list args;
    char *s;

    va_start(args, format);
    s = xvasprintf(format, args);
    va_end(args);

    return s;
}

/* Similar to strlcpy() from OpenBSD, but it never reads more than 'size - 1'
 * bytes from 'src' and doesn't return anything. */
void
ovs_strlcpy(char *dst, const char *src, size_t size)
{
    if (size > 0) {
        size_t len = strnlen(src, size - 1);
        memcpy(dst, src, len);
        dst[len] = '\0';
    }
}

/* Copies 'src' to 'dst'.  Reads no more than 'size - 1' bytes from 'src'.
 * Always null-terminates 'dst' (if 'size' is nonzero), and writes a zero byte
 * to every otherwise unused byte in 'dst'.
 *
 * Except for performance, the following call:
 *     ovs_strzcpy(dst, src, size);
 * is equivalent to these two calls:
 *     memset(dst, '\0', size);
 *     ovs_strlcpy(dst, src, size);
 *
 * (Thus, ovs_strzcpy() is similar to strncpy() without some of the pitfalls.)
 */
void
ovs_strzcpy(char *dst, const char *src, size_t size)
{
    if (size > 0) {
        size_t len = strnlen(src, size - 1);
        memcpy(dst, src, len);
        memset(dst + len, '\0', size - len);
    }
}

/*
 * Returns true if 'str' ends with given 'suffix'.
 */
int
string_ends_with(const char *str, const char *suffix)
{
    int str_len = strlen(str);
    int suffix_len = strlen(suffix);

    return (str_len >= suffix_len) &&
           (0 == strcmp(str + (str_len - suffix_len), suffix));
}

/* Prints 'format' on stderr, formatting it like printf() does.  If 'err_no' is
 * nonzero, then it is formatted with ovs_retval_to_string() and appended to
 * the message inside parentheses.  Then, terminates with abort().
 *
 * This function is preferred to ovs_fatal() in a situation where it would make
 * sense for a monitoring process to restart the daemon.
 *
 * 'format' should not end with a new-line, because this function will add one
 * itself. */
void
ovs_abort(int err_no, const char *format, ...)
{
    va_list args;

    va_start(args, format);
    ovs_abort_valist(err_no, format, args);
}

/* Same as ovs_abort() except that the arguments are supplied as a va_list. */
void
ovs_abort_valist(int err_no, const char *format, va_list args)
{
    ovs_error_valist(err_no, format, args);
    abort();
}

/* Prints 'format' on stderr, formatting it like printf() does.  If 'err_no' is
 * nonzero, then it is formatted with ovs_retval_to_string() and appended to
 * the message inside parentheses.  Then, terminates with EXIT_FAILURE.
 *
 * 'format' should not end with a new-line, because this function will add one
 * itself. */
void
ovs_fatal(int err_no, const char *format, ...)
{
    va_list args;

    va_start(args, format);
    ovs_fatal_valist(err_no, format, args);
}

/* Same as ovs_fatal() except that the arguments are supplied as a va_list. */
void
ovs_fatal_valist(int err_no, const char *format, va_list args)
{
    ovs_error_valist(err_no, format, args);
    exit(EXIT_FAILURE);
}

/* Prints 'format' on stderr, formatting it like printf() does.  If 'err_no' is
 * nonzero, then it is formatted with ovs_retval_to_string() and appended to
 * the message inside parentheses.
 *
 * 'format' should not end with a new-line, because this function will add one
 * itself. */
void
ovs_error(int err_no, const char *format, ...)
{
    va_list args;

    va_start(args, format);
    ovs_error_valist(err_no, format, args);
    va_end(args);
}

/* Same as ovs_error() except that the arguments are supplied as a va_list. */
void
ovs_error_valist(int err_no, const char *format, va_list args)
{
    const char *subprogram_name = get_subprogram_name();
    int save_errno = errno;

    if (subprogram_name[0]) {
        fprintf(stderr, "%s(%s): ", program_name, subprogram_name);
    } else {
        fprintf(stderr, "%s: ", program_name);
    }

    vfprintf(stderr, format, args);
    if (err_no != 0) {
        fprintf(stderr, " (%s)", ovs_retval_to_string(err_no));
    }
    putc('\n', stderr);

    errno = save_errno;
}

/* Many OVS functions return an int which is one of:
 * - 0: no error yet
 * - >0: errno value
 * - EOF: end of file (not necessarily an error; depends on the function called)
 *
 * Returns the appropriate human-readable string. The caller must copy the
 * string if it wants to hold onto it, as the storage may be overwritten on
 * subsequent function calls.
 */
const char *
ovs_retval_to_string(int retval)
{
    return (!retval ? ""
            : retval == EOF ? "End of file"
            : ovs_strerror(retval));
}

/* This function returns the string describing the error number in 'error'
 * for POSIX platforms.  For Windows, this function can be used for C library
 * calls.  For socket calls that are also used in Windows, use sock_strerror()
 * instead.  For WINAPI calls, look at ovs_lasterror_to_string(). */
const char *
ovs_strerror(int error)
{
    enum { BUFSIZE = sizeof strerror_buffer_get()->s };
    int save_errno;
    char *buffer;
    char *s;

    if (error == 0) {
        /*
         * strerror(0) varies among platforms:
         *
         *   Success
         *   No error
         *   Undefined error: 0
         *
         * We want to provide a consistent result here because
         * our testsuite has test cases which strictly matches
         * log messages containing this string.
         */
        return "Success";
    }

    save_errno = errno;
    buffer = strerror_buffer_get()->s;

#if STRERROR_R_CHAR_P
    /* GNU style strerror_r() might return an immutable static string, or it
     * might write and return 'buffer', but in either case we can pass the
     * returned string directly to the caller. */
    s = strerror_r(error, buffer, BUFSIZE);
#else  /* strerror_r() returns an int. */
    s = buffer;
    if (strerror_r(error, buffer, BUFSIZE)) {
        /* strerror_r() is only allowed to fail on ERANGE (because the buffer
         * is too short).  We don't check the actual failure reason because
         * POSIX requires strerror_r() to return the error but old glibc
         * (before 2.13) returns -1 and sets errno. */
        snprintf(buffer, BUFSIZE, "Unknown error %d", error);
    }
#endif

    errno = save_errno;

    return s;
}

/* Sets global "program_name" and "program_version" variables.  Should
 * be called at the beginning of main() with "argv[0]" as the argument
 * to 'argv0'.
 *
 * 'version' should contain the version of the caller's program.  If 'version'
 * is the same as the VERSION #define, the caller is assumed to be part of Open
 * vSwitch.  Otherwise, it is assumed to be an external program linking against
 * the Open vSwitch libraries.
 *
 */
void
ovs_set_program_name(const char *argv0, const char *version)
{
    char *basename;
#ifdef _WIN32
    size_t max_len = strlen(argv0) + 1;

    SetErrorMode(GetErrorMode() | SEM_NOGPFAULTERRORBOX);
#if _MSC_VER < 1900
     /* This function is deprecated from 1900 (Visual Studio 2015) */
    _set_output_format(_TWO_DIGIT_EXPONENT);
#endif

    basename = xmalloc(max_len);
    _splitpath_s(argv0, NULL, 0, NULL, 0, basename, max_len, NULL, 0);
#else
    const char *slash = strrchr(argv0, '/');
    basename = xstrdup(slash ? slash + 1 : argv0);
#endif

    assert_single_threaded();
    free(program_name);
    /* Remove libtool prefix, if it is there */
    if (strncmp(basename, "lt-", 3) == 0) {
        char *tmp_name = basename;
        basename = xstrdup(basename + 3);
        free(tmp_name);
    }
    program_name = basename;

    free(program_version);
    if (!strcmp(version, VERSION)) {
        program_version = xasprintf("%s (Open vSwitch) "VERSION"\n",
                                    program_name);
    } else {
        program_version = xasprintf("%s %s\n"
                                    "Open vSwitch Library "VERSION"\n",
                                    program_name, version);
    }
}

/* Returns the name of the currently running thread or process. */
const char *
get_subprogram_name(void)
{
    const char *name = subprogram_name_get();
    return name ? name : "";
}

/* Sets 'subprogram_name' as the name of the currently running thread or
 * process.  (This appears in log messages and may also be visible in system
 * process listings and debuggers.) */
void
set_subprogram_name(const char *subprogram_name)
{
    char *pname = xstrdup(subprogram_name ? subprogram_name : program_name);
    free(subprogram_name_set(pname));

#if HAVE_GLIBC_PTHREAD_SETNAME_NP
    /* The maximum supported thread name including '\0' is 16.
     * Add '>' at 0th position to highlight that the name was truncated. */
    if (strlen(pname) > 15) {
        memmove(pname, &pname[strlen(pname) - 15], 15 + 1);
        pname[0] = '>';
    }
    pthread_setname_np(pthread_self(), pname);
#elif HAVE_NETBSD_PTHREAD_SETNAME_NP
    pthread_setname_np(pthread_self(), "%s", pname);
#elif HAVE_PTHREAD_SET_NAME_NP
    pthread_set_name_np(pthread_self(), pname);
#endif
}

unsigned int
get_page_size(void)
{
    static unsigned int cached;

    if (!cached) {
#ifndef _WIN32
        long int value = sysconf(_SC_PAGESIZE);
#else
        long int value;
        SYSTEM_INFO sysinfo;
        GetSystemInfo(&sysinfo);
        value = sysinfo.dwPageSize;
#endif
        if (value >= 0) {
            cached = value;
        }
    }

    return cached;
}

/* Returns the time at which the system booted, as the number of milliseconds
 * since the epoch, or 0 if the time of boot cannot be determined. */
long long int
get_boot_time(void)
{
    static long long int cache_expiration = LLONG_MIN;
    static long long int boot_time;

    ovs_assert(LINUX);

    if (time_msec() >= cache_expiration) {
        static const char stat_file[] = "/proc/stat";
        char line[128];
        FILE *stream;

        cache_expiration = time_msec() + 5 * 1000;

        stream = fopen(stat_file, "r");
        if (!stream) {
            VLOG_ERR_ONCE("%s: open failed (%s)",
                          stat_file, ovs_strerror(errno));
            return boot_time;
        }

        while (fgets(line, sizeof line, stream)) {
            long long int btime;
            if (ovs_scan(line, "btime %lld", &btime)) {
                boot_time = btime * 1000;
                goto done;
            }
        }
        VLOG_ERR_ONCE("%s: btime not found", stat_file);
    done:
        fclose(stream);
    }
    return boot_time;
}

/* This is a wrapper for setting timeout in control utils.
 * The value of OVS_CTL_TIMEOUT environment variable will be used by
 * default if 'secs' is not specified. */
void
ctl_timeout_setup(unsigned int secs)
{
    if (!secs) {
        char *env = getenv("OVS_CTL_TIMEOUT");

        if (env && env[0]) {
            str_to_uint(env, 10, &secs);
        }
    }
    if (secs) {
        time_alarm(secs);
    }
}

/* Returns a pointer to a string describing the program version.  The
 * caller must not modify or free the returned string.
 */
const char *
ovs_get_program_version(void)
{
    return program_version;
}

/* Returns a pointer to a string describing the program name.  The
 * caller must not modify or free the returned string.
 */
const char *
ovs_get_program_name(void)
{
    return program_name;
}

/* Print the version information for the program.  */
void
ovs_print_version(uint8_t min_ofp, uint8_t max_ofp)
{
    printf("%s", program_version);
    if (min_ofp || max_ofp) {
        printf("OpenFlow versions %#x:%#x\n", min_ofp, max_ofp);
    }
}

/* Writes the 'size' bytes in 'buf' to 'stream' as hex bytes arranged 16 per
 * line.  Numeric offsets are also included, starting at 'ofs' for the first
 * byte in 'buf'.  If 'ascii' is true then the corresponding ASCII characters
 * are also rendered alongside. */
void
ovs_hex_dump(FILE *stream, const void *buf_, size_t size,
             uintptr_t ofs, bool ascii)
{
    const uint8_t *buf = buf_;
    const size_t per_line = 16; /* Maximum bytes per line. */

    while (size > 0) {
        size_t i;

        /* Number of bytes on this line. */
        size_t start = ofs % per_line;
        size_t end = per_line;
        if (end - start > size) {
            end = start + size;
        }
        size_t n = end - start;

        /* Print line. */
        fprintf(stream, "%08"PRIxMAX" ",
                (uintmax_t) ROUND_DOWN(ofs, per_line));
        for (i = 0; i < start; i++) {
            fprintf(stream, "   ");
        }
        for (; i < end; i++) {
            fprintf(stream, "%c%02x",
                    i == per_line / 2 ? '-' : ' ', buf[i - start]);
        }
        if (ascii) {
            fprintf(stream, " ");
            for (; i < per_line; i++) {
                fprintf(stream, "   ");
            }
            fprintf(stream, "|");
            for (i = 0; i < start; i++) {
                fprintf(stream, " ");
            }
            for (; i < end; i++) {
                int c = buf[i - start];
                putc(c >= 32 && c < 127 ? c : '.', stream);
            }
            for (; i < per_line; i++) {
                fprintf(stream, " ");
            }
            fprintf(stream, "|");
        }
        fprintf(stream, "\n");

        ofs += n;
        buf += n;
        size -= n;
    }
}

bool
str_to_int(const char *s, int base, int *i)
{
    long long ll;
    bool ok = str_to_llong(s, base, &ll);

    if (!ok || ll < INT_MIN || ll > INT_MAX) {
        *i = 0;
        return false;
    }
    *i = ll;
    return true;
}

bool
str_to_long(const char *s, int base, long *li)
{
    long long ll;
    bool ok = str_to_llong(s, base, &ll);

    if (!ok || ll < LONG_MIN || ll > LONG_MAX) {
        *li = 0;
        return false;
    }
    *li = ll;
    return true;
}

bool
str_to_llong(const char *s, int base, long long *x)
{
    char *tail;
    bool ok = str_to_llong_with_tail(s, &tail, base, x);
    if (*tail != '\0') {
        *x = 0;
        return false;
    }
    return ok;
}

bool
str_to_llong_with_tail(const char *s, char **tail, int base, long long *x)
{
    int save_errno = errno;
    errno = 0;
    *x = strtoll(s, tail, base);
    if (errno == EINVAL || errno == ERANGE || *tail == s) {
        errno = save_errno;
        *x = 0;
        return false;
    } else {
        errno = save_errno;
        return true;
    }
}

bool
str_to_uint(const char *s, int base, unsigned int *u)
{
    long long ll;
    bool ok = str_to_llong(s, base, &ll);
    if (!ok || ll < 0 || ll > UINT_MAX) {
        *u = 0;
        return false;
    } else {
        *u = ll;
        return true;
    }
}

bool
str_to_ullong(const char *s, int base, unsigned long long *x)
{
    int save_errno = errno;
    char *tail;

    errno = 0;
    *x = strtoull(s, &tail, base);
    if (errno == EINVAL || errno == ERANGE || tail == s || *tail != '\0') {
        errno = save_errno;
        *x = 0;
        return false;
    } else {
        errno = save_errno;
        return true;
    }
}

bool
str_to_llong_range(const char *s, int base, long long *begin,
                   long long *end)
{
    char *tail;
    if (str_to_llong_with_tail(s, &tail, base, begin)
        && *tail == '-'
        && str_to_llong(tail + 1, base, end)) {
        return true;
    }
    *begin = 0;
    *end = 0;
    return false;
}

/* Converts floating-point string 's' into a double.  If successful, stores
 * the double in '*d' and returns true; on failure, stores 0 in '*d' and
 * returns false.
 *
 * Underflow (e.g. "1e-9999") is not considered an error, but overflow
 * (e.g. "1e9999)" is. */
bool
str_to_double(const char *s, double *d)
{
    int save_errno = errno;
    char *tail;
    errno = 0;
    *d = strtod(s, &tail);
    if (errno == EINVAL || (errno == ERANGE && *d != 0)
        || tail == s || *tail != '\0') {
        errno = save_errno;
        *d = 0;
        return false;
    } else {
        errno = save_errno;
        return true;
    }
}

/* Returns the value of 'c' as a hexadecimal digit. */
int
hexit_value(unsigned char c)
{
    static const signed char tbl[UCHAR_MAX + 1] = {
#define TBL(x)                                  \
        (  x >= '0' && x <= '9' ? x - '0'       \
         : x >= 'a' && x <= 'f' ? x - 'a' + 0xa \
         : x >= 'A' && x <= 'F' ? x - 'A' + 0xa \
         : -1)
#define TBL0(x)  TBL(x),  TBL((x) + 1),   TBL((x) + 2),   TBL((x) + 3)
#define TBL1(x) TBL0(x), TBL0((x) + 4),  TBL0((x) + 8),  TBL0((x) + 12)
#define TBL2(x) TBL1(x), TBL1((x) + 16), TBL1((x) + 32), TBL1((x) + 48)
        TBL2(0), TBL2(64), TBL2(128), TBL2(192)
    };

    return tbl[c];
}

/* Returns the integer value of the 'n' hexadecimal digits starting at 's', or
 * UINTMAX_MAX if one of those "digits" is not really a hex digit.  Sets '*ok'
 * to true if the conversion succeeds or to false if a non-hex digit is
 * detected. */
uintmax_t
hexits_value(const char *s, size_t n, bool *ok)
{
    uintmax_t value;
    size_t i;

    value = 0;
    for (i = 0; i < n; i++) {
        int hexit = hexit_value(s[i]);
        if (hexit < 0) {
            *ok = false;
            return UINTMAX_MAX;
        }
        value = (value << 4) + hexit;
    }
    *ok = true;
    return value;
}

/* Parses the string in 's' as an integer in either hex or decimal format and
 * puts the result right justified in the array 'valuep' that is 'field_width'
 * big. If the string is in hex format, the value may be arbitrarily large;
 * integers are limited to 64-bit values. (The rationale is that decimal is
 * likely to represent a number and 64 bits is a reasonable maximum whereas
 * hex could either be a number or a byte string.)
 *
 * On return 'tail' points to the first character in the string that was
 * not parsed as part of the value. ERANGE is returned if the value is too
 * large to fit in the given field. */
int
parse_int_string(const char *s, uint8_t *valuep, int field_width, char **tail)
{
    unsigned long long int integer;
    int i;

    if (!strncmp(s, "0x", 2) || !strncmp(s, "0X", 2)) {
        uint8_t *hexit_str;
        int len = 0;
        int val_idx;
        int err = 0;

        s += 2;
        hexit_str = xmalloc(field_width * 2);

        for (;;) {
            uint8_t hexit;
            bool ok;

            s += strspn(s, " \t\r\n");
            hexit = hexits_value(s, 1, &ok);
            if (!ok) {
                *tail = CONST_CAST(char *, s);
                break;
            }

            if (hexit != 0 || len) {
                if (DIV_ROUND_UP(len + 1, 2) > field_width) {
                    err = ERANGE;
                    goto free;
                }

                hexit_str[len] = hexit;
                len++;
            }
            s++;
        }

        val_idx = field_width;
        for (i = len - 1; i >= 0; i -= 2) {
            val_idx--;
            valuep[val_idx] = hexit_str[i];
            if (i > 0) {
                valuep[val_idx] += hexit_str[i - 1] << 4;
            }
        }

        memset(valuep, 0, val_idx);

free:
        free(hexit_str);
        return err;
    }

    errno = 0;
    integer = strtoull(s, tail, 0);
    if (errno || s == *tail) {
        return errno ? errno : EINVAL;
    }

    for (i = field_width - 1; i >= 0; i--) {
        valuep[i] = integer;
        integer >>= 8;
    }
    if (integer) {
        return ERANGE;
    }

    return 0;
}

/* Returns the current working directory as a malloc()'d string, or a null
 * pointer if the current working directory cannot be determined. */
char *
get_cwd(void)
{
    long int path_max;
    size_t size;

    /* Get maximum path length or at least a reasonable estimate. */
#ifndef _WIN32
    path_max = pathconf(".", _PC_PATH_MAX);
#else
    path_max = MAX_PATH;
#endif
    size = (path_max < 0 ? 1024
            : path_max > 10240 ? 10240
            : path_max);

    /* Get current working directory. */
    for (;;) {
        char *buf = xmalloc(size);
        if (getcwd(buf, size)) {
            return xrealloc(buf, strlen(buf) + 1);
        } else {
            int error = errno;
            free(buf);
            if (error != ERANGE) {
                VLOG_WARN("getcwd failed (%s)", ovs_strerror(error));
                return NULL;
            }
            size *= 2;
        }
    }
}

static char *
all_slashes_name(const char *s)
{
    return xstrdup(s[0] == '/' && s[1] == '/' && s[2] != '/' ? "//"
                   : s[0] == '/' ? "/"
                   : ".");
}

#ifndef _WIN32
/* Returns the directory name portion of 'file_name' as a malloc()'d string,
 * similar to the POSIX dirname() function but thread-safe. */
char *
dir_name(const char *file_name)
{
    size_t len = strlen(file_name);
    while (len > 0 && file_name[len - 1] == '/') {
        len--;
    }
    while (len > 0 && file_name[len - 1] != '/') {
        len--;
    }
    while (len > 0 && file_name[len - 1] == '/') {
        len--;
    }
    return len ? xmemdup0(file_name, len) : all_slashes_name(file_name);
}

/* Returns the file name portion of 'file_name' as a malloc()'d string,
 * similar to the POSIX basename() function but thread-safe. */
char *
base_name(const char *file_name)
{
    size_t end, start;

    end = strlen(file_name);
    while (end > 0 && file_name[end - 1] == '/') {
        end--;
    }

    if (!end) {
        return all_slashes_name(file_name);
    }

    start = end;
    while (start > 0 && file_name[start - 1] != '/') {
        start--;
    }

    return xmemdup0(file_name + start, end - start);
}
#endif /* _WIN32 */

bool
is_file_name_absolute(const char *fn)
{
#ifdef _WIN32
    /* Use platform specific API */
    return !PathIsRelative(fn);
#else
    /* An absolute path begins with /. */
    return fn[0] == '/';
#endif
}

/* If 'file_name' is absolute, returns a copy of 'file_name'.  Otherwise,
 * returns an absolute path to 'file_name' considering it relative to 'dir',
 * which itself must be absolute.  'dir' may be null or the empty string, in
 * which case the current working directory is used.
 *
 * Returns a null pointer if 'dir' is null and getcwd() fails. */
char *
abs_file_name(const char *dir, const char *file_name)
{
    /* If it's already absolute, return a copy. */
    if (is_file_name_absolute(file_name)) {
        return xstrdup(file_name);
    }

    /* If a base dir was supplied, use it.  We assume, without checking, that
     * the base dir is absolute.*/
    if (dir && dir[0]) {
        char *separator = dir[strlen(dir) - 1] == '/' ? "" : "/";
        return xasprintf("%s%s%s", dir, separator, file_name);
    }

#if _WIN32
    /* It's a little complicated to make an absolute path on Windows because a
     * relative path might still specify a drive letter.  The OS has a function
     * to do the job for us, so use it. */
    char abs_path[MAX_PATH];
    DWORD n = GetFullPathName(file_name, sizeof abs_path, abs_path, NULL);
    return n > 0 && n <= sizeof abs_path ? xmemdup0(abs_path, n) : NULL;
#else
    /* Outside Windows, do the job ourselves. */
    char *cwd = get_cwd();
    if (!cwd) {
        return NULL;
    }
    char *abs_name = xasprintf("%s/%s", cwd, file_name);
    free(cwd);
    return abs_name;
#endif
}

/* Like readlink(), but returns the link name as a null-terminated string in
 * allocated memory that the caller must eventually free (with free()).
 * Returns NULL on error, in which case errno is set appropriately. */
static char *
xreadlink(const char *filename)
{
#ifdef _WIN32
    errno = ENOENT;
    return NULL;
#else
    size_t size;

    for (size = 64; ; size *= 2) {
        char *buf = xmalloc(size);
        ssize_t retval = readlink(filename, buf, size);
        int error = errno;

        if (retval >= 0 && retval < size) {
            buf[retval] = '\0';
            return buf;
        }

        free(buf);
        if (retval < 0) {
            errno = error;
            return NULL;
        }
    }
#endif
}

/* Returns a version of 'filename' with symlinks in the final component
 * dereferenced.  This differs from realpath() in that:
 *
 *     - 'filename' need not exist.
 *
 *     - If 'filename' does exist as a symlink, its referent need not exist.
 *
 *     - Only symlinks in the final component of 'filename' are dereferenced.
 *
 * For Windows platform, this function returns a string that has the same
 * value as the passed string.
 *
 * The caller must eventually free the returned string (with free()). */
char *
follow_symlinks(const char *filename)
{
#ifndef _WIN32
    struct stat s;
    char *fn;
    int i;

    fn = xstrdup(filename);
    for (i = 0; i < 10; i++) {
        char *linkname;
        char *next_fn;

        if (lstat(fn, &s) != 0 || !S_ISLNK(s.st_mode)) {
            return fn;
        }

        linkname = xreadlink(fn);
        if (!linkname) {
            VLOG_WARN("%s: readlink failed (%s)",
                      filename, ovs_strerror(errno));
            return fn;
        }

        if (linkname[0] == '/') {
            /* Target of symlink is absolute so use it raw. */
            next_fn = linkname;
        } else {
            /* Target of symlink is relative so add to 'fn''s directory. */
            char *dir = dir_name(fn);

            if (!strcmp(dir, ".")) {
                next_fn = linkname;
            } else {
                char *separator = dir[strlen(dir) - 1] == '/' ? "" : "/";
                next_fn = xasprintf("%s%s%s", dir, separator, linkname);
                free(linkname);
            }

            free(dir);
        }

        free(fn);
        fn = next_fn;
    }

    VLOG_WARN("%s: too many levels of symlinks", filename);
    free(fn);
#endif
    return xstrdup(filename);
}

/* Pass a value to this function if it is marked with
 * __attribute__((warn_unused_result)) and you genuinely want to ignore
 * its return value.  (Note that every scalar type can be implicitly
 * converted to bool.) */
void ignore(bool x OVS_UNUSED) { }

/* Returns an appropriate delimiter for inserting just before the 0-based item
 * 'index' in a list that has 'total' items in it. */
const char *
english_list_delimiter(size_t index, size_t total)
{
    return (index == 0 ? ""
            : index < total - 1 ? ", "
            : total > 2 ? ", and "
            : " and ");
}

/* Returns the number of trailing 0-bits in 'n'.  Undefined if 'n' == 0. */
#if __GNUC__ >= 4 || _MSC_VER
/* Defined inline in util.h. */
#else
/* Returns the number of trailing 0-bits in 'n'.  Undefined if 'n' == 0. */
int
raw_ctz(uint64_t n)
{
    uint64_t k;
    int count = 63;

#define CTZ_STEP(X)                             \
    k = n << (X);                               \
    if (k) {                                    \
        count -= X;                             \
        n = k;                                  \
    }
    CTZ_STEP(32);
    CTZ_STEP(16);
    CTZ_STEP(8);
    CTZ_STEP(4);
    CTZ_STEP(2);
    CTZ_STEP(1);
#undef CTZ_STEP

    return count;
}

/* Returns the number of leading 0-bits in 'n'.  Undefined if 'n' == 0. */
int
raw_clz64(uint64_t n)
{
    uint64_t k;
    int count = 63;

#define CLZ_STEP(X)                             \
    k = n >> (X);                               \
    if (k) {                                    \
        count -= X;                             \
        n = k;                                  \
    }
    CLZ_STEP(32);
    CLZ_STEP(16);
    CLZ_STEP(8);
    CLZ_STEP(4);
    CLZ_STEP(2);
    CLZ_STEP(1);
#undef CLZ_STEP

    return count;
}
#endif

#if NEED_COUNT_1BITS_8
#define INIT1(X)                                \
    ((((X) & (1 << 0)) != 0) +                  \
     (((X) & (1 << 1)) != 0) +                  \
     (((X) & (1 << 2)) != 0) +                  \
     (((X) & (1 << 3)) != 0) +                  \
     (((X) & (1 << 4)) != 0) +                  \
     (((X) & (1 << 5)) != 0) +                  \
     (((X) & (1 << 6)) != 0) +                  \
     (((X) & (1 << 7)) != 0))
#define INIT2(X)   INIT1(X),  INIT1((X) +  1)
#define INIT4(X)   INIT2(X),  INIT2((X) +  2)
#define INIT8(X)   INIT4(X),  INIT4((X) +  4)
#define INIT16(X)  INIT8(X),  INIT8((X) +  8)
#define INIT32(X) INIT16(X), INIT16((X) + 16)
#define INIT64(X) INIT32(X), INIT32((X) + 32)

const uint8_t count_1bits_8[256] = {
    INIT64(0), INIT64(64), INIT64(128), INIT64(192)
};
#endif

/* Returns true if the 'n' bytes starting at 'p' are 'byte'. */
bool
is_all_byte(const void *p_, size_t n, uint8_t byte)
{
    const uint8_t *p = p_;
    size_t i;

    for (i = 0; i < n; i++) {
        if (p[i] != byte) {
            return false;
        }
    }
    return true;
}

/* Returns true if the 'n' bytes starting at 'p' are zeros. */
bool
is_all_zeros(const void *p, size_t n)
{
    return is_all_byte(p, n, 0);
}

/* Returns true if the 'n' bytes starting at 'p' are 0xff. */
bool
is_all_ones(const void *p, size_t n)
{
    return is_all_byte(p, n, 0xff);
}

/* *dst |= *src for 'n' bytes. */
void
or_bytes(void *dst_, const void *src_, size_t n)
{
    const uint8_t *src = src_;
    uint8_t *dst = dst_;
    size_t i;

    for (i = 0; i < n; i++) {
        *dst++ |= *src++;
    }
}

/* Copies 'n_bits' bits starting from bit 'src_ofs' in 'src' to the 'n_bits'
 * starting from bit 'dst_ofs' in 'dst'.  'src' is 'src_len' bytes long and
 * 'dst' is 'dst_len' bytes long.
 *
 * If you consider all of 'src' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in src[src_len - 1], bit 1 is the bit with value 2, bit 2 is
 * the bit with value 4, ..., bit 8 is the bit with value 1 in src[src_len -
 * 2], and so on.  Similarly for 'dst'.
 *
 * Required invariants:
 *   src_ofs + n_bits <= src_len * 8
 *   dst_ofs + n_bits <= dst_len * 8
 *   'src' and 'dst' must not overlap.
 */
void
bitwise_copy(const void *src_, unsigned int src_len, unsigned int src_ofs,
             void *dst_, unsigned int dst_len, unsigned int dst_ofs,
             unsigned int n_bits)
{
    const uint8_t *src = src_;
    uint8_t *dst = dst_;

    src += src_len - (src_ofs / 8 + 1);
    src_ofs %= 8;

    dst += dst_len - (dst_ofs / 8 + 1);
    dst_ofs %= 8;

    if (src_ofs == 0 && dst_ofs == 0) {
        unsigned int n_bytes = n_bits / 8;
        if (n_bytes) {
            dst -= n_bytes - 1;
            src -= n_bytes - 1;
            memcpy(dst, src, n_bytes);

            n_bits %= 8;
            src--;
            dst--;
        }
        if (n_bits) {
            uint8_t mask = (1 << n_bits) - 1;
            *dst = (*dst & ~mask) | (*src & mask);
        }
    } else {
        while (n_bits > 0) {
            unsigned int max_copy = 8 - MAX(src_ofs, dst_ofs);
            unsigned int chunk = MIN(n_bits, max_copy);
            uint8_t mask = ((1 << chunk) - 1) << dst_ofs;

            *dst &= ~mask;
            *dst |= ((*src >> src_ofs) << dst_ofs) & mask;

            src_ofs += chunk;
            if (src_ofs == 8) {
                src--;
                src_ofs = 0;
            }
            dst_ofs += chunk;
            if (dst_ofs == 8) {
                dst--;
                dst_ofs = 0;
            }
            n_bits -= chunk;
        }
    }
}

/* Zeros the 'n_bits' bits starting from bit 'dst_ofs' in 'dst'.  'dst' is
 * 'dst_len' bytes long.
 *
 * If you consider all of 'dst' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in dst[dst_len - 1], bit 1 is the bit with value 2, bit 2 is
 * the bit with value 4, ..., bit 8 is the bit with value 1 in dst[dst_len -
 * 2], and so on.
 *
 * Required invariant:
 *   dst_ofs + n_bits <= dst_len * 8
 */
void
bitwise_zero(void *dst_, unsigned int dst_len, unsigned dst_ofs,
             unsigned int n_bits)
{
    uint8_t *dst = dst_;

    if (!n_bits) {
        return;
    }

    dst += dst_len - (dst_ofs / 8 + 1);
    dst_ofs %= 8;

    if (dst_ofs) {
        unsigned int chunk = MIN(n_bits, 8 - dst_ofs);

        *dst &= ~(((1 << chunk) - 1) << dst_ofs);

        n_bits -= chunk;
        if (!n_bits) {
            return;
        }

        dst--;
    }

    while (n_bits >= 8) {
        *dst-- = 0;
        n_bits -= 8;
    }

    if (n_bits) {
        *dst &= ~((1 << n_bits) - 1);
    }
}

/* Sets to 1 all of the 'n_bits' bits starting from bit 'dst_ofs' in 'dst'.
 * 'dst' is 'dst_len' bytes long.
 *
 * If you consider all of 'dst' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in dst[dst_len - 1], bit 1 is the bit with value 2, bit 2 is
 * the bit with value 4, ..., bit 8 is the bit with value 1 in dst[dst_len -
 * 2], and so on.
 *
 * Required invariant:
 *   dst_ofs + n_bits <= dst_len * 8
 */
void
bitwise_one(void *dst_, unsigned int dst_len, unsigned dst_ofs,
            unsigned int n_bits)
{
    uint8_t *dst = dst_;

    if (!n_bits) {
        return;
    }

    dst += dst_len - (dst_ofs / 8 + 1);
    dst_ofs %= 8;

    if (dst_ofs) {
        unsigned int chunk = MIN(n_bits, 8 - dst_ofs);

        *dst |= ((1 << chunk) - 1) << dst_ofs;

        n_bits -= chunk;
        if (!n_bits) {
            return;
        }

        dst--;
    }

    while (n_bits >= 8) {
        *dst-- = 0xff;
        n_bits -= 8;
    }

    if (n_bits) {
        *dst |= (1 << n_bits) - 1;
    }
}

/* Scans the 'n_bits' bits starting from bit 'dst_ofs' in 'dst' for 1-bits.
 * Returns false if any 1-bits are found, otherwise true.  'dst' is 'dst_len'
 * bytes long.
 *
 * If you consider all of 'dst' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in dst[dst_len - 1], bit 1 is the bit with value 2, bit 2 is
 * the bit with value 4, ..., bit 8 is the bit with value 1 in dst[dst_len -
 * 2], and so on.
 *
 * Required invariant:
 *   dst_ofs + n_bits <= dst_len * 8
 */
bool
bitwise_is_all_zeros(const void *p_, unsigned int len, unsigned int ofs,
                     unsigned int n_bits)
{
    const uint8_t *p = p_;

    if (!n_bits) {
        return true;
    }

    p += len - (ofs / 8 + 1);
    ofs %= 8;

    if (ofs) {
        unsigned int chunk = MIN(n_bits, 8 - ofs);

        if (*p & (((1 << chunk) - 1) << ofs)) {
            return false;
        }

        n_bits -= chunk;
        if (!n_bits) {
            return true;
        }

        p--;
    }

    while (n_bits >= 8) {
        if (*p) {
            return false;
        }
        n_bits -= 8;
        p--;
    }

    if (n_bits && *p & ((1 << n_bits) - 1)) {
        return false;
    }

    return true;
}

/* Scans the bits in 'p' that have bit offsets 'start' (inclusive) through
 * 'end' (exclusive) for the first bit with value 'target'.  If one is found,
 * returns its offset, otherwise 'end'.  'p' is 'len' bytes long.
 *
 * If you consider all of 'p' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in p[len - 1], bit 1 is the bit with value 2, bit 2 is the bit
 * with value 4, ..., bit 8 is the bit with value 1 in p[len - 2], and so on.
 *
 * Required invariant:
 *   start <= end
 */
unsigned int
bitwise_scan(const void *p, unsigned int len, bool target, unsigned int start,
             unsigned int end)
{
    unsigned int ofs;

    for (ofs = start; ofs < end; ofs++) {
        if (bitwise_get_bit(p, len, ofs) == target) {
            break;
        }
    }
    return ofs;
}

/* Scans the bits in 'p' that have bit offsets 'start' (inclusive) through
 * 'end' (exclusive) for the first bit with value 'target', in reverse order.
 * If one is found, returns its offset, otherwise 'end'.  'p' is 'len' bytes
 * long.
 *
 * If you consider all of 'p' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in p[len - 1], bit 1 is the bit with value 2, bit 2 is the bit
 * with value 4, ..., bit 8 is the bit with value 1 in p[len - 2], and so on.
 *
 * To scan an entire bit array in reverse order, specify start == len * 8 - 1
 * and end == -1, in which case the return value is nonnegative if successful
 * and -1 if no 'target' match is found.
 *
 * Required invariant:
 *   start >= end
 */
int
bitwise_rscan(const void *p, unsigned int len, bool target, int start, int end)
{
    const uint8_t *s = p;
    int start_byte = len - (start / 8 + 1);
    int end_byte = len - (end / 8 + 1);
    int ofs_byte;
    int ofs;
    uint8_t the_byte;

    /* Find the target in the start_byte from starting offset */
    ofs_byte = start_byte;
    the_byte = s[ofs_byte];
    for (ofs = start % 8; ofs >= 0; ofs--) {
        if (((the_byte & (1u << ofs)) != 0) == target) {
            break;
        }
    }
    if (ofs < 0) {
        /* Target not found in start byte, continue searching byte by byte */
        for (ofs_byte = start_byte + 1; ofs_byte <= end_byte; ofs_byte++) {
            if ((target && s[ofs_byte])
                    || (!target && (s[ofs_byte] != 0xff))) {
               break;
            }
        }
        if (ofs_byte > end_byte) {
            return end;
        }
        the_byte = s[ofs_byte];
        /* Target is in the_byte, find it bit by bit */
        for (ofs = 7; ofs >= 0; ofs--) {
            if (((the_byte & (1u << ofs)) != 0) == target) {
                break;
            }
        }
    }
    int ret = (len - ofs_byte) * 8 - (8 - ofs);
    if (ret < end) {
        return end;
    }
    return ret;
}

/* Copies the 'n_bits' low-order bits of 'value' into the 'n_bits' bits
 * starting at bit 'dst_ofs' in 'dst', which is 'dst_len' bytes long.
 *
 * If you consider all of 'dst' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in dst[dst_len - 1], bit 1 is the bit with value 2, bit 2 is
 * the bit with value 4, ..., bit 8 is the bit with value 1 in dst[dst_len -
 * 2], and so on.
 *
 * Required invariants:
 *   dst_ofs + n_bits <= dst_len * 8
 *   n_bits <= 64
 */
void
bitwise_put(uint64_t value,
            void *dst, unsigned int dst_len, unsigned int dst_ofs,
            unsigned int n_bits)
{
    ovs_be64 n_value = htonll(value);
    bitwise_copy(&n_value, sizeof n_value, 0,
                 dst, dst_len, dst_ofs,
                 n_bits);
}

/* Returns the value of the 'n_bits' bits starting at bit 'src_ofs' in 'src',
 * which is 'src_len' bytes long.
 *
 * If you consider all of 'src' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in src[src_len - 1], bit 1 is the bit with value 2, bit 2 is
 * the bit with value 4, ..., bit 8 is the bit with value 1 in src[src_len -
 * 2], and so on.
 *
 * Required invariants:
 *   src_ofs + n_bits <= src_len * 8
 *   n_bits <= 64
 */
uint64_t
bitwise_get(const void *src, unsigned int src_len,
            unsigned int src_ofs, unsigned int n_bits)
{
    ovs_be64 value = htonll(0);

    bitwise_copy(src, src_len, src_ofs,
                 &value, sizeof value, 0,
                 n_bits);
    return ntohll(value);
}

/* Returns the value of the bit with offset 'ofs' in 'src', which is 'len'
 * bytes long.
 *
 * If you consider all of 'src' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in src[len - 1], bit 1 is the bit with value 2, bit 2 is the
 * bit with value 4, ..., bit 8 is the bit with value 1 in src[len - 2], and so
 * on.
 *
 * Required invariants:
 *   ofs < len * 8
 */
bool
bitwise_get_bit(const void *src_, unsigned int len, unsigned int ofs)
{
    const uint8_t *src = src_;

    return (src[len - (ofs / 8 + 1)] & (1u << (ofs % 8))) != 0;
}

/* Sets the bit with offset 'ofs' in 'dst', which is 'len' bytes long, to 0.
 *
 * If you consider all of 'dst' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in dst[len - 1], bit 1 is the bit with value 2, bit 2 is the
 * bit with value 4, ..., bit 8 is the bit with value 1 in dst[len - 2], and so
 * on.
 *
 * Required invariants:
 *   ofs < len * 8
 */
void
bitwise_put0(void *dst_, unsigned int len, unsigned int ofs)
{
    uint8_t *dst = dst_;

    dst[len - (ofs / 8 + 1)] &= ~(1u << (ofs % 8));
}

/* Sets the bit with offset 'ofs' in 'dst', which is 'len' bytes long, to 1.
 *
 * If you consider all of 'dst' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in dst[len - 1], bit 1 is the bit with value 2, bit 2 is the
 * bit with value 4, ..., bit 8 is the bit with value 1 in dst[len - 2], and so
 * on.
 *
 * Required invariants:
 *   ofs < len * 8
 */
void
bitwise_put1(void *dst_, unsigned int len, unsigned int ofs)
{
    uint8_t *dst = dst_;

    dst[len - (ofs / 8 + 1)] |= 1u << (ofs % 8);
}

/* Sets the bit with offset 'ofs' in 'dst', which is 'len' bytes long, to 'b'.
 *
 * If you consider all of 'dst' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in dst[len - 1], bit 1 is the bit with value 2, bit 2 is the
 * bit with value 4, ..., bit 8 is the bit with value 1 in dst[len - 2], and so
 * on.
 *
 * Required invariants:
 *   ofs < len * 8
 */
void
bitwise_put_bit(void *dst, unsigned int len, unsigned int ofs, bool b)
{
    if (b) {
        bitwise_put1(dst, len, ofs);
    } else {
        bitwise_put0(dst, len, ofs);
    }
}

/* Flips the bit with offset 'ofs' in 'dst', which is 'len' bytes long.
 *
 * If you consider all of 'dst' to be a single unsigned integer in network byte
 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 * with value 1 in dst[len - 1], bit 1 is the bit with value 2, bit 2 is the
 * bit with value 4, ..., bit 8 is the bit with value 1 in dst[len - 2], and so
 * on.
 *
 * Required invariants:
 *   ofs < len * 8
 */
void
bitwise_toggle_bit(void *dst_, unsigned int len, unsigned int ofs)
{
    uint8_t *dst = dst_;

    dst[len - (ofs / 8 + 1)] ^= 1u << (ofs % 8);
}

/* ovs_scan */

struct scan_spec {
    unsigned int width;
    enum {
        SCAN_DISCARD,
        SCAN_CHAR,
        SCAN_SHORT,
        SCAN_INT,
        SCAN_LONG,
        SCAN_LLONG,
        SCAN_INTMAX_T,
        SCAN_PTRDIFF_T,
        SCAN_SIZE_T
    } type;
};

static const char *
skip_spaces(const char *s)
{
    while (isspace((unsigned char) *s)) {
        s++;
    }
    return s;
}

static const char *
scan_int(const char *s, const struct scan_spec *spec, int base, va_list *args)
{
    const char *start = s;
    uintmax_t value;
    bool negative;
    int n_digits;

    negative = *s == '-';
    s += *s == '-' || *s == '+';

    if ((!base || base == 16) && *s == '0' && (s[1] == 'x' || s[1] == 'X')) {
        base = 16;
        s += 2;
    } else if (!base) {
        base = *s == '0' ? 8 : 10;
    }

    if (s - start >= spec->width) {
        return NULL;
    }

    value = 0;
    n_digits = 0;
    while (s - start < spec->width) {
        int digit = hexit_value(*s);

        if (digit < 0 || digit >= base) {
            break;
        }
        value = value * base + digit;
        n_digits++;
        s++;
    }
    if (!n_digits) {
        return NULL;
    }

    if (negative) {
        value = -value;
    }

    switch (spec->type) {
    case SCAN_DISCARD:
        break;
    case SCAN_CHAR:
        *va_arg(*args, char *) = value;
        break;
    case SCAN_SHORT:
        *va_arg(*args, short int *) = value;
        break;
    case SCAN_INT:
        *va_arg(*args, int *) = value;
        break;
    case SCAN_LONG:
        *va_arg(*args, long int *) = value;
        break;
    case SCAN_LLONG:
        *va_arg(*args, long long int *) = value;
        break;
    case SCAN_INTMAX_T:
        *va_arg(*args, intmax_t *) = value;
        break;
    case SCAN_PTRDIFF_T:
        *va_arg(*args, ptrdiff_t *) = value;
        break;
    case SCAN_SIZE_T:
        *va_arg(*args, size_t *) = value;
        break;
    }
    return s;
}

static const char *
skip_digits(const char *s)
{
    while (*s >= '0' && *s <= '9') {
        s++;
    }
    return s;
}

static const char *
scan_float(const char *s, const struct scan_spec *spec, va_list *args)
{
    const char *start = s;
    long double value;
    char *tail;
    char *copy;
    bool ok;

    s += *s == '+' || *s == '-';
    s = skip_digits(s);
    if (*s == '.') {
        s = skip_digits(s + 1);
    }
    if (*s == 'e' || *s == 'E') {
        s++;
        s += *s == '+' || *s == '-';
        s = skip_digits(s);
    }

    if (s - start > spec->width) {
        s = start + spec->width;
    }

    copy = xmemdup0(start, s - start);
    value = strtold(copy, &tail);
    ok = *tail == '\0';
    free(copy);
    if (!ok) {
        return NULL;
    }

    switch (spec->type) {
    case SCAN_DISCARD:
        break;
    case SCAN_INT:
        *va_arg(*args, float *) = value;
        break;
    case SCAN_LONG:
        *va_arg(*args, double *) = value;
        break;
    case SCAN_LLONG:
        *va_arg(*args, long double *) = value;
        break;

    case SCAN_CHAR:
    case SCAN_SHORT:
    case SCAN_INTMAX_T:
    case SCAN_PTRDIFF_T:
    case SCAN_SIZE_T:
        OVS_NOT_REACHED();
    }
    return s;
}

static void
scan_output_string(const struct scan_spec *spec,
                   const char *s, size_t n,
                   va_list *args)
{
    if (spec->type != SCAN_DISCARD) {
        char *out = va_arg(*args, char *);
        memcpy(out, s, n);
        out[n] = '\0';
    }
}

static const char *
scan_string(const char *s, const struct scan_spec *spec, va_list *args)
{
    size_t n;

    for (n = 0; n < spec->width; n++) {
        if (!s[n] || isspace((unsigned char) s[n])) {
            break;
        }
    }
    if (!n) {
        return NULL;
    }

    scan_output_string(spec, s, n, args);
    return s + n;
}

static const char *
parse_scanset(const char *p_, unsigned long *set, bool *complemented)
{
    const uint8_t *p = (const uint8_t *) p_;

    *complemented = *p == '^';
    p += *complemented;

    if (*p == ']') {
        bitmap_set1(set, ']');
        p++;
    }

    while (*p && *p != ']') {
        if (p[1] == '-' && p[2] != ']' && p[2] > *p) {
            bitmap_set_multiple(set, *p, p[2] - *p + 1, true);
            p += 3;
        } else {
            bitmap_set1(set, *p++);
        }
    }
    if (*p == ']') {
        p++;
    }
    return (const char *) p;
}

static const char *
scan_set(const char *s, const struct scan_spec *spec, const char **pp,
         va_list *args)
{
    unsigned long set[BITMAP_N_LONGS(UCHAR_MAX + 1)];
    bool complemented;
    unsigned int n;

    /* Parse the scan set. */
    memset(set, 0, sizeof set);
    *pp = parse_scanset(*pp, set, &complemented);

    /* Parse the data. */
    n = 0;
    while (s[n]
           && bitmap_is_set(set, (unsigned char) s[n]) == !complemented
           && n < spec->width) {
        n++;
    }
    if (!n) {
        return NULL;
    }
    scan_output_string(spec, s, n, args);
    return s + n;
}

static const char *
scan_chars(const char *s, const struct scan_spec *spec, va_list *args)
{
    unsigned int n = spec->width == UINT_MAX ? 1 : spec->width;

    if (strlen(s) < n) {
        return NULL;
    }
    if (spec->type != SCAN_DISCARD) {
        memcpy(va_arg(*args, char *), s, n);
    }
    return s + n;
}

static bool
ovs_scan__(const char *s, int *n, const char *format, va_list *args)
{
    const char *const start = s;
    bool ok = false;
    const char *p;

    p = format;
    while (*p != '\0') {
        struct scan_spec spec;
        unsigned char c = *p++;
        bool discard;

        if (isspace(c)) {
            s = skip_spaces(s);
            continue;
        } else if (c != '%') {
            if (*s != c) {
                goto exit;
            }
            s++;
            continue;
        } else if (*p == '%') {
            if (*s++ != '%') {
                goto exit;
            }
            p++;
            continue;
        }

        /* Parse '*' flag. */
        discard = *p == '*';
        p += discard;

        /* Parse field width. */
        spec.width = 0;
        while (*p >= '0' && *p <= '9') {
            spec.width = spec.width * 10 + (*p++ - '0');
        }
        if (spec.width == 0) {
            spec.width = UINT_MAX;
        }

        /* Parse type modifier. */
        switch (*p) {
        case 'h':
            if (p[1] == 'h') {
                spec.type = SCAN_CHAR;
                p += 2;
            } else {
                spec.type = SCAN_SHORT;
                p++;
            }
            break;

        case 'j':
            spec.type = SCAN_INTMAX_T;
            p++;
            break;

        case 'l':
            if (p[1] == 'l') {
                spec.type = SCAN_LLONG;
                p += 2;
            } else {
                spec.type = SCAN_LONG;
                p++;
            }
            break;

        case 'L':
        case 'q':
            spec.type = SCAN_LLONG;
            p++;
            break;

        case 't':
            spec.type = SCAN_PTRDIFF_T;
            p++;
            break;

        case 'z':
            spec.type = SCAN_SIZE_T;
            p++;
            break;

        default:
            spec.type = SCAN_INT;
            break;
        }

        if (discard) {
            spec.type = SCAN_DISCARD;
        }

        c = *p++;
        if (c != 'c' && c != 'n' && c != '[') {
            s = skip_spaces(s);
        }
        switch (c) {
        case 'd':
            s = scan_int(s, &spec, 10, args);
            break;

        case 'i':
            s = scan_int(s, &spec, 0, args);
            break;

        case 'o':
            s = scan_int(s, &spec, 8, args);
            break;

        case 'u':
            s = scan_int(s, &spec, 10, args);
            break;

        case 'x':
        case 'X':
            s = scan_int(s, &spec, 16, args);
            break;

        case 'e':
        case 'f':
        case 'g':
        case 'E':
        case 'G':
            s = scan_float(s, &spec, args);
            break;

        case 's':
            s = scan_string(s, &spec, args);
            break;

        case '[':
            s = scan_set(s, &spec, &p, args);
            break;

        case 'c':
            s = scan_chars(s, &spec, args);
            break;

        case 'n':
            if (spec.type != SCAN_DISCARD) {
                *va_arg(*args, int *) = s - start;
            }
            break;
        }

        if (!s) {
            goto exit;
        }
    }
    if (n) {
        *n = s - start;
    }

    ok = true;
exit:
    return ok;
}

/* This is an implementation of the standard sscanf() function, with the
 * following exceptions:
 *
 *   - It returns true if the entire format was successfully scanned and
 *     converted, false if any conversion failed.
 *
 *   - The standard doesn't define sscanf() behavior when an out-of-range value
 *     is scanned, e.g. if a "%"PRIi8 conversion scans "-1" or "0x1ff".  Some
 *     implementations consider this an error and stop scanning.  This
 *     implementation never considers an out-of-range value an error; instead,
 *     it stores the least-significant bits of the converted value in the
 *     destination, e.g. the value 255 for both examples earlier.
 *
 *   - Only single-byte characters are supported, that is, the 'l' modifier
 *     on %s, %[, and %c is not supported.  The GNU extension 'a' modifier is
 *     also not supported.
 *
 *   - %p is not supported.
 */
bool
ovs_scan(const char *s, const char *format, ...)
{
    va_list args;
    bool res;

    va_start(args, format);
    res = ovs_scan__(s, NULL, format, &args);
    va_end(args);
    return res;
}

/*
 * This function is similar to ovs_scan(), with an extra parameter `n` added to
 * return the number of scanned characters.
 */
bool
ovs_scan_len(const char *s, int *n, const char *format, ...)
{
    va_list args;
    bool success;
    int n1;

    va_start(args, format);
    success = ovs_scan__(s + *n, &n1, format, &args);
    va_end(args);
    if (success) {
        *n = *n + n1;
    }
    return success;
}

void
xsleep(unsigned int seconds)
{
    ovsrcu_quiesce_start();
#ifdef _WIN32
    Sleep(seconds * 1000);
#else
    sleep(seconds);
#endif
    ovsrcu_quiesce_end();
}

static void
xnanosleep__(uint64_t nanoseconds)
{
#ifndef _WIN32
    int retval;
    struct timespec ts_sleep;
    nsec_to_timespec(nanoseconds, &ts_sleep);

    int error = 0;
    do {
        retval = nanosleep(&ts_sleep, NULL);
        error = retval < 0 ? errno : 0;
    } while (error == EINTR);
#else
    HANDLE timer = CreateWaitableTimer(NULL, FALSE, NULL);
    if (timer) {
        LARGE_INTEGER duetime;
        duetime.QuadPart = -nanoseconds;
        if (SetWaitableTimer(timer, &duetime, 0, NULL, NULL, FALSE)) {
            WaitForSingleObject(timer, INFINITE);
        } else {
            VLOG_ERR_ONCE("SetWaitableTimer Failed (%s)",
                           ovs_lasterror_to_string());
        }
        CloseHandle(timer);
    } else {
        VLOG_ERR_ONCE("CreateWaitableTimer Failed (%s)",
                       ovs_lasterror_to_string());
    }
#endif
}

/* High resolution sleep with thread quiesce. */
void
xnanosleep(uint64_t nanoseconds)
{
    ovsrcu_quiesce_start();
    xnanosleep__(nanoseconds);
    ovsrcu_quiesce_end();
}

/* High resolution sleep without thread quiesce. */
void
xnanosleep_no_quiesce(uint64_t nanoseconds)
{
    xnanosleep__(nanoseconds);
}

#if __linux__
void
set_timer_resolution(unsigned long nanoseconds)
{
    prctl(PR_SET_TIMERSLACK, nanoseconds);
}
#else
void
set_timer_resolution(unsigned long nanoseconds OVS_UNUSED)
{
}
#endif

/* Determine whether standard output is a tty or not. This is useful to decide
 * whether to use color output or not when --color option for utilities is set
 * to `auto`.
 */
bool
is_stdout_a_tty(void)
{
    char const *t = getenv("TERM");
    return (isatty(STDOUT_FILENO) && t && strcmp(t, "dumb") != 0);
}

#ifdef _WIN32

char *
ovs_format_message(int error)
{
    enum { BUFSIZE = sizeof strerror_buffer_get()->s };
    char *buffer = strerror_buffer_get()->s;

    if (error == 0) {
        /* See ovs_strerror */
        return "Success";
    }

    FormatMessage(FORMAT_MESSAGE_FROM_SYSTEM | FORMAT_MESSAGE_IGNORE_INSERTS,
                  NULL, error, 0, buffer, BUFSIZE, NULL);
    return buffer;
}

/* Returns a null-terminated string that explains the last error.
 * Use this function to get the error string for WINAPI calls. */
char *
ovs_lasterror_to_string(void)
{
    return ovs_format_message(GetLastError());
}

int
ftruncate(int fd, off_t length)
{
    int error;

    error = _chsize_s(fd, length);
    if (error) {
        return -1;
    }
    return 0;
}

OVS_CONSTRUCTOR(winsock_start) {
    WSADATA wsaData;
    int error;

    error = WSAStartup(MAKEWORD(2, 2), &wsaData);
    if (error != 0) {
        VLOG_FATAL("WSAStartup failed: %s", sock_strerror(sock_errno()));
   }
}
#endif

#ifdef __linux__
bool
ovs_kernel_is_version_or_newer(int target_major, int target_minor)
{
    static struct ovsthread_once once = OVSTHREAD_ONCE_INITIALIZER;
    static int current_major, current_minor = -1;

    if (ovsthread_once_start(&once)) {
        struct utsname utsname;

        if (uname(&utsname) == -1) {
            VLOG_WARN("uname failed (%s)", ovs_strerror(errno));
        } else if (!ovs_scan(utsname.release, "%d.%d",
                    &current_major, &current_minor)) {
            VLOG_WARN("uname reported bad OS release (%s)", utsname.release);
        }
        ovsthread_once_done(&once);
    }
    if (current_major == -1 || current_minor == -1) {
        return false;
    }
    return current_major > target_major || (
            current_major == target_major && current_minor >= target_minor);
}
#endif
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								/*
-												util: New function nullable_xstrdup().

It's a pretty common pattern so create a function for it.

Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-06-24 21:23:16 -07:00
+								 * Copyright (c) 2008, 2009, 2010, 2011, 2012, 2013, 2014, 2015, 2016 Nicira, Inc.
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								 *
-												Update primary code license to Apache 2.0.

											
										
										
											2009-06-15 15:11:30 -07:00
+								 * Licensed under the Apache License, Version 2.0 (the "License");
 								 * you may not use this file except in compliance with the License.
 								 * You may obtain a copy of the License at:
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								 *
-												Update primary code license to Apache 2.0.

											
										
										
											2009-06-15 15:11:30 -07:00
+								 *     http://www.apache.org/licenses/LICENSE-2.0
 								 *
 								 * Unless required by applicable law or agreed to in writing, software
 								 * distributed under the License is distributed on an "AS IS" BASIS,
 								 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 								 * See the License for the specific language governing permissions and
 								 * limitations under the License.
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								 */
 								#include <config.h>
 								#include "util.h"
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								#include <ctype.h>
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								#include <errno.h>
-												util: New function log_2_floor().

Calculates the position of the most significant bit in a 32 bit
word.

											
										
										
											2011-07-22 10:20:52 -07:00
+								#include <limits.h>
-												New function ovs_strerror() as a thread-safe replacement for strerror().

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-06-19 15:44:54 -07:00
+								#include <pthread.h>
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								#include <stdarg.h>
-												util: New function log_2_floor().

Calculates the position of the most significant bit in a 32 bit
word.

											
										
										
											2011-07-22 10:20:52 -07:00
+								#include <stdint.h>
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								#include <stdio.h>
 								#include <stdlib.h>
 								#include <string.h>
-												dpif-netdev: Set timer slack for PMD threads.

The default Linux timer slack groups timer expires into 50 uS intervals.

With some traffic patterns this can mean that returning to process
packets after a sleep takes too long and packets are dropped.

Add a helper to util.c and set use it to reduce the timer slack
for PMD threads, so that sleeps with smaller resolutions can be done
to prevent sleeping for too long.

Fixes: de3bbdc479a9 ("dpif-netdev: Add PMD load based sleeping.")
Reported-at: https://mail.openvswitch.org/pipermail/ovs-dev/2023-January/401121.html
Reported-by: Ilya Maximets <i.maximets@ovn.org>
Signed-off-by: David Marchand <david.marchand@redhat.com>
Co-authored-by: Kevin Traynor <ktraynor@redhat.com>
Signed-off-by: Kevin Traynor <ktraynor@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-18 16:23:55 +00:00
+								#ifdef __linux__
 								#include <sys/prctl.h>
-												util: Support checking for kernel versions.

Extract checking for a given kernel version to a separate function.
It will be used also in the next patch.

Acked-by: Mike Pattrick <mkp@redhat.com>
Acked-by: Eelco Chaudron <echaudro@redhat.com>
Acked-by: Aaron Conole <aconole@redhat.com>
Signed-off-by: Felix Huettner <felix.huettner@mail.schwarz>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2024-03-11 14:15:47 +01:00
+								#include <sys/utsname.h>
-												dpif-netdev: Set timer slack for PMD threads.

The default Linux timer slack groups timer expires into 50 uS intervals.

With some traffic patterns this can mean that returning to process
packets after a sleep takes too long and packets are dropped.

Add a helper to util.c and set use it to reduce the timer slack
for PMD threads, so that sleeps with smaller resolutions can be done
to prevent sleeping for too long.

Fixes: de3bbdc479a9 ("dpif-netdev: Add PMD load based sleeping.")
Reported-at: https://mail.openvswitch.org/pipermail/ovs-dev/2023-January/401121.html
Reported-by: Ilya Maximets <i.maximets@ovn.org>
Signed-off-by: David Marchand <david.marchand@redhat.com>
Co-authored-by: Kevin Traynor <ktraynor@redhat.com>
Signed-off-by: Kevin Traynor <ktraynor@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-18 16:23:55 +00:00
+								#endif
-												util: New function follow_symlinks().

It will acquire its first user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-30 11:36:06 -07:00
+								#include <sys/stat.h>
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
+								#include <unistd.h>
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								#include "bitmap.h"
-												util: Move bitwise_copy() here, add new bitwise functions, add a test.

bitwise_copy() is generally useful so make it a general utility function.
Also add a comment.

Upcoming commits will introduce users for the new functions.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-01-17 16:38:23 -08:00
+								#include "byte-order.h"
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								#include "coverage.h"
-												utils: Introduce xsleep for RCU quiescent state

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-21 09:20:42 -07:00
+								#include "ovs-rcu.h"
-												ovs-thread: Add support for various thread-related assertions.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-06-19 13:07:35 -07:00
+								#include "ovs-thread.h"
-												util: Make WSAStartup available outside stream.c.

WSAStartup() needs to be called before using winsock2 related
functions. We need this for almost all the utilities. So call
it through OVS_CONSTRUCTOR.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-05-23 10:07:49 -07:00
+								#include "socket-util.h"
-												process: Consolidate process related APIs.

As part of retrieving system statistics, process status APIs along with
helper functions were implemented. Some of them are very generic and can
be reused by other subsystems.

Move the APIs in system-stats.c to process.c and util.c and make them
available. This patch doesn't change any functionality.

Signed-off-by: Bhanuprakash Bodireddy <bhanuprakash.bodireddy@intel.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-20 10:29:47 +01:00
+								#include "timeval.h"
-												lib: Move vlog.h to <openvswitch/vlog.h>

A new function vlog_insert_module() is introduced to avoid using
list_insert() from the vlog.h header.

Signed-off-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-12-15 14:10:38 +01:00
+								#include "openvswitch/vlog.h"
-												util: Include pthread_np.h on FreeBSD

On FreeBSD pthread_set_name_np's prototype is provided by pthread_np.h.
As I believe it is the only platform to provide the "set_name" (with an
underscore) variant I hope it's fine to use the existing autoconf macro
HAVE_PTHREAD_SET_NAME_NP.

Signed-off-by: Ed Maste <emaste@freebsd.org>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-08-30 10:56:08 -04:00
+								#ifdef HAVE_PTHREAD_SET_NAME_NP
 								#include <pthread_np.h>
 								#endif
-												util: Fix abs_file_name() bugs on Windows.

abs_file_name() believed that a file name that begins with / or contains :
is absolute and that any other file name is relative.  On Windows, this is
wrong in at least the following ways:

   * / and \ are interchangeable on Windows.

   * A name that begins with \\ or // is also absolute.

   * A name that begins with X: but not X:\ is not absolute.

   * A name with : in some position other than the second position is
     not absolute (although it might not be valid either?).

Furthermore, Windows has more than one current working directory (one per
volume letter), so trying to make a file name absolute by just prefixing
the current working directory for the current volume results in silliness.

This patch attempts to fix the problem.

This makes OVS link against shlwapi, which is needed to use
PathIsRelative().

Found by inspection.

Acked-by: Alin Gabriel Serdean <aserdean@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2018-07-24 09:48:45 -07:00
+								#ifdef _WIN32
 								#include <shlwapi.h>
 								#endif
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
-												vlog: Make client supply semicolon for VLOG_DEFINE_THIS_MODULE.

It's kind of odd for VLOG_DEFINE_THIS_MODULE to supply its own semicolon,
so this commit switches to the more common form.

											
										
										
											2010-10-19 14:47:01 -07:00
+								VLOG_DEFINE_THIS_MODULE(util);
-												vlog: Introduce VLOG_DEFINE_THIS_MODULE for declaring vlog module in use.

Adding a macro to define the vlog module in use adds a level of
indirection, which makes it easier to change how the vlog module must be
defined.  A followup commit needs to do that, so getting these widespread
changes out of the way first should make that commit easier to review.

											
										
										
											2010-07-16 11:02:49 -07:00
-												process: Consolidate process related APIs.

As part of retrieving system statistics, process status APIs along with
helper functions were implemented. Some of them are very generic and can
be reused by other subsystems.

Move the APIs in system-stats.c to process.c and util.c and make them
available. This patch doesn't change any functionality.

Signed-off-by: Bhanuprakash Bodireddy <bhanuprakash.bodireddy@intel.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-20 10:29:47 +01:00
+								#ifdef __linux__
 								#define LINUX 1
 								#include <asm/param.h>
 								#else
 								#define LINUX 0
 								#endif
-												coverage: Make the coverage counters catalog program-specific.

Until now, the collection of coverage counters supported by a given OVS
program was not specific to that program.  That means that, for example,
even though ovs-dpctl does not have anything to do with mac_learning, it
still has a coverage counter for it.  This is confusing, at best.

This commit fixes the problem on some systems, in particular on ones that
use GCC and the GNU linker.  It uses the feature of the GNU linker
described in its manual as:

    If an orphaned section's name is representable as a C identifier then
    the linker will automatically see PROVIDE two symbols: __start_SECNAME
    and __end_SECNAME, where SECNAME is the name of the section.  These
    indicate the start address and end address of the orphaned section
    respectively.

Systems that don't support these features retain the earlier behavior.

This commit also fixes the annoyance that files that include coverage
counters must be listed on COVERAGE_FILES in lib/automake.mk.

This commit also fixes the annoyance that modifying any source file that
includes a coverage counter caused all programs that link against
libopenvswitch.a to relink, even programs that the source file was not
linked into.  For example, modifying ofproto/ofproto.c (which includes
coverage counters) caused tests/test-aes128 to relink, even though
test-aes128 does not link again ofproto.o.

											
										
										
											2010-11-01 14:14:27 -07:00
+								COVERAGE_DEFINE(util_xalloc);
-												util: Introduce "subprogram_name" to identify subprocesses and threads.

This will be more useful later when we introduces "worker" subprocesses.
I don't have any current plans to introduce threading, but I can't
think of a disadvantage to wording this in a general manner.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-18 10:30:47 -07:00
+								/* argv[0] without directory names. */
-												util: fix compile warnings

This patch fixes two compile warnings introduced by commit
64b73291 ("util: create a copy of program_name"):
1. ../lib/util.c:457:5: error: passing argument 1 of 'free'
   discards 'const' qualifier from pointer target type; And
2. ../lib/util.c:463:5: error: ISO C90 forbids mixed declarations
   and code [-Werror=declaration-after-statement] (affected only
   branch-2.3 that is C90 compliant and not the master)

Reported-By: Joe Stringer <jstringer@nicira.com>
Reported-By: Lorand Jakab <lojakab@cisco.com>
Signed-Off-By: Ansis Atteka <aatteka@nicira.com>
Acked-by: Joe Stringer <joestringer@nicira.com>

											
										
										
											2014-07-08 04:11:53 +00:00
+								char *program_name;
-												util: Introduce "subprogram_name" to identify subprocesses and threads.

This will be more useful later when we introduces "worker" subprocesses.
I don't have any current plans to introduce threading, but I can't
think of a disadvantage to wording this in a general manner.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-18 10:30:47 -07:00
-												util: Make subprogram_name thread-specific.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-07-12 14:18:01 -07:00
+								/* Name for the currently running thread or process, for log messages, process
 								 * listings, and debuggers. */
 								DEFINE_PER_THREAD_MALLOCED_DATA(char *, subprogram_name);
-												util: Introduce "subprogram_name" to identify subprocesses and threads.

This will be more useful later when we introduces "worker" subprocesses.
I don't have any current plans to introduce threading, but I can't
think of a disadvantage to wording this in a general manner.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-18 10:30:47 -07:00
 								/* --version option output. */
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
+								static char *program_version;
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
-												vswitchd: Only lock pages that are faulted in.

The main purpose of locking the memory is to ensure that OVS can keep
doing what it did before in case of increased memory pressure, e.g.,
during VM ingest / migration.  Fulfilling this requirement can be
achieved without locking all the allocated memory, but only the pages
already accessed in the past (faulted in).  Processing of the new
traffic involves new memory allocations.  Latency on these operations
can't be guaranteed by the locking.  The main difference would be
the pre-faulting of the stack memory.  However, in order to revalidate
or process upcalls on the same traffic, the same amount of stack is
likely needed, so all the necessary memory will already be faulted in.

Switch 'mlockall' to MCL_ONFAULT to avoid consuming unnecessarily
large amounts of RAM on systems with high core counts.  For example,
in a densely populated OVN cluster this saves about 650 MB of RAM per
node on a system with 64 cores.  This equates to 320 GB of allocated
but unused RAM in a 500 node cluster.

This also makes OVS better suited by default for small systems with
limited amount of memory.

The MCL_ONFAULT flag was introduced in Linux kernel 4.4 and wasn't
available at the time of '--mlockall' introduction, but we can use it
now.  Falling back to an old way of locking in case we're running on
an older kernel just in case.

Only locking the faulted in pages also makes locking compatible with
vhost post-copy live migration by default, because we'll no longer
pre-fault all the guest's memory.  Post-copy relies on userfaultfd
to work on shared huge pages, which is only available in 4.11+ kernels.
So, technically, it should not be possible for MCL_ONFAULT to fail and
the call without it to succeed.  But keeping the check just in case
for now.

Acked-by: Simon Horman <horms@ovn.org>
Acked-by: Eelco Chaudron <echaudro@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2024-06-14 14:22:47 +02:00
+								/* 'true' if mlockall() succeeded, but doesn't support ONFAULT. */
 								static bool is_all_memory_locked = false;
-												vswitchd: Track status of memory locking.

Needed for the future post-copy live migration support for
vhost-user ports.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com>

											
										
										
											2019-05-14 16:08:42 +03:00
-												util: Pre-allocate buffer for ovs_lasterror_to_string().

This lets us call ovs_lasterror_to_string() and not having
to do an extra call of LocalFree() on the returned string.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-14 08:12:32 -08:00
+								/* Buffer used by ovs_strerror() and ovs_format_message(). */
-												ovs-thread: Add support for globally visible per-thread data.

DEFINE_PER_THREAD_DATA always declared its data item as "static", meaning
that it was only directly visible within a single translation unit.
This commit adds additional forms of per-thread data that allow the data
to be accessible from multiple translation units.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-08-06 14:40:25 -07:00
+								DEFINE_STATIC_PER_THREAD_DATA(struct { char s[128]; },
 								                              strerror_buffer,
 								                              { "" });
-												New function ovs_strerror() as a thread-safe replacement for strerror().

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-06-19 15:44:54 -07:00
-												util: Make xreadlink a static function.

It is only used in util.c

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-13 10:21:04 -08:00
+								static char *xreadlink(const char *filename);
-												util: Introduce ovs_assert macro.

An occasionally significant problem with the standard "assert" macro is
that it writes the failure message to stderr.  In our daemons, stderr is
generally redirected to /dev/null.  It's more useful to write the failure
message to the log, which is what the new ovs_assert macro introduced in
this patch does.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:03:03 -08:00
+								void
 								ovs_assert_failure(const char *where, const char *function,
 								                   const char *condition)
 								{
 								    /* Prevent an infinite loop (or stack overflow) in case VLOG_ABORT happens
 								     * to trigger an assertion failure of its own. */
 								    static int reentry = 0;
 								    switch (reentry++) {
 								    case 0:
 								        VLOG_ABORT("%s: assertion %s failed in %s()",
 								                   where, condition, function);
-												Rename NOT_REACHED to OVS_NOT_REACHED

This allows other libraries to use util.h that has already
defined NOT_REACHED.

Signed-off-by: Harold Lim <haroldl@vmware.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-12-17 10:32:12 -08:00
+								        OVS_NOT_REACHED();
-												util: Introduce ovs_assert macro.

An occasionally significant problem with the standard "assert" macro is
that it writes the failure message to stderr.  In our daemons, stderr is
generally redirected to /dev/null.  It's more useful to write the failure
message to the log, which is what the new ovs_assert macro introduced in
this patch does.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:03:03 -08:00
 								    case 1:
 								        fprintf(stderr, "%s: assertion %s failed in %s()",
 								                where, condition, function);
 								        abort();
 								    default:
 								        abort();
 								    }
 								}
-												vswitchd: Track status of memory locking.

Needed for the future post-copy live migration support for
vhost-user ports.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com>

											
										
										
											2019-05-14 16:08:42 +03:00
+								void
-												vswitchd: Only lock pages that are faulted in.

The main purpose of locking the memory is to ensure that OVS can keep
doing what it did before in case of increased memory pressure, e.g.,
during VM ingest / migration.  Fulfilling this requirement can be
achieved without locking all the allocated memory, but only the pages
already accessed in the past (faulted in).  Processing of the new
traffic involves new memory allocations.  Latency on these operations
can't be guaranteed by the locking.  The main difference would be
the pre-faulting of the stack memory.  However, in order to revalidate
or process upcalls on the same traffic, the same amount of stack is
likely needed, so all the necessary memory will already be faulted in.

Switch 'mlockall' to MCL_ONFAULT to avoid consuming unnecessarily
large amounts of RAM on systems with high core counts.  For example,
in a densely populated OVN cluster this saves about 650 MB of RAM per
node on a system with 64 cores.  This equates to 320 GB of allocated
but unused RAM in a 500 node cluster.

This also makes OVS better suited by default for small systems with
limited amount of memory.

The MCL_ONFAULT flag was introduced in Linux kernel 4.4 and wasn't
available at the time of '--mlockall' introduction, but we can use it
now.  Falling back to an old way of locking in case we're running on
an older kernel just in case.

Only locking the faulted in pages also makes locking compatible with
vhost post-copy live migration by default, because we'll no longer
pre-fault all the guest's memory.  Post-copy relies on userfaultfd
to work on shared huge pages, which is only available in 4.11+ kernels.
So, technically, it should not be possible for MCL_ONFAULT to fail and
the call without it to succeed.  But keeping the check just in case
for now.

Acked-by: Simon Horman <horms@ovn.org>
Acked-by: Eelco Chaudron <echaudro@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2024-06-14 14:22:47 +02:00
+								set_all_memory_locked(void)
-												vswitchd: Track status of memory locking.

Needed for the future post-copy live migration support for
vhost-user ports.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com>

											
										
										
											2019-05-14 16:08:42 +03:00
+								{
-												vswitchd: Only lock pages that are faulted in.

The main purpose of locking the memory is to ensure that OVS can keep
doing what it did before in case of increased memory pressure, e.g.,
during VM ingest / migration.  Fulfilling this requirement can be
achieved without locking all the allocated memory, but only the pages
already accessed in the past (faulted in).  Processing of the new
traffic involves new memory allocations.  Latency on these operations
can't be guaranteed by the locking.  The main difference would be
the pre-faulting of the stack memory.  However, in order to revalidate
or process upcalls on the same traffic, the same amount of stack is
likely needed, so all the necessary memory will already be faulted in.

Switch 'mlockall' to MCL_ONFAULT to avoid consuming unnecessarily
large amounts of RAM on systems with high core counts.  For example,
in a densely populated OVN cluster this saves about 650 MB of RAM per
node on a system with 64 cores.  This equates to 320 GB of allocated
but unused RAM in a 500 node cluster.

This also makes OVS better suited by default for small systems with
limited amount of memory.

The MCL_ONFAULT flag was introduced in Linux kernel 4.4 and wasn't
available at the time of '--mlockall' introduction, but we can use it
now.  Falling back to an old way of locking in case we're running on
an older kernel just in case.

Only locking the faulted in pages also makes locking compatible with
vhost post-copy live migration by default, because we'll no longer
pre-fault all the guest's memory.  Post-copy relies on userfaultfd
to work on shared huge pages, which is only available in 4.11+ kernels.
So, technically, it should not be possible for MCL_ONFAULT to fail and
the call without it to succeed.  But keeping the check just in case
for now.

Acked-by: Simon Horman <horms@ovn.org>
Acked-by: Eelco Chaudron <echaudro@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2024-06-14 14:22:47 +02:00
+								    is_all_memory_locked = true;
-												vswitchd: Track status of memory locking.

Needed for the future post-copy live migration support for
vhost-user ports.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com>

											
										
										
											2019-05-14 16:08:42 +03:00
+								}
 								bool
-												vswitchd: Only lock pages that are faulted in.

The main purpose of locking the memory is to ensure that OVS can keep
doing what it did before in case of increased memory pressure, e.g.,
during VM ingest / migration.  Fulfilling this requirement can be
achieved without locking all the allocated memory, but only the pages
already accessed in the past (faulted in).  Processing of the new
traffic involves new memory allocations.  Latency on these operations
can't be guaranteed by the locking.  The main difference would be
the pre-faulting of the stack memory.  However, in order to revalidate
or process upcalls on the same traffic, the same amount of stack is
likely needed, so all the necessary memory will already be faulted in.

Switch 'mlockall' to MCL_ONFAULT to avoid consuming unnecessarily
large amounts of RAM on systems with high core counts.  For example,
in a densely populated OVN cluster this saves about 650 MB of RAM per
node on a system with 64 cores.  This equates to 320 GB of allocated
but unused RAM in a 500 node cluster.

This also makes OVS better suited by default for small systems with
limited amount of memory.

The MCL_ONFAULT flag was introduced in Linux kernel 4.4 and wasn't
available at the time of '--mlockall' introduction, but we can use it
now.  Falling back to an old way of locking in case we're running on
an older kernel just in case.

Only locking the faulted in pages also makes locking compatible with
vhost post-copy live migration by default, because we'll no longer
pre-fault all the guest's memory.  Post-copy relies on userfaultfd
to work on shared huge pages, which is only available in 4.11+ kernels.
So, technically, it should not be possible for MCL_ONFAULT to fail and
the call without it to succeed.  But keeping the check just in case
for now.

Acked-by: Simon Horman <horms@ovn.org>
Acked-by: Eelco Chaudron <echaudro@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2024-06-14 14:22:47 +02:00
+								memory_all_locked(void)
-												vswitchd: Track status of memory locking.

Needed for the future post-copy live migration support for
vhost-user ports.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com>

											
										
										
											2019-05-14 16:08:42 +03:00
+								{
-												vswitchd: Only lock pages that are faulted in.

The main purpose of locking the memory is to ensure that OVS can keep
doing what it did before in case of increased memory pressure, e.g.,
during VM ingest / migration.  Fulfilling this requirement can be
achieved without locking all the allocated memory, but only the pages
already accessed in the past (faulted in).  Processing of the new
traffic involves new memory allocations.  Latency on these operations
can't be guaranteed by the locking.  The main difference would be
the pre-faulting of the stack memory.  However, in order to revalidate
or process upcalls on the same traffic, the same amount of stack is
likely needed, so all the necessary memory will already be faulted in.

Switch 'mlockall' to MCL_ONFAULT to avoid consuming unnecessarily
large amounts of RAM on systems with high core counts.  For example,
in a densely populated OVN cluster this saves about 650 MB of RAM per
node on a system with 64 cores.  This equates to 320 GB of allocated
but unused RAM in a 500 node cluster.

This also makes OVS better suited by default for small systems with
limited amount of memory.

The MCL_ONFAULT flag was introduced in Linux kernel 4.4 and wasn't
available at the time of '--mlockall' introduction, but we can use it
now.  Falling back to an old way of locking in case we're running on
an older kernel just in case.

Only locking the faulted in pages also makes locking compatible with
vhost post-copy live migration by default, because we'll no longer
pre-fault all the guest's memory.  Post-copy relies on userfaultfd
to work on shared huge pages, which is only available in 4.11+ kernels.
So, technically, it should not be possible for MCL_ONFAULT to fail and
the call without it to succeed.  But keeping the check just in case
for now.

Acked-by: Simon Horman <horms@ovn.org>
Acked-by: Eelco Chaudron <echaudro@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2024-06-14 14:22:47 +02:00
+								    return is_all_memory_locked;
-												vswitchd: Track status of memory locking.

Needed for the future post-copy live migration support for
vhost-user ports.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com>

											
										
										
											2019-05-14 16:08:42 +03:00
+								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								void
-												treewide: Remove trailing whitespace

Signed-off-by: Joe Perches <joe@perches.com>
Acked-by: Simon Horman <horms@verge.net.au>
Signed-off-by: Jesse Gross <jesse@nicira.com>

											
										
										
											2010-08-30 00:24:53 -07:00
+								out_of_memory(void)
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								{
-												util: Make out_of_memory() call abort() instead of exit(EXIT_FAILURE).

exit(EXIT_FAILURE) will make a monitoring process (the one created by
--monitor) think that it should exit.  But the most likely reason for
out_of_memory() to be called is a bug: probably, the process is trying
to allocate more memory than there is available address space, e.g.
something like malloc(-1).  So it's better, in my opinion, to call abort()
instead, so that the monitor process restarts the daemon and we are more
likely to stay alive and, in addition, get a core dump and a useful bug
report.

I decided to implement a new general-purpose function for this purpose in
case we run into other similar situations in the future.

(I haven't actually run into this problem in practice.  This commit is
just speculation about what is better behavior.)

											
										
										
											2011-02-23 15:43:34 -08:00
+								    ovs_abort(0, "virtual memory exhausted");
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								}
 								void *
-												util: Add allocation wrappers that don't increment coverage counters.

The thread-local data allocators can't increment coverage counters
because this can cause reentrancy.  Until now, this code has used
explicit calls to malloc().  This code replaces them by calls to the
new functions.  This will make it easier in an upcoming patch to update
all the code that can run out of memory.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-03-26 11:30:23 -07:00
+								xcalloc__(size_t count, size_t size)
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								{
 								    void *p = count && size ? calloc(count, size) : malloc(1);
 								    if (p == NULL) {
 								        out_of_memory();
 								    }
 								    return p;
 								}
-												Add new function xzalloc(n) as a shorthand for xcalloc(1, n).

											
										
										
											2009-09-28 13:56:42 -07:00
+								void *
-												util: Add allocation wrappers that don't increment coverage counters.

The thread-local data allocators can't increment coverage counters
because this can cause reentrancy.  Until now, this code has used
explicit calls to malloc().  This code replaces them by calls to the
new functions.  This will make it easier in an upcoming patch to update
all the code that can run out of memory.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-03-26 11:30:23 -07:00
+								xzalloc__(size_t size)
-												Add new function xzalloc(n) as a shorthand for xcalloc(1, n).

											
										
										
											2009-09-28 13:56:42 -07:00
+								{
-												util: Add allocation wrappers that don't increment coverage counters.

The thread-local data allocators can't increment coverage counters
because this can cause reentrancy.  Until now, this code has used
explicit calls to malloc().  This code replaces them by calls to the
new functions.  This will make it easier in an upcoming patch to update
all the code that can run out of memory.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-03-26 11:30:23 -07:00
+								    return xcalloc__(1, size);
-												Add new function xzalloc(n) as a shorthand for xcalloc(1, n).

											
										
										
											2009-09-28 13:56:42 -07:00
+								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								void *
-												util: Add allocation wrappers that don't increment coverage counters.

The thread-local data allocators can't increment coverage counters
because this can cause reentrancy.  Until now, this code has used
explicit calls to malloc().  This code replaces them by calls to the
new functions.  This will make it easier in an upcoming patch to update
all the code that can run out of memory.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-03-26 11:30:23 -07:00
+								xmalloc__(size_t size)
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								{
 								    void *p = malloc(size ? size : 1);
 								    if (p == NULL) {
 								        out_of_memory();
 								    }
 								    return p;
 								}
 								void *
-												util: Add allocation wrappers that don't increment coverage counters.

The thread-local data allocators can't increment coverage counters
because this can cause reentrancy.  Until now, this code has used
explicit calls to malloc().  This code replaces them by calls to the
new functions.  This will make it easier in an upcoming patch to update
all the code that can run out of memory.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-03-26 11:30:23 -07:00
+								xrealloc__(void *p, size_t size)
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								{
 								    p = realloc(p, size ? size : 1);
 								    if (p == NULL) {
 								        out_of_memory();
 								    }
 								    return p;
 								}
-												util: Add allocation wrappers that don't increment coverage counters.

The thread-local data allocators can't increment coverage counters
because this can cause reentrancy.  Until now, this code has used
explicit calls to malloc().  This code replaces them by calls to the
new functions.  This will make it easier in an upcoming patch to update
all the code that can run out of memory.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-03-26 11:30:23 -07:00
+								void *
 								xcalloc(size_t count, size_t size)
 								{
 								    COVERAGE_INC(util_xalloc);
 								    return xcalloc__(count, size);
 								}
 								void *
 								xzalloc(size_t size)
 								{
 								    COVERAGE_INC(util_xalloc);
 								    return xzalloc__(size);
 								}
 								void *
 								xmalloc(size_t size)
 								{
 								    COVERAGE_INC(util_xalloc);
 								    return xmalloc__(size);
 								}
 								void *
 								xrealloc(void *p, size_t size)
 								{
 								    COVERAGE_INC(util_xalloc);
 								    return xrealloc__(p, size);
 								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								void *
 								xmemdup(const void *p_, size_t size)
 								{
 								    void *p = xmalloc(size);
-												treewide: Avoid undefined behavior passing null in nonnull parameters.

Eliminate a number of instances of undefined behavior related to
passing NULL in parameters having "nonnull" annotations.

Found with gcc's undefined behavior sanitizer.

Signed-off-by: Lance Richardson <lrichard@redhat.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-13 12:57:38 -04:00
+								    nullable_memcpy(p, p_, size);
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    return p;
 								}
 								char *
 								xmemdup0(const char *p_, size_t length)
 								{
 								    char *p = xmalloc(length + 1);
 								    memcpy(p, p_, length);
 								    p[length] = '\0';
 								    return p;
 								}
 								char *
-												treewide: Remove trailing whitespace

Signed-off-by: Joe Perches <joe@perches.com>
Acked-by: Simon Horman <horms@verge.net.au>
Signed-off-by: Jesse Gross <jesse@nicira.com>

											
										
										
											2010-08-30 00:24:53 -07:00
+								xstrdup(const char *s)
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								{
 								    return xmemdup0(s, strlen(s));
 								}
-												util: New function nullable_xstrdup().

It's a pretty common pattern so create a function for it.

Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-06-24 21:23:16 -07:00
+								char * MALLOC_LIKE
 								nullable_xstrdup(const char *s)
 								{
 								    return s ? xstrdup(s) : NULL;
 								}
-												util: Expose function nullable_string_is_equal.

Implementation of 'nullable_string_is_equal()' moved to util.c and
reused inside dpif-netdev.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Acked-by: Daniele Di Proietto <diproiettod@vmware.com>

											
										
										
											2016-07-15 14:54:53 +03:00
+								bool
 								nullable_string_is_equal(const char *a, const char *b)
 								{
 								    return a ? b && !strcmp(a, b) : !b;
 								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								char *
 								xvasprintf(const char *format, va_list args)
 								{
 								    va_list args2;
 								    size_t needed;
 								    char *s;
 								    va_copy(args2, args);
 								    needed = vsnprintf(NULL, 0, format, args);
 								    s = xmalloc(needed + 1);
 								    vsnprintf(s, needed + 1, format, args2);
 								    va_end(args2);
 								    return s;
 								}
 								void *
 								x2nrealloc(void *p, size_t *n, size_t s)
 								{
 								    *n = *n == 0 ? 1 : 2 * *n;
 								    return xrealloc(p, *n * s);
 								}
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
+								/* Allocates and returns 'size' bytes of memory aligned to 'alignment' bytes.
 								 * 'alignment' must be a power of two and a multiple of sizeof(void *).
-												util: New functions for allocating memory while avoiding false sharing.

This factors code out of fat-rwlock, making it easily usable by other code.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2014-03-11 00:11:30 -07:00
+								 *
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
+								 * Use free_size_align() to free the returned memory block. */
-												util: New functions for allocating memory while avoiding false sharing.

This factors code out of fat-rwlock, making it easily usable by other code.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2014-03-11 00:11:30 -07:00
+								void *
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
+								xmalloc_size_align(size_t size, size_t alignment)
-												util: New functions for allocating memory while avoiding false sharing.

This factors code out of fat-rwlock, making it easily usable by other code.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2014-03-11 00:11:30 -07:00
+								{
-												util: Use posix_memalign for xmalloc_cacheline if available

A malloc library is expected to provide a better implementation
using the knowledge of its internal details.

ax_func_posix_memalign.m4 was obtained from:
http://git.savannah.gnu.org/gitweb/?p=autoconf-archive.git;a=blob_plain;f=m4/ax_func_posix_memalign.m4

Acked-by: Ben Pfaff <blp@nicira.com>
Signed-off-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-05-02 17:07:29 +09:00
+								#ifdef HAVE_POSIX_MEMALIGN
 								    void *p;
 								    int error;
 								    COVERAGE_INC(util_xalloc);
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
+								    error = posix_memalign(&p, alignment, size ? size : 1);
-												util: Use posix_memalign for xmalloc_cacheline if available

A malloc library is expected to provide a better implementation
using the knowledge of its internal details.

ax_func_posix_memalign.m4 was obtained from:
http://git.savannah.gnu.org/gitweb/?p=autoconf-archive.git;a=blob_plain;f=m4/ax_func_posix_memalign.m4

Acked-by: Ben Pfaff <blp@nicira.com>
Signed-off-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-05-02 17:07:29 +09:00
+								    if (error != 0) {
 								        out_of_memory();
 								    }
 								    return p;
 								#else
-												util: New functions for allocating memory while avoiding false sharing.

This factors code out of fat-rwlock, making it easily usable by other code.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2014-03-11 00:11:30 -07:00
+								    /* Allocate room for:
 								     *
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
+								     *     - Header padding: Up to alignment - 1 bytes, to allow the
 								     *       pointer 'q' to be aligned exactly sizeof(void *) bytes before the
 								     *       beginning of the alignment.
-												util: New functions for allocating memory while avoiding false sharing.

This factors code out of fat-rwlock, making it easily usable by other code.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2014-03-11 00:11:30 -07:00
+								     *
-												util: Make xmalloc_cacheline() allocate full cachelines.

Until now, xmalloc_cacheline() has provided its caller memory that does not
share a cache line, but when posix_memalign() is not available it did not
provide a full cache line; instead, it returned memory that was offset 8
bytes into a cache line.  This makes it hard for clients to design
structures to be cache line-aligned.  This commit changes
xmalloc_cacheline() to always return a full cache line instead of memory
offset into one.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-at: https://mail.openvswitch.org/pipermail/ovs-dev/2017-November/341362.html

											
										
										
											2017-11-28 10:28:33 -08:00
+								     *     - Pointer: A pointer to the start of the header padding, to allow us
 								     *       to free() the block later.
-												util: New functions for allocating memory while avoiding false sharing.

This factors code out of fat-rwlock, making it easily usable by other code.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2014-03-11 00:11:30 -07:00
+								     *
-												util: Make xmalloc_cacheline() allocate full cachelines.

Until now, xmalloc_cacheline() has provided its caller memory that does not
share a cache line, but when posix_memalign() is not available it did not
provide a full cache line; instead, it returned memory that was offset 8
bytes into a cache line.  This makes it hard for clients to design
structures to be cache line-aligned.  This commit changes
xmalloc_cacheline() to always return a full cache line instead of memory
offset into one.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-at: https://mail.openvswitch.org/pipermail/ovs-dev/2017-November/341362.html

											
										
										
											2017-11-28 10:28:33 -08:00
+								     *     - User data: 'size' bytes.
 								     *
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
+								     *     - Trailer padding: Enough to bring the user data up to a alignment
-												util: Make xmalloc_cacheline() allocate full cachelines.

Until now, xmalloc_cacheline() has provided its caller memory that does not
share a cache line, but when posix_memalign() is not available it did not
provide a full cache line; instead, it returned memory that was offset 8
bytes into a cache line.  This makes it hard for clients to design
structures to be cache line-aligned.  This commit changes
xmalloc_cacheline() to always return a full cache line instead of memory
offset into one.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-at: https://mail.openvswitch.org/pipermail/ovs-dev/2017-November/341362.html

											
										
										
											2017-11-28 10:28:33 -08:00
+								     *       multiple.
 								     *
 								     * +---------------+---------+------------------------+---------+
 								     * | header        | pointer | user data              | trailer |
 								     * +---------------+---------+------------------------+---------+
 								     * ^               ^         ^
 								     * |               |         |
 								     * p               q         r
 								     *
 								     */
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
+								    void *p, *r, **q;
 								    bool runt;
 								    if (!IS_POW2(alignment) || (alignment % sizeof(void *) != 0)) {
 								        ovs_abort(0, "Invalid alignment");
 								    }
 								    p = xmalloc((alignment - 1)
 								                + sizeof(void *)
 								                + ROUND_UP(size, alignment));
 								    runt = PAD_SIZE((uintptr_t) p, alignment) < sizeof(void *);
 								    /* When the padding size < sizeof(void*), we don't have enough room for
 								     * pointer 'q'. As a reuslt, need to move 'r' to the next alignment.
 								     * So ROUND_UP when xmalloc above, and ROUND_UP again when calculate 'r'
 								     * below.
 								     */
 								    r = (void *) ROUND_UP((uintptr_t) p + (runt ? alignment : 0), alignment);
 								    q = (void **) r - 1;
-												util: Make xmalloc_cacheline() allocate full cachelines.

Until now, xmalloc_cacheline() has provided its caller memory that does not
share a cache line, but when posix_memalign() is not available it did not
provide a full cache line; instead, it returned memory that was offset 8
bytes into a cache line.  This makes it hard for clients to design
structures to be cache line-aligned.  This commit changes
xmalloc_cacheline() to always return a full cache line instead of memory
offset into one.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-at: https://mail.openvswitch.org/pipermail/ovs-dev/2017-November/341362.html

											
										
										
											2017-11-28 10:28:33 -08:00
+								    *q = p;
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
-												util: Make xmalloc_cacheline() allocate full cachelines.

Until now, xmalloc_cacheline() has provided its caller memory that does not
share a cache line, but when posix_memalign() is not available it did not
provide a full cache line; instead, it returned memory that was offset 8
bytes into a cache line.  This makes it hard for clients to design
structures to be cache line-aligned.  This commit changes
xmalloc_cacheline() to always return a full cache line instead of memory
offset into one.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-by: Bhanuprakash Bodireddy <Bhanuprakash.bodireddy@intel.com>
Tested-at: https://mail.openvswitch.org/pipermail/ovs-dev/2017-November/341362.html

											
										
										
											2017-11-28 10:28:33 -08:00
+								    return r;
-												util: Use posix_memalign for xmalloc_cacheline if available

A malloc library is expected to provide a better implementation
using the knowledge of its internal details.

ax_func_posix_memalign.m4 was obtained from:
http://git.savannah.gnu.org/gitweb/?p=autoconf-archive.git;a=blob_plain;f=m4/ax_func_posix_memalign.m4

Acked-by: Ben Pfaff <blp@nicira.com>
Signed-off-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-05-02 17:07:29 +09:00
+								#endif
-												util: New functions for allocating memory while avoiding false sharing.

This factors code out of fat-rwlock, making it easily usable by other code.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2014-03-11 00:11:30 -07:00
+								}
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
+								void
 								free_size_align(void *p)
 								{
 								#ifdef HAVE_POSIX_MEMALIGN
 								    free(p);
 								#else
 								    if (p) {
 								        void **q = (void **) p - 1;
 								        free(*q);
 								    }
 								#endif
 								}
 								/* Allocates and returns 'size' bytes of memory aligned to a cache line and in
 								 * dedicated cache lines.  That is, the memory block returned will not share a
 								 * cache line with other data, avoiding "false sharing".
 								 *
 								 * Use free_cacheline() to free the returned memory block. */
 								void *
 								xmalloc_cacheline(size_t size)
 								{
 								    return xmalloc_size_align(size, CACHE_LINE_SIZE);
 								}
-												util: New functions for allocating memory while avoiding false sharing.

This factors code out of fat-rwlock, making it easily usable by other code.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2014-03-11 00:11:30 -07:00
+								/* Like xmalloc_cacheline() but clears the allocated memory to all zero
 								 * bytes. */
 								void *
 								xzalloc_cacheline(size_t size)
 								{
 								    void *p = xmalloc_cacheline(size);
 								    memset(p, 0, size);
 								    return p;
 								}
 								/* Frees a memory block allocated with xmalloc_cacheline() or
 								 * xzalloc_cacheline(). */
 								void
 								free_cacheline(void *p)
 								{
-												netdev-afxdp: add new netdev type for AF_XDP.

The patch introduces experimental AF_XDP support for OVS netdev.
AF_XDP, the Address Family of the eXpress Data Path, is a new Linux socket
type built upon the eBPF and XDP technology.  It is aims to have comparable
performance to DPDK but cooperate better with existing kernel's networking
stack.  An AF_XDP socket receives and sends packets from an eBPF/XDP program
attached to the netdev, by-passing a couple of Linux kernel's subsystems
As a result, AF_XDP socket shows much better performance than AF_PACKET
For more details about AF_XDP, please see linux kernel's
Documentation/networking/af_xdp.rst. Note that by default, this feature is
not compiled in.

Signed-off-by: William Tu <u9012063@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@samsung.com>

											
										
										
											2019-07-18 13:11:14 -07:00
+								    free_size_align(p);
 								}
 								void *
 								xmalloc_pagealign(size_t size)
 								{
 								    return xmalloc_size_align(size, get_page_size());
 								}
 								void
 								free_pagealign(void *p)
 								{
 								    free_size_align(p);
-												util: New functions for allocating memory while avoiding false sharing.

This factors code out of fat-rwlock, making it easily usable by other code.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2014-03-11 00:11:30 -07:00
+								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								char *
 								xasprintf(const char *format, ...)
 								{
 								    va_list args;
 								    char *s;
 								    va_start(args, format);
 								    s = xvasprintf(format, args);
 								    va_end(args);
 								    return s;
 								}
-												util: Don't read over 'size - 1' bytes of source string in ovs_strlcpy().

The blind replacement of strncpy() by ovs_strlcpy() is risky because
strncpy() never reads more bytes from its source string than necessary to
write its destination string, but ovs_strlcpy() and the OpenBSD function
that inspired it both read the entire source string.  This avoids that
problem.

Given that change, we can use ovs_strlcpy() in a few more places, and
this commit does that too.

Coverity #10697,10696,10695,10694,10693,10692,10691,10690.

											
										
										
											2011-02-22 10:41:15 -08:00
+								/* Similar to strlcpy() from OpenBSD, but it never reads more than 'size - 1'
 								 * bytes from 'src' and doesn't return anything. */
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								void
 								ovs_strlcpy(char *dst, const char *src, size_t size)
 								{
 								    if (size > 0) {
-												util: Don't read over 'size - 1' bytes of source string in ovs_strlcpy().

The blind replacement of strncpy() by ovs_strlcpy() is risky because
strncpy() never reads more bytes from its source string than necessary to
write its destination string, but ovs_strlcpy() and the OpenBSD function
that inspired it both read the entire source string.  This avoids that
problem.

Given that change, we can use ovs_strlcpy() in a few more places, and
this commit does that too.

Coverity #10697,10696,10695,10694,10693,10692,10691,10690.

											
										
										
											2011-02-22 10:41:15 -08:00
+								        size_t len = strnlen(src, size - 1);
 								        memcpy(dst, src, len);
 								        dst[len] = '\0';
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    }
 								}
-												util: New function ovs_strzcpy().

Static analyzers hate strncpy().  This new function shares its property of
initializing an entire buffer, without its nasty habit of failing to
null-terminate long strings.

Coverity #10697,10696,10695,10694,10693,10692,10691,10690.

											
										
										
											2011-02-22 10:58:36 -08:00
+								/* Copies 'src' to 'dst'.  Reads no more than 'size - 1' bytes from 'src'.
 								 * Always null-terminates 'dst' (if 'size' is nonzero), and writes a zero byte
 								 * to every otherwise unused byte in 'dst'.
 								 *
 								 * Except for performance, the following call:
 								 *     ovs_strzcpy(dst, src, size);
 								 * is equivalent to these two calls:
 								 *     memset(dst, '\0', size);
 								 *     ovs_strlcpy(dst, src, size);
 								 *
 								 * (Thus, ovs_strzcpy() is similar to strncpy() without some of the pitfalls.)
 								 */
 								void
 								ovs_strzcpy(char *dst, const char *src, size_t size)
 								{
 								    if (size > 0) {
 								        size_t len = strnlen(src, size - 1);
 								        memcpy(dst, src, len);
 								        memset(dst + len, '\0', size - len);
 								    }
 								}
-												netdev: Custom statistics.

- New get_custom_stats interface function is added to netdev. It
  allows particular netdev implementation to expose custom
  counters in dictionary format (counter name/counter value).
- New statistics are retrieved using experimenter code and
  are printed as a result to ofctl dump-ports.
- New counters are available for OpenFlow 1.4+.
- New statistics are printed to output via ofctl only if those
  are present in reply message.
- New statistics definition is added to include/openflow/intel-ext.h.
- Custom statistics are implemented only for dpdk-physical
  port type.
- DPDK-physical implementation uses xstats to collect statistics.
  Only dropped and error counters are exposed.

Co-authored-by: Ben Pfaff <blp@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Signed-off-by: Michal Weglicki <michalx.weglicki@intel.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2018-01-09 07:55:37 +00:00
+								/*
 								 * Returns true if 'str' ends with given 'suffix'.
 								 */
 								int
 								string_ends_with(const char *str, const char *suffix)
 								{
 								    int str_len = strlen(str);
 								    int suffix_len = strlen(suffix);
 								    return (str_len >= suffix_len) &&
 								           (0 == strcmp(str + (str_len - suffix_len), suffix));
 								}
-												util: Make out_of_memory() call abort() instead of exit(EXIT_FAILURE).

exit(EXIT_FAILURE) will make a monitoring process (the one created by
--monitor) think that it should exit.  But the most likely reason for
out_of_memory() to be called is a bug: probably, the process is trying
to allocate more memory than there is available address space, e.g.
something like malloc(-1).  So it's better, in my opinion, to call abort()
instead, so that the monitor process restarts the daemon and we are more
likely to stay alive and, in addition, get a core dump and a useful bug
report.

I decided to implement a new general-purpose function for this purpose in
case we run into other similar situations in the future.

(I haven't actually run into this problem in practice.  This commit is
just speculation about what is better behavior.)

											
										
										
											2011-02-23 15:43:34 -08:00
+								/* Prints 'format' on stderr, formatting it like printf() does.  If 'err_no' is
 								 * nonzero, then it is formatted with ovs_retval_to_string() and appended to
 								 * the message inside parentheses.  Then, terminates with abort().
 								 *
 								 * This function is preferred to ovs_fatal() in a situation where it would make
 								 * sense for a monitoring process to restart the daemon.
 								 *
 								 * 'format' should not end with a new-line, because this function will add one
 								 * itself. */
 								void
 								ovs_abort(int err_no, const char *format, ...)
 								{
 								    va_list args;
 								    va_start(args, format);
-												vlog: Add VLOG_ABORT() to log and call abort().

Whereas VLOG_FATAL() eventually calls exit(1), VLOG_ABORT()
eventually calls abort().  The key difference is that abort()
will cause a "monitor" process to restart, where exit(1) will
cause it to exit along with the monitored process.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-05-22 11:36:50 -07:00
+								    ovs_abort_valist(err_no, format, args);
 								}
-												util: Make out_of_memory() call abort() instead of exit(EXIT_FAILURE).

exit(EXIT_FAILURE) will make a monitoring process (the one created by
--monitor) think that it should exit.  But the most likely reason for
out_of_memory() to be called is a bug: probably, the process is trying
to allocate more memory than there is available address space, e.g.
something like malloc(-1).  So it's better, in my opinion, to call abort()
instead, so that the monitor process restarts the daemon and we are more
likely to stay alive and, in addition, get a core dump and a useful bug
report.

I decided to implement a new general-purpose function for this purpose in
case we run into other similar situations in the future.

(I haven't actually run into this problem in practice.  This commit is
just speculation about what is better behavior.)

											
										
										
											2011-02-23 15:43:34 -08:00
-												vlog: Add VLOG_ABORT() to log and call abort().

Whereas VLOG_FATAL() eventually calls exit(1), VLOG_ABORT()
eventually calls abort().  The key difference is that abort()
will cause a "monitor" process to restart, where exit(1) will
cause it to exit along with the monitored process.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-05-22 11:36:50 -07:00
+								/* Same as ovs_abort() except that the arguments are supplied as a va_list. */
 								void
 								ovs_abort_valist(int err_no, const char *format, va_list args)
 								{
 								    ovs_error_valist(err_no, format, args);
-												util: Make out_of_memory() call abort() instead of exit(EXIT_FAILURE).

exit(EXIT_FAILURE) will make a monitoring process (the one created by
--monitor) think that it should exit.  But the most likely reason for
out_of_memory() to be called is a bug: probably, the process is trying
to allocate more memory than there is available address space, e.g.
something like malloc(-1).  So it's better, in my opinion, to call abort()
instead, so that the monitor process restarts the daemon and we are more
likely to stay alive and, in addition, get a core dump and a useful bug
report.

I decided to implement a new general-purpose function for this purpose in
case we run into other similar situations in the future.

(I haven't actually run into this problem in practice.  This commit is
just speculation about what is better behavior.)

											
										
										
											2011-02-23 15:43:34 -08:00
+								    abort();
 								}
 								/* Prints 'format' on stderr, formatting it like printf() does.  If 'err_no' is
 								 * nonzero, then it is formatted with ovs_retval_to_string() and appended to
 								 * the message inside parentheses.  Then, terminates with EXIT_FAILURE.
 								 *
 								 * 'format' should not end with a new-line, because this function will add one
 								 * itself. */
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								void
 								ovs_fatal(int err_no, const char *format, ...)
 								{
 								    va_list args;
 								    va_start(args, format);
-												util: New function ovs_fatal_valist().

This commit adds a few initial users but more are coming up.

											
										
										
											2011-03-31 14:50:58 -07:00
+								    ovs_fatal_valist(err_no, format, args);
 								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
-												util: New function ovs_fatal_valist().

This commit adds a few initial users but more are coming up.

											
										
										
											2011-03-31 14:50:58 -07:00
+								/* Same as ovs_fatal() except that the arguments are supplied as a va_list. */
 								void
 								ovs_fatal_valist(int err_no, const char *format, va_list args)
 								{
 								    ovs_error_valist(err_no, format, args);
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    exit(EXIT_FAILURE);
 								}
-												util: Make out_of_memory() call abort() instead of exit(EXIT_FAILURE).

exit(EXIT_FAILURE) will make a monitoring process (the one created by
--monitor) think that it should exit.  But the most likely reason for
out_of_memory() to be called is a bug: probably, the process is trying
to allocate more memory than there is available address space, e.g.
something like malloc(-1).  So it's better, in my opinion, to call abort()
instead, so that the monitor process restarts the daemon and we are more
likely to stay alive and, in addition, get a core dump and a useful bug
report.

I decided to implement a new general-purpose function for this purpose in
case we run into other similar situations in the future.

(I haven't actually run into this problem in practice.  This commit is
just speculation about what is better behavior.)

											
										
										
											2011-02-23 15:43:34 -08:00
+								/* Prints 'format' on stderr, formatting it like printf() does.  If 'err_no' is
 								 * nonzero, then it is formatted with ovs_retval_to_string() and appended to
 								 * the message inside parentheses.
 								 *
 								 * 'format' should not end with a new-line, because this function will add one
 								 * itself. */
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								void
 								ovs_error(int err_no, const char *format, ...)
 								{
 								    va_list args;
 								    va_start(args, format);
-												util: Make out_of_memory() call abort() instead of exit(EXIT_FAILURE).

exit(EXIT_FAILURE) will make a monitoring process (the one created by
--monitor) think that it should exit.  But the most likely reason for
out_of_memory() to be called is a bug: probably, the process is trying
to allocate more memory than there is available address space, e.g.
something like malloc(-1).  So it's better, in my opinion, to call abort()
instead, so that the monitor process restarts the daemon and we are more
likely to stay alive and, in addition, get a core dump and a useful bug
report.

I decided to implement a new general-purpose function for this purpose in
case we run into other similar situations in the future.

(I haven't actually run into this problem in practice.  This commit is
just speculation about what is better behavior.)

											
										
										
											2011-02-23 15:43:34 -08:00
+								    ovs_error_valist(err_no, format, args);
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    va_end(args);
-												util: Make out_of_memory() call abort() instead of exit(EXIT_FAILURE).

exit(EXIT_FAILURE) will make a monitoring process (the one created by
--monitor) think that it should exit.  But the most likely reason for
out_of_memory() to be called is a bug: probably, the process is trying
to allocate more memory than there is available address space, e.g.
something like malloc(-1).  So it's better, in my opinion, to call abort()
instead, so that the monitor process restarts the daemon and we are more
likely to stay alive and, in addition, get a core dump and a useful bug
report.

I decided to implement a new general-purpose function for this purpose in
case we run into other similar situations in the future.

(I haven't actually run into this problem in practice.  This commit is
just speculation about what is better behavior.)

											
										
										
											2011-02-23 15:43:34 -08:00
+								}
 								/* Same as ovs_error() except that the arguments are supplied as a va_list. */
 								void
 								ovs_error_valist(int err_no, const char *format, va_list args)
 								{
-												util: Make subprogram_name thread-specific.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-07-12 14:18:01 -07:00
+								    const char *subprogram_name = get_subprogram_name();
-												util: Make out_of_memory() call abort() instead of exit(EXIT_FAILURE).

exit(EXIT_FAILURE) will make a monitoring process (the one created by
--monitor) think that it should exit.  But the most likely reason for
out_of_memory() to be called is a bug: probably, the process is trying
to allocate more memory than there is available address space, e.g.
something like malloc(-1).  So it's better, in my opinion, to call abort()
instead, so that the monitor process restarts the daemon and we are more
likely to stay alive and, in addition, get a core dump and a useful bug
report.

I decided to implement a new general-purpose function for this purpose in
case we run into other similar situations in the future.

(I haven't actually run into this problem in practice.  This commit is
just speculation about what is better behavior.)

											
										
										
											2011-02-23 15:43:34 -08:00
+								    int save_errno = errno;
-												util: Introduce "subprogram_name" to identify subprocesses and threads.

This will be more useful later when we introduces "worker" subprocesses.
I don't have any current plans to introduce threading, but I can't
think of a disadvantage to wording this in a general manner.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-18 10:30:47 -07:00
+								    if (subprogram_name[0]) {
 								        fprintf(stderr, "%s(%s): ", program_name, subprogram_name);
 								    } else {
 								        fprintf(stderr, "%s: ", program_name);
 								    }
-												util: Make out_of_memory() call abort() instead of exit(EXIT_FAILURE).

exit(EXIT_FAILURE) will make a monitoring process (the one created by
--monitor) think that it should exit.  But the most likely reason for
out_of_memory() to be called is a bug: probably, the process is trying
to allocate more memory than there is available address space, e.g.
something like malloc(-1).  So it's better, in my opinion, to call abort()
instead, so that the monitor process restarts the daemon and we are more
likely to stay alive and, in addition, get a core dump and a useful bug
report.

I decided to implement a new general-purpose function for this purpose in
case we run into other similar situations in the future.

(I haven't actually run into this problem in practice.  This commit is
just speculation about what is better behavior.)

											
										
										
											2011-02-23 15:43:34 -08:00
+								    vfprintf(stderr, format, args);
-												util: Make ovs_error() understand that EOF means "end of file".

This convention is in use in a few places in the source tree, and so it
seems to be about time to start putting it into central places.

											
										
										
											2009-10-28 11:11:18 -07:00
+								    if (err_no != 0) {
-												util: New ovs_retval_to_string() function.

Many OVS functions return 0, EOF, or errno. There are several places in the
codebase where a return value is converted to a string. All must decide whether
the return value is set, and if it is, whether it is an errno value, EOF, or
otherwise invalid. This commit consolidates that code.

Reviewed by Ben Pfaff.

											
										
										
											2011-01-30 11:29:14 -08:00
+								        fprintf(stderr, " (%s)", ovs_retval_to_string(err_no));
-												util: Make ovs_error() understand that EOF means "end of file".

This convention is in use in a few places in the source tree, and so it
seems to be about time to start putting it into central places.

											
										
										
											2009-10-28 11:11:18 -07:00
+								    }
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    putc('\n', stderr);
 								    errno = save_errno;
 								}
-												util: New ovs_retval_to_string() function.

Many OVS functions return 0, EOF, or errno. There are several places in the
codebase where a return value is converted to a string. All must decide whether
the return value is set, and if it is, whether it is an errno value, EOF, or
otherwise invalid. This commit consolidates that code.

Reviewed by Ben Pfaff.

											
										
										
											2011-01-30 11:29:14 -08:00
+								/* Many OVS functions return an int which is one of:
 								 * - 0: no error yet
 								 * - >0: errno value
 								 * - EOF: end of file (not necessarily an error; depends on the function called)
 								 *
 								 * Returns the appropriate human-readable string. The caller must copy the
 								 * string if it wants to hold onto it, as the storage may be overwritten on
 								 * subsequent function calls.
 								 */
 								const char *
 								ovs_retval_to_string(int retval)
 								{
-												New function ovs_strerror() as a thread-safe replacement for strerror().

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-06-19 15:44:54 -07:00
+								    return (!retval ? ""
 								            : retval == EOF ? "End of file"
 								            : ovs_strerror(retval));
 								}
-												util: New ovs_retval_to_string() function.

Many OVS functions return 0, EOF, or errno. There are several places in the
codebase where a return value is converted to a string. All must decide whether
the return value is set, and if it is, whether it is an errno value, EOF, or
otherwise invalid. This commit consolidates that code.

Reviewed by Ben Pfaff.

											
										
										
											2011-01-30 11:29:14 -08:00
-												socket-util: error number to string for sockets.

For winsock2 functions, error number has to be converted to string
using FormatMessage().

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-05 19:50:10 -08:00
+								/* This function returns the string describing the error number in 'error'
 								 * for POSIX platforms.  For Windows, this function can be used for C library
 								 * calls.  For socket calls that are also used in Windows, use sock_strerror()
 								 * instead.  For WINAPI calls, look at ovs_lasterror_to_string(). */
-												New function ovs_strerror() as a thread-safe replacement for strerror().

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-06-19 15:44:54 -07:00
+								const char *
 								ovs_strerror(int error)
 								{
 								    enum { BUFSIZE = sizeof strerror_buffer_get()->s };
 								    int save_errno;
 								    char *buffer;
 								    char *s;
-												ovs_strerror, ovs_format_message: Always use "Success" for errno 0

So that testsuite can compare log messages including the string.

Signed-off-by: YAMAMOTO Takashi <yamamoto@midokura.com>
Acked-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-03-16 07:19:35 +00:00
+								    if (error == 0) {
 								        /*
 								         * strerror(0) varies among platforms:
 								         *
 								         *   Success
 								         *   No error
 								         *   Undefined error: 0
 								         *
 								         * We want to provide a consistent result here because
 								         * our testsuite has test cases which strictly matches
 								         * log messages containing this string.
 								         */
 								        return "Success";
 								    }
-												New function ovs_strerror() as a thread-safe replacement for strerror().

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-06-19 15:44:54 -07:00
+								    save_errno = errno;
 								    buffer = strerror_buffer_get()->s;
 								#if STRERROR_R_CHAR_P
 								    /* GNU style strerror_r() might return an immutable static string, or it
 								     * might write and return 'buffer', but in either case we can pass the
 								     * returned string directly to the caller. */
 								    s = strerror_r(error, buffer, BUFSIZE);
 								#else  /* strerror_r() returns an int. */
 								    s = buffer;
 								    if (strerror_r(error, buffer, BUFSIZE)) {
 								        /* strerror_r() is only allowed to fail on ERANGE (because the buffer
 								         * is too short).  We don't check the actual failure reason because
 								         * POSIX requires strerror_r() to return the error but old glibc
 								         * (before 2.13) returns -1 and sets errno. */
-												util: fix a printf format

revert a mistake in commit 34582733.
("Avoid printf type modifiers not supported by MSVC C runtime library.")

Signed-off-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>
Signed-off-by: Jesse Gross <jesse@nicira.com>

											
										
										
											2013-11-27 14:25:24 +09:00
+								        snprintf(buffer, BUFSIZE, "Unknown error %d", error);
-												util: New ovs_retval_to_string() function.

Many OVS functions return 0, EOF, or errno. There are several places in the
codebase where a return value is converted to a string. All must decide whether
the return value is set, and if it is, whether it is an errno value, EOF, or
otherwise invalid. This commit consolidates that code.

Reviewed by Ben Pfaff.

											
										
										
											2011-01-30 11:29:14 -08:00
+								    }
-												New function ovs_strerror() as a thread-safe replacement for strerror().

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-06-19 15:44:54 -07:00
+								#endif
 								    errno = save_errno;
 								    return s;
-												util: New ovs_retval_to_string() function.

Many OVS functions return 0, EOF, or errno. There are several places in the
codebase where a return value is converted to a string. All must decide whether
the return value is set, and if it is, whether it is an errno value, EOF, or
otherwise invalid. This commit consolidates that code.

Reviewed by Ben Pfaff.

											
										
										
											2011-01-30 11:29:14 -08:00
+								}
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
+								/* Sets global "program_name" and "program_version" variables.  Should
 								 * be called at the beginning of main() with "argv[0]" as the argument
 								 * to 'argv0'.
 								 *
-												util: New function set_program_name_version().

With this function, users of the Open vSwitch libraries which
should not have the same version as Open vSwitch will have their
version displayed in unixctl and at the command line.

Signed-off-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2012-04-06 11:47:51 -07:00
+								 * 'version' should contain the version of the caller's program.  If 'version'
 								 * is the same as the VERSION #define, the caller is assumed to be part of Open
 								 * vSwitch.  Otherwise, it is assumed to be an external program linking against
 								 * the Open vSwitch libraries.
 								 *
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
+								 */
 								void
-												util: Drop 'date' and 'time' arguments from ovs_set_program_name

The 'date' and 'time' arguments are normally being set by
'ovs_set_program_name' using __DATE__ and __TIME__. However, this
breaks reproducible builds since even without any changes in the
toolchain, build system etc, the end binary will still differ in
that regard. This is also visible when building with -Wdate-time:

utilities/ovs-dpctl.c:61:29: warning: macro "__DATE__" might prevent
reproducible builds [-Wdate-time]
     set_program_name(argv[0]);
                             ^

and it's also something that triggers the following warning in the
openSUSE OBS builds:

[...]
openvswitch.x86_64: W: file-contains-date-and-time /usr/bin/ovs-ofctl
openvswitch.x86_64: W: file-contains-date-and-time /usr/bin/ovs-appctl
Your file uses  __DATE and __TIME__ this causes the package to rebuild
when not needed
[...]

This patch drops these two arguments from ovs_set_program_name__ and
renames the function to ovs_set_program_name dropping the previous
preprocessor macro in the process.

This finally removes the remaining references to __DATE__ and __TIME__
from the sources which is something that has already been done in
commit 26bfaeaa9687 ("Stop using __DATE__ and __TIME__ in startup
string.") for the kernel datapath.

Cc: Jan Engelhardt <jengelh@inai.de>
Signed-off-by: Markos Chandras <mchandras@suse.de>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-05-26 10:02:54 +01:00
+								ovs_set_program_name(const char *argv0, const char *version)
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								{
-												util: Set program_name for windows correctly.

Windows path uses backward slashes. Also, the executable name
has a .exe extension in it. While creating log files, we use
the program name to create log file names. It feels a little odd
to have log file names like ovsdb-server.exe.log etc. Using
_splitpath_s() is a way to have same log file names on both
windows and linux platforms.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-01-06 08:47:57 -08:00
+								    char *basename;
-												util: fix compile warnings

This patch fixes two compile warnings introduced by commit
64b73291 ("util: create a copy of program_name"):
1. ../lib/util.c:457:5: error: passing argument 1 of 'free'
   discards 'const' qualifier from pointer target type; And
2. ../lib/util.c:463:5: error: ISO C90 forbids mixed declarations
   and code [-Werror=declaration-after-statement] (affected only
   branch-2.3 that is C90 compliant and not the master)

Reported-By: Joe Stringer <jstringer@nicira.com>
Reported-By: Lorand Jakab <lojakab@cisco.com>
Signed-Off-By: Ansis Atteka <aatteka@nicira.com>
Acked-by: Joe Stringer <joestringer@nicira.com>

											
										
										
											2014-07-08 04:11:53 +00:00
+								#ifdef _WIN32
-												util: Set program_name for windows correctly.

Windows path uses backward slashes. Also, the executable name
has a .exe extension in it. While creating log files, we use
the program name to create log file names. It feels a little odd
to have log file names like ovsdb-server.exe.log etc. Using
_splitpath_s() is a way to have same log file names on both
windows and linux platforms.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-01-06 08:47:57 -08:00
+								    size_t max_len = strlen(argv0) + 1;
-												daemon-windows: Ability to handle windows service calls.

The following code does not add any users yet.

The visioned workflow that this piece of code should work with is:
* Create a windows service through a startup script with
a tool like 'sc'
ex:  sc create ovsdb-server binpath=
 "C:\openvswitch\usr\sbin\ovsdb-server.exe -vconsole:off
-vsyslog:off -vfile:info --remote=ptcp:6632:127.0.0.1 --log-file
--service-monitor --service"

* Start the service from the startup script.
ex: sc start ovsdb-server

* Terminate the service during shutdown process.
ex: sc stop ovsdb-server

* Abrupt termination will restart the service.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-01-16 16:16:24 -08:00
-												util: Disable popups while asserting in windows.

The default behavior for programs is to display a popup
after an assert/abort etc. This is not an ideal behavior because
this needs user intervention.

set_program_name, though not an ideal place to disable this, is
a useful place because it is called by all programs including
unit test binaries.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-05-12 14:49:58 -07:00
+								    SetErrorMode(GetErrorMode() | SEM_NOGPFAULTERRORBOX);
-												windows: _set_output_format is no longer required from VS2015

_set_output_format is deprecated ang no longer required
starting from MSC_VER 1900 (VS 2015):
https://msdn.microsoft.com/en-us/library/bb531344(v=vs.140).aspx .

Signed-off-by: Alin Gabriel Serdean <aserdean@ovn.org>
Acked-by: Ben Pfaff <blp@ovn.org>
Acked-by: Anand Kumar <kumaranand@vmware.com>

											
										
										
											2017-11-01 19:19:04 +02:00
+								#if _MSC_VER < 1900
 								     /* This function is deprecated from 1900 (Visual Studio 2015) */
-												util: Set two digit exponents for scientific notation.

By default, three digit exponents are printed on Windows.
Many unit tests in Open vSwitch expect two digit exponents.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-06-17 11:16:06 -07:00
+								    _set_output_format(_TWO_DIGIT_EXPONENT);
-												windows: _set_output_format is no longer required from VS2015

_set_output_format is deprecated ang no longer required
starting from MSC_VER 1900 (VS 2015):
https://msdn.microsoft.com/en-us/library/bb531344(v=vs.140).aspx .

Signed-off-by: Alin Gabriel Serdean <aserdean@ovn.org>
Acked-by: Ben Pfaff <blp@ovn.org>
Acked-by: Anand Kumar <kumaranand@vmware.com>

											
										
										
											2017-11-01 19:19:04 +02:00
+								#endif
-												util: Disable popups while asserting in windows.

The default behavior for programs is to display a popup
after an assert/abort etc. This is not an ideal behavior because
this needs user intervention.

set_program_name, though not an ideal place to disable this, is
a useful place because it is called by all programs including
unit test binaries.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-05-12 14:49:58 -07:00
-												util: Set program_name for windows correctly.

Windows path uses backward slashes. Also, the executable name
has a .exe extension in it. While creating log files, we use
the program name to create log file names. It feels a little odd
to have log file names like ovsdb-server.exe.log etc. Using
_splitpath_s() is a way to have same log file names on both
windows and linux platforms.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-01-06 08:47:57 -08:00
+								    basename = xmalloc(max_len);
 								    _splitpath_s(argv0, NULL, 0, NULL, 0, basename, max_len, NULL, 0);
 								#else
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    const char *slash = strrchr(argv0, '/');
-												util: fix compile warnings

This patch fixes two compile warnings introduced by commit
64b73291 ("util: create a copy of program_name"):
1. ../lib/util.c:457:5: error: passing argument 1 of 'free'
   discards 'const' qualifier from pointer target type; And
2. ../lib/util.c:463:5: error: ISO C90 forbids mixed declarations
   and code [-Werror=declaration-after-statement] (affected only
   branch-2.3 that is C90 compliant and not the master)

Reported-By: Joe Stringer <jstringer@nicira.com>
Reported-By: Lorand Jakab <lojakab@cisco.com>
Signed-Off-By: Ansis Atteka <aatteka@nicira.com>
Acked-by: Joe Stringer <joestringer@nicira.com>

											
										
										
											2014-07-08 04:11:53 +00:00
+								    basename = xstrdup(slash ? slash + 1 : argv0);
-												util: Set program_name for windows correctly.

Windows path uses backward slashes. Also, the executable name
has a .exe extension in it. While creating log files, we use
the program name to create log file names. It feels a little odd
to have log file names like ovsdb-server.exe.log etc. Using
_splitpath_s() is a way to have same log file names on both
windows and linux platforms.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-01-06 08:47:57 -08:00
+								#endif
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
-												util: fix compile warnings

This patch fixes two compile warnings introduced by commit
64b73291 ("util: create a copy of program_name"):
1. ../lib/util.c:457:5: error: passing argument 1 of 'free'
   discards 'const' qualifier from pointer target type; And
2. ../lib/util.c:463:5: error: ISO C90 forbids mixed declarations
   and code [-Werror=declaration-after-statement] (affected only
   branch-2.3 that is C90 compliant and not the master)

Reported-By: Joe Stringer <jstringer@nicira.com>
Reported-By: Lorand Jakab <lojakab@cisco.com>
Signed-Off-By: Ansis Atteka <aatteka@nicira.com>
Acked-by: Joe Stringer <joestringer@nicira.com>

											
										
										
											2014-07-08 04:11:53 +00:00
+								    assert_single_threaded();
 								    free(program_name);
-												Build: Add support for shared libraries and versioning.

These changes allow for the building of shared libraries by providing
the --enable-shared option to configure. In particular, lib/libopenvwitch.so,
lib/libsflow.so, ofproto/libofproto.so, and ovsdb/libovsdb.so will be built.
Original behavior of building static remains the same.

Additionally, versioning is introduced to each of the libraries objects
paving the way for APIs to be built around them. A detailed comment
outlining the rules for changing a version number is provided in
configure.ac. Note that at this time, the version number is set to
1.0.0, no API is specified yet, and there are no requirements to
maintain any sort of compatibility in any of the libraries.

Signed-off-by: Scott Mann <smann@noironetworks.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-07 19:02:09 -08:00
+								    /* Remove libtool prefix, if it is there */
 								    if (strncmp(basename, "lt-", 3) == 0) {
 								        char *tmp_name = basename;
 								        basename = xstrdup(basename + 3);
 								        free(tmp_name);
 								    }
-												util: fix compile warnings

This patch fixes two compile warnings introduced by commit
64b73291 ("util: create a copy of program_name"):
1. ../lib/util.c:457:5: error: passing argument 1 of 'free'
   discards 'const' qualifier from pointer target type; And
2. ../lib/util.c:463:5: error: ISO C90 forbids mixed declarations
   and code [-Werror=declaration-after-statement] (affected only
   branch-2.3 that is C90 compliant and not the master)

Reported-By: Joe Stringer <jstringer@nicira.com>
Reported-By: Lorand Jakab <lojakab@cisco.com>
Signed-Off-By: Ansis Atteka <aatteka@nicira.com>
Acked-by: Joe Stringer <joestringer@nicira.com>

											
										
										
											2014-07-08 04:11:53 +00:00
+								    program_name = basename;
-												util: New function set_program_name_version().

With this function, users of the Open vSwitch libraries which
should not have the same version as Open vSwitch will have their
version displayed in unixctl and at the command line.

Signed-off-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2012-04-06 11:47:51 -07:00
-												Build: Add support for shared libraries and versioning.

These changes allow for the building of shared libraries by providing
the --enable-shared option to configure. In particular, lib/libopenvwitch.so,
lib/libsflow.so, ofproto/libofproto.so, and ovsdb/libovsdb.so will be built.
Original behavior of building static remains the same.

Additionally, versioning is introduced to each of the libraries objects
paving the way for APIs to be built around them. A detailed comment
outlining the rules for changing a version number is provided in
configure.ac. Note that at this time, the version number is set to
1.0.0, no API is specified yet, and there are no requirements to
maintain any sort of compatibility in any of the libraries.

Signed-off-by: Scott Mann <smann@noironetworks.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-07 19:02:09 -08:00
+								    free(program_version);
-												util: New function set_program_name_version().

With this function, users of the Open vSwitch libraries which
should not have the same version as Open vSwitch will have their
version displayed in unixctl and at the command line.

Signed-off-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2012-04-06 11:47:51 -07:00
+								    if (!strcmp(version, VERSION)) {
-												util: Drop 'date' and 'time' arguments from ovs_set_program_name

The 'date' and 'time' arguments are normally being set by
'ovs_set_program_name' using __DATE__ and __TIME__. However, this
breaks reproducible builds since even without any changes in the
toolchain, build system etc, the end binary will still differ in
that regard. This is also visible when building with -Wdate-time:

utilities/ovs-dpctl.c:61:29: warning: macro "__DATE__" might prevent
reproducible builds [-Wdate-time]
     set_program_name(argv[0]);
                             ^

and it's also something that triggers the following warning in the
openSUSE OBS builds:

[...]
openvswitch.x86_64: W: file-contains-date-and-time /usr/bin/ovs-ofctl
openvswitch.x86_64: W: file-contains-date-and-time /usr/bin/ovs-appctl
Your file uses  __DATE and __TIME__ this causes the package to rebuild
when not needed
[...]

This patch drops these two arguments from ovs_set_program_name__ and
renames the function to ovs_set_program_name dropping the previous
preprocessor macro in the process.

This finally removes the remaining references to __DATE__ and __TIME__
from the sources which is something that has already been done in
commit 26bfaeaa9687 ("Stop using __DATE__ and __TIME__ in startup
string.") for the kernel datapath.

Cc: Jan Engelhardt <jengelh@inai.de>
Signed-off-by: Markos Chandras <mchandras@suse.de>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-05-26 10:02:54 +01:00
+								        program_version = xasprintf("%s (Open vSwitch) "VERSION"\n",
 								                                    program_name);
-												util: New function set_program_name_version().

With this function, users of the Open vSwitch libraries which
should not have the same version as Open vSwitch will have their
version displayed in unixctl and at the command line.

Signed-off-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2012-04-06 11:47:51 -07:00
+								    } else {
 								        program_version = xasprintf("%s %s\n"
-												util: Drop 'date' and 'time' arguments from ovs_set_program_name

The 'date' and 'time' arguments are normally being set by
'ovs_set_program_name' using __DATE__ and __TIME__. However, this
breaks reproducible builds since even without any changes in the
toolchain, build system etc, the end binary will still differ in
that regard. This is also visible when building with -Wdate-time:

utilities/ovs-dpctl.c:61:29: warning: macro "__DATE__" might prevent
reproducible builds [-Wdate-time]
     set_program_name(argv[0]);
                             ^

and it's also something that triggers the following warning in the
openSUSE OBS builds:

[...]
openvswitch.x86_64: W: file-contains-date-and-time /usr/bin/ovs-ofctl
openvswitch.x86_64: W: file-contains-date-and-time /usr/bin/ovs-appctl
Your file uses  __DATE and __TIME__ this causes the package to rebuild
when not needed
[...]

This patch drops these two arguments from ovs_set_program_name__ and
renames the function to ovs_set_program_name dropping the previous
preprocessor macro in the process.

This finally removes the remaining references to __DATE__ and __TIME__
from the sources which is something that has already been done in
commit 26bfaeaa9687 ("Stop using __DATE__ and __TIME__ in startup
string.") for the kernel datapath.

Cc: Jan Engelhardt <jengelh@inai.de>
Signed-off-by: Markos Chandras <mchandras@suse.de>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-05-26 10:02:54 +01:00
+								                                    "Open vSwitch Library "VERSION"\n",
 								                                    program_name, version);
-												util: New function set_program_name_version().

With this function, users of the Open vSwitch libraries which
should not have the same version as Open vSwitch will have their
version displayed in unixctl and at the command line.

Signed-off-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2012-04-06 11:47:51 -07:00
+								    }
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
+								}
-												util: Make subprogram_name thread-specific.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-07-12 14:18:01 -07:00
+								/* Returns the name of the currently running thread or process. */
 								const char *
 								get_subprogram_name(void)
 								{
 								    const char *name = subprogram_name_get();
 								    return name ? name : "";
 								}
-												configure: Stop avoiding -Wformat-zero-length.

Debian likes to enable -Wformat-zero-length, even over our code trying to
disable it.  It isn't too hard to make our code warning-free against this
option, so this commit both stops disabling it and fixes the warnings.

The first fix is to change set_subprogram_name() to take a plain string
instead of a format string, and to adjust its few callers.  This fixes one
warning since one of those callers passed in an empty string.

The second fix is to remove a test for ovs_scan() against an empty string.
I couldn't find a way to avoid a warning for this test, and it isn't too
valuable in any case.

This allows us to drop filtering for -Wformat from the Debian rules file,
so this commit removes it.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2015-06-07 09:48:14 -07:00
+								/* Sets 'subprogram_name' as the name of the currently running thread or
 								 * process.  (This appears in log messages and may also be visible in system
 								 * process listings and debuggers.) */
-												util: Make subprogram_name thread-specific.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-07-12 14:18:01 -07:00
+								void
-												configure: Stop avoiding -Wformat-zero-length.

Debian likes to enable -Wformat-zero-length, even over our code trying to
disable it.  It isn't too hard to make our code warning-free against this
option, so this commit both stops disabling it and fixes the warnings.

The first fix is to change set_subprogram_name() to take a plain string
instead of a format string, and to adjust its few callers.  This fixes one
warning since one of those callers passed in an empty string.

The second fix is to remove a test for ovs_scan() against an empty string.
I couldn't find a way to avoid a warning for this test, and it isn't too
valuable in any case.

This allows us to drop filtering for -Wformat from the Debian rules file,
so this commit removes it.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2015-06-07 09:48:14 -07:00
+								set_subprogram_name(const char *subprogram_name)
-												util: Make subprogram_name thread-specific.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-07-12 14:18:01 -07:00
+								{
-												configure: Stop avoiding -Wformat-zero-length.

Debian likes to enable -Wformat-zero-length, even over our code trying to
disable it.  It isn't too hard to make our code warning-free against this
option, so this commit both stops disabling it and fixes the warnings.

The first fix is to change set_subprogram_name() to take a plain string
instead of a format string, and to adjust its few callers.  This fixes one
warning since one of those callers passed in an empty string.

The second fix is to remove a test for ovs_scan() against an empty string.
I couldn't find a way to avoid a warning for this test, and it isn't too
valuable in any case.

This allows us to drop filtering for -Wformat from the Debian rules file,
so this commit removes it.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2015-06-07 09:48:14 -07:00
+								    char *pname = xstrdup(subprogram_name ? subprogram_name : program_name);
-												util: Allow set_subprogram_name() to take a printf() format string.

This will be convenient in an upcoming commit.

I had to add -Wno-format-zero-length to suppress a GCC warning about a
zero-length format string in this monitor_daemon() call:
    set_subprogram_name("");
I don't know what that warning is good for anyway, and I guess the Clang
developers don't either because Clang didn't warn.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-11-02 06:55:40 -07:00
+								    free(subprogram_name_set(pname));
-												configure: Distinguish glibc and NetBSD pthread_setname_np() variants.

Reported-by: YAMAMOTO Takashi <yamt@mwd.biglobe.ne.jp>
Tested-by: YAMAMOTO Takashi <yamt@mwd.biglobe.ne.jp>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-08-01 09:35:56 -07:00
+								#if HAVE_GLIBC_PTHREAD_SETNAME_NP
-												util: Fix an issue that thread name cannot be set.

The name of the current thread consists of a name with a maximum
length of 16 bytes and a thread ID. The final name may be longer
than 16 bytes. If the name is longer than 16 bytes, the thread
name will fail to be set

Acked-by: Eelco Chaudron <echaudro@redhat.com>
Signed-off-by: Songtao Zhan <zhanst1@chinatelecom.cn>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-04-19 09:38:52 +08:00
+								    /* The maximum supported thread name including '\0' is 16.
 								     * Add '>' at 0th position to highlight that the name was truncated. */
 								    if (strlen(pname) > 15) {
 								        memmove(pname, &pname[strlen(pname) - 15], 15 + 1);
 								        pname[0] = '>';
 								    }
-												util: Don't set thread name to empty

In monitor_daemon(), it set subprogram_name to "" which causes system crash
in some platform when trying to set the thread name to "".  This change set
thread name to program name in this case.

Signed-off-by: Guolin Yang <gyang@nicira.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-09-09 09:38:01 -07:00
+								    pthread_setname_np(pthread_self(), pname);
-												configure: Distinguish glibc and NetBSD pthread_setname_np() variants.

Reported-by: YAMAMOTO Takashi <yamt@mwd.biglobe.ne.jp>
Tested-by: YAMAMOTO Takashi <yamt@mwd.biglobe.ne.jp>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-08-01 09:35:56 -07:00
+								#elif HAVE_NETBSD_PTHREAD_SETNAME_NP
-												util: Don't set thread name to empty

In monitor_daemon(), it set subprogram_name to "" which causes system crash
in some platform when trying to set the thread name to "".  This change set
thread name to program name in this case.

Signed-off-by: Guolin Yang <gyang@nicira.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-09-09 09:38:01 -07:00
+								    pthread_setname_np(pthread_self(), "%s", pname);
-												util: Set thread name via pthreads in set_subprogram_name().

This makes "top" and "ps" output more readable on FreeBSD at least, and
the names are also visible in debuggers.

Suggested-by: Ed Maste <emaste@freebsd.org>
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Tested-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2013-07-25 09:45:43 -07:00
+								#elif HAVE_PTHREAD_SET_NAME_NP
-												util: Don't set thread name to empty

In monitor_daemon(), it set subprogram_name to "" which causes system crash
in some platform when trying to set the thread name to "".  This change set
thread name to program name in this case.

Signed-off-by: Guolin Yang <gyang@nicira.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-09-09 09:38:01 -07:00
+								    pthread_set_name_np(pthread_self(), pname);
-												util: Set thread name via pthreads in set_subprogram_name().

This makes "top" and "ps" output more readable on FreeBSD at least, and
the names are also visible in debuggers.

Suggested-by: Ed Maste <emaste@freebsd.org>
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Tested-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2013-07-25 09:45:43 -07:00
+								#endif
-												util: Make subprogram_name thread-specific.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-07-12 14:18:01 -07:00
+								}
-												process: Consolidate process related APIs.

As part of retrieving system statistics, process status APIs along with
helper functions were implemented. Some of them are very generic and can
be reused by other subsystems.

Move the APIs in system-stats.c to process.c and util.c and make them
available. This patch doesn't change any functionality.

Signed-off-by: Bhanuprakash Bodireddy <bhanuprakash.bodireddy@intel.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-20 10:29:47 +01:00
+								unsigned int
 								get_page_size(void)
 								{
 								    static unsigned int cached;
 								    if (!cached) {
 								#ifndef _WIN32
 								        long int value = sysconf(_SC_PAGESIZE);
 								#else
 								        long int value;
 								        SYSTEM_INFO sysinfo;
 								        GetSystemInfo(&sysinfo);
 								        value = sysinfo.dwPageSize;
 								#endif
 								        if (value >= 0) {
 								            cached = value;
 								        }
 								    }
 								    return cached;
 								}
 								/* Returns the time at which the system booted, as the number of milliseconds
 								 * since the epoch, or 0 if the time of boot cannot be determined. */
 								long long int
 								get_boot_time(void)
 								{
 								    static long long int cache_expiration = LLONG_MIN;
 								    static long long int boot_time;
 								    ovs_assert(LINUX);
 								    if (time_msec() >= cache_expiration) {
 								        static const char stat_file[] = "/proc/stat";
 								        char line[128];
 								        FILE *stream;
 								        cache_expiration = time_msec() + 5 * 1000;
 								        stream = fopen(stat_file, "r");
 								        if (!stream) {
 								            VLOG_ERR_ONCE("%s: open failed (%s)",
 								                          stat_file, ovs_strerror(errno));
 								            return boot_time;
 								        }
 								        while (fgets(line, sizeof line, stream)) {
 								            long long int btime;
 								            if (ovs_scan(line, "btime %lld", &btime)) {
 								                boot_time = btime * 1000;
 								                goto done;
 								            }
 								        }
 								        VLOG_ERR_ONCE("%s: btime not found", stat_file);
 								    done:
 								        fclose(stream);
 								    }
 								    return boot_time;
 								}
-												tests: Use environment variable for default timeout.

Introduce new 'OVS_CTL_TIMEOUT' environment variable
that, if set, will be used as a default timeout for
OVS control utilities. Setting it in 'atlocal.in' will
cover all the hangs inside the testsuite, even when
utils called in a subshell.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2018-08-14 10:53:16 +03:00
+								/* This is a wrapper for setting timeout in control utils.
 								 * The value of OVS_CTL_TIMEOUT environment variable will be used by
 								 * default if 'secs' is not specified. */
 								void
 								ctl_timeout_setup(unsigned int secs)
 								{
 								    if (!secs) {
 								        char *env = getenv("OVS_CTL_TIMEOUT");
 								        if (env && env[0]) {
 								            str_to_uint(env, 10, &secs);
 								        }
 								    }
 								    if (secs) {
 								        time_alarm(secs);
 								    }
 								}
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
+								/* Returns a pointer to a string describing the program version.  The
 								 * caller must not modify or free the returned string.
-												lib: Whitespace cleanup.

											
										
										
											2011-08-04 16:50:25 -07:00
+								 */
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
+								const char *
-												lib: Add API to set program name and version

Required to have reasonable logging messages.

Signed-off-by: Thomas Graf <tgraf@noironetworks.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-24 12:49:01 +01:00
+								ovs_get_program_version(void)
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
+								{
 								    return program_version;
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								}
-												lib: Add API to set program name and version

Required to have reasonable logging messages.

Signed-off-by: Thomas Graf <tgraf@noironetworks.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-24 12:49:01 +01:00
+								/* Returns a pointer to a string describing the program name.  The
 								 * caller must not modify or free the returned string.
 								 */
 								const char *
 								ovs_get_program_name(void)
 								{
 								    return program_name;
 								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								/* Print the version information for the program.  */
 								void
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
+								ovs_print_version(uint8_t min_ofp, uint8_t max_ofp)
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								{
-												util: Introduce get_program_version function.

Useful in an upcoming commit.

											
										
										
											2011-08-02 12:16:44 -07:00
+								    printf("%s", program_version);
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    if (min_ofp || max_ofp) {
 								        printf("OpenFlow versions %#x:%#x\n", min_ofp, max_ofp);
 								    }
 								}
 								/* Writes the 'size' bytes in 'buf' to 'stream' as hex bytes arranged 16 per
 								 * line.  Numeric offsets are also included, starting at 'ofs' for the first
 								 * byte in 'buf'.  If 'ascii' is true then the corresponding ASCII characters
 								 * are also rendered alongside. */
 								void
 								ovs_hex_dump(FILE *stream, const void *buf_, size_t size,
 								             uintptr_t ofs, bool ascii)
 								{
-												util: Fix style in ovs_hex_dump().

Reported-by: Russell Bryant <russell@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Russell Bryant <russell@ovn.org>

											
										
										
											2017-10-09 10:34:55 -07:00
+								    const uint8_t *buf = buf_;
 								    const size_t per_line = 16; /* Maximum bytes per line. */
 								    while (size > 0) {
 								        size_t i;
 								        /* Number of bytes on this line. */
 								        size_t start = ofs % per_line;
 								        size_t end = per_line;
 								        if (end - start > size) {
 								            end = start + size;
 								        }
 								        size_t n = end - start;
 								        /* Print line. */
 								        fprintf(stream, "%08"PRIxMAX" ",
 								                (uintmax_t) ROUND_DOWN(ofs, per_line));
 								        for (i = 0; i < start; i++) {
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								            fprintf(stream, "   ");
-												util: Fix style in ovs_hex_dump().

Reported-by: Russell Bryant <russell@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Russell Bryant <russell@ovn.org>

											
										
										
											2017-10-09 10:34:55 -07:00
+								        }
 								        for (; i < end; i++) {
 								            fprintf(stream, "%c%02x",
 								                    i == per_line / 2 ? '-' : ' ', buf[i - start]);
 								        }
 								        if (ascii) {
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								            fprintf(stream, " ");
-												util: Fix style in ovs_hex_dump().

Reported-by: Russell Bryant <russell@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Russell Bryant <russell@ovn.org>

											
										
										
											2017-10-09 10:34:55 -07:00
+								            for (; i < per_line; i++) {
 								                fprintf(stream, "   ");
 								            }
 								            fprintf(stream, "|");
 								            for (i = 0; i < start; i++) {
 								                fprintf(stream, " ");
 								            }
 								            for (; i < end; i++) {
 								                int c = buf[i - start];
 								                putc(c >= 32 && c < 127 ? c : '.', stream);
 								            }
 								            for (; i < per_line; i++) {
 								                fprintf(stream, " ");
 								            }
 								            fprintf(stream, "|");
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								        }
-												util: Fix style in ovs_hex_dump().

Reported-by: Russell Bryant <russell@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Russell Bryant <russell@ovn.org>

											
										
										
											2017-10-09 10:34:55 -07:00
+								        fprintf(stream, "\n");
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
-												util: Fix style in ovs_hex_dump().

Reported-by: Russell Bryant <russell@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Russell Bryant <russell@ovn.org>

											
										
										
											2017-10-09 10:34:55 -07:00
+								        ofs += n;
 								        buf += n;
 								        size -= n;
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    }
 								}
 								bool
 								str_to_int(const char *s, int base, int *i)
 								{
 								    long long ll;
 								    bool ok = str_to_llong(s, base, &ll);
-												util: Check ranges on string to int/long conversion.

It's required to check ranges to avoid integer overflow because
underlying strtoll() will check only for LLONG_MIN/MAX.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Jan Scheurich <jan.scheurich@ericsson.com>

											
										
										
											2017-11-29 13:50:43 +03:00
 								    if (!ok || ll < INT_MIN || ll > INT_MAX) {
 								        *i = 0;
 								        return false;
 								    }
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    *i = ll;
-												util: Check ranges on string to int/long conversion.

It's required to check ranges to avoid integer overflow because
underlying strtoll() will check only for LLONG_MIN/MAX.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Jan Scheurich <jan.scheurich@ericsson.com>

											
										
										
											2017-11-29 13:50:43 +03:00
+								    return true;
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								}
 								bool
 								str_to_long(const char *s, int base, long *li)
 								{
 								    long long ll;
 								    bool ok = str_to_llong(s, base, &ll);
-												util: Check ranges on string to int/long conversion.

It's required to check ranges to avoid integer overflow because
underlying strtoll() will check only for LLONG_MIN/MAX.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Jan Scheurich <jan.scheurich@ericsson.com>

											
										
										
											2017-11-29 13:50:43 +03:00
 								    if (!ok || ll < LONG_MIN || ll > LONG_MAX) {
 								        *li = 0;
 								        return false;
 								    }
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    *li = ll;
-												util: Check ranges on string to int/long conversion.

It's required to check ranges to avoid integer overflow because
underlying strtoll() will check only for LLONG_MIN/MAX.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Jan Scheurich <jan.scheurich@ericsson.com>

											
										
										
											2017-11-29 13:50:43 +03:00
+								    return true;
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								}
 								bool
 								str_to_llong(const char *s, int base, long long *x)
 								{
 								    char *tail;
-												ovsdb-data: Add support for integer ranges in database commands

Adding / removing a range of integers to a column accepting a set of
integers requires enumarating all of the integers. This patch simplifies
it by introducing 'range' concept to the database commands. Two integers
separated by a hyphen represent an inclusive range.

The patch adds positive and negative tests for the new syntax.
The patch was tested by 'make check'. Covarage was tested by
'make check-lcov'.

Signed-off-by: Lukasz Rzasik <lukasz.rzasik@gmail.com>
Suggested-by: <my_ovs_discuss@yahoo.com>
Suggested-by: Ben Pfaff <blp@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-12-29 15:55:46 -07:00
+								    bool ok = str_to_llong_with_tail(s, &tail, base, x);
 								    if (*tail != '\0') {
 								        *x = 0;
 								        return false;
 								    }
 								    return ok;
 								}
 								bool
 								str_to_llong_with_tail(const char *s, char **tail, int base, long long *x)
 								{
 								    int save_errno = errno;
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								    errno = 0;
-												ovsdb-data: Add support for integer ranges in database commands

Adding / removing a range of integers to a column accepting a set of
integers requires enumarating all of the integers. This patch simplifies
it by introducing 'range' concept to the database commands. Two integers
separated by a hyphen represent an inclusive range.

The patch adds positive and negative tests for the new syntax.
The patch was tested by 'make check'. Covarage was tested by
'make check-lcov'.

Signed-off-by: Lukasz Rzasik <lukasz.rzasik@gmail.com>
Suggested-by: <my_ovs_discuss@yahoo.com>
Suggested-by: Ben Pfaff <blp@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-12-29 15:55:46 -07:00
+								    *x = strtoll(s, tail, base);
 								    if (errno == EINVAL || errno == ERANGE || *tail == s) {
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								        errno = save_errno;
 								        *x = 0;
 								        return false;
 								    } else {
 								        errno = save_errno;
 								        return true;
 								    }
 								}
-												lib/util: Input validation in str_to_uint

This function returns true when 's' is negative or greater than UINT_MAX. Also,
the representation of 'int' and 'unsigned int' is implementation dependent, so
converting [INT_MAX..UINT_MAX] values with str_to_int is fragile.
Instead, we should convert straight to 'long long' and do a boundary check
before returning the converted value.
This patch also move the function to the .c file as it's not-trivial now, and
deletes the other str_to_u* functions as they are not used.

Signed-off-by: Zoltan Kiss <zoltan.kiss@citrix.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-04-23 14:45:21 +01:00
+								bool
 								str_to_uint(const char *s, int base, unsigned int *u)
 								{
 								    long long ll;
 								    bool ok = str_to_llong(s, base, &ll);
 								    if (!ok || ll < 0 || ll > UINT_MAX) {
-												lib/util.c: style fixes

Covert tabs into spaces. Found by inspection.

Signed-off-by: Andy Zhou <azhou@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>

											
										
										
											2015-06-01 19:07:13 -07:00
+								        *u = 0;
 								        return false;
-												lib/util: Input validation in str_to_uint

This function returns true when 's' is negative or greater than UINT_MAX. Also,
the representation of 'int' and 'unsigned int' is implementation dependent, so
converting [INT_MAX..UINT_MAX] values with str_to_int is fragile.
Instead, we should convert straight to 'long long' and do a boundary check
before returning the converted value.
This patch also move the function to the .c file as it's not-trivial now, and
deletes the other str_to_u* functions as they are not used.

Signed-off-by: Zoltan Kiss <zoltan.kiss@citrix.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-04-23 14:45:21 +01:00
+								    } else {
-												lib/util.c: style fixes

Covert tabs into spaces. Found by inspection.

Signed-off-by: Andy Zhou <azhou@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>

											
										
										
											2015-06-01 19:07:13 -07:00
+								        *u = ll;
 								        return true;
-												lib/util: Input validation in str_to_uint

This function returns true when 's' is negative or greater than UINT_MAX. Also,
the representation of 'int' and 'unsigned int' is implementation dependent, so
converting [INT_MAX..UINT_MAX] values with str_to_int is fragile.
Instead, we should convert straight to 'long long' and do a boundary check
before returning the converted value.
This patch also move the function to the .c file as it's not-trivial now, and
deletes the other str_to_u* functions as they are not used.

Signed-off-by: Zoltan Kiss <zoltan.kiss@citrix.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-04-23 14:45:21 +01:00
+								    }
 								}
-												util: Introduce str_to_ullong() helper function.

Will be used to convert strings to unsigned long long.

Signed-off-by: Ilya Maximets <i.maximets@samsung.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Jan Scheurich <jan.scheurich@ericsson.com>

											
										
										
											2017-11-29 13:50:44 +03:00
+								bool
 								str_to_ullong(const char *s, int base, unsigned long long *x)
 								{
 								    int save_errno = errno;
 								    char *tail;
 								    errno = 0;
 								    *x = strtoull(s, &tail, base);
 								    if (errno == EINVAL || errno == ERANGE || tail == s || *tail != '\0') {
 								        errno = save_errno;
 								        *x = 0;
 								        return false;
 								    } else {
 								        errno = save_errno;
 								        return true;
 								    }
 								}
-												ovsdb-data: Add support for integer ranges in database commands

Adding / removing a range of integers to a column accepting a set of
integers requires enumarating all of the integers. This patch simplifies
it by introducing 'range' concept to the database commands. Two integers
separated by a hyphen represent an inclusive range.

The patch adds positive and negative tests for the new syntax.
The patch was tested by 'make check'. Covarage was tested by
'make check-lcov'.

Signed-off-by: Lukasz Rzasik <lukasz.rzasik@gmail.com>
Suggested-by: <my_ovs_discuss@yahoo.com>
Suggested-by: Ben Pfaff <blp@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-12-29 15:55:46 -07:00
+								bool
 								str_to_llong_range(const char *s, int base, long long *begin,
 								                   long long *end)
 								{
 								    char *tail;
 								    if (str_to_llong_with_tail(s, &tail, base, begin)
 								        && *tail == '-'
 								        && str_to_llong(tail + 1, base, end)) {
 								        return true;
 								    }
 								    *begin = 0;
 								    *end = 0;
 								    return false;
 								}
-												Implement JSON parsing and serialization.

This will be used by the upcoming Open vSwitch configuration database.

											
										
										
											2009-11-04 14:55:53 -08:00
+								/* Converts floating-point string 's' into a double.  If successful, stores
 								 * the double in '*d' and returns true; on failure, stores 0 in '*d' and
 								 * returns false.
 								 *
 								 * Underflow (e.g. "1e-9999") is not considered an error, but overflow
 								 * (e.g. "1e9999)" is. */
 								bool
 								str_to_double(const char *s, double *d)
 								{
 								    int save_errno = errno;
 								    char *tail;
 								    errno = 0;
 								    *d = strtod(s, &tail);
 								    if (errno == EINVAL || (errno == ERANGE && *d != 0)
 								        || tail == s || *tail != '\0') {
 								        errno = save_errno;
 								        *d = 0;
 								        return false;
 								    } else {
 								        errno = save_errno;
 								        return true;
 								    }
 								}
 								/* Returns the value of 'c' as a hexadecimal digit. */
 								int
-												util: Use lookup table to optimize hexit_value().

Daniel Alvarez Sanchez reported a significant overall speedup in ovn-northd
due to a similar patch.

Reported-by: Daniel Alvarez Sanchez <dalvarez@redhat.com>
Reported-at: https://mail.openvswitch.org/pipermail/ovs-discuss/2018-February/046120.html
Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Daniel Alvarez <dalvarez@redhat.com>
Reviewed-by: Yifeng Sun <pkusunyifeng@gmail.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2018-02-02 15:16:22 -08:00
+								hexit_value(unsigned char c)
 								{
 								    static const signed char tbl[UCHAR_MAX + 1] = {
 								#define TBL(x)                                  \
 								        (  x >= '0' && x <= '9' ? x - '0'       \
 								         : x >= 'a' && x <= 'f' ? x - 'a' + 0xa \
 								         : x >= 'A' && x <= 'F' ? x - 'A' + 0xa \
 								         : -1)
 								#define TBL0(x)  TBL(x),  TBL((x) + 1),   TBL((x) + 2),   TBL((x) + 3)
 								#define TBL1(x) TBL0(x), TBL0((x) + 4),  TBL0((x) + 8),  TBL0((x) + 12)
 								#define TBL2(x) TBL1(x), TBL1((x) + 16), TBL1((x) + 32), TBL1((x) + 48)
 								        TBL2(0), TBL2(64), TBL2(128), TBL2(192)
 								    };
 								    return tbl[c];
-												Implement JSON parsing and serialization.

This will be used by the upcoming Open vSwitch configuration database.

											
										
										
											2009-11-04 14:55:53 -08:00
+								}
-												New dir_name() function plus tests.

											
										
										
											2009-10-19 14:04:14 -07:00
-												util: Add function hexits_value() for parsing multiple hex digits.

Suggested-by: Justin Pettit <jpettit@nicira.com>

											
										
										
											2010-11-15 10:18:10 -08:00
+								/* Returns the integer value of the 'n' hexadecimal digits starting at 's', or
-												util: Make hexits_value() support 64-bit integers too.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-09-30 12:45:50 -07:00
+								 * UINTMAX_MAX if one of those "digits" is not really a hex digit.  Sets '*ok'
 								 * to true if the conversion succeeds or to false if a non-hex digit is
 								 * detected. */
 								uintmax_t
-												util: Add function hexits_value() for parsing multiple hex digits.

Suggested-by: Justin Pettit <jpettit@nicira.com>

											
										
										
											2010-11-15 10:18:10 -08:00
+								hexits_value(const char *s, size_t n, bool *ok)
 								{
-												util: Make hexits_value() support 64-bit integers too.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-09-30 12:45:50 -07:00
+								    uintmax_t value;
-												util: Add function hexits_value() for parsing multiple hex digits.

Suggested-by: Justin Pettit <jpettit@nicira.com>

											
										
										
											2010-11-15 10:18:10 -08:00
+								    size_t i;
 								    value = 0;
 								    for (i = 0; i < n; i++) {
 								        int hexit = hexit_value(s[i]);
 								        if (hexit < 0) {
-												util: Make hexits_value() support 64-bit integers too.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-09-30 12:45:50 -07:00
+								            *ok = false;
 								            return UINTMAX_MAX;
-												util: Add function hexits_value() for parsing multiple hex digits.

Suggested-by: Justin Pettit <jpettit@nicira.com>

											
										
										
											2010-11-15 10:18:10 -08:00
+								        }
 								        value = (value << 4) + hexit;
 								    }
-												util: Make hexits_value() support 64-bit integers too.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-09-30 12:45:50 -07:00
+								    *ok = true;
-												util: Add function hexits_value() for parsing multiple hex digits.

Suggested-by: Justin Pettit <jpettit@nicira.com>

											
										
										
											2010-11-15 10:18:10 -08:00
+								    return value;
 								}
-												util: Library routines for printing and scanning large hex integers.

Geneve options are variable length and up to 124 bytes long, which means
that they can't be easily manipulated by the integer string functions
like we do for other fields. This adds a few helper routines to make
these operations easier.

Signed-off-by: Jesse Gross <jesse@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2015-05-20 18:47:21 -07:00
+								/* Parses the string in 's' as an integer in either hex or decimal format and
 								 * puts the result right justified in the array 'valuep' that is 'field_width'
 								 * big. If the string is in hex format, the value may be arbitrarily large;
 								 * integers are limited to 64-bit values. (The rationale is that decimal is
 								 * likely to represent a number and 64 bits is a reasonable maximum whereas
 								 * hex could either be a number or a byte string.)
 								 *
 								 * On return 'tail' points to the first character in the string that was
 								 * not parsed as part of the value. ERANGE is returned if the value is too
 								 * large to fit in the given field. */
 								int
 								parse_int_string(const char *s, uint8_t *valuep, int field_width, char **tail)
 								{
 								    unsigned long long int integer;
 								    int i;
 								    if (!strncmp(s, "0x", 2) || !strncmp(s, "0X", 2)) {
 								        uint8_t *hexit_str;
 								        int len = 0;
 								        int val_idx;
 								        int err = 0;
 								        s += 2;
 								        hexit_str = xmalloc(field_width * 2);
 								        for (;;) {
 								            uint8_t hexit;
 								            bool ok;
 								            s += strspn(s, " \t\r\n");
 								            hexit = hexits_value(s, 1, &ok);
 								            if (!ok) {
 								                *tail = CONST_CAST(char *, s);
 								                break;
 								            }
 								            if (hexit != 0 || len) {
 								                if (DIV_ROUND_UP(len + 1, 2) > field_width) {
 								                    err = ERANGE;
 								                    goto free;
 								                }
 								                hexit_str[len] = hexit;
 								                len++;
 								            }
 								            s++;
 								        }
 								        val_idx = field_width;
 								        for (i = len - 1; i >= 0; i -= 2) {
 								            val_idx--;
 								            valuep[val_idx] = hexit_str[i];
 								            if (i > 0) {
 								                valuep[val_idx] += hexit_str[i - 1] << 4;
 								            }
 								        }
 								        memset(valuep, 0, val_idx);
 								free:
 								        free(hexit_str);
-												lib/util.c: style fixes

Covert tabs into spaces. Found by inspection.

Signed-off-by: Andy Zhou <azhou@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>

											
										
										
											2015-06-01 19:07:13 -07:00
+								        return err;
-												util: Library routines for printing and scanning large hex integers.

Geneve options are variable length and up to 124 bytes long, which means
that they can't be easily manipulated by the integer string functions
like we do for other fields. This adds a few helper routines to make
these operations easier.

Signed-off-by: Jesse Gross <jesse@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2015-05-20 18:47:21 -07:00
+								    }
 								    errno = 0;
 								    integer = strtoull(s, tail, 0);
-												util: Make parse_int_string() only succeed if it parses a non-empty string.

strtoull() doesn't necessarily set errno if it finds nothing to parse, but
this code didn't check for that case.

Reported-by: Ilya Maximets <i.maximets@samsung.com>
Reported-at: https://mail.openvswitch.org/pipermail/ovs-dev/2018-December/354622.html
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2018-12-18 19:12:59 -08:00
+								    if (errno || s == *tail) {
 								        return errno ? errno : EINVAL;
-												util: Library routines for printing and scanning large hex integers.

Geneve options are variable length and up to 124 bytes long, which means
that they can't be easily manipulated by the integer string functions
like we do for other fields. This adds a few helper routines to make
these operations easier.

Signed-off-by: Jesse Gross <jesse@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>

											
										
										
											2015-05-20 18:47:21 -07:00
+								    }
 								    for (i = field_width - 1; i >= 0; i--) {
 								        valuep[i] = integer;
 								        integer >>= 8;
 								    }
 								    if (integer) {
 								        return ERANGE;
 								    }
 								    return 0;
 								}
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
+								/* Returns the current working directory as a malloc()'d string, or a null
 								 * pointer if the current working directory cannot be determined. */
 								char *
 								get_cwd(void)
 								{
 								    long int path_max;
 								    size_t size;
 								    /* Get maximum path length or at least a reasonable estimate. */
-												util: Maximum path length for Windows.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-10 09:16:08 -07:00
+								#ifndef _WIN32
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
+								    path_max = pathconf(".", _PC_PATH_MAX);
-												util: Maximum path length for Windows.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-10 09:16:08 -07:00
+								#else
 								    path_max = MAX_PATH;
 								#endif
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
+								    size = (path_max < 0 ? 1024
 								            : path_max > 10240 ? 10240
 								            : path_max);
 								    /* Get current working directory. */
 								    for (;;) {
 								        char *buf = xmalloc(size);
 								        if (getcwd(buf, size)) {
 								            return xrealloc(buf, strlen(buf) + 1);
 								        } else {
 								            int error = errno;
 								            free(buf);
 								            if (error != ERANGE) {
-												Replace all uses of strerror() by ovs_strerror(), for thread safety.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-06-24 10:54:49 -07:00
+								                VLOG_WARN("getcwd failed (%s)", ovs_strerror(error));
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
+								                return NULL;
 								            }
 								            size *= 2;
 								        }
 								    }
 								}
-												util: New function base_name().

											
										
										
											2010-11-09 14:38:28 -08:00
+								static char *
 								all_slashes_name(const char *s)
 								{
 								    return xstrdup(s[0] == '/' && s[1] == '/' && s[2] != '/' ? "//"
 								                   : s[0] == '/' ? "/"
 								                   : ".");
 								}
-												util: Don't compile couple of unused function for Windows.

basename() and dir_name() are not used for Windows and won't work well if
used. So put a '#ifndef _WIN32' around them to prevent future calls.

test-file_name.c tests the above 2 functions. It makes sense to merge
this single function file with test-util.c and then not compile it for
Windows.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-05-29 10:19:19 -07:00
+								#ifndef _WIN32
-												New dir_name() function plus tests.

											
										
										
											2009-10-19 14:04:14 -07:00
+								/* Returns the directory name portion of 'file_name' as a malloc()'d string,
 								 * similar to the POSIX dirname() function but thread-safe. */
 								char *
 								dir_name(const char *file_name)
 								{
 								    size_t len = strlen(file_name);
 								    while (len > 0 && file_name[len - 1] == '/') {
 								        len--;
 								    }
 								    while (len > 0 && file_name[len - 1] != '/') {
 								        len--;
 								    }
 								    while (len > 0 && file_name[len - 1] == '/') {
 								        len--;
 								    }
-												util: New function base_name().

											
										
										
											2010-11-09 14:38:28 -08:00
+								    return len ? xmemdup0(file_name, len) : all_slashes_name(file_name);
 								}
 								/* Returns the file name portion of 'file_name' as a malloc()'d string,
 								 * similar to the POSIX basename() function but thread-safe. */
 								char *
 								base_name(const char *file_name)
 								{
 								    size_t end, start;
 								    end = strlen(file_name);
 								    while (end > 0 && file_name[end - 1] == '/') {
 								        end--;
 								    }
 								    if (!end) {
 								        return all_slashes_name(file_name);
-												New dir_name() function plus tests.

											
										
										
											2009-10-19 14:04:14 -07:00
+								    }
-												util: New function base_name().

											
										
										
											2010-11-09 14:38:28 -08:00
 								    start = end;
 								    while (start > 0 && file_name[start - 1] != '/') {
 								        start--;
 								    }
 								    return xmemdup0(file_name + start, end - start);
-												New dir_name() function plus tests.

											
										
										
											2009-10-19 14:04:14 -07:00
+								}
-												util: Don't compile couple of unused function for Windows.

basename() and dir_name() are not used for Windows and won't work well if
used. So put a '#ifndef _WIN32' around them to prevent future calls.

test-file_name.c tests the above 2 functions. It makes sense to merge
this single function file with test-util.c and then not compile it for
Windows.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-05-29 10:19:19 -07:00
+								#endif /* _WIN32 */
-												Clean-up compiler warnings about ignoring return values

Some systems complain when certain functions' return values are not
checked.  This commit fixes those warnings.

Creating ignore() function suggested by Ben Pfaff.

											
										
										
											2009-12-14 23:08:10 -08:00
-												util: Fix abs_file_name() bugs on Windows.

abs_file_name() believed that a file name that begins with / or contains :
is absolute and that any other file name is relative.  On Windows, this is
wrong in at least the following ways:

   * / and \ are interchangeable on Windows.

   * A name that begins with \\ or // is also absolute.

   * A name that begins with X: but not X:\ is not absolute.

   * A name with : in some position other than the second position is
     not absolute (although it might not be valid either?).

Furthermore, Windows has more than one current working directory (one per
volume letter), so trying to make a file name absolute by just prefixing
the current working directory for the current volume results in silliness.

This patch attempts to fix the problem.

This makes OVS link against shlwapi, which is needed to use
PathIsRelative().

Found by inspection.

Acked-by: Alin Gabriel Serdean <aserdean@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2018-07-24 09:48:45 -07:00
+								bool
 								is_file_name_absolute(const char *fn)
 								{
 								#ifdef _WIN32
 								    /* Use platform specific API */
 								    return !PathIsRelative(fn);
 								#else
 								    /* An absolute path begins with /. */
 								    return fn[0] == '/';
 								#endif
 								}
 								/* If 'file_name' is absolute, returns a copy of 'file_name'.  Otherwise,
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
+								 * returns an absolute path to 'file_name' considering it relative to 'dir',
 								 * which itself must be absolute.  'dir' may be null or the empty string, in
 								 * which case the current working directory is used.
 								 *
 								 * Returns a null pointer if 'dir' is null and getcwd() fails. */
 								char *
 								abs_file_name(const char *dir, const char *file_name)
 								{
-												util: Fix abs_file_name() bugs on Windows.

abs_file_name() believed that a file name that begins with / or contains :
is absolute and that any other file name is relative.  On Windows, this is
wrong in at least the following ways:

   * / and \ are interchangeable on Windows.

   * A name that begins with \\ or // is also absolute.

   * A name that begins with X: but not X:\ is not absolute.

   * A name with : in some position other than the second position is
     not absolute (although it might not be valid either?).

Furthermore, Windows has more than one current working directory (one per
volume letter), so trying to make a file name absolute by just prefixing
the current working directory for the current volume results in silliness.

This patch attempts to fix the problem.

This makes OVS link against shlwapi, which is needed to use
PathIsRelative().

Found by inspection.

Acked-by: Alin Gabriel Serdean <aserdean@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2018-07-24 09:48:45 -07:00
+								    /* If it's already absolute, return a copy. */
 								    if (is_file_name_absolute(file_name)) {
-												Windows: Report absolute file name.

On Windows if a file path contains ":" we can safely say it is an absolute
file name.

This patch allows file_name checks to report correctly when using
"abs_file_name".

Found by testing.

Signed-off-by: Alin Gabriel Serdean <aserdean@cloudbasesolutions.com>
Acked-by: Sairam Venugopal <vsairam@vmware.com>
Signed-off-by: Gurucharan Shetty <guru@ovn.org>

											
										
										
											2016-08-12 07:39:01 +00:00
+								        return xstrdup(file_name);
-												util: Fix abs_file_name() bugs on Windows.

abs_file_name() believed that a file name that begins with / or contains :
is absolute and that any other file name is relative.  On Windows, this is
wrong in at least the following ways:

   * / and \ are interchangeable on Windows.

   * A name that begins with \\ or // is also absolute.

   * A name that begins with X: but not X:\ is not absolute.

   * A name with : in some position other than the second position is
     not absolute (although it might not be valid either?).

Furthermore, Windows has more than one current working directory (one per
volume letter), so trying to make a file name absolute by just prefixing
the current working directory for the current volume results in silliness.

This patch attempts to fix the problem.

This makes OVS link against shlwapi, which is needed to use
PathIsRelative().

Found by inspection.

Acked-by: Alin Gabriel Serdean <aserdean@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2018-07-24 09:48:45 -07:00
+								    }
 								    /* If a base dir was supplied, use it.  We assume, without checking, that
 								     * the base dir is absolute.*/
 								    if (dir && dir[0]) {
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
+								        char *separator = dir[strlen(dir) - 1] == '/' ? "" : "/";
 								        return xasprintf("%s%s%s", dir, separator, file_name);
 								    }
-												util: Fix abs_file_name() bugs on Windows.

abs_file_name() believed that a file name that begins with / or contains :
is absolute and that any other file name is relative.  On Windows, this is
wrong in at least the following ways:

   * / and \ are interchangeable on Windows.

   * A name that begins with \\ or // is also absolute.

   * A name that begins with X: but not X:\ is not absolute.

   * A name with : in some position other than the second position is
     not absolute (although it might not be valid either?).

Furthermore, Windows has more than one current working directory (one per
volume letter), so trying to make a file name absolute by just prefixing
the current working directory for the current volume results in silliness.

This patch attempts to fix the problem.

This makes OVS link against shlwapi, which is needed to use
PathIsRelative().

Found by inspection.

Acked-by: Alin Gabriel Serdean <aserdean@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2018-07-24 09:48:45 -07:00
 								#if _WIN32
 								    /* It's a little complicated to make an absolute path on Windows because a
 								     * relative path might still specify a drive letter.  The OS has a function
 								     * to do the job for us, so use it. */
 								    char abs_path[MAX_PATH];
 								    DWORD n = GetFullPathName(file_name, sizeof abs_path, abs_path, NULL);
 								    return n > 0 && n <= sizeof abs_path ? xmemdup0(abs_path, n) : NULL;
 								#else
 								    /* Outside Windows, do the job ourselves. */
 								    char *cwd = get_cwd();
 								    if (!cwd) {
 								        return NULL;
 								    }
 								    char *abs_name = xasprintf("%s/%s", cwd, file_name);
 								    free(cwd);
 								    return abs_name;
 								#endif
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
+								}
-												util: New function follow_symlinks().

It will acquire its first user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-30 11:36:06 -07:00
+								/* Like readlink(), but returns the link name as a null-terminated string in
 								 * allocated memory that the caller must eventually free (with free()).
 								 * Returns NULL on error, in which case errno is set appropriately. */
-												util: Make xreadlink a static function.

It is only used in util.c

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-13 10:21:04 -08:00
+								static char *
-												util: New function follow_symlinks().

It will acquire its first user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-30 11:36:06 -07:00
+								xreadlink(const char *filename)
 								{
-												windows: return NULL in xreadlink

readlink does not exist on Windows.

While we could skip the function all togheter on Windows, we may add
support for it later on. For the moment return change errno to ENOENT
and return NULL.

FYI:
https://blogs.windows.com/buildingapps/2016/12/02/symlinks-windows-10/#kBeZetM7P1dorllZ.97
https://msdn.microsoft.com/en-us/library/windows/desktop/aa365680(v=vs.85).aspx

Signed-off-by: Alin Gabriel Serdean <aserdean@cloudbasesolutions.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-02-06 04:41:41 +00:00
+								#ifdef _WIN32
 								    errno = ENOENT;
 								    return NULL;
 								#else
-												util: New function follow_symlinks().

It will acquire its first user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-30 11:36:06 -07:00
+								    size_t size;
 								    for (size = 64; ; size *= 2) {
 								        char *buf = xmalloc(size);
 								        ssize_t retval = readlink(filename, buf, size);
 								        int error = errno;
 								        if (retval >= 0 && retval < size) {
 								            buf[retval] = '\0';
 								            return buf;
 								        }
 								        free(buf);
 								        if (retval < 0) {
 								            errno = error;
 								            return NULL;
 								        }
 								    }
-												windows: return NULL in xreadlink

readlink does not exist on Windows.

While we could skip the function all togheter on Windows, we may add
support for it later on. For the moment return change errno to ENOENT
and return NULL.

FYI:
https://blogs.windows.com/buildingapps/2016/12/02/symlinks-windows-10/#kBeZetM7P1dorllZ.97
https://msdn.microsoft.com/en-us/library/windows/desktop/aa365680(v=vs.85).aspx

Signed-off-by: Alin Gabriel Serdean <aserdean@cloudbasesolutions.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-02-06 04:41:41 +00:00
+								#endif
-												util: New function follow_symlinks().

It will acquire its first user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-30 11:36:06 -07:00
+								}
 								/* Returns a version of 'filename' with symlinks in the final component
 								 * dereferenced.  This differs from realpath() in that:
 								 *
 								 *     - 'filename' need not exist.
 								 *
 								 *     - If 'filename' does exist as a symlink, its referent need not exist.
 								 *
 								 *     - Only symlinks in the final component of 'filename' are dereferenced.
 								 *
-												util: follow_symlinks() for windows.

Start with not supporting symbolic links for windows.
This is useful for an upcoming commit.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-13 10:34:39 -08:00
+								 * For Windows platform, this function returns a string that has the same
 								 * value as the passed string.
 								 *
-												util: New function follow_symlinks().

It will acquire its first user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-30 11:36:06 -07:00
+								 * The caller must eventually free the returned string (with free()). */
 								char *
 								follow_symlinks(const char *filename)
 								{
-												util: follow_symlinks() for windows.

Start with not supporting symbolic links for windows.
This is useful for an upcoming commit.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-13 10:34:39 -08:00
+								#ifndef _WIN32
-												util: New function follow_symlinks().

It will acquire its first user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-30 11:36:06 -07:00
+								    struct stat s;
 								    char *fn;
 								    int i;
 								    fn = xstrdup(filename);
 								    for (i = 0; i < 10; i++) {
 								        char *linkname;
 								        char *next_fn;
 								        if (lstat(fn, &s) != 0 || !S_ISLNK(s.st_mode)) {
 								            return fn;
 								        }
 								        linkname = xreadlink(fn);
 								        if (!linkname) {
-												Replace all uses of strerror() by ovs_strerror(), for thread safety.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-06-24 10:54:49 -07:00
+								            VLOG_WARN("%s: readlink failed (%s)",
 								                      filename, ovs_strerror(errno));
-												util: New function follow_symlinks().

It will acquire its first user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-30 11:36:06 -07:00
+								            return fn;
 								        }
 								        if (linkname[0] == '/') {
 								            /* Target of symlink is absolute so use it raw. */
 								            next_fn = linkname;
 								        } else {
 								            /* Target of symlink is relative so add to 'fn''s directory. */
 								            char *dir = dir_name(fn);
 								            if (!strcmp(dir, ".")) {
 								                next_fn = linkname;
 								            } else {
 								                char *separator = dir[strlen(dir) - 1] == '/' ? "" : "/";
 								                next_fn = xasprintf("%s%s%s", dir, separator, linkname);
 								                free(linkname);
 								            }
 								            free(dir);
 								        }
 								        free(fn);
 								        fn = next_fn;
 								    }
 								    VLOG_WARN("%s: too many levels of symlinks", filename);
 								    free(fn);
-												util: follow_symlinks() for windows.

Start with not supporting symbolic links for windows.
This is useful for an upcoming commit.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-13 10:34:39 -08:00
+								#endif
-												util: New function follow_symlinks().

It will acquire its first user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-30 11:36:06 -07:00
+								    return xstrdup(filename);
 								}
-												util: New functions get_cwd(), abs_file_name().

These will be used further in an upcoming commit.

											
										
										
											2010-03-16 15:06:11 -07:00
-												Clean-up compiler warnings about ignoring return values

Some systems complain when certain functions' return values are not
checked.  This commit fixes those warnings.

Creating ignore() function suggested by Ben Pfaff.

											
										
										
											2009-12-14 23:08:10 -08:00
+								/* Pass a value to this function if it is marked with
-												treewide: Remove trailing whitespace

Signed-off-by: Joe Perches <joe@perches.com>
Acked-by: Simon Horman <horms@verge.net.au>
Signed-off-by: Jesse Gross <jesse@nicira.com>

											
										
										
											2010-08-30 00:24:53 -07:00
+								 * __attribute__((warn_unused_result)) and you genuinely want to ignore
 								 * its return value.  (Note that every scalar type can be implicitly
-												Clean-up compiler warnings about ignoring return values

Some systems complain when certain functions' return values are not
checked.  This commit fixes those warnings.

Creating ignore() function suggested by Ben Pfaff.

											
										
										
											2009-12-14 23:08:10 -08:00
+								 * converted to bool.) */
-												Merge "master" into "next".

The main change here is the need to update all of the uses of UNUSED in
the next branch to OVS_UNUSED as it is now spelled on "master".

											
										
										
											2010-02-11 11:11:23 -08:00
+								void ignore(bool x OVS_UNUSED) { }
-												util: New function for forming English lists.

This follows the rules I learned in school.  Some locales may prefer to
omit the comma before "and" in a list of three or more items.

											
										
										
											2011-06-02 10:47:18 -07:00
 								/* Returns an appropriate delimiter for inserting just before the 0-based item
 								 * 'index' in a list that has 'total' items in it. */
 								const char *
 								english_list_delimiter(size_t index, size_t total)
 								{
 								    return (index == 0 ? ""
 								            : index < total - 1 ? ", "
 								            : total > 2 ? ", and "
 								            : " and ");
 								}
-												util: New function log_2_floor().

Calculates the position of the most significant bit in a 32 bit
word.

											
										
										
											2011-07-22 10:20:52 -07:00
-												util: New function raw_ctz().

This will acquire a user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-08-21 10:47:22 -07:00
+								/* Returns the number of trailing 0-bits in 'n'.  Undefined if 'n' == 0. */
-												util: Use MSVC compiler intrinsic for clz and ctz.

Using the compiler intrinsic shows approximately around 25% speed
up with some classifier specific unit tests.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-10-03 12:00:11 -07:00
+								#if __GNUC__ >= 4 || _MSC_VER
-												util: New function raw_ctz().

This will acquire a user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-08-21 10:47:22 -07:00
+								/* Defined inline in util.h. */
-												packets: Add more utility functions for IPv4 and IPv6 addresses.

We had these functions scattered around the source tree anyway.  packets.h
is a good place to centralize them.

I do plan to introduce some additional callers.

											
										
										
											2011-08-17 10:55:15 -07:00
+								#else
-												lib/util: Add clz32() and clz64().

Count leading zeroes using builtin if available.

Make log_2_floor() use raw_clz() and inline log_2_floor() and
log_2_ceil().

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2013-12-03 13:41:41 -08:00
+								/* Returns the number of trailing 0-bits in 'n'.  Undefined if 'n' == 0. */
-												lib/util: Make raw_ctz() implementation non-static.

Signed-off By: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2013-11-18 09:28:44 -08:00
+								int
-												util: Make raw_ctz() accept 64-bit integers.

Having a single function that can do raw_ctz() on any integer type is
easier for callers to get right, and there is no real downside in the
implementation.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jarno Rajahalme <jrajahalme@nicira.com>

											
										
										
											2013-11-18 11:30:38 -08:00
+								raw_ctz(uint64_t n)
-												util: New function raw_ctz().

This will acquire a user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-08-21 10:47:22 -07:00
+								{
-												util: Make raw_ctz() accept 64-bit integers.

Having a single function that can do raw_ctz() on any integer type is
easier for callers to get right, and there is no real downside in the
implementation.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jarno Rajahalme <jrajahalme@nicira.com>

											
										
										
											2013-11-18 11:30:38 -08:00
+								    uint64_t k;
 								    int count = 63;
-												packets: Add more utility functions for IPv4 and IPv6 addresses.

We had these functions scattered around the source tree anyway.  packets.h
is a good place to centralize them.

I do plan to introduce some additional callers.

											
										
										
											2011-08-17 10:55:15 -07:00
 								#define CTZ_STEP(X)                             \
-												util: New function raw_ctz().

This will acquire a user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-08-21 10:47:22 -07:00
+								    k = n << (X);                               \
 								    if (k) {                                    \
 								        count -= X;                             \
 								        n = k;                                  \
 								    }
-												util: Make raw_ctz() accept 64-bit integers.

Having a single function that can do raw_ctz() on any integer type is
easier for callers to get right, and there is no real downside in the
implementation.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jarno Rajahalme <jrajahalme@nicira.com>

											
										
										
											2013-11-18 11:30:38 -08:00
+								    CTZ_STEP(32);
-												util: New function raw_ctz().

This will acquire a user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-08-21 10:47:22 -07:00
+								    CTZ_STEP(16);
 								    CTZ_STEP(8);
 								    CTZ_STEP(4);
 								    CTZ_STEP(2);
 								    CTZ_STEP(1);
-												packets: Add more utility functions for IPv4 and IPv6 addresses.

We had these functions scattered around the source tree anyway.  packets.h
is a good place to centralize them.

I do plan to introduce some additional callers.

											
										
										
											2011-08-17 10:55:15 -07:00
+								#undef CTZ_STEP
-												util: New function raw_ctz().

This will acquire a user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-08-21 10:47:22 -07:00
+								    return count;
-												packets: Add more utility functions for IPv4 and IPv6 addresses.

We had these functions scattered around the source tree anyway.  packets.h
is a good place to centralize them.

I do plan to introduce some additional callers.

											
										
										
											2011-08-17 10:55:15 -07:00
+								}
-												lib/util: Add clz32() and clz64().

Count leading zeroes using builtin if available.

Make log_2_floor() use raw_clz() and inline log_2_floor() and
log_2_ceil().

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2013-12-03 13:41:41 -08:00
 								/* Returns the number of leading 0-bits in 'n'.  Undefined if 'n' == 0. */
 								int
 								raw_clz64(uint64_t n)
 								{
 								    uint64_t k;
 								    int count = 63;
 								#define CLZ_STEP(X)                             \
 								    k = n >> (X);                               \
 								    if (k) {                                    \
 								        count -= X;                             \
 								        n = k;                                  \
 								    }
 								    CLZ_STEP(32);
 								    CLZ_STEP(16);
 								    CLZ_STEP(8);
 								    CLZ_STEP(4);
 								    CLZ_STEP(2);
 								    CLZ_STEP(1);
 								#undef CLZ_STEP
 								    return count;
 								}
-												util: New function raw_ctz().

This will acquire a user in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-08-21 10:47:22 -07:00
+								#endif
-												Implement new "learn" action.

There are a few loose ends here.  First, learning actions cause too much
flow revalidation.  Upcoming commits will fix that problem.  The following
additional issues have not yet been addressed:

    * Resource limits: nothing yet limits the maximum number of flows that
      can be learned.  It is possible to exhaust all system memory.

    * Age reporting: there is no way to find out how soon a learned table
      entry is due to be evicted.

To try this action out, here's a recipe for a very simple-minded MAC
learning switch.  It uses a 10-second MAC expiration time to make it easier
to see what's going on:

ovs-vsctl del-controller br0
ovs-ofctl del-flows br0
ovs-ofctl add-flow br0 "table=0 actions=learn(table=1, hard_timeout=10, \
	NXM_OF_VLAN_TCI[0..11], NXM_OF_ETH_DST[]=NXM_OF_ETH_SRC[], \
	output:NXM_OF_IN_PORT[]), resubmit(,1)"
ovs-ofctl add-flow br0 "table=1 priority=0 actions=flood"

You can then dump the MAC learning table with:

ovs-ofctl dump-flows br0 table=1

											
										
										
											2011-09-12 16:19:57 -07:00
-												lib/util: More portable use of builtin popcnt.

- Use the GCC predefined macro __POPCNT__ to detect the availability
  of fast __builtin_popcnt function.
- Use portable preprocessor macros to detect 64-bit build.
- Only define the 32-bit parts when needed and declare the
  count_1bits_8 at file scope to silence a warning.

This time I have tested all code paths to make sure no warnigns are
generated.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Reviewed-by: Simon Horman <horms@verge.net.au>
											
										
										
											2013-12-12 08:27:41 -08:00
+								#if NEED_COUNT_1BITS_8
-												util: New function popcount().

This is the fastest portable implementation among the ones below, as
measured with GCC 4.4 on a Xeon X3430.  The measeured times were, in
seconds:

popcount1    25.6
popcount2     6.9 (but is not portable)
popcount3    31.4
popcount4    25.6
popcount5    61.6 (and is buggy)
popcount6    64.6
popcount7    32.3
popcount8    11.2

int
popcount1(unsigned int x)
{
    return __builtin_popcount(x);
}

int
popcount2(unsigned int x)
{
    unsigned int y;
    asm("popcnt %1, %0" : "=r" (y) : "g" (x));
    return y;
}

int
popcount3(unsigned int x)
{
    unsigned int n;

    n = (x >> 1) & 033333333333;
    x -= n;
    n = (n >> 1) & 033333333333;
    x -= n;
    x = (x + (x >> 3)) & 030707070707;
    return x % 63;
}

int
popcount4(unsigned int x)
{
    x -= (x >> 1) & 0x55555555;
    x = (x & 0x33333333) + ((x >> 2) & 0x33333333);
    x = (x + (x >> 4)) & 0x0f0f0f0f;
    x += x >> 8;
    x += x >> 16;
    return x & 0x3f;
}

int
popcount5(unsigned int x)
{
    int n;

    n = 0;
    while (x) {
        if (x & 0xf) {
            n += ((0xe9949440 >> (x & 0xf)) & 3) + 1;
        }
        x >>= 4;
    }
    return n;
}

int
popcount6(unsigned int x)
{
    int n;

    n = 0;
    while (x) {
        n += (0xe994 >> (x & 7)) & 3;
        x >>= 3;
    }
    return n;
}

int
popcount7(unsigned int x)
{
    static const int table[16] = {
        0, 1, 1, 2, 1, 2, 2, 3, 1, 2, 2, 3, 2, 3, 3, 4
    };

    return (table[x & 0xf]
            + table[(x >> 4) & 0xf]
            + table[(x >> 8) & 0xf]
            + table[(x >> 12) & 0xf]
            + table[(x >> 16) & 0xf]
            + table[(x >> 20) & 0xf]
            + table[(x >> 24) & 0xf]
            + table[x >> 28]);
}

static int
popcount8(unsigned int x)
{
    ((((X) & (1 << 0)) != 0) +                  \
     (((X) & (1 << 1)) != 0) +                  \
     (((X) & (1 << 2)) != 0) +                  \
     (((X) & (1 << 3)) != 0) +                  \
     (((X) & (1 << 4)) != 0) +                  \
     (((X) & (1 << 5)) != 0) +                  \
     (((X) & (1 << 6)) != 0) +                  \
     (((X) & (1 << 7)) != 0))

    static const uint8_t popcount8[256] = {
        INIT64(0), INIT64(64), INIT64(128), INIT64(192)
    };

    return (popcount8[x & 0xff] +
            popcount8[(x >> 8) & 0xff] +
            popcount8[(x >> 16) & 0xff] +
            popcount8[x >> 24]);
}

int
main(void)
{
    unsigned long long int x;
    int n;

    n = 0;
    for (x = 0; x <= UINT32_MAX; x++) {
        n += popcount8(x);
    }
    printf("%d\n", n);

    return 0;
}

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-07-20 12:38:59 -07:00
+								#define INIT1(X)                                \
 								    ((((X) & (1 << 0)) != 0) +                  \
 								     (((X) & (1 << 1)) != 0) +                  \
 								     (((X) & (1 << 2)) != 0) +                  \
 								     (((X) & (1 << 3)) != 0) +                  \
 								     (((X) & (1 << 4)) != 0) +                  \
 								     (((X) & (1 << 5)) != 0) +                  \
 								     (((X) & (1 << 6)) != 0) +                  \
 								     (((X) & (1 << 7)) != 0))
 								#define INIT2(X)   INIT1(X),  INIT1((X) +  1)
 								#define INIT4(X)   INIT2(X),  INIT2((X) +  2)
 								#define INIT8(X)   INIT4(X),  INIT4((X) +  4)
 								#define INIT16(X)  INIT8(X),  INIT8((X) +  8)
 								#define INIT32(X) INIT16(X), INIT16((X) + 16)
 								#define INIT64(X) INIT32(X), INIT32((X) + 32)
-												util: Better count_1bits().

Inline, use another well-known algorithm for 64-bit builds, and use
builtins when they are known to be fast at compile time.  A 32-bit
version of the alternate algorithm is slower than the existing
implementation, so the old one is used for 32-bit builds.  Inline
assembler would be a bit faster on 32-bit i7 build, but we use the GCC
builtin for portability.

It should be stressed builds for specific CPUs do not work on others
CPUs, and that OVS build system or runtime does not currently support
CPU detection.

Speed improvement v.s. existing implementation / GCC 4.7
__builtin_popcountll():

i386:         64%  (inlining)                         / 380%
i386 on i7:   240% (inlining + builtin)               / 820%
x86_64:       59%  (inlining + different algorithm)   / 190%
x86_64 on i7: 370% (inlining + builtin)               / 0%

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2013-11-27 12:58:46 -08:00
+								const uint8_t count_1bits_8[256] = {
 								    INIT64(0), INIT64(64), INIT64(128), INIT64(192)
 								};
 								#endif
-												util: Make popcount() handle 64-bit integers, not separate popcount64().

Having a single function that can do popcount() on any integer type is
easier for callers to get right.  The implementation is probably slower
if the caller actually provides a 32-bit (or shorter) integer, but the
only existing callers always provide a full 64-bit integer so this seems
unimportant for now.

This also restores use, in practice, of the optimized implementation of
population count.  (As the comment on popcount32() says, this version is
2x faster than __builtin_popcount().)

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jarno Rajahalme <jrajahalme@nicira.com>

											
										
										
											2013-11-18 13:18:41 -08:00
-												util: New function is_all_byte().

This makes it easy for callers to choose all-ones or all-zeros based on
a parameter instead of choice of function.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Andy Zhou <azhou@ovn.org>

											
										
										
											2017-07-31 10:07:50 -07:00
+								/* Returns true if the 'n' bytes starting at 'p' are 'byte'. */
-												Implement new "learn" action.

There are a few loose ends here.  First, learning actions cause too much
flow revalidation.  Upcoming commits will fix that problem.  The following
additional issues have not yet been addressed:

    * Resource limits: nothing yet limits the maximum number of flows that
      can be learned.  It is possible to exhaust all system memory.

    * Age reporting: there is no way to find out how soon a learned table
      entry is due to be evicted.

To try this action out, here's a recipe for a very simple-minded MAC
learning switch.  It uses a 10-second MAC expiration time to make it easier
to see what's going on:

ovs-vsctl del-controller br0
ovs-ofctl del-flows br0
ovs-ofctl add-flow br0 "table=0 actions=learn(table=1, hard_timeout=10, \
	NXM_OF_VLAN_TCI[0..11], NXM_OF_ETH_DST[]=NXM_OF_ETH_SRC[], \
	output:NXM_OF_IN_PORT[]), resubmit(,1)"
ovs-ofctl add-flow br0 "table=1 priority=0 actions=flood"

You can then dump the MAC learning table with:

ovs-ofctl dump-flows br0 table=1

											
										
										
											2011-09-12 16:19:57 -07:00
+								bool
-												util: New function is_all_byte().

This makes it easy for callers to choose all-ones or all-zeros based on
a parameter instead of choice of function.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Andy Zhou <azhou@ovn.org>

											
										
										
											2017-07-31 10:07:50 -07:00
+								is_all_byte(const void *p_, size_t n, uint8_t byte)
-												Implement new "learn" action.

There are a few loose ends here.  First, learning actions cause too much
flow revalidation.  Upcoming commits will fix that problem.  The following
additional issues have not yet been addressed:

    * Resource limits: nothing yet limits the maximum number of flows that
      can be learned.  It is possible to exhaust all system memory.

    * Age reporting: there is no way to find out how soon a learned table
      entry is due to be evicted.

To try this action out, here's a recipe for a very simple-minded MAC
learning switch.  It uses a 10-second MAC expiration time to make it easier
to see what's going on:

ovs-vsctl del-controller br0
ovs-ofctl del-flows br0
ovs-ofctl add-flow br0 "table=0 actions=learn(table=1, hard_timeout=10, \
	NXM_OF_VLAN_TCI[0..11], NXM_OF_ETH_DST[]=NXM_OF_ETH_SRC[], \
	output:NXM_OF_IN_PORT[]), resubmit(,1)"
ovs-ofctl add-flow br0 "table=1 priority=0 actions=flood"

You can then dump the MAC learning table with:

ovs-ofctl dump-flows br0 table=1

											
										
										
											2011-09-12 16:19:57 -07:00
+								{
-												lib/util: Change is_all_zeros and is_all_ones to take a void *.

is_all_zeros() and is_all_ones() operate on bytes, but just like with
memset, it is easier to use if the first argument is a void *.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2014-09-05 15:44:19 -07:00
+								    const uint8_t *p = p_;
-												Implement new "learn" action.

There are a few loose ends here.  First, learning actions cause too much
flow revalidation.  Upcoming commits will fix that problem.  The following
additional issues have not yet been addressed:

    * Resource limits: nothing yet limits the maximum number of flows that
      can be learned.  It is possible to exhaust all system memory.

    * Age reporting: there is no way to find out how soon a learned table
      entry is due to be evicted.

To try this action out, here's a recipe for a very simple-minded MAC
learning switch.  It uses a 10-second MAC expiration time to make it easier
to see what's going on:

ovs-vsctl del-controller br0
ovs-ofctl del-flows br0
ovs-ofctl add-flow br0 "table=0 actions=learn(table=1, hard_timeout=10, \
	NXM_OF_VLAN_TCI[0..11], NXM_OF_ETH_DST[]=NXM_OF_ETH_SRC[], \
	output:NXM_OF_IN_PORT[]), resubmit(,1)"
ovs-ofctl add-flow br0 "table=1 priority=0 actions=flood"

You can then dump the MAC learning table with:

ovs-ofctl dump-flows br0 table=1

											
										
										
											2011-09-12 16:19:57 -07:00
+								    size_t i;
 								    for (i = 0; i < n; i++) {
-												util: New function is_all_byte().

This makes it easy for callers to choose all-ones or all-zeros based on
a parameter instead of choice of function.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Andy Zhou <azhou@ovn.org>

											
										
										
											2017-07-31 10:07:50 -07:00
+								        if (p[i] != byte) {
-												Implement new "learn" action.

There are a few loose ends here.  First, learning actions cause too much
flow revalidation.  Upcoming commits will fix that problem.  The following
additional issues have not yet been addressed:

    * Resource limits: nothing yet limits the maximum number of flows that
      can be learned.  It is possible to exhaust all system memory.

    * Age reporting: there is no way to find out how soon a learned table
      entry is due to be evicted.

To try this action out, here's a recipe for a very simple-minded MAC
learning switch.  It uses a 10-second MAC expiration time to make it easier
to see what's going on:

ovs-vsctl del-controller br0
ovs-ofctl del-flows br0
ovs-ofctl add-flow br0 "table=0 actions=learn(table=1, hard_timeout=10, \
	NXM_OF_VLAN_TCI[0..11], NXM_OF_ETH_DST[]=NXM_OF_ETH_SRC[], \
	output:NXM_OF_IN_PORT[]), resubmit(,1)"
ovs-ofctl add-flow br0 "table=1 priority=0 actions=flood"

You can then dump the MAC learning table with:

ovs-ofctl dump-flows br0 table=1

											
										
										
											2011-09-12 16:19:57 -07:00
+								            return false;
 								        }
 								    }
 								    return true;
 								}
-												util: New function is_all_byte().

This makes it easy for callers to choose all-ones or all-zeros based on
a parameter instead of choice of function.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Andy Zhou <azhou@ovn.org>

											
										
										
											2017-07-31 10:07:50 -07:00
+								/* Returns true if the 'n' bytes starting at 'p' are zeros. */
-												Implement new "learn" action.

There are a few loose ends here.  First, learning actions cause too much
flow revalidation.  Upcoming commits will fix that problem.  The following
additional issues have not yet been addressed:

    * Resource limits: nothing yet limits the maximum number of flows that
      can be learned.  It is possible to exhaust all system memory.

    * Age reporting: there is no way to find out how soon a learned table
      entry is due to be evicted.

To try this action out, here's a recipe for a very simple-minded MAC
learning switch.  It uses a 10-second MAC expiration time to make it easier
to see what's going on:

ovs-vsctl del-controller br0
ovs-ofctl del-flows br0
ovs-ofctl add-flow br0 "table=0 actions=learn(table=1, hard_timeout=10, \
	NXM_OF_VLAN_TCI[0..11], NXM_OF_ETH_DST[]=NXM_OF_ETH_SRC[], \
	output:NXM_OF_IN_PORT[]), resubmit(,1)"
ovs-ofctl add-flow br0 "table=1 priority=0 actions=flood"

You can then dump the MAC learning table with:

ovs-ofctl dump-flows br0 table=1

											
										
										
											2011-09-12 16:19:57 -07:00
+								bool
-												util: New function is_all_byte().

This makes it easy for callers to choose all-ones or all-zeros based on
a parameter instead of choice of function.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Andy Zhou <azhou@ovn.org>

											
										
										
											2017-07-31 10:07:50 -07:00
+								is_all_zeros(const void *p, size_t n)
-												Implement new "learn" action.

There are a few loose ends here.  First, learning actions cause too much
flow revalidation.  Upcoming commits will fix that problem.  The following
additional issues have not yet been addressed:

    * Resource limits: nothing yet limits the maximum number of flows that
      can be learned.  It is possible to exhaust all system memory.

    * Age reporting: there is no way to find out how soon a learned table
      entry is due to be evicted.

To try this action out, here's a recipe for a very simple-minded MAC
learning switch.  It uses a 10-second MAC expiration time to make it easier
to see what's going on:

ovs-vsctl del-controller br0
ovs-ofctl del-flows br0
ovs-ofctl add-flow br0 "table=0 actions=learn(table=1, hard_timeout=10, \
	NXM_OF_VLAN_TCI[0..11], NXM_OF_ETH_DST[]=NXM_OF_ETH_SRC[], \
	output:NXM_OF_IN_PORT[]), resubmit(,1)"
ovs-ofctl add-flow br0 "table=1 priority=0 actions=flood"

You can then dump the MAC learning table with:

ovs-ofctl dump-flows br0 table=1

											
										
										
											2011-09-12 16:19:57 -07:00
+								{
-												util: New function is_all_byte().

This makes it easy for callers to choose all-ones or all-zeros based on
a parameter instead of choice of function.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Andy Zhou <azhou@ovn.org>

											
										
										
											2017-07-31 10:07:50 -07:00
+								    return is_all_byte(p, n, 0);
 								}
-												Implement new "learn" action.

There are a few loose ends here.  First, learning actions cause too much
flow revalidation.  Upcoming commits will fix that problem.  The following
additional issues have not yet been addressed:

    * Resource limits: nothing yet limits the maximum number of flows that
      can be learned.  It is possible to exhaust all system memory.

    * Age reporting: there is no way to find out how soon a learned table
      entry is due to be evicted.

To try this action out, here's a recipe for a very simple-minded MAC
learning switch.  It uses a 10-second MAC expiration time to make it easier
to see what's going on:

ovs-vsctl del-controller br0
ovs-ofctl del-flows br0
ovs-ofctl add-flow br0 "table=0 actions=learn(table=1, hard_timeout=10, \
	NXM_OF_VLAN_TCI[0..11], NXM_OF_ETH_DST[]=NXM_OF_ETH_SRC[], \
	output:NXM_OF_IN_PORT[]), resubmit(,1)"
ovs-ofctl add-flow br0 "table=1 priority=0 actions=flood"

You can then dump the MAC learning table with:

ovs-ofctl dump-flows br0 table=1

											
										
										
											2011-09-12 16:19:57 -07:00
-												util: New function is_all_byte().

This makes it easy for callers to choose all-ones or all-zeros based on
a parameter instead of choice of function.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Andy Zhou <azhou@ovn.org>

											
										
										
											2017-07-31 10:07:50 -07:00
+								/* Returns true if the 'n' bytes starting at 'p' are 0xff. */
 								bool
 								is_all_ones(const void *p, size_t n)
 								{
 								    return is_all_byte(p, n, 0xff);
-												Implement new "learn" action.

There are a few loose ends here.  First, learning actions cause too much
flow revalidation.  Upcoming commits will fix that problem.  The following
additional issues have not yet been addressed:

    * Resource limits: nothing yet limits the maximum number of flows that
      can be learned.  It is possible to exhaust all system memory.

    * Age reporting: there is no way to find out how soon a learned table
      entry is due to be evicted.

To try this action out, here's a recipe for a very simple-minded MAC
learning switch.  It uses a 10-second MAC expiration time to make it easier
to see what's going on:

ovs-vsctl del-controller br0
ovs-ofctl del-flows br0
ovs-ofctl add-flow br0 "table=0 actions=learn(table=1, hard_timeout=10, \
	NXM_OF_VLAN_TCI[0..11], NXM_OF_ETH_DST[]=NXM_OF_ETH_SRC[], \
	output:NXM_OF_IN_PORT[]), resubmit(,1)"
ovs-ofctl add-flow br0 "table=1 priority=0 actions=flood"

You can then dump the MAC learning table with:

ovs-ofctl dump-flows br0 table=1

											
										
										
											2011-09-12 16:19:57 -07:00
+								}
-												odp-util: Fix clearing match mask if set action is partially unnecessary.

While committing set() actions, commit() could wildcard all the fields
that are same in match key and in the set action.  This leads to
situation where mask after commit could actually contain less bits
than it was before.  And if set action was partially committed, all
the fields that were the same will be cleared out from the matching key
resulting in the incorrect (too wide) flow.

For example, for the flow that matches on both src and dst mac
addresses, if the dst mac is the same and only src should be changed
by the set() action, destination address will be wildcarded in the
match key and will never be matched, i.e. flows with any destination
mac will match, which is not correct.

Setting OF rule:

 in_port=1,dl_src=50:54:00:00:00:09 actions=mod_dl_dst(50:54:00:00:00:0a),output(2)

Sending following packets on port 1:

  1. eth(src=50:54:00:00:00:09,dst=50:54:00:00:00:0a),eth_type(0x0800)
  2. eth(src=50:54:00:00:00:09,dst=50:54:00:00:00:0c),eth_type(0x0800)
  3. eth(src=50:54:00:00:00:0b,dst=50:54:00:00:00:0c),eth_type(0x0800)

Resulted datapath flows:
  eth(dst=50:54:00:00:00:0c),<...>, actions:set(eth(dst=50:54:00:00:00:0a)),2
  eth(src=50:54:00:00:00:09,dst=50:54:00:00:00:0a),<...>, actions:2

The first flow  doesn't have any match on source MAC address and the
third packet successfully matched on it while it must be dropped.

Fix that by updating the match mask with only the new bits set by
commit(), but keeping those that were cleared (OR operation).

With fix applied, resulted correct flows are:
  eth(src=50:54:00:00:00:09,dst=50:54:00:00:00:0a),<...>, actions:2
  eth(src=50:54:00:00:00:09,dst=50:54:00:00:00:0c),<...>,
                                    actions:set(eth(dst=50:54:00:00:00:0a)),2
  eth(src=50:54:00:00:00:0b),<...>, actions:drop

The code before commit dbf4a92800d0 was not able to reduce the mask,
it was only possible to expand it to exact match, so it was OK to
update original matching mask with the new value in all cases.

Fixes: dbf4a92800d0 ("odp-util: Do not rewrite fields with the same values as matched")
Reported-at: https://bugzilla.redhat.com/show_bug.cgi?id=1854376
Acked-by: Eli Britstein <elibr@mellanox.com>
Tested-by: Adrián Moreno <amorenoz@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2020-07-27 17:41:35 +02:00
+								/* *dst |= *src for 'n' bytes. */
 								void
 								or_bytes(void *dst_, const void *src_, size_t n)
 								{
 								    const uint8_t *src = src_;
 								    uint8_t *dst = dst_;
 								    size_t i;
 								    for (i = 0; i < n; i++) {
 								        *dst++ |= *src++;
 								    }
 								}
-												util: Move bitwise_copy() here, add new bitwise functions, add a test.

bitwise_copy() is generally useful so make it a general utility function.
Also add a comment.

Upcoming commits will introduce users for the new functions.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-01-17 16:38:23 -08:00
+								/* Copies 'n_bits' bits starting from bit 'src_ofs' in 'src' to the 'n_bits'
 								 * starting from bit 'dst_ofs' in 'dst'.  'src' is 'src_len' bytes long and
 								 * 'dst' is 'dst_len' bytes long.
 								 *
 								 * If you consider all of 'src' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in src[src_len - 1], bit 1 is the bit with value 2, bit 2 is
 								 * the bit with value 4, ..., bit 8 is the bit with value 1 in src[src_len -
 								 * 2], and so on.  Similarly for 'dst'.
 								 *
 								 * Required invariants:
 								 *   src_ofs + n_bits <= src_len * 8
 								 *   dst_ofs + n_bits <= dst_len * 8
 								 *   'src' and 'dst' must not overlap.
 								 */
 								void
 								bitwise_copy(const void *src_, unsigned int src_len, unsigned int src_ofs,
 								             void *dst_, unsigned int dst_len, unsigned int dst_ofs,
 								             unsigned int n_bits)
 								{
 								    const uint8_t *src = src_;
 								    uint8_t *dst = dst_;
 								    src += src_len - (src_ofs / 8 + 1);
 								    src_ofs %= 8;
 								    dst += dst_len - (dst_ofs / 8 + 1);
 								    dst_ofs %= 8;
 								    if (src_ofs == 0 && dst_ofs == 0) {
 								        unsigned int n_bytes = n_bits / 8;
 								        if (n_bytes) {
 								            dst -= n_bytes - 1;
 								            src -= n_bytes - 1;
 								            memcpy(dst, src, n_bytes);
 								            n_bits %= 8;
 								            src--;
 								            dst--;
 								        }
 								        if (n_bits) {
 								            uint8_t mask = (1 << n_bits) - 1;
 								            *dst = (*dst & ~mask) | (*src & mask);
 								        }
 								    } else {
 								        while (n_bits > 0) {
 								            unsigned int max_copy = 8 - MAX(src_ofs, dst_ofs);
 								            unsigned int chunk = MIN(n_bits, max_copy);
 								            uint8_t mask = ((1 << chunk) - 1) << dst_ofs;
 								            *dst &= ~mask;
 								            *dst |= ((*src >> src_ofs) << dst_ofs) & mask;
 								            src_ofs += chunk;
 								            if (src_ofs == 8) {
 								                src--;
 								                src_ofs = 0;
 								            }
 								            dst_ofs += chunk;
 								            if (dst_ofs == 8) {
 								                dst--;
 								                dst_ofs = 0;
 								            }
 								            n_bits -= chunk;
 								        }
 								    }
 								}
-												util: New function bitwise_zero().

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-01-17 16:53:29 -08:00
+								/* Zeros the 'n_bits' bits starting from bit 'dst_ofs' in 'dst'.  'dst' is
 								 * 'dst_len' bytes long.
 								 *
 								 * If you consider all of 'dst' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in dst[dst_len - 1], bit 1 is the bit with value 2, bit 2 is
 								 * the bit with value 4, ..., bit 8 is the bit with value 1 in dst[dst_len -
 								 * 2], and so on.
 								 *
 								 * Required invariant:
 								 *   dst_ofs + n_bits <= dst_len * 8
 								 */
 								void
 								bitwise_zero(void *dst_, unsigned int dst_len, unsigned dst_ofs,
 								             unsigned int n_bits)
 								{
 								    uint8_t *dst = dst_;
 								    if (!n_bits) {
 								        return;
 								    }
 								    dst += dst_len - (dst_ofs / 8 + 1);
 								    dst_ofs %= 8;
 								    if (dst_ofs) {
 								        unsigned int chunk = MIN(n_bits, 8 - dst_ofs);
 								        *dst &= ~(((1 << chunk) - 1) << dst_ofs);
 								        n_bits -= chunk;
 								        if (!n_bits) {
 								            return;
 								        }
 								        dst--;
 								    }
 								    while (n_bits >= 8) {
 								        *dst-- = 0;
 								        n_bits -= 8;
 								    }
 								    if (n_bits) {
 								        *dst &= ~((1 << n_bits) - 1);
 								    }
 								}
-												util: New function bitwise_one().

It's the obvious counterpart to bitwise_zero().

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-04-11 12:07:51 -07:00
+								/* Sets to 1 all of the 'n_bits' bits starting from bit 'dst_ofs' in 'dst'.
 								 * 'dst' is 'dst_len' bytes long.
 								 *
 								 * If you consider all of 'dst' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in dst[dst_len - 1], bit 1 is the bit with value 2, bit 2 is
 								 * the bit with value 4, ..., bit 8 is the bit with value 1 in dst[dst_len -
 								 * 2], and so on.
 								 *
 								 * Required invariant:
 								 *   dst_ofs + n_bits <= dst_len * 8
 								 */
 								void
 								bitwise_one(void *dst_, unsigned int dst_len, unsigned dst_ofs,
 								            unsigned int n_bits)
 								{
 								    uint8_t *dst = dst_;
 								    if (!n_bits) {
 								        return;
 								    }
 								    dst += dst_len - (dst_ofs / 8 + 1);
 								    dst_ofs %= 8;
 								    if (dst_ofs) {
 								        unsigned int chunk = MIN(n_bits, 8 - dst_ofs);
 								        *dst |= ((1 << chunk) - 1) << dst_ofs;
 								        n_bits -= chunk;
 								        if (!n_bits) {
 								            return;
 								        }
 								        dst--;
 								    }
 								    while (n_bits >= 8) {
 								        *dst-- = 0xff;
 								        n_bits -= 8;
 								    }
 								    if (n_bits) {
 								        *dst |= (1 << n_bits) - 1;
 								    }
 								}
-												util: New function bitwise_is_all_zeros().

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-04-13 21:12:37 -07:00
+								/* Scans the 'n_bits' bits starting from bit 'dst_ofs' in 'dst' for 1-bits.
 								 * Returns false if any 1-bits are found, otherwise true.  'dst' is 'dst_len'
 								 * bytes long.
 								 *
 								 * If you consider all of 'dst' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in dst[dst_len - 1], bit 1 is the bit with value 2, bit 2 is
 								 * the bit with value 4, ..., bit 8 is the bit with value 1 in dst[dst_len -
 								 * 2], and so on.
 								 *
 								 * Required invariant:
 								 *   dst_ofs + n_bits <= dst_len * 8
 								 */
 								bool
 								bitwise_is_all_zeros(const void *p_, unsigned int len, unsigned int ofs,
 								                     unsigned int n_bits)
 								{
 								    const uint8_t *p = p_;
 								    if (!n_bits) {
 								        return true;
 								    }
 								    p += len - (ofs / 8 + 1);
 								    ofs %= 8;
 								    if (ofs) {
 								        unsigned int chunk = MIN(n_bits, 8 - ofs);
 								        if (*p & (((1 << chunk) - 1) << ofs)) {
 								            return false;
 								        }
 								        n_bits -= chunk;
 								        if (!n_bits) {
 								            return true;
 								        }
 								        p--;
 								    }
 								    while (n_bits >= 8) {
 								        if (*p) {
 								            return false;
 								        }
 								        n_bits -= 8;
 								        p--;
 								    }
 								    if (n_bits && *p & ((1 << n_bits) - 1)) {
 								        return false;
 								    }
 								    return true;
 								}
-												util: Add more bitwise operations.

To be used in upcoming commits.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Acked-by: Russell Bryant <rbryant@redhat.com>

											
										
										
											2015-04-15 15:21:00 -07:00
+								/* Scans the bits in 'p' that have bit offsets 'start' (inclusive) through
 								 * 'end' (exclusive) for the first bit with value 'target'.  If one is found,
 								 * returns its offset, otherwise 'end'.  'p' is 'len' bytes long.
-												util: New function bitwise_scan().

This will acquire its first user in an upcoming commit.

This implementation is not optimized at all but it doesn't matter for the
purpose for which I intend to initially use it.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-09-02 17:16:51 -07:00
+								 *
 								 * If you consider all of 'p' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in p[len - 1], bit 1 is the bit with value 2, bit 2 is the bit
 								 * with value 4, ..., bit 8 is the bit with value 1 in p[len - 2], and so on.
 								 *
 								 * Required invariant:
 								 *   start <= end
 								 */
 								unsigned int
-												util: Add more bitwise operations.

To be used in upcoming commits.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Acked-by: Russell Bryant <rbryant@redhat.com>

											
										
										
											2015-04-15 15:21:00 -07:00
+								bitwise_scan(const void *p, unsigned int len, bool target, unsigned int start,
-												util: New function bitwise_scan().

This will acquire its first user in an upcoming commit.

This implementation is not optimized at all but it doesn't matter for the
purpose for which I intend to initially use it.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-09-02 17:16:51 -07:00
+								             unsigned int end)
 								{
 								    unsigned int ofs;
 								    for (ofs = start; ofs < end; ofs++) {
-												util: Add more bitwise operations.

To be used in upcoming commits.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Acked-by: Russell Bryant <rbryant@redhat.com>

											
										
										
											2015-04-15 15:21:00 -07:00
+								        if (bitwise_get_bit(p, len, ofs) == target) {
-												util: New function bitwise_scan().

This will acquire its first user in an upcoming commit.

This implementation is not optimized at all but it doesn't matter for the
purpose for which I intend to initially use it.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-09-02 17:16:51 -07:00
+								            break;
 								        }
 								    }
 								    return ofs;
 								}
-												util: Add more bitwise operations.

To be used in upcoming commits.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Acked-by: Russell Bryant <rbryant@redhat.com>

											
										
										
											2015-04-15 15:21:00 -07:00
+								/* Scans the bits in 'p' that have bit offsets 'start' (inclusive) through
 								 * 'end' (exclusive) for the first bit with value 'target', in reverse order.
 								 * If one is found, returns its offset, otherwise 'end'.  'p' is 'len' bytes
 								 * long.
 								 *
 								 * If you consider all of 'p' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in p[len - 1], bit 1 is the bit with value 2, bit 2 is the bit
 								 * with value 4, ..., bit 8 is the bit with value 1 in p[len - 2], and so on.
 								 *
 								 * To scan an entire bit array in reverse order, specify start == len * 8 - 1
 								 * and end == -1, in which case the return value is nonnegative if successful
 								 * and -1 if no 'target' match is found.
 								 *
 								 * Required invariant:
 								 *   start >= end
 								 */
 								int
 								bitwise_rscan(const void *p, unsigned int len, bool target, int start, int end)
 								{
-												lib/util.c: Optimise bitwise_rscan.

bitwise_rscan() is found to be hot spot in ovn-controller during OVN
scalability tests. It is triggered by lflow_run() when processing
lflow updates from SB ovsdb. The perf result shows:

+  35.90%  ovn-controller  ovn-controller      [.] bitwise_rscan
+  13.39%  ovn-controller  [kernel.kallsyms]   [k] 0xffffffff8104f45a
+   5.02%  ovn-controller  libc-2.19.so        [.] _int_malloc
+   3.47%  ovn-controller  libc-2.19.so        [.] _int_free

After optimization, bitwise_rscan percentage dropped from 36% to less
than 6%:

+  11.34%  ovn-controller  [kernel.kallsyms]   [k] 0xffffffff8104f45a
+   8.15%  ovn-controller  libc-2.19.so        [.] _int_malloc
+   5.77%  ovn-controller  ovn-controller      [.] bitwise_rscan
+   5.49%  ovn-controller  libc-2.19.so        [.] _int_free

Signed-off-by: Han Zhou <zhouhan@gmail.com>
[blp@ovn.org enhanced the test]
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-03-20 00:08:48 -07:00
+								    const uint8_t *s = p;
 								    int start_byte = len - (start / 8 + 1);
 								    int end_byte = len - (end / 8 + 1);
 								    int ofs_byte;
-												util: Add more bitwise operations.

To be used in upcoming commits.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Acked-by: Russell Bryant <rbryant@redhat.com>

											
										
										
											2015-04-15 15:21:00 -07:00
+								    int ofs;
-												lib/util.c: Optimise bitwise_rscan.

bitwise_rscan() is found to be hot spot in ovn-controller during OVN
scalability tests. It is triggered by lflow_run() when processing
lflow updates from SB ovsdb. The perf result shows:

+  35.90%  ovn-controller  ovn-controller      [.] bitwise_rscan
+  13.39%  ovn-controller  [kernel.kallsyms]   [k] 0xffffffff8104f45a
+   5.02%  ovn-controller  libc-2.19.so        [.] _int_malloc
+   3.47%  ovn-controller  libc-2.19.so        [.] _int_free

After optimization, bitwise_rscan percentage dropped from 36% to less
than 6%:

+  11.34%  ovn-controller  [kernel.kallsyms]   [k] 0xffffffff8104f45a
+   8.15%  ovn-controller  libc-2.19.so        [.] _int_malloc
+   5.77%  ovn-controller  ovn-controller      [.] bitwise_rscan
+   5.49%  ovn-controller  libc-2.19.so        [.] _int_free

Signed-off-by: Han Zhou <zhouhan@gmail.com>
[blp@ovn.org enhanced the test]
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-03-20 00:08:48 -07:00
+								    uint8_t the_byte;
-												util: Add more bitwise operations.

To be used in upcoming commits.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Acked-by: Russell Bryant <rbryant@redhat.com>

											
										
										
											2015-04-15 15:21:00 -07:00
-												lib/util.c: Optimise bitwise_rscan.

bitwise_rscan() is found to be hot spot in ovn-controller during OVN
scalability tests. It is triggered by lflow_run() when processing
lflow updates from SB ovsdb. The perf result shows:

+  35.90%  ovn-controller  ovn-controller      [.] bitwise_rscan
+  13.39%  ovn-controller  [kernel.kallsyms]   [k] 0xffffffff8104f45a
+   5.02%  ovn-controller  libc-2.19.so        [.] _int_malloc
+   3.47%  ovn-controller  libc-2.19.so        [.] _int_free

After optimization, bitwise_rscan percentage dropped from 36% to less
than 6%:

+  11.34%  ovn-controller  [kernel.kallsyms]   [k] 0xffffffff8104f45a
+   8.15%  ovn-controller  libc-2.19.so        [.] _int_malloc
+   5.77%  ovn-controller  ovn-controller      [.] bitwise_rscan
+   5.49%  ovn-controller  libc-2.19.so        [.] _int_free

Signed-off-by: Han Zhou <zhouhan@gmail.com>
[blp@ovn.org enhanced the test]
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-03-20 00:08:48 -07:00
+								    /* Find the target in the start_byte from starting offset */
 								    ofs_byte = start_byte;
 								    the_byte = s[ofs_byte];
 								    for (ofs = start % 8; ofs >= 0; ofs--) {
 								        if (((the_byte & (1u << ofs)) != 0) == target) {
-												util: Add more bitwise operations.

To be used in upcoming commits.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Acked-by: Russell Bryant <rbryant@redhat.com>

											
										
										
											2015-04-15 15:21:00 -07:00
+								            break;
 								        }
 								    }
-												lib/util.c: Optimise bitwise_rscan.

bitwise_rscan() is found to be hot spot in ovn-controller during OVN
scalability tests. It is triggered by lflow_run() when processing
lflow updates from SB ovsdb. The perf result shows:

+  35.90%  ovn-controller  ovn-controller      [.] bitwise_rscan
+  13.39%  ovn-controller  [kernel.kallsyms]   [k] 0xffffffff8104f45a
+   5.02%  ovn-controller  libc-2.19.so        [.] _int_malloc
+   3.47%  ovn-controller  libc-2.19.so        [.] _int_free

After optimization, bitwise_rscan percentage dropped from 36% to less
than 6%:

+  11.34%  ovn-controller  [kernel.kallsyms]   [k] 0xffffffff8104f45a
+   8.15%  ovn-controller  libc-2.19.so        [.] _int_malloc
+   5.77%  ovn-controller  ovn-controller      [.] bitwise_rscan
+   5.49%  ovn-controller  libc-2.19.so        [.] _int_free

Signed-off-by: Han Zhou <zhouhan@gmail.com>
[blp@ovn.org enhanced the test]
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-03-20 00:08:48 -07:00
+								    if (ofs < 0) {
 								        /* Target not found in start byte, continue searching byte by byte */
 								        for (ofs_byte = start_byte + 1; ofs_byte <= end_byte; ofs_byte++) {
 								            if ((target && s[ofs_byte])
 								                    || (!target && (s[ofs_byte] != 0xff))) {
 								               break;
 								            }
 								        }
 								        if (ofs_byte > end_byte) {
 								            return end;
 								        }
 								        the_byte = s[ofs_byte];
 								        /* Target is in the_byte, find it bit by bit */
 								        for (ofs = 7; ofs >= 0; ofs--) {
 								            if (((the_byte & (1u << ofs)) != 0) == target) {
 								                break;
 								            }
 								        }
 								    }
 								    int ret = (len - ofs_byte) * 8 - (8 - ofs);
 								    if (ret < end) {
 								        return end;
 								    }
 								    return ret;
-												util: Add more bitwise operations.

To be used in upcoming commits.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Acked-by: Russell Bryant <rbryant@redhat.com>

											
										
										
											2015-04-15 15:21:00 -07:00
+								}
-												util: New function bitwise_scan().

This will acquire its first user in an upcoming commit.

This implementation is not optimized at all but it doesn't matter for the
purpose for which I intend to initially use it.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: YAMAMOTO Takashi <yamamoto@valinux.co.jp>

											
										
										
											2014-09-02 17:16:51 -07:00
-												util: Move bitwise_copy() here, add new bitwise functions, add a test.

bitwise_copy() is generally useful so make it a general utility function.
Also add a comment.

Upcoming commits will introduce users for the new functions.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-01-17 16:38:23 -08:00
+								/* Copies the 'n_bits' low-order bits of 'value' into the 'n_bits' bits
 								 * starting at bit 'dst_ofs' in 'dst', which is 'dst_len' bytes long.
 								 *
 								 * If you consider all of 'dst' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in dst[dst_len - 1], bit 1 is the bit with value 2, bit 2 is
 								 * the bit with value 4, ..., bit 8 is the bit with value 1 in dst[dst_len -
 								 * 2], and so on.
 								 *
 								 * Required invariants:
 								 *   dst_ofs + n_bits <= dst_len * 8
 								 *   n_bits <= 64
 								 */
 								void
 								bitwise_put(uint64_t value,
 								            void *dst, unsigned int dst_len, unsigned int dst_ofs,
 								            unsigned int n_bits)
 								{
 								    ovs_be64 n_value = htonll(value);
 								    bitwise_copy(&n_value, sizeof n_value, 0,
 								                 dst, dst_len, dst_ofs,
 								                 n_bits);
 								}
 								/* Returns the value of the 'n_bits' bits starting at bit 'src_ofs' in 'src',
 								 * which is 'src_len' bytes long.
 								 *
 								 * If you consider all of 'src' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in src[src_len - 1], bit 1 is the bit with value 2, bit 2 is
 								 * the bit with value 4, ..., bit 8 is the bit with value 1 in src[src_len -
 								 * 2], and so on.
 								 *
 								 * Required invariants:
 								 *   src_ofs + n_bits <= src_len * 8
 								 *   n_bits <= 64
 								 */
 								uint64_t
 								bitwise_get(const void *src, unsigned int src_len,
 								            unsigned int src_ofs, unsigned int n_bits)
 								{
 								    ovs_be64 value = htonll(0);
 								    bitwise_copy(src, src_len, src_ofs,
 								                 &value, sizeof value, 0,
 								                 n_bits);
 								    return ntohll(value);
 								}
-												util: Add more bitwise operations.

To be used in upcoming commits.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Andy Zhou <azhou@nicira.com>
Acked-by: Russell Bryant <rbryant@redhat.com>

											
										
										
											2015-04-15 15:21:00 -07:00
 								/* Returns the value of the bit with offset 'ofs' in 'src', which is 'len'
 								 * bytes long.
 								 *
 								 * If you consider all of 'src' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in src[len - 1], bit 1 is the bit with value 2, bit 2 is the
 								 * bit with value 4, ..., bit 8 is the bit with value 1 in src[len - 2], and so
 								 * on.
 								 *
 								 * Required invariants:
 								 *   ofs < len * 8
 								 */
 								bool
 								bitwise_get_bit(const void *src_, unsigned int len, unsigned int ofs)
 								{
 								    const uint8_t *src = src_;
 								    return (src[len - (ofs / 8 + 1)] & (1u << (ofs % 8))) != 0;
 								}
 								/* Sets the bit with offset 'ofs' in 'dst', which is 'len' bytes long, to 0.
 								 *
 								 * If you consider all of 'dst' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in dst[len - 1], bit 1 is the bit with value 2, bit 2 is the
 								 * bit with value 4, ..., bit 8 is the bit with value 1 in dst[len - 2], and so
 								 * on.
 								 *
 								 * Required invariants:
 								 *   ofs < len * 8
 								 */
 								void
 								bitwise_put0(void *dst_, unsigned int len, unsigned int ofs)
 								{
 								    uint8_t *dst = dst_;
 								    dst[len - (ofs / 8 + 1)] &= ~(1u << (ofs % 8));
 								}
 								/* Sets the bit with offset 'ofs' in 'dst', which is 'len' bytes long, to 1.
 								 *
 								 * If you consider all of 'dst' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in dst[len - 1], bit 1 is the bit with value 2, bit 2 is the
 								 * bit with value 4, ..., bit 8 is the bit with value 1 in dst[len - 2], and so
 								 * on.
 								 *
 								 * Required invariants:
 								 *   ofs < len * 8
 								 */
 								void
 								bitwise_put1(void *dst_, unsigned int len, unsigned int ofs)
 								{
 								    uint8_t *dst = dst_;
 								    dst[len - (ofs / 8 + 1)] |= 1u << (ofs % 8);
 								}
 								/* Sets the bit with offset 'ofs' in 'dst', which is 'len' bytes long, to 'b'.
 								 *
 								 * If you consider all of 'dst' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in dst[len - 1], bit 1 is the bit with value 2, bit 2 is the
 								 * bit with value 4, ..., bit 8 is the bit with value 1 in dst[len - 2], and so
 								 * on.
 								 *
 								 * Required invariants:
 								 *   ofs < len * 8
 								 */
 								void
 								bitwise_put_bit(void *dst, unsigned int len, unsigned int ofs, bool b)
 								{
 								    if (b) {
 								        bitwise_put1(dst, len, ofs);
 								    } else {
 								        bitwise_put0(dst, len, ofs);
 								    }
 								}
 								/* Flips the bit with offset 'ofs' in 'dst', which is 'len' bytes long.
 								 *
 								 * If you consider all of 'dst' to be a single unsigned integer in network byte
 								 * order, then bit N is the bit with value 2**N.  That is, bit 0 is the bit
 								 * with value 1 in dst[len - 1], bit 1 is the bit with value 2, bit 2 is the
 								 * bit with value 4, ..., bit 8 is the bit with value 1 in dst[len - 2], and so
 								 * on.
 								 *
 								 * Required invariants:
 								 *   ofs < len * 8
 								 */
 								void
 								bitwise_toggle_bit(void *dst_, unsigned int len, unsigned int ofs)
 								{
 								    uint8_t *dst = dst_;
 								    dst[len - (ofs / 8 + 1)] ^= 1u << (ofs % 8);
 								}
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
 								/* ovs_scan */
 								struct scan_spec {
 								    unsigned int width;
 								    enum {
 								        SCAN_DISCARD,
 								        SCAN_CHAR,
 								        SCAN_SHORT,
 								        SCAN_INT,
 								        SCAN_LONG,
 								        SCAN_LLONG,
 								        SCAN_INTMAX_T,
 								        SCAN_PTRDIFF_T,
 								        SCAN_SIZE_T
 								    } type;
 								};
 								static const char *
 								skip_spaces(const char *s)
 								{
 								    while (isspace((unsigned char) *s)) {
 								        s++;
 								    }
 								    return s;
 								}
 								static const char *
 								scan_int(const char *s, const struct scan_spec *spec, int base, va_list *args)
 								{
 								    const char *start = s;
 								    uintmax_t value;
 								    bool negative;
 								    int n_digits;
 								    negative = *s == '-';
 								    s += *s == '-' || *s == '+';
 								    if ((!base || base == 16) && *s == '0' && (s[1] == 'x' || s[1] == 'X')) {
 								        base = 16;
 								        s += 2;
 								    } else if (!base) {
 								        base = *s == '0' ? 8 : 10;
 								    }
 								    if (s - start >= spec->width) {
 								        return NULL;
 								    }
 								    value = 0;
 								    n_digits = 0;
 								    while (s - start < spec->width) {
 								        int digit = hexit_value(*s);
 								        if (digit < 0 || digit >= base) {
 								            break;
 								        }
 								        value = value * base + digit;
 								        n_digits++;
 								        s++;
 								    }
 								    if (!n_digits) {
 								        return NULL;
 								    }
 								    if (negative) {
 								        value = -value;
 								    }
 								    switch (spec->type) {
 								    case SCAN_DISCARD:
 								        break;
 								    case SCAN_CHAR:
 								        *va_arg(*args, char *) = value;
 								        break;
 								    case SCAN_SHORT:
 								        *va_arg(*args, short int *) = value;
 								        break;
 								    case SCAN_INT:
 								        *va_arg(*args, int *) = value;
 								        break;
 								    case SCAN_LONG:
 								        *va_arg(*args, long int *) = value;
 								        break;
 								    case SCAN_LLONG:
 								        *va_arg(*args, long long int *) = value;
 								        break;
 								    case SCAN_INTMAX_T:
 								        *va_arg(*args, intmax_t *) = value;
 								        break;
 								    case SCAN_PTRDIFF_T:
 								        *va_arg(*args, ptrdiff_t *) = value;
 								        break;
 								    case SCAN_SIZE_T:
 								        *va_arg(*args, size_t *) = value;
 								        break;
 								    }
 								    return s;
 								}
 								static const char *
 								skip_digits(const char *s)
 								{
 								    while (*s >= '0' && *s <= '9') {
 								        s++;
 								    }
 								    return s;
 								}
 								static const char *
 								scan_float(const char *s, const struct scan_spec *spec, va_list *args)
 								{
 								    const char *start = s;
 								    long double value;
 								    char *tail;
 								    char *copy;
 								    bool ok;
 								    s += *s == '+' || *s == '-';
 								    s = skip_digits(s);
 								    if (*s == '.') {
 								        s = skip_digits(s + 1);
 								    }
 								    if (*s == 'e' || *s == 'E') {
 								        s++;
 								        s += *s == '+' || *s == '-';
 								        s = skip_digits(s);
 								    }
 								    if (s - start > spec->width) {
 								        s = start + spec->width;
 								    }
 								    copy = xmemdup0(start, s - start);
 								    value = strtold(copy, &tail);
 								    ok = *tail == '\0';
 								    free(copy);
 								    if (!ok) {
 								        return NULL;
 								    }
 								    switch (spec->type) {
 								    case SCAN_DISCARD:
 								        break;
 								    case SCAN_INT:
 								        *va_arg(*args, float *) = value;
 								        break;
 								    case SCAN_LONG:
 								        *va_arg(*args, double *) = value;
 								        break;
 								    case SCAN_LLONG:
 								        *va_arg(*args, long double *) = value;
 								        break;
 								    case SCAN_CHAR:
 								    case SCAN_SHORT:
 								    case SCAN_INTMAX_T:
 								    case SCAN_PTRDIFF_T:
 								    case SCAN_SIZE_T:
-												Rename NOT_REACHED to OVS_NOT_REACHED

This allows other libraries to use util.h that has already
defined NOT_REACHED.

Signed-off-by: Harold Lim <haroldl@vmware.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-12-17 10:32:12 -08:00
+								        OVS_NOT_REACHED();
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								    }
 								    return s;
 								}
 								static void
 								scan_output_string(const struct scan_spec *spec,
 								                   const char *s, size_t n,
 								                   va_list *args)
 								{
 								    if (spec->type != SCAN_DISCARD) {
 								        char *out = va_arg(*args, char *);
 								        memcpy(out, s, n);
 								        out[n] = '\0';
 								    }
 								}
 								static const char *
 								scan_string(const char *s, const struct scan_spec *spec, va_list *args)
 								{
 								    size_t n;
 								    for (n = 0; n < spec->width; n++) {
 								        if (!s[n] || isspace((unsigned char) s[n])) {
 								            break;
 								        }
 								    }
 								    if (!n) {
 								        return NULL;
 								    }
 								    scan_output_string(spec, s, n, args);
 								    return s + n;
 								}
 								static const char *
 								parse_scanset(const char *p_, unsigned long *set, bool *complemented)
 								{
 								    const uint8_t *p = (const uint8_t *) p_;
 								    *complemented = *p == '^';
 								    p += *complemented;
 								    if (*p == ']') {
 								        bitmap_set1(set, ']');
 								        p++;
 								    }
 								    while (*p && *p != ']') {
 								        if (p[1] == '-' && p[2] != ']' && p[2] > *p) {
 								            bitmap_set_multiple(set, *p, p[2] - *p + 1, true);
 								            p += 3;
 								        } else {
 								            bitmap_set1(set, *p++);
 								        }
 								    }
 								    if (*p == ']') {
 								        p++;
 								    }
 								    return (const char *) p;
 								}
 								static const char *
 								scan_set(const char *s, const struct scan_spec *spec, const char **pp,
 								         va_list *args)
 								{
 								    unsigned long set[BITMAP_N_LONGS(UCHAR_MAX + 1)];
 								    bool complemented;
 								    unsigned int n;
 								    /* Parse the scan set. */
 								    memset(set, 0, sizeof set);
 								    *pp = parse_scanset(*pp, set, &complemented);
 								    /* Parse the data. */
 								    n = 0;
 								    while (s[n]
 								           && bitmap_is_set(set, (unsigned char) s[n]) == !complemented
 								           && n < spec->width) {
 								        n++;
 								    }
 								    if (!n) {
 								        return NULL;
 								    }
 								    scan_output_string(spec, s, n, args);
 								    return s + n;
 								}
 								static const char *
 								scan_chars(const char *s, const struct scan_spec *spec, va_list *args)
 								{
-												util: Fix bad constant in ovs_scan() implementation on 64-bit.

scan_chars() compares an "unsigned int" against SIZE_MAX, which will
always be false on 64-bit architectures.  The correct constant is
UINT_MAX.

Reported-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Jarno Rajahalme <jrajahalme@nicira.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 10:34:34 -08:00
+								    unsigned int n = spec->width == UINT_MAX ? 1 : spec->width;
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
 								    if (strlen(s) < n) {
 								        return NULL;
 								    }
 								    if (spec->type != SCAN_DISCARD) {
 								        memcpy(va_arg(*args, char *), s, n);
 								    }
 								    return s + n;
 								}
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								static bool
 								ovs_scan__(const char *s, int *n, const char *format, va_list *args)
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								{
 								    const char *const start = s;
 								    bool ok = false;
 								    const char *p;
-												Update openvswitch to allow linking from C++ projects

The input variable of ovs_scan is changed from 'template' to
'format'. template is a keyword in C++.

Signed-off-by: Harold Lim <haroldl@vmware.com>
Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-12-17 10:32:11 -08:00
+								    p = format;
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								    while (*p != '\0') {
 								        struct scan_spec spec;
 								        unsigned char c = *p++;
 								        bool discard;
 								        if (isspace(c)) {
 								            s = skip_spaces(s);
 								            continue;
 								        } else if (c != '%') {
 								            if (*s != c) {
 								                goto exit;
 								            }
 								            s++;
 								            continue;
 								        } else if (*p == '%') {
 								            if (*s++ != '%') {
 								                goto exit;
 								            }
 								            p++;
 								            continue;
 								        }
 								        /* Parse '*' flag. */
 								        discard = *p == '*';
 								        p += discard;
 								        /* Parse field width. */
 								        spec.width = 0;
 								        while (*p >= '0' && *p <= '9') {
 								            spec.width = spec.width * 10 + (*p++ - '0');
 								        }
 								        if (spec.width == 0) {
 								            spec.width = UINT_MAX;
 								        }
 								        /* Parse type modifier. */
 								        switch (*p) {
 								        case 'h':
 								            if (p[1] == 'h') {
 								                spec.type = SCAN_CHAR;
 								                p += 2;
 								            } else {
 								                spec.type = SCAN_SHORT;
 								                p++;
 								            }
 								            break;
 								        case 'j':
 								            spec.type = SCAN_INTMAX_T;
 								            p++;
 								            break;
 								        case 'l':
 								            if (p[1] == 'l') {
 								                spec.type = SCAN_LLONG;
 								                p += 2;
 								            } else {
 								                spec.type = SCAN_LONG;
 								                p++;
 								            }
 								            break;
 								        case 'L':
 								        case 'q':
 								            spec.type = SCAN_LLONG;
 								            p++;
 								            break;
 								        case 't':
 								            spec.type = SCAN_PTRDIFF_T;
 								            p++;
 								            break;
 								        case 'z':
 								            spec.type = SCAN_SIZE_T;
 								            p++;
 								            break;
 								        default:
 								            spec.type = SCAN_INT;
 								            break;
 								        }
 								        if (discard) {
 								            spec.type = SCAN_DISCARD;
 								        }
 								        c = *p++;
 								        if (c != 'c' && c != 'n' && c != '[') {
 								            s = skip_spaces(s);
 								        }
 								        switch (c) {
 								        case 'd':
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								            s = scan_int(s, &spec, 10, args);
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            break;
 								        case 'i':
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								            s = scan_int(s, &spec, 0, args);
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            break;
 								        case 'o':
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								            s = scan_int(s, &spec, 8, args);
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            break;
 								        case 'u':
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								            s = scan_int(s, &spec, 10, args);
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            break;
 								        case 'x':
 								        case 'X':
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								            s = scan_int(s, &spec, 16, args);
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            break;
 								        case 'e':
 								        case 'f':
 								        case 'g':
 								        case 'E':
 								        case 'G':
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								            s = scan_float(s, &spec, args);
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            break;
 								        case 's':
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								            s = scan_string(s, &spec, args);
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            break;
 								        case '[':
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								            s = scan_set(s, &spec, &p, args);
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            break;
 								        case 'c':
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								            s = scan_chars(s, &spec, args);
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            break;
 								        case 'n':
 								            if (spec.type != SCAN_DISCARD) {
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								                *va_arg(*args, int *) = s - start;
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								            }
 								            break;
 								        }
 								        if (!s) {
 								            goto exit;
 								        }
 								    }
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								    if (n) {
 								        *n = s - start;
 								    }
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								    ok = true;
-												util: New function ovs_scan().

This new function is essentially an implementation of sscanf() with
slightly different behavior (see the comment) that is more convenient for
Open vSwitch internal use.  Also, this implementation ought to work out of
the box on Windows, which has a defective sscanf() that lacks the 'hh'
modifier required to scan into a char variable.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2013-11-15 08:54:56 -08:00
+								exit:
 								    return ok;
 								}
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								/* This is an implementation of the standard sscanf() function, with the
 								 * following exceptions:
 								 *
 								 *   - It returns true if the entire format was successfully scanned and
 								 *     converted, false if any conversion failed.
 								 *
 								 *   - The standard doesn't define sscanf() behavior when an out-of-range value
 								 *     is scanned, e.g. if a "%"PRIi8 conversion scans "-1" or "0x1ff".  Some
 								 *     implementations consider this an error and stop scanning.  This
 								 *     implementation never considers an out-of-range value an error; instead,
 								 *     it stores the least-significant bits of the converted value in the
 								 *     destination, e.g. the value 255 for both examples earlier.
 								 *
 								 *   - Only single-byte characters are supported, that is, the 'l' modifier
 								 *     on %s, %[, and %c is not supported.  The GNU extension 'a' modifier is
 								 *     also not supported.
 								 *
 								 *   - %p is not supported.
 								 */
 								bool
 								ovs_scan(const char *s, const char *format, ...)
 								{
 								    va_list args;
 								    bool res;
 								    va_start(args, format);
 								    res = ovs_scan__(s, NULL, format, &args);
 								    va_end(args);
 								    return res;
 								}
 								/*
-												util: Fix typo in comment.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Justin Pettit <jpettit@nicira.com>

											
										
										
											2015-02-26 20:26:05 -08:00
+								 * This function is similar to ovs_scan(), with an extra parameter `n` added to
 								 * return the number of scanned characters.
-												util: Introduce ovs_scan_len()

This is similar to ovs_scan but takes int pointer as extra
parameter, this pointer point to starting index of the string.
On successful scan this API stores number of characters
scanned.  This API is useful for parsing complex odp actions
e.g. tun_push action.

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Thomas Graf <tgraf@noironetworks.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-11-10 12:46:11 -08:00
+								 */
 								bool
 								ovs_scan_len(const char *s, int *n, const char *format, ...)
 								{
 								    va_list args;
 								    bool success;
 								    int n1;
 								    va_start(args, format);
 								    success = ovs_scan__(s + *n, &n1, format, &args);
 								    va_end(args);
 								    if (success) {
 								        *n = *n + n1;
 								    }
 								    return success;
 								}
-												util: xleep for Windows.

Windows does not have a sleep(seconds). But it does have
a Sleep(milliseconds). Sleep() in windows does not have a
return value. Since we are not using the return value for xsleep()
anywhere as of now, don't return any.

Introduced by commit 275eebb9 (utils: Introduce xsleep for RCU quiescent state)

CC: Pravin B Shelar <pshelar@nicira.com>
Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Pravin B Shelar <pshelar@nicira.com>

											
										
										
											2014-03-28 15:15:02 -07:00
+								void
-												utils: Introduce xsleep for RCU quiescent state

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-21 09:20:42 -07:00
+								xsleep(unsigned int seconds)
 								{
 								    ovsrcu_quiesce_start();
-												util: xleep for Windows.

Windows does not have a sleep(seconds). But it does have
a Sleep(milliseconds). Sleep() in windows does not have a
return value. Since we are not using the return value for xsleep()
anywhere as of now, don't return any.

Introduced by commit 275eebb9 (utils: Introduce xsleep for RCU quiescent state)

CC: Pravin B Shelar <pshelar@nicira.com>
Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Pravin B Shelar <pshelar@nicira.com>

											
										
										
											2014-03-28 15:15:02 -07:00
+								#ifdef _WIN32
 								    Sleep(seconds * 1000);
 								#else
 								    sleep(seconds);
 								#endif
-												utils: Introduce xsleep for RCU quiescent state

Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-21 09:20:42 -07:00
+								    ovsrcu_quiesce_end();
 								}
-												util: Add non quiesce xnanosleep.

xnanosleep forces the thread into quiesce state in anticipation that
it will be sleeping for a considerable time and that the thread may
need to quiesce before the sleep is finished.

In some cases, a very short sleep may be requested and in that case
the overhead of going to into quiesce state may be unnecessary.

To allow for those cases add a xnanosleep_no_quiesce() variant.

Suggested-by: Ilya Maximets <i.maximets@ovn.org>
Reviewed-by: David Marchand <david.marchand@redhat.com>
Signed-off-by: Kevin Traynor <ktraynor@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-11 09:35:00 +00:00
+								static void
 								xnanosleep__(uint64_t nanoseconds)
-												util: Add high resolution sleep support.

This commit introduces xnanosleep() for the threads needing high
resolution sleep timeouts.

usleep() that provides microsecond granularity is deprecated and threads
wanting sub-second(ms,us,ns) granularity can use this implementation.

Signed-off-by: Bhanuprakash Bodireddy <bhanuprakash.bodireddy@intel.com>
Acked-by: Alin Gabriel Serdean <aserdean@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-11-28 22:02:06 +00:00
+								{
 								#ifndef _WIN32
 								    int retval;
 								    struct timespec ts_sleep;
 								    nsec_to_timespec(nanoseconds, &ts_sleep);
 								    int error = 0;
 								    do {
 								        retval = nanosleep(&ts_sleep, NULL);
 								        error = retval < 0 ? errno : 0;
 								    } while (error == EINTR);
 								#else
 								    HANDLE timer = CreateWaitableTimer(NULL, FALSE, NULL);
 								    if (timer) {
 								        LARGE_INTEGER duetime;
 								        duetime.QuadPart = -nanoseconds;
 								        if (SetWaitableTimer(timer, &duetime, 0, NULL, NULL, FALSE)) {
 								            WaitForSingleObject(timer, INFINITE);
 								        } else {
 								            VLOG_ERR_ONCE("SetWaitableTimer Failed (%s)",
 								                           ovs_lasterror_to_string());
 								        }
 								        CloseHandle(timer);
 								    } else {
 								        VLOG_ERR_ONCE("CreateWaitableTimer Failed (%s)",
 								                       ovs_lasterror_to_string());
 								    }
 								#endif
-												util: Add non quiesce xnanosleep.

xnanosleep forces the thread into quiesce state in anticipation that
it will be sleeping for a considerable time and that the thread may
need to quiesce before the sleep is finished.

In some cases, a very short sleep may be requested and in that case
the overhead of going to into quiesce state may be unnecessary.

To allow for those cases add a xnanosleep_no_quiesce() variant.

Suggested-by: Ilya Maximets <i.maximets@ovn.org>
Reviewed-by: David Marchand <david.marchand@redhat.com>
Signed-off-by: Kevin Traynor <ktraynor@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-11 09:35:00 +00:00
+								}
 								/* High resolution sleep with thread quiesce. */
 								void
 								xnanosleep(uint64_t nanoseconds)
 								{
 								    ovsrcu_quiesce_start();
 								    xnanosleep__(nanoseconds);
-												util: Add high resolution sleep support.

This commit introduces xnanosleep() for the threads needing high
resolution sleep timeouts.

usleep() that provides microsecond granularity is deprecated and threads
wanting sub-second(ms,us,ns) granularity can use this implementation.

Signed-off-by: Bhanuprakash Bodireddy <bhanuprakash.bodireddy@intel.com>
Acked-by: Alin Gabriel Serdean <aserdean@ovn.org>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-11-28 22:02:06 +00:00
+								    ovsrcu_quiesce_end();
 								}
-												util: Add non quiesce xnanosleep.

xnanosleep forces the thread into quiesce state in anticipation that
it will be sleeping for a considerable time and that the thread may
need to quiesce before the sleep is finished.

In some cases, a very short sleep may be requested and in that case
the overhead of going to into quiesce state may be unnecessary.

To allow for those cases add a xnanosleep_no_quiesce() variant.

Suggested-by: Ilya Maximets <i.maximets@ovn.org>
Reviewed-by: David Marchand <david.marchand@redhat.com>
Signed-off-by: Kevin Traynor <ktraynor@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-11 09:35:00 +00:00
+								/* High resolution sleep without thread quiesce. */
 								void
 								xnanosleep_no_quiesce(uint64_t nanoseconds)
 								{
 								    xnanosleep__(nanoseconds);
 								}
-												dpif-netdev: Set timer slack for PMD threads.

The default Linux timer slack groups timer expires into 50 uS intervals.

With some traffic patterns this can mean that returning to process
packets after a sleep takes too long and packets are dropped.

Add a helper to util.c and set use it to reduce the timer slack
for PMD threads, so that sleeps with smaller resolutions can be done
to prevent sleeping for too long.

Fixes: de3bbdc479a9 ("dpif-netdev: Add PMD load based sleeping.")
Reported-at: https://mail.openvswitch.org/pipermail/ovs-dev/2023-January/401121.html
Reported-by: Ilya Maximets <i.maximets@ovn.org>
Signed-off-by: David Marchand <david.marchand@redhat.com>
Co-authored-by: Kevin Traynor <ktraynor@redhat.com>
Signed-off-by: Kevin Traynor <ktraynor@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-18 16:23:55 +00:00
+								#if __linux__
 								void
 								set_timer_resolution(unsigned long nanoseconds)
 								{
 								    prctl(PR_SET_TIMERSLACK, nanoseconds);
 								}
 								#else
 								void
 								set_timer_resolution(unsigned long nanoseconds OVS_UNUSED)
 								{
 								}
 								#endif
-												ovs-ofctl: Add option for color output to dump-flows command.

Add an option to ovs-ofctl utility so as to obtain colorized output in
tty, for easier reading. Currently, only the dump-flows command supports
colors.

A new `--color` option has been added to ovs-ofctl so as to indicate
whether color markers should be used or not. It can be set to `always`
(force colors), `never` (no colors) or `auto` (use colors only if output
is a tty). If provided without any value, it is the same as `auto`. If
the option is not provided at all, colors are disabled by default.

Examples:
This first call will output colorized flows:

    ovs-ofctl dump-flows br0 --color=always

These two calls will produce colorized output on a tty, but they will
not use color markers if the output is redirected to a file or piped
into another command:

    ovs-ofctl dump-flows br0 --color=auto
    ovs-ofctl dump-flows br0 --color

These two calls will not use color markers:

    ovs-ofctl dump-flows br0 --color=never
    ovs-ofctl dump-flows br0

The result of this option is stored into a variable which is to be
forwarded (in next commits) as a function argument until it reaches the
functions that print the elements of the flows.

Signed-off-by: Quentin Monnet <quentin.monnet@6wind.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-03-02 15:56:16 +01:00
+								/* Determine whether standard output is a tty or not. This is useful to decide
 								 * whether to use color output or not when --color option for utilities is set
 								 * to `auto`.
 								 */
 								bool
 								is_stdout_a_tty(void)
 								{
 								    char const *t = getenv("TERM");
 								    return (isatty(STDOUT_FILENO) && t && strcmp(t, "dumb") != 0);
 								}
-												util: A generic function to convert error to string for windows.

More users will be added in an upcoming commit.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-01-16 13:49:38 -08:00
+								#ifdef _WIN32
 								char *
-												util: Pre-allocate buffer for ovs_lasterror_to_string().

This lets us call ovs_lasterror_to_string() and not having
to do an extra call of LocalFree() on the returned string.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-14 08:12:32 -08:00
+								ovs_format_message(int error)
-												util: A generic function to convert error to string for windows.

More users will be added in an upcoming commit.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-01-16 13:49:38 -08:00
+								{
-												util: Pre-allocate buffer for ovs_lasterror_to_string().

This lets us call ovs_lasterror_to_string() and not having
to do an extra call of LocalFree() on the returned string.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-14 08:12:32 -08:00
+								    enum { BUFSIZE = sizeof strerror_buffer_get()->s };
 								    char *buffer = strerror_buffer_get()->s;
-												ovs_strerror, ovs_format_message: Always use "Success" for errno 0

So that testsuite can compare log messages including the string.

Signed-off-by: YAMAMOTO Takashi <yamamoto@midokura.com>
Acked-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-03-16 07:19:35 +00:00
+								    if (error == 0) {
 								        /* See ovs_strerror */
 								        return "Success";
 								    }
-												util: Pre-allocate buffer for ovs_lasterror_to_string().

This lets us call ovs_lasterror_to_string() and not having
to do an extra call of LocalFree() on the returned string.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-14 08:12:32 -08:00
+								    FormatMessage(FORMAT_MESSAGE_FROM_SYSTEM | FORMAT_MESSAGE_IGNORE_INSERTS,
 								                  NULL, error, 0, buffer, BUFSIZE, NULL);
-												util: A generic function to convert error to string for windows.

More users will be added in an upcoming commit.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-01-16 13:49:38 -08:00
+								    return buffer;
 								}
-												util: Pre-allocate buffer for ovs_lasterror_to_string().

This lets us call ovs_lasterror_to_string() and not having
to do an extra call of LocalFree() on the returned string.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-02-14 08:12:32 -08:00
 								/* Returns a null-terminated string that explains the last error.
 								 * Use this function to get the error string for WINAPI calls. */
 								char *
 								ovs_lasterror_to_string(void)
 								{
 								    return ovs_format_message(GetLastError());
 								}
-												ovsdb-server: Truncate file for Windows.

There is no ftruncate() in visual studio. There is a _chsize_s()
which has a similar functionality.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-10 08:37:21 -07:00
 								int
 								ftruncate(int fd, off_t length)
 								{
 								    int error;
 								    error = _chsize_s(fd, length);
 								    if (error) {
 								        return -1;
 								    }
 								    return 0;
 								}
-												util: Make WSAStartup available outside stream.c.

WSAStartup() needs to be called before using winsock2 related
functions. We need this for almost all the utilities. So call
it through OVS_CONSTRUCTOR.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-05-23 10:07:49 -07:00
 								OVS_CONSTRUCTOR(winsock_start) {
 								    WSADATA wsaData;
 								    int error;
 								    error = WSAStartup(MAKEWORD(2, 2), &wsaData);
 								    if (error != 0) {
 								        VLOG_FATAL("WSAStartup failed: %s", sock_strerror(sock_errno()));
 								   }
 								}
-												util: A generic function to convert error to string for windows.

More users will be added in an upcoming commit.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-01-16 13:49:38 -08:00
+								#endif
-												util: Support checking for kernel versions.

Extract checking for a given kernel version to a separate function.
It will be used also in the next patch.

Acked-by: Mike Pattrick <mkp@redhat.com>
Acked-by: Eelco Chaudron <echaudro@redhat.com>
Acked-by: Aaron Conole <aconole@redhat.com>
Signed-off-by: Felix Huettner <felix.huettner@mail.schwarz>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2024-03-11 14:15:47 +01:00
 								#ifdef __linux__
 								bool
 								ovs_kernel_is_version_or_newer(int target_major, int target_minor)
 								{
 								    static struct ovsthread_once once = OVSTHREAD_ONCE_INITIALIZER;
 								    static int current_major, current_minor = -1;
 								    if (ovsthread_once_start(&once)) {
 								        struct utsname utsname;
 								        if (uname(&utsname) == -1) {
 								            VLOG_WARN("uname failed (%s)", ovs_strerror(errno));
 								        } else if (!ovs_scan(utsname.release, "%d.%d",
 								                    &current_major, &current_minor)) {
 								            VLOG_WARN("uname reported bad OS release (%s)", utsname.release);
 								        }
 								        ovsthread_once_done(&once);
 								    }
 								    if (current_major == -1 || current_minor == -1) {
 								        return false;
 								    }
 								    return current_major > target_major || (
 								            current_major == target_major && current_minor >= target_minor);
 								}
 								#endif