ovs/lib/hash.h

/*
 * Copyright (c) 2008, 2009, 2010, 2012, 2013, 2014, 2016 Nicira, Inc.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at:
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
#ifndef HASH_H
#define HASH_H 1

#include <stdbool.h>
#include <stddef.h>
#include <stdint.h>
#include <string.h>
#include "util.h"

#ifdef __cplusplus
extern "C" {
#endif

static inline uint32_t
hash_rot(uint32_t x, int k)
{
    return (x << k) | (x >> (32 - k));
}

uint32_t hash_bytes(const void *, size_t n_bytes, uint32_t basis);
/* The hash input must be a word larger than 128 bits. */
void hash_bytes128(const void *_, size_t n_bytes, uint32_t basis,
                   ovs_u128 *out);

static inline uint32_t hash_int(uint32_t x, uint32_t basis);
static inline uint32_t hash_2words(uint32_t, uint32_t);
static inline uint32_t hash_uint64(const uint64_t);
static inline uint32_t hash_uint64_basis(const uint64_t x,
                                         const uint32_t basis);
uint32_t hash_3words(uint32_t, uint32_t, uint32_t);

static inline uint32_t hash_boolean(bool x, uint32_t basis);
uint32_t hash_double(double, uint32_t basis);

static inline uint32_t hash_pointer(const void *, uint32_t basis);
static inline uint32_t hash_string(const char *, uint32_t basis);

/* Murmurhash by Austin Appleby,
 * from https://github.com/aappleby/smhasher/blob/master/src/MurmurHash3.cpp
 *
 * The upstream license there says:
 *
 *    MurmurHash3 was written by Austin Appleby, and is placed in the public
 *    domain. The author hereby disclaims copyright to this source code.
 *
 * See hash_words() for sample usage. */

static inline uint32_t mhash_add__(uint32_t hash, uint32_t data)
{
    /* zero-valued 'data' will not change the 'hash' value */
    if (!data) {
        return hash;
    }

    data *= 0xcc9e2d51;
    data = hash_rot(data, 15);
    data *= 0x1b873593;
    return hash ^ data;
}

static inline uint32_t mhash_add(uint32_t hash, uint32_t data)
{
    hash = mhash_add__(hash, data);
    hash = hash_rot(hash, 13);
    return hash * 5 + 0xe6546b64;
}

static inline uint32_t mhash_finish(uint32_t hash)
{
    hash ^= hash >> 16;
    hash *= 0x85ebca6b;
    hash ^= hash >> 13;
    hash *= 0xc2b2ae35;
    hash ^= hash >> 16;
    return hash;
}

static inline uint32_t hash_add(uint32_t hash, uint32_t data);
static inline uint32_t hash_add64(uint32_t hash, uint64_t data);

static inline uint32_t hash_add_words(uint32_t, const uint32_t *, size_t);
static inline uint32_t hash_add_words64(uint32_t, const uint64_t *, size_t);
static inline uint32_t hash_add_bytes32(uint32_t, const uint32_t *, size_t);
static inline uint32_t hash_add_bytes64(uint32_t, const uint64_t *, size_t);

#if (defined(__ARM_FEATURE_CRC32) && defined(__aarch64__))
#include "hash-aarch64.h"

#elif !(defined(__SSE4_2__) && defined(__x86_64__))
/* Mhash-based implementation. */

static inline uint32_t hash_add(uint32_t hash, uint32_t data)
{
    return mhash_add(hash, data);
}

static inline uint32_t hash_add64(uint32_t hash, uint64_t data)
{
    return hash_add(hash_add(hash, data), data >> 32);
}

static inline uint32_t hash_finish(uint32_t hash, uint32_t final)
{
    return mhash_finish(hash ^ final);
}

/* Returns the hash of the 'n' 32-bit words at 'p', starting from 'basis'.
 * 'p' must be properly aligned.
 *
 * This is inlined for the compiler to have access to the 'n_words', which
 * in many cases is a constant. */
static inline uint32_t
hash_words_inline(const uint32_t *p, size_t n_words, uint32_t basis)
{
    return hash_finish(hash_add_words(basis, p, n_words), n_words * 4);
}

static inline uint32_t
hash_words64_inline(const uint64_t *p, size_t n_words, uint32_t basis)
{
    return hash_finish(hash_add_words64(basis, p, n_words), n_words * 8);
}

static inline uint32_t hash_pointer(const void *p, uint32_t basis)
{
    /* Often pointers are hashed simply by casting to integer type, but that
     * has pitfalls since the lower bits of a pointer are often all 0 for
     * alignment reasons.  It's hard to guess where the entropy really is, so
     * we give up here and just use a high-quality hash function.
     *
     * The double cast suppresses a warning on 64-bit systems about casting to
     * an integer to different size.  That's OK in this case, since most of the
     * entropy in the pointer is almost certainly in the lower 32 bits. */
    return hash_int((uint32_t) (uintptr_t) p, basis);
}

static inline uint32_t hash_2words(uint32_t x, uint32_t y)
{
    return hash_finish(hash_add(hash_add(x, 0), y), 8);
}

static inline uint32_t hash_uint64_basis(const uint64_t x,
                                         const uint32_t basis)
{
    return hash_finish(hash_add64(basis, x), 8);
}

static inline uint32_t hash_uint64(const uint64_t x)
{
    return hash_uint64_basis(x, 0);
}

#else /* __SSE4_2__ && __x86_64__ */
#include <smmintrin.h>

static inline uint32_t hash_add(uint32_t hash, uint32_t data)
{
    return _mm_crc32_u32(hash, data);
}

/* Add the halves of 'data' in the memory order. */
static inline uint32_t hash_add64(uint32_t hash, uint64_t data)
{
    return _mm_crc32_u64(hash, data);
}

static inline uint32_t hash_finish(uint64_t hash, uint64_t final)
{
    /* The finishing multiplier 0x805204f3 has been experimentally
     * derived to pass the testsuite hash tests. */
    hash = _mm_crc32_u64(hash, final) * 0x805204f3;
    return hash ^ (uint32_t)hash >> 16; /* Increase entropy in LSBs. */
}

static inline uint32_t
hash_finish32(uint64_t hash, uint32_t final, uint32_t semifinal)
{
    /* The finishing multiplier 0x805204f3 has been experimentally
     * derived to pass the testsuite hash tests. */
    hash = _mm_crc32_u32(hash, semifinal);
    hash = _mm_crc32_u32(hash, final) * 0x805204f3ULL;
    return hash ^ ((uint32_t) hash >> 16); /* Increase entropy in LSBs. */
}

static inline uint32_t
hash_words_32aligned(const uint32_t *p, size_t n_words, uint32_t basis)
{
    uint32_t hash1 = basis;
    uint32_t hash2 = 0;
    uint32_t hash3 = n_words;
    const uint32_t *endp = (const uint32_t *) p + n_words;
    const uint32_t *limit = p + n_words - 6;

    while (p <= limit) {
        hash1 = _mm_crc32_u32(hash1, p[0]);
        hash1 = _mm_crc32_u32(hash1, p[1]);
        hash2 = _mm_crc32_u32(hash2, p[2]);
        hash2 = _mm_crc32_u32(hash2, p[3]);
        hash3 = _mm_crc32_u32(hash3, p[4]);
        hash3 = _mm_crc32_u32(hash3, p[5]);
        p += 6;
    }
    switch (endp - (const uint32_t *) p) {
    case 1:
        hash1 = _mm_crc32_u32(hash1, p[0]);
        break;
    case 2:
        hash1 = _mm_crc32_u32(hash1, p[0]);
        hash1 = _mm_crc32_u32(hash1, p[1]);
        break;
    case 3:
        hash1 = _mm_crc32_u32(hash1, p[0]);
        hash1 = _mm_crc32_u32(hash1, p[1]);
        hash2 = _mm_crc32_u32(hash2, p[2]);
        break;
    case 4:
        hash1 = _mm_crc32_u32(hash1, p[0]);
        hash1 = _mm_crc32_u32(hash1, p[1]);
        hash2 = _mm_crc32_u32(hash2, p[2]);
        hash2 = _mm_crc32_u32(hash2, p[3]);
        break;
    case 5:
        hash1 = _mm_crc32_u32(hash1, p[0]);
        hash1 = _mm_crc32_u32(hash1, p[1]);
        hash2 = _mm_crc32_u32(hash2, p[2]);
        hash2 = _mm_crc32_u32(hash2, p[3]);
        hash3 = _mm_crc32_u32(hash3, p[4]);
        break;
    }
    return hash_finish32(hash1, hash2, hash3);
}

/* Returns the hash of the 'n' 32-bit words at 'p_', starting from 'basis'.
 * We access 'p_' as a uint64_t pointer, which is fine for __SSE_4_2__.
 *
 * This is inlined for the compiler to have access to the 'n_words', which
 * in many cases is a constant. */
static inline uint32_t
hash_words_inline(const uint32_t *p_, size_t n_words, uint32_t basis)
{
    const uint64_t *p = ALIGNED_CAST(const uint64_t *, p_);
    uint64_t hash1 = basis;
    uint64_t hash2 = 0;
    uint64_t hash3 = n_words;
    const uint32_t *endp = (const uint32_t *)p + n_words;
    const uint64_t *limit = p + n_words / 2 - 3;

    if (OVS_UNLIKELY(((intptr_t) p & ((sizeof(uint64_t)) - 1)) != 0)) {
        return hash_words_32aligned(p_, n_words, basis);
    }

    while (p <= limit) {
        hash1 = _mm_crc32_u64(hash1, p[0]);
        hash2 = _mm_crc32_u64(hash2, p[1]);
        hash3 = _mm_crc32_u64(hash3, p[2]);
        p += 3;
    }
    switch (endp - (const uint32_t *)p) {
    case 1:
        hash1 = _mm_crc32_u32(hash1, *(const uint32_t *)&p[0]);
        break;
    case 2:
        hash1 = _mm_crc32_u64(hash1, p[0]);
        break;
    case 3:
        hash1 = _mm_crc32_u64(hash1, p[0]);
        hash2 = _mm_crc32_u32(hash2, *(const uint32_t *)&p[1]);
        break;
    case 4:
        hash1 = _mm_crc32_u64(hash1, p[0]);
        hash2 = _mm_crc32_u64(hash2, p[1]);
        break;
    case 5:
        hash1 = _mm_crc32_u64(hash1, p[0]);
        hash2 = _mm_crc32_u64(hash2, p[1]);
        hash3 = _mm_crc32_u32(hash3, *(const uint32_t *)&p[2]);
        break;
    }
    return hash_finish(hash1, hash2 << 32 | hash3);
}

/* A simpler version for 64-bit data.
 * 'n_words' is the count of 64-bit words, basis is 64 bits. */
static inline uint32_t
hash_words64_inline(const uint64_t *p, size_t n_words, uint32_t basis)
{
    uint64_t hash1 = basis;
    uint64_t hash2 = 0;
    uint64_t hash3 = n_words;
    const uint64_t *endp = p + n_words;
    const uint64_t *limit = endp - 3;

    while (p <= limit) {
        hash1 = _mm_crc32_u64(hash1, p[0]);
        hash2 = _mm_crc32_u64(hash2, p[1]);
        hash3 = _mm_crc32_u64(hash3, p[2]);
        p += 3;
    }
    switch (endp - p) {
    case 1:
        hash1 = _mm_crc32_u64(hash1, p[0]);
        break;
    case 2:
        hash1 = _mm_crc32_u64(hash1, p[0]);
        hash2 = _mm_crc32_u64(hash2, p[1]);
        break;
    }
    return hash_finish(hash1, hash2 << 32 | hash3);
}

static inline uint32_t hash_uint64_basis(const uint64_t x,
                                         const uint32_t basis)
{
    /* '23' chosen to mix bits enough for the test-hash to pass. */
    return hash_finish(hash_add64(basis, x), 23);
}

static inline uint32_t hash_uint64(const uint64_t x)
{
    return hash_uint64_basis(x, 0);
}

static inline uint32_t hash_2words(uint32_t x, uint32_t y)
{
    return hash_uint64((uint64_t)y << 32 | x);
}

static inline uint32_t hash_pointer(const void *p, uint32_t basis)
{
    return hash_uint64_basis((uint64_t) (uintptr_t) p, basis);
}
#endif

uint32_t hash_words__(const uint32_t *p, size_t n_words, uint32_t basis);
uint32_t hash_words64__(const uint64_t *p, size_t n_words, uint32_t basis);

/* Inline the larger hash functions only when 'n_words' is known to be
 * compile-time constant. */
#if __GNUC__ >= 4
static inline uint32_t
hash_words(const uint32_t *p, size_t n_words, uint32_t basis)
{
    if (__builtin_constant_p(n_words)) {
        return hash_words_inline(p, n_words, basis);
    } else {
        return hash_words__(p, n_words, basis);
    }
}

static inline uint32_t
hash_words64(const uint64_t *p, size_t n_words, uint32_t basis)
{
    if (__builtin_constant_p(n_words)) {
        return hash_words64_inline(p, n_words, basis);
    } else {
        return hash_words64__(p, n_words, basis);
    }
}

#else

static inline uint32_t
hash_words(const uint32_t *p, size_t n_words, uint32_t basis)
{
    return hash_words__(p, n_words, basis);
}

static inline uint32_t
hash_words64(const uint64_t *p, size_t n_words, uint32_t basis)
{
    return hash_words64__(p, n_words, basis);
}
#endif

static inline uint32_t
hash_bytes32(const uint32_t *p, size_t n_bytes, uint32_t basis)
{
    return hash_words(p, n_bytes / 4, basis);
}

static inline uint32_t
hash_bytes64(const uint64_t *p, size_t n_bytes, uint32_t basis)
{
    return hash_words64(p, n_bytes / 8, basis);
}

static inline uint32_t hash_string(const char *s, uint32_t basis)
{
    return hash_bytes(s, strlen(s), basis);
}

static inline uint32_t hash_int(uint32_t x, uint32_t basis)
{
    return hash_2words(x, basis);
}

/* An attempt at a useful 1-bit hash function.  Has not been analyzed for
 * quality. */
static inline uint32_t hash_boolean(bool x, uint32_t basis)
{
    const uint32_t P0 = 0xc2b73583;   /* This is hash_int(1, 0). */
    const uint32_t P1 = 0xe90f1258;   /* This is hash_int(2, 0). */
    return (x ? P0 : P1) ^ hash_rot(basis, 1);
}

/* Helper functions for calling hash_add() for several 32- or 64-bit words in a
 * buffer.  These are not hash functions by themselves, since they need
 * hash_finish() to be called, so if you are looking for a full hash function
 * see hash_words(), etc. */

static inline uint32_t
hash_add_words(uint32_t hash, const uint32_t *p, size_t n_words)
{
    for (size_t i = 0; i < n_words; i++) {
        hash = hash_add(hash, p[i]);
    }
    return hash;
}

static inline uint32_t
hash_add_words64(uint32_t hash, const uint64_t *p, size_t n_words)
{
    for (size_t i = 0; i < n_words; i++) {
        hash = hash_add64(hash, p[i]);
    }
    return hash;
}

static inline uint32_t
hash_add_bytes32(uint32_t hash, const uint32_t *p, size_t n_bytes)
{
    return hash_add_words(hash, p, n_bytes / 4);
}

static inline uint32_t
hash_add_bytes64(uint32_t hash, const uint64_t *p, size_t n_bytes)
{
    return hash_add_words64(hash, p, n_bytes / 8);
}

#ifdef __cplusplus
}
#endif

#endif /* hash.h */
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								/*
-												hash: New helper functions hash_bytes32() and hash_bytes64().

All of the callers of hash_words() and hash_words64() actually find it
easier to pass in the number of bytes instead of the number of 32-bit
or 64-bit words.  These new functions allow the callers to be a little
simpler.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Jarno Rajahalme <jarno@ovn.org>

											
										
										
											2016-01-18 22:52:48 -08:00
+								 * Copyright (c) 2008, 2009, 2010, 2012, 2013, 2014, 2016 Nicira, Inc.
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								 *
-												Update primary code license to Apache 2.0.

											
										
										
											2009-06-15 15:11:30 -07:00
+								 * Licensed under the Apache License, Version 2.0 (the "License");
 								 * you may not use this file except in compliance with the License.
 								 * You may obtain a copy of the License at:
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								 *
-												Update primary code license to Apache 2.0.

											
										
										
											2009-06-15 15:11:30 -07:00
+								 *     http://www.apache.org/licenses/LICENSE-2.0
 								 *
 								 * Unless required by applicable law or agreed to in writing, software
 								 * distributed under the License is distributed on an "AS IS" BASIS,
 								 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 								 * See the License for the specific language governing permissions and
 								 * limitations under the License.
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								 */
 								#ifndef HASH_H
 								#define HASH_H 1
-												hash: Implement hash function for Boolean values.

This will be used by the configuration database, and it's generally useful
to have around.

											
										
										
											2009-11-04 15:01:00 -08:00
+								#include <stdbool.h>
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								#include <stddef.h>
 								#include <stdint.h>
 								#include <string.h>
-												hash: Implement hash function for "double" values.

This will be used by the configuration database, which can store real
numbers.

											
										
										
											2009-10-14 17:03:55 -07:00
+								#include "util.h"
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
-												lib: Adapt headers for use in C++.

This commit makes several library headers suitable for inclusion in C++.

It adds [extern "C"] guards and makes minor changes to fix casting and
keyword issues.

											
										
										
											2011-08-04 16:18:59 -07:00
+								#ifdef __cplusplus
 								extern "C" {
 								#endif
-												hash: Convert macros to inline functions.

I always assumed that macros would generate better code.  I was wrong.  The
generated code was identical with inline functions, with GCC version 4.4.5.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-01-18 11:29:57 -08:00
+								static inline uint32_t
 								hash_rot(uint32_t x, int k)
 								{
 								    return (x << k) | (x >> (32 - k));
 								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
+								uint32_t hash_bytes(const void *, size_t n_bytes, uint32_t basis);
-												test-hash: Remove the check_word_hash() for hash_bytes128_cb.

The original test fails on big-endian system due to the hash function
performing not as well when input is uint32_t.  In reality, users should
only use hash_bytes128() to hash words larger than 128 bits (e.g. struct
flow).  Besides, we do check the 1-bit set case for 16 128-bit words in
following test case.  Therefore, the cleanest way to fix the failure
in big-endian system seems to be just removing the check_word_hash()
test for hash_bytes128_cb.

Signed-off-by: Alex Wang <alexw@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2015-02-27 09:07:18 -08:00
+								/* The hash input must be a word larger than 128 bits. */
-												hash: Add 128-bit murmurhash.

Add the 128-bit murmurhash by Austin Appleby, r150 from:
http://code.google.com/p/smhasher/source/browse/trunk/MurmurHash3.cpp

Signed-off-by: Joe Stringer <joestringer@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-08-12 11:12:12 +12:00
+								void hash_bytes128(const void *_, size_t n_bytes, uint32_t basis,
 								                   ovs_u128 *out);
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
 								static inline uint32_t hash_int(uint32_t x, uint32_t basis);
 								static inline uint32_t hash_2words(uint32_t, uint32_t);
-												hash.h: Avoid compiler warnings with MSVC.

The lack of 'const' in function declaration causes MSVC to complain
because the function definition uses it.

Signed-off-by: Gurucharan Shetty <gshetty@nicira.com>
Acked-by: Alin Gabriel Serdean <aserdean@cloudbasesolutions.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-09-09 14:16:16 -07:00
+								static inline uint32_t hash_uint64(const uint64_t);
 								static inline uint32_t hash_uint64_basis(const uint64_t x,
 								                                         const uint32_t basis);
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
+								uint32_t hash_3words(uint32_t, uint32_t, uint32_t);
 								static inline uint32_t hash_boolean(bool x, uint32_t basis);
 								uint32_t hash_double(double, uint32_t basis);
 								static inline uint32_t hash_pointer(const void *, uint32_t basis);
 								static inline uint32_t hash_string(const char *, uint32_t basis);
 								/* Murmurhash by Austin Appleby,
-												hash: Update murmurhash repo link in comments

The MurmurHash code repo has moved from code.google to github. Update
the link to reflect this.

Signed-off-by: Cian Ferriter <cian.ferriter@intel.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2016-12-21 16:39:16 +00:00
+								 * from https://github.com/aappleby/smhasher/blob/master/src/MurmurHash3.cpp
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
+								 *
 								 * The upstream license there says:
 								 *
-												treewide: Get rid of // comments, even inside comments.

Just a style fix.

With this patch, the following reports no hits:

git ls-files | grep '\.[ch]$' | grep -vE 'datapath|sflow' \
    | xargs grep -n // | grep -vE "http|s/|'|\""

Acked-by: Ilya Maximets <i.maximets@samsung.com>
Reported-by: Ilya Maximets <i.maximets@samsung.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2019-01-23 12:09:46 -08:00
+								 *    MurmurHash3 was written by Austin Appleby, and is placed in the public
 								 *    domain. The author hereby disclaims copyright to this source code.
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
+								 *
 								 * See hash_words() for sample usage. */
 								static inline uint32_t mhash_add__(uint32_t hash, uint32_t data)
-												hash: Convert macros to inline functions.

I always assumed that macros would generate better code.  I was wrong.  The
generated code was identical with inline functions, with GCC version 4.4.5.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-01-18 11:29:57 -08:00
+								{
-												hash: Skip Invoking mhash_add__() with zero input.

mhash_add__() is expensive and should be only called with valid input.
zero-valued 'data' will not affect the 'hash' value and expensive hash
computation can be skipped when input is zero.

This patch will validate the input in mhash_add__ to save some cpu
cycles.

Signed-off-by: Bhanuprakash Bodireddy <bhanuprakash.bodireddy@intel.com>
Co-authored-by: Antonio Fischetti <antonio.fischetti@intel.com>
Signed-off-by: Antonio Fischetti <antonio.fischetti@intel.com>
Acked-by: Daniele Di Proietto <diproiettod@vmware.com>

											
										
										
											2016-10-14 15:37:07 +01:00
+								    /* zero-valued 'data' will not change the 'hash' value */
 								    if (!data) {
 								        return hash;
 								    }
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
+								    data *= 0xcc9e2d51;
 								    data = hash_rot(data, 15);
 								    data *= 0x1b873593;
 								    return hash ^ data;
-												hash: Convert macros to inline functions.

I always assumed that macros would generate better code.  I was wrong.  The
generated code was identical with inline functions, with GCC version 4.4.5.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-01-18 11:29:57 -08:00
+								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
+								static inline uint32_t mhash_add(uint32_t hash, uint32_t data)
-												hash: Convert macros to inline functions.

I always assumed that macros would generate better code.  I was wrong.  The
generated code was identical with inline functions, with GCC version 4.4.5.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-01-18 11:29:57 -08:00
+								{
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
+								    hash = mhash_add__(hash, data);
 								    hash = hash_rot(hash, 13);
 								    return hash * 5 + 0xe6546b64;
-												hash: Convert macros to inline functions.

I always assumed that macros would generate better code.  I was wrong.  The
generated code was identical with inline functions, with GCC version 4.4.5.

Signed-off-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2012-01-18 11:29:57 -08:00
+								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
-												hash: Add 128-bit murmurhash.

Add the 128-bit murmurhash by Austin Appleby, r150 from:
http://code.google.com/p/smhasher/source/browse/trunk/MurmurHash3.cpp

Signed-off-by: Joe Stringer <joestringer@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-08-12 11:12:12 +12:00
+								static inline uint32_t mhash_finish(uint32_t hash)
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
+								{
 								    hash ^= hash >> 16;
 								    hash *= 0x85ebca6b;
 								    hash ^= hash >> 13;
 								    hash *= 0xc2b2ae35;
 								    hash ^= hash >> 16;
 								    return hash;
 								}
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
-												hash: New helper functions for adding words in a buffer to a hash.

These will receive their first user (outside of hash.h) in the following
commit.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Darrell Ball <dlu998@gmail.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-09 15:30:42 -07:00
+								static inline uint32_t hash_add(uint32_t hash, uint32_t data);
 								static inline uint32_t hash_add64(uint32_t hash, uint64_t data);
 								static inline uint32_t hash_add_words(uint32_t, const uint32_t *, size_t);
 								static inline uint32_t hash_add_words64(uint32_t, const uint64_t *, size_t);
 								static inline uint32_t hash_add_bytes32(uint32_t, const uint32_t *, size_t);
 								static inline uint32_t hash_add_bytes64(uint32_t, const uint64_t *, size_t);
-												hash: Implement hash for aarch64 using CRC32c intrinsics.

This commit adds lib/hash-aarch64.h to implement hash for aarch64.
It is based on aarch64 built-in CRC32c intrinsics, which accelerates
hash function for datapath performance.

test:
1. "test-hash" case passed in aarch64 platform.
2.  OVS-DPDK datapth performance test was run(NIC to NIC).
    Test bed: aarch64(Centriq 2400) platform.
    Test case: DPCLS forwarding(disable EMC + avg 10 subtable lookups)
    Test result: improve around 10%.

Signed-off-by: Yanqin Wei <yanqin.wei@arm.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2019-01-25 11:28:01 +00:00
+								#if (defined(__ARM_FEATURE_CRC32) && defined(__aarch64__))
 								#include "hash-aarch64.h"
 								#elif !(defined(__SSE4_2__) && defined(__x86_64__))
-												hash: Add 128-bit murmurhash.

Add the 128-bit murmurhash by Austin Appleby, r150 from:
http://code.google.com/p/smhasher/source/browse/trunk/MurmurHash3.cpp

Signed-off-by: Joe Stringer <joestringer@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-08-12 11:12:12 +12:00
+								/* Mhash-based implementation. */
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
-												lib/hash: Abstract hash interface.

Use generic names hash_add() and hash_finish() instead of mhash_*
equivalents.  This makes future changes to hash implentations more
localized.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-04 07:57:18 -07:00
+								static inline uint32_t hash_add(uint32_t hash, uint32_t data)
 								{
 								    return mhash_add(hash, data);
 								}
-												hash: Add hash_add64().

Add support for adding 64-bit words to hashes.  This will be used by
subsequent patches.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2015-01-06 11:10:42 -08:00
+								static inline uint32_t hash_add64(uint32_t hash, uint64_t data)
 								{
 								    return hash_add(hash_add(hash, data), data >> 32);
 								}
-												lib/hash: Abstract hash interface.

Use generic names hash_add() and hash_finish() instead of mhash_*
equivalents.  This makes future changes to hash implentations more
localized.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-04 07:57:18 -07:00
+								static inline uint32_t hash_finish(uint32_t hash, uint32_t final)
 								{
-												hash: Add 128-bit murmurhash.

Add the 128-bit murmurhash by Austin Appleby, r150 from:
http://code.google.com/p/smhasher/source/browse/trunk/MurmurHash3.cpp

Signed-off-by: Joe Stringer <joestringer@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-08-12 11:12:12 +12:00
+								    return mhash_finish(hash ^ final);
-												lib/hash: Abstract hash interface.

Use generic names hash_add() and hash_finish() instead of mhash_*
equivalents.  This makes future changes to hash implentations more
localized.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-04 07:57:18 -07:00
+								}
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								/* Returns the hash of the 'n' 32-bit words at 'p', starting from 'basis'.
 								 * 'p' must be properly aligned.
 								 *
 								 * This is inlined for the compiler to have access to the 'n_words', which
 								 * in many cases is a constant. */
 								static inline uint32_t
-												hash: New helper functions for adding words in a buffer to a hash.

These will receive their first user (outside of hash.h) in the following
commit.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Darrell Ball <dlu998@gmail.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-09 15:30:42 -07:00
+								hash_words_inline(const uint32_t *p, size_t n_words, uint32_t basis)
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								{
-												hash: New helper functions for adding words in a buffer to a hash.

These will receive their first user (outside of hash.h) in the following
commit.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Darrell Ball <dlu998@gmail.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-09 15:30:42 -07:00
+								    return hash_finish(hash_add_words(basis, p, n_words), n_words * 4);
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								}
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								static inline uint32_t
-												hash: New helper functions for adding words in a buffer to a hash.

These will receive their first user (outside of hash.h) in the following
commit.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Darrell Ball <dlu998@gmail.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-09 15:30:42 -07:00
+								hash_words64_inline(const uint64_t *p, size_t n_words, uint32_t basis)
-												hash: Implement hash function for Boolean values.

This will be used by the configuration database, and it's generally useful
to have around.

											
										
										
											2009-11-04 15:01:00 -08:00
+								{
-												hash: New helper functions for adding words in a buffer to a hash.

These will receive their first user (outside of hash.h) in the following
commit.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Darrell Ball <dlu998@gmail.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-09 15:30:42 -07:00
+								    return hash_finish(hash_add_words64(basis, p, n_words), n_words * 8);
-												hash: Implement hash function for Boolean values.

This will be used by the configuration database, and it's generally useful
to have around.

											
										
										
											2009-11-04 15:01:00 -08:00
+								}
-												hash: Implement hash function for pointer values.

This will be used by an upcoming commit, and it's generally useful to
have around.

											
										
										
											2009-11-04 15:00:28 -08:00
+								static inline uint32_t hash_pointer(const void *p, uint32_t basis)
 								{
 								    /* Often pointers are hashed simply by casting to integer type, but that
 								     * has pitfalls since the lower bits of a pointer are often all 0 for
 								     * alignment reasons.  It's hard to guess where the entropy really is, so
 								     * we give up here and just use a high-quality hash function.
 								     *
 								     * The double cast suppresses a warning on 64-bit systems about casting to
 								     * an integer to different size.  That's OK in this case, since most of the
 								     * entropy in the pointer is almost certainly in the lower 32 bits. */
 								    return hash_int((uint32_t) (uintptr_t) p, basis);
 								}
-												hash: Replace primary hash functions by murmurhash.

murmurhash is faster than Jenkins and slightly higher quality, so switch to
it for hashing words.

The best timings I got for hashing for data lengths of the following
numbers of 32-bit words, in seconds per 1,000,000,000 hashes, were:

words     murmurhash      Jenkins hash
-----     ----------      ------------
   1           8.4              10.4
   2          10.3              10.3
   3          11.2              10.7
   4          12.6              18.0
   5          13.9              18.3
   6          15.2              18.7

In other words, murmurhash outperforms Jenkins for all input lengths other
than exactly 3 32-bit words (12 bytes).  (It's understandable that Jenkins
would have a best case at 12 bytes, because Jenkins works in 12-byte
chunks.)  Even in the case where Jenkins is faster, it's only by 5%.  On
average within this data set, murmurhash is 15% faster, and for 4-word
input it is 30% faster.

We retain Jenkins for flow_hash_symmetric_l4() and flow_hash_fields(),
which are cases where the hash value is exposed externally.

This commit appears to improve "ovs-benchmark rate" results slightly by
a few hundred connections per second (under 1%), when used with an NVP
controller.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2013-01-16 16:14:42 -08:00
+								static inline uint32_t hash_2words(uint32_t x, uint32_t y)
-												hash: Introduce an implementation of murmurhash.

Murmurhash is generally superior to the Jenkins lookup3 hash according to
the available figures.  Perhaps we should generally replace our current
hashes by murmurhash.

For now, I'm introducing a parallel implementation to allow it to be used
in cases where an incremental one-word-at-a-time hash is desirable.  The
first user will be added in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2012-08-21 14:26:23 -07:00
+								{
-												lib/hash: Abstract hash interface.

Use generic names hash_add() and hash_finish() instead of mhash_*
equivalents.  This makes future changes to hash implentations more
localized.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-04 07:57:18 -07:00
+								    return hash_finish(hash_add(hash_add(x, 0), y), 8);
-												hash: Introduce an implementation of murmurhash.

Murmurhash is generally superior to the Jenkins lookup3 hash according to
the available figures.  Perhaps we should generally replace our current
hashes by murmurhash.

For now, I'm introducing a parallel implementation to allow it to be used
in cases where an incremental one-word-at-a-time hash is desirable.  The
first user will be added in an upcoming commit.

Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Ethan Jackson <ethan@nicira.com>

											
										
										
											2012-08-21 14:26:23 -07:00
+								}
-												hash: Add hash_add64().

Add support for adding 64-bit words to hashes.  This will be used by
subsequent patches.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2015-01-06 11:10:42 -08:00
+								static inline uint32_t hash_uint64_basis(const uint64_t x,
 								                                         const uint32_t basis)
-												lib/hash.h: add hash_uint64()

Add hash_uint64() and apply it when appropriate.

Signed-off-by: Andy Zhou <azhou@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-27 19:38:04 -07:00
+								{
-												hash: Add hash_add64().

Add support for adding 64-bit words to hashes.  This will be used by
subsequent patches.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2015-01-06 11:10:42 -08:00
+								    return hash_finish(hash_add64(basis, x), 8);
-												lib/hash.h: add hash_uint64()

Add hash_uint64() and apply it when appropriate.

Signed-off-by: Andy Zhou <azhou@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-27 19:38:04 -07:00
+								}
-												hash: Add hash_add64().

Add support for adding 64-bit words to hashes.  This will be used by
subsequent patches.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2015-01-06 11:10:42 -08:00
+								static inline uint32_t hash_uint64(const uint64_t x)
-												lib/packet.h: add hash_mac()

Add hash_mac() and apply it when appropriate.

Signed-off-by: Andy Zhou <azhou@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-27 20:22:37 -07:00
+								{
-												hash: Add hash_add64().

Add support for adding 64-bit words to hashes.  This will be used by
subsequent patches.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2015-01-06 11:10:42 -08:00
+								    return hash_uint64_basis(x, 0);
-												lib/packet.h: add hash_mac()

Add hash_mac() and apply it when appropriate.

Signed-off-by: Andy Zhou <azhou@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-03-27 20:22:37 -07:00
+								}
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
 								#else /* __SSE4_2__ && __x86_64__ */
 								#include <smmintrin.h>
 								static inline uint32_t hash_add(uint32_t hash, uint32_t data)
 								{
 								    return _mm_crc32_u32(hash, data);
 								}
-												hash: Add hash_add64().

Add support for adding 64-bit words to hashes.  This will be used by
subsequent patches.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2015-01-06 11:10:42 -08:00
+								/* Add the halves of 'data' in the memory order. */
 								static inline uint32_t hash_add64(uint32_t hash, uint64_t data)
 								{
 								    return _mm_crc32_u64(hash, data);
 								}
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								static inline uint32_t hash_finish(uint64_t hash, uint64_t final)
 								{
 								    /* The finishing multiplier 0x805204f3 has been experimentally
 								     * derived to pass the testsuite hash tests. */
 								    hash = _mm_crc32_u64(hash, final) * 0x805204f3;
 								    return hash ^ (uint32_t)hash >> 16; /* Increase entropy in LSBs. */
 								}
-												hash: Avoid 64bit crc intrinsics on 32bit aligned data.

UB Sanitizer report:

lib/hash.h:219:17: runtime error: load of misaligned address
0x7ffc164a88b4 for type 'const uint64_t', which requires 8 byte
alignment

    #0 in hash_words_inline lib/hash.h:219
    #1 in hash_words lib/hash.h:297
    [...]

Signed-off-by: Mike Pattrick <mkp@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-30 17:04:17 -05:00
+								static inline uint32_t
 								hash_finish32(uint64_t hash, uint32_t final, uint32_t semifinal)
 								{
 								    /* The finishing multiplier 0x805204f3 has been experimentally
 								     * derived to pass the testsuite hash tests. */
 								    hash = _mm_crc32_u32(hash, semifinal);
-												hash: Fix integer overflow before widen in hash_finish32().

Fix unintentional integer overflow reported by Coverity by adding
the ULL suffix to the numerical literals used in the multiplication.

Fixes: e85e8a7541cb ("hash: Avoid 64bit crc intrinsics on 32bit aligned data.")
Signed-off-by: Eelco Chaudron <echaudro@redhat.com>
Acked-by: Aaron Conole <aconole@redhat.com>

											
										
										
											2024-08-28 15:28:38 +02:00
+								    hash = _mm_crc32_u32(hash, final) * 0x805204f3ULL;
-												hash: Avoid 64bit crc intrinsics on 32bit aligned data.

UB Sanitizer report:

lib/hash.h:219:17: runtime error: load of misaligned address
0x7ffc164a88b4 for type 'const uint64_t', which requires 8 byte
alignment

    #0 in hash_words_inline lib/hash.h:219
    #1 in hash_words lib/hash.h:297
    [...]

Signed-off-by: Mike Pattrick <mkp@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-30 17:04:17 -05:00
+								    return hash ^ ((uint32_t) hash >> 16); /* Increase entropy in LSBs. */
 								}
 								static inline uint32_t
-												hash: Add explicit typecasts to fix C++ compilation issues.

C++ does not allow implicit conversion from void pointer to a specific
pointer type. This change removes the cast from uint32_t* to void* in
`hash_words_32aligned` and adds an explicit typecast from uint32_t* to
uint64_t* in `hash_words_inline`.

This issue was initially discovered on G++ v9.2.0 when a downstream C++
application included the hash.h header file and was compiled on an AMD
Ryzen Zen 2 CPU (__SSE4_2__ && __x86_64__). On the latest G++ version,
it would throw an error. On the latest GCC version with `-Wc++-compat`,
it would throw a warning.

Acked-by: Mike Pattrick <mkp@redhat.com>
Signed-off-by: James Raphael Tiovalen <jamestiotio@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-09-16 15:28:54 +08:00
+								hash_words_32aligned(const uint32_t *p, size_t n_words, uint32_t basis)
-												hash: Avoid 64bit crc intrinsics on 32bit aligned data.

UB Sanitizer report:

lib/hash.h:219:17: runtime error: load of misaligned address
0x7ffc164a88b4 for type 'const uint64_t', which requires 8 byte
alignment

    #0 in hash_words_inline lib/hash.h:219
    #1 in hash_words lib/hash.h:297
    [...]

Signed-off-by: Mike Pattrick <mkp@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-30 17:04:17 -05:00
+								{
 								    uint32_t hash1 = basis;
 								    uint32_t hash2 = 0;
 								    uint32_t hash3 = n_words;
 								    const uint32_t *endp = (const uint32_t *) p + n_words;
 								    const uint32_t *limit = p + n_words - 6;
 								    while (p <= limit) {
 								        hash1 = _mm_crc32_u32(hash1, p[0]);
 								        hash1 = _mm_crc32_u32(hash1, p[1]);
 								        hash2 = _mm_crc32_u32(hash2, p[2]);
 								        hash2 = _mm_crc32_u32(hash2, p[3]);
 								        hash3 = _mm_crc32_u32(hash3, p[4]);
 								        hash3 = _mm_crc32_u32(hash3, p[5]);
 								        p += 6;
 								    }
 								    switch (endp - (const uint32_t *) p) {
 								    case 1:
 								        hash1 = _mm_crc32_u32(hash1, p[0]);
 								        break;
 								    case 2:
 								        hash1 = _mm_crc32_u32(hash1, p[0]);
 								        hash1 = _mm_crc32_u32(hash1, p[1]);
 								        break;
 								    case 3:
 								        hash1 = _mm_crc32_u32(hash1, p[0]);
 								        hash1 = _mm_crc32_u32(hash1, p[1]);
 								        hash2 = _mm_crc32_u32(hash2, p[2]);
 								        break;
 								    case 4:
 								        hash1 = _mm_crc32_u32(hash1, p[0]);
 								        hash1 = _mm_crc32_u32(hash1, p[1]);
 								        hash2 = _mm_crc32_u32(hash2, p[2]);
 								        hash2 = _mm_crc32_u32(hash2, p[3]);
 								        break;
 								    case 5:
 								        hash1 = _mm_crc32_u32(hash1, p[0]);
 								        hash1 = _mm_crc32_u32(hash1, p[1]);
 								        hash2 = _mm_crc32_u32(hash2, p[2]);
 								        hash2 = _mm_crc32_u32(hash2, p[3]);
 								        hash3 = _mm_crc32_u32(hash3, p[4]);
 								        break;
 								    }
 								    return hash_finish32(hash1, hash2, hash3);
 								}
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								/* Returns the hash of the 'n' 32-bit words at 'p_', starting from 'basis'.
 								 * We access 'p_' as a uint64_t pointer, which is fine for __SSE_4_2__.
 								 *
 								 * This is inlined for the compiler to have access to the 'n_words', which
 								 * in many cases is a constant. */
 								static inline uint32_t
-												hash: Avoid 64bit crc intrinsics on 32bit aligned data.

UB Sanitizer report:

lib/hash.h:219:17: runtime error: load of misaligned address
0x7ffc164a88b4 for type 'const uint64_t', which requires 8 byte
alignment

    #0 in hash_words_inline lib/hash.h:219
    #1 in hash_words lib/hash.h:297
    [...]

Signed-off-by: Mike Pattrick <mkp@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-30 17:04:17 -05:00
+								hash_words_inline(const uint32_t *p_, size_t n_words, uint32_t basis)
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								{
-												hash: Add explicit typecasts to fix C++ compilation issues.

C++ does not allow implicit conversion from void pointer to a specific
pointer type. This change removes the cast from uint32_t* to void* in
`hash_words_32aligned` and adds an explicit typecast from uint32_t* to
uint64_t* in `hash_words_inline`.

This issue was initially discovered on G++ v9.2.0 when a downstream C++
application included the hash.h header file and was compiled on an AMD
Ryzen Zen 2 CPU (__SSE4_2__ && __x86_64__). On the latest G++ version,
it would throw an error. On the latest GCC version with `-Wc++-compat`,
it would throw a warning.

Acked-by: Mike Pattrick <mkp@redhat.com>
Signed-off-by: James Raphael Tiovalen <jamestiotio@gmail.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-09-16 15:28:54 +08:00
+								    const uint64_t *p = ALIGNED_CAST(const uint64_t *, p_);
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								    uint64_t hash1 = basis;
 								    uint64_t hash2 = 0;
 								    uint64_t hash3 = n_words;
 								    const uint32_t *endp = (const uint32_t *)p + n_words;
 								    const uint64_t *limit = p + n_words / 2 - 3;
-												hash: Avoid 64bit crc intrinsics on 32bit aligned data.

UB Sanitizer report:

lib/hash.h:219:17: runtime error: load of misaligned address
0x7ffc164a88b4 for type 'const uint64_t', which requires 8 byte
alignment

    #0 in hash_words_inline lib/hash.h:219
    #1 in hash_words lib/hash.h:297
    [...]

Signed-off-by: Mike Pattrick <mkp@redhat.com>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2023-01-30 17:04:17 -05:00
+								    if (OVS_UNLIKELY(((intptr_t) p & ((sizeof(uint64_t)) - 1)) != 0)) {
 								        return hash_words_32aligned(p_, n_words, basis);
 								    }
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								    while (p <= limit) {
 								        hash1 = _mm_crc32_u64(hash1, p[0]);
 								        hash2 = _mm_crc32_u64(hash2, p[1]);
 								        hash3 = _mm_crc32_u64(hash3, p[2]);
 								        p += 3;
 								    }
 								    switch (endp - (const uint32_t *)p) {
 								    case 1:
 								        hash1 = _mm_crc32_u32(hash1, *(const uint32_t *)&p[0]);
 								        break;
 								    case 2:
 								        hash1 = _mm_crc32_u64(hash1, p[0]);
 								        break;
 								    case 3:
 								        hash1 = _mm_crc32_u64(hash1, p[0]);
 								        hash2 = _mm_crc32_u32(hash2, *(const uint32_t *)&p[1]);
 								        break;
 								    case 4:
 								        hash1 = _mm_crc32_u64(hash1, p[0]);
 								        hash2 = _mm_crc32_u64(hash2, p[1]);
 								        break;
 								    case 5:
 								        hash1 = _mm_crc32_u64(hash1, p[0]);
 								        hash2 = _mm_crc32_u64(hash2, p[1]);
 								        hash3 = _mm_crc32_u32(hash3, *(const uint32_t *)&p[2]);
 								        break;
 								    }
 								    return hash_finish(hash1, hash2 << 32 | hash3);
 								}
 								/* A simpler version for 64-bit data.
 								 * 'n_words' is the count of 64-bit words, basis is 64 bits. */
 								static inline uint32_t
-												hash: Fix compilation error on Fedora 34 with GCC 11 and -O0.

With newest version of GCC, OVS fails to compile with -O0 due to
false-positive overread detection in hash-related functions.  Those
function declares "const uint32_t p[]" as argument and it throws off
the compiler into thinking that it reads from memory region of size 0.

To fix that behavior, a change in argument declaration needs to be made:
instead of using "[]" notation for a pointer, simply use "*".

The reported error in question:

lib/conntrack.c: In function ‘conn_key_hash’:
lib/conntrack.c:2154:12: error: ‘hash_words’ reading 4 bytes \
                   from a region of size 0 [-Werror=stringop-overread]
 2154| return hash_words((uint32_t *) (&key->dst + 1),
     |        ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2155|                   (uint32_t *) (key + 1) - (uint32_t *) (&key->dst + 1),
     |                   ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2156|                   hash);
     |                   ~~~~~
lib/conntrack.c:2154:12: note: referencing argument 1 \
        of type ‘const uint32_t *’ {aka ‘const unsigned int *’}
In file included from lib/packets.h:31,
                 from lib/ct-dpif.h:21,
                 from lib/conntrack.h:23,
                 from lib/conntrack.c:26:
lib/hash.h:294:1: note: in a call to function ‘hash_words’
  294 | hash_words(const uint32_t p[], size_t n_words, uint32_t basis)
      | ^~~~~~~~~~

Signed-off-by: Guzowski Adrian <adrian.guzowski@exatel.pl>
Tested-by: Numan Siddique <numans@ovn.org>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-07-28 12:03:29 +00:00
+								hash_words64_inline(const uint64_t *p, size_t n_words, uint32_t basis)
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								{
-												hash: Make basis of hash_words64() 32 bits.

The basis of hash_words64() was 64 bits, even when the hash value is
32 bits, thus confusing the domain and the range of the function.
This patch fixes this by making the basis an uint32_t.

Suggested-by: Ben Pfaff <blp@nicira.com>
Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
											
										
										
											2015-01-06 13:48:54 -08:00
+								    uint64_t hash1 = basis;
 								    uint64_t hash2 = 0;
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								    uint64_t hash3 = n_words;
 								    const uint64_t *endp = p + n_words;
 								    const uint64_t *limit = endp - 3;
 								    while (p <= limit) {
 								        hash1 = _mm_crc32_u64(hash1, p[0]);
 								        hash2 = _mm_crc32_u64(hash2, p[1]);
 								        hash3 = _mm_crc32_u64(hash3, p[2]);
 								        p += 3;
 								    }
 								    switch (endp - p) {
 								    case 1:
 								        hash1 = _mm_crc32_u64(hash1, p[0]);
 								        break;
 								    case 2:
 								        hash1 = _mm_crc32_u64(hash1, p[0]);
 								        hash2 = _mm_crc32_u64(hash2, p[1]);
 								        break;
 								    }
 								    return hash_finish(hash1, hash2 << 32 | hash3);
 								}
 								static inline uint32_t hash_uint64_basis(const uint64_t x,
 								                                         const uint32_t basis)
 								{
 								    /* '23' chosen to mix bits enough for the test-hash to pass. */
-												hash: Add hash_add64().

Add support for adding 64-bit words to hashes.  This will be used by
subsequent patches.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>
											
										
										
											2015-01-06 11:10:42 -08:00
+								    return hash_finish(hash_add64(basis, x), 23);
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								}
 								static inline uint32_t hash_uint64(const uint64_t x)
 								{
 								    return hash_uint64_basis(x, 0);
 								}
 								static inline uint32_t hash_2words(uint32_t x, uint32_t y)
 								{
 								    return hash_uint64((uint64_t)y << 32 | x);
 								}
 								static inline uint32_t hash_pointer(const void *p, uint32_t basis)
 								{
 								    return hash_uint64_basis((uint64_t) (uintptr_t) p, basis);
 								}
 								#endif
-												hash: Fix compilation error on Fedora 34 with GCC 11 and -O0.

With newest version of GCC, OVS fails to compile with -O0 due to
false-positive overread detection in hash-related functions.  Those
function declares "const uint32_t p[]" as argument and it throws off
the compiler into thinking that it reads from memory region of size 0.

To fix that behavior, a change in argument declaration needs to be made:
instead of using "[]" notation for a pointer, simply use "*".

The reported error in question:

lib/conntrack.c: In function ‘conn_key_hash’:
lib/conntrack.c:2154:12: error: ‘hash_words’ reading 4 bytes \
                   from a region of size 0 [-Werror=stringop-overread]
 2154| return hash_words((uint32_t *) (&key->dst + 1),
     |        ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2155|                   (uint32_t *) (key + 1) - (uint32_t *) (&key->dst + 1),
     |                   ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2156|                   hash);
     |                   ~~~~~
lib/conntrack.c:2154:12: note: referencing argument 1 \
        of type ‘const uint32_t *’ {aka ‘const unsigned int *’}
In file included from lib/packets.h:31,
                 from lib/ct-dpif.h:21,
                 from lib/conntrack.h:23,
                 from lib/conntrack.c:26:
lib/hash.h:294:1: note: in a call to function ‘hash_words’
  294 | hash_words(const uint32_t p[], size_t n_words, uint32_t basis)
      | ^~~~~~~~~~

Signed-off-by: Guzowski Adrian <adrian.guzowski@exatel.pl>
Tested-by: Numan Siddique <numans@ovn.org>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-07-28 12:03:29 +00:00
+								uint32_t hash_words__(const uint32_t *p, size_t n_words, uint32_t basis);
 								uint32_t hash_words64__(const uint64_t *p, size_t n_words, uint32_t basis);
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
 								/* Inline the larger hash functions only when 'n_words' is known to be
 								 * compile-time constant. */
 								#if __GNUC__ >= 4
 								static inline uint32_t
-												hash: Fix compilation error on Fedora 34 with GCC 11 and -O0.

With newest version of GCC, OVS fails to compile with -O0 due to
false-positive overread detection in hash-related functions.  Those
function declares "const uint32_t p[]" as argument and it throws off
the compiler into thinking that it reads from memory region of size 0.

To fix that behavior, a change in argument declaration needs to be made:
instead of using "[]" notation for a pointer, simply use "*".

The reported error in question:

lib/conntrack.c: In function ‘conn_key_hash’:
lib/conntrack.c:2154:12: error: ‘hash_words’ reading 4 bytes \
                   from a region of size 0 [-Werror=stringop-overread]
 2154| return hash_words((uint32_t *) (&key->dst + 1),
     |        ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2155|                   (uint32_t *) (key + 1) - (uint32_t *) (&key->dst + 1),
     |                   ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2156|                   hash);
     |                   ~~~~~
lib/conntrack.c:2154:12: note: referencing argument 1 \
        of type ‘const uint32_t *’ {aka ‘const unsigned int *’}
In file included from lib/packets.h:31,
                 from lib/ct-dpif.h:21,
                 from lib/conntrack.h:23,
                 from lib/conntrack.c:26:
lib/hash.h:294:1: note: in a call to function ‘hash_words’
  294 | hash_words(const uint32_t p[], size_t n_words, uint32_t basis)
      | ^~~~~~~~~~

Signed-off-by: Guzowski Adrian <adrian.guzowski@exatel.pl>
Tested-by: Numan Siddique <numans@ovn.org>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-07-28 12:03:29 +00:00
+								hash_words(const uint32_t *p, size_t n_words, uint32_t basis)
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								{
 								    if (__builtin_constant_p(n_words)) {
 								        return hash_words_inline(p, n_words, basis);
 								    } else {
 								        return hash_words__(p, n_words, basis);
 								    }
 								}
 								static inline uint32_t
-												hash: Fix compilation error on Fedora 34 with GCC 11 and -O0.

With newest version of GCC, OVS fails to compile with -O0 due to
false-positive overread detection in hash-related functions.  Those
function declares "const uint32_t p[]" as argument and it throws off
the compiler into thinking that it reads from memory region of size 0.

To fix that behavior, a change in argument declaration needs to be made:
instead of using "[]" notation for a pointer, simply use "*".

The reported error in question:

lib/conntrack.c: In function ‘conn_key_hash’:
lib/conntrack.c:2154:12: error: ‘hash_words’ reading 4 bytes \
                   from a region of size 0 [-Werror=stringop-overread]
 2154| return hash_words((uint32_t *) (&key->dst + 1),
     |        ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2155|                   (uint32_t *) (key + 1) - (uint32_t *) (&key->dst + 1),
     |                   ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2156|                   hash);
     |                   ~~~~~
lib/conntrack.c:2154:12: note: referencing argument 1 \
        of type ‘const uint32_t *’ {aka ‘const unsigned int *’}
In file included from lib/packets.h:31,
                 from lib/ct-dpif.h:21,
                 from lib/conntrack.h:23,
                 from lib/conntrack.c:26:
lib/hash.h:294:1: note: in a call to function ‘hash_words’
  294 | hash_words(const uint32_t p[], size_t n_words, uint32_t basis)
      | ^~~~~~~~~~

Signed-off-by: Guzowski Adrian <adrian.guzowski@exatel.pl>
Tested-by: Numan Siddique <numans@ovn.org>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-07-28 12:03:29 +00:00
+								hash_words64(const uint64_t *p, size_t n_words, uint32_t basis)
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								{
 								    if (__builtin_constant_p(n_words)) {
 								        return hash_words64_inline(p, n_words, basis);
 								    } else {
 								        return hash_words64__(p, n_words, basis);
 								    }
 								}
 								#else
 								static inline uint32_t
-												hash: Fix compilation error on Fedora 34 with GCC 11 and -O0.

With newest version of GCC, OVS fails to compile with -O0 due to
false-positive overread detection in hash-related functions.  Those
function declares "const uint32_t p[]" as argument and it throws off
the compiler into thinking that it reads from memory region of size 0.

To fix that behavior, a change in argument declaration needs to be made:
instead of using "[]" notation for a pointer, simply use "*".

The reported error in question:

lib/conntrack.c: In function ‘conn_key_hash’:
lib/conntrack.c:2154:12: error: ‘hash_words’ reading 4 bytes \
                   from a region of size 0 [-Werror=stringop-overread]
 2154| return hash_words((uint32_t *) (&key->dst + 1),
     |        ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2155|                   (uint32_t *) (key + 1) - (uint32_t *) (&key->dst + 1),
     |                   ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2156|                   hash);
     |                   ~~~~~
lib/conntrack.c:2154:12: note: referencing argument 1 \
        of type ‘const uint32_t *’ {aka ‘const unsigned int *’}
In file included from lib/packets.h:31,
                 from lib/ct-dpif.h:21,
                 from lib/conntrack.h:23,
                 from lib/conntrack.c:26:
lib/hash.h:294:1: note: in a call to function ‘hash_words’
  294 | hash_words(const uint32_t p[], size_t n_words, uint32_t basis)
      | ^~~~~~~~~~

Signed-off-by: Guzowski Adrian <adrian.guzowski@exatel.pl>
Tested-by: Numan Siddique <numans@ovn.org>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-07-28 12:03:29 +00:00
+								hash_words(const uint32_t *p, size_t n_words, uint32_t basis)
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								{
 								    return hash_words__(p, n_words, basis);
 								}
 								static inline uint32_t
-												hash: Fix compilation error on Fedora 34 with GCC 11 and -O0.

With newest version of GCC, OVS fails to compile with -O0 due to
false-positive overread detection in hash-related functions.  Those
function declares "const uint32_t p[]" as argument and it throws off
the compiler into thinking that it reads from memory region of size 0.

To fix that behavior, a change in argument declaration needs to be made:
instead of using "[]" notation for a pointer, simply use "*".

The reported error in question:

lib/conntrack.c: In function ‘conn_key_hash’:
lib/conntrack.c:2154:12: error: ‘hash_words’ reading 4 bytes \
                   from a region of size 0 [-Werror=stringop-overread]
 2154| return hash_words((uint32_t *) (&key->dst + 1),
     |        ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2155|                   (uint32_t *) (key + 1) - (uint32_t *) (&key->dst + 1),
     |                   ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2156|                   hash);
     |                   ~~~~~
lib/conntrack.c:2154:12: note: referencing argument 1 \
        of type ‘const uint32_t *’ {aka ‘const unsigned int *’}
In file included from lib/packets.h:31,
                 from lib/ct-dpif.h:21,
                 from lib/conntrack.h:23,
                 from lib/conntrack.c:26:
lib/hash.h:294:1: note: in a call to function ‘hash_words’
  294 | hash_words(const uint32_t p[], size_t n_words, uint32_t basis)
      | ^~~~~~~~~~

Signed-off-by: Guzowski Adrian <adrian.guzowski@exatel.pl>
Tested-by: Numan Siddique <numans@ovn.org>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-07-28 12:03:29 +00:00
+								hash_words64(const uint64_t *p, size_t n_words, uint32_t basis)
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								{
 								    return hash_words64__(p, n_words, basis);
 								}
 								#endif
-												hash: New helper functions hash_bytes32() and hash_bytes64().

All of the callers of hash_words() and hash_words64() actually find it
easier to pass in the number of bytes instead of the number of 32-bit
or 64-bit words.  These new functions allow the callers to be a little
simpler.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Jarno Rajahalme <jarno@ovn.org>

											
										
										
											2016-01-18 22:52:48 -08:00
+								static inline uint32_t
-												hash: Fix compilation error on Fedora 34 with GCC 11 and -O0.

With newest version of GCC, OVS fails to compile with -O0 due to
false-positive overread detection in hash-related functions.  Those
function declares "const uint32_t p[]" as argument and it throws off
the compiler into thinking that it reads from memory region of size 0.

To fix that behavior, a change in argument declaration needs to be made:
instead of using "[]" notation for a pointer, simply use "*".

The reported error in question:

lib/conntrack.c: In function ‘conn_key_hash’:
lib/conntrack.c:2154:12: error: ‘hash_words’ reading 4 bytes \
                   from a region of size 0 [-Werror=stringop-overread]
 2154| return hash_words((uint32_t *) (&key->dst + 1),
     |        ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2155|                   (uint32_t *) (key + 1) - (uint32_t *) (&key->dst + 1),
     |                   ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2156|                   hash);
     |                   ~~~~~
lib/conntrack.c:2154:12: note: referencing argument 1 \
        of type ‘const uint32_t *’ {aka ‘const unsigned int *’}
In file included from lib/packets.h:31,
                 from lib/ct-dpif.h:21,
                 from lib/conntrack.h:23,
                 from lib/conntrack.c:26:
lib/hash.h:294:1: note: in a call to function ‘hash_words’
  294 | hash_words(const uint32_t p[], size_t n_words, uint32_t basis)
      | ^~~~~~~~~~

Signed-off-by: Guzowski Adrian <adrian.guzowski@exatel.pl>
Tested-by: Numan Siddique <numans@ovn.org>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-07-28 12:03:29 +00:00
+								hash_bytes32(const uint32_t *p, size_t n_bytes, uint32_t basis)
-												hash: New helper functions hash_bytes32() and hash_bytes64().

All of the callers of hash_words() and hash_words64() actually find it
easier to pass in the number of bytes instead of the number of 32-bit
or 64-bit words.  These new functions allow the callers to be a little
simpler.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Jarno Rajahalme <jarno@ovn.org>

											
										
										
											2016-01-18 22:52:48 -08:00
+								{
 								    return hash_words(p, n_bytes / 4, basis);
 								}
 								static inline uint32_t
-												hash: Fix compilation error on Fedora 34 with GCC 11 and -O0.

With newest version of GCC, OVS fails to compile with -O0 due to
false-positive overread detection in hash-related functions.  Those
function declares "const uint32_t p[]" as argument and it throws off
the compiler into thinking that it reads from memory region of size 0.

To fix that behavior, a change in argument declaration needs to be made:
instead of using "[]" notation for a pointer, simply use "*".

The reported error in question:

lib/conntrack.c: In function ‘conn_key_hash’:
lib/conntrack.c:2154:12: error: ‘hash_words’ reading 4 bytes \
                   from a region of size 0 [-Werror=stringop-overread]
 2154| return hash_words((uint32_t *) (&key->dst + 1),
     |        ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2155|                   (uint32_t *) (key + 1) - (uint32_t *) (&key->dst + 1),
     |                   ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 2156|                   hash);
     |                   ~~~~~
lib/conntrack.c:2154:12: note: referencing argument 1 \
        of type ‘const uint32_t *’ {aka ‘const unsigned int *’}
In file included from lib/packets.h:31,
                 from lib/ct-dpif.h:21,
                 from lib/conntrack.h:23,
                 from lib/conntrack.c:26:
lib/hash.h:294:1: note: in a call to function ‘hash_words’
  294 | hash_words(const uint32_t p[], size_t n_words, uint32_t basis)
      | ^~~~~~~~~~

Signed-off-by: Guzowski Adrian <adrian.guzowski@exatel.pl>
Tested-by: Numan Siddique <numans@ovn.org>
Signed-off-by: Ilya Maximets <i.maximets@ovn.org>

											
										
										
											2021-07-28 12:03:29 +00:00
+								hash_bytes64(const uint64_t *p, size_t n_bytes, uint32_t basis)
-												hash: New helper functions hash_bytes32() and hash_bytes64().

All of the callers of hash_words() and hash_words64() actually find it
easier to pass in the number of bytes instead of the number of 32-bit
or 64-bit words.  These new functions allow the callers to be a little
simpler.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Jarno Rajahalme <jarno@ovn.org>

											
										
										
											2016-01-18 22:52:48 -08:00
+								{
 								    return hash_words64(p, n_bytes / 8, basis);
 								}
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
+								static inline uint32_t hash_string(const char *s, uint32_t basis)
 								{
 								    return hash_bytes(s, strlen(s), basis);
 								}
 								static inline uint32_t hash_int(uint32_t x, uint32_t basis)
 								{
 								    return hash_2words(x, basis);
 								}
 								/* An attempt at a useful 1-bit hash function.  Has not been analyzed for
 								 * quality. */
 								static inline uint32_t hash_boolean(bool x, uint32_t basis)
 								{
 								    const uint32_t P0 = 0xc2b73583;   /* This is hash_int(1, 0). */
 								    const uint32_t P1 = 0xe90f1258;   /* This is hash_int(2, 0). */
 								    return (x ? P0 : P1) ^ hash_rot(basis, 1);
 								}
-												hash: New helper functions for adding words in a buffer to a hash.

These will receive their first user (outside of hash.h) in the following
commit.

Signed-off-by: Ben Pfaff <blp@ovn.org>
Acked-by: Darrell Ball <dlu998@gmail.com>
Signed-off-by: Ben Pfaff <blp@ovn.org>

											
										
										
											2017-06-09 15:30:42 -07:00
 								/* Helper functions for calling hash_add() for several 32- or 64-bit words in a
 								 * buffer.  These are not hash functions by themselves, since they need
 								 * hash_finish() to be called, so if you are looking for a full hash function
 								 * see hash_words(), etc. */
 								static inline uint32_t
 								hash_add_words(uint32_t hash, const uint32_t *p, size_t n_words)
 								{
 								    for (size_t i = 0; i < n_words; i++) {
 								        hash = hash_add(hash, p[i]);
 								    }
 								    return hash;
 								}
 								static inline uint32_t
 								hash_add_words64(uint32_t hash, const uint64_t *p, size_t n_words)
 								{
 								    for (size_t i = 0; i < n_words; i++) {
 								        hash = hash_add64(hash, p[i]);
 								    }
 								    return hash;
 								}
 								static inline uint32_t
 								hash_add_bytes32(uint32_t hash, const uint32_t *p, size_t n_bytes)
 								{
 								    return hash_add_words(hash, p, n_bytes / 4);
 								}
 								static inline uint32_t
 								hash_add_bytes64(uint32_t hash, const uint64_t *p, size_t n_bytes)
 								{
 								    return hash_add_words64(hash, p, n_bytes / 8);
 								}
-												lib/hash: Use CRC32 for hashing.

Use CRC32 intrinsics for hash computations when building for
X86_64 with SSE4_2.

Add a new hash_words64() and change hash_words() to be inlined when
'n_words' is a compile-time constant.

Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com>
Acked-by: Ben Pfaff <blp@nicira.com>

											
										
										
											2014-07-11 05:57:11 -07:00
-												lib: Adapt headers for use in C++.

This commit makes several library headers suitable for inclusion in C++.

It adds [extern "C"] guards and makes minor changes to fix casting and
keyword issues.

											
										
										
											2011-08-04 16:18:59 -07:00
+								#ifdef __cplusplus
 								}
 								#endif
-												Import from old repository commit 61ef2b42a9c4ba8e1600f15bb0236765edc2ad45.

											
										
										
											2009-07-08 13:19:16 -07:00
+								#endif /* hash.h */