ovs/lib/mpsc-queue.h

/*
 * Copyright (c) 2021 NVIDIA Corporation.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at:
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#ifndef MPSC_QUEUE_H
#define MPSC_QUEUE_H 1

#include <stdbool.h>
#include <stdint.h>
#include <stddef.h>

#include <openvswitch/thread.h>
#include <openvswitch/util.h>

#include "ovs-atomic.h"

/* Multi-producer, single-consumer queue
 * =====================================
 *
 * This data structure is a lockless queue implementation with
 * the following properties:
 *
 *  * Multi-producer: multiple threads can write concurrently.
 *    Insertion in the queue is thread-safe, no inter-thread
 *    synchronization is necessary.
 *
 *  * Single-consumer: only a single thread can safely remove
 *    nodes from the queue.  The queue must be 'acquired' using
 *    'mpsc_queue_acquire()' before removing nodes.
 *
 *  * Unbounded: the queue is backed by a linked-list and is not
 *    limited in number of elements.
 *
 *  * Intrusive: queue elements are allocated as part of larger
 *    objects.  Objects are retrieved by offset manipulation.
 *
 *  * per-producer FIFO: Elements in the queue are kept in the
 *    order their producer inserted them.  The consumer retrieves
 *    them in in the same insertion order.  When multiple
 *    producers insert at the same time, either will proceed.
 *
 * This queue is well-suited for message passing between threads,
 * where any number of thread can insert a message and a single
 * thread is meant to receive and process it.
 *
 * Thread-safety
 * =============
 *
 *  The consumer thread must acquire the queue using 'mpsc_queue_acquire()'.
 *  Once the queue is protected against concurrent reads, the thread can call
 *  the consumer API:
 *
 *      * mpsc_queue_poll() to peek and return the tail of the queue
 *      * mpsc_queue_pop() to remove the tail of the queue
 *      * mpsc_queue_tail() to read the current tail
 *      * mpsc_queue_push_front() to enqueue an element safely at the tail
 *      * MPSC_QUEUE_FOR_EACH() to iterate over the current elements,
 *        without removing them.
 *      * MPSC_QUEUE_FOR_EACH_POP() to iterate over the elements while
 *        removing them.
 *
 *  When a thread is finished with reading the queue, it can release the
 *  reader lock using 'mpsc_queue_release()'.
 *
 *  Producers can always insert elements in the queue, even if no consumer
 *  acquired the reader lock.  No inter-producer synchronization is needed.
 *
 *  The consumer thread is also allowed to insert elements while it holds the
 *  reader lock.
 *
 *  Producer threads must never be cancelled while writing to the queue.
 *  This will block the consumer, that will then lose any subsequent elements
 *  in the queue.  Producers should ideally be cooperatively managed or
 *  the queue insertion should be within non-cancellable sections.
 *
 * Queue state
 * ===========
 *
 *  When polling the queue, three states can be observed: 'empty', 'non-empty',
 *  and 'inconsistent'.  Three polling results are defined, respectively:
 *
 *   * MPSC_QUEUE_EMPTY: the queue is empty.
 *   * MPSC_QUEUE_ITEM: an item was available and has been removed.
 *   * MPSC_QUEUE_RETRY: the queue is inconsistent.
 *
 *  If 'MPSC_QUEUE_RETRY' is returned, then a producer has not yet finished
 *  writing to the queue and the list of nodes is not coherent.  The consumer
 *  can retry shortly to check if the producer has finished.
 *
 *  This behavior is the reason the removal function is called
 *  'mpsc_queue_poll()'.
 *
 */

struct mpsc_queue_node {
    ATOMIC(struct mpsc_queue_node *) next;
};

struct mpsc_queue {
    ATOMIC(struct mpsc_queue_node *) head;
    ATOMIC(struct mpsc_queue_node *) tail;
    struct mpsc_queue_node stub;
    struct ovs_mutex read_lock;
};

#define MPSC_QUEUE_INITIALIZER(Q) { \
    .head = &(Q)->stub, \
    .tail = &(Q)->stub, \
    .stub = { .next = NULL }, \
    .read_lock = OVS_MUTEX_INITIALIZER, \
}

/* Consumer API. */

/* Initialize the queue. Not necessary is 'MPSC_QUEUE_INITIALIZER' was used. */
void mpsc_queue_init(struct mpsc_queue *queue);
/* The reader lock must be released prior to destroying the queue. */
void mpsc_queue_destroy(struct mpsc_queue *queue);

/* Acquire and release the consumer lock. */
#define mpsc_queue_acquire(q) do { \
        ovs_mutex_lock(&(q)->read_lock); \
    } while (0)
#define mpsc_queue_release(q) do { \
        ovs_mutex_unlock(&(q)->read_lock); \
    } while (0)

enum mpsc_queue_poll_result {
    /* Queue is empty. */
    MPSC_QUEUE_EMPTY,
    /* Polling the queue returned an item. */
    MPSC_QUEUE_ITEM,
    /* Data has been enqueued but one or more producer thread have not
     * finished writing it. The queue is in an inconsistent state.
     * Retrying shortly, if the producer threads are still active, will
     * return the data.
     */
    MPSC_QUEUE_RETRY,
};

/* Set 'node' to a removed item from the queue if 'MPSC_QUEUE_ITEM' is
 * returned, otherwise 'node' is not set.
 */
enum mpsc_queue_poll_result mpsc_queue_poll(struct mpsc_queue *queue,
                                            struct mpsc_queue_node **node)
    OVS_REQUIRES(queue->read_lock);

/* Pop an element if there is any in the queue. */
struct mpsc_queue_node *mpsc_queue_pop(struct mpsc_queue *queue)
    OVS_REQUIRES(queue->read_lock);

/* Insert at the front of the queue. Only the consumer can do it. */
void mpsc_queue_push_front(struct mpsc_queue *queue,
                           struct mpsc_queue_node *node)
    OVS_REQUIRES(queue->read_lock);

/* Get the current queue tail. */
struct mpsc_queue_node *mpsc_queue_tail(struct mpsc_queue *queue)
    OVS_REQUIRES(queue->read_lock);

/* Get the next element of a node. */
struct mpsc_queue_node *mpsc_queue_next(struct mpsc_queue *queue,
                                        struct mpsc_queue_node *prev)
    OVS_REQUIRES(queue->read_lock);

#define MPSC_QUEUE_FOR_EACH(node, queue) \
    for (node = mpsc_queue_tail(queue); node != NULL; \
         node = mpsc_queue_next((queue), node))

#define MPSC_QUEUE_FOR_EACH_POP(node, queue) \
    for (node = mpsc_queue_pop(queue); node != NULL; \
         node = mpsc_queue_pop(queue))

/* Producer API. */

void mpsc_queue_insert(struct mpsc_queue *queue, struct mpsc_queue_node *node);

#endif /* MPSC_QUEUE_H */
mpsc-queue: Module for lock-free message passing. Add a lockless multi-producer/single-consumer (MPSC), linked-list based, intrusive, unbounded queue that does not require deferred memory management. The queue is designed to improve the specific MPSC setup. A benchmark accompanies the unit tests to measure the difference in this configuration. A single reader thread polls the queue while N writers enqueue elements as fast as possible. The mpsc-queue is compared against the regular ovs-list as well as the guarded list. The latter usually offers a slight improvement by batching the element removal, however the mpsc-queue is faster. The average is of each producer threads time: $ ./tests/ovstest test-mpsc-queue benchmark 3000000 1 Benchmarking n=3000000 on 1 + 1 threads. type\thread: Reader 1 Avg mpsc-queue: 167 167 167 ms list(spin): 89 80 80 ms list(mutex): 745 745 745 ms guarded list: 788 788 788 ms $ ./tests/ovstest test-mpsc-queue benchmark 3000000 2 Benchmarking n=3000000 on 1 + 2 threads. type\thread: Reader 1 2 Avg mpsc-queue: 98 97 94 95 ms list(spin): 185 171 173 172 ms list(mutex): 203 199 203 201 ms guarded list: 269 269 188 228 ms $ ./tests/ovstest test-mpsc-queue benchmark 3000000 3 Benchmarking n=3000000 on 1 + 3 threads. type\thread: Reader 1 2 3 Avg mpsc-queue: 76 76 65 76 72 ms list(spin): 246 110 240 238 196 ms list(mutex): 542 541 541 539 540 ms guarded list: 535 535 507 511 517 ms $ ./tests/ovstest test-mpsc-queue benchmark 3000000 4 Benchmarking n=3000000 on 1 + 4 threads. type\thread: Reader 1 2 3 4 Avg mpsc-queue: 73 68 68 68 68 68 ms list(spin): 294 275 279 277 282 278 ms list(mutex): 346 309 287 345 302 310 ms guarded list: 378 319 334 378 351 345 ms Signed-off-by: Gaetan Rivet <grive@u256.net> Reviewed-by: Eli Britstein <elibr@nvidia.com> Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com> Signed-off-by: Ilya Maximets <i.maximets@ovn.org> 2021-09-08 11:47:36 +02:00			`/*`
			`* Copyright (c) 2021 NVIDIA Corporation.`
			`*`
			`* Licensed under the Apache License, Version 2.0 (the "License");`
			`* you may not use this file except in compliance with the License.`
			`* You may obtain a copy of the License at:`
			`*`
			`* http://www.apache.org/licenses/LICENSE-2.0`
			`*`
			`* Unless required by applicable law or agreed to in writing, software`
			`* distributed under the License is distributed on an "AS IS" BASIS,`
			`* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`* See the License for the specific language governing permissions and`
			`* limitations under the License.`
			`*/`

			`#ifndef MPSC_QUEUE_H`
			`#define MPSC_QUEUE_H 1`

			`#include <stdbool.h>`
			`#include <stdint.h>`
			`#include <stddef.h>`

			`#include <openvswitch/thread.h>`
			`#include <openvswitch/util.h>`

			`#include "ovs-atomic.h"`

			`/* Multi-producer, single-consumer queue`
			`* =====================================`
			`*`
			`* This data structure is a lockless queue implementation with`
			`* the following properties:`
			`*`
			`* * Multi-producer: multiple threads can write concurrently.`
			`* Insertion in the queue is thread-safe, no inter-thread`
			`* synchronization is necessary.`
			`*`
			`* * Single-consumer: only a single thread can safely remove`
			`* nodes from the queue. The queue must be 'acquired' using`
			`* 'mpsc_queue_acquire()' before removing nodes.`
			`*`
			`* * Unbounded: the queue is backed by a linked-list and is not`
			`* limited in number of elements.`
			`*`
			`* * Intrusive: queue elements are allocated as part of larger`
			`* objects. Objects are retrieved by offset manipulation.`
			`*`
			`* * per-producer FIFO: Elements in the queue are kept in the`
			`* order their producer inserted them. The consumer retrieves`
			`* them in in the same insertion order. When multiple`
			`* producers insert at the same time, either will proceed.`
			`*`
			`* This queue is well-suited for message passing between threads,`
			`* where any number of thread can insert a message and a single`
			`* thread is meant to receive and process it.`
			`*`
			`* Thread-safety`
			`* =============`
			`*`
			`* The consumer thread must acquire the queue using 'mpsc_queue_acquire()'.`
			`* Once the queue is protected against concurrent reads, the thread can call`
			`* the consumer API:`
			`*`
			`* * mpsc_queue_poll() to peek and return the tail of the queue`
			`* * mpsc_queue_pop() to remove the tail of the queue`
			`* * mpsc_queue_tail() to read the current tail`
			`* * mpsc_queue_push_front() to enqueue an element safely at the tail`
			`* * MPSC_QUEUE_FOR_EACH() to iterate over the current elements,`
			`* without removing them.`
			`* * MPSC_QUEUE_FOR_EACH_POP() to iterate over the elements while`
			`* removing them.`
			`*`
			`* When a thread is finished with reading the queue, it can release the`
			`* reader lock using 'mpsc_queue_release()'.`
			`*`
			`* Producers can always insert elements in the queue, even if no consumer`
			`* acquired the reader lock. No inter-producer synchronization is needed.`
			`*`
			`* The consumer thread is also allowed to insert elements while it holds the`
			`* reader lock.`
			`*`
			`* Producer threads must never be cancelled while writing to the queue.`
			`* This will block the consumer, that will then lose any subsequent elements`
			`* in the queue. Producers should ideally be cooperatively managed or`
			`* the queue insertion should be within non-cancellable sections.`
			`*`
			`* Queue state`
			`* ===========`
			`*`
			`* When polling the queue, three states can be observed: 'empty', 'non-empty',`
			`* and 'inconsistent'. Three polling results are defined, respectively:`
			`*`
			`* * MPSC_QUEUE_EMPTY: the queue is empty.`
			`* * MPSC_QUEUE_ITEM: an item was available and has been removed.`
			`* * MPSC_QUEUE_RETRY: the queue is inconsistent.`
			`*`
			`* If 'MPSC_QUEUE_RETRY' is returned, then a producer has not yet finished`
			`* writing to the queue and the list of nodes is not coherent. The consumer`
			`* can retry shortly to check if the producer has finished.`
			`*`
			`* This behavior is the reason the removal function is called`
			`* 'mpsc_queue_poll()'.`
			`*`
			`*/`

			`struct mpsc_queue_node {`
			`ATOMIC(struct mpsc_queue_node *) next;`
			`};`

			`struct mpsc_queue {`
			`ATOMIC(struct mpsc_queue_node *) head;`
			`ATOMIC(struct mpsc_queue_node *) tail;`
			`struct mpsc_queue_node stub;`
			`struct ovs_mutex read_lock;`
			`};`

			`#define MPSC_QUEUE_INITIALIZER(Q) { \`
treewide: Remove uses of ATOMIC_VAR_INIT. ATOMIC_VAR_INIT has a trivial definition `#define ATOMIC_VAR_INIT(value) (value)`, is deprecated in C17/C++20, and will be removed in newer standards in newer GCC/Clang (e.g. https://reviews.llvm.org/D144196). Signed-off-by: Fangrui Song <maskray@google.com> Signed-off-by: Ilya Maximets <i.maximets@ovn.org> 2023-02-28 18:30:56 -08:00			`.head = &(Q)->stub, \`
			`.tail = &(Q)->stub, \`
			`.stub = { .next = NULL }, \`
mpsc-queue: Module for lock-free message passing. Add a lockless multi-producer/single-consumer (MPSC), linked-list based, intrusive, unbounded queue that does not require deferred memory management. The queue is designed to improve the specific MPSC setup. A benchmark accompanies the unit tests to measure the difference in this configuration. A single reader thread polls the queue while N writers enqueue elements as fast as possible. The mpsc-queue is compared against the regular ovs-list as well as the guarded list. The latter usually offers a slight improvement by batching the element removal, however the mpsc-queue is faster. The average is of each producer threads time: $ ./tests/ovstest test-mpsc-queue benchmark 3000000 1 Benchmarking n=3000000 on 1 + 1 threads. type\thread: Reader 1 Avg mpsc-queue: 167 167 167 ms list(spin): 89 80 80 ms list(mutex): 745 745 745 ms guarded list: 788 788 788 ms $ ./tests/ovstest test-mpsc-queue benchmark 3000000 2 Benchmarking n=3000000 on 1 + 2 threads. type\thread: Reader 1 2 Avg mpsc-queue: 98 97 94 95 ms list(spin): 185 171 173 172 ms list(mutex): 203 199 203 201 ms guarded list: 269 269 188 228 ms $ ./tests/ovstest test-mpsc-queue benchmark 3000000 3 Benchmarking n=3000000 on 1 + 3 threads. type\thread: Reader 1 2 3 Avg mpsc-queue: 76 76 65 76 72 ms list(spin): 246 110 240 238 196 ms list(mutex): 542 541 541 539 540 ms guarded list: 535 535 507 511 517 ms $ ./tests/ovstest test-mpsc-queue benchmark 3000000 4 Benchmarking n=3000000 on 1 + 4 threads. type\thread: Reader 1 2 3 4 Avg mpsc-queue: 73 68 68 68 68 68 ms list(spin): 294 275 279 277 282 278 ms list(mutex): 346 309 287 345 302 310 ms guarded list: 378 319 334 378 351 345 ms Signed-off-by: Gaetan Rivet <grive@u256.net> Reviewed-by: Eli Britstein <elibr@nvidia.com> Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com> Signed-off-by: Ilya Maximets <i.maximets@ovn.org> 2021-09-08 11:47:36 +02:00			`.read_lock = OVS_MUTEX_INITIALIZER, \`
			`}`

			`/* Consumer API. */`

			`/* Initialize the queue. Not necessary is 'MPSC_QUEUE_INITIALIZER' was used. */`
			`void mpsc_queue_init(struct mpsc_queue *queue);`
			`/* The reader lock must be released prior to destroying the queue. */`
			`void mpsc_queue_destroy(struct mpsc_queue *queue);`

			`/* Acquire and release the consumer lock. */`
			`#define mpsc_queue_acquire(q) do { \`
			`ovs_mutex_lock(&(q)->read_lock); \`
			`} while (0)`
			`#define mpsc_queue_release(q) do { \`
			`ovs_mutex_unlock(&(q)->read_lock); \`
			`} while (0)`

			`enum mpsc_queue_poll_result {`
			`/* Queue is empty. */`
			`MPSC_QUEUE_EMPTY,`
			`/* Polling the queue returned an item. */`
			`MPSC_QUEUE_ITEM,`
			`/* Data has been enqueued but one or more producer thread have not`
			`* finished writing it. The queue is in an inconsistent state.`
			`* Retrying shortly, if the producer threads are still active, will`
			`* return the data.`
			`*/`
			`MPSC_QUEUE_RETRY,`
			`};`

			`/* Set 'node' to a removed item from the queue if 'MPSC_QUEUE_ITEM' is`
			`* returned, otherwise 'node' is not set.`
			`*/`
			`enum mpsc_queue_poll_result mpsc_queue_poll(struct mpsc_queue *queue,`
			`struct mpsc_queue_node **node)`
			`OVS_REQUIRES(queue->read_lock);`

			`/* Pop an element if there is any in the queue. */`
			`struct mpsc_queue_node mpsc_queue_pop(struct mpsc_queue queue)`
			`OVS_REQUIRES(queue->read_lock);`

			`/* Insert at the front of the queue. Only the consumer can do it. */`
			`void mpsc_queue_push_front(struct mpsc_queue *queue,`
			`struct mpsc_queue_node *node)`
			`OVS_REQUIRES(queue->read_lock);`

			`/* Get the current queue tail. */`
			`struct mpsc_queue_node mpsc_queue_tail(struct mpsc_queue queue)`
			`OVS_REQUIRES(queue->read_lock);`

			`/* Get the next element of a node. */`
			`struct mpsc_queue_node mpsc_queue_next(struct mpsc_queue queue,`
			`struct mpsc_queue_node *prev)`
			`OVS_REQUIRES(queue->read_lock);`

			`#define MPSC_QUEUE_FOR_EACH(node, queue) \`
			`for (node = mpsc_queue_tail(queue); node != NULL; \`
			`node = mpsc_queue_next((queue), node))`

			`#define MPSC_QUEUE_FOR_EACH_POP(node, queue) \`
			`for (node = mpsc_queue_pop(queue); node != NULL; \`
			`node = mpsc_queue_pop(queue))`

			`/* Producer API. */`

			`void mpsc_queue_insert(struct mpsc_queue queue, struct mpsc_queue_node node);`

			`#endif /* MPSC_QUEUE_H */`