mirror of
				https://github.com/openvswitch/ovs
				synced 2025-10-25 15:07:05 +00:00 
			
		
		
		
	This patch adds a new functions classifier_defer() and classifier_publish(), which control when the classifier modifications are made available to lookups. By default, all modifications are made available to lookups immediately. Modifications made after a classifier_defer() call MAY be 'deferred' for later 'publication'. A call to classifier_publish() will both publish any deferred modifications, and cause subsequent changes to to be published immediately. Currently any deferring is limited to the visibility of the subtable vector changes. pvector now processes modifications mostly in a working copy, which needs to be explicitly published with pvector_publish(). pvector_publish() sorts the working copy and removes gaps before publishing it. This change helps avoiding O(n**2) memory behavior in corner cases, where large number of rules with different masks are inserted or deleted. VMware-BZ: #1322017 Signed-off-by: Jarno Rajahalme <jrajahalme@nicira.com> Acked-by: Ben Pfaff <blp@nicira.com>
		
			
				
	
	
		
			242 lines
		
	
	
		
			8.4 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			242 lines
		
	
	
		
			8.4 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | ||
|  * Copyright (c) 2014 Nicira, Inc.
 | ||
|  *
 | ||
|  * Licensed under the Apache License, Version 2.0 (the "License");
 | ||
|  * you may not use this file except in compliance with the License.
 | ||
|  * You may obtain a copy of the License at:
 | ||
|  *
 | ||
|  *     http://www.apache.org/licenses/LICENSE-2.0
 | ||
|  *
 | ||
|  * Unless required by applicable law or agreed to in writing, software
 | ||
|  * distributed under the License is distributed on an "AS IS" BASIS,
 | ||
|  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||
|  * See the License for the specific language governing permissions and
 | ||
|  * limitations under the License.
 | ||
|  */
 | ||
| 
 | ||
| #ifndef PVECTOR_H
 | ||
| #define PVECTOR_H 1
 | ||
| 
 | ||
| #include <stdbool.h>
 | ||
| #include <stdint.h>
 | ||
| #include <stdlib.h>
 | ||
| #include "ovs-rcu.h"
 | ||
| #include "util.h"
 | ||
| 
 | ||
| /* Concurrent Priority Vector
 | ||
|  * ==========================
 | ||
|  *
 | ||
|  * Concurrent priority vector holds non-NULL pointers to objects in an
 | ||
|  * increasing priority order and allows readers to traverse the vector without
 | ||
|  * being concerned about writers modifying the vector as they are traversing
 | ||
|  * it.
 | ||
|  *
 | ||
|  * The priority order is maintained as a linear vector of elements to allow
 | ||
|  * for efficient memory prefetching.
 | ||
|  *
 | ||
|  * Concurrency is implemented with OVS RCU so that the readers can assume
 | ||
|  * that once they have taken a pointer to the vector with
 | ||
|  * pvector_cursor_init(), the 'size' member will not decrease, so that
 | ||
|  * they can safely read 'size' entries from 'vector', and find that each
 | ||
|  * entry has a valid, non-NULL 'ptr', and the vector is in order from highest
 | ||
|  * to lowest 'priority'.  The 'priority' values can change any time, but only
 | ||
|  * so that the order of the entries does not change, so readers can use
 | ||
|  * 'priority' values read at any time after acquisition of the vector pointer.
 | ||
|  *
 | ||
|  * Writers can concurrently add entries to the end of the vector, incrementing
 | ||
|  * 'size', or update the 'priority' value of an entry, but only if that does
 | ||
|  * not change the ordering of the entries.  Writers will never change the 'ptr'
 | ||
|  * values, or decrement the 'size' on a copy that readers have access to.
 | ||
|  *
 | ||
|  * Most modifications are internally staged at the 'temp' vector, from which
 | ||
|  * they can be published at 'impl' by calling pvector_publish().  This saves
 | ||
|  * unnecessary memory allocations when many changes are done back-to-back.
 | ||
|  * 'temp' may contain NULL pointers and it may be in unsorted order.  It is
 | ||
|  * sorted before it is published at 'impl', which also removes the NULLs from
 | ||
|  * the published vector.
 | ||
|  *
 | ||
|  * Clients should not use priority INT_MIN.
 | ||
|  */
 | ||
| 
 | ||
| struct pvector_entry {
 | ||
|     int priority;
 | ||
|     void *ptr;
 | ||
| };
 | ||
| 
 | ||
| /* Writers will preallocate space for some entries at the end to avoid future
 | ||
|  * reallocations. */
 | ||
| enum { PVECTOR_EXTRA_ALLOC = 4 };
 | ||
| 
 | ||
| struct pvector_impl {
 | ||
|     size_t size;       /* Number of entries in the vector. */
 | ||
|     size_t allocated;  /* Number of allocated entries. */
 | ||
|     struct pvector_entry vector[];
 | ||
| };
 | ||
| 
 | ||
| /* Concurrent priority vector. */
 | ||
| struct pvector {
 | ||
|     OVSRCU_TYPE(struct pvector_impl *) impl;
 | ||
|     struct pvector_impl *temp;
 | ||
| };
 | ||
| 
 | ||
| /* Initialization. */
 | ||
| void pvector_init(struct pvector *);
 | ||
| void pvector_destroy(struct pvector *);
 | ||
| 
 | ||
| /* Insertion and deletion.  These work on 'temp'.  */
 | ||
| void pvector_insert(struct pvector *, void *, int priority);
 | ||
| void pvector_change_priority(struct pvector *, void *, int priority);
 | ||
| void pvector_remove(struct pvector *, void *);
 | ||
| 
 | ||
| /* Make the modified pvector available for iteration. */
 | ||
| static inline void pvector_publish(struct pvector *);
 | ||
| 
 | ||
| /* Count.  These operate on the published pvector. */
 | ||
| static inline size_t pvector_count(const struct pvector *);
 | ||
| static inline bool pvector_is_empty(const struct pvector *);
 | ||
| 
 | ||
| /* Iteration.
 | ||
|  *
 | ||
|  *
 | ||
|  * Thread-safety
 | ||
|  * =============
 | ||
|  *
 | ||
|  * Iteration is safe even in a pvector that is changing concurrently.
 | ||
|  * Multiple writers must exclude each other via e.g., a mutex.
 | ||
|  *
 | ||
|  * Example
 | ||
|  * =======
 | ||
|  *
 | ||
|  *     struct my_node {
 | ||
|  *         int data;
 | ||
|  *     };
 | ||
|  *
 | ||
|  *     struct my_node elem1, elem2, *iter;
 | ||
|  *     struct pvector my_pvector;
 | ||
|  *
 | ||
|  *     pvector_init(&my_pvector);
 | ||
|  *     ...add data...
 | ||
|  *     pvector_insert(&my_pvector, &elem1, 1);
 | ||
|  *     pvector_insert(&my_pvector, &elem2, 2);
 | ||
|  *     ...
 | ||
|  *     PVECTOR_FOR_EACH (iter, &my_pvector) {
 | ||
|  *         ...operate on '*iter'...
 | ||
|  *         ...elem2 to be seen before elem1...
 | ||
|  *     }
 | ||
|  *     ...
 | ||
|  *     pvector_destroy(&my_pvector);
 | ||
|  *
 | ||
|  * There is no PVECTOR_FOR_EACH_SAFE variant as iteration is performed on RCU
 | ||
|  * protected instance of the priority vector.  Any concurrent modifications
 | ||
|  * that would be disruptive for readers (such as deletions), will be performed
 | ||
|  * on a new instance.  To see any of the modifications, a new iteration loop
 | ||
|  * has to be started.
 | ||
|  *
 | ||
|  * The PVECTOR_FOR_EACH_PRIORITY limits the iteration to entries with higher
 | ||
|  * than given priority and allows for object lookahead.
 | ||
|  *
 | ||
|  * The iteration loop must be completed without entering the OVS RCU quiescent
 | ||
|  * period.  That is, an old iteration loop must not be continued after any
 | ||
|  * blocking IO (VLOG is non-blocking, so that is OK).
 | ||
|  */
 | ||
| struct pvector_cursor {
 | ||
|     size_t size;        /* Number of entries in the vector. */
 | ||
|     size_t entry_idx;   /* Current index. */
 | ||
|     const struct pvector_entry *vector;
 | ||
| };
 | ||
| 
 | ||
| static inline struct pvector_cursor pvector_cursor_init(const struct pvector *,
 | ||
|                                                         size_t n_ahead,
 | ||
|                                                         size_t obj_size);
 | ||
| static inline void *pvector_cursor_next(struct pvector_cursor *,
 | ||
|                                         int stop_at_priority,
 | ||
|                                         size_t n_ahead, size_t obj_size);
 | ||
| static inline void pvector_cursor_lookahead(const struct pvector_cursor *,
 | ||
|                                             int n, size_t size);
 | ||
| 
 | ||
| #define PVECTOR_FOR_EACH(PTR, PVECTOR)                                  \
 | ||
|     for (struct pvector_cursor cursor__ = pvector_cursor_init(PVECTOR, 0, 0); \
 | ||
|          ((PTR) = pvector_cursor_next(&cursor__, INT_MIN, 0, 0)) != NULL; )
 | ||
| 
 | ||
| /* Loop while priority is higher than 'PRIORITY' and prefetch objects
 | ||
|  * of size 'SZ' 'N' objects ahead from the current object. */
 | ||
| #define PVECTOR_FOR_EACH_PRIORITY(PTR, PRIORITY, N, SZ, PVECTOR)        \
 | ||
|     for (struct pvector_cursor cursor__ = pvector_cursor_init(PVECTOR, N, SZ); \
 | ||
|          ((PTR) = pvector_cursor_next(&cursor__, PRIORITY, N, SZ)) != NULL; )
 | ||
| 
 | ||
| #define PVECTOR_CURSOR_FOR_EACH(PTR, CURSOR, PVECTOR)                \
 | ||
|     for (*(CURSOR) = pvector_cursor_init(PVECTOR, 0, 0);             \
 | ||
|          ((PTR) = pvector_cursor_next(CURSOR, INT_MIN, 0, 0)) != NULL; )
 | ||
| 
 | ||
| #define PVECTOR_CURSOR_FOR_EACH_CONTINUE(PTR, CURSOR)                   \
 | ||
|     for (; ((PTR) = pvector_cursor_next(CURSOR, INT_MIN, 0, 0)) != NULL; )
 | ||
| 
 | ||
| 
 | ||
| /* Inline implementations. */
 | ||
| 
 | ||
| static inline struct pvector_cursor
 | ||
| pvector_cursor_init(const struct pvector *pvec,
 | ||
|                     size_t n_ahead, size_t obj_size)
 | ||
| {
 | ||
|     const struct pvector_impl *impl;
 | ||
|     struct pvector_cursor cursor;
 | ||
| 
 | ||
|     impl = ovsrcu_get(struct pvector_impl *, &pvec->impl);
 | ||
| 
 | ||
|     ovs_prefetch_range(impl->vector, impl->size * sizeof impl->vector[0]);
 | ||
| 
 | ||
|     cursor.size = impl->size;
 | ||
|     cursor.vector = impl->vector;
 | ||
|     cursor.entry_idx = -1;
 | ||
| 
 | ||
|     for (size_t i = 0; i < n_ahead; i++) {
 | ||
|         /* Prefetch the first objects. */
 | ||
|         pvector_cursor_lookahead(&cursor, i, obj_size);
 | ||
|     }
 | ||
|     return cursor;
 | ||
| }
 | ||
| 
 | ||
| static inline void *pvector_cursor_next(struct pvector_cursor *cursor,
 | ||
|                                         int stop_at_priority,
 | ||
|                                         size_t n_ahead, size_t obj_size)
 | ||
| {
 | ||
|     if (++cursor->entry_idx < cursor->size &&
 | ||
|         cursor->vector[cursor->entry_idx].priority > stop_at_priority) {
 | ||
|         if (n_ahead) {
 | ||
|             pvector_cursor_lookahead(cursor, n_ahead, obj_size);
 | ||
|         }
 | ||
|         return cursor->vector[cursor->entry_idx].ptr;
 | ||
|     }
 | ||
|     return NULL;
 | ||
| }
 | ||
| 
 | ||
| static inline void pvector_cursor_lookahead(const struct pvector_cursor *cursor,
 | ||
|                                             int n, size_t size)
 | ||
| {
 | ||
|     if (cursor->entry_idx + n < cursor->size) {
 | ||
|         ovs_prefetch_range(cursor->vector[cursor->entry_idx + n].ptr, size);
 | ||
|     }
 | ||
| }
 | ||
| 
 | ||
| static inline size_t pvector_count(const struct pvector *pvec)
 | ||
| {
 | ||
|     return ovsrcu_get(struct pvector_impl *, &pvec->impl)->size;
 | ||
| }
 | ||
| 
 | ||
| static inline bool pvector_is_empty(const struct pvector *pvec)
 | ||
| {
 | ||
|     return pvector_count(pvec) == 0;
 | ||
| }
 | ||
| 
 | ||
| void pvector_publish__(struct pvector *);
 | ||
| 
 | ||
| /* Make the modified pvector available for iteration. */
 | ||
| static inline void pvector_publish(struct pvector *pvec)
 | ||
| {
 | ||
|     if (pvec->temp) {
 | ||
|         pvector_publish__(pvec);
 | ||
|     }
 | ||
| }
 | ||
| 
 | ||
| #endif /* pvector.h */
 |