Add atomic bit test/set/clear/assign/flip and
test-and-set/clear/assign/flip functions.

All atomic bit functions allow (and indeed, require) the caller to
specify a memory order.

RFC v8:
 * Add missing macro #undef for C++ version of atomic bit flip.

RFC v7:
 * Replace compare-exchange-based rte_bitset_atomic_test_and_*() and
   flip() with implementations that use the previous value as returned
   by the atomic fetch function.
 * Reword documentation to match the non-atomic macro variants.
 * Remove pointer to <rte_stdatomic.h> for memory model documentation,
   since there is no documentation for that API.

RFC v6:
 * Have rte_bit_atomic_test() accept const-marked bitsets.

RFC v4:
 * Add atomic bit flip.
 * Mark macro-generated private functions experimental.

RFC v3:
 * Work around lack of C++ support for _Generic (Tyler Retzlaff).

RFC v2:
 o Add rte_bit_atomic_test_and_assign() (for consistency).
 o Fix bugs in rte_bit_atomic_test_and_[set|clear]().
 o Use <rte_stdatomics.h> to support MSVC.

Signed-off-by: Mattias Rönnblom <mattias.ronnb...@ericsson.com>
Acked-by: Morten Brørup <m...@smartsharesystems.com>
Acked-by: Tyler Retzlaff <roret...@linux.microsoft.com>
---
 lib/eal/include/rte_bitops.h | 414 +++++++++++++++++++++++++++++++++++
 1 file changed, 414 insertions(+)

diff --git a/lib/eal/include/rte_bitops.h b/lib/eal/include/rte_bitops.h
index 3297133e22..4d878099ed 100644
--- a/lib/eal/include/rte_bitops.h
+++ b/lib/eal/include/rte_bitops.h
@@ -21,6 +21,7 @@
 
 #include <rte_compat.h>
 #include <rte_debug.h>
+#include <rte_stdatomic.h>
 
 #ifdef __cplusplus
 extern "C" {
@@ -226,6 +227,204 @@ extern "C" {
                 uint32_t *: __rte_bit_flip32,                          \
                 uint64_t *: __rte_bit_flip64)(addr, nr)
 
+/**
+ * @warning
+ * @b EXPERIMENTAL: this API may change without prior notice.
+ *
+ * Test if a particular bit in a word is set with a particular memory
+ * order.
+ *
+ * Test a bit with the resulting memory load ordered as per the
+ * specified memory order.
+ *
+ * @param addr
+ *   A pointer to the word to query.
+ * @param nr
+ *   The index of the bit.
+ * @param memory_order
+ *   The memory order to use.
+ * @return
+ *   Returns true if the bit is set, and false otherwise.
+ */
+#define rte_bit_atomic_test(addr, nr, memory_order)                    \
+       _Generic((addr),                                                \
+                uint32_t *: __rte_bit_atomic_test32,                   \
+                const uint32_t *: __rte_bit_atomic_test32,             \
+                uint64_t *: __rte_bit_atomic_test64,                   \
+                const uint64_t *: __rte_bit_atomic_test64)(addr, nr,   \
+                                                           memory_order)
+
+/**
+ * @warning
+ * @b EXPERIMENTAL: this API may change without prior notice.
+ *
+ * Atomically set bit in word.
+ *
+ * Generic selection macro to atomically set bit specified by @c nr in
+ * the word pointed to by @c addr to '1', with the memory ordering as
+ * specified by @c memory_order.
+ *
+ * @param addr
+ *   A pointer to the word to modify.
+ * @param nr
+ *   The index of the bit.
+ * @param memory_order
+ *   The memory order to use.
+ */
+#define rte_bit_atomic_set(addr, nr, memory_order)                     \
+       _Generic((addr),                                                \
+                uint32_t *: __rte_bit_atomic_set32,                    \
+                uint64_t *: __rte_bit_atomic_set64)(addr, nr, memory_order)
+
+/**
+ * @warning
+ * @b EXPERIMENTAL: this API may change without prior notice.
+ *
+ * Atomically clear bit in word.
+ *
+ * Generic selection macro to atomically set bit specified by @c nr in
+ * the word pointed to by @c addr to '0', with the memory ordering as
+ * specified by @c memory_order.
+ *
+ * @param addr
+ *   A pointer to the word to modify.
+ * @param nr
+ *   The index of the bit.
+ * @param memory_order
+ *   The memory order to use.
+ */
+#define rte_bit_atomic_clear(addr, nr, memory_order)                   \
+       _Generic((addr),                                                \
+                uint32_t *: __rte_bit_atomic_clear32,                  \
+                uint64_t *: __rte_bit_atomic_clear64)(addr, nr, memory_order)
+
+/**
+ * @warning
+ * @b EXPERIMENTAL: this API may change without prior notice.
+ *
+ * Atomically assign a value to bit in word.
+ *
+ * Generic selection macro to atomically set bit specified by @c nr in the
+ * word pointed to by @c addr to the value indicated by @c value, with
+ * the memory ordering as specified with @c memory_order.
+ *
+ * @param addr
+ *   A pointer to the word to modify.
+ * @param nr
+ *   The index of the bit.
+ * @param value
+ *   The new value of the bit - true for '1', or false for '0'.
+ * @param memory_order
+ *   The memory order to use.
+ */
+#define rte_bit_atomic_assign(addr, nr, value, memory_order)           \
+       _Generic((addr),                                                \
+                uint32_t *: __rte_bit_atomic_assign32,                 \
+                uint64_t *: __rte_bit_atomic_assign64)(addr, nr, value, \
+                                                       memory_order)
+
+/**
+ * @warning
+ * @b EXPERIMENTAL: this API may change without prior notice.
+ *
+ * Atomically flip bit in word.
+ *
+ * Generic selection macro to atomically negate the value of the bit
+ * specified by @c nr in the word pointed to by @c addr to the value
+ * indicated by @c value, with the memory ordering as specified with
+ * @c memory_order.
+ *
+ * @param addr
+ *   A pointer to the word to modify.
+ * @param nr
+ *   The index of the bit.
+ * @param memory_order
+ *   The memory order to use.
+ */
+#define rte_bit_atomic_flip(addr, nr, memory_order)                    \
+       _Generic((addr),                                                \
+                uint32_t *: __rte_bit_atomic_flip32,                   \
+                uint64_t *: __rte_bit_atomic_flip64)(addr, nr, memory_order)
+
+/**
+ * @warning
+ * @b EXPERIMENTAL: this API may change without prior notice.
+ *
+ * Atomically test and set a bit in word.
+ *
+ * Generic selection macro to atomically test and set bit specified by
+ * @c nr in the word pointed to by @c addr to '1', with the memory
+ * ordering as specified with @c memory_order.
+ *
+ * @param addr
+ *   A pointer to the word to modify.
+ * @param nr
+ *   The index of the bit.
+ * @param memory_order
+ *   The memory order to use.
+ * @return
+ *   Returns true if the bit was set, and false otherwise.
+ */
+#define rte_bit_atomic_test_and_set(addr, nr, memory_order)            \
+       _Generic((addr),                                                \
+                uint32_t *: __rte_bit_atomic_test_and_set32,           \
+                uint64_t *: __rte_bit_atomic_test_and_set64)(addr, nr, \
+                                                             memory_order)
+
+/**
+ * @warning
+ * @b EXPERIMENTAL: this API may change without prior notice.
+ *
+ * Atomically test and clear a bit in word.
+ *
+ * Generic selection macro to atomically test and clear bit specified
+ * by @c nr in the word pointed to by @c addr to '0', with the memory
+ * ordering as specified with @c memory_order.
+ *
+ * @param addr
+ *   A pointer to the word to modify.
+ * @param nr
+ *   The index of the bit.
+ * @param memory_order
+ *   The memory order to use.
+ * @return
+ *   Returns true if the bit was set, and false otherwise.
+ */
+#define rte_bit_atomic_test_and_clear(addr, nr, memory_order)          \
+       _Generic((addr),                                                \
+                uint32_t *: __rte_bit_atomic_test_and_clear32,         \
+                uint64_t *: __rte_bit_atomic_test_and_clear64)(addr, nr, \
+                                                               memory_order)
+
+/**
+ * @warning
+ * @b EXPERIMENTAL: this API may change without prior notice.
+ *
+ * Atomically test and assign a bit in word.
+ *
+ * Generic selection macro to atomically test and assign bit specified
+ * by @c nr in the word pointed to by @c addr the value specified by
+ * @c value, with the memory ordering as specified with @c
+ * memory_order.
+ *
+ * @param addr
+ *   A pointer to the word to modify.
+ * @param nr
+ *   The index of the bit.
+ * @param value
+ *   The new value of the bit - true for '1', or false for '0'.
+ * @param memory_order
+ *   The memory order to use.
+ * @return
+ *   Returns true if the bit was set, and false otherwise.
+ */
+#define rte_bit_atomic_test_and_assign(addr, nr, value, memory_order)  \
+       _Generic((addr),                                                \
+                uint32_t *: __rte_bit_atomic_test_and_assign32,        \
+                uint64_t *: __rte_bit_atomic_test_and_assign64)(addr, nr, \
+                                                                value, \
+                                                                memory_order)
+
 #define __RTE_GEN_BIT_TEST(family, fun, qualifier, size)               \
        __rte_experimental                                              \
        static inline bool                                              \
@@ -298,6 +497,145 @@ __RTE_GEN_BIT_CLEAR(, clear,, 64)
 __RTE_GEN_BIT_ASSIGN(, assign,, 64)
 __RTE_GEN_BIT_FLIP(, flip,, 64)
 
+#define __RTE_GEN_BIT_ATOMIC_TEST(size)                                        
\
+       __rte_experimental                                              \
+       static inline bool                                              \
+       __rte_bit_atomic_test ## size(const uint ## size ## _t *addr,   \
+                                     unsigned int nr, int memory_order) \
+       {                                                               \
+               RTE_ASSERT(nr < size);                                  \
+                                                                       \
+               const RTE_ATOMIC(uint ## size ## _t) *a_addr =          \
+                       (const RTE_ATOMIC(uint ## size ## _t) *)addr;   \
+               uint ## size ## _t mask = (uint ## size ## _t)1 << nr;  \
+               return rte_atomic_load_explicit(a_addr, memory_order) & mask; \
+       }
+
+#define __RTE_GEN_BIT_ATOMIC_SET(size)                                 \
+       __rte_experimental                                              \
+       static inline void                                              \
+       __rte_bit_atomic_set ## size(uint ## size ## _t *addr,          \
+                                    unsigned int nr, int memory_order) \
+       {                                                               \
+               RTE_ASSERT(nr < size);                                  \
+                                                                       \
+               RTE_ATOMIC(uint ## size ## _t) *a_addr =                \
+                       (RTE_ATOMIC(uint ## size ## _t) *)addr;         \
+               uint ## size ## _t mask = (uint ## size ## _t)1 << nr;  \
+               rte_atomic_fetch_or_explicit(a_addr, mask, memory_order); \
+       }
+
+#define __RTE_GEN_BIT_ATOMIC_CLEAR(size)                               \
+       __rte_experimental                                              \
+       static inline void                                              \
+       __rte_bit_atomic_clear ## size(uint ## size ## _t *addr,        \
+                                      unsigned int nr, int memory_order) \
+       {                                                               \
+               RTE_ASSERT(nr < size);                                  \
+                                                                       \
+               RTE_ATOMIC(uint ## size ## _t) *a_addr =                \
+                       (RTE_ATOMIC(uint ## size ## _t) *)addr;         \
+               uint ## size ## _t mask = (uint ## size ## _t)1 << nr;  \
+               rte_atomic_fetch_and_explicit(a_addr, ~mask, memory_order); \
+       }
+
+#define __RTE_GEN_BIT_ATOMIC_FLIP(size)                                        
\
+       __rte_experimental                                              \
+       static inline void                                              \
+       __rte_bit_atomic_flip ## size(uint ## size ## _t *addr,         \
+                                      unsigned int nr, int memory_order) \
+       {                                                               \
+               RTE_ASSERT(nr < size);                                  \
+                                                                       \
+               RTE_ATOMIC(uint ## size ## _t) *a_addr =                \
+                       (RTE_ATOMIC(uint ## size ## _t) *)addr;         \
+               uint ## size ## _t mask = (uint ## size ## _t)1 << nr;  \
+               rte_atomic_fetch_xor_explicit(a_addr, mask, memory_order); \
+       }
+
+#define __RTE_GEN_BIT_ATOMIC_ASSIGN(size)                              \
+       __rte_experimental                                              \
+       static inline void                                              \
+       __rte_bit_atomic_assign ## size(uint ## size ## _t *addr,       \
+                                       unsigned int nr, bool value,    \
+                                       int memory_order)               \
+       {                                                               \
+               if (value)                                              \
+                       __rte_bit_atomic_set ## size(addr, nr, memory_order); \
+               else                                                    \
+                       __rte_bit_atomic_clear ## size(addr, nr,        \
+                                                      memory_order);   \
+       }
+
+#define __RTE_GEN_BIT_ATOMIC_TEST_AND_SET(size)                                
\
+       __rte_experimental                                              \
+       static inline bool                                              \
+       __rte_bit_atomic_test_and_set ## size(uint ## size ## _t *addr, \
+                                             unsigned int nr,          \
+                                             int memory_order)         \
+       {                                                               \
+               RTE_ASSERT(nr < size);                                  \
+                                                                       \
+               RTE_ATOMIC(uint ## size ## _t) *a_addr =                \
+                       (RTE_ATOMIC(uint ## size ## _t) *)addr;         \
+               uint ## size ## _t mask = (uint ## size ## _t)1 << nr;  \
+               uint ## size ## _t prev;                                \
+                                                                       \
+               prev = rte_atomic_fetch_or_explicit(a_addr, mask,       \
+                                                   memory_order);      \
+                                                                       \
+               return prev & mask;                                     \
+       }
+
+#define __RTE_GEN_BIT_ATOMIC_TEST_AND_CLEAR(size)                      \
+       __rte_experimental                                              \
+       static inline bool                                              \
+       __rte_bit_atomic_test_and_clear ## size(uint ## size ## _t *addr, \
+                                               unsigned int nr,        \
+                                               int memory_order)       \
+       {                                                               \
+               RTE_ASSERT(nr < size);                                  \
+                                                                       \
+               RTE_ATOMIC(uint ## size ## _t) *a_addr =                \
+                       (RTE_ATOMIC(uint ## size ## _t) *)addr;         \
+               uint ## size ## _t mask = (uint ## size ## _t)1 << nr;  \
+               uint ## size ## _t prev;                                \
+                                                                       \
+               prev = rte_atomic_fetch_and_explicit(a_addr, ~mask,     \
+                                                    memory_order);     \
+                                                                       \
+               return prev & mask;                                     \
+       }
+
+#define __RTE_GEN_BIT_ATOMIC_TEST_AND_ASSIGN(size)                     \
+       __rte_experimental                                              \
+       static inline bool                                              \
+       __rte_bit_atomic_test_and_assign ## size(uint ## size ## _t *addr, \
+                                                unsigned int nr,       \
+                                                bool value,            \
+                                                int memory_order)      \
+       {                                                               \
+               if (value)                                              \
+                       return __rte_bit_atomic_test_and_set ## size(addr, nr, \
+                                                                    
memory_order); \
+               else                                                    \
+                       return __rte_bit_atomic_test_and_clear ## size(addr, 
nr, \
+                                                                      
memory_order); \
+       }
+
+#define __RTE_GEN_BIT_ATOMIC_OPS(size)                 \
+       __RTE_GEN_BIT_ATOMIC_TEST(size)                 \
+       __RTE_GEN_BIT_ATOMIC_SET(size)                  \
+       __RTE_GEN_BIT_ATOMIC_CLEAR(size)                \
+       __RTE_GEN_BIT_ATOMIC_ASSIGN(size)               \
+       __RTE_GEN_BIT_ATOMIC_TEST_AND_SET(size)         \
+       __RTE_GEN_BIT_ATOMIC_TEST_AND_CLEAR(size)       \
+       __RTE_GEN_BIT_ATOMIC_TEST_AND_ASSIGN(size)      \
+       __RTE_GEN_BIT_ATOMIC_FLIP(size)
+
+__RTE_GEN_BIT_ATOMIC_OPS(32)
+__RTE_GEN_BIT_ATOMIC_OPS(64)
+
 /*------------------------ 32-bit relaxed operations ------------------------*/
 
 /**
@@ -993,6 +1331,15 @@ rte_log2_u64(uint64_t v)
 #undef rte_bit_assign
 #undef rte_bit_flip
 
+#undef rte_bit_atomic_test
+#undef rte_bit_atomic_set
+#undef rte_bit_atomic_clear
+#undef rte_bit_atomic_assign
+#undef rte_bit_atomic_flip
+#undef rte_bit_atomic_test_and_set
+#undef rte_bit_atomic_test_and_clear
+#undef rte_bit_atomic_test_and_assign
+
 #define __RTE_BIT_OVERLOAD_SZ_2(fun, qualifier, size, arg1_type, arg1_name) \
        static inline void                                              \
        rte_bit_ ## fun(qualifier uint ## size ## _t *addr,             \
@@ -1036,12 +1383,79 @@ rte_log2_u64(uint64_t v)
        __RTE_BIT_OVERLOAD_SZ_3(fun, qualifier, 64, arg1_type, arg1_name, \
                                arg2_type, arg2_name)
 
+#define __RTE_BIT_OVERLOAD_SZ_3R(fun, qualifier, size, ret_type, arg1_type, \
+                                arg1_name, arg2_type, arg2_name)       \
+       static inline ret_type                                          \
+       rte_bit_ ## fun(uint ## size ## _t *addr, arg1_type arg1_name,  \
+                       arg2_type arg2_name)                            \
+       {                                                               \
+               return __rte_bit_ ## fun ## size(addr, arg1_name, arg2_name); \
+       }
+
+#define __RTE_BIT_OVERLOAD_3R(fun, qualifier, ret_type, arg1_type, arg1_name, \
+                             arg2_type, arg2_name)                     \
+       __RTE_BIT_OVERLOAD_SZ_3R(fun, qualifier, 32, ret_type, arg1_type, \
+                                arg1_name, arg2_type, arg2_name)       \
+       __RTE_BIT_OVERLOAD_SZ_3R(fun, qualifier, 64, ret_type, arg1_type, \
+                                arg1_name, arg2_type, arg2_name)
+
+#define __RTE_BIT_OVERLOAD_SZ_4(fun, qualifier, size, arg1_type, arg1_name, \
+                               arg2_type, arg2_name, arg3_type, arg3_name) \
+       static inline void                                              \
+       rte_bit_ ## fun(uint ## size ## _t *addr, arg1_type arg1_name,  \
+                       arg2_type arg2_name, arg3_type arg3_name)       \
+       {                                                               \
+               __rte_bit_ ## fun ## size(addr, arg1_name, arg2_name,   \
+                                         arg3_name);                 \
+       }
+
+#define __RTE_BIT_OVERLOAD_4(fun, qualifier, arg1_type, arg1_name, arg2_type, \
+                            arg2_name, arg3_type, arg3_name)           \
+       __RTE_BIT_OVERLOAD_SZ_4(fun, qualifier, 32, arg1_type, arg1_name, \
+                               arg2_type, arg2_name, arg3_type, arg3_name) \
+       __RTE_BIT_OVERLOAD_SZ_4(fun, qualifier, 64, arg1_type, arg1_name, \
+                               arg2_type, arg2_name, arg3_type, arg3_name)
+
+#define __RTE_BIT_OVERLOAD_SZ_4R(fun, qualifier, size, ret_type, arg1_type, \
+                                arg1_name, arg2_type, arg2_name, arg3_type, \
+                                arg3_name)                             \
+       static inline ret_type                                          \
+       rte_bit_ ## fun(uint ## size ## _t *addr, arg1_type arg1_name,  \
+                       arg2_type arg2_name, arg3_type arg3_name)       \
+       {                                                               \
+               return __rte_bit_ ## fun ## size(addr, arg1_name, arg2_name, \
+                                                arg3_name);            \
+       }
+
+#define __RTE_BIT_OVERLOAD_4R(fun, qualifier, ret_type, arg1_type, arg1_name, \
+                             arg2_type, arg2_name, arg3_type, arg3_name) \
+       __RTE_BIT_OVERLOAD_SZ_4R(fun, qualifier, 32, ret_type, arg1_type, \
+                                arg1_name, arg2_type, arg2_name, arg3_type, \
+                                arg3_name)                             \
+       __RTE_BIT_OVERLOAD_SZ_4R(fun, qualifier, 64, ret_type, arg1_type, \
+                                arg1_name, arg2_type, arg2_name, arg3_type, \
+                                arg3_name)
+
 __RTE_BIT_OVERLOAD_2R(test, const, bool, unsigned int, nr)
 __RTE_BIT_OVERLOAD_2(set,, unsigned int, nr)
 __RTE_BIT_OVERLOAD_2(clear,, unsigned int, nr)
 __RTE_BIT_OVERLOAD_3(assign,, unsigned int, nr, bool, value)
 __RTE_BIT_OVERLOAD_2(flip,, unsigned int, nr)
 
+__RTE_BIT_OVERLOAD_3R(atomic_test, const, bool, unsigned int, nr,
+                     int, memory_order)
+__RTE_BIT_OVERLOAD_3(atomic_set,, unsigned int, nr, int, memory_order)
+__RTE_BIT_OVERLOAD_3(atomic_clear,, unsigned int, nr, int, memory_order)
+__RTE_BIT_OVERLOAD_4(atomic_assign,, unsigned int, nr, bool, value,
+                    int, memory_order)
+__RTE_BIT_OVERLOAD_3(atomic_flip,, unsigned int, nr, int, memory_order)
+__RTE_BIT_OVERLOAD_3R(atomic_test_and_set,, bool, unsigned int, nr,
+                     int, memory_order)
+__RTE_BIT_OVERLOAD_3R(atomic_test_and_clear,, bool, unsigned int, nr,
+                     int, memory_order)
+__RTE_BIT_OVERLOAD_4R(atomic_test_and_assign,, bool, unsigned int, nr,
+                     bool, value, int, memory_order)
+
 #endif
 
 #endif /* _RTE_BITOPS_H_ */
-- 
2.34.1

Reply via email to