diff options
author | Damjan Marion <damarion@cisco.com> | 2022-01-13 00:28:14 +0100 |
---|---|---|
committer | Florin Coras <florin.coras@gmail.com> | 2022-01-16 18:54:52 +0000 |
commit | 7b90f669d83f432f3610ec0da522bd8ccc4dff01 (patch) | |
tree | f2e47bdf50dfa3c353ddc8ff7916b7d4ef50c9d1 /src/vppinfra | |
parent | 5233d4619cd0a4a154c35e88ccee92c24cacd377 (diff) |
vppinfra: bitops cleanup
Type: refactor
Change-Id: I7fa113e924640f9d798c1eb6ae64b9c0a9e2104c
Signed-off-by: Damjan Marion <damarion@cisco.com>
Diffstat (limited to 'src/vppinfra')
-rw-r--r-- | src/vppinfra/bitmap.h | 1 | ||||
-rw-r--r-- | src/vppinfra/bitops.h | 83 | ||||
-rw-r--r-- | src/vppinfra/clib.h | 71 | ||||
-rw-r--r-- | src/vppinfra/interrupt.c | 1 | ||||
-rw-r--r-- | src/vppinfra/interrupt.h | 1 | ||||
-rw-r--r-- | src/vppinfra/sparse_vec.h | 2 | ||||
-rw-r--r-- | src/vppinfra/unix-formats.c | 1 | ||||
-rw-r--r-- | src/vppinfra/vector/compress.h | 36 |
8 files changed, 54 insertions, 142 deletions
diff --git a/src/vppinfra/bitmap.h b/src/vppinfra/bitmap.h index d9bdd0fac7d..459e6f2b9b4 100644 --- a/src/vppinfra/bitmap.h +++ b/src/vppinfra/bitmap.h @@ -45,7 +45,6 @@ #include <vppinfra/vec.h> #include <vppinfra/random.h> #include <vppinfra/error.h> -#include <vppinfra/bitops.h> /* for count_set_bits */ typedef uword clib_bitmap_t; diff --git a/src/vppinfra/bitops.h b/src/vppinfra/bitops.h index 04365699f93..15454ca5036 100644 --- a/src/vppinfra/bitops.h +++ b/src/vppinfra/bitops.h @@ -38,18 +38,38 @@ #ifndef included_clib_bitops_h #define included_clib_bitops_h -#include <vppinfra/clib.h> +static_always_inline uword +clear_lowest_set_bit (uword x) +{ +#ifdef __BMI__ + return uword_bits > 32 ? _blsr_u64 (x) : _blsr_u32 (x); +#else + return x & (x - 1); +#endif +} + +static_always_inline uword +get_lowest_set_bit (uword x) +{ +#ifdef __BMI__ + return uword_bits > 32 ? _blsi_u64 (x) : _blsi_u32 (x); +#else + return x & -x; +#endif +} + +static_always_inline u8 +get_lowest_set_bit_index (uword x) +{ + return uword_bits > 32 ? __builtin_ctzll (x) : __builtin_ctz (x); +} /* Population count from Hacker's Delight. */ always_inline uword count_set_bits (uword x) { #ifdef __POPCNT__ -#if uword_bits == 64 - return __builtin_popcountll (x); -#else - return __builtin_popcount (x); -#endif + return uword_bits > 32 ? __builtin_popcountll (x) : __builtin_popcount (x); #else #if uword_bits == 64 const uword c1 = 0x5555555555555555; @@ -81,6 +101,15 @@ count_set_bits (uword x) #endif } +#if uword_bits == 64 +#define count_leading_zeros(x) __builtin_clzll (x) +#else +#define count_leading_zeros(x) __builtin_clzll (x) +#endif + +#define count_trailing_zeros(x) get_lowest_set_bit_index (x) +#define log2_first_set(x) get_lowest_set_bit_index (x) + /* Based on "Hacker's Delight" code from GLS. */ typedef struct { @@ -163,45 +192,13 @@ next_with_same_number_of_set_bits (uword x) return ripple | ones; } -#define foreach_set_bit(var,mask,body) \ -do { \ - uword _foreach_set_bit_m_##var = (mask); \ - uword _foreach_set_bit_f_##var; \ - while (_foreach_set_bit_m_##var != 0) \ - { \ - _foreach_set_bit_f_##var = first_set (_foreach_set_bit_m_##var); \ - _foreach_set_bit_m_##var ^= _foreach_set_bit_f_##var; \ - (var) = min_log2 (_foreach_set_bit_f_##var); \ - do { body; } while (0); \ - } \ -} while (0) - -static_always_inline u64 -reset_lowest_set_bit (u64 x) -{ -#ifdef __BMI__ - return _blsr_u64 (x); -#else - return x & (x - 1); -#endif -} +#define foreach_set_bit_index(i, v) \ + for (uword _tmp = (v) + 0 * (uword) (i = get_lowest_set_bit_index (v)); \ + _tmp; \ + i = get_lowest_set_bit_index (_tmp = clear_lowest_set_bit (_tmp))) -static_always_inline u64 -get_lowest_set_bit (u64 x) -{ -#ifdef __BMI__ - return _blsi_u64 (x); #else - return x & -x; -#endif -} - -static_always_inline u64 -get_lowest_set_bit_index (u64 x) -{ - return __builtin_ctzll (x); -} - +#warning "already included" #endif /* included_clib_bitops_h */ /* diff --git a/src/vppinfra/clib.h b/src/vppinfra/clib.h index 1b6ab4157d7..b3a2580e73a 100644 --- a/src/vppinfra/clib.h +++ b/src/vppinfra/clib.h @@ -164,25 +164,7 @@ decl __attribute ((destructor)); \ decl -/* Use __builtin_clz if available. */ -#if uword_bits == 64 -#define count_leading_zeros(x) __builtin_clzll (x) -#define count_trailing_zeros(x) __builtin_ctzll (x) -#else -#define count_leading_zeros(x) __builtin_clzl (x) -#define count_trailing_zeros(x) __builtin_ctzl (x) -#endif - -#if defined (count_leading_zeros) -always_inline uword -clear_lowest_set_bit (uword x) -{ -#ifdef __BMI2__ - return _blsr_u64 (x); -#else - return x ^ (1ULL << count_trailing_zeros (x)); -#endif -} +#include <vppinfra/bitops.h> always_inline uword min_log2 (uword x) @@ -191,45 +173,6 @@ min_log2 (uword x) n = count_leading_zeros (x); return BITS (uword) - n - 1; } -#else -always_inline uword -min_log2 (uword x) -{ - uword a = x, b = BITS (uword) / 2, c = 0, r = 0; - - /* Reduce x to 4 bit result. */ -#define _ \ -{ \ - c = a >> b; \ - if (c) a = c; \ - if (c) r += b; \ - b /= 2; \ -} - - if (BITS (uword) > 32) - _; - _; - _; - _; -#undef _ - - /* Do table lookup on 4 bit partial. */ - if (BITS (uword) > 32) - { - const u64 table = 0x3333333322221104LL; - uword t = (table >> (4 * a)) & 0xf; - r = t < 4 ? r + t : ~0; - } - else - { - const u32 table = 0x22221104; - uword t = (a & 8) ? 3 : ((table >> (4 * a)) & 0xf); - r = t < 4 ? r + t : ~0; - } - - return r; -} -#endif always_inline uword max_log2 (uword x) @@ -308,18 +251,6 @@ first_set (uword x) return x & -x; } -always_inline uword -log2_first_set (uword x) -{ - uword result; -#ifdef count_trailing_zeros - result = count_trailing_zeros (x); -#else - result = min_log2 (first_set (x)); -#endif - return result; -} - always_inline f64 flt_round_down (f64 x) { diff --git a/src/vppinfra/interrupt.c b/src/vppinfra/interrupt.c index 20b7450ceed..df242d932b6 100644 --- a/src/vppinfra/interrupt.c +++ b/src/vppinfra/interrupt.c @@ -15,7 +15,6 @@ */ #include <vppinfra/clib.h> -#include <vppinfra/bitops.h> /* for count_set_bits */ #include <vppinfra/vec.h> #include <vppinfra/interrupt.h> #include <vppinfra/format.h> diff --git a/src/vppinfra/interrupt.h b/src/vppinfra/interrupt.h index 60c01fa0248..393574b076b 100644 --- a/src/vppinfra/interrupt.h +++ b/src/vppinfra/interrupt.h @@ -17,7 +17,6 @@ #define included_clib_interrupt_h #include <vppinfra/clib.h> -#include <vppinfra/bitops.h> /* for count_set_bits */ #include <vppinfra/vec.h> typedef struct diff --git a/src/vppinfra/sparse_vec.h b/src/vppinfra/sparse_vec.h index 54a92ce7a84..fc8b3cf1e8e 100644 --- a/src/vppinfra/sparse_vec.h +++ b/src/vppinfra/sparse_vec.h @@ -38,8 +38,8 @@ #ifndef included_sparse_vec_h #define included_sparse_vec_h +#include <vppinfra/clib.h> #include <vppinfra/vec.h> -#include <vppinfra/bitops.h> /* Sparsely indexed vectors. Basic idea taken from Hacker's delight. Eliot added ranges. */ diff --git a/src/vppinfra/unix-formats.c b/src/vppinfra/unix-formats.c index fd112675fa7..fb3a7286020 100644 --- a/src/vppinfra/unix-formats.c +++ b/src/vppinfra/unix-formats.c @@ -91,7 +91,6 @@ # include <netinet/if_ether.h> #endif /* __KERNEL__ */ -#include <vppinfra/bitops.h> /* foreach_set_bit */ #include <vppinfra/format.h> #include <vppinfra/error.h> diff --git a/src/vppinfra/vector/compress.h b/src/vppinfra/vector/compress.h index adb6503f711..d2ed716ac8e 100644 --- a/src/vppinfra/vector/compress.h +++ b/src/vppinfra/vector/compress.h @@ -27,12 +27,9 @@ clib_compress_u64_x64 (u64 *dst, u64 *src, u64 mask) mask >>= 4; } #else - while (mask) - { - u16 bit = count_trailing_zeros (mask); - mask = clear_lowest_set_bit (mask); - dst++[0] = src[bit]; - } + u32 i; + foreach_set_bit_index (i, mask) + dst++[0] = src[i]; #endif return dst; } @@ -93,12 +90,9 @@ clib_compress_u32_x64 (u32 *dst, u32 *src, u64 mask) mask >>= 8; } #else - while (mask) - { - u16 bit = count_trailing_zeros (mask); - mask = clear_lowest_set_bit (mask); - dst++[0] = src[bit]; - } + u32 i; + foreach_set_bit_index (i, mask) + dst++[0] = src[i]; #endif return dst; } @@ -150,12 +144,9 @@ clib_compress_u16_x64 (u16 *dst, u16 *src, u64 mask) mask >>= 32; } #else - while (mask) - { - u16 bit = count_trailing_zeros (mask); - mask = clear_lowest_set_bit (mask); - dst++[0] = src[bit]; - } + u32 i; + foreach_set_bit_index (i, mask) + dst++[0] = src[i]; #endif return dst; } @@ -203,12 +194,9 @@ clib_compress_u8_x64 (u8 *dst, u8 *src, u64 mask) u8x64_compress_store (sv[0], mask, dst); dst += _popcnt64 (mask); #else - while (mask) - { - u16 bit = count_trailing_zeros (mask); - mask = clear_lowest_set_bit (mask); - dst++[0] = src[bit]; - } + u32 i; + foreach_set_bit_index (i, mask) + dst++[0] = src[i]; #endif return dst; } |