diff options
author | Mohsin Kazmi <sykazmi@cisco.com> | 2021-07-15 10:34:36 +0000 |
---|---|---|
committer | Damjan Marion <damarion@cisco.com> | 2021-07-16 11:31:27 +0200 |
commit | 0ec7dad7a00852663eb88554561347987f87bb53 (patch) | |
tree | c5312a27935c0556fee511b9fa2aea8b936276f8 /src/vppinfra/vector/array_mask.h | |
parent | b31ddb5bb14f6975afe912bc07275a9a8e0aa29f (diff) |
vppinfra: add array mask func
Type: feature
Signed-off-by: Mohsin Kazmi <sykazmi@cisco.com>
Change-Id: I6869221917f30f7e59709e20571b4615bc68dc8c
Diffstat (limited to 'src/vppinfra/vector/array_mask.h')
-rw-r--r-- | src/vppinfra/vector/array_mask.h | 75 |
1 files changed, 75 insertions, 0 deletions
diff --git a/src/vppinfra/vector/array_mask.h b/src/vppinfra/vector/array_mask.h new file mode 100644 index 00000000000..8f2e1d7d88c --- /dev/null +++ b/src/vppinfra/vector/array_mask.h @@ -0,0 +1,75 @@ +/* SPDX-License-Identifier: Apache-2.0 + * Copyright(c) 2021 Cisco Systems, Inc. + */ + +#ifndef included_vector_array_mask_h +#define included_vector_array_mask_h +#include <vppinfra/clib.h> + +/** \brief Mask array of 32-bit elemments + + @param src source array of u32 elements + @param mask use to mask the values of source array + @param n_elts number of elements in the source array + @return masked values are return in source array +*/ + +static_always_inline void +clib_array_mask_u32 (u32 *src, u32 mask, u32 n_elts) +{ + u32 i; +#if defined(CLIB_HAVE_VEC512) + u32x16 mask16 = u32x16_splat (mask); + + for (i = 0; i + 16 <= n_elts; i += 16) + *((u32x16u *) (src + i)) &= mask16; + n_elts -= i; + if (n_elts) + { + u16 m = pow2_mask (n_elts); + u32x16_mask_store (u32x16_mask_load_zero (src + i, m) & mask16, src + i, + m); + } + return; +#elif defined(CLIB_HAVE_VEC256) + u32x8 mask8 = u32x8_splat (mask); + + for (i = 0; i + 8 <= n_elts; i += 8) + *((u32x8u *) (src + i)) &= mask8; + n_elts -= i; +#if defined(CLIB_HAVE_VEC256_MASK_LOAD_STORE) + if (n_elts) + { + u8 m = pow2_mask (n_elts); + u32x8_mask_store (u32x8_mask_load_zero (src + i, m) & mask8, src + i, m); + } + return; +#endif +#elif defined(CLIB_HAVE_VEC128) + u32x4 mask4 = u32x4_splat (mask); + + for (i = 0; i + 4 <= n_elts; i += 4) + *((u32x4u *) (src + i)) &= mask4; + n_elts -= i; + switch (n_elts) + { + case 3: + src[2] &= mask; + case 2: + src[1] &= mask; + case 1: + src[0] &= mask; + case 0: + default:; + } + return; +#endif + while (n_elts > 0) + { + src[0] &= mask; + src++; + n_elts--; + } +} + +#endif |