summaryrefslogtreecommitdiffstats
path: root/src/vppinfra/vector/array_mask.h
diff options
context:
space:
mode:
authorMohsin Kazmi <sykazmi@cisco.com>2021-07-15 10:34:36 +0000
committerDamjan Marion <damarion@cisco.com>2021-07-16 11:31:27 +0200
commit0ec7dad7a00852663eb88554561347987f87bb53 (patch)
treec5312a27935c0556fee511b9fa2aea8b936276f8 /src/vppinfra/vector/array_mask.h
parentb31ddb5bb14f6975afe912bc07275a9a8e0aa29f (diff)
vppinfra: add array mask func
Type: feature Signed-off-by: Mohsin Kazmi <sykazmi@cisco.com> Change-Id: I6869221917f30f7e59709e20571b4615bc68dc8c
Diffstat (limited to 'src/vppinfra/vector/array_mask.h')
-rw-r--r--src/vppinfra/vector/array_mask.h75
1 files changed, 75 insertions, 0 deletions
diff --git a/src/vppinfra/vector/array_mask.h b/src/vppinfra/vector/array_mask.h
new file mode 100644
index 00000000000..8f2e1d7d88c
--- /dev/null
+++ b/src/vppinfra/vector/array_mask.h
@@ -0,0 +1,75 @@
+/* SPDX-License-Identifier: Apache-2.0
+ * Copyright(c) 2021 Cisco Systems, Inc.
+ */
+
+#ifndef included_vector_array_mask_h
+#define included_vector_array_mask_h
+#include <vppinfra/clib.h>
+
+/** \brief Mask array of 32-bit elemments
+
+ @param src source array of u32 elements
+ @param mask use to mask the values of source array
+ @param n_elts number of elements in the source array
+ @return masked values are return in source array
+*/
+
+static_always_inline void
+clib_array_mask_u32 (u32 *src, u32 mask, u32 n_elts)
+{
+ u32 i;
+#if defined(CLIB_HAVE_VEC512)
+ u32x16 mask16 = u32x16_splat (mask);
+
+ for (i = 0; i + 16 <= n_elts; i += 16)
+ *((u32x16u *) (src + i)) &= mask16;
+ n_elts -= i;
+ if (n_elts)
+ {
+ u16 m = pow2_mask (n_elts);
+ u32x16_mask_store (u32x16_mask_load_zero (src + i, m) & mask16, src + i,
+ m);
+ }
+ return;
+#elif defined(CLIB_HAVE_VEC256)
+ u32x8 mask8 = u32x8_splat (mask);
+
+ for (i = 0; i + 8 <= n_elts; i += 8)
+ *((u32x8u *) (src + i)) &= mask8;
+ n_elts -= i;
+#if defined(CLIB_HAVE_VEC256_MASK_LOAD_STORE)
+ if (n_elts)
+ {
+ u8 m = pow2_mask (n_elts);
+ u32x8_mask_store (u32x8_mask_load_zero (src + i, m) & mask8, src + i, m);
+ }
+ return;
+#endif
+#elif defined(CLIB_HAVE_VEC128)
+ u32x4 mask4 = u32x4_splat (mask);
+
+ for (i = 0; i + 4 <= n_elts; i += 4)
+ *((u32x4u *) (src + i)) &= mask4;
+ n_elts -= i;
+ switch (n_elts)
+ {
+ case 3:
+ src[2] &= mask;
+ case 2:
+ src[1] &= mask;
+ case 1:
+ src[0] &= mask;
+ case 0:
+ default:;
+ }
+ return;
+#endif
+ while (n_elts > 0)
+ {
+ src[0] &= mask;
+ src++;
+ n_elts--;
+ }
+}
+
+#endif