summaryrefslogtreecommitdiffstats
path: root/src/vppinfra/vector/array_mask.h
blob: 778ed3e638f0c07f07d9fc2608914d7041b98fe0 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
/* SPDX-License-Identifier: Apache-2.0
 * Copyright(c) 2021 Cisco Systems, Inc.
 */

#ifndef included_vector_array_mask_h
#define included_vector_array_mask_h
#include <vppinfra/clib.h>

/** \brief Mask array of 32-bit elemments

    @param src source array of u32 elements
    @param mask use to mask the values of source array
    @param n_elts number of elements in the source array
    @return masked values are return in source array
*/

static_always_inline void
clib_array_mask_u32 (u32 *src, u32 mask, u32 n_elts)
{
  u32 i;
#if defined(CLIB_HAVE_VEC512)
  u32x16 mask16 = u32x16_splat (mask);

  for (i = 0; i + 16 <= n_elts; i += 16)
    *((u32x16u *) (src + i)) &= mask16;
  n_elts -= i;
  if (n_elts)
    {
      u16 m = pow2_mask (n_elts);
      u32x16_mask_store (u32x16_mask_load_zero (src + i, m) & mask16, src + i,
			 m);
    }
  return;
#elif defined(CLIB_HAVE_VEC256)
  u32x8 mask8 = u32x8_splat (mask);

  for (i = 0; i + 8 <= n_elts; i += 8)
    *((u32x8u *) (src + i)) &= mask8;
  n_elts -= i;
  src += i;
#if defined(CLIB_HAVE_VEC256_MASK_LOAD_STORE)
  if (n_elts)
    {
      u8 m = pow2_mask (n_elts);
      u32x8_mask_store (u32x8_mask_load_zero (src, m) & mask8, src, m);
    }
  return;
#endif
#elif defined(CLIB_HAVE_VEC128)
  u32x4 mask4 = u32x4_splat (mask);

  for (i = 0; i + 4 <= n_elts; i += 4)
    *((u32x4u *) (src + i)) &= mask4;
  n_elts -= i;
  src += i;
  switch (n_elts)
    {
    case 3:
      src[2] &= mask;
    case 2:
      src[1] &= mask;
    case 1:
      src[0] &= mask;
    case 0:
    default:;
    }
  return;
#endif
  while (n_elts > 0)
    {
      src[0] &= mask;
      src++;
      n_elts--;
    }
}

#endif