aboutsummaryrefslogtreecommitdiffstats
path: root/docs/gettingstarted/developers/multiarch/nodefns.rst
blob: a43d40e301f20b9f66005925160dc1528857c17b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
Multi-Architecture Graph Node Cookbook
======================================

In the context of graph node dispatch functions, it's easy enough to
use the vpp multi-architecture support setup. The point of the scheme
is simple: for performance-critical nodes, generate multiple CPU
hardware-dependent versions of the node dispatch functions, and pick
the best one at runtime.

The vpp scheme is simple enough to use, but details matter.

100,000 foot view
-----------------

We compile entire graph node dispatch function implementation files
multiple times. These compilations give rise to multiple versions of
the graph node dispatch functions. Per-node constructor-functions
interrogate CPU hardware, select the node dispatch function variant to
use, and set the vlib_node_registration_t ".function" member to the
address of the selected variant.

Details
-------

Declare the node dispatch function as shown, using the VLIB\_NODE\_FN macro. The
name of the node function **MUST** match the name of the graph node. 

:: 

    VLIB_NODE_FN (ip4_sdp_node) (vlib_main_t * vm, vlib_node_runtime_t * node,
                                 vlib_frame_t * frame)
    {
      if (PREDICT_FALSE (node->flags & VLIB_NODE_FLAG_TRACE))
        return ip46_sdp_inline (vm, node, frame, 1 /* is_ip4 */ ,
    			    1 /* is_trace */ );
      else
        return ip46_sdp_inline (vm, node, frame, 1 /* is_ip4 */ ,
    			    0 /* is_trace */ );
    }   

We need to generate *precisely one copy* of the
vlib_node_registration_t, error strings, and packet trace decode function.

Simply bracket these items with "#ifndef CLIB_MARCH_VARIANT...#endif":

::

    #ifndef CLIB_MARCH_VARIANT
    static u8 *
    format_sdp_trace (u8 * s, va_list * args)
    {
       <snip>
    }
    #endif

    ...

    #ifndef CLIB_MARCH_VARIANT
    static char *sdp_error_strings[] = {
    #define _(sym,string) string,
      foreach_sdp_error
    #undef _
    };
    #endif

    ...

    #ifndef CLIB_MARCH_VARIANT
    VLIB_REGISTER_NODE (ip4_sdp_node) =
    {
      // DO NOT set the .function structure member.
      // The multiarch selection __attribute__((constructor)) function
      // takes care of it at runtime
      .name = "ip4-sdp",
      .vector_size = sizeof (u32),
      .format_trace = format_sdp_trace,
      .type = VLIB_NODE_TYPE_INTERNAL,

      .n_errors = ARRAY_LEN(sdp_error_strings),
      .error_strings = sdp_error_strings,

      .n_next_nodes = SDP_N_NEXT,

      /* edit / add dispositions here */
      .next_nodes =
      {
        [SDP_NEXT_DROP] = "ip4-drop",
      },
    };
    #endif

To belabor the point: *do not* set the ".function" member! That's the job of the multi-arch
selection \_\_attribute\_\_((constructor)) function

Always inline node dispatch functions
-------------------------------------

It's typical for a graph dispatch function to contain one or more
calls to an inline function. See above. If your node dispatch function
is structured that way, make *ABSOLUTELY CERTAIN* to use the
"always_inline" macro:

::

    always_inline uword
    ip46_sdp_inline (vlib_main_t * vm, vlib_node_runtime_t * node, 
                 vlib_frame_t * frame,
    		 int is_ip4, int is_trace)
    { ... }

Otherwise, the compiler is highly likely NOT to build multiple
versions of the guts of your dispatch function. 

It's fairly easy to spot this mistake in "perf top." If you see, for
example, a bunch of functions with names of the form
"xxx_node_fn_avx2" in the profile, *BUT* your brand-new node function
shows up with a name of the form "xxx_inline.isra.1", it's quite likely
that the inline was declared "static inline" instead of "always_inline".

Modify CMakeLists.txt
---------------------

If the component in question already lists "MULTIARCH_SOURCES", simply
add the indicated .c file to the list.  Otherwise, add as shown
below. Note that the added file "new_multiarch_node.c" should appear in
*both* SOURCES and MULTIARCH_SOURCES:

::

    add_vpp_plugin(myplugin
      SOURCES
      new_multiarch_node.c
      ...  

      MULTIARCH_SOURCES
      new_ multiarch_node.c
      ...
     )
in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sublicense, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * The above copyright notice and this permission notice shall be * included in all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ #include <vlib/vlib.h> #include <vlib/unix/unix.h> #include <sys/types.h> #include <sys/stat.h> #include <fcntl.h> #include <dirent.h> clib_error_t * foreach_directory_file (char *dir_name, clib_error_t * (*f) (void *arg, u8 * path_name, u8 * file_name), void *arg, int scan_dirs) { DIR *d; struct dirent *e; clib_error_t *error = 0; u8 *s, *t; d = opendir (dir_name); if (!d) { if (errno == ENOENT) return 0; return clib_error_return_unix (0, "open `%s'", dir_name); } s = t = 0; while (1) { e = readdir (d); if (!e) break; if (scan_dirs) { if (e->d_type == DT_DIR && (!strcmp (e->d_name, ".") || !strcmp (e->d_name, ".."))) continue; } else { if (e->d_type == DT_DIR) continue; } s = format (s, "%s/%s", dir_name, e->d_name); t = format (t, "%s", e->d_name); error = f (arg, s, t); _vec_len (s) = 0; _vec_len (t) = 0; if (error) break; } vec_free (s); closedir (d); return error; } clib_error_t * vlib_sysfs_write (char *file_name, char *fmt, ...) { u8 *s; int fd; clib_error_t *error = 0; fd = open (file_name, O_WRONLY); if (fd < 0) return clib_error_return_unix (0, "open `%s'", file_name); va_list va; va_start (va, fmt); s = va_format (0, fmt, &va); va_end (va); if (write (fd, s, vec_len (s)) < 0) error = clib_error_return_unix (0, "write `%s'", file_name); vec_free (s); close (fd); return error; } clib_error_t * vlib_sysfs_read (char *file_name, char *fmt, ...) { unformat_input_t input; u8 *s = 0; int fd; ssize_t sz; uword result; fd = open (file_name, O_RDONLY); if (fd < 0) return clib_error_return_unix (0, "open `%s'", file_name); vec_validate (s, 4095); sz = read (fd, s, vec_len (s)); if (sz < 0) { close (fd); vec_free (s); return clib_error_return_unix (0, "read `%s'", file_name); } _vec_len (s) = sz; unformat_init_vector (&input, s); va_list va; va_start (va, fmt); result = va_unformat (&input, fmt, &va); va_end (va); vec_free (s); close (fd); if (result == 0) return clib_error_return (0, "unformat error"); return 0; } u8 * vlib_sysfs_link_to_name (char *link) { char *p, buffer[64]; unformat_input_t in; u8 *s = 0; int r; r = readlink (link, buffer, sizeof (buffer) - 1); if (r < 0) return 0; buffer[r] = 0; p = strrchr (buffer, '/'); if (!p) return 0; unformat_init_string (&in, p + 1, strlen (p + 1)); if (unformat (&in, "%s", &s) != 1) clib_unix_warning ("no string?"); unformat_free (&in); return s; } int vlib_sysfs_get_free_hugepages (unsigned int numa_node, int page_size) { struct stat sb; u8 *p = 0; int r = -1; p = format (p, "/sys/devices/system/node/node%u%c", numa_node, 0); if (stat ((char *) p, &sb) == 0) { if (S_ISDIR (sb.st_mode) == 0) goto done; } else if (numa_node == 0) { vec_reset_length (p); p = format (p, "/sys/kernel/mm%c", 0); if (stat ((char *) p, &sb) < 0 || S_ISDIR (sb.st_mode) == 0) goto done; } else goto done; _vec_len (p) -= 1; p = format (p, "/hugepages/hugepages-%ukB/free_hugepages%c", page_size, 0); vlib_sysfs_read ((char *) p, "%d", &r); done: vec_free (p); return r; } clib_error_t * vlib_unix_recursive_mkdir (char *path) { clib_error_t *error = 0; char *c = 0; int i = 0; while (path[i] != 0) { if (c && path[i] == '/') { vec_add1 (c, 0); if ((mkdir (c, 0755)) && (errno != EEXIST)) { error = clib_error_return_unix (0, "mkdir '%s'", c); goto done; } _vec_len (c)--; } vec_add1 (c, path[i]); i++; } if ((mkdir (path, 0755)) && (errno != EEXIST)) { error = clib_error_return_unix (0, "mkdir '%s'", path); goto done; } done: vec_free (c); return error; } clib_error_t * vlib_unix_validate_runtime_file (unix_main_t * um, const char *path, u8 ** full_path) { u8 *fp = 0; char *last_slash = 0; if (path[0] == '\0') { return clib_error_return (0, "path is an empty string"); } else if (strncmp (path, "../", 3) == 0 || strstr (path, "/../")) { return clib_error_return (0, "'..' not allowed in runtime path"); } else if (path[0] == '/') { /* Absolute path. Has to start with runtime directory */ if (strncmp ((char *) um->runtime_dir, path, strlen ((char *) um->runtime_dir))) { return clib_error_return (0, "file %s is not in runtime directory %s", path, um->runtime_dir); } fp = format (0, "%s%c", path, '\0'); } else { /* Relative path, just append to runtime */ fp = format (0, "%s/%s%c", um->runtime_dir, path, '\0'); } /* We don't want to create a directory out of the last file */ if ((last_slash = strrchr ((char *) fp, '/')) != NULL) *last_slash = '\0'; clib_error_t *error = vlib_unix_recursive_mkdir ((char *) fp); if (last_slash != NULL) *last_slash = '/'; if (error) vec_free (fp); *full_path = fp; return error; } /* * fd.io coding-style-patch-verification: ON * * Local Variables: * eval: (c-set-style "gnu") * End: */