diff options
Diffstat (limited to 'src/vnet')
-rw-r--r-- | src/vnet/CMakeLists.txt | 24 | ||||
-rw-r--r-- | src/vnet/vxlan/FEATURE.yaml | 14 | ||||
-rw-r--r-- | src/vnet/vxlan/decap.c | 1330 | ||||
-rw-r--r-- | src/vnet/vxlan/dir.dox | 24 | ||||
-rw-r--r-- | src/vnet/vxlan/encap.c | 540 | ||||
-rw-r--r-- | src/vnet/vxlan/vxlan.api | 198 | ||||
-rw-r--r-- | src/vnet/vxlan/vxlan.c | 1349 | ||||
-rw-r--r-- | src/vnet/vxlan/vxlan.h | 242 | ||||
-rw-r--r-- | src/vnet/vxlan/vxlan_api.c | 376 | ||||
-rw-r--r-- | src/vnet/vxlan/vxlan_error.def | 17 | ||||
-rw-r--r-- | src/vnet/vxlan/vxlan_packet.h | 80 |
11 files changed, 0 insertions, 4194 deletions
diff --git a/src/vnet/CMakeLists.txt b/src/vnet/CMakeLists.txt index 963e000807c..c1c9acc41a0 100644 --- a/src/vnet/CMakeLists.txt +++ b/src/vnet/CMakeLists.txt @@ -297,30 +297,6 @@ list(APPEND VNET_HEADERS ) ############################################################################## -# Layer 2 / vxlan -############################################################################## -list(APPEND VNET_SOURCES - vxlan/vxlan.c - vxlan/encap.c - vxlan/decap.c - vxlan/vxlan_api.c -) - -list(APPEND VNET_MULTIARCH_SOURCES - vxlan/encap.c -) - -list(APPEND VNET_HEADERS - vxlan/vxlan.h - vxlan/vxlan_packet.h - vxlan/vxlan_error.def -) - -list(APPEND VNET_MULTIARCH_SOURCES vxlan/decap.c) - -list(APPEND VNET_API_FILES vxlan/vxlan.api) - -############################################################################## # Layer 2 / Bonding ############################################################################## list(APPEND VNET_SOURCES diff --git a/src/vnet/vxlan/FEATURE.yaml b/src/vnet/vxlan/FEATURE.yaml deleted file mode 100644 index dc7d21b010e..00000000000 --- a/src/vnet/vxlan/FEATURE.yaml +++ /dev/null @@ -1,14 +0,0 @@ ---- -name: Virtual eXtensible LAN -maintainer: John Lo <loj@cisco.com> -features: - - VXLAN tunnel for support of L2 overlay/virtual networks (RFC-7348) - - Support either IPv4 or IPv6 underlay network VTEPs - - Flooding via headend replication if all VXLAN tunnels in BD are unicast ones - - Multicast VXLAN tunnel can be added to BD to flood via IP multicast - - VXLAN encap with flow-hashed source port for better underlay IP load balance - - VXLAN decap optimization via vxlan-bypass IP feature on underlay interfaces - - VXLAN decap HW offload using flow director with DPDK on Intel Fortville NICs -description: "Virtual eXtensible LAN (VXLAN) tunnels support L2 overlay networks that span L3 networks" -state: production -properties: [API, CLI, MULTITHREAD] diff --git a/src/vnet/vxlan/decap.c b/src/vnet/vxlan/decap.c deleted file mode 100644 index 729293fb3e5..00000000000 --- a/src/vnet/vxlan/decap.c +++ /dev/null @@ -1,1330 +0,0 @@ -/* - * decap.c: vxlan tunnel decap packet processing - * - * Copyright (c) 2013 Cisco and/or its affiliates. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at: - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ - -#include <vlib/vlib.h> -#include <vnet/vxlan/vxlan.h> -#include <vnet/udp/udp_local.h> - -#ifndef CLIB_MARCH_VARIANT -vlib_node_registration_t vxlan4_input_node; -vlib_node_registration_t vxlan6_input_node; -#endif - -typedef struct -{ - u32 next_index; - u32 tunnel_index; - u32 error; - u32 vni; -} vxlan_rx_trace_t; - -static u8 * -format_vxlan_rx_trace (u8 * s, va_list * args) -{ - CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *); - CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *); - vxlan_rx_trace_t *t = va_arg (*args, vxlan_rx_trace_t *); - - if (t->tunnel_index == ~0) - return format (s, "VXLAN decap error - tunnel for vni %d does not exist", - t->vni); - return format (s, "VXLAN decap from vxlan_tunnel%d vni %d next %d error %d", - t->tunnel_index, t->vni, t->next_index, t->error); -} - -typedef vxlan4_tunnel_key_t last_tunnel_cache4; - -static const vxlan_decap_info_t decap_not_found = { - .sw_if_index = ~0, - .next_index = VXLAN_INPUT_NEXT_DROP, - .error = VXLAN_ERROR_NO_SUCH_TUNNEL -}; - -static const vxlan_decap_info_t decap_bad_flags = { - .sw_if_index = ~0, - .next_index = VXLAN_INPUT_NEXT_DROP, - .error = VXLAN_ERROR_BAD_FLAGS -}; - -always_inline vxlan_decap_info_t -vxlan4_find_tunnel (vxlan_main_t * vxm, last_tunnel_cache4 * cache, - u32 fib_index, ip4_header_t * ip4_0, - vxlan_header_t * vxlan0, u32 * stats_sw_if_index) -{ - if (PREDICT_FALSE (vxlan0->flags != VXLAN_FLAGS_I)) - return decap_bad_flags; - - /* Make sure VXLAN tunnel exist according to packet S/D IP, UDP port, VRF, - * and VNI */ - u32 dst = ip4_0->dst_address.as_u32; - u32 src = ip4_0->src_address.as_u32; - udp_header_t *udp = ip4_next_header (ip4_0); - vxlan4_tunnel_key_t key4 = { - .key[0] = ((u64) dst << 32) | src, - .key[1] = ((u64) udp->dst_port << 48) | ((u64) fib_index << 32) | - vxlan0->vni_reserved, - }; - - if (PREDICT_TRUE - (key4.key[0] == cache->key[0] && key4.key[1] == cache->key[1])) - { - /* cache hit */ - vxlan_decap_info_t di = {.as_u64 = cache->value }; - *stats_sw_if_index = di.sw_if_index; - return di; - } - - int rv = clib_bihash_search_inline_16_8 (&vxm->vxlan4_tunnel_by_key, &key4); - if (PREDICT_TRUE (rv == 0)) - { - *cache = key4; - vxlan_decap_info_t di = {.as_u64 = key4.value }; - *stats_sw_if_index = di.sw_if_index; - return di; - } - - /* try multicast */ - if (PREDICT_TRUE (!ip4_address_is_multicast (&ip4_0->dst_address))) - return decap_not_found; - - /* search for mcast decap info by mcast address */ - key4.key[0] = dst; - rv = clib_bihash_search_inline_16_8 (&vxm->vxlan4_tunnel_by_key, &key4); - if (rv != 0) - return decap_not_found; - - /* search for unicast tunnel using the mcast tunnel local(src) ip */ - vxlan_decap_info_t mdi = {.as_u64 = key4.value }; - key4.key[0] = ((u64) mdi.local_ip.as_u32 << 32) | src; - rv = clib_bihash_search_inline_16_8 (&vxm->vxlan4_tunnel_by_key, &key4); - if (PREDICT_FALSE (rv != 0)) - return decap_not_found; - - /* mcast traffic does not update the cache */ - *stats_sw_if_index = mdi.sw_if_index; - vxlan_decap_info_t di = {.as_u64 = key4.value }; - return di; -} - -typedef vxlan6_tunnel_key_t last_tunnel_cache6; - -always_inline vxlan_decap_info_t -vxlan6_find_tunnel (vxlan_main_t * vxm, last_tunnel_cache6 * cache, - u32 fib_index, ip6_header_t * ip6_0, - vxlan_header_t * vxlan0, u32 * stats_sw_if_index) -{ - if (PREDICT_FALSE (vxlan0->flags != VXLAN_FLAGS_I)) - return decap_bad_flags; - - /* Make sure VXLAN tunnel exist according to packet SIP, UDP port, VRF, and - * VNI */ - udp_header_t *udp = ip6_next_header (ip6_0); - vxlan6_tunnel_key_t key6 = { - .key[0] = ip6_0->src_address.as_u64[0], - .key[1] = ip6_0->src_address.as_u64[1], - .key[2] = ((u64) udp->dst_port << 48) | ((u64) fib_index << 32) | - vxlan0->vni_reserved, - }; - - if (PREDICT_FALSE - (clib_bihash_key_compare_24_8 (key6.key, cache->key) == 0)) - { - int rv = - clib_bihash_search_inline_24_8 (&vxm->vxlan6_tunnel_by_key, &key6); - if (PREDICT_FALSE (rv != 0)) - return decap_not_found; - - *cache = key6; - } - vxlan_tunnel_t *t0 = pool_elt_at_index (vxm->tunnels, cache->value); - - /* Validate VXLAN tunnel SIP against packet DIP */ - if (PREDICT_TRUE (ip6_address_is_equal (&ip6_0->dst_address, &t0->src.ip6))) - *stats_sw_if_index = t0->sw_if_index; - else - { - /* try multicast */ - if (PREDICT_TRUE (!ip6_address_is_multicast (&ip6_0->dst_address))) - return decap_not_found; - - /* Make sure mcast VXLAN tunnel exist by packet DIP and VNI */ - key6.key[0] = ip6_0->dst_address.as_u64[0]; - key6.key[1] = ip6_0->dst_address.as_u64[1]; - int rv = - clib_bihash_search_inline_24_8 (&vxm->vxlan6_tunnel_by_key, &key6); - if (PREDICT_FALSE (rv != 0)) - return decap_not_found; - - vxlan_tunnel_t *mcast_t0 = pool_elt_at_index (vxm->tunnels, key6.value); - *stats_sw_if_index = mcast_t0->sw_if_index; - } - - vxlan_decap_info_t di = { - .sw_if_index = t0->sw_if_index, - .next_index = t0->decap_next_index, - }; - return di; -} - -always_inline uword -vxlan_input (vlib_main_t * vm, - vlib_node_runtime_t * node, - vlib_frame_t * from_frame, u32 is_ip4) -{ - vxlan_main_t *vxm = &vxlan_main; - vnet_main_t *vnm = vxm->vnet_main; - vnet_interface_main_t *im = &vnm->interface_main; - vlib_combined_counter_main_t *rx_counter = - im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX; - last_tunnel_cache4 last4; - last_tunnel_cache6 last6; - u32 pkts_dropped = 0; - u32 thread_index = vlib_get_thread_index (); - - if (is_ip4) - clib_memset (&last4, 0xff, sizeof last4); - else - clib_memset (&last6, 0xff, sizeof last6); - - u32 *from = vlib_frame_vector_args (from_frame); - u32 n_left_from = from_frame->n_vectors; - - vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b = bufs; - vlib_get_buffers (vm, from, bufs, n_left_from); - - u32 stats_if0 = ~0, stats_if1 = ~0; - u16 nexts[VLIB_FRAME_SIZE], *next = nexts; - while (n_left_from >= 4) - { - /* Prefetch next iteration. */ - vlib_prefetch_buffer_header (b[2], LOAD); - vlib_prefetch_buffer_header (b[3], LOAD); - - /* udp leaves current_data pointing at the vxlan header */ - void *cur0 = vlib_buffer_get_current (b[0]); - void *cur1 = vlib_buffer_get_current (b[1]); - vxlan_header_t *vxlan0 = cur0; - vxlan_header_t *vxlan1 = cur1; - - - ip4_header_t *ip4_0, *ip4_1; - ip6_header_t *ip6_0, *ip6_1; - if (is_ip4) - { - ip4_0 = cur0 - sizeof (udp_header_t) - sizeof (ip4_header_t); - ip4_1 = cur1 - sizeof (udp_header_t) - sizeof (ip4_header_t); - } - else - { - ip6_0 = cur0 - sizeof (udp_header_t) - sizeof (ip6_header_t); - ip6_1 = cur1 - sizeof (udp_header_t) - sizeof (ip6_header_t); - } - - /* pop vxlan */ - vlib_buffer_advance (b[0], sizeof *vxlan0); - vlib_buffer_advance (b[1], sizeof *vxlan1); - - u32 fi0 = vlib_buffer_get_ip_fib_index (b[0], is_ip4); - u32 fi1 = vlib_buffer_get_ip_fib_index (b[1], is_ip4); - - vxlan_decap_info_t di0 = is_ip4 ? - vxlan4_find_tunnel (vxm, &last4, fi0, ip4_0, vxlan0, &stats_if0) : - vxlan6_find_tunnel (vxm, &last6, fi0, ip6_0, vxlan0, &stats_if0); - vxlan_decap_info_t di1 = is_ip4 ? - vxlan4_find_tunnel (vxm, &last4, fi1, ip4_1, vxlan1, &stats_if1) : - vxlan6_find_tunnel (vxm, &last6, fi1, ip6_1, vxlan1, &stats_if1); - - /* Prefetch next iteration. */ - clib_prefetch_load (b[2]->data); - clib_prefetch_load (b[3]->data); - - u32 len0 = vlib_buffer_length_in_chain (vm, b[0]); - u32 len1 = vlib_buffer_length_in_chain (vm, b[1]); - - next[0] = di0.next_index; - next[1] = di1.next_index; - - u8 any_error = di0.error | di1.error; - if (PREDICT_TRUE (any_error == 0)) - { - /* Required to make the l2 tag push / pop code work on l2 subifs */ - vnet_update_l2_len (b[0]); - vnet_update_l2_len (b[1]); - /* Set packet input sw_if_index to unicast VXLAN tunnel for learning */ - vnet_buffer (b[0])->sw_if_index[VLIB_RX] = di0.sw_if_index; - vnet_buffer (b[1])->sw_if_index[VLIB_RX] = di1.sw_if_index; - vlib_increment_combined_counter (rx_counter, thread_index, - stats_if0, 1, len0); - vlib_increment_combined_counter (rx_counter, thread_index, - stats_if1, 1, len1); - } - else - { - if (di0.error == 0) - { - vnet_update_l2_len (b[0]); - vnet_buffer (b[0])->sw_if_index[VLIB_RX] = di0.sw_if_index; - vlib_increment_combined_counter (rx_counter, thread_index, - stats_if0, 1, len0); - } - else - { - b[0]->error = node->errors[di0.error]; - pkts_dropped++; - } - - if (di1.error == 0) - { - vnet_update_l2_len (b[1]); - vnet_buffer (b[1])->sw_if_index[VLIB_RX] = di1.sw_if_index; - vlib_increment_combined_counter (rx_counter, thread_index, - stats_if1, 1, len1); - } - else - { - b[1]->error = node->errors[di1.error]; - pkts_dropped++; - } - } - - if (PREDICT_FALSE (b[0]->flags & VLIB_BUFFER_IS_TRACED)) - { - vxlan_rx_trace_t *tr = - vlib_add_trace (vm, node, b[0], sizeof (*tr)); - tr->next_index = next[0]; - tr->error = di0.error; - tr->tunnel_index = di0.sw_if_index == ~0 ? - ~0 : vxm->tunnel_index_by_sw_if_index[di0.sw_if_index]; - tr->vni = vnet_get_vni (vxlan0); - } - if (PREDICT_FALSE (b[1]->flags & VLIB_BUFFER_IS_TRACED)) - { - vxlan_rx_trace_t *tr = - vlib_add_trace (vm, node, b[1], sizeof (*tr)); - tr->next_index = next[1]; - tr->error = di1.error; - tr->tunnel_index = di1.sw_if_index == ~0 ? - ~0 : vxm->tunnel_index_by_sw_if_index[di1.sw_if_index]; - tr->vni = vnet_get_vni (vxlan1); - } - b += 2; - next += 2; - n_left_from -= 2; - } - - while (n_left_from > 0) - { - /* udp leaves current_data pointing at the vxlan header */ - void *cur0 = vlib_buffer_get_current (b[0]); - vxlan_header_t *vxlan0 = cur0; - ip4_header_t *ip4_0; - ip6_header_t *ip6_0; - if (is_ip4) - ip4_0 = cur0 - sizeof (udp_header_t) - sizeof (ip4_header_t); - else - ip6_0 = cur0 - sizeof (udp_header_t) - sizeof (ip6_header_t); - - /* pop (ip, udp, vxlan) */ - vlib_buffer_advance (b[0], sizeof (*vxlan0)); - - u32 fi0 = vlib_buffer_get_ip_fib_index (b[0], is_ip4); - - vxlan_decap_info_t di0 = is_ip4 ? - vxlan4_find_tunnel (vxm, &last4, fi0, ip4_0, vxlan0, &stats_if0) : - vxlan6_find_tunnel (vxm, &last6, fi0, ip6_0, vxlan0, &stats_if0); - - uword len0 = vlib_buffer_length_in_chain (vm, b[0]); - - next[0] = di0.next_index; - - /* Validate VXLAN tunnel encap-fib index against packet */ - if (di0.error == 0) - { - /* Required to make the l2 tag push / pop code work on l2 subifs */ - vnet_update_l2_len (b[0]); - - /* Set packet input sw_if_index to unicast VXLAN tunnel for learning */ - vnet_buffer (b[0])->sw_if_index[VLIB_RX] = di0.sw_if_index; - - vlib_increment_combined_counter (rx_counter, thread_index, - stats_if0, 1, len0); - } - else - { - b[0]->error = node->errors[di0.error]; - pkts_dropped++; - } - - if (PREDICT_FALSE (b[0]->flags & VLIB_BUFFER_IS_TRACED)) - { - vxlan_rx_trace_t *tr - = vlib_add_trace (vm, node, b[0], sizeof (*tr)); - tr->next_index = next[0]; - tr->error = di0.error; - tr->tunnel_index = di0.sw_if_index == ~0 ? - ~0 : vxm->tunnel_index_by_sw_if_index[di0.sw_if_index]; - tr->vni = vnet_get_vni (vxlan0); - } - b += 1; - next += 1; - n_left_from -= 1; - } - vlib_buffer_enqueue_to_next (vm, node, from, nexts, from_frame->n_vectors); - /* Do we still need this now that tunnel tx stats is kept? */ - u32 node_idx = is_ip4 ? vxlan4_input_node.index : vxlan6_input_node.index; - vlib_node_increment_counter (vm, node_idx, VXLAN_ERROR_DECAPSULATED, - from_frame->n_vectors - pkts_dropped); - - return from_frame->n_vectors; -} - -VLIB_NODE_FN (vxlan4_input_node) (vlib_main_t * vm, - vlib_node_runtime_t * node, - vlib_frame_t * from_frame) -{ - return vxlan_input (vm, node, from_frame, /* is_ip4 */ 1); -} - -VLIB_NODE_FN (vxlan6_input_node) (vlib_main_t * vm, - vlib_node_runtime_t * node, - vlib_frame_t * from_frame) -{ - return vxlan_input (vm, node, from_frame, /* is_ip4 */ 0); -} - -static char *vxlan_error_strings[] = { -#define vxlan_error(n,s) s, -#include <vnet/vxlan/vxlan_error.def> -#undef vxlan_error -}; - -/* *INDENT-OFF* */ -VLIB_REGISTER_NODE (vxlan4_input_node) = -{ - .name = "vxlan4-input", - .vector_size = sizeof (u32), - .n_errors = VXLAN_N_ERROR, - .error_strings = vxlan_error_strings, - .n_next_nodes = VXLAN_INPUT_N_NEXT, - .format_trace = format_vxlan_rx_trace, - .next_nodes = { -#define _(s,n) [VXLAN_INPUT_NEXT_##s] = n, - foreach_vxlan_input_next -#undef _ - }, -}; - -VLIB_REGISTER_NODE (vxlan6_input_node) = -{ - .name = "vxlan6-input", - .vector_size = sizeof (u32), - .n_errors = VXLAN_N_ERROR, - .error_strings = vxlan_error_strings, - .n_next_nodes = VXLAN_INPUT_N_NEXT, - .next_nodes = { -#define _(s,n) [VXLAN_INPUT_NEXT_##s] = n, - foreach_vxlan_input_next -#undef _ - }, - .format_trace = format_vxlan_rx_trace, -}; -/* *INDENT-ON* */ - -typedef enum -{ - IP_VXLAN_BYPASS_NEXT_DROP, - IP_VXLAN_BYPASS_NEXT_VXLAN, - IP_VXLAN_BYPASS_N_NEXT, -} ip_vxlan_bypass_next_t; - -always_inline uword -ip_vxlan_bypass_inline (vlib_main_t * vm, - vlib_node_runtime_t * node, - vlib_frame_t * frame, u32 is_ip4) -{ - vxlan_main_t *vxm = &vxlan_main; - u32 *from, *to_next, n_left_from, n_left_to_next, next_index; - vlib_node_runtime_t *error_node = - vlib_node_get_runtime (vm, ip4_input_node.index); - vtep4_key_t last_vtep4; /* last IPv4 address / fib index - matching a local VTEP address */ - vtep6_key_t last_vtep6; /* last IPv6 address / fib index - matching a local VTEP address */ - vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b = bufs; - - last_tunnel_cache4 last4; - last_tunnel_cache6 last6; - - from = vlib_frame_vector_args (frame); - n_left_from = frame->n_vectors; - next_index = node->cached_next_index; - - vlib_get_buffers (vm, from, bufs, n_left_from); - - if (node->flags & VLIB_NODE_FLAG_TRACE) - ip4_forward_next_trace (vm, node, frame, VLIB_TX); - - if (is_ip4) - { - vtep4_key_init (&last_vtep4); - clib_memset (&last4, 0xff, sizeof last4); - } - else - { - vtep6_key_init (&last_vtep6); - clib_memset (&last6, 0xff, sizeof last6); - } - - while (n_left_from > 0) - { - vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next); - - while (n_left_from >= 4 && n_left_to_next >= 2) - { - vlib_buffer_t *b0, *b1; - ip4_header_t *ip40, *ip41; - ip6_header_t *ip60, *ip61; - udp_header_t *udp0, *udp1; - vxlan_header_t *vxlan0, *vxlan1; - u32 bi0, ip_len0, udp_len0, flags0, next0; - u32 bi1, ip_len1, udp_len1, flags1, next1; - i32 len_diff0, len_diff1; - u8 error0, good_udp0, proto0; - u8 error1, good_udp1, proto1; - u32 stats_if0 = ~0, stats_if1 = ~0; - - /* Prefetch next iteration. */ - { - vlib_prefetch_buffer_header (b[2], LOAD); - vlib_prefetch_buffer_header (b[3], LOAD); - - CLIB_PREFETCH (b[2]->data, 2 * CLIB_CACHE_LINE_BYTES, LOAD); - CLIB_PREFETCH (b[3]->data, 2 * CLIB_CACHE_LINE_BYTES, LOAD); - } - - bi0 = to_next[0] = from[0]; - bi1 = to_next[1] = from[1]; - from += 2; - n_left_from -= 2; - to_next += 2; - n_left_to_next -= 2; - - b0 = b[0]; - b1 = b[1]; - b += 2; - if (is_ip4) - { - ip40 = vlib_buffer_get_current (b0); - ip41 = vlib_buffer_get_current (b1); - } - else - { - ip60 = vlib_buffer_get_current (b0); - ip61 = vlib_buffer_get_current (b1); - } - - /* Setup packet for next IP feature */ - vnet_feature_next (&next0, b0); - vnet_feature_next (&next1, b1); - - if (is_ip4) - { - /* Treat IP frag packets as "experimental" protocol for now - until support of IP frag reassembly is implemented */ - proto0 = ip4_is_fragment (ip40) ? 0xfe : ip40->protocol; - proto1 = ip4_is_fragment (ip41) ? 0xfe : ip41->protocol; - } - else - { - proto0 = ip60->protocol; - proto1 = ip61->protocol; - } - - /* Process packet 0 */ - if (proto0 != IP_PROTOCOL_UDP) - goto exit0; /* not UDP packet */ - - if (is_ip4) - udp0 = ip4_next_header (ip40); - else - udp0 = ip6_next_header (ip60); - - u32 fi0 = vlib_buffer_get_ip_fib_index (b0, is_ip4); - vxlan0 = vlib_buffer_get_current (b0) + sizeof (udp_header_t) + - sizeof (ip4_header_t); - - vxlan_decap_info_t di0 = - is_ip4 ? - vxlan4_find_tunnel (vxm, &last4, fi0, ip40, vxlan0, &stats_if0) : - vxlan6_find_tunnel (vxm, &last6, fi0, ip60, vxlan0, &stats_if0); - - if (PREDICT_FALSE (di0.sw_if_index == ~0)) - goto exit0; /* unknown interface */ - - /* Validate DIP against VTEPs */ - if (is_ip4) - { -#ifdef CLIB_HAVE_VEC512 - if (!vtep4_check_vector (&vxm->vtep_table, b0, ip40, &last_vtep4, - &vxm->vtep4_u512)) -#else - if (!vtep4_check (&vxm->vtep_table, b0, ip40, &last_vtep4)) -#endif - goto exit0; /* no local VTEP for VXLAN packet */ - } - else - { - if (!vtep6_check (&vxm->vtep_table, b0, ip60, &last_vtep6)) - goto exit0; /* no local VTEP for VXLAN packet */ - } - - flags0 = b0->flags; - good_udp0 = (flags0 & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0; - - /* Don't verify UDP checksum for packets with explicit zero checksum. */ - good_udp0 |= udp0->checksum == 0; - - /* Verify UDP length */ - if (is_ip4) - ip_len0 = clib_net_to_host_u16 (ip40->length); - else - ip_len0 = clib_net_to_host_u16 (ip60->payload_length); - udp_len0 = clib_net_to_host_u16 (udp0->length); - len_diff0 = ip_len0 - udp_len0; - - /* Verify UDP checksum */ - if (PREDICT_FALSE (!good_udp0)) - { - if (is_ip4) - flags0 = ip4_tcp_udp_validate_checksum (vm, b0); - else - flags0 = ip6_tcp_udp_icmp_validate_checksum (vm, b0); - good_udp0 = (flags0 & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0; - } - - if (is_ip4) - { - error0 = good_udp0 ? 0 : IP4_ERROR_UDP_CHECKSUM; - error0 = (len_diff0 >= 0) ? error0 : IP4_ERROR_UDP_LENGTH; - } - else - { - error0 = good_udp0 ? 0 : IP6_ERROR_UDP_CHECKSUM; - error0 = (len_diff0 >= 0) ? error0 : IP6_ERROR_UDP_LENGTH; - } - - next0 = error0 ? - IP_VXLAN_BYPASS_NEXT_DROP : IP_VXLAN_BYPASS_NEXT_VXLAN; - b0->error = error0 ? error_node->errors[error0] : 0; - - /* vxlan-input node expect current at VXLAN header */ - if (is_ip4) - vlib_buffer_advance (b0, - sizeof (ip4_header_t) + - sizeof (udp_header_t)); - else - vlib_buffer_advance (b0, - sizeof (ip6_header_t) + - sizeof (udp_header_t)); - - exit0: - /* Process packet 1 */ - if (proto1 != IP_PROTOCOL_UDP) - goto exit1; /* not UDP packet */ - - if (is_ip4) - udp1 = ip4_next_header (ip41); - else - udp1 = ip6_next_header (ip61); - - u32 fi1 = vlib_buffer_get_ip_fib_index (b1, is_ip4); - vxlan1 = vlib_buffer_get_current (b1) + sizeof (udp_header_t) + - sizeof (ip4_header_t); - - vxlan_decap_info_t di1 = - is_ip4 ? - vxlan4_find_tunnel (vxm, &last4, fi1, ip41, vxlan1, &stats_if1) : - vxlan6_find_tunnel (vxm, &last6, fi1, ip61, vxlan1, &stats_if1); - - if (PREDICT_FALSE (di1.sw_if_index == ~0)) - goto exit1; /* unknown interface */ - - /* Validate DIP against VTEPs */ - if (is_ip4) - { -#ifdef CLIB_HAVE_VEC512 - if (!vtep4_check_vector (&vxm->vtep_table, b1, ip41, &last_vtep4, - &vxm->vtep4_u512)) -#else - if (!vtep4_check (&vxm->vtep_table, b1, ip41, &last_vtep4)) -#endif - goto exit1; /* no local VTEP for VXLAN packet */ - } - else - { - if (!vtep6_check (&vxm->vtep_table, b1, ip61, &last_vtep6)) - goto exit1; /* no local VTEP for VXLAN packet */ - } - - flags1 = b1->flags; - good_udp1 = (flags1 & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0; - - /* Don't verify UDP checksum for packets with explicit zero checksum. */ - good_udp1 |= udp1->checksum == 0; - - /* Verify UDP length */ - if (is_ip4) - ip_len1 = clib_net_to_host_u16 (ip41->length); - else - ip_len1 = clib_net_to_host_u16 (ip61->payload_length); - udp_len1 = clib_net_to_host_u16 (udp1->length); - len_diff1 = ip_len1 - udp_len1; - - /* Verify UDP checksum */ - if (PREDICT_FALSE (!good_udp1)) - { - if (is_ip4) - flags1 = ip4_tcp_udp_validate_checksum (vm, b1); - else - flags1 = ip6_tcp_udp_icmp_validate_checksum (vm, b1); - good_udp1 = (flags1 & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0; - } - - if (is_ip4) - { - error1 = good_udp1 ? 0 : IP4_ERROR_UDP_CHECKSUM; - error1 = (len_diff1 >= 0) ? error1 : IP4_ERROR_UDP_LENGTH; - } - else - { - error1 = good_udp1 ? 0 : IP6_ERROR_UDP_CHECKSUM; - error1 = (len_diff1 >= 0) ? error1 : IP6_ERROR_UDP_LENGTH; - } - - next1 = error1 ? - IP_VXLAN_BYPASS_NEXT_DROP : IP_VXLAN_BYPASS_NEXT_VXLAN; - b1->error = error1 ? error_node->errors[error1] : 0; - - /* vxlan-input node expect current at VXLAN header */ - if (is_ip4) - vlib_buffer_advance (b1, - sizeof (ip4_header_t) + - sizeof (udp_header_t)); - else - vlib_buffer_advance (b1, - sizeof (ip6_header_t) + - sizeof (udp_header_t)); - - exit1: - vlib_validate_buffer_enqueue_x2 (vm, node, next_index, - to_next, n_left_to_next, - bi0, bi1, next0, next1); - } - - while (n_left_from > 0 && n_left_to_next > 0) - { - vlib_buffer_t *b0; - ip4_header_t *ip40; - ip6_header_t *ip60; - udp_header_t *udp0; - vxlan_header_t *vxlan0; - u32 bi0, ip_len0, udp_len0, flags0, next0; - i32 len_diff0; - u8 error0, good_udp0, proto0; - u32 stats_if0 = ~0; - - bi0 = to_next[0] = from[0]; - from += 1; - n_left_from -= 1; - to_next += 1; - n_left_to_next -= 1; - - b0 = b[0]; - b++; - if (is_ip4) - ip40 = vlib_buffer_get_current (b0); - else - ip60 = vlib_buffer_get_current (b0); - - /* Setup packet for next IP feature */ - vnet_feature_next (&next0, b0); - - if (is_ip4) - /* Treat IP4 frag packets as "experimental" protocol for now - until support of IP frag reassembly is implemented */ - proto0 = ip4_is_fragment (ip40) ? 0xfe : ip40->protocol; - else - proto0 = ip60->protocol; - - if (proto0 != IP_PROTOCOL_UDP) - goto exit; /* not UDP packet */ - - if (is_ip4) - udp0 = ip4_next_header (ip40); - else - udp0 = ip6_next_header (ip60); - - u32 fi0 = vlib_buffer_get_ip_fib_index (b0, is_ip4); - vxlan0 = vlib_buffer_get_current (b0) + sizeof (udp_header_t) + - sizeof (ip4_header_t); - - vxlan_decap_info_t di0 = - is_ip4 ? - vxlan4_find_tunnel (vxm, &last4, fi0, ip40, vxlan0, &stats_if0) : - vxlan6_find_tunnel (vxm, &last6, fi0, ip60, vxlan0, &stats_if0); - - if (PREDICT_FALSE (di0.sw_if_index == ~0)) - goto exit; /* unknown interface */ - - /* Validate DIP against VTEPs */ - if (is_ip4) - { -#ifdef CLIB_HAVE_VEC512 - if (!vtep4_check_vector (&vxm->vtep_table, b0, ip40, &last_vtep4, - &vxm->vtep4_u512)) -#else - if (!vtep4_check (&vxm->vtep_table, b0, ip40, &last_vtep4)) -#endif - goto exit; /* no local VTEP for VXLAN packet */ - } - else - { - if (!vtep6_check (&vxm->vtep_table, b0, ip60, &last_vtep6)) - goto exit; /* no local VTEP for VXLAN packet */ - } - - flags0 = b0->flags; - good_udp0 = (flags0 & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0; - - /* Don't verify UDP checksum for packets with explicit zero checksum. */ - good_udp0 |= udp0->checksum == 0; - - /* Verify UDP length */ - if (is_ip4) - ip_len0 = clib_net_to_host_u16 (ip40->length); - else - ip_len0 = clib_net_to_host_u16 (ip60->payload_length); - udp_len0 = clib_net_to_host_u16 (udp0->length); - len_diff0 = ip_len0 - udp_len0; - - /* Verify UDP checksum */ - if (PREDICT_FALSE (!good_udp0)) - { - if (is_ip4) - flags0 = ip4_tcp_udp_validate_checksum (vm, b0); - else - flags0 = ip6_tcp_udp_icmp_validate_checksum (vm, b0); - good_udp0 = (flags0 & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0; - } - - if (is_ip4) - { - error0 = good_udp0 ? 0 : IP4_ERROR_UDP_CHECKSUM; - error0 = (len_diff0 >= 0) ? error0 : IP4_ERROR_UDP_LENGTH; - } - else - { - error0 = good_udp0 ? 0 : IP6_ERROR_UDP_CHECKSUM; - error0 = (len_diff0 >= 0) ? error0 : IP6_ERROR_UDP_LENGTH; - } - - next0 = error0 ? - IP_VXLAN_BYPASS_NEXT_DROP : IP_VXLAN_BYPASS_NEXT_VXLAN; - b0->error = error0 ? error_node->errors[error0] : 0; - - /* vxlan-input node expect current at VXLAN header */ - if (is_ip4) - vlib_buffer_advance (b0, - sizeof (ip4_header_t) + - sizeof (udp_header_t)); - else - vlib_buffer_advance (b0, - sizeof (ip6_header_t) + - sizeof (udp_header_t)); - - exit: - vlib_validate_buffer_enqueue_x1 (vm, node, next_index, - to_next, n_left_to_next, - bi0, next0); - } - - vlib_put_next_frame (vm, node, next_index, n_left_to_next); - } - - return frame->n_vectors; -} - -VLIB_NODE_FN (ip4_vxlan_bypass_node) (vlib_main_t * vm, - vlib_node_runtime_t * node, - vlib_frame_t * frame) -{ - return ip_vxlan_bypass_inline (vm, node, frame, /* is_ip4 */ 1); -} - -/* *INDENT-OFF* */ -VLIB_REGISTER_NODE (ip4_vxlan_bypass_node) = -{ - .name = "ip4-vxlan-bypass", - .vector_size = sizeof (u32), - .n_next_nodes = IP_VXLAN_BYPASS_N_NEXT, - .next_nodes = { - [IP_VXLAN_BYPASS_NEXT_DROP] = "error-drop", - [IP_VXLAN_BYPASS_NEXT_VXLAN] = "vxlan4-input", - }, - .format_buffer = format_ip4_header, - .format_trace = format_ip4_forward_next_trace, -}; - -/* *INDENT-ON* */ - -/* Dummy init function to get us linked in. */ -static clib_error_t * -ip4_vxlan_bypass_init (vlib_main_t * vm) -{ - return 0; -} - -VLIB_INIT_FUNCTION (ip4_vxlan_bypass_init); - -VLIB_NODE_FN (ip6_vxlan_bypass_node) (vlib_main_t * vm, - vlib_node_runtime_t * node, - vlib_frame_t * frame) -{ - return ip_vxlan_bypass_inline (vm, node, frame, /* is_ip4 */ 0); -} - -/* *INDENT-OFF* */ -VLIB_REGISTER_NODE (ip6_vxlan_bypass_node) = -{ - .name = "ip6-vxlan-bypass", - .vector_size = sizeof (u32), - .n_next_nodes = IP_VXLAN_BYPASS_N_NEXT, - .next_nodes = { - [IP_VXLAN_BYPASS_NEXT_DROP] = "error-drop", - [IP_VXLAN_BYPASS_NEXT_VXLAN] = "vxlan6-input", - }, - .format_buffer = format_ip6_header, - .format_trace = format_ip6_forward_next_trace, -}; - -/* *INDENT-ON* */ - -/* Dummy init function to get us linked in. */ -static clib_error_t * -ip6_vxlan_bypass_init (vlib_main_t * vm) -{ - return 0; -} - -VLIB_INIT_FUNCTION (ip6_vxlan_bypass_init); - -#define foreach_vxlan_flow_input_next \ -_(DROP, "error-drop") \ -_(L2_INPUT, "l2-input") - -typedef enum -{ -#define _(s,n) VXLAN_FLOW_NEXT_##s, - foreach_vxlan_flow_input_next -#undef _ - VXLAN_FLOW_N_NEXT, -} vxlan_flow_input_next_t; - -#define foreach_vxlan_flow_error \ - _(NONE, "no error") \ - _(IP_CHECKSUM_ERROR, "Rx ip checksum errors") \ - _(IP_HEADER_ERROR, "Rx ip header errors") \ - _(UDP_CHECKSUM_ERROR, "Rx udp checksum errors") \ - _(UDP_LENGTH_ERROR, "Rx udp length errors") - -typedef enum -{ -#define _(f,s) VXLAN_FLOW_ERROR_##f, - foreach_vxlan_flow_error -#undef _ - VXLAN_FLOW_N_ERROR, -} vxlan_flow_error_t; - -static char *vxlan_flow_error_strings[] = { -#define _(n,s) s, - foreach_vxlan_flow_error -#undef _ -}; - - -static_always_inline u8 -vxlan_validate_udp_csum (vlib_main_t * vm, vlib_buffer_t * b) -{ - u32 flags = b->flags; - enum - { offset = - sizeof (ip4_header_t) + sizeof (udp_header_t) + sizeof (vxlan_header_t), - }; - - /* Verify UDP checksum */ - if ((flags & VNET_BUFFER_F_L4_CHECKSUM_COMPUTED) == 0) - { - vlib_buffer_advance (b, -offset); - flags = ip4_tcp_udp_validate_checksum (vm, b); - vlib_buffer_advance (b, offset); - } - - return (flags & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0; -} - -static_always_inline u8 -vxlan_check_udp_csum (vlib_main_t * vm, vlib_buffer_t * b) -{ - ip4_vxlan_header_t *hdr = vlib_buffer_get_current (b) - sizeof *hdr; - udp_header_t *udp = &hdr->udp; - /* Don't verify UDP checksum for packets with explicit zero checksum. */ - u8 good_csum = (b->flags & VNET_BUFFER_F_L4_CHECKSUM_CORRECT) != 0 || - udp->checksum == 0; - - return !good_csum; -} - -static_always_inline u8 -vxlan_check_ip (vlib_buffer_t * b, u16 payload_len) -{ - ip4_vxlan_header_t *hdr = vlib_buffer_get_current (b) - sizeof *hdr; - u16 ip_len = clib_net_to_host_u16 (hdr->ip4.length); - u16 expected = payload_len + sizeof *hdr; - return ip_len > expected || hdr->ip4.ttl == 0 - || hdr->ip4.ip_version_and_header_length != 0x45; -} - -static_always_inline u8 -vxlan_check_ip_udp_len (vlib_buffer_t * b) -{ - ip4_vxlan_header_t *hdr = vlib_buffer_get_current (b) - sizeof *hdr; - u16 ip_len = clib_net_to_host_u16 (hdr->ip4.length); - u16 udp_len = clib_net_to_host_u16 (hdr->udp.length); - return udp_len > ip_len; -} - -static_always_inline u8 -vxlan_err_code (u8 ip_err0, u8 udp_err0, u8 csum_err0) -{ - u8 error0 = VXLAN_FLOW_ERROR_NONE; - if (ip_err0) - error0 = VXLAN_FLOW_ERROR_IP_HEADER_ERROR; - if (udp_err0) - error0 = VXLAN_FLOW_ERROR_UDP_LENGTH_ERROR; - if (csum_err0) - error0 = VXLAN_FLOW_ERROR_UDP_CHECKSUM_ERROR; - return error0; -} - -VLIB_NODE_FN (vxlan4_flow_input_node) (vlib_main_t * vm, - vlib_node_runtime_t * node, - vlib_frame_t * f) -{ - enum - { payload_offset = sizeof (ip4_vxlan_header_t) }; - - vxlan_main_t *vxm = &vxlan_main; - vnet_interface_main_t *im = &vnet_main.interface_main; - vlib_combined_counter_main_t *rx_counter[VXLAN_FLOW_N_NEXT] = { - [VXLAN_FLOW_NEXT_DROP] = - im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_DROP, - [VXLAN_FLOW_NEXT_L2_INPUT] = - im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX, - }; - u32 thread_index = vlib_get_thread_index (); - - u32 *from = vlib_frame_vector_args (f); - u32 n_left_from = f->n_vectors; - u32 next_index = VXLAN_FLOW_NEXT_L2_INPUT; - - while (n_left_from > 0) - { - u32 n_left_to_next, *to_next; - - vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next); - - while (n_left_from > 3 && n_left_to_next > 3) - { - u32 bi0 = to_next[0] = from[0]; - u32 bi1 = to_next[1] = from[1]; - u32 bi2 = to_next[2] = from[2]; - u32 bi3 = to_next[3] = from[3]; - from += 4; - n_left_from -= 4; - to_next += 4; - n_left_to_next -= 4; - - vlib_buffer_t *b0 = vlib_get_buffer (vm, bi0); - vlib_buffer_t *b1 = vlib_get_buffer (vm, bi1); - vlib_buffer_t *b2 = vlib_get_buffer (vm, bi2); - vlib_buffer_t *b3 = vlib_get_buffer (vm, bi3); - - vlib_buffer_advance (b0, payload_offset); - vlib_buffer_advance (b1, payload_offset); - vlib_buffer_advance (b2, payload_offset); - vlib_buffer_advance (b3, payload_offset); - - u16 len0 = vlib_buffer_length_in_chain (vm, b0); - u16 len1 = vlib_buffer_length_in_chain (vm, b1); - u16 len2 = vlib_buffer_length_in_chain (vm, b2); - u16 len3 = vlib_buffer_length_in_chain (vm, b3); - - u32 next0 = VXLAN_FLOW_NEXT_L2_INPUT, next1 = - VXLAN_FLOW_NEXT_L2_INPUT, next2 = - VXLAN_FLOW_NEXT_L2_INPUT, next3 = VXLAN_FLOW_NEXT_L2_INPUT; - - u8 ip_err0 = vxlan_check_ip (b0, len0); - u8 ip_err1 = vxlan_check_ip (b1, len1); - u8 ip_err2 = vxlan_check_ip (b2, len2); - u8 ip_err3 = vxlan_check_ip (b3, len3); - u8 ip_err = ip_err0 | ip_err1 | ip_err2 | ip_err3; - - u8 udp_err0 = vxlan_check_ip_udp_len (b0); - u8 udp_err1 = vxlan_check_ip_udp_len (b1); - u8 udp_err2 = vxlan_check_ip_udp_len (b2); - u8 udp_err3 = vxlan_check_ip_udp_len (b3); - u8 udp_err = udp_err0 | udp_err1 | udp_err2 | udp_err3; - - u8 csum_err0 = vxlan_check_udp_csum (vm, b0); - u8 csum_err1 = vxlan_check_udp_csum (vm, b1); - u8 csum_err2 = vxlan_check_udp_csum (vm, b2); - u8 csum_err3 = vxlan_check_udp_csum (vm, b3); - u8 csum_err = csum_err0 | csum_err1 | csum_err2 | csum_err3; - - if (PREDICT_FALSE (csum_err)) - { - if (csum_err0) - csum_err0 = !vxlan_validate_udp_csum (vm, b0); - if (csum_err1) - csum_err1 = !vxlan_validate_udp_csum (vm, b1); - if (csum_err2) - csum_err2 = !vxlan_validate_udp_csum (vm, b2); - if (csum_err3) - csum_err3 = !vxlan_validate_udp_csum (vm, b3); - csum_err = csum_err0 | csum_err1 | csum_err2 | csum_err3; - } - - if (PREDICT_FALSE (ip_err || udp_err || csum_err)) - { - if (ip_err0 || udp_err0 || csum_err0) - { - next0 = VXLAN_FLOW_NEXT_DROP; - u8 error0 = vxlan_err_code (ip_err0, udp_err0, csum_err0); - b0->error = node->errors[error0]; - } - if (ip_err1 || udp_err1 || csum_err1) - { - next1 = VXLAN_FLOW_NEXT_DROP; - u8 error1 = vxlan_err_code (ip_err1, udp_err1, csum_err1); - b1->error = node->errors[error1]; - } - if (ip_err2 || udp_err2 || csum_err2) - { - next2 = VXLAN_FLOW_NEXT_DROP; - u8 error2 = vxlan_err_code (ip_err2, udp_err2, csum_err2); - b2->error = node->errors[error2]; - } - if (ip_err3 || udp_err3 || csum_err3) - { - next3 = VXLAN_FLOW_NEXT_DROP; - u8 error3 = vxlan_err_code (ip_err3, udp_err3, csum_err3); - b3->error = node->errors[error3]; - } - } - - vnet_update_l2_len (b0); - vnet_update_l2_len (b1); - vnet_update_l2_len (b2); - vnet_update_l2_len (b3); - - ASSERT (b0->flow_id != 0); - ASSERT (b1->flow_id != 0); - ASSERT (b2->flow_id != 0); - ASSERT (b3->flow_id != 0); - - u32 t_index0 = b0->flow_id - vxm->flow_id_start; - u32 t_index1 = b1->flow_id - vxm->flow_id_start; - u32 t_index2 = b2->flow_id - vxm->flow_id_start; - u32 t_index3 = b3->flow_id - vxm->flow_id_start; - - vxlan_tunnel_t *t0 = &vxm->tunnels[t_index0]; - vxlan_tunnel_t *t1 = &vxm->tunnels[t_index1]; - vxlan_tunnel_t *t2 = &vxm->tunnels[t_index2]; - vxlan_tunnel_t *t3 = &vxm->tunnels[t_index3]; - - /* flow id consumed */ - b0->flow_id = 0; - b1->flow_id = 0; - b2->flow_id = 0; - b3->flow_id = 0; - - u32 sw_if_index0 = vnet_buffer (b0)->sw_if_index[VLIB_RX] = - t0->sw_if_index; - u32 sw_if_index1 = vnet_buffer (b1)->sw_if_index[VLIB_RX] = - t1->sw_if_index; - u32 sw_if_index2 = vnet_buffer (b2)->sw_if_index[VLIB_RX] = - t2->sw_if_index; - u32 sw_if_index3 = vnet_buffer (b3)->sw_if_index[VLIB_RX] = - t3->sw_if_index; - - vlib_increment_combined_counter (rx_counter[next0], thread_index, - sw_if_index0, 1, len0); - vlib_increment_combined_counter (rx_counter[next1], thread_index, - sw_if_index1, 1, len1); - vlib_increment_combined_counter (rx_counter[next2], thread_index, - sw_if_index2, 1, len2); - vlib_increment_combined_counter (rx_counter[next3], thread_index, - sw_if_index3, 1, len3); - - u32 flags = b0->flags | b1->flags | b2->flags | b3->flags; - - if (PREDICT_FALSE (flags & VLIB_BUFFER_IS_TRACED)) - { - if (b0->flags & VLIB_BUFFER_IS_TRACED) - { - vxlan_rx_trace_t *tr = - vlib_add_trace (vm, node, b0, sizeof *tr); - u8 error0 = vxlan_err_code (ip_err0, udp_err0, csum_err0); - tr->next_index = next0; - tr->error = error0; - tr->tunnel_index = t_index0; - tr->vni = t0->vni; - } - if (b1->flags & VLIB_BUFFER_IS_TRACED) - { - vxlan_rx_trace_t *tr = - vlib_add_trace (vm, node, b1, sizeof *tr); - u8 error1 = vxlan_err_code (ip_err1, udp_err1, csum_err1); - tr->next_index = next1; - tr->error = error1; - tr->tunnel_index = t_index1; - tr->vni = t1->vni; - } - if (b2->flags & VLIB_BUFFER_IS_TRACED) - { - vxlan_rx_trace_t *tr = - vlib_add_trace (vm, node, b2, sizeof *tr); - u8 error2 = vxlan_err_code (ip_err2, udp_err2, csum_err2); - tr->next_index = next2; - tr->error = error2; - tr->tunnel_index = t_index2; - tr->vni = t2->vni; - } - if (b3->flags & VLIB_BUFFER_IS_TRACED) - { - vxlan_rx_trace_t *tr = - vlib_add_trace (vm, node, b3, sizeof *tr); - u8 error3 = vxlan_err_code (ip_err3, udp_err3, csum_err3); - tr->next_index = next3; - tr->error = error3; - tr->tunnel_index = t_index3; - tr->vni = t3->vni; - } - } - vlib_validate_buffer_enqueue_x4 - (vm, node, next_index, to_next, n_left_to_next, - bi0, bi1, bi2, bi3, next0, next1, next2, next3); - } - while (n_left_from > 0 && n_left_to_next > 0) - { - u32 bi0 = to_next[0] = from[0]; - from++; - n_left_from--; - to_next++; - n_left_to_next--; - - vlib_buffer_t *b0 = vlib_get_buffer (vm, bi0); - vlib_buffer_advance (b0, payload_offset); - - u16 len0 = vlib_buffer_length_in_chain (vm, b0); - u32 next0 = VXLAN_FLOW_NEXT_L2_INPUT; - - u8 ip_err0 = vxlan_check_ip (b0, len0); - u8 udp_err0 = vxlan_check_ip_udp_len (b0); - u8 csum_err0 = vxlan_check_udp_csum (vm, b0); - - if (csum_err0) - csum_err0 = !vxlan_validate_udp_csum (vm, b0); - if (ip_err0 || udp_err0 || csum_err0) - { - next0 = VXLAN_FLOW_NEXT_DROP; - u8 error0 = vxlan_err_code (ip_err0, udp_err0, csum_err0); - b0->error = node->errors[error0]; - } - - vnet_update_l2_len (b0); - - ASSERT (b0->flow_id != 0); - u32 t_index0 = b0->flow_id - vxm->flow_id_start; - vxlan_tunnel_t *t0 = &vxm->tunnels[t_index0]; - b0->flow_id = 0; - - u32 sw_if_index0 = vnet_buffer (b0)->sw_if_index[VLIB_RX] = - t0->sw_if_index; - vlib_increment_combined_counter (rx_counter[next0], thread_index, - sw_if_index0, 1, len0); - - if (PREDICT_FALSE (b0->flags & VLIB_BUFFER_IS_TRACED)) - { - vxlan_rx_trace_t *tr = - vlib_add_trace (vm, node, b0, sizeof *tr); - u8 error0 = vxlan_err_code (ip_err0, udp_err0, csum_err0); - tr->next_index = next0; - tr->error = error0; - tr->tunnel_index = t_index0; - tr->vni = t0->vni; - } - vlib_validate_buffer_enqueue_x1 (vm, node, next_index, - to_next, n_left_to_next, - bi0, next0); - } - - vlib_put_next_frame (vm, node, next_index, n_left_to_next); - } - - return f->n_vectors; -} - -/* *INDENT-OFF* */ -#ifndef CLIB_MULTIARCH_VARIANT -VLIB_REGISTER_NODE (vxlan4_flow_input_node) = { - .name = "vxlan-flow-input", - .type = VLIB_NODE_TYPE_INTERNAL, - .vector_size = sizeof (u32), - - .format_trace = format_vxlan_rx_trace, - - .n_errors = VXLAN_FLOW_N_ERROR, - .error_strings = vxlan_flow_error_strings, - - .n_next_nodes = VXLAN_FLOW_N_NEXT, - .next_nodes = { -#define _(s,n) [VXLAN_FLOW_NEXT_##s] = n, - foreach_vxlan_flow_input_next -#undef _ - }, -}; -#endif -/* *INDENT-ON* */ - -/* - * fd.io coding-style-patch-verification: ON - * - * Local Variables: - * eval: (c-set-style "gnu") - * End: - */ diff --git a/src/vnet/vxlan/dir.dox b/src/vnet/vxlan/dir.dox deleted file mode 100644 index 31a9e2b6112..00000000000 --- a/src/vnet/vxlan/dir.dox +++ /dev/null @@ -1,24 +0,0 @@ -/* - * Copyright (c) 2016 Cisco and/or its affiliates. - * - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at: - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ - -/** -@dir -@brief VXLAN Code. - -This directory contains source code to support VXLAN. - -*/ -/*? %%clicmd:group_label VXLAN CLI %% ?*/ diff --git a/src/vnet/vxlan/encap.c b/src/vnet/vxlan/encap.c deleted file mode 100644 index 0961a27942d..00000000000 --- a/src/vnet/vxlan/encap.c +++ /dev/null @@ -1,540 +0,0 @@ - -/* - * Copyright (c) 2015 Cisco and/or its affiliates. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at: - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -#include <vppinfra/error.h> -#include <vppinfra/hash.h> -#include <vnet/vnet.h> -#include <vnet/ip/ip.h> -#include <vnet/ethernet/ethernet.h> -#include <vnet/interface_output.h> -#include <vnet/vxlan/vxlan.h> -#include <vnet/qos/qos_types.h> -#include <vnet/adj/rewrite.h> - -/* Statistics (not all errors) */ -#define foreach_vxlan_encap_error \ -_(ENCAPSULATED, "good packets encapsulated") - -static char *vxlan_encap_error_strings[] = { -#define _(sym,string) string, - foreach_vxlan_encap_error -#undef _ -}; - -typedef enum -{ -#define _(sym,str) VXLAN_ENCAP_ERROR_##sym, - foreach_vxlan_encap_error -#undef _ - VXLAN_ENCAP_N_ERROR, -} vxlan_encap_error_t; - -typedef enum -{ - VXLAN_ENCAP_NEXT_DROP, - VXLAN_ENCAP_N_NEXT, -} vxlan_encap_next_t; - -typedef struct -{ - u32 tunnel_index; - u32 vni; -} vxlan_encap_trace_t; - -#ifndef CLIB_MARCH_VARIANT -u8 * -format_vxlan_encap_trace (u8 * s, va_list * args) -{ - CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *); - CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *); - vxlan_encap_trace_t *t = va_arg (*args, vxlan_encap_trace_t *); - - s = format (s, "VXLAN encap to vxlan_tunnel%d vni %d", - t->tunnel_index, t->vni); - return s; -} -#endif - -always_inline uword -vxlan_encap_inline (vlib_main_t *vm, vlib_node_runtime_t *node, - vlib_frame_t *from_frame, u8 is_ip4) -{ - u32 n_left_from, next_index, *from, *to_next; - vxlan_main_t *vxm = &vxlan_main; - vnet_main_t *vnm = vxm->vnet_main; - vnet_interface_main_t *im = &vnm->interface_main; - vlib_combined_counter_main_t *tx_counter = - im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_TX; - u32 pkts_encapsulated = 0; - u32 thread_index = vlib_get_thread_index (); - u32 sw_if_index0 = 0, sw_if_index1 = 0; - u32 next0 = 0, next1 = 0; - vxlan_tunnel_t *t0 = NULL, *t1 = NULL; - index_t dpoi_idx0 = INDEX_INVALID, dpoi_idx1 = INDEX_INVALID; - vlib_buffer_t *bufs[VLIB_FRAME_SIZE]; - vlib_buffer_t **b = bufs; - - from = vlib_frame_vector_args (from_frame); - n_left_from = from_frame->n_vectors; - - next_index = node->cached_next_index; - - STATIC_ASSERT_SIZEOF (ip6_vxlan_header_t, 56); - STATIC_ASSERT_SIZEOF (ip4_vxlan_header_t, 36); - - u8 const underlay_hdr_len = is_ip4 ? - sizeof (ip4_vxlan_header_t) : sizeof (ip6_vxlan_header_t); - u16 const l3_len = is_ip4 ? sizeof (ip4_header_t) : sizeof (ip6_header_t); - u32 const outer_packet_csum_offload_flags = - is_ip4 ? (VNET_BUFFER_OFFLOAD_F_OUTER_IP_CKSUM | - VNET_BUFFER_OFFLOAD_F_TNL_VXLAN) : - (VNET_BUFFER_OFFLOAD_F_OUTER_UDP_CKSUM | - VNET_BUFFER_OFFLOAD_F_TNL_VXLAN); - - vlib_get_buffers (vm, from, bufs, n_left_from); - - while (n_left_from > 0) - { - u32 n_left_to_next; - - vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next); - - while (n_left_from >= 4 && n_left_to_next >= 2) - { - /* Prefetch next iteration. */ - { - vlib_prefetch_buffer_header (b[2], LOAD); - vlib_prefetch_buffer_header (b[3], LOAD); - - CLIB_PREFETCH (b[2]->data - CLIB_CACHE_LINE_BYTES, - 2 * CLIB_CACHE_LINE_BYTES, LOAD); - CLIB_PREFETCH (b[3]->data - CLIB_CACHE_LINE_BYTES, - 2 * CLIB_CACHE_LINE_BYTES, LOAD); - } - - u32 bi0 = to_next[0] = from[0]; - u32 bi1 = to_next[1] = from[1]; - from += 2; - to_next += 2; - n_left_to_next -= 2; - n_left_from -= 2; - - vlib_buffer_t *b0 = b[0]; - vlib_buffer_t *b1 = b[1]; - b += 2; - - u32 flow_hash0 = vnet_l2_compute_flow_hash (b0); - u32 flow_hash1 = vnet_l2_compute_flow_hash (b1); - - /* Get next node index and adj index from tunnel next_dpo */ - if (sw_if_index0 != vnet_buffer (b0)->sw_if_index[VLIB_TX]) - { - sw_if_index0 = vnet_buffer (b0)->sw_if_index[VLIB_TX]; - vnet_hw_interface_t *hi0 = - vnet_get_sup_hw_interface (vnm, sw_if_index0); - t0 = &vxm->tunnels[hi0->dev_instance]; - /* Note: change to always set next0 if it may set to drop */ - next0 = t0->next_dpo.dpoi_next_node; - dpoi_idx0 = t0->next_dpo.dpoi_index; - } - - /* Get next node index and adj index from tunnel next_dpo */ - if (sw_if_index1 != vnet_buffer (b1)->sw_if_index[VLIB_TX]) - { - if (sw_if_index0 == vnet_buffer (b1)->sw_if_index[VLIB_TX]) - { - sw_if_index1 = sw_if_index0; - t1 = t0; - next1 = next0; - dpoi_idx1 = dpoi_idx0; - } - else - { - sw_if_index1 = vnet_buffer (b1)->sw_if_index[VLIB_TX]; - vnet_hw_interface_t *hi1 = - vnet_get_sup_hw_interface (vnm, sw_if_index1); - t1 = &vxm->tunnels[hi1->dev_instance]; - /* Note: change to always set next1 if it may set to drop */ - next1 = t1->next_dpo.dpoi_next_node; - dpoi_idx1 = t1->next_dpo.dpoi_index; - } - } - - vnet_buffer (b0)->ip.adj_index[VLIB_TX] = dpoi_idx0; - vnet_buffer (b1)->ip.adj_index[VLIB_TX] = dpoi_idx1; - - ASSERT (t0->rewrite_header.data_bytes == underlay_hdr_len); - ASSERT (t1->rewrite_header.data_bytes == underlay_hdr_len); - vnet_rewrite_two_headers (*t0, *t1, vlib_buffer_get_current (b0), - vlib_buffer_get_current (b1), - underlay_hdr_len); - - vlib_buffer_advance (b0, -underlay_hdr_len); - vlib_buffer_advance (b1, -underlay_hdr_len); - - u32 len0 = vlib_buffer_length_in_chain (vm, b0); - u32 len1 = vlib_buffer_length_in_chain (vm, b1); - u16 payload_l0 = clib_host_to_net_u16 (len0 - l3_len); - u16 payload_l1 = clib_host_to_net_u16 (len1 - l3_len); - - void *underlay0 = vlib_buffer_get_current (b0); - void *underlay1 = vlib_buffer_get_current (b1); - - ip4_header_t *ip4_0, *ip4_1; - qos_bits_t ip4_0_tos = 0, ip4_1_tos = 0; - ip6_header_t *ip6_0, *ip6_1; - udp_header_t *udp0, *udp1; - u8 *l3_0, *l3_1; - if (is_ip4) - { - ip4_vxlan_header_t *hdr0 = underlay0; - ip4_vxlan_header_t *hdr1 = underlay1; - - /* Fix the IP4 checksum and length */ - ip4_0 = &hdr0->ip4; - ip4_1 = &hdr1->ip4; - ip4_0->length = clib_host_to_net_u16 (len0); - ip4_1->length = clib_host_to_net_u16 (len1); - - if (PREDICT_FALSE (b0->flags & VNET_BUFFER_F_QOS_DATA_VALID)) - { - ip4_0_tos = vnet_buffer2 (b0)->qos.bits; - ip4_0->tos = ip4_0_tos; - } - if (PREDICT_FALSE (b1->flags & VNET_BUFFER_F_QOS_DATA_VALID)) - { - ip4_1_tos = vnet_buffer2 (b1)->qos.bits; - ip4_1->tos = ip4_1_tos; - } - - l3_0 = (u8 *) ip4_0; - l3_1 = (u8 *) ip4_1; - udp0 = &hdr0->udp; - udp1 = &hdr1->udp; - } - else /* ipv6 */ - { - ip6_vxlan_header_t *hdr0 = underlay0; - ip6_vxlan_header_t *hdr1 = underlay1; - - /* Fix IP6 payload length */ - ip6_0 = &hdr0->ip6; - ip6_1 = &hdr1->ip6; - ip6_0->payload_length = payload_l0; - ip6_1->payload_length = payload_l1; - - l3_0 = (u8 *) ip6_0; - l3_1 = (u8 *) ip6_1; - udp0 = &hdr0->udp; - udp1 = &hdr1->udp; - } - - /* Fix UDP length and set source port */ - udp0->length = payload_l0; - udp0->src_port = flow_hash0; - udp1->length = payload_l1; - udp1->src_port = flow_hash1; - - if (b0->flags & VNET_BUFFER_F_OFFLOAD) - { - vnet_buffer2 (b0)->outer_l3_hdr_offset = l3_0 - b0->data; - vnet_buffer2 (b0)->outer_l4_hdr_offset = (u8 *) udp0 - b0->data; - vnet_buffer_offload_flags_set (b0, - outer_packet_csum_offload_flags); - } - /* IPv4 checksum only */ - else if (is_ip4) - { - ip_csum_t sum0 = ip4_0->checksum; - sum0 = ip_csum_update (sum0, 0, ip4_0->length, ip4_header_t, - length /* changed member */); - if (PREDICT_FALSE (ip4_0_tos)) - { - sum0 = ip_csum_update (sum0, 0, ip4_0_tos, ip4_header_t, - tos /* changed member */); - } - ip4_0->checksum = ip_csum_fold (sum0); - } - /* IPv6 UDP checksum is mandatory */ - else - { - int bogus = 0; - - udp0->checksum = - ip6_tcp_udp_icmp_compute_checksum (vm, b0, ip6_0, &bogus); - ASSERT (bogus == 0); - if (udp0->checksum == 0) - udp0->checksum = 0xffff; - } - - if (b1->flags & VNET_BUFFER_F_OFFLOAD) - { - vnet_buffer2 (b1)->outer_l3_hdr_offset = l3_1 - b1->data; - vnet_buffer2 (b1)->outer_l4_hdr_offset = (u8 *) udp1 - b1->data; - vnet_buffer_offload_flags_set (b1, - outer_packet_csum_offload_flags); - } - /* IPv4 checksum only */ - else if (is_ip4) - { - ip_csum_t sum1 = ip4_1->checksum; - sum1 = ip_csum_update (sum1, 0, ip4_1->length, ip4_header_t, - length /* changed member */); - if (PREDICT_FALSE (ip4_1_tos)) - { - sum1 = ip_csum_update (sum1, 0, ip4_1_tos, ip4_header_t, - tos /* changed member */); - } - ip4_1->checksum = ip_csum_fold (sum1); - } - /* IPv6 UDP checksum is mandatory */ - else - { - int bogus = 0; - - udp1->checksum = ip6_tcp_udp_icmp_compute_checksum - (vm, b1, ip6_1, &bogus); - ASSERT (bogus == 0); - if (udp1->checksum == 0) - udp1->checksum = 0xffff; - } - - /* save inner packet flow_hash for load-balance node */ - vnet_buffer (b0)->ip.flow_hash = flow_hash0; - vnet_buffer (b1)->ip.flow_hash = flow_hash1; - - if (sw_if_index0 == sw_if_index1) - { - vlib_increment_combined_counter (tx_counter, thread_index, - sw_if_index0, 2, len0 + len1); - } - else - { - vlib_increment_combined_counter (tx_counter, thread_index, - sw_if_index0, 1, len0); - vlib_increment_combined_counter (tx_counter, thread_index, - sw_if_index1, 1, len1); - } - pkts_encapsulated += 2; - - if (PREDICT_FALSE (b0->flags & VLIB_BUFFER_IS_TRACED)) - { - vxlan_encap_trace_t *tr = - vlib_add_trace (vm, node, b0, sizeof (*tr)); - tr->tunnel_index = t0 - vxm->tunnels; - tr->vni = t0->vni; - } - - if (PREDICT_FALSE (b1->flags & VLIB_BUFFER_IS_TRACED)) - { - vxlan_encap_trace_t *tr = - vlib_add_trace (vm, node, b1, sizeof (*tr)); - tr->tunnel_index = t1 - vxm->tunnels; - tr->vni = t1->vni; - } - - vlib_validate_buffer_enqueue_x2 (vm, node, next_index, - to_next, n_left_to_next, - bi0, bi1, next0, next1); - } - - while (n_left_from > 0 && n_left_to_next > 0) - { - u32 bi0 = to_next[0] = from[0]; - from += 1; - to_next += 1; - n_left_from -= 1; - n_left_to_next -= 1; - - vlib_buffer_t *b0 = b[0]; - b += 1; - - u32 flow_hash0 = vnet_l2_compute_flow_hash (b0); - - /* Get next node index and adj index from tunnel next_dpo */ - if (sw_if_index0 != vnet_buffer (b0)->sw_if_index[VLIB_TX]) - { - sw_if_index0 = vnet_buffer (b0)->sw_if_index[VLIB_TX]; - vnet_hw_interface_t *hi0 = - vnet_get_sup_hw_interface (vnm, sw_if_index0); - t0 = &vxm->tunnels[hi0->dev_instance]; - /* Note: change to always set next0 if it may be set to drop */ - next0 = t0->next_dpo.dpoi_next_node; - dpoi_idx0 = t0->next_dpo.dpoi_index; - } - vnet_buffer (b0)->ip.adj_index[VLIB_TX] = dpoi_idx0; - - ASSERT (t0->rewrite_header.data_bytes == underlay_hdr_len); - vnet_rewrite_one_header (*t0, vlib_buffer_get_current (b0), - underlay_hdr_len); - - vlib_buffer_advance (b0, -underlay_hdr_len); - void *underlay0 = vlib_buffer_get_current (b0); - - u32 len0 = vlib_buffer_length_in_chain (vm, b0); - u16 payload_l0 = clib_host_to_net_u16 (len0 - l3_len); - - udp_header_t *udp0; - ip4_header_t *ip4_0; - qos_bits_t ip4_0_tos = 0; - ip6_header_t *ip6_0; - u8 *l3_0; - if (is_ip4) - { - ip4_vxlan_header_t *hdr = underlay0; - - /* Fix the IP4 checksum and length */ - ip4_0 = &hdr->ip4; - ip4_0->length = clib_host_to_net_u16 (len0); - - if (PREDICT_FALSE (b0->flags & VNET_BUFFER_F_QOS_DATA_VALID)) - { - ip4_0_tos = vnet_buffer2 (b0)->qos.bits; - ip4_0->tos = ip4_0_tos; - } - - l3_0 = (u8 *) ip4_0; - udp0 = &hdr->udp; - } - else /* ip6 path */ - { - ip6_vxlan_header_t *hdr = underlay0; - - /* Fix IP6 payload length */ - ip6_0 = &hdr->ip6; - ip6_0->payload_length = payload_l0; - - l3_0 = (u8 *) ip6_0; - udp0 = &hdr->udp; - } - - /* Fix UDP length and set source port */ - udp0->length = payload_l0; - udp0->src_port = flow_hash0; - - if (b0->flags & VNET_BUFFER_F_OFFLOAD) - { - vnet_buffer2 (b0)->outer_l3_hdr_offset = l3_0 - b0->data; - vnet_buffer2 (b0)->outer_l4_hdr_offset = (u8 *) udp0 - b0->data; - vnet_buffer_offload_flags_set (b0, - outer_packet_csum_offload_flags); - } - /* IPv4 checksum only */ - else if (is_ip4) - { - ip_csum_t sum0 = ip4_0->checksum; - sum0 = ip_csum_update (sum0, 0, ip4_0->length, ip4_header_t, - length /* changed member */); - if (PREDICT_FALSE (ip4_0_tos)) - { - sum0 = ip_csum_update (sum0, 0, ip4_0_tos, ip4_header_t, - tos /* changed member */); - } - ip4_0->checksum = ip_csum_fold (sum0); - } - /* IPv6 UDP checksum is mandatory */ - else - { - int bogus = 0; - - udp0->checksum = ip6_tcp_udp_icmp_compute_checksum - (vm, b0, ip6_0, &bogus); - ASSERT (bogus == 0); - if (udp0->checksum == 0) - udp0->checksum = 0xffff; - } - - /* reuse inner packet flow_hash for load-balance node */ - vnet_buffer (b0)->ip.flow_hash = flow_hash0; - - vlib_increment_combined_counter (tx_counter, thread_index, - sw_if_index0, 1, len0); - pkts_encapsulated++; - - if (PREDICT_FALSE (b0->flags & VLIB_BUFFER_IS_TRACED)) - { - vxlan_encap_trace_t *tr = - vlib_add_trace (vm, node, b0, sizeof (*tr)); - tr->tunnel_index = t0 - vxm->tunnels; - tr->vni = t0->vni; - } - vlib_validate_buffer_enqueue_x1 (vm, node, next_index, - to_next, n_left_to_next, - bi0, next0); - } - - vlib_put_next_frame (vm, node, next_index, n_left_to_next); - } - - /* Do we still need this now that tunnel tx stats is kept? */ - vlib_node_increment_counter (vm, node->node_index, - VXLAN_ENCAP_ERROR_ENCAPSULATED, - pkts_encapsulated); - - return from_frame->n_vectors; -} - -VLIB_NODE_FN (vxlan4_encap_node) (vlib_main_t * vm, - vlib_node_runtime_t * node, - vlib_frame_t * from_frame) -{ - /* Disable chksum offload as setup overhead in tx node is not worthwhile - for ip4 header checksum only, unless udp checksum is also required */ - return vxlan_encap_inline (vm, node, from_frame, /* is_ip4 */ 1); -} - -VLIB_NODE_FN (vxlan6_encap_node) (vlib_main_t * vm, - vlib_node_runtime_t * node, - vlib_frame_t * from_frame) -{ - /* Enable checksum offload for ip6 as udp checksum is mandatory, */ - return vxlan_encap_inline (vm, node, from_frame, /* is_ip4 */ 0); -} - -/* *INDENT-OFF* */ -VLIB_REGISTER_NODE (vxlan4_encap_node) = { - .name = "vxlan4-encap", - .vector_size = sizeof (u32), - .format_trace = format_vxlan_encap_trace, - .type = VLIB_NODE_TYPE_INTERNAL, - .n_errors = ARRAY_LEN(vxlan_encap_error_strings), - .error_strings = vxlan_encap_error_strings, - .n_next_nodes = VXLAN_ENCAP_N_NEXT, - .next_nodes = { - [VXLAN_ENCAP_NEXT_DROP] = "error-drop", - }, -}; - -VLIB_REGISTER_NODE (vxlan6_encap_node) = { - .name = "vxlan6-encap", - .vector_size = sizeof (u32), - .format_trace = format_vxlan_encap_trace, - .type = VLIB_NODE_TYPE_INTERNAL, - .n_errors = ARRAY_LEN(vxlan_encap_error_strings), - .error_strings = vxlan_encap_error_strings, - .n_next_nodes = VXLAN_ENCAP_N_NEXT, - .next_nodes = { - [VXLAN_ENCAP_NEXT_DROP] = "error-drop", - }, -}; -/* *INDENT-ON* */ - -/* - * fd.io coding-style-patch-verification: ON - * - * Local Variables: - * eval: (c-set-style "gnu") - * End: - */ diff --git a/src/vnet/vxlan/vxlan.api b/src/vnet/vxlan/vxlan.api deleted file mode 100644 index b7e678595d8..00000000000 --- a/src/vnet/vxlan/vxlan.api +++ /dev/null @@ -1,198 +0,0 @@ -/* - * Copyright (c) 2015-2016 Cisco and/or its affiliates. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at: - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ - -option version = "2.1.0"; - -import "vnet/interface_types.api"; -import "vnet/ip/ip_types.api"; - -/** \brief Create or delete a VXLAN tunnel - @param client_index - opaque cookie to identify the sender - @param context - sender context, to match reply w/ request - @param is_add - Use 1 to create the tunnel, 0 to remove it - @param instance - optional unique custom device instance, else ~0. - @param src_address - Source IP address - @param dst_address - Destination IP address, can be multicast - @param mcast_sw_if_index - Interface for multicast destination - @param encap_vrf_id - Encap route table FIB index - @param decap_next_index - index of decap next graph node - @param vni - The VXLAN Network Identifier, uint24 -*/ -define vxlan_add_del_tunnel -{ - u32 client_index; - u32 context; - bool is_add [default=true]; - u32 instance; /* If non-~0, specifies a custom dev instance */ - vl_api_address_t src_address; - vl_api_address_t dst_address; - vl_api_interface_index_t mcast_sw_if_index; - u32 encap_vrf_id; - u32 decap_next_index; - u32 vni; -}; - -/** \brief Create or delete a VXLAN tunnel - @param client_index - opaque cookie to identify the sender - @param context - sender context, to match reply w/ request - @param is_add - Use 1 to create the tunnel, 0 to remove it - @param instance - optional unique custom device instance, else ~0. - @param src_address - Source IP address - @param dst_address - Destination IP address, can be multicast - @param src_port - Source UDP port. It is not included in sent packets. Used only for port registration - @param dst_port - Destination UDP port - @param mcast_sw_if_index - Interface for multicast destination - @param encap_vrf_id - Encap route table FIB index - @param decap_next_index - index of decap next graph node - @param vni - The VXLAN Network Identifier, uint24 -*/ -define vxlan_add_del_tunnel_v2 -{ - u32 client_index; - u32 context; - bool is_add [default=true]; - u32 instance [default=0xffffffff]; /* If non-~0, specifies a custom dev instance */ - vl_api_address_t src_address; - vl_api_address_t dst_address; - u16 src_port; - u16 dst_port; - vl_api_interface_index_t mcast_sw_if_index; - u32 encap_vrf_id; - u32 decap_next_index; - u32 vni; -}; - -/** \brief Create or delete a VXLAN tunnel - @param client_index - opaque cookie to identify the sender - @param context - sender context, to match reply w/ request - @param is_add - Use 1 to create the tunnel, 0 to remove it - @param instance - optional unique custom device instance, else ~0. - @param src_address - Source IP address - @param dst_address - Destination IP address, can be multicast - @param src_port - Source UDP port. It is not included in sent packets. Used only for port registration - @param dst_port - Destination UDP port - @param mcast_sw_if_index - Interface for multicast destination - @param encap_vrf_id - Encap route table FIB index - @param decap_next_index - index of decap next graph node - @param vni - The VXLAN Network Identifier, uint24 - @param is_l3 - if true, create the interface in L3 mode, w/o MAC -*/ -define vxlan_add_del_tunnel_v3 -{ - u32 client_index; - u32 context; - bool is_add [default=true]; - u32 instance [default=0xffffffff]; /* If non-~0, specifies a custom dev instance */ - vl_api_address_t src_address; - vl_api_address_t dst_address; - u16 src_port; - u16 dst_port; - vl_api_interface_index_t mcast_sw_if_index; - u32 encap_vrf_id; - u32 decap_next_index; - u32 vni; - bool is_l3 [default=false]; -}; - -define vxlan_add_del_tunnel_reply -{ - u32 context; - i32 retval; - vl_api_interface_index_t sw_if_index; -}; -define vxlan_add_del_tunnel_v2_reply -{ - u32 context; - i32 retval; - vl_api_interface_index_t sw_if_index; -}; -define vxlan_add_del_tunnel_v3_reply -{ - u32 context; - i32 retval; - vl_api_interface_index_t sw_if_index; -}; - -define vxlan_tunnel_dump -{ - u32 client_index; - u32 context; - vl_api_interface_index_t sw_if_index; -}; -define vxlan_tunnel_v2_dump -{ - u32 client_index; - u32 context; - vl_api_interface_index_t sw_if_index; -}; - -define vxlan_tunnel_details -{ - u32 context; - vl_api_interface_index_t sw_if_index; - u32 instance; - vl_api_address_t src_address; - vl_api_address_t dst_address; - vl_api_interface_index_t mcast_sw_if_index; - u32 encap_vrf_id; - u32 decap_next_index; - u32 vni; -}; -define vxlan_tunnel_v2_details -{ - u32 context; - vl_api_interface_index_t sw_if_index; - u32 instance; - vl_api_address_t src_address; - vl_api_address_t dst_address; - u16 src_port; - u16 dst_port; - vl_api_interface_index_t mcast_sw_if_index; - u32 encap_vrf_id; - u32 decap_next_index; - u32 vni; -}; - -/** \brief Interface set vxlan-bypass request - @param client_index - opaque cookie to identify the sender - @param context - sender context, to match reply w/ request - @param sw_if_index - interface used to reach neighbor - @param is_ipv6 - if non-zero, enable ipv6-vxlan-bypass, else ipv4-vxlan-bypass - @param enable - if non-zero enable, else disable -*/ -autoreply define sw_interface_set_vxlan_bypass -{ - u32 client_index; - u32 context; - vl_api_interface_index_t sw_if_index; - bool is_ipv6; - bool enable [default=true]; -}; - -/** \brief Offload vxlan rx request - @param client_index - opaque cookie to identify the sender - @param context - sender context, to match reply w/ request - @param hw_if_index - rx hw interface - @param sw_if_index - vxlan interface to offload - @param enable - if non-zero enable, else disable -*/ -autoreply define vxlan_offload_rx -{ - u32 client_index; - u32 context; - vl_api_interface_index_t hw_if_index; - vl_api_interface_index_t sw_if_index; - bool enable [default=true]; -}; diff --git a/src/vnet/vxlan/vxlan.c b/src/vnet/vxlan/vxlan.c deleted file mode 100644 index 1871e5d71d2..00000000000 --- a/src/vnet/vxlan/vxlan.c +++ /dev/null @@ -1,1349 +0,0 @@ -/* - * Copyright (c) 2015 Cisco and/or its affiliates. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at: - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -#include <vnet/vxlan/vxlan.h> -#include <vnet/ip/format.h> -#include <vnet/fib/fib_entry.h> -#include <vnet/fib/fib_table.h> -#include <vnet/fib/fib_entry_track.h> -#include <vnet/mfib/mfib_table.h> -#include <vnet/adj/adj_mcast.h> -#include <vnet/adj/rewrite.h> -#include <vnet/dpo/drop_dpo.h> -#include <vnet/interface.h> -#include <vnet/flow/flow.h> -#include <vnet/udp/udp_local.h> -#include <vlib/vlib.h> - -/** - * @file - * @brief VXLAN. - * - * VXLAN provides the features needed to allow L2 bridge domains (BDs) - * to span multiple servers. This is done by building an L2 overlay on - * top of an L3 network underlay using VXLAN tunnels. - * - * This makes it possible for servers to be co-located in the same data - * center or be separated geographically as long as they are reachable - * through the underlay L3 network. - * - * You can refer to this kind of L2 overlay bridge domain as a VXLAN - * (Virtual eXtensible VLAN) segment. - */ - - -vxlan_main_t vxlan_main; - -static u32 -vxlan_eth_flag_change (vnet_main_t *vnm, vnet_hw_interface_t *hi, u32 flags) -{ - /* nothing for now */ - return 0; -} - -static clib_error_t * -vxlan_eth_set_max_frame_size (vnet_main_t *vnm, vnet_hw_interface_t *hw, - u32 frame_size) -{ - /* nothing for now */ - return 0; -} - -static u8 * -format_decap_next (u8 * s, va_list * args) -{ - u32 next_index = va_arg (*args, u32); - - if (next_index == VXLAN_INPUT_NEXT_DROP) - return format (s, "drop"); - else - return format (s, "index %d", next_index); - return s; -} - -u8 * -format_vxlan_tunnel (u8 * s, va_list * args) -{ - vxlan_tunnel_t *t = va_arg (*args, vxlan_tunnel_t *); - - s = format (s, - "[%d] instance %d src %U dst %U src_port %d dst_port %d vni %d " - "fib-idx %d sw-if-idx %d ", - t->dev_instance, t->user_instance, format_ip46_address, &t->src, - IP46_TYPE_ANY, format_ip46_address, &t->dst, IP46_TYPE_ANY, - t->src_port, t->dst_port, t->vni, t->encap_fib_index, - t->sw_if_index); - - s = format (s, "encap-dpo-idx %d ", t->next_dpo.dpoi_index); - - if (PREDICT_FALSE (t->decap_next_index != VXLAN_INPUT_NEXT_L2_INPUT)) - s = format (s, "decap-next-%U ", format_decap_next, t->decap_next_index); - - if (PREDICT_FALSE (ip46_address_is_multicast (&t->dst))) - s = format (s, "mcast-sw-if-idx %d ", t->mcast_sw_if_index); - - if (t->flow_index != ~0) - s = format (s, "flow-index %d [%U]", t->flow_index, - format_flow_enabled_hw, t->flow_index); - - return s; -} - -static u8 * -format_vxlan_name (u8 * s, va_list * args) -{ - u32 dev_instance = va_arg (*args, u32); - vxlan_main_t *vxm = &vxlan_main; - vxlan_tunnel_t *t; - - if (dev_instance == ~0) - return format (s, "<cached-unused>"); - - if (dev_instance >= vec_len (vxm->tunnels)) - return format (s, "<improperly-referenced>"); - - t = pool_elt_at_index (vxm->tunnels, dev_instance); - - return format (s, "vxlan_tunnel%d", t->user_instance); -} - -static clib_error_t * -vxlan_interface_admin_up_down (vnet_main_t * vnm, u32 hw_if_index, u32 flags) -{ - u32 hw_flags = (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) ? - VNET_HW_INTERFACE_FLAG_LINK_UP : 0; - vnet_hw_interface_set_flags (vnm, hw_if_index, hw_flags); - - return /* no error */ 0; -} - -/* *INDENT-OFF* */ -VNET_DEVICE_CLASS (vxlan_device_class, static) = { - .name = "VXLAN", - .format_device_name = format_vxlan_name, - .format_tx_trace = format_vxlan_encap_trace, - .admin_up_down_function = vxlan_interface_admin_up_down, -}; -/* *INDENT-ON* */ - -static u8 * -format_vxlan_header_with_length (u8 * s, va_list * args) -{ - u32 dev_instance = va_arg (*args, u32); - s = format (s, "unimplemented dev %u", dev_instance); - return s; -} - -/* *INDENT-OFF* */ -VNET_HW_INTERFACE_CLASS (vxlan_hw_class) = { - .name = "VXLAN", - .format_header = format_vxlan_header_with_length, - .build_rewrite = default_build_rewrite, -}; -/* *INDENT-ON* */ - -static void -vxlan_tunnel_restack_dpo (vxlan_tunnel_t * t) -{ - u8 is_ip4 = ip46_address_is_ip4 (&t->dst); - dpo_id_t dpo = DPO_INVALID; - fib_forward_chain_type_t forw_type = is_ip4 ? - FIB_FORW_CHAIN_TYPE_UNICAST_IP4 : FIB_FORW_CHAIN_TYPE_UNICAST_IP6; - - fib_entry_contribute_forwarding (t->fib_entry_index, forw_type, &dpo); - - /* vxlan uses the payload hash as the udp source port - * hence the packet's hash is unknown - * skip single bucket load balance dpo's */ - while (DPO_LOAD_BALANCE == dpo.dpoi_type) - { - const load_balance_t *lb; - const dpo_id_t *choice; - - lb = load_balance_get (dpo.dpoi_index); - if (lb->lb_n_buckets > 1) - break; - - choice = load_balance_get_bucket_i (lb, 0); - - if (DPO_RECEIVE == choice->dpoi_type) - dpo_copy (&dpo, drop_dpo_get (choice->dpoi_proto)); - else - dpo_copy (&dpo, choice); - } - - u32 encap_index = is_ip4 ? - vxlan4_encap_node.index : vxlan6_encap_node.index; - dpo_stack_from_node (encap_index, &t->next_dpo, &dpo); - dpo_reset (&dpo); -} - -static vxlan_tunnel_t * -vxlan_tunnel_from_fib_node (fib_node_t * node) -{ - ASSERT (FIB_NODE_TYPE_VXLAN_TUNNEL == node->fn_type); - return ((vxlan_tunnel_t *) (((char *) node) - - STRUCT_OFFSET_OF (vxlan_tunnel_t, node))); -} - -/** - * Function definition to backwalk a FIB node - - * Here we will restack the new dpo of VXLAN DIP to encap node. - */ -static fib_node_back_walk_rc_t -vxlan_tunnel_back_walk (fib_node_t * node, fib_node_back_walk_ctx_t * ctx) -{ - vxlan_tunnel_restack_dpo (vxlan_tunnel_from_fib_node (node)); - return (FIB_NODE_BACK_WALK_CONTINUE); -} - -/** - * Function definition to get a FIB node from its index - */ -static fib_node_t * -vxlan_tunnel_fib_node_get (fib_node_index_t index) -{ - vxlan_tunnel_t *t; - vxlan_main_t *vxm = &vxlan_main; - - t = pool_elt_at_index (vxm->tunnels, index); - - return (&t->node); -} - -/** - * Function definition to inform the FIB node that its last lock has gone. - */ -static void -vxlan_tunnel_last_lock_gone (fib_node_t * node) -{ - /* - * The VXLAN tunnel is a root of the graph. As such - * it never has children and thus is never locked. - */ - ASSERT (0); -} - -/* - * Virtual function table registered by VXLAN tunnels - * for participation in the FIB object graph. - */ -const static fib_node_vft_t vxlan_vft = { - .fnv_get = vxlan_tunnel_fib_node_get, - .fnv_last_lock = vxlan_tunnel_last_lock_gone, - .fnv_back_walk = vxlan_tunnel_back_walk, -}; - -#define foreach_copy_field \ - _ (vni) \ - _ (mcast_sw_if_index) \ - _ (encap_fib_index) \ - _ (decap_next_index) \ - _ (src) \ - _ (dst) \ - _ (src_port) \ - _ (dst_port) - -static void -vxlan_rewrite (vxlan_tunnel_t * t, bool is_ip6) -{ - union - { - ip4_vxlan_header_t h4; - ip6_vxlan_header_t h6; - } h; - int len = is_ip6 ? sizeof h.h6 : sizeof h.h4; - - udp_header_t *udp; - vxlan_header_t *vxlan; - /* Fixed portion of the (outer) ip header */ - - clib_memset (&h, 0, sizeof (h)); - if (!is_ip6) - { - ip4_header_t *ip = &h.h4.ip4; - udp = &h.h4.udp, vxlan = &h.h4.vxlan; - ip->ip_version_and_header_length = 0x45; - ip->ttl = 254; - ip->protocol = IP_PROTOCOL_UDP; - - ip->src_address = t->src.ip4; - ip->dst_address = t->dst.ip4; - - /* we fix up the ip4 header length and checksum after-the-fact */ - ip->checksum = ip4_header_checksum (ip); - } - else - { - ip6_header_t *ip = &h.h6.ip6; - udp = &h.h6.udp, vxlan = &h.h6.vxlan; - ip->ip_version_traffic_class_and_flow_label = - clib_host_to_net_u32 (6 << 28); - ip->hop_limit = 255; - ip->protocol = IP_PROTOCOL_UDP; - - ip->src_address = t->src.ip6; - ip->dst_address = t->dst.ip6; - } - - /* UDP header, randomize src port on something, maybe? */ - udp->src_port = clib_host_to_net_u16 (t->src_port); - udp->dst_port = clib_host_to_net_u16 (t->dst_port); - - /* VXLAN header */ - vnet_set_vni_and_flags (vxlan, t->vni); - vnet_rewrite_set_data (*t, &h, len); -} - -static bool -vxlan_decap_next_is_valid (vxlan_main_t * vxm, u32 is_ip6, - u32 decap_next_index) -{ - vlib_main_t *vm = vxm->vlib_main; - u32 input_idx = (!is_ip6) ? - vxlan4_input_node.index : vxlan6_input_node.index; - vlib_node_runtime_t *r = vlib_node_get_runtime (vm, input_idx); - - return decap_next_index < r->n_next_nodes; -} - -/* *INDENT-OFF* */ -typedef CLIB_PACKED(union -{ - struct - { - fib_node_index_t mfib_entry_index; - adj_index_t mcast_adj_index; - }; - u64 as_u64; -}) mcast_shared_t; -/* *INDENT-ON* */ - -static inline mcast_shared_t -mcast_shared_get (ip46_address_t * ip) -{ - ASSERT (ip46_address_is_multicast (ip)); - uword *p = hash_get_mem (vxlan_main.mcast_shared, ip); - ALWAYS_ASSERT (p); - mcast_shared_t ret = {.as_u64 = *p }; - return ret; -} - -static inline void -mcast_shared_add (ip46_address_t * dst, fib_node_index_t mfei, adj_index_t ai) -{ - mcast_shared_t new_ep = { - .mcast_adj_index = ai, - .mfib_entry_index = mfei, - }; - - hash_set_mem_alloc (&vxlan_main.mcast_shared, dst, new_ep.as_u64); -} - -static inline void -mcast_shared_remove (ip46_address_t * dst) -{ - mcast_shared_t ep = mcast_shared_get (dst); - - adj_unlock (ep.mcast_adj_index); - mfib_table_entry_delete_index (ep.mfib_entry_index, MFIB_SOURCE_VXLAN); - - hash_unset_mem_free (&vxlan_main.mcast_shared, dst); -} - -int vnet_vxlan_add_del_tunnel - (vnet_vxlan_add_del_tunnel_args_t * a, u32 * sw_if_indexp) -{ - vxlan_main_t *vxm = &vxlan_main; - vnet_main_t *vnm = vxm->vnet_main; - vxlan_decap_info_t *p; - u32 sw_if_index = ~0; - vxlan4_tunnel_key_t key4; - vxlan6_tunnel_key_t key6; - u32 is_ip6 = a->is_ip6; - vlib_main_t *vm = vlib_get_main (); - u8 hw_addr[6]; - - /* Set udp-ports */ - if (a->src_port == 0) - a->src_port = is_ip6 ? UDP_DST_PORT_vxlan6 : UDP_DST_PORT_vxlan; - - if (a->dst_port == 0) - a->dst_port = is_ip6 ? UDP_DST_PORT_vxlan6 : UDP_DST_PORT_vxlan; - - int not_found; - if (!is_ip6) - { - /* ip4 mcast is indexed by mcast addr only */ - key4.key[0] = ip46_address_is_multicast (&a->dst) ? - a->dst.ip4.as_u32 : - a->dst.ip4.as_u32 | (((u64) a->src.ip4.as_u32) << 32); - key4.key[1] = ((u64) clib_host_to_net_u16 (a->src_port) << 48) | - (((u64) a->encap_fib_index) << 32) | - clib_host_to_net_u32 (a->vni << 8); - not_found = - clib_bihash_search_inline_16_8 (&vxm->vxlan4_tunnel_by_key, &key4); - p = (void *) &key4.value; - } - else - { - key6.key[0] = a->dst.ip6.as_u64[0]; - key6.key[1] = a->dst.ip6.as_u64[1]; - key6.key[2] = (((u64) clib_host_to_net_u16 (a->src_port) << 48) | - ((u64) a->encap_fib_index) << 32) | - clib_host_to_net_u32 (a->vni << 8); - not_found = - clib_bihash_search_inline_24_8 (&vxm->vxlan6_tunnel_by_key, &key6); - p = (void *) &key6.value; - } - - if (not_found) - p = 0; - - if (a->is_add) - { - l2input_main_t *l2im = &l2input_main; - u32 dev_instance; /* real dev instance tunnel index */ - u32 user_instance; /* request and actual instance number */ - - /* adding a tunnel: tunnel must not already exist */ - if (p) - return VNET_API_ERROR_TUNNEL_EXIST; - - /*if not set explicitly, default to l2 */ - if (a->decap_next_index == ~0) - a->decap_next_index = VXLAN_INPUT_NEXT_L2_INPUT; - if (!vxlan_decap_next_is_valid (vxm, is_ip6, a->decap_next_index)) - return VNET_API_ERROR_INVALID_DECAP_NEXT; - - vxlan_tunnel_t *t; - pool_get_aligned (vxm->tunnels, t, CLIB_CACHE_LINE_BYTES); - clib_memset (t, 0, sizeof (*t)); - dev_instance = t - vxm->tunnels; - - /* copy from arg structure */ -#define _(x) t->x = a->x; - foreach_copy_field; -#undef _ - - vxlan_rewrite (t, is_ip6); - /* - * Reconcile the real dev_instance and a possible requested instance. - */ - user_instance = a->instance; - if (user_instance == ~0) - user_instance = dev_instance; - if (hash_get (vxm->instance_used, user_instance)) - { - pool_put (vxm->tunnels, t); - return VNET_API_ERROR_INSTANCE_IN_USE; - } - - hash_set (vxm->instance_used, user_instance, 1); - - t->dev_instance = dev_instance; /* actual */ - t->user_instance = user_instance; /* name */ - t->flow_index = ~0; - - if (a->is_l3) - t->hw_if_index = - vnet_register_interface (vnm, vxlan_device_class.index, dev_instance, - vxlan_hw_class.index, dev_instance); - else - { - vnet_eth_interface_registration_t eir = {}; - f64 now = vlib_time_now (vm); - u32 rnd; - rnd = (u32) (now * 1e6); - rnd = random_u32 (&rnd); - memcpy (hw_addr + 2, &rnd, sizeof (rnd)); - hw_addr[0] = 2; - hw_addr[1] = 0xfe; - - eir.dev_class_index = vxlan_device_class.index; - eir.dev_instance = dev_instance; - eir.address = hw_addr; - eir.cb.flag_change = vxlan_eth_flag_change; - eir.cb.set_max_frame_size = vxlan_eth_set_max_frame_size; - t->hw_if_index = vnet_eth_register_interface (vnm, &eir); - } - - vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, t->hw_if_index); - - /* Set vxlan tunnel output node */ - u32 encap_index = !is_ip6 ? - vxlan4_encap_node.index : vxlan6_encap_node.index; - vnet_set_interface_output_node (vnm, t->hw_if_index, encap_index); - - t->sw_if_index = sw_if_index = hi->sw_if_index; - - /* copy the key */ - int add_failed; - if (is_ip6) - { - key6.value = (u64) dev_instance; - add_failed = clib_bihash_add_del_24_8 (&vxm->vxlan6_tunnel_by_key, - &key6, 1 /*add */ ); - } - else - { - vxlan_decap_info_t di = {.sw_if_index = t->sw_if_index, }; - if (ip46_address_is_multicast (&t->dst)) - di.local_ip = t->src.ip4; - else - di.next_index = t->decap_next_index; - key4.value = di.as_u64; - add_failed = clib_bihash_add_del_16_8 (&vxm->vxlan4_tunnel_by_key, - &key4, 1 /*add */ ); - } - - if (add_failed) - { - if (a->is_l3) - vnet_delete_hw_interface (vnm, t->hw_if_index); - else - ethernet_delete_interface (vnm, t->hw_if_index); - hash_unset (vxm->instance_used, t->user_instance); - pool_put (vxm->tunnels, t); - return VNET_API_ERROR_INVALID_REGISTRATION; - } - - vec_validate_init_empty (vxm->tunnel_index_by_sw_if_index, sw_if_index, - ~0); - vxm->tunnel_index_by_sw_if_index[sw_if_index] = dev_instance; - - /* setup l2 input config with l2 feature and bd 0 to drop packet */ - vec_validate (l2im->configs, sw_if_index); - l2im->configs[sw_if_index].feature_bitmap = L2INPUT_FEAT_DROP; - l2im->configs[sw_if_index].bd_index = 0; - - vnet_sw_interface_t *si = vnet_get_sw_interface (vnm, sw_if_index); - si->flags &= ~VNET_SW_INTERFACE_FLAG_HIDDEN; - vnet_sw_interface_set_flags (vnm, sw_if_index, - VNET_SW_INTERFACE_FLAG_ADMIN_UP); - - fib_node_init (&t->node, FIB_NODE_TYPE_VXLAN_TUNNEL); - fib_prefix_t tun_dst_pfx; - vnet_flood_class_t flood_class = VNET_FLOOD_CLASS_TUNNEL_NORMAL; - - fib_protocol_t fp = fib_ip_proto (is_ip6); - fib_prefix_from_ip46_addr (fp, &t->dst, &tun_dst_pfx); - if (!ip46_address_is_multicast (&t->dst)) - { - /* Unicast tunnel - - * source the FIB entry for the tunnel's destination - * and become a child thereof. The tunnel will then get poked - * when the forwarding for the entry updates, and the tunnel can - * re-stack accordingly - */ - vtep_addr_ref (&vxm->vtep_table, t->encap_fib_index, &t->src); - t->fib_entry_index = fib_entry_track (t->encap_fib_index, - &tun_dst_pfx, - FIB_NODE_TYPE_VXLAN_TUNNEL, - dev_instance, - &t->sibling_index); - vxlan_tunnel_restack_dpo (t); - } - else - { - /* Multicast tunnel - - * as the same mcast group can be used for multiple mcast tunnels - * with different VNIs, create the output fib adjacency only if - * it does not already exist - */ - if (vtep_addr_ref (&vxm->vtep_table, - t->encap_fib_index, &t->dst) == 1) - { - fib_node_index_t mfei; - adj_index_t ai; - fib_route_path_t path = { - .frp_proto = fib_proto_to_dpo (fp), - .frp_addr = zero_addr, - .frp_sw_if_index = 0xffffffff, - .frp_fib_index = ~0, - .frp_weight = 1, - .frp_flags = FIB_ROUTE_PATH_LOCAL, - .frp_mitf_flags = MFIB_ITF_FLAG_FORWARD, - }; - const mfib_prefix_t mpfx = { - .fp_proto = fp, - .fp_len = (is_ip6 ? 128 : 32), - .fp_grp_addr = tun_dst_pfx.fp_addr, - }; - - /* - * Setup the (*,G) to receive traffic on the mcast group - * - the forwarding interface is for-us - * - the accepting interface is that from the API - */ - mfib_table_entry_path_update (t->encap_fib_index, &mpfx, - MFIB_SOURCE_VXLAN, - MFIB_ENTRY_FLAG_NONE, &path); - - path.frp_sw_if_index = a->mcast_sw_if_index; - path.frp_flags = FIB_ROUTE_PATH_FLAG_NONE; - path.frp_mitf_flags = MFIB_ITF_FLAG_ACCEPT; - mfei = mfib_table_entry_path_update ( - t->encap_fib_index, &mpfx, MFIB_SOURCE_VXLAN, - MFIB_ENTRY_FLAG_NONE, &path); - - /* - * Create the mcast adjacency to send traffic to the group - */ - ai = adj_mcast_add_or_lock (fp, - fib_proto_to_link (fp), - a->mcast_sw_if_index); - - /* - * create a new end-point - */ - mcast_shared_add (&t->dst, mfei, ai); - } - - dpo_id_t dpo = DPO_INVALID; - mcast_shared_t ep = mcast_shared_get (&t->dst); - - /* Stack shared mcast dst mac addr rewrite on encap */ - dpo_set (&dpo, DPO_ADJACENCY_MCAST, - fib_proto_to_dpo (fp), ep.mcast_adj_index); - - dpo_stack_from_node (encap_index, &t->next_dpo, &dpo); - dpo_reset (&dpo); - flood_class = VNET_FLOOD_CLASS_TUNNEL_MASTER; - } - - vnet_get_sw_interface (vnet_get_main (), sw_if_index)->flood_class = - flood_class; - } - else - { - /* deleting a tunnel: tunnel must exist */ - if (!p) - return VNET_API_ERROR_NO_SUCH_ENTRY; - - u32 instance = is_ip6 ? key6.value : - vxm->tunnel_index_by_sw_if_index[p->sw_if_index]; - vxlan_tunnel_t *t = pool_elt_at_index (vxm->tunnels, instance); - - sw_if_index = t->sw_if_index; - vnet_sw_interface_set_flags (vnm, sw_if_index, 0 /* down */ ); - - vxm->tunnel_index_by_sw_if_index[sw_if_index] = ~0; - - if (!is_ip6) - clib_bihash_add_del_16_8 (&vxm->vxlan4_tunnel_by_key, &key4, - 0 /*del */ ); - else - clib_bihash_add_del_24_8 (&vxm->vxlan6_tunnel_by_key, &key6, - 0 /*del */ ); - - if (!ip46_address_is_multicast (&t->dst)) - { - if (t->flow_index != ~0) - vnet_flow_del (vnm, t->flow_index); - - vtep_addr_unref (&vxm->vtep_table, t->encap_fib_index, &t->src); - fib_entry_untrack (t->fib_entry_index, t->sibling_index); - } - else if (vtep_addr_unref (&vxm->vtep_table, - t->encap_fib_index, &t->dst) == 0) - { - mcast_shared_remove (&t->dst); - } - - vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, t->hw_if_index); - if (hw->dev_class_index == vxlan_device_class.index) - vnet_delete_hw_interface (vnm, t->hw_if_index); - else - ethernet_delete_interface (vnm, t->hw_if_index); - hash_unset (vxm->instance_used, t->user_instance); - - fib_node_deinit (&t->node); - pool_put (vxm->tunnels, t); - } - - if (sw_if_indexp) - *sw_if_indexp = sw_if_index; - - if (a->is_add) - { - /* register udp ports */ - if (!is_ip6 && !udp_is_valid_dst_port (a->src_port, 1)) - udp_register_dst_port (vxm->vlib_main, a->src_port, - vxlan4_input_node.index, 1); - if (is_ip6 && !udp_is_valid_dst_port (a->src_port, 0)) - udp_register_dst_port (vxm->vlib_main, a->src_port, - vxlan6_input_node.index, 0); - } - - return 0; -} - -static uword -get_decap_next_for_node (u32 node_index, u32 ipv4_set) -{ - vxlan_main_t *vxm = &vxlan_main; - vlib_main_t *vm = vxm->vlib_main; - uword input_node = (ipv4_set) ? vxlan4_input_node.index : - vxlan6_input_node.index; - - return vlib_node_add_next (vm, input_node, node_index); -} - -static uword -unformat_decap_next (unformat_input_t * input, va_list * args) -{ - u32 *result = va_arg (*args, u32 *); - u32 ipv4_set = va_arg (*args, int); - vxlan_main_t *vxm = &vxlan_main; - vlib_main_t *vm = vxm->vlib_main; - u32 node_index; - u32 tmp; - - if (unformat (input, "l2")) - *result = VXLAN_INPUT_NEXT_L2_INPUT; - else if (unformat (input, "node %U", unformat_vlib_node, vm, &node_index)) - *result = get_decap_next_for_node (node_index, ipv4_set); - else if (unformat (input, "%d", &tmp)) - *result = tmp; - else - return 0; - return 1; -} - -static clib_error_t * -vxlan_add_del_tunnel_command_fn (vlib_main_t * vm, - unformat_input_t * input, - vlib_cli_command_t * cmd) -{ - unformat_input_t _line_input, *line_input = &_line_input; - ip46_address_t src = ip46_address_initializer, dst = - ip46_address_initializer; - u8 is_add = 1; - u8 src_set = 0; - u8 dst_set = 0; - u8 grp_set = 0; - u8 ipv4_set = 0; - u8 ipv6_set = 0; - u8 is_l3 = 0; - u32 instance = ~0; - u32 encap_fib_index = 0; - u32 mcast_sw_if_index = ~0; - u32 decap_next_index = VXLAN_INPUT_NEXT_L2_INPUT; - u32 vni = 0; - u32 src_port = 0; - u32 dst_port = 0; - u32 table_id; - clib_error_t *parse_error = NULL; - - /* Get a line of input. */ - if (!unformat_user (input, unformat_line_input, line_input)) - return 0; - - while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT) - { - if (unformat (line_input, "del")) - { - is_add = 0; - } - else if (unformat (line_input, "instance %d", &instance)) - ; - else if (unformat (line_input, "src %U", - unformat_ip46_address, &src, IP46_TYPE_ANY)) - { - src_set = 1; - ip46_address_is_ip4 (&src) ? (ipv4_set = 1) : (ipv6_set = 1); - } - else if (unformat (line_input, "dst %U", - unformat_ip46_address, &dst, IP46_TYPE_ANY)) - { - dst_set = 1; - ip46_address_is_ip4 (&dst) ? (ipv4_set = 1) : (ipv6_set = 1); - } - else if (unformat (line_input, "group %U %U", - unformat_ip46_address, &dst, IP46_TYPE_ANY, - unformat_vnet_sw_interface, - vnet_get_main (), &mcast_sw_if_index)) - { - grp_set = dst_set = 1; - ip46_address_is_ip4 (&dst) ? (ipv4_set = 1) : (ipv6_set = 1); - } - else if (unformat (line_input, "encap-vrf-id %d", &table_id)) - { - encap_fib_index = - fib_table_find (fib_ip_proto (ipv6_set), table_id); - } - else if (unformat (line_input, "l3")) - is_l3 = 1; - else if (unformat (line_input, "decap-next %U", unformat_decap_next, - &decap_next_index, ipv4_set)) - ; - else if (unformat (line_input, "vni %d", &vni)) - ; - else if (unformat (line_input, "src_port %d", &src_port)) - ; - else if (unformat (line_input, "dst_port %d", &dst_port)) - ; - else - { - parse_error = clib_error_return (0, "parse error: '%U'", - format_unformat_error, line_input); - break; - } - } - - unformat_free (line_input); - - if (parse_error) - return parse_error; - - if (is_l3 && decap_next_index == VXLAN_INPUT_NEXT_L2_INPUT) - { - vlib_node_t *node = vlib_get_node_by_name ( - vm, (u8 *) (ipv4_set ? "ip4-input" : "ip6-input")); - decap_next_index = get_decap_next_for_node (node->index, ipv4_set); - } - - if (encap_fib_index == ~0) - return clib_error_return (0, "nonexistent encap-vrf-id %d", table_id); - - if (src_set == 0) - return clib_error_return (0, "tunnel src address not specified"); - - if (dst_set == 0) - return clib_error_return (0, "tunnel dst address not specified"); - - if (grp_set && !ip46_address_is_multicast (&dst)) - return clib_error_return (0, "tunnel group address not multicast"); - - if (grp_set == 0 && ip46_address_is_multicast (&dst)) - return clib_error_return (0, "dst address must be unicast"); - - if (grp_set && mcast_sw_if_index == ~0) - return clib_error_return (0, "tunnel nonexistent multicast device"); - - if (ipv4_set && ipv6_set) - return clib_error_return (0, "both IPv4 and IPv6 addresses specified"); - - if (ip46_address_cmp (&src, &dst) == 0) - return clib_error_return (0, "src and dst addresses are identical"); - - if (decap_next_index == ~0) - return clib_error_return (0, "next node not found"); - - if (vni == 0) - return clib_error_return (0, "vni not specified"); - - if (vni >> 24) - return clib_error_return (0, "vni %d out of range", vni); - - vnet_vxlan_add_del_tunnel_args_t a = { .is_add = is_add, - .is_ip6 = ipv6_set, - .is_l3 = is_l3, - .instance = instance, -#define _(x) .x = x, - foreach_copy_field -#undef _ - }; - - u32 tunnel_sw_if_index; - int rv = vnet_vxlan_add_del_tunnel (&a, &tunnel_sw_if_index); - - switch (rv) - { - case 0: - if (is_add) - vlib_cli_output (vm, "%U\n", format_vnet_sw_if_index_name, - vnet_get_main (), tunnel_sw_if_index); - break; - - case VNET_API_ERROR_TUNNEL_EXIST: - return clib_error_return (0, "tunnel already exists..."); - - case VNET_API_ERROR_NO_SUCH_ENTRY: - return clib_error_return (0, "tunnel does not exist..."); - - case VNET_API_ERROR_INSTANCE_IN_USE: - return clib_error_return (0, "Instance is in use"); - - default: - return clib_error_return - (0, "vnet_vxlan_add_del_tunnel returned %d", rv); - } - - return 0; -} - -/*? - * Add or delete a VXLAN Tunnel. - * - * VXLAN provides the features needed to allow L2 bridge domains (BDs) - * to span multiple servers. This is done by building an L2 overlay on - * top of an L3 network underlay using VXLAN tunnels. - * - * This makes it possible for servers to be co-located in the same data - * center or be separated geographically as long as they are reachable - * through the underlay L3 network. - * - * You can refer to this kind of L2 overlay bridge domain as a VXLAN - * (Virtual eXtensible VLAN) segment. - * - * @cliexpar - * Example of how to create a VXLAN Tunnel: - * @cliexcmd{create vxlan tunnel src 10.0.3.1 dst 10.0.3.3 vni 13 encap-vrf-id - 7} - * Example of how to create a VXLAN Tunnel with a known name, vxlan_tunnel42: - * @cliexcmd{create vxlan tunnel src 10.0.3.1 dst 10.0.3.3 instance 42} - * Example of how to create a multicast VXLAN Tunnel with a known name, - vxlan_tunnel23: - * @cliexcmd{create vxlan tunnel src 10.0.3.1 group 239.1.1.1 - GigabitEthernet0/8/0 instance 23} - * Example of how to create a VXLAN Tunnel with custom udp-ports: - * @cliexcmd{create vxlan tunnel src 10.0.3.1 dst 10.0.3.3 vni 13 src_port - 59000 dst_port 59001} - * Example of how to delete a VXLAN Tunnel: - * @cliexcmd{create vxlan tunnel src 10.0.3.1 dst 10.0.3.3 vni 13 del} - ?*/ -/* *INDENT-OFF* */ -VLIB_CLI_COMMAND (create_vxlan_tunnel_command, static) = { - .path = "create vxlan tunnel", - .short_help = - "create vxlan tunnel src <local-vtep-addr>" - " {dst <remote-vtep-addr>|group <mcast-vtep-addr> <intf-name>} vni <nn>" - " [instance <id>]" - " [encap-vrf-id <nn>] [decap-next [l2|node <name>]] [del] [l3]" - " [src_port <local-vtep-udp-port>] [dst_port <remote-vtep-udp-port>]", - .function = vxlan_add_del_tunnel_command_fn, -}; -/* *INDENT-ON* */ - -static clib_error_t * -show_vxlan_tunnel_command_fn (vlib_main_t * vm, - unformat_input_t * input, - vlib_cli_command_t * cmd) -{ - vxlan_main_t *vxm = &vxlan_main; - vxlan_tunnel_t *t; - int raw = 0; - - while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT) - { - if (unformat (input, "raw")) - raw = 1; - else - return clib_error_return (0, "parse error: '%U'", - format_unformat_error, input); - } - - if (pool_elts (vxm->tunnels) == 0) - vlib_cli_output (vm, "No vxlan tunnels configured..."); - -/* *INDENT-OFF* */ - pool_foreach (t, vxm->tunnels) - { - vlib_cli_output (vm, "%U", format_vxlan_tunnel, t); - } -/* *INDENT-ON* */ - - if (raw) - { - vlib_cli_output (vm, "Raw IPv4 Hash Table:\n%U\n", - format_bihash_16_8, &vxm->vxlan4_tunnel_by_key, - 1 /* verbose */ ); - vlib_cli_output (vm, "Raw IPv6 Hash Table:\n%U\n", - format_bihash_24_8, &vxm->vxlan6_tunnel_by_key, - 1 /* verbose */ ); - } - - return 0; -} - -/*? - * Display all the VXLAN Tunnel entries. - * - * @cliexpar - * Example of how to display the VXLAN Tunnel entries: - * @cliexstart{show vxlan tunnel} - * [0] src 10.0.3.1 dst 10.0.3.3 src_port 4789 dst_port 4789 vni 13 - encap_fib_index 0 sw_if_index 5 decap_next l2 - * @cliexend - ?*/ -/* *INDENT-OFF* */ -VLIB_CLI_COMMAND (show_vxlan_tunnel_command, static) = { - .path = "show vxlan tunnel", - .short_help = "show vxlan tunnel [raw]", - .function = show_vxlan_tunnel_command_fn, -}; -/* *INDENT-ON* */ - - -void -vnet_int_vxlan_bypass_mode (u32 sw_if_index, u8 is_ip6, u8 is_enable) -{ - vxlan_main_t *vxm = &vxlan_main; - - if (pool_is_free_index (vxm->vnet_main->interface_main.sw_interfaces, - sw_if_index)) - return; - - is_enable = ! !is_enable; - - if (is_ip6) - { - if (clib_bitmap_get (vxm->bm_ip6_bypass_enabled_by_sw_if, sw_if_index) - != is_enable) - { - vnet_feature_enable_disable ("ip6-unicast", "ip6-vxlan-bypass", - sw_if_index, is_enable, 0, 0); - vxm->bm_ip6_bypass_enabled_by_sw_if = - clib_bitmap_set (vxm->bm_ip6_bypass_enabled_by_sw_if, - sw_if_index, is_enable); - } - } - else - { - if (clib_bitmap_get (vxm->bm_ip4_bypass_enabled_by_sw_if, sw_if_index) - != is_enable) - { - vnet_feature_enable_disable ("ip4-unicast", "ip4-vxlan-bypass", - sw_if_index, is_enable, 0, 0); - vxm->bm_ip4_bypass_enabled_by_sw_if = - clib_bitmap_set (vxm->bm_ip4_bypass_enabled_by_sw_if, - sw_if_index, is_enable); - } - } -} - - -static clib_error_t * -set_ip_vxlan_bypass (u32 is_ip6, - unformat_input_t * input, vlib_cli_command_t * cmd) -{ - unformat_input_t _line_input, *line_input = &_line_input; - vnet_main_t *vnm = vnet_get_main (); - clib_error_t *error = 0; - u32 sw_if_index, is_enable; - - sw_if_index = ~0; - is_enable = 1; - - if (!unformat_user (input, unformat_line_input, line_input)) - return 0; - - while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT) - { - if (unformat_user - (line_input, unformat_vnet_sw_interface, vnm, &sw_if_index)) - ; - else if (unformat (line_input, "del")) - is_enable = 0; - else - { - error = unformat_parse_error (line_input); - goto done; - } - } - - if (~0 == sw_if_index) - { - error = clib_error_return (0, "unknown interface `%U'", - format_unformat_error, line_input); - goto done; - } - - vnet_int_vxlan_bypass_mode (sw_if_index, is_ip6, is_enable); - -done: - unformat_free (line_input); - - return error; -} - -static clib_error_t * -set_ip4_vxlan_bypass (vlib_main_t * vm, - unformat_input_t * input, vlib_cli_command_t * cmd) -{ - return set_ip_vxlan_bypass (0, input, cmd); -} - -/*? - * This command adds the 'ip4-vxlan-bypass' graph node for a given interface. - * By adding the IPv4 vxlan-bypass graph node to an interface, the node checks - * for and validate input vxlan packet and bypass ip4-lookup, ip4-local, - * ip4-udp-lookup nodes to speedup vxlan packet forwarding. This node will - * cause extra overhead to for non-vxlan packets which is kept at a minimum. - * - * @cliexpar - * @parblock - * Example of graph node before ip4-vxlan-bypass is enabled: - * @cliexstart{show vlib graph ip4-vxlan-bypass} - * Name Next Previous - * ip4-vxlan-bypass error-drop [0] - * vxlan4-input [1] - * ip4-lookup [2] - * @cliexend - * - * Example of how to enable ip4-vxlan-bypass on an interface: - * @cliexcmd{set interface ip vxlan-bypass GigabitEthernet2/0/0} - * - * Example of graph node after ip4-vxlan-bypass is enabled: - * @cliexstart{show vlib graph ip4-vxlan-bypass} - * Name Next Previous - * ip4-vxlan-bypass error-drop [0] ip4-input - * vxlan4-input [1] ip4-input-no-checksum - * ip4-lookup [2] - * @cliexend - * - * Example of how to display the feature enabled on an interface: - * @cliexstart{show ip interface features GigabitEthernet2/0/0} - * IP feature paths configured on GigabitEthernet2/0/0... - * ... - * ipv4 unicast: - * ip4-vxlan-bypass - * ip4-lookup - * ... - * @cliexend - * - * Example of how to disable ip4-vxlan-bypass on an interface: - * @cliexcmd{set interface ip vxlan-bypass GigabitEthernet2/0/0 del} - * @endparblock -?*/ -/* *INDENT-OFF* */ -VLIB_CLI_COMMAND (set_interface_ip_vxlan_bypass_command, static) = { - .path = "set interface ip vxlan-bypass", - .function = set_ip4_vxlan_bypass, - .short_help = "set interface ip vxlan-bypass <interface> [del]", -}; -/* *INDENT-ON* */ - -static clib_error_t * -set_ip6_vxlan_bypass (vlib_main_t * vm, - unformat_input_t * input, vlib_cli_command_t * cmd) -{ - return set_ip_vxlan_bypass (1, input, cmd); -} - -/*? - * This command adds the 'ip6-vxlan-bypass' graph node for a given interface. - * By adding the IPv6 vxlan-bypass graph node to an interface, the node checks - * for and validate input vxlan packet and bypass ip6-lookup, ip6-local, - * ip6-udp-lookup nodes to speedup vxlan packet forwarding. This node will - * cause extra overhead to for non-vxlan packets which is kept at a minimum. - * - * @cliexpar - * @parblock - * Example of graph node before ip6-vxlan-bypass is enabled: - * @cliexstart{show vlib graph ip6-vxlan-bypass} - * Name Next Previous - * ip6-vxlan-bypass error-drop [0] - * vxlan6-input [1] - * ip6-lookup [2] - * @cliexend - * - * Example of how to enable ip6-vxlan-bypass on an interface: - * @cliexcmd{set interface ip6 vxlan-bypass GigabitEthernet2/0/0} - * - * Example of graph node after ip6-vxlan-bypass is enabled: - * @cliexstart{show vlib graph ip6-vxlan-bypass} - * Name Next Previous - * ip6-vxlan-bypass error-drop [0] ip6-input - * vxlan6-input [1] ip4-input-no-checksum - * ip6-lookup [2] - * @cliexend - * - * Example of how to display the feature enabled on an interface: - * @cliexstart{show ip interface features GigabitEthernet2/0/0} - * IP feature paths configured on GigabitEthernet2/0/0... - * ... - * ipv6 unicast: - * ip6-vxlan-bypass - * ip6-lookup - * ... - * @cliexend - * - * Example of how to disable ip6-vxlan-bypass on an interface: - * @cliexcmd{set interface ip6 vxlan-bypass GigabitEthernet2/0/0 del} - * @endparblock -?*/ -/* *INDENT-OFF* */ -VLIB_CLI_COMMAND (set_interface_ip6_vxlan_bypass_command, static) = { - .path = "set interface ip6 vxlan-bypass", - .function = set_ip6_vxlan_bypass, - .short_help = "set interface ip6 vxlan-bypass <interface> [del]", -}; -/* *INDENT-ON* */ - -int -vnet_vxlan_add_del_rx_flow (u32 hw_if_index, u32 t_index, int is_add) -{ - vxlan_main_t *vxm = &vxlan_main; - vxlan_tunnel_t *t = pool_elt_at_index (vxm->tunnels, t_index); - vnet_main_t *vnm = vnet_get_main (); - if (is_add) - { - if (t->flow_index == ~0) - { - vxlan_main_t *vxm = &vxlan_main; - vnet_flow_t flow = { - .actions = - VNET_FLOW_ACTION_REDIRECT_TO_NODE | VNET_FLOW_ACTION_MARK | - VNET_FLOW_ACTION_BUFFER_ADVANCE, - .mark_flow_id = t->dev_instance + vxm->flow_id_start, - .redirect_node_index = vxlan4_flow_input_node.index, - .buffer_advance = sizeof (ethernet_header_t), - .type = VNET_FLOW_TYPE_IP4_VXLAN, - .ip4_vxlan = { - .protocol.prot = IP_PROTOCOL_UDP, - .src_addr.addr = t->dst.ip4, - .dst_addr.addr = t->src.ip4, - .src_addr.mask.as_u32 = ~0, - .dst_addr.mask.as_u32 = ~0, - .dst_port.port = t->src_port, - .dst_port.mask = 0xFF, - .vni = t->vni, - } - , - }; - vnet_flow_add (vnm, &flow, &t->flow_index); - } - return vnet_flow_enable (vnm, t->flow_index, hw_if_index); - } - /* flow index is removed when the tunnel is deleted */ - return vnet_flow_disable (vnm, t->flow_index, hw_if_index); -} - -u32 -vnet_vxlan_get_tunnel_index (u32 sw_if_index) -{ - vxlan_main_t *vxm = &vxlan_main; - - if (sw_if_index >= vec_len (vxm->tunnel_index_by_sw_if_index)) - return ~0; - return vxm->tunnel_index_by_sw_if_index[sw_if_index]; -} - -static clib_error_t * -vxlan_offload_command_fn (vlib_main_t * vm, - unformat_input_t * input, vlib_cli_command_t * cmd) -{ - unformat_input_t _line_input, *line_input = &_line_input; - - /* Get a line of input. */ - if (!unformat_user (input, unformat_line_input, line_input)) - return 0; - - vnet_main_t *vnm = vnet_get_main (); - u32 rx_sw_if_index = ~0; - u32 hw_if_index = ~0; - int is_add = 1; - - while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT) - { - if (unformat (line_input, "hw %U", unformat_vnet_hw_interface, vnm, - &hw_if_index)) - continue; - if (unformat (line_input, "rx %U", unformat_vnet_sw_interface, vnm, - &rx_sw_if_index)) - continue; - if (unformat (line_input, "del")) - { - is_add = 0; - continue; - } - return clib_error_return (0, "unknown input `%U'", - format_unformat_error, line_input); - } - - if (rx_sw_if_index == ~0) - return clib_error_return (0, "missing rx interface"); - if (hw_if_index == ~0) - return clib_error_return (0, "missing hw interface"); - - u32 t_index = vnet_vxlan_get_tunnel_index (rx_sw_if_index);; - if (t_index == ~0) - return clib_error_return (0, "%U is not a vxlan tunnel", - format_vnet_sw_if_index_name, vnm, - rx_sw_if_index); - - vxlan_main_t *vxm = &vxlan_main; - vxlan_tunnel_t *t = pool_elt_at_index (vxm->tunnels, t_index); - - if (!ip46_address_is_ip4 (&t->dst)) - return clib_error_return (0, "currently only IPV4 tunnels are supported"); - - vnet_hw_interface_t *hw_if = vnet_get_hw_interface (vnm, hw_if_index); - ip4_main_t *im = &ip4_main; - u32 rx_fib_index = - vec_elt (im->fib_index_by_sw_if_index, hw_if->sw_if_index); - - if (t->encap_fib_index != rx_fib_index) - return clib_error_return (0, "interface/tunnel fib mismatch"); - - if (vnet_vxlan_add_del_rx_flow (hw_if_index, t_index, is_add)) - return clib_error_return (0, "error %s flow", - is_add ? "enabling" : "disabling"); - - return 0; -} - -/* *INDENT-OFF* */ -VLIB_CLI_COMMAND (vxlan_offload_command, static) = { - .path = "set flow-offload vxlan", - .short_help = - "set flow-offload vxlan hw <interface-name> rx <tunnel-name> [del]", - .function = vxlan_offload_command_fn, -}; -/* *INDENT-ON* */ - -#define VXLAN_HASH_NUM_BUCKETS (2 * 1024) -#define VXLAN_HASH_MEMORY_SIZE (1 << 20) - -clib_error_t * -vxlan_init (vlib_main_t * vm) -{ - vxlan_main_t *vxm = &vxlan_main; - - vxm->vnet_main = vnet_get_main (); - vxm->vlib_main = vm; - - vnet_flow_get_range (vxm->vnet_main, "vxlan", 1024 * 1024, - &vxm->flow_id_start); - - vxm->bm_ip4_bypass_enabled_by_sw_if = 0; - vxm->bm_ip6_bypass_enabled_by_sw_if = 0; - - /* initialize the ip6 hash */ - clib_bihash_init_16_8 (&vxm->vxlan4_tunnel_by_key, "vxlan4", - VXLAN_HASH_NUM_BUCKETS, VXLAN_HASH_MEMORY_SIZE); - clib_bihash_init_24_8 (&vxm->vxlan6_tunnel_by_key, "vxlan6", - VXLAN_HASH_NUM_BUCKETS, VXLAN_HASH_MEMORY_SIZE); - vxm->vtep_table = vtep_table_create (); - vxm->mcast_shared = hash_create_mem (0, - sizeof (ip46_address_t), - sizeof (mcast_shared_t)); - - fib_node_register_type (FIB_NODE_TYPE_VXLAN_TUNNEL, &vxlan_vft); - - return 0; -} - -VLIB_INIT_FUNCTION (vxlan_init); - -/* - * fd.io coding-style-patch-verification: ON - * - * Local Variables: - * eval: (c-set-style "gnu") - * End: - */ diff --git a/src/vnet/vxlan/vxlan.h b/src/vnet/vxlan/vxlan.h deleted file mode 100644 index fa47605e42d..00000000000 --- a/src/vnet/vxlan/vxlan.h +++ /dev/null @@ -1,242 +0,0 @@ -/* - * Copyright (c) 2015 Cisco and/or its affiliates. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at: - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -#ifndef included_vnet_vxlan_h -#define included_vnet_vxlan_h - -#include <vppinfra/error.h> -#include <vppinfra/hash.h> -#include <vppinfra/bihash_16_8.h> -#include <vppinfra/bihash_24_8.h> -#include <vnet/vnet.h> -#include <vnet/ip/ip.h> -#include <vnet/ip/vtep.h> -#include <vnet/l2/l2_input.h> -#include <vnet/l2/l2_output.h> -#include <vnet/l2/l2_bd.h> -#include <vnet/ethernet/ethernet.h> -#include <vnet/vxlan/vxlan_packet.h> -#include <vnet/ip/ip4_packet.h> -#include <vnet/ip/ip6_packet.h> -#include <vnet/udp/udp_packet.h> -#include <vnet/dpo/dpo.h> -#include <vnet/adj/adj_types.h> - -/* *INDENT-OFF* */ -typedef CLIB_PACKED (struct { - ip4_header_t ip4; /* 20 bytes */ - udp_header_t udp; /* 8 bytes */ - vxlan_header_t vxlan; /* 8 bytes */ -}) ip4_vxlan_header_t; - -typedef CLIB_PACKED (struct { - ip6_header_t ip6; /* 40 bytes */ - udp_header_t udp; /* 8 bytes */ - vxlan_header_t vxlan; /* 8 bytes */ -}) ip6_vxlan_header_t; -/* *INDENT-ON* */ - -/* -* Key fields: remote ip, vni on incoming VXLAN packet -* all fields in NET byte order -*/ -typedef clib_bihash_kv_16_8_t vxlan4_tunnel_key_t; - -/* -* Key fields: remote ip, vni and fib index on incoming VXLAN packet -* ip, vni fields in NET byte order -* fib index field in host byte order -*/ -typedef clib_bihash_kv_24_8_t vxlan6_tunnel_key_t; - -typedef union -{ - struct - { - u32 sw_if_index; /* unicast - input interface / mcast - stats interface */ - union - { - struct /* unicast action */ - { - u16 next_index; - u8 error; - }; - ip4_address_t local_ip; /* used as dst ip for mcast pkts to assign them to unicast tunnel */ - }; - }; - u64 as_u64; -} vxlan_decap_info_t; - -typedef struct -{ - /* Required for pool_get_aligned */ - CLIB_CACHE_LINE_ALIGN_MARK (cacheline0); - - /* FIB DPO for IP forwarding of VXLAN encap packet */ - dpo_id_t next_dpo; - - /* vxlan VNI in HOST byte order */ - u32 vni; - - /* tunnel src and dst addresses */ - ip46_address_t src; - ip46_address_t dst; - - /* udp-ports */ - u16 src_port; - u16 dst_port; - - /* mcast packet output intfc index (used only if dst is mcast) */ - u32 mcast_sw_if_index; - - /* decap next index */ - u16 decap_next_index; - - /* The FIB index for src/dst addresses */ - u32 encap_fib_index; - - /* vnet intfc index */ - u32 sw_if_index; - u32 hw_if_index; - - /** - * Linkage into the FIB object graph - */ - fib_node_t node; - - /* - * The FIB entry for (depending on VXLAN tunnel is unicast or mcast) - * sending unicast VXLAN encap packets or receiving mcast VXLAN packets - */ - fib_node_index_t fib_entry_index; - adj_index_t mcast_adj_index; - - /** - * The tunnel is a child of the FIB entry for its destination. This is - * so it receives updates when the forwarding information for that entry - * changes. - * The tunnels sibling index on the FIB entry's dependency list. - */ - u32 sibling_index; - - u32 flow_index; /* infra flow index */ - u32 dev_instance; /* Real device instance in tunnel vector */ - u32 user_instance; /* Instance name being shown to user */ - - VNET_DECLARE_REWRITE; -} vxlan_tunnel_t; - -#define foreach_vxlan_input_next \ -_(DROP, "error-drop") \ -_(L2_INPUT, "l2-input") - -typedef enum -{ -#define _(s,n) VXLAN_INPUT_NEXT_##s, - foreach_vxlan_input_next -#undef _ - VXLAN_INPUT_N_NEXT, -} vxlan_input_next_t; - -typedef enum -{ -#define vxlan_error(n,s) VXLAN_ERROR_##n, -#include <vnet/vxlan/vxlan_error.def> -#undef vxlan_error - VXLAN_N_ERROR, -} vxlan_input_error_t; - -typedef struct -{ - /* vector of encap tunnel instances */ - vxlan_tunnel_t *tunnels; - - /* lookup tunnel by key */ - clib_bihash_16_8_t - vxlan4_tunnel_by_key; /* keyed on ipv4.dst + src_port + fib + vni */ - clib_bihash_24_8_t - vxlan6_tunnel_by_key; /* keyed on ipv6.dst + src_port + fib + vni */ - - /* local VTEP IPs ref count used by vxlan-bypass node to check if - received VXLAN packet DIP matches any local VTEP address */ - vtep_table_t vtep_table; - - /* mcast shared info */ - uword *mcast_shared; /* keyed on mcast ip46 addr */ - - /* Mapping from sw_if_index to tunnel index */ - u32 *tunnel_index_by_sw_if_index; - - /* graph node state */ - uword *bm_ip4_bypass_enabled_by_sw_if; - uword *bm_ip6_bypass_enabled_by_sw_if; - - /* convenience */ - vlib_main_t *vlib_main; - vnet_main_t *vnet_main; - - /* Record used instances */ - uword *instance_used; - u32 flow_id_start; - - /* cache for last 8 vxlan tunnel */ - vtep4_cache_t vtep4_u512; - -} vxlan_main_t; - -extern vxlan_main_t vxlan_main; - -extern vlib_node_registration_t vxlan4_input_node; -extern vlib_node_registration_t vxlan6_input_node; -extern vlib_node_registration_t vxlan4_encap_node; -extern vlib_node_registration_t vxlan6_encap_node; -extern vlib_node_registration_t vxlan4_flow_input_node; - -u8 *format_vxlan_encap_trace (u8 * s, va_list * args); - -typedef struct -{ - u8 is_add; - - /* we normally use is_ip4, but since this adds to the - * structure, this seems less of a breaking change */ - u8 is_ip6; - u8 is_l3; - u32 instance; - ip46_address_t src, dst; - u32 mcast_sw_if_index; - u32 encap_fib_index; - u32 decap_next_index; - u32 vni; - u16 src_port; - u16 dst_port; -} vnet_vxlan_add_del_tunnel_args_t; - -int vnet_vxlan_add_del_tunnel - (vnet_vxlan_add_del_tunnel_args_t * a, u32 * sw_if_indexp); - -void vnet_int_vxlan_bypass_mode (u32 sw_if_index, u8 is_ip6, u8 is_enable); - -int vnet_vxlan_add_del_rx_flow (u32 hw_if_index, u32 t_imdex, int is_add); - -u32 vnet_vxlan_get_tunnel_index (u32 sw_if_index); -#endif /* included_vnet_vxlan_h */ - -/* - * fd.io coding-style-patch-verification: ON - * - * Local Variables: - * eval: (c-set-style "gnu") - * End: - */ diff --git a/src/vnet/vxlan/vxlan_api.c b/src/vnet/vxlan/vxlan_api.c deleted file mode 100644 index 56fd654951f..00000000000 --- a/src/vnet/vxlan/vxlan_api.c +++ /dev/null @@ -1,376 +0,0 @@ -/* - *------------------------------------------------------------------ - * vxlan_api.c - vxlan api - * - * Copyright (c) 2016 Cisco and/or its affiliates. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at: - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - *------------------------------------------------------------------ - */ - -#include <vnet/vnet.h> -#include <vlibmemory/api.h> - -#include <vnet/interface.h> -#include <vnet/api_errno.h> -#include <vnet/feature/feature.h> -#include <vnet/vxlan/vxlan.h> -#include <vnet/fib/fib_table.h> -#include <vnet/ip/ip_types_api.h> -#include <vnet/udp/udp_local.h> -#include <vnet/format_fns.h> -#include <vxlan/vxlan.api_enum.h> -#include <vxlan/vxlan.api_types.h> - -static u16 msg_id_base; - -#define REPLY_MSG_ID_BASE msg_id_base -#include <vlibapi/api_helper_macros.h> - -static void -vl_api_vxlan_offload_rx_t_handler (vl_api_vxlan_offload_rx_t * mp) -{ - vl_api_vxlan_offload_rx_reply_t *rmp; - int rv = 0; - u32 hw_if_index = ntohl (mp->hw_if_index); - u32 sw_if_index = ntohl (mp->sw_if_index); - - if (!vnet_hw_interface_is_valid (vnet_get_main (), hw_if_index)) - { - rv = VNET_API_ERROR_NO_SUCH_ENTRY; - goto err; - } - VALIDATE_SW_IF_INDEX (mp); - - u32 t_index = vnet_vxlan_get_tunnel_index (sw_if_index); - if (t_index == ~0) - { - rv = VNET_API_ERROR_INVALID_SW_IF_INDEX_2; - goto err; - } - - vxlan_main_t *vxm = &vxlan_main; - vxlan_tunnel_t *t = pool_elt_at_index (vxm->tunnels, t_index); - if (!ip46_address_is_ip4 (&t->dst)) - { - rv = VNET_API_ERROR_INVALID_ADDRESS_FAMILY; - goto err; - } - - vnet_main_t *vnm = vnet_get_main (); - vnet_hw_interface_t *hw_if = vnet_get_hw_interface (vnm, hw_if_index); - ip4_main_t *im = &ip4_main; - u32 rx_fib_index = - vec_elt (im->fib_index_by_sw_if_index, hw_if->sw_if_index); - - if (t->encap_fib_index != rx_fib_index) - { - rv = VNET_API_ERROR_NO_SUCH_FIB; - goto err; - } - - if (vnet_vxlan_add_del_rx_flow (hw_if_index, t_index, mp->enable)) - { - rv = VNET_API_ERROR_UNSPECIFIED; - goto err; - } - BAD_SW_IF_INDEX_LABEL; -err: - - REPLY_MACRO (VL_API_VXLAN_OFFLOAD_RX_REPLY); -} - -static void - vl_api_sw_interface_set_vxlan_bypass_t_handler - (vl_api_sw_interface_set_vxlan_bypass_t * mp) -{ - vl_api_sw_interface_set_vxlan_bypass_reply_t *rmp; - int rv = 0; - u32 sw_if_index = ntohl (mp->sw_if_index); - - VALIDATE_SW_IF_INDEX (mp); - - vnet_int_vxlan_bypass_mode (sw_if_index, mp->is_ipv6, mp->enable); - BAD_SW_IF_INDEX_LABEL; - - REPLY_MACRO (VL_API_SW_INTERFACE_SET_VXLAN_BYPASS_REPLY); -} - -static int -vxlan_add_del_tunnel_clean_input (vnet_vxlan_add_del_tunnel_args_t *a, - u32 encap_vrf_id) -{ - a->is_ip6 = !ip46_address_is_ip4 (&a->src); - - a->encap_fib_index = fib_table_find (fib_ip_proto (a->is_ip6), encap_vrf_id); - if (a->encap_fib_index == ~0) - { - return VNET_API_ERROR_NO_SUCH_FIB; - } - - if (ip46_address_is_ip4 (&a->src) != ip46_address_is_ip4 (&a->dst)) - { - return VNET_API_ERROR_INVALID_VALUE; - } - - /* Check src & dst are different */ - if (ip46_address_cmp (&a->dst, &a->src) == 0) - { - return VNET_API_ERROR_SAME_SRC_DST; - } - if (ip46_address_is_multicast (&a->dst) && - !vnet_sw_if_index_is_api_valid (a->mcast_sw_if_index)) - { - return VNET_API_ERROR_INVALID_SW_IF_INDEX; - } - return 0; -} - -static void -vl_api_vxlan_add_del_tunnel_t_handler (vl_api_vxlan_add_del_tunnel_t *mp) -{ - vl_api_vxlan_add_del_tunnel_reply_t *rmp; - u32 sw_if_index = ~0; - int rv = 0; - - vnet_vxlan_add_del_tunnel_args_t a = { - .is_add = mp->is_add, - .instance = ntohl (mp->instance), - .mcast_sw_if_index = ntohl (mp->mcast_sw_if_index), - .decap_next_index = ntohl (mp->decap_next_index), - .vni = ntohl (mp->vni), - }; - ip_address_decode (&mp->src_address, &a.src); - ip_address_decode (&mp->dst_address, &a.dst); - - rv = vxlan_add_del_tunnel_clean_input (&a, ntohl (mp->encap_vrf_id)); - if (rv) - goto out; - a.dst_port = a.is_ip6 ? UDP_DST_PORT_vxlan6 : UDP_DST_PORT_vxlan, - a.src_port = a.is_ip6 ? UDP_DST_PORT_vxlan6 : UDP_DST_PORT_vxlan, - rv = vnet_vxlan_add_del_tunnel (&a, &sw_if_index); - -out: - REPLY_MACRO2(VL_API_VXLAN_ADD_DEL_TUNNEL_REPLY, - ({ - rmp->sw_if_index = ntohl (sw_if_index); - })); -} - -static void -vl_api_vxlan_add_del_tunnel_v2_t_handler (vl_api_vxlan_add_del_tunnel_v2_t *mp) -{ - vl_api_vxlan_add_del_tunnel_v2_reply_t *rmp; - u32 sw_if_index = ~0; - int rv = 0; - - vnet_vxlan_add_del_tunnel_args_t a = { - .is_add = mp->is_add, - .instance = ntohl (mp->instance), - .mcast_sw_if_index = ntohl (mp->mcast_sw_if_index), - .decap_next_index = ntohl (mp->decap_next_index), - .vni = ntohl (mp->vni), - .dst_port = ntohs (mp->dst_port), - .src_port = ntohs (mp->src_port), - }; - - ip_address_decode (&mp->src_address, &a.src); - ip_address_decode (&mp->dst_address, &a.dst); - - rv = vxlan_add_del_tunnel_clean_input (&a, ntohl (mp->encap_vrf_id)); - if (rv) - goto out; - rv = vnet_vxlan_add_del_tunnel (&a, &sw_if_index); -out: - REPLY_MACRO2 (VL_API_VXLAN_ADD_DEL_TUNNEL_V2_REPLY, - ({ rmp->sw_if_index = ntohl (sw_if_index); })); -} - -static void -vl_api_vxlan_add_del_tunnel_v3_t_handler (vl_api_vxlan_add_del_tunnel_v3_t *mp) -{ - vl_api_vxlan_add_del_tunnel_v3_reply_t *rmp; - u32 sw_if_index = ~0; - int rv = 0; - - vnet_vxlan_add_del_tunnel_args_t a = { - .is_add = mp->is_add, - .instance = ntohl (mp->instance), - .mcast_sw_if_index = ntohl (mp->mcast_sw_if_index), - .decap_next_index = ntohl (mp->decap_next_index), - .vni = ntohl (mp->vni), - .dst_port = ntohs (mp->dst_port), - .src_port = ntohs (mp->src_port), - .is_l3 = mp->is_l3, - }; - - ip_address_decode (&mp->src_address, &a.src); - ip_address_decode (&mp->dst_address, &a.dst); - - rv = vxlan_add_del_tunnel_clean_input (&a, ntohl (mp->encap_vrf_id)); - if (rv) - goto out; - rv = vnet_vxlan_add_del_tunnel (&a, &sw_if_index); -out: - REPLY_MACRO2 (VL_API_VXLAN_ADD_DEL_TUNNEL_V3_REPLY, - ({ rmp->sw_if_index = ntohl (sw_if_index); })); -} - -static void send_vxlan_tunnel_details - (vxlan_tunnel_t * t, vl_api_registration_t * reg, u32 context) -{ - vl_api_vxlan_tunnel_details_t *rmp; - ip4_main_t *im4 = &ip4_main; - ip6_main_t *im6 = &ip6_main; - - rmp = vl_msg_api_alloc (sizeof (*rmp)); - clib_memset (rmp, 0, sizeof (*rmp)); - rmp->_vl_msg_id = ntohs (REPLY_MSG_ID_BASE + VL_API_VXLAN_TUNNEL_DETAILS); - - ip_address_encode (&t->src, IP46_TYPE_ANY, &rmp->src_address); - ip_address_encode (&t->dst, IP46_TYPE_ANY, &rmp->dst_address); - - if (ip46_address_is_ip4 (&t->dst)) - rmp->encap_vrf_id = htonl (im4->fibs[t->encap_fib_index].ft_table_id); - else - rmp->encap_vrf_id = htonl (im6->fibs[t->encap_fib_index].ft_table_id); - - rmp->instance = htonl (t->user_instance); - rmp->mcast_sw_if_index = htonl (t->mcast_sw_if_index); - rmp->vni = htonl (t->vni); - rmp->decap_next_index = htonl (t->decap_next_index); - rmp->sw_if_index = htonl (t->sw_if_index); - rmp->context = context; - - vl_api_send_msg (reg, (u8 *) rmp); -} - -static void vl_api_vxlan_tunnel_dump_t_handler - (vl_api_vxlan_tunnel_dump_t * mp) -{ - vl_api_registration_t *reg; - vxlan_main_t *vxm = &vxlan_main; - vxlan_tunnel_t *t; - u32 sw_if_index; - - reg = vl_api_client_index_to_registration (mp->client_index); - if (!reg) - return; - - sw_if_index = ntohl (mp->sw_if_index); - - if (~0 == sw_if_index) - { - pool_foreach (t, vxm->tunnels) - send_vxlan_tunnel_details(t, reg, mp->context); - } - else - { - if ((sw_if_index >= vec_len (vxm->tunnel_index_by_sw_if_index)) || - (~0 == vxm->tunnel_index_by_sw_if_index[sw_if_index])) - { - return; - } - t = &vxm->tunnels[vxm->tunnel_index_by_sw_if_index[sw_if_index]]; - send_vxlan_tunnel_details (t, reg, mp->context); - } -} - -static void -send_vxlan_tunnel_v2_details (vxlan_tunnel_t *t, vl_api_registration_t *reg, - u32 context) -{ - vl_api_vxlan_tunnel_v2_details_t *rmp; - ip4_main_t *im4 = &ip4_main; - ip6_main_t *im6 = &ip6_main; - - rmp = vl_msg_api_alloc (sizeof (*rmp)); - clib_memset (rmp, 0, sizeof (*rmp)); - rmp->_vl_msg_id = ntohs (REPLY_MSG_ID_BASE + VL_API_VXLAN_TUNNEL_V2_DETAILS); - - ip_address_encode (&t->src, IP46_TYPE_ANY, &rmp->src_address); - ip_address_encode (&t->dst, IP46_TYPE_ANY, &rmp->dst_address); - rmp->src_port = htons (t->src_port); - rmp->dst_port = htons (t->dst_port); - - if (ip46_address_is_ip4 (&t->dst)) - rmp->encap_vrf_id = htonl (im4->fibs[t->encap_fib_index].ft_table_id); - else - rmp->encap_vrf_id = htonl (im6->fibs[t->encap_fib_index].ft_table_id); - - rmp->instance = htonl (t->user_instance); - rmp->mcast_sw_if_index = htonl (t->mcast_sw_if_index); - rmp->vni = htonl (t->vni); - rmp->decap_next_index = htonl (t->decap_next_index); - rmp->sw_if_index = htonl (t->sw_if_index); - rmp->context = context; - - vl_api_send_msg (reg, (u8 *) rmp); -} - -static void -vl_api_vxlan_tunnel_v2_dump_t_handler (vl_api_vxlan_tunnel_v2_dump_t *mp) -{ - vl_api_registration_t *reg; - vxlan_main_t *vxm = &vxlan_main; - vxlan_tunnel_t *t; - u32 sw_if_index; - - reg = vl_api_client_index_to_registration (mp->client_index); - if (!reg) - return; - - sw_if_index = ntohl (mp->sw_if_index); - - if (~0 == sw_if_index) - { - pool_foreach (t, vxm->tunnels) - send_vxlan_tunnel_v2_details (t, reg, mp->context); - } - else - { - if ((sw_if_index >= vec_len (vxm->tunnel_index_by_sw_if_index)) || - (~0 == vxm->tunnel_index_by_sw_if_index[sw_if_index])) - { - return; - } - t = &vxm->tunnels[vxm->tunnel_index_by_sw_if_index[sw_if_index]]; - send_vxlan_tunnel_v2_details (t, reg, mp->context); - } -} - -#include <vxlan/vxlan.api.c> -static clib_error_t * -vxlan_api_hookup (vlib_main_t * vm) -{ - api_main_t *am = vlibapi_get_main (); - - vl_api_increase_msg_trace_size (am, VL_API_VXLAN_ADD_DEL_TUNNEL, - 16 * sizeof (u32)); - - /* - * Set up the (msg_name, crc, message-id) table - */ - msg_id_base = setup_message_id_table (); - - return 0; -} - -VLIB_API_INIT_FUNCTION (vxlan_api_hookup); - -/* - * fd.io coding-style-patch-verification: ON - * - * Local Variables: - * eval: (c-set-style "gnu") - * End: - */ diff --git a/src/vnet/vxlan/vxlan_error.def b/src/vnet/vxlan/vxlan_error.def deleted file mode 100644 index 17f905950f5..00000000000 --- a/src/vnet/vxlan/vxlan_error.def +++ /dev/null @@ -1,17 +0,0 @@ -/* - * Copyright (c) 2015 Cisco and/or its affiliates. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at: - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -vxlan_error (DECAPSULATED, "good packets decapsulated") -vxlan_error (NO_SUCH_TUNNEL, "no such tunnel packets") -vxlan_error (BAD_FLAGS, "packets with bad flags field in vxlan header") diff --git a/src/vnet/vxlan/vxlan_packet.h b/src/vnet/vxlan/vxlan_packet.h deleted file mode 100644 index d1d1ed813e5..00000000000 --- a/src/vnet/vxlan/vxlan_packet.h +++ /dev/null @@ -1,80 +0,0 @@ -/* - * Copyright (c) 2015 Cisco and/or its affiliates. - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at: - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -#ifndef __included_vxlan_packet_h__ -#define __included_vxlan_packet_h__ 1 - -/* - * From RFC-7348 - * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ - * |R|R|R|R|I|R|R|R| Reserved | - * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ - * | VXLAN Network Identifier (VNI) | Reserved | - * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ - * - * VXLAN Header: This is an 8-byte field that has: - * - * - Flags (8 bits): where the I flag MUST be set to 1 for a valid - * VXLAN Network ID (VNI). The other 7 bits (designated "R") are - * reserved fields and MUST be set to zero on transmission and - * ignored on receipt. - * - * - VXLAN Segment ID/VXLAN Network Identifier (VNI): this is a - * 24-bit value used to designate the individual VXLAN overlay - * network on which the communicating VMs are situated. VMs in - * different VXLAN overlay networks cannot communicate with each - * other. - * - * - Reserved fields (24 bits and 8 bits): MUST be set to zero on - * transmission and ignored on receipt. - * - */ - -typedef struct -{ - u8 flags; - u8 res1; - u8 res2; - u8 res3; - u32 vni_reserved; -} vxlan_header_t; - -#define VXLAN_FLAGS_I 0x08 - -static inline u32 -vnet_get_vni (vxlan_header_t * h) -{ - u32 vni_reserved_host_byte_order; - - vni_reserved_host_byte_order = clib_net_to_host_u32 (h->vni_reserved); - return vni_reserved_host_byte_order >> 8; -} - -static inline void -vnet_set_vni_and_flags (vxlan_header_t * h, u32 vni) -{ - h->vni_reserved = clib_host_to_net_u32 (vni << 8); - *(u32 *) h = 0; - h->flags = VXLAN_FLAGS_I; -} - -#endif /* __included_vxlan_packet_h__ */ - -/* - * fd.io coding-style-patch-verification: ON - * - * Local Variables: - * eval: (c-set-style "gnu") - * End: - */ |