/* *------------------------------------------------------------------ * Copyright (c) 2017 Cisco and/or its affiliates. * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at: * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. *------------------------------------------------------------------ */ #include #include #include #include #include #include void bond_disable_collecting_distributing (vlib_main_t * vm, member_if_t * mif) { bond_main_t *bm = &bond_main; bond_if_t *bif; int i; uword p; u8 switching_active = 0; bif = bond_get_bond_if_by_dev_instance (mif->bif_dev_instance); clib_spinlock_lock_if_init (&bif->lockp); vec_foreach_index (i, bif->active_members) { p = *vec_elt_at_index (bif->active_members, i); if (p == mif->sw_if_index) { if ((bif->mode == BOND_MODE_ACTIVE_BACKUP) && (i == 0) && (vec_len (bif->active_members) > 1)) /* deleting the active member for active-backup */ switching_active = 1; vec_del1 (bif->active_members, i); if (mif->lacp_enabled && bif->numa_only) { /* For lacp mode, if we check it is a member on local numa node, bif->n_numa_members should be decreased by 1 becasue the first bif->n_numa_members are all members on local numa node */ if (i < bif->n_numa_members) { bif->n_numa_members--; ASSERT (bif->n_numa_members >= 0); } } break; } } /* We get a new member just becoming active */ if (switching_active) vlib_process_signal_event (bm->vlib_main, bond_process_node.index, BOND_SEND_GARP_NA, bif->hw_if_index); clib_spinlock_unlock_if_init (&bif->lockp); } /* * return 1 if s2 is preferred. * return -1 if s1 is preferred. */ static int bond_member_sort (void *a1, void *a2) { u32 *s1 = a1; u32 *s2 = a2; member_if_t *mif1 = bond_get_member_by_sw_if_index (*s1); member_if_t *mif2 = bond_get_member_by_sw_if_index (*s2); bond_if_t *bif; ALWAYS_ASSERT (mif1); ALWAYS_ASSERT (mif2); /* * sort entries according to preference rules: * 1. biggest weight * 2. numa-node * 3. current active member (to prevent churning) * 4. lowest sw_if_index (for deterministic behavior) * */ if (mif2->weight > mif1->weight) return 1; if (mif2->weight < mif1->weight) return -1; else { if (mif2->is_local_numa > mif1->is_local_numa) return 1; if (mif2->is_local_numa < mif1->is_local_numa) return -1; else { bif = bond_get_bond_if_by_dev_instance (mif1->bif_dev_instance); /* Favor the current active member to avoid churning */ if (bif->active_members[0] == mif2->sw_if_index) return 1; if (bif->active_members[0] == mif1->sw_if_index) return -1; /* go for the tiebreaker as the last resort */ if (mif1->sw_if_index > mif2->sw_if_index) return 1; if (mif1->sw_if_index < mif2->sw_if_index) return -1; else ASSERT (0); } } return 0; } static void bond_sort_members (bond_if_t * bif) { bond_main_t *bm = &bond_main; u32 old_active = bif->active_members[0]; vec_sort_with_function (bif->active_members, bond_member_sort); if (old_active != bif->active_members[0]) vlib_process_signal_event (bm->vlib_main, bond_process_node.index, BOND_SEND_GARP_NA, bif->hw_if_index); } void bond_enable_collecting_distributing (vlib_main_t * vm, member_if_t * mif) { bond_if_t *bif; bond_main_t *bm = &bond_main; vnet_main_t *vnm = vnet_get_main (); vnet_hw_interface_t *hw = vnet_get_sup_hw_interface (vnm, mif->sw_if_index); int i; uword p; bif = bond_get_bond_if_by_dev_instance (mif->bif_dev_instance); clib_spinlock_lock_if_init (&bif->lockp); vec_foreach_index (i, bif->active_members) { p = *vec_elt_at_index (bif->active_members, i); if (p == mif->sw_if_index) goto done; } if (mif->lacp_enabled && bif->numa_only && (vm->numa_node == hw->numa_node)) { vec_insert_elts (bif->active_members, &mif->sw_if_index, 1, bif->n_numa_members); bif->n_numa_members++; } else vec_add1 (bif->active_members, mif->sw_if_index); mif->is_local_numa = (vm->numa_node == hw->numa_node) ? 1 : 0; if (bif->mode == BOND_MODE_ACTIVE_BACKUP) { if (vec_len (bif->active_members) == 1) /* First member becomes active? */ vlib_process_signal_event (bm->vlib_main, bond_process_node.index, BOND_SEND
vpp (@VPP_VERSION@) unstable; urgency=low

  * no description

 -- fd.io VPP <vpp-dev@fd.io>  @TIMESTAMP@
ad-balance %U", unformat_bond_load_balance, &args.lb)) ; else if (unformat (line_input, "hw-addr %U", unformat_ethernet_address, args.hw_addr)) args.hw_addr_set = 1; else if (unformat (line_input, "id %u", &args.id)) ; else if (unformat (line_input, "gso")) args.gso = 1; else if (unformat (line_input, "numa-only")) { if (args.mode == BOND_MODE_LACP) args.numa_only = 1; else return clib_error_return (0, "Only lacp mode supports numa-only so far!"); } else return clib_error_return (0, "unknown input `%U'", format_unformat_error, input); } unformat_free (line_input); if (mode_is_set == 0) return clib_error_return (0, "Missing bond mode"); bond_create_if (vm, &args); if (!args.rv) vlib_cli_output (vm, "%U\n", format_vnet_sw_if_index_name, vnet_get_main (), args.sw_if_index); return args.error; } /* *INDENT-OFF* */ VLIB_CLI_COMMAND (bond_create_command, static) = { .path = "create bond", .short_help = "create bond mode {round-robin | active-backup | broadcast | " "{lacp | xor} [load-balance { l2 | l23 | l34 } [numa-only]]} " "[hw-addr ] [id ] [gso]", .function = bond_create_command_fn, }; /* *INDENT-ON* */ static clib_error_t * bond_delete_command_fn (vlib_main_t * vm, unformat_input_t * input, vlib_cli_command_t * cmd) { unformat_input_t _line_input, *line_input = &_line_input; u32 sw_if_index = ~0; vnet_main_t *vnm = vnet_get_main (); int rv; /* Get a line of input. */ if (!unformat_user (input, unformat_line_input, line_input)) return clib_error_return (0, "Missing "); while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT) { if (unformat (line_input, "sw_if_index %d", &sw_if_index)) ; else if (unformat (line_input, "%U", unformat_vnet_sw_interface, vnm, &sw_if_index)) ; else return clib_error_return (0, "unknown input `%U'", format_unformat_error, input); } unformat_free (line_input); if (sw_if_index == ~0) return clib_error_return (0, "please specify interface name or sw_if_index"); rv = bond_delete_if (vm, sw_if_index); if (rv == VNET_API_ERROR_INVALID_SW_IF_INDEX) return clib_error_return (0, "not a bond interface"); else if (rv != 0) return clib_error_return (0, "error on deleting bond interface"); return 0; } /* *INDENT-OFF* */ VLIB_CLI_COMMAND (bond_delete__command, static) = { .path = "delete bond", .short_help = "delete bond { | sw_if_index }", .function = bond_delete_command_fn, }; /* *INDENT-ON* */ void bond_add_member (vlib_main_t * vm, bond_add_member_args_t * args) { bond_main_t *bm = &bond_main; vnet_main_t *vnm = vnet_get_main (); bond_if_t *bif; member_if_t *mif; vnet_interface_main_t *im = &vnm->interface_main; vnet_hw_interface_t *bif_hw, *mif_hw; vnet_sw_interface_t *sw; u32 thread_index; u32 mif_if_index; bif = bond_get_bond_if_by_sw_if_index (args->group); if (!bif) { args->rv = VNET_API_ERROR_INVALID_INTERFACE; args->error = clib_error_return (0, "bond interface not found"); return; } // make sure the interface is not already added as member if (bond_get_member_by_sw_if_index (args->member)) { args->rv = VNET_API_ERROR_VALUE_EXIST; args->error = clib_error_return (0, "interface was already added as member"); return; } mif_hw = vnet_get_sup_hw_interface (vnm, args->member); if (mif_hw->dev_class_index == bond_dev_class.index) { args->rv = VNET_API_ERROR_INVALID_INTERFACE; args->error = clib_error_return (0, "bond interface cannot be added as member"); return; } if (bif->gso && !(mif_hw->flags & VNET_HW_INTERFACE_FLAG_SUPPORTS_GSO)) { args->rv = VNET_API_ERROR_INVALID_INTERFACE; args->error = clib_error_return (0, "member interface is not gso capable"); return; } if (bif->mode == BOND_MODE_LACP) { u8 *name = format (0, "/if/lacp/%u/%u/state%c", bif->sw_if_index, args->member, 0); vec_validate (bm->stats, bif->sw_if_index); vec_validate (bm->stats[bif->sw_if_index], args->member); args->error = stat_segment_register_state_counter (name, &bm->stats[bif->sw_if_index][args->member].actor_state); if (args->error != 0) { args->rv = VNET_API_ERROR_INVALID_INTERFACE; vec_free (name); return; } vec_reset_length (name); name = format (0, "/if/lacp/%u/%u/partner-state%c", bif->sw_if_index, args->member, 0); args->error = stat_segment_register_state_counter (name, &bm->stats[bif->sw_if_index][args->member].partner_state); vec_free (name); if (args->error != 0) { args->rv = VNET_API_ERROR_INVALID_INTERFACE; return; } } pool_get (bm->neighbors, mif); clib_memset (mif, 0, sizeof (*mif)); sw = pool_elt_at_index (im->sw_interfaces, args->member); /* port_enabled is both admin up and hw link up */ mif->port_enabled = vnet_sw_interface_is_up (vnm, sw->sw_if_index); mif->sw_if_index = sw->sw_if_index; mif->hw_if_index = sw->hw_if_index; mif->packet_template_index = (u8) ~ 0; mif->is_passive = args->is_passive; mif->group = args->group; mif->bif_dev_instance = bif->dev_instance; mif->mode = bif->mode; mif->is_long_timeout = args->is_long_timeout; if (args->is_long_timeout) mif->ttl_in_seconds = LACP_LONG_TIMOUT_TIME; else mif->ttl_in_seconds = LACP_SHORT_TIMOUT_TIME; vec_validate_aligned (bm->member_by_sw_if_index, mif->sw_if_index, CLIB_CACHE_LINE_BYTES); /* * mif - bm->neighbors may be 0 * Left shift it by 1 bit to distinguish the valid entry that we actually * store from the null entries */ bm->member_by_sw_if_index[mif->sw_if_index] = (uword) (((mif - bm->neighbors) << 1) | 1); vec_add1 (bif->members, mif->sw_if_index); mif_hw = vnet_get_sup_hw_interface (vnm, mif->sw_if_index); /* Save the old mac */ memcpy (mif->persistent_hw_address, mif_hw->hw_address, 6); bif_hw = vnet_get_sup_hw_interface (vnm, bif->sw_if_index); if (bif->use_custom_mac) { vnet_hw_interface_change_mac_address (vnm, mif_hw->hw_if_index, bif->hw_address); } else { // bond interface gets the mac address from the first member if (vec_len (bif->members) == 1) { memcpy (bif->hw_address, mif_hw->hw_address, 6); vnet_hw_interface_change_mac_address (vnm, bif_hw->hw_if_index, mif_hw->hw_address); } else { // subsequent members gets the mac address of the bond interface vnet_hw_interface_change_mac_address (vnm, mif_hw->hw_if_index, bif->hw_address); } } /* if there are secondary/virtual mac addrs, propagate to the member */ bond_member_add_del_mac_addrs (bif, mif->sw_if_index, 1 /* is_add */ ); if (bif_hw->l2_if_count) ethernet_set_flags (vnm, mif_hw->hw_if_index, ETHERNET_INTERFACE_FLAG_ACCEPT_ALL); else ethernet_set_flags (vnm, mif_hw->hw_if_index, /*ETHERNET_INTERFACE_FLAG_DEFAULT_L3 */ 0); if (bif->mode == BOND_MODE_LACP) { if (bm->lacp_enable_disable) (*bm->lacp_enable_disable) (vm, bif, mif, 1); } else if (mif->port_enabled) { bond_enable_collecting_distributing (vm, mif); } vec_foreach_index (thread_index, bm->per_thread_data) { bond_per_thread_data_t *ptd = vec_elt_at_index (bm->per_thread_data, thread_index); vec_validate_aligned (ptd->per_port_queue, vec_len (bif->members) - 1, CLIB_CACHE_LINE_BYTES); vec_foreach_index (mif_if_index, ptd->per_port_queue) { ptd->per_port_queue[mif_if_index].n_buffers = 0; } } args->rv = vnet_feature_enable_disable ("device-input", "bond-input", mif->sw_if_index, 1, 0, 0); if (args->rv) { args->error = clib_error_return (0, "Error encountered on input feature arc enable"); } } static clib_error_t * add_member_interface_command_fn (vlib_main_t * vm, unformat_input_t * input, vlib_cli_command_t * cmd) { bond_add_member_args_t args = { 0 }; unformat_input_t _line_input, *line_input = &_line_input; vnet_main_t *vnm = vnet_get_main (); /* Get a line of input. */ if (!unformat_user (input, unformat_line_input, line_input)) return clib_error_return (0, "Missing required arguments."); args.member = ~0; args.group = ~0; while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT) { if (unformat (line_input, "%U %U", unformat_vnet_sw_interface, vnm, &args.group, unformat_vnet_sw_interface, vnm, &args.member)) ; else if (unformat (line_input, "passive")) args.is_passive = 1; else if (unformat (line_input, "long-timeout")) args.is_long_timeout = 1; else { args.error = clib_error_return (0, "unknown input `%U'", format_unformat_error, input); break; } } unformat_free (line_input); if (args.error) return args.error; if (args.group == ~0) return clib_error_return (0, "Missing bond interface"); if (args.member == ~0) return clib_error_return (0, "please specify valid member interface name"); bond_add_member (vm, &args); return args.error; } /* *INDENT-OFF* */ VLIB_CLI_COMMAND (add_member_interface_command, static) = { .path = "bond add", .short_help = "bond add " "[passive] [long-timeout]", .function = add_member_interface_command_fn, }; /* *INDENT-ON* */ void bond_detach_member (vlib_main_t * vm, bond_detach_member_args_t * args) { bond_if_t *bif; member_if_t *mif; mif = bond_get_member_by_sw_if_index (args->member); if (!mif) { args->rv = VNET_API_ERROR_INVALID_INTERFACE; args->error = clib_error_return (0, "interface was not a member"); return; } bif = bond_get_bond_if_by_dev_instance (mif->bif_dev_instance); bond_delete_neighbor (vm, bif, mif); } static clib_error_t * detach_interface_command_fn (vlib_main_t * vm, unformat_input_t * input, vlib_cli_command_t * cmd) { bond_detach_member_args_t args = { 0 }; unformat_input_t _line_input, *line_input = &_line_input; vnet_main_t *vnm = vnet_get_main (); /* Get a line of input. */ if (!unformat_user (input, unformat_line_input, line_input)) return clib_error_return (0, "Missing required arguments."); args.member = ~0; while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT) { if (unformat (line_input, "%U", unformat_vnet_sw_interface, vnm, &args.member)) ; else { args.error = clib_error_return (0, "unknown input `%U'", format_unformat_error, input); break; } } unformat_free (line_input); if (args.error) return args.error; if (args.member == ~0) return clib_error_return (0, "please specify valid member interface name"); bond_detach_member (vm, &args); return args.error; } /* *INDENT-OFF* */ VLIB_CLI_COMMAND (detach_interface_command, static) = { .path = "bond del", .short_help = "bond del ", .function = detach_interface_command_fn, }; /* *INDENT-ON* */ static void show_bond (vlib_main_t * vm) { bond_main_t *bm = &bond_main; bond_if_t *bif; vlib_cli_output (vm, "%-16s %-12s %-13s %-13s %-14s %s", "interface name", "sw_if_index", "mode", "load balance", "active members", "members"); /* *INDENT-OFF* */ pool_foreach (bif, bm->interfaces) { vlib_cli_output (vm, "%-16U %-12d %-13U %-13U %-14u %u", format_bond_interface_name, bif->dev_instance, bif->sw_if_index, format_bond_mode, bif->mode, format_bond_load_balance, bif->lb, vec_len (bif->active_members), vec_len (bif->members)); } /* *INDENT-ON* */ } static void show_bond_details (vlib_main_t * vm) { bond_main_t *bm = &bond_main; bond_if_t *bif; u32 *sw_if_index; /* *INDENT-OFF* */ pool_foreach (bif, bm->interfaces) { vlib_cli_output (vm, "%U", format_bond_interface_name, bif->dev_instance); vlib_cli_output (vm, " mode: %U", format_bond_mode, bif->mode); vlib_cli_output (vm, " load balance: %U", format_bond_load_balance, bif->lb); if (bif->gso) vlib_cli_output (vm, " gso enable"); if (bif->mode == BOND_MODE_ROUND_ROBIN) vlib_cli_output (vm, " last xmit member index: %u", bif->lb_rr_last_index); vlib_cli_output (vm, " number of active members: %d", vec_len (bif->active_members)); vec_foreach (sw_if_index, bif->active_members) { vlib_cli_output (vm, " %U", format_vnet_sw_if_index_name, vnet_get_main (), *sw_if_index); if (bif->mode == BOND_MODE_ACTIVE_BACKUP) { member_if_t *mif = bond_get_member_by_sw_if_index (*sw_if_index); if (mif) vlib_cli_output (vm, " weight: %u, is_local_numa: %u, " "sw_if_index: %u", mif->weight, mif->is_local_numa, mif->sw_if_index); } } vlib_cli_output (vm, " number of members: %d", vec_len (bif->members)); vec_foreach (sw_if_index, bif->members) { vlib_cli_output (vm, " %U", format_vnet_sw_if_index_name, vnet_get_main (), *sw_if_index); } vlib_cli_output (vm, " device instance: %d", bif->dev_instance); vlib_cli_output (vm, " interface id: %d", bif->id); vlib_cli_output (vm, " sw_if_index: %d", bif->sw_if_index); vlib_cli_output (vm, " hw_if_index: %d", bif->hw_if_index); } /* *INDENT-ON* */ } static clib_error_t * show_bond_fn (vlib_main_t * vm, unformat_input_t * input, vlib_cli_command_t * cmd) { u8 details = 0; while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT) { if (unformat (input, "details")) details = 1; else { return clib_error_return (0, "unknown input `%U'", format_unformat_error, input); } } if (details) show_bond_details (vm); else show_bond (vm); return 0; } /* *INDENT-OFF* */ VLIB_CLI_COMMAND (show_bond_command, static) = { .path = "show bond", .short_help = "show bond [details]", .function = show_bond_fn, }; /* *INDENT-ON* */ void bond_set_intf_weight (vlib_main_t * vm, bond_set_intf_weight_args_t * args) { member_if_t *mif; bond_if_t *bif; vnet_main_t *vnm; u32 old_weight; mif = bond_get_member_by_sw_if_index (args->sw_if_index); if (!mif) { args->rv = VNET_API_ERROR_INVALID_INTERFACE; args->error = clib_error_return (0, "Interface not a member"); return; } bif = bond_get_bond_if_by_dev_instance (mif->bif_dev_instance); if (!bif) { args->rv = VNET_API_ERROR_INVALID_INTERFACE; args->error = clib_error_return (0, "bond interface not found"); return; } if (bif->mode != BOND_MODE_ACTIVE_BACKUP) { args->rv = VNET_API_ERROR_INVALID_ARGUMENT; args->error = clib_error_return (0, "Weight valid for active-backup only"); return; } old_weight = mif->weight; mif->weight = args->weight; vnm = vnet_get_main (); /* * No need to sort the list if the affected member is not up (not in active * member set), active member count is 1, or the current member is already the * primary member and new weight > old weight. */ if (!vnet_sw_interface_is_up (vnm, mif->sw_if_index) || (vec_len (bif->active_members) == 1) || ((bif->active_members[0] == mif->sw_if_index) && (mif->weight >= old_weight))) return; bond_sort_members (bif); } static clib_error_t * bond_set_intf_cmd (vlib_main_t * vm, unformat_input_t * input, vlib_cli_command_t * cmd) { bond_set_intf_weight_args_t args = { 0 }; u32 sw_if_index = (u32) ~ 0; unformat_input_t _line_input, *line_input = &_line_input; vnet_main_t *vnm = vnet_get_main (); u8 weight_enter = 0; u32 weight = 0; /* Get a line of input. */ if (!unformat_user (input, unformat_line_input, line_input)) return clib_error_return (0, "Missing required arguments."); while (unformat_check_input (line_input) != UNFORMAT_END_OF_INPUT) { if (unformat (line_input, "sw_if_index %d", &sw_if_index)) ; else if (unformat (line_input, "%U", unformat_vnet_sw_interface, vnm, &sw_if_index)) ; else if (unformat (line_input, "weight %u", &weight)) weight_enter = 1; else { clib_error_return (0, "unknown input `%U'", format_unformat_error, input); break; } } unformat_free (line_input); if (sw_if_index == (u32) ~ 0) { args.rv = VNET_API_ERROR_INVALID_INTERFACE; clib_error_return (0, "Interface name is invalid!"); } if (weight_enter == 0) { args.rv = VNET_API_ERROR_INVALID_ARGUMENT; clib_error_return (0, "weight missing"); } args.sw_if_index = sw_if_index; args.weight = weight; bond_set_intf_weight (vm, &args); return args.error; } /* *INDENT-OFF* */ VLIB_CLI_COMMAND(set_interface_bond_cmd, static) = { .path = "set interface bond", .short_help = "set interface bond | sw_if_index " " weight ", .function = bond_set_intf_cmd, }; /* *INDENT-ON* */ clib_error_t * bond_cli_init (vlib_main_t * vm) { bond_main_t *bm = &bond_main; bm->vlib_main = vm; bm->vnet_main = vnet_get_main (); vec_validate_aligned (bm->member_by_sw_if_index, 1, CLIB_CACHE_LINE_BYTES); vec_validate_aligned (bm->per_thread_data, vlib_get_thread_main ()->n_vlib_mains - 1, CLIB_CACHE_LINE_BYTES); return 0; } VLIB_INIT_FUNCTION (bond_cli_init); /* * fd.io coding-style-patch-verification: ON * * Local Variables: * eval: (c-set-style "gnu") * End: */