When ovn-monitor-all is set to false ovn-controller sets ovn-installed on OVS interfaces too early. ovn-controller needs to wait for the response from the southbound database with the updates to the newly monitored fields only then can it install flows and label the OVS interface as installed.
Reported-at: https://redhat.atlassian.net/browse/FDP-2887 Signed-off-by: Jacob Tanenbaum <[email protected]> --- v7->v8 * removed printing in the system testcases that shouldn't be there and caused failure. v6->v7 * added an sset that holds the uuid's of datapaths that are waiting for sb updates * added back the the state OIF_WAITING_SB_COND to the if_mgr state machine. * no longer hold if the datapath is updated in the local_datapaths struct as that is generated each transaction and cannot be relied upon. * removed some leftover logic from previous patch versions v5->v6 * simplified the logic as requested, Ales saw that we did not need to save the seqno if we checked before the engine run. * removing the extra state from the state machine * removing some leftover logic that was seen. v4->v5 * corrected a sanitizer error: used bool update_seqno without initializing v3->v4 * Added state OIF_WAITING_SB_COND to the state machine that manages the adding of interfaces. This state waits until the Southbound has updated the ovn-controller of relevent information about ports related to it * Addressed several nits v2->v3 * adding the ld->monitor_updated required the additiona of checking for monitor_all in update_sb_monitors. I didn't account for being able to toggle on monitor_all v1->v2 * if_status_mgr_run() will run everytime the conditional seqno is changed so it should be safe to only skip when the expected_seqno and seqno returned from ovn are strictly not equal, that way we do not have to deal with overflow in the seqno. Additionally add a boolean to the local_datapath in the event that the seqno wraps around at the same time the datapath would go back into the state OIF_INSTALL_FLOWS. * remove setting the state to itself for OIF_INSTALL_FLOWS in if_status_mgr_update() * added assert(pb) in if_status_mgr_run() * removed a manual loop looking for the local_datapath and replaced with get_local_datapath() in if_status_mgr_run * remove a few nit spelling errors in the test case diff --git a/controller/if-status.c b/controller/if-status.c index ee9337e63..34875d23e 100644 --- a/controller/if-status.c +++ b/controller/if-status.c @@ -18,6 +18,7 @@ #include "binding.h" #include "if-status.h" #include "lib/ofctrl-seqno.h" +#include "local_data.h" #include "ovsport.h" #include "simap.h" @@ -58,6 +59,11 @@ VLOG_DEFINE_THIS_MODULE(if_status); enum if_state { OIF_CLAIMED, /* Newly claimed interface. pb->chassis update not yet initiated. */ + OIF_WAITING_SB_COND, /* Waiting for the Southbound database to update + * ovn-controller for a given datapath. We should + * only be waiting in this state when monitor_all + * is false AND it is the first time that we see + * a specific datapath. */ OIF_INSTALL_FLOWS, /* Claimed interface with pb->chassis update sent to * SB (but update notification not confirmed, so the * update may be resent in any of the following @@ -87,6 +93,7 @@ enum if_state { static const char *if_state_names[] = { [OIF_CLAIMED] = "CLAIMED", + [OIF_WAITING_SB_COND] = "WAITING_SB_COND", [OIF_INSTALL_FLOWS] = "INSTALL_FLOWS", [OIF_REM_OLD_OVN_INST] = "REM_OLD_OVN_INST", [OIF_MARK_UP] = "MARK_UP", @@ -114,7 +121,18 @@ static const char *if_state_names[] = { * | | | +--+ | | | * | | | | | | * | | | mgr_update(when sb is rw i.e. pb->chassis) | | | - * | | | has been updated | | | + * | | V has been updated | | | + * | | +----------------------+ | | | + * | | | | | | | + * | | | WAITING_SB_COND | | | | + * | | | | | | | + * | | | | | | | + * | | +----------------------+ | | | + * | | | | | | + * | | | | | | + * | | | mgr_update(when sb_cond_seqno == expected) | | | + * | | | - request seqno | | | + * | | | | | | * | | release_iface | - request seqno | | | * | | | | | | * | | V | | | @@ -335,6 +353,7 @@ if_status_mgr_claim_iface(struct if_status_mgr *mgr, switch (iface->state) { case OIF_CLAIMED: + case OIF_WAITING_SB_COND: case OIF_INSTALL_FLOWS: case OIF_REM_OLD_OVN_INST: case OIF_MARK_UP: @@ -383,6 +402,7 @@ if_status_mgr_release_iface(struct if_status_mgr *mgr, const char *iface_id) switch (iface->state) { case OIF_CLAIMED: + case OIF_WAITING_SB_COND: case OIF_INSTALL_FLOWS: /* Not yet fully installed interfaces: * pb->chassis still need to be deleted. @@ -424,6 +444,7 @@ if_status_mgr_delete_iface(struct if_status_mgr *mgr, const char *iface_id, switch (iface->state) { case OIF_CLAIMED: + case OIF_WAITING_SB_COND: case OIF_INSTALL_FLOWS: /* Not yet fully installed interfaces: * pb->chassis still need to be deleted. @@ -500,6 +521,8 @@ if_status_mgr_update(struct if_status_mgr *mgr, const struct sbrec_chassis *chassis_rec, const struct ovsrec_interface_table *iface_table, const struct sbrec_port_binding_table *pb_table, + const struct hmap *local_datapaths, + const struct sset *waiting_sb_update, bool ovs_readonly, bool sb_readonly) { @@ -622,9 +645,7 @@ if_status_mgr_update(struct if_status_mgr *mgr, * in if_status_handle_claims or if_status_mgr_claim_iface */ if (iface->is_vif) { - ovs_iface_set_state(mgr, iface, OIF_INSTALL_FLOWS); - iface->install_seqno = mgr->iface_seqno + 1; - new_ifaces = true; + ovs_iface_set_state(mgr, iface, OIF_WAITING_SB_COND); } else { ovs_iface_set_state(mgr, iface, OIF_MARK_UP); } @@ -639,6 +660,32 @@ if_status_mgr_update(struct if_status_mgr *mgr, } } + if (!sb_readonly) { + HMAPX_FOR_EACH_SAFE (node, + &mgr->ifaces_per_state[OIF_WAITING_SB_COND]) { + struct ovs_iface *iface = node->data; + if (local_datapaths) { + const struct sbrec_port_binding *pb = + sbrec_port_binding_table_get_for_uuid(pb_table, + &iface->pb_uuid); + ovs_assert(pb); + struct local_datapath *ld = + get_local_datapath(local_datapaths, + pb->datapath->tunnel_key); + if (!ld) { + continue; + } + char *uuid = uuid_to_string(&ld->datapath->header_.uuid); + if (!sset_contains(waiting_sb_update, uuid)) { + ovs_iface_set_state(mgr, iface, OIF_INSTALL_FLOWS); + iface->install_seqno = mgr->iface_seqno + 1; + new_ifaces = true; + } + free(uuid); + } + } + } + if (!sb_readonly) { HMAPX_FOR_EACH_SAFE (node, &mgr->ifaces_per_state[OIF_UPDATE_PORT]) { struct ovs_iface *iface = node->data; diff --git a/controller/if-status.h b/controller/if-status.h index d15ca3008..67018d113 100644 --- a/controller/if-status.h +++ b/controller/if-status.h @@ -43,6 +43,8 @@ void if_status_mgr_update(struct if_status_mgr *, struct local_binding_data *, const struct sbrec_chassis *chassis, const struct ovsrec_interface_table *iface_table, const struct sbrec_port_binding_table *pb_table, + const struct hmap *local_datapaths, + const struct sset *waiting_sb_update, bool ovs_readonly, bool sb_readonly); void if_status_mgr_run(struct if_status_mgr *mgr, struct local_binding_data *, diff --git a/controller/ovn-controller.c b/controller/ovn-controller.c index da43051ed..a25892056 100644 --- a/controller/ovn-controller.c +++ b/controller/ovn-controller.c @@ -1511,6 +1511,7 @@ en_runtime_data_clear_tracked_data(void *data_) } static void * + en_runtime_data_init(struct engine_node *node OVS_UNUSED, struct engine_arg *arg OVS_UNUSED) { @@ -7596,6 +7597,8 @@ main(int argc, char *argv[]) int ovs_txn_status = 1; bool sb_monitor_all = false; struct tracked_acl_ids *tracked_acl_ids = NULL; + struct sset waiting_sb_update; + sset_init(&waiting_sb_update); while (!exit_args.exiting) { ovsrcu_quiesce_end(); @@ -7842,6 +7845,7 @@ main(int argc, char *argv[]) bool recompute_allowed = (ovnsb_idl_txn && !ofctrl_has_backlog()); + engine_run(recompute_allowed); tracked_acl_ids = engine_get_data(&en_acl_id); @@ -7951,6 +7955,9 @@ main(int argc, char *argv[]) sbrec_mirror_table_get(ovnsb_idl_loop.idl), br_int, &runtime_data->lbinding_data.bindings); + if (ovnsb_cond_seqno == ovnsb_expected_cond_seqno) { + sset_clear(&waiting_sb_update); + } /* Updating monitor conditions if runtime data or * logical datapath goups changed. */ if (engine_node_changed(&en_runtime_data) @@ -7973,6 +7980,23 @@ main(int argc, char *argv[]) * a continuous reason for monitor updates. */ daemon_started_recently_countdown(); } + + if (!sb_monitor_all && runtime_data) { + struct hmap *tracked_dp_bindings = + &runtime_data->tracked_dp_bindings; + struct tracked_datapath *tdp; + HMAP_FOR_EACH_SAFE (tdp, + node, + tracked_dp_bindings) { + char *uuid = + uuid_to_string(&tdp->dp->header_.uuid); + if (tdp->tracked_type == + TRACKED_RESOURCE_NEW) { + sset_add(&waiting_sb_update, uuid); + } + free(uuid); + } + } } /* If there is no new expected seqno we have finished * loading all needed data from southbound. We then @@ -8017,6 +8041,10 @@ main(int argc, char *argv[]) ovs_idl_loop.idl), sbrec_port_binding_table_get( ovnsb_idl_loop.idl), + runtime_data ? + &runtime_data->local_datapaths + : NULL, + &waiting_sb_update, !ovs_idl_txn, !ovnsb_idl_txn); stopwatch_stop(IF_STATUS_MGR_UPDATE_STOPWATCH_NAME, diff --git a/tests/ovn-controller.at b/tests/ovn-controller.at index c98de9bc4..9dc7555ba 100644 --- a/tests/ovn-controller.at +++ b/tests/ovn-controller.at @@ -3944,3 +3944,69 @@ OVN_CLEANUP([hv1], [hv2 /already has encap ip.*cannot duplicate on/d]) AT_CLEANUP ]) + +OVN_FOR_EACH_NORTHD([ +AT_SETUP([ovn-installed]) +ovn_start + +net_add n1 +sim_add hv1 + +as hv1 +ovs-vsctl add-br br-phys +ovn_attach n1 br-phys 192.168.0.1 +ovn-appctl vlog/set dbg +ovs-vsctl add-port br-int vif1 -- \ + set Interface vif1 external-ids:iface-id=lsp1 + +check ovn-nbctl ls-add ls1 +sleep_controller hv1 +check ovn-nbctl --wait=sb lsp-add ls1 lsp1 -- \ + lsp-set-addresses lsp1 "f0:00:00:00:00:01 10.0.0.1" + +sleep_sb +wake_up_controller hv1 + +# Wait for pflow for lsp1 +OVS_WAIT_UNTIL([ + ofport=$(as hv1 ovs-vsctl --bare --columns ofport find Interface name=vif1) + echo "vif1 port=$ofport" + test -n "$ofport" && test 1 -le $(as hv1 ovs-ofctl dump-flows br-int | grep -c in_port=$ofport) +]) + +# If ovn-installed in ovs, all flows should be installed. +# In that case, there should be at least one flow with lsp1 address. +OVS_WAIT_UNTIL([ + ovn_installed=$(as hv1 ovs-vsctl get Interface vif1 external_ids:ovn-installed) + echo $ovn_installed + flow_count=$(as hv1 ovs-ofctl dump-flows br-int | grep -Fc "10.0.0.1") + # for the monitor-all=true case the flow gets installed because ovn-controller is monitoring all + # tables in OVN_SOUTHBOUND. + if test -n "$ovn_installed"; then + as hv1 ovs-ofctl dump-flows br-int > output + test $flow_count -ge 1 + else + true + fi +]) + +wake_up_sb +# After the southbound db has woken up and can send the update to the +# ovn-controller not monitoring all tables in the southbound db it +# should be able to install the interface. +OVS_WAIT_UNTIL([ + ovn_installed=$(as hv1 ovs-vsctl get Interface vif1 external_ids:ovn-installed) + flow_count=$(as hv1 ovs-ofctl dump-flows br-int | grep -Fc "10.0.0.1") + echo "installed=$ovn_installed, count=$flow_count" + if test -n "$ovn_installed"; then + as hv1 ovs-ofctl dump-flows br-int > output + test $flow_count -ge 1 + else + false + fi +]) +wait_for_ports_up + +OVN_CLEANUP([hv1]) +AT_CLEANUP +]) -- 2.53.0 _______________________________________________ dev mailing list [email protected] https://mail.openvswitch.org/mailman/listinfo/ovs-dev
