When ovn-monitor-all is set to false ovn-controller sets ovn-installed
on OVS interfaces too early. ovn-controller needs to wait for the
response from the southbound database with the updates to the newly
monitored fields only then can it install flows and label the OVS
interface as installed.

Reported-at: https://redhat.atlassian.net/browse/FDP-2887
Signed-off-by: Jacob Tanenbaum <[email protected]>

---
v7->v8
* removed printing in the system testcases that shouldn't be there and
  caused failure.

v6->v7
* added an sset that holds the uuid's of datapaths that are waiting for
  sb updates
* added back the the state OIF_WAITING_SB_COND to the if_mgr state
  machine.
* no longer hold if the datapath is updated in the local_datapaths
  struct as that is generated each transaction and cannot be relied
  upon.
* removed some leftover logic from previous patch versions

v5->v6
* simplified the logic as requested, Ales saw that we did not need to
  save the seqno if we checked before the engine run.
* removing the extra state from the state machine
* removing some leftover logic that was seen.

v4->v5
* corrected a sanitizer error: used bool update_seqno without
  initializing

v3->v4
* Added state OIF_WAITING_SB_COND to the state machine that manages
  the adding of interfaces. This state waits until the Southbound has
  updated the ovn-controller of relevent information about ports related
  to it
* Addressed several nits

v2->v3
* adding the ld->monitor_updated required the additiona of checking for
  monitor_all in update_sb_monitors. I didn't account for being able to
  toggle on monitor_all

v1->v2
* if_status_mgr_run() will run everytime the conditional seqno is
  changed so it should be safe to only skip when the expected_seqno and
  seqno returned from ovn are strictly not equal, that way we do not
  have to deal with overflow in the seqno. Additionally add a boolean to
  the local_datapath in the event that the seqno wraps around at the
  same time the datapath would go back into the state OIF_INSTALL_FLOWS.
* remove setting the state to itself for OIF_INSTALL_FLOWS in
  if_status_mgr_update()
* added assert(pb) in if_status_mgr_run()
* removed a manual loop looking for the local_datapath and replaced with
  get_local_datapath() in if_status_mgr_run
* remove a few nit spelling errors in the test case

diff --git a/controller/if-status.c b/controller/if-status.c
index ee9337e63..34875d23e 100644
--- a/controller/if-status.c
+++ b/controller/if-status.c
@@ -18,6 +18,7 @@
 #include "binding.h"
 #include "if-status.h"
 #include "lib/ofctrl-seqno.h"
+#include "local_data.h"
 #include "ovsport.h"
 #include "simap.h"
 
@@ -58,6 +59,11 @@ VLOG_DEFINE_THIS_MODULE(if_status);
 enum if_state {
     OIF_CLAIMED,          /* Newly claimed interface. pb->chassis update not
                              yet initiated. */
+    OIF_WAITING_SB_COND,  /* Waiting for the Southbound database to update
+                           * ovn-controller for a given datapath. We should
+                           * only be waiting in this state when monitor_all
+                           * is false AND it is the first time that we see
+                           * a specific datapath. */
     OIF_INSTALL_FLOWS,    /* Claimed interface with pb->chassis update sent to
                            * SB (but update notification not confirmed, so the
                            * update may be resent in any of the following
@@ -87,6 +93,7 @@ enum if_state {
 
 static const char *if_state_names[] = {
     [OIF_CLAIMED]          = "CLAIMED",
+    [OIF_WAITING_SB_COND]  = "WAITING_SB_COND",
     [OIF_INSTALL_FLOWS]    = "INSTALL_FLOWS",
     [OIF_REM_OLD_OVN_INST] = "REM_OLD_OVN_INST",
     [OIF_MARK_UP]          = "MARK_UP",
@@ -114,7 +121,18 @@ static const char *if_state_names[] = {
  * | |                 |  +--+                                           | | |
  * | |                 |                                                 | | |
  * | |                 | mgr_update(when sb is rw i.e. pb->chassis)      | | |
- * | |                 |            has been updated                     | | |
+ * | |                 V            has been updated                     | | |
+ * | |   +----------------------+                                        | | |
+ * | |   |                      |                                        | | |
+ * | |   |    WAITING_SB_COND   |                                        | | |
+ * | |   |                      |                                        | | |
+ * | |   |                      |                                        | | |
+ * | |   +----------------------+                                        | | |
+ * | |                 |                                                 | | |
+ * | |                 |                                                 | | |
+ * | |                 |   mgr_update(when sb_cond_seqno == expected)    | | |
+ * | |                 |   - request seqno                               | | |
+ * | |                 |                                                 | | |
  * | | release_iface   | - request seqno                                 | | |
  * | |                 |                                                 | | |
  * | |                 V                                                 | | |
@@ -335,6 +353,7 @@ if_status_mgr_claim_iface(struct if_status_mgr *mgr,
 
     switch (iface->state) {
     case OIF_CLAIMED:
+    case OIF_WAITING_SB_COND:
     case OIF_INSTALL_FLOWS:
     case OIF_REM_OLD_OVN_INST:
     case OIF_MARK_UP:
@@ -383,6 +402,7 @@ if_status_mgr_release_iface(struct if_status_mgr *mgr, 
const char *iface_id)
 
     switch (iface->state) {
     case OIF_CLAIMED:
+    case OIF_WAITING_SB_COND:
     case OIF_INSTALL_FLOWS:
         /* Not yet fully installed interfaces:
          * pb->chassis still need to be deleted.
@@ -424,6 +444,7 @@ if_status_mgr_delete_iface(struct if_status_mgr *mgr, const 
char *iface_id,
 
     switch (iface->state) {
     case OIF_CLAIMED:
+    case OIF_WAITING_SB_COND:
     case OIF_INSTALL_FLOWS:
         /* Not yet fully installed interfaces:
          * pb->chassis still need to be deleted.
@@ -500,6 +521,8 @@ if_status_mgr_update(struct if_status_mgr *mgr,
                      const struct sbrec_chassis *chassis_rec,
                      const struct ovsrec_interface_table *iface_table,
                      const struct sbrec_port_binding_table *pb_table,
+                     const struct hmap *local_datapaths,
+                     const struct sset *waiting_sb_update,
                      bool ovs_readonly,
                      bool sb_readonly)
 {
@@ -622,9 +645,7 @@ if_status_mgr_update(struct if_status_mgr *mgr,
              * in if_status_handle_claims or if_status_mgr_claim_iface
              */
             if (iface->is_vif) {
-                ovs_iface_set_state(mgr, iface, OIF_INSTALL_FLOWS);
-                iface->install_seqno = mgr->iface_seqno + 1;
-                new_ifaces = true;
+                ovs_iface_set_state(mgr, iface, OIF_WAITING_SB_COND);
             } else {
                 ovs_iface_set_state(mgr, iface, OIF_MARK_UP);
             }
@@ -639,6 +660,32 @@ if_status_mgr_update(struct if_status_mgr *mgr,
         }
     }
 
+    if (!sb_readonly) {
+        HMAPX_FOR_EACH_SAFE (node,
+                             &mgr->ifaces_per_state[OIF_WAITING_SB_COND]) {
+            struct ovs_iface *iface = node->data;
+            if (local_datapaths) {
+                const struct sbrec_port_binding *pb =
+                    sbrec_port_binding_table_get_for_uuid(pb_table,
+                                                          &iface->pb_uuid);
+                ovs_assert(pb);
+                struct local_datapath *ld =
+                    get_local_datapath(local_datapaths,
+                                       pb->datapath->tunnel_key);
+                if (!ld) {
+                    continue;
+                }
+                char *uuid = uuid_to_string(&ld->datapath->header_.uuid);
+                if (!sset_contains(waiting_sb_update, uuid)) {
+                    ovs_iface_set_state(mgr, iface, OIF_INSTALL_FLOWS);
+                    iface->install_seqno = mgr->iface_seqno + 1;
+                    new_ifaces = true;
+                }
+                free(uuid);
+            }
+        }
+    }
+
     if (!sb_readonly) {
         HMAPX_FOR_EACH_SAFE (node, &mgr->ifaces_per_state[OIF_UPDATE_PORT]) {
             struct ovs_iface *iface = node->data;
diff --git a/controller/if-status.h b/controller/if-status.h
index d15ca3008..67018d113 100644
--- a/controller/if-status.h
+++ b/controller/if-status.h
@@ -43,6 +43,8 @@ void if_status_mgr_update(struct if_status_mgr *, struct 
local_binding_data *,
                           const struct sbrec_chassis *chassis,
                           const struct ovsrec_interface_table *iface_table,
                           const struct sbrec_port_binding_table *pb_table,
+                          const struct hmap *local_datapaths,
+                          const struct sset *waiting_sb_update,
                           bool ovs_readonly,
                           bool sb_readonly);
 void if_status_mgr_run(struct if_status_mgr *mgr, struct local_binding_data *,
diff --git a/controller/ovn-controller.c b/controller/ovn-controller.c
index da43051ed..a25892056 100644
--- a/controller/ovn-controller.c
+++ b/controller/ovn-controller.c
@@ -1511,6 +1511,7 @@ en_runtime_data_clear_tracked_data(void *data_)
 }
 
 static void *
+
 en_runtime_data_init(struct engine_node *node OVS_UNUSED,
                      struct engine_arg *arg OVS_UNUSED)
 {
@@ -7596,6 +7597,8 @@ main(int argc, char *argv[])
     int ovs_txn_status = 1;
     bool sb_monitor_all = false;
     struct tracked_acl_ids *tracked_acl_ids = NULL;
+    struct sset waiting_sb_update;
+    sset_init(&waiting_sb_update);
     while (!exit_args.exiting) {
         ovsrcu_quiesce_end();
 
@@ -7842,6 +7845,7 @@ main(int argc, char *argv[])
 
                     bool recompute_allowed = (ovnsb_idl_txn &&
                                               !ofctrl_has_backlog());
+
                     engine_run(recompute_allowed);
                     tracked_acl_ids = engine_get_data(&en_acl_id);
 
@@ -7951,6 +7955,9 @@ main(int argc, char *argv[])
                                    sbrec_mirror_table_get(ovnsb_idl_loop.idl),
                                    br_int,
                                    &runtime_data->lbinding_data.bindings);
+                        if (ovnsb_cond_seqno == ovnsb_expected_cond_seqno) {
+                            sset_clear(&waiting_sb_update);
+                        }
                         /* Updating monitor conditions if runtime data or
                          * logical datapath goups changed. */
                         if (engine_node_changed(&en_runtime_data)
@@ -7973,6 +7980,23 @@ main(int argc, char *argv[])
                                  * a continuous reason for monitor updates. */
                                 daemon_started_recently_countdown();
                             }
+
+                            if (!sb_monitor_all && runtime_data) {
+                                struct hmap *tracked_dp_bindings =
+                                    &runtime_data->tracked_dp_bindings;
+                                struct tracked_datapath *tdp;
+                                HMAP_FOR_EACH_SAFE (tdp,
+                                                    node,
+                                                    tracked_dp_bindings) {
+                                    char *uuid =
+                                        uuid_to_string(&tdp->dp->header_.uuid);
+                                    if (tdp->tracked_type ==
+                                        TRACKED_RESOURCE_NEW) {
+                                        sset_add(&waiting_sb_update, uuid);
+                                    }
+                                    free(uuid);
+                                }
+                            }
                         }
                         /* If there is no new expected seqno we have finished
                          * loading all needed data from southbound. We then
@@ -8017,6 +8041,10 @@ main(int argc, char *argv[])
                                                     ovs_idl_loop.idl),
                                          sbrec_port_binding_table_get(
                                                     ovnsb_idl_loop.idl),
+                                         runtime_data ?
+                                               &runtime_data->local_datapaths
+                                               : NULL,
+                                         &waiting_sb_update,
                                          !ovs_idl_txn,
                                          !ovnsb_idl_txn);
                     stopwatch_stop(IF_STATUS_MGR_UPDATE_STOPWATCH_NAME,
diff --git a/tests/ovn-controller.at b/tests/ovn-controller.at
index c98de9bc4..9dc7555ba 100644
--- a/tests/ovn-controller.at
+++ b/tests/ovn-controller.at
@@ -3944,3 +3944,69 @@ OVN_CLEANUP([hv1], [hv2
 /already has encap ip.*cannot duplicate on/d])
 AT_CLEANUP
 ])
+
+OVN_FOR_EACH_NORTHD([
+AT_SETUP([ovn-installed])
+ovn_start
+
+net_add n1
+sim_add hv1
+
+as hv1
+ovs-vsctl add-br br-phys
+ovn_attach n1 br-phys 192.168.0.1
+ovn-appctl vlog/set dbg
+ovs-vsctl add-port br-int vif1 -- \
+    set Interface vif1 external-ids:iface-id=lsp1
+
+check ovn-nbctl ls-add ls1
+sleep_controller hv1
+check ovn-nbctl --wait=sb lsp-add ls1 lsp1 -- \
+                          lsp-set-addresses lsp1 "f0:00:00:00:00:01 10.0.0.1"
+
+sleep_sb
+wake_up_controller hv1
+
+# Wait for pflow for lsp1
+OVS_WAIT_UNTIL([
+    ofport=$(as hv1 ovs-vsctl --bare --columns ofport find Interface name=vif1)
+    echo "vif1 port=$ofport"
+    test -n "$ofport" && test 1 -le $(as hv1 ovs-ofctl dump-flows br-int | 
grep -c in_port=$ofport)
+])
+
+# If ovn-installed in ovs, all flows should be installed.
+# In that case, there should be at least one flow with lsp1 address.
+OVS_WAIT_UNTIL([
+    ovn_installed=$(as hv1 ovs-vsctl get Interface vif1 
external_ids:ovn-installed)
+    echo $ovn_installed
+    flow_count=$(as hv1 ovs-ofctl dump-flows br-int | grep -Fc "10.0.0.1")
+    # for the monitor-all=true case the flow gets installed because 
ovn-controller is monitoring all
+    # tables in OVN_SOUTHBOUND.
+    if test -n "$ovn_installed"; then
+        as hv1 ovs-ofctl dump-flows br-int > output
+        test $flow_count -ge 1
+    else
+        true
+    fi
+])
+
+wake_up_sb
+# After the southbound db has woken up and can send the update to the
+# ovn-controller not monitoring all tables in the southbound db it
+# should be able to install the interface.
+OVS_WAIT_UNTIL([
+    ovn_installed=$(as hv1 ovs-vsctl get Interface vif1 
external_ids:ovn-installed)
+    flow_count=$(as hv1 ovs-ofctl dump-flows br-int | grep -Fc "10.0.0.1")
+    echo "installed=$ovn_installed, count=$flow_count"
+    if test -n "$ovn_installed"; then
+        as hv1 ovs-ofctl dump-flows br-int > output
+        test $flow_count -ge 1
+    else
+        false
+    fi
+])
+wait_for_ports_up
+
+OVN_CLEANUP([hv1])
+AT_CLEANUP
+])
-- 
2.53.0

_______________________________________________
dev mailing list
[email protected]
https://mail.openvswitch.org/mailman/listinfo/ovs-dev

Reply via email to