On Fri, Sep 1, 2023 at 2:41 AM Han Zhou <hz...@ovn.org> wrote:
>
> On Fri, Aug 18, 2023 at 1:58 AM <num...@ovn.org> wrote:
> >
> > From: Numan Siddique <num...@ovn.org>
> >
> > A new engine node 'sync_to_sb_pb' is added within 'sync_to_sb'
> > node to sync NAT column of Port bindings table.  This separation
> > is required in order to add load balancer group I-P handling
> > in 'northd' engine node (which is handled in the next commit).
> >
> > 'sync_to_sb_pb' engine node can be later expanded to sync other
> > Port binding columns if required.
> >
> > Signed-off-by: Numan Siddique <num...@ovn.org>
> > ---
> >  northd/en-sync-sb.c      |  31 +++++
> >  northd/en-sync-sb.h      |   4 +
> >  northd/inc-proc-northd.c |   8 +-
> >  northd/northd.c          | 243 +++++++++++++++++++++------------------
> >  northd/northd.h          |   2 +
> >  5 files changed, 174 insertions(+), 114 deletions(-)
> >
> > diff --git a/northd/en-sync-sb.c b/northd/en-sync-sb.c
> > index 9832fce30a..552ed56452 100644
> > --- a/northd/en-sync-sb.c
> > +++ b/northd/en-sync-sb.c
> > @@ -254,6 +254,37 @@ sync_to_sb_lb_northd_handler(struct engine_node
> *node, void *data OVS_UNUSED)
> >      return false;
> >  }
> >
> > +/* sync_to_sb_pb engine node functions.
> > + * This engine node syncs the SB Port Bindings (partly).
> > + * en_northd engine create the SB Port binding rows and
> > + * updates most of the columns.
> > + * This engine node updates the port binding columns which
> > + * needs to be updated after northd engine is run.
> > + */
> > +
> > +void *
> > +en_sync_to_sb_pb_init(struct engine_node *node OVS_UNUSED,
> > +                      struct engine_arg *arg OVS_UNUSED)
> > +{
> > +    return NULL;
> > +}
> > +
> > +void
> > +en_sync_to_sb_pb_run(struct engine_node *node, void *data OVS_UNUSED)
> > +{
> > +    const struct engine_context *eng_ctx = engine_get_context();
> > +    struct northd_data *northd_data = engine_get_input_data("northd",
> node);
> > +
> > +    sync_pbs(eng_ctx->ovnsb_idl_txn, &northd_data->ls_ports);
> > +    engine_set_node_state(node, EN_UPDATED);
> > +}
> > +
> > +void
> > +en_sync_to_sb_pb_cleanup(void *data OVS_UNUSED)
> > +{
> > +
> > +}
> > +
> >  /* static functions. */
> >  static void
> >  sync_addr_set(struct ovsdb_idl_txn *ovnsb_txn, const char *name,
> > diff --git a/northd/en-sync-sb.h b/northd/en-sync-sb.h
> > index 06d2a57710..700d3340e4 100644
> > --- a/northd/en-sync-sb.h
> > +++ b/northd/en-sync-sb.h
> > @@ -22,4 +22,8 @@ void en_sync_to_sb_lb_run(struct engine_node *, void
> *data);
> >  void en_sync_to_sb_lb_cleanup(void *data);
> >  bool sync_to_sb_lb_northd_handler(struct engine_node *, void *data
> OVS_UNUSED);
> >
> > +void *en_sync_to_sb_pb_init(struct engine_node *, struct engine_arg *);
> > +void en_sync_to_sb_pb_run(struct engine_node *, void *data);
> > +void en_sync_to_sb_pb_cleanup(void *data);
> > +
> >  #endif /* end of EN_SYNC_SB_H */
> > diff --git a/northd/inc-proc-northd.c b/northd/inc-proc-northd.c
> > index 402c94e88c..dc8b880fd8 100644
> > --- a/northd/inc-proc-northd.c
> > +++ b/northd/inc-proc-northd.c
> > @@ -141,6 +141,7 @@ static ENGINE_NODE(sync_to_sb_addr_set,
> "sync_to_sb_addr_set");
> >  static ENGINE_NODE(fdb_aging, "fdb_aging");
> >  static ENGINE_NODE(fdb_aging_waker, "fdb_aging_waker");
> >  static ENGINE_NODE(sync_to_sb_lb, "sync_to_sb_lb");
> > +static ENGINE_NODE(sync_to_sb_pb, "sync_to_sb_pb");
> >  static ENGINE_NODE_WITH_CLEAR_TRACK_DATA(lb_data, "lb_data");
> >
> >  void inc_proc_northd_init(struct ovsdb_idl_loop *nb,
> > @@ -215,13 +216,16 @@ void inc_proc_northd_init(struct ovsdb_idl_loop *nb,
> >                       sync_to_sb_lb_northd_handler);
> >      engine_add_input(&en_sync_to_sb_lb, &en_sb_load_balancer, NULL);
> >
> > +    engine_add_input(&en_sync_to_sb_pb, &en_northd, NULL);
>
> NULL handler here always triggers recompute for any en_northd change, which
> causes a performance regression for VIF I-P. Before this change, only
> tracked LSP changes will have related SB port-binding synced to SB, but now
> it iterates through all the ls_ports and resync each of them even if there
> is only one LSP in tracked_changes.
>
> I ran the scale test of the simulated ovn-k8s topology of 500 chassis x 50
> lsp, for each single VIF creation/deletion the "ovn-northd completion" time
> increased from 25ms to 40ms - nearly doubled.
>
> I think a simple handler can be implemented so that only sync tracked LSPs,
> and fallback to recompute only if changes are not tracked.

Thanks for the reviews.  I've added a handler in v7.  Please take a look.

Thanks
Numan

>
> Thanks,
> Han
>
> > +
> >      /* en_sync_to_sb engine node syncs the SB database tables from
> >       * the NB database tables.
> > -     * Right now this engine syncs the SB Address_Set table and
> > -     * SB Load_Balancer table.
> > +     * Right now this engine syncs the SB Address_Set table,
> > +     * SB Load_Balancer table and (partly) SB Port_Binding table.
> >       */
> >      engine_add_input(&en_sync_to_sb, &en_sync_to_sb_addr_set, NULL);
> >      engine_add_input(&en_sync_to_sb, &en_sync_to_sb_lb, NULL);
> > +    engine_add_input(&en_sync_to_sb, &en_sync_to_sb_pb, NULL);
> >
> >      engine_add_input(&en_sync_from_sb, &en_northd,
> >                       sync_from_sb_northd_handler);
> > diff --git a/northd/northd.c b/northd/northd.c
> > index 1477b79331..a3bd21e0b4 100644
> > --- a/northd/northd.c
> > +++ b/northd/northd.c
> > @@ -3514,8 +3514,6 @@ ovn_port_update_sbrec(struct ovsdb_idl_txn
> *ovnsb_txn,
> >          ds_destroy(&s);
> >
> >          sbrec_port_binding_set_external_ids(op->sb,
> &op->nbrp->external_ids);
> > -
> > -        sbrec_port_binding_set_nat_addresses(op->sb, NULL, 0);
> >      } else {
> >          if (!lsp_is_router(op->nbsp)) {
> >              uint32_t queue_id = smap_get_int(
> > @@ -3631,116 +3629,6 @@ ovn_port_update_sbrec(struct ovsdb_idl_txn
> *ovnsb_txn,
> >              } else {
> >                  sbrec_port_binding_set_options(op->sb, NULL);
> >              }
> > -            const char *nat_addresses = smap_get(&op->nbsp->options,
> > -                                           "nat-addresses");
> > -            size_t n_nats = 0;
> > -            char **nats = NULL;
> > -            bool l3dgw_ports = op->peer && op->peer->od &&
> > -                               op->peer->od->n_l3dgw_ports;
> > -            if (nat_addresses && !strcmp(nat_addresses, "router")) {
> > -                if (op->peer && op->peer->od
> > -                    && (chassis || op->peer->od->n_l3dgw_ports)) {
> > -                    bool exclude_lb_vips =
> smap_get_bool(&op->nbsp->options,
> > -                            "exclude-lb-vips-from-garp", false);
> > -                    nats = get_nat_addresses(op->peer, &n_nats, false,
> > -                                             !exclude_lb_vips);
> > -                }
> > -            } else if (nat_addresses && (chassis || l3dgw_ports)) {
> > -                struct lport_addresses laddrs;
> > -                if (!extract_lsp_addresses(nat_addresses, &laddrs)) {
> > -                    static struct vlog_rate_limit rl =
> > -                        VLOG_RATE_LIMIT_INIT(1, 1);
> > -                    VLOG_WARN_RL(&rl, "Error extracting nat-addresses.");
> > -                } else {
> > -                    destroy_lport_addresses(&laddrs);
> > -                    n_nats = 1;
> > -                    nats = xcalloc(1, sizeof *nats);
> > -                    struct ds nat_addr = DS_EMPTY_INITIALIZER;
> > -                    ds_put_format(&nat_addr, "%s", nat_addresses);
> > -                    if (l3dgw_ports) {
> > -                        const struct ovn_port *l3dgw_port = (
> > -                            is_l3dgw_port(op->peer)
> > -                            ? op->peer
> > -                            : op->peer->od->l3dgw_ports[0]);
> > -                        ds_put_format(&nat_addr, "
> is_chassis_resident(%s)",
> > -                            l3dgw_port->cr_port->json_key);
> > -                    }
> > -                    nats[0] = xstrdup(ds_cstr(&nat_addr));
> > -                    ds_destroy(&nat_addr);
> > -                }
> > -            }
> > -
> > -            /* Add the router mac and IPv4 addresses to
> > -             * Port_Binding.nat_addresses so that GARP is sent for these
> > -             * IPs by the ovn-controller on which the distributed gateway
> > -             * router port resides if:
> > -             *
> > -             * -  op->peer has 'reside-on-redirect-chassis' set and the
> > -             *    the logical router datapath has distributed router
> port.
> > -             *
> > -             * -  op->peer is distributed gateway router port.
> > -             *
> > -             * -  op->peer's router is a gateway router and op has a
> localnet
> > -             *    port.
> > -             *
> > -             * Note: Port_Binding.nat_addresses column is also used for
> > -             * sending the GARPs for the router port IPs.
> > -             * */
> > -            bool add_router_port_garp = false;
> > -            if (op->peer && op->peer->nbrp &&
> op->peer->od->n_l3dgw_ports) {
> > -                if (is_l3dgw_port(op->peer)) {
> > -                    add_router_port_garp = true;
> > -                } else if (smap_get_bool(&op->peer->nbrp->options,
> > -                               "reside-on-redirect-chassis", false)) {
> > -                    if (op->peer->od->n_l3dgw_ports == 1) {
> > -                        add_router_port_garp = true;
> > -                    } else {
> > -                        static struct vlog_rate_limit rl =
> > -                            VLOG_RATE_LIMIT_INIT(1, 1);
> > -                        VLOG_WARN_RL(&rl,
> "\"reside-on-redirect-chassis\" is "
> > -                                     "set on logical router port %s,
> which "
> > -                                     "is on logical router %s, which has
> %"
> > -                                     PRIuSIZE" distributed gateway
> ports. This"
> > -                                     "option can only be used when there
> is "
> > -                                     "a single distributed gateway
> port.",
> > -                                     op->peer->key,
> op->peer->od->nbr->name,
> > -                                     op->peer->od->n_l3dgw_ports);
> > -                    }
> > -                }
> > -            } else if (chassis && op->od->n_localnet_ports) {
> > -                add_router_port_garp = true;
> > -            }
> > -
> > -            if (add_router_port_garp) {
> > -                struct ds garp_info = DS_EMPTY_INITIALIZER;
> > -                ds_put_format(&garp_info, "%s",
> op->peer->lrp_networks.ea_s);
> > -
> > -                for (size_t i = 0; i <
> op->peer->lrp_networks.n_ipv4_addrs;
> > -                     i++) {
> > -                    ds_put_format(&garp_info, " %s",
> > -
>  op->peer->lrp_networks.ipv4_addrs[i].addr_s);
> > -                }
> > -
> > -                if (op->peer->od->n_l3dgw_ports) {
> > -                    const struct ovn_port *l3dgw_port = (
> > -                        is_l3dgw_port(op->peer)
> > -                        ? op->peer
> > -                        : op->peer->od->l3dgw_ports[0]);
> > -                    ds_put_format(&garp_info, " is_chassis_resident(%s)",
> > -                                  l3dgw_port->cr_port->json_key);
> > -                }
> > -
> > -                n_nats++;
> > -                nats = xrealloc(nats, (n_nats * sizeof *nats));
> > -                nats[n_nats - 1] = ds_steal_cstr(&garp_info);
> > -                ds_destroy(&garp_info);
> > -            }
> > -            sbrec_port_binding_set_nat_addresses(op->sb,
> > -                                                 (const char **) nats,
> n_nats);
> > -            for (size_t i = 0; i < n_nats; i++) {
> > -                free(nats[i]);
> > -            }
> > -            free(nats);
> >          }
> >
> >          sbrec_port_binding_set_parent_port(op->sb,
> op->nbsp->parent_name);
> > @@ -4695,6 +4583,137 @@ sync_lbs(struct ovsdb_idl_txn *ovnsb_txn,
> >      }
> >  }
> >
> > +/* Sync the SB Port bindings which needs to be updated.
> > + * Presently it syncs the nat column of port bindings corresponding to
> > + * the logical switch ports. */
> > +void sync_pbs(struct ovsdb_idl_txn *ovnsb_idl_txn, struct hmap *ls_ports)
> > +{
> > +    ovs_assert(ovnsb_idl_txn);
> > +
> > +    struct ovn_port *op;
> > +    HMAP_FOR_EACH (op, key_node, ls_ports) {
> > +        if (lsp_is_router(op->nbsp)) {
> > +            const char *chassis = NULL;
> > +            if (op->peer && op->peer->od && op->peer->od->nbr) {
> > +                chassis = smap_get(&op->peer->od->nbr->options,
> "chassis");
> > +            }
> > +
> > +            const char *nat_addresses = smap_get(&op->nbsp->options,
> > +                                                 "nat-addresses");
> > +            size_t n_nats = 0;
> > +            char **nats = NULL;
> > +            bool l3dgw_ports = op->peer && op->peer->od &&
> > +                               op->peer->od->n_l3dgw_ports;
> > +            if (nat_addresses && !strcmp(nat_addresses, "router")) {
> > +                if (op->peer && op->peer->od
> > +                    && (chassis || op->peer->od->n_l3dgw_ports)) {
> > +                    bool exclude_lb_vips =
> smap_get_bool(&op->nbsp->options,
> > +                            "exclude-lb-vips-from-garp", false);
> > +                    nats = get_nat_addresses(op->peer, &n_nats, false,
> > +                                             !exclude_lb_vips);
> > +                }
> > +            } else if (nat_addresses && (chassis || l3dgw_ports)) {
> > +                struct lport_addresses laddrs;
> > +                if (!extract_lsp_addresses(nat_addresses, &laddrs)) {
> > +                    static struct vlog_rate_limit rl =
> > +                        VLOG_RATE_LIMIT_INIT(1, 1);
> > +                    VLOG_WARN_RL(&rl, "Error extracting nat-addresses.");
> > +                } else {
> > +                    destroy_lport_addresses(&laddrs);
> > +                    n_nats = 1;
> > +                    nats = xcalloc(1, sizeof *nats);
> > +                    struct ds nat_addr = DS_EMPTY_INITIALIZER;
> > +                    ds_put_format(&nat_addr, "%s", nat_addresses);
> > +                    if (l3dgw_ports) {
> > +                        const struct ovn_port *l3dgw_port = (
> > +                            is_l3dgw_port(op->peer)
> > +                            ? op->peer
> > +                            : op->peer->od->l3dgw_ports[0]);
> > +                        ds_put_format(&nat_addr, "
> is_chassis_resident(%s)",
> > +                            l3dgw_port->cr_port->json_key);
> > +                    }
> > +                    nats[0] = xstrdup(ds_cstr(&nat_addr));
> > +                    ds_destroy(&nat_addr);
> > +                }
> > +            }
> > +
> > +            /* Add the router mac and IPv4 addresses to
> > +             * Port_Binding.nat_addresses so that GARP is sent for these
> > +             * IPs by the ovn-controller on which the distributed gateway
> > +             * router port resides if:
> > +             *
> > +             * -  op->peer has 'reside-on-redirect-chassis' set and the
> > +             *    the logical router datapath has distributed router
> port.
> > +             *
> > +             * -  op->peer is distributed gateway router port.
> > +             *
> > +             * -  op->peer's router is a gateway router and op has a
> localnet
> > +             *    port.
> > +             *
> > +             * Note: Port_Binding.nat_addresses column is also used for
> > +             * sending the GARPs for the router port IPs.
> > +             * */
> > +            bool add_router_port_garp = false;
> > +            if (op->peer && op->peer->nbrp &&
> op->peer->od->n_l3dgw_ports) {
> > +                if (is_l3dgw_port(op->peer)) {
> > +                    add_router_port_garp = true;
> > +                } else if (smap_get_bool(&op->peer->nbrp->options,
> > +                               "reside-on-redirect-chassis", false)) {
> > +                    if (op->peer->od->n_l3dgw_ports == 1) {
> > +                        add_router_port_garp = true;
> > +                    } else {
> > +                        static struct vlog_rate_limit rl =
> > +                            VLOG_RATE_LIMIT_INIT(1, 1);
> > +                        VLOG_WARN_RL(&rl,
> "\"reside-on-redirect-chassis\" is "
> > +                                     "set on logical router port %s,
> which "
> > +                                     "is on logical router %s, which has
> %"
> > +                                     PRIuSIZE" distributed gateway
> ports. This"
> > +                                     "option can only be used when there
> is "
> > +                                     "a single distributed gateway
> port.",
> > +                                     op->peer->key,
> op->peer->od->nbr->name,
> > +                                     op->peer->od->n_l3dgw_ports);
> > +                    }
> > +                }
> > +            } else if (chassis && op->od->n_localnet_ports) {
> > +                add_router_port_garp = true;
> > +            }
> > +
> > +            if (add_router_port_garp) {
> > +                struct ds garp_info = DS_EMPTY_INITIALIZER;
> > +                ds_put_format(&garp_info, "%s",
> op->peer->lrp_networks.ea_s);
> > +
> > +                for (size_t i = 0; i <
> op->peer->lrp_networks.n_ipv4_addrs;
> > +                     i++) {
> > +                    ds_put_format(&garp_info, " %s",
> > +
>  op->peer->lrp_networks.ipv4_addrs[i].addr_s);
> > +                }
> > +
> > +                if (op->peer->od->n_l3dgw_ports) {
> > +                    const struct ovn_port *l3dgw_port = (
> > +                        is_l3dgw_port(op->peer)
> > +                        ? op->peer
> > +                        : op->peer->od->l3dgw_ports[0]);
> > +                    ds_put_format(&garp_info, " is_chassis_resident(%s)",
> > +                                  l3dgw_port->cr_port->json_key);
> > +                }
> > +
> > +                n_nats++;
> > +                nats = xrealloc(nats, (n_nats * sizeof *nats));
> > +                nats[n_nats - 1] = ds_steal_cstr(&garp_info);
> > +                ds_destroy(&garp_info);
> > +            }
> > +            sbrec_port_binding_set_nat_addresses(op->sb,
> > +                                                 (const char **) nats,
> n_nats);
> > +            for (size_t i = 0; i < n_nats; i++) {
> > +                free(nats[i]);
> > +            }
> > +            free(nats);
> > +        } else {
> > +            sbrec_port_binding_set_nat_addresses(op->sb, NULL, 0);
> > +        }
> > +    }
> > +}
> > +
> >  static bool
> >  ovn_port_add_tnlid(struct ovn_port *op, uint32_t tunnel_key)
> >  {
> > diff --git a/northd/northd.h b/northd/northd.h
> > index 044d4ee0c0..cd2e5394c2 100644
> > --- a/northd/northd.h
> > +++ b/northd/northd.h
> > @@ -374,4 +374,6 @@ const char *northd_get_svc_monitor_mac(void);
> >  void sync_lbs(struct ovsdb_idl_txn *, const struct
> sbrec_load_balancer_table *,
> >                struct ovn_datapaths *ls_datapaths, struct hmap *lbs);
> >
> > +void sync_pbs(struct ovsdb_idl_txn *, struct hmap *ls_ports);
> > +
> >  #endif /* NORTHD_H */
> > --
> > 2.40.1
> >
> > _______________________________________________
> > dev mailing list
> > d...@openvswitch.org
> > https://mail.openvswitch.org/mailman/listinfo/ovs-dev
> _______________________________________________
> dev mailing list
> d...@openvswitch.org
> https://mail.openvswitch.org/mailman/listinfo/ovs-dev
_______________________________________________
dev mailing list
d...@openvswitch.org
https://mail.openvswitch.org/mailman/listinfo/ovs-dev

Reply via email to