On Mon, Feb 03, 2025 at 04:04:30PM +0100, Dumitru Ceara wrote:
> On 1/31/25 4:05 PM, Dumitru Ceara wrote:
> > On 1/29/25 12:15 PM, Felix Huettner via dev wrote:
> >> For each vrf we use we open a netlink watcher.
> >> This allows us to reconcile on changed route entries from outside
> >> routing agents.
> >>
> >> Signed-off-by: Felix Huettner <felix.huettner@stackit.cloud>
> >> ---
> > 
> > Hi Felix,
> > 
> > This is not a full review, just some things I noticed while trying to
> > debug some test failures.
> > 
> 
> This is a follow up which includes the rest of the review. :)

Hi Dumitru,

thanks a lot for the reviews.

> 
> >>  controller/automake.mk               |   7 +-
> >>  controller/ovn-controller.c          |  48 ++++++-
> >>  controller/route-exchange.c          |   6 +-
> >>  controller/route-exchange.h          |   3 +
> >>  controller/route-table-notify-stub.c |  44 +++++++
> >>  controller/route-table-notify.c      | 179 +++++++++++++++++++++++++++
> >>  controller/route-table-notify.h      |  37 ++++++
> >>  tests/system-ovn.at                  |   4 -
> >>  8 files changed, 319 insertions(+), 9 deletions(-)
> >>  create mode 100644 controller/route-table-notify-stub.c
> >>  create mode 100644 controller/route-table-notify.c
> >>  create mode 100644 controller/route-table-notify.h
> >>
> >> diff --git a/controller/automake.mk b/controller/automake.mk
> >> index 66aff8643..df24a674f 100644
> >> --- a/controller/automake.mk
> >> +++ b/controller/automake.mk
> >> @@ -53,6 +53,7 @@ controller_ovn_controller_SOURCES = \
> >>    controller/ovn-dns.c \
> >>    controller/ovn-dns.h \
> >>    controller/route-exchange.h \
> >> +  controller/route-table-notify.h \
> >>    controller/route.h \
> >>    controller/route.c
> >>  
> >> @@ -60,10 +61,12 @@ if HAVE_NETLINK
> >>  controller_ovn_controller_SOURCES += \
> >>    controller/route-exchange-netlink.h \
> >>    controller/route-exchange-netlink.c \
> >> -  controller/route-exchange.c
> >> +  controller/route-exchange.c \
> >> +  controller/route-table-notify.c
> >>  else
> >>  controller_ovn_controller_SOURCES += \
> >> -  controller/route-exchange-stub.c
> >> +  controller/route-exchange-stub.c \
> >> +  controller/route-table-notify-stub.c
> >>  endif
> >>  
> >>  controller_ovn_controller_LDADD = lib/libovn.la 
> >> $(OVS_LIBDIR)/libopenvswitch.la
> >> diff --git a/controller/ovn-controller.c b/controller/ovn-controller.c
> >> index 612fccb42..70c3a5d1a 100644
> >> --- a/controller/ovn-controller.c
> >> +++ b/controller/ovn-controller.c
> >> @@ -90,6 +90,7 @@
> >>  #include "ovn-dns.h"
> >>  #include "route.h"
> >>  #include "route-exchange.h"
> >> +#include "route-table-notify.h"
> >>  
> >>  VLOG_DEFINE_THIS_MODULE(main);
> >>  
> >> @@ -5104,10 +5105,14 @@ en_route_exchange_run(struct engine_node *node, 
> >> void *data)
> >>          .announce_routes = &route_data->announce_routes,
> >>      };
> >>  
> >> -    struct route_exchange_ctx_out r_ctx_out = {
> >> -    };
> >> +    struct route_exchange_ctx_out r_ctx_out = {};
> >> +
> >> +    hmap_init(&r_ctx_out.route_table_watches);
> >>  
> >>      route_exchange_run(&r_ctx_in, &r_ctx_out);
> >> +    route_table_notify_update_watches(&r_ctx_out.route_table_watches);
> >> +
> >> +    hmap_destroy(&r_ctx_out.route_table_watches);
> >>  
> >>      engine_set_node_state(node, EN_UPDATED);
> >>  }
> >> @@ -5126,6 +5131,38 @@ static void
> >>  en_route_exchange_cleanup(void *data OVS_UNUSED)
> >>  {}
> >>  
> >> +struct ed_type_route_table_notify {
> >> +    /* For incremental processing this could be tracked per datapath in
> >> +     * the future. */
> >> +    bool changed;
> >> +};
> >> +
> >> +static void
> >> +en_route_table_notify_run(struct engine_node *node, void *data)
> >> +{
> >> +    struct ed_type_route_table_notify *rtn = data;
> >> +    if (rtn->changed) {
> >> +        engine_set_node_state(node, EN_UPDATED);
> >> +    } else {
> >> +        engine_set_node_state(node, EN_UNCHANGED);
> >> +    }
> >> +    rtn->changed = false;
> >> +}
> >> +
> >> +
> >> +static void *
> >> +en_route_table_notify_init(struct engine_node *node OVS_UNUSED,
> >> +                       struct engine_arg *arg OVS_UNUSED)
> >> +{
> >> +    struct ed_type_route_table_notify *rtn = xzalloc(sizeof *rtn);
> >> +    rtn->changed = true;
> >> +    return rtn;
> >> +}
> >> +
> >> +static void
> >> +en_route_table_notify_cleanup(void *data OVS_UNUSED)
> >> +{}
> >> +
> >>  /* Returns false if the northd internal version stored in SB_Global
> >>   * and ovn-controller internal version don't match.
> >>   */
> >> @@ -5425,6 +5462,7 @@ main(int argc, char *argv[])
> >>      ENGINE_NODE(bfd_chassis, "bfd_chassis");
> >>      ENGINE_NODE(dns_cache, "dns_cache");
> >>      ENGINE_NODE(route, "route");
> >> +    ENGINE_NODE(route_table_notify, "route_table_notify");
> >>      ENGINE_NODE(route_exchange, "route_exchange");
> >>  
> >>  #define SB_NODE(NAME, NAME_STR) ENGINE_NODE_SB(NAME, NAME_STR);
> >> @@ -5462,6 +5500,7 @@ main(int argc, char *argv[])
> >>                       engine_noop_handler);
> >>      engine_add_input(&en_route_exchange, &en_sb_port_binding,
> >>                       engine_noop_handler);
> >> +    engine_add_input(&en_route_exchange, &en_route_table_notify, NULL);
> > 
> > I know we for now we didn't really cover the route learning/advertising
> > incremental processing part but this dependency here will cause
> > en_route_exchange_run() to execute every time anything changes in the
> > host routing.
> > 
> >>  
> >>      engine_add_input(&en_addr_sets, &en_sb_address_set,
> >>                       addr_sets_sb_address_set_handler);
> >> @@ -5979,6 +6018,10 @@ main(int argc, char *argv[])
> >>                                 &transport_zones,
> >>                                 bridge_table);
> >>  
> >> +                    struct ed_type_route_table_notify *rtn =
> >> +                        engine_get_internal_data(&en_route_table_notify);
> >> +                    route_table_notify_run(&rtn->changed);
> >> +
> >>                      stopwatch_start(CONTROLLER_LOOP_STOPWATCH_NAME,
> >>                                      time_msec());
> >>  
> >> @@ -6254,6 +6297,7 @@ main(int argc, char *argv[])
> >>              }
> >>  
> >>              binding_wait();
> >> +            route_table_notify_wait();
> >>          }
> >>  
> >>          unixctl_server_run(unixctl);
> >> diff --git a/controller/route-exchange.c b/controller/route-exchange.c
> >> index dc3e5657c..e7a85eecf 100644
> >> --- a/controller/route-exchange.c
> >> +++ b/controller/route-exchange.c
> >> @@ -29,6 +29,7 @@
> >>  #include "ha-chassis.h"
> >>  #include "local_data.h"
> >>  #include "route.h"
> >> +#include "route-table-notify.h"
> >>  #include "route-exchange.h"
> >>  #include "route-exchange-netlink.h"
> >>  
> >> @@ -169,7 +170,7 @@ sb_sync_learned_routes(const struct ovs_list 
> >> *learned_routes,
> >>  
> >>  void
> >>  route_exchange_run(struct route_exchange_ctx_in *r_ctx_in,
> >> -                   struct route_exchange_ctx_out *r_ctx_out OVS_UNUSED)
> >> +                   struct route_exchange_ctx_out *r_ctx_out)
> >>  {
> >>      struct sset old_maintained_vrfs = 
> >> SSET_INITIALIZER(&old_maintained_vrfs);
> >>      sset_swap(&_maintained_vrfs, &old_maintained_vrfs);
> >> @@ -211,6 +212,9 @@ route_exchange_run(struct route_exchange_ctx_in 
> >> *r_ctx_in,
> >>                                 r_ctx_in->sbrec_port_binding_by_name,
> >>                                 r_ctx_in->sbrec_learned_route_by_datapath);
> >>  
> >> +        route_table_add_watch_request(
> >> +            &r_ctx_out->route_table_watches, table_id);
> >> +
> >>          re_nl_learned_routes_destroy(&received_routes);
> >>      }
> >>  
> >> diff --git a/controller/route-exchange.h b/controller/route-exchange.h
> >> index d23bb37a2..0eb0477ee 100644
> >> --- a/controller/route-exchange.h
> >> +++ b/controller/route-exchange.h
> >> @@ -18,6 +18,8 @@
> >>  #ifndef ROUTE_EXCHANGE_H
> >>  #define ROUTE_EXCHANGE_H 1
> >>  
> >> +#include "openvswitch/hmap.h"
> >> +
> >>  struct route_exchange_ctx_in {
> >>      struct ovsdb_idl_txn *ovnsb_idl_txn;
> >>      struct ovsdb_idl_index *sbrec_port_binding_by_name;
> >> @@ -27,6 +29,7 @@ struct route_exchange_ctx_in {
> >>  };
> >>  
> >>  struct route_exchange_ctx_out {
> >> +    struct hmap route_table_watches;
> >>  };
> >>  
> >>  void route_exchange_run(struct route_exchange_ctx_in *,
> >> diff --git a/controller/route-table-notify-stub.c 
> >> b/controller/route-table-notify-stub.c
> >> new file mode 100644
> >> index 000000000..0a83a3e93
> >> --- /dev/null
> >> +++ b/controller/route-table-notify-stub.c
> >> @@ -0,0 +1,44 @@
> >> +/*
> >> + * Copyright (c) 2024, STACKIT GmbH & Co. KG
> > 
> > 2025
> > 
> >> + *
> >> + * Licensed under the Apache License, Version 2.0 (the "License");
> >> + * you may not use this file except in compliance with the License.
> >> + * You may obtain a copy of the License at:
> >> + *
> >> + *     http://www.apache.org/licenses/LICENSE-2.0
> >> + *
> >> + * Unless required by applicable law or agreed to in writing, software
> >> + * distributed under the License is distributed on an "AS IS" BASIS,
> >> + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or 
> >> implied.
> >> + * See the License for the specific language governing permissions and
> >> + * limitations under the License.
> >> + */
> >> +
> >> +#include <config.h>
> >> +
> >> +#include <stdbool.h>
> >> +
> >> +#include "openvswitch/compiler.h"
> >> +#include "route-table-notify.h"
> >> +
> >> +void
> >> +route_table_notify_run(bool *changed)
> >> +{
> >> +    *changed = false;
> >> +}
> >> +
> >> +void
> >> +route_table_notify_wait(void)
> >> +{
> >> +}
> >> +
> >> +void
> >> +route_table_add_watch_request(struct hmap *route_table_watches OVS_UNUSED,
> >> +                              uint32_t table_id OVS_UNUSED) {
> >> +}
> >> +
> >> +void
> >> +route_table_notify_update_watches(struct hmap *route_table_watches 
> >> OVS_UNUSED)
> >> +{
> >> +}
> >> +
> >> diff --git a/controller/route-table-notify.c 
> >> b/controller/route-table-notify.c
> >> new file mode 100644
> >> index 000000000..0d931e133
> >> --- /dev/null
> >> +++ b/controller/route-table-notify.c
> >> @@ -0,0 +1,179 @@
> >> +/*
> >> + * Copyright (c) 2024, STACKIT GmbH & Co. KG
> > 
> > 2025
> > 
> >> + *
> >> + * Licensed under the Apache License, Version 2.0 (the "License");
> >> + * you may not use this file except in compliance with the License.
> >> + * You may obtain a copy of the License at:
> >> + *
> >> + *     http://www.apache.org/licenses/LICENSE-2.0
> >> + *
> >> + * Unless required by applicable law or agreed to in writing, software
> >> + * distributed under the License is distributed on an "AS IS" BASIS,
> >> + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or 
> >> implied.
> >> + * See the License for the specific language governing permissions and
> >> + * limitations under the License.
> >> + */
> >> +
> >> +#include <config.h>
> >> +
> >> +#include <net/if.h>
> >> +#include <linux/rtnetlink.h>
> >> +
> >> +#include "netlink-notifier.h"
> >> +#include "openvswitch/vlog.h"
> >> +
> >> +#include "binding.h"
> >> +#include "hash.h"
> >> +#include "hmapx.h"
> >> +#include "route-table.h"
> >> +#include "route.h"
> >> +#include "route-table-notify.h"
> >> +#include "route-exchange-netlink.h"
> >> +
> >> +VLOG_DEFINE_THIS_MODULE(route_table_notify);
> >> +
> >> +struct route_table_watch_request {
> >> +    struct hmap_node node;
> >> +    uint32_t table_id;
> >> +};
> >> +
> >> +struct route_table_watch_entry {
> >> +    struct hmap_node node;
> >> +    uint32_t table_id;
> >> +    struct nln *nln;
> >> +    struct nln_notifier *route_notifier;
> >> +    struct nln_notifier *route6_notifier;
> >> +};
> >> +
> >> +static struct hmap watches = HMAP_INITIALIZER(&watches);
> >> +static bool any_route_table_changed;
> >> +static struct route_table_msg rtmsg;
> >> +
> >> +static uint32_t
> >> +route_table_notify_hash_watch(uint32_t table_id)
> >> +{
> >> +    return hash_add(0, table_id);
> >> +}
> >> +
> >> +void
> >> +route_table_add_watch_request(struct hmap *route_table_watches,
> >> +                              uint32_t table_id)
> >> +{
> >> +    struct route_table_watch_request *wr = xzalloc(sizeof *wr);
> >> +    wr->table_id = table_id;
> >> +    hmap_insert(route_table_watches, &wr->node,
> >> +                route_table_notify_hash_watch(wr->table_id));
> >> +}
> >> +
> >> +static void
> >> +route_table_change(const void *change_, void *aux OVS_UNUSED)
> >> +{
> >> +    const struct route_table_msg *change = change_;
> >> +    if (change && change->rd.rtm_protocol != RTPROT_OVN) {
> >> +        any_route_table_changed = true;
> >> +    }
> >> +}
> > 
> > What do you think of this to avoid having to do en_route_exchange_run()
> > for each and every host route table change?
> > 
> > static void
> > route_table_change(const void *change_, void *aux OVS_UNUSED)
> > {
> >     const struct route_table_msg *change = change_;
> >     if (change && change->rd.rtm_protocol != RTPROT_OVN) {
> >         if (find_watch_entry(change->rd.rta_table_id)) {
> >             any_route_table_changed = true;
> >         }
> >     }
> > }
> > 

Yes that makes it significantly more efficient. I'll add that.

> >> +
> >> +static void
> >> +add_watch_entry(uint32_t table_id)
> >> +{
> >> +    struct route_table_watch_entry *we;
> >> +    uint32_t hash = route_table_notify_hash_watch(table_id);
> >> +    we = xzalloc(sizeof *we);
> >> +    we->table_id = table_id;
> >> +    VLOG_INFO("Registering new route table watcher for table %d.",
> >> +             table_id);
> >> +    we->nln = nln_create(NETLINK_ROUTE, route_table_parse, &rtmsg);
> >> +
> >> +    we->route_notifier =
> >> +        nln_notifier_create(we->nln, RTNLGRP_IPV4_ROUTE,
> >> +                            route_table_change, NULL);
> >> +    if (!we->route_notifier) {
> >> +        VLOG_WARN("Failed to create ipv4 route table watcher for "
> 
> It's probably a good idea to rate limit this warning message.
> 
> >> +                  "table %d. We will miss routing table updates.", 
> >> table_id);
> >> +    }
> >> +
> >> +    we->route6_notifier =
> >> +        nln_notifier_create(we->nln, RTNLGRP_IPV6_ROUTE,
> >> +                            route_table_change, NULL);
> >> +    if (!we->route6_notifier) {
> >> +        VLOG_WARN("Failed to create ipv6 route table watcher for "
> 
> It's probably a good idea to rate limit this warning message.
> 
> >> +                  "table %d. We will miss routing table updates.", 
> >> table_id);
> >> +    }
> >> +
> >> +    hmap_insert(&watches, &we->node, hash);
> >> +}
> >> +
> >> +static void
> >> +remove_watch_entry(struct route_table_watch_entry *we)
> >> +{
> >> +    hmap_remove(&watches, &we->node);
> >> +    VLOG_INFO("Removing route table watcher for table %d.",
> >> +             we->table_id);
> 
> Nit: fits on one line.
> 
> >> +    nln_notifier_destroy(we->route_notifier);
> >> +    nln_notifier_destroy(we->route6_notifier);
> >> +    nln_destroy(we->nln);
> >> +    free(we);
> >> +}
> >> +
> >> +void
> >> +route_table_notify_run(bool *changed)
> >> +{
> >> +    any_route_table_changed = false;
> >> +
> >> +    struct route_table_watch_entry *we;
> >> +    HMAP_FOR_EACH (we, node, &watches) {
> >> +        nln_run(we->nln);
> >> +    }
> >> +
> >> +    *changed = any_route_table_changed;
> >> +}
> >> +
> >> +void
> >> +route_table_notify_wait(void)
> >> +{
> >> +    struct route_table_watch_entry *we;
> >> +    HMAP_FOR_EACH (we, node, &watches) {
> >> +        nln_wait(we->nln);
> >> +    }
> >> +}
> >> +
> >> +static struct route_table_watch_entry*
> > 
> > Nit: missing space before '*'.
> > 
> >> +find_watch_entry(uint32_t table_id)
> >> +{
> >> +    struct route_table_watch_entry *we;
> >> +    uint32_t hash = route_table_notify_hash_watch(table_id);
> >> +    HMAP_FOR_EACH_WITH_HASH (we, node, hash, &watches) {
> >> +        if (table_id == we->table_id) {
> >> +            return we;
> >> +        }
> >> +    }
> >> +    return NULL;
> >> +}
> >> +
> >> +void
> >> +route_table_notify_update_watches(struct hmap *route_table_watches)
> 
> This should be 'const struct hmap *route_table_watches'.
> 
> I know we remove from the map below but we don't have to.  This is the
> "desired" state we want to reconcile the host to.

The thing is that this hmap is just passed to here and afterwards needs
to be freed again. So i would leave this here, as we otherwise need to
have a separate loop freeing everything.

> 
> >> +{
> >> +    struct hmapx sync_watches = HMAPX_INITIALIZER(&sync_watches);
> >> +    struct route_table_watch_entry *we;
> >> +    HMAP_FOR_EACH (we, node, &watches) {
> >> +        hmapx_add(&sync_watches, we);
> >> +    }
> >> +
> >> +    struct route_table_watch_request *wr;
> >> +    HMAP_FOR_EACH_SAFE (wr, node, route_table_watches) {
> >> +        we = find_watch_entry(wr->table_id);
> >> +        if (we) {
> >> +            hmapx_find_and_delete(&sync_watches, we);
> >> +        } else {
> >> +            add_watch_entry(wr->table_id);
> >> +        }
> >> +        hmap_remove(route_table_watches, &wr->node);
> >> +        free(wr);
> 
> No need to remove here, so no need to free and that means
> HMAP_FOR_EACH() is enough.
> 
> >> +    }
> >> +
> >> +    struct hmapx_node *node;
> >> +    HMAPX_FOR_EACH (node, &sync_watches) {
> >> +        remove_watch_entry(node->data);
> >> +    }
> 
> Kind of a nit because I assume exiting the process will probably cleanup
> fine but shouldn't we remove all watch entries on exit like we do with
> other resources?

Yea, i'll add a *_destroy.

> 
> >> +}
> >> diff --git a/controller/route-table-notify.h 
> >> b/controller/route-table-notify.h
> >> new file mode 100644
> >> index 000000000..b7211f6e7
> >> --- /dev/null
> >> +++ b/controller/route-table-notify.h
> >> @@ -0,0 +1,37 @@
> >> +/*
> >> + * Copyright (c) 2024, STACKIT GmbH & Co. KG
> > 
> > 2025
> > 
> >> + *
> >> + * Licensed under the Apache License, Version 2.0 (the "License");
> >> + * you may not use this file except in compliance with the License.
> >> + * You may obtain a copy of the License at:
> >> + *
> >> + *     http://www.apache.org/licenses/LICENSE-2.0
> >> + *
> >> + * Unless required by applicable law or agreed to in writing, software
> >> + * distributed under the License is distributed on an "AS IS" BASIS,
> >> + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or 
> >> implied.
> >> + * See the License for the specific language governing permissions and
> >> + * limitations under the License.
> >> + */
> >> +
> >> +#ifndef ROUTE_TABLE_NOTIFY_H
> >> +#define ROUTE_TABLE_NOTIFY_H 1
> >> +
> >> +#include <stdbool.h>
> >> +#include "openvswitch/hmap.h"
> >> +
> >> +/* Sets "changed" to true if any route table has changed enough that we 
> >> need
> >> + * to learn new routes. */
> >> +void route_table_notify_run(bool *changed);
> 
> Why not just return true if any relevant table changed and false
> otherwise?  It feels a bit weird to do that through a 'bool *' argument.

That came from your comment at
https://patchwork.ozlabs.org/project/ovn/patch/ae5de92e1880da09e7d27770f0b0a3214f0a2985.1735830931.git.felix.huettner@stackit.cloud/
But maybe i misunderstood it?

"""
Maybe it's a bit cleaner if we pass &rtn->changed to
route_table_notify_run() instead of setting it here?
"""

But i can change it back if you want.

Thanks a lot,
Felix

> 
> >> +void route_table_notify_wait(void);
> >> +
> >> +/* Add a watch request to the hmap. The hmap should later be passed to
> >> + * route_table_notify_update_watches*/
> >> +void route_table_add_watch_request(struct hmap *route_table_watches,
> >> +                                   uint32_t table_id);
> >> +
> >> +/* Updates the list of route table watches that are currently active.
> >> + * hmap should contain struct route_table_watch_request */
> >> +void route_table_notify_update_watches(struct hmap *route_table_watches);
> >> +
> >> +#endif /* ROUTE_TABLE_NOTIFY_H */
> >> diff --git a/tests/system-ovn.at b/tests/system-ovn.at
> >> index ef43e242e..3f5672dad 100644
> >> --- a/tests/system-ovn.at
> >> +++ b/tests/system-ovn.at
> >> @@ -15075,8 +15075,6 @@ blackhole 198.51.100.0/24 proto 84 metric 1000])
> >>  # Now we test route learning.
> >>  check_row_count Learned_Route 0
> >>  check ip route add 233.252.0.0/24 via 192.168.10.10 dev lo onlink vrf 
> >> ovnvrf1337
> >> -# For now we trigger a recompute as route watching is not yet implemented.
> >> -check ovn-appctl -t ovn-controller inc-engine/recompute
> >>  check ovn-nbctl --wait=hv sync
> >>  check_row_count Learned_Route 1
> >>  lp=$(fetch_column port_binding _uuid logical_port=internet-phys)
> >> @@ -15324,8 +15322,6 @@ blackhole 198.51.100.0/24 proto 84 metric 1000])
> >>  # Now we test route learning.
> >>  check_row_count Learned_Route 0
> >>  check ip route add 233.252.0.0/24 via 192.168.10.10 dev lo onlink vrf 
> >> ovnvrf1337
> >> -# For now we trigger a recompute as route watching is not yet implemented.
> >> -check ovn-appctl -t ovn-controller inc-engine/recompute
> >>  check ovn-nbctl --wait=hv sync
> >>  check_row_count Learned_Route 1
> >>  lp=$(fetch_column port_binding _uuid logical_port=internet-phys)
> > 
> 
> Thanks,
> Dumitru
> 
_______________________________________________
dev mailing list
d...@openvswitch.org
https://mail.openvswitch.org/mailman/listinfo/ovs-dev

Reply via email to