On Fri, Sep 15, 2023 at 3:09 AM Ales Musil <[email protected]> wrote:
>
> On Fri, Sep 15, 2023 at 8:21 AM Xavier Simonart <[email protected]> wrote:
> >
> > QoS was not configured in OVS db when db was read only: the configuration
> > was just ignored and not done later when OVS db became writable.
> > It was sometimes set later, if/when a recompute happened.
> > This is now fixed: when OVS db is read only, the ports on which qos
> > must be applied are stored and qos will be applied when OVS db becomes
> > writable.
> > To avoid race conditions between delayed qos and new qos changes (e.g. a qos
> > configuration delayed in one loop as ovs is ro, followed in next loop, when
> > ovs
> > becomes rw, by another qos on the same port), all qos changes are done at
> > the
> > same time.
> >
> > This issue was identified by some random failures in system test
> > "egress qos".
> >
> > Signed-off-by: Xavier Simonart <[email protected]>
>
> Hi Xavier,
>
> I believe that we are missing Reported-at:
> https://bugzilla.redhat.com/2234349.
I added this tag to the commit message and applied the patch to main
and branch-23.09.
Let me know if this needs to be backported further down.
Thanks
Numan
>
> >
> > ---
> > v2: - rebased on origin/main
> > - handled comments from Ales
> > ---
> > controller/binding.c | 133 ++++++++++++++++++++++++------------
> > controller/binding.h | 8 +++
> > controller/ovn-controller.c | 7 ++
> > tests/ovn.at | 1 -
> > tests/system-ovn.at | 22 ++++++
> > 5 files changed, 125 insertions(+), 46 deletions(-)
> >
> > diff --git a/controller/binding.c b/controller/binding.c
> > index a521f2828..fd08aaafa 100644
> > --- a/controller/binding.c
> > +++ b/controller/binding.c
> > @@ -55,8 +55,13 @@ struct claimed_port {
> > long long int last_claimed;
> > };
> >
> > +struct qos_port {
> > + bool added;
> > +};
> > +
> > static struct shash _claimed_ports = SHASH_INITIALIZER(&_claimed_ports);
> > static struct sset _postponed_ports = SSET_INITIALIZER(&_postponed_ports);
> > +static struct shash _qos_ports = SHASH_INITIALIZER(&_qos_ports);
> >
> > static void
> > remove_additional_chassis(const struct sbrec_port_binding *pb,
> > @@ -218,6 +223,17 @@ get_qos_egress_port_interface(struct shash
> > *bridge_mappings,
> > return NULL;
> > }
> >
> > +static void
> > +add_or_del_qos_port(const char *ovn_port, bool add)
> > +{
> > + struct qos_port *qos_port = shash_find_data(&_qos_ports, ovn_port);
> > + if (!qos_port) {
> > + qos_port = xzalloc(sizeof *qos_port);
> > + shash_add(&_qos_ports, ovn_port, qos_port);
> > + }
> > + qos_port->added = add;
> > +}
> > +
> > /* 34359738360 == (2^32 - 1) * 8. netdev_set_qos() doesn't support
> > * 64-bit rate netlink attributes, so the maximum value is 2^32 - 1
> > * bytes. The 'max-rate' config option is in bits, so multiplying by 8.
> > @@ -225,7 +241,7 @@ get_qos_egress_port_interface(struct shash
> > *bridge_mappings,
> > * can be unrecognized for certain NICs or reported too low for virtual
> > * interfaces. */
> > #define OVN_QOS_MAX_RATE 34359738360ULL
> > -static void
> > +static bool
> > add_ovs_qos_table_entry(struct ovsdb_idl_txn *ovs_idl_txn,
> > const struct ovsrec_port *port,
> > unsigned long long min_rate,
> > @@ -239,7 +255,7 @@ add_ovs_qos_table_entry(struct ovsdb_idl_txn
> > *ovs_idl_txn,
> > const struct ovsrec_qos *qos = port->qos;
> > if (qos && !smap_get_bool(&qos->external_ids, "ovn_qos", false)) {
> > /* External configured QoS, do not overwrite it. */
> > - return;
> > + return false;
> > }
> >
> > if (!qos) {
> > @@ -282,22 +298,18 @@ add_ovs_qos_table_entry(struct ovsdb_idl_txn
> > *ovs_idl_txn,
> > ovsrec_queue_verify_external_ids(queue);
> > ovsrec_queue_set_external_ids(queue, &external_ids);
> > smap_destroy(&external_ids);
> > + return true;
> > }
> >
> > static void
> > -remove_stale_qos_entry(struct ovsdb_idl_txn *ovs_idl_txn,
> > - const struct sbrec_port_binding *pb,
> > +remove_stale_qos_entry( const char *logical_port,
> > struct ovsdb_idl_index *ovsrec_port_by_qos,
> > const struct ovsrec_qos_table *qos_table,
> > struct hmap *queue_map)
> > {
> > - if (!ovs_idl_txn) {
> > - return;
> > - }
> > -
> > struct qos_queue *q = find_qos_queue(
> > - queue_map, hash_string(pb->logical_port, 0),
> > - pb->logical_port);
> > + queue_map, hash_string(logical_port, 0),
> > + logical_port);
> > if (!q) {
> > return;
> > }
> > @@ -338,8 +350,12 @@ remove_stale_qos_entry(struct ovsdb_idl_txn
> > *ovs_idl_txn,
> >
> > static void
> > configure_qos(const struct sbrec_port_binding *pb,
> > - struct binding_ctx_in *b_ctx_in,
> > - struct binding_ctx_out *b_ctx_out)
> > + struct ovsdb_idl_txn *ovs_idl_txn,
> > + struct ovsdb_idl_index *ovsrec_port_by_qos,
> > + const struct ovsrec_qos_table *qos_table,
> > + struct hmap *qos_map,
> > + const struct ovsrec_open_vswitch_table *ovs_table,
> > + const struct ovsrec_bridge_table *bridge_table)
> > {
> > unsigned long long min_rate = smap_get_ullong(
> > &pb->options, "qos_min_rate", 0);
> > @@ -351,20 +367,20 @@ configure_qos(const struct sbrec_port_binding *pb,
> >
> > if ((!min_rate && !max_rate && !burst) || !queue_id) {
> > /* Qos is not configured for this port. */
> > - remove_stale_qos_entry(b_ctx_in->ovs_idl_txn, pb,
> > - b_ctx_in->ovsrec_port_by_qos,
> > - b_ctx_in->qos_table, b_ctx_out->qos_map);
> > + remove_stale_qos_entry(pb->logical_port,
> > + ovsrec_port_by_qos,
> > + qos_table, qos_map);
> > return;
> > }
> >
> > const char *network = smap_get(&pb->options, "qos_physical_network");
> > uint32_t hash = hash_string(pb->logical_port, 0);
> > - struct qos_queue *q = find_qos_queue(b_ctx_out->qos_map, hash,
> > + struct qos_queue *q = find_qos_queue(qos_map, hash,
> > pb->logical_port);
> > if (!q || q->min_rate != min_rate || q->max_rate != max_rate ||
> > q->burst != burst || (network && strcmp(network, q->network))) {
> > struct shash bridge_mappings = SHASH_INITIALIZER(&bridge_mappings);
> > - add_ovs_bridge_mappings(b_ctx_in->ovs_table,
> > b_ctx_in->bridge_table,
> > + add_ovs_bridge_mappings(ovs_table, bridge_table,
> > &bridge_mappings);
> >
> > const struct ovsrec_port *port = NULL;
> > @@ -375,25 +391,58 @@ configure_qos(const struct sbrec_port_binding *pb,
> > }
> > if (iface) {
> > /* Add new QoS entries. */
> > - add_ovs_qos_table_entry(b_ctx_in->ovs_idl_txn, port, min_rate,
> > + if (add_ovs_qos_table_entry(ovs_idl_txn, port, min_rate,
> > max_rate, burst, queue_id,
> > - pb->logical_port);
> > - if (!q) {
> > - q = xzalloc(sizeof *q);
> > - hmap_insert(b_ctx_out->qos_map, &q->node, hash);
> > - q->port = xstrdup(pb->logical_port);
> > - q->queue_id = queue_id;
> > + pb->logical_port)) {
> > + if (!q) {
> > + q = xzalloc(sizeof *q);
> > + hmap_insert(qos_map, &q->node, hash);
> > + q->port = xstrdup(pb->logical_port);
> > + q->queue_id = queue_id;
> > + }
> > + free(q->network);
> > + q->network = network ? xstrdup(network) : NULL;
> > + q->min_rate = min_rate;
> > + q->max_rate = max_rate;
> > + q->burst = burst;
> > }
> > - free(q->network);
> > - q->network = network ? xstrdup(network) : NULL;
> > - q->min_rate = min_rate;
> > - q->max_rate = max_rate;
> > - q->burst = burst;
> > }
> > shash_destroy(&bridge_mappings);
> > }
> > }
> >
> > +void
> > +update_qos(struct ovsdb_idl_index *sbrec_port_binding_by_name,
> > + struct ovsdb_idl_txn *ovs_idl_txn,
> > + struct ovsdb_idl_index *ovsrec_port_by_qos,
> > + const struct ovsrec_qos_table *qos_table,
> > + struct hmap *qos_map,
> > + const struct ovsrec_open_vswitch_table *ovs_table,
> > + const struct ovsrec_bridge_table *bridge_table)
> > +{
> > + /* Remove qos for any ports for which we could not do it before */
> > + const struct sbrec_port_binding *pb;
> > +
> > + struct shash_node *node;
> > + SHASH_FOR_EACH_SAFE (node, &_qos_ports) {
> > + struct qos_port *qos_port = (struct qos_port *) node->data;
> > + if (qos_port->added) {
> > + pb = lport_lookup_by_name(sbrec_port_binding_by_name,
> > + node->name);
> > + if (pb) {
> > + configure_qos(pb, ovs_idl_txn, ovsrec_port_by_qos,
> > qos_table,
> > + qos_map, ovs_table, bridge_table);
> > + }
> > + } else {
> > + remove_stale_qos_entry(node->name,
> > + ovsrec_port_by_qos,
> > + qos_table, qos_map);
> > + }
> > + free(qos_port);
> > + shash_delete(&_qos_ports, node);
> > + }
> > +}
> > +
> > static const struct ovsrec_queue *
> > find_qos_queue_by_external_ids(const struct smap *external_ids,
> > struct ovsdb_idl_index *ovsrec_queue_by_external_ids)
> > @@ -1524,8 +1573,8 @@ consider_vif_lport_(const struct sbrec_port_binding
> > *pb,
> > tracked_datapath_lport_add(pb, TRACKED_RESOURCE_UPDATED,
> > b_ctx_out->tracked_dp_bindings);
> > }
> > - if (b_lport->lbinding->iface && b_ctx_in->ovs_idl_txn) {
> > - configure_qos(pb, b_ctx_in, b_ctx_out);
> > + if (b_lport->lbinding->iface) {
> > + add_or_del_qos_port(pb->logical_port, true);
> > }
> > } else {
> > /* We could, but can't claim the lport. */
> > @@ -1851,7 +1900,6 @@ consider_l3gw_lport(const struct sbrec_port_binding
> > *pb,
> >
> > static void
> > consider_localnet_lport(const struct sbrec_port_binding *pb,
> > - struct binding_ctx_in *b_ctx_in,
> > struct binding_ctx_out *b_ctx_out)
> > {
> > struct local_datapath *ld
> > @@ -1864,10 +1912,7 @@ consider_localnet_lport(const struct
> > sbrec_port_binding *pb,
> > * for them. */
> > update_local_lports(pb->logical_port, b_ctx_out);
> >
> > - if (b_ctx_in->ovs_idl_txn) {
> > - configure_qos(pb, b_ctx_in, b_ctx_out);
> > - }
> > -
> > + add_or_del_qos_port(pb->logical_port, true);
> > update_related_lport(pb, b_ctx_out);
> > }
> >
> > @@ -1988,6 +2033,7 @@ binding_run(struct binding_ctx_in *b_ctx_in, struct
> > binding_ctx_out *b_ctx_out)
> > return;
> > }
> >
> > + shash_clear_free_data(&_qos_ports);
> > struct shash bridge_mappings = SHASH_INITIALIZER(&bridge_mappings);
> >
> > if (b_ctx_in->br_int) {
> > @@ -2103,7 +2149,7 @@ binding_run(struct binding_ctx_in *b_ctx_in, struct
> > binding_ctx_out *b_ctx_out)
> > * accordingly. */
> > struct lport *lnet_lport;
> > LIST_FOR_EACH_POP (lnet_lport, list_node, &localnet_lports) {
> > - consider_localnet_lport(lnet_lport->pb, b_ctx_in, b_ctx_out);
> > + consider_localnet_lport(lnet_lport->pb, b_ctx_out);
> > update_ld_localnet_port(lnet_lport->pb, &bridge_mappings,
> > b_ctx_out->local_datapaths);
> > free(lnet_lport);
> > @@ -2378,9 +2424,7 @@ consider_iface_release(const struct ovsrec_interface
> > *iface_rec,
> > b_ctx_out, ld);
> > }
> >
> > - remove_stale_qos_entry(b_ctx_in->ovs_idl_txn, b_lport->pb,
> > - b_ctx_in->ovsrec_port_by_qos,
> > - b_ctx_in->qos_table, b_ctx_out->qos_map);
> > + add_or_del_qos_port(b_lport->pb->logical_port, false);
> >
> > /* Release the primary binding lport and other children lports if
> > * any. */
> > @@ -2938,7 +2982,7 @@ handle_updated_port(struct binding_ctx_in *b_ctx_in,
> > break;
> >
> > case LP_LOCALNET: {
> > - consider_localnet_lport(pb, b_ctx_in, b_ctx_out);
> > + consider_localnet_lport(pb, b_ctx_out);
> >
> > struct shash bridge_mappings =
> > SHASH_INITIALIZER(&bridge_mappings);
> > @@ -3026,9 +3070,7 @@ binding_handle_port_binding_changes(struct
> > binding_ctx_in *b_ctx_in,
> > shash_add(&deleted_other_pbs, pb->logical_port, pb);
> > }
> >
> > - remove_stale_qos_entry(b_ctx_in->ovs_idl_txn, pb,
> > - b_ctx_in->ovsrec_port_by_qos,
> > - b_ctx_in->qos_table, b_ctx_out->qos_map);
> > + add_or_del_qos_port(pb->logical_port, false);
> > }
> >
> > struct shash_node *node;
> > @@ -3140,7 +3182,7 @@ delete_done:
> > b_ctx_in->sbrec_port_binding_by_datapath) {
> > enum en_lport_type lport_type = get_lport_type(pb);
> > if (lport_type == LP_LOCALNET) {
> > - consider_localnet_lport(pb, b_ctx_in, b_ctx_out);
> > + consider_localnet_lport(pb, b_ctx_out);
> > update_ld_localnet_port(pb, &bridge_mappings,
> > b_ctx_out->local_datapaths);
> > } else if (lport_type == LP_EXTERNAL) {
> > @@ -3614,5 +3656,6 @@ void
> > binding_destroy(void)
> > {
> > shash_destroy_free_data(&_claimed_ports);
> > + shash_destroy_free_data(&_qos_ports);
> > sset_clear(&_postponed_ports);
> > }
> > diff --git a/controller/binding.h b/controller/binding.h
> > index 24bc84079..47df668a2 100644
> > --- a/controller/binding.h
> > +++ b/controller/binding.h
> > @@ -250,4 +250,12 @@ void binding_destroy(void);
> >
> > void destroy_qos_map(struct hmap *);
> >
> > +void update_qos(struct ovsdb_idl_index * sbrec_port_binding_by_name,
> > + struct ovsdb_idl_txn *ovs_idl_txn,
> > + struct ovsdb_idl_index *ovsrec_port_by_qos,
> > + const struct ovsrec_qos_table *qos_table,
> > + struct hmap *qos_map,
> > + const struct ovsrec_open_vswitch_table *ovs_table,
> > + const struct ovsrec_bridge_table *bridge_table);
> > +
> > #endif /* controller/binding.h */
> > diff --git a/controller/ovn-controller.c b/controller/ovn-controller.c
> > index b3e4e0da8..859d9cab9 100644
> > --- a/controller/ovn-controller.c
> > +++ b/controller/ovn-controller.c
> > @@ -5809,6 +5809,13 @@ main(int argc, char *argv[])
> > &runtime_data->local_datapaths,
> > sb_monitor_all);
> > }
> > + if (ovs_idl_txn) {
> > + update_qos(sbrec_port_binding_by_name,
> > ovs_idl_txn,
> > + ovsrec_port_by_qos,
> > +
> > ovsrec_qos_table_get(ovs_idl_loop.idl),
> > + &runtime_data->qos_map,
> > + ovs_table, bridge_table);
> > + }
> > }
> >
> > if (mac_cache_data) {
> > diff --git a/tests/ovn.at b/tests/ovn.at
> > index e127530f6..ba5ce298a 100644
> > --- a/tests/ovn.at
> > +++ b/tests/ovn.at
> > @@ -36728,7 +36728,6 @@ check ovn-nbctl lsp-add ls2 public2
> > check ovn-nbctl lsp-set-addresses public2 unknown
> > check ovn-nbctl lsp-set-type public2 localnet
> > check ovn-nbctl --wait=sb set Logical_Switch_Port public2
> > options:qos_min_rate=6000000000 options:qos_max_rate=7000000000
> > options:qos_burst=8000000000 options:network_name=phys
> > -check ovn-nbctl --wait=sb lsp-set-options public2 qos_min_rate=6000000000
> > qos_max_rate=7000000000 qos_burst=8000000000
> >
> > # Let's now send ovn controller to sleep, so it will receive both ofport
> > notification and ls deletion simultaneously
> > sleep_controller hv-1
> > diff --git a/tests/system-ovn.at b/tests/system-ovn.at
> > index 59d0cb2a0..75611c1d5 100644
> > --- a/tests/system-ovn.at
> > +++ b/tests/system-ovn.at
> > @@ -6630,6 +6630,28 @@ AT_CHECK([ovn-nbctl set Logical_Switch_Port ext
> > options:qos_min_rate=400000])
> > AT_CHECK([ovn-nbctl set Logical_Switch_Port ext
> > options:qos_max_rate=600000])
> > AT_CHECK([ovn-nbctl set Logical_Switch_Port ext options:qos_burst=6000000])
> >
> > +OVS_WAIT_UNTIL([tc qdisc show | grep -q 'htb 1: dev ovs-public'])
> > +OVS_WAIT_UNTIL([tc class show dev ovs-public | \
> > + grep -q 'class htb .* rate 200Kbit ceil 300Kbit burst
> > 375000b cburst 375000b'])
> > +
> > +OVS_WAIT_UNTIL([tc qdisc show | grep -q 'htb 1: dev ovs-ext'])
> > +OVS_WAIT_UNTIL([tc class show dev ovs-ext | \
> > + grep -q 'class htb .* rate 400Kbit ceil 600Kbit burst
> > 750000b cburst 750000b'])
> > +
> > +# The same now with ovs db read only
> > +#
> > +AT_CHECK([ovn-nbctl remove Logical_Switch_Port ext options
> > qos_min_rate=400000])
> > +AT_CHECK([ovn-nbctl remove Logical_Switch_Port ext options
> > qos_max_rate=600000])
> > +AT_CHECK([ovn-nbctl remove Logical_Switch_Port ext options
> > qos_burst=6000000])
> > +OVS_WAIT_UNTIL([test "$(tc class show dev ovs-ext | grep 'class htb')" ==
> > ""])
> > +
> > +sleep_ovsdb .
> > +
> > +AT_CHECK([ovn-nbctl set Logical_Switch_Port ext
> > options:qos_min_rate=400000])
> > +AT_CHECK([ovn-nbctl set Logical_Switch_Port ext
> > options:qos_max_rate=600000])
> > +AT_CHECK([ovn-nbctl set Logical_Switch_Port ext options:qos_burst=6000000])
> > +wake_up_ovsdb .
> > +
> > OVS_WAIT_UNTIL([tc qdisc show | grep -q 'htb 1: dev ovs-public'])
> > OVS_WAIT_UNTIL([tc class show dev ovs-public | \
> > grep -q 'class htb .* rate 200Kbit ceil 300Kbit burst
> > 375000b cburst 375000b'])
> > --
> > 2.31.1
> >
>
> Other than that it looks good.
>
> Acked-by: Ales Musil <[email protected]>
>
> Thanks,
> Ales
>
>
> --
>
> Ales Musil
>
> Senior Software Engineer - OVN Core
>
> Red Hat EMEA
>
> [email protected] IM: amusil
>
> _______________________________________________
> dev mailing list
> [email protected]
> https://mail.openvswitch.org/mailman/listinfo/ovs-dev
_______________________________________________
dev mailing list
[email protected]
https://mail.openvswitch.org/mailman/listinfo/ovs-dev