On Mon, Jul 10, 2023 at 5:26 PM Dumitru Ceara <dce...@redhat.com> wrote:
> If we want to catch new failures faster we have a better chance if CI > doesn't auto-retry (once). > > There are some tests that are still "unstable" and fail every now and > then. In order to reduce the number of false negatives keep the > --recheck for them. To achieve that we use a new macro, TAG_UNSTABLE, > to tag all these tests. The list of "unstable" tests is compiled based > on the following discussion: > https://mail.openvswitch.org/pipermail/ovs-dev/2023-June/405465.html > > In order to avoid new GitHub actions jobs, we re-purpose the last job of > each target type to also run the unstable tests. These jobs were > already running less tests than others so the additional run time should > not be an issue. > > Signed-off-by: Dumitru Ceara <dce...@redhat.com> > --- > V2: > - Addressed Ales' comments: > - always run stable and unstable tests before declaring pass/fail > Changes in v1 (since RFC): > - kept recheck for unstable tests > - introduced TAG_UNSTABLE > - changed test.yml to run unstable tests in the last batch of every > test target type. > --- > .ci/ci.sh | 2 +- > .ci/linux-build.sh | 76 ++++++++++++++++++++++++++++++-------- > .github/workflows/test.yml | 15 ++++---- > tests/ovn-ic.at | 1 + > tests/ovn-ipsec.at | 1 + > tests/ovn-macros.at | 5 +++ > tests/ovn-northd.at | 1 + > tests/ovn-performance.at | 1 + > tests/ovn.at | 13 +++++++ > 9 files changed, 92 insertions(+), 23 deletions(-) > > diff --git a/.ci/ci.sh b/.ci/ci.sh > index 10f11939c5..a500aba764 100755 > --- a/.ci/ci.sh > +++ b/.ci/ci.sh > @@ -101,7 +101,7 @@ function run_tests() { > && \ > ARCH=$ARCH CC=$CC LIBS=$LIBS OPTS=$OPTS TESTSUITE=$TESTSUITE \ > TEST_RANGE=$TEST_RANGE SANITIZERS=$SANITIZERS DPDK=$DPDK \ > - ./.ci/linux-build.sh > + UNSTABLE=$UNSTABLE ./.ci/linux-build.sh > " > } > > diff --git a/.ci/linux-build.sh b/.ci/linux-build.sh > index 5a79a52daf..4c5361f3ca 100755 > --- a/.ci/linux-build.sh > +++ b/.ci/linux-build.sh > @@ -9,6 +9,7 @@ COMMON_CFLAGS="" > OVN_CFLAGS="" > OPTS="$OPTS --enable-Werror" > JOBS=${JOBS:-"-j4"} > +RECHECK=${RECHECK:-"no"} > > function install_dpdk() > { > @@ -99,6 +100,17 @@ function configure_clang() > COMMON_CFLAGS="${COMMON_CFLAGS} > -Wno-error=unused-command-line-argument" > } > > +function run_tests() > +{ > + if ! make distcheck CFLAGS="${COMMON_CFLAGS} ${OVN_CFLAGS}" $JOBS \ > + TESTSUITEFLAGS="$JOBS $TEST_RANGE" RECHECK=$RECHECK > + then > + # testsuite.log is necessary for debugging. > + cat */_build/sub/tests/testsuite.log > + return 1 > + fi > +} > + > function execute_tests() > { > # 'distcheck' will reconfigure with required options. > @@ -106,27 +118,61 @@ function execute_tests() > configure_ovn > > export DISTCHECK_CONFIGURE_FLAGS="$OPTS" > - if ! make distcheck CFLAGS="${COMMON_CFLAGS} ${OVN_CFLAGS}" $JOBS \ > - TESTSUITEFLAGS="$JOBS $TEST_RANGE" RECHECK=yes > - then > - # testsuite.log is necessary for debugging. > - cat */_build/sub/tests/testsuite.log > + > + local stable_rc=0 > + local unstable_rc=0 > + > + if ! SKIP_UNSTABLE=yes run_tests; then > + stable_rc=1 > + fi > + > + if [ "$UNSTABLE" ]; then > + if ! SKIP_UNSTABLE=no TEST_RANGE="-k unstable" RECHECK=yes \ > + run_tests; then > + unstable_rc=1 > + fi > + fi > + > + if [[ $stable_rc -ne 0 ]] || [[ $unstable_rc -ne 0 ]]; then > exit 1 > fi > } > > +function run_system_tests() > +{ > + local type=$1 > + local log_file=$2 > + > + if ! sudo make $JOBS $type TESTSUITEFLAGS="$TEST_RANGE" \ > + RECHECK=$RECHECK; then > + # $log_file is necessary for debugging. > + cat tests/$log_file > + return 1 > + fi > +} > + > function execute_system_tests() > { > - type=$1 > - log_file=$2 > - > - configure_ovn $OPTS > - make $JOBS || { cat config.log; exit 1; } > - if ! sudo make $JOBS $type TESTSUITEFLAGS="$TEST_RANGE" > RECHECK=yes; then > - # $log_file is necessary for debugging. > - cat tests/$log_file > - exit 1 > - fi > + configure_ovn $OPTS > + make $JOBS || { cat config.log; exit 1; } > + > + local stable_rc=0 > + local unstable_rc=0 > + > + if ! SKIP_UNSTABLE=yes run_system_tests $@; then > + stable_rc=1 > + fi > + > + if [ "$UNSTABLE" ]; then > + if ! SKIP_UNSTABLE=no TEST_RANGE="-k unstable" RECHECK=yes \ > + run_system_tests $@; then > + unstable_rc=1 > + fi > + fi > + > + if [[ $stable_rc -ne 0 ]] || [[ $unstable_rc -ne 0 ]]; then > + exit 1 > + fi > } > > configure_$CC > diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml > index fe2a14c401..7d40251003 100644 > --- a/.github/workflows/test.yml > +++ b/.github/workflows/test.yml > @@ -92,6 +92,7 @@ jobs: > TESTSUITE: ${{ matrix.cfg.testsuite }} > TEST_RANGE: ${{ matrix.cfg.test_range }} > SANITIZERS: ${{ matrix.cfg.sanitizers }} > + UNSTABLE: ${{ matrix.cfg.unstable }} > > name: linux ${{ join(matrix.cfg.*, ' ') }} > runs-on: ubuntu-latest > @@ -104,27 +105,27 @@ jobs: > - { compiler: clang, opts: --disable-ssl } > - { compiler: gcc, testsuite: test, test_range: "-500" } > - { compiler: gcc, testsuite: test, test_range: "501-1000" } > - - { compiler: gcc, testsuite: test, test_range: "1001-" } > + - { compiler: gcc, testsuite: test, test_range: "1001-", > unstable: unstable } > - { compiler: clang, testsuite: test, sanitizers: sanitizers, > test_range: "-300" } > - { compiler: clang, testsuite: test, sanitizers: sanitizers, > test_range: "301-600" } > - { compiler: clang, testsuite: test, sanitizers: sanitizers, > test_range: "601-900" } > - { compiler: clang, testsuite: test, sanitizers: sanitizers, > test_range: "901-1200" } > - - { compiler: clang, testsuite: test, sanitizers: sanitizers, > test_range: "1201-" } > + - { compiler: clang, testsuite: test, sanitizers: sanitizers, > test_range: "1201-", unstable: unstable } > - { compiler: gcc, testsuite: test, libs: -ljemalloc, test_range: > "-500" } > - { compiler: gcc, testsuite: test, libs: -ljemalloc, test_range: > "501-1000" } > - - { compiler: gcc, testsuite: test, libs: -ljemalloc, test_range: > "1001-" } > + - { compiler: gcc, testsuite: test, libs: -ljemalloc, test_range: > "1001-", unstable: unstable } > - { compiler: gcc, testsuite: system-test-dpdk, dpdk: dpdk, > test_range: "-100" } > - { compiler: gcc, testsuite: system-test-dpdk, dpdk: dpdk, > test_range: "101-200" } > - - { compiler: gcc, testsuite: system-test-dpdk, dpdk: dpdk, > test_range: "201-" } > + - { compiler: gcc, testsuite: system-test-dpdk, dpdk: dpdk, > test_range: "201-", unstable: unstable } > - { compiler: gcc, testsuite: system-test-userspace, test_range: > "-100" } > - { compiler: gcc, testsuite: system-test-userspace, test_range: > "101-200" } > - - { compiler: gcc, testsuite: system-test-userspace, test_range: > "201-" } > + - { compiler: gcc, testsuite: system-test-userspace, test_range: > "201-", unstable: unstable } > - { compiler: gcc, testsuite: system-test, test_range: "-100" } > - { compiler: gcc, testsuite: system-test, test_range: "101-200" } > - - { compiler: gcc, testsuite: system-test, test_range: "201-" } > + - { compiler: gcc, testsuite: system-test, test_range: "201-", > unstable: unstable } > - { compiler: clang, testsuite: system-test, sanitizers: > sanitizers, test_range: "-100" } > - { compiler: clang, testsuite: system-test, sanitizers: > sanitizers, test_range: "101-200" } > - - { compiler: clang, testsuite: system-test, sanitizers: > sanitizers, test_range: "201-" } > + - { compiler: clang, testsuite: system-test, sanitizers: > sanitizers, test_range: "201-", unstable: unstable } > - { arch: x86, compiler: gcc, opts: --disable-ssl } > > steps: > diff --git a/tests/ovn-ic.at b/tests/ovn-ic.at > index ceee450925..285662e3b8 100644 > --- a/tests/ovn-ic.at > +++ b/tests/ovn-ic.at > @@ -256,6 +256,7 @@ AT_CLEANUP > > OVN_FOR_EACH_NORTHD([ > AT_SETUP([ovn-ic -- gateway sync]) > +TAG_UNSTABLE > > ovn_init_ic_db > net_add n1 > diff --git a/tests/ovn-ipsec.at b/tests/ovn-ipsec.at > index 10ef978780..e621547c59 100644 > --- a/tests/ovn-ipsec.at > +++ b/tests/ovn-ipsec.at > @@ -1,6 +1,7 @@ > AT_BANNER([OVN - IPsec]) > > AT_SETUP([ipsec -- basic configuration]) > +TAG_UNSTABLE > ovn_start > > # Configure the Northbound database > diff --git a/tests/ovn-macros.at b/tests/ovn-macros.at > index 6f2d085ae4..6420721740 100644 > --- a/tests/ovn-macros.at > +++ b/tests/ovn-macros.at > @@ -871,3 +871,8 @@ m4_define([RUN_OVN_NBCTL], [ > check ovn-nbctl ${command} > unset command > ]) > + > +m4_define([TAG_UNSTABLE], [ > + AT_KEYWORDS([unstable]) > + AT_SKIP_IF([test X"$SKIP_UNSTABLE" = Xyes]) > +]) > diff --git a/tests/ovn-northd.at b/tests/ovn-northd.at > index 3e06f14c94..c1c8287e03 100644 > --- a/tests/ovn-northd.at > +++ b/tests/ovn-northd.at > @@ -4531,6 +4531,7 @@ AT_CLEANUP > > OVN_FOR_EACH_NORTHD_NO_HV([ > AT_SETUP([northd ssl file change]) > +TAG_UNSTABLE > AT_SKIP_IF([test "$HAVE_OPENSSL" = no]) > PKIDIR="$(cd $abs_top_builddir/tests && pwd)" > AT_SKIP_IF([expr "$PKIDIR" : ".*[[ '\" > diff --git a/tests/ovn-performance.at b/tests/ovn-performance.at > index ba329f0f64..9de0a4e770 100644 > --- a/tests/ovn-performance.at > +++ b/tests/ovn-performance.at > @@ -225,6 +225,7 @@ m4_define([OVN_CONTROLLER_EXPECT_HIT_COND],[ > ]) > > AT_SETUP([ovn-controller incremental processing]) > +TAG_UNSTABLE > # Check which operations the trigger full logical flow processing. > # > # Create and destroy logical routers, switches, ports, address sets and > ACLs > diff --git a/tests/ovn.at b/tests/ovn.at > index cd6d4b9ff4..cd8f481bbc 100644 > --- a/tests/ovn.at > +++ b/tests/ovn.at > @@ -7853,6 +7853,7 @@ AT_CLEANUP > OVN_FOR_EACH_NORTHD([ > AT_SETUP([policy-based routing: 1 HVs, 2 LSs, 1 lport/LS, 1 LR]) > AT_KEYWORDS([policy-based-routing]) > +TAG_UNSTABLE > ovn_start > > # Logical network: > @@ -8025,6 +8026,7 @@ AT_CLEANUP > OVN_FOR_EACH_NORTHD([ > AT_SETUP([policy-based routing IPv6: 1 HVs, 3 LSs, 1 lport/LS, 1 LR]) > AT_KEYWORDS([policy-based-routing]) > +TAG_UNSTABLE > ovn_start > > # Logical network: > @@ -14405,6 +14407,7 @@ AT_CLEANUP > OVN_FOR_EACH_NORTHD([ > AT_SETUP([options:multiple requested-chassis for logical port]) > AT_KEYWORDS([multi-chassis]) > +TAG_UNSTABLE > ovn_start > > net_add n1 > @@ -14507,6 +14510,7 @@ AT_CLEANUP > OVN_FOR_EACH_NORTHD([ > AT_SETUP([options:multiple requested-chassis for logical port: change > chassis role]) > AT_KEYWORDS([multi-chassis]) > +TAG_UNSTABLE > ovn_start > > net_add n1 > @@ -14557,6 +14561,7 @@ AT_CLEANUP > OVN_FOR_EACH_NORTHD([ > AT_SETUP([options:multiple requested-chassis for logical port: unclaimed > behavior]) > AT_KEYWORDS([multi-chassis]) > +TAG_UNSTABLE > ovn_start > > net_add n1 > @@ -16130,6 +16135,7 @@ AT_CLEANUP > > OVN_FOR_EACH_NORTHD([ > AT_SETUP([tug-of-war between two chassis for the same port]) > +TAG_UNSTABLE > ovn_start > > ovn-nbctl ls-add ls0 > @@ -29503,6 +29509,7 @@ AT_CLEANUP > > OVN_FOR_EACH_NORTHD([ > AT_SETUP([nb_cfg timestamp]) > +TAG_UNSTABLE > ovn_start > > check ovn-nbctl ls-add s2 > @@ -29604,6 +29611,7 @@ AT_CLEANUP > OVN_FOR_EACH_NORTHD([ > AT_SETUP([ARP replies for SNAT external ips]) > AT_KEYWORDS([slowtest]) > +TAG_UNSTABLE > ovn_start > > net_add n1 > @@ -29970,6 +29978,7 @@ AT_CLEANUP > # It is to cover a corner case when flows are re-processed in the I-P > # iteration, combined with the scenario of conflicting ACLs. > AT_SETUP([conflict ACLs with address set]) > +TAG_UNSTABLE > ovn_start > > ovn-nbctl ls-add ls1 > @@ -30165,6 +30174,7 @@ AT_CLEANUP > # > OVN_FOR_EACH_NORTHD([ > AT_SETUP([multi-vtep SB Chassis encap updates]) > +TAG_UNSTABLE > ovn_start > > net_add n1 > @@ -32354,6 +32364,7 @@ AT_CLEANUP > # - 2 for expanding the port group @pg1 to the 2 locally bound lports. > OVN_FOR_EACH_NORTHD([ > AT_SETUP([ACL with Port Group conjunction flow efficiency]) > +TAG_UNSTABLE > ovn_start > > net_add n1 > @@ -34606,6 +34617,7 @@ AT_CLEANUP > > OVN_FOR_EACH_NORTHD([ > AT_SETUP([recomputes]) > +TAG_UNSTABLE > ovn_start > > net_add n1 > @@ -35040,6 +35052,7 @@ MULTIPLE_OVS_INT([]) > > OVN_FOR_EACH_NORTHD([ > AT_SETUP([Check default openflow flows]) > +TAG_UNSTABLE > ovn_start > > # Check that every table has a default (i.e: priority=0) flow. > -- > 2.31.1 > > Looks good to me, thanks. Acked-by: Ales Musil <amu...@redhat.com> -- Ales Musil Senior Software Engineer - OVN Core Red Hat EMEA <https://www.redhat.com> amu...@redhat.com IM: amusil <https://red.ht/sig> _______________________________________________ dev mailing list d...@openvswitch.org https://mail.openvswitch.org/mailman/listinfo/ovs-dev