On Tue, Jul 11, 2023 at 7:14 AM Ales Musil <amu...@redhat.com> wrote:

>
>
> On Mon, Jul 10, 2023 at 5:26 PM Dumitru Ceara <dce...@redhat.com> wrote:
>
>> If we want to catch new failures faster we have a better chance if CI
>> doesn't auto-retry (once).
>>
>> There are some tests that are still "unstable" and fail every now and
>> then.  In order to reduce the number of false negatives keep the
>> --recheck for them.  To achieve that we use a new macro, TAG_UNSTABLE,
>> to tag all these tests.  The list of "unstable" tests is compiled based
>> on the following discussion:
>> https://mail.openvswitch.org/pipermail/ovs-dev/2023-June/405465.html
>>
>> In order to avoid new GitHub actions jobs, we re-purpose the last job of
>> each target type to also run the unstable tests.  These jobs were
>> already running less tests than others so the additional run time should
>> not be an issue.
>>
>> Signed-off-by: Dumitru Ceara <dce...@redhat.com>
>> ---
>> V2:
>> - Addressed Ales' comments:
>>   - always run stable and unstable tests before declaring pass/fail
>> Changes in v1 (since RFC):
>> - kept recheck for unstable tests
>> - introduced TAG_UNSTABLE
>> - changed test.yml to run unstable tests in the last batch of every
>>   test target type.
>> ---
>>  .ci/ci.sh                  |  2 +-
>>  .ci/linux-build.sh         | 76 ++++++++++++++++++++++++++++++--------
>>  .github/workflows/test.yml | 15 ++++----
>>  tests/ovn-ic.at            |  1 +
>>  tests/ovn-ipsec.at         |  1 +
>>  tests/ovn-macros.at        |  5 +++
>>  tests/ovn-northd.at        |  1 +
>>  tests/ovn-performance.at   |  1 +
>>  tests/ovn.at               | 13 +++++++
>>  9 files changed, 92 insertions(+), 23 deletions(-)
>>
>> diff --git a/.ci/ci.sh b/.ci/ci.sh
>> index 10f11939c5..a500aba764 100755
>> --- a/.ci/ci.sh
>> +++ b/.ci/ci.sh
>> @@ -101,7 +101,7 @@ function run_tests() {
>>          && \
>>          ARCH=$ARCH CC=$CC LIBS=$LIBS OPTS=$OPTS TESTSUITE=$TESTSUITE \
>>          TEST_RANGE=$TEST_RANGE SANITIZERS=$SANITIZERS DPDK=$DPDK \
>> -        ./.ci/linux-build.sh
>> +        UNSTABLE=$UNSTABLE ./.ci/linux-build.sh
>>
>
I've missed one thing, please add the recheck here as well.


>      "
>>  }
>>
>> diff --git a/.ci/linux-build.sh b/.ci/linux-build.sh
>> index 5a79a52daf..4c5361f3ca 100755
>> --- a/.ci/linux-build.sh
>> +++ b/.ci/linux-build.sh
>> @@ -9,6 +9,7 @@ COMMON_CFLAGS=""
>>  OVN_CFLAGS=""
>>  OPTS="$OPTS --enable-Werror"
>>  JOBS=${JOBS:-"-j4"}
>> +RECHECK=${RECHECK:-"no"}
>>
>>  function install_dpdk()
>>  {
>> @@ -99,6 +100,17 @@ function configure_clang()
>>      COMMON_CFLAGS="${COMMON_CFLAGS}
>> -Wno-error=unused-command-line-argument"
>>  }
>>
>> +function run_tests()
>> +{
>> +    if ! make distcheck CFLAGS="${COMMON_CFLAGS} ${OVN_CFLAGS}" $JOBS \
>> +        TESTSUITEFLAGS="$JOBS $TEST_RANGE" RECHECK=$RECHECK
>> +    then
>> +        # testsuite.log is necessary for debugging.
>> +        cat */_build/sub/tests/testsuite.log
>> +        return 1
>> +    fi
>> +}
>> +
>>  function execute_tests()
>>  {
>>      # 'distcheck' will reconfigure with required options.
>> @@ -106,27 +118,61 @@ function execute_tests()
>>      configure_ovn
>>
>>      export DISTCHECK_CONFIGURE_FLAGS="$OPTS"
>> -    if ! make distcheck CFLAGS="${COMMON_CFLAGS} ${OVN_CFLAGS}" $JOBS \
>> -        TESTSUITEFLAGS="$JOBS $TEST_RANGE" RECHECK=yes
>> -    then
>> -        # testsuite.log is necessary for debugging.
>> -        cat */_build/sub/tests/testsuite.log
>> +
>> +    local stable_rc=0
>> +    local unstable_rc=0
>> +
>> +    if ! SKIP_UNSTABLE=yes run_tests; then
>> +        stable_rc=1
>> +    fi
>> +
>> +    if [ "$UNSTABLE" ]; then
>> +        if ! SKIP_UNSTABLE=no TEST_RANGE="-k unstable" RECHECK=yes \
>> +                run_tests; then
>> +            unstable_rc=1
>> +        fi
>> +    fi
>> +
>> +    if [[ $stable_rc -ne 0 ]] || [[ $unstable_rc -ne 0 ]]; then
>>          exit 1
>>      fi
>>  }
>>
>> +function run_system_tests()
>> +{
>> +    local type=$1
>> +    local log_file=$2
>> +
>> +    if ! sudo make $JOBS $type TESTSUITEFLAGS="$TEST_RANGE" \
>> +            RECHECK=$RECHECK; then
>> +        # $log_file is necessary for debugging.
>> +        cat tests/$log_file
>> +        return 1
>> +    fi
>> +}
>> +
>>  function execute_system_tests()
>>  {
>> -      type=$1
>> -      log_file=$2
>> -
>> -      configure_ovn $OPTS
>> -      make $JOBS || { cat config.log; exit 1; }
>> -      if ! sudo make $JOBS $type TESTSUITEFLAGS="$TEST_RANGE"
>> RECHECK=yes; then
>> -          # $log_file is necessary for debugging.
>> -          cat tests/$log_file
>> -          exit 1
>> -      fi
>> +    configure_ovn $OPTS
>> +    make $JOBS || { cat config.log; exit 1; }
>> +
>> +    local stable_rc=0
>> +    local unstable_rc=0
>> +
>> +    if ! SKIP_UNSTABLE=yes run_system_tests $@; then
>> +        stable_rc=1
>> +    fi
>> +
>> +    if [ "$UNSTABLE" ]; then
>> +        if ! SKIP_UNSTABLE=no TEST_RANGE="-k unstable" RECHECK=yes \
>> +                run_system_tests $@; then
>> +            unstable_rc=1
>> +        fi
>> +    fi
>> +
>> +    if [[ $stable_rc -ne 0 ]] || [[ $unstable_rc -ne 0 ]]; then
>> +        exit 1
>> +    fi
>>  }
>>
>>  configure_$CC
>> diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
>> index fe2a14c401..7d40251003 100644
>> --- a/.github/workflows/test.yml
>> +++ b/.github/workflows/test.yml
>> @@ -92,6 +92,7 @@ jobs:
>>        TESTSUITE:   ${{ matrix.cfg.testsuite }}
>>        TEST_RANGE:  ${{ matrix.cfg.test_range }}
>>        SANITIZERS:  ${{ matrix.cfg.sanitizers }}
>> +      UNSTABLE:    ${{ matrix.cfg.unstable }}
>>
>>      name: linux ${{ join(matrix.cfg.*, ' ') }}
>>      runs-on: ubuntu-latest
>> @@ -104,27 +105,27 @@ jobs:
>>          - { compiler: clang, opts: --disable-ssl }
>>          - { compiler: gcc, testsuite: test, test_range: "-500" }
>>          - { compiler: gcc, testsuite: test, test_range: "501-1000" }
>> -        - { compiler: gcc, testsuite: test, test_range: "1001-" }
>> +        - { compiler: gcc, testsuite: test, test_range: "1001-",
>> unstable: unstable }
>>          - { compiler: clang, testsuite: test, sanitizers: sanitizers,
>> test_range: "-300" }
>>          - { compiler: clang, testsuite: test, sanitizers: sanitizers,
>> test_range: "301-600" }
>>          - { compiler: clang, testsuite: test, sanitizers: sanitizers,
>> test_range: "601-900" }
>>          - { compiler: clang, testsuite: test, sanitizers: sanitizers,
>> test_range: "901-1200" }
>> -        - { compiler: clang, testsuite: test, sanitizers: sanitizers,
>> test_range: "1201-" }
>> +        - { compiler: clang, testsuite: test, sanitizers: sanitizers,
>> test_range: "1201-", unstable: unstable }
>>          - { compiler: gcc, testsuite: test, libs: -ljemalloc,
>> test_range: "-500" }
>>          - { compiler: gcc, testsuite: test, libs: -ljemalloc,
>> test_range: "501-1000" }
>> -        - { compiler: gcc, testsuite: test, libs: -ljemalloc,
>> test_range: "1001-" }
>> +        - { compiler: gcc, testsuite: test, libs: -ljemalloc,
>> test_range: "1001-", unstable: unstable }
>>          - { compiler: gcc, testsuite: system-test-dpdk, dpdk: dpdk,
>> test_range: "-100" }
>>          - { compiler: gcc, testsuite: system-test-dpdk, dpdk: dpdk,
>> test_range: "101-200" }
>> -        - { compiler: gcc, testsuite: system-test-dpdk, dpdk: dpdk,
>> test_range: "201-" }
>> +        - { compiler: gcc, testsuite: system-test-dpdk, dpdk: dpdk,
>> test_range: "201-", unstable: unstable }
>>          - { compiler: gcc, testsuite: system-test-userspace, test_range:
>> "-100" }
>>          - { compiler: gcc, testsuite: system-test-userspace, test_range:
>> "101-200" }
>> -        - { compiler: gcc, testsuite: system-test-userspace, test_range:
>> "201-" }
>> +        - { compiler: gcc, testsuite: system-test-userspace, test_range:
>> "201-", unstable: unstable }
>>          - { compiler: gcc, testsuite: system-test, test_range: "-100" }
>>          - { compiler: gcc, testsuite: system-test, test_range: "101-200"
>> }
>> -        - { compiler: gcc, testsuite: system-test, test_range: "201-" }
>> +        - { compiler: gcc, testsuite: system-test, test_range: "201-",
>> unstable: unstable }
>>          - { compiler: clang, testsuite: system-test, sanitizers:
>> sanitizers, test_range: "-100" }
>>          - { compiler: clang, testsuite: system-test, sanitizers:
>> sanitizers, test_range: "101-200" }
>> -        - { compiler: clang, testsuite: system-test, sanitizers:
>> sanitizers, test_range: "201-" }
>> +        - { compiler: clang, testsuite: system-test, sanitizers:
>> sanitizers, test_range: "201-", unstable: unstable }
>>          - { arch: x86, compiler: gcc, opts: --disable-ssl }
>>
>>      steps:
>> diff --git a/tests/ovn-ic.at b/tests/ovn-ic.at
>> index ceee450925..285662e3b8 100644
>> --- a/tests/ovn-ic.at
>> +++ b/tests/ovn-ic.at
>> @@ -256,6 +256,7 @@ AT_CLEANUP
>>
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([ovn-ic -- gateway sync])
>> +TAG_UNSTABLE
>>
>>  ovn_init_ic_db
>>  net_add n1
>> diff --git a/tests/ovn-ipsec.at b/tests/ovn-ipsec.at
>> index 10ef978780..e621547c59 100644
>> --- a/tests/ovn-ipsec.at
>> +++ b/tests/ovn-ipsec.at
>> @@ -1,6 +1,7 @@
>>  AT_BANNER([OVN - IPsec])
>>
>>  AT_SETUP([ipsec -- basic configuration])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  # Configure the Northbound database
>> diff --git a/tests/ovn-macros.at b/tests/ovn-macros.at
>> index 6f2d085ae4..6420721740 100644
>> --- a/tests/ovn-macros.at
>> +++ b/tests/ovn-macros.at
>> @@ -871,3 +871,8 @@ m4_define([RUN_OVN_NBCTL], [
>>      check ovn-nbctl ${command}
>>      unset command
>>  ])
>> +
>> +m4_define([TAG_UNSTABLE], [
>> +    AT_KEYWORDS([unstable])
>> +    AT_SKIP_IF([test X"$SKIP_UNSTABLE" = Xyes])
>> +])
>> diff --git a/tests/ovn-northd.at b/tests/ovn-northd.at
>> index 3e06f14c94..c1c8287e03 100644
>> --- a/tests/ovn-northd.at
>> +++ b/tests/ovn-northd.at
>> @@ -4531,6 +4531,7 @@ AT_CLEANUP
>>
>>  OVN_FOR_EACH_NORTHD_NO_HV([
>>  AT_SETUP([northd ssl file change])
>> +TAG_UNSTABLE
>>  AT_SKIP_IF([test "$HAVE_OPENSSL" = no])
>>  PKIDIR="$(cd $abs_top_builddir/tests && pwd)"
>>  AT_SKIP_IF([expr "$PKIDIR" : ".*[[     '\"
>> diff --git a/tests/ovn-performance.at b/tests/ovn-performance.at
>> index ba329f0f64..9de0a4e770 100644
>> --- a/tests/ovn-performance.at
>> +++ b/tests/ovn-performance.at
>> @@ -225,6 +225,7 @@ m4_define([OVN_CONTROLLER_EXPECT_HIT_COND],[
>>  ])
>>
>>  AT_SETUP([ovn-controller incremental processing])
>> +TAG_UNSTABLE
>>  # Check which operations the trigger full logical flow processing.
>>  #
>>  # Create and destroy logical routers, switches, ports, address sets and
>> ACLs
>> diff --git a/tests/ovn.at b/tests/ovn.at
>> index cd6d4b9ff4..cd8f481bbc 100644
>> --- a/tests/ovn.at
>> +++ b/tests/ovn.at
>> @@ -7853,6 +7853,7 @@ AT_CLEANUP
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([policy-based routing: 1 HVs, 2 LSs, 1 lport/LS, 1 LR])
>>  AT_KEYWORDS([policy-based-routing])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  # Logical network:
>> @@ -8025,6 +8026,7 @@ AT_CLEANUP
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([policy-based routing IPv6: 1 HVs, 3 LSs, 1 lport/LS, 1 LR])
>>  AT_KEYWORDS([policy-based-routing])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  # Logical network:
>> @@ -14405,6 +14407,7 @@ AT_CLEANUP
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([options:multiple requested-chassis for logical port])
>>  AT_KEYWORDS([multi-chassis])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  net_add n1
>> @@ -14507,6 +14510,7 @@ AT_CLEANUP
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([options:multiple requested-chassis for logical port: change
>> chassis role])
>>  AT_KEYWORDS([multi-chassis])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  net_add n1
>> @@ -14557,6 +14561,7 @@ AT_CLEANUP
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([options:multiple requested-chassis for logical port: unclaimed
>> behavior])
>>  AT_KEYWORDS([multi-chassis])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  net_add n1
>> @@ -16130,6 +16135,7 @@ AT_CLEANUP
>>
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([tug-of-war between two chassis for the same port])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  ovn-nbctl ls-add ls0
>> @@ -29503,6 +29509,7 @@ AT_CLEANUP
>>
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([nb_cfg timestamp])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  check ovn-nbctl ls-add s2
>> @@ -29604,6 +29611,7 @@ AT_CLEANUP
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([ARP replies for SNAT external ips])
>>  AT_KEYWORDS([slowtest])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  net_add n1
>> @@ -29970,6 +29978,7 @@ AT_CLEANUP
>>  # It is to cover a corner case when flows are re-processed in the I-P
>>  # iteration, combined with the scenario of conflicting ACLs.
>>  AT_SETUP([conflict ACLs with address set])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  ovn-nbctl ls-add ls1
>> @@ -30165,6 +30174,7 @@ AT_CLEANUP
>>  #
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([multi-vtep SB Chassis encap updates])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  net_add n1
>> @@ -32354,6 +32364,7 @@ AT_CLEANUP
>>  # - 2 for expanding the port group @pg1 to the 2 locally bound lports.
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([ACL with Port Group conjunction flow efficiency])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  net_add n1
>> @@ -34606,6 +34617,7 @@ AT_CLEANUP
>>
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([recomputes])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  net_add n1
>> @@ -35040,6 +35052,7 @@ MULTIPLE_OVS_INT([])
>>
>>  OVN_FOR_EACH_NORTHD([
>>  AT_SETUP([Check default openflow flows])
>> +TAG_UNSTABLE
>>  ovn_start
>>
>>  # Check that every table has a default (i.e: priority=0) flow.
>> --
>> 2.31.1
>>
>>
> Looks good to me, thanks.
>
> Acked-by: Ales Musil <amu...@redhat.com>
>
> --
>
> Ales Musil
>
> Senior Software Engineer - OVN Core
>
> Red Hat EMEA <https://www.redhat.com>
>
> amu...@redhat.com    IM: amusil
> <https://red.ht/sig>
>

Thanks,
Ales
-- 

Ales Musil

Senior Software Engineer - OVN Core

Red Hat EMEA <https://www.redhat.com>

amu...@redhat.com    IM: amusil
<https://red.ht/sig>
_______________________________________________
dev mailing list
d...@openvswitch.org
https://mail.openvswitch.org/mailman/listinfo/ovs-dev

Reply via email to