From dd23d4774376f8647cbb6dab0d647dd2c9037db6 Mon Sep 17 00:00:00 2001 From: Weny Xu Date: Wed, 31 Jul 2024 15:29:31 +0800 Subject: [PATCH] chore(ci): bring back chaos tests (#4456) * Revert "chore: temporarily disable fuzz chaos tests (#4457)" This reverts commit f0c953f84a4eb7b3453548733848d7bb08169601. * chore: update config * Update .github/actions/setup-greptimedb-cluster/with-remote-wal.yaml Co-authored-by: Ruihang Xia --------- Co-authored-by: Ruihang Xia --- .../with-remote-wal.yaml | 5 + .github/workflows/develop.yml | 254 +++++++++--------- 2 files changed, 132 insertions(+), 127 deletions(-) diff --git a/.github/actions/setup-greptimedb-cluster/with-remote-wal.yaml b/.github/actions/setup-greptimedb-cluster/with-remote-wal.yaml index e5fc71cfe382..b5a7dec358fe 100644 --- a/.github/actions/setup-greptimedb-cluster/with-remote-wal.yaml +++ b/.github/actions/setup-greptimedb-cluster/with-remote-wal.yaml @@ -38,3 +38,8 @@ objectStorage: credentials: accessKeyId: rootuser secretAccessKey: rootpass123 +remoteWal: + enabled: true + kafka: + brokerEndpoints: + - "kafka.kafka-cluster.svc.cluster.local:9092" diff --git a/.github/workflows/develop.yml b/.github/workflows/develop.yml index 61e27352e9b5..4a3982b585fd 100644 --- a/.github/workflows/develop.yml +++ b/.github/workflows/develop.yml @@ -412,133 +412,133 @@ jobs: docker stop $(docker ps -a -q) docker rm $(docker ps -a -q) docker system prune -f - # FIXME(weny): wait for the chart to release a new version. - # distributed-fuzztest-with-chaos: - # name: Fuzz Test with Chaos (Distributed, ${{ matrix.mode.name }}, ${{ matrix.target }}) - # runs-on: ubuntu-latest - # needs: build-greptime-ci - # timeout-minutes: 60 - # strategy: - # matrix: - # target: ["fuzz_migrate_mito_regions", "fuzz_failover_mito_regions", "fuzz_failover_metric_regions"] - # mode: - # - name: "Remote WAL" - # minio: true - # kafka: true - # values: "with-remote-wal.yaml" - # steps: - # - uses: actions/checkout@v4 - # - name: Setup Kind - # uses: ./.github/actions/setup-kind - # - name: Setup Chaos Mesh - # uses: ./.github/actions/setup-chaos - # - if: matrix.mode.minio - # name: Setup Minio - # uses: ./.github/actions/setup-minio - # - if: matrix.mode.kafka - # name: Setup Kafka cluser - # uses: ./.github/actions/setup-kafka-cluster - # - name: Setup Etcd cluser - # uses: ./.github/actions/setup-etcd-cluster - # # Prepares for fuzz tests - # - uses: arduino/setup-protoc@v3 - # with: - # repo-token: ${{ secrets.GITHUB_TOKEN }} - # - uses: dtolnay/rust-toolchain@master - # with: - # toolchain: ${{ env.RUST_TOOLCHAIN }} - # - name: Rust Cache - # uses: Swatinem/rust-cache@v2 - # with: - # # Shares across multiple jobs - # shared-key: "fuzz-test-targets" - # - name: Set Rust Fuzz - # shell: bash - # run: | - # sudo apt-get install -y libfuzzer-14-dev - # rustup install nightly - # cargo +nightly install cargo-fuzz cargo-gc-bin - # # Downloads ci image - # - name: Download pre-built binariy - # uses: actions/download-artifact@v4 - # with: - # name: bin - # path: . - # - name: Unzip binary - # run: | - # tar -xvf ./bin.tar.gz - # rm ./bin.tar.gz - # - name: Build and push GreptimeDB image - # uses: ./.github/actions/build-and-push-ci-image - # - name: Wait for etcd - # run: | - # kubectl wait \ - # --for=condition=Ready \ - # pod -l app.kubernetes.io/instance=etcd \ - # --timeout=120s \ - # -n etcd-cluster - # - if: matrix.mode.minio - # name: Wait for minio - # run: | - # kubectl wait \ - # --for=condition=Ready \ - # pod -l app=minio \ - # --timeout=120s \ - # -n minio - # - if: matrix.mode.kafka - # name: Wait for kafka - # run: | - # kubectl wait \ - # --for=condition=Ready \ - # pod -l app.kubernetes.io/instance=kafka \ - # --timeout=120s \ - # -n kafka-cluster - # - name: Print etcd info - # shell: bash - # run: kubectl get all --show-labels -n etcd-cluster - # # Setup cluster for test - # - name: Setup GreptimeDB cluster - # uses: ./.github/actions/setup-greptimedb-cluster - # with: - # image-registry: localhost:5001 - # values-filename: ${{ matrix.mode.values }} - # enable-region-failover: true - # - name: Port forward (mysql) - # run: | - # kubectl port-forward service/my-greptimedb-frontend 4002:4002 -n my-greptimedb& - # - name: Fuzz Test - # uses: ./.github/actions/fuzz-test - # env: - # CUSTOM_LIBFUZZER_PATH: /usr/lib/llvm-14/lib/libFuzzer.a - # GT_MYSQL_ADDR: 127.0.0.1:4002 - # with: - # target: ${{ matrix.target }} - # max-total-time: 120 - # - name: Describe Nodes - # if: failure() - # shell: bash - # run: | - # kubectl describe nodes - # - name: Export kind logs - # if: failure() - # shell: bash - # run: | - # kind export logs /tmp/kind - # - name: Upload logs - # if: failure() - # uses: actions/upload-artifact@v4 - # with: - # name: fuzz-tests-kind-logs-${{ matrix.mode.name }}-${{ matrix.target }} - # path: /tmp/kind - # retention-days: 3 - # - name: Delete cluster - # if: success() - # shell: bash - # run: | - # kind delete cluster - # docker stop $(docker ps -a -q) - # docker rm $(docker ps -a -q) - # docker system prune -f + + distributed-fuzztest-with-chaos: + name: Fuzz Test with Chaos (Distributed, ${{ matrix.mode.name }}, ${{ matrix.target }}) + runs-on: ubuntu-latest + needs: build-greptime-ci + timeout-minutes: 60 + strategy: + matrix: + target: ["fuzz_migrate_mito_regions", "fuzz_failover_mito_regions", "fuzz_failover_metric_regions"] + mode: + - name: "Remote WAL" + minio: true + kafka: true + values: "with-remote-wal.yaml" + steps: + - uses: actions/checkout@v4 + - name: Setup Kind + uses: ./.github/actions/setup-kind + - name: Setup Chaos Mesh + uses: ./.github/actions/setup-chaos + - if: matrix.mode.minio + name: Setup Minio + uses: ./.github/actions/setup-minio + - if: matrix.mode.kafka + name: Setup Kafka cluser + uses: ./.github/actions/setup-kafka-cluster + - name: Setup Etcd cluser + uses: ./.github/actions/setup-etcd-cluster + # Prepares for fuzz tests + - uses: arduino/setup-protoc@v3 + with: + repo-token: ${{ secrets.GITHUB_TOKEN }} + - uses: dtolnay/rust-toolchain@master + with: + toolchain: ${{ env.RUST_TOOLCHAIN }} + - name: Rust Cache + uses: Swatinem/rust-cache@v2 + with: + # Shares across multiple jobs + shared-key: "fuzz-test-targets" + - name: Set Rust Fuzz + shell: bash + run: | + sudo apt-get install -y libfuzzer-14-dev + rustup install nightly + cargo +nightly install cargo-fuzz cargo-gc-bin + # Downloads ci image + - name: Download pre-built binariy + uses: actions/download-artifact@v4 + with: + name: bin + path: . + - name: Unzip binary + run: | + tar -xvf ./bin.tar.gz + rm ./bin.tar.gz + - name: Build and push GreptimeDB image + uses: ./.github/actions/build-and-push-ci-image + - name: Wait for etcd + run: | + kubectl wait \ + --for=condition=Ready \ + pod -l app.kubernetes.io/instance=etcd \ + --timeout=120s \ + -n etcd-cluster + - if: matrix.mode.minio + name: Wait for minio + run: | + kubectl wait \ + --for=condition=Ready \ + pod -l app=minio \ + --timeout=120s \ + -n minio + - if: matrix.mode.kafka + name: Wait for kafka + run: | + kubectl wait \ + --for=condition=Ready \ + pod -l app.kubernetes.io/instance=kafka \ + --timeout=120s \ + -n kafka-cluster + - name: Print etcd info + shell: bash + run: kubectl get all --show-labels -n etcd-cluster + # Setup cluster for test + - name: Setup GreptimeDB cluster + uses: ./.github/actions/setup-greptimedb-cluster + with: + image-registry: localhost:5001 + values-filename: ${{ matrix.mode.values }} + enable-region-failover: true + - name: Port forward (mysql) + run: | + kubectl port-forward service/my-greptimedb-frontend 4002:4002 -n my-greptimedb& + - name: Fuzz Test + uses: ./.github/actions/fuzz-test + env: + CUSTOM_LIBFUZZER_PATH: /usr/lib/llvm-14/lib/libFuzzer.a + GT_MYSQL_ADDR: 127.0.0.1:4002 + with: + target: ${{ matrix.target }} + max-total-time: 120 + - name: Describe Nodes + if: failure() + shell: bash + run: | + kubectl describe nodes + - name: Export kind logs + if: failure() + shell: bash + run: | + kind export logs /tmp/kind + - name: Upload logs + if: failure() + uses: actions/upload-artifact@v4 + with: + name: fuzz-tests-kind-logs-${{ matrix.mode.name }}-${{ matrix.target }} + path: /tmp/kind + retention-days: 3 + - name: Delete cluster + if: success() + shell: bash + run: | + kind delete cluster + docker stop $(docker ps -a -q) + docker rm $(docker ps -a -q) + docker system prune -f sqlness: name: Sqlness Test (${{ matrix.mode.name }})