Skip to content

Commit 4024279

Browse files
committed
[Test][Autoscaler] deflaky unexpected dead actors with a new ci runner
Signed-off-by: Rueian <[email protected]>
1 parent 6322758 commit 4024279

File tree

1 file changed

+20
-0
lines changed

1 file changed

+20
-0
lines changed

.buildkite/test-e2e.yml

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -78,6 +78,26 @@
7878
- KUBERAY_TEST_TIMEOUT_SHORT=1m KUBERAY_TEST_TIMEOUT_MEDIUM=5m KUBERAY_TEST_TIMEOUT_LONG=10m go test -timeout 60m -v ./test/e2eautoscaler/raycluster_autoscaler_part2_test.go ./test/e2eautoscaler/support.go 2>&1 | awk -f ../.buildkite/format.awk | tee $$KUBERAY_TEST_OUTPUT_DIR/gotest.log || (kubectl logs --tail -1 -l app.kubernetes.io/name=kuberay | tee $$KUBERAY_TEST_OUTPUT_DIR/kuberay-operator.log && cd $$KUBERAY_TEST_OUTPUT_DIR && find . -name "*.log" | tar -cf /artifact-mount/e2e-autoscaler-log.tar -T - && exit 1)
7979
- echo "--- END:Autoscaler E2E Part 2 (nightly operator) tests finished"
8080

81+
- label: 'Test Autoscaler E2E Part 3 (detached actor workaround) (nightly operator)'
82+
instance_size: large
83+
image: golang:1.24
84+
commands:
85+
- source .buildkite/setup-env.sh
86+
- kind create cluster --wait 900s --config ./ci/kind-config-buildkite.yml
87+
- kubectl config set clusters.kind-kind.server https://docker:6443
88+
# Build nightly KubeRay operator image
89+
- pushd ray-operator
90+
- bash ../.buildkite/build-start-operator.sh
91+
- kubectl wait --timeout=90s --for=condition=Available=true deployment kuberay-operator
92+
# Run e2e tests and print KubeRay operator logs if tests fail
93+
- echo "--- START:Running Autoscaler E2E Part 3 (detached actor workaround) (nightly operator) tests"
94+
- if [ -n "${KUBERAY_TEST_RAY_IMAGE}"]; then echo "Using Ray Image ${KUBERAY_TEST_RAY_IMAGE}"; fi
95+
- set -o pipefail
96+
- mkdir -p "$(pwd)/tmp" && export KUBERAY_TEST_OUTPUT_DIR=$(pwd)/tmp
97+
- echo "KUBERAY_TEST_OUTPUT_DIR=$$KUBERAY_TEST_OUTPUT_DIR"
98+
- KUBERAY_TEST_TIMEOUT_SHORT=1m KUBERAY_TEST_TIMEOUT_MEDIUM=5m KUBERAY_TEST_TIMEOUT_LONG=10m go test -timeout 150m -v -count=30 -run=TestRayClusterAutoscalerMaxReplicasUpdate ./test/e2eautoscaler/raycluster_autoscaler_part2_test.go ./test/e2eautoscaler/support.go 2>&1 | awk -f ../.buildkite/format.awk | tee $$KUBERAY_TEST_OUTPUT_DIR/gotest.log || (kubectl logs --tail -1 -l app.kubernetes.io/name=kuberay | tee $$KUBERAY_TEST_OUTPUT_DIR/kuberay-operator.log && cd $$KUBERAY_TEST_OUTPUT_DIR && find . -name "*.log" | tar -cf /artifact-mount/e2e-autoscaler-log.tar -T - && exit 1)
99+
- echo "--- END:Autoscaler E2E Part 3 (detached actor workaround) (nightly operator) tests finished"
100+
81101
- label: 'Test E2E Operator Version Upgrade (v1.3.0)'
82102
instance_size: large
83103
image: golang:1.24

0 commit comments

Comments
 (0)