Skip to content

Commit ed31404

Browse files
committed
Debug GPU failures
1 parent dd41e8d commit ed31404

File tree

2 files changed

+6
-2
lines changed

2 files changed

+6
-2
lines changed

.github/workflows/bazel_gpu_local.yml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -37,3 +37,5 @@ jobs:
3737
uses: ./actions/ci_connection/
3838
- name: Run Bazel GPU tests locally
3939
run: ./ci/run_bazel_test.sh "ci/envs/run_tests/bazel_gpu_local"
40+
- name: Test if step runs
41+
run: echo "This step ran!"

ci/run_bazel_test.sh

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -59,14 +59,16 @@ if [[ $JAXCI_RUN_BAZEL_TEST_GPU_LOCAL == 1 ]]; then
5959
--repo_env=HERMETIC_PYTHON_VERSION="$JAXCI_HERMETIC_PYTHON_VERSION" \
6060
--override_repository=xla="${JAXCI_XLA_GIT_DIR}" \
6161
--run_under "${JAXCI_JAX_GIT_DIR}/build/parallel_accelerator_execute.sh" \
62-
//tests:gpu_tests //tests:backend_independent_tests //tests/pallas:gpu_tests //tests/pallas:backend_independent_tests
62+
//tests:gpu_tests //tests:backend_independent_tests //tests/pallas:gpu_tests //tests/pallas:backend_independent_tests || true
63+
echo "Finished running non-multiaccelerator tests..."
6364

6465
# Runs multiaccelerator tests with all GPUs.
6566
check_if_to_run_in_docker bazel --bazelrc=ci/.bazelrc test --config=ci_linux_x86_64_cuda \
6667
--config=multiaccelerator_local \
6768
--repo_env=HERMETIC_PYTHON_VERSION="$JAXCI_HERMETIC_PYTHON_VERSION" \
6869
--override_repository=xla="${JAXCI_XLA_GIT_DIR}" \
69-
//tests:gpu_tests //tests/pallas:gpu_tests
70+
//tests:gpu_tests //tests/pallas:gpu_tests || true
71+
echo "Finished running multiaccelerator tests..."
7072
fi
7173

7274
# Run Bazel GPU tests with RBE.

0 commit comments

Comments
 (0)