mirror of
https://github.com/ROCm/jax.git
synced 2025-04-16 11:56:07 +00:00
[TPU CI] Send chat notification on cancellation as well as failure.
In particular, this makes it notify on timeouts (which usually indicates a test hang, but should be addressed in any case).
This commit is contained in:
parent
78599e65d1
commit
582578220d
4
.github/workflows/cloud-tpu-ci-nightly.yml
vendored
4
.github/workflows/cloud-tpu-ci-nightly.yml
vendored
@ -63,10 +63,10 @@ jobs:
|
||||
python -m pytest -m "multiaccelerator" --tb=short --maxfail=20 tests
|
||||
- name: Send chat on failure
|
||||
# Don't notify when testing the workflow from a branch.
|
||||
if: ${{ failure() && github.ref_name == 'main' }}
|
||||
if: ${{ (failure() || cancelled()) && github.ref_name == 'main' }}
|
||||
run: |
|
||||
curl --location --request POST '${{ secrets.BUILD_CHAT_WEBHOOK }}' \
|
||||
--header 'Content-Type: application/json' \
|
||||
--data-raw "{
|
||||
'text': '\"$GITHUB_WORKFLOW\", jaxlib/libtpu version \"${{ matrix.jaxlib-version }}\", TPU type ${{ matrix.tpu-type }} job failed: $GITHUB_SERVER_URL/$GITHUB_REPOSITORY/actions/runs/$GITHUB_RUN_ID'
|
||||
'text': '\"$GITHUB_WORKFLOW\", jaxlib/libtpu version \"${{ matrix.jaxlib-version }}\", TPU type ${{ matrix.tpu-type }} job failed, timed out, or was cancelled: $GITHUB_SERVER_URL/$GITHUB_REPOSITORY/actions/runs/$GITHUB_RUN_ID'
|
||||
}"
|
||||
|
Loading…
x
Reference in New Issue
Block a user