[workflow] hook compatibility test failure to lark (#2586)

pull/2591/head
Frank Lee 2023-02-06 14:56:31 +08:00 committed by GitHub
parent 186ddce2c4
commit 5767f8e394
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 20 additions and 0 deletions

View File

@ -4,6 +4,7 @@ on:
# run at 03:00 of every Sunday(singapore time) so here is UTC time Saturday 16:00 # run at 03:00 of every Sunday(singapore time) so here is UTC time Saturday 16:00
schedule: schedule:
- cron: '0 19 * * 6' - cron: '0 19 * * 6'
workflow_dispatch:
jobs: jobs:
matrix_preparation: matrix_preparation:
@ -43,11 +44,13 @@ jobs:
- name: Install dependencies - name: Install dependencies
run: | run: |
pip install -U pip setuptools wheel --user pip install -U pip setuptools wheel --user
- uses: actions/checkout@v2 - uses: actions/checkout@v2
with: with:
repository: hpcaitech/TensorNVMe repository: hpcaitech/TensorNVMe
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }} ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
path: TensorNVMe path: TensorNVMe
- name: Install tensornvme - name: Install tensornvme
run: | run: |
cd TensorNVMe cd TensorNVMe
@ -57,10 +60,12 @@ jobs:
- uses: actions/checkout@v2 - uses: actions/checkout@v2
with: with:
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }} ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
- name: Install Colossal-AI - name: Install Colossal-AI
run: | run: |
pip install -v --no-cache-dir . pip install -v --no-cache-dir .
pip install -r requirements/requirements-test.txt pip install -r requirements/requirements-test.txt
- name: Unit Testing - name: Unit Testing
run: | run: |
PYTHONPATH=$PWD pytest tests PYTHONPATH=$PWD pytest tests
@ -68,3 +73,18 @@ jobs:
DATA: /data/scratch/cifar-10 DATA: /data/scratch/cifar-10
NCCL_SHM_DISABLE: 1 NCCL_SHM_DISABLE: 1
LD_LIBRARY_PATH: /github/home/.tensornvme/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64 LD_LIBRARY_PATH: /github/home/.tensornvme/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64
- name: Notify Lark
id: message-preparation
if: ${{ failure() }}
run: |
url=$SERVER_URL/$REPO/actions/runs/$RUN_ID
msg="Compatibility test failed with $container, please visit $url for details"
echo $msg
python .github/workflows/scripts/send_message_to_lark.py -m "$msg" -u $WEBHOOK_URL
env:
SERVER_URL: ${{github.server_url }}
REPO: ${{ github.repository }}
RUN_ID: ${{ github.run_id }}
WEBHOOK_URL: ${{ secrets.LARK_NOTIFICATION_WEBHOOK_URL }}
container: ${{ matrix.container }}