[workflow] disable p2p via shared memory on non-nvlink machine (#1086)

2022-06-09 15:24:35 +08:00 · 2022-06-09 15:24:35 +08:00 · 1bd8a72fc9
parent 65ee6dcc20
commit 1bd8a72fc9
1 changed files with 2 additions and 1 deletions
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@ -15,7 +15,7 @@ jobs:
    runs-on: [self-hosted, gpu]
    container:
      image: hpcaitech/pytorch-cuda:1.10.1-11.3.0
-      options: --shm-size=2gb --gpus all --rm -v /data/scratch/cifar-10:/data/scratch/cifar-10
+      options: --gpus all --rm -v /data/scratch/cifar-10:/data/scratch/cifar-10
    timeout-minutes: 40
    steps:
      - uses: actions/checkout@v2
@ -34,3 +34,4 @@ jobs:
          PYTHONPATH=$PWD pytest tests
        env:
          DATA: /data/scratch/cifar-10
+          NCCL_SHM_DISABLE: 1