mirror of https://github.com/hpcaitech/ColossalAI
[misc] support torch2.3 (#5893)
* [misc] support torch2.3 * [devops] update compatibility ci * [devops] update compatibility ci * [devops] add debug * [devops] add debug * [devops] add debug * [devops] add debug * [devops] remove debug * [devops] remove debugpull/5912/head
parent
530283dba0
commit
27a72f0de1
|
@ -1,2 +1,3 @@
|
||||||
2.1.0-12.1.0
|
2.1.0-12.1.0
|
||||||
2.2.2-12.1.0
|
2.2.2-12.1.0
|
||||||
|
2.3.0-12.1.0
|
||||||
|
|
|
@ -55,41 +55,27 @@ jobs:
|
||||||
steps:
|
steps:
|
||||||
- name: Install dependencies
|
- name: Install dependencies
|
||||||
run: |
|
run: |
|
||||||
pip install -U pip setuptools==68.2.2 wheel --user
|
|
||||||
- uses: actions/checkout@v2
|
|
||||||
with:
|
|
||||||
repository: hpcaitech/TensorNVMe
|
|
||||||
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
|
|
||||||
path: TensorNVMe
|
|
||||||
- name: Install tensornvme
|
|
||||||
run: |
|
|
||||||
cd TensorNVMe
|
|
||||||
apt update && apt install -y cmake
|
apt update && apt install -y cmake
|
||||||
pip install -r requirements.txt
|
pip install -U pip setuptools==68.2.2 wheel --user
|
||||||
DISABLE_URING=1 pip install -v .
|
|
||||||
- uses: actions/checkout@v2
|
- uses: actions/checkout@v2
|
||||||
with:
|
with:
|
||||||
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
|
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
|
||||||
- name: Download cub for CUDA 10.2
|
|
||||||
run: |
|
|
||||||
CUDA_VERSION=$(nvcc -V | awk -F ',| ' '/release/{print $6}')
|
|
||||||
|
|
||||||
# check if it is CUDA 10.2
|
|
||||||
# download cub
|
|
||||||
if [ "$CUDA_VERSION" = "10.2" ]; then
|
|
||||||
wget https://github.com/NVIDIA/cub/archive/refs/tags/1.8.0.zip
|
|
||||||
unzip 1.8.0.zip
|
|
||||||
cp -r cub-1.8.0/cub/ colossalai/kernel/cuda_native/csrc/kernels/include/
|
|
||||||
fi
|
|
||||||
- name: Install Colossal-AI
|
- name: Install Colossal-AI
|
||||||
run: |
|
run: |
|
||||||
BUILD_EXT=1 pip install -v .
|
BUILD_EXT=1 pip install -v .
|
||||||
pip install -r requirements/requirements-test.txt
|
pip install --no-cache-dir -r requirements/requirements-test.txt
|
||||||
|
|
||||||
|
- name: Install tensornvme
|
||||||
|
run: |
|
||||||
|
DISABLE_URING=1 pip install -v git+https://github.com/hpcaitech/TensorNVMe.git
|
||||||
|
|
||||||
- name: Unit Testing
|
- name: Unit Testing
|
||||||
run: |
|
run: |
|
||||||
PYTHONPATH=$PWD pytest --durations=0 tests
|
PYTHONPATH=$PWD pytest --durations=0 tests
|
||||||
env:
|
env:
|
||||||
DATA: /data/scratch/cifar-10
|
DATA: /data/scratch/cifar-10
|
||||||
LD_LIBRARY_PATH: /github/home/.tensornvme/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64
|
LD_LIBRARY_PATH: /github/home/.tensornvme/lib
|
||||||
LLAMA_PATH: /data/scratch/llama-tiny
|
LLAMA_PATH: /data/scratch/llama-tiny
|
||||||
MOE_TENSOR_PATH: /data/scratch/moe_tensors
|
MOE_TENSOR_PATH: /data/scratch/moe_tensors
|
||||||
|
|
|
@ -49,42 +49,27 @@ jobs:
|
||||||
steps:
|
steps:
|
||||||
- name: Install dependencies
|
- name: Install dependencies
|
||||||
run: |
|
run: |
|
||||||
pip install -U pip setuptools==68.2.2 wheel --user
|
|
||||||
- uses: actions/checkout@v2
|
|
||||||
with:
|
|
||||||
repository: hpcaitech/TensorNVMe
|
|
||||||
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
|
|
||||||
path: TensorNVMe
|
|
||||||
- name: Install tensornvme
|
|
||||||
run: |
|
|
||||||
cd TensorNVMe
|
|
||||||
apt update && apt install -y cmake
|
apt update && apt install -y cmake
|
||||||
pip install -r requirements.txt
|
pip install -U pip setuptools==68.2.2 wheel --user
|
||||||
DISABLE_URING=1 pip install -v .
|
|
||||||
- uses: actions/checkout@v2
|
- uses: actions/checkout@v2
|
||||||
with:
|
with:
|
||||||
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
|
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
|
||||||
- name: Download cub for CUDA 10.2
|
|
||||||
run: |
|
|
||||||
CUDA_VERSION=$(nvcc -V | awk -F ',| ' '/release/{print $6}')
|
|
||||||
|
|
||||||
# check if it is CUDA 10.2
|
|
||||||
# download cub
|
|
||||||
if [ "$CUDA_VERSION" = "10.2" ]; then
|
|
||||||
wget https://github.com/NVIDIA/cub/archive/refs/tags/1.8.0.zip
|
|
||||||
unzip 1.8.0.zip
|
|
||||||
cp -r cub-1.8.0/cub/ colossalai/kernel/cuda_native/csrc/kernels/include/
|
|
||||||
fi
|
|
||||||
|
|
||||||
- name: Install Colossal-AI
|
- name: Install Colossal-AI
|
||||||
run: |
|
run: |
|
||||||
BUILD_EXT=1 pip install -v .
|
BUILD_EXT=1 pip install -v .
|
||||||
pip install -r requirements/requirements-test.txt
|
pip install --no-cache-dir -r requirements/requirements-test.txt
|
||||||
|
|
||||||
|
- name: Install tensornvme
|
||||||
|
run: |
|
||||||
|
DISABLE_URING=1 pip install -v git+https://github.com/hpcaitech/TensorNVMe.git
|
||||||
|
|
||||||
- name: Unit Testing
|
- name: Unit Testing
|
||||||
run: |
|
run: |
|
||||||
PYTHONPATH=$PWD pytest --durations=0 tests
|
PYTHONPATH=$PWD pytest --durations=0 tests
|
||||||
env:
|
env:
|
||||||
DATA: /data/scratch/cifar-10
|
DATA: /data/scratch/cifar-10
|
||||||
LD_LIBRARY_PATH: /github/home/.tensornvme/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64
|
LD_LIBRARY_PATH: /github/home/.tensornvme/lib
|
||||||
LLAMA_PATH: /data/scratch/llama-tiny
|
LLAMA_PATH: /data/scratch/llama-tiny
|
||||||
MOE_TENSOR_PATH: /data/scratch/moe_tensors
|
MOE_TENSOR_PATH: /data/scratch/moe_tensors
|
||||||
|
|
|
@ -43,47 +43,28 @@ jobs:
|
||||||
steps:
|
steps:
|
||||||
- name: Install dependencies
|
- name: Install dependencies
|
||||||
run: |
|
run: |
|
||||||
|
apt update && apt install -y cmake
|
||||||
pip install -U pip setuptools==68.2.2 wheel --user
|
pip install -U pip setuptools==68.2.2 wheel --user
|
||||||
|
|
||||||
- uses: actions/checkout@v2
|
- uses: actions/checkout@v2
|
||||||
with:
|
with:
|
||||||
repository: hpcaitech/TensorNVMe
|
|
||||||
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
|
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
|
||||||
path: TensorNVMe
|
|
||||||
|
|
||||||
- name: Install tensornvme
|
|
||||||
run: |
|
|
||||||
cd TensorNVMe
|
|
||||||
apt update && apt install -y cmake
|
|
||||||
pip install -r requirements.txt
|
|
||||||
DISABLE_URING=1 pip install -v .
|
|
||||||
- uses: actions/checkout@v2
|
|
||||||
with:
|
|
||||||
ssh-key: ${{ secrets.SSH_KEY_FOR_CI }}
|
|
||||||
|
|
||||||
- name: Download cub for CUDA 10.2
|
|
||||||
run: |
|
|
||||||
CUDA_VERSION=$(nvcc -V | awk -F ',| ' '/release/{print $6}')
|
|
||||||
|
|
||||||
# check if it is CUDA 10.2
|
|
||||||
# download cub
|
|
||||||
if [ "$CUDA_VERSION" = "10.2" ]; then
|
|
||||||
wget https://github.com/NVIDIA/cub/archive/refs/tags/1.8.0.zip
|
|
||||||
unzip 1.8.0.zip
|
|
||||||
cp -r cub-1.8.0/cub/ colossalai/kernel/cuda_native/csrc/kernels/include/
|
|
||||||
fi
|
|
||||||
|
|
||||||
- name: Install Colossal-AI
|
- name: Install Colossal-AI
|
||||||
run: |
|
run: |
|
||||||
BUILD_EXT=1 pip install -v .
|
BUILD_EXT=1 pip install -v .
|
||||||
pip install -r requirements/requirements-test.txt
|
pip install --no-cache-dir -r requirements/requirements-test.txt
|
||||||
|
|
||||||
|
- name: Install tensornvme
|
||||||
|
run: |
|
||||||
|
DISABLE_URING=1 pip install -v git+https://github.com/hpcaitech/TensorNVMe.git
|
||||||
|
|
||||||
- name: Unit Testing
|
- name: Unit Testing
|
||||||
run: |
|
run: |
|
||||||
PYTHONPATH=$PWD pytest --durations=0 tests
|
PYTHONPATH=$PWD pytest --durations=0 tests
|
||||||
env:
|
env:
|
||||||
DATA: /data/scratch/cifar-10
|
DATA: /data/scratch/cifar-10
|
||||||
LD_LIBRARY_PATH: /github/home/.tensornvme/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64
|
LD_LIBRARY_PATH: /github/home/.tensornvme/lib
|
||||||
LLAMA_PATH: /data/scratch/llama-tiny
|
LLAMA_PATH: /data/scratch/llama-tiny
|
||||||
MOE_TENSOR_PATH: /data/scratch/moe_tensors
|
MOE_TENSOR_PATH: /data/scratch/moe_tensors
|
||||||
|
|
||||||
|
|
|
@ -8,7 +8,7 @@ click
|
||||||
fabric
|
fabric
|
||||||
contexttimer
|
contexttimer
|
||||||
ninja
|
ninja
|
||||||
torch>=2.1.0,<2.3.0
|
torch>=2.1.0,<=2.3.0
|
||||||
safetensors
|
safetensors
|
||||||
einops
|
einops
|
||||||
pydantic
|
pydantic
|
||||||
|
|
Loading…
Reference in New Issue