[dicp][ascend] Add llama hf unit test. (#537) #1
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: dipu ci | |
on: | |
workflow_dispatch: | |
push: | |
branches: | |
- main | |
- dev_v0.25 | |
pull_request: | |
paths-ignore: | |
- "dicp/**" | |
env: | |
CAMB_CI_PATH: '/mnt/lustre/share/parrotsci/github/cibuild/${{ github.repository }}' | |
CAMB_PARTATION: ${{ vars.CAMB_SLURM_PAR != '' && vars.CAMB_SLURM_PAR || 'camb_mlu370_m8' }} | |
CAMB_CLUSTER: CAMB | |
CAMB_TORCH_BASE_DIR: '/mnt/lustre/share/parrotsci/github/cibuild/pytorchbase' | |
CUDA_CI_PATH: '/mnt/cache/share/parrotsci/github/cibuild/${{ github.repository }}' | |
CUDA_PARTATION: ${{ vars.SH1988_SLURM_PAR != '' && vars.SH1988_SLURM_PAR || 'pat_rd -x SH-IDC1-10-198-8-60' }} | |
CUDA_CLUSTER: SH1988 | |
DEEPLINK_PATH: '/mnt/cache/share/deeplinkci/github/${{ github.repository }}' | |
ASCEND_CLUSTER: ASCEND | |
CLUSTER_ASCEND_910B: ASCEND-910B | |
ASCEND_TORCH_DIR: '/mnt/cache/share/platform/cienv/pytorch' | |
CI_BUILD_FLAG: "ci_build_flag" | |
PYTORCH_COMMIT: ${{ vars.PYTORCH_COMMIT != '' && vars.PYTORCH_COMMIT || 'c263bd43e8e8502d4726643bc6fd046f0130ac0e' }} # pytorch tag 2.0 | |
ALL_COVERAGE: ${{ (contains( github.ref, 'main') || startsWith(github.ref, 'refs/heads/v') || startsWith(github.ref, 'refs/heads/dev')) && 'ON' || 'OFF' }} | |
REQUIRE_COVERAGE: ${{ vars.REQUIRE_COVERAGE != '' && vars.REQUIRE_COVERAGE || '40' }} | |
REPO: ${{ github.event.repository.name }} | |
concurrency: | |
group: dipu-${{ github.head_ref || github.ref }} | |
cancel-in-progress: true | |
jobs: | |
Rsync: | |
name: Rsync code | |
runs-on: github-poc-ci | |
steps: | |
- name: clone repo | |
run: | | |
set -ex | |
cd ${GITHUB_WORKSPACE} && rm -rf DIPU ${REPO}_DIOPI ${REPO} ${REPO}.dev | |
if [ -n "${{ github.event.pull_request.head.repo.full_name }}" ] && [[ ! "${{ github.event.pull_request.head.repo.full_name }}" == "${{ github.repository }}" ]]; then | |
git clone ${{ github.event.pull_request.head.repo.ssh_url }} ${REPO} | |
cd ${GITHUB_WORKSPACE}/${REPO} && git checkout ${{ github.event.pull_request.head.sha }} | |
git remote add mainrepo [email protected]:${GITHUB_REPOSITORY}.git | |
git fetch mainrepo && git merge --no-edit mainrepo/${{ github.base_ref }} | |
else | |
git clone https://github.com/DeepLink-org/${REPO}.git && cd ${REPO} | |
if [ $GITHUB_EVENT_NAME == "pull_request" ]; then | |
echo "${{ github.base_ref }} " | |
git checkout ${{ github.event.pull_request.head.sha }} && git merge --no-edit origin/${{ github.base_ref }} | |
else | |
echo $GITHUB_EVENT_NAME | |
git checkout ${{ github.sha }} | |
fi | |
fi | |
cd ${GITHUB_WORKSPACE}/${REPO}/dipu && rm -rf third_party/kineto | |
git clone --reference /home/autolink/rsync/sourcecode/DeepLink-org/kineto https://github.com/DeepLink-org/kineto.git third_party/kineto | |
git submodule update --init && cd third_party/kineto && git submodule update --init | |
cd ${GITHUB_WORKSPACE} && cp -R ${REPO} ${REPO}_DIOPI | |
cd ${REPO}/dipu && bash /home/autolink/rsync/sourcecode/update_code.sh | |
rsync -a /home/autolink/rsync/sourcecode/mmlab_pack . && cd mmlab_pack | |
bash ../scripts/ci/ci_one_iter.sh clone | |
# dipu_diopi depend on latest target diopi branch, not diopi in submodule. here assume diopi and dipu use same 'target branch' " github.base_ref " | |
cd ${GITHUB_WORKSPACE}/${REPO}_DIOPI/dipu/third_party && rm -rf DIOPI && git clone https://github.com/DeepLink-org/DIOPI.git | |
if [ $GITHUB_EVENT_NAME == "pull_request" ]; then | |
cd ./DIOPI && git checkout ${{ github.base_ref }} | |
fi | |
- name: Rsync to Server | |
run: | | |
ssh ${CAMB_CLUSTER} "mkdir -p ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/source ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/source-main" | |
rsync -a --delete ${GITHUB_WORKSPACE}/${REPO}/ ${CAMB_CLUSTER}:${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/source/ | |
rsync -a --delete ${GITHUB_WORKSPACE}/${REPO}_DIOPI/ ${CAMB_CLUSTER}:${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/source-main/ | |
ssh ${CUDA_CLUSTER} "mkdir -p ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/source ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/source-main" | |
rsync -a --delete ${GITHUB_WORKSPACE}/${REPO}/ ${CUDA_CLUSTER}:${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/source/ | |
rsync -a --delete ${GITHUB_WORKSPACE}/${REPO}_DIOPI/ ${CUDA_CLUSTER}:${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/source-main/ | |
ssh ${CLUSTER_ASCEND_910B} "mkdir -p ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/source ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/source-main" | |
rsync -a --delete ${GITHUB_WORKSPACE}/${REPO}/ ${CLUSTER_ASCEND_910B}:${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/source/ | |
rsync -a --delete ${GITHUB_WORKSPACE}/${REPO}_DIOPI/ ${CLUSTER_ASCEND_910B}:${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/source-main/ | |
Build-Camb: | |
name: Build-dipu-camb | |
needs: [Rsync] | |
runs-on: github-poc-ci | |
env: | |
MLU_REQUESTS: 1 | |
steps: | |
- name: Build dipu | |
run: | | |
ssh ${CAMB_CLUSTER} """ | |
set -ex | |
export USE_COVERAGE=ON | |
cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && cp -R source ${GITHUB_JOB} && cd ${GITHUB_JOB}/dipu | |
export PYTORCH_DIR=${CAMB_TORCH_BASE_DIR}/${PYTORCH_COMMIT} | |
source scripts/ci/camb/ci_camb_env.sh | |
rsync -a /mnt/lustre/share_data/PAT/datasets/huggingface mmlab_pack/ | |
srun --job-name=${GITHUB_JOB} --partition=${CAMB_PARTATION} --time=40 \ | |
--gres=mlu:${MLU_REQUESTS} bash scripts/ci/camb/ci_camb_script.sh build_dipu \ | |
|| ( cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && exit 1 ) | |
""" | |
Test-Camb: | |
name: Test-dipu-camb | |
needs: [Build-Camb] | |
runs-on: github-poc-ci | |
env: | |
MLU_REQUESTS: 1 | |
steps: | |
- name: Run-test | |
run: | | |
ssh ${CAMB_CLUSTER} """ | |
set -ex | |
export USE_COVERAGE=ON | |
cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/ && cd Build-Camb/dipu | |
export PYTORCH_DIR=${CAMB_TORCH_BASE_DIR}/${PYTORCH_COMMIT} | |
source scripts/ci/camb/ci_camb_env.sh | |
srun --job-name=${GITHUB_JOB} --partition=${CAMB_PARTATION} --time=40 --gres=mlu:${MLU_REQUESTS} sh tests/run_camb_tests.sh | |
if [ "${ALL_COVERAGE}" = "ON" ]; then | |
sh /mnt/lustre/share/platform/dep/sonar/coverage_DIPU_camb.sh ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Camb ${GITHUB_RUN_NUMBER} || echo "get coverage fail" | |
fi | |
""" | |
- name: increment coverage check | |
if: ${{ contains( github.event_name, 'pull_request' ) && contains( github.base_ref, 'main' ) }} | |
run: | | |
ssh ${CAMB_CLUSTER} """ | |
set -e | |
cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Camb | |
rm -rf scripts | |
ln -s ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/source-main/dipu/third_party/DIOPI/scripts scripts | |
source /mnt/cache/share/platform/env/pt2.0_diopi | |
bash scripts/increment_coverage.sh ${REQUIRE_COVERAGE} | |
""" | |
Test-One-Iter-Camb: | |
name: Test-one-iter-camb | |
needs: [Build-Camb] | |
runs-on: github-poc-ci | |
env: | |
MLU_REQUESTS: 1 | |
steps: | |
- name: build-some-env | |
run: | | |
ssh ${CAMB_CLUSTER} """ | |
set -ex | |
cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Camb/dipu | |
export PYTORCH_DIR=${CAMB_TORCH_BASE_DIR}/${PYTORCH_COMMIT} | |
echo "pytorch dir: \${PYTORCH_DIR}" | |
source scripts/ci/camb/ci_camb_env.sh | |
basic_path=${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Camb/dipu/mmlab_pack | |
export PYTHONPATH=\${basic_path}/mmengine:\$PYTHONPATH | |
export PYTHONPATH=\${basic_path}/mmcv:\$PYTHONPATH | |
export PYTHONPATH=\$(pwd):\$PYTHONPATH | |
cd mmlab_pack | |
srun --job-name=${GITHUB_RUN_NUMBER}_${GITHUB_JOB} --partition=${CAMB_PARTATION} --gres=mlu:${MLU_REQUESTS} sh ../scripts/ci/ci_one_iter.sh build_camb | |
""" | |
- name: run-one-iter-for-tradition | |
run: | | |
ssh ${CAMB_CLUSTER} """ | |
set -ex | |
cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Camb/dipu | |
export PYTORCH_DIR=${CAMB_TORCH_BASE_DIR}/${PYTORCH_COMMIT} | |
echo "pytorch dir: \${PYTORCH_DIR}" | |
source scripts/ci/camb/ci_camb_env.sh | |
basic_path=${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Camb/dipu/mmlab_pack | |
source scripts/ci/ci_one_iter.sh export_pythonpath_camb \${basic_path} | |
export PYTHONPATH=\$(pwd):\$PYTHONPATH | |
cd mmlab_pack | |
rm -rf one_iter_data | |
python ../scripts/ci/ci_run_one_iter.py camb ${GITHUB_JOB} "mlu:${MLU_REQUESTS}" \"${CAMB_PARTATION}\" && rm -rf one_iter_data || (rm -rf one_iter_data && exit 1) | |
""" | |
- name: run-one-iter-for-llm | |
run: | | |
ssh ${CAMB_CLUSTER} """ | |
set -ex | |
cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Camb/dipu | |
export PYTORCH_DIR=${CAMB_TORCH_BASE_DIR}/${PYTORCH_COMMIT} | |
echo "pytorch dir: \${PYTORCH_DIR}" | |
source scripts/ci/camb/ci_camb_env.sh | |
basic_path=${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Camb/dipu/mmlab_pack | |
source scripts/ci/ci_one_iter.sh export_pythonpath_camb \${basic_path} | |
export PYTHONPATH=\$(pwd):\$PYTHONPATH | |
cd mmlab_pack | |
rm -rf one_iter_data | |
python ../scripts/ci/ci_run_one_iter.py camb ${GITHUB_JOB} "mlu:${MLU_REQUESTS}" \"${CAMB_PARTATION}\" "llm" && rm -rf one_iter_data || (rm -rf one_iter_data && exit 1) | |
""" | |
- name: Perform cleanup one iter data | |
if: always() | |
run: | | |
ssh ${CAMB_CLUSTER} """ | |
set -ex | |
echo "${GITHUB_RUN_NUMBER}_${GITHUB_JOB}" | |
scancel -n "${GITHUB_RUN_NUMBER}_${GITHUB_JOB}" | |
cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Camb/dipu/mmlab_pack | |
rm -rf one_iter_data | |
touch one_iter_data #用于占位,防止创建新的one_iter_data文件夹 | |
""" | |
- name: Check for failure | |
if: ${{ failure() }} | |
run: exit 1 | |
Build-Camb-Latest-Target: | |
name: Build-dipu-camb-latest-target | |
needs: [Rsync] | |
runs-on: github-poc-ci | |
env: | |
MLU_REQUESTS: 1 | |
steps: | |
- name: Build dipu diopi-latest-target | |
run: | | |
ssh ${CAMB_CLUSTER} """ | |
set -ex | |
cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && cp -R source-main ${GITHUB_JOB} && cd ${GITHUB_JOB}/dipu | |
export PYTORCH_DIR=${CAMB_TORCH_BASE_DIR}/${PYTORCH_COMMIT} | |
source scripts/ci/camb/ci_camb_env.sh | |
srun --job-name=${GITHUB_JOB} --partition=${CAMB_PARTATION} --time=40 \ | |
--gres=mlu:${MLU_REQUESTS} bash scripts/ci/camb/ci_camb_script.sh build_dipu \ | |
|| ( cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && exit 1 ) | |
""" | |
Test-Camb-Latest-Target: | |
name: Test-dipu-camb-latest-target | |
needs: [Build-Camb-Latest-Target] | |
runs-on: github-poc-ci | |
env: | |
MLU_REQUESTS: 1 | |
steps: | |
- name: Run-test | |
run: | | |
ssh ${CAMB_CLUSTER} """ | |
set -ex | |
cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/ && cd Build-Camb-Latest-Target/dipu | |
export PYTORCH_DIR=${CAMB_TORCH_BASE_DIR}/${PYTORCH_COMMIT} | |
source scripts/ci/camb/ci_camb_env.sh | |
srun --job-name=${GITHUB_JOB} --partition=${CAMB_PARTATION} --time=40 --gres=mlu:${MLU_REQUESTS} sh tests/run_camb_tests.sh && rm -rf Build-Camb-Diopi \ | |
|| ( cd ${CAMB_CI_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf Build-Camb-Latest-Target && exit 1 ) | |
""" | |
Build-Cuda: | |
name: Build-dipu-cuda | |
needs: [Rsync] | |
runs-on: github-poc-ci | |
env: | |
GPU_REQUESTS: 1 | |
steps: | |
- name: Build dipu | |
run: | | |
ssh ${CUDA_CLUSTER} """ | |
set -e | |
export USE_COVERAGE=ON | |
cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER} && rm -rf ${GITHUB_JOB} && cp -R source ${GITHUB_JOB} && cd ${GITHUB_JOB}/dipu | |
source scripts/ci/nv/ci_nv_env.sh | |
rsync -a /mnt/lustre/share_data/PAT/datasets/huggingface mmlab_pack/ | |
srun --job-name=${GITHUB_RUN_NUMBER}_${GITHUB_JOB} --partition=${CUDA_PARTATION} --gres=gpu:${GPU_REQUESTS} --time=30 bash scripts/ci/nv/ci_nv_script.sh build_dipu \ | |
|| ( cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && exit 1 ) | |
""" | |
Test-Cuda: | |
name: Test-dipu-cuda | |
needs: [Build-Cuda] | |
runs-on: github-poc-ci | |
env: | |
GPU_REQUESTS: 1 | |
steps: | |
- name: Run-test | |
run: | | |
ssh ${CUDA_CLUSTER} """ | |
set -ex | |
export USE_COVERAGE=ON | |
cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/ && cd Build-Cuda/dipu | |
source scripts/ci/nv/ci_nv_env.sh | |
srun --job-name=${GITHUB_RUN_NUMBER}_${GITHUB_JOB} --partition=${CUDA_PARTATION} --gres=gpu:${GPU_REQUESTS} --cpus-per-task=5 --mem=16G --time=70 sh tests/run_nv_tests.sh | |
if [ "${ALL_COVERAGE}" = "ON" ]; then | |
bash /mnt/cache/share/platform/dep/sonar/coverage_DIPU_nv.sh ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Cuda ${GITHUB_RUN_NUMBER} || echo "get coverage fail" | |
fi | |
""" | |
- name: increment coverage check | |
if: ${{ contains( github.event_name, 'pull_request' ) && contains( github.base_ref, 'main' ) }} | |
run: | | |
ssh ${CUDA_CLUSTER} """ | |
set -e | |
cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Cuda/ | |
rm -rf scripts | |
ln -s ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/source-main/dipu/third_party/DIOPI/scripts scripts | |
source /mnt/cache/share/platform/env/pt2.0_diopi | |
bash scripts/increment_coverage.sh ${REQUIRE_COVERAGE} | |
""" | |
Test-One-Iter_Cuda: | |
name: Test-one-iter-cuda | |
needs: [Build-Cuda] | |
runs-on: github-poc-ci | |
env: | |
GPU_REQUESTS: 1 | |
steps: | |
- name: build some env | |
run: | | |
ssh ${CUDA_CLUSTER} """ | |
set -ex | |
cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/ && cd Build-Cuda/dipu | |
source scripts/ci/nv/ci_nv_env.sh | |
basic_path=${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Cuda/dipu/mmlab_pack | |
export PYTHONPATH=\${basic_path}/mmengine:\$PYTHONPATH | |
export PYTHONPATH=\${basic_path}/mmcv:\$PYTHONPATH | |
export PYTHONPATH=\$(pwd):\$PYTHONPATH | |
cd mmlab_pack | |
srun --job-name=${GITHUB_RUN_NUMBER}_${GITHUB_JOB} --partition=${CUDA_PARTATION} --gres=gpu:${GPU_REQUESTS} --time=20 bash ../scripts/ci/ci_one_iter.sh build_cuda | |
""" | |
- name: run-one-iter-for-tradition | |
run: | | |
ssh ${CUDA_CLUSTER} """ | |
cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/ && cd Build-Cuda/dipu | |
source scripts/ci/nv/ci_nv_env.sh | |
basic_path=${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Cuda/dipu/mmlab_pack | |
source scripts/ci/ci_one_iter.sh export_pythonpath_cuda \${basic_path} | |
export PYTHONPATH=\$(pwd):\$PYTHONPATH | |
cd mmlab_pack | |
rm -rf one_iter_data | |
python ../scripts/ci/ci_run_one_iter.py cuda ${GITHUB_RUN_NUMBER}_${GITHUB_JOB} "gpu:${GPU_REQUESTS}" \"${CUDA_PARTATION}\" && rm -rf one_iter_data || (rm -rf one_iter_data && exit 1) | |
""" | |
- name: run-one-iter-for-llm | |
run: | | |
ssh ${CUDA_CLUSTER} """ | |
cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/ && cd Build-Cuda/dipu | |
source scripts/ci/nv/ci_nv_env.sh | |
basic_path=${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Cuda/dipu/mmlab_pack | |
source scripts/ci/ci_one_iter.sh export_pythonpath_cuda \${basic_path} | |
export PYTHONPATH=\$(pwd):\$PYTHONPATH | |
cd mmlab_pack | |
rm -rf one_iter_data | |
python ../scripts/ci/ci_run_one_iter.py cuda ${GITHUB_RUN_NUMBER}_${GITHUB_JOB} "gpu:${GPU_REQUESTS}" \"${CUDA_PARTATION}\" "llm" && rm -rf one_iter_data || (rm -rf one_iter_data && exit 1) | |
""" | |
- name: Perform cleanup one iter data | |
if: always() | |
run: | | |
ssh ${CUDA_CLUSTER} """ | |
set -ex | |
echo "${GITHUB_RUN_NUMBER}_${GITHUB_JOB}" | |
scancel -n "${GITHUB_RUN_NUMBER}_${GITHUB_JOB}" | |
cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/Build-Cuda/dipu/mmlab_pack | |
rm -rf one_iter_data | |
touch one_iter_data #用于占位,防止创建新的one_iter_data文件夹 | |
""" | |
- name: Check for failure | |
if: ${{ failure() }} | |
run: exit 1 | |
Build-Cuda-Latest-Target: | |
name: Build-dipu-cuda-latest-target | |
needs: [Rsync] | |
runs-on: github-poc-ci | |
env: | |
GPU_REQUESTS: 1 | |
steps: | |
- name: Build dipu diopi-latest-target | |
run: | | |
ssh ${CUDA_CLUSTER} """ | |
set -ex | |
cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER} && rm -rf ${GITHUB_JOB} && cp -R source-main ${GITHUB_JOB} && cd ${GITHUB_JOB}/dipu | |
source scripts/ci/nv/ci_nv_env.sh | |
srun --job-name=${GITHUB_RUN_NUMBER}_${GITHUB_JOB} --partition=${CUDA_PARTATION} --gres=gpu:${GPU_REQUESTS} --cpus-per-task=5 --mem=16G --time=30 bash scripts/ci/nv/ci_nv_script.sh build_dipu \ | |
|| ( cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && exit 1 ) | |
""" | |
Test-Cuda-Latest-Target: | |
name: Test-dipu-cuda-latest-target | |
needs: [Build-Cuda-Latest-Target] | |
runs-on: github-poc-ci | |
env: | |
GPU_REQUESTS: 1 | |
steps: | |
- name: Run-test | |
run: | | |
ssh ${CUDA_CLUSTER} """ | |
set -ex | |
cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/ && cd Build-Cuda-Latest-Target/dipu | |
source scripts/ci/nv/ci_nv_env.sh | |
srun --job-name=${GITHUB_RUN_NUMBER}_${GITHUB_JOB} --partition=${CUDA_PARTATION} --gres=gpu:${GPU_REQUESTS} --cpus-per-task=5 --mem=16G --time=60 sh tests/run_nv_tests.sh && cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf Build-Cuda-Latest-Target \ | |
|| ( cd ${CUDA_CI_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && exit 1 ) | |
""" | |
Build-PyTorch-For-Ascend-910b: | |
name: Build-dipu-pytorch-for-ascend-910b | |
needs: [Rsync] | |
runs-on: tps-ascend-ci-910b | |
steps: | |
- name: Build PyTorch | |
run: | | |
set -ex | |
cd ${ASCEND_TORCH_DIR} | |
if [ "$(git rev-parse HEAD)" != "${PYTORCH_COMMIT}" ]; then | |
rm -rf build | |
fi | |
if [ ! -d "build" ]; then | |
source ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/source/dipu/scripts/ci/ascend/ci_ascend_env.sh | |
export CMAKE_PREFIX_PATH=${CONDA_PREFIX:-"$(dirname $(which conda))/../"} | |
BUILD_BINARY=0 USE_PRECOMPILED_HEADERS=1 BUILD_TEST=0 USE_CUDA=0 python setup.py build_ext -i || (rm -rf build && exit 1) | |
fi | |
Build-Ascend-910b: | |
name: Build-dipu-ascend-910b | |
needs: [Build-PyTorch-For-Ascend-910b] | |
runs-on: tps-ascend-ci-910b | |
steps: | |
- name: Build dipu | |
run: | | |
set -ex | |
cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && cp -R source ${GITHUB_JOB} && cd ${GITHUB_JOB}/dipu | |
source scripts/ci/ascend/ci_ascend_env.sh | |
bash scripts/ci/ascend/ci_ascend_script.sh build_dipu \ | |
|| ( cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && exit 1 ) | |
Test-Ascend-910b: | |
name: Test-dipu-ascend-910b | |
needs: [Build-Ascend-910b] | |
runs-on: tps-ascend-ci-910b | |
steps: | |
- name: Run a test | |
run: | | |
set -ex | |
cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/Build-Ascend-910b/dipu | |
source scripts/ci/ascend/ci_ascend_env.sh | |
bash tests/run_ascend_tests.sh | |
Test-One-Iter-Ascend-910b: | |
name: Test-one-iter-ascend-910b | |
needs: [Build-Ascend-910b] | |
runs-on: tps-ascend-ci-910b | |
steps: | |
- name: Build some env | |
run: | | |
set -ex | |
cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/Build-Ascend-910b/dipu | |
source scripts/ci/ascend/ci_ascend_env.sh | |
basic_path=${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/Build-Ascend-910b/dipu/mmlab_pack | |
source scripts/ci/ci_one_iter.sh export_pythonpath_ascend ${basic_path} | |
cd mmlab_pack | |
bash ../scripts/ci/ci_one_iter.sh build_ascend910b | |
- name: Run one iter tools | |
run: | | |
set -ex | |
cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/Build-Ascend-910b/dipu | |
source scripts/ci/ascend/ci_ascend_env.sh | |
basic_path=${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/Build-Ascend-910b/dipu/mmlab_pack | |
source scripts/ci/ci_one_iter.sh export_pythonpath_ascend ${basic_path} | |
cd mmlab_pack | |
rm -rf one_iter_data | |
python ../scripts/ci/ci_run_one_iter.py ascend "" "" "" && rm -rf one_iter_data || (rm -rf one_iter_data && exit 1) | |
- name: Perform cleanup one iter data | |
if: always() | |
run: | | |
set -ex | |
cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/Build-Ascend-910b/dipu/mmlab_pack | |
rm -rf one_iter_data | |
touch one_iter_data #用于占位,防止创建新的one_iter_data文件夹 | |
- name: Check for failure | |
if: ${{ failure() }} | |
run: exit 1 | |
Build-Ascend-Latest-Target-910b: | |
name: Build-dipu-ascend-latest-target-910b | |
needs: [Build-PyTorch-For-Ascend-910b] | |
runs-on: tps-ascend-ci-910b | |
steps: | |
- name: Build dipu diopi-latest-target | |
run: | | |
set -ex | |
cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && cp -R source-main ${GITHUB_JOB} && cd ${GITHUB_JOB}/dipu | |
source scripts/ci/ascend/ci_ascend_env.sh | |
bash scripts/ci/ascend/ci_ascend_script.sh build_dipu \ | |
|| ( cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf ${GITHUB_JOB} && exit 1 ) | |
Test-Ascend-Latest-Target-910b: | |
name: Test-dipu-ascend-latest-target-910b | |
needs: [Build-Ascend-Latest-Target-910b] | |
runs-on: tps-ascend-ci-910b | |
steps: | |
- name: Run a test | |
run: | | |
set -ex | |
cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/Build-Ascend-Latest-Target-910b/dipu | |
source scripts/ci/ascend/ci_ascend_env.sh | |
bash tests/run_ascend_tests.sh && cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf Build-Ascend-Latest-Target \ | |
|| ( cd ${DEEPLINK_PATH}/${GITHUB_RUN_NUMBER}/ && rm -rf Build-Ascend-Latest-Target && exit 1 ) |