From de2dc61091137fe93eb94db4b18a69a207cef200 Mon Sep 17 00:00:00 2001 From: Oliver Koenig Date: Fri, 25 Oct 2024 10:15:48 +0200 Subject: [PATCH] cpu Signed-off-by: Oliver Koenig --- .github/workflows/_test_template.yml | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/.github/workflows/_test_template.yml b/.github/workflows/_test_template.yml index 76549af5dfa4e..56623c8fbff04 100644 --- a/.github/workflows/_test_template.yml +++ b/.github/workflows/_test_template.yml @@ -43,6 +43,7 @@ jobs: outputs: conclusion: ${{ steps.main.conclusion }} log: ${{ steps.main.outputs.log }} + potential_infra_failure: ${{ steps.main.outputs.potential_infra_failure }} steps: - name: Docker system cleanup run: | @@ -54,7 +55,13 @@ jobs: - name: Start container run: | - docker run --rm -d --name nemo_container_${{ github.run_id }} --runtime=nvidia --gpus all --shm-size=64g --env TRANSFORMERS_OFFLINE=0 --env HYDRA_FULL_ERROR=1 --volume /mnt/datadrive/TestData:/home/TestData nemoci.azurecr.io/nemo_container_${{ github.run_id }} bash -c "sleep $(( ${{ inputs.TIMEOUT }} * 60 + 60 ))" + if [[ "${{ inputs.RUNNER }}" == *cpu* ]]; then + ARG=("--runtime=nvidia --gpus all") + else + ARG=("") + fi + + docker run --rm -d --name nemo_container_${{ github.run_id }} ${ARG[@]} --shm-size=64g --env TRANSFORMERS_OFFLINE=0 --env HYDRA_FULL_ERROR=1 --volume /mnt/datadrive/TestData:/home/TestData nemoci.azurecr.io/nemo_container_${{ github.run_id }} bash -c "sleep $(( ${{ inputs.TIMEOUT }} * 60 + 60 ))" - id: main name: Run main script