lammps-migration-net: add migration + compute and network bound bench… #166
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Test example applications | |
on: | |
push: | |
branches: [main] | |
pull_request: | |
branches: [main] | |
types: [opened, synchronize, reopened, ready_for_review] | |
jobs: | |
# Cancel previous running actions for the same PR | |
cancel_previous: | |
if: github.event.pull_request.draft == false | |
runs-on: ubuntu-latest | |
steps: | |
- name: Cancel Workflow Action | |
uses: styfle/[email protected] | |
checks: | |
if: github.event.pull_request.draft == false | |
runs-on: ubuntu-latest | |
steps: | |
# --- Update code --- | |
- name: "Checkout code" | |
uses: actions/checkout@v4 | |
with: | |
submodules: true | |
# --- Formatting --- | |
- name: "Format code" | |
run: ./bin/inv_wrapper.sh format-code --check | |
# Work-out whether we need to re-build the examples. We need to re-build the | |
# examples if either _any_ fo the examples has changed, or the WASM cache | |
# has expired | |
needs-build: | |
if: github.event.pull_request.draft == false | |
runs-on: ubuntu-latest | |
outputs: | |
needs-wasm: ${{ (steps.filter.outputs.examples-changed == 'true') || (steps.wasm-cache.outputs.cache-hit != 'true') }} | |
steps: | |
- name: "Checkout code" | |
uses: actions/checkout@v4 | |
# Check if any of the submodules have been modified | |
- uses: dorny/paths-filter@v2 | |
id: filter | |
with: | |
filters: | | |
examples-changed: | |
- './examples/**' | |
# Check if we have a WASM cache hit | |
- name: "Get CPP/Python commits" | |
id: submodule-commit | |
run: | | |
git submodule update --init ./cpp | |
git submodule update --init ./python | |
sudo apt install -y zstd | |
git config --global --add safe.directory "$GITHUB_WORKSPACE" | |
echo "cpp-commit=$(git submodule status ./cpp | cut '-d ' -f 2)" >> $GITHUB_OUTPUT | |
echo "py-commit=$(git submodule status ./python | cut '-d ' -f 2)" >> $GITHUB_OUTPUT | |
- uses: actions/cache/[email protected] | |
id: wasm-cache | |
with: | |
path: ./wasm | |
key: wasm-${{ steps.submodule-commit.outputs.cpp-commit }}-${{ steps.submodule-commit.outputs.py-commit }} | |
lookup-only: true | |
build-examples: | |
needs: needs-build | |
if: ${{ needs.needs-build.outputs.needs-wasm == 'true' }} | |
runs-on: ubuntu-latest | |
container: | |
image: faasm.azurecr.io/examples-build:0.3.1_0.3.1 | |
credentials: | |
username: ${{ secrets.ACR_SERVICE_PRINCIPAL_ID }} | |
password: ${{ secrets.ACR_SERVICE_PRINCIPAL_PASSWORD }} | |
steps: | |
- name: "Checkout code" | |
uses: actions/checkout@v4 | |
with: | |
submodules: true | |
- name: "Build FFmpeg" | |
run: ./bin/inv_wrapper.sh ffmpeg | |
- name: "Build ImageMagick" | |
run: ./bin/inv_wrapper.sh libpng imagemagick | |
- name: "Build Kernels" | |
run: ./bin/inv_wrapper.sh kernels kernels --native | |
- name: "Build LAMMPS" | |
run: ./bin/inv_wrapper.sh lammps lammps --native | |
- name: "Build LAMMPS with migration" | |
run: ./bin/inv_wrapper.sh lammps --migration lammps --native --migration | |
- name: "Build LAMMPS with migration and network phase" | |
run: ./bin/inv_wrapper.sh lammps --migration-net lammps --native --migration-net | |
- name: "Build Lulesh" | |
run: ./bin/inv_wrapper.sh lulesh lulesh --native | |
- name: "Build TensorFlow" | |
run: ./bin/inv_wrapper.sh tensorflow | |
- name: "Build PolyBench/C" | |
run: ./bin/inv_wrapper.sh polybench polybench --native | |
- name: "Build functions used in the tests" | |
run: ./bin/inv_wrapper.sh func.tests | |
- name: "Get CPP/Python commits" | |
id: submodule-commit | |
run: | | |
apt install -y zstd | |
git config --global --add safe.directory "$GITHUB_WORKSPACE" | |
echo "cpp-commit=$(git submodule status ./cpp | cut '-d ' -f 2)" >> $GITHUB_OUTPUT | |
echo "py-commit=$(git submodule status ./python | cut '-d ' -f 2)" >> $GITHUB_OUTPUT | |
# Also move to a different path to restore from | |
mv /usr/local/faasm/wasm ./wasm | |
# If we are here we _always_ want to overwrite the cache | |
- name: "Prepare WASM cache" | |
uses: actions/cache/[email protected] | |
if: always() | |
with: | |
path: ./wasm | |
key: wasm-${{ steps.submodule-commit.outputs.cpp-commit }}-${{ steps.submodule-commit.outputs.py-commit }} | |
run-examples-faasmctl: | |
needs: [build-examples] | |
if: | |
always() && | |
!cancelled() && | |
github.event.pull_request.draft == false && | |
(needs.build-examples.result == 'success' || needs.build-examples.result == 'skipped') | |
runs-on: ubuntu-latest | |
strategy: | |
fail-fast: false | |
matrix: | |
faasm_wasm_vm: [wavm, wamr] | |
defaults: | |
run: | |
shell: bash | |
env: | |
CONAN_CACHE_MOUNT_SOURCE: ~/.conan | |
FAASM_INI_FILE: ./faasm.ini | |
FAASM_VERSION: 0.20.1 | |
FAASM_WASM_VM: ${{ matrix.faasm_wasm_vm }} | |
steps: | |
- uses: csegarragonz/set-compose-version-action@main | |
with: | |
compose-version: "2.22.0" | |
# A regular `faasmctl` deployment pulls a lot of docker images, so we | |
# may run out of disk space | |
- name: "Maximize build space" | |
uses: easimon/maximize-build-space@master | |
with: | |
# Leave 25 GB for the / partition for docker images (stored under | |
# /var/lib/docker) | |
root-reserve-mb: 25600 | |
remove-android: 'true' | |
remove-codeql: 'true' | |
remove-docker-images: 'true' | |
remove-dotnet: 'true' | |
remove-haskell: 'true' | |
- name: "Checkout code" | |
uses: actions/checkout@v4 | |
- name: "Install faasmctl" | |
run: pip3 install $(cat ./requirements.txt | grep faasmctl | tr -d '\n') | |
- name: "Start a Faasm cluster to run the examples" | |
run: faasmctl deploy.compose --workers=2 | |
# This can fail when the container isn't ready, so we want to retry | |
- name: "Wait for upload server to be available" | |
run: | | |
(echo "Attempt 1" && faasmctl cli.faasm --cmd "./deploy/local/wait_for_upload.sh upload 8002") || \ | |
(echo "Attempt 2" && faasmctl cli.faasm --cmd "./deploy/local/wait_for_upload.sh upload 8002") || \ | |
(echo "Attempt 3" && faasmctl cli.faasm --cmd "./deploy/local/wait_for_upload.sh upload 8002") || \ | |
(echo "Wait for upload failed after retries" && faasmctl logs -s upload && exit 1) | |
- name: "Get CPP/Python commits" | |
id: submodule-commit | |
run: | | |
sudo apt install -y zstd | |
git config --global --add safe.directory "$GITHUB_WORKSPACE" | |
git submodule update --init ./cpp | |
git submodule update --init ./python | |
echo "cpp-commit=$(git submodule status ./cpp | cut '-d ' -f 2)" >> $GITHUB_OUTPUT | |
echo "py-commit=$(git submodule status ./python | cut '-d ' -f 2)" >> $GITHUB_OUTPUT | |
- name: "Get WASM cache" | |
uses: actions/cache/[email protected] | |
id: cpp-wasm-cache | |
with: | |
path: ./wasm | |
key: wasm-${{ steps.submodule-commit.outputs.cpp-commit }}-${{ steps.submodule-commit.outputs.py-commit }} | |
fail-on-cache-miss: true | |
- name: "Upload all WASM files to the cluster" | |
run: ./bin/inv_wrapper.sh wasm.upload | |
- name: "Run MPI kernels" | |
# TODO: MPI kernels still not run in WAMR because there's a seg. fault | |
# with the `exit` syscall | |
if: "contains(env.FAASM_WASM_VM, 'wavm')" | |
timeout-minutes: 2 | |
run: | | |
# The global MPI kernel stopped working when enabling SIMD | |
# faasmctl invoke kernels-mpi global --cmdline '10 1024' | |
faasmctl invoke kernels-mpi p2p --cmdline '10 1024 1024' --mpi-world-size 4 | |
faasmctl invoke kernels-mpi sparse --cmdline '10 10 5' --mpi-world-size 4 | |
faasmctl invoke kernels-mpi transpose --cmdline '10 1024 32' --mpi-world-size 4 | |
faasmctl invoke kernels-mpi stencil --cmdline '10 1000' --mpi-world-size 4 | |
# The dgemm MPI kernel does not work because we are missing | |
# implementations for MPI_Comm_group, MPI_Group_incl, and MPI_Comm_create | |
# faasmctl invoke kernels-mpi dgemm --cmdline '10 1024 32 1' --mpi-world-size 4 | |
faasmctl invoke kernels-mpi nstream --cmdline '10 1024 32' --mpi-world-size 4 | |
faasmctl invoke kernels-mpi reduce --cmdline '10 1024' --mpi-world-size 4 | |
# The random MPI kernel does not work because we are missing | |
# implementations for MPI_Alltoallv | |
# faasmctl invoke kernels-mpi random --cmdline '32 20' --mpi-world-size 4 | |
- name: "Run OpenMP kernels" | |
if: "contains(env.FAASM_WASM_VM, 'wavm')" | |
timeout-minutes: 2 | |
run: | | |
faasmctl invoke kernels-omp global --cmdline '2 10 1024' | |
faasmctl invoke kernels-omp p2p --cmdline '2 10 1024 1024' | |
# The sparse OpenMP kernel fails during the result integrity checks | |
# faasmctl invoke kernels-omp sparse --cmdline '2 10 10 5' | |
# The transpose OpenMP kernel can not be cross-compiled due to problems | |
# with the static_for signature and symbol definition | |
# faasmctl invoke kernels-omp transpose --cmdline '10 1024 32' | |
# The stencil OpenMP kernel can not be cross-compiled due to a problem | |
# with the faasm_sm_reduce signature | |
# faasmctl invoke kernels-omp stencil --cmdline '10 1000' | |
faasmctl invoke kernels-omp dgemm --cmdline '2 2 1024 32' | |
faasmctl invoke kernels-omp nstream --cmdline '2 10 1024 32' | |
faasmctl invoke kernels-omp reduce --cmdline '2 10 1024' | |
# The random OpenMP kernel can not be cross-compiled due to a problem | |
# with the faasm_sm_reduce signature | |
# faasmctl invoke kernels-omp random --cmdline '32 20' | |
- name: "Run PolyBench/C" | |
timeout-minutes: 2 | |
# We deliberately enumerate all the supported functions here and | |
# execute them individually, rather than using the microbench runner. | |
# This is so that we can more easily track what functions are supported | |
# and what functions are not | |
run: | | |
faasmctl invoke polybench poly_covariance | |
faasmctl invoke polybench poly_correlation | |
faasmctl invoke polybench poly_2mm | |
faasmctl invoke polybench poly_3mm | |
faasmctl invoke polybench poly_atax | |
faasmctl invoke polybench poly_bicg | |
faasmctl invoke polybench poly_doitgen | |
faasmctl invoke polybench poly_mvt | |
faasmctl invoke polybench poly_cholesky | |
faasmctl invoke polybench poly_durbin | |
faasmctl invoke polybench poly_gramschmidt | |
faasmctl invoke polybench poly_lu | |
faasmctl invoke polybench poly_ludcmp | |
faasmctl invoke polybench poly_trisolv | |
faasmctl invoke polybench poly_deriche | |
faasmctl invoke polybench poly_floyd-warshall | |
faasmctl invoke polybench poly_nussinov | |
faasmctl invoke polybench poly_adi | |
faasmctl invoke polybench poly_fdtd-2d | |
faasmctl invoke polybench poly_heat-3d | |
faasmctl invoke polybench poly_jacobi-1d | |
faasmctl invoke polybench poly_jacobi-2d | |
faasmctl invoke polybench poly_seidel-2d | |
- name: "Run ImageMagick" | |
if: "contains(env.FAASM_WASM_VM, 'wavm')" | |
timeout-minutes: 1 | |
run: faasmctl invoke imagemagick main --cmdline 'faasm://im/sample_image.png -flip faasm://im/image_out.png' | |
- name: "Run LAMMPS" | |
timeout-minutes: 1 | |
run: faasmctl invoke lammps main --cmdline '-in faasm://lammps-data/in.controller.wall' --mpi-world-size 4 | |
# Note that the migration experiment does not migrate, it just checks the binary | |
- name: "Run LAMMPS migration binary" | |
timeout-minutes: 1 | |
run: faasmctl invoke lammps migration --cmdline '-in faasm://lammps-data/in.controller.wall' --mpi-world-size 4 --input-data '1 2' | |
- name: "Run LAMMPS migration-net binary" | |
timeout-minutes: 1 | |
run: faasmctl invoke lammps migration-net --cmdline '-in faasm://lammps-data/in.controller.wall' --mpi-world-size 4 --input-data '1 2' | |
# 08/12/2023 - LULESH is broken with a memory leak | |
# - name: "Run LULESH" | |
# timeout-minutes: 1 | |
# if: "contains(env.FAASM_WASM_VM, 'wavm')" | |
# run: faasmctl invoke lulesh main --cmdline '-i 5 -s 20 -r 11 -c 1 -b 1' --input-data '4' | |
- name: "Run TFlite check" | |
timeout-minutes: 1 | |
if: "contains(env.FAASM_WASM_VM, 'wavm')" | |
run: faasmctl invoke tf check | |
- name: "Run FFmpeg check" | |
timeout-minutes: 1 | |
run: faasmctl invoke ffmpeg check |