chore: cortex.llamacpp v0.1.4 #2

Workflow file for this run

.github/workflows/cortex-cpp-quality-gate.yml at 2675745

	name: CI Quality Gate Cortex CPP

	on:
	pull_request:
	types: [opened, synchronize, reopened]
	paths:
	[
	"cortex-cpp/**",
	]
	workflow_dispatch:

	env:
	LLM_MODEL_URL: https://delta.jan.ai/tinyllama-1.1b-chat-v0.3.Q2_K.gguf
	EMBEDDING_MODEL_URL: https://catalog.jan.ai/dist/models/embeds/nomic-embed-text-v1.5.f16.gguf

	jobs:
	build-and-test:
	runs-on: ${{ matrix.runs-on }}
	timeout-minutes: 40
	strategy:
	fail-fast: false
	matrix:
	include:
	- os: "linux"
	name: "amd64-avx2"
	runs-on: "ubuntu-18-04"
	cmake-flags: "-DLLAMA_AVX2=ON -DLLAMA_NATIVE=OFF"
	run-e2e: true

	- os: "linux"
	name: "amd64-avx"
	runs-on: "ubuntu-18-04"
	cmake-flags: "-DLLAMA_AVX2=OFF -DLLAMA_NATIVE=OFF"
	run-e2e: false

	- os: "linux"
	name: "amd64-avx512"
	runs-on: "ubuntu-18-04"
	cmake-flags: "-DLLAMA_AVX512=ON -DLLAMA_NATIVE=OFF"
	run-e2e: false

	- os: "linux"
	name: "amd64-vulkan"
	runs-on: "ubuntu-18-04-cuda-11-7"
	cmake-flags: "-DLLAMA_VULKAN=ON -DLLAMA_NATIVE=OFF"
	run-e2e: false

	- os: "linux"
	name: "amd64-cuda-11-7"
	runs-on: "ubuntu-18-04-cuda-11-7"
	cmake-flags: "-DCUDA_11_7=ON -DLLAMA_NATIVE=OFF -DLLAMA_CUDA=ON"
	run-e2e: false

	- os: "linux"
	name: "amd64-cuda-12-0"
	runs-on: "ubuntu-18-04-cuda-12-0"
	cmake-flags: "-DCUDA_12_0=ON -DLLAMA_NATIVE=OFF -DLLAMA_CUDA=ON"
	run-e2e: false

	- os: "mac"
	name: "amd64"
	runs-on: "macos-13"
	cmake-flags: ""
	run-e2e: true

	- os: "mac"
	name: "arm64"
	runs-on: "mac-silicon"
	cmake-flags: "-DMAC_ARM64=ON"
	run-e2e: true

	- os: "windows"
	name: "amd64-avx2"
	runs-on: "windows-latest"
	cmake-flags: "-DLLAMA_AVX2=ON -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_BLAS=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: true

	- os: "windows"
	name: "amd64-avx"
	runs-on: "windows-latest"
	cmake-flags: "-DLLAMA_AVX2=OFF -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_BLAS=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: false

	- os: "windows"
	name: "amd64-avx512"
	runs-on: "windows-latest"
	cmake-flags: "-DLLAMA_AVX512=ON -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_BLAS=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: false

	- os: "windows"
	name: "amd64-vulkan"
	runs-on: "windows-latest"
	cmake-flags: "-DLLAMA_VULKAN=ON -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: false

	- os: "windows"
	name: "amd64-avx2-cuda-12-0"
	runs-on: "windows-cuda-12-0"
	cmake-flags: "-DLLAMA_AVX2=ON -DLLAMA_NATIVE=OFF -DCUDA_12_0=ON -DLLAMA_BUILD_SERVER=ON -DLLAMA_CUDA=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: false

	- os: "windows"
	name: "amd64-avx-cuda-12-0"
	runs-on: "windows-cuda-12-0"
	cmake-flags: "-DLLAMA_AVX2=OFF -DLLAMA_NATIVE=OFF -DCUDA_12_0=ON -DLLAMA_BUILD_SERVER=ON -DLLAMA_CUDA=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: false

	- os: "windows"
	name: "amd64-avx512-cuda-12-0"
	runs-on: "windows-cuda-12-0"
	cmake-flags: "-DLLAMA_AVX512=ON -DLLAMA_NATIVE=OFF -DCUDA_12_0=ON -DLLAMA_BUILD_SERVER=ON -DLLAMA_CUDA=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: false

	- os: "windows"
	name: "amd64-avx2-cuda-11-7"
	runs-on: "windows-cuda-11-7"
	cmake-flags: "-DLLAMA_AVX2=ON -DLLAMA_NATIVE=OFF -DCUDA_11_7=ON -DLLAMA_BUILD_SERVER=ON -DLLAMA_CUDA=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: false

	- os: "windows"
	name: "amd64-avx-cuda-11-7"
	runs-on: "windows-cuda-11-7"
	cmake-flags: "-DLLAMA_AVX2=OFF -DLLAMA_NATIVE=OFF -DCUDA_11_7=ON -DLLAMA_BUILD_SERVER=ON -DLLAMA_CUDA=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: false
	- os: "windows"
	name: "amd64-avx512-cuda-11-7"
	runs-on: "windows-cuda-11-7"
	cmake-flags: "-DLLAMA_AVX512=ON -DLLAMA_NATIVE=OFF -DCUDA_11_7=ON -DLLAMA_BUILD_SERVER=ON -DLLAMA_CUDA=ON -DBUILD_SHARED_LIBS=OFF -DCMAKE_BUILD_TYPE=RELEASE"
	run-e2e: false

	steps:
	- name: Clone
	id: checkout
	uses: actions/checkout@v3
	with:
	submodules: recursive

	- name: Install choco on Windows
	if: runner.os == 'Windows'
	run: \|
	choco install make -y

	- name: Build
	run: \|
	cd cortex-cpp
	make build CMAKE_EXTRA_FLAGS="${{ matrix.cmake-flags }}"

	- name: Pre-package
	run: \|
	cd cortex-cpp
	make pre-package

	- name: Package
	run: \|
	cd cortex-cpp
	make package

	- name: Run e2e testing
	if: ${{ matrix.run-e2e }}
	run: \|
	cd cortex-cpp
	make run-e2e-test RUN_TESTS=true LLM_MODEL_URL=${{ env.LLM_MODEL_URL }} EMBEDDING_MODEL_URL=${{ env.EMBEDDING_MODEL_URL }}

	- name: Upload Artifact
	uses: actions/upload-artifact@v2
	with:
	name: cortex-cpp-${{ matrix.os }}-${{ matrix.name }}
	path: ./cortex-cpp/cortex-cpp

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

chore: cortex.llamacpp v0.1.4 #2

Workflow file

chore: cortex.llamacpp v0.1.4 #2

Jobs

Run details

Workflow file for this run