diff --git a/rllm/rllm-cuda/server.sh b/rllm/rllm-cuda/server.sh index 3c6ca131..73c1caf9 100755 --- a/rllm/rllm-cuda/server.sh +++ b/rllm/rllm-cuda/server.sh @@ -41,6 +41,38 @@ while [ "$1" != "" ] ; do exit 1 fi ;; + --sycl ) + if [ "$CPP" = 1 ] ; then + VER="$VER --features sycl" + else + echo "--sycl only valid for llama.cpp" + exit 1 + fi + ;; + --sycl-fp16 ) + if [ "$CPP" = 1 ] ; then + VER="$VER --features \"sycl,sycl-fp16\"" + else + echo "--sycl-fp16 only valid for llama.cpp" + exit 1 + fi + ;; + --sycl-nvidia ) + if [ "$CPP" = 1 ] ; then + VER="$VER --features \"sycl,sycl-nvidia\"" + else + echo "--sycl-nvidia only valid for llama.cpp" + exit 1 + fi + ;; + --sycl-nvidia-fp16 ) + if [ "$CPP" = 1 ] ; then + VER="$VER --features \"sycl,sycl-nvidia,sycl-fp16\"" + else + echo "--sycl-nvidia-fp16 only valid for llama.cpp" + exit 1 + fi + ;; --trace ) R_LOG=info,tokenizers=error,rllm=trace,aicirt=info,llama_cpp_low=trace ;; @@ -84,7 +116,7 @@ if [ "$CPP" = 1 ] ; then * ) SELF="server.sh" cat <