Update server-llm.sh

This commit is contained in:
Olivier Chafik 2024-06-07 11:52:40 +01:00
parent af8f0169da
commit 0dba58269f

View File

@ -380,13 +380,13 @@ fi
if [[ "$backend" == "cuda" ]]; then if [[ "$backend" == "cuda" ]]; then
printf "[+] Building with CUDA backend\n" printf "[+] Building with CUDA backend\n"
LLAMA_CUDA=1 make -j server $log LLAMA_CUDA=1 make -j llama-server $log
elif [[ "$backend" == "cpu" ]]; then elif [[ "$backend" == "cpu" ]]; then
printf "[+] Building with CPU backend\n" printf "[+] Building with CPU backend\n"
make -j server $log make -j llama-server $log
elif [[ "$backend" == "metal" ]]; then elif [[ "$backend" == "metal" ]]; then
printf "[+] Building with Metal backend\n" printf "[+] Building with Metal backend\n"
make -j server $log make -j llama-server $log
else else
printf "[-] Unknown backend: %s\n" "$backend" printf "[-] Unknown backend: %s\n" "$backend"
exit 1 exit 1
@ -413,6 +413,6 @@ if [[ $verbose -eq 1 ]]; then
args="$args --verbose" args="$args --verbose"
fi fi
./server -m "../$wfile" --host 0.0.0.0 --port "$port" -c $n_kv -np "$n_parallel" $args ./llama-server -m "../$wfile" --host 0.0.0.0 --port "$port" -c $n_kv -np "$n_parallel" $args
exit 0 exit 0