mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-23 18:09:18 +01:00
f482bb2e49
* llama: llama_split_prefix fix strncpy does not include string termination common: llama_load_model_from_url: - fix header name case sensitive - support downloading additional split in parallel - hide password in url * common: EOL EOF * common: remove redundant LLAMA_CURL_MAX_PATH_LENGTH definition * common: change max url max length * common: minor comment * server: support HF URL options * llama: llama_model_loader fix log * common: use a constant for max url length * common: clean up curl if file cannot be loaded in gguf * server: tests: add split tests, and HF options params * common: move llama_download_hide_password_in_url inside llama_download_file as a lambda * server: tests: enable back Release test on PR * spacing Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> * spacing Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> * spacing Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
155 lines
4.6 KiB
YAML
155 lines
4.6 KiB
YAML
# Server build and tests
|
|
name: Server
|
|
|
|
on:
|
|
workflow_dispatch: # allows manual triggering
|
|
inputs:
|
|
slow_tests:
|
|
description: 'Run slow tests'
|
|
required: true
|
|
type: boolean
|
|
push:
|
|
branches:
|
|
- master
|
|
paths: ['.github/workflows/server.yml', '**/CMakeLists.txt', '**/Makefile', '**/*.h', '**/*.hpp', '**/*.c', '**/*.cpp', '**/*.cu', '**/*.swift', '**/*.m', 'examples/server/tests/**.*']
|
|
pull_request:
|
|
types: [opened, synchronize, reopened]
|
|
paths: ['.github/workflows/server.yml', '**/CMakeLists.txt', '**/Makefile', '**/*.h', '**/*.hpp', '**/*.c', '**/*.cpp', '**/*.cu', '**/*.swift', '**/*.m', 'examples/server/tests/**.*']
|
|
schedule:
|
|
- cron: '0 0 * * *'
|
|
|
|
concurrency:
|
|
group: ${{ github.workflow }}-${{ github.ref }}
|
|
cancel-in-progress: true
|
|
|
|
jobs:
|
|
server:
|
|
runs-on: ubuntu-latest
|
|
|
|
strategy:
|
|
matrix:
|
|
# TODO: temporary disabled due to linux kernel issues
|
|
#sanitizer: [ADDRESS, THREAD, UNDEFINED]
|
|
sanitizer: [UNDEFINED]
|
|
build_type: [Debug]
|
|
include:
|
|
- build_type: Release
|
|
sanitizer: ""
|
|
fail-fast: false # While -DLLAMA_SANITIZE_THREAD=ON is broken
|
|
|
|
container:
|
|
image: ubuntu:latest
|
|
ports:
|
|
- 8888
|
|
options: --cpus 4
|
|
|
|
steps:
|
|
- name: Clone
|
|
id: checkout
|
|
uses: actions/checkout@v3
|
|
with:
|
|
fetch-depth: 0
|
|
|
|
- name: Dependencies
|
|
id: depends
|
|
run: |
|
|
apt-get update
|
|
apt-get -y install \
|
|
build-essential \
|
|
git \
|
|
cmake \
|
|
python3-pip \
|
|
wget \
|
|
language-pack-en \
|
|
libcurl4-openssl-dev
|
|
|
|
- name: Build
|
|
id: cmake_build
|
|
run: |
|
|
mkdir build
|
|
cd build
|
|
cmake .. \
|
|
-DLLAMA_NATIVE=OFF \
|
|
-DLLAMA_BUILD_SERVER=ON \
|
|
-DLLAMA_CURL=ON \
|
|
-DCMAKE_BUILD_TYPE=${{ matrix.build_type }} \
|
|
-DLLAMA_SANITIZE_${{ matrix.sanitizer }}=ON ;
|
|
cmake --build . --config ${{ matrix.build_type }} -j $(nproc) --target server
|
|
|
|
- name: Tests dependencies
|
|
id: test_dependencies
|
|
run: |
|
|
pip install -r examples/server/tests/requirements.txt
|
|
|
|
- name: Tests
|
|
id: server_integration_tests
|
|
if: ${{ !matrix.disabled_on_pr || !github.event.pull_request }}
|
|
run: |
|
|
cd examples/server/tests
|
|
PORT=8888 ./tests.sh
|
|
|
|
- name: Slow tests
|
|
id: server_integration_tests_slow
|
|
if: ${{ (github.event.schedule || github.event.inputs.slow_tests == 'true') && matrix.build_type == 'Release' }}
|
|
run: |
|
|
cd examples/server/tests
|
|
PORT=8888 ./tests.sh --stop --no-skipped --no-capture --tags slow
|
|
|
|
|
|
server-windows:
|
|
runs-on: windows-latest
|
|
|
|
steps:
|
|
- name: Clone
|
|
id: checkout
|
|
uses: actions/checkout@v3
|
|
with:
|
|
fetch-depth: 0
|
|
|
|
- name: libCURL
|
|
id: get_libcurl
|
|
env:
|
|
CURL_VERSION: 8.6.0_6
|
|
run: |
|
|
curl.exe -o $env:RUNNER_TEMP/curl.zip -L "https://curl.se/windows/dl-${env:CURL_VERSION}/curl-${env:CURL_VERSION}-win64-mingw.zip"
|
|
mkdir $env:RUNNER_TEMP/libcurl
|
|
tar.exe -xvf $env:RUNNER_TEMP/curl.zip --strip-components=1 -C $env:RUNNER_TEMP/libcurl
|
|
|
|
- name: Build
|
|
id: cmake_build
|
|
run: |
|
|
mkdir build
|
|
cd build
|
|
cmake .. -DLLAMA_CURL=ON -DCURL_LIBRARY="$env:RUNNER_TEMP/libcurl/lib/libcurl.dll.a" -DCURL_INCLUDE_DIR="$env:RUNNER_TEMP/libcurl/include"
|
|
cmake --build . --config Release -j ${env:NUMBER_OF_PROCESSORS} --target server
|
|
|
|
- name: Python setup
|
|
id: setup_python
|
|
uses: actions/setup-python@v5
|
|
with:
|
|
python-version: '3.11'
|
|
|
|
- name: Tests dependencies
|
|
id: test_dependencies
|
|
run: |
|
|
pip install -r examples/server/tests/requirements.txt
|
|
|
|
- name: Copy Libcurl
|
|
id: prepare_libcurl
|
|
run: |
|
|
cp $env:RUNNER_TEMP/libcurl/bin/libcurl-x64.dll ./build/bin/Release/libcurl-x64.dll
|
|
|
|
- name: Tests
|
|
id: server_integration_tests
|
|
if: ${{ !matrix.disabled_on_pr || !github.event.pull_request }}
|
|
run: |
|
|
cd examples/server/tests
|
|
behave.exe --summary --stop --no-capture --exclude 'issues|wrong_usages|passkey' --tags llama.cpp
|
|
|
|
- name: Slow tests
|
|
id: server_integration_tests_slow
|
|
if: ${{ (github.event.schedule || github.event.inputs.slow_tests == 'true') && matrix.build_type == 'Release' }}
|
|
run: |
|
|
cd examples/server/tests
|
|
behave.exe --stop --no-skipped --no-capture --tags slow
|