llama.cpp/.devops/full-cuda.Dockerfile

ARG UBUNTU_VERSION=22.04
# This needs to generally match the container host's environment.
ARG CUDA_VERSION=12.6.0
# Target the CUDA build image
ARG BASE_CUDA_DEV_CONTAINER=nvidia/cuda:${CUDA_VERSION}-devel-ubuntu${UBUNTU_VERSION}

FROM ${BASE_CUDA_DEV_CONTAINER} AS build

# CUDA architecture to build for (defaults to all supported archs)
ARG CUDA_DOCKER_ARCH=default

RUN apt-get update && \
    apt-get install -y build-essential cmake python3 python3-pip git libcurl4-openssl-dev libgomp1

COPY requirements.txt   requirements.txt
COPY requirements       requirements

RUN pip install --upgrade pip setuptools wheel \
    && pip install -r requirements.txt

WORKDIR /app

COPY . .

# Use the default CUDA archs if not specified
RUN if [ "${CUDA_DOCKER_ARCH}" != "default" ]; then \
        export CMAKE_ARGS="-DCMAKE_CUDA_ARCHITECTURES=${CUDA_DOCKER_ARCH}"; \
    fi && \
    cmake -B build -DGGML_NATIVE=OFF -DGGML_CUDA=ON -DLLAMA_CURL=ON ${CMAKE_ARGS} -DCMAKE_EXE_LINKER_FLAGS=-Wl,--allow-shlib-undefined . && \
    cmake --build build --config Release -j$(nproc) && \
    cp build/bin/* .

ENTRYPOINT ["/app/.devops/tools.sh"]
docker : add support for CUDA in docker (#1461) Co-authored-by: canardleteer <eris.has.a.dad+github@gmail.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> 2023-07-07 20:25:25 +02:00			`ARG UBUNTU_VERSION=22.04`
			`# This needs to generally match the container host's environment.`
docker : update CUDA images (#9213) 2024-08-28 13:20:36 +02:00			`ARG CUDA_VERSION=12.6.0`
docker : add support for CUDA in docker (#1461) Co-authored-by: canardleteer <eris.has.a.dad+github@gmail.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> 2023-07-07 20:25:25 +02:00			`# Target the CUDA build image`
			`ARG BASE_CUDA_DEV_CONTAINER=nvidia/cuda:${CUDA_VERSION}-devel-ubuntu${UBUNTU_VERSION}`

build : Fix docker build warnings (#8535) (#8537) 2024-07-17 20:21:55 +02:00			`FROM ${BASE_CUDA_DEV_CONTAINER} AS build`
docker : add support for CUDA in docker (#1461) Co-authored-by: canardleteer <eris.has.a.dad+github@gmail.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> 2023-07-07 20:25:25 +02:00
docker : update CUDA images (#9213) 2024-08-28 13:20:36 +02:00			`# CUDA architecture to build for (defaults to all supported archs)`
			`ARG CUDA_DOCKER_ARCH=default`
docker : add support for CUDA in docker (#1461) Co-authored-by: canardleteer <eris.has.a.dad+github@gmail.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> 2023-07-07 20:25:25 +02:00
			`RUN apt-get update && \`
docker : update CUDA images (#9213) 2024-08-28 13:20:36 +02:00			`apt-get install -y build-essential cmake python3 python3-pip git libcurl4-openssl-dev libgomp1`
docker : add support for CUDA in docker (#1461) Co-authored-by: canardleteer <eris.has.a.dad+github@gmail.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> 2023-07-07 20:25:25 +02:00
python : add check-requirements.sh and GitHub workflow (#4585) * python: add check-requirements.sh and GitHub workflow This script and workflow forces package versions to remain compatible across all convert.py scripts, while allowing secondary convert scripts to import dependencies not wanted in convert.py. Move requirements into ./requirements * Fail on "==" being used for package requirements (but can be suppressed) * Enforce "compatible release" syntax instead of == * Update workflow * Add upper version bound for transformers and protobuf * improve check-requirements.sh * small syntax change * don't remove venvs if nocleanup is passed * See if this fixes docker workflow * Move check-requirements.sh into ./scripts/ --------- Co-authored-by: Jared Van Bortel <jared@nomic.ai> 2023-12-29 15:50:29 +01:00			`COPY requirements.txt requirements.txt`
			`COPY requirements requirements`
docker : add support for CUDA in docker (#1461) Co-authored-by: canardleteer <eris.has.a.dad+github@gmail.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> 2023-07-07 20:25:25 +02:00
			`RUN pip install --upgrade pip setuptools wheel \`
			`&& pip install -r requirements.txt`

			`WORKDIR /app`

			`COPY . .`

docker : update CUDA images (#9213) 2024-08-28 13:20:36 +02:00			`# Use the default CUDA archs if not specified`
			`RUN if [ "${CUDA_DOCKER_ARCH}" != "default" ]; then \`
			`export CMAKE_ARGS="-DCMAKE_CUDA_ARCHITECTURES=${CUDA_DOCKER_ARCH}"; \`
			`fi && \`
docker: use GGML_NATIVE=OFF (#10368) 2024-11-18 00:21:53 +01:00			`cmake -B build -DGGML_NATIVE=OFF -DGGML_CUDA=ON -DLLAMA_CURL=ON ${CMAKE_ARGS} -DCMAKE_EXE_LINKER_FLAGS=-Wl,--allow-shlib-undefined . && \`
docker : fix missing binaries in full-cuda image (#9278) 2024-09-02 18:11:13 +02:00			`cmake --build build --config Release -j$(nproc) && \`
docker : update CUDA images (#9213) 2024-08-28 13:20:36 +02:00			`cp build/bin/* .`
docker : add support for CUDA in docker (#1461) Co-authored-by: canardleteer <eris.has.a.dad+github@gmail.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> 2023-07-07 20:25:25 +02:00
			`ENTRYPOINT ["/app/.devops/tools.sh"]`