llama.cpp/.devops/nix/sif.nix

{
  lib,
  singularity-tools,
  llama-cpp,
  bashInteractive,
  interactive ? false,
}:

let
    optionalInt = cond: x: if cond then x else 0;
in
singularity-tools.buildImage rec {
  inherit (llama-cpp) name;
  contents = [ llama-cpp ] ++ lib.optionals interactive [ bashInteractive ];

  # These are excessive (but safe) for most variants. Building singularity
  # images requires superuser privileges, so we build them inside a VM in a
  # writable image of pre-determined size.
  #
  # ROCm is currently affected by https://github.com/NixOS/nixpkgs/issues/276846
  #
  # Expected image sizes:
  # - cpu/blas: 150M,
  # - cuda, all gencodes: 560M,
  diskSize = 4096 + optionalInt llama-cpp.useRocm 16384;
  memSize = diskSize;
}
nix: init singularity and docker images (#5056) Exposes a few attributes demonstrating how to build [singularity](https://docs.sylabs.io/guides/latest/user-guide/)/[apptainer](https://apptainer.org/) and Docker images re-using llama.cpp's Nix expression. Built locally on `x86_64-linux` with `nix build github:someoneserge/llama.cpp/feat/nix/images#llamaPackages.{docker,docker-min,sif,llama-cpp}` and it's fast and effective. 2024-02-22 20:44:10 +01:00			`{`
			`lib,`
			`singularity-tools,`
			`llama-cpp,`
			`bashInteractive,`
			`interactive ? false,`
			`}:`

			`let`
			`optionalInt = cond: x: if cond then x else 0;`
			`in`
			`singularity-tools.buildImage rec {`
			`inherit (llama-cpp) name;`
			`contents = [ llama-cpp ] ++ lib.optionals interactive [ bashInteractive ];`

			`# These are excessive (but safe) for most variants. Building singularity`
			`# images requires superuser privileges, so we build them inside a VM in a`
			`# writable image of pre-determined size.`
			`#`
			`# ROCm is currently affected by https://github.com/NixOS/nixpkgs/issues/276846`
			`#`
			`# Expected image sizes:`
			`# - cpu/blas: 150M,`
			`# - cuda, all gencodes: 560M,`
			`diskSize = 4096 + optionalInt llama-cpp.useRocm 16384;`
			`memSize = diskSize;`
			`}`