From 247678afc7c74c98f64e8d19f67355d128946974 Mon Sep 17 00:00:00 2001 From: Ben Sima Date: Thu, 10 Aug 2023 21:11:23 -0400 Subject: Add llama-cpp and exllama --- Biz/Bild/Deps/llama-cpp.nix | 41 +++++++++++++++++++++++++++++++++++++++++ 1 file changed, 41 insertions(+) create mode 100644 Biz/Bild/Deps/llama-cpp.nix (limited to 'Biz/Bild/Deps/llama-cpp.nix') diff --git a/Biz/Bild/Deps/llama-cpp.nix b/Biz/Bild/Deps/llama-cpp.nix new file mode 100644 index 0000000..85bd778 --- /dev/null +++ b/Biz/Bild/Deps/llama-cpp.nix @@ -0,0 +1,41 @@ +{ stdenv +, pkgs +, sources +, python3 +, cmake +, pkgconfig +, openmpi +, cudaPackages +}: +let + llama-python = python3.withPackages (ps: with ps; [ numpy sentencepiece ]); +in stdenv.mkDerivation { + name = "llama.cpp"; + version = sources.llama-cpp.rev; + + src = sources.llama-cpp; + + postPatch = '' + substituteInPlace ./ggml-metal.m \ + --replace '[bundle pathForResource:@"ggml-metal" ofType:@"metal"];' "@\"$out/bin/ggml-metal.metal\";" + substituteInPlace ./*.py --replace '/usr/bin/env python' '${llama-python}/bin/python' + ''; + + nativeBuildInputs = [ cmake pkgconfig ]; + buildInputs = [ openmpi cudaPackages.cudatoolkit ]; + + cmakeFlags = [ + "-DLLAMA_BUILD_SERVER=ON" + "-DLLAMA_MPI=ON" + "-DBUILD_SHARED_LIBS=ON" + "-DCMAKE_SKIP_BUILD_RPATH=ON" + "-DLLAMA_CUBLAS=ON" + ]; + + postInstall = '' + mv $out/bin/main $out/bin/llama + mv $out/bin/server $out/bin/llama-server + ''; + + meta.mainProgram = "llama"; +} -- cgit v1.2.3