From 247678afc7c74c98f64e8d19f67355d128946974 Mon Sep 17 00:00:00 2001
From: Ben Sima <ben@bsima.me>
Date: Thu, 10 Aug 2023 21:11:23 -0400
Subject: Add llama-cpp and exllama

---
 Biz/Bild/Deps/llama-cpp.nix | 41 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 41 insertions(+)
 create mode 100644 Biz/Bild/Deps/llama-cpp.nix

(limited to 'Biz/Bild/Deps/llama-cpp.nix')

diff --git a/Biz/Bild/Deps/llama-cpp.nix b/Biz/Bild/Deps/llama-cpp.nix
new file mode 100644
index 0000000..85bd778
--- /dev/null
+++ b/Biz/Bild/Deps/llama-cpp.nix
@@ -0,0 +1,41 @@
+{ stdenv
+, pkgs
+, sources
+, python3
+, cmake
+, pkgconfig
+, openmpi
+, cudaPackages
+}:
+let
+  llama-python = python3.withPackages (ps: with ps; [ numpy sentencepiece ]);
+in stdenv.mkDerivation {
+  name = "llama.cpp";
+  version = sources.llama-cpp.rev;
+
+  src = sources.llama-cpp;
+
+  postPatch = ''
+    substituteInPlace ./ggml-metal.m \
+      --replace '[bundle pathForResource:@"ggml-metal" ofType:@"metal"];' "@\"$out/bin/ggml-metal.metal\";"
+    substituteInPlace ./*.py --replace '/usr/bin/env python' '${llama-python}/bin/python'
+  '';
+
+  nativeBuildInputs = [ cmake pkgconfig ];
+  buildInputs = [ openmpi cudaPackages.cudatoolkit ];
+
+  cmakeFlags = [
+    "-DLLAMA_BUILD_SERVER=ON"
+    "-DLLAMA_MPI=ON"
+    "-DBUILD_SHARED_LIBS=ON"
+    "-DCMAKE_SKIP_BUILD_RPATH=ON"
+    "-DLLAMA_CUBLAS=ON"
+  ];
+
+  postInstall = ''
+    mv $out/bin/main $out/bin/llama
+    mv $out/bin/server $out/bin/llama-server
+  '';
+
+  meta.mainProgram = "llama";
+}
-- 
cgit v1.2.3