Use newer ollama in system service

Ollama releases often, and nixos-24.05 has a very old version, it was preventing me from doing work. Here I'm putting the newer nixos unstable as an overlay into the 24.05 version so I can backpull versions as needed.
author: Ben Sima <ben@bsima.me> 2024-10-25 02:10:20 -0400
committer: Ben Sima <ben@bsima.me> 2024-12-21 10:06:48 -0500
commit: 8ceebbdb53ea5c67310a5281c30f53c9cf504d70 (patch)
tree: 17ef6c8bbe37959202ff3a77401f255573336dd1 /Biz/Bild/Deps
parent: 9293fd18d4df5383bb596fabbc6a0f2f7a46923e (diff)
1 files changed, 0 insertions, 193 deletions
diff --git a/Biz/Bild/Deps/ollama.nix b/Biz/Bild/Deps/ollama.nix
deleted file mode 100644
index 72e31f7..0000000
--- a/Biz/Bild/Deps/ollama.nix
+++ /dev/null
@@ -1,193 +0,0 @@
-# This was cribbed from an open pull request: https://github.com/NixOS/nixpkgs/pull/309330
-{ lib, buildGo122Module, fetchFromGitHub, fetchpatch, buildEnv, linkFarm
-, overrideCC, makeWrapper, stdenv, nixosTests
-
-, pkgs, cmake, gcc12, clblast, libdrm, rocmPackages, cudaPackages, linuxPackages
-, darwin
-
-, testers, ollama
-
-, config
-# one of `[ null false "rocm" "cuda" ]`
-, acceleration ? null }:
-
-let
-  pname = "ollama";
-  # don't forget to invalidate all hashes each update
-  version = "0.1.33";
-
-  src = fetchFromGitHub {
-    owner = "jmorganca";
-    repo = "ollama";
-    rev = "v${version}";
-    hash = "sha256-+iZIuHr90d5OijrXl6kzPycsHmx5XnKAKKOtppycjsk=";
-    fetchSubmodules = true;
-  };
-  vendorHash = "sha256-7x/n60WiKmwHFFuN0GfzkibUREvxAXNHcD3fHmihZvs=";
-  # ollama's patches of llama.cpp's example server
-  # `ollama/llm/generate/gen_common.sh` -> "apply temporary patches until fix is upstream"
-  # each update, these patches should be synchronized with the contents of `ollama/llm/patches/`
-  llamacppPatches = [
-    (preparePatch "02-clip-log.diff"
-      "sha256-rMWbl3QgrPlhisTeHwD7EnGRJyOhLB4UeS7rqa0tdXM=")
-    (preparePatch "03-load_exception.diff"
-      "sha256-1DfNahFYYxqlx4E4pwMKQpL+XR0bibYnDFGt6dCL4TM=")
-    (preparePatch "04-metal.diff"
-      "sha256-Ne8J9R8NndUosSK0qoMvFfKNwqV5xhhce1nSoYrZo7Y=")
-  ];
-
-  preparePatch = patch: hash:
-    fetchpatch {
-      url = "file://${src}/llm/patches/${patch}";
-      inherit hash;
-      stripLen = 1;
-      extraPrefix = "llm/llama.cpp/";
-    };
-
-  accelIsValid = builtins.elem acceleration [ null false "rocm" "cuda" ];
-  validateFallback = lib.warnIf (config.rocmSupport && config.cudaSupport)
-    (lib.concatStrings [
-      "both `nixpkgs.config.rocmSupport` and `nixpkgs.config.cudaSupport` are enabled, "
-      "but they are mutually exclusive; falling back to cpu"
-    ]) (!(config.rocmSupport && config.cudaSupport));
-  validateLinux = api:
-    (lib.warnIfNot stdenv.isLinux
-      "building ollama with `${api}` is only supported on linux; falling back to cpu"
-      stdenv.isLinux);
-  shouldEnable = assert accelIsValid;
-    mode: fallback:
-    ((acceleration == mode)
-      || (fallback && acceleration == null && validateFallback))
-    && (validateLinux mode);
-
-  enableRocm = shouldEnable "rocm" config.rocmSupport;
-  enableCuda = shouldEnable "cuda" config.cudaSupport;
-
-  rocmClang = linkFarm "rocm-clang" { llvm = rocmPackages.llvm.clang; };
-  rocmPath = buildEnv {
-    name = "rocm-path";
-    paths = [
-      rocmPackages.clr
-      rocmPackages.hipblas
-      rocmPackages.rocblas
-      rocmPackages.rocsolver
-      rocmPackages.rocsparse
-      rocmPackages.rocm-device-libs
-      rocmClang
-    ];
-  };
-
-  cudaToolkit = buildEnv {
-    name = "cuda-toolkit";
-    ignoreCollisions =
-      true; # FIXME: find a cleaner way to do this without ignoring collisions
-    paths = [
-      cudaPackages.cudatoolkit
-      cudaPackages.cuda_cudart
-      cudaPackages.cuda_cudart.static
-    ];
-  };
-
-  runtimeLibs = lib.optionals enableRocm [ rocmPackages.rocm-smi ]
-    ++ lib.optionals enableCuda [ linuxPackages.nvidia_x11 ];
-
-  appleFrameworks = darwin.apple_sdk_11_0.frameworks;
-  metalFrameworks = [
-    appleFrameworks.Accelerate
-    appleFrameworks.Metal
-    appleFrameworks.MetalKit
-    appleFrameworks.MetalPerformanceShaders
-  ];
-
-  goBuild = if enableCuda then
-    buildGo122Module.override { stdenv = overrideCC stdenv gcc12; }
-  else
-    buildGo122Module;
-  inherit (lib) licenses platforms maintainers;
-in goBuild ((lib.optionalAttrs enableRocm {
-  ROCM_PATH = rocmPath;
-  CLBlast_DIR = "${clblast}/lib/cmake/CLBlast";
-}) // (lib.optionalAttrs enableCuda {
-  CUDA_LIB_DIR = "${cudaToolkit}/lib";
-  CUDACXX = "${cudaToolkit}/bin/nvcc";
-  CUDAToolkit_ROOT = cudaToolkit;
-}) // {
-  inherit pname version src vendorHash;
-
-  nativeBuildInputs = [ cmake ]
-    ++ lib.optionals enableRocm [ rocmPackages.llvm.bintools ]
-    ++ lib.optionals (enableRocm || enableCuda) [ makeWrapper ]
-    ++ lib.optionals stdenv.isDarwin metalFrameworks;
-
-  buildInputs = lib.optionals enableRocm [
-    rocmPackages.clr
-    rocmPackages.hipblas
-    rocmPackages.rocblas
-    rocmPackages.rocsolver
-    rocmPackages.rocsparse
-    libdrm
-  ] ++ lib.optionals enableCuda [ cudaPackages.cuda_cudart ]
-    ++ lib.optionals stdenv.isDarwin metalFrameworks;
-
-  patches = [
-    # disable uses of `git` in the `go generate` script
-    # ollama's build script assumes the source is a git repo, but nix removes the git directory
-    # this also disables necessary patches contained in `ollama/llm/patches/`
-    # those patches are added to `llamacppPatches`, and reapplied here in the patch phase
-    (fetchpatch {
-      url =
-        "https://raw.githubusercontent.com/NixOS/nixpkgs/70998b85f2dd9b48faa474134678277a03dfa107/pkgs/by-name/ol/ollama/disable-git.patch";
-      hash = "sha256-7DthNfvk4VACdJb5L+4n9JmFzQn9qqDP2N4Hwuuhtgg=";
-    })
-  ] ++ llamacppPatches;
-  postPatch = ''
-    # replace inaccurate version number with actual release version
-    substituteInPlace version/version.go --replace-fail 0.0.0 '${version}'
-  '';
-  preBuild = ''
-    # disable uses of `git`, since nix removes the git directory
-    export OLLAMA_SKIP_PATCHING=true
-    # build llama.cpp libraries for ollama
-    go generate ./...
-  '';
-  postFixup = ''
-    # the app doesn't appear functional at the moment, so hide it
-    mv "$out/bin/app" "$out/bin/.ollama-app"
-  '' + lib.optionalString (enableRocm || enableCuda) ''
-    # expose runtime libraries necessary to use the gpu
-    mv "$out/bin/ollama" "$out/bin/.ollama-unwrapped"
-    makeWrapper "$out/bin/.ollama-unwrapped" "$out/bin/ollama" ${
-      lib.optionalString enableRocm "--set-default HIP_PATH '${rocmPath}' "
-    } \
-      --suffix LD_LIBRARY_PATH : '/run/opengl-driver/lib:${
-        lib.makeLibraryPath runtimeLibs
-      }'
-  '';
-
-  ldflags = [
-    "-s"
-    "-w"
-    "-X=github.com/jmorganca/ollama/version.Version=${version}"
-    "-X=github.com/jmorganca/ollama/server.mode=release"
-  ];
-
-  passthru.tests = {
-    service = nixosTests.ollama;
-    rocm = pkgs.ollama.override { acceleration = "rocm"; };
-    cuda = pkgs.ollama.override { acceleration = "cuda"; };
-    version = testers.testVersion {
-      inherit version;
-      package = ollama;
-    };
-  };
-
-  meta = {
-    description = "Get up and running with large language models locally";
-    homepage = "https://github.com/ollama/ollama";
-    changelog = "https://github.com/ollama/ollama/releases/tag/v${version}";
-    license = licenses.mit;
-    platforms = platforms.unix;
-    mainProgram = "ollama";
-    maintainers = with maintainers; [ abysssol dit7ya elohmeier ];
-  };
-})
author	Ben Sima <ben@bsima.me>	2024-10-25 02:10:20 -0400
committer	Ben Sima <ben@bsima.me>	2024-12-21 10:06:48 -0500
commit	8ceebbdb53ea5c67310a5281c30f53c9cf504d70 (patch)
tree	17ef6c8bbe37959202ff3a77401f255573336dd1 /Biz/Bild/Deps
parent	9293fd18d4df5383bb596fabbc6a0f2f7a46923e (diff)