{ lib, fetchFromGitHub, stdenv, makeWrapper, gitUpdater, python3Packages, python311Packages ? null, # Ignored. Kept for compatibility with the release tk, addDriverRunpath, darwin, koboldLiteSupport ? true, config, cudaPackages ? { }, openblasSupport ? !stdenv.isDarwin, openblas, cublasSupport ? config.cudaSupport, # You can find a full list here: https://arnon.dk/matching-sm-architectures-arch-and-gencode-for-various-nvidia-cards/ # For example if you're on an GTX 1080 that means you're using "Pascal" and you need to pass "sm_60" cudaArches ? cudaPackages.cudaFlags.realArches or [ ], clblastSupport ? stdenv.isLinux, clblast, ocl-icd, vulkanSupport ? true, vulkan-loader, metalSupport ? stdenv.isDarwin && stdenv.isAarch64, march ? "", mtune ? "", }: let makeBool = option: bool: (if bool then "${option}=1" else ""); libraryPathWrapperArgs = lib.optionalString config.cudaSupport '' --prefix LD_LIBRARY_PATH : "${lib.makeLibraryPath [ addDriverRunpath.driverLink ]}" ''; darwinFrameworks = if (stdenv.isDarwin && stdenv.isx86_64) then darwin.apple_sdk.frameworks else darwin.apple_sdk_11_0.frameworks; effectiveStdenv = if cublasSupport then cudaPackages.backendStdenv else stdenv; in effectiveStdenv.mkDerivation (finalAttrs: { pname = "koboldcpp"; version = "1.71.1"; src = fetchFromGitHub { owner = "LostRuins"; repo = "koboldcpp"; rev = "refs/tags/v${finalAttrs.version}"; hash = "sha256-69iqpXzG9NXrqv08lJ36hlHWXwXUJs6yqcaGr32cHPw="; }; enableParallelBuilding = true; nativeBuildInputs = [ makeWrapper python3Packages.wrapPython ]; pythonInputs = builtins.attrValues { inherit (python3Packages) tkinter customtkinter packaging; }; buildInputs = [ tk ] ++ finalAttrs.pythonInputs ++ lib.optionals effectiveStdenv.isDarwin [ darwinFrameworks.Accelerate darwinFrameworks.CoreVideo darwinFrameworks.CoreGraphics darwinFrameworks.CoreServices ] ++ lib.optionals metalSupport [ darwinFrameworks.MetalKit darwinFrameworks.Foundation darwinFrameworks.MetalPerformanceShaders ] ++ lib.optionals openblasSupport [ openblas ] ++ lib.optionals cublasSupport [ cudaPackages.libcublas cudaPackages.cuda_nvcc cudaPackages.cuda_cudart cudaPackages.cuda_cccl ] ++ lib.optionals clblastSupport [ clblast ocl-icd ] ++ lib.optionals vulkanSupport [ vulkan-loader ]; pythonPath = finalAttrs.pythonInputs; darwinLdFlags = lib.optionals stdenv.isDarwin [ "-F${darwinFrameworks.CoreServices}/Library/Frameworks" "-F${darwinFrameworks.Accelerate}/Library/Frameworks" "-framework CoreServices" "-framework Accelerate" ]; metalLdFlags = lib.optionals metalSupport [ "-F${darwinFrameworks.Foundation}/Library/Frameworks" "-F${darwinFrameworks.Metal}/Library/Frameworks" "-framework Foundation" "-framework Metal" ]; env.NIX_LDFLAGS = lib.concatStringsSep " " (finalAttrs.darwinLdFlags ++ finalAttrs.metalLdFlags); env.NIX_CFLAGS_COMPILE = lib.optionalString (march != "") ( lib.warn "koboldcpp: the march argument is only kept for compatibility; use overrideAttrs intead" "-march=${march}" ) + lib.optionalString (mtune != "") ( lib.warn "koboldcpp: the mtune argument is only kept for compatibility; use overrideAttrs intead" "-mtune=${mtune}" ); makeFlags = [ (makeBool "LLAMA_OPENBLAS" openblasSupport) (makeBool "LLAMA_CUBLAS" cublasSupport) (makeBool "LLAMA_CLBLAST" clblastSupport) (makeBool "LLAMA_VULKAN" vulkanSupport) (makeBool "LLAMA_METAL" metalSupport) (lib.optionals cublasSupport "CUDA_DOCKER_ARCH=${builtins.head cudaArches}") ]; installPhase = '' runHook preInstall mkdir -p "$out/bin" install -Dm755 koboldcpp.py "$out/bin/koboldcpp.unwrapped" cp *.so "$out/bin" cp *.embd "$out/bin" ${lib.optionalString (!koboldLiteSupport) '' rm "$out/bin/kcpp_docs.embd" rm "$out/bin/klite.embd" ''} runHook postInstall ''; # Remove an unused argument, mainly intended for Darwin to reduce warnings postPatch = '' substituteInPlace Makefile \ --replace-warn " -s " " " ''; postFixup = '' wrapPythonProgramsIn "$out/bin" "$pythonPath" makeWrapper "$out/bin/koboldcpp.unwrapped" "$out/bin/koboldcpp" \ --prefix PATH : ${lib.makeBinPath [ tk ]} ${libraryPathWrapperArgs} ''; passthru.updateScript = gitUpdater { rev-prefix = "v"; }; meta = { description = "Way to run various GGML and GGUF models"; license = lib.licenses.agpl3Only; maintainers = with lib.maintainers; [ maxstrid donteatoreo ]; mainProgram = "koboldcpp"; platforms = lib.platforms.unix; }; })