depot/third_party/nixpkgs/pkgs/by-name/lo/local-ai/package.nix

{ config
, callPackages
, stdenv
, lib
, addDriverRunpath
, fetchpatch
, fetchFromGitHub
, protobuf
, grpc
, openssl
, llama-cpp
  # needed for audio-to-text
, ffmpeg
, cmake
, pkg-config
, buildGoModule
, makeWrapper

  # apply feature parameter names according to
  # https://github.com/NixOS/rfcs/pull/169

  # CPU extensions
, enable_avx ? true
, enable_avx2 ? true
, enable_avx512 ? stdenv.hostPlatform.avx512Support
, enable_f16c ? true
, enable_fma ? true

, with_openblas ? false
, openblas

, with_cublas ? config.cudaSupport
, cudaPackages

, with_clblas ? false
, clblast
, ocl-icd
, opencl-headers

, with_tinydream ? false # do not compile with cublas
, ncnn

, with_stablediffusion ? true
, opencv

, with_tts ? true
, onnxruntime
, sonic
, spdlog
, fmt
, espeak-ng
, piper-tts
}:
let
  BUILD_TYPE =
    assert (lib.count lib.id [ with_openblas with_cublas with_clblas ]) <= 1;
    if with_openblas then "openblas"
    else if with_cublas then "cublas"
    else if with_clblas then "clblas"
    else "";

  inherit (cudaPackages) libcublas cuda_nvcc cuda_cccl cuda_cudart cudatoolkit;

  go-llama-ggml = effectiveStdenv.mkDerivation {
    name = "go-llama-ggml";
    src = fetchFromGitHub {
      owner = "go-skynet";
      repo = "go-llama.cpp";
      rev = "2b57a8ae43e4699d3dc5d1496a1ccd42922993be";
      hash = "sha256-D6SEg5pPcswGyKAmF4QTJP6/Y1vjRr7m7REguag+too=";
      fetchSubmodules = true;
    };
    buildFlags = [
      "libbinding.a"
      "BUILD_TYPE=${BUILD_TYPE}"
    ];

    buildInputs = [ ]
      ++ lib.optionals with_clblas [ clblast ocl-icd opencl-headers ]
      ++ lib.optionals with_openblas [ openblas.dev ];

    nativeBuildInputs = [ cmake ]
      # backward compatiblity with nixos-23.11
      # use cuda_nvcc after release of nixos-24.05
      ++ lib.optionals with_cublas [ cudatoolkit ];

    dontUseCmakeConfigure = true;

    installPhase = ''
      mkdir $out
      tar cf - --exclude=build --exclude=CMakeFiles --exclude="*.o" . \
        | tar xf - -C $out
    '';
  };

  llama-cpp-grpc = (llama-cpp.overrideAttrs (final: prev: {
    name = "llama-cpp-grpc";
    src = fetchFromGitHub {
      owner = "ggerganov";
      repo = "llama.cpp";
      rev = "1b67731e184e27a465b8c5476061294a4af668ea";
      hash = "sha256-0WWbsklpW6HhFRkvWpYh8Lhi8VIansS/zmyIKNQRkIs=";
      fetchSubmodules = true;
    };
    postPatch = prev.postPatch + ''
      cd examples
      cp -r --no-preserve=mode ${src}/backend/cpp/llama grpc-server
      cp llava/clip.* llava/llava.* grpc-server
      printf "\nadd_subdirectory(grpc-server)" >> CMakeLists.txt

      cp ${src}/backend/backend.proto grpc-server
      sed -i grpc-server/CMakeLists.txt \
        -e '/get_filename_component/ s;[.\/]*backend/;;' \
        -e '$a\install(TARGETS ''${TARGET} RUNTIME)'
      cd ..
    '';
    cmakeFlags = prev.cmakeFlags ++ [
      (lib.cmakeBool "BUILD_SHARED_LIBS" false)
      (lib.cmakeBool "LLAMA_AVX" enable_avx)
      (lib.cmakeBool "LLAMA_AVX2" enable_avx2)
      (lib.cmakeBool "LLAMA_AVX512" enable_avx512)
      (lib.cmakeBool "LLAMA_FMA" enable_fma)
      (lib.cmakeBool "LLAMA_F16C" enable_f16c)
    ];
    buildInputs = prev.buildInputs ++ [
      protobuf # provides also abseil_cpp as propagated build input
      grpc
      openssl
    ];
  })).override {
    cudaSupport = with_cublas;
    rocmSupport = false;
    openclSupport = with_clblas;
    blasSupport = with_openblas;
  };

  gpt4all = stdenv.mkDerivation {
    name = "gpt4all";
    src = fetchFromGitHub {
      owner = "nomic-ai";
      repo = "gpt4all";
      rev = "27a8b020c36b0df8f8b82a252d261cda47cf44b8";
      hash = "sha256-djq1eK6ncvhkO3MNDgasDBUY/7WWcmZt/GJsHAulLdI=";
      fetchSubmodules = true;
    };
    makeFlags = [ "-C gpt4all-bindings/golang" ];
    buildFlags = [ "libgpt4all.a" ];
    dontUseCmakeConfigure = true;
    nativeBuildInputs = [ cmake ];
    installPhase = ''
      mkdir $out
      tar cf - --exclude=CMakeFiles . \
        | tar xf - -C $out
    '';
  };

  espeak-ng' = espeak-ng.overrideAttrs (self: {
    name = "espeak-ng'";
    inherit (go-piper) src;
    sourceRoot = "source/espeak";
    patches = [ ];
    nativeBuildInputs = [ cmake ];
    cmakeFlags = (self.cmakeFlags or [ ]) ++ [
      (lib.cmakeBool "BUILD_SHARED_LIBS" true)
      (lib.cmakeBool "USE_ASYNC" false)
      (lib.cmakeBool "USE_MBROLA" false)
      (lib.cmakeBool "USE_LIBPCAUDIO" false)
      (lib.cmakeBool "USE_KLATT" false)
      (lib.cmakeBool "USE_SPEECHPLAYER" false)
      (lib.cmakeBool "USE_LIBSONIC" false)
      (lib.cmakeBool "CMAKE_POSITION_INDEPENDENT_CODE" true)
    ];
    preConfigure = null;
    postInstall = null;
  });

  piper-phonemize = stdenv.mkDerivation {
    name = "piper-phonemize";
    inherit (go-piper) src;
    sourceRoot = "source/piper-phonemize";
    buildInputs = [ espeak-ng' onnxruntime ];
    nativeBuildInputs = [ cmake pkg-config ];
    cmakeFlags = [
      (lib.cmakeFeature "ONNXRUNTIME_DIR" "${onnxruntime.dev}")
      (lib.cmakeFeature "ESPEAK_NG_DIR" "${espeak-ng'}")
    ];
    passthru.espeak-ng = espeak-ng';
  };

  piper-tts' = (piper-tts.override { inherit piper-phonemize; }).overrideAttrs (self: {
    name = "piper-tts'";
    inherit (go-piper) src;
    sourceRoot = "source/piper";
    installPhase = null;
    postInstall = ''
      cp CMakeFiles/piper.dir/src/cpp/piper.cpp.o $out/piper.o
      cd $out
      mkdir bin lib
      mv lib*so* lib/
      mv piper piper_phonemize bin/
      rm -rf cmake pkgconfig espeak-ng-data *.ort
    '';
  });

  go-piper = stdenv.mkDerivation {
    name = "go-piper";
    src = fetchFromGitHub {
      owner = "mudler";
      repo = "go-piper";
      rev = "9d0100873a7dbb0824dfea40e8cec70a1b110759";
      hash = "sha256-Yv9LQkWwGpYdOS0FvtP0vZ0tRyBAx27sdmziBR4U4n8=";
      fetchSubmodules = true;
    };
    postUnpack = ''
      cp -r --no-preserve=mode ${piper-tts'}/* source
    '';
    postPatch = ''
      sed -i Makefile \
        -e '/CXXFLAGS *= / s;$; -DSPDLOG_FMT_EXTERNAL=1;'
    '';
    buildFlags = [ "libpiper_binding.a" ];
    buildInputs = [ piper-tts' espeak-ng' piper-phonemize sonic fmt spdlog onnxruntime ];
    installPhase = ''
      cp -r --no-preserve=mode $src $out
      mkdir -p $out/piper-phonemize/pi
      cp -r --no-preserve=mode ${piper-phonemize}/share $out/piper-phonemize/pi
      cp *.a $out
    '';
  };

  go-rwkv = stdenv.mkDerivation {
    name = "go-rwkv";
    src = fetchFromGitHub {
      owner = "donomii";
      repo = "go-rwkv.cpp";
      rev = "661e7ae26d442f5cfebd2a0881b44e8c55949ec6";
      hash = "sha256-byTNZQSnt7qpBMng3ANJmpISh3GJiz+F15UqfXaz6nQ=";
      fetchSubmodules = true;
    };
    buildFlags = [ "librwkv.a" ];
    dontUseCmakeConfigure = true;
    nativeBuildInputs = [ cmake ];
    installPhase = ''
      cp -r --no-preserve=mode $src $out
      cp *.a $out
    '';
  };

  # try to merge with openai-whisper-cpp in future
  whisper-cpp = effectiveStdenv.mkDerivation {
    name = "whisper-cpp";
    src = fetchFromGitHub {
      owner = "ggerganov";
      repo = "whisper.cpp";
      rev = "8f253ef3af1c62c04316ba4afa7145fc4d701a8c";
      hash = "sha256-yHHjhpQIn99A/hqFwAb7TfTf4Q9KnKat93zyXS70bT8=";
    };

    nativeBuildInputs = [ cmake pkg-config ]
      ++ lib.optionals with_cublas [ cuda_nvcc ];

    buildInputs = [ ]
      ++ lib.optionals with_cublas [ cuda_cccl cuda_cudart libcublas ]
      ++ lib.optionals with_clblas [ clblast ocl-icd opencl-headers ]
      ++ lib.optionals with_openblas [ openblas.dev ];

    cmakeFlags = [
      (lib.cmakeBool "WHISPER_CUDA" with_cublas)
      (lib.cmakeBool "WHISPER_CLBLAST" with_clblas)
      (lib.cmakeBool "WHISPER_OPENBLAS" with_openblas)
      (lib.cmakeBool "WHISPER_NO_AVX" (!enable_avx))
      (lib.cmakeBool "WHISPER_NO_AVX2" (!enable_avx2))
      (lib.cmakeBool "WHISPER_NO_FMA" (!enable_fma))
      (lib.cmakeBool "WHISPER_NO_F16C" (!enable_f16c))
      (lib.cmakeBool "BUILD_SHARED_LIBS" false)
    ];
    postInstall = ''
      install -Dt $out/bin bin/*
    '';
  };

  go-bert = stdenv.mkDerivation {
    name = "go-bert";
    src = fetchFromGitHub {
      owner = "go-skynet";
      repo = "go-bert.cpp";
      rev = "6abe312cded14042f6b7c3cd8edf082713334a4d";
      hash = "sha256-lh9cvXc032Eq31kysxFOkRd0zPjsCznRl0tzg9P2ygo=";
      fetchSubmodules = true;
    };
    buildFlags = [ "libgobert.a" ];
    dontUseCmakeConfigure = true;
    nativeBuildInputs = [ cmake ];
    env.NIX_CFLAGS_COMPILE = "-Wformat";
    installPhase = ''
      cp -r --no-preserve=mode $src $out
      cp *.a $out
    '';
  };

  go-stable-diffusion = stdenv.mkDerivation {
    name = "go-stable-diffusion";
    src = fetchFromGitHub {
      owner = "mudler";
      repo = "go-stable-diffusion";
      rev = "362df9da29f882dbf09ade61972d16a1f53c3485";
      hash = "sha256-A5KvMZOviPsIpPHxM8cacT+qE2x1iFJAbPsRs4sLijY=";
      fetchSubmodules = true;
    };
    buildFlags = [ "libstablediffusion.a" ];
    dontUseCmakeConfigure = true;
    nativeBuildInputs = [ cmake ];
    buildInputs = [ opencv ];
    env.NIX_CFLAGS_COMPILE = " -isystem ${opencv}/include/opencv4";
    installPhase = ''
      mkdir $out
      tar cf - --exclude=CMakeFiles --exclude="*.o" --exclude="*.so" --exclude="*.so.*" . \
        | tar xf - -C $out
    '';
  };

  go-tiny-dream-ncnn = ncnn.overrideAttrs (self: {
    name = "go-tiny-dream-ncnn";
    inherit (go-tiny-dream) src;
    sourceRoot = "source/ncnn";
    cmakeFlags = self.cmakeFlags ++ [
      (lib.cmakeBool "NCNN_SHARED_LIB" false)
      (lib.cmakeBool "NCNN_OPENMP" false)
      (lib.cmakeBool "NCNN_VULKAN" false)
      (lib.cmakeBool "NCNN_AVX" enable_avx)
      (lib.cmakeBool "NCNN_AVX2" enable_avx2)
      (lib.cmakeBool "NCNN_AVX512" enable_avx512)
      (lib.cmakeBool "NCNN_FMA" enable_fma)
      (lib.cmakeBool "NCNN_F16C" enable_f16c)
    ];
  });

  go-tiny-dream = effectiveStdenv.mkDerivation {
    name = "go-tiny-dream";
    src = fetchFromGitHub {
      owner = "M0Rf30";
      repo = "go-tiny-dream";
      rev = "22a12a4bc0ac5455856f28f3b771331a551a4293";
      hash = "sha256-DAVHD6E0OKHf4C2ldoI0Mm7813DIrmWFONUhSCQPCfc=";
      fetchSubmodules = true;
    };
    postUnpack = ''
      rm -rf source/ncnn
      mkdir -p source/ncnn/build/src
      cp -r --no-preserve=mode ${go-tiny-dream-ncnn}/lib/. ${go-tiny-dream-ncnn}/include/. source/ncnn/build/src
    '';
    buildFlags = [ "libtinydream.a" ];
    installPhase = ''
      mkdir $out
      tar cf - --exclude="*.o" . \
        | tar xf - -C $out
    '';
    meta.broken = lib.versionOlder go-tiny-dream.stdenv.cc.version "13";
  };

  GO_TAGS = lib.optional with_tinydream "tinydream"
    ++ lib.optional with_tts "tts"
    ++ lib.optional with_stablediffusion "stablediffusion";

  effectiveStdenv =
    if with_cublas then
    # It's necessary to consistently use backendStdenv when building with CUDA support,
    # otherwise we get libstdc++ errors downstream.
      cudaPackages.backendStdenv
    else
      stdenv;

  pname = "local-ai";
  version = "2.12.4";
  src = fetchFromGitHub {
    owner = "go-skynet";
    repo = "LocalAI";
    rev = "v${version}";
    hash = "sha256-piu2B6u4ZfxiOd9SXrE7jiiiwL2SM8EqXo2s5qeKRl0=";
  };

  self = buildGoModule.override { stdenv = effectiveStdenv; } {
    inherit pname version src;

    vendorHash = "sha256-8Hu1y/PK21twnB7D22ltslFFzRrsB8d1R2hkgIFB/XY=";

    env.NIX_CFLAGS_COMPILE = lib.optionalString with_stablediffusion " -isystem ${opencv}/include/opencv4";

    postPatch =
      let
        cp = "cp -r --no-preserve=mode,ownership";
      in
      ''
        sed -i Makefile \
          -e 's;git clone.*go-llama-ggml$;${cp} ${go-llama-ggml} sources/go-llama-ggml;' \
          -e 's;git clone.*gpt4all$;${cp} ${gpt4all} sources/gpt4all;' \
          -e 's;git clone.*go-piper$;${cp} ${if with_tts then go-piper else go-piper.src} sources/go-piper;' \
          -e 's;git clone.*go-rwkv$;${cp} ${go-rwkv} sources/go-rwkv;' \
          -e 's;git clone.*whisper\.cpp$;${cp} ${whisper-cpp.src} sources/whisper\.cpp;' \
          -e 's;git clone.*go-bert$;${cp} ${go-bert} sources/go-bert;' \
          -e 's;git clone.*diffusion$;${cp} ${if with_stablediffusion then go-stable-diffusion else go-stable-diffusion.src} sources/go-stable-diffusion;' \
          -e 's;git clone.*go-tiny-dream$;${cp} ${if with_tinydream then go-tiny-dream else go-tiny-dream.src} sources/go-tiny-dream;' \
          -e 's, && git checkout.*,,g' \
          -e '/mod download/ d' \

        ${cp} ${llama-cpp-grpc}/bin/*grpc-server backend/cpp/llama/grpc-server
        echo "grpc-server:" > backend/cpp/llama/Makefile
      ''
    ;

    buildInputs = [ ]
      ++ lib.optionals with_cublas [ libcublas ]
      ++ lib.optionals with_clblas [ clblast ocl-icd opencl-headers ]
      ++ lib.optionals with_openblas [ openblas.dev ]
      ++ lib.optionals with_stablediffusion go-stable-diffusion.buildInputs
      ++ lib.optionals with_tts go-piper.buildInputs;

    nativeBuildInputs = [ makeWrapper ]
      ++ lib.optionals with_cublas [ cuda_nvcc ];

    enableParallelBuilding = false;

    modBuildPhase = ''
      mkdir sources
      make prepare-sources
      go mod tidy -v
    '';

    proxyVendor = true;

    # should be passed as makeFlags, but build system failes with strings
    # containing spaces
    env.GO_TAGS = builtins.concatStringsSep " " GO_TAGS;

    makeFlags = [
      "VERSION=v${version}"
      "BUILD_TYPE=${BUILD_TYPE}"
    ]
    ++ lib.optional with_cublas "CUDA_LIBPATH=${cuda_cudart}/lib"
    ++ lib.optional with_tts "PIPER_CGO_CXXFLAGS=-DSPDLOG_FMT_EXTERNAL=1";

    buildPhase = ''
      runHook preBuild

      mkdir sources
      make prepare-sources
      # avoid rebuild of prebuilt libraries
      touch sources/**/lib*.a
      cp ${whisper-cpp}/lib/static/lib*.a sources/whisper.cpp

      local flagsArray=(
        ''${enableParallelBuilding:+-j''${NIX_BUILD_CORES}}
        SHELL=$SHELL
      )
      _accumFlagsArray makeFlags makeFlagsArray buildFlags buildFlagsArray
      echoCmd 'build flags' "''${flagsArray[@]}"
      make build "''${flagsArray[@]}"
      unset flagsArray

      runHook postBuild
    '';

    installPhase = ''
      runHook preInstall

      install -Dt $out/bin ${pname}

      runHook postInstall
    '';

    # patching rpath with patchelf doens't work. The execuable
    # raises an segmentation fault
    postFixup =
      let
        LD_LIBRARY_PATH = [ ]
          ++ lib.optionals with_cublas [ (lib.getLib libcublas) cuda_cudart addDriverRunpath.driverLink ]
          ++ lib.optionals with_clblas [ clblast ocl-icd ]
          ++ lib.optionals with_openblas [ openblas ]
          ++ lib.optionals with_tts [ piper-phonemize ];
      in
      ''
        wrapProgram $out/bin/${pname} \
        --prefix LD_LIBRARY_PATH : "${lib.makeLibraryPath LD_LIBRARY_PATH}" \
        --prefix PATH : "${ffmpeg}/bin"
      '';

    passthru.local-packages = {
      inherit
        go-tiny-dream go-rwkv go-bert go-llama-ggml gpt4all go-piper
        llama-cpp-grpc whisper-cpp go-tiny-dream-ncnn espeak-ng' piper-phonemize
        piper-tts';
    };

    passthru.features = {
      inherit
        with_cublas with_openblas with_tts with_stablediffusion
        with_tinydream with_clblas;
    };

    passthru.tests = callPackages ./tests.nix { inherit self; };

    meta = with lib; {
      description = "OpenAI alternative to run local LLMs, image and audio generation";
      homepage = "https://localai.io";
      license = licenses.mit;
      maintainers = with maintainers; [ onny ck3d ];
      platforms = platforms.linux;
    };
  };
in
self
Project import generated by Copybara. GitOrigin-RevId: 6143fc5eeb9c4f00163267708e26191d1e918932 2024-04-21 15:54:59 +00:00			`{ config`
			`, callPackages`
			`, stdenv`
			`, lib`
			`, addDriverRunpath`
			`, fetchpatch`
			`, fetchFromGitHub`
			`, protobuf`
			`, grpc`
			`, openssl`
			`, llama-cpp`
			`# needed for audio-to-text`
			`, ffmpeg`
			`, cmake`
			`, pkg-config`
			`, buildGoModule`
			`, makeWrapper`

			`# apply feature parameter names according to`
			`# https://github.com/NixOS/rfcs/pull/169`

			`# CPU extensions`
			`, enable_avx ? true`
			`, enable_avx2 ? true`
			`, enable_avx512 ? stdenv.hostPlatform.avx512Support`
			`, enable_f16c ? true`
			`, enable_fma ? true`

			`, with_openblas ? false`
			`, openblas`

			`, with_cublas ? config.cudaSupport`
			`, cudaPackages`

			`, with_clblas ? false`
			`, clblast`
			`, ocl-icd`
			`, opencl-headers`

			`, with_tinydream ? false # do not compile with cublas`
			`, ncnn`

			`, with_stablediffusion ? true`
			`, opencv`

			`, with_tts ? true`
			`, onnxruntime`
			`, sonic`
			`, spdlog`
			`, fmt`
			`, espeak-ng`
			`, piper-tts`
			`}:`
			`let`
			`BUILD_TYPE =`
			`assert (lib.count lib.id [ with_openblas with_cublas with_clblas ]) <= 1;`
			`if with_openblas then "openblas"`
			`else if with_cublas then "cublas"`
			`else if with_clblas then "clblas"`
			`else "";`

			`inherit (cudaPackages) libcublas cuda_nvcc cuda_cccl cuda_cudart cudatoolkit;`

			`go-llama-ggml = effectiveStdenv.mkDerivation {`
			`name = "go-llama-ggml";`
			`src = fetchFromGitHub {`
			`owner = "go-skynet";`
			`repo = "go-llama.cpp";`
			`rev = "2b57a8ae43e4699d3dc5d1496a1ccd42922993be";`
			`hash = "sha256-D6SEg5pPcswGyKAmF4QTJP6/Y1vjRr7m7REguag+too=";`
			`fetchSubmodules = true;`
			`};`
			`buildFlags = [`
			`"libbinding.a"`
			`"BUILD_TYPE=${BUILD_TYPE}"`
			`];`

			`buildInputs = [ ]`
			`++ lib.optionals with_clblas [ clblast ocl-icd opencl-headers ]`
			`++ lib.optionals with_openblas [ openblas.dev ];`

			`nativeBuildInputs = [ cmake ]`
			`# backward compatiblity with nixos-23.11`
			`# use cuda_nvcc after release of nixos-24.05`
			`++ lib.optionals with_cublas [ cudatoolkit ];`

			`dontUseCmakeConfigure = true;`

			`installPhase = ''`
			`mkdir $out`
			`tar cf - --exclude=build --exclude=CMakeFiles --exclude="*.o" . \`
			`\| tar xf - -C $out`
			`'';`
			`};`

			`llama-cpp-grpc = (llama-cpp.overrideAttrs (final: prev: {`
			`name = "llama-cpp-grpc";`
			`src = fetchFromGitHub {`
			`owner = "ggerganov";`
			`repo = "llama.cpp";`
			`rev = "1b67731e184e27a465b8c5476061294a4af668ea";`
			`hash = "sha256-0WWbsklpW6HhFRkvWpYh8Lhi8VIansS/zmyIKNQRkIs=";`
			`fetchSubmodules = true;`
			`};`
			`postPatch = prev.postPatch + ''`
			`cd examples`
			`cp -r --no-preserve=mode ${src}/backend/cpp/llama grpc-server`
			`cp llava/clip.* llava/llava.* grpc-server`
			`printf "\nadd_subdirectory(grpc-server)" >> CMakeLists.txt`

			`cp ${src}/backend/backend.proto grpc-server`
			`sed -i grpc-server/CMakeLists.txt \`
			`-e '/get_filename_component/ s;[.\/]*backend/;;' \`
			`-e '$a\install(TARGETS ''${TARGET} RUNTIME)'`
			`cd ..`
			`'';`
			`cmakeFlags = prev.cmakeFlags ++ [`
			`(lib.cmakeBool "BUILD_SHARED_LIBS" false)`
			`(lib.cmakeBool "LLAMA_AVX" enable_avx)`
			`(lib.cmakeBool "LLAMA_AVX2" enable_avx2)`
			`(lib.cmakeBool "LLAMA_AVX512" enable_avx512)`
			`(lib.cmakeBool "LLAMA_FMA" enable_fma)`
			`(lib.cmakeBool "LLAMA_F16C" enable_f16c)`
			`];`
			`buildInputs = prev.buildInputs ++ [`
			`protobuf # provides also abseil_cpp as propagated build input`
			`grpc`
			`openssl`
			`];`
			`})).override {`
			`cudaSupport = with_cublas;`
			`rocmSupport = false;`
			`openclSupport = with_clblas;`
			`blasSupport = with_openblas;`
			`};`

			`gpt4all = stdenv.mkDerivation {`
			`name = "gpt4all";`
			`src = fetchFromGitHub {`
			`owner = "nomic-ai";`
			`repo = "gpt4all";`
			`rev = "27a8b020c36b0df8f8b82a252d261cda47cf44b8";`
			`hash = "sha256-djq1eK6ncvhkO3MNDgasDBUY/7WWcmZt/GJsHAulLdI=";`
			`fetchSubmodules = true;`
			`};`
			`makeFlags = [ "-C gpt4all-bindings/golang" ];`
			`buildFlags = [ "libgpt4all.a" ];`
			`dontUseCmakeConfigure = true;`
			`nativeBuildInputs = [ cmake ];`
			`installPhase = ''`
			`mkdir $out`
			`tar cf - --exclude=CMakeFiles . \`
			`\| tar xf - -C $out`
			`'';`
			`};`

			`espeak-ng' = espeak-ng.overrideAttrs (self: {`
			`name = "espeak-ng'";`
			`inherit (go-piper) src;`
			`sourceRoot = "source/espeak";`
			`patches = [ ];`
			`nativeBuildInputs = [ cmake ];`
			`cmakeFlags = (self.cmakeFlags or [ ]) ++ [`
			`(lib.cmakeBool "BUILD_SHARED_LIBS" true)`
			`(lib.cmakeBool "USE_ASYNC" false)`
			`(lib.cmakeBool "USE_MBROLA" false)`
			`(lib.cmakeBool "USE_LIBPCAUDIO" false)`
			`(lib.cmakeBool "USE_KLATT" false)`
			`(lib.cmakeBool "USE_SPEECHPLAYER" false)`
			`(lib.cmakeBool "USE_LIBSONIC" false)`
			`(lib.cmakeBool "CMAKE_POSITION_INDEPENDENT_CODE" true)`
			`];`
			`preConfigure = null;`
			`postInstall = null;`
			`});`

			`piper-phonemize = stdenv.mkDerivation {`
			`name = "piper-phonemize";`
			`inherit (go-piper) src;`
			`sourceRoot = "source/piper-phonemize";`
			`buildInputs = [ espeak-ng' onnxruntime ];`
			`nativeBuildInputs = [ cmake pkg-config ];`
			`cmakeFlags = [`
			`(lib.cmakeFeature "ONNXRUNTIME_DIR" "${onnxruntime.dev}")`
			`(lib.cmakeFeature "ESPEAK_NG_DIR" "${espeak-ng'}")`
			`];`
			`passthru.espeak-ng = espeak-ng';`
			`};`

			`piper-tts' = (piper-tts.override { inherit piper-phonemize; }).overrideAttrs (self: {`
			`name = "piper-tts'";`
			`inherit (go-piper) src;`
			`sourceRoot = "source/piper";`
			`installPhase = null;`
			`postInstall = ''`
			`cp CMakeFiles/piper.dir/src/cpp/piper.cpp.o $out/piper.o`
			`cd $out`
			`mkdir bin lib`
			`mv libso lib/`
			`mv piper piper_phonemize bin/`
			`rm -rf cmake pkgconfig espeak-ng-data *.ort`
			`'';`
			`});`

			`go-piper = stdenv.mkDerivation {`
			`name = "go-piper";`
			`src = fetchFromGitHub {`
			`owner = "mudler";`
			`repo = "go-piper";`
			`rev = "9d0100873a7dbb0824dfea40e8cec70a1b110759";`
			`hash = "sha256-Yv9LQkWwGpYdOS0FvtP0vZ0tRyBAx27sdmziBR4U4n8=";`
			`fetchSubmodules = true;`
			`};`
			`postUnpack = ''`
			`cp -r --no-preserve=mode ${piper-tts'}/* source`
			`'';`
			`postPatch = ''`
			`sed -i Makefile \`
			`-e '/CXXFLAGS *= / s;$; -DSPDLOG_FMT_EXTERNAL=1;'`
			`'';`
			`buildFlags = [ "libpiper_binding.a" ];`
			`buildInputs = [ piper-tts' espeak-ng' piper-phonemize sonic fmt spdlog onnxruntime ];`
			`installPhase = ''`
			`cp -r --no-preserve=mode $src $out`
			`mkdir -p $out/piper-phonemize/pi`
			`cp -r --no-preserve=mode ${piper-phonemize}/share $out/piper-phonemize/pi`
			`cp *.a $out`
			`'';`
			`};`

			`go-rwkv = stdenv.mkDerivation {`
			`name = "go-rwkv";`
			`src = fetchFromGitHub {`
			`owner = "donomii";`
			`repo = "go-rwkv.cpp";`
			`rev = "661e7ae26d442f5cfebd2a0881b44e8c55949ec6";`
			`hash = "sha256-byTNZQSnt7qpBMng3ANJmpISh3GJiz+F15UqfXaz6nQ=";`
			`fetchSubmodules = true;`
			`};`
			`buildFlags = [ "librwkv.a" ];`
			`dontUseCmakeConfigure = true;`
			`nativeBuildInputs = [ cmake ];`
			`installPhase = ''`
			`cp -r --no-preserve=mode $src $out`
			`cp *.a $out`
			`'';`
			`};`

			`# try to merge with openai-whisper-cpp in future`
			`whisper-cpp = effectiveStdenv.mkDerivation {`
			`name = "whisper-cpp";`
			`src = fetchFromGitHub {`
			`owner = "ggerganov";`
			`repo = "whisper.cpp";`
			`rev = "8f253ef3af1c62c04316ba4afa7145fc4d701a8c";`
			`hash = "sha256-yHHjhpQIn99A/hqFwAb7TfTf4Q9KnKat93zyXS70bT8=";`
			`};`

			`nativeBuildInputs = [ cmake pkg-config ]`
			`++ lib.optionals with_cublas [ cuda_nvcc ];`

			`buildInputs = [ ]`
			`++ lib.optionals with_cublas [ cuda_cccl cuda_cudart libcublas ]`
			`++ lib.optionals with_clblas [ clblast ocl-icd opencl-headers ]`
			`++ lib.optionals with_openblas [ openblas.dev ];`

			`cmakeFlags = [`
			`(lib.cmakeBool "WHISPER_CUDA" with_cublas)`
			`(lib.cmakeBool "WHISPER_CLBLAST" with_clblas)`
			`(lib.cmakeBool "WHISPER_OPENBLAS" with_openblas)`
			`(lib.cmakeBool "WHISPER_NO_AVX" (!enable_avx))`
			`(lib.cmakeBool "WHISPER_NO_AVX2" (!enable_avx2))`
			`(lib.cmakeBool "WHISPER_NO_FMA" (!enable_fma))`
			`(lib.cmakeBool "WHISPER_NO_F16C" (!enable_f16c))`
			`(lib.cmakeBool "BUILD_SHARED_LIBS" false)`
			`];`
			`postInstall = ''`
			`install -Dt $out/bin bin/*`
			`'';`
			`};`

			`go-bert = stdenv.mkDerivation {`
			`name = "go-bert";`
			`src = fetchFromGitHub {`
			`owner = "go-skynet";`
			`repo = "go-bert.cpp";`
			`rev = "6abe312cded14042f6b7c3cd8edf082713334a4d";`
			`hash = "sha256-lh9cvXc032Eq31kysxFOkRd0zPjsCznRl0tzg9P2ygo=";`
			`fetchSubmodules = true;`
			`};`
			`buildFlags = [ "libgobert.a" ];`
			`dontUseCmakeConfigure = true;`
			`nativeBuildInputs = [ cmake ];`
			`env.NIX_CFLAGS_COMPILE = "-Wformat";`
			`installPhase = ''`
			`cp -r --no-preserve=mode $src $out`
			`cp *.a $out`
			`'';`
			`};`

			`go-stable-diffusion = stdenv.mkDerivation {`
			`name = "go-stable-diffusion";`
			`src = fetchFromGitHub {`
			`owner = "mudler";`
			`repo = "go-stable-diffusion";`
			`rev = "362df9da29f882dbf09ade61972d16a1f53c3485";`
			`hash = "sha256-A5KvMZOviPsIpPHxM8cacT+qE2x1iFJAbPsRs4sLijY=";`
			`fetchSubmodules = true;`
			`};`
			`buildFlags = [ "libstablediffusion.a" ];`
			`dontUseCmakeConfigure = true;`
			`nativeBuildInputs = [ cmake ];`
			`buildInputs = [ opencv ];`
			`env.NIX_CFLAGS_COMPILE = " -isystem ${opencv}/include/opencv4";`
			`installPhase = ''`
			`mkdir $out`
			`tar cf - --exclude=CMakeFiles --exclude=".o" --exclude=".so" --exclude=".so." . \`
			`\| tar xf - -C $out`
			`'';`
			`};`

			`go-tiny-dream-ncnn = ncnn.overrideAttrs (self: {`
			`name = "go-tiny-dream-ncnn";`
			`inherit (go-tiny-dream) src;`
			`sourceRoot = "source/ncnn";`
			`cmakeFlags = self.cmakeFlags ++ [`
			`(lib.cmakeBool "NCNN_SHARED_LIB" false)`
			`(lib.cmakeBool "NCNN_OPENMP" false)`
			`(lib.cmakeBool "NCNN_VULKAN" false)`
			`(lib.cmakeBool "NCNN_AVX" enable_avx)`
			`(lib.cmakeBool "NCNN_AVX2" enable_avx2)`
			`(lib.cmakeBool "NCNN_AVX512" enable_avx512)`
			`(lib.cmakeBool "NCNN_FMA" enable_fma)`
			`(lib.cmakeBool "NCNN_F16C" enable_f16c)`
			`];`
			`});`

			`go-tiny-dream = effectiveStdenv.mkDerivation {`
			`name = "go-tiny-dream";`
			`src = fetchFromGitHub {`
			`owner = "M0Rf30";`
			`repo = "go-tiny-dream";`
			`rev = "22a12a4bc0ac5455856f28f3b771331a551a4293";`
			`hash = "sha256-DAVHD6E0OKHf4C2ldoI0Mm7813DIrmWFONUhSCQPCfc=";`
			`fetchSubmodules = true;`
			`};`
			`postUnpack = ''`
			`rm -rf source/ncnn`
			`mkdir -p source/ncnn/build/src`
			`cp -r --no-preserve=mode ${go-tiny-dream-ncnn}/lib/. ${go-tiny-dream-ncnn}/include/. source/ncnn/build/src`
			`'';`
			`buildFlags = [ "libtinydream.a" ];`
			`installPhase = ''`
			`mkdir $out`
			`tar cf - --exclude="*.o" . \`
			`\| tar xf - -C $out`
			`'';`
			`meta.broken = lib.versionOlder go-tiny-dream.stdenv.cc.version "13";`
			`};`

			`GO_TAGS = lib.optional with_tinydream "tinydream"`
			`++ lib.optional with_tts "tts"`
			`++ lib.optional with_stablediffusion "stablediffusion";`

			`effectiveStdenv =`
			`if with_cublas then`
			`# It's necessary to consistently use backendStdenv when building with CUDA support,`
			`# otherwise we get libstdc++ errors downstream.`
			`cudaPackages.backendStdenv`
			`else`
			`stdenv;`

			`pname = "local-ai";`
			`version = "2.12.4";`
			`src = fetchFromGitHub {`
			`owner = "go-skynet";`
			`repo = "LocalAI";`
			`rev = "v${version}";`
			`hash = "sha256-piu2B6u4ZfxiOd9SXrE7jiiiwL2SM8EqXo2s5qeKRl0=";`
			`};`

			`self = buildGoModule.override { stdenv = effectiveStdenv; } {`
			`inherit pname version src;`

			`vendorHash = "sha256-8Hu1y/PK21twnB7D22ltslFFzRrsB8d1R2hkgIFB/XY=";`

			`env.NIX_CFLAGS_COMPILE = lib.optionalString with_stablediffusion " -isystem ${opencv}/include/opencv4";`

			`postPatch =`
			`let`
			`cp = "cp -r --no-preserve=mode,ownership";`
			`in`
			`''`
			`sed -i Makefile \`
			`-e 's;git clone.*go-llama-ggml$;${cp} ${go-llama-ggml} sources/go-llama-ggml;' \`
			`-e 's;git clone.*gpt4all$;${cp} ${gpt4all} sources/gpt4all;' \`
			`-e 's;git clone.*go-piper$;${cp} ${if with_tts then go-piper else go-piper.src} sources/go-piper;' \`
			`-e 's;git clone.*go-rwkv$;${cp} ${go-rwkv} sources/go-rwkv;' \`
			`-e 's;git clone.*whisper\.cpp$;${cp} ${whisper-cpp.src} sources/whisper\.cpp;' \`
			`-e 's;git clone.*go-bert$;${cp} ${go-bert} sources/go-bert;' \`
			`-e 's;git clone.*diffusion$;${cp} ${if with_stablediffusion then go-stable-diffusion else go-stable-diffusion.src} sources/go-stable-diffusion;' \`
			`-e 's;git clone.*go-tiny-dream$;${cp} ${if with_tinydream then go-tiny-dream else go-tiny-dream.src} sources/go-tiny-dream;' \`
			`-e 's, && git checkout.*,,g' \`
			`-e '/mod download/ d' \`

			`${cp} ${llama-cpp-grpc}/bin/*grpc-server backend/cpp/llama/grpc-server`
			`echo "grpc-server:" > backend/cpp/llama/Makefile`
			`''`
			`;`

			`buildInputs = [ ]`
			`++ lib.optionals with_cublas [ libcublas ]`
			`++ lib.optionals with_clblas [ clblast ocl-icd opencl-headers ]`
			`++ lib.optionals with_openblas [ openblas.dev ]`
			`++ lib.optionals with_stablediffusion go-stable-diffusion.buildInputs`
			`++ lib.optionals with_tts go-piper.buildInputs;`

			`nativeBuildInputs = [ makeWrapper ]`
			`++ lib.optionals with_cublas [ cuda_nvcc ];`

			`enableParallelBuilding = false;`

			`modBuildPhase = ''`
			`mkdir sources`
			`make prepare-sources`
			`go mod tidy -v`
			`'';`

			`proxyVendor = true;`

			`# should be passed as makeFlags, but build system failes with strings`
			`# containing spaces`
			`env.GO_TAGS = builtins.concatStringsSep " " GO_TAGS;`

			`makeFlags = [`
			`"VERSION=v${version}"`
			`"BUILD_TYPE=${BUILD_TYPE}"`
			`]`
			`++ lib.optional with_cublas "CUDA_LIBPATH=${cuda_cudart}/lib"`
			`++ lib.optional with_tts "PIPER_CGO_CXXFLAGS=-DSPDLOG_FMT_EXTERNAL=1";`

			`buildPhase = ''`
			`runHook preBuild`

			`mkdir sources`
			`make prepare-sources`
			`# avoid rebuild of prebuilt libraries`
			`touch sources/*/lib.a`
			`cp ${whisper-cpp}/lib/static/lib*.a sources/whisper.cpp`

			`local flagsArray=(`
			`''${enableParallelBuilding:+-j''${NIX_BUILD_CORES}}`
			`SHELL=$SHELL`
			`)`
			`_accumFlagsArray makeFlags makeFlagsArray buildFlags buildFlagsArray`
			`echoCmd 'build flags' "''${flagsArray[@]}"`
			`make build "''${flagsArray[@]}"`
			`unset flagsArray`

			`runHook postBuild`
			`'';`

			`installPhase = ''`
			`runHook preInstall`

			`install -Dt $out/bin ${pname}`

			`runHook postInstall`
			`'';`

			`# patching rpath with patchelf doens't work. The execuable`
			`# raises an segmentation fault`
			`postFixup =`
			`let`
			`LD_LIBRARY_PATH = [ ]`
			`++ lib.optionals with_cublas [ (lib.getLib libcublas) cuda_cudart addDriverRunpath.driverLink ]`
			`++ lib.optionals with_clblas [ clblast ocl-icd ]`
			`++ lib.optionals with_openblas [ openblas ]`
			`++ lib.optionals with_tts [ piper-phonemize ];`
			`in`
			`''`
			`wrapProgram $out/bin/${pname} \`
			`--prefix LD_LIBRARY_PATH : "${lib.makeLibraryPath LD_LIBRARY_PATH}" \`
			`--prefix PATH : "${ffmpeg}/bin"`
			`'';`

			`passthru.local-packages = {`
			`inherit`
			`go-tiny-dream go-rwkv go-bert go-llama-ggml gpt4all go-piper`
			`llama-cpp-grpc whisper-cpp go-tiny-dream-ncnn espeak-ng' piper-phonemize`
			`piper-tts';`
			`};`

			`passthru.features = {`
			`inherit`
			`with_cublas with_openblas with_tts with_stablediffusion`
			`with_tinydream with_clblas;`
			`};`

			`passthru.tests = callPackages ./tests.nix { inherit self; };`

			`meta = with lib; {`
			`description = "OpenAI alternative to run local LLMs, image and audio generation";`
			`homepage = "https://localai.io";`
			`license = licenses.mit;`
			`maintainers = with maintainers; [ onny ck3d ];`
			`platforms = platforms.linux;`
			`};`
			`};`
			`in`
			`self`