211 lines
6 KiB
Nix
211 lines
6 KiB
Nix
{
|
|
config,
|
|
lib,
|
|
rustPlatform,
|
|
fetchFromGitHub,
|
|
nix-update-script,
|
|
stdenv,
|
|
|
|
git,
|
|
openssl,
|
|
pkg-config,
|
|
protobuf,
|
|
|
|
llama-cpp,
|
|
|
|
apple-sdk_15,
|
|
autoAddDriverRunpath,
|
|
versionCheckHook,
|
|
|
|
cudaSupport ? config.cudaSupport,
|
|
rocmSupport ? config.rocmSupport,
|
|
metalSupport ? stdenv.hostPlatform.isDarwin && stdenv.hostPlatform.isAarch64,
|
|
# one of [ null "cpu" "rocm" "cuda" "metal" ];
|
|
acceleration ? null,
|
|
}:
|
|
|
|
let
|
|
inherit (lib) optional optionals flatten;
|
|
# References:
|
|
# https://github.com/NixOS/nixpkgs/blob/master/pkgs/by-name/ll/llama-cpp/package.nix
|
|
# https://github.com/NixOS/nixpkgs/blob/master/pkgs/tools/misc/ollama/default.nix
|
|
|
|
pname = "tabby";
|
|
version = "0.20.0";
|
|
|
|
availableAccelerations = flatten [
|
|
(optional cudaSupport "cuda")
|
|
(optional rocmSupport "rocm")
|
|
(optional metalSupport "metal")
|
|
];
|
|
|
|
warnIfMultipleAccelerationMethods =
|
|
configured:
|
|
(
|
|
let
|
|
len = builtins.length configured;
|
|
result = if len == 0 then "cpu" else (builtins.head configured);
|
|
in
|
|
lib.warnIf (len > 1) ''
|
|
building tabby with multiple acceleration methods enabled is not
|
|
supported; falling back to `${result}`
|
|
'' result
|
|
);
|
|
|
|
# If user did not not override the acceleration attribute, then try to use one of
|
|
# - nixpkgs.config.cudaSupport
|
|
# - nixpkgs.config.rocmSupport
|
|
# - metal if (stdenv.hostPlatform.isDarwin && stdenv.hostPlatform.isAarch64)
|
|
# !! warn if multiple acceleration methods are enabled and default to the first one in the list
|
|
featureDevice =
|
|
if (builtins.isNull acceleration) then
|
|
(warnIfMultipleAccelerationMethods availableAccelerations)
|
|
else
|
|
acceleration;
|
|
|
|
warnIfNotLinux =
|
|
api:
|
|
(lib.warnIfNot stdenv.hostPlatform.isLinux
|
|
"building tabby with `${api}` is only supported on linux; falling back to cpu"
|
|
stdenv.hostPlatform.isLinux
|
|
);
|
|
warnIfNotDarwinAarch64 =
|
|
api:
|
|
(lib.warnIfNot (stdenv.hostPlatform.isDarwin && stdenv.hostPlatform.isAarch64)
|
|
"building tabby with `${api}` is only supported on Darwin-aarch64; falling back to cpu"
|
|
(stdenv.hostPlatform.isDarwin && stdenv.hostPlatform.isAarch64)
|
|
);
|
|
|
|
validAccel = lib.assertOneOf "tabby.featureDevice" featureDevice [
|
|
"cpu"
|
|
"rocm"
|
|
"cuda"
|
|
"metal"
|
|
];
|
|
|
|
# TODO(ghthor): there is a bug here where featureDevice could be cuda, but enableCuda is false
|
|
# The would result in a startup failure of the service module.
|
|
enableRocm = validAccel && (featureDevice == "rocm") && (warnIfNotLinux "rocm");
|
|
enableCuda = validAccel && (featureDevice == "cuda") && (warnIfNotLinux "cuda");
|
|
enableMetal = validAccel && (featureDevice == "metal") && (warnIfNotDarwinAarch64 "metal");
|
|
|
|
# We have to use override here because tabby doesn't actually tell llama-cpp
|
|
# to use a specific device type as it is relying on llama-cpp only being
|
|
# built to use one type of device.
|
|
#
|
|
# See: https://github.com/TabbyML/tabby/blob/v0.11.1/crates/llama-cpp-bindings/include/engine.h#L20
|
|
#
|
|
llamaccpPackage = llama-cpp.override {
|
|
rocmSupport = enableRocm;
|
|
cudaSupport = enableCuda;
|
|
metalSupport = enableMetal;
|
|
};
|
|
|
|
# TODO(ghthor): some of this can be removed
|
|
darwinBuildInputs =
|
|
[ llamaccpPackage ]
|
|
++ optionals stdenv.hostPlatform.isDarwin ([
|
|
apple-sdk_15
|
|
]);
|
|
|
|
cudaBuildInputs = [ llamaccpPackage ];
|
|
rocmBuildInputs = [ llamaccpPackage ];
|
|
|
|
in
|
|
rustPlatform.buildRustPackage {
|
|
inherit pname version;
|
|
inherit featureDevice;
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "TabbyML";
|
|
repo = "tabby";
|
|
rev = "refs/tags/v${version}";
|
|
hash = "sha256-Vhl5oNVYY3pizoA0PuV4c9UXH3F2L+WiXQMOM0Pqxks=";
|
|
fetchSubmodules = true;
|
|
};
|
|
|
|
cargoLock = {
|
|
lockFile = ./Cargo.lock;
|
|
outputHashes = {
|
|
"ollama-rs-0.1.9" = "sha256-d6sKUxc8VQbRkVqMOeNFqDdKesq5k32AQShK67y2ssg=";
|
|
"oneshot-0.1.6" = "sha256-PmYuHuNTqToMyMHPRFDUaHUvFkVftx9ZCOBwXj+4Hc4=";
|
|
"ownedbytes-0.7.0" = "sha256-p0+ohtW0VLmfDTZw/LfwX2gYfuYuoOBcE+JsguK7Wn8=";
|
|
"sqlx-0.7.4" = "sha256-tcISzoSfOZ0jjNgGpuPPxjMxmBUPw/5FVDoALZEAHKY=";
|
|
"tree-sitter-c-0.21.3" = "sha256-ucbHLS2xyGo1uyKZv/K1HNXuMo4GpTY327cgdVS9F3c=";
|
|
"tree-sitter-cpp-0.22.1" = "sha256-3akSuQltFMF6I32HwRU08+Hcl9ojxPGk2ZuOX3gAObw=";
|
|
"tree-sitter-solidity-1.2.6" = "sha256-S00hdzMoIccPYBEvE092/RIMnG8YEnDGk6GJhXlr4ng=";
|
|
};
|
|
};
|
|
|
|
# https://github.com/TabbyML/tabby/blob/v0.7.0/.github/workflows/release.yml#L39
|
|
cargoBuildFlags =
|
|
[
|
|
# Don't need to build llama-cpp-server (included in default build)
|
|
"--no-default-features"
|
|
"--features"
|
|
"ee"
|
|
"--package"
|
|
"tabby"
|
|
]
|
|
++ optionals enableRocm [
|
|
"--features"
|
|
"rocm"
|
|
]
|
|
++ optionals enableCuda [
|
|
"--features"
|
|
"cuda"
|
|
];
|
|
|
|
nativeInstallCheckInputs = [
|
|
versionCheckHook
|
|
];
|
|
versionCheckProgramArg = [ "--version" ];
|
|
doInstallCheck = true;
|
|
|
|
nativeBuildInputs =
|
|
[
|
|
git
|
|
pkg-config
|
|
protobuf
|
|
]
|
|
++ optionals enableCuda [
|
|
autoAddDriverRunpath
|
|
];
|
|
|
|
buildInputs =
|
|
[ openssl ]
|
|
++ optionals stdenv.hostPlatform.isDarwin darwinBuildInputs
|
|
++ optionals enableCuda cudaBuildInputs
|
|
++ optionals enableRocm rocmBuildInputs;
|
|
|
|
postInstall = ''
|
|
# NOTE: Project contains a subproject for building llama-server
|
|
# But, we already have a derivation for this
|
|
ln -s ${lib.getExe' llama-cpp "llama-server"} $out/bin/llama-server
|
|
'';
|
|
|
|
env = {
|
|
OPENSSL_NO_VENDOR = 1;
|
|
};
|
|
|
|
# Fails with:
|
|
# file cannot create directory: /var/empty/local/lib64/cmake/Llama
|
|
doCheck = false;
|
|
|
|
passthru.updateScript = nix-update-script {
|
|
extraArgs = [
|
|
"--version-regex"
|
|
"^v([0-9.]+)$"
|
|
];
|
|
};
|
|
|
|
meta = with lib; {
|
|
homepage = "https://github.com/TabbyML/tabby";
|
|
changelog = "https://github.com/TabbyML/tabby/releases/tag/v${version}";
|
|
description = "Self-hosted AI coding assistant";
|
|
mainProgram = "tabby";
|
|
license = licenses.asl20;
|
|
maintainers = [ maintainers.ghthor ];
|
|
broken = stdenv.hostPlatform.isDarwin && !stdenv.hostPlatform.isAarch64;
|
|
};
|
|
}
|