2024-10-04 16:56:33 +00:00
|
|
|
{
|
|
|
|
pkgs,
|
|
|
|
config,
|
|
|
|
lib,
|
|
|
|
...
|
|
|
|
}:
|
2024-05-15 15:35:15 +00:00
|
|
|
let
|
|
|
|
cfg = config.services.local-ai;
|
|
|
|
inherit (lib) mkOption types;
|
|
|
|
in
|
|
|
|
{
|
|
|
|
options.services.local-ai = {
|
2024-06-05 15:53:02 +00:00
|
|
|
enable = lib.mkEnableOption "local-ai";
|
2024-05-15 15:35:15 +00:00
|
|
|
|
|
|
|
package = lib.mkPackageOption pkgs "local-ai" { };
|
|
|
|
|
|
|
|
extraArgs = mkOption {
|
|
|
|
type = types.listOf types.str;
|
|
|
|
default = [ ];
|
|
|
|
};
|
|
|
|
|
|
|
|
port = mkOption {
|
|
|
|
type = types.port;
|
|
|
|
default = 8080;
|
|
|
|
};
|
|
|
|
|
|
|
|
threads = mkOption {
|
|
|
|
type = types.int;
|
|
|
|
default = 1;
|
|
|
|
};
|
|
|
|
|
|
|
|
models = mkOption {
|
|
|
|
type = types.either types.package types.str;
|
|
|
|
default = "models";
|
|
|
|
};
|
|
|
|
|
|
|
|
parallelRequests = mkOption {
|
|
|
|
type = types.int;
|
|
|
|
default = 1;
|
|
|
|
};
|
|
|
|
|
|
|
|
logLevel = mkOption {
|
2024-10-04 16:56:33 +00:00
|
|
|
type = types.enum [
|
|
|
|
"error"
|
|
|
|
"warn"
|
|
|
|
"info"
|
|
|
|
"debug"
|
|
|
|
"trace"
|
|
|
|
];
|
2024-05-15 15:35:15 +00:00
|
|
|
default = "warn";
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
config = lib.mkIf cfg.enable {
|
|
|
|
systemd.services.local-ai = {
|
|
|
|
wantedBy = [ "multi-user.target" ];
|
|
|
|
environment.LLAMACPP_PARALLEL = toString cfg.parallelRequests;
|
|
|
|
serviceConfig = {
|
|
|
|
DynamicUser = true;
|
2024-10-04 16:56:33 +00:00
|
|
|
ExecStart = lib.escapeShellArgs (
|
|
|
|
[
|
|
|
|
"${cfg.package}/bin/local-ai"
|
|
|
|
"--address=:${toString cfg.port}"
|
|
|
|
"--threads=${toString cfg.threads}"
|
|
|
|
"--localai-config-dir=."
|
|
|
|
"--models-path=${cfg.models}"
|
|
|
|
"--log-level=${cfg.logLevel}"
|
|
|
|
]
|
|
|
|
++ lib.optional (cfg.parallelRequests > 1) "--parallel-requests"
|
|
|
|
++ cfg.extraArgs
|
|
|
|
);
|
2024-05-15 15:35:15 +00:00
|
|
|
RuntimeDirectory = "local-ai";
|
|
|
|
WorkingDirectory = "%t/local-ai";
|
|
|
|
};
|
|
|
|
};
|
|
|
|
};
|
|
|
|
}
|