2023-08-04 22:07:22 +00:00
|
|
|
{ lib
|
|
|
|
, buildGoModule
|
|
|
|
, fetchFromGitHub
|
2023-11-16 04:20:00 +00:00
|
|
|
, llama-cpp
|
2023-08-04 22:07:22 +00:00
|
|
|
, stdenv
|
|
|
|
}:
|
|
|
|
|
|
|
|
buildGoModule rec {
|
|
|
|
pname = "ollama";
|
2023-11-16 04:20:00 +00:00
|
|
|
version = "0.1.7";
|
2023-08-04 22:07:22 +00:00
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
|
|
|
owner = "jmorganca";
|
|
|
|
repo = "ollama";
|
|
|
|
rev = "v${version}";
|
2023-11-16 04:20:00 +00:00
|
|
|
hash = "sha256-rzcuRU2qcYTMo/GxiSHwJYnvA9samfWlztMEhOGzbRg=";
|
2023-08-04 22:07:22 +00:00
|
|
|
};
|
|
|
|
|
2023-11-16 04:20:00 +00:00
|
|
|
patches = [
|
|
|
|
# disable passing the deprecated gqa flag to llama-cpp-server
|
|
|
|
# see https://github.com/ggerganov/llama.cpp/issues/2975
|
|
|
|
./disable-gqa.patch
|
2023-08-04 22:07:22 +00:00
|
|
|
|
2023-11-16 04:20:00 +00:00
|
|
|
# replace the call to the bundled llama-cpp-server with the one in the llama-cpp package
|
|
|
|
./set-llamacpp-path.patch
|
|
|
|
];
|
2023-08-04 22:07:22 +00:00
|
|
|
|
2023-11-16 04:20:00 +00:00
|
|
|
postPatch = ''
|
|
|
|
substituteInPlace llm/llama.go \
|
|
|
|
--subst-var-by llamaCppServer "${llama-cpp}/bin/llama-cpp-server"
|
|
|
|
'';
|
|
|
|
|
|
|
|
vendorHash = "sha256-Qt5QVqRkwK61BJPVhFWtox6b9E8BpAIseNB0yhh+/90=";
|
|
|
|
|
|
|
|
ldflags = [
|
|
|
|
"-s"
|
|
|
|
"-w"
|
|
|
|
"-X=github.com/jmorganca/ollama/version.Version=${version}"
|
|
|
|
"-X=github.com/jmorganca/ollama/server.mode=release"
|
|
|
|
];
|
2023-08-04 22:07:22 +00:00
|
|
|
|
|
|
|
meta = with lib; {
|
|
|
|
description = "Get up and running with large language models locally";
|
|
|
|
homepage = "https://github.com/jmorganca/ollama";
|
|
|
|
license = licenses.mit;
|
2023-11-16 04:20:00 +00:00
|
|
|
mainProgram = "ollama";
|
|
|
|
maintainers = with maintainers; [ dit7ya elohmeier ];
|
|
|
|
platforms = platforms.unix;
|
2023-08-04 22:07:22 +00:00
|
|
|
};
|
|
|
|
}
|