472aeafc57
GitOrigin-RevId: c31898adf5a8ed202ce5bea9f347b1c6871f32d1
92 lines
1.6 KiB
Nix
92 lines
1.6 KiB
Nix
{
|
|
lib,
|
|
buildPythonPackage,
|
|
fetchFromGitHub,
|
|
|
|
# build-system
|
|
poetry-core,
|
|
|
|
# dependencies
|
|
boltons,
|
|
gensim,
|
|
gitpython,
|
|
greek-accentuation,
|
|
nltk,
|
|
pyyaml,
|
|
rapidfuzz,
|
|
requests,
|
|
scikit-learn,
|
|
scipy,
|
|
spacy,
|
|
stanza,
|
|
stringcase,
|
|
torch,
|
|
tqdm,
|
|
|
|
# tests
|
|
pytestCheckHook,
|
|
}:
|
|
buildPythonPackage rec {
|
|
pname = "cltk";
|
|
version = "1.3.0";
|
|
|
|
pyproject = true;
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "cltk";
|
|
repo = "cltk";
|
|
rev = "refs/tags/v${version}";
|
|
hash = "sha256-/rdv96lnSGN+aJJmPSIan79zoXxnStokFEAjBtCLKy4=";
|
|
};
|
|
|
|
postPatch = ''
|
|
substituteInPlace pyproject.toml \
|
|
--replace-fail "poetry>=1.1.13" poetry-core \
|
|
--replace-fail "poetry.masonry.api" "poetry.core.masonry.api" \
|
|
--replace-fail 'scipy = "<1.13.0"' 'scipy = "^1"' \
|
|
--replace-fail 'boltons = "^21.0.0"' 'boltons = "^24.0.0"'
|
|
'';
|
|
|
|
build-system = [ poetry-core ];
|
|
|
|
pythonRelaxDeps = [
|
|
"spacy"
|
|
];
|
|
|
|
dependencies = [
|
|
boltons
|
|
gensim
|
|
gitpython
|
|
greek-accentuation
|
|
nltk
|
|
pyyaml
|
|
rapidfuzz
|
|
requests
|
|
scikit-learn
|
|
scipy
|
|
spacy
|
|
stanza
|
|
stringcase
|
|
torch
|
|
tqdm
|
|
];
|
|
|
|
nativeCheckInputs = [
|
|
pytestCheckHook
|
|
];
|
|
|
|
preCheck = ''
|
|
export HOME=$(mktemp -d)
|
|
'';
|
|
|
|
# Most of tests fail as they require local files to be present and also internet access
|
|
doCheck = false;
|
|
|
|
meta = {
|
|
description = "Natural language processing (NLP) framework for pre-modern languages";
|
|
homepage = "https://cltk.org";
|
|
changelog = "https://github.com/cltk/cltk/releases/tag/v${version}";
|
|
license = lib.licenses.mit;
|
|
maintainers = with lib.maintainers; [ kmein ];
|
|
};
|
|
}
|