5ca88bfbb9
GitOrigin-RevId: 9f918d616c5321ad374ae6cb5ea89c9e04bf3e58
41 lines
825 B
Nix
41 lines
825 B
Nix
{
|
|
lib,
|
|
stdenv,
|
|
fetchFromGitHub,
|
|
buildPythonPackage,
|
|
pythonOlder,
|
|
setuptools,
|
|
regex,
|
|
}:
|
|
|
|
buildPythonPackage rec {
|
|
pname = "somajo";
|
|
version = "2.4.2";
|
|
pyproject = true;
|
|
|
|
disabled = pythonOlder "3.7";
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "tsproisl";
|
|
repo = "SoMaJo";
|
|
rev = "refs/tags/v${version}";
|
|
hash = "sha256-5rlgDnPYTtuVMincG5CgVwNh/IGmZk6ItvzdB/wHmgg=";
|
|
};
|
|
|
|
nativeBuildInputs = [ setuptools ];
|
|
|
|
propagatedBuildInputs = [ regex ];
|
|
|
|
# loops forever
|
|
doCheck = !stdenv.isDarwin;
|
|
|
|
pythonImportsCheck = [ "somajo" ];
|
|
|
|
meta = with lib; {
|
|
description = "Tokenizer and sentence splitter for German and English web texts";
|
|
mainProgram = "somajo-tokenizer";
|
|
homepage = "https://github.com/tsproisl/SoMaJo";
|
|
license = licenses.gpl3Plus;
|
|
maintainers = [ ];
|
|
};
|
|
}
|