depot/third_party/nixpkgs/pkgs/development/python-modules/somajo/default.nix
Default email 7e47f3658e Project import generated by Copybara.
GitOrigin-RevId: 1925c603f17fc89f4c8f6bf6f631a802ad85d784
2024-09-26 11:04:55 +00:00

42 lines
907 B
Nix

{
lib,
stdenv,
fetchFromGitHub,
buildPythonPackage,
pythonOlder,
setuptools,
regex,
}:
buildPythonPackage rec {
pname = "somajo";
version = "2.4.3";
pyproject = true;
disabled = pythonOlder "3.8";
src = fetchFromGitHub {
owner = "tsproisl";
repo = "SoMaJo";
rev = "refs/tags/v${version}";
hash = "sha256-fq891LX6PukUEfrXplulhnisuPX/RqLAQ/5ty/Fvm9k=";
};
build-system = [ setuptools ];
dependencies = [ regex ];
# loops forever
doCheck = !stdenv.hostPlatform.isDarwin;
pythonImportsCheck = [ "somajo" ];
meta = with lib; {
description = "Tokenizer and sentence splitter for German and English web texts";
homepage = "https://github.com/tsproisl/SoMaJo";
changelog = "https://github.com/tsproisl/SoMaJo/blob/v${version}/CHANGES.txt";
license = licenses.gpl3Plus;
maintainers = [ ];
mainProgram = "somajo-tokenizer";
};
}