2021-02-05 17:12:51 +00:00
|
|
|
{ lib, stdenv, fetchFromGitHub, buildPythonPackage, isPy3k, regex }:
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
buildPythonPackage rec {
|
|
|
|
pname = "SoMaJo";
|
2021-08-27 14:25:00 +00:00
|
|
|
version = "2.1.5";
|
2020-04-24 23:36:52 +00:00
|
|
|
disabled = !isPy3k;
|
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
|
|
|
owner = "tsproisl";
|
|
|
|
repo = pname;
|
|
|
|
rev = "v${version}";
|
2021-08-27 14:25:00 +00:00
|
|
|
sha256 = "17v1vmbjwpxwql25vlbm7xsair7945ljmyaricxx8fd6fxvgn9rr";
|
2020-04-24 23:36:52 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
propagatedBuildInputs = [ regex ];
|
|
|
|
|
2021-02-05 17:12:51 +00:00
|
|
|
# loops forever
|
|
|
|
doCheck = !stdenv.isDarwin;
|
|
|
|
|
2021-01-15 22:18:51 +00:00
|
|
|
meta = with lib; {
|
2020-04-24 23:36:52 +00:00
|
|
|
description = "Tokenizer and sentence splitter for German and English web texts";
|
|
|
|
homepage = "https://github.com/tsproisl/SoMaJo";
|
2021-02-05 17:12:51 +00:00
|
|
|
license = licenses.gpl3Plus;
|
2021-09-18 10:52:07 +00:00
|
|
|
maintainers = with maintainers; [ ];
|
2020-04-24 23:36:52 +00:00
|
|
|
};
|
|
|
|
}
|