02cf88bb76
GitOrigin-RevId: c4a0efdd5a728e20791b8d8d2f26f90ac228ee8d
96 lines
1.7 KiB
Nix
96 lines
1.7 KiB
Nix
{ lib
|
|
, buildPythonPackage
|
|
, callPackage
|
|
, pythonOlder
|
|
, fetchFromGitHub
|
|
, babel
|
|
, gruut-ipa
|
|
, dateparser
|
|
, jsonlines
|
|
, num2words
|
|
, python-crfsuite
|
|
, dataclasses
|
|
, python
|
|
, networkx
|
|
, glibcLocales
|
|
, pytestCheckHook
|
|
}:
|
|
|
|
let
|
|
langPkgs = [
|
|
"ar"
|
|
"cs"
|
|
"de"
|
|
"en"
|
|
"es"
|
|
"fa"
|
|
"fr"
|
|
"it"
|
|
"lb"
|
|
"nl"
|
|
"pt"
|
|
"ru"
|
|
"sv"
|
|
"sw"
|
|
];
|
|
in
|
|
buildPythonPackage rec {
|
|
pname = "gruut";
|
|
version = "2.3.4";
|
|
format = "setuptools";
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "rhasspy";
|
|
repo = pname;
|
|
rev = "refs/tags/v${version}";
|
|
sha256 = "sha256-DD7gnvH9T2R6E19+exWE7Si+XEpfh0Iy5FYbycjgzgM=";
|
|
};
|
|
|
|
postPatch = ''
|
|
substituteInPlace requirements.txt \
|
|
--replace "dateparser~=1.0.0" "dateparser" \
|
|
--replace "gruut_lang_en~=2.0.0" "gruut_lang_en" \
|
|
--replace "jsonlines~=1.2.0" "jsonlines"
|
|
'';
|
|
|
|
propagatedBuildInputs = [
|
|
babel
|
|
gruut-ipa
|
|
jsonlines
|
|
num2words
|
|
python-crfsuite
|
|
dateparser
|
|
networkx
|
|
] ++ lib.optionals (pythonOlder "3.7") [
|
|
dataclasses
|
|
] ++ (map (lang: callPackage ./language-pack.nix {
|
|
inherit lang version format src;
|
|
}) langPkgs);
|
|
|
|
checkInputs = [ glibcLocales pytestCheckHook ];
|
|
|
|
disabledTests = [
|
|
# https://github.com/rhasspy/gruut/issues/25
|
|
"test_lexicon_external"
|
|
|
|
# requires mishkal library
|
|
"test_fa"
|
|
"test_ar"
|
|
"test_lb"
|
|
];
|
|
|
|
preCheck = ''
|
|
export LC_ALL=en_US.utf-8
|
|
'';
|
|
|
|
pythonImportsCheck = [
|
|
"gruut"
|
|
];
|
|
|
|
meta = with lib; {
|
|
description = "A tokenizer, text cleaner, and phonemizer for many human languages";
|
|
homepage = "https://github.com/rhasspy/gruut";
|
|
license = licenses.mit;
|
|
maintainers = teams.tts.members;
|
|
};
|
|
}
|