{ lib , python3 , fetchFromGitHub , fetchpatch , espeak-ng }: # USAGE: # $ tts-server --list_models # # pick your favorite vocoder/tts model # $ tts-server --model_name tts_models/en/ljspeech/glow-tts --vocoder_name vocoder_models/universal/libri-tts/fullband-melgan # # If you upgrade from an old version you may have to delete old models from ~/.local/share/tts # # For now, for deployment check the systemd unit in the pull request: # https://github.com/NixOS/nixpkgs/pull/103851#issue-521121136 let python = python3.override { packageOverrides = self: super: { # API breakage with 0.9.0 # TypeError: mel() takes 0 positional arguments but 2 positional arguments (and 3 keyword-only arguments) were given librosa = super.librosa.overridePythonAttrs (oldAttrs: rec { version = "0.8.1"; src = super.fetchPypi { pname = "librosa"; inherit version; hash = "sha256-xT0F52iuSj5VOuIcLlAVKT5e+/1cEtSX8RBMtRnMprM="; }; }); }; }; in python.pkgs.buildPythonApplication rec { pname = "tts"; version = "0.11.1"; format = "pyproject"; src = fetchFromGitHub { owner = "coqui-ai"; repo = "TTS"; rev = "refs/tags/v${version}"; hash = "sha256-EVFFETiGbrouUsrIhMFZEex3UGCCWTI3CC4yFAcERyw="; }; postPatch = let relaxedConstraints = [ "cython" "gruut" "inflect" "librosa" "mecab-python3" "numba" "numpy" "unidic-lite" ]; in '' sed -r -i \ ${lib.concatStringsSep "\n" (map (package: ''-e 's/${package}.*[<>=]+.*/${package}/g' \'' ) relaxedConstraints)} requirements.txt # only used for notebooks and visualization sed -r -i -e '/umap-learn/d' requirements.txt ''; nativeBuildInputs = with python.pkgs; [ cython packaging ]; propagatedBuildInputs = with python.pkgs; [ anyascii coqpit flask fsspec g2pkk gdown gruut inflect jamo jieba librosa matplotlib mecab-python3 nltk numba packaging pandas pypinyin pysbd scipy soundfile tensorflow torch-bin torchaudio-bin tqdm trainer unidic-lite webrtcvad ]; postInstall = '' cp -r TTS/server/templates/ $out/${python.sitePackages}/TTS/server # cython modules are not installed for some reasons ( cd TTS/tts/utils/monotonic_align ${python.interpreter} setup.py install --prefix=$out ) ''; nativeCheckInputs = with python.pkgs; [ espeak-ng pytestCheckHook ]; preCheck = '' # use the installed TTS in $PYTHONPATH instead of the one from source to also have cython modules. mv TTS{,.old} export PATH=$out/bin:$PATH # numba tries to write to HOME directory export HOME=$TMPDIR for file in $(grep -rl 'python TTS/bin' tests); do substituteInPlace "$file" \ --replace "python TTS/bin" "${python.interpreter} $out/lib/${python.libPrefix}/site-packages/TTS/bin" done ''; disabledTests = [ # Requires network acccess to download models "test_korean_text_to_phonemes" "test_models_offset_0_step_3" "test_models_offset_1_step_3" "test_models_offset_2_step_3" "test_run_all_models" "test_synthesize" "test_voice_cloning" "test_voice_conversion" "test_multi_speaker_multi_lingual_model" "test_single_speaker_model" # Mismatch between phonemes "test_text_to_ids_phonemes_with_eos_bos_and_blank" # Takes too long "test_parametrized_wavernn_dataset" ]; disabledTestPaths = [ # phonemes mismatch between espeak-ng and gruuts phonemizer "tests/text_tests/test_phonemizer.py" # no training, it takes too long "tests/aux_tests/test_speaker_encoder_train.py" "tests/tts_tests/test_align_tts_train.py" "tests/tts_tests/test_fast_pitch_speaker_emb_train.py" "tests/tts_tests/test_fast_pitch_train.py" "tests/tts_tests/test_fastspeech_2_speaker_emb_train.py" "tests/tts_tests/test_fastspeech_2_train.py" "tests/tts_tests/test_glow_tts_d-vectors_train.py" "tests/tts_tests/test_glow_tts_speaker_emb_train.py" "tests/tts_tests/test_glow_tts_train.py" "tests/tts_tests/test_neuralhmm_tts_train.py" "tests/tts_tests/test_overflow_train.py" "tests/tts_tests/test_speedy_speech_train.py" "tests/tts_tests/test_tacotron2_d-vectors_train.py" "tests/tts_tests/test_tacotron2_speaker_emb_train.py" "tests/tts_tests/test_tacotron2_train.py" "tests/tts_tests/test_tacotron_train.py" "tests/tts_tests/test_vits_d-vectors_train.py" "tests/tts_tests/test_vits_multilingual_speaker_emb_train.py" "tests/tts_tests/test_vits_multilingual_train-d_vectors.py" "tests/tts_tests/test_vits_speaker_emb_train.py" "tests/tts_tests/test_vits_train.py" "tests/vocoder_tests/test_wavegrad_train.py" "tests/vocoder_tests/test_parallel_wavegan_train.py" "tests/vocoder_tests/test_fullband_melgan_train.py" "tests/vocoder_tests/test_hifigan_train.py" "tests/vocoder_tests/test_multiband_melgan_train.py" "tests/vocoder_tests/test_melgan_train.py" "tests/vocoder_tests/test_wavernn_train.py" ]; meta = with lib; { homepage = "https://github.com/coqui-ai/TTS"; changelog = "https://github.com/coqui-ai/TTS/releases/tag/v${version}"; description = "Deep learning toolkit for Text-to-Speech, battle-tested in research and production"; license = licenses.mpl20; maintainers = teams.tts.members; }; }