summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorDanny Milosavljevic <dannym@friendly-machines.com>2026-03-11 01:03:05 +0100
committerDanny Milosavljevic <dannym@friendly-machines.com>2026-03-11 10:33:24 +0100
commit08c1be701d833da632eb77a6d0ccd0be6acc8b31 (patch)
treed1873c2c2dc7a0e8b6b49228da33286587d8bb37
parentae1d77b36d17d5886b4cc24ec0291c8bce4fc7bf (diff)
gnu: Add python-pocket-tts.
* gnu/packages/speech.scm (python-pocket-tts): New variable. Change-Id: Id91307c0c934ba36db3c488e606230249ff50363
-rw-r--r--gnu/packages/speech.scm46
1 files changed, 46 insertions, 0 deletions
diff --git a/gnu/packages/speech.scm b/gnu/packages/speech.scm
index 38858a6e684..4ee5962c599 100644
--- a/gnu/packages/speech.scm
+++ b/gnu/packages/speech.scm
@@ -953,3 +953,49 @@ using a Python-based domain-specific language.")
ONNX Runtime. It supports models including Whisper and NeMo Parakeet.
Includes bundled Parakeet TDT V3 model weights (int8, CC-BY-4.0, NVIDIA).")
(license license:expat)))
+
+(define-public python-pocket-tts
+ (package
+ (name "python-pocket-tts")
+ (version "1.1.1")
+ (source
+ (origin
+ (method git-fetch)
+ (uri (git-reference
+ (url "https://github.com/kyutai-labs/pocket-tts")
+ (commit (string-append "v" version))))
+ (file-name (git-file-name name version))
+ (sha256
+ (base32 "0b9xxyrwa8vsz6r6fi7p47z8rd7q2gjjnwq47br89zp2lkzym3zm"))))
+ (build-system pyproject-build-system)
+ (arguments
+ (list
+ #:test-flags
+ #~(list ;;; These tests try to download models from HuggingFace Hub.
+ "--ignore=tests/test_cli_generate.py"
+ "--ignore=tests/test_documentation_examples.py")))
+ (propagated-inputs
+ (list python-beartype
+ python-einops
+ python-fastapi
+ python-huggingface-hub
+ python-numpy
+ python-pydantic
+ python-pytorch
+ python-safetensors
+ python-scipy
+ python-sentencepiece
+ python-soundfile
+ python-typer
+ python-typing-extensions
+ python-uvicorn))
+ (native-inputs
+ (list nss-certs-for-test
+ python-hatchling
+ python-pytest))
+ (home-page "https://github.com/kyutai-labs/pocket-tts")
+ (synopsis "Fast neural text-to-speech")
+ (description
+ "Pocket TTS is a fast neural text-to-speech engine with ~100M parameters,
+running at approximately 6x realtime on CPU. English only.")
+ (license license:expat)))