diff --git a/README.md b/README.md index 1a15bd3..ef7ba45 100644 --- a/README.md +++ b/README.md @@ -1,5 +1,12 @@ # Kitten TTS 😻 +THIS IS A MODIFIED VERSION +- modified to be able to install on Python 3.13 +- modified to remove a dependency on Torch + +It was modified in order to explore using it in: +https://github.com/createcandle/voco + Screenshot 2026-02-18 at 8 33 04 PM diff --git a/kittentts/get_model.py b/kittentts/get_model.py index e9b346d..10bbd36 100644 --- a/kittentts/get_model.py +++ b/kittentts/get_model.py @@ -34,7 +34,7 @@ def generate(self, text, voice="expr-voice-5-m", speed=1.0, clean_text=False): Returns: Audio data as numpy array """ - print(f"Generating audio for text: {text}") + #print(f"Generating audio for text: {text}") return self.model.generate(text, voice=voice, speed=speed, clean_text=clean_text) def generate_to_file(self, text, output_path, voice="expr-voice-5-m", speed=1.0, sample_rate=24000): diff --git a/pyproject.toml b/pyproject.toml index 8a60547..43f08d2 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -19,13 +19,13 @@ classifiers = [ ] dependencies = [ "num2words", - "spacy", "espeakng_loader", - "misaki[en]>=0.9.4", "onnxruntime", "soundfile", "numpy", "huggingface_hub", + "transformers", + "phonemizer-fork" ] [project.urls] diff --git a/requirements.txt b/requirements.txt index 37bfbb3..3b61c2b 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,8 +1,8 @@ num2words -spacy espeakng_loader -misaki[en]>=0.9.4 onnxruntime soundfile numpy huggingface_hub +transformers +phonemizer-fork diff --git a/setup.py b/setup.py index 5ff10c6..eaaf62b 100644 --- a/setup.py +++ b/setup.py @@ -24,19 +24,22 @@ "Programming Language :: Python :: 3.10", "Programming Language :: Python :: 3.11", "Programming Language :: Python :: 3.12", + "Programming Language :: Python :: 3.13", "Topic :: Multimedia :: Sound/Audio :: Speech", "Topic :: Scientific/Engineering :: Artificial Intelligence", ], python_requires=">=3.8", install_requires=[ "num2words", - "spacy", + #"spacy", "espeakng_loader", - "misaki[en]>=0.9.4", + #"misaki@git+https://github.com/createcandle/misaki", "onnxruntime", "soundfile", "numpy", "huggingface_hub", + "transformers", + "phonemizer-fork", ], keywords="text-to-speech, tts, speech-synthesis, neural-networks, onnx", project_urls={