RoboServant/tts.py
2025-09-30 12:01:44 -05:00

21 lines
549 B
Python

from kokoro import KPipeline
from IPython.display import display, Audio
import soundfile as sf
import torch
class TTS:
pipeline = KPipeline(lang_code='a')
def __init__(self):
pass
# Should be saved as .wav
def create_audio(self, text: str, save_path: str) -> None:
generator = self.pipeline(text, voice='af_heart')
for i, (gs, ps, audio) in enumerate(generator):
print(i, gs, ps)
display(Audio(data=audio, rate=24000, autoplay=i==0))
sf.write(save_path, audio, 24000)