mirror of
https://github.com/tcsenpai/agenticSeek.git
synced 2025-06-03 01:30:11 +00:00
37 lines
1.3 KiB
Python
37 lines
1.3 KiB
Python
from kokoro import KPipeline
|
|
from IPython.display import display, Audio
|
|
import soundfile as sf
|
|
import subprocess
|
|
import re
|
|
|
|
# 🇺🇸 'a' => American English, 🇬🇧 'b' => British English
|
|
# 🇯🇵 'j' => Japanese: pip install misaki[ja]
|
|
# 🇨🇳 'z' => Mandarin Chinese: pip install misaki[zh]
|
|
pipeline = KPipeline(lang_code='a') # <= make sure lang_code matches voice
|
|
|
|
class Speech():
|
|
def __init__(self) -> None:
|
|
self.pipeline = KPipeline(lang_code='a')
|
|
|
|
def speak(self, sentence):
|
|
sentence = self.clean_sentence(sentence)
|
|
generator = self.pipeline(
|
|
sentence, voice='af_heart', # <= change voice here
|
|
speed=1, split_pattern=r'\n+'
|
|
)
|
|
for i, (gs, ps, audio) in enumerate(generator):
|
|
audio_file = f'sample.wav'
|
|
display(Audio(data=audio, rate=24000, autoplay=i==0))
|
|
sf.write(audio_file, audio, 24000) # save each audio file
|
|
subprocess.call(["afplay", audio_file])
|
|
|
|
def clean_sentence(self, sentence):
|
|
sentence = re.sub(r'`.*?`', '', sentence)
|
|
sentence = re.sub(r'[^a-zA-Z0-9.,!? ]+', '', sentence)
|
|
sentence = re.sub(r'\s+', ' ', sentence).strip()
|
|
return sentence
|
|
|
|
if __name__ == "__main__":
|
|
speech = Speech()
|
|
speech.speak("hello would you like coffee ?")
|