|
from fam.llm.fast_inference import TTS |
|
import string |
|
import soundfile as sf |
|
|
|
def remove_punctuation(sentence): |
|
translator = str.maketrans('', '', string.punctuation) |
|
sentence = sentence.translate(translator) |
|
|
|
|
|
sentence = sentence.replace('\n', ' ').replace('\r', '') |
|
|
|
return sentence |
|
|
|
def run_audio_generation_v2(new_text,accent='None'): |
|
tts = TTS() |
|
new_text = new_text.replace('\n', ' ').replace('\r', '') |
|
new_text_mod = remove_punctuation(new_text) |
|
|
|
new_text_split = new_text_mod.split() |
|
for word in new_text_split: |
|
if len(word)>=2 and word.isupper(): |
|
new_text = new_text.replace(word, " ".join([*word])) |
|
|
|
wav_file = tts.synthesise( |
|
text=new_text, |
|
spk_ref_path="./tmp/audio/speaker_wav.wav" |
|
) |
|
sf.write('audio/output.wav', wav_file, samplerate=22050) |
|
|
|
|