# from fam.llm.fast_inference import TTS
# import string
# import soundfile as sf

# def remove_punctuation(sentence):
#     translator = str.maketrans('', '', string.punctuation)
#     sentence = sentence.translate(translator)

#     # Remove line breaks
#     sentence = sentence.replace('\n', ' ').replace('\r', '')

#     return sentence

# def run_audio_generation_v2(new_text,accent='None'):
#     tts = TTS()
#     new_text =  new_text.replace('\n', ' ').replace('\r', '')
#     new_text_mod = remove_punctuation(new_text)

#     new_text_split = new_text_mod.split()
#     for word in new_text_split:
#         if len(word)>=2 and word.isupper():
#             new_text = new_text.replace(word, " ".join([*word]))
            
#     wav_file = tts.synthesise(
#     text=new_text,
#     spk_ref_path="./tmp/audio/speaker_wav.wav" # you can use any speaker reference file (WAV, OGG, MP3, FLAC, etc.)
#     )     
#     sf.write('audio/output.wav', wav_file, samplerate=22050)