Spaces:

TDN-M
/

GV-a

Running on Zero

TDN-M commited on Feb 12

Commit

a7ba2cd

verified ·

1 Parent(s): d019e55

Update tts.py

Files changed (1) hide show

tts.py CHANGED Viewed

@@ -71,11 +71,9 @@ def generate_speech(text, language="vi", speaker_wav=None, normalize_text=True):
         raise ValueError(f"Ngôn ngữ {language} không được hỗ trợ.")
     if len(text) < 2:
         raise ValueError("Văn bản quá ngắn.")
     try:
         if normalize_text and language == "vi":
             text = normalize_vietnamese_text(text)
         with torch.no_grad():
             with autocast(enabled=use_fp16):
                 gpt_cond_latent, speaker_embedding = MODEL.get_conditioning_latents(
@@ -93,8 +91,7 @@ def generate_speech(text, language="vi", speaker_wav=None, normalize_text=True):
                     temperature=0.75,
                     enable_text_splitting=True,
                 )
-        output_file = "output.wav"
         torchaudio.save(output_file, torch.tensor(out["wav"]).unsqueeze(0).to("cpu"), 24000)
         return output_file
     except Exception as e:

         raise ValueError(f"Ngôn ngữ {language} không được hỗ trợ.")
     if len(text) < 2:
         raise ValueError("Văn bản quá ngắn.")
     try:
         if normalize_text and language == "vi":
             text = normalize_vietnamese_text(text)
         with torch.no_grad():
             with autocast(enabled=use_fp16):
                 gpt_cond_latent, speaker_embedding = MODEL.get_conditioning_latents(
                     temperature=0.75,
                     enable_text_splitting=True,
                 )
+        output_file = f"output_{os.urandom(4).hex()}.wav"
         torchaudio.save(output_file, torch.tensor(out["wav"]).unsqueeze(0).to("cpu"), 24000)
         return output_file
     except Exception as e: