Spaces:

akbarazimifar
/

Persian-TTS

Runtime error

App Files Files Community

akbarazimifar commited on Jun 8, 2024

Commit

e0bb698

verified ·

1 Parent(s): 6ae3876

Update app.py

Browse files

Files changed (1) hide show

app.py +69 -60

app.py CHANGED Viewed

@@ -1,12 +1,13 @@
-import tempfile ,os
-from TTS.config import load_config
 import gradio as gr
 from TTS.utils.manage import ModelManager
 from TTS.utils.synthesizer import Synthesizer
-MODEL_NAMES=[
     "vits male1 (best)",
     "vits female (best)",
     "vits-male",
@@ -15,70 +16,78 @@ MODEL_NAMES=[
     "glowtts-female",
     "female tacotron2"
 ]
-MAX_TXT_LEN = 800
-model_path = os.getcwd() + "/best_model.pth"
-config_path = os.getcwd() + "/config.json"
-from TTS.utils.download import download_url
-modelInfo=[
-    ["vits-male","best_model_65633.pth","config-0.json","https://huggingface.co/Kamtera/persian-tts-male-vits/resolve/main/"],
-    ["vits female (best)","checkpoint_48000.pth","config-2.json","https://huggingface.co/Kamtera/persian-tts-female-vits/resolve/main/"],
-    ["glowtts-male","best_model_77797.pth","config-1.json","https://huggingface.co/Kamtera/persian-tts-male-glow_tts/resolve/main/"],
-    ["glowtts-female","best_model.pth","config.json","https://huggingface.co/Kamtera/persian-tts-female-glow_tts/resolve/main/"],
-    ["vits male1 (best)","checkpoint_88000.pth","config.json","https://huggingface.co/Kamtera/persian-tts-male1-vits/resolve/main/"],
-    ["vits female1","checkpoint_50000.pth","config.json","https://huggingface.co/Kamtera/persian-tts-female1-vits/resolve/main/"],
-    ["female tacotron2","checkpoint_313000.pth","config-2.json","https://huggingface.co/Kamtera/persian-tts-female-tacotron2/resolve/main/"]
 ]
-for d in modelInfo:
-    directory=d[0]
-    if not os.path.exists(directory):
-        os.makedirs(directory)
-    print("|> Downloading: ",directory)
-    download_url(
-        d[3]+d[1],directory,"best_model.pth"
-    )
-    download_url(
-        d[3]+d[2],directory,"config.json"
-    )
-def tts(text: str,model_name: str):
-    if len(text) > MAX_TXT_LEN:
-        text = text[:MAX_TXT_LEN]
-        print(f"Input text was cutoff since it went over the {MAX_TXT_LEN} character limit.")
-    print(text)
-    # synthesize
-    synthesizer = Synthesizer(
-        model_name+"/best_model.pth", model_name+"/config.json"
-    )
-    if synthesizer is None:
-        raise NameError("model not found")
-    wavs = synthesizer.tts(text)
-    # return output
-    with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
-        synthesizer.save_wav(wavs, fp)
-        return fp.name
-description="""
-"""
-article= ""
-examples=[
-    ["و خداوند شما را با ارسال روح در جسم زندگانی و حیات بخشید","vits-male"],
-    ["تاجر تو چه تجارت می کنی ، تو را چه که چه تجارت می کنم؟","vits female (best)"],
-    ["شیش سیخ جیگر سیخی شیش هزار","vits female (best)"],
-    ["سه شیشه شیر ، سه سیر سرشیر","vits female (best)"],
-    ["دزدی دزدید ز بز دزدی بزی ، عجب دزدی که دزدید ز بز دزدی بزی","vits male1 (best)"],
-    ["مثنوی یکی از قالب های شعری است ک هر بیت قافیه ی جداگانه دارد","vits female1"],
-    ["در گلو ماند خس او سالها، چیست آن خس مهر جاه و مالها","vits male1 (best)"],
 ]
 iface = gr.Interface(
-    fn=tts,
     inputs=[
         gr.Textbox(
             label="Text",
@@ -90,11 +99,11 @@ iface = gr.Interface(
             value="vits-female",
         ),
     ],
-    outputs=gr.Audio(label="Output",type='filepath'),
     examples=examples,
     title="🗣️ Persian tts 🗣️",
     description=description,
     article=article,
     live=False
 )
-iface.launch(share=False)

+import tempfile
+import os
 import gradio as gr
+from TTS.config import load_config
 from TTS.utils.manage import ModelManager
 from TTS.utils.synthesizer import Synthesizer
+from TTS.utils.download import download_url
+from concurrent.futures import ThreadPoolExecutor
+MODEL_NAMES = [
     "vits male1 (best)",
     "vits female (best)",
     "vits-male",
     "glowtts-female",
     "female tacotron2"
 ]
+MAX_TXT_LEN = 800
+MODELS_DIRECTORY = "models"  # مسیر مدل‌ها
+modelInfo = [
+    ["vits-male", "best_model_65633.pth", "config-0.json",
+     "https://huggingface.co/Kamtera/persian-tts-male-vits/resolve/main/"],
+    ["vits female (best)", "checkpoint_48000.pth", "config-2.json",
+     "https://huggingface.co/Kamtera/persian-tts-female-vits/resolve/main/"],
+    ["glowtts-male", "best_model_77797.pth", "config-1.json",
+     "https://huggingface.co/Kamtera/persian-tts-male-glow_tts/resolve/main/"],
+    ["glowtts-female", "best_model.pth", "config.json",
+     "https://huggingface.co/Kamtera/persian-tts-female-glow_tts/resolve/main/"],
+    ["vits male1 (best)", "checkpoint_88000.pth", "config.json",
+     "https://huggingface.co/Kamtera/persian-tts-male1-vits/resolve/main/"],
+    ["vits female1", "checkpoint_50000.pth", "config.json",
+     "https://huggingface.co/Kamtera/persian-tts-female1-vits/resolve/main/"],
+    ["female tacotron2", "checkpoint_313000.pth", "config-2.json",
+     "https://huggingface.co/Kamtera/persian-tts-female-tacotron2/resolve/main/"]
 ]
+class PersianTTS:
+    def __init__(self):
+        self.model_manager = ModelManager(MODELS_DIRECTORY)
+        self.download_models()
+    def download_models(self):
+        with ThreadPoolExecutor(max_workers=5) as executor:
+            for model in modelInfo:
+                model_name, model_filename, config_filename, model_url = model
+                model_directory = os.path.join(MODELS_DIRECTORY, model_name)
+                if not os.path.exists(model_directory):
+                    os.makedirs(model_directory)
+                print("|> Downloading: ", model_directory)
+                executor.submit(download_url, model_url + model_filename, model_directory, "best_model.pth")
+                executor.submit(download_url, model_url + config_filename, model_directory, "config.json")
+    def tts(self, text: str, model_name: str):
+        if len(text) > MAX_TXT_LEN:
+            text = text[:MAX_TXT_LEN]
+            print(f"Input text was cutoff since it went over the {MAX_TXT_LEN} character limit.")
+        # synthesize
+        model_path, config_path = self.model_manager.get_model_paths(model_name)
+        synthesizer = Synthesizer(model_path, config_path)
+        if synthesizer is None:
+            raise NameError("model not found")
+        wavs = synthesizer.tts(text)
+        # return output
+        with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
+            synthesizer.save_wav(wavs, fp)
+            return fp.name
+description = """
+"""
+article = ""
+examples = [
+    ["و خداوند شما را با ارسال روح در جسم زندگانی و حیات بخشید", "vits-male"],
+    ["تاجر تو چه تجارت می کنی ، تو را چه که چه تجارت می کنم؟", "vits female (best)"],
+    ["شیش سیخ جیگر سیخی شیش هزار", "vits female (best)"],
+    ["سه شیشه شیر ، سه سیر سرشیر", "vits female (best)"],
+    ["دزدی دزدید ز بز دزدی بزی ، عجب دزدی که دزدید ز بز دزدی بزی", "vits male1 (best)"],
+    ["مثنوی یکی از قالب های شعری است ک هر بیت قافیه ی جداگانه دارد", "vits female1"],
+    ["در گلو ماند خس او سالها، چیست آن خس مهر جاه و مالها", "vits male1 (best)"],
 ]
+persian_tts = PersianTTS()
 iface = gr.Interface(
+    fn=persian_tts.tts,
     inputs=[
         gr.Textbox(
             label="Text",
             value="vits-female",
         ),
     ],
+    outputs=gr.Audio(label="Output", type='filepath'),
     examples=examples,
     title="🗣️ Persian tts 🗣️",
     description=description,
     article=article,
     live=False
 )
+iface.launch(share=False)