Spaces:

akbarazimifar
/

Persian-TTS

Runtime error

App Files Files Community

Persian-TTS / app.py

akbarazimifar

Create app.py

2070617 verified over 1 year ago

raw

history blame

5.39 kB

	import tempfile
	import os
	import gradio as gr
	from TTS.config import load_config
	from TTS.utils.manage import ModelManager
	from TTS.utils.synthesizer import Synthesizer
	from TTS.utils.download import download_url

	MODEL_NAMES = [
	"vits male1 (best)",
	"vits female (best)",
	"vits-male",
	"vits female1",
	"glowtts-male",
	"glowtts-female",
	"female tacotron2"
	]

	MAX_TXT_LEN = 800
	MODELS_DIRECTORY = os.path.join(os.path.dirname(__file__), "models")

	modelInfo = [
	["vits-male", "best_model_65633.pth", "config-0.json",
	"https://huggingface.co/Kamtera/persian-tts-male-vits/resolve/main/"],
	["vits female (best)", "checkpoint_48000.pth", "config-2.json",
	"https://huggingface.co/Kamtera/persian-tts-female-vits/resolve/main/"],
	["glowtts-male", "best_model_77797.pth", "config-1.json",
	"https://huggingface.co/Kamtera/persian-tts-male-glow_tts/resolve/main/"],
	["glowtts-female", "best_model.pth", "config.json",
	"https://huggingface.co/Kamtera/persian-tts-female-glow_tts/resolve/main/"],
	["vits male1 (best)", "checkpoint_88000.pth", "config.json",
	"https://huggingface.co/Kamtera/persian-tts-male1-vits/resolve/main/"],
	["vits female1", "checkpoint_50000.pth", "config.json",
	"https://huggingface.co/Kamtera/persian-tts-female1-vits/resolve/main/"],
	["female tacotron2", "checkpoint_313000.pth", "config-2.json",
	"https://huggingface.co/Kamtera/persian-tts-female-tacotron2/resolve/main/"]
	]

	for model in modelInfo:
	model_name, model_filename, config_filename, model_url = model
	model_directory = os.path.join(MODELS_DIRECTORY, model_name)
	if not os.path.exists(model_directory):
	os.makedirs(model_directory)
	print("\|> Downloading: ", model_directory)
	download_url(model_url + model_filename, model_directory, "best_model.pth")
	download_url(model_url + config_filename, model_directory, "config.json")


	def tts(text: str, model_name: str):
	if len(text) > MAX_TXT_LEN:
	text = text[:MAX_TXT_LEN]
	print(f"Input text was cutoff since it went over the {MAX_TXT_LEN} character limit.")

	# synthesize
	model_directory = os.path.join(MODELS_DIRECTORY, model_name)
	model_path = os.path.join(model_directory, "best_model.pth")
	config_path = os.path.join(model_directory, "config.json")
	synthesizer = Synthesizer(model_path, config_path)
	if synthesizer is None:
	raise NameError("model not found")
	wavs = synthesizer.tts(text)
	# return output
	with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
	synthesizer.save_wav(wavs, fp)
	return fp.name


	description = """
	This is a demo of persian text to speech model.

	Github : https://github.com/karim23657/Persian-tts-coqui

	Models can be found here: <br>

	\|Model\|Dataset\|
	\|----\|------\|
	\|[vits female (best)](https://huggingface.co/Kamtera/persian-tts-female-vits)\|[persian-tts-dataset-famale](https://www.kaggle.com/datasets/magnoliasis/persian-tts-dataset-famale)\|
	\|[vits male1 (best)](https://huggingface.co/Kamtera/persian-tts-male1-vits)\|[persian-tts-dataset-male](https://www.kaggle.com/datasets/magnoliasis/persian-tts-dataset-male)\|
	\|[vits female1](https://huggingface.co/Kamtera/persian-tts-female1-vits)\|[ParsiGoo](https://github.com/karim23657/ParsiGoo)\|
	\|[vits male](https://huggingface.co/Kamtera/persian-tts-male-vits)\|[persian-tts-dataset](https://www.kaggle.com/datasets/magnoliasis/persian-tts-dataset)\|
	\|[glowtts female](https://huggingface.co/Kamtera/persian-tts-female-glow_tts)\|[persian-tts-dataset-famale](https://www.kaggle.com/datasets/magnoliasis/persian-tts-dataset-famale)\|
	\|[glowtts male](https://huggingface.co/Kamtera/persian-tts-male-glow_tts)\|[persian-tts-dataset](https://www.kaggle.com/datasets/magnoliasis/persian-tts-dataset)\|
	\|[tacotron2 female](https://huggingface.co/Kamtera/persian-tts-female-tacotron2)\|[persian-tts-dataset-famale](https://www.kaggle.com/datasets/magnoliasis/persian-tts-dataset-famale)\|


	"""
	article = ""
	examples = [
	["و خداوند شما را با ارسال روح در جسم زندگانی و حیات بخشید", "vits-male"],
	["تاجر تو چه تجارت می کنی ، تو را چه که چه تجارت می کنم؟", "vits female (best)"],
	["شیش سیخ جیگر سیخی شیش هزار", "vits female (best)"],
	["سه شیشه شیر ، سه سیر سرشیر", "vits female (best)"],
	["دزدی دزدید ز بز دزدی بزی ، عجب دزدی که دزدید ز بز دزدی بزی", "vits male1 (best)"],
	["مثنوی یکی از قالب های شعری است ک هر بیت قافیه ی جداگانه دارد", "vits female1"],
	["در گلو ماند خس او سالها، چیست آن خس مهر جاه و مالها", "vits male1 (best)"],
	]

	iface = gr.Interface(
	fn=tts,
	inputs=[
	gr.Textbox(
	label="Text",
	value="زندگی فقط یک بار است؛ از آن به خوبی استفاده کن",
	),
	gr.Radio(
	label="Pick a TTS Model ",
	choices=MODEL_NAMES,
	value="vits-female",
	),
	],
	outputs=gr.Audio(label="Output", type='filepath'),
	examples=examples,
	title="🗣️ Persian tts 🗣️",
	description=description,
	article=article,
	live=False
	)
	iface.launch(share=False)