Spaces:

TDN-M
/

GV-a

Sleeping

App Files Files Community

TDN-M commited on Jan 13

Commit

070807c

verified ·

1 Parent(s): f77bed0

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -24

app.py CHANGED Viewed

@@ -8,13 +8,12 @@ import gradio as gr
 from docx import Document
 from content_generation import create_content, CONTENT_TYPES
 from openai import OpenAI
-from gradio_client import Client, handle_file
 import subprocess
 import time
 # Khởi tạo client OpenAI với API key từ biến môi trường
 client_openai = OpenAI(api_key=os.environ.get('OPENAI_API_KEY'))
-client_vixtts = Client("thinhlpg/vixtts-demo")
 def create_docx(content, output_path):
     """
@@ -44,30 +43,15 @@ def process_docx(file_path):
         text += para.text
     return text
-def convert_text_to_speech(text, language='vi', timeout=60):
     """
-    Chuyển đổi văn bản thành giọng nói với thời gian chờ đợi.
     """
     try:
-        start_time = time.time()
-        future = client_vixtts.predict(
-            prompt=text,
-            language=language,
-            audio_file_pth=handle_file(''),
-            normalize_text=True,
-            api_name="/predict"
-        )
-        while not future.done():
-            elapsed_time = time.time() - start_time
-            if elapsed_time > timeout:
-                raise TimeoutError(f"Chờ quá lâu cho API chuyển đổi văn bản thành giọng nói (>{timeout} giây)")
-            time.sleep(1)  # Kiểm tra mỗi giây
-        result = future.result()
-        audio_file_path = result.audio_file_pth
-        if not audio_file_path or not os.path.exists(audio_file_path):
-            raise FileNotFoundError(f"File âm thanh không được tạo ra hoặc không tồn tại: {audio_file_path}")
-        return audio_file_path
     except Exception as e:
         raise Exception(f"Lỗi khi chuyển đổi văn bản thành giọng nói: {str(e)}")
@@ -183,7 +167,7 @@ def interface():
                     docx_path = "script.docx"
                     create_docx(text_to_convert, docx_path)
                     status_message.value = "Đang chuyển đổi văn bản thành giọng nói..."
-                    audio_path = convert_text_to_speech(text_to_convert, language)
                     status_message.value = "Đã chuyển đổi văn bản thành giọng nói thành công!"
                     status_message.value = "Đang tạo video..."
                     video_path = create_video(audio_path, mc_choice, text_color)

 from docx import Document
 from content_generation import create_content, CONTENT_TYPES
 from openai import OpenAI
+import edge_tts
 import subprocess
 import time
 # Khởi tạo client OpenAI với API key từ biến môi trường
 client_openai = OpenAI(api_key=os.environ.get('OPENAI_API_KEY'))
 def create_docx(content, output_path):
     """
         text += para.text
     return text
+async def convert_text_to_speech(text, language='vi', output_file="output.wav"):
     """
+    Chuyển đổi văn bản thành giọng nói sử dụng edge_tts.
     """
     try:
+        communicate = edge_tts.Communicate(text, "vi-VN-JennyNeural")
+        with open(output_file, "wb") as file:
+            await communicate.save(file)
+        return output_file
     except Exception as e:
         raise Exception(f"Lỗi khi chuyển đổi văn bản thành giọng nói: {str(e)}")
                     docx_path = "script.docx"
                     create_docx(text_to_convert, docx_path)
                     status_message.value = "Đang chuyển đổi văn bản thành giọng nói..."
+                    audio_path = await convert_text_to_speech(text_to_convert, language)
                     status_message.value = "Đã chuyển đổi văn bản thành giọng nói thành công!"
                     status_message.value = "Đang tạo video..."
                     video_path = create_video(audio_path, mc_choice, text_color)