Spaces:

TDN-M
/

GV-a

Running on Zero

App Files Files Community

TDN-M commited on Oct 13, 2024

Commit

2b12a37

verified ·

1 Parent(s): e163cb1

Upload 5 files

Browse files

Files changed (3) hide show

app.py +12 -9
utils.py +1 -1
video_processing.py +58 -24

app.py CHANGED Viewed

@@ -75,9 +75,6 @@ def extract_key_contents(script, num_contents=10):
     except Exception as e:
         print(f"Lỗi khi trích xuất nội dung: {str(e)}")
         return []
-# Định nghĩa danh sách giọng đọc
-VOICES = ["alloy", "echo", "fable", "onyx", "nova", "shimmer"]
 # Giao diện Gradio
 def interface():
@@ -143,18 +140,24 @@ def interface():
             confirm_button.click(lambda x: asyncio.run(confirm_content(x)),
                                  inputs=[content_output],
                                  outputs=[download_docx, download_audio, status_message])
         with gr.Tab("Tạo Âm thanh"):
             text_input = gr.Textbox(label="Nhập văn bản để chuyển đổi")
-            voice_select = gr.Dropdown(label="Chọn giọng đọc",
-                                       choices=VOICES)  # Dropdown cho voice_select
             audio_button = gr.Button("Tạo Âm thanh")
             audio_output = gr.Audio(label="Âm thanh tạo ra")
             download_audio = gr.File(label="Tải xuống file âm thanh", interactive=False)
             def text_to_speech_func(text, voice):
-                audio_path = text_to_speech(text, voice, "Tiếng Việt")
-                return audio_path, audio_path
             audio_button.click(text_to_speech_func,
                                inputs=[text_input, voice_select],
@@ -175,6 +178,7 @@ def interface():
                 """ Tạo video từ các thông tin đầu vào. """
                 try:
                     status_message.update("Đang xử lý...")  # Cập nhật trạng thái
                     # 1. Tính toán thời lượng video
                     audio_clip = AudioFileClip(audio_file)
                     video_duration = audio_clip.duration
@@ -207,8 +211,7 @@ def interface():
                 except Exception as e:
                     status_message.update(f"Lỗi khi tạo video: {e}")  # Cập nhật trạng thái
                     return None
-        return app
 # Khởi chạy ứng dụng
 if __name__ == "__main__":

     except Exception as e:
         print(f"Lỗi khi trích xuất nội dung: {str(e)}")
         return []
 # Giao diện Gradio
 def interface():
             confirm_button.click(lambda x: asyncio.run(confirm_content(x)),
                                  inputs=[content_output],
                                  outputs=[download_docx, download_audio, status_message])
+        # Định nghĩa danh sách giọng đọc
+        VOICES = ["alloy", "echo", "fable", "onyx", "nova", "shimmer"]
         with gr.Tab("Tạo Âm thanh"):
             text_input = gr.Textbox(label="Nhập văn bản để chuyển đổi")
+            voice_select = gr.Dropdown(label="Chọn giọng đọc", choices=VOICES)  # Dropdown cho voice_select
             audio_button = gr.Button("Tạo Âm thanh")
             audio_output = gr.Audio(label="Âm thanh tạo ra")
             download_audio = gr.File(label="Tải xuống file âm thanh", interactive=False)
             def text_to_speech_func(text, voice):
+                try:
+                    audio_path = text_to_speech(text, voice, "Tiếng Việt")
+                    return audio_path, audio_path
+                except Exception as e:
+                    print(f"Lỗi khi chuyển đổi văn bản thành giọng nói: {e}")
+                    return None, None
             audio_button.click(text_to_speech_func,
                                inputs=[text_input, voice_select],
                 """ Tạo video từ các thông tin đầu vào. """
                 try:
                     status_message.update("Đang xử lý...")  # Cập nhật trạng thái
                     # 1. Tính toán thời lượng video
                     audio_clip = AudioFileClip(audio_file)
                     video_duration = audio_clip.duration
                 except Exception as e:
                     status_message.update(f"Lỗi khi tạo video: {e}")  # Cập nhật trạng thái
                     return None
+                    return app
 # Khởi chạy ứng dụng
 if __name__ == "__main__":

utils.py CHANGED Viewed

@@ -10,7 +10,7 @@ def check_file_exists(file_path):
         raise FileNotFoundError(f"Tệp {file_path} không tồn tại.")
 # Đường dẫn đầy đủ tới các file
-bgm_file = "data/bg_music/output000.mp3"
 output_path = "output/final_video.mp4"
 check_file_exists(bgm_file)

         raise FileNotFoundError(f"Tệp {file_path} không tồn tại.")
 # Đường dẫn đầy đủ tới các file
+bgm_file = "data/bg_music.mp3"
 output_path = "output/final_video.mp4"
 check_file_exists(bgm_file)

video_processing.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import os
 import random
 import shutil
 import tempfile
 from concurrent.futures import ThreadPoolExecutor
@@ -82,6 +83,35 @@ def process_images_parallel(image_patch, clip_duration):
     return clips
 def process_script_for_video(script, dataset_path, use_dataset):
     """
     Xử lý script để tạo video.
@@ -93,30 +123,34 @@ def create_video_func(script, audio_path, dataset_path, use_dataset):
     """
     Hàm chính để tạo video.
     """
-    sentences = process_script_for_video(script, dataset_path, use_dataset)
-    # Tạo thư mục tạm thời để lưu các file âm thanh tách biệt
-    temp_dir = tempfile.mkdtemp()
-    # Tách file âm thanh thành các đoạn nhỏ
-    audio_clips = split_audio(audio_path, len(sentences), temp_dir)
-    # Lấy đường dẫn của các video từ dataset
-    video_files = glob.glob(os.path.join(dataset_path, "*.mp4")) if use_dataset else []
-    # Đảm bảo số lượng câu, âm thanh và video là bằng nhau
-    min_length = min(len(sentences), len(audio_clips), len(video_files))
-    sentences = sentences[:min_length]
-    audio_clips = audio_clips[:min_length]
-    video_files = video_files[:min_length]
-    output_path = "output_video.mp4"
-    create_video(sentences, audio_clips, video_files, output_path)
-    # Xóa thư mục tạm thời
-    shutil.rmtree(temp_dir)
-    return output_path, output_path
 def split_audio(audio_path, num_segments, output_dir):
     """

 import os
 import random
+import glob
 import shutil
 import tempfile
 from concurrent.futures import ThreadPoolExecutor
     return clips
+# Định nghĩa hàm extract_key_contents
+def extract_key_contents(script: str) -> list[str]:
+    """
+    Hàm này dùng để trích xuất các ý chính từ một đoạn script.
+    Tham số:
+    - script (str): Đoạn văn bản cần xử lý để trích xuất các ý chính.
+    Trả về:
+    - list[str]: Danh sách các câu được tách ra từ đoạn script.
+    Logic xử lý:
+    - Đầu tiên, đoạn script được tách thành các câu dựa trên dấu chấm ('.').
+    - Mỗi câu được xem như một ý chính và được thêm vào danh sách kết quả.
+    """
+    # Kiểm tra nếu script là chuỗi rỗng
+    if not script:
+        return []
+    # Tách đoạn script thành các câu dựa trên dấu chấm
+    sentences = script.split('.')
+    # Loại bỏ các khoảng trắng thừa và các câu rỗng
+    sentences = [sentence.strip() for sentence in sentences if sentence.strip()]
+    # Trả về danh sách các câu
+    return sentences
 def process_script_for_video(script, dataset_path, use_dataset):
     """
     Xử lý script để tạo video.
     """
     Hàm chính để tạo video.
     """
+    try:
+        sentences = process_script_for_video(script, dataset_path, use_dataset)
+        # Tạo thư mục tạm thời để lưu các file âm thanh tách biệt
+        temp_dir = tempfile.mkdtemp()
+        # Tách file âm thanh thành các đoạn nhỏ
+        audio_clips = split_audio(audio_path, len(sentences), temp_dir)
+        # Lấy đường dẫn của các video từ dataset
+        video_files = glob.glob(os.path.join(dataset_path, "*.mp4")) if use_dataset else []
+        # Đảm bảo số lượng câu, âm thanh và video là bằng nhau
+        min_length = min(len(sentences), len(audio_clips), len(video_files))
+        sentences = sentences[:min_length]
+        audio_clips = audio_clips[:min_length]
+        video_files = video_files[:min_length]
+        output_path = "output_video.mp4"
+        create_video(sentences, audio_clips, video_files, output_path)
+        return output_path
+    except Exception as e:
+        print(f"Lỗi khi tạo video: {e}")
+        return None
+    finally:
+        # Xóa thư mục tạm thời
+        shutil.rmtree(temp_dir)
 def split_audio(audio_path, num_segments, output_dir):
     """