Spaces:

TDN-M
/

GV-a

Running on Zero

App Files Files Community

TDN-M commited on Feb 12

Commit

26b60de

verified ·

1 Parent(s): 33c29ad

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -19

app.py CHANGED Viewed

@@ -3,8 +3,12 @@ import mimetypes
 import gradio as gr
 from docx import Document
 from content_generation import create_content, CONTENT_TYPES
 from tts import generate_speech
 # Đường dẫn đến thư mục chứa các file âm thanh
 VOICES_DIR = "voices"
@@ -29,28 +33,21 @@ def process_pdf(file_path):
     """
     Xử lý file PDF và trích xuất nội dung.
     """
-    try:
-        import fitz
-        doc = fitz.open(file_path)
-        text = ""
-        for page in doc:
-            text += page.get_text()
-        return text
-    except Exception as e:
-        raise ValueError(f"Lỗi khi xử lý file PDF: {str(e)}")
 def process_docx(file_path):
     """
     Xử lý file DOCX và trích xuất nội dung.
     """
-    try:
-        doc = Document(file_path)
-        text = ""
-        for para in doc.paragraphs:
-            text += para.text + "\n"
-        return text
-    except Exception as e:
-        raise ValueError(f"Lỗi khi xử lý file DOCX: {str(e)}")
 def text_to_speech(content, voice_file):
     """
@@ -60,6 +57,7 @@ def text_to_speech(content, voice_file):
         print(f"Đường dẫn file âm thanh mẫu: {voice_file}")  # Log đường dẫn file
         if voice_file is None or not os.path.exists(voice_file):
             return f"Lỗi: File âm thanh mẫu không tồn tại hoặc không hợp lệ. Đường dẫn: {voice_file}"
         print(f"Chuyển đổi nội dung thành giọng nói: {content}")  # Log nội dung trước khi chuyển đổi
         output_audio = generate_speech(content, language="vi", speaker_wav=voice_file)
         print(f"File âm thanh đã được tạo: {output_audio}")  # Log file âm thanh
@@ -81,6 +79,7 @@ def convert_content_to_speech(content, voice_file):
 def interface():
     with gr.Blocks() as app:
         gr.Markdown("# TTV@tdnm")
         with gr.Tab("Tạo Nội dung"):
             with gr.Row():
                 with gr.Column():
@@ -95,6 +94,7 @@ def interface():
                     else:
                         voice_selector = gr.Dropdown(label="Chọn giọng đọc", choices=[], value=None)  # Nếu không có file, để trống
                     content_button = gr.Button("Tạo Nội dung")
                 with gr.Column():
                     content_output = gr.Textbox(label="Nội dung tạo ra", interactive=True)
                     download_docx = gr.File(label="Tải xuống file DOCX", interactive=False)
@@ -111,20 +111,24 @@ def interface():
                             file_content = process_pdf(file)
                             prompt = f"{prompt}\n\nDưới đây là nội dung của file tài liệu:\n\n{file_content}"
                         elif mime_type in (
-                                "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-                                "application/msword"):
                             file_content = process_docx(file)
                             prompt = f"{prompt}\n\nDưới đây là nội dung của file tài liệu:\n\n{file_content}"
                         else:
                             raise ValueError("Định dạng file không được hỗ trợ.")
                     if not content_type:
                         raise ValueError("Vui lòng chọn một loại nội dung")
                     script_content = create_content(prompt, content_type, "Tiếng Việt")
                     print(f"Nội dung từ LLM: {script_content}")  # Log nội dung từ LLM
                     if script_content is None:
                         raise ValueError("Nội dung từ LLM là None. Vui lòng kiểm tra lại hàm create_content.")
                     docx_path = "script.docx"
                     create_docx(script_content, docx_path)
                     status = "Đã tạo nội dung thành công!"
                     return script_content, docx_path, status
                 except Exception as e:
@@ -138,6 +142,7 @@ def interface():
             content_button.click(generate_content,
                                  inputs=[prompt, file_upload, content_type],
                                  outputs=[content_output, download_docx, status_message])
             convert_to_speech_button.click(convert_content_to_speech,
                                            inputs=[content_output, voice_selector],
                                            outputs=[audio_output])

 import gradio as gr
 from docx import Document
 from content_generation import create_content, CONTENT_TYPES
+from openai import OpenAI
 from tts import generate_speech
+# Khởi tạo client OpenAI với API key từ biến môi trường
+client = OpenAI(api_key=os.environ.get('OPENAI_API_KEY'))
 # Đường dẫn đến thư mục chứa các file âm thanh
 VOICES_DIR = "voices"
     """
     Xử lý file PDF và trích xuất nội dung.
     """
+    doc = fitz.open(file_path)
+    text = ""
+    for page in doc:
+        text += page.get_text()
+    return text
 def process_docx(file_path):
     """
     Xử lý file DOCX và trích xuất nội dung.
     """
+    doc = Document(file_path)
+    text = ""
+    for para in doc.paragraphs:
+        text += para.text
+    return text
 def text_to_speech(content, voice_file):
     """
         print(f"Đường dẫn file âm thanh mẫu: {voice_file}")  # Log đường dẫn file
         if voice_file is None or not os.path.exists(voice_file):
             return f"Lỗi: File âm thanh mẫu không tồn tại hoặc không hợp lệ. Đường dẫn: {voice_file}"
         print(f"Chuyển đổi nội dung thành giọng nói: {content}")  # Log nội dung trước khi chuyển đổi
         output_audio = generate_speech(content, language="vi", speaker_wav=voice_file)
         print(f"File âm thanh đã được tạo: {output_audio}")  # Log file âm thanh
 def interface():
     with gr.Blocks() as app:
         gr.Markdown("# TTV@tdnm")
         with gr.Tab("Tạo Nội dung"):
             with gr.Row():
                 with gr.Column():
                     else:
                         voice_selector = gr.Dropdown(label="Chọn giọng đọc", choices=[], value=None)  # Nếu không có file, để trống
                     content_button = gr.Button("Tạo Nội dung")
                 with gr.Column():
                     content_output = gr.Textbox(label="Nội dung tạo ra", interactive=True)
                     download_docx = gr.File(label="Tải xuống file DOCX", interactive=False)
                             file_content = process_pdf(file)
                             prompt = f"{prompt}\n\nDưới đây là nội dung của file tài liệu:\n\n{file_content}"
                         elif mime_type in (
+                            "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
+                            "application/msword"):
                             file_content = process_docx(file)
                             prompt = f"{prompt}\n\nDưới đây là nội dung của file tài liệu:\n\n{file_content}"
                         else:
                             raise ValueError("Định dạng file không được hỗ trợ.")
                     if not content_type:
                         raise ValueError("Vui lòng chọn một loại nội dung")
                     script_content = create_content(prompt, content_type, "Tiếng Việt")
                     print(f"Nội dung từ LLM: {script_content}")  # Log nội dung từ LLM
                     if script_content is None:
                         raise ValueError("Nội dung từ LLM là None. Vui lòng kiểm tra lại hàm create_content.")
                     docx_path = "script.docx"
                     create_docx(script_content, docx_path)
                     status = "Đã tạo nội dung thành công!"
                     return script_content, docx_path, status
                 except Exception as e:
             content_button.click(generate_content,
                                  inputs=[prompt, file_upload, content_type],
                                  outputs=[content_output, download_docx, status_message])
             convert_to_speech_button.click(convert_content_to_speech,
                                            inputs=[content_output, voice_selector],
                                            outputs=[audio_output])