Spaces:

openfree
/

ginigen-sora

Running

App Files Files Community

openfree commited on Nov 24, 2024

Commit

75c3863

verified ·

1 Parent(s): 604df90

Update app-backup1.py

Browse files

Files changed (1) hide show

app-backup1.py +472 -79

app-backup1.py CHANGED Viewed

@@ -55,24 +55,68 @@ hf_token = os.getenv("HF_TOKEN")
 openai_api_key = os.getenv("OPENAI_API_KEY")
 client = OpenAI(api_key=openai_api_key)
-# Initialize translation pipeline
-translator = pipeline("translation", model="Helsinki-NLP/opus-mt-ko-en")
 # Korean text detection function
 def contains_korean(text):
     korean_pattern = re.compile('[ㄱ-ㅎㅏ-ㅣ가-힣]')
     return bool(korean_pattern.search(text))
-def translate_korean_prompt(prompt):
     """
     Translate Korean prompt to English if Korean text is detected
     """
-    if contains_korean(prompt):
-        translated = translator(prompt)[0]['translation_text']
         print(f"Original Korean prompt: {prompt}")
-        print(f"Translated English prompt: {translated}")
-        return translated
-    return prompt
 def enhance_prompt(prompt, type="t2v"):
     system_prompt = system_prompt_t2v if type == "t2v" else system_prompt_i2v
@@ -195,58 +239,55 @@ pipeline = XoraVideoPipeline(
     vae=vae,
 ).to(device)
 # Preset options for resolution and frame configuration
 # Convert frames to seconds assuming 25 FPS
 preset_options = [
-    {"label": "1216x704, 1.6초", "width": 1216, "height": 704, "num_frames": 41},
-    {"label": "1088x704, 2.0초", "width": 1088, "height": 704, "num_frames": 49},
-    {"label": "1056x640, 2.3초", "width": 1056, "height": 640, "num_frames": 57},
-    {"label": "992x608, 2.6초", "width": 992, "height": 608, "num_frames": 65},
-    {"label": "896x608, 2.9초", "width": 896, "height": 608, "num_frames": 73},
-    {"label": "896x544, 3.2초", "width": 896, "height": 544, "num_frames": 81},
-    {"label": "832x544, 3.6초", "width": 832, "height": 544, "num_frames": 89},
-    {"label": "800x512, 3.9초", "width": 800, "height": 512, "num_frames": 97},
-    {"label": "768x512, 3.9초", "width": 768, "height": 512, "num_frames": 97},
-    {"label": "800x480, 4.2초", "width": 800, "height": 480, "num_frames": 105},
-    {"label": "736x480, 4.5초", "width": 736, "height": 480, "num_frames": 113},
-    {"label": "704x480, 4.8초", "width": 704, "height": 480, "num_frames": 121},
-    {"label": "704x448, 5.2초", "width": 704, "height": 448, "num_frames": 129},
-    {"label": "672x448, 5.5초", "width": 672, "height": 448, "num_frames": 137},
-    {"label": "640x416, 6.1초", "width": 640, "height": 416, "num_frames": 153},
-    {"label": "672x384, 6.4초", "width": 672, "height": 384, "num_frames": 161},
-    {"label": "640x384, 6.8초", "width": 640, "height": 384, "num_frames": 169},
-    {"label": "608x384, 7.1초", "width": 608, "height": 384, "num_frames": 177},
-    {"label": "576x384, 7.4초", "width": 576, "height": 384, "num_frames": 185},
-    {"label": "608x352, 7.7초", "width": 608, "height": 352, "num_frames": 193},
-    {"label": "576x352, 8.0초", "width": 576, "height": 352, "num_frames": 201},
-    {"label": "544x352, 8.4초", "width": 544, "height": 352, "num_frames": 209},
-    {"label": "512x352, 9.3초", "width": 512, "height": 352, "num_frames": 233},
-    {"label": "544x320, 9.6초", "width": 544, "height": 320, "num_frames": 241},
-    {"label": "512x320, 10.3초", "width": 512, "height": 320, "num_frames": 257},
 ]
 def preset_changed(preset):
-    if preset != "Custom":
-        selected = next(item for item in preset_options if item["label"] == preset)
-        # height, width, num_frames 값을 global 변수로 업데이트
-        return (
-            selected["height"],
-            selected["width"],
-            selected["num_frames"],
-            gr.update(visible=False),
-            gr.update(visible=False),
-            gr.update(visible=False),
-        )
-    else:
-        return (
-            None,
-            None,
-            None,
-            gr.update(visible=True),
-            gr.update(visible=True),
-            gr.update(visible=True),
-        )
 def generate_video_from_text(
     prompt="",
@@ -256,8 +297,8 @@ def generate_video_from_text(
     seed=171198,
     num_inference_steps=41,
     guidance_scale=4,
-    height=512,
-    width=320,
     num_frames=257,
     progress=gr.Progress(),
 ):
@@ -335,11 +376,11 @@ def generate_video_from_image(
     negative_prompt="low quality, worst quality, deformed, distorted, warped, motion smear, motion artifacts, fused fingers, incorrect anatomy, strange hands, unattractive",
     frame_rate=25,
     seed=171198,
-    num_inference_steps=50,
     guidance_scale=4,
-    height=512,
-    width=768,
-    num_frames=121,
     progress=gr.Progress(),
 ):
     print("Height: ", height)
@@ -432,7 +473,7 @@ def create_advanced_options():
             minimum=1,
             maximum=50,
             step=1,
-            value=50,
             visible=False
         )
         guidance_scale = gr.Slider(
@@ -448,7 +489,7 @@ def create_advanced_options():
             minimum=256,
             maximum=1024,
             step=64,
-            value=512,
             visible=False,
         )
         width_slider = gr.Slider(
@@ -456,7 +497,7 @@ def create_advanced_options():
             minimum=256,
             maximum=1024,
             step=64,
-            value=768,
             visible=False,
         )
         num_frames_slider = gr.Slider(
@@ -464,7 +505,7 @@ def create_advanced_options():
             minimum=1,
             maximum=200,
             step=1,
-            value=121,
             visible=False,
         )
@@ -477,6 +518,180 @@ def create_advanced_options():
             num_frames_slider,
         ]
 # Gradio Interface Definition
 with gr.Blocks(theme=gr.themes.Soft()) as iface:
     with gr.Tabs():
@@ -504,14 +719,9 @@ with gr.Blocks(theme=gr.themes.Soft()) as iface:
                         visible=False
                     )
-                    # 현재 선택된 값들을 저장할 상태 변수들
-                    txt2vid_current_height = gr.State(value=512)
-                    txt2vid_current_width = gr.State(value=320)
-                    txt2vid_current_num_frames = gr.State(value=257)
                     txt2vid_preset = gr.Dropdown(
                         choices=[p["label"] for p in preset_options],
-                        value="512x320, 10.3초",
                         label="Step 2: 해상도 프리셋 선택",
                     )
@@ -562,14 +772,9 @@ with gr.Blocks(theme=gr.themes.Soft()) as iface:
                         visible=False
                     )
-                    # 현재 선택된 값들을 저장할 상태 변수들
-                    img2vid_current_height = gr.State(value=512)
-                    img2vid_current_width = gr.State(value=768)
-                    img2vid_current_num_frames = gr.State(value=97)
                     img2vid_preset = gr.Dropdown(
                         choices=[p["label"] for p in preset_options],
-                        value="512x320, 10.3초",
                         label="Step 3: 해상도 프리셋 선택",
                     )
@@ -592,7 +797,101 @@ with gr.Blocks(theme=gr.themes.Soft()) as iface:
                 with gr.Column():
                     img2vid_output = gr.Video(label="생성된 비디오")
-    # Event handlers
     txt2vid_preset.change(
         fn=preset_changed,
         inputs=[txt2vid_preset],
@@ -617,7 +916,7 @@ with gr.Blocks(theme=gr.themes.Soft()) as iface:
             txt2vid_enhance_toggle,
             txt2vid_negative_prompt,
             txt2vid_frame_rate,
-            *txt2vid_advanced[:3],  # seed, inference_steps, guidance_scale
             txt2vid_current_height,
             txt2vid_current_width,
             txt2vid_current_num_frames,
@@ -653,7 +952,7 @@ with gr.Blocks(theme=gr.themes.Soft()) as iface:
             img2vid_enhance_toggle,
             img2vid_negative_prompt,
             img2vid_frame_rate,
-            *img2vid_advanced[:3],  # seed, inference_steps, guidance_scale
             img2vid_current_height,
             img2vid_current_width,
             img2vid_current_num_frames,
@@ -664,6 +963,100 @@ with gr.Blocks(theme=gr.themes.Soft()) as iface:
         queue=True,
     )
 if __name__ == "__main__":
     iface.queue(max_size=64, default_concurrency_limit=1, api_open=False).launch(
         share=True, show_api=False

 openai_api_key = os.getenv("OPENAI_API_KEY")
 client = OpenAI(api_key=openai_api_key)
+# Initialize translation pipeline with device and clean_up settings
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+translator = pipeline(
+    "translation",
+    model="Helsinki-NLP/opus-mt-ko-en",
+    device=device,
+    clean_up_tokenization_spaces=True
+)
 # Korean text detection function
 def contains_korean(text):
     korean_pattern = re.compile('[ㄱ-ㅎㅏ-ㅣ가-힣]')
     return bool(korean_pattern.search(text))
+def translate_korean_prompt(prompt, max_length=450):
     """
     Translate Korean prompt to English if Korean text is detected
+    Split long text into chunks if necessary
     """
+    if not contains_korean(prompt):
+        return prompt
+    # Split long text into chunks
+    def split_text(text, max_length):
+        words = text.split()
+        chunks = []
+        current_chunk = []
+        current_length = 0
+        for word in words:
+            if current_length + len(word) + 1 > max_length:
+                chunks.append(' '.join(current_chunk))
+                current_chunk = [word]
+                current_length = len(word)
+            else:
+                current_chunk.append(word)
+                current_length += len(word) + 1
+        if current_chunk:
+            chunks.append(' '.join(current_chunk))
+        return chunks
+    try:
+        if len(prompt) > max_length:
+            chunks = split_text(prompt, max_length)
+            translated_chunks = []
+            for chunk in chunks:
+                translated = translator(chunk, max_length=512)[0]['translation_text']
+                translated_chunks.append(translated)
+            final_translation = ' '.join(translated_chunks)
+        else:
+            final_translation = translator(prompt, max_length=512)[0]['translation_text']
         print(f"Original Korean prompt: {prompt}")
+        print(f"Translated English prompt: {final_translation}")
+        return final_translation
+    except Exception as e:
+        print(f"Translation error: {e}")
+        return prompt  # Return original prompt if translation fails
 def enhance_prompt(prompt, type="t2v"):
     system_prompt = system_prompt_t2v if type == "t2v" else system_prompt_i2v
     vae=vae,
 ).to(device)
+# State 변수들의 초기화 수정
+txt2vid_current_height = gr.State(value=320)
+txt2vid_current_width = gr.State(value=512)
+txt2vid_current_num_frames = gr.State(value=257)
+img2vid_current_height = gr.State(value=320)
+img2vid_current_width = gr.State(value=512)
+img2vid_current_num_frames = gr.State(value=257)
 # Preset options for resolution and frame configuration
 # Convert frames to seconds assuming 25 FPS
 preset_options = [
+    {"label": "[16:9 HD] 1216x704, 1.6초", "width": 1216, "height": 704, "num_frames": 41},
+    {"label": "[16:9] 1088x704, 2.0초", "width": 1088, "height": 704, "num_frames": 49},
+    {"label": "[16:9] 1056x640, 2.3초", "width": 1056, "height": 640, "num_frames": 57},
+    {"label": "[16:9] 992x608, 2.6초", "width": 992, "height": 608, "num_frames": 65},
+    {"label": "[16:9] 896x608, 2.9초", "width": 896, "height": 608, "num_frames": 73},
+    {"label": "[16:9] 896x544, 3.2초", "width": 896, "height": 544, "num_frames": 81},
+    {"label": "[16:9] 832x544, 3.6초", "width": 832, "height": 544, "num_frames": 89},
+    {"label": "[16:9] 800x512, 3.9초", "width": 800, "height": 512, "num_frames": 97},
+    {"label": "[16:9] 768x512, 3.9초", "width": 768, "height": 512, "num_frames": 97},
+    {"label": "[16:9] 800x480, 4.2초", "width": 800, "height": 480, "num_frames": 105},
+    {"label": "[16:9] 736x480, 4.5초", "width": 736, "height": 480, "num_frames": 113},
+    {"label": "[3:2] 704x480, 4.8초", "width": 704, "height": 480, "num_frames": 121},
+    {"label": "[16:9] 704x448, 5.2초", "width": 704, "height": 448, "num_frames": 129},
+    {"label": "[16:9] 672x448, 5.5초", "width": 672, "height": 448, "num_frames": 137},
+    {"label": "[16:9] 640x416, 6.1초", "width": 640, "height": 416, "num_frames": 153},
+    {"label": "[16:9] 672x384, 6.4초", "width": 672, "height": 384, "num_frames": 161},
+    {"label": "[16:9] 640x384, 6.8초", "width": 640, "height": 384, "num_frames": 169},
+    {"label": "[16:9] 608x384, 7.1초", "width": 608, "height": 384, "num_frames": 177},
+    {"label": "[16:9] 576x384, 7.4초", "width": 576, "height": 384, "num_frames": 185},
+    {"label": "[16:9] 608x352, 7.7초", "width": 608, "height": 352, "num_frames": 193},
+    {"label": "[16:9] 576x352, 8.0초", "width": 576, "height": 352, "num_frames": 201},
+    {"label": "[16:9] 544x352, 8.4초", "width": 544, "height": 352, "num_frames": 209},
+    {"label": "[3:2] 512x352, 9.3초", "width": 512, "height": 352, "num_frames": 233},
+    {"label": "[16:9] 544x320, 9.6초", "width": 544, "height": 320, "num_frames": 241},
+    {"label": "[16:9] 512x320, 10.3초", "width": 512, "height": 320, "num_frames": 257},
 ]
 def preset_changed(preset):
+    selected = next(item for item in preset_options if item["label"] == preset)
+    return [
+        selected["height"],
+        selected["width"],
+        selected["num_frames"],
+        gr.update(visible=False),
+        gr.update(visible=False),
+        gr.update(visible=False),
+    ]
 def generate_video_from_text(
     prompt="",
     seed=171198,
     num_inference_steps=41,
     guidance_scale=4,
+    height=320,
+    width=512,
     num_frames=257,
     progress=gr.Progress(),
 ):
     negative_prompt="low quality, worst quality, deformed, distorted, warped, motion smear, motion artifacts, fused fingers, incorrect anatomy, strange hands, unattractive",
     frame_rate=25,
     seed=171198,
+    num_inference_steps=41,
     guidance_scale=4,
+    height=320,
+    width=512,
+    num_frames=257,
     progress=gr.Progress(),
 ):
     print("Height: ", height)
             minimum=1,
             maximum=50,
             step=1,
+            value=41,
             visible=False
         )
         guidance_scale = gr.Slider(
             minimum=256,
             maximum=1024,
             step=64,
+            value=320,
             visible=False,
         )
         width_slider = gr.Slider(
             minimum=256,
             maximum=1024,
             step=64,
+            value=512,
             visible=False,
         )
         num_frames_slider = gr.Slider(
             minimum=1,
             maximum=200,
             step=1,
+            value=257,
             visible=False,
         )
             num_frames_slider,
         ]
+system_prompt_scenario = """당신은 영상 스크립트에 맞는 배경 영상을 생성하기 위한 프롬프트 전문가입니다.
+주어진 스크립트의 분위기와 맥락을 시각적 배경으로 표현하되, 다음 원칙을 반드시 준수하세요:
+1. 제품이나 서비스를 직접적으로 묘사하지 말 것
+2. 스크립트의 감성과 톤앤매너를 표현하는 배경 영상에 집중할 것
+3. 5개 섹션이 하나의 이야기처럼 자연스럽게 연결되도록 할 것
+4. 추상적이고 은유적인 시각 표현을 활용할 것
+각 섹션별 프롬프트 작성 가이드:
+1. 배경 및 필요성: 주제의 전반적인 분위기를 표현하는 배경 씬
+2. 문제 제기: 긴장감이나 갈등을 암시하는 분위기 있는 배경
+3. 해결책 제시: 희망적이고 밝은 톤의 배경 전환
+4. 본론: 안정감 있고 신뢰도를 높이는 배경
+5. 결론: 임팩트 있는 마무리를 위한 역동적인 배경
+모든 섹션이 일관된 스타일과 톤을 유지하면서도 자연스럽게 이어지도록 구성하세요.
+각 섹션의 프롬프트 작성시 반드시 다음 구조에 맞게 개선해주세요:
+1. 주요 동작을 명확한 한 문장으로 시작
+2. 구체적인 동작과 제스처를 시간 순서대로 설명
+3. 캐릭터/객체의 외모를 상세히 묘사
+4. 배경과 환경 세부 사항을 구체적으로 포함
+5. 카메라 각도와 움직임을 명시
+6. 조명과 색상을 자세히 설명
+7. 변화나 갑작스러운 사건을 자연스럽게 포함
+모든 설명은 하나의 자연스러운 문단으로 작성하고,
+촬영 감독이 촬영 목록을 설명하는 것처럼 구체적이고 시각적으로 작성하세요.
+200단어를 넘지 않도록 하되, 최대한 상세하게 작성하세요.
+"""
+def analyze_scenario(scenario):
+    """시나리오를 분석하여 배경 영상용 프롬프트 생성"""
+    messages = [
+        {"role": "system", "content": system_prompt_scenario},
+        {"role": "user", "content": f"""
+다음 스크립트의 분위기와 감성을 표현할 수 있는 배경 영상 프롬프트를 생성해주세요:
+{scenario}
+각 섹션별로 직접적인 제품 묘사는 피하고, 스크립트의 감성을 표현하는 배경 영상에 집중해주세요."""},
+    ]
+    try:
+        response = client.chat.completions.create(
+            model="gpt-4-1106-preview",
+            messages=messages,
+            max_tokens=2000,
+        )
+        prompts = response.choices[0].message.content.strip().split("\n\n")
+        # 프롬프트 처리 로직은 동일
+        section_prompts = []
+        current_section = ""
+        for line in prompts:
+            if line.strip():
+                if any(section in line for section in ["1.", "2.", "3.", "4.", "5."]):
+                    if current_section:
+                        section_prompts.append(current_section)
+                    current_section = line
+                else:
+                    current_section += "\n" + line
+        if current_section:
+            section_prompts.append(current_section)
+        while len(section_prompts) < 5:
+            section_prompts.append("추가 섹션이 필요합니다.")
+        return section_prompts[:5]
+    except Exception as e:
+        print(f"Error during scenario analysis: {e}")
+        return ["Error occurred during analysis"] * 5
+def generate_section_video(prompt, preset, section_number=1, base_seed=171198, progress=gr.Progress()):
+    """각 섹션의 비디오 생성 - 에러 처리 추가"""
+    try:
+        if not prompt or len(prompt.strip()) < 50:
+            raise gr.Error("프롬프트는 최소 50자 이상이어야 합니다.")
+        selected = next(item for item in preset_options if item["label"] == preset)
+        section_seed = base_seed + section_number
+        return generate_video_from_text(
+            prompt=prompt,
+            height=selected["height"],
+            width=selected["width"],
+            num_frames=selected["num_frames"],
+            seed=section_seed,
+            progress=progress
+        )
+    except Exception as e:
+        print(f"Error in section {section_number}: {e}")
+        raise gr.Error(f"섹션 {section_number} 생성 중 오류: {str(e)}")
+# 개별 섹션 프롬프트 생성 함수 추가
+def generate_single_section_prompt(scenario, section_number):
+    """개별 섹션에 대한 프롬프트 생성"""
+    section_descriptions = {
+        1: "배경 및 필요성: 주제의 전반적인 분위기를 표현하는 배경 씬",
+        2: "흥미 유발: 흥미를 유발하고 기대감을 증폭시키는 배경",
+        3: "해결책 제시: 희망적이고 밝��� 톤의 배경 전환",
+        4: "본론: 안정감 있고 신뢰도를 높이는 배경",
+        5: "결론: 임팩트 있는 마무리를 위한 역동적인 배경"
+    }
+    messages = [
+        {"role": "system", "content": system_prompt_scenario},
+        {"role": "user", "content": f"""
+다음 스크립트의 {section_number}번째 섹션({section_descriptions[section_number]})에 대한
+배경 영상 프롬프트만을 생성해주세요:
+{scenario}
+직접적인 제품 묘사는 피하고, 스크립트의 주제와 감성을 표현하는 핵심 키워드를 반영한 배경 영상에 집중해주세요."""}
+    ]
+    try:
+        response = client.chat.completions.create(
+            model="gpt-4-1106-preview",
+            messages=messages,
+            max_tokens=500,
+        )
+        return response.choices[0].message.content.strip()
+    except Exception as e:
+        print(f"Error during prompt generation: {e}")
+        return "Error occurred during prompt generation"
+# 비디오 결합 함수 추가
+def combine_videos(video_paths, output_path):
+    """여러 비디오를 하나로 결합"""
+    if not all(video_paths):
+        raise gr.Error("모든 섹션의 영상이 생성되어야 합니다.")
+    try:
+        # 첫 번째 비디오의 속성 가져오기
+        cap = cv2.VideoCapture(video_paths[0])
+        fps = int(cap.get(cv2.CAP_PROP_FPS))
+        width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+        height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+        cap.release()
+        # 출력 비디오 설정
+        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+        out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
+        # 각 비디오 순차적으로 결합
+        for video_path in video_paths:
+            if video_path and os.path.exists(video_path):
+                cap = cv2.VideoCapture(video_path)
+                while True:
+                    ret, frame = cap.read()
+                    if not ret:
+                        break
+                    out.write(frame)
+                cap.release()
+        out.release()
+        return output_path
+    except Exception as e:
+        raise gr.Error(f"비디오 결합 중 오류 발생: {e}")
+def merge_section_videos(section1, section2, section3, section4, section5):
+    """섹션 비디오들을 하나로 결합"""
+    videos = [section1, section2, section3, section4, section5]
+    if not all(videos):
+        raise gr.Error("모든 섹션의 영상이 먼저 생성되어야 합니다.")
+    output_path = tempfile.mktemp(suffix=".mp4")
+    return combine_videos(videos, output_path)
 # Gradio Interface Definition
 with gr.Blocks(theme=gr.themes.Soft()) as iface:
     with gr.Tabs():
                         visible=False
                     )
                     txt2vid_preset = gr.Dropdown(
                         choices=[p["label"] for p in preset_options],
+                        value="[16:9] 512x320, 10.3초",
                         label="Step 2: 해상도 프리셋 선택",
                     )
                         visible=False
                     )
                     img2vid_preset = gr.Dropdown(
                         choices=[p["label"] for p in preset_options],
+                        value="[16:9] 512x320, 10.3초",
                         label="Step 3: 해상도 프리셋 선택",
                     )
                 with gr.Column():
                     img2vid_output = gr.Video(label="생성된 비디오")
+        # Scenario to Video Tab (Modified)
+        with gr.TabItem("시나리오로 비디오 만들기(숏폼)"):
+            with gr.Row():
+                with gr.Column(scale=1):
+                    scenario_input = gr.Textbox(
+                        label="영상 스크립트 입력",
+                        placeholder="전체 시나리오를 입력하세요...",
+                        lines=10
+                    )
+                    scenario_preset = gr.Dropdown(
+                        choices=[p["label"] for p in preset_options],
+                        value="[16:9] 512x320, 10.3초",
+                        label="화면 크기 선택"
+                    )
+                    analyze_btn = gr.Button("시나리오 분석 및 프롬프트 생성", variant="primary")
+                with gr.Column(scale=2):
+                    with gr.Row():
+                        # 섹션 1
+                        with gr.Column():
+                            section1_prompt = gr.Textbox(
+                                label="1. 배경 및 필요성",
+                                lines=4
+                            )
+                            with gr.Row():
+                                section1_regenerate = gr.Button("🔄 프롬프트 생성")
+                                section1_generate = gr.Button("🔄 영상 생성")
+                            section1_video = gr.Video(label="섹션 1 영상")
+                        # 섹션 2
+                        with gr.Column():
+                            section2_prompt = gr.Textbox(
+                                label="2. 흥미 유발",
+                                lines=4
+                            )
+                            with gr.Row():
+                                section2_regenerate = gr.Button("🔄 프롬프트 생성")
+                                section2_generate = gr.Button("🔄 영상 생성")
+                            section2_video = gr.Video(label="섹션 2 영상")
+                    with gr.Row():
+                        # 섹션 3
+                        with gr.Column():
+                            section3_prompt = gr.Textbox(
+                                label="3. 해결책 제시",
+                                lines=4
+                            )
+                            with gr.Row():
+                                section3_regenerate = gr.Button("🔄 프롬프트 생성")
+                                section3_generate = gr.Button("🔄 영상 생성")
+                            section3_video = gr.Video(label="섹션 3 영상")
+                        # 섹션 4
+                        with gr.Column():
+                            section4_prompt = gr.Textbox(
+                                label="4. 본론",
+                                lines=4
+                            )
+                            with gr.Row():
+                                section4_regenerate = gr.Button("🔄 프롬프트 생성")
+                                section4_generate = gr.Button("🔄 영상 생성")
+                            section4_video = gr.Video(label="섹션 4 영상")
+                    with gr.Row():
+                        # 섹션 5
+                        with gr.Column():
+                            section5_prompt = gr.Textbox(
+                                label="5. 결론 및 강조",
+                                lines=4
+                            )
+                            with gr.Row():
+                                section5_regenerate = gr.Button("🔄 프롬프트 생성")
+                                section5_generate = gr.Button("🔄 영상 생성")
+                            section5_video = gr.Video(label="섹션 5 영상")
+    # 통합 영상 섹션 추가
+                    with gr.Row():
+                        with gr.Column(scale=1):
+            # 기존의 scenario_input과 analyze_btn 유지
+                            merge_videos_btn = gr.Button("통합 영상 생성", variant="primary", size="lg")
+                        with gr.Column(scale=2):
+            # 기존의 섹션 1-5 유지
+            # 통합 영상 출력 섹션 추가
+                            with gr.Row():
+                                merged_video_output = gr.Video(label="통합 영상")
+# Event handlers
     txt2vid_preset.change(
         fn=preset_changed,
         inputs=[txt2vid_preset],
             txt2vid_enhance_toggle,
             txt2vid_negative_prompt,
             txt2vid_frame_rate,
+            *txt2vid_advanced[:3],
             txt2vid_current_height,
             txt2vid_current_width,
             txt2vid_current_num_frames,
             img2vid_enhance_toggle,
             img2vid_negative_prompt,
             img2vid_frame_rate,
+            *img2vid_advanced[:3],
             img2vid_current_height,
             img2vid_current_width,
             img2vid_current_num_frames,
         queue=True,
     )
+    # Scenario tab event handlers
+    analyze_btn.click(
+        fn=analyze_scenario,
+        inputs=[scenario_input],
+        outputs=[
+            section1_prompt, section2_prompt, section3_prompt,
+            section4_prompt, section5_prompt
+        ]
+    )
+# 섹션 생성 이벤트 핸들러
+    section1_generate.click(
+        fn=generate_section_video,
+        inputs=[section1_prompt, scenario_preset],
+        outputs=section1_video,
+        api_name=f"generate_section1"
+    )
+    section2_generate.click(
+        fn=lambda p, pr: generate_section_video(p, pr, 2),
+        inputs=[section2_prompt, scenario_preset],
+        outputs=section2_video,
+        api_name=f"generate_section2"
+    )
+    section3_generate.click(
+        fn=lambda p, pr: generate_section_video(p, pr, 3),
+        inputs=[section3_prompt, scenario_preset],
+        outputs=section3_video,
+        api_name=f"generate_section3"
+    )
+    section4_generate.click(
+        fn=lambda p, pr: generate_section_video(p, pr, 4),
+        inputs=[section4_prompt, scenario_preset],
+        outputs=section4_video,
+        api_name=f"generate_section4"
+    )
+    section5_generate.click(
+        fn=lambda p, pr: generate_section_video(p, pr, 5),
+        inputs=[section5_prompt, scenario_preset],
+        outputs=section5_video,
+        api_name=f"generate_section5"
+    )
+    # 섹션 생성 이벤트 핸들러
+    section1_generate.click(
+        fn=lambda p, pr: generate_section_video(p, pr, 1),
+        inputs=[section1_prompt, scenario_preset],
+        outputs=section1_video
+    )
+    section2_generate.click(
+        fn=lambda p, pr: generate_section_video(p, pr, 2),
+        inputs=[section2_prompt, scenario_preset],
+        outputs=section2_video
+    )
+    section3_generate.click(
+        fn=lambda p, pr: generate_section_video(p, pr, 3),
+        inputs=[section3_prompt, scenario_preset],
+        outputs=section3_video
+    )
+    section4_generate.click(
+        fn=lambda p, pr: generate_section_video(p, pr, 4),
+        inputs=[section4_prompt, scenario_preset],
+        outputs=section4_video
+    )
+    section5_generate.click(
+        fn=lambda p, pr: generate_section_video(p, pr, 5),
+        inputs=[section5_prompt, scenario_preset],
+        outputs=section5_video
+    )
+# 이벤트 핸들러 추가
+    merge_videos_btn.click(
+        fn=merge_section_videos,
+        inputs=[
+            section1_video,
+            section2_video,
+            section3_video,
+            section4_video,
+            section5_video
+        ],
+        outputs=merged_video_output
+    )
 if __name__ == "__main__":
     iface.queue(max_size=64, default_concurrency_limit=1, api_open=False).launch(
         share=True, show_api=False