Spaces:

VIDraft
/

Portrait-Animation

Running on Zero

App Files Files Community

openfree commited on May 10

Commit

1fc29a2

verified ·

1 Parent(s): 2a1d7cf

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -14

app.py CHANGED Viewed

@@ -31,24 +31,21 @@ os.makedirs(res_path, exist_ok=True)
 @spaces.GPU(duration=600)  # 긴 비디오 처리를 위해 duration 600초로 설정 (10분)
 def get_video_res(img_path, audio_path, res_video_path, dynamic_scale=1.0):
     # ============================
-    # 1) 오디오 길이에 따라 프레임 수 계산 (최대 1분까지)
-    # 2) 원본 비율 유지(크롭 제거)
     # ============================
-    ## 수정됨: expand_ratio를 0으로 (기존 0.5)
-    expand_ratio = 0.0
     min_resolution = 512
-    ## 수정됨: 오디오 길이에 따라 inference_steps 계산
     audio = AudioSegment.from_file(audio_path)
     duration = len(audio) / 1000.0  # 초 단위
     # 오디오 길이에 따라 inference_steps 계산 (초당 약 12.5 프레임)
-    # 최소 25 프레임, 최대 750 프레임 (60초 x 12.5)
     inference_steps = min(max(int(duration * 12.5), 25), 750)
-    print(f"Audio duration: {duration} seconds, using inference_steps: {inference_steps}")
     # 얼굴 인식 (face_info는 참고용)
     face_info = pipe.preprocess(img_path, expand_ratio=expand_ratio)
@@ -57,8 +54,7 @@ def get_video_res(img_path, audio_path, res_video_path, dynamic_scale=1.0):
     # 얼굴이 하나라도 검출되면(>0), 원본 이미지 비율 유지
     if face_info['face_num'] > 0:
         os.makedirs(os.path.dirname(res_video_path), exist_ok=True)
-        # 원본 이미지를 그대로 전달
         pipe.process(
             img_path,
             audio_path,
@@ -96,7 +92,7 @@ def process_sonic(image, audio, dynamic_scale):
     audio_segment = audio_segment.set_frame_rate(sampling_rate)
     # 오디오 길이 제한 확인 (최대 60초)
-    MAX_DURATION_MS = 60000  # 60초 (60,000ms)
     if len(audio_segment) > MAX_DURATION_MS:
         print(f"Audio longer than 60 seconds ({len(audio_segment)/1000:.2f}s). Truncating to 60 seconds.")
         audio_segment = audio_segment[:MAX_DURATION_MS]
@@ -112,7 +108,7 @@ def process_sonic(image, audio, dynamic_scale):
     if not os.path.exists(audio_path):
         audio_segment.export(audio_path, format="wav")
-    # 캐시된 결과가 있으면 바로 사용, 없으면 새로 생성
     if os.path.exists(res_video_path):
         print(f"Using cached result: {res_video_path}")
         return res_video_path
@@ -120,7 +116,7 @@ def process_sonic(image, audio, dynamic_scale):
         print(f"Generating new video with dynamic scale: {dynamic_scale}")
         return get_video_res(image_path, audio_path, res_video_path, dynamic_scale)
-# 예시 데이터를 위한 dummy 함수 (필요시 실제 예시 데이터 추가)
 def get_example():
     return []
@@ -217,4 +213,4 @@ with gr.Blocks(css=css) as demo:
     """)
 # 공개 링크 생성
-demo.launch(share=True)

 @spaces.GPU(duration=600)  # 긴 비디오 처리를 위해 duration 600초로 설정 (10분)
 def get_video_res(img_path, audio_path, res_video_path, dynamic_scale=1.0):
     # ============================
+    # 최대 60초까지 오디오를 반영
     # ============================
+    expand_ratio = 0.0
     min_resolution = 512
+    # pydub으로 오디오 길이 계산
     audio = AudioSegment.from_file(audio_path)
     duration = len(audio) / 1000.0  # 초 단위
     # 오디오 길이에 따라 inference_steps 계산 (초당 약 12.5 프레임)
+    # 최소 25 프레임, 최대 750 프레임 (60초 => 60*12.5=750)
     inference_steps = min(max(int(duration * 12.5), 25), 750)
+    print(f"Audio duration: {duration:.2f} seconds, using inference_steps: {inference_steps}")
     # 얼굴 인식 (face_info는 참고용)
     face_info = pipe.preprocess(img_path, expand_ratio=expand_ratio)
     # 얼굴이 하나라도 검출되면(>0), 원본 이미지 비율 유지
     if face_info['face_num'] > 0:
         os.makedirs(os.path.dirname(res_video_path), exist_ok=True)
         pipe.process(
             img_path,
             audio_path,
     audio_segment = audio_segment.set_frame_rate(sampling_rate)
     # 오디오 길이 제한 확인 (최대 60초)
+    MAX_DURATION_MS = 60000  # 60초
     if len(audio_segment) > MAX_DURATION_MS:
         print(f"Audio longer than 60 seconds ({len(audio_segment)/1000:.2f}s). Truncating to 60 seconds.")
         audio_segment = audio_segment[:MAX_DURATION_MS]
     if not os.path.exists(audio_path):
         audio_segment.export(audio_path, format="wav")
+    # 캐시된 결과가 있으면 바로 사용
     if os.path.exists(res_video_path):
         print(f"Using cached result: {res_video_path}")
         return res_video_path
         print(f"Generating new video with dynamic scale: {dynamic_scale}")
         return get_video_res(image_path, audio_path, res_video_path, dynamic_scale)
+# 예시 데이터를 위한 dummy 함수
 def get_example():
     return []
     """)
 # 공개 링크 생성
+demo.launch(share=True)