Spaces:

Curify
/

studio_V1

Sleeping

App Files Files Community

qqwjq1981 commited on Feb 25

Commit

4291f64

verified ·

1 Parent(s): b0d613e

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -4

app.py CHANGED Viewed

@@ -277,13 +277,13 @@ def process_entry(entry, i, video_width, video_height, add_voiceover, target_lan
     audio_segment = None
     if add_voiceover:
         segment_audio_path = f"segment_{i}_voiceover.wav"
-        generate_voiceover_OpenAI([entry], target_language, segment_audio_path)
         audio_clip = AudioFileClip(segment_audio_path)
         # Get and log all methods in AudioFileClip
         logger.info("Methods in AudioFileClip:")
         for method in dir(audio_clip):
             logger.info(method)
-        desired_duration = entry["end"] - entry["start"]
         # Log duration of the audio clip and the desired duration for debugging.
         logger.debug(f"Audio clip duration: {audio_clip.duration}, Desired duration: {desired_duration}")
@@ -362,7 +362,26 @@ def generate_voiceover(translated_json, language, output_audio_path):
     except Exception as e:
         raise ValueError(f"Error generating voiceover: {e}")
-def generate_voiceover_OpenAI(translated_json, language, output_audio_path):
     """
     Generate voiceover from translated text for a given language using OpenAI TTS API.
     """
@@ -380,12 +399,13 @@ def generate_voiceover_OpenAI(translated_json, language, output_audio_path):
     while retry_count < max_retries:
         try:
             # Create the speech using OpenAI TTS API
             response = client.audio.speech.create(
                 model=model,
                 voice=voice,
                 input=full_text,
-                speed=1.1
             )
             # Save the audio to the specified path
             with open(output_audio_path, 'wb') as f:

     audio_segment = None
     if add_voiceover:
         segment_audio_path = f"segment_{i}_voiceover.wav"
+        desired_duration = entry["end"] - entry["start"]
+        generate_voiceover_OpenAI([entry], target_language, desired_duration, segment_audio_path)
         audio_clip = AudioFileClip(segment_audio_path)
         # Get and log all methods in AudioFileClip
         logger.info("Methods in AudioFileClip:")
         for method in dir(audio_clip):
             logger.info(method)
         # Log duration of the audio clip and the desired duration for debugging.
         logger.debug(f"Audio clip duration: {audio_clip.duration}, Desired duration: {desired_duration}")
     except Exception as e:
         raise ValueError(f"Error generating voiceover: {e}")
+def truncated_linear(x):
+    if x < 15:
+        return 1
+    elif x > 25:
+        return 1.2
+    else:
+        slope = (1.2 - 1) / (25 - 15)
+        return 1 + slope * (x - 15)
+def calculate_speed(text, desired_duration):
+    # Calculate characters per second
+    char_count = len(text)
+    chars_per_second = char_count / (desired_duration + 0.001)
+    # Apply truncated linear function to get speed
+    speed = truncated_linear(chars_per_second)
+    return speed
+def generate_voiceover_OpenAI(translated_json, language, desired_duration, output_audio_path):
     """
     Generate voiceover from translated text for a given language using OpenAI TTS API.
     """
     while retry_count < max_retries:
         try:
+            speed_tts = calculate_speed(full_text, desired_duration)
             # Create the speech using OpenAI TTS API
             response = client.audio.speech.create(
                 model=model,
                 voice=voice,
                 input=full_text,
+                speed=speed_tts
             )
             # Save the audio to the specified path
             with open(output_audio_path, 'wb') as f: