TextToVideo-Dalle

Running

App Files Files Community

ruslanmv commited on Jan 17

Commit

108e243

verified ·

1 Parent(s): 6668dc9

Update app.py

Browse files

Files changed (1) hide show

app.py +33 -18

app.py CHANGED Viewed

@@ -10,6 +10,7 @@ import nltk
 import textwrap
 import os
 import glob
 # Ensure 'punkt' is downloaded for nltk
 try:
@@ -17,22 +18,26 @@ try:
 except LookupError:
     nltk.download('punkt')
-# Download ffmpeg if not found (using a more robust method)
-try:
-    from imageio_ffmpeg import get_ffmpeg_exe
-    get_ffmpeg_exe()
-except Exception as e:
-    print(f"Error downloading ffmpeg: {e}")
-    print("Attempting to download ffmpeg using a different method...")
     try:
-        import imageio
-        imageio.plugins.ffmpeg.download(directory=os.path.join(os.path.expanduser("~"), ".imageio"))
-        print("ffmpeg downloaded successfully.")
-    except Exception as e:
-        print(f"Failed to download ffmpeg: {e}")
-        print("Please ensure you have an internet connection and that imageio and imageio_ffmpeg are installed.")
-        raise
 description = " Video Story Generator with Audio \n PS:  Generation of video by using Artificial Intelligence by dalle-mini and distilbart and gtss "
 title = "Video Story Generator with Audio by using dalle-mini and distilbart and gtss  "
@@ -59,9 +64,9 @@ def get_output_video(text):
     The required models will be downloaded to models_root if they are not already there.
     Set the dtype to torch.float16 to save GPU memory.
     If you have an Ampere architecture GPU you can use torch.bfloat16.
-      Set the device to either "cuda" or "cpu". Once everything has finished initializing,
     float32 is faster than float16 but uses more GPU memory.
-          '''
     def generate_image(
             is_mega: bool,
@@ -123,7 +128,7 @@ def get_output_video(text):
         y_text = text_start_height
         lines = textwrap.wrap(text, width=40)
         for line in lines:
-            line_width, line_height = font.getsize(line)
             draw.text(((image_width - line_width) / 2, y_text),
                       line, font=font, fill=text_color)
             y_text += line_height
@@ -133,7 +138,7 @@ def get_output_video(text):
         Testing draw_multiple_line_text
         '''
         image = image_input
-        fontsize = 13  # starting font size
         path_font = "/usr/share/fonts/truetype/liberation/LiberationSans-Bold.ttf"
         if not os.path.exists(path_font):
           # Try alternative location on different systems
@@ -239,6 +244,16 @@ def get_output_video(text):
         final_clip.write_videofile(outname, fps=fps)
     combine_audio(movie_name, export_path, movie_final)  # create a new file
     return 'result_final.mp4'

 import textwrap
 import os
 import glob
+import subprocess
 # Ensure 'punkt' is downloaded for nltk
 try:
 except LookupError:
     nltk.download('punkt')
+# Function to check and install FFmpeg if not found
+def ensure_ffmpeg_installed():
     try:
+        # Check if FFmpeg is installed by running ffmpeg -version
+        subprocess.run(['ffmpeg', '-version'], check=True, capture_output=True, text=True)
+        print("FFmpeg is already installed.")
+    except (subprocess.CalledProcessError, FileNotFoundError):
+        print("FFmpeg not found. Attempting to install...")
+        try:
+            # Install FFmpeg using the system package manager (apt for Debian/Ubuntu)
+            subprocess.run(['apt', 'update'], check=True)
+            subprocess.run(['apt', 'install', '-y', 'ffmpeg'], check=True)
+            print("FFmpeg installed successfully using apt.")
+        except subprocess.CalledProcessError as e:
+            print(f"Failed to install FFmpeg using apt: {e}")
+            print("Please install FFmpeg manually and ensure it is in your system's PATH.")
+            raise
+# Ensure FFmpeg is installed before proceeding
+ensure_ffmpeg_installed()
 description = " Video Story Generator with Audio \n PS:  Generation of video by using Artificial Intelligence by dalle-mini and distilbart and gtss "
 title = "Video Story Generator with Audio by using dalle-mini and distilbart and gtss  "
     The required models will be downloaded to models_root if they are not already there.
     Set the dtype to torch.float16 to save GPU memory.
     If you have an Ampere architecture GPU you can use torch.bfloat16.
+        Set the device to either "cuda" or "cpu". Once everything has finished initializing,
     float32 is faster than float16 but uses more GPU memory.
+        '''
     def generate_image(
             is_mega: bool,
         y_text = text_start_height
         lines = textwrap.wrap(text, width=40)
         for line in lines:
+            line_width, line_height = font.getbbox(line)[2:4] # Use getbbox for better size calculation
             draw.text(((image_width - line_width) / 2, y_text),
                       line, font=font, fill=text_color)
             y_text += line_height
         Testing draw_multiple_line_text
         '''
         image = image_input
+        fontsize = 20  # Increased font size
         path_font = "/usr/share/fonts/truetype/liberation/LiberationSans-Bold.ttf"
         if not os.path.exists(path_font):
           # Try alternative location on different systems
         final_clip.write_videofile(outname, fps=fps)
     combine_audio(movie_name, export_path, movie_final)  # create a new file
+    # Cleanup intermediate files
+    for f in file_names:
+        os.remove(f)
+    for f in mp3_names:
+        os.remove(f)
+    os.remove("result_new.mp4")
+    os.remove("result.mp3")
     return 'result_final.mp4'