Spaces:

ysharma
/

text-to-ner-to-image-to-video

Runtime error

ysharma HF Staff commited on Apr 21, 2022

Commit

d5c7b7a

1 Parent(s): 8d3fb0e

1

Files changed (1) hide show

app.py CHANGED Viewed

@@ -78,20 +78,20 @@ def engine(text_input):
         img = gr.Interface.load("spaces/multimodalart/latentdiffusion")(ent[0],'50','256','256','1',10)[0]
         img_list.append(img)
-     #Resizing all images produced to same size
-     resize_img_list = resize(img_list)
-     #Convert text to speech using facebook's latest model from HF hub
-     speech = text2speech(text_input)
-     #Calculate the desired frame per second based on given audio length and entities identified
-     fps= entities_num / 19 #length of audio file   #13 / 19
-     #Convert string of images into a video
-     clip = images_to_video(fps, resize_img_list)
-     #Merge video and audio created above
-     merged_file = merge_audio_video(speech, clip)
     #{'prompt':text_input,'steps':'50','width':'256','height':'256','images':'1','scale':10}).launch()
     #img_intfc = gr.Interface.load("spaces/multimodalart/latentdiffusion", inputs=[gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text")],
     #outputs=[gr.outputs.Image(type="pil", label="output image"),gr.outputs.Carousel(label="Individual images",components=["image"]),gr.outputs.Textbox(label="Error")], )

         img = gr.Interface.load("spaces/multimodalart/latentdiffusion")(ent[0],'50','256','256','1',10)[0]
         img_list.append(img)
+    #Resizing all images produced to same size
+    resize_img_list = resize(img_list)
+    #Convert text to speech using facebook's latest model from HF hub
+    speech = text2speech(text_input)
+    #Calculate the desired frame per second based on given audio length and entities identified
+    fps= entities_num / 19 #length of audio file   #13 / 19
+    #Convert string of images into a video
+    clip = images_to_video(fps, resize_img_list)
+    #Merge video and audio created above
+    merged_file = merge_audio_video(speech, clip)
     #{'prompt':text_input,'steps':'50','width':'256','height':'256','images':'1','scale':10}).launch()
     #img_intfc = gr.Interface.load("spaces/multimodalart/latentdiffusion", inputs=[gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text"), gr.inputs.Textbox(lines=1, label="Input Text")],
     #outputs=[gr.outputs.Image(type="pil", label="output image"),gr.outputs.Carousel(label="Individual images",components=["image"]),gr.outputs.Textbox(label="Error")], )