Spaces:

Nepjune
/

Project_image_captioning_blip

Runtime error

Nepjune commited on Feb 15, 2024

Commit

ff7ab28

verified ·

1 Parent(s): 97599f2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,12 +2,8 @@ import gradio as gr
 from transformers import BlipProcessor, BlipForConditionalGeneration
 from gtts import gTTS
 from playsound import playsound
-from transformers import pipeline
-# Load the text-to-speech model
-tts_synthesizer = pipeline("text-to-speech", "suno/bark")
-# Load the image-to-text model
 model_id = "dblasko/blip-dalle3-img2prompt"
 model = BlipForConditionalGeneration.from_pretrained(model_id)
 processor = BlipProcessor.from_pretrained(model_id)
@@ -20,10 +16,9 @@ def generate_caption(image):
     generated_caption = processor.batch_decode(generated_ids, skip_special_tokens=True, temperature=0.8, top_k=40, top_p=0.9)[0]
     # Convert the generated caption to speech
-    speech = tts_synthesizer(generated_caption)
-    audio_path = "generated_audio.wav"
-    with open(audio_path, "wb") as f:
-        f.write(speech["audio"])
     return generated_caption, audio_path
@@ -37,6 +32,7 @@ demo = gr.Interface(
     outputs=[
         gr.Textbox(label="Generated caption"),
         gr.Button("Convert to Audio", play_audio),
-    ]
 )
 demo.launch(share=True)

 from transformers import BlipProcessor, BlipForConditionalGeneration
 from gtts import gTTS
 from playsound import playsound
+from concurrent.futures import ThreadPoolExecutor
 model_id = "dblasko/blip-dalle3-img2prompt"
 model = BlipForConditionalGeneration.from_pretrained(model_id)
 processor = BlipProcessor.from_pretrained(model_id)
     generated_caption = processor.batch_decode(generated_ids, skip_special_tokens=True, temperature=0.8, top_k=40, top_p=0.9)[0]
     # Convert the generated caption to speech
+    tts = gTTS(text=generated_caption, lang='en')
+    audio_path = "generated_audio.mp3"
+    tts.save(audio_path)
     return generated_caption, audio_path
     outputs=[
         gr.Textbox(label="Generated caption"),
         gr.Button("Convert to Audio", play_audio),
+    ],
+    live=True  # ทำให้ Gradio ทำงานแบบไม่บล็อก
 )
 demo.launch(share=True)