Nepjune commited on
Commit
f1b8b86
·
verified ·
1 Parent(s): 86126aa

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -1,5 +1,6 @@
1
  import gradio as gr
2
  from transformers import BlipProcessor, BlipForConditionalGeneration, AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
 
3
 
4
  # Initialize Blip model for image captioning
5
  model_id = "dblasko/blip-dalle3-img2prompt"
@@ -7,9 +8,9 @@ blip_model = BlipForConditionalGeneration.from_pretrained(model_id)
7
  blip_processor = BlipProcessor.from_pretrained(model_id)
8
 
9
  # Initialize TTS model from Hugging Face
10
- tts_model_name = "tts-mozilla/tts-ljspeech-multilingual"
11
- tts_tokenizer = AutoTokenizer.from_pretrained(tts_model_name)
12
- tts_model = AutoModelForSeq2SeqLM.from_pretrained(tts_model_name)
13
  tts = pipeline(task="text2speech", model=tts_model, tokenizer=tts_tokenizer)
14
 
15
  def generate_caption(image):
 
1
  import gradio as gr
2
  from transformers import BlipProcessor, BlipForConditionalGeneration, AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
3
+ from transformers import AutoTokenizer
4
 
5
  # Initialize Blip model for image captioning
6
  model_id = "dblasko/blip-dalle3-img2prompt"
 
8
  blip_processor = BlipProcessor.from_pretrained(model_id)
9
 
10
  # Initialize TTS model from Hugging Face
11
+ model_name = "facebook/tts-crdnn-baker-softmax"
12
+ tts_tokenizer = AutoTokenizer.from_pretrained(model_name)
13
+ tts_model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
14
  tts = pipeline(task="text2speech", model=tts_model, tokenizer=tts_tokenizer)
15
 
16
  def generate_caption(image):