Spaces:

ZeeAI1
/

tts1

Sleeping

tts1 / app.py

Create app.py

b86e718 verified 3 months ago

1.58 kB

	# Install dependencies in Colab
	try:
	import whisper, gradio as gr
	from gtts import gTTS
	from groq import Groq
	except:
	import whisper, gradio as gr
	from gtts import gTTS
	from groq import Groq

	import os
	import tempfile

	# Load Whisper model
	whisper_model = whisper.load_model("base")

	# Groq API Key (replace with your actual key or set as env variable)
	GROQ_API_KEY = "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"
	client = Groq(api_key=GROQ_API_KEY)

	# Core logic
	def voice_chat(audio_path):
	# Step 1: Transcribe audio
	result = whisper_model.transcribe(audio_path)
	user_text = result["text"]

	# Step 2: Groq LLM response
	response = client.chat.completions.create(
	messages=[{"role": "user", "content": user_text}],
	model="llama3-8b-8192",
	)
	bot_reply = response.choices[0].message.content

	# Step 3: Text to speech using gTTS
	tts = gTTS(bot_reply)
	with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as f:
	tts.save(f.name)
	audio_response_path = f.name

	return user_text, bot_reply, audio_response_path

	# Gradio interface
	iface = gr.Interface(
	fn=voice_chat,
	inputs=gr.Microphone(label="🎤 Speak your question", type="filepath"),
	outputs=[
	gr.Text(label="📝 Transcribed Input"),
	gr.Text(label="🤖 LLM Reply"),
	gr.Audio(label="🔉 Spoken Reply", type="filepath")
	],
	title="🗣️ Real-Time Voice-to-Voice Chatbot (Whisper + Groq + gTTS)",
	live=True
	)

	if __name__ == "__main__":
	iface.launch()