Spaces:

palbha
/

conversational_ai

Running

palbha commited on Mar 18

Commit

176259d

verified ·

1 Parent(s): 6a5b9ba

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,14 +1,14 @@
 import os
 import gradio as gr
-import google.generativeai as genai
 from gtts import gTTS
 import tempfile
 import time
 # Configure the Gemini API
 GOOGLE_API_KEY = os.getenv("gemini_api") # Replace with your actual API key
-genai.configure(api_key=GOOGLE_API_KEY)
 # Initialize the model
 model = genai.GenerativeModel('gemini-pro')
@@ -21,7 +21,12 @@ def transcribe_audio(audio_path):
     """
     # For demonstration, we're returning a placeholder message
     # In a real app, you would connect to a speech-to-text service
-    return "This is a placeholder for speech-to-text transcription. In a real application, this would be the transcribed text from your audio."
 def text_to_speech(text):
     """Convert text to speech using gTTS and return the path to the audio file"""
@@ -37,13 +42,9 @@ def chat_with_gemini(user_input, history):
     # Initialize conversation or continue existing one
     if not history:
         history = []
-        chat = model.start_chat(history=[])
-    else:
-        # Reconstruct the chat session with history
-        chat = model.start_chat(history=[
-            {"role": "user" if i % 2 == 0 else "model", "parts": [msg]}
-            for i, msg in enumerate(history)
-        ])
     # Generate response
     response = chat.send_message(user_input)

 import os
 import gradio as gr
+from google import genai
 from gtts import gTTS
 import tempfile
 import time
 # Configure the Gemini API
 GOOGLE_API_KEY = os.getenv("gemini_api") # Replace with your actual API key
+client = genai.Client(api_key=GOOGLE_API_KEY)
 # Initialize the model
 model = genai.GenerativeModel('gemini-pro')
     """
     # For demonstration, we're returning a placeholder message
     # In a real app, you would connect to a speech-to-text service
+    response = client.models.generate_content(
+          model='gemini-2.0-flash',
+          contents=['Describe this audio clip', audio_path]
+        )
+    return response.text
 def text_to_speech(text):
     """Convert text to speech using gTTS and return the path to the audio file"""
     # Initialize conversation or continue existing one
     if not history:
         history = []
+        chat = client.chats.create(model="gemini-2.0-flash")
     # Generate response
     response = chat.send_message(user_input)