Spaces:

GoodML
/

dishDecode

Running

App Files Files Community

GoodML commited on Nov 25, 2024

Commit

b6e7946

verified ·

1 Parent(s): c139644

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -31

app.py CHANGED Viewed

@@ -208,41 +208,31 @@ def process_audio():
     audio_file = request.files['audio']
     print("AUDIO FILE NAME: ", audio_file)
     try:
-        print("SAVING THE FILE TEMPO, ANIKET")
-        # Step 1: Save audio to a temporary file
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio_file:
-            audio_file.save(temp_audio_file.name)
-            print(f"Audio file saved: {temp_audio_file.name}")
-            print("STARTING TRANSCRIPTION, ANIKET")
-            # Step 2: Transcribe the audio using Whisper AI
-            transcription = transcribe_audio(temp_audio_file.name)
-            print("BEFORE THE transcription FAILED ERROR, CHECKING IF I GOT THE TRANSCRIPTION", transcription)
-            if not transcription:
-                return jsonify({"error": "Audio transcription failed"}), 500
-            print("GOT THE transcription")
-            print("Starting the GEMINI REQUEST TO STRUCTURE IT")
-            # Step 3: Generate structured recipe information using Gemini API
-            structured_data = query_gemini_api(transcription)
-            print("GOT THE STRUCTURED DATA", structured_data)
-            # Step 4: Return the structured data
-            return jsonify(structured_data)
     except Exception as e:
         return jsonify({"error": str(e)}), 500
-    finally:
-        # Clean up temporary files
-        if os.path.exists(temp_audio_file.name):
-            os.remove(temp_audio_file.name)
 def transcribe_audio(audio_path):
     """
     Transcribe audio using Whisper AI.

     audio_file = request.files['audio']
     print("AUDIO FILE NAME: ", audio_file)
     try:
+        print("STARTING TRANSCRIPTION, ANIKET")
+        # Step 1: Transcribe the uploaded audio file directly
+        audio_file = request.files['audio']
+        transcription = transcribe_audio(audio_file)
+        print("BEFORE THE transcription FAILED ERROR, CHECKING IF I GOT THE TRANSCRIPTION", transcription)
+        if not transcription:
+            return jsonify({"error": "Audio transcription failed"}), 500
+        print("GOT THE transcription")
+        print("Starting the GEMINI REQUEST TO STRUCTURE IT")
+        # Step 2: Generate structured recipe information using Gemini API
+        structured_data = query_gemini_api(transcription)
+        print("GOT THE STRUCTURED DATA", structured_data)
+        # Step 3: Return the structured data
+        return jsonify(structured_data)
     except Exception as e:
         return jsonify({"error": str(e)}), 500
 def transcribe_audio(audio_path):
     """
     Transcribe audio using Whisper AI.