Spaces:

jdalfonso
/

SISE-ULTIMATE-CHALLENGE

Sleeping

App Files Files Community

SISE-ULTIMATE-CHALLENGE / views /application.py

Cyr-CK

Added real-time emotion detection over an uploaded audio file

aaa3b8b 9 months ago

raw

history blame

9.7 kB

	import streamlit as st
	import pandas as pd
	from st_audiorec import st_audiorec
	import datetime
	import os
	import matplotlib.pyplot as plt
	import librosa
	from src.model.transcriber import transcribe_audio
	from src.model.predict import predict_emotion


	DIRECTORY = "audios"
	FILE_NAME = "audio.wav"
	CHUNK = 1024
	# FORMAT = pyaudio.paInt16
	CHANNELS = 1
	RATE = 16000

	def application():
	st.title("SISE ultimate challenge")
	st.write("C'est le dernier challenge de la formation SISE.")
	st.markdown("""
	Overview:
	- Analyse de logs
	- Analyse de données
	- Machine learning
	""")

	st.markdown("---")

	tab1, tab2, tab3 = st.tabs(["⬆️ Record Audio", "🔈 Realtime Audio", "📝 Transcription"])

	with tab1:
	st.header("⬆️ Upload Audio Record")
	st.write("Here you can upload a pre-recorded audio.")
	audio_file = st.file_uploader("Upload an audio file", type=["wav", "mp3", "ogg"])

	if audio_file is not None:

	with open(os.path.join(DIRECTORY,FILE_NAME), "wb") as f:
	f.write(audio_file.getbuffer())
	st.success(f"Saved file: {FILE_NAME}")


	start_inference = st.button("Start emotion recogniton","inf_on_upl_btn")
	emotion_labels = ["joie", "colère", "neutre"]
	colors = ['#f6d60a', '#f71c1c', '#cac8c8']

	if start_inference:
	# Configuration Streamlit
	with st.spinner("Real-time emotion analysis..."):
	# uploaded_file = st.file_uploader("Choisissez un fichier audio", type=["wav", "mp3"])

	if audio_file is not None:
	# Charger et rééchantillonner l'audio
	audio, sr = librosa.load(audio_file, sr=RATE)
	# chunk = audio_file

	# Paramètres de la fenêtre glissante
	window_size = 1 # en secondes
	hop_length = 0.5 # en secondes

	# Créer un graphique en temps réel
	fig, ax = plt.subplots()
	lines = [ax.plot([], [], label=emotion)[0] for emotion in emotion_labels]
	ax.set_ylim(0, 1)
	ax.set_xlim(0, len(audio) / sr)
	ax.set_xlabel("Temps (s)")
	ax.set_ylabel("Probabilité")
	ax.legend()

	chart = st.pyplot(fig)

	scores = [[],[],[]] # 3 émotions pour l'instant

	# Traitement par fenêtre glissante
	for i in range(0, len(audio), int(hop_length * sr)):
	chunk = audio[i:i + int(window_size * sr)]
	if len(chunk) < int(window_size * sr):
	break

	emotion_scores = predict_emotion(chunk, output_probs=True, sampling_rate=RATE)

	# Mettre à jour le graphique
	for emotion, line in zip(emotion_labels, lines):
	xdata = list(line.get_xdata())
	ydata = list(line.get_ydata())
	xdata.append(i / sr)
	ydata.append(emotion_scores[emotion])
	scores[list(emotion_scores).index(emotion)].append(emotion_scores[emotion])
	line.set_data(xdata, ydata)

	ax.relim()
	ax.autoscale_view()
	chart.pyplot(fig, use_container_width=True)

	# Prepare the styling
	st.markdown("""
	<style>
	.colored-box {
	padding: 10px;
	border-radius: 5px;
	color: white;
	font-weight: bold;
	text-align: center;
	}
	</style>
	"""
	, unsafe_allow_html=True)

	# Dynamically create the specified number of columns
	columns = st.columns(len(emotion_scores))

	# emotion_scores_mean = [sum(sublist) / len(sublist) for sublist in scores]
	emotion_scores_mean = {emotion:sum(sublist) / len(sublist) for emotion, sublist in zip(emotion_labels, scores)}
	max_emo = max(emotion_scores_mean)
	emotion_scores_sorted = dict(sorted(emotion_scores_mean.items(), key=lambda x: x[1], reverse=True))
	colors_sorted = [colors[list(emotion_scores_mean.keys()).index(key)] for key in list(emotion_scores_sorted.keys())]

	# Add content to each column
	for i, (col, emotion) in enumerate(zip(columns, emotion_scores_sorted)):
	color = colors_sorted[i % len(colors_sorted)] # Cycle through colors if more columns than colors
	col.markdown(f"""
	<div class="colored-box" style="background-color: {color};">
	{emotion} : {100*emotion_scores_sorted[emotion]:.2f} %
	</div>
	"""
	, unsafe_allow_html=True)



	st.success("Analyse terminée !")
	else:
	st.warning("You need to load an audio file !")

	st.subheader("Feedback")

	# Initialisation du fichier CSV
	csv_file = os.path.join("src","predictions","feedback.csv")

	# Vérifier si le fichier CSV existe, sinon le créer avec des colonnes appropriées
	if not os.path.exists(csv_file):
	df = pd.DataFrame(columns=["filepath", "prediction", "feedback"])
	df.to_csv(csv_file, index=False)

	# Charger les données existantes du CSV
	df = pd.read_csv(csv_file)

	with st.form("feedback_form"):
	st.write("What should have been the correct prediction ? (Choose the same emotion if the prediction was correct).")
	feedback = st.selectbox("Your answer :", ['Sadness','Anger', 'Disgust', 'Fear', 'Surprise', 'Joy', 'Neutral'])
	submit_button = st.form_submit_button("Submit")
	st.write("En cliquant sur ce bouton, vous acceptez que votre audio soit sauvegardé dans notre base de données.")

	if submit_button:
	# Ajouter le feedback au DataFrame
	new_entry = {"filepath": audio_file.name, "prediction": max_emo, "feedback": feedback}
	df = df.append(new_entry, ignore_index=True)

	# Sauvegarder les données mises à jour dans le fichier CSV
	df.to_csv(csv_file, index=False)

	# Sauvegarder le fichier audio
	with open(os.path.join("src","predictions","data"), "wb") as f:
	f.write(audio_file.getbuffer())

	# Confirmation pour l'utilisateur
	st.success("Merci pour votre retour ! Vos données ont été sauvegardées.")



	with tab2:
	st.header("🔈 Realtime Audio Record")
	st.write("Here you can record an audio.")

	if st.button("Register", key="register-button"):
	st.success("Audio registered successfully.")

	audio_file = st_audiorec()

	if audio_file is not None:
	st.audio(audio_file, format='audio/wav')

	with tab3:
	st.header("📝 Speech2Text Transcription")
	st.write("Here you can get the audio transcript.")

	save = st.checkbox("Save transcription to .txt", value=False, key="save-transcript")

	############################# A décommenté quand ce sera débogué
	if st.button("Transcribe", key="transcribe-button"):
	# # Fonction pour transcrire l'audio
	# transcription = transcribe_audio(st.audio)

	# # Charger et transcrire l'audio
	# # audio, rate = load_audio(audio_file_path) # (re)chargement de l'audio si nécessaire
	# transcription = transcribe_audio(audio_file, sampling_rate=16000)

	# # Afficher la transcription
	# st.write("Transcription :", transcription)

	st.success("Audio registered successfully.")
	# if save:
	# file_path = "transcript.txt"

	# # Write the text to the file
	# with open(file_path, "w") as file:
	# file.write(transcription)

	# st.success(f"Text saved to {file_path}")