Spaces:

haepada
/

roots

Sleeping

App Files Files Community

haepada commited on Nov 4, 2024

Commit

5693c3d

verified ·

1 Parent(s): 16cbc9b

Create app.py

Browse files

Files changed (1) hide show

app.py +18 -27

app.py CHANGED Viewed

@@ -1,63 +1,54 @@
-# 파일 구조
-digital-gut/
-├── app.py             # 메인 Gradio 앱
-├── requirements.txt   # 필요한 패키지
-└── README.md         # 설명 문서
-# app.py
 import gradio as gr
 import numpy as np
 import librosa
 from transformers import pipeline
-# 음성 감정 분석 모델
 emotion_analyzer = pipeline("audio-classification", model="MIT/ast-finetuned-speech-commands-v2")
-# 한국어 음성인식 모델
 speech_recognizer = pipeline("automatic-speech-recognition",
                            model="kresnik/wav2vec2-large-xlsr-korean")
 def analyze_voice(audio_file):
-    """음성 분석 함수"""
     try:
-        # 오디오 로드
         y, sr = librosa.load(audio_file)
-        # 1. 음성 감정 분석
         emotions = emotion_analyzer(y)
         primary_emotion = emotions[0]
-        # 2. 음성 텍스트 변환
         text_result = speech_recognizer(y)
-        # 3. 기본 오디오 특성 추출
         mfccs = librosa.feature.mfcc(y=y, sr=sr, n_mfcc=13)
         energy = np.mean(librosa.feature.rms(y=y))
         return {
-            "감정": primary_emotion['label'],
-            "감정_확률": f"{primary_emotion['score']:.2f}",
-            "음성_텍스트": text_result['text'],
-            "에너지_레벨": f"{energy:.2f}",
-            "상태": "분석 완료"
         }
     except Exception as e:
         return {
             "error": str(e),
-            "상태": "오류 발생"
         }
-# Gradio 인터페이스 생성
 interface = gr.Interface(
     fn=analyze_voice,
-    inputs=gr.Audio(source="microphone", type="filepath", label="음성 입력"),
-    outputs=gr.JSON(label="분석 결과"),
-    title="디지털 굿판 - 음성 감정 분석",
-    description="음성을 통한 감정 분석과 텍스트 변환을 수행합니다.",
     theme=gr.themes.Soft(),
     analytics_enabled=True
 )
-# 앱 실행
 if __name__ == "__main__":
     interface.launch()

 import gradio as gr
 import numpy as np
 import librosa
 from transformers import pipeline
+# Initialize models
 emotion_analyzer = pipeline("audio-classification", model="MIT/ast-finetuned-speech-commands-v2")
 speech_recognizer = pipeline("automatic-speech-recognition",
                            model="kresnik/wav2vec2-large-xlsr-korean")
 def analyze_voice(audio_file):
+    """Voice analysis function"""
     try:
+        # Load audio
         y, sr = librosa.load(audio_file)
+        # 1. Voice emotion analysis
         emotions = emotion_analyzer(y)
         primary_emotion = emotions[0]
+        # 2. Speech to text
         text_result = speech_recognizer(y)
+        # 3. Extract audio features
         mfccs = librosa.feature.mfcc(y=y, sr=sr, n_mfcc=13)
         energy = np.mean(librosa.feature.rms(y=y))
         return {
+            "emotion": primary_emotion['label'],
+            "emotion_probability": f"{primary_emotion['score']:.2f}",
+            "transcribed_text": text_result['text'],
+            "energy_level": f"{energy:.2f}",
+            "status": "Analysis complete"
         }
     except Exception as e:
         return {
             "error": str(e),
+            "status": "Error occurred"
         }
+# Create Gradio interface
 interface = gr.Interface(
     fn=analyze_voice,
+    inputs=gr.Audio(source="microphone", type="filepath", label="Voice Input"),
+    outputs=gr.JSON(label="Analysis Results"),
+    title="Digital Gut - Voice Emotion Analysis",
+    description="Performs emotion analysis and text conversion from voice input.",
     theme=gr.themes.Soft(),
     analytics_enabled=True
 )
+# Launch app
 if __name__ == "__main__":
     interface.launch()