Spaces:

haepada
/

roots

Sleeping

App Files Files Community

haepada commited on Nov 7, 2024

Commit

6f76a92

verified ·

1 Parent(s): bed0080

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -109

app.py CHANGED Viewed

@@ -250,59 +250,63 @@ def analyze_voice(audio_data, state):
         return state, "음성을 먼저 녹음해주세요.", "", "", ""
     try:
-        features = calculate_baseline_features(audio_data)
-        if features is None:
             return state, "음성 분석에 실패했습니다.", "", "", ""
-        # 기준점과 비교하여 감정 분석
-        voice_emotion = map_acoustic_to_emotion(
-            features,
-            state.get("baseline_features")  # 기준점 전달
-        )
-        # 음성 인식 (필요한 경우)
-        text = "음성이 인식되었습니다."
         if speech_recognizer:
             try:
-                sr, y = audio_data
                 transcription = speech_recognizer({"sampling_rate": sr, "raw": y.astype(np.float32)})
                 text = transcription["text"]
             except Exception as e:
                 print(f"Speech recognition error: {e}")
-                text = "음성 인식은 실패했으나, 감정 분석은 진행합니다."
-        # 감정 상태 변화 분석
-        baseline_emotion = state.get("baseline_emotion", {})
-        emotion_change = ""
-        if baseline_emotion:
-            baseline_intensity = baseline_emotion.get("intensity", 0)
-            current_intensity = voice_emotion["intensity"]
-            intensity_change = current_intensity - baseline_intensity
-            emotion_change = f"""
-            💫 기준 상태와의 비교:
-            • 감정 변화: {baseline_emotion['primary']} → {voice_emotion['primary']}
-            • 강도 변화: {intensity_change:+.1f}%
-            """
-        voice_result = f"""
-        🎭 현재 감정 상태:
-        • 주요 감정: {voice_emotion['primary']}
-        • 감정 강도: {voice_emotion['intensity']:.1f}%
-        • 특징: {', '.join(voice_emotion['characteristics'])}
-        {emotion_change}
-        """
         # 프롬프트 생성
-        prompt = generate_detailed_prompt(text, voice_emotion, {"label": "neutral", "score": 0.5})
         state = {**state, "final_prompt": prompt}
-        return state, text, voice_result, "", prompt
     except Exception as e:
         print(f"Error in analyze_voice: {str(e)}")
-        return state, f"오류가 발생했습니다: {str(e)}", "", "", ""
 def generate_detailed_prompt(text, emotions, text_sentiment):
@@ -649,77 +653,14 @@ def create_interface():
                 with blessing_section:
                     gr.Markdown("### 축원의식을 시작하겠습니다")
                     gr.Markdown("'명짐 복짐 짊어지고 안가태평하시기를 비도발원 축원 드립니다'")
-                    with gr.Column() as recording_section:
-                        baseline_audio = gr.Audio(
-                            label="축원 문장 녹음하기",
-                            sources=["microphone"],
-                            type="numpy",
-                            streaming=False
-                        )
-                        set_baseline_btn = gr.Button("축원 마치기", variant="primary")
-                    # 분석 결과 표시 영역
-                    baseline_status = gr.Markdown("")  # 상태 메시지
-                    analysis_results = gr.Markdown(visible=False)  # 분석 결과
-                def handle_blessing_complete(audio, state):
-                    """축원 완료 및 기준점 설정 핸들러"""
-                    if audio is None:
-                        return (
-                            state,
-                            "음성을 먼저 녹음해주세요.",
-                            gr.update(visible=True),
-                            gr.update(visible=False)
-                        )
-                    try:
-                        # 기준점 설정을 위한 음성 분석
-                        features = calculate_baseline_features(audio)
-                        if features is None:
-                            return (
-                                state,
-                                "음성 분석에 실패했습니다. 다시 시도해주세요.",
-                                gr.update(visible=True),
-                                gr.update(visible=False)
-                            )
-                        # 기본 감정 상태 분석
-                        baseline_emotion = map_acoustic_to_emotion(features)
-                        # 상태 업데이트
-                        new_state = safe_state_update(state, {
-                            "baseline_features": features,
-                            "baseline_emotion": baseline_emotion
-                        })
-                        # 분석 결과 표시
-                        result_text = f"""
-                        ✨ 축원이 완료되었습니다.
-                        🎭 기본 감정 상태:
-                        • 주요 감정: {baseline_emotion['primary']}
-                        • 감정 강도: {baseline_emotion['intensity']:.1f}%
-                        • 특징: {', '.join(baseline_emotion['characteristics'])}
-                        다음 단계로 진행해주세요.
-                        """
-                        return (
-                            new_state,
-                            result_text,
-                            gr.update(visible=False),
-                            gr.update(visible=True)
-                        )
-                    except Exception as e:
-                        print(f"Error in handle_blessing_complete: {str(e)}")
-                        return (
-                            state,
-                            f"오류가 발생했습니다. 다시 시도해주세요.",
-                            gr.update(visible=True),
-                            gr.update(visible=False)
-                        )
                 # 4단계: 굿판 입장 안내
                 entry_guide_section = gr.Column(visible=False)

         return state, "음성을 먼저 녹음해주세요.", "", "", ""
     try:
+        sr, y = audio_data
+        y = y.astype(np.float32)
+        if len(y) == 0:
+            return state, "음성이 감지되지 않았습니다.", "", "", ""
+        acoustic_features = calculate_baseline_features((sr, y))
+        if acoustic_features is None:
             return state, "음성 분석에 실패했습니다.", "", "", ""
+        # 음성 인식
         if speech_recognizer:
             try:
                 transcription = speech_recognizer({"sampling_rate": sr, "raw": y.astype(np.float32)})
                 text = transcription["text"]
             except Exception as e:
                 print(f"Speech recognition error: {e}")
+                text = "음성 인식 실패"
+        else:
+            text = "음성 인식 모델을 불러올 수 없습니다."
+        # 음성 감정 분석
+        voice_emotion = map_acoustic_to_emotion(acoustic_features, state.get("baseline_features"))
+        # 텍스트 감정 분석
+        if text_analyzer and text:
+            try:
+                text_sentiment = text_analyzer(text)[0]
+                text_result = f"텍스트 감정 분석: {text_sentiment['label']} (점수: {text_sentiment['score']:.2f})"
+            except Exception as e:
+                print(f"Text analysis error: {e}")
+                text_sentiment = {"label": "unknown", "score": 0.0}
+                text_result = "텍스트 감정 분석 실패"
+        else:
+            text_sentiment = {"label": "unknown", "score": 0.0}
+            text_result = "텍스트 감정 분석을 수행할 수 없습니다."
+        voice_result = (
+            f"음성 감정: {voice_emotion['primary']} "
+            f"(강도: {voice_emotion['intensity']:.1f}%, 신뢰도: {voice_emotion['confidence']:.2f})\n"
+            f"특징: {', '.join(voice_emotion['characteristics'])}\n"
+            f"상세 분석:\n"
+            f"- 에너지 레벨: {voice_emotion['details']['energy_level']}\n"
+            f"- 말하기 속도: {voice_emotion['details']['speech_rate']}\n"
+            f"- 음높이 변화: {voice_emotion['details']['pitch_variation']}\n"
+            f"- 음성 크기: {voice_emotion['details']['voice_volume']}"
+        )
         # 프롬프트 생성
+        prompt = generate_detailed_prompt(text, voice_emotion, text_sentiment)
         state = {**state, "final_prompt": prompt}
+        return state, text, voice_result, text_result, prompt
     except Exception as e:
         print(f"Error in analyze_voice: {str(e)}")
+        return state, f"오류 발생: {str(e)}", "", "", ""
 def generate_detailed_prompt(text, emotions, text_sentiment):
                 with blessing_section:
                     gr.Markdown("### 축원의식을 시작하겠습니다")
                     gr.Markdown("'명짐 복짐 짊어지고 안가태평하시기를 비도발원 축원 드립니다'")
+                    baseline_audio = gr.Audio(
+                        label="축원 문장 녹음하기",
+                        sources=["microphone"],
+                        type="numpy",
+                        streaming=False
+                    )
+                    set_baseline_btn = gr.Button("축원 마치기", variant="primary")
+                    baseline_status = gr.Markdown("")
                 # 4단계: 굿판 입장 안내
                 entry_guide_section = gr.Column(visible=False)