Spaces:

haepada
/

roots

Sleeping

App Files Files Community

haepada commited on Nov 6, 2024

Commit

36c54bd

verified ·

1 Parent(s): 7eac455

Update app.py

Browse files

Files changed (1) hide show

app.py +128 -73

app.py CHANGED Viewed

@@ -8,12 +8,40 @@ import requests
 import json
 import time
 import threading
-# 데이터 저장을 위한 DB 클래스
 class SimpleDB:
     def __init__(self, file_path="wishes.json"):
         self.file_path = file_path
         self.wishes = self._load_wishes()
     def _load_wishes(self):
         try:
@@ -42,43 +70,34 @@ class SimpleDB:
             print(f"Error saving wish: {e}")
             return False
-# 환경변수 및 API 설정
-HF_API_TOKEN = os.getenv("roots")
 if not HF_API_TOKEN:
-    raise ValueError("roots token not found in environment variables")
 API_URL = "https://api-inference.huggingface.co/models/stabilityai/stable-diffusion-xl-base-1.0"
-headers = {"Authorization": f"Bearer {HF_API_TOKEN}"}
 # AI 모델 초기화
-speech_recognizer = pipeline(
-    "automatic-speech-recognition",
-    model="kresnik/wav2vec2-large-xlsr-korean"
-)
-text_analyzer = pipeline(
-    "sentiment-analysis",
-    model="nlptown/bert-base-multilingual-uncased-sentiment"
-)
-IMAGE_DISPLAY_TIME = 30
-WELCOME_MESSAGE = """
-# 디지털 굿판에 오신 것을 환영합니다
-디지털 굿판은 현대 도시 속에서 잊혀진 전통 굿의 정수를 담아낸 **디지털 의례의 공간**입니다.
-이곳에서는 사람들의 목소리와 감정을 통해 **영적 교감**을 나누고, **자연과 도시의 에너지가 연결**됩니다.
-이제, 평온함과 치유의 여정을 시작해보세요.
-"""
-WORLDVIEW_MESSAGE = """
-## 굿판의 세계관 🌌
-온천천의 물줄기는 신성한 금샘에서 시작됩니다. 금샘은 생명과 창조의 원천이며,
-천상의 생명이 지상에서 숨을 틔우는 자리입니다. 도시의 소음 속에서도 신성한 생명력을 느껴보세요.
-이곳에서 영적인 교감을 경험하며, 자연과 하나 되는 순간을 맞이해 보시기 바랍니다.
-이 앱은 온천천의 사운드스케이프를 녹음하여 제작되었으며,
-온천천 온천장역에서 장전역까지 걸으며 더 깊은 체험이 가능합니다.
-"""
 def calculate_baseline_features(audio_data):
     """기준점 음성 특성 분석"""
     try:
@@ -90,6 +109,11 @@ def calculate_baseline_features(audio_data):
             print("Unsupported audio format")
             return None
         features = {
             "energy": float(np.mean(librosa.feature.rms(y=y))),
             "tempo": float(librosa.beat.tempo(y, sr=sr)[0]),
@@ -104,6 +128,21 @@ def calculate_baseline_features(audio_data):
 def map_acoustic_to_emotion(features, baseline_features=None):
     """음향학적 특성을 감정으로 매핑"""
     energy_norm = min(features["energy"] * 100, 100)
     tempo_norm = min(features["tempo"] / 200, 1)
     pitch_norm = min(features["pitch"] * 2, 1)
@@ -121,6 +160,7 @@ def map_acoustic_to_emotion(features, baseline_features=None):
         "characteristics": []
     }
     if energy_norm > 70:
         if tempo_norm > 0.6:
             emotions["primary"] = "기쁨/열정"
@@ -178,22 +218,27 @@ def analyze_voice(audio_data, state):
             return state, "오디오 형식을 지원하지 않습니다.", "", "", ""
         # 음향학적 특성 분석
-        acoustic_features = {
-            "energy": float(np.mean(librosa.feature.rms(y=y))),
-            "tempo": float(librosa.beat.tempo(y, sr=sr)[0]),
-            "pitch": float(np.mean(librosa.feature.zero_crossing_rate(y))),
-            "volume": float(np.mean(np.abs(y)))
-        }
         # 음성 감정 분석
         voice_emotion = map_acoustic_to_emotion(acoustic_features, state.get("baseline_features"))
         # 음성 인식
-        transcription = speech_recognizer(y, sampling_rate=sr)
-        text = transcription["text"]
         # 텍스트 감정 분석
-        text_sentiment = text_analyzer(text)[0]
         # 결과 포맷팅
         voice_result = (
@@ -207,8 +252,6 @@ def analyze_voice(audio_data, state):
             f"- 음성 크기: {voice_emotion['details']['voice_volume']}"
         )
-        text_result = f"텍스트 감정 분석: {text_sentiment['label']} (점수: {text_sentiment['score']:.2f})"
         # 프롬프트 생성
         prompt = generate_detailed_prompt(text, voice_emotion, text_sentiment)
@@ -217,6 +260,7 @@ def analyze_voice(audio_data, state):
         return state, text, voice_result, text_result, prompt
     except Exception as e:
         return state, f"오류 발생: {str(e)}", "", "", ""
 def generate_detailed_prompt(text, emotions, text_sentiment):
@@ -248,12 +292,11 @@ def generate_detailed_prompt(text, emotions, text_sentiment):
 def generate_image_from_prompt(prompt):
     """이미지 생성 함수"""
-    print(f"Generating image with prompt: {prompt}")
-    try:
-        if not prompt:
-            print("No prompt provided")
-            return None, None
         response = requests.post(
             API_URL,
             headers=headers,
@@ -268,10 +311,8 @@ def generate_image_from_prompt(prompt):
         )
         if response.status_code == 200:
-            print("Image generated successfully")
             timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
             image_path = f"generated_images/{timestamp}.png"
-            os.makedirs("generated_images", exist_ok=True)
             with open(image_path, "wb") as f:
                 f.write(response.content)
             return response.content, image_path
@@ -286,11 +327,11 @@ def generate_image_from_prompt(prompt):
 def save_reflection(text, state):
     """감상 저장"""
     if not text.strip():
-        return state, state.get("reflections", [])
     try:
         current_time = datetime.now().strftime("%H:%M:%S")
-        sentiment = text_analyzer(text)[0]
         new_reflection = [current_time, text, f"{sentiment['label']} ({sentiment['score']:.2f})"]
         reflections = state.get("reflections", [])
@@ -302,18 +343,22 @@ def save_reflection(text, state):
         return state, []
 def create_interface():
     db = SimpleDB()
     with gr.Blocks(theme=gr.themes.Soft()) as app:
-        state = gr.State({
-            "user_name": "",
-            "baseline_features": None,
-            "reflections": [],
-            "wish": None,
-            "final_prompt": "",
-            "image_path": None
-        })
         header = gr.Markdown("# 디지털 굿판")
         user_display = gr.Markdown("")
@@ -331,8 +376,10 @@ def create_interface():
                 gr.Markdown("""### 축원의 문장을 평온한 마음으로 읽어주세요""")
                 gr.Markdown("'당신의 건강과 행복이 늘 가득하기를'")
                 baseline_audio = gr.Audio(
-                   label="축원 문장 녹음하기",
-                   type="numpy"
                 )
                 set_baseline_btn = gr.Button("기준점 설정 완료")
                 baseline_status = gr.Markdown("")
@@ -346,7 +393,8 @@ def create_interface():
                         type="filepath",
                         label="온천천의 소리",
                         interactive=False,
-                        autoplay=False
                     )
                     with gr.Column():
                         reflection_input = gr.Textbox(
@@ -357,9 +405,8 @@ def create_interface():
                         reflections_display = gr.Dataframe(
                             headers=["시간", "감상", "감정 분석"],
                             label="기록된 감상들",
-                            datatype=["str", "str", "str"],
-                            row_count=(0, "dynamic"),
-                            col_count=(3, "fixed")
                         )
             with gr.Tab("기원"):
@@ -368,7 +415,9 @@ def create_interface():
                     with gr.Column():
                         voice_input = gr.Audio(
                             label="소원을 나누고 싶은 마음을 말해주세요",
-                            type="numpy"
                         )
                         clear_btn = gr.Button("녹음 지우기")
                         analyze_btn = gr.Button("소원 분석하기")
@@ -400,7 +449,7 @@ def create_interface():
         start_btn.click(
             fn=lambda name, state: (
                 WORLDVIEW_MESSAGE if name.strip() else "이름을 입력해주세요",
-                gr.update(visible=True) if name.strip() else gr.update(),
                 {**state, "user_name": name} if name.strip() else state
             ),
             inputs=[name_input, state],
@@ -420,7 +469,7 @@ def create_interface():
         )
         clear_btn.click(
-            fn=lambda: None,
             outputs=[voice_input]
         )
@@ -452,7 +501,13 @@ def create_interface():
     return app
-# 파일 맨 아래 부분
 if __name__ == "__main__":
     demo = create_interface()
-    demo.launch(debug=True, share=True)

 import json
 import time
 import threading
+from dotenv import load_dotenv
+# 환경변수 로드
+load_dotenv()
+# 상수 정의
+WELCOME_MESSAGE = """
+# 디지털 굿판에 오신 것을 환영합니다
+디지털 굿판은 현대 도시 속에서 잊혀진 전통 굿의 정수를 담아낸 **디지털 의례의 공간**입니다.
+이곳에서는 사람들의 목소리와 감정을 통해 **영적 교감**을 나누고, **자연과 도시의 에너지가 연결**됩니다.
+이제, 평온함과 치유의 여정을 시작해보세요.
+"""
+WORLDVIEW_MESSAGE = """
+## 굿판의 세계관 🌌
+온천천의 물줄기는 신성한 금샘에서 시작됩니다. 금샘은 생명과 창조의 원천이며,
+천상의 생명이 지상에서 숨을 틔우는 자리입니다. 도시의 소음 속에서도 신성한 생명력을 느껴보세요.
+이곳에서 영적인 교감을 경험하며, 자연과 하나 되는 순간을 맞이해 보시기 바랍니다.
+이 앱은 온천천의 사운드스케이프를 녹음하여 제작되었으며,
+온천천 온천장역에서 장전역까지 걸으며 더 깊은 체험이 가능합니다.
+"""
 class SimpleDB:
     def __init__(self, file_path="wishes.json"):
         self.file_path = file_path
         self.wishes = self._load_wishes()
+        # wishes.json 파일이 없으면 생성
+        if not os.path.exists(self.file_path):
+            with open(self.file_path, 'w', encoding='utf-8') as f:
+                json.dump([], f, ensure_ascii=False, indent=2)
     def _load_wishes(self):
         try:
             print(f"Error saving wish: {e}")
             return False
+# API 설정
+HF_API_TOKEN = os.getenv("roots", "")  # 기본값을 빈 문자열로 설정
 if not HF_API_TOKEN:
+    print("Warning: HuggingFace API token not found. Some features may be limited.")
 API_URL = "https://api-inference.huggingface.co/models/stabilityai/stable-diffusion-xl-base-1.0"
+headers = {"Authorization": f"Bearer {HF_API_TOKEN}"} if HF_API_TOKEN else {}
 # AI 모델 초기화
+try:
+    speech_recognizer = pipeline(
+        "automatic-speech-recognition",
+        model="kresnik/wav2vec2-large-xlsr-korean"
+    )
+    text_analyzer = pipeline(
+        "sentiment-analysis",
+        model="nlptown/bert-base-multilingual-uncased-sentiment"
+    )
+except Exception as e:
+    print(f"Error initializing AI models: {e}")
+    # 기본 파이프라인 설정
+    speech_recognizer = None
+    text_analyzer = None
+# 필요한 디렉토리 생성
+os.makedirs("generated_images", exist_ok=True)
+# 음성 분석 관련 함수들
 def calculate_baseline_features(audio_data):
     """기준점 음성 특성 분석"""
     try:
             print("Unsupported audio format")
             return None
+        # 음성이 없는 경우 처리
+        if len(y) == 0:
+            print("Empty audio data")
+            return None
         features = {
             "energy": float(np.mean(librosa.feature.rms(y=y))),
             "tempo": float(librosa.beat.tempo(y, sr=sr)[0]),
 def map_acoustic_to_emotion(features, baseline_features=None):
     """음향학적 특성을 감정으로 매핑"""
+    if features is None:
+        return {
+            "primary": "알 수 없음",
+            "intensity": 0,
+            "confidence": 0.0,
+            "secondary": "",
+            "characteristics": ["음성 분석 실패"],
+            "details": {
+                "energy_level": "0%",
+                "speech_rate": "알 수 없음",
+                "pitch_variation": "알 수 없음",
+                "voice_volume": "알 수 없음"
+            }
+        }
     energy_norm = min(features["energy"] * 100, 100)
     tempo_norm = min(features["tempo"] / 200, 1)
     pitch_norm = min(features["pitch"] * 2, 1)
         "characteristics": []
     }
+    # 감정 매핑 로직
     if energy_norm > 70:
         if tempo_norm > 0.6:
             emotions["primary"] = "기쁨/열정"
             return state, "오디오 형식을 지원하지 않습니다.", "", "", ""
         # 음향학적 특성 분석
+        acoustic_features = calculate_baseline_features(audio_data)
+        if acoustic_features is None:
+            return state, "음성 분석에 실패했습니다.", "", "", ""
         # 음성 감정 분석
         voice_emotion = map_acoustic_to_emotion(acoustic_features, state.get("baseline_features"))
         # 음성 인식
+        if speech_recognizer:
+            transcription = speech_recognizer({"sampling_rate": sr, "raw": y})
+            text = transcription["text"]
+        else:
+            text = "음성 인식 모델을 불러올 수 없습니다."
         # 텍스트 감정 분석
+        if text_analyzer and text:
+            text_sentiment = text_analyzer(text)[0]
+            text_result = f"텍스트 감정 분석: {text_sentiment['label']} (점수: {text_sentiment['score']:.2f})"
+        else:
+            text_sentiment = {"label": "unknown", "score": 0.0}
+            text_result = "텍스트 감정 분석을 수행할 수 없습니다."
         # 결과 포맷팅
         voice_result = (
             f"- 음성 크기: {voice_emotion['details']['voice_volume']}"
         )
         # 프롬프트 생성
         prompt = generate_detailed_prompt(text, voice_emotion, text_sentiment)
         return state, text, voice_result, text_result, prompt
     except Exception as e:
+        print(f"Error in analyze_voice: {str(e)}")
         return state, f"오류 발생: {str(e)}", "", "", ""
 def generate_detailed_prompt(text, emotions, text_sentiment):
 def generate_image_from_prompt(prompt):
     """이미지 생성 함수"""
+    if not prompt:
+        print("No prompt provided")
+        return None, None
+    try:
         response = requests.post(
             API_URL,
             headers=headers,
         )
         if response.status_code == 200:
             timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
             image_path = f"generated_images/{timestamp}.png"
             with open(image_path, "wb") as f:
                 f.write(response.content)
             return response.content, image_path
 def save_reflection(text, state):
     """감상 저장"""
     if not text.strip():
+        return state, []
     try:
         current_time = datetime.now().strftime("%H:%M:%S")
+        sentiment = text_analyzer(text)[0] if text_analyzer else {"label": "unknown", "score": 0.0}
         new_reflection = [current_time, text, f"{sentiment['label']} ({sentiment['score']:.2f})"]
         reflections = state.get("reflections", [])
         return state, []
 def create_interface():
+    """Gradio 인터페이스 생성"""
     db = SimpleDB()
+    # 초기 상태값 설정
+    initial_state = {
+        "user_name": "",
+        "baseline_features": None,
+        "reflections": [],
+        "wish": None,
+        "final_prompt": "",
+        "image_path": None
+    }
     with gr.Blocks(theme=gr.themes.Soft()) as app:
+        state = gr.State(value=initial_state)
         header = gr.Markdown("# 디지털 굿판")
         user_display = gr.Markdown("")
                 gr.Markdown("""### 축원의 문장을 평온한 마음으로 읽어주세요""")
                 gr.Markdown("'당신의 건강과 행복이 늘 가득하기를'")
                 baseline_audio = gr.Audio(
+                    label="축원 문장 녹음하기",
+                    type="numpy",
+                    source="microphone",
+                    streaming=False
                 )
                 set_baseline_btn = gr.Button("기준점 설정 완료")
                 baseline_status = gr.Markdown("")
                         type="filepath",
                         label="온천천의 소리",
                         interactive=False,
+                        autoplay=False,
+                        visible=True
                     )
                     with gr.Column():
                         reflection_input = gr.Textbox(
                         reflections_display = gr.Dataframe(
                             headers=["시간", "감상", "감정 분석"],
                             label="기록된 감상들",
+                            value=[[]],
+                            interactive=False
                         )
             with gr.Tab("기원"):
                     with gr.Column():
                         voice_input = gr.Audio(
                             label="소원을 나누고 싶은 마음을 말해주세요",
+                            type="numpy",
+                            source="microphone",
+                            streaming=False
                         )
                         clear_btn = gr.Button("녹음 지우기")
                         analyze_btn = gr.Button("소원 분석하기")
         start_btn.click(
             fn=lambda name, state: (
                 WORLDVIEW_MESSAGE if name.strip() else "이름을 입력해주세요",
+                gr.update(visible=True) if name.strip() else gr.update(visible=False),
                 {**state, "user_name": name} if name.strip() else state
             ),
             inputs=[name_input, state],
         )
         clear_btn.click(
+            fn=lambda: gr.update(value=None),
             outputs=[voice_input]
         )
     return app
 if __name__ == "__main__":
     demo = create_interface()
+    demo.launch(
+        debug=True,
+        share=True,
+        show_error=True,
+        server_name="0.0.0.0",
+        server_port=7860
+    )