Spaces:

MoiMoi-01
/

Ollama_TTS_RVC

Runtime error

App Files Files Community

MoiMoi-01 commited on Feb 4

Commit

6e54df2

verified ·

1 Parent(s): 6150e28

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -9

app.py CHANGED Viewed

@@ -5,9 +5,11 @@ from TTS.api import TTS
 import os
 import subprocess
-# Load TTS Model
-device = "cuda" if torch.cuda.is_available() else "cpu"
-tts_model = TTS("tts_models/en/ljspeech/tacotron2-DDC").to(device)
 # Hugging Face LLM Client (DeepSeek R1 7B)
 client = InferenceClient("deepseek-ai/deepseek-r1-7b")
@@ -16,13 +18,13 @@ client = InferenceClient("deepseek-ai/deepseek-r1-7b")
 RVC_MODEL_PATH = "zeldabotw.pth"
 RVC_INDEX_PATH = "zeldabotw.index"
-# Function to call RVC for voice conversion
 def convert_voice(input_wav, output_wav):
-    """Converts input TTS audio to ZeldaBotW voice using RVC."""
     if not os.path.exists(RVC_MODEL_PATH) or not os.path.exists(RVC_INDEX_PATH):
         raise FileNotFoundError("RVC model files not found! Ensure zeldabotw.pth and zeldabotw.index are in the same directory.")
-    command = f"python infer_rvc.py --input {input_wav} --output {output_wav} --model {RVC_MODEL_PATH} --index {RVC_INDEX_PATH} --pitch_shift 0"
     process = subprocess.run(command, shell=True, capture_output=True, text=True)
     if process.returncode != 0:
@@ -46,11 +48,11 @@ def respond(message, history, system_message, max_tokens, temperature, top_p):
         response += token
         yield response, None, None  # Text first
-    # Generate Speech from Text
     tts_audio_path = "tts_output.wav"
     tts_model.tts_to_file(text=response, file_path=tts_audio_path)
-    # Convert TTS output to ZeldaBotW voice
     rvc_audio_path = "rvc_output.wav"
     rvc_converted_path = convert_voice(tts_audio_path, rvc_audio_path)
@@ -58,7 +60,7 @@ def respond(message, history, system_message, max_tokens, temperature, top_p):
 # Gradio UI
 with gr.Blocks() as demo:
-    gr.Markdown("## DeepSeek R1 7B Chatbot with ZeldaBotW Voice")
     chatbot = gr.Chatbot()
     msg = gr.Textbox(label="User Input")

 import os
 import subprocess
+# Force CPU usage
+device = "cpu"
+# Load TTS Model (Running on CPU)
+tts_model = TTS("tts_models/en/ljspeech/tacotron2-DDC", gpu=False)  # ✅ Ensures CPU-only execution
 # Hugging Face LLM Client (DeepSeek R1 7B)
 client = InferenceClient("deepseek-ai/deepseek-r1-7b")
 RVC_MODEL_PATH = "zeldabotw.pth"
 RVC_INDEX_PATH = "zeldabotw.index"
+# Function to call RVC for voice conversion (CPU Mode)
 def convert_voice(input_wav, output_wav):
+    """Converts input TTS audio to ZeldaBotW voice using RVC (CPU Mode)."""
     if not os.path.exists(RVC_MODEL_PATH) or not os.path.exists(RVC_INDEX_PATH):
         raise FileNotFoundError("RVC model files not found! Ensure zeldabotw.pth and zeldabotw.index are in the same directory.")
+    command = f"python infer_rvc.py --input {input_wav} --output {output_wav} --model {RVC_MODEL_PATH} --index {RVC_INDEX_PATH} --pitch_shift 0 --device cpu"
     process = subprocess.run(command, shell=True, capture_output=True, text=True)
     if process.returncode != 0:
         response += token
         yield response, None, None  # Text first
+    # Generate Speech from Text (CPU Mode)
     tts_audio_path = "tts_output.wav"
     tts_model.tts_to_file(text=response, file_path=tts_audio_path)
+    # Convert TTS output to ZeldaBotW voice (CPU Mode)
     rvc_audio_path = "rvc_output.wav"
     rvc_converted_path = convert_voice(tts_audio_path, rvc_audio_path)
 # Gradio UI
 with gr.Blocks() as demo:
+    gr.Markdown("## DeepSeek R1 7B Chatbot with ZeldaBotW Voice (CPU Mode)")
     chatbot = gr.Chatbot()
     msg = gr.Textbox(label="User Input")