Spaces:

Athagi
/

Gttggtt

Sleeping

App Files Files Community

Athagi commited on Jun 4

Commit

f48cab7

verified ·

1 Parent(s): fdd092a

Create app.py

Browse files

Files changed (1) hide show

app.py +63 -0

app.py ADDED Viewed

	@@ -0,0 +1,63 @@

+import os
+import gradio as gr
+import torch
+import librosa
+import numpy as np
+import soundfile as sf
+import requests
+# ========== DOWNLOAD PRETRAINED MODEL ==========
+MODEL_PATH = "model/D_v13_20231020.pth"
+os.makedirs("model", exist_ok=True)
+def download_model():
+    if not os.path.exists(MODEL_PATH):
+        url = "https://huggingface.co/MMVC/prelearned-model/resolve/main/D_v13_20231020.pth"
+        print("Downloading model...")
+        response = requests.get(url)
+        with open(MODEL_PATH, "wb") as f:
+            f.write(response.content)
+        print("Model downloaded.")
+download_model()
+# ========== DUMMY MODEL LOADER (Placeholder for real MMVC model) ==========
+class DummyVoiceChanger(torch.nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.gain = torch.nn.Parameter(torch.tensor(1.0))
+    def forward(self, audio):
+        audio = torch.tensor(audio, dtype=torch.float32)
+        return (audio * self.gain).numpy()
+# Load dummy model (Replace this with real MMVC model loading)
+model = DummyVoiceChanger()
+state_dict = torch.load(MODEL_PATH, map_location="cpu")
+# model.load_state_dict(state_dict)  # Normally you'd load real weights
+# ========== VOICE CONVERSION ==========
+def convert_voice(audio):
+    # Load input
+    audio_data, sr = librosa.load(audio, sr=16000)
+    audio_data = librosa.util.fix_length(audio_data, size=16000 * 5)
+    # Process with dummy model
+    converted = model(audio_data)
+    converted /= np.max(np.abs(converted)) + 1e-6
+    # Save output
+    output_path = "output.wav"
+    sf.write(output_path, converted, 16000)
+    return output_path
+# ========== GRADIO INTERFACE ==========
+interface = gr.Interface(
+    fn=convert_voice,
+    inputs=gr.Audio(source="upload", type="filepath", label="Upload Voice"),
+    outputs=gr.Audio(type="filepath", label="Converted Voice"),
+    title="AI Voice Changer (No RVC / No TTS)",
+    description="This app loads a pretrained AI model (D_v13_20231020.pth) and simulates voice conversion using PyTorch. Replace dummy model with full MMVC logic for advanced use."
+)
+interface.launch()