Spaces:

Athagi
/

Gttggtt

Sleeping

App Files Files Community

Athagi commited on Jun 4

Commit

29c9c4c

verified ·

1 Parent(s): 3800f2c

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -11

app.py CHANGED Viewed

@@ -6,22 +6,22 @@ import numpy as np
 import soundfile as sf
 import requests
-# ========== DOWNLOAD PRETRAINED MODEL ==========
 MODEL_PATH = "model/D_v13_20231020.pth"
 os.makedirs("model", exist_ok=True)
 def download_model():
     if not os.path.exists(MODEL_PATH):
-        url = "https://huggingface.co/MMVC/prelearned-model/resolve/main/D_v13_20231020.pth"
         print("Downloading model...")
-        response = requests.get(url)
         with open(MODEL_PATH, "wb") as f:
             f.write(response.content)
         print("Model downloaded.")
 download_model()
-# ========== DUMMY MODEL LOADER (Placeholder for real MMVC model) ==========
 class DummyVoiceChanger(torch.nn.Module):
     def __init__(self):
         super().__init__()
@@ -29,14 +29,13 @@ class DummyVoiceChanger(torch.nn.Module):
     def forward(self, audio):
         audio = torch.tensor(audio, dtype=torch.float32)
-        return (audio * self.gain).numpy()
-# Load dummy model
 model = DummyVoiceChanger()
-state_dict = torch.load(MODEL_PATH, map_location="cpu")
-# model.load_state_dict(state_dict)  # Skip loading for this dummy model
-# ========== VOICE CONVERSION FUNCTION ==========
 def convert_voice(audio_file):
     audio_data, sr = librosa.load(audio_file, sr=16000)
     audio_data = librosa.util.fix_length(audio_data, size=16000 * 5)
@@ -53,8 +52,8 @@ interface = gr.Interface(
     fn=convert_voice,
     inputs=gr.Audio(type="filepath", label="Upload Voice"),
     outputs=gr.Audio(type="filepath", label="Converted Voice"),
-    title="AI Voice Changer (No RVC / No TTS)",
-    description="Uploads a voice file, downloads AI model, and changes the voice using PyTorch. Replace dummy model with real MMVC inference logic for full functionality."
 )
 interface.launch()

 import soundfile as sf
 import requests
+# ========== MODEL SETUP ==========
+MODEL_URL = "https://huggingface.co/MMVC/prelearned-model/resolve/main/D_v13_20231020.pth"
 MODEL_PATH = "model/D_v13_20231020.pth"
 os.makedirs("model", exist_ok=True)
 def download_model():
     if not os.path.exists(MODEL_PATH):
         print("Downloading model...")
+        response = requests.get(MODEL_URL)
         with open(MODEL_PATH, "wb") as f:
             f.write(response.content)
         print("Model downloaded.")
 download_model()
+# ========== DUMMY VOICE CHANGER MODEL ==========
 class DummyVoiceChanger(torch.nn.Module):
     def __init__(self):
         super().__init__()
     def forward(self, audio):
         audio = torch.tensor(audio, dtype=torch.float32)
+        return (audio * self.gain).detach().numpy()  # FIXED
 model = DummyVoiceChanger()
+# Skipping real loading of .pth, as it's just a placeholder
+# torch.load(MODEL_PATH) would load it here if needed
+# ========== INFERENCE FUNCTION ==========
 def convert_voice(audio_file):
     audio_data, sr = librosa.load(audio_file, sr=16000)
     audio_data = librosa.util.fix_length(audio_data, size=16000 * 5)
     fn=convert_voice,
     inputs=gr.Audio(type="filepath", label="Upload Voice"),
     outputs=gr.Audio(type="filepath", label="Converted Voice"),
+    title="🗣️ AI Voice Changer (No RVC / No TTS)",
+    description="Simple PyTorch voice changer using a dummy model and direct model download. Replace dummy model with real MMVC for production."
 )
 interface.launch()