YuE-music-generator-demo-zero

Paused

KingNish commited on Jan 30

Commit

5c20a01

verified ·

1 Parent(s): f24e46c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -65,14 +65,6 @@ from models.soundstream_hubert_new import SoundStream
 from vocoder import build_codec_model, process_audio
 from post_process_audio import replace_low_freq_with_energy_matched
-# Install flash attention
-print("Installing flash-attn...")
-subprocess.run(
-    "pip install flash-attn --no-build-isolation",
-    env={"FLASH_ATTENTION_SKIP_CUDA_BUILD": "TRUE"},
-    shell=True,
-)
 # Initialize device
 device = "cuda:0"
@@ -211,7 +203,7 @@ def generate_music(genre_txt, lyrics_txt, max_new_tokens=5, run_n_segments=2, us
     decoded_instrumentals = codec_model.decode(torch.as_tensor(instrumentals.astype(np.int16), dtype=torch.long).unsqueeze(0).permute(1, 0, 2).to(device)).cpu().squeeze(0)
     mixed_audio = (decoded_vocals + decoded_instrumentals) / 2
-    return (16000, mixed_audio.tensor.detach().numpy())
 @spaces.GPU(duration=120)
 def infer(genre_txt_content, lyrics_txt_content, num_segments=2, max_new_tokens=10):

 from vocoder import build_codec_model, process_audio
 from post_process_audio import replace_low_freq_with_energy_matched
 # Initialize device
 device = "cuda:0"
     decoded_instrumentals = codec_model.decode(torch.as_tensor(instrumentals.astype(np.int16), dtype=torch.long).unsqueeze(0).permute(1, 0, 2).to(device)).cpu().squeeze(0)
     mixed_audio = (decoded_vocals + decoded_instrumentals) / 2
+    return (16000, mixed_audio.detach().numpy())
 @spaces.GPU(duration=120)
 def infer(genre_txt_content, lyrics_txt_content, num_segments=2, max_new_tokens=10):