KingNish commited on
Commit
0695bb5
·
1 Parent(s): 1999a7f

modified: app.py

Browse files
Files changed (1) hide show
  1. app.py +48 -48
app.py CHANGED
@@ -380,58 +380,58 @@ def generate_music(
380
  instrumental_stem, _ = sf.read(vocal_path)
381
  mix_stem = (vocal_stem + instrumental_stem) / 1
382
  sf.write(recons_mix, mix_stem, sr)
383
- return recons_mix
384
  except Exception as e:
385
  print(e)
 
386
 
387
  # vocoder to upsample audios
388
- vocal_decoder, inst_decoder = build_codec_model(config_path, vocal_decoder_path, inst_decoder_path)
389
- vocoder_output_dir = os.path.join(output_dir, 'vocoder')
390
- vocoder_stems_dir = os.path.join(vocoder_output_dir, 'stems')
391
- vocoder_mix_dir = os.path.join(vocoder_output_dir, 'mix')
392
- os.makedirs(vocoder_mix_dir, exist_ok=True)
393
- os.makedirs(vocoder_stems_dir, exist_ok=True)
394
- instrumental_output = None
395
- vocal_output = None
396
- for npy in stage1_output_set:
397
- if 'instrumental' in npy:
398
- # Process instrumental
399
- instrumental_output = process_audio(
400
- npy,
401
- os.path.join(vocoder_stems_dir, 'instrumental.mp3'),
402
- rescale,
403
- argparse.Namespace(**locals()), # Convert local variables to argparse.Namespace
404
- inst_decoder,
405
- codec_model
406
- )
407
- else:
408
- # Process vocal
409
- vocal_output = process_audio(
410
- npy,
411
- os.path.join(vocoder_stems_dir, 'vocal.mp3'),
412
- rescale,
413
- argparse.Namespace(**locals()), # Convert local variables to argparse.Namespace
414
- vocal_decoder,
415
- codec_model
416
- )
417
- # mix tracks
418
- try:
419
- mix_output = instrumental_output + vocal_output
420
- vocoder_mix = os.path.join(vocoder_mix_dir, os.path.basename(recons_mix))
421
- save_audio(mix_output, vocoder_mix, 44100, rescale)
422
- print(f"Created mix: {vocoder_mix}")
423
- except RuntimeError as e:
424
- print(e)
425
- print(f"mix {vocoder_mix} failed! inst: {instrumental_output.shape}, vocal: {vocal_output.shape}")
426
-
427
- # Post process
428
- replace_low_freq_with_energy_matched(
429
- a_file=recons_mix, # 16kHz
430
- b_file=vocoder_mix, # 48kHz
431
- c_file=os.path.join(output_dir, os.path.basename(recons_mix)),
432
- cutoff_freq=5500.0
433
- )
434
- print("All process Done")
435
 
436
 
437
  @spaces.GPU(duration=120)
 
380
  instrumental_stem, _ = sf.read(vocal_path)
381
  mix_stem = (vocal_stem + instrumental_stem) / 1
382
  sf.write(recons_mix, mix_stem, sr)
 
383
  except Exception as e:
384
  print(e)
385
+ return recons_mix
386
 
387
  # vocoder to upsample audios
388
+ # vocal_decoder, inst_decoder = build_codec_model(config_path, vocal_decoder_path, inst_decoder_path)
389
+ # vocoder_output_dir = os.path.join(output_dir, 'vocoder')
390
+ # vocoder_stems_dir = os.path.join(vocoder_output_dir, 'stems')
391
+ # vocoder_mix_dir = os.path.join(vocoder_output_dir, 'mix')
392
+ # os.makedirs(vocoder_mix_dir, exist_ok=True)
393
+ # os.makedirs(vocoder_stems_dir, exist_ok=True)
394
+ # instrumental_output = None
395
+ # vocal_output = None
396
+ # for npy in stage1_output_set:
397
+ # if 'instrumental' in npy:
398
+ # # Process instrumental
399
+ # instrumental_output = process_audio(
400
+ # npy,
401
+ # os.path.join(vocoder_stems_dir, 'instrumental.mp3'),
402
+ # rescale,
403
+ # argparse.Namespace(**locals()), # Convert local variables to argparse.Namespace
404
+ # inst_decoder,
405
+ # codec_model
406
+ # )
407
+ # else:
408
+ # # Process vocal
409
+ # vocal_output = process_audio(
410
+ # npy,
411
+ # os.path.join(vocoder_stems_dir, 'vocal.mp3'),
412
+ # rescale,
413
+ # argparse.Namespace(**locals()), # Convert local variables to argparse.Namespace
414
+ # vocal_decoder,
415
+ # codec_model
416
+ # )
417
+ # # mix tracks
418
+ # try:
419
+ # mix_output = instrumental_output + vocal_output
420
+ # vocoder_mix = os.path.join(vocoder_mix_dir, os.path.basename(recons_mix))
421
+ # save_audio(mix_output, vocoder_mix, 44100, rescale)
422
+ # print(f"Created mix: {vocoder_mix}")
423
+ # except RuntimeError as e:
424
+ # print(e)
425
+ # print(f"mix {vocoder_mix} failed! inst: {instrumental_output.shape}, vocal: {vocal_output.shape}")
426
+
427
+ # # Post process
428
+ # replace_low_freq_with_energy_matched(
429
+ # a_file=recons_mix, # 16kHz
430
+ # b_file=vocoder_mix, # 48kHz
431
+ # c_file=os.path.join(output_dir, os.path.basename(recons_mix)),
432
+ # cutoff_freq=5500.0
433
+ # )
434
+ # print("All process Done")
435
 
436
 
437
  @spaces.GPU(duration=120)