Spaces:

rc19477
/

dev_only_useless

Sleeping

roychao19477 commited on Jun 24

Commit

3a0e329

1 Parent(s): 0d22451

Update module

Files changed (1) hide show

app.py CHANGED Viewed

@@ -83,19 +83,19 @@ avse_model.eval()
 @spaces.GPU
 def run_avse_inference(video_path, audio_path):
     # Load audio
-    noisy, _ = sf.read(audio_path, dtype='float32')  # (N, )
-    noisy = torch.tensor(noisy).unsqueeze(0)  # (1, N)
     # Load grayscale video
     vr = VideoReader(video_path, ctx=cpu(0))
     frames = vr.get_batch(list(range(len(vr)))).asnumpy()
     bg_frames = np.array([cv2.cvtColor(f, cv2.COLOR_RGB2GRAY) for f in frames]).astype(np.float32) / 255.0
-    bg_frames = torch.tensor(bg_frames).unsqueeze(0).unsqueeze(0)  # (1, 1, T, H, W)
     # Combine into input dict (match what model.enhance expects)
     data = {
-        "noisy_audio": noisy.numpy(),
-        "video_frames": bg_frames.numpy()
     }
     with torch.no_grad():
@@ -189,7 +189,6 @@ def extract_faces(video_file):
     # ------------------------------- #
     # AVSE models
-    noisy = wavfile.read(audio_path)[1].astype(np.float32) / (2 ** 15)
     vr = VideoReader(output_path, ctx=cpu(0))
     frames = vr.get_batch(list(range(len(vr)))).asnumpy()

 @spaces.GPU
 def run_avse_inference(video_path, audio_path):
     # Load audio
+    #noisy, _ = sf.read(audio_path, dtype='float32')  # (N, )
+    #noisy = torch.tensor(noisy).unsqueeze(0)  # (1, N)
+    noisy = wavfile.read(audio_path)[1].astype(np.float32) / (2 ** 15)
     # Load grayscale video
     vr = VideoReader(video_path, ctx=cpu(0))
     frames = vr.get_batch(list(range(len(vr)))).asnumpy()
     bg_frames = np.array([cv2.cvtColor(f, cv2.COLOR_RGB2GRAY) for f in frames]).astype(np.float32) / 255.0
     # Combine into input dict (match what model.enhance expects)
     data = {
+        "noisy_audio": noisy,
+        "video_frames": bg_frames
     }
     with torch.no_grad():
     # ------------------------------- #
     # AVSE models
     vr = VideoReader(output_path, ctx=cpu(0))
     frames = vr.get_batch(list(range(len(vr)))).asnumpy()