roychao19477 commited on
Commit
8c03ebe
·
1 Parent(s): 7d86927

Test on lengths

Browse files
Files changed (1) hide show
  1. app.py +4 -2
app.py CHANGED
@@ -64,7 +64,7 @@ from scipy.io import wavfile
64
  from avse_code import run_avse
65
 
66
  # Load face detector
67
- model = YOLO("yolov8n-face.pt").cuda() # assumes CUDA available
68
 
69
 
70
  from decord import VideoReader, cpu
@@ -79,11 +79,12 @@ avse_model = AVSEModule()
79
  #avse_state_dict = torch.load("ckpts/ep215_0906.oat.ckpt")
80
  avse_state_dict = torch.load("ckpts/ep220_0908.oat.ckpt")
81
  avse_model.load_state_dict(avse_state_dict, strict=True)
82
- avse_model.to("cuda")
83
  avse_model.eval()
84
 
85
  @spaces.GPU
86
  def run_avse_inference(video_path, audio_path):
 
87
  estimated = run_avse(video_path, audio_path)
88
  # Load audio
89
  #noisy, _ = sf.read(audio_path, dtype='float32') # (N, )
@@ -147,6 +148,7 @@ def extract_faces(video_file):
147
  break
148
 
149
  # Inference
 
150
  results = model(frame, verbose=False)[0]
151
  for box in results.boxes:
152
  # version 1
 
64
  from avse_code import run_avse
65
 
66
  # Load face detector
67
+ model = YOLO("yolov8n-face.pt") # assumes CUDA available
68
 
69
 
70
  from decord import VideoReader, cpu
 
79
  #avse_state_dict = torch.load("ckpts/ep215_0906.oat.ckpt")
80
  avse_state_dict = torch.load("ckpts/ep220_0908.oat.ckpt")
81
  avse_model.load_state_dict(avse_state_dict, strict=True)
82
+ #avse_model.to("cuda")
83
  avse_model.eval()
84
 
85
  @spaces.GPU
86
  def run_avse_inference(video_path, audio_path):
87
+ avse_model.to("cuda")
88
  estimated = run_avse(video_path, audio_path)
89
  # Load audio
90
  #noisy, _ = sf.read(audio_path, dtype='float32') # (N, )
 
148
  break
149
 
150
  # Inference
151
+ model = model.cuda()
152
  results = model(frame, verbose=False)[0]
153
  for box in results.boxes:
154
  # version 1