roychao19477 commited on
Commit
6792f52
·
1 Parent(s): a5096b9

Test on lengths

Browse files
Files changed (1) hide show
  1. app.py +2 -5
app.py CHANGED
@@ -64,7 +64,7 @@ from scipy.io import wavfile
64
  from avse_code import run_avse
65
 
66
  # Load face detector
67
- model = YOLO("yolov8n-face.pt") # assumes CUDA available
68
 
69
 
70
  from decord import VideoReader, cpu
@@ -79,12 +79,11 @@ avse_model = AVSEModule()
79
  #avse_state_dict = torch.load("ckpts/ep215_0906.oat.ckpt")
80
  avse_state_dict = torch.load("ckpts/ep220_0908.oat.ckpt")
81
  avse_model.load_state_dict(avse_state_dict, strict=True)
82
- #avse_model.to("cuda")
83
  avse_model.eval()
84
 
85
  @spaces.GPU
86
  def run_avse_inference(video_path, audio_path):
87
- avse_model.to("cuda")
88
  estimated = run_avse(video_path, audio_path)
89
  # Load audio
90
  #noisy, _ = sf.read(audio_path, dtype='float32') # (N, )
@@ -148,7 +147,6 @@ def extract_faces(video_file):
148
  break
149
 
150
  # Inference
151
- model = model.cuda()
152
  results = model(frame, verbose=False)[0]
153
  for box in results.boxes:
154
  # version 1
@@ -236,4 +234,3 @@ iface = gr.Interface(
236
 
237
  iface.launch()
238
 
239
-
 
64
  from avse_code import run_avse
65
 
66
  # Load face detector
67
+ model = YOLO("yolov8n-face.pt").cuda() # assumes CUDA available
68
 
69
 
70
  from decord import VideoReader, cpu
 
79
  #avse_state_dict = torch.load("ckpts/ep215_0906.oat.ckpt")
80
  avse_state_dict = torch.load("ckpts/ep220_0908.oat.ckpt")
81
  avse_model.load_state_dict(avse_state_dict, strict=True)
82
+ avse_model.to("cuda")
83
  avse_model.eval()
84
 
85
  @spaces.GPU
86
  def run_avse_inference(video_path, audio_path):
 
87
  estimated = run_avse(video_path, audio_path)
88
  # Load audio
89
  #noisy, _ = sf.read(audio_path, dtype='float32') # (N, )
 
147
  break
148
 
149
  # Inference
 
150
  results = model(frame, verbose=False)[0]
151
  for box in results.boxes:
152
  # version 1
 
234
 
235
  iface.launch()
236