ZebangCheng commited on
Commit
cb91aa8
·
1 Parent(s): 6a13b6a
minigpt4/conversation/conversation.py CHANGED
@@ -260,7 +260,8 @@ class Chat:
260
  samples, sr = extract_audio_from_video(video_path)
261
  # print("samples:", samples)
262
 
263
- model_file = "checkpoints/transformer/chinese-hubert-large"
 
264
  feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(model_file)
265
  input_values = feature_extractor(samples, sampling_rate=sr, return_tensors="pt").input_values
266
  # print("input_values:", input_values)
 
260
  samples, sr = extract_audio_from_video(video_path)
261
  # print("samples:", samples)
262
 
263
+ # model_file = "checkpoints/transformer/chinese-hubert-large"
264
+ model_file = "ZebangCheng/chinese-hubert-large"
265
  feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(model_file)
266
  input_values = feature_extractor(samples, sampling_rate=sr, return_tensors="pt").input_values
267
  # print("input_values:", input_values)
minigpt4/datasets/datasets/first_face.py CHANGED
@@ -12,13 +12,11 @@ import torch.nn.functional as F
12
 
13
  import numpy as np
14
  from PIL import Image
15
- import skimage.io as io
16
  import matplotlib.pyplot as plt
17
  from matplotlib.collections import PatchCollection
18
  from matplotlib.patches import Polygon, Rectangle
19
  import torch
20
  from torch.utils.data import Dataset
21
- import webdataset as wds
22
  import cv2
23
 
24
  from minigpt4.datasets.datasets.base_dataset import BaseDataset
 
12
 
13
  import numpy as np
14
  from PIL import Image
 
15
  import matplotlib.pyplot as plt
16
  from matplotlib.collections import PatchCollection
17
  from matplotlib.patches import Polygon, Rectangle
18
  import torch
19
  from torch.utils.data import Dataset
 
20
  import cv2
21
 
22
  from minigpt4.datasets.datasets.base_dataset import BaseDataset