Spaces:
Running
Running
Commit
·
cb91aa8
1
Parent(s):
6a13b6a
hubert hf
Browse files
minigpt4/conversation/conversation.py
CHANGED
@@ -260,7 +260,8 @@ class Chat:
|
|
260 |
samples, sr = extract_audio_from_video(video_path)
|
261 |
# print("samples:", samples)
|
262 |
|
263 |
-
model_file = "checkpoints/transformer/chinese-hubert-large"
|
|
|
264 |
feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(model_file)
|
265 |
input_values = feature_extractor(samples, sampling_rate=sr, return_tensors="pt").input_values
|
266 |
# print("input_values:", input_values)
|
|
|
260 |
samples, sr = extract_audio_from_video(video_path)
|
261 |
# print("samples:", samples)
|
262 |
|
263 |
+
# model_file = "checkpoints/transformer/chinese-hubert-large"
|
264 |
+
model_file = "ZebangCheng/chinese-hubert-large"
|
265 |
feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(model_file)
|
266 |
input_values = feature_extractor(samples, sampling_rate=sr, return_tensors="pt").input_values
|
267 |
# print("input_values:", input_values)
|
minigpt4/datasets/datasets/first_face.py
CHANGED
@@ -12,13 +12,11 @@ import torch.nn.functional as F
|
|
12 |
|
13 |
import numpy as np
|
14 |
from PIL import Image
|
15 |
-
import skimage.io as io
|
16 |
import matplotlib.pyplot as plt
|
17 |
from matplotlib.collections import PatchCollection
|
18 |
from matplotlib.patches import Polygon, Rectangle
|
19 |
import torch
|
20 |
from torch.utils.data import Dataset
|
21 |
-
import webdataset as wds
|
22 |
import cv2
|
23 |
|
24 |
from minigpt4.datasets.datasets.base_dataset import BaseDataset
|
|
|
12 |
|
13 |
import numpy as np
|
14 |
from PIL import Image
|
|
|
15 |
import matplotlib.pyplot as plt
|
16 |
from matplotlib.collections import PatchCollection
|
17 |
from matplotlib.patches import Polygon, Rectangle
|
18 |
import torch
|
19 |
from torch.utils.data import Dataset
|
|
|
20 |
import cv2
|
21 |
|
22 |
from minigpt4.datasets.datasets.base_dataset import BaseDataset
|