File size: 1,200 Bytes
9785847
d685a80
9785847
 
 
 
d685a80
9785847
 
 
 
 
 
 
 
 
dc80a97
9785847
 
d685a80
 
 
9785847
 
d685a80
9785847
1e477d8
9785847
 
 
 
 
4c17e05
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
be471ee
9785847
 
 
 
be471ee
 
5cd3f25
 
9785847
 
 
d685a80
 
9785847
 
d685a80
9785847
 
 
be471ee
9785847
 
d685a80
9785847
 
d685a80
 
9785847
 
1869df3
d685a80
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
# ZeroGPU兼容的核心依赖
spaces

# 基础AI框架
transformers==4.37.2
accelerate==0.25.0
datasets==2.17.0
tokenizers==0.15.2
safetensors==0.4.1
huggingface-hub==0.21.1

# 量化支持
bitsandbytes==0.42.0
peft==0.2.0

# 视频和音频处理
decord==0.6.0
opencv-python==4.7.0.72
moviepy==1.0.3
ffmpeg-python==0.2.0
imageio==2.33.1
imageio-ffmpeg==0.4.9

# 语音处理
openai-whisper==20231117
soundfile==0.12.1
openai==1.12.0

# Web界面
gradio==4.36.1
gradio-client

# 图像处理
scikit-image==0.21.0

# NLP和评估
nltk==3.8.1
pycocoevalcap==1.2

# 可视化和绘图
matplotlib==3.7.5

# 实验跟踪
wandb==0.16.2

# 字幕处理
pysrt==1.1.2
chardet==5.2.0

# MiniGPT4-Video核心依赖
omegaconf==2.3.0
einops==0.7.0
webvtt-py==0.4.6
pytubefix
iopath==0.1.10
fairscale==0.4.13
webdataset==0.2.86
visual_genome==1.1.1

# 基础依赖
numpy<2.0.0
pandas==2.0.0
pillow==10.2.0
tqdm
requests
regex==2023.12.25
pyyaml==6.0.1
filelock==3.13.1
fsspec==2023.10.0
scipy==1.11.4

# 其他工具
sentencepiece==0.1.97
protobuf==4.25.1
psutil==5.9.7
six==1.16.0
typing-extensions==4.9.0
packaging

# Git依赖 (包含自定义的timm版本)
git+https://github.com/fffiloni/pytorch-image-models