Update app.py
Browse files
app.py
CHANGED
@@ -9,7 +9,10 @@ processor = WhisperProcessor.from_pretrained(model_name)
|
|
9 |
model = WhisperForConditionalGeneration.from_pretrained(model_name)
|
10 |
|
11 |
# 加载数据集 bigcode/the-stack
|
12 |
-
dataset = load_dataset("CoIR-Retrieval/CodeSearchNet-php-queries-corpus", data_dir="data", split="train[:80%]")
|
|
|
|
|
|
|
13 |
|
14 |
def transcribe(audio):
|
15 |
# 处理音频进行转录
|
|
|
9 |
model = WhisperForConditionalGeneration.from_pretrained(model_name)
|
10 |
|
11 |
# 加载数据集 bigcode/the-stack
|
12 |
+
# dataset = load_dataset("CoIR-Retrieval/CodeSearchNet-php-queries-corpus", data_dir="data", split="train[:80%]")
|
13 |
+
queries_dataset = load_dataset("CoIR-Retrieval/CodeSearchNet-php-queries-corpus", data_dir="data", split="queries")
|
14 |
+
corpus_dataset = load_dataset("CoIR-Retrieval/CodeSearchNet-php-queries-corpus", data_dir="data", split="corpus")
|
15 |
+
|
16 |
|
17 |
def transcribe(audio):
|
18 |
# 处理音频进行转录
|