Spaces:
Runtime error
Runtime error
Remove `html_content`
Browse files
app.py
CHANGED
|
@@ -199,21 +199,6 @@ audio_examples = [
|
|
| 199 |
]
|
| 200 |
|
| 201 |
|
| 202 |
-
|
| 203 |
-
html_content = """
|
| 204 |
-
<div>
|
| 205 |
-
<h2 style="font-size: 22px;margin-left: 0px;">Voice Understanding Model: SenseVoice-Small</h2>
|
| 206 |
-
<p style="font-size: 18px;margin-left: 20px;">SenseVoice-Small is an encoder-only speech foundation model designed for rapid voice understanding. It encompasses a variety of features including automatic speech recognition (ASR), spoken language identification (LID), speech emotion recognition (SER), and acoustic event detection (AED). SenseVoice-Small supports multilingual recognition for Chinese, English, Cantonese, Japanese, and Korean. Additionally, it offers exceptionally low inference latency, performing 7 times faster than Whisper-small and 17 times faster than Whisper-large.</p>
|
| 207 |
-
<h2 style="font-size: 22px;margin-left: 0px;">Usage</h2> <p style="font-size: 18px;margin-left: 20px;">Upload an audio file or input through a microphone, then select the task and language. the audio is transcribed into corresponding text along with associated emotions (π happy, π‘ angry/exicting, π sad) and types of sound events (π laughter, πΌ music, π applause, π€§ cough&sneeze, π cry). The event labels are placed in the front of the text and the emotion are in the back of the text.</p>
|
| 208 |
-
<p style="font-size: 18px;margin-left: 20px;">Recommended audio input duration is below 30 seconds. For audio longer than 30 seconds, local deployment is recommended.</p>
|
| 209 |
-
<h2 style="font-size: 22px;margin-left: 0px;">Repo</h2>
|
| 210 |
-
<p style="font-size: 18px;margin-left: 20px;"><a href="https://github.com/FunAudioLLM/SenseVoice" target="_blank">SenseVoice</a>: multilingual speech understanding model</p>
|
| 211 |
-
<p style="font-size: 18px;margin-left: 20px;"><a href="https://github.com/modelscope/FunASR" target="_blank">FunASR</a>: fundamental speech recognition toolkit</p>
|
| 212 |
-
<p style="font-size: 18px;margin-left: 20px;"><a href="https://github.com/FunAudioLLM/CosyVoice" target="_blank">CosyVoice</a>: high-quality multilingual TTS model</p>
|
| 213 |
-
</div>
|
| 214 |
-
"""
|
| 215 |
-
|
| 216 |
-
|
| 217 |
def launch():
|
| 218 |
with gr.Blocks(theme=gr.themes.Soft()) as demo:
|
| 219 |
# gr.Markdown(description)
|
|
|
|
| 199 |
]
|
| 200 |
|
| 201 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 202 |
def launch():
|
| 203 |
with gr.Blocks(theme=gr.themes.Soft()) as demo:
|
| 204 |
# gr.Markdown(description)
|