LAP-DEV commited on
Commit
d33be88
·
verified ·
1 Parent(s): d17f6fd

Upload default_parameters.yaml

Browse files
Files changed (1) hide show
  1. configs/default_parameters.yaml +76 -0
configs/default_parameters.yaml ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ website_title: "Speech2text"
3
+ website_subtitle: "Automatic speech recognition using Whisper"
4
+ disclaimer_show: true
5
+ disclaimer_popup: false
6
+ disclaimer_text: "Warning: This service is provided as is, please read the disclaimer [here](https://huggingface.co/spaces/LAP-DEV/Demo/blob/main/README.md) before use as well as for more information."
7
+
8
+ whisper:
9
+ model_size: "large-v3"
10
+ lang: "Automatic Detection"
11
+ is_translate: false
12
+ beam_size: 5
13
+ log_prob_threshold: -1
14
+ #no_speech_threshold: 0.6
15
+ no_speech_threshold: 0.4
16
+ best_of: 5
17
+ patience: 1
18
+ condition_on_previous_text: false #set to false to avoid hallucinations
19
+ prompt_reset_on_temperature: 0.5
20
+ initial_prompt: null
21
+ temperature: 0
22
+ compression_ratio_threshold: 2.4
23
+ chunk_length: 30
24
+ batch_size: 24
25
+ length_penalty: 1
26
+ repetition_penalty: 1
27
+ no_repeat_ngram_size: 0
28
+ prefix: null
29
+ suppress_blank: true
30
+ suppress_tokens: "[-1]"
31
+ max_initial_timestamp: 1
32
+ word_timestamps: false
33
+ prepend_punctuations: "\"'“¿([{-"
34
+ append_punctuations: "\"'.。,,!!??::”)]}、"
35
+ max_new_tokens: null
36
+ hallucination_silence_threshold: null
37
+ hotwords: null
38
+ language_detection_threshold: 0.5
39
+ language_detection_segments: 1
40
+ add_timestamp_preview: false
41
+ add_timestamp_file: false
42
+ enable_offload: true
43
+
44
+ vad:
45
+ vad_filter: false
46
+ threshold: 0.5
47
+ min_speech_duration_ms: 250
48
+ max_speech_duration_s: 9999
49
+ min_silence_duration_ms: 100
50
+ speech_pad_ms: 30
51
+
52
+ diarization:
53
+ is_diarize: false
54
+ hf_token: ""
55
+ enable_offload: true
56
+
57
+ bgm_separation:
58
+ is_separate_bgm: false
59
+ model_size: "UVR-MDX-NET-Inst_HQ_4"
60
+ segment_size: 256
61
+ save_file: false
62
+ enable_offload: true
63
+
64
+ translation:
65
+ deepl:
66
+ api_key: ""
67
+ is_pro: false
68
+ source_lang: "Automatic Detection"
69
+ target_lang: "English"
70
+ nllb:
71
+ model_size: "facebook/nllb-200-distilled-1.3B"
72
+ source_lang: null
73
+ target_lang: "Dutch"
74
+ max_length: 200
75
+ add_timestamp: true
76
+ translate_output: false