Spaces:
				
			
			
	
			
			
		Runtime error
		
	
	
	
			
			
	
	
	
	
		
		
		Runtime error
		
	Update app.py
Browse files
    	
        app.py
    CHANGED
    
    | @@ -54,6 +54,7 @@ def generate_prompt(instruction, input=None): | |
| 54 | 
             
            def evaluate(
         | 
| 55 | 
             
            #    instruction,
         | 
| 56 | 
             
                audio,
         | 
|  | |
| 57 | 
             
                input=None,
         | 
| 58 | 
             
                token_count=200,
         | 
| 59 | 
             
                temperature=1.0,
         | 
| @@ -61,7 +62,7 @@ def evaluate( | |
| 61 | 
             
                presencePenalty = 0.1,
         | 
| 62 | 
             
                countPenalty = 0.1,
         | 
| 63 | 
             
            ):
         | 
| 64 | 
            -
             | 
| 65 | 
             
                # load audio and pad/trim it to fit 30 seconds
         | 
| 66 | 
             
                audio = whisper.load_audio(audio)
         | 
| 67 | 
             
                audio = whisper.pad_or_trim(audio)
         | 
| @@ -116,13 +117,32 @@ def evaluate( | |
| 116 | 
             
                        out_last = i + 1
         | 
| 117 | 
             
                gc.collect()
         | 
| 118 | 
             
                torch.cuda.empty_cache()
         | 
| 119 | 
            -
             | 
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
| 120 |  | 
| 121 | 
             
            g = gr.Interface(
         | 
| 122 | 
             
                fn=evaluate,
         | 
| 123 | 
             
                inputs=[
         | 
| 124 | 
             
            #        gr.components.Textbox(lines=2, label="Instruction", value="Tell me about ravens."),
         | 
| 125 | 
             
                    gr.Audio(source="microphone", label = "请开始对话吧!", type="filepath"),
         | 
|  | |
| 126 | 
             
                    gr.components.Textbox(lines=2, label="Input", placeholder="none"),
         | 
| 127 | 
             
                    gr.components.Slider(minimum=10, maximum=200, step=10, value=150), # token_count
         | 
| 128 | 
             
                    gr.components.Slider(minimum=0.2, maximum=2.0, step=0.1, value=1.0), # temperature
         | 
| @@ -131,10 +151,15 @@ g = gr.Interface( | |
| 131 | 
             
                    gr.components.Slider(0.0, 1.0, step=0.1, value=0.4),  # countPenalty        
         | 
| 132 | 
             
                ],
         | 
| 133 | 
             
                outputs=[
         | 
|  | |
|  | |
|  | |
|  | |
| 134 | 
             
                    gr.inputs.Textbox(
         | 
| 135 | 
             
                        lines=5,
         | 
| 136 | 
            -
                        label="Output",
         | 
| 137 | 
            -
                    )
         | 
|  | |
| 138 | 
             
                ],
         | 
| 139 | 
             
                title="🥳💬💕 - TalktoAI,随时随地,谈天说地!",
         | 
| 140 | 
             
                description="🤖 - 让有人文关怀的AI造福每一个人!AI向善,文明璀璨!TalktoAI - Enable the future!",
         | 
|  | |
| 54 | 
             
            def evaluate(
         | 
| 55 | 
             
            #    instruction,
         | 
| 56 | 
             
                audio,
         | 
| 57 | 
            +
                upload,
         | 
| 58 | 
             
                input=None,
         | 
| 59 | 
             
                token_count=200,
         | 
| 60 | 
             
                temperature=1.0,
         | 
|  | |
| 62 | 
             
                presencePenalty = 0.1,
         | 
| 63 | 
             
                countPenalty = 0.1,
         | 
| 64 | 
             
            ):
         | 
| 65 | 
            +
                res = []
         | 
| 66 | 
             
                # load audio and pad/trim it to fit 30 seconds
         | 
| 67 | 
             
                audio = whisper.load_audio(audio)
         | 
| 68 | 
             
                audio = whisper.pad_or_trim(audio)
         | 
|  | |
| 117 | 
             
                        out_last = i + 1
         | 
| 118 | 
             
                gc.collect()
         | 
| 119 | 
             
                torch.cuda.empty_cache()
         | 
| 120 | 
            +
             | 
| 121 | 
            +
                res.append(out_str.strip())
         | 
| 122 | 
            +
             | 
| 123 | 
            +
                tts.tts_to_file(res, speaker_wav = upload, language="en", file_path="output.wav")
         | 
| 124 | 
            +
                
         | 
| 125 | 
            +
                voicefixer.restore(input="output.wav", # input wav file path
         | 
| 126 | 
            +
                                output="audio1.wav", # output wav file path
         | 
| 127 | 
            +
                                cuda=True, # whether to use gpu acceleration
         | 
| 128 | 
            +
                                mode = 0) # You can try out mode 0, 1, or 2 to find out the best result
         | 
| 129 | 
            +
                
         | 
| 130 | 
            +
                noisy = enhance_model.load_audio(
         | 
| 131 | 
            +
                "audio1.wav"
         | 
| 132 | 
            +
                ).unsqueeze(0)
         | 
| 133 | 
            +
             | 
| 134 | 
            +
                enhanced = enhance_model.enhance_batch(noisy, lengths=torch.tensor([1.]))
         | 
| 135 | 
            +
                torchaudio.save("enhanced.wav", enhanced.cpu(), 16000)
         | 
| 136 | 
            +
             | 
| 137 | 
            +
                return [result.text, res, "enhanced.wav"]    
         | 
| 138 | 
            +
            #    yield out_str.strip()
         | 
| 139 |  | 
| 140 | 
             
            g = gr.Interface(
         | 
| 141 | 
             
                fn=evaluate,
         | 
| 142 | 
             
                inputs=[
         | 
| 143 | 
             
            #        gr.components.Textbox(lines=2, label="Instruction", value="Tell me about ravens."),
         | 
| 144 | 
             
                    gr.Audio(source="microphone", label = "请开始对话吧!", type="filepath"),
         | 
| 145 | 
            +
                    gr.Audio(source="upload", label = "请上传您喜欢的声音(wav文件)", type="filepath"),
         | 
| 146 | 
             
                    gr.components.Textbox(lines=2, label="Input", placeholder="none"),
         | 
| 147 | 
             
                    gr.components.Slider(minimum=10, maximum=200, step=10, value=150), # token_count
         | 
| 148 | 
             
                    gr.components.Slider(minimum=0.2, maximum=2.0, step=0.1, value=1.0), # temperature
         | 
|  | |
| 151 | 
             
                    gr.components.Slider(0.0, 1.0, step=0.1, value=0.4),  # countPenalty        
         | 
| 152 | 
             
                ],
         | 
| 153 | 
             
                outputs=[
         | 
| 154 | 
            +
                    gr.inputs.Textbox(
         | 
| 155 | 
            +
                        lines=1,
         | 
| 156 | 
            +
                        label="Speech to Text"",
         | 
| 157 | 
            +
                    ),
         | 
| 158 | 
             
                    gr.inputs.Textbox(
         | 
| 159 | 
             
                        lines=5,
         | 
| 160 | 
            +
                        label="Raven Output",
         | 
| 161 | 
            +
                    ),
         | 
| 162 | 
            +
                    gr.Audio(label="Audio with Custom Voice"),
         | 
| 163 | 
             
                ],
         | 
| 164 | 
             
                title="🥳💬💕 - TalktoAI,随时随地,谈天说地!",
         | 
| 165 | 
             
                description="🤖 - 让有人文关怀的AI造福每一个人!AI向善,文明璀璨!TalktoAI - Enable the future!",
         | 
 
			
