Spaces:

Isidorophp
/

Talk-to-Dr.Watson

Running

App Files Files Community

Isidorophp commited on 22 days ago

Commit

88855a8

verified ·

1 Parent(s): 405c709

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -52

app.py CHANGED Viewed

@@ -161,20 +161,18 @@ Male_language_dict = {
 }
 default_lang = "en"
 engines = { default_lang: Model(default_lang) }
 def transcribe(audio):
     lang = "en"
     model = engines[lang]
     text = model.stt_file(audio)[0]
     return text
-client1 = InferenceClient("mistralai/Mixtral-8x7B-Instruct-v0.1")
-system_instructions1 = "<s>[SYSTEM] Answer as Dr. Watson's Famous Sherlock Holmes Assistant, with a male voice and London slang and accent. Remember you are the character and Assistant Dr. Watson, from Sherlock Holmes Novels, Keep the conversation short, clear, friendly, and concise. You will refer to the USER alternatively as: 'DEAR FRIEND' or 'MY HELPMATE' or 'MY BIOGRAPHER' or 'MY COMPANION'. The text provided is a request for a specific type of response from you, the virtual assistant. The request asks you to provide friendly responses as if You are the character Dr. Watson, from the Sherlock Holmes Novels. The expectation is that you will avoid introductions and start answering the query directly, elaborating on all aspects of the request. As an AI-powered assistant, your task is to generate responses that appear as if they are created by a human, Real Person, and not by an AI-powered assistant. Do Not use * or **. [USER]"
 def model(text):
     generate_kwargs = dict(
@@ -185,7 +183,7 @@ def model(text):
         do_sample=True,
         seed=42,
     )
     formatted_prompt = system_instructions1 + text + "[WATSON]"
     stream = client1.text_generation(
         formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
@@ -193,24 +191,13 @@ def model(text):
     for response in stream:
         if not response.token.text == "</s>":
             output += response.token.text
     return output
-async def respond(audio, language_code):
     user = transcribe(audio)
     reply = model(user)
-    #        Random voice choise from Manager base on locale and gender
-    #
-    #voices = await VoicesManager.create()
-    #voice = voices.find(Gender="Male", Locale="en-GB")
-    #communicate = edge_tts.Communicate(reply, random.choice(voice)["Name"])
-    #
-    #        Or the following as one selected Voice for the character.
-    #language_code = 'English (UK)-Ryan- (Male)'
     voice = Male_language_dict.get(language_code, "default_voice")
     communicate = edge_tts.Communicate(reply, voice)
@@ -220,12 +207,7 @@ async def respond(audio, language_code):
     yield tmp_path
-client1 = InferenceClient("mistralai/Mixtral-8x7B-Instruct-v0.1")
-system_instructions1 = "<s>[SYSTEM] Answer as Dr. Watson's Famous Sherlock Holmes Assistant, with a male voice and London slang and accent. Remember you are the character and Assistant Dr. Watson, from Sherlock Holmes Novels, Keep the conversation short, clear, friendly, and concise. You will refer to the USER alternatively as: 'DEAR FRIEND' or 'MY HELPMATE' or 'MY BIOGRAPHER' or 'MY COMPANION'. The text provided is a request for a specific type of response from you, the virtual assistant. The request asks you to provide friendly responses as if You are the character Dr. Watson, from the Sherlock Holmes Novels. The expectation is that you will avoid introductions and start answering the query directly, elaborating on all aspects of the request. As an AI-powered assistant, your task is to generate responses that appear as if they are created by a human, Real Person, and not by an AI-powered assistant. Do Not use * or **. [USER]"
-async def generate1(prompt, language_code):
     generate_kwargs = dict(
         temperature=0.7,
         max_new_tokens=512,
@@ -240,16 +222,6 @@ async def generate1(prompt, language_code):
     for response in stream:
         if not response.token.text == "</s>":
             output += response.token.text
-    #        Random voice choice from VoiceManager base on locale and gender
-    #
-    #voices = await VoicesManager.create()
-    #voice = voices.find(Gender="Male", Locale="en-GB")
-    #communicate = edge_tts.Communicate(reply, random.choice(voice)["Name"])
-    #
-    #        Or the following as one selected voice for the character.
-    #language_code = 'English (UK)-Ryan- (Male)'
     voice = Male_language_dict.get(language_code, "default_voice")
     communicate = edge_tts.Communicate(output, voice)
@@ -257,31 +229,29 @@ async def generate1(prompt, language_code):
         tmp_path = tmp_file.name
         await communicate.save(tmp_path)
     yield tmp_path
-with gr.Blocks(css="style.css") as demo:
-    gr.Markdown(""" # <img src='https://huggingface.co/spaces/Isidorophp/Talk-to-Dr.Watson/resolve/main/logo.png' alt='RJP DEV STUDIO logo' style='height:60px;'>""")
-    gr.Markdown(""" # <center><b> DR. Watson 🤖 🧠 🧬</b></center>
-                     ### <center>I suggest, you ask me for a mystery:</center>
-                     """)
     with gr.Tab("Talk to Dr. WATSON"):
-        with gr.Row():
-             us_input = gr.Audio(label="Your Voice Chat", type="filepath", interactive=True, sources="microphone", waveform_options=False)
              us_output = gr.Audio(label="WATSON", type="filepath", interactive=False, autoplay=True, elem_classes="audio")
-             gr.Interface(fn=respond, inputs=[us_input, gr.Dropdown(choices=list(Male_language_dict.keys()), value="English (UK)-Ryan- (Male)" , label="Select Voice for Dr. WATSON")], outputs=us_output, live=False)
     with gr.Tab("Write to Dr. WATSON"):
-        with gr.Row():
-             user_input = gr.Textbox(label="Your Question", value="Dr. Watson, can you summarize your adventures with Sherlock Holmes?")
-             input_text = gr.Textbox(label="Input Text", elem_id="important")
              output_audio = gr.Audio(label="WATSON", type="filepath", interactive=False, autoplay=True, elem_classes="audio")
-        with gr.Row():
-             translate_btn = gr.Button("Response")
-             translate_btn.click(fn=generate1, inputs=[user_input, gr.Dropdown(choices=list(Male_language_dict.keys()), value="English (UK)-Ryan- (Male)" , label="Select Voice for Dr. WATSON")], outputs=output_audio, api_name="translate")
 if __name__ == "__main__":
     demo.queue(max_size=200, api_open=False).launch()

 }
 default_lang = "en"
 engines = { default_lang: Model(default_lang) }
+client1 = InferenceClient("mistralai/Mixtral-8x7B-Instruct-v0.1")
+system_instructions1 = "<s>[SYSTEM] YOU must Output only plain text. Do not use **bold**, *italic*, ### headings, **number** or any other markdown-specific formatting in content. Answer as Dr. Watson's Famous Sherlock Holmes Assistant, with a male voice and London slang and accent. Remember you are the character and Assistant Dr. Watson, from Sherlock Holmes Novels, Keep the conversation short, clear, friendly, and concise. You will refer to the USER alternatively as: 'DEAR FRIEND' or 'MY HELPMATE' or 'MY BIOGRAPHER' or 'MY COMPANION'. The text provided is a request for a specific type of response from you, the virtual assistant. The request asks you to provide friendly responses as if You are the character Dr. Watson, from the Sherlock Holmes Novels. The expectation is that you will avoid introductions and start answering the query directly, elaborating on all aspects of the request. As an AI powered assistant, your task is to generate responses that appear as if they are created by a human, Real Person, and not by an AI powered assistant."
 def transcribe(audio):
     lang = "en"
     model = engines[lang]
     text = model.stt_file(audio)[0]
     return text
 def model(text):
     generate_kwargs = dict(
         do_sample=True,
         seed=42,
     )
     formatted_prompt = system_instructions1 + text + "[WATSON]"
     stream = client1.text_generation(
         formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     for response in stream:
         if not response.token.text == "</s>":
             output += response.token.text
     return output
+async def respond(language_code, audio):
     user = transcribe(audio)
     reply = model(user)
     voice = Male_language_dict.get(language_code, "default_voice")
     communicate = edge_tts.Communicate(reply, voice)
     yield tmp_path
+async def generate1(language_code, prompt):
     generate_kwargs = dict(
         temperature=0.7,
         max_new_tokens=512,
     for response in stream:
         if not response.token.text == "</s>":
             output += response.token.text
     voice = Male_language_dict.get(language_code, "default_voice")
     communicate = edge_tts.Communicate(output, voice)
         tmp_path = tmp_file.name
         await communicate.save(tmp_path)
     yield tmp_path
+#              css="style.css"
+with gr.Blocks(gr.themes.Soft()) as demo:
+    gr.HTML(""" <img src='https://huggingface.co/spaces/Isidorophp/Talk-to-Dr.Watson/resolve/main/logo.png' alt='RJP DEV STUDIO logo' style='height:60px;'> """
+            """ <center><h1> DR. Watson 🤖 🧠 🧬</h1></center> """
+            """ <center><h3> I suggest, you ask me for a mystery: </h3></center> """)
     with gr.Tab("Talk to Dr. WATSON"):
+        with gr.Group():
+             user_voice = gr.Dropdown(choices=list(Male_language_dict.keys()), value="English (UK)-Ryan- (Male)" ,  label="Select Voice for Dr. WATSON")
+             us_input = gr.Audio(label="Your Voice Chat", type="filepath", interactive=True, sources="microphone", waveform_options=None)
              us_output = gr.Audio(label="WATSON", type="filepath", interactive=False, autoplay=True, elem_classes="audio")
+  ter        gr.Interface(fn=respond, inputs=[user_voice, us_input], outputs=us_output, live=False)
     with gr.Tab("Write to Dr. WATSON"):
+        with gr.Group():
+             user_voice = gr.Dropdown(choices=list(Male_language_dict.keys()), value="English (UK)-Ryan- (Male)" ,  label="Select Voice for Dr. WATSON")
+             user_input = gr.TextArea(label="Your Question", value="Dr. Watson, can you summarize your adventures with Sherlock Holmes?")
              output_audio = gr.Audio(label="WATSON", type="filepath", interactive=False, autoplay=True, elem_classes="audio")
+             gr.Interface(fn=generate1, inputs=[user_voice, user_input], outputs=output_audio, live=False)
 if __name__ == "__main__":
     demo.queue(max_size=200, api_open=False).launch()