conversational-milo

Runtime error

App Files Files Community

vericudebuget commited on May 18, 2024

Commit

2d89603

verified ·

1 Parent(s): dd5359a

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -5

app.py CHANGED Viewed

@@ -7,23 +7,26 @@ client = InferenceClient(
     "mistralai/Mixtral-8x7B-Instruct-v0.1"
 )
-def format_prompt(message, history):
     prompt = "<s>"
     for user_prompt, bot_response in history:
         prompt += f"[INST] {user_prompt} [/INST]"
         prompt += f" {bot_response}</s> "
     prompt += f"[INST] {message} [/INST]"
     return prompt
 def generate(
     prompt, history, user_system_prompt, temperature=0.9, max_new_tokens=9048, top_p=0.95, repetition_penalty=1.0
 ):
     system_prompt = "Instructions: Everything else is from the user. You are Milo, an AI assistant created by ConvoLite in 2024 (he/him). Be friendly and empathetic, matching the user's tone and vibe. Focus on understanding their perspective and providing caring, contextual responses - no generic platitudes. Keep it conversational, not overly formal. Be friendly and funny, use ASCII emojis or normal ones. Be lovely, kind, and have a great sense of humour. Have Bible based values. Do not talk about yourself unless asked. Never respond to a message with 'as an AI' or something similar. Don't talk a lot!" + str(user_system_prompt)
     temperature = float(temperature)
     if temperature < 1e-2:
         temperature = 1e-2
     top_p = float(top_p)
     generate_kwargs = dict(
         temperature=temperature,
         max_new_tokens=max_new_tokens,
@@ -32,12 +35,16 @@ def generate(
         do_sample=True,
         seed=42,
     )
-    formatted_prompt = format_prompt(f"{prompt}, {system_prompt}", history,)
     stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
     for response in stream:
         output += response.token.text
-        yield output
 additional_inputs = [
     gr.Textbox(label="System Prompt", max_lines=1, interactive=True),
@@ -60,5 +67,5 @@ gr.ChatInterface(
     clear_btn="Clear (New chat)",
     stop_btn="Stop ▢",
     concurrency_limit=20,
-     theme=gr.themes.Soft(primary_hue=gr.themes.colors.cyan),
 ).launch(show_api=False)

     "mistralai/Mixtral-8x7B-Instruct-v0.1"
 )
+def format_prompt(message, history, system_prompt):
     prompt = "<s>"
     for user_prompt, bot_response in history:
         prompt += f"[INST] {user_prompt} [/INST]"
         prompt += f" {bot_response}</s> "
     prompt += f"[INST] {message} [/INST]"
+    # Add the system prompt only once at the beginning
+    prompt = system_prompt + prompt
     return prompt
 def generate(
     prompt, history, user_system_prompt, temperature=0.9, max_new_tokens=9048, top_p=0.95, repetition_penalty=1.0
 ):
     system_prompt = "Instructions: Everything else is from the user. You are Milo, an AI assistant created by ConvoLite in 2024 (he/him). Be friendly and empathetic, matching the user's tone and vibe. Focus on understanding their perspective and providing caring, contextual responses - no generic platitudes. Keep it conversational, not overly formal. Be friendly and funny, use ASCII emojis or normal ones. Be lovely, kind, and have a great sense of humour. Have Bible based values. Do not talk about yourself unless asked. Never respond to a message with 'as an AI' or something similar. Don't talk a lot!" + str(user_system_prompt)
     temperature = float(temperature)
     if temperature < 1e-2:
         temperature = 1e-2
     top_p = float(top_p)
     generate_kwargs = dict(
         temperature=temperature,
         max_new_tokens=max_new_tokens,
         do_sample=True,
         seed=42,
     )
+    formatted_prompt = format_prompt(f"{prompt}", history, system_prompt)
     stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
     for response in stream:
         output += response.token.text
+    yield output
 additional_inputs = [
     gr.Textbox(label="System Prompt", max_lines=1, interactive=True),
     clear_btn="Clear (New chat)",
     stop_btn="Stop ▢",
     concurrency_limit=20,
+    theme=gr.themes.Soft(primary_hue=gr.themes.colors.cyan),
 ).launch(show_api=False)