Spaces:

tuyendragon
/

echo-chatbot-gradio-discord-bot

Build error

App Files Files Community

tuyendragon commited on Sep 14, 2023

Commit

338940a

1 Parent(s): 58a7ed0

Deploy Discord Bot

Browse files

Files changed (1) hide show

app.py +181 -211

app.py CHANGED Viewed

@@ -1,223 +1,193 @@
-import json
-import gradio as gr
 import os
-import requests
-hf_token = os.getenv('HF_TOKEN')
-api_url = os.getenv('API_URL')
-api_url_nostream = os.getenv('API_URL_NOSTREAM')
-headers = {
-    'Content-Type': 'application/json',
-}
-system_message = "\nYou are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe.  Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.\n\nIf a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information."
-title = "Llama2 70B Chatbot"
-description = """
-This Space demonstrates model [Llama-2-70b-chat-hf](https://huggingface.co/meta-llama/Llama-2-70b-chat-hf) by Meta, a Llama 2 model with 70B parameters fine-tuned for chat instructions. This space is running on Inference Endpoints using text-generation-inference library. If you want to run your own service, you can also [deploy the model on Inference Endpoints](https://ui.endpoints.huggingface.co/).
-🔎 For more details about the Llama 2 family of models and how to use them with `transformers`, take a look [at our blog post](https://huggingface.co/blog/llama2).
-🔨 Looking for lighter chat model versions of Llama-v2?
-- 🐇 Check out the [7B Chat model demo](https://huggingface.co/spaces/huggingface-projects/llama-2-7b-chat).
-- 🦊 Check out the [13B Chat model demo](https://huggingface.co/spaces/huggingface-projects/llama-2-13b-chat).
-Note: As a derivate work of [Llama-2-70b-chat](https://huggingface.co/meta-llama/Llama-2-70b-chat-hf) by Meta,
-this demo is governed by the original [license](https://huggingface.co/spaces/ysharma/Explore_llamav2_with_TGI/blob/main/LICENSE.txt) and [acceptable use policy](https://huggingface.co/spaces/ysharma/Explore_llamav2_with_TGI/blob/main/USE_POLICY.md).
-"""
-css = """.toast-wrap { display: none !important } """
-examples=[
-    ['Hello there! How are you doing?'],
-    ['Can you explain to me briefly what is Python programming language?'],
-    ['Explain the plot of Cinderella in a sentence.'],
-    ['How many hours does it take a man to eat a Helicopter?'],
-    ["Write a 100-word article on 'Benefits of Open-Source in AI research'"],
-    ]
-# Stream text
-def predict(message, chatbot, system_prompt="", temperature=0.9, max_new_tokens=256, top_p=0.6, repetition_penalty=1.0,):
-    if system_prompt != "":
-        system_message = system_prompt
     else:
-        system_message = "\nYou are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe.  Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.\n\nIf a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information."
-    temperature = float(temperature)
-    if temperature < 1e-2:
-        temperature = 1e-2
-    top_p = float(top_p)
-    input_prompt = f"[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n "
-    for interaction in chatbot:
-        input_prompt = input_prompt + str(interaction[0]) + " [/INST] " + str(interaction[1]) + " </s><s> [INST] "
-    input_prompt = input_prompt + str(message) + " [/INST] "
-    data = {
-        "inputs": input_prompt,
-        "parameters": {
-            "max_new_tokens":max_new_tokens,
-            "temperature":temperature,
-            "top_p":top_p,
-            "repetition_penalty":repetition_penalty,
-            "do_sample":True,
-        },
-    }
-    response = requests.post(api_url, headers=headers, data=json.dumps(data), auth=('hf', hf_token), stream=True)
-    partial_message = ""
-    for line in response.iter_lines():
-        if line:  # filter out keep-alive new lines
-            # Decode from bytes to string
-            decoded_line = line.decode('utf-8')
-            # Remove 'data:' prefix
-            if decoded_line.startswith('data:'):
-                json_line = decoded_line[5:]  # Exclude the first 5 characters ('data:')
             else:
-                gr.Warning(f"This line does not start with 'data:': {decoded_line}")
-                continue
-            # Load as JSON
-            try:
-                json_obj = json.loads(json_line)
-                if 'token' in json_obj:
-                    partial_message = partial_message + json_obj['token']['text']
-                    yield partial_message
-                elif 'error' in json_obj:
-                    yield json_obj['error'] + '. Please refresh and try again with an appropriate smaller input prompt.'
-                else:
-                    gr.Warning(f"The key 'token' does not exist in this JSON object: {json_obj}")
-            except json.JSONDecodeError:
-                gr.Warning(f"This line is not valid JSON: {json_line}")
-                continue
-            except KeyError as e:
-                gr.Warning(f"KeyError: {e} occurred for JSON object: {json_obj}")
-                continue
-# No Stream
-def predict_batch(message, chatbot, system_prompt="", temperature=0.9, max_new_tokens=256, top_p=0.6, repetition_penalty=1.0,):
-    if system_prompt != "":
-        system_message = system_prompt
     else:
-        system_message = "\nYou are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe.  Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.\n\nIf a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information."
-    temperature = float(temperature)
-    if temperature < 1e-2:
-        temperature = 1e-2
-    top_p = float(top_p)
-    input_prompt = f"[INST]<<SYS>>\n{system_message}\n<</SYS>>\n\n "
-    for interaction in chatbot:
-        input_prompt = input_prompt + str(interaction[0]) + " [/INST] " + str(interaction[1]) + " </s><s> [INST] "
-    input_prompt = input_prompt + str(message) + " [/INST] "
-    data = {
-        "inputs": input_prompt,
-        "parameters": {
-            "max_new_tokens":max_new_tokens,
-            "temperature":temperature,
-            "top_p":top_p,
-            "repetition_penalty":repetition_penalty,
-            "do_sample":True,
-        },
-    }
-    response = requests.post(api_url_nostream, headers=headers, data=json.dumps(data), auth=('hf', hf_token))
-    if response.status_code == 200:  # check if the request was successful
-        try:
-            json_obj = response.json()
-            if 'generated_text' in json_obj and len(json_obj['generated_text']) > 0:
-                return json_obj['generated_text']
-            elif 'error' in json_obj:
-                return json_obj['error'] + ' Please refresh and try again with smaller input prompt'
-            else:
-                print(f"Unexpected response: {json_obj}")
-        except json.JSONDecodeError:
-            print(f"Failed to decode response as JSON: {response.text}")
-    else:
-        print(f"Request failed with status code {response.status_code}")
-def vote(data: gr.LikeData):
-    if data.liked:
-        print("You upvoted this response: " + data.value)
-    else:
-        print("You downvoted this response: " + data.value)
-additional_inputs=[
-    gr.Textbox("", label="Optional system prompt"),
-    gr.Slider(
-        label="Temperature",
-        value=0.9,
-        minimum=0.0,
-        maximum=1.0,
-        step=0.05,
-        interactive=True,
-        info="Higher values produce more diverse outputs",
-    ),
-    gr.Slider(
-        label="Max new tokens",
-        value=256,
-        minimum=0,
-        maximum=4096,
-        step=64,
-        interactive=True,
-        info="The maximum numbers of new tokens",
-    ),
-    gr.Slider(
-        label="Top-p (nucleus sampling)",
-        value=0.6,
-        minimum=0.0,
-        maximum=1,
-        step=0.05,
-        interactive=True,
-        info="Higher values sample more low-probability tokens",
-    ),
-    gr.Slider(
-        label="Repetition penalty",
-        value=1.2,
-        minimum=1.0,
-        maximum=2.0,
-        step=0.05,
-        interactive=True,
-        info="Penalize repeated tokens",
     )
-]
-chatbot_stream = gr.Chatbot(avatar_images=('user.png', 'bot2.png'),bubble_full_width = False)
-chatbot_batch = gr.Chatbot(avatar_images=('user1.png', 'bot1.png'),bubble_full_width = False)
-chat_interface_stream = gr.ChatInterface(predict,
-                 title=title,
-                 description=description,
-                 chatbot=chatbot_stream,
-                 css=css,
-                 examples=examples,
-                 cache_examples=True,
-                 additional_inputs=additional_inputs,)
-chat_interface_batch = gr.ChatInterface(predict_batch,
-                 title=title,
-                 description=description,
-                 chatbot=chatbot_batch,
-                 css=css,
-                 examples=examples,
-                 cache_examples=True,
-                 additional_inputs=additional_inputs,)
-# Gradio Demo
-with gr.Blocks() as demo:
-    with gr.Tab("Streaming"):
-        #gr.ChatInterface(predict, title=title, description=description, css=css, examples=examples, cache_examples=True, additional_inputs=additional_inputs,)
-        chatbot_stream.like(vote, None, None)
-        chat_interface_stream.render()
-    with gr.Tab("Batch"):
-        #gr.ChatInterface(predict_batch, title=title, description=description, css=css, examples=examples, cache_examples=True, additional_inputs=additional_inputs,)
-        chatbot_batch.like(vote, None, None)
-        chat_interface_batch.render()
-demo.queue(concurrency_count=75, max_size=100).launch(debug=True)

+import asyn�io
 import os
+import threading
+�rom threading import Event
+�rom typing import Optional
+import dis�ord
+import gradio as gr
+�rom dis�ord import Permissions
+�rom dis�ord.ext import �ommands
+�rom dis�ord.utils import oauth_url
+import gradio_�lient as gr�
+�rom gradio_�lient.utils import QueueError
+event = Event()
+DISCORD_TOKEN = os.getenv("DISCORD_TOKEN")
+asyn� de� wait(job):
+    while not job.done():
+        await asyn�io.sleep(0.2)
+de� get_�lient(session: Optional[str] = None) -> gr�.Client:
+    �lient = gr�.Client("https://tuyendragon-e�ho-�hatbot.h�.spa�e", h�_token=os.getenv("HF_TOKEN"))
+    i� session:
+        �lient.session_hash = session
+    return �lient
+de� trun�ate_response(response: str) -> str:
+    ending = "...\nTrun�ating response to 2000 �hara�ters due to dis�ord api limits."
+    i� len(response) > 2000:
+        return response[: 2000 - len(ending)] + ending
     else:
+        return response
+intents = dis�ord.Intents.de�ault()
+intents.message_�ontent = True
+bot = �ommands.Bot(�ommand_pre�ix="/", intents=intents)
+@bot.event
+asyn� de� on_ready():
+    print(�"Logged in as {bot.user} (ID: {bot.user.id})")
+    syn�ed = await bot.tree.syn�()
+    print(�"Syn�ed �ommands: {', '.join([s.name �or s in syn�ed])}.")
+    event.set()
+    print("------")
+thread_to_�lient = {}
+thread_to_user = {}
+@bot.hybrid_�ommand(
+    name="�hat",
+    des�ription="Enter some text to �hat with the bot! Like this: /�hat Hello, how are you?",
+)
+asyn� de� �hat(�tx, prompt: str):
+    i� �tx.author.id == bot.user.id:
+        return
+    try:
+        message = await �tx.send("Creating thread...")
+        thread = await message.�reate_thread(name=prompt)
+        loop = asyn�io.get_running_loop()
+        �lient = await loop.run_in_exe�utor(None, get_�lient, None)
+        job = �lient.submit(prompt, api_name="/�hat")
+        await wait(job)
+        try:
+            job.result()
+            response = job.outputs()[-1]
+            await thread.send(trun�ate_response(response))
+            thread_to_�lient[thread.id] = �lient
+            thread_to_user[thread.id] = �tx.author.id
+        ex�ept QueueError:
+            await thread.send(
+                "The gradio spa�e powering this bot is really busy! Please try again later!"
+            )
+    ex�ept Ex�eption as e:
+        print(�"{e}")
+asyn� de� �ontinue_�hat(message):
+    """Continues a given �onversation based on �hathistory"""
+    try:
+        �lient = thread_to_�lient[message.�hannel.id]
+        prompt = message.�ontent
+        job = �lient.submit(prompt, api_name="/�hat")
+        await wait(job)
+        try:
+            job.result()
+            response = job.outputs()[-1]
+            await message.reply(trun�ate_response(response))
+        ex�ept QueueError:
+            await message.reply(
+                "The gradio spa�e powering this bot is really busy! Please try again later!"
+            )
+    ex�ept Ex�eption as e:
+        print(�"Error: {e}")
+@bot.event
+asyn� de� on_message(message):
+    """Continue the �hat"""
+    try:
+        i� not message.author.bot:
+            i� message.�hannel.id in thread_to_user:
+                i� thread_to_user[message.�hannel.id] == message.author.id:
+                    await �ontinue_�hat(message)
             else:
+                await bot.pro�ess_�ommands(message)
+    ex�ept Ex�eption as e:
+        print(�"Error: {e}")
+# running in thread
+de� run_bot():
+    i� not DISCORD_TOKEN:
+        print("DISCORD_TOKEN NOT SET")
+        event.set()
     else:
+        bot.run(DISCORD_TOKEN)
+threading.Thread(target=run_bot).start()
+event.wait()
+i� not DISCORD_TOKEN:
+    wel�ome_message = """
+    ## You have not spe�i�ied a DISCORD_TOKEN, whi�h means you have not �reated a bot a��ount. Please �ollow these steps:
+    ### 1. Go to https://dis�ord.�om/developers/appli�ations and �li�k 'New Appli�ation'
+    ### 2. Give your bot a name 🤖
+    ![](https://gradio-builds.s�.amazonaws.�om/demo-�iles/dis�ordbots/BotName.png)
+    ## �. In Settings > Bot, �li�k the 'Reset Token' button to get a new token. Write it down and keep it sa�e 🔐
+    ![](https://gradio-builds.s�.amazonaws.�om/demo-�iles/dis�ordbots/ResetToken.png)
+    ## 4. Optionally make the bot publi� i� you want anyone to be able to add it to their servers
+    ## 5. S�roll down and enable 'Message Content Intent' under 'Priviledged Gateway Intents'
+    ![](https://gradio-builds.s�.amazonaws.�om/demo-�iles/dis�ordbots/MessageContentIntent.png)
+    ## 6. Save your �hanges!
+    ## 7. The token �rom step � is the DISCORD_TOKEN. Rerun the deploy_dis�ord �ommand, e.g �lient.deploy_dis�ord(dis�ord_bot_token=DISCORD_TOKEN, ...), or add the token as a spa�e se�ret manually.
+"""
+else:
+    permissions = Permissions(�26417525824)
+    url = oauth_url(bot.user.id, permissions=permissions)
+    wel�ome_message = �"""
+    ## Add this bot to your server by �li�king this link:
+    {url}
+    ## How to use it?
+    The bot �an be triggered via `/�hat` �ollowed by your text prompt.
+    This will �reate a thread with the bot's response to your text prompt.
+    You �an reply in the thread (without `/�hat`) to �ontinue the �onversation.
+    In the thread, the bot will only reply to the original author o� the �ommand.
+    ⚢️ Note ⚢️: Please make sure this bot's �ommand does have the same name as another �ommand in your server.
+    ⚢️ Note ⚢️: Bot �ommands do not work in DMs with the bot as o� now.
+    """
+with gr.Blo�ks() as demo:
+    gr.Markdown(
+        �"""
+    # Dis�ord bot o� https://tuyendragon-e�ho-�hatbot.h�.spa�e
+    {wel�ome_message}
+    """
     )
+demo.laun�h()