Spaces:

rodrisouza
/

demo-chatbot-v3

Configuration error

App Files Files Community

rodrisouza commited on Jul 10, 2024

Commit

58cb3d4

verified ·

1 Parent(s): 88720d3

Update app.py

Browse files

Files changed (1) hide show

app.py +206 -62

app.py CHANGED Viewed

@@ -1,63 +1,207 @@
 import gradio as gr
-from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
-"""
-client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
-def respond(
-    message,
-    history: list[tuple[str, str]],
-    system_message,
-    max_tokens,
-    temperature,
-    top_p,
-):
-    messages = [{"role": "system", "content": system_message}]
-    for val in history:
-        if val[0]:
-            messages.append({"role": "user", "content": val[0]})
-        if val[1]:
-            messages.append({"role": "assistant", "content": val[1]})
-    messages.append({"role": "user", "content": message})
-    response = ""
-    for message in client.chat_completion(
-        messages,
-        max_tokens=max_tokens,
-        stream=True,
-        temperature=temperature,
-        top_p=top_p,
-    ):
-        token = message.choices[0].delta.content
-        response += token
-        yield response
-"""
-For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
-"""
-demo = gr.ChatInterface(
-    respond,
-    additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
-        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(
-            minimum=0.1,
-            maximum=1.0,
-            value=0.95,
-            step=0.05,
-            label="Top-p (nucleus sampling)",
-        ),
-    ],
-)
-if __name__ == "__main__":
-    demo.launch()

+import os
 import gradio as gr
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import pandas as pd
+from datetime import datetime, timedelta, timezone
+import torch
+from config import hugging_face_token, init_google_sheets_client, models, default_model_name, user_names, google_sheets_name
+import spaces
+# Hack for ZeroGPU
+torch.jit.script = lambda f: f
+# Initialize Google Sheets client
+client = init_google_sheets_client()
+sheet = client.open(google_sheets_name)
+stories_sheet = sheet.get_worksheet(1)  # Assuming stories are in the second sheet (index 1)
+# Load stories from Google Sheets
+def load_stories():
+    stories_data = stories_sheet.get_all_values()
+    stories = [{"title": story[0], "story": story[1]} for story in stories_data if story[0] != "Title"]  # Skip header row
+    return stories
+# Load available stories
+stories = load_stories()
+# Initialize the selected model
+selected_model = default_model_name
+tokenizer, model = None, None
+# Initialize the data list
+data = []
+# Load the model and tokenizer once at the beginning
+def load_model(model_name):
+    global tokenizer, model, selected_model
+    try:
+        # Release the memory of the previous model if exists
+        if model is not None:
+            del model
+            torch.cuda.empty_cache()
+        tokenizer = AutoTokenizer.from_pretrained(models[model_name], padding_side='left', token=hugging_face_token, trust_remote_code=True)
+        # Ensure the padding token is set
+        if tokenizer.pad_token is None:
+            tokenizer.pad_token = tokenizer.eos_token
+            tokenizer.add_special_tokens({'pad_token': tokenizer.eos_token})
+        model = AutoModelForCausalLM.from_pretrained(models[model_name], token=hugging_face_token, trust_remote_code=True).to("cuda")
+        selected_model = model_name
+    except Exception as e:
+        print(f"Error loading model {model_name}: {e}")
+        raise e
+    return tokenizer, model
+# Ensure the initial model is loaded
+tokenizer, model = load_model(selected_model)
+# Chat history
+chat_history = []
+# Function to handle interaction with model
+@spaces.GPU
+def interact(user_input, history):
+    global tokenizer, model
+    try:
+        if tokenizer is None or model is None:
+            raise ValueError("Tokenizer or model is not initialized.")
+        messages = history + [{"role": "user", "content": user_input}]
+        # Ensure roles alternate correctly
+        for i in range(1, len(messages)):
+            if messages[i-1].get("role") == messages[i].get("role"):
+                raise ValueError("Conversation roles must alternate user/assistant/user/assistant/...")
+        prompt = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
+        # Generate response using selected model
+        input_ids = tokenizer(prompt, return_tensors='pt').input_ids.to("cuda")
+        chat_history_ids = model.generate(input_ids, max_new_tokens=100, pad_token_id=tokenizer.eos_token_id)  # Increase max_new_tokens
+        response = tokenizer.decode(chat_history_ids[:, input_ids.shape[-1]:][0], skip_special_tokens=True)
+        # Update chat history with generated response
+        history.append({"role": "user", "content": user_input})
+        history.append({"role": "assistant", "content": response})
+        formatted_history = [(entry["content"], None) if entry["role"] == "user" else (None, entry["content"]) for entry in history if entry["role"] in ["user", "assistant"]]
+        return "", formatted_history, history
+    except Exception as e:
+        if torch.cuda.is_available():
+            torch.cuda.empty_cache()
+        print(f"Error during interaction: {e}")
+        raise gr.Error(f"An error occurred during interaction: {str(e)}")
+# Function to send selected story and initial message
+def send_selected_story(title, model_name, system_prompt):
+    global chat_history
+    global selected_story
+    global data  # Ensure data is reset
+    data = []  # Reset data for new story
+    tokenizer, model = load_model(model_name)
+    selected_story = title
+    for story in stories:
+        if story["title"] == title:
+            system_prompt = f"""
+{system_prompt}
+Here is the story:
+---
+{story['story']}
+---
+            """
+            combined_message = system_prompt.strip()
+            if combined_message:
+                chat_history = []  # Reset chat history
+                chat_history.append({"role": "system", "content": combined_message})
+                # Generate the first question based on the story
+                question_prompt = "Please ask a simple question about the story to encourage interaction."
+                _, formatted_history, chat_history = interact(question_prompt, chat_history)
+                return formatted_history, chat_history, gr.update(value=[])  # Reset the data table
+            else:
+                print("Combined message is empty.")
+        else:
+            print("Story title does not match.")
+# Function to save comment and score
+def save_comment_score(chat_responses, score, comment, story_name, user_name):
+    last_user_message = ""
+    last_assistant_message = ""
+    # Find the last user and assistant messages
+    for message in reversed(chat_responses):
+        if isinstance(message, list) and len(message) == 2:
+            if message[0] and not last_user_message:
+                last_user_message = message[0]
+            elif message[1] and not last_assistant_message:
+                last_assistant_message = message[1]
+        if last_user_message and last_assistant_message:
+            break
+    timestamp = datetime.now(timezone.utc) - timedelta(hours=3)  # Adjust to GMT-3
+    timestamp_str = timestamp.strftime("%Y-%m-%d %H:%M:%S")
+    model_name = selected_model
+    # Append data to local data storage
+    data.append([
+        timestamp_str,
+        user_name,
+        model_name,
+        story_name,
+        last_user_message,
+        last_assistant_message,
+        score,
+        comment
+    ])
+    # Append data to Google Sheets
+    sheet = client.open(google_sheets_name).sheet1  # Assuming results are saved in sheet1
+    sheet.append_row([timestamp_str, user_name, model_name, story_name, last_user_message, last_assistant_message, score, comment])
+    df = pd.DataFrame(data, columns=["Timestamp", "User Name", "Model Name", "Story Name", "User Input", "Chat Response", "Score", "Comment"])
+    return df, gr.update(value="")  # Clear the comment input box
+# Create the chat interface using Gradio Blocks
+with gr.Blocks() as demo:
+    gr.Markdown("# Chat with Model")
+    model_dropdown = gr.Dropdown(choices=list(models.keys()), label="Select Model", value=selected_model)
+    user_dropdown = gr.Dropdown(choices=user_names, label="Select User Name")
+    initial_story = stories[0]["title"] if stories else None
+    story_dropdown = gr.Dropdown(choices=[story["title"] for story in stories], label="Select Story", value=initial_story)
+    default_system_prompt = ("You are friendly chatbot and you will interact with a child who speaks Spanish and is learning English as a foreign language. "
+                             "Everything you write should be in English. I will provide you with a short children's story in English. "
+                             "After reading the story, please ask the child a series of five simple questions about it, one at a time, to encourage ongoing interaction. "
+                             "Wait for the child's response to each question before asking the next one.")
+    system_prompt_input = gr.Textbox(lines=5, value=default_system_prompt, label="System Prompt")
+    send_story_button = gr.Button("Send Story")
+    with gr.Row():
+        with gr.Column(scale=1):
+            chatbot_input = gr.Textbox(placeholder="Type your message here...", label="User Input")
+            send_message_button = gr.Button("Send")
+        with gr.Column(scale=2):
+            chatbot_output = gr.Chatbot(label="Chat History")
+    with gr.Row():
+        with gr.Column(scale=1):
+            score_input = gr.Slider(minimum=0, maximum=5, step=1, label="Score")
+            comment_input = gr.Textbox(placeholder="Add a comment...", label="Comment")
+            save_button = gr.Button("Save Score and Comment")
+    data_table = gr.DataFrame(headers=["Timestamp", "User Name", "Model Name", "Story Name", "User Input", "Chat Response", "Score", "Comment"])
+    chat_history_json = gr.JSON(value=[], visible=False)
+    send_story_button.click(fn=send_selected_story, inputs=[story_dropdown, model_dropdown, system_prompt_input], outputs=[chatbot_output, chat_history_json, data_table])
+    send_message_button.click(fn=interact, inputs=[chatbot_input, chat_history_json], outputs=[chatbot_input, chatbot_output, chat_history_json])
+    save_button.click(fn=save_comment_score, inputs=[chatbot_output, score_input, comment_input, story_dropdown, user_dropdown], outputs=[data_table, comment_input])
+demo.launch()