GaiaMiniMed

Runtime error

File size: 1,604 Bytes

f93c2ca
 
 
 
d0dbbcc
f93c2ca
7d36a00
f93c2ca
 
 
00e2bc7
3755403
f93c2ca
 
d0dbbcc
 
 
00e2bc7
d0dbbcc
00e2bc7
 
f93c2ca
d0dbbcc
 
f93c2ca
d0dbbcc
 
a369bf4
d0dbbcc
5debb29
d0dbbcc
 
 
 
 
 
 
 
5debb29
f93c2ca
 
 
 
 
 
d0dbbcc
 
55976ec
d0dbbcc

from transformers import AutoModelForCausalLM, AutoTokenizer
import gradio as gr
import torch


title = "EZChat"
description = "A State-of-the-Art Large-scale Pretrained Response generation model (DialoGPT-medium)"
examples = [["How are you?"]]


tokenizer = AutoTokenizer.from_pretrained("microsoft/DialoGPT-medium", padding_side='left')
model = AutoModelForCausalLM.from_pretrained("microsoft/DialoGPT-medium")


def predict(input, history=[]):
    # tokenize the new input sentence
    new_user_input_ids = tokenizer.encode(
        input + tokenizer.eos_token, padding=True, truncation=True, return_tensors="pt"
    )
    #Attention Mask For Reliable Results
    attention_mask = inputs['attention_mask']

    # append the new user input tokens to the chat history
    bot_input_ids = torch.cat([torch.LongTensor(history), new_user_input_ids], dim=-1)

    # generate a response
    history = model.generate(
        bot_input_ids, max_length=4000, pad_token_id=tokenizer.eos_token_id
    ).tolist()

    # convert the tokens to text, and then split the responses into lines
    response = tokenizer.decode(history[0]).split("<|endoftext|>")
    # print('decoded_response-->>'+str(response))
    response = [
        (response[i], response[i + 1]) for i in range(0, len(response) - 1, 2)
    ]  # convert to tuples of list
    # print('response-->>'+str(response))
    return response, history


gr.Interface(
    fn=predict,
    title=title,
    description=description,
    examples=examples,
    inputs=["text", "state"],
    outputs=["chatbot", "state"],
    theme="ParityError/Anime",
).launch()