| import gradio as gr | |
| import torch | |
| import random | |
| from transformers import T5Tokenizer, T5ForConditionalGeneration | |
| tokenizer = T5Tokenizer.from_pretrained("google/flan-t5-small") | |
| model = T5ForConditionalGeneration.from_pretrained("roborovski/superprompt-v1", torch_dtype=torch.float16) | |
| if torch.cuda.is_available(): | |
| device = "cuda" | |
| print("Using GPU") | |
| else: | |
| device = "cpu" | |
| print("Using CPU") | |
| model.to(device) | |
| def generate( | |
| prompt, | |
| history, | |
| max_new_tokens, | |
| repetition_penalty, | |
| temperature, | |
| top_p, | |
| top_k, | |
| random_seed, | |
| seed, | |
| ): | |
| input_text = f"{prompt}, {history}" | |
| input_ids = tokenizer(input_text, return_tensors="pt").input_ids.to(device) | |
| if random_seed: | |
| seed = random.randint(1, 100000) | |
| torch.manual_seed(seed) | |
| else: | |
| torch.manual_seed(seed) | |
| outputs = model.generate( | |
| input_ids, | |
| max_new_tokens=max_new_tokens, | |
| repetition_penalty=repetition_penalty, | |
| do_sample=True, | |
| temperature=temperature, | |
| top_p=top_p, | |
| top_k=top_k, | |
| ) | |
| better_prompt = tokenizer.decode(outputs[0]) | |
| return better_prompt | |
| use_random_seed = gr.Checkbox(value=False, label="Use Random Seed", info="Check to use a random seed which is a start point for the generation process") | |
| additional_inputs = [ | |
| gr.Slider( | |
| value=512, | |
| minimum=250, | |
| maximum=512, | |
| step=1, | |
| interactive=True, | |
| label="Max New Tokens", | |
| info="The maximum numbers of new tokens, controls how long is the output", | |
| ), | |
| gr.Slider( | |
| value=1.2, | |
| minimum=0, | |
| maximum=2, | |
| step=0.05, | |
| interactive=True, | |
| label="Repetition Penalty", | |
| info="Penalize repeated tokens, making the AI repeat less itself", | |
| ), | |
| gr.Slider( | |
| value=0.5, | |
| minimum=0, | |
| maximum=1, | |
| step=0.05, | |
| interactive=True, | |
| label="Temperature", | |
| info="Higher values produce more diverse outputs", | |
| ), | |
| gr.Slider( | |
| value=1, | |
| minimum=0, | |
| maximum=2, | |
| step=0.05, | |
| interactive=True, | |
| label="Top P", | |
| info="Higher values sample more low-probability tokens", | |
| ), | |
| gr.Slider( | |
| value=1, | |
| minimum=1, | |
| maximum=100, | |
| step=1, | |
| interactive=True, | |
| label="Top K", | |
| info="Higher k means more diverse outputs by considering a range of tokens", | |
| ), | |
| use_random_seed, | |
| gr.Number( | |
| value=42, | |
| interactive=True, | |
| label="Manual Seed", | |
| info="A starting point to initiate the generation process", | |
| visible={'False' if use_random_seed else 'True'} | |
| ), | |
| ] | |
| examples = [ | |
| [ | |
| "Expand the following prompt to add more detail: A storefront with 'Text to Image' written on it.", | |
| 512, | |
| 1.2, | |
| 0.5, | |
| 1, | |
| 50, | |
| False, | |
| 42, | |
| ] | |
| ] | |
| gr.ChatInterface( | |
| fn=generate, | |
| chatbot=gr.Chatbot( | |
| show_label=False, show_share_button=False, show_copy_button=True, likeable=True, layout="panel" | |
| ), | |
| additional_inputs=additional_inputs, | |
| title="SuperPrompt-v1", | |
| description="Make your prompts more detailed!", | |
| examples=examples, | |
| concurrency_limit=20, | |
| ).launch(show_api=False) | 
 
			
