Spaces:

tombetthauser
/

astronaut-horse-concept-loader

Runtime error

App Files Files Community

tombetthauser commited on Feb 27, 2023

Commit

7e14edd

1 Parent(s): 3491a10

Working artist concept selector

Browse files

Files changed (1) hide show

app.py +212 -23

app.py CHANGED Viewed

@@ -1,32 +1,201 @@
-# !pip install -Uq diffusers transformers
-# !pip install -Uq gradio
-# !pip install -Uq accelerate
-import gradio
-from diffusers import StableDiffusionPipeline as pipeline
 from accelerate import init_empty_weights
 import torch
 import os
-api_key = os.environ['api_key']
-my_token = api_key
-with init_empty_weights():
-  pipe = pipeline.from_pretrained("CompVis/stable-diffusion-v1-4", revision="fp16", torch_dtype=torch.float16, use_auth_token=my_token).to("cuda")
-DROPDOWNS = {
-    "gustav": " by dan mumford and gustav klimt and john harris and jean delville and victo ngai and josan gonzalez",
-    "hayao": " by studio ghibli",
-    "vinny": " painting by Vincent van Gogh",
-    "danny": " drawn by a child",
-    "jeff": " by jeff koons",
-}
-def image_prompt(prompt, dropdown):
-  prompt = prompt + DROPDOWNS[dropdown]
-  return pipe(prompt=prompt, height=512, width=512).images[0]
-with gradio.Blocks(css="""
   #go-button {
     background-color: white;
     border-radius: 0;
@@ -105,11 +274,31 @@ with gradio.Blocks(css="""
     margin-left: auto;
     margin-right: auto;
   }
-""") as demo:
-  dropdown = gradio.Dropdown(["danny", "gustav", "hayao", "vinny", "jeff"], label="choose style...")
   prompt = gradio.Textbox(label="image prompt...", elem_id="input-text")
   output = gradio.Image(elem_id="output-image")
   go_button = gradio.Button("draw it!", elem_id="go-button")
   go_button.click(fn=image_prompt, inputs=[prompt, dropdown], outputs=output)
-demo.launch()

+#@title 1. General Setup
+!pip install -qq diffusers==0.11.1 transformers ftfy accelerate
+!pip install -Uq diffusers transformers
+!pip install -Uq gradio
+!pip install -Uq accelerate
+from diffusers import StableDiffusionPipeline
+pipeline = StableDiffusionPipeline
+from transformers import CLIPFeatureExtractor, CLIPTextModel, CLIPTokenizer
 from accelerate import init_empty_weights
+import gradio
 import torch
 import os
+# FOR DEPLOYMENT: uncomment these and delete the notebook_login() below
+# api_key = os.environ['api_key']
+# my_token = api_key
+from huggingface_hub import notebook_login
+notebook_login()
+import PIL
+from PIL import Image
+def image_grid(imgs, rows, cols):
+    assert len(imgs) == rows*cols
+    w, h = imgs[0].size
+    grid = Image.new('RGB', size=(cols*w, rows*h))
+    grid_w, grid_h = grid.size
+    for i, img in enumerate(imgs):
+        grid.paste(img, box=(i%cols*w, i//cols*h))
+    return grid
+pretrained_model_name_or_path = "stabilityai/stable-diffusion-2"
+from IPython.display import Markdown
+from huggingface_hub import hf_hub_download
+#@title 2. Tell it What Concepts to Load
+models_to_load = [
+    "ahx-model-3",
+    "ahx-model-5",
+    "ahx-model-6",
+    "ahx-model-7",
+    "ahx-model-8",
+    "ahx-model-9",
+    "ahx-model-10",
+    "ahx-model-11",
+]
+models_to_load = [f"sd-concepts-library/{model}" for model in models_to_load]
+completed_concept_pipes = {}
+#@title 3. Load the Concepts as Distinct Pipes
+for repo_id_embeds in models_to_load:
+  print(f"loading {repo_id_embeds}")
+  print("----------------------")
+  # repo_id_embeds = "sd-concepts-library/ahx-model-3"
+  embeds_url = "" #Add the URL or path to a learned_embeds.bin file in case you have one
+  placeholder_token_string = "" #Add what is the token string in case you are uploading your own embed
+  downloaded_embedding_folder = "./downloaded_embedding"
+  if not os.path.exists(downloaded_embedding_folder):
+    os.mkdir(downloaded_embedding_folder)
+  if(not embeds_url):
+    embeds_path = hf_hub_download(repo_id=repo_id_embeds, filename="learned_embeds.bin")
+    token_path = hf_hub_download(repo_id=repo_id_embeds, filename="token_identifier.txt")
+    !cp
+downloaded_embedding_folder
+    !cp
+downloaded_embedding_folder
+    with open(f'{downloaded_embedding_folder}/token_identifier.txt', 'r') as file:
+      placeholder_token_string = file.read()
+  else:
+    !wget -q -O $downloaded_embedding_folder/learned_embeds.bin $embeds_url
+  learned_embeds_path = f"{downloaded_embedding_folder}/learned_embeds.bin"
+  # ----
+  tokenizer = CLIPTokenizer.from_pretrained(
+    pretrained_model_name_or_path,
+    subfolder="tokenizer",
+  )
+  text_encoder = CLIPTextModel.from_pretrained(
+      pretrained_model_name_or_path, subfolder="text_encoder", torch_dtype=torch.float16
+  )
+  # ----
+  def load_learned_embed_in_clip(learned_embeds_path, text_encoder, tokenizer, token=None):
+    loaded_learned_embeds = torch.load(learned_embeds_path, map_location="cpu")
+    # separate token and the embeds
+    trained_token = list(loaded_learned_embeds.keys())[0]
+    embeds = loaded_learned_embeds[trained_token]
+    # cast to dtype of text_encoder
+    dtype = text_encoder.get_input_embeddings().weight.dtype
+    embeds.to(dtype)
+    # add the token in tokenizer
+    token = token if token is not None else trained_token
+    num_added_tokens = tokenizer.add_tokens(token)
+    if num_added_tokens == 0:
+      raise ValueError(f"The tokenizer already contains the token {token}. Please pass a different `token` that is not already in the tokenizer.")
+    # resize the token embeddings
+    text_encoder.resize_token_embeddings(len(tokenizer))
+    # get the id for the token and assign the embeds
+    token_id = tokenizer.convert_tokens_to_ids(token)
+    text_encoder.get_input_embeddings().weight.data[token_id] = embeds
+  load_learned_embed_in_clip(learned_embeds_path, text_encoder, tokenizer)
+  # FOR DEPLOYMENT: add use_auth_token=my_token to pipe keyword args
+    # ie --> pipe = pipeline.from_pretrained("CompVis/stable-diffusion-v1-4", revision="fp16", torch_dtype=torch.float16, use_auth_token=my_token).to("cuda")
+  pipe = StableDiffusionPipeline.from_pretrained(
+    pretrained_model_name_or_path,
+    torch_dtype=torch.float16,
+    text_encoder=text_encoder,
+    tokenizer=tokenizer,
+  ).to("cuda")
+  completed_concept_pipes[repo_id_embeds] = pipe
+  print("--> complete !")
+  print("----------------------")
+#@title 4. Print Available Concept Strings
+print("AVAILABLE CONCEPTS TO SELECT FROM")
+print("copy one and paste below under 'model'")
+print("------------------------------------------------------")
+# list(completed_concept_pipes)
+for model in completed_concept_pipes:
+  print(f"{model}")
+#@title 5. Optionally Test without Gradio
+model = "" #@param {type: "string"}
+prompt = "" #@param {type:"string"}
+if prompt and model:
+  if model not in completed_concept_pipes:
+    raise ValueError("Invalid Model Name")
+  model_token = model.split("/")[1]
+  prompt = f"{prompt} in the style of <{model_token}>"
+  if model == "sd-concepts-library/ahx-model-5":
+    prompt = f"{prompt} in the style of "
+  num_samples = 1
+  num_rows = 1
+  all_images = []
+  pipe = completed_concept_pipes[model]
+  for _ in range(num_rows):
+      images = pipe(prompt, num_images_per_prompt=num_samples, height=512, width=512, num_inference_steps=30, guidance_scale=7.5).images
+      all_images.extend(images)
+  grid = image_grid(all_images, num_samples, num_rows)
+  grid
+#@title 6. Define Custom CSS for Gradio
+use_custom_css = True
+gradio_css = """
+  #output-image {
+    border: 1px solid black;
+    background-color: white;
+    width: 500px;
+    display: block;
+    margin-left: auto;
+    margin-right: auto;
+  }
+"""
+gradio_css_alternative = """
   #go-button {
     background-color: white;
     border-radius: 0;
     margin-left: auto;
     margin-right: auto;
   }
+"""
+#@title 7. Build and Launch the Gradio Interface
+DROPDOWNS = {}
+for model in models_to_load:
+  token = model.split("/")[1]
+  DROPDOWNS[model] = f" in the style of <{token}>"
+if "sd-concepts-library/ahx-model-5" in DROPDOWNS:
+  DROPDOWNS["sd-concepts-library/ahx-model-5"] = f"{prompt} in the style of "
+def image_prompt(prompt, dropdown):
+  prompt = prompt + DROPDOWNS[dropdown]
+  pipe = completed_concept_pipes[dropdown]
+  return pipe(prompt=prompt, height=512, width=512).images[0]
+with gradio.Blocks(css=gradio_css if use_custom_css else "") as demo:
+  dropdown = gradio.Dropdown(list(DROPDOWNS), label="choose style...")
   prompt = gradio.Textbox(label="image prompt...", elem_id="input-text")
   output = gradio.Image(elem_id="output-image")
   go_button = gradio.Button("draw it!", elem_id="go-button")
   go_button.click(fn=image_prompt, inputs=[prompt, dropdown], outputs=output)
+demo.launch(share=True)