min-dalle

Runtime error

App Files Files Community

abidlabs HF Staff

kuprel commited on Dec 20, 2022

Commit

0f51c59

0 Parent(s):

Duplicate from kuprel/min-dalle

Browse files

Co-authored-by: Brett Kuprel <[email protected]>

Files changed (21) hide show

.gitattributes +27 -0
.gitignore +19 -0
README.md +16 -0
app.py +203 -0
examples/astronaut-horse.jpg +0 -0
examples/astronaut-mars.jpg +0 -0
examples/cleopatra-iphone.jpg +0 -0
examples/dali-walle.jpg +0 -0
examples/elmo-riot.jpg +0 -0
examples/funeral-whole-foods.jpg +0 -0
examples/godzilla-trial.jpg +0 -0
examples/gollum.jpg +0 -0
examples/jesus-talent.jpg +0 -0
examples/lofi-nuclear-war.jpg +0 -0
examples/marx-slimed.jpg +0 -0
examples/moai-statue.jpg +0 -0
examples/nuclear-broccoli.jpg +0 -0
examples/rusty-iron-man.jpg +0 -0
examples/scientists-rhyme.jpg +0 -0
examples/singularity.jpg +0 -0
requirements.txt +5 -0

.gitattributes ADDED Viewed

	@@ -0,0 +1,27 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zstandard filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,19 @@

+**/__pycache__/
+**/.cache/
+**/*.pkl
+**/.DS*
+**/*.pt
+*.mlpackage
+**/*.ckpt
+.vscode
+**/.ipynb_checkpoints
+**/generated
+**/pretrained
+**/*.msgpack
+*.egg-info/
+*.egg
+dist
+build
+README
+.cog
+cog

README.md ADDED Viewed

	@@ -0,0 +1,16 @@

+---
+title: min(DALL·E)
+metaTitle: min(DALL·E)
+emoji: ⚡️ 🥑 ⚡️
+colorFrom: yellow
+colorTo: green
+sdk: gradio
+sdk_version: 3.3.1
+app_file: app.py
+pinned: true
+license: mit
+python_version: 3.10.5
+models:
+- kuprel/min-dalle
+duplicated_from: kuprel/min-dalle
+---

app.py ADDED Viewed

	@@ -0,0 +1,203 @@

+import gradio
+import subprocess
+from PIL import Image
+import torch, torch.backends.cudnn, torch.backends.cuda
+from min_dalle import MinDalle
+from emoji import demojize
+import string
+def filename_from_text(text: str) -> str:
+    text = demojize(text, delimiters=['', ''])
+    text = text.lower().encode('ascii', errors='ignore').decode()
+    allowed_chars = string.ascii_lowercase + ' '
+    text = ''.join(i for i in text.lower() if i in allowed_chars)
+    text = text[:64]
+    text = '-'.join(text.strip().split())
+    if len(text) == 0: text = 'blank'
+    return text
+def log_gpu_memory():
+    print(subprocess.check_output('nvidia-smi').decode('utf-8'))
+log_gpu_memory()
+model = MinDalle(
+    is_mega=True,
+    is_reusable=True,
+    device='cuda',
+    dtype=torch.float32
+)
+log_gpu_memory()
+def run_model(
+    text: str,
+    grid_size: int,
+    is_seamless: bool,
+    save_as_png: bool,
+    temperature: float,
+    supercondition: str,
+    top_k: str
+) -> str:
+    torch.set_grad_enabled(False)
+    torch.backends.cudnn.enabled = True
+    torch.backends.cudnn.deterministic = False
+    torch.backends.cudnn.benchmark = True
+    torch.backends.cuda.matmul.allow_tf32 = True
+    torch.backends.cuda.matmul.allow_fp16_reduced_precision_reduction = True
+    print('text:', text)
+    print('grid_size:', grid_size)
+    print('is_seamless:', is_seamless)
+    print('temperature:', temperature)
+    print('supercondition:', supercondition)
+    print('top_k:', top_k)
+    try:
+        temperature = float(temperature)
+        assert(temperature > 1e-6)
+    except:
+        raise Exception('Temperature must be a positive nonzero number')
+    try:
+        grid_size = int(grid_size)
+        assert(grid_size <= 5)
+        assert(grid_size >= 1)
+    except:
+        raise Exception('Grid size must be between 1 and 5')
+    try:
+        top_k = int(top_k)
+        assert(top_k <= 16384)
+        assert(top_k >= 1)
+    except:
+        raise Exception('Top k must be between 1 and 16384')
+    with torch.no_grad():
+        image = model.generate_image(
+            text = text,
+            seed = -1,
+            grid_size = grid_size,
+            is_seamless = bool(is_seamless),
+            temperature = temperature,
+            supercondition_factor = float(supercondition),
+            top_k = top_k,
+            is_verbose = True
+        )
+    log_gpu_memory()
+    ext = 'png' if bool(save_as_png) else 'jpg'
+    filename = filename_from_text(text)
+    image_path = '{}.{}'.format(filename, ext)
+    image.save(image_path)
+    return image_path
+demo = gradio.Blocks(analytics_enabled=True)
+with demo:
+    with gradio.Row():
+        with gradio.Column():
+            input_text = gradio.Textbox(
+                label='Input Text',
+                value='Moai statue giving a TED Talk',
+                lines=3
+            )
+            run_button = gradio.Button(value='Generate Image').style(full_width=True)
+            output_image = gradio.Image(
+                value='examples/moai-statue.jpg',
+                label='Output Image',
+                type='file',
+                interactive=False
+            )
+        with gradio.Column():
+            gradio.Markdown('## Settings')
+            with gradio.Row():
+                grid_size = gradio.Slider(
+                    label='Grid Size',
+                    value=5,
+                    minimum=1,
+                    maximum=5,
+                    step=1
+                )
+                save_as_png = gradio.Checkbox(
+                    label='Output PNG',
+                    value=False
+                )
+                is_seamless = gradio.Checkbox(
+                    label='Seamless',
+                    value=False
+                )
+            gradio.Markdown('#### Advanced')
+            with gradio.Row():
+                temperature = gradio.Number(
+                    label='Temperature',
+                    value=1
+                )
+                top_k = gradio.Dropdown(
+                    label='Top-k',
+                    choices=[str(2 ** i) for i in range(15)],
+                    value='128'
+                )
+                supercondition = gradio.Dropdown(
+                    label='Super Condition',
+                    choices=[str(2 ** i) for i in range(2, 7)],
+                    value='16'
+                )
+            gradio.Markdown(
+                """
+                ####
+                - **Input Text**: For long prompts, only the first 64 text tokens will be used to generate the image.
+                - **Grid Size**: Size of the image grid. 3x3 takes about 15 seconds.
+                - **Seamless**: Tile images in image token space instead of pixel space.
+                - **Temperature**: High temperature increases the probability of sampling low scoring image tokens.
+                - **Top-k**: Each image token is sampled from the top-k scoring tokens.
+                - **Super Condition**: Higher values can result in better agreement with the text.
+                """
+            )
+    gradio.Examples(
+        examples=[
+            ['Rusty Iron Man suit found abandoned in the woods being reclaimed by nature', 3, 'examples/rusty-iron-man.jpg'],
+            ['Moai statue giving a TED Talk', 5, 'examples/moai-statue.jpg'],
+            ['Court sketch of Godzilla on trial', 5, 'examples/godzilla-trial.jpg'],
+            ['lofi nuclear war to relax and study to', 5, 'examples/lofi-nuclear-war.jpg'],
+            ['Karl Marx slimed at Kids Choice Awards', 4, 'examples/marx-slimed.jpg'],
+            ['Scientists trying to rhyme orange with banana', 4, 'examples/scientists-rhyme.jpg'],
+            ['Jesus turning water into wine on Americas Got Talent', 5, 'examples/jesus-talent.jpg'],
+            ['Elmo in a street riot throwing a Molotov cocktail, hyperrealistic', 5, 'examples/elmo-riot.jpg'],
+            ['Trail cam footage of gollum eating watermelon', 4, 'examples/gollum.jpg'],
+            ['Funeral at Whole Foods', 4, 'examples/funeral-whole-foods.jpg'],
+            ['Singularity, hyperrealism', 5, 'examples/singularity.jpg'],
+            ['Astronaut riding a horse hyperrealistic', 5, 'examples/astronaut-horse.jpg'],
+            ['An astronaut walking on Mars next to a Starship rocket, realistic', 5, 'examples/astronaut-mars.jpg'],
+            ['Nuclear explosion broccoli', 4, 'examples/nuclear-broccoli.jpg'],
+            ['Dali painting of WALL·E', 5, 'examples/dali-walle.jpg'],
+            ['Cleopatra checking her iPhone', 4, 'examples/cleopatra-iphone.jpg'],
+        ],
+        inputs=[
+            input_text,
+            grid_size,
+            output_image
+        ],
+        examples_per_page=20
+    )
+    run_button.click(
+        fn=run_model,
+        inputs=[
+            input_text,
+            grid_size,
+            is_seamless,
+            save_as_png,
+            temperature,
+            supercondition,
+            top_k
+        ],
+        outputs=[
+            output_image
+        ]
+    )
+demo.launch()