Spaces:

adamelliotfields
/

diffusion

Running on Zero

App Files Files Community

adamelliotfields commited on Aug 8, 2024

Commit

cb5daed

verified ·

1 Parent(s): c62ffd9

Add AuraSR GAN

Browse files

Files changed (5) hide show

README.md +8 -4
app.py +11 -15
cli.py +4 -0
generate.py +47 -20
requirements.txt +1 -0

README.md CHANGED Viewed

@@ -43,7 +43,14 @@ preload_from_hub:
 # diffusion
-Gradio-based UI for Stable Diffusion pipelines.
 ## Usage
@@ -65,8 +72,5 @@ python cli.py 'an astronaut riding a horse on mars'
 ## TODO
-- [ ] Hires fix
-- [ ] Support LoRA
 - [ ] Metadata embed and display
 - [ ] Image-to-image
-- [ ] Latent preview

 # diffusion
+Gradio app for Stable Diffusion 1.5 including:
+* curated models and TI embeddings
+* multiple samplers with Karras schedule
+* Compel prompting
+* 100+ styles from sdxl_prompt_styler
+* AuraSR GAN
+* DeepCache and ToMe
+* optional TAESD
 ## Usage
 ## TODO
 - [ ] Metadata embed and display
 - [ ] Image-to-image

app.py CHANGED Viewed

@@ -100,7 +100,6 @@ with gr.Blocks(
                         style = gr.Dropdown(
                             value=cfg.STYLE,
                             label="Style",
-                            scale=1,
                             choices=["None"] + [f"{style['name']}" for style in styles],
                         )
                         scheduler = gr.Dropdown(
@@ -109,7 +108,6 @@ with gr.Blocks(
                             label="Scheduler",
                             filterable=False,
                             min_width=200,
-                            scale=1,
                             choices=cfg.SCHEDULERS,
                         )
@@ -119,7 +117,6 @@ with gr.Blocks(
                             label="Guidance Scale",
                             minimum=1.0,
                             maximum=15.0,
-                            scale=1,
                             step=0.1,
                         )
                         inference_steps = gr.Slider(
@@ -127,7 +124,6 @@ with gr.Blocks(
                             label="Inference Steps",
                             minimum=1,
                             maximum=50,
-                            scale=1,
                             step=1,
                         )
                         seed = gr.Number(
@@ -135,32 +131,28 @@ with gr.Blocks(
                             label="Seed",
                             minimum=-1,
                             maximum=(2**64) - 1,
-                            scale=1,
                         )
                     with gr.Row():
                         width = gr.Slider(
                             value=cfg.WIDTH,
                             label="Width",
-                            minimum=256,
-                            maximum=1024,
                             step=32,
-                            scale=1,
                         )
                         height = gr.Slider(
                             value=cfg.HEIGHT,
                             label="Height",
-                            minimum=256,
-                            maximum=1024,
                             step=32,
-                            scale=1,
                         )
                         num_images = gr.Dropdown(
                             choices=list(range(1, 5)),
                             value=cfg.NUM_IMAGES,
                             filterable=False,
                             label="Images",
-                            scale=1,
                         )
                     with gr.Row():
@@ -174,6 +166,12 @@ with gr.Blocks(
                             elem_classes=["checkbox"],
                             label="Autoincrement",
                             value=True,
                             scale=3,
                         )
@@ -206,19 +204,16 @@ with gr.Blocks(
                             elem_classes=["checkbox"],
                             label="Tiny VAE",
                             value=False,
-                            scale=1,
                         )
                         use_clip_skip = gr.Checkbox(
                             elem_classes=["checkbox"],
                             label="Clip skip",
                             value=False,
-                            scale=1,
                         )
                         truncate_prompts = gr.Checkbox(
                             elem_classes=["checkbox"],
                             label="Truncate prompts",
                             value=False,
-                            scale=1,
                         )
             with gr.TabItem("ℹ️ Usage"):
@@ -304,6 +299,7 @@ with gr.Blocks(
             increment_seed,
             deepcache_interval,
             tome_ratio,
         ],
     )

                         style = gr.Dropdown(
                             value=cfg.STYLE,
                             label="Style",
                             choices=["None"] + [f"{style['name']}" for style in styles],
                         )
                         scheduler = gr.Dropdown(
                             label="Scheduler",
                             filterable=False,
                             min_width=200,
                             choices=cfg.SCHEDULERS,
                         )
                             label="Guidance Scale",
                             minimum=1.0,
                             maximum=15.0,
                             step=0.1,
                         )
                         inference_steps = gr.Slider(
                             label="Inference Steps",
                             minimum=1,
                             maximum=50,
                             step=1,
                         )
                         seed = gr.Number(
                             label="Seed",
                             minimum=-1,
                             maximum=(2**64) - 1,
                         )
                     with gr.Row():
                         width = gr.Slider(
                             value=cfg.WIDTH,
                             label="Width",
+                            minimum=320,
+                            maximum=768,
                             step=32,
                         )
                         height = gr.Slider(
                             value=cfg.HEIGHT,
                             label="Height",
+                            minimum=320,
+                            maximum=768,
                             step=32,
                         )
                         num_images = gr.Dropdown(
                             choices=list(range(1, 5)),
                             value=cfg.NUM_IMAGES,
                             filterable=False,
                             label="Images",
                         )
                     with gr.Row():
                             elem_classes=["checkbox"],
                             label="Autoincrement",
                             value=True,
+                            scale=1,
+                        )
+                        upscale_4x = gr.Checkbox(
+                            elem_classes=["checkbox"],
+                            label="Upscale 4x",
+                            value=False,
                             scale=3,
                         )
                             elem_classes=["checkbox"],
                             label="Tiny VAE",
                             value=False,
                         )
                         use_clip_skip = gr.Checkbox(
                             elem_classes=["checkbox"],
                             label="Clip skip",
                             value=False,
                         )
                         truncate_prompts = gr.Checkbox(
                             elem_classes=["checkbox"],
                             label="Truncate prompts",
                             value=False,
                         )
             with gr.TabItem("ℹ️ Usage"):
             increment_seed,
             deepcache_interval,
             tome_ratio,
+            upscale_4x,
         ],
     )

cli.py CHANGED Viewed

@@ -1,3 +1,5 @@
 import argparse
 import config as cfg
@@ -31,6 +33,7 @@ def main():
     parser.add_argument("--clip-skip", action="store_true")
     parser.add_argument("--truncate", action="store_true")
     parser.add_argument("--karras", action="store_true")
     parser.add_argument("--no-increment", action="store_false")
     # fmt: on
@@ -54,6 +57,7 @@ def main():
         args.no_increment,
         args.deepcache,
         args.tome,
     )
     save_images(images, args.filename)

+# CLI
+# usage: python cli.py 'colorful calico cat artstation'
 import argparse
 import config as cfg
     parser.add_argument("--clip-skip", action="store_true")
     parser.add_argument("--truncate", action="store_true")
     parser.add_argument("--karras", action="store_true")
+    parser.add_argument("--upscale", action="store_true")
     parser.add_argument("--no-increment", action="store_false")
     # fmt: on
         args.no_increment,
         args.deepcache,
         args.tome,
+        args.upscale,
     )
     save_images(images, args.filename)

generate.py CHANGED Viewed

@@ -1,16 +1,16 @@
 import json
 import re
 import time
 from contextlib import contextmanager
 from datetime import datetime
 from itertools import product
-from os import environ
-from types import MethodType
 from typing import Callable
 import spaces
 import tomesd
 import torch
 from compel import Compel, DiffusersTextualInversionManager, ReturnedEmbeddingsType
 from compel.prompt_parser import PromptParser
 from DeepCache import DeepCacheSDHelper
@@ -27,13 +27,13 @@ from diffusers import (
 from diffusers.models import AutoencoderKL, AutoencoderTiny
 from torch._dynamo import OptimizedModule
-# some models use the deprecated CLIPFeatureExtractor class (should use CLIPImageProcessor)
 __import__("warnings").filterwarnings("ignore", category=FutureWarning, module="transformers")
 __import__("transformers").logging.set_verbosity_error()
 ZERO_GPU = (
-    environ.get("SPACES_ZERO_GPU", "").lower() == "true"
-    or environ.get("SPACES_ZERO_GPU", "") == "1"
 )
 EMBEDDINGS = {
@@ -58,6 +58,7 @@ class Loader:
             cls._instance = super(Loader, cls).__new__(cls)
             cls._instance.cpu = torch.device("cpu")
             cls._instance.gpu = torch.device("cuda")
             cls._instance.pipe = None
         return cls._instance
@@ -105,7 +106,7 @@ class Loader:
             )
         return self.pipe.vae
-    def load(self, model, scheduler, karras, taesd, deepcache_interval, dtype=None):
         model_lower = model.lower()
         schedulers = {
@@ -127,7 +128,7 @@ class Loader:
             "steps_offset": 1,
         }
-        if scheduler == "PNDM" or scheduler == "Euler a":
             del scheduler_kwargs["use_karras_sigmas"]
         pipe_kwargs = {
@@ -159,7 +160,7 @@ class Loader:
                 self._load_vae(model_lower, taesd, dtype)
                 self._load_deepcache(interval=deepcache_interval)
-                return self.pipe
             else:
                 print(f"Unloading {model_name.lower()}...")
                 self.pipe = None
@@ -181,7 +182,17 @@ class Loader:
         )
         self._load_vae(model_lower, taesd, dtype)
         self._load_deepcache(interval=deepcache_interval)
-        return self.pipe
 # applies tome to the pipeline
@@ -227,8 +238,7 @@ def apply_style(prompt, style_name, negative=False):
     return prompt
-# 1024x1024 for 50 steps can take ~10s each
-@spaces.GPU(duration=44)
 def generate(
     positive_prompt,
     negative_prompt="",
@@ -248,6 +258,7 @@ def generate(
     increment_seed=True,
     deepcache_interval=1,
     tome_ratio=0,
     log: Callable[[str], None] = None,
     Error=Exception,
 ):
@@ -258,9 +269,11 @@ def generate(
     if seed is None or seed < 0:
         seed = int(datetime.now().timestamp() * 1_000_000) % (2**64)
     TORCH_DTYPE = (
         torch.bfloat16
-        if torch.cuda.is_available() and torch.cuda.is_bf16_supported()
         else torch.float16
     )
@@ -273,7 +286,15 @@ def generate(
     with torch.inference_mode():
         start = time.perf_counter()
         loader = Loader()
-        pipe = loader.load(model, scheduler, karras, taesd, deepcache_interval, TORCH_DTYPE)
         # prompt embeds
         compel = Compel(
@@ -283,7 +304,7 @@ def generate(
             truncate_long_prompts=truncate_prompts,
             text_encoder=pipe.text_encoder,
             tokenizer=pipe.tokenizer,
-            device=pipe.device,
         )
         images = []
@@ -297,7 +318,7 @@ def generate(
         for i in range(num_images):
             # seeded generator for each iteration
-            generator = torch.Generator(device=pipe.device).manual_seed(current_seed)
             try:
                 all_positive_prompts = parse_prompt(positive_prompt)
@@ -312,7 +333,7 @@ def generate(
                 raise Error("ParsingException: Invalid prompt")
             with token_merging(pipe, tome_ratio=tome_ratio):
-                result = pipe(
                     num_inference_steps=inference_steps,
                     negative_prompt_embeds=neg_embeds,
                     guidance_scale=guidance_scale,
@@ -320,8 +341,14 @@ def generate(
                     generator=generator,
                     height=height,
                     width=width,
-                )
-                images.append((result.images[0], str(current_seed)))
             if increment_seed:
                 current_seed += 1
@@ -329,9 +356,9 @@ def generate(
         if ZERO_GPU:
             # spaces always start fresh
             loader.pipe = None
-        end = time.perf_counter()
-        diff = end - start
         if log:
             log(f"Generated {len(images)} image{'s' if len(images) > 1 else ''} in {diff:.2f}s")
         return images

 import json
+import os
 import re
 import time
 from contextlib import contextmanager
 from datetime import datetime
 from itertools import product
 from typing import Callable
 import spaces
 import tomesd
 import torch
+from aura_sr import AuraSR
 from compel import Compel, DiffusersTextualInversionManager, ReturnedEmbeddingsType
 from compel.prompt_parser import PromptParser
 from DeepCache import DeepCacheSDHelper
 from diffusers.models import AutoencoderKL, AutoencoderTiny
 from torch._dynamo import OptimizedModule
+__import__("warnings").filterwarnings("ignore", category=FutureWarning, module="diffusers")
 __import__("warnings").filterwarnings("ignore", category=FutureWarning, module="transformers")
 __import__("transformers").logging.set_verbosity_error()
 ZERO_GPU = (
+    os.environ.get("SPACES_ZERO_GPU", "").lower() == "true"
+    or os.environ.get("SPACES_ZERO_GPU", "") == "1"
 )
 EMBEDDINGS = {
             cls._instance = super(Loader, cls).__new__(cls)
             cls._instance.cpu = torch.device("cpu")
             cls._instance.gpu = torch.device("cuda")
+            cls._instance.gan = None
             cls._instance.pipe = None
         return cls._instance
             )
         return self.pipe.vae
+    def load(self, model, scheduler, karras, taesd, deepcache_interval, upscale, dtype=None):
         model_lower = model.lower()
         schedulers = {
             "steps_offset": 1,
         }
+        if scheduler in ["Euler a", "PNDM"]:
             del scheduler_kwargs["use_karras_sigmas"]
         pipe_kwargs = {
                 self._load_vae(model_lower, taesd, dtype)
                 self._load_deepcache(interval=deepcache_interval)
+                return self.pipe, self.gan
             else:
                 print(f"Unloading {model_name.lower()}...")
                 self.pipe = None
         )
         self._load_vae(model_lower, taesd, dtype)
         self._load_deepcache(interval=deepcache_interval)
+        if upscale and self.gan is None:
+            print("Loading fal/AuraSR-v2...")
+            self.gan = AuraSR.from_pretrained("fal/AuraSR-v2")
+        if not upscale and self.gan is not None:
+            print("Unloading fal/AuraSR-v2...")
+            self.gan = None
+            torch.cuda.empty_cache
+        return self.pipe, self.gan
 # applies tome to the pipeline
     return prompt
+@spaces.GPU(duration=40)
 def generate(
     positive_prompt,
     negative_prompt="",
     increment_seed=True,
     deepcache_interval=1,
     tome_ratio=0,
+    upscale=False,
     log: Callable[[str], None] = None,
     Error=Exception,
 ):
     if seed is None or seed < 0:
         seed = int(datetime.now().timestamp() * 1_000_000) % (2**64)
+    GPU = torch.device("cuda")
     TORCH_DTYPE = (
         torch.bfloat16
+        if torch.cuda.is_available() and torch.cuda.is_bf16_supported(including_emulation=False)
         else torch.float16
     )
     with torch.inference_mode():
         start = time.perf_counter()
         loader = Loader()
+        pipe, gan = loader.load(
+            model,
+            scheduler,
+            karras,
+            taesd,
+            deepcache_interval,
+            upscale,
+            TORCH_DTYPE,
+        )
         # prompt embeds
         compel = Compel(
             truncate_long_prompts=truncate_prompts,
             text_encoder=pipe.text_encoder,
             tokenizer=pipe.tokenizer,
+            device=GPU,
         )
         images = []
         for i in range(num_images):
             # seeded generator for each iteration
+            generator = torch.Generator(device=GPU).manual_seed(current_seed)
             try:
                 all_positive_prompts = parse_prompt(positive_prompt)
                 raise Error("ParsingException: Invalid prompt")
             with token_merging(pipe, tome_ratio=tome_ratio):
+                image = pipe(
                     num_inference_steps=inference_steps,
                     negative_prompt_embeds=neg_embeds,
                     guidance_scale=guidance_scale,
                     generator=generator,
                     height=height,
                     width=width,
+                ).images[0]
+                if upscale:
+                    print("Upscaling image...")
+                    batch_size = 12 if ZERO_GPU else 4  # smaller batch to fit in 8GB
+                    image = gan.upscale_4x_overlapped(image, max_batch_size=batch_size)
+                images.append((image, str(current_seed)))
             if increment_seed:
                 current_seed += 1
         if ZERO_GPU:
             # spaces always start fresh
             loader.pipe = None
+            loader.gan = None
+        diff = time.perf_counter() - start
         if log:
             log(f"Generated {len(images)} image{'s' if len(images) > 1 else ''} in {diff:.2f}s")
         return images

requirements.txt CHANGED Viewed

@@ -1,4 +1,5 @@
 accelerate
 compel
 deepcache==0.1.1
 diffusers

 accelerate
+aura-sr==0.0.4
 compel
 deepcache==0.1.1
 diffusers