junnyu
/

webui_ppdiffusers

Model card Files Files and versions

xet

Community

junnyu commited on Apr 24, 2023

Commit

be7aa5c

1 Parent(s): 83feac1

Update pipeline.py

Browse files

Files changed (1) hide show

pipeline.py +119 -19

pipeline.py CHANGED Viewed

@@ -17,6 +17,7 @@
 # Here is the AGPL-3.0 license https://github.com/AUTOMATIC1111/stable-diffusion-webui/blob/master/LICENSE.txt
 import inspect
 from pathlib import Path
 from typing import Any, Callable, Dict, List, Optional, Union
@@ -32,7 +33,9 @@ from ppdiffusers.pipelines.stable_diffusion.safety_checker import (
 )
 from ppdiffusers.schedulers import KarrasDiffusionSchedulers
 from ppdiffusers.utils import (
     logging,
     randn_tensor,
     safetensors_load,
     smart_load,
@@ -42,6 +45,64 @@ from ppdiffusers.utils import (
 logger = logging.get_logger(__name__)  # pylint: disable=invalid-name
 @paddle.no_grad()
 def load_lora(
     pipeline,
@@ -164,6 +225,8 @@ class WebUIStableDiffusionPipeline(DiffusionPipeline):
     _optional_components = ["safety_checker", "feature_extractor"]
     enable_emphasis = True
     comma_padding_backtrack = 20
     def __init__(
         self,
@@ -227,7 +290,17 @@ class WebUIStableDiffusionPipeline(DiffusionPipeline):
         ]
         self.weights_has_changed = False
-    def add_ti_embedding_dir(self, embeddings_dir):
         self.sj.embedding_db.add_embedding_dir(embeddings_dir)
         self.sj.embedding_db.load_textual_inversion_embeddings()
@@ -235,6 +308,30 @@ class WebUIStableDiffusionPipeline(DiffusionPipeline):
         self.sj.embedding_db.clear_embedding_dirs()
         self.sj.embedding_db.load_textual_inversion_embeddings(True)
     def change_scheduler(self, scheduler_type="ddim"):
         self.switch_scheduler(scheduler_type)
@@ -408,7 +505,6 @@ class WebUIStableDiffusionPipeline(DiffusionPipeline):
         callback_steps: Optional[int] = 1,
         cross_attention_kwargs: Optional[Dict[str, Any]] = None,
         clip_skip: int = 1,
-        lora_dir: str = "./loras",
     ):
         r"""
         Function invoked when calling the pipeline for generation.
@@ -459,10 +555,8 @@ class WebUIStableDiffusionPipeline(DiffusionPipeline):
                 A kwargs dictionary that if specified is passed along to the `AttnProcessor` as defined under
                 `self.processor` in
                 [diffusers.cross_attention](https://github.com/huggingface/diffusers/blob/main/src/diffusers/models/cross_attention.py).
-            clip_skip (`int`, *optional*, defaults to 0):
                 CLIP_stop_at_last_layers, if clip_skip <= 1, we will use the last_hidden_state from text_encoder.
-            lora_dir (`str`, *optional*):
-                Path to lora which we want to load.
         Examples:
         Returns:
@@ -472,6 +566,8 @@ class WebUIStableDiffusionPipeline(DiffusionPipeline):
             list of `bool`s denoting whether the corresponding generated image likely represents "not-safe-for-work"
             (nsfw) content, according to the `safety_checker`.
         """
         try:
             # 0. Default height and width to unet
             height = height or max(self.unet.config.sample_size * self.vae_scale_factor, 512)
@@ -495,19 +591,23 @@ class WebUIStableDiffusionPipeline(DiffusionPipeline):
             prompts, extra_network_data = parse_prompts([prompt])
-            if lora_dir is not None and os.path.exists(lora_dir):
-                lora_mapping = {p.stem: p.absolute() for p in Path(lora_dir).glob("*.safetensors")}
-                for params in extra_network_data["lora"]:
-                    assert len(params.items) > 0
-                    name = params.items[0]
-                    if name in lora_mapping:
-                        ratio = float(params.items[1]) if len(params.items) > 1 else 1.0
-                        lora_state_dict = smart_load(lora_mapping[name], map_location=paddle.get_device())
-                        self.weights_has_changed = True
-                        load_lora(self, state_dict=lora_state_dict, ratio=ratio)
-                        del lora_state_dict
-                    else:
-                        print(f"We can't find lora weight: {name}! Please make sure that exists!")
             self.sj.clip.CLIP_stop_at_last_layers = clip_skip
             # 3. Encode input prompt
@@ -1658,7 +1758,7 @@ class EmbeddingDatabase:
         self.previously_displayed_embeddings = ()
     def add_embedding_dir(self, path):
-        if path is not None:
             self.embedding_dirs[path] = DirWithTextualInversionEmbeddings(path)
     def clear_embedding_dirs(self):

 # Here is the AGPL-3.0 license https://github.com/AUTOMATIC1111/stable-diffusion-webui/blob/master/LICENSE.txt
 import inspect
+import shutil
 from pathlib import Path
 from typing import Any, Callable, Dict, List, Optional, Union
 )
 from ppdiffusers.schedulers import KarrasDiffusionSchedulers
 from ppdiffusers.utils import (
+    PPDIFFUSERS_CACHE,
     logging,
+    ppdiffusers_url_download,
     randn_tensor,
     safetensors_load,
     smart_load,
 logger = logging.get_logger(__name__)  # pylint: disable=invalid-name
+import copy
+import os
+import os.path
+from huggingface_hub.file_download import _request_wrapper, hf_raise_for_status
+# lark omegaconf
+def get_civitai_download_url(display_url, url_prefix="https://civitai.com"):
+    if "api/download" in display_url:
+        return display_url
+    import bs4
+    import requests
+    headers = {
+        "User-Agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/63.0.3239.132 Safari/537.36 QIHU 360SE"
+    }
+    r = requests.get(display_url, headers=headers)
+    soup = bs4.BeautifulSoup(r.text, "lxml")
+    download_url = None
+    for a in soup.find_all("a", href=True):
+        if "Download" in str(a):
+            download_url = url_prefix + a["href"].split("?")[0]
+            break
+    return download_url
+def http_file_name(
+    url: str,
+    *,
+    proxies=None,
+    headers: Optional[Dict[str, str]] = None,
+    timeout=10.0,
+    max_retries=0,
+):
+    """
+    Get a remote file name.
+    """
+    headers = copy.deepcopy(headers) or {}
+    r = _request_wrapper(
+        method="GET",
+        url=url,
+        stream=True,
+        proxies=proxies,
+        headers=headers,
+        timeout=timeout,
+        max_retries=max_retries,
+    )
+    hf_raise_for_status(r)
+    displayed_name = url.split("/")[-1]
+    content_disposition = r.headers.get("Content-Disposition")
+    if content_disposition is not None and "filename=" in content_disposition:
+        # Means file is on CDN
+        displayed_name = content_disposition.split("filename=")[-1]
+    return displayed_name
 @paddle.no_grad()
 def load_lora(
     pipeline,
     _optional_components = ["safety_checker", "feature_extractor"]
     enable_emphasis = True
     comma_padding_backtrack = 20
+    LORA_DIR = os.path.join(PPDIFFUSERS_CACHE, "lora")
+    TI_DIR = os.path.join(PPDIFFUSERS_CACHE, "textual_inversion")
     def __init__(
         self,
         ]
         self.weights_has_changed = False
+        # register_state_dict_hook to fix text_encoder, when we save_pretrained text model.
+        def map_to(state_dict, *args, **kwargs):
+            if "text_model.token_embedding.wrapped.weight" in state_dict:
+                state_dict["text_model.token_embedding.weight"] = state_dict.pop(
+                    "text_model.token_embedding.wrapped.weight"
+                )
+            return state_dict
+        self.text_encoder.register_state_dict_hook(map_to)
+    def add_ti_embedding_dir(self, embeddings_dir=None):
         self.sj.embedding_db.add_embedding_dir(embeddings_dir)
         self.sj.embedding_db.load_textual_inversion_embeddings()
         self.sj.embedding_db.clear_embedding_dirs()
         self.sj.embedding_db.load_textual_inversion_embeddings(True)
+    def download_civitai_lora_file(self, url):
+        if os.path.isfile(url):
+            dst = os.path.join(self.LORA_DIR, os.path.basename(url))
+            shutil.copyfile(url, dst)
+            return dst
+        download_url = get_civitai_download_url(url) or url
+        file_path = ppdiffusers_url_download(
+            download_url, cache_dir=self.LORA_DIR, filename=http_file_name(download_url).strip('"')
+        )
+        return file_path
+    def download_civitai_ti_file(self, url):
+        if os.path.isfile(url):
+            dst = os.path.join(self.TI_DIR, os.path.basename(url))
+            shutil.copyfile(url, dst)
+            return dst
+        download_url = get_civitai_download_url(url) or url
+        file_path = ppdiffusers_url_download(
+            download_url, cache_dir=self.TI_DIR, filename=http_file_name(download_url).strip('"')
+        )
+        return file_path
     def change_scheduler(self, scheduler_type="ddim"):
         self.switch_scheduler(scheduler_type)
         callback_steps: Optional[int] = 1,
         cross_attention_kwargs: Optional[Dict[str, Any]] = None,
         clip_skip: int = 1,
     ):
         r"""
         Function invoked when calling the pipeline for generation.
                 A kwargs dictionary that if specified is passed along to the `AttnProcessor` as defined under
                 `self.processor` in
                 [diffusers.cross_attention](https://github.com/huggingface/diffusers/blob/main/src/diffusers/models/cross_attention.py).
+            clip_skip (`int`, *optional*, defaults to 1):
                 CLIP_stop_at_last_layers, if clip_skip <= 1, we will use the last_hidden_state from text_encoder.
         Examples:
         Returns:
             list of `bool`s denoting whether the corresponding generated image likely represents "not-safe-for-work"
             (nsfw) content, according to the `safety_checker`.
         """
+        self.add_ti_embedding_dir(self.TI_DIR)
         try:
             # 0. Default height and width to unet
             height = height or max(self.unet.config.sample_size * self.vae_scale_factor, 512)
             prompts, extra_network_data = parse_prompts([prompt])
+            if self.LORA_DIR is not None:
+                if os.path.exists(self.LORA_DIR):
+                    lora_mapping = {p.stem: p.absolute() for p in Path(self.LORA_DIR).glob("*.safetensors")}
+                    for params in extra_network_data["lora"]:
+                        assert len(params.items) > 0
+                        name = params.items[0]
+                        if name in lora_mapping:
+                            ratio = float(params.items[1]) if len(params.items) > 1 else 1.0
+                            lora_state_dict = smart_load(lora_mapping[name], map_location=paddle.get_device())
+                            self.weights_has_changed = True
+                            load_lora(self, state_dict=lora_state_dict, ratio=ratio)
+                            del lora_state_dict
+                        else:
+                            print(f"We can't find lora weight: {name}! Please make sure that exists!")
+                else:
+                    if len(extra_network_data["lora"]) > 0:
+                        print(f"{self.LORA_DIR} not exists, so we cant load loras!")
             self.sj.clip.CLIP_stop_at_last_layers = clip_skip
             # 3. Encode input prompt
         self.previously_displayed_embeddings = ()
     def add_embedding_dir(self, path):
+        if path is not None and path not in self.embedding_dirs:
             self.embedding_dirs[path] = DirWithTextualInversionEmbeddings(path)
     def clear_embedding_dirs(self):