Update Lycoris

2023-12-03 11:52:20 -05:00 · 2023-12-03 11:52:20 -05:00 · 821cdda125
parent bf20e17b0c
commit 821cdda125
7 changed files with 224 additions and 104 deletions
--- a/.release
+++ b/.release
@ -1 +1 @@
-v22.2.1
+v22.2.2
--- a/README.md
+++ b/README.md
@ -651,7 +651,12 @@ masterpiece, best quality, 1boy, in business suit, standing at street, looking b


 ## Change History
-* 2023/11/?? (v22.2.1)
+* 2023/12/03 (v22.2.2)
+- Update Lycoris module to 2.0.0 (https://github.com/KohakuBlueleaf/LyCORIS/blob/0006e2ffa05a48d8818112d9f70da74c0cd30b99/README.md)
+- Update Lycoris merge and extract tools
+- Remove anoying warning about local pip modules that is not necessary.
+
+* 2023/11/20 (v22.2.1)
 - Fix issue with `Debiased Estimation loss` not getting properly loaded from json file. Oups.

 * 2023/11/15 (v22.2.0)
--- a/library/extract_lycoris_locon_gui.py
+++ b/library/extract_lycoris_locon_gui.py
@ -25,6 +25,7 @@ def extract_lycoris_locon(
    base_model,
    output_name,
    device,
+    is_sdxl,
    is_v2,
    mode,
    linear_dim,
@ -58,6 +59,8 @@ def extract_lycoris_locon(
        return

    run_cmd = f'{PYTHON} "{os.path.join("tools","lycoris_locon_extract.py")}"'
+    if is_sdxl:
+        run_cmd += f' --is_sdxl'
    if is_v2:
        run_cmd += f' --is_v2'
    run_cmd += f' --device {device}'
@ -196,10 +199,13 @@ def gradio_extract_lycoris_locon_tab(headless=False):
                value='cuda',
                interactive=True,
            )
+            
+            is_sdxl = gr.Checkbox(label='is SDXL', value=False, interactive=True)
+            
            is_v2 = gr.Checkbox(label='is v2', value=False, interactive=True)
        mode = gr.Dropdown(
            label='Mode',
-            choices=['fixed', 'threshold', 'ratio', 'quantile'],
+            choices=['fixed', 'full', 'quantile', 'ratio', 'threshold'],
            value='fixed',
            interactive=True,
        )
@ -211,6 +217,7 @@ def gradio_extract_lycoris_locon_tab(headless=False):
                value=1,
                step=1,
                interactive=True,
+                info="network dim for linear layer in fixed mode",
            )
            conv_dim = gr.Slider(
                minimum=1,
@ -219,6 +226,7 @@ def gradio_extract_lycoris_locon_tab(headless=False):
                value=1,
                step=1,
                interactive=True,
+                info="network dim for conv layer in fixed mode",
            )
        with gr.Row(visible=False) as threshold:
            linear_threshold = gr.Slider(
@ -312,6 +320,7 @@ def gradio_extract_lycoris_locon_tab(headless=False):
                base_model,
                output_name,
                device,
+                is_sdxl,
                is_v2,
                mode,
                linear_dim,
--- a/library/merge_lycoris_gui.py
+++ b/library/merge_lycoris_gui.py
@ -26,6 +26,7 @@ def merge_lycoris(
    output_name,
    dtype,
    device,
+    is_sdxl,
    is_v2,
 ):
    log.info('Merge model...')
@ -37,6 +38,8 @@ def merge_lycoris(
    run_cmd += f' --weight {weight}'
    run_cmd += f' --device {device}'
    run_cmd += f' --dtype {dtype}'
+    if is_sdxl:
+        run_cmd += f' --is_sdxl'
    if is_v2:
        run_cmd += f' --is_v2'

@ -149,12 +152,13 @@ def gradio_merge_lycoris_tab(headless=False):
                label='Device',
                choices=[
                    'cpu',
-                    #  'cuda',
+                    'cuda',
                ],
                value='cpu',
                interactive=True,
            )

+            is_sdxl = gr.Checkbox(label='is sdxl', value=False, interactive=True)
            is_v2 = gr.Checkbox(label='is v2', value=False, interactive=True)

        merge_button = gr.Button('Merge model')
@ -168,6 +172,7 @@ def gradio_merge_lycoris_tab(headless=False):
                output_name,
                dtype,
                device,
+                is_sdxl,
                is_v2,
            ],
            show_progress=False,
--- a/requirements.txt
+++ b/requirements.txt
@ -13,7 +13,7 @@ huggingface-hub==0.15.1
 # for loading Diffusers' SDXL
 invisible-watermark==0.2.0
 lion-pytorch==0.0.6
-lycoris_lora==1.9.0
+lycoris_lora==2.0.0
 # for BLIP captioning
 # requests==2.28.2
 # timm==0.6.12
--- a/tools/lycoris_locon_extract.py
+++ b/tools/lycoris_locon_extract.py
@ -1,4 +1,5 @@
 import os, sys
+
 sys.path.insert(0, os.getcwd())
 import argparse

@ -6,87 +7,125 @@ import argparse
 def get_args():
    parser = argparse.ArgumentParser()
    parser.add_argument(
-        "base_model", help="The model which use it to train the dreambooth model",
-        default='', type=str
+        "base_model",
+        help="The model which use it to train the dreambooth model",
+        default="",
+        type=str,
    )
    parser.add_argument(
-        "db_model", help="the dreambooth model you want to extract the locon",
-        default='', type=str
+        "db_model",
+        help="the dreambooth model you want to extract the locon",
+        default="",
+        type=str,
    )
    parser.add_argument(
-        "output_name", help="the output model",
-        default='./out.pt', type=str
+        "output_name", help="the output model", default="./out.pt", type=str
    )
    parser.add_argument(
-        "--is_v2", help="Your base/db model is sd v2 or not",
-        default=False, action="store_true"
+        "--is_v2",
+        help="Your base/db model is sd v2 or not",
+        default=False,
+        action="store_true",
    )
    parser.add_argument(
-        "--device", help="Which device you want to use to extract the locon",
-        default='cpu', type=str
+        "--is_sdxl",
+        help="Your base/db model is sdxl or not",
+        default=False,
+        action="store_true",
+    )
+    parser.add_argument(
+        "--device",
+        help="Which device you want to use to extract the locon",
+        default="cpu",
+        type=str,
    )
    parser.add_argument(
        "--mode",
        help=(
-            'extraction mode, can be "fixed", "threshold", "ratio", "quantile". '
+            'extraction mode, can be "full", "fixed", "threshold", "ratio", "quantile". '
            'If not "fixed", network_dim and conv_dim will be ignored'
        ),
-        default='fixed', type=str
+        default="fixed",
+        type=str,
    )
    parser.add_argument(
-        "--safetensors", help='use safetensors to save locon model',
-        default=False, action="store_true"
+        "--safetensors",
+        help="use safetensors to save locon model",
+        default=False,
+        action="store_true",
    )
    parser.add_argument(
-        "--linear_dim", help="network dim for linear layer in fixed mode",
-        default=1, type=int
+        "--linear_dim",
+        help="network dim for linear layer in fixed mode",
+        default=1,
+        type=int,
    )
    parser.add_argument(
-        "--conv_dim", help="network dim for conv layer in fixed mode",
-        default=1, type=int
+        "--conv_dim",
+        help="network dim for conv layer in fixed mode",
+        default=1,
+        type=int,
    )
    parser.add_argument(
-        "--linear_threshold", help="singular value threshold for linear layer in threshold mode",
-        default=0., type=float
+        "--linear_threshold",
+        help="singular value threshold for linear layer in threshold mode",
+        default=0.0,
+        type=float,
    )
    parser.add_argument(
-        "--conv_threshold", help="singular value threshold for conv layer in threshold mode",
-        default=0., type=float
+        "--conv_threshold",
+        help="singular value threshold for conv layer in threshold mode",
+        default=0.0,
+        type=float,
    )
    parser.add_argument(
-        "--linear_ratio", help="singular ratio for linear layer in ratio mode",
-        default=0., type=float
+        "--linear_ratio",
+        help="singular ratio for linear layer in ratio mode",
+        default=0.0,
+        type=float,
    )
    parser.add_argument(
-        "--conv_ratio", help="singular ratio for conv layer in ratio mode",
-        default=0., type=float
+        "--conv_ratio",
+        help="singular ratio for conv layer in ratio mode",
+        default=0.0,
+        type=float,
    )
    parser.add_argument(
-        "--linear_quantile", help="singular value quantile for linear layer quantile mode",
-        default=1., type=float
+        "--linear_quantile",
+        help="singular value quantile for linear layer quantile mode",
+        default=1.0,
+        type=float,
    )
    parser.add_argument(
-        "--conv_quantile", help="singular value quantile for conv layer quantile mode",
-        default=1., type=float
+        "--conv_quantile",
+        help="singular value quantile for conv layer quantile mode",
+        default=1.0,
+        type=float,
    )
    parser.add_argument(
-        "--use_sparse_bias", help="enable sparse bias",
-        default=False, action="store_true"
+        "--use_sparse_bias",
+        help="enable sparse bias",
+        default=False,
+        action="store_true",
    )
    parser.add_argument(
-        "--sparsity", help="sparsity for sparse bias",
-        default=0.98, type=float
+        "--sparsity", help="sparsity for sparse bias", default=0.98, type=float
    )
    parser.add_argument(
-        "--disable_cp", help="don't use cp decomposition",
-        default=False, action="store_true"
+        "--disable_cp",
+        help="don't use cp decomposition",
+        default=False,
+        action="store_true",
    )
    return parser.parse_args()
+
+
 ARGS = get_args()


 from lycoris.utils import extract_diff
 from lycoris.kohya.model_utils import load_models_from_stable_diffusion_checkpoint
+from lycoris.kohya.sdxl_model_util import load_models_from_sdxl_checkpoint

 import torch
 from safetensors.torch import save_file
@ -94,29 +133,51 @@ from safetensors.torch import save_file

 def main():
    args = ARGS
-    base = load_models_from_stable_diffusion_checkpoint(args.is_v2, args.base_model)
-    db = load_models_from_stable_diffusion_checkpoint(args.is_v2, args.db_model)
+    if args.is_sdxl:
+        base = load_models_from_sdxl_checkpoint(None, args.base_model, args.device)
+        db = load_models_from_sdxl_checkpoint(None, args.db_model, args.device)
+    else:
+        base = load_models_from_stable_diffusion_checkpoint(args.is_v2, args.base_model)
+        db = load_models_from_stable_diffusion_checkpoint(args.is_v2, args.db_model)

    linear_mode_param = {
-        'fixed': args.linear_dim,
-        'threshold': args.linear_threshold,
-        'ratio': args.linear_ratio,
-        'quantile': args.linear_quantile,
+        "fixed": args.linear_dim,
+        "threshold": args.linear_threshold,
+        "ratio": args.linear_ratio,
+        "quantile": args.linear_quantile,
+        "full": None,
    }[args.mode]
    conv_mode_param = {
-        'fixed': args.conv_dim,
-        'threshold': args.conv_threshold,
-        'ratio': args.conv_ratio,
-        'quantile': args.conv_quantile,
+        "fixed": args.conv_dim,
+        "threshold": args.conv_threshold,
+        "ratio": args.conv_ratio,
+        "quantile": args.conv_quantile,
+        "full": None,
    }[args.mode]

+    if args.is_sdxl:
+        db_tes = [db[0], db[1]]
+        db_unet = db[3]
+        base_tes = [base[0], base[1]]
+        base_unet = base[3]
+    else:
+        db_tes = [db[0]]
+        db_unet = db[2]
+        base_tes = [base[0]]
+        base_unet = base[2]
+
    state_dict = extract_diff(
-        base, db,
+        base_tes,
+        db_tes,
+        base_unet,
+        db_unet,
        args.mode,
-        linear_mode_param, conv_mode_param,
+        linear_mode_param,
+        conv_mode_param,
        args.device,
-        args.use_sparse_bias, args.sparsity,
-        not args.disable_cp
+        args.use_sparse_bias,
+        args.sparsity,
+        not args.disable_cp,
    )

    if args.safetensors:
@ -125,5 +186,5 @@ def main():
        torch.save(state_dict, args.output_name)


-if __name__ == '__main__':
+if __name__ == "__main__":
    main()
--- a/tools/merge_lycoris.py
+++ b/tools/merge_lycoris.py
@ -1,4 +1,5 @@
 import os, sys
+
 sys.path.insert(0, os.getcwd())
 import argparse

@ -6,80 +7,119 @@ import argparse
 def get_args():
    parser = argparse.ArgumentParser()
    parser.add_argument(
-        "base_model", help="The model you want to merge with loha",
-        default='', type=str
+        "base_model", help="The model you want to merge with loha", default="", type=str
    )
    parser.add_argument(
-        "lycoris_model", help="the lyco model you want to merge into sd model",
-        default='', type=str
+        "lycoris_model",
+        help="the lyco model you want to merge into sd model",
+        default="",
+        type=str,
    )
    parser.add_argument(
-        "output_name", help="the output model",
-        default='./out.pt', type=str
+        "output_name", help="the output model", default="./out.pt", type=str
    )
    parser.add_argument(
-        "--is_v2", help="Your base model is sd v2 or not",
-        default=False, action="store_true"
+        "--is_v2",
+        help="Your base model is sd v2 or not",
+        default=False,
+        action="store_true",
    )
    parser.add_argument(
-        "--device", help="Which device you want to use to merge the weight",
-        default='cpu', type=str
+        "--is_sdxl",
+        help="Your base/db model is sdxl or not",
+        default=False,
+        action="store_true",
    )
    parser.add_argument(
-        "--dtype", help='dtype to save',
-        default='float', type=str
+        "--device",
+        help="Which device you want to use to merge the weight",
+        default="cpu",
+        type=str,
    )
+    parser.add_argument("--dtype", help="dtype to save", default="float", type=str)
    parser.add_argument(
-        "--weight", help='weight for the lyco model to merge',
-        default='1.0', type=float
+        "--weight", help="weight for the lyco model to merge", default="1.0", type=float
    )
    return parser.parse_args()
-ARGS = get_args()
+
+
+args = ARGS = get_args()


 from lycoris.utils import merge
 from lycoris.kohya.model_utils import (
    load_models_from_stable_diffusion_checkpoint,
    save_stable_diffusion_checkpoint,
-    load_file
+    load_file,
+)
+from lycoris.kohya.sdxl_model_util import (
+    load_models_from_sdxl_checkpoint,
+    save_stable_diffusion_checkpoint as save_sdxl_checkpoint,
 )

 import torch


+@torch.no_grad()
 def main():
-    base = load_models_from_stable_diffusion_checkpoint(ARGS.is_v2, ARGS.base_model)
-    if ARGS.lycoris_model.rsplit('.', 1)[-1] == 'safetensors':
+    if args.is_sdxl:
+        base = load_models_from_sdxl_checkpoint(
+            None, args.base_model, map_location=args.device
+        )
+    else:
+        base = load_models_from_stable_diffusion_checkpoint(args.is_v2, args.base_model)
+    if ARGS.lycoris_model.rsplit(".", 1)[-1] == "safetensors":
        lyco = load_file(ARGS.lycoris_model)
    else:
        lyco = torch.load(ARGS.lycoris_model)

-    dtype_str = ARGS.dtype.replace('fp', 'float').replace('bf', 'bfloat')
+    dtype_str = ARGS.dtype.replace("fp", "float").replace("bf", "bfloat")
    dtype = {
-        'float': torch.float,
-        'float16': torch.float16,
-        'float32': torch.float32,
-        'float64': torch.float64,
-        'bfloat': torch.bfloat16,
-        'bfloat16': torch.bfloat16,
+        "float": torch.float,
+        "float16": torch.float16,
+        "float32": torch.float32,
+        "float64": torch.float64,
+        "bfloat": torch.bfloat16,
+        "bfloat16": torch.bfloat16,
    }.get(dtype_str, None)
    if dtype is None:
        raise ValueError(f'Cannot Find the dtype "{dtype}"')

-    merge(
-        base,
-        lyco,
-        ARGS.weight,
-        ARGS.device
-    )
+    if args.is_sdxl:
+        base_tes = [base[0], base[1]]
+        base_unet = base[3]
+    else:
+        base_tes = [base[0]]
+        base_unet = base[2]

-    save_stable_diffusion_checkpoint(
-        ARGS.is_v2, ARGS.output_name, 
-        base[0], base[2], 
-        None, 0, 0, dtype, 
-        base[1]
-    )
+    merge(base_tes, base_unet, lyco, ARGS.weight, ARGS.device)
+
+    if args.is_sdxl:
+        save_sdxl_checkpoint(
+            ARGS.output_name,
+            base[0].cpu(),
+            base[1].cpu(),
+            base[3].cpu(),
+            0,
+            0,
+            None,
+            base[2],
+            getattr(base[1], "logit_scale", None),
+            dtype,
+        )
+    else:
+        save_stable_diffusion_checkpoint(
+            ARGS.is_v2,
+            ARGS.output_name,
+            base[0].cpu(),
+            base[2].cpu(),
+            None,
+            0,
+            0,
+            dtype,
+            base[1],
+        )


-if __name__ == '__main__':
+if __name__ == "__main__":
    main()