WIP Lora Extract

AI-Casanova · Oct 19, 2024 · 2744269 · 2744269
1 parent 01953b9
commit 2744269
Show file tree

Hide file tree

Showing 3 changed files with 212 additions and 12 deletions.
diff --git a/extensions-builtin/Lora/lora_extract.py b/extensions-builtin/Lora/lora_extract.py
@@ -0,0 +1,192 @@
+import torch
+from os import path
+from safetensors.torch import save_file
+import gradio as gr
+from modules import shared, devices
+from modules.ui_common import create_refresh_button
+# from modules.call_queue import wrap_gradio_gpu_call
+
+
+class SVDHandler:
+    def __init__(self):
+        self.network_name = None
+        self.U = None
+        self.S = None
+        self.Vh = None
+        self.rank = 0
+        self.maxrank = 0
+        self.out_size = None
+        self.in_size = None
+        self.kernel_size = None
+        self.conv2d = False
+
+    def decompose(self, weight, backupweight):
+        self.conv2d = len(weight.size()) == 4
+        self.kernel_size = None if not self.conv2d else weight.size()[2:4]
+        self.out_size, self.in_size = weight.size()[0:2]
+        diffweight = weight.clone().to(devices.device)
+        diffweight -= backupweight.to(devices.device)
+        if self.conv2d:
+            if self.conv2d and self.kernel_size != (1, 1):
+                diffweight = diffweight.flatten(start_dim=1)
+            else:
+                diffweight = diffweight.squeeze()
+
+        self.U, self.S, self.Vh = torch.linalg.svd(diffweight.to(device=devices.device, dtype=torch.float))
+        del diffweight
+        self.U = self.U.to(device=devices.cpu, dtype=torch.bfloat16)
+        self.S = self.S.to(device=devices.cpu, dtype=torch.bfloat16)
+        self.Vh = self.Vh.to(device=devices.cpu, dtype=torch.bfloat16)
+
+    def findrank(self, maxrank, rankratio):
+        if rankratio < 1:
+            S_squared = self.S.pow(2)
+            S_fro_sq = float(torch.sum(S_squared))
+            sum_S_squared = torch.cumsum(S_squared, dim=0) / S_fro_sq
+            index = int(torch.searchsorted(sum_S_squared, rankratio ** 2)) + 1
+            index = max(1, min(index, len(self.S) - 1))
+            self.rank = index
+            if maxrank > 0:
+                self.rank = min(self.rank, maxrank)
+        elif maxrank == 0:
+            self.rank = min(self.in_size, self.out_size)
+        else:
+            self.rank = min(self.in_size, self.out_size, maxrank)
+
+    def makeweights(self, rankoverride=None):
+        if rankoverride:
+            self.rank = min(self.in_size, self.out_size, rankoverride)
+        up = self.U[:, :self.rank] @ torch.diag(self.S[:self.rank])
+        down = self.Vh[:self.rank, :]
+        if self.conv2d:
+            up = up.reshape(self.out_size, self.rank, 1, 1)
+            down = down.reshape(self.rank, self.in_size, self.kernel_size[0], self.kernel_size[1])
+        return_dict = {f'{self.network_name}.lora_up.weight': up.contiguous(),
+                       f'{self.network_name}.lora_down.weight': down.contiguous(),
+                       f'{self.network_name}.alpha': torch.tensor(down.shape[0]),
+                       }
+        return return_dict
+
+
+def loaded_lora():
+    if not shared.sd_loaded:
+        return ""
+    loaded = set()
+    if hasattr(shared.sd_model, 'unet'):
+        for name, module in shared.sd_model.unet.named_modules():
+            current = getattr(module, "network_current_names", None)
+            if current is not None:
+                current = [item[0] for item in current]
+                loaded.update(current)
+    return ", ".join(list(loaded))
+
+
+def make_lora(basename, rank, auto_rank, rank_ratio, constant_rank):
+    if not shared.sd_loaded or not shared.native or loaded_lora() == "":
+        return
+    rank = int(rank)
+    rank_ratio = 1 if not auto_rank else rank_ratio
+    constant_rank = False if not auto_rank else constant_rank
+    rank_overide = 0 if constant_rank else None
+
+    if hasattr(shared.sd_model, 'text_encoder') and shared.sd_model.text_encoder is not None:
+        for name, module in shared.sd_model.text_encoder.named_modules():
+            weights_backup = getattr(module, "network_weights_backup", None)
+            if weights_backup is None or getattr(module, "network_current_names", None) is None:
+                continue
+            prefix = "lora_te1_" if hasattr(shared.sd_model, 'text_encoder_2') else "lora_te_"
+            module.svdhandler = SVDHandler()
+            module.svdhandler.network_name = prefix + name.replace(".", "_")
+            with devices.inference_context():
+                module.svdhandler.decompose(module.weight, weights_backup)
+            module.svdhandler.findrank(rank, rank_ratio)
+    print("TE1 done")
+    if hasattr(shared.sd_model, 'text_encoder_2'):
+        for name, module in shared.sd_model.text_encoder_2.named_modules():
+            weights_backup = getattr(module, "network_weights_backup", None)
+            if weights_backup is None or getattr(module, "network_current_names", None) is None:
+                continue
+            module.svdhandler = SVDHandler()
+            module.svdhandler.network_name = "lora_te2_" + name.replace(".", "_")
+            with devices.inference_context():
+                module.svdhandler.decompose(module.weight, weights_backup)
+            module.svdhandler.findrank(rank, rank_ratio)
+
+    print("TE2 done")
+    if hasattr(shared.sd_model, 'unet'):
+        for name, module in shared.sd_model.unet.named_modules():
+            weights_backup = getattr(module, "network_weights_backup", None)
+            if weights_backup is None or getattr(module, "network_current_names", None) is None:
+                continue
+            module.svdhandler = SVDHandler()
+            module.svdhandler.network_name = "lora_unet_" + name.replace(".", "_")
+            with devices.inference_context():
+                module.svdhandler.decompose(module.weight, weights_backup)
+            module.svdhandler.findrank(rank, rank_ratio)
+
+    # if hasattr(shared.sd_model, 'transformer'):  # TODO: Handle quant for Flux
+    #     for name, module in shared.sd_model.transformer.named_modules():
+    #         if "norm" in name and "linear" not in name:
+    #             continue
+    #         weights_backup = getattr(module, "network_weights_backup", None)
+    #         if weights_backup is None:
+    #             continue
+    #         module.svdhandler = SVDHandler()
+    #         module.svdhandler.network_name = "lora_transformer_" + name.replace(".", "_")
+    #         module.svdhandler.decompose(module.weight, weights_backup)
+    #         module.svdhandler.findrank(rank, rank_ratio)
+
+    submodelname = ['text_encoder', 'text_encoder_2', 'unet', 'transformer']
+
+    if constant_rank:
+        for sub in submodelname:
+            submodel = getattr(shared.sd_model, sub, None)
+            if submodel is not None:
+                for name, module in submodel.named_modules():
+                    if not hasattr(module, "svdhandler"):
+                        continue
+                    rank_overide = max(rank_overide, module.svdhandler.rank)
+    print(f"rank_overide: {rank_overide}")
+    lora_state_dict = {}
+    for sub in submodelname:
+        submodel = getattr(shared.sd_model, sub, None)
+        if submodel is not None:
+            for name, module in submodel.named_modules():
+                if not hasattr(module, "svdhandler"):
+                    continue
+                lora_state_dict.update(module.svdhandler.makeweights(rank_overide))
+                del module.svdhandler
+
+    save_file(lora_state_dict, path.join(shared.cmd_opts.lora_dir, basename+".safetensors"))
+
+
+def create_ui():
+    def gr_show(visible=True):
+        return {"visible": visible, "__type__": "update"}
+
+
+
+    with gr.Tab(label="Extract LoRA"):
+        with gr.Row():
+            loaded = gr.Textbox(label="Loaded LoRA", interactive=False)
+            # create_refresh_button(loaded, lambda: None, gr.update(value=loaded_lora()), "testid")
+            create_refresh_button(loaded, lambda: None, lambda: {'value': loaded_lora()}, "testid")
+        with gr.Row():
+            rank = gr.Number(value=0, label="Optional max rank")
+        with gr.Row():
+            auto_rank = gr.Checkbox(value=False, label="Automatically determine rank")
+        with gr.Row(visible=False) as rank_options:
+            rank_ratio = gr.Slider(minimum=0, maximum=1, value=1, label="Autorank ratio", visible=True)
+            constant_rank = gr.Checkbox(value=False, label="Constant rank", visible=True)
+        with gr.Row():
+            basename = gr.Textbox(label="Base name for LoRa")
+        with gr.Row():
+            extract = gr.Button(value="Extract Lora", variant='primary')
+
+    auto_rank.change(fn=lambda x: gr_show(x), inputs=[auto_rank], outputs=[rank_options])
+    # extract.click(
+    #     fn=wrap_gradio_gpu_call(make_lora(basename, rank, auto_rank, rank_ratio, constant_rank),
+    #                             extra_outputs=None), _js='loraextract', inputs=[],
+    #     outputs=[])
+    extract.click(fn=make_lora, inputs=[basename, rank, auto_rank, rank_ratio, constant_rank], outputs=[])
+    # extract.click(fn= lambda: None)
diff --git a/extensions-builtin/Lora/networks.py b/extensions-builtin/Lora/networks.py
@@ -285,6 +285,8 @@ def network_restore_weights_from_backup(self: Union[torch.nn.Conv2d, torch.nn.Li
     weights_backup = getattr(self, "network_weights_backup", None)
     bias_backup = getattr(self, "network_bias_backup", None)
     if weights_backup is None and bias_backup is None:
+        t1 = time.time()
+        timer['restore'] += t1 - t0
         return
     # if debug:
     #     shared.log.debug('LoRA restore weights')
@@ -319,18 +321,7 @@ def network_restore_weights_from_backup(self: Union[torch.nn.Conv2d, torch.nn.Li
     timer['restore'] += t1 - t0
 
 
-def network_apply_weights(self: Union[torch.nn.Conv2d, torch.nn.Linear, torch.nn.GroupNorm, torch.nn.LayerNorm, torch.nn.MultiheadAttention, diffusers.models.lora.LoRACompatibleLinear, diffusers.models.lora.LoRACompatibleConv]):
-    """
-    Applies the currently selected set of networks to the weights of torch layer self.
-    If weights already have this particular set of networks applied, does nothing.
-    If not, restores orginal weights from backup and alters weights according to networks.
-    """
-    network_layer_name = getattr(self, 'network_layer_name', None)
-    if network_layer_name is None:
-        return
-    t0 = time.time()
-    current_names = getattr(self, "network_current_names", ())
-    wanted_names = tuple((x.name, x.te_multiplier, x.unet_multiplier, x.dyn_dim) for x in loaded_networks)
+def maybe_backup_weights(self: Union[torch.nn.Conv2d, torch.nn.Linear, torch.nn.GroupNorm, torch.nn.LayerNorm, torch.nn.MultiheadAttention, diffusers.models.lora.LoRACompatibleLinear, diffusers.models.lora.LoRACompatibleConv], wanted_names, current_names):
     weights_backup = getattr(self, "network_weights_backup", None)
     if weights_backup is None and wanted_names != (): # pylint: disable=C1803
         if current_names != ():
@@ -360,6 +351,21 @@ def network_apply_weights(self: Union[torch.nn.Conv2d, torch.nn.Linear, torch.nn
             bias_backup = None
         self.network_bias_backup = bias_backup
 
+
+def network_apply_weights(self: Union[torch.nn.Conv2d, torch.nn.Linear, torch.nn.GroupNorm, torch.nn.LayerNorm, torch.nn.MultiheadAttention, diffusers.models.lora.LoRACompatibleLinear, diffusers.models.lora.LoRACompatibleConv]):
+    """
+    Applies the currently selected set of networks to the weights of torch layer self.
+    If weights already have this particular set of networks applied, does nothing.
+    If not, restores orginal weights from backup and alters weights according to networks.
+    """
+    network_layer_name = getattr(self, 'network_layer_name', None)
+    if network_layer_name is None:
+        return
+    t0 = time.time()
+    current_names = getattr(self, "network_current_names", ())
+    wanted_names = tuple((x.name, x.te_multiplier, x.unet_multiplier, x.dyn_dim) for x in loaded_networks)
+    if any([net.modules.get(network_layer_name, None) for net in loaded_networks]):
+        maybe_backup_weights(self, wanted_names, current_names)
     if current_names != wanted_names:
         network_restore_weights_from_backup(self)
         for net in loaded_networks:

diff --git a/extensions-builtin/Lora/scripts/lora_script.py b/extensions-builtin/Lora/scripts/lora_script.py
@@ -1,6 +1,7 @@
 import re
 import networks
 import lora # pylint: disable=unused-import
+from lora_extract import create_ui
 from network import NetworkOnDisk
 from ui_extra_networks_lora import ExtraNetworksPageLora
 from extra_networks_lora import ExtraNetworkLora
@@ -14,6 +15,7 @@ def before_ui():
     ui_extra_networks.register_page(ExtraNetworksPageLora())
     networks.extra_network_lora = ExtraNetworkLora()
     extra_networks.register_extra_network(networks.extra_network_lora)
+    ui_models.extra_ui.append(create_ui)
 
 
 def create_lora_json(obj: NetworkOnDisk):