bbc-mc · rockerBOO · Jan 21, 2023
diff --git a/scripts/mbw/merge_block_weighted.py b/scripts/mbw/merge_block_weighted.py
@@ -7,7 +7,8 @@
 # bbc-mc
 
 import os
-import argparse
+
+# import argparse
 import re
 import torch
 from tqdm import tqdm
@@ -22,21 +23,30 @@
 
 KEY_POSITION_IDS = "cond_stage_model.transformer.text_model.embeddings.position_ids"
 
+
 def dprint(str, flg):
     if flg:
         print(str)
 
 
-def merge(weights:list, model_0, model_1, device="cpu", base_alpha=0.5,
-        output_file="", allow_overwrite=False, verbose=False,
-        save_as_safetensors=False,
-        save_as_half=False,
-        skip_position_ids=0
-        ):
-    if weights is None:
-        weights = None
+def merge(
+    input_weights: str,
+    model_0,
+    model_1,
+    device="cpu",
+    base_alpha=0.5,
+    output_file="",
+    allow_overwrite=False,
+    verbose=False,
+    save_as_safetensors=False,
+    save_as_half=False,
+    skip_position_ids=0,
+):
+    if input_weights is None:
+        weights = []
     else:
-        weights = [float(w) for w in weights.split(',')]
+        weights = [float(w) for w in input_weights.split(",")]
+
     if len(weights) != NUM_TOTAL_BLOCKS:
         _err_msg = f"weights value must be {NUM_TOTAL_BLOCKS}."
         print(_err_msg)
@@ -46,8 +56,10 @@ def merge(weights:list, model_0, model_1, device="cpu", base_alpha=0.5,
 
     def load_model(_model, _device="cpu"):
         model_info = sd_models.get_closet_checkpoint_match(_model)
-        if model_info:
-            model_file = model_info.filename
+        if model_info is None:
+            raise RuntimeError("invalid model filename")
+
+        model_file = model_info.filename
         return sd_models.read_state_dict(model_file, map_location=_device)
 
     print("loading", model_0)
@@ -69,42 +81,48 @@ def load_model(_model, _device="cpu"):
         print(_err_msg)
         return False, _err_msg
 
-    re_inp = re.compile(r'\.input_blocks\.(\d+)\.')  # 12
-    re_mid = re.compile(r'\.middle_block\.(\d+)\.')  # 1
-    re_out = re.compile(r'\.output_blocks\.(\d+)\.') # 12
+    re_inp = re.compile(r"\.input_blocks\.(\d+)\.")  # 12
+    re_mid = re.compile(r"\.middle_block\.(\d+)\.")  # 1
+    re_out = re.compile(r"\.output_blocks\.(\d+)\.")  # 12
 
     print("  merging ...")
-    dprint(f"-- start Stage 1/2 --", verbose)
+    dprint("-- start Stage 1/2 --", verbose)
     count_target_of_basealpha = 0
-    for key in (tqdm(theta_0.keys(), desc="Stage 1/2")):
+    for key in tqdm(theta_0.keys(), desc="Stage 1/2"):
         if "model" in key and key in theta_1:
 
             if KEY_POSITION_IDS in key:
                 print(key)
                 if skip_position_ids == 1:
-                    print(f"  modelA: skip 'position_ids' : dtype:{theta_0[KEY_POSITION_IDS].dtype}")
+                    print(
+                        f"  modelA: skip 'position_ids' : dtype:{theta_0[KEY_POSITION_IDS].dtype}"
+                    )
                     dprint(f"{theta_0[KEY_POSITION_IDS]}", verbose)
                     continue
                 elif skip_position_ids == 2:
                     theta_0[key] = torch.tensor([list(range(77))], dtype=torch.int64)
-                    print(f"  modelA: reset 'position_ids': dtype:{theta_0[KEY_POSITION_IDS].dtype}")
+                    print(
+                        f"  modelA: reset 'position_ids': dtype:{theta_0[KEY_POSITION_IDS].dtype}"
+                    )
                     dprint(f"{theta_0[KEY_POSITION_IDS]}", verbose)
                     continue
                 else:
-                    print(f"  modelA: 'position_ids' key found. do nothing : {skip_position_ids}: dtype:{theta_0[KEY_POSITION_IDS].dtype}")
+                    print(
+                        f"  modelA: 'position_ids' key found. do nothing : {skip_position_ids}: dtype:{theta_0[KEY_POSITION_IDS].dtype}"
+                    )
 
             dprint(f"  key : {key}", verbose)
             current_alpha = alpha
 
             # check weighted and U-Net or not
-            if weights is not None and 'model.diffusion_model.' in key:
+            if weights is not None and "model.diffusion_model." in key:
                 # check block index
                 weight_index = -1
 
-                if 'time_embed' in key:
-                    weight_index = 0                # before input blocks
-                elif '.out.' in key:
-                    weight_index = NUM_TOTAL_BLOCKS - 1     # after output blocks
+                if "time_embed" in key:
+                    weight_index = 0  # before input blocks
+                elif ".out." in key:
+                    weight_index = NUM_TOTAL_BLOCKS - 1  # after output blocks
                 else:
                     m = re_inp.search(key)
                     if m:
@@ -118,45 +136,56 @@ def load_model(_model, _device="cpu"):
                             m = re_out.search(key)
                             if m:
                                 out_idx = int(m.groups()[0])
-                                weight_index = NUM_INPUT_BLOCKS + NUM_MID_BLOCK + out_idx
+                                weight_index = (
+                                    NUM_INPUT_BLOCKS + NUM_MID_BLOCK + out_idx
+                                )
 
                 if weight_index >= NUM_TOTAL_BLOCKS:
                     print(f"error. illegal block index: {key}")
                     return False, ""
+
                 if weight_index >= 0:
                     current_alpha = weights[weight_index]
                     dprint(f"weighted '{key}': {current_alpha}", verbose)
             else:
                 count_target_of_basealpha = count_target_of_basealpha + 1
                 dprint(f"base_alpha applied: [{key}]", verbose)
 
-            theta_0[key] = (1 - current_alpha) * theta_0[key] + current_alpha * theta_1[key]
+            theta_0[key] = (1 - current_alpha) * theta_0[key] + current_alpha * theta_1[
+                key
+            ]
 
             if save_as_half:
                 theta_0[key] = theta_0[key].half()
 
         else:
             dprint(f"  key - {key}", verbose)
 
-    dprint(f"-- start Stage 2/2 --", verbose)
+    dprint("-- start Stage 2/2 --", verbose)
     for key in tqdm(theta_1.keys(), desc="Stage 2/2"):
         if "model" in key and key not in theta_0:
 
             if KEY_POSITION_IDS in key:
                 if skip_position_ids == 1:
-                    print(f"  modelB: skip 'position_ids' : {theta_0[KEY_POSITION_IDS].dtype}")
+                    print(
+                        f"  modelB: skip 'position_ids' : {theta_0[KEY_POSITION_IDS].dtype}"
+                    )
                     dprint(f"{theta_0[KEY_POSITION_IDS]}", verbose)
                     continue
                 elif skip_position_ids == 2:
                     theta_0[key] = torch.tensor([list(range(77))], dtype=torch.int64)
-                    print(f"  modelB: reset 'position_ids': {theta_0[KEY_POSITION_IDS].dtype}")
+                    print(
+                        f"  modelB: reset 'position_ids': {theta_0[KEY_POSITION_IDS].dtype}"
+                    )
                     dprint(f"{theta_0[KEY_POSITION_IDS]}", verbose)
                     continue
                 else:
-                    print(f"  modelB: 'position_ids' key found. do nothing : {skip_position_ids}")
+                    print(
+                        f"  modelB: 'position_ids' key found. do nothing : {skip_position_ids}"
+                    )
 
             dprint(f"  key : {key}", verbose)
-            theta_0.update({key:theta_1[key]})
+            theta_0.update({key: theta_1[key]})
 
             if save_as_half:
                 theta_0[key] = theta_0[key].half()
@@ -171,10 +200,14 @@ def load_model(_model, _device="cpu"):
         if save_as_safetensors and extension.lower() != ".safetensors":
             output_file = output_file + ".safetensors"
         import safetensors.torch
+
         safetensors.torch.save_file(theta_0, output_file, metadata={"format": "pt"})
     else:
         torch.save({"state_dict": theta_0}, output_file)
 
     print("Done!")
 
-    return True, f"{output_file}<br>base_alpha applied [{count_target_of_basealpha}] times."
+    return (
+        True,
+        f"{output_file}<br>base_alpha applied [{count_target_of_basealpha}] times.",
+    )