feat: reduce batching on flux

Haidra-Org · Sep 11, 2024 · dca63e0 · dca63e0
1 parent ea24368
commit dca63e0
Show file tree

Hide file tree

Showing 3 changed files with 16 additions and 0 deletions.
diff --git a/horde/classes/stable/waiting_prompt.py b/horde/classes/stable/waiting_prompt.py
@@ -18,6 +18,7 @@
     KNOWN_LCM_LORA_VERSIONS,
     KNOWN_POST_PROCESSORS,
     SECOND_ORDER_SAMPLERS,
+    BASELINE_BATCHING_MULTIPLIERS,
 )
 from horde.flask import db
 from horde.image import convert_pil_to_b64
@@ -511,5 +512,12 @@ def has_heavy_operations(self):
             return True
         return False
 
+    def get_highest_model_batching_multiplier(self):
+        highest_multiplier = 1
+        for mn in self.get_model_names():
+            if BASELINE_BATCHING_MULTIPLIERS.get(mn, 1) > highest_multiplier:
+                highest_multiplier = BASELINE_BATCHING_MULTIPLIERS.get(mn, 1)
+        return highest_multiplier
+
     def count_pp(self):
         return len(self.params.get("post_processing", []))
diff --git a/horde/classes/stable/worker.py b/horde/classes/stable/worker.py
@@ -225,6 +225,7 @@ def get_safe_amount(self, amount, wp):
         if wp.has_heavy_operations():
             pp_multiplier *= 1.8
         mps *= pp_multiplier
+        mps *= wp.get_highest_model_batching_multiplier()
         safe_amount = round(safe_generations / mps)
         if safe_amount > amount:
             safe_amount = amount

diff --git a/horde/consts.py b/horde/consts.py
@@ -38,6 +38,13 @@
     "4x_AnimeSharp" "CodeFormers",
 }
 
+# These models are very large in VRAM, so we increase the calculated MPS
+# used to figure out batches by a set multiplier to reduce how many images are batched
+# at a time when these models are used.
+BASELINE_BATCHING_MULTIPLIERS = {
+    "flux.1": 2,
+}
+
 
 KNOWN_SAMPLERS = {
     "k_lms",