Merge pull request #14 from Aatricks/cond-dynamic-width-scaling-451456543888025473

Aatricks · web-flow · commit 625ac6f472e3 · 2026-01-10T20:52:54.000+01:00
Dynamic Width Scaling in Condition Encoding
diff --git a/src/Utilities/Latent.py b/src/Utilities/Latent.py
@@ -15,7 +15,8 @@ class LatentFormat:
 
     scale_factor: float = 1.0
     latent_channels: int = 4
-    
+    downscale_factor: int = 8
+
     def process_in(self, latent: torch.Tensor) -> torch.Tensor:
         """#### Process the latent input, by multiplying it by the scale factor.
 
diff --git a/src/cond/cond.py b/src/cond/cond.py
@@ -588,10 +588,19 @@ def encode_model_conds(
         params["device"] = device
         params["noise"] = noise
         default_width = None
-        if len(noise.shape) >= 4:  # TODO: 8 multiple should be set by the model
-            default_width = noise.shape[3] * 8
+
+        downscale_factor = 8
+        if hasattr(model_function, "__self__"):
+            model = model_function.__self__
+            if hasattr(model, "latent_format") and hasattr(
+                model.latent_format, "downscale_factor"
+            ):
+                downscale_factor = model.latent_format.downscale_factor
+
+        if len(noise.shape) >= 4:
+            default_width = noise.shape[3] * downscale_factor
         params["width"] = params.get("width", default_width)
-        params["height"] = params.get("height", noise.shape[2] * 8)
+        params["height"] = params.get("height", noise.shape[2] * downscale_factor)
         params["prompt_type"] = params.get("prompt_type", prompt_type)
         for k in kwargs:
             if k not in params: