Improve comments, optimize memory in blur routine

2026-02-16 00:12:33 +08:00 · 2023-12-07 12:02:40 +01:00 · 2023-12-07 12:02:40 +01:00 · ecd098a7fd
commit ecd098a7fd
parent f8d719f9e7
2 changed files with 5 additions and 8 deletions
--- a/comfy/samplers.py
+++ b/comfy/samplers.py
@ -257,19 +257,18 @@ def sampling_function(model, x, timestep, uncond, cond, cond_scale, model_option
            return x - model_options["sampler_cfg_function"](args)
        # if cfg = 1.0, we can't do sag
        elif "sag" in model_options:
            assert uncond is not None, "SAG requires uncond guidance"
            sag_scale = model_options["sag_scale"]
            sag_sigma = model_options["sag_sigma"]
            sag_threshold = model_options.get("sag_threshold", 1.0)
-            # this method is added by the sag patcher
+            # these methods are added by the sag patcher
            uncond_attn = model.get_attn_scores()
            mid_shape = model.get_mid_block_shape()
            degraded = create_blur_map(uncond_pred, uncond_attn, mid_shape, sag_sigma, sag_threshold)
            degraded_noised = degraded + x - uncond_pred
-            assert uncond is not None, "SAG requires uncond guidance"
+            # call into the UNet with the adversarially blurred image
            (sag, _) = calc_cond_uncond_batch(model, uncond, None, degraded_noised, timestep, model_options)
            # Unless I've misunderstood the paper, this is supposed to be   (uncond_pred - sag) * sag_scale.
            # but this is what the automatic1111 implementation does, and it works better??
            return uncond_pred + (cond_pred - uncond_pred) * cond_scale + (degraded - sag) * sag_scale
        else:
            return uncond_pred + (cond_pred - uncond_pred) * cond_scale
@ -277,7 +276,7 @@ def sampling_function(model, x, timestep, uncond, cond, cond_scale, model_option
 def create_blur_map(x0, attn, mid_shape, sigma=3.0, threshold=1.0):
    # reshape and GAP the attention map
    _, hw1, hw2 = attn.shape
-    b, lc, lh, lw = x0.shape
+    b, _, lh, lw = x0.shape
    attn = attn.reshape(b, -1, hw1, hw2)
    # Global Average Pool
    mask = attn.mean(1, keepdim=False).sum(1, keepdim=False) > threshold
@ -285,7 +284,6 @@ def create_blur_map(x0, attn, mid_shape, sigma=3.0, threshold=1.0):
    mask = (
        mask.reshape(b, *mid_shape)
        .unsqueeze(1)
        .repeat(1, lc, 1, 1)
        .type(attn.dtype)
    )
    # Upsample
--- a/comfy_extras/nodes_sag.py
+++ b/comfy_extras/nodes_sag.py
@ -101,7 +101,6 @@ class SagNode:
            if name not in to["patches_replace"]:
                to["patches_replace"][name] = {}
            to["patches_replace"][name][key] = patch
        # this actually patches 2 attn calls -- confusing, since we only want to get one
        set_model_patch_replace(attn_and_record, "attn1", ("middle", 0, 0))
        # from diffusers:
        # unet.mid_block.attentions[0].register_forward_hook()