-
Notifications
You must be signed in to change notification settings - Fork 2.4k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Modular backend - add rescale cfg (#6640)
## Summary Rescale CFG code from #6577. ## Related Issues / Discussions #6606 https://invokeai.notion.site/Modular-Stable-Diffusion-Backend-Design-Document-e8952daab5d5472faecdc4a72d377b0d ## QA Instructions Run with and without set `USE_MODULAR_DENOISE` environment. ~~Note: for some reasons there slightly different output from run to run, but I able sometimes to get same output on main and this branch.~~ Fix presented in #6641. ## Merge Plan ~~Nope.~~ Merge #6641 firstly, to be able see output difference properly. If you think that there should be some kind of tests - feel free to add. ## Checklist - [x] _The PR has a short but descriptive title, suitable for a changelog_ - [ ] _Tests added / updated (if applicable)_ - [ ] _Documentation added / updated (if applicable)_
- Loading branch information
Showing
5 changed files
with
56 additions
and
15 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
36 changes: 36 additions & 0 deletions
36
invokeai/backend/stable_diffusion/extensions/rescale_cfg.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,36 @@ | ||
from __future__ import annotations | ||
|
||
from typing import TYPE_CHECKING | ||
|
||
import torch | ||
|
||
from invokeai.backend.stable_diffusion.extension_callback_type import ExtensionCallbackType | ||
from invokeai.backend.stable_diffusion.extensions.base import ExtensionBase, callback | ||
|
||
if TYPE_CHECKING: | ||
from invokeai.backend.stable_diffusion.denoise_context import DenoiseContext | ||
|
||
|
||
class RescaleCFGExt(ExtensionBase): | ||
def __init__(self, rescale_multiplier: float): | ||
super().__init__() | ||
self._rescale_multiplier = rescale_multiplier | ||
|
||
@staticmethod | ||
def _rescale_cfg(total_noise_pred: torch.Tensor, pos_noise_pred: torch.Tensor, multiplier: float = 0.7): | ||
"""Implementation of Algorithm 2 from https://arxiv.org/pdf/2305.08891.pdf.""" | ||
ro_pos = torch.std(pos_noise_pred, dim=(1, 2, 3), keepdim=True) | ||
ro_cfg = torch.std(total_noise_pred, dim=(1, 2, 3), keepdim=True) | ||
|
||
x_rescaled = total_noise_pred * (ro_pos / ro_cfg) | ||
x_final = multiplier * x_rescaled + (1.0 - multiplier) * total_noise_pred | ||
return x_final | ||
|
||
@callback(ExtensionCallbackType.POST_COMBINE_NOISE_PREDS) | ||
def rescale_noise_pred(self, ctx: DenoiseContext): | ||
if self._rescale_multiplier > 0: | ||
ctx.noise_pred = self._rescale_cfg( | ||
ctx.noise_pred, | ||
ctx.positive_noise_pred, | ||
self._rescale_multiplier, | ||
) |