my-sd/modules/sd_samplers_cfg_denoiser.py

import torch
from modules import prompt_parser, sd_samplers_common

from modules.shared import state
import modules.shared as shared
from modules.script_callbacks import CFGDenoiserParams, cfg_denoiser_callback
from modules.script_callbacks import AfterCFGCallbackParams, cfg_after_cfg_callback
from modules_forge import forge_sampler


def catenate_conds(conds):
    if not isinstance(conds[0], dict):
        return torch.cat(conds)

    return {key: torch.cat([x[key] for x in conds]) for key in conds[0].keys()}


def subscript_cond(cond, a, b):
    if not isinstance(cond, dict):
        return cond[a:b]

    return {key: vec[a:b] for key, vec in cond.items()}


def pad_cond(tensor, repeats, empty):
    if not isinstance(tensor, dict):
        return torch.cat([tensor, empty.repeat((tensor.shape[0], repeats, 1))], axis=1)

    tensor['crossattn'] = pad_cond(tensor['crossattn'], repeats, empty)
    return tensor


class CFGDenoiser(torch.nn.Module):
    """
    Classifier free guidance denoiser. A wrapper for stable diffusion model (specifically for unet)
    that can take a noisy picture and produce a noise-free picture using two guidances (prompts)
    instead of one. Originally, the second prompt is just an empty string, but we use non-empty
    negative prompt.
    """

    def __init__(self, sampler):
        super().__init__()
        self.model_wrap = None
        self.mask = None
        self.nmask = None
        self.init_latent = None
        self.steps = None
        """number of steps as specified by user in UI"""

        self.total_steps = None
        """expected number of calls to denoiser calculated from self.steps and specifics of the selected sampler"""

        self.step = 0
        self.image_cfg_scale = None
        self.padded_cond_uncond = False
        self.padded_cond_uncond_v0 = False
        self.sampler = sampler
        self.model_wrap = None
        self.p = None

        # Backward Compatibility
        self.mask_before_denoising = False

        self.classic_ddim_eps_estimation = False

    @property
    def inner_model(self):
        raise NotImplementedError()

    def combine_denoised(self, x_out, conds_list, uncond, cond_scale, timestep, x_in, cond):
        denoised_uncond = x_out[-uncond.shape[0]:]
        denoised = torch.clone(denoised_uncond)

        for i, conds in enumerate(conds_list):
            for cond_index, weight in conds:
                denoised[i] += (x_out[cond_index] - denoised_uncond[i]) * (weight * cond_scale)

        return denoised

    def combine_denoised_for_edit_model(self, x_out, cond_scale):
        out_cond, out_img_cond, out_uncond = x_out.chunk(3)
        denoised = out_uncond + cond_scale * (out_cond - out_img_cond) + self.image_cfg_scale * (out_img_cond - out_uncond)

        return denoised

    def get_pred_x0(self, x_in, x_out, sigma):
        return x_out

    def update_inner_model(self):
        self.model_wrap = None

        c, uc = self.p.get_conds()
        self.sampler.sampler_extra_args['cond'] = c
        self.sampler.sampler_extra_args['uncond'] = uc

    def pad_cond_uncond(self, cond, uncond):
        empty = shared.sd_model.cond_stage_model_empty_prompt
        num_repeats = (cond.shape[1] - uncond.shape[1]) // empty.shape[1]

        if num_repeats < 0:
            cond = pad_cond(cond, -num_repeats, empty)
            self.padded_cond_uncond = True
        elif num_repeats > 0:
            uncond = pad_cond(uncond, num_repeats, empty)
            self.padded_cond_uncond = True

        return cond, uncond

    def pad_cond_uncond_v0(self, cond, uncond):
        """
        Pads the 'uncond' tensor to match the shape of the 'cond' tensor.

        If 'uncond' is a dictionary, it is assumed that the 'crossattn' key holds the tensor to be padded.
        If 'uncond' is a tensor, it is padded directly.

        If the number of columns in 'uncond' is less than the number of columns in 'cond', the last column of 'uncond'
        is repeated to match the number of columns in 'cond'.

        If the number of columns in 'uncond' is greater than the number of columns in 'cond', 'uncond' is truncated
        to match the number of columns in 'cond'.

        Args:
            cond (torch.Tensor or DictWithShape): The condition tensor to match the shape of 'uncond'.
            uncond (torch.Tensor or DictWithShape): The tensor to be padded, or a dictionary containing the tensor to be padded.

        Returns:
            tuple: A tuple containing the 'cond' tensor and the padded 'uncond' tensor.

        Note:
            This is the padding that was always used in DDIM before version 1.6.0
        """

        is_dict_cond = isinstance(uncond, dict)
        uncond_vec = uncond['crossattn'] if is_dict_cond else uncond

        if uncond_vec.shape[1] < cond.shape[1]:
            last_vector = uncond_vec[:, -1:]
            last_vector_repeated = last_vector.repeat([1, cond.shape[1] - uncond_vec.shape[1], 1])
            uncond_vec = torch.hstack([uncond_vec, last_vector_repeated])
            self.padded_cond_uncond_v0 = True
        elif uncond_vec.shape[1] > cond.shape[1]:
            uncond_vec = uncond_vec[:, :cond.shape[1]]
            self.padded_cond_uncond_v0 = True

        if is_dict_cond:
            uncond['crossattn'] = uncond_vec
        else:
            uncond = uncond_vec

        return cond, uncond

    def forward(self, x, sigma, uncond, cond, cond_scale, s_min_uncond, image_cond):
        if state.interrupted or state.skipped:
            raise sd_samplers_common.InterruptedException

        original_x_device = x.device
        original_x_dtype = x.dtype

        if self.classic_ddim_eps_estimation:
            acd = self.inner_model.inner_model.alphas_cumprod
            fake_sigmas = ((1 - acd) / acd) ** 0.5
            real_sigma = fake_sigmas[sigma.round().long().clip(0, int(fake_sigmas.shape[0]))]
            real_sigma_data = 1.0
            x = x * (real_sigma ** 2.0 + real_sigma_data ** 2.0) ** 0.5
            sigma = real_sigma

        if sd_samplers_common.apply_refiner(self, x):
            cond = self.sampler.sampler_extra_args['cond']
            uncond = self.sampler.sampler_extra_args['uncond']

        cond_composition, cond = prompt_parser.reconstruct_multicond_batch(cond, self.step)
        uncond = prompt_parser.reconstruct_cond_batch(uncond, self.step)

        if self.mask is not None:
            noisy_initial_latent = self.init_latent + sigma[:, None, None, None] * torch.randn_like(self.init_latent).to(self.init_latent)
            x = x * self.nmask + noisy_initial_latent * self.mask

        denoiser_params = CFGDenoiserParams(x, image_cond, sigma, state.sampling_step, state.sampling_steps, cond, uncond, self)
        cfg_denoiser_callback(denoiser_params)

        denoised = forge_sampler.forge_sample(self, denoiser_params=denoiser_params,
                                              cond_scale=cond_scale, cond_composition=cond_composition)

        if self.mask is not None:
            denoised = denoised * self.nmask + self.init_latent * self.mask

        preview = self.sampler.last_latent = denoised
        sd_samplers_common.store_latent(preview)

        after_cfg_callback_params = AfterCFGCallbackParams(denoised, state.sampling_step, state.sampling_steps)
        cfg_after_cfg_callback(after_cfg_callback_params)
        denoised = after_cfg_callback_params.x

        self.step += 1

        if self.classic_ddim_eps_estimation:
            eps = (x - denoised) / sigma
            return eps

        return denoised.to(device=original_x_device, dtype=original_x_dtype)
split codebase into multiple files; to anyone this affects negatively: sorry 2022-09-03 09:08:45 +00:00			`import torch`
Fix ruff linter (#137) * Fix ruff linter * Remove unused imports * Remove unused imports 2024-02-09 01:35:20 +00:00			`from modules import prompt_parser, sd_samplers_common`
split codebase into multiple files; to anyone this affects negatively: sorry 2022-09-03 09:08:45 +00:00
Fix ruff linter (#137) * Fix ruff linter * Remove unused imports * Remove unused imports 2024-02-09 01:35:20 +00:00			`from modules.shared import state`
split codebase into multiple files; to anyone this affects negatively: sorry 2022-09-03 09:08:45 +00:00			`import modules.shared as shared`
Update class name and assign back to vars 2022-11-02 00:38:17 +00:00			`from modules.script_callbacks import CFGDenoiserParams, cfg_denoiser_callback`
Add/modify CFG callbacks Required by self-attn guidance extension https://github.com/ashen-sensored/sd_webui_SAG 2023-05-14 01:49:41 +00:00			`from modules.script_callbacks import AfterCFGCallbackParams, cfg_after_cfg_callback`
better sampler 2024-01-27 21:21:25 +00:00			`from modules_forge import forge_sampler`
split codebase into multiple files; to anyone this affects negatively: sorry 2022-09-03 09:08:45 +00:00
removed the option to use 2x more memory when generating previews added an option to always only show one image in previews removed duplicate code 2022-10-22 17:48:13 +00:00
getting SD2.1 to run on SDXL repo 2023-07-11 18:16:43 +00:00			`def catenate_conds(conds):`
			`if not isinstance(conds[0], dict):`
			`return torch.cat(conds)`

			`return {key: torch.cat([x[key] for x in conds]) for key in conds[0].keys()}`


			`def subscript_cond(cond, a, b):`
			`if not isinstance(cond, dict):`
			`return cond[a:b]`

			`return {key: vec[a:b] for key, vec in cond.items()}`


			`def pad_cond(tensor, repeats, empty):`
			`if not isinstance(tensor, dict):`
			`return torch.cat([tensor, empty.repeat((tensor.shape[0], repeats, 1))], axis=1)`

			`tensor['crossattn'] = pad_cond(tensor['crossattn'], repeats, empty)`
			`return tensor`


split codebase into multiple files; to anyone this affects negatively: sorry 2022-09-03 09:08:45 +00:00			`class CFGDenoiser(torch.nn.Module):`
split samplers into one more files for k-diffusion 2023-01-30 07:11:30 +00:00			`"""`
			`Classifier free guidance denoiser. A wrapper for stable diffusion model (specifically for unet)`
			`that can take a noisy picture and produce a noise-free picture using two guidances (prompts)`
			`instead of one. Originally, the second prompt is just an empty string, but we use non-empty`
			`negative prompt.`
			`"""`

merge errors 2023-08-08 19:09:40 +00:00			`def __init__(self, sampler):`
split codebase into multiple files; to anyone this affects negatively: sorry 2022-09-03 09:08:45 +00:00			`super().__init__()`
merge errors 2023-08-08 19:09:40 +00:00			`self.model_wrap = None`
split codebase into multiple files; to anyone this affects negatively: sorry 2022-09-03 09:08:45 +00:00			`self.mask = None`
			`self.nmask = None`
			`self.init_latent = None`
merge errors 2023-08-08 19:09:40 +00:00			`self.steps = None`
put refiner into main UI, into the new accordions section add VAE from main model into infotext, not from refiner model option to make scripts UI without gr.Group fix inconsistencies with refiner when usings samplers that do more denoising than steps 2023-08-12 09:39:59 +00:00			`"""number of steps as specified by user in UI"""`

			`self.total_steps = None`
			`"""expected number of calls to denoiser calculated from self.steps and specifics of the selected sampler"""`

prompt editing 2022-09-15 10:10:16 +00:00			`self.step = 0`
merge CFGDenoiserEdit and CFGDenoiser into single object 2023-02-04 08:06:17 +00:00			`self.image_cfg_scale = None`
add missing infotext entry for the pad cond/uncond option 2023-06-27 03:18:43 +00:00			`self.padded_cond_uncond = False`
Add Pad conds v0 option 2024-01-27 19:30:12 +00:00			`self.padded_cond_uncond_v0 = False`
add CFG denoiser implementation for DDIM, PLMS and UniPC (this is the commit when you can run both old and new implementations to compare them) 2023-08-08 16:20:11 +00:00			`self.sampler = sampler`
merge errors 2023-08-08 19:09:40 +00:00			`self.model_wrap = None`
			`self.p = None`
Implements "scheduling" for blending of the original latents and a latent blending formula that preserves details in blend transition areas. 2023-11-28 23:10:22 +00:00
ddim 2024-02-04 21:47:31 +00:00			`# Backward Compatibility`
revert to applying mask before denoising for k-diffusion, like it was before 2023-08-14 05:59:15 +00:00			`self.mask_before_denoising = False`
merge errors 2023-08-08 19:09:40 +00:00
ddim 2024-02-04 21:47:31 +00:00			`self.classic_ddim_eps_estimation = False`

merge errors 2023-08-08 19:09:40 +00:00			`@property`
			`def inner_model(self):`
			`raise NotImplementedError()`

Update sd_samplers_cfg_denoiser.py 2024-01-26 03:52:03 +00:00			`def combine_denoised(self, x_out, conds_list, uncond, cond_scale, timestep, x_in, cond):`
separate part of denoiser code into a function to make it easier for extensions to override it 2022-12-24 15:38:16 +00:00			`denoised_uncond = x_out[-uncond.shape[0]:]`
			`denoised = torch.clone(denoised_uncond)`

			`for i, conds in enumerate(conds_list):`
			`for cond_index, weight in conds:`
			`denoised[i] += (x_out[cond_index] - denoised_uncond[i]) * (weight * cond_scale)`

			`return denoised`

merge CFGDenoiserEdit and CFGDenoiser into single object 2023-02-04 08:06:17 +00:00			`def combine_denoised_for_edit_model(self, x_out, cond_scale):`
			`out_cond, out_img_cond, out_uncond = x_out.chunk(3)`
			`denoised = out_uncond + cond_scale * (out_cond - out_img_cond) + self.image_cfg_scale * (out_img_cond - out_uncond)`

			`return denoised`

add CFG denoiser implementation for DDIM, PLMS and UniPC (this is the commit when you can run both old and new implementations to compare them) 2023-08-08 16:20:11 +00:00			`def get_pred_x0(self, x_in, x_out, sigma):`
			`return x_out`

merge errors 2023-08-08 19:09:40 +00:00			`def update_inner_model(self):`
			`self.model_wrap = None`

			`c, uc = self.p.get_conds()`
			`self.sampler.sampler_extra_args['cond'] = c`
			`self.sampler.sampler_extra_args['uncond'] = uc`

Add Pad conds v0 option 2024-01-27 19:30:12 +00:00			`def pad_cond_uncond(self, cond, uncond):`
			`empty = shared.sd_model.cond_stage_model_empty_prompt`
fix the typo -- thanks Cyberbeing 2024-01-29 07:20:27 +00:00			`num_repeats = (cond.shape[1] - uncond.shape[1]) // empty.shape[1]`
Add Pad conds v0 option 2024-01-27 19:30:12 +00:00
			`if num_repeats < 0:`
			`cond = pad_cond(cond, -num_repeats, empty)`
			`self.padded_cond_uncond = True`
			`elif num_repeats > 0:`
			`uncond = pad_cond(uncond, num_repeats, empty)`
			`self.padded_cond_uncond = True`

			`return cond, uncond`

			`def pad_cond_uncond_v0(self, cond, uncond):`
			`"""`
			`Pads the 'uncond' tensor to match the shape of the 'cond' tensor.`

			`If 'uncond' is a dictionary, it is assumed that the 'crossattn' key holds the tensor to be padded.`
			`If 'uncond' is a tensor, it is padded directly.`

			`If the number of columns in 'uncond' is less than the number of columns in 'cond', the last column of 'uncond'`
			`is repeated to match the number of columns in 'cond'.`

			`If the number of columns in 'uncond' is greater than the number of columns in 'cond', 'uncond' is truncated`
			`to match the number of columns in 'cond'.`

			`Args:`
			`cond (torch.Tensor or DictWithShape): The condition tensor to match the shape of 'uncond'.`
			`uncond (torch.Tensor or DictWithShape): The tensor to be padded, or a dictionary containing the tensor to be padded.`

			`Returns:`
			`tuple: A tuple containing the 'cond' tensor and the padded 'uncond' tensor.`

			`Note:`
			`This is the padding that was always used in DDIM before version 1.6.0`
			`"""`

			`is_dict_cond = isinstance(uncond, dict)`
			`uncond_vec = uncond['crossattn'] if is_dict_cond else uncond`

			`if uncond_vec.shape[1] < cond.shape[1]:`
			`last_vector = uncond_vec[:, -1:]`
			`last_vector_repeated = last_vector.repeat([1, cond.shape[1] - uncond_vec.shape[1], 1])`
			`uncond_vec = torch.hstack([uncond_vec, last_vector_repeated])`
			`self.padded_cond_uncond_v0 = True`
			`elif uncond_vec.shape[1] > cond.shape[1]:`
			`uncond_vec = uncond_vec[:, :cond.shape[1]]`
			`self.padded_cond_uncond_v0 = True`

			`if is_dict_cond:`
			`uncond['crossattn'] = uncond_vec`
			`else:`
			`uncond = uncond_vec`

			`return cond, uncond`

performance increase 2023-03-28 22:18:28 +00:00			`def forward(self, x, sigma, uncond, cond, cond_scale, s_min_uncond, image_cond):`
remove dependence on TQDM for sampler progress/interrupt functionality 2022-10-18 14:23:38 +00:00			`if state.interrupted or state.skipped:`
split compvis sampler and shared sampler stuff into their own files 2023-01-30 06:51:06 +00:00			`raise sd_samplers_common.InterruptedException`
remove dependence on TQDM for sampler progress/interrupt functionality 2022-10-18 14:23:38 +00:00
try solve #71 2024-02-07 01:46:23 +00:00			`original_x_device = x.device`
			`original_x_dtype = x.dtype`

ddim 2024-02-04 21:47:31 +00:00			`if self.classic_ddim_eps_estimation:`
fix ddim plms unipc 2024-02-04 10:03:35 +00:00			`acd = self.inner_model.inner_model.alphas_cumprod`
			`fake_sigmas = ((1 - acd) / acd) ** 0.5`
fix ddim inpaint 2024-02-04 11:34:20 +00:00			`real_sigma = fake_sigmas[sigma.round().long().clip(0, int(fake_sigmas.shape[0]))]`
fix ddim plms unipc 2024-02-04 10:03:35 +00:00			`real_sigma_data = 1.0`
			`x = x * (real_sigma 2.0 + real_sigma_data 2.0) ** 0.5`
			`sigma = real_sigma`

i 2024-01-25 15:52:29 +00:00			`if sd_samplers_common.apply_refiner(self, x):`
merge errors 2023-08-08 19:09:40 +00:00			`cond = self.sampler.sampler_extra_args['cond']`
			`uncond = self.sampler.sampler_extra_args['uncond']`

i 2024-01-28 02:38:11 +00:00			`cond_composition, cond = prompt_parser.reconstruct_multicond_batch(cond, self.step)`
prompt editing 2022-09-15 10:10:16 +00:00			`uncond = prompt_parser.reconstruct_cond_batch(uncond, self.step)`

fix inpaint formulation 2024-02-05 21:44:31 +00:00			`if self.mask is not None:`
fix inpaint batch dim align #94 2024-02-07 06:57:53 +00:00			`noisy_initial_latent = self.init_latent + sigma[:, None, None, None] * torch.randn_like(self.init_latent).to(self.init_latent)`
fix inpaint formulation 2024-02-05 21:44:31 +00:00			`x = x * self.nmask + noisy_initial_latent * self.mask`
add CFG denoiser implementation for DDIM, PLMS and UniPC (this is the commit when you can run both old and new implementations to compare them) 2023-08-08 16:20:11 +00:00
i 2024-01-27 21:53:18 +00:00			`denoiser_params = CFGDenoiserParams(x, image_cond, sigma, state.sampling_step, state.sampling_steps, cond, uncond, self)`
Update class name and assign back to vars 2022-11-02 00:38:17 +00:00			`cfg_denoiser_callback(denoiser_params)`
merge CFGDenoiserEdit and CFGDenoiser into single object 2023-02-04 08:06:17 +00:00
i 2024-01-28 02:38:11 +00:00			`denoised = forge_sampler.forge_sample(self, denoiser_params=denoiser_params,`
			`cond_scale=cond_scale, cond_composition=cond_composition)`
add CFG denoiser implementation for DDIM, PLMS and UniPC (this is the commit when you can run both old and new implementations to compare them) 2023-08-08 16:20:11 +00:00
fix ddim inpaint 2024-02-04 11:34:20 +00:00			`if self.mask is not None:`
fix inpaint formulation 2024-02-05 21:44:31 +00:00			`denoised = denoised * self.nmask + self.init_latent * self.mask`
a1111 2024-02-04 08:49:40 +00:00
better sampler 2024-01-27 21:21:25 +00:00			`preview = self.sampler.last_latent = denoised`
add CFG denoiser implementation for DDIM, PLMS and UniPC (this is the commit when you can run both old and new implementations to compare them) 2023-08-08 16:20:11 +00:00			`sd_samplers_common.store_latent(preview)`
split codebase into multiple files; to anyone this affects negatively: sorry 2022-09-03 09:08:45 +00:00
Add/modify CFG callbacks Required by self-attn guidance extension https://github.com/ashen-sensored/sd_webui_SAG 2023-05-14 01:49:41 +00:00			`after_cfg_callback_params = AfterCFGCallbackParams(denoised, state.sampling_step, state.sampling_steps)`
			`cfg_after_cfg_callback(after_cfg_callback_params)`
remove output_altered flag from AfterCFGCallbackParams 2023-05-14 05:15:22 +00:00			`denoised = after_cfg_callback_params.x`
Add/modify CFG callbacks Required by self-attn guidance extension https://github.com/ashen-sensored/sd_webui_SAG 2023-05-14 01:49:41 +00:00
prompt editing 2022-09-15 10:10:16 +00:00			`self.step += 1`
fix ddim plms unipc 2024-02-04 10:03:35 +00:00
ddim 2024-02-04 21:47:31 +00:00			`if self.classic_ddim_eps_estimation:`
fix ddim plms unipc 2024-02-04 10:03:35 +00:00			`eps = (x - denoised) / sigma`
			`return eps`

try solve #71 2024-02-07 01:46:23 +00:00			`return denoised.to(device=original_x_device, dtype=original_x_dtype)`
split codebase into multiple files; to anyone this affects negatively: sorry 2022-09-03 09:08:45 +00:00