better sigmas for sd1.5 as refiner

2023-10-12 18:31:42 -07:00 · 2023-10-12 18:31:42 -07:00 · 3b9266e848
parent 26fe88d8a6
commit 3b9266e848
4 changed files with 49 additions and 33 deletions
--- a/fooocus_version.py
+++ b/fooocus_version.py
@ -1 +1 @@
-version = '2.1.53'
+version = '2.1.54'
--- a/modules/core.py
+++ b/modules/core.py
@ -204,17 +204,19 @@ def get_previewer(model):
 def ksampler(model, positive, negative, latent, seed=None, steps=30, cfg=7.0, sampler_name='dpmpp_fooocus_2m_sde_inpaint_seamless',
             scheduler='karras', denoise=1.0, disable_noise=False, start_step=None, last_step=None,
             force_full_denoise=False, callback_function=None, refiner=None, refiner_switch=-1,
-             previewer_start=None, previewer_end=None, sigmas=None):
+             previewer_start=None, previewer_end=None, sigmas=None, noise=None):

    if sigmas is not None:
        sigmas = sigmas.clone().to(fcbh.model_management.get_torch_device())

    latent_image = latent["samples"]
-    if disable_noise:
-        noise = torch.zeros(latent_image.size(), dtype=latent_image.dtype, layout=latent_image.layout, device="cpu")
-    else:
-        batch_inds = latent["batch_index"] if "batch_index" in latent else None
-        noise = fcbh.sample.prepare_noise(latent_image, seed, batch_inds)
+
+    if noise is None:
+        if disable_noise:
+            noise = torch.zeros(latent_image.size(), dtype=latent_image.dtype, layout=latent_image.layout, device="cpu")
+        else:
+            batch_inds = latent["batch_index"] if "batch_index" in latent else None
+            noise = fcbh.sample.prepare_noise(latent_image, seed, batch_inds)

    noise_mask = None
    if "noise_mask" in latent:
--- a/modules/default_pipeline.py
+++ b/modules/default_pipeline.py
@ -5,6 +5,7 @@ import modules.path
 import fcbh.model_management
 import fcbh.latent_formats
 import modules.inpaint_worker
+import modules.sample_hijack as sample_hijack

 from fcbh.model_base import SDXL, SDXLRefiner
 from modules.expansion import FooocusExpansion
@ -327,6 +328,8 @@ def process_diffusion(positive_cond, negative_cond, steps, switch, width, height
    else:
        empty_latent = latent

+    decoded_latent = None
+
    if refiner_swap_method == 'joint':
        sampled_latent = core.ksampler(
            model=final_unet,
@ -346,8 +349,6 @@ def process_diffusion(positive_cond, negative_cond, steps, switch, width, height
            previewer_end=steps,
        )
        decoded_latent = core.decode_vae(vae=final_vae, latent_image=sampled_latent, tiled=tiled)
-        images = core.pytorch_to_numpy(decoded_latent)
-        return images

    if refiner_swap_method == 'upscale':
        target_model = final_refiner_unet
@ -374,8 +375,6 @@ def process_diffusion(positive_cond, negative_cond, steps, switch, width, height
        if target_model is None:
            target_model = final_vae
        decoded_latent = core.decode_vae(vae=target_model, latent_image=sampled_latent, tiled=tiled)
-        images = core.pytorch_to_numpy(decoded_latent)
-        return images

    if refiner_swap_method == 'separate':
        sampled_latent = core.ksampler(
@ -420,23 +419,10 @@ def process_diffusion(positive_cond, negative_cond, steps, switch, width, height
        if target_model is None:
            target_model = final_vae
        decoded_latent = core.decode_vae(vae=target_model, latent_image=sampled_latent, tiled=tiled)
-        images = core.pytorch_to_numpy(decoded_latent)
-        return images

    if refiner_swap_method == 'vae':
-        sigmas = calculate_sigmas(sampler=sampler_name, scheduler=scheduler_name, model=final_unet.model, steps=steps, denoise=denoise)
-        sigmas_a = sigmas[:switch]
-        sigmas_b = sigmas[switch:]
-
-        if final_refiner_unet is not None:
-            k1 = final_refiner_unet.model.latent_format.scale_factor
-            k2 = final_unet.model.latent_format.scale_factor
-            k = float(k1) / float(k2)
-            sigmas_b = sigmas_b * k
-
-        sigmas = torch.cat([sigmas_a, sigmas_b], dim=0)
-
-        sampled_latent = core.ksampler(
+        sample_hijack.history_record = []
+        core.ksampler(
            model=final_unet,
            positive=positive_cond,
            negative=negative_cond,
@ -449,8 +435,7 @@ def process_diffusion(positive_cond, negative_cond, steps, switch, width, height
            sampler_name=sampler_name,
            scheduler=scheduler_name,
            previewer_start=0,
-            previewer_end=steps,
-            sigmas=sigmas
+            previewer_end=steps
        )
        print('Fooocus VAE-based swap.')

@ -459,6 +444,28 @@ def process_diffusion(positive_cond, negative_cond, steps, switch, width, height
            target_model = final_unet
            print('Use base model to refine itself - this may because of developer mode.')

+        sigmas = None
+        len_sigmas = steps - switch
+
+        if final_refiner_unet is not None:
+            sigmas = calculate_sigmas(sampler=sampler_name,
+                                      scheduler=scheduler_name,
+                                      model=final_refiner_unet.model,
+                                      steps=steps,
+                                      denoise=denoise)[switch:]
+            k1 = final_refiner_unet.model.latent_format.scale_factor
+            k2 = final_unet.model.latent_format.scale_factor
+            k = float(k1) / float(k2)
+            sigmas = sigmas * k
+            len_sigmas = len(sigmas) - 1
+
+        last_step, last_clean_latent, last_noisy_latent = sample_hijack.history_record[-1]
+        last_clean_latent = final_unet.model.process_latent_out(last_clean_latent.cpu().to(torch.float32))
+        last_noisy_latent = final_unet.model.process_latent_out(last_noisy_latent.cpu().to(torch.float32))
+        last_noise = last_noisy_latent - last_clean_latent
+        last_noise = last_noise / last_noise.std()
+
+        sampled_latent = {'samples': last_clean_latent}
        sampled_latent = vae_parse(sampled_latent)

        if modules.inpaint_worker.current_task is not None:
@ -469,8 +476,8 @@ def process_diffusion(positive_cond, negative_cond, steps, switch, width, height
            positive=clip_separate(positive_cond, target_model=target_model.model, target_clip=final_clip),
            negative=clip_separate(negative_cond, target_model=target_model.model, target_clip=final_clip),
            latent=sampled_latent,
-            steps=steps, start_step=switch, last_step=steps, disable_noise=False, force_full_denoise=True,
-            seed=image_seed,
+            steps=len_sigmas, start_step=0, last_step=len_sigmas, disable_noise=False, force_full_denoise=True,
+            seed=image_seed+1,  # Avoid artifacts
            denoise=denoise,
            callback_function=callback,
            cfg=cfg_scale,
@ -478,7 +485,8 @@ def process_diffusion(positive_cond, negative_cond, steps, switch, width, height
            scheduler=scheduler_name,
            previewer_start=switch,
            previewer_end=steps,
-            sigmas=sigmas
+            sigmas=sigmas,
+            noise=last_noise
        )

        if modules.inpaint_worker.current_task is not None:
@ -488,5 +496,7 @@ def process_diffusion(positive_cond, negative_cond, steps, switch, width, height
        if target_model is None:
            target_model = final_vae
        decoded_latent = core.decode_vae(vae=target_model, latent_image=sampled_latent, tiled=tiled)
-        images = core.pytorch_to_numpy(decoded_latent)
-        return images
+
+    images = core.pytorch_to_numpy(decoded_latent)
+    sample_hijack.history_record = None
+    return images
--- a/modules/sample_hijack.py
+++ b/modules/sample_hijack.py
@ -11,6 +11,7 @@ from fcbh.samplers import resolve_areas_and_cond_masks, wrap_model, calculate_st

 current_refiner = None
 refiner_switch_step = -1
+history_record = None


@torch.no_grad()
@ -127,6 +128,9 @@ def sample_hacked(model, noise, positive, negative, cfg, device, sampler, sigmas
        return

    def callback_wrap(step, x0, x, total_steps):
+        global history_record
+        if isinstance(history_record, list):
+            history_record.append((step, x0, x))
        if step == refiner_switch_step and current_refiner is not None:
            refiner_switch()
        if callback is not None: