blepping
diff --git a/‎NOTICE.txt
Lines changed: 5 additions & 0 deletions b/‎NOTICE.txt
Lines changed: 5 additions & 0 deletions
diff --git a/‎py/config.py
Lines changed: 214 additions & 0 deletions b/‎py/config.py
Lines changed: 214 additions & 0 deletions
diff --git a/‎py/external.py
Lines changed: 7 additions & 0 deletions b/‎py/external.py
Lines changed: 7 additions & 0 deletions
diff --git a/‎py/nodes.py
Lines changed: 95 additions & 18 deletions b/‎py/nodes.py
Lines changed: 95 additions & 18 deletions
@@ -0,0 +1,5 @@
+comfyui_jankdiffusehigh
+
+Copyright https://gitub.com/blepping
+
+This project was referenced from the original implementation at https://github.com/yhyun225/DiffuseHigh
@@ -0,0 +1,214 @@
+from __future__ import annotations
+
+from comfy.samplers import ksampler
+from pytorch_wavelets import DTCWTForward, DTCWTInverse, DWTForward, DWTInverse
+
+from .tensor_image_ops import (
+    BLENDING_MODES,
+    Sharpen,
+)
+from .upscale import Upscale
+from .utils import fallback
+from .vae import VAEHelper
+
+
+class Config:
+    _overridable_fields = {  # noqa: RUF012
+        "blend_by_mode",
+        "blend_mode",
+        "denoised_wavelet_multiplier",
+        "dtcwt_biort",
+        "dtcwt_mode",
+        "dtcwt_qshift",
+        "dwt_flip_filters",
+        "dwt_level",
+        "dwt_mode",
+        "dwt_wave",
+        "fadeout_factor",
+        "guidance_factor",
+        "guidance_mode",
+        "guidance_restart_s_noise",
+        "guidance_restart",
+        "guidance_steps",
+        "iteration_override",
+        "reference_wavelet_multiplier",
+        "renoise_factor",
+        "resample_mode",
+        "rescale_increment",
+        "scale_factor",
+        "sharpen_gaussian_kernel_size",
+        "sharpen_gaussian_sigma",
+        "sharpen_mode",
+        "sharpen_reference",
+        "sharpen_strength",
+        "sigma_offset",
+        "vae_decode_kwargs",
+        "vae_encode_kwargs",
+        "vae_mode",
+    }
+
+    _dict_exclude_keys = {  # noqa: RUF012
+        "as_dict",
+        "blend_function",
+        "dwt",
+        "get_iteration_config",
+        "idwt",
+        "iteration_override",
+        "sharpen",
+        "upscale",
+        "vae",
+    }
+
+    def __init__(
+        self,
+        device,
+        dtype,
+        latent_format,
+        *,
+        blend_mode="lerp",
+        blend_by_mode="image",
+        denoised_wavelet_multiplier=1.0,
+        dtcwt_biort="near_sym_a",
+        dtcwt_mode=False,
+        dtcwt_qshift="qshift_a",
+        dwt_flip_filters=False,
+        dwt_level=1,
+        dwt_mode="symmetric",
+        dwt_wave="db4",
+        fadeout_factor=0.0,
+        guidance_factor=1.0,
+        guidance_mode="image",
+        guidance_restart_s_noise=1.0,
+        guidance_restart=0,
+        guidance_sampler=None,
+        guidance_steps=5,
+        iteration_override=None,
+        iterations=1,
+        reference_sampler=None,
+        reference_wavelet_multiplier=1.0,
+        renoise_factor=1.0,
+        resample_mode="bicubic",
+        rescale_increment=64,
+        sampler=None,
+        scale_factor=2.0,
+        sharpen_gaussian_kernel_size=3,
+        sharpen_gaussian_sigma=(0.1, 2.0),
+        sharpen_mode="gaussian",
+        sharpen_reference=True,
+        sharpen_strength=1.0,
+        sigma_offset=0,
+        upscale_model=None,
+        vae_decode_kwargs=None,
+        vae_encode_kwargs=None,
+        vae_mode="normal",
+        vae=None,
+    ):
+        sampler = fallback(
+            sampler,
+            lambda: ksampler("euler"),
+            default_is_fun=True,
+        )
+        self.sigma_offset = sigma_offset
+        self.fadeout_factor = fadeout_factor
+        self.scale_factor = scale_factor
+        self.guidance_factor = guidance_factor
+        self.renoise_factor = renoise_factor
+        self.iterations = iterations
+        self.guidance_steps = guidance_steps
+        self.guidance_mode = guidance_mode
+        self.guidance_restart = guidance_restart
+        self.guidance_restart_s_noise = guidance_restart_s_noise
+        self.sampler = sampler
+        self.guidance_sampler = fallback(guidance_sampler, sampler)
+        self.reference_sampler = fallback(reference_sampler, sampler)
+        self.vae = VAEHelper(
+            vae_mode,
+            latent_format,
+            device=device,
+            dtype=dtype,
+            vae=vae,
+            encode_kwargs=fallback(vae_encode_kwargs, {}),
+            decode_kwargs=fallback(vae_decode_kwargs, {}),
+        )
+        self.sharpen = Sharpen(
+            mode=sharpen_mode,
+            strength=sharpen_strength if sharpen_reference else 0,
+            gaussian_kernel_size=sharpen_gaussian_kernel_size,
+            gaussian_sigma=sharpen_gaussian_sigma,
+        )
+        self.upscale = Upscale(
+            resample_mode=resample_mode,
+            rescale_increment=rescale_increment,
+            upscale_model=upscale_model,
+        )
+        self.dwt_mode = dwt_mode
+        self.dwt_level = dwt_level
+        self.dwt_wave = dwt_wave
+        self.dtcwt_mode = dtcwt_mode
+        self.dtcwt_biort = dtcwt_biort
+        self.dtcwt_qshift = dtcwt_qshift
+        if dtcwt_mode:
+            self.dwt = DTCWTForward(
+                J=dwt_level,
+                mode=dwt_mode,
+                biort=dtcwt_biort,
+                qshift=dtcwt_qshift,
+            ).to(device)
+            self.idwt = DTCWTInverse(
+                mode=dwt_mode,
+                biort=dtcwt_biort,
+                qshift=dtcwt_qshift,
+            ).to(device)
+        else:
+            self.dwt = DWTForward(J=dwt_level, wave=dwt_wave, mode=dwt_mode).to(device)
+            self.idwt = DWTInverse(wave=dwt_wave, mode=dwt_mode).to(device)
+        self.dwt_flip_filters = dwt_flip_filters
+        self.reference_wavelet_multiplier = reference_wavelet_multiplier
+        self.denoised_wavelet_multiplier = denoised_wavelet_multiplier
+        self.blend_mode = blend_mode
+        if blend_by_mode not in {"image", "latent", "wavelet"}:
+            raise ValueError("Bad blend_by_mode: must be one of image, latent, wavelet")
+        self.blend_by_mode = blend_by_mode
+        self.blend_function = BLENDING_MODES[blend_mode]
+        self.iteration_override = {}
+        if iteration_override is None or iteration_override == {}:
+            return
+        if not isinstance(iteration_override, dict):
+            raise TypeError("Iteration override must be an object")
+        # if isinstance(next(iter(iteration_override.values())), self.__class__):
+        #     self.iteration_Override = iteration_override
+        #     return
+        selfdict = self.as_dict()
+        overrides = self.iteration_override
+        for k, v in iteration_override.items():
+            if not isinstance(k, (int, str)) or not isinstance(v, dict):
+                raise TypeError(
+                    "Bad type for override item: key must be integer or string, value must be an object",
+                )
+            okwargs = selfdict | {
+                ok: ov for ok, ov in v.items() if ok in self._overridable_fields
+            }
+            overrides[k] = self.__class__(device, dtype, latent_format, **okwargs)
+
+    def as_dict(self) -> dict:
+        result = {
+            k: getattr(self, k)
+            for k in dir(self)
+            if not k.startswith("_") and k not in self._dict_exclude_keys
+        }
+        result["vae_mode"] = self.vae.mode.name.lower()
+        result["vae"] = self.vae.vae
+        result["vae_encode_kwargs"] = self.vae.encode_kwargs
+        result["vae_decode_kwargs"] = self.vae.decode_kwargs
+        result["sharpen_reference"] = self.sharpen.strength != 0
+        result["sharpen_strength"] = self.sharpen.strength
+        result["sharpen_gaussian_kernel_size"] = self.sharpen.gaussian_kernel_size
+        result["sharpen_gaussian_sigma"] = self.sharpen.gaussian_sigma
+        result["resample_mode"] = self.upscale.resample_mode
+        result["rescale_increment"] = self.upscale.rescale_increment
+        result["upscale_model"] = self.upscale.upscale_model
+        return result
+
+    def get_iteration_config(self, iteration):
+        override = self.iteration_override.get(iteration)
+        return override.get_iteration_config(iteration) if override else self
@@ -7,3 +7,10 @@
     EXTERNAL["tiled_diffusion"] = importlib.import_module(
         "custom_nodes.ComfyUI-TiledDiffusion",
     )
+
+with contextlib.suppress(ImportError, NotImplementedError):
+    bleh = importlib.import_module("custom_nodes.ComfyUI-bleh")
+    bleh_version = getattr(bleh, "BLEH_VERSION", -1)
+    if bleh_version < 1:
+        raise NotImplementedError
+    EXTERNAL["bleh"] = bleh.py
@@ -4,52 +4,129 @@
 from comfy.samplers import KSAMPLER
 
 from .sampler import diffusehigh_sampler
+from .vae import VAEMode
 
 
 class DiffuseHighSamplerNode:
+    DESCRIPTION = "Jank DiffuseHigh sampler node, used for generating directly to resolutions higher than what the model was trained for. Can be connected to a SamplerCustom or other sampler node that supports a SAMPLER input."
+    OUTPUT_TOOLTIPS = (
+        "SAMPLER that can be connected to a SamplerCustom or other sampler node that supports a SAMPLER input.",
+    )
+    CATEGORY = "sampling/custom_sampling/JankDiffuseHigh"
     RETURN_TYPES = ("SAMPLER",)
     FUNCTION = "go"
 
     @classmethod
     def INPUT_TYPES(cls) -> dict:
         return {
             "required": {
-                "highres_sigmas": ("SIGMAS",),
-                "guidance_steps": ("INT", {"default": 5, "min": 0}),
+                "highres_sigmas": (
+                    "SIGMAS",
+                    {
+                        "tooltip": "Sigmas used for steps after upscaling. Generally should be around 0.3-0.5 denoise. NOTE: I do not recommend plugging in raw 1.0 denoise sigmas here.",
+                    },
+                ),
+                "guidance_steps": (
+                    "INT",
+                    {
+                        "default": 5,
+                        "min": 0,
+                        "tooltip": "Number of guidance steps after an upscale.",
+                    },
+                ),
                 "guidance_mode": (
                     (
                         "image",
                         "latent",
                     ),
+                    {
+                        "default": "image",
+                        "tooltip": "The original implementation uses image guidance. This requires a VAE encode/decode per guidance step. Alternatively, you can try using guidance via the latent instead which is much faster.",
+                    },
                 ),
                 "guidance_factor": (
                     "FLOAT",
                     {
                         "default": 1.0,
                         "min": 0.0,
                         "max": 1.0,
+                        "tooltip": "Mix factor used on guidance steps. 1.0 means use 100% DiffuseHigh guidance for those steps (like the original implementation).",
+                    },
+                ),
+                "fadeout_factor": (
+                    "FLOAT",
+                    {
+                        "default": 0.0,
+                        "tooltip": "Can be enabled to fade out guidance_factor. For example, if guidance_factor is 1 and guidance_steps is 4 then fadeout_factor would use these guidance_factors for the guidance steps: 1.00, 0.75, 0.50, 0.25",
+                    },
+                ),
+                "scale_factor": (
+                    "FLOAT",
+                    {
+                        "default": 2.0,
+                        "tooltip": "Upscale factor per iteration.",
+                    },
+                ),
+                "renoise_factor": (
+                    "FLOAT",
+                    {
+                        "default": 1.0,
+                        "tooltip": "Strength of noise added at the start of each iteration. The default of 1.0 (100%) is the normal amount, but you can increase this slightly to add more detail.",
+                    },
+                ),
+                "iterations": (
+                    "INT",
+                    {
+                        "default": 1,
+                        "min": 0,
+                        "tooltip": "Number of upscale iterations to run. Be careful, this can add up fast - if you start at 512x512 with a 2.0 scale factor then 3 iterations will get you to 4096x4096.",
                     },
                 ),
-                "fadeout_factor": ("FLOAT", {"default": 0.0}),
-                "scale_factor": ("FLOAT", {"default": 2.0}),
-                "renoise_factor": ("FLOAT", {"default": 1.0}),
-                "iterations": ("INT", {"default": 1, "min": 0}),
-                "sampler": ("SAMPLER",),
                 "vae_mode": (
-                    (
-                        "taesd",
-                        "normal",
-                        "tiled",
-                        "tiled_diffusion",
-                    ),
+                    tuple(vm.name.lower() for vm in VAEMode),
+                    {
+                        "default": "normal",
+                        "tooltip": "Mode used for encoding/decoding images. TAESD is fast/low VRAM but may reduce quality (you will also need the TAESD encoders installed). Normal will just use the normal VAE node, tiled with use the tiled VAE node. Alternatively, if you have ComfyUI-TiledDiffusion installed you can use tiled_diffusion here.",
+                    },
                 ),
             },
             "optional": {
-                "reference_image_opt": ("IMAGE",),
-                "guidance_sampler_opt": ("SAMPLER",),
-                "reference_sampler_opt": ("SAMPLER",),
-                "vae_opt": ("VAE",),
-                "upscale_model_opt": ("UPSCALE_MODEL",),
+                "sampler": (
+                    "SAMPLER",
+                    {
+                        "tooltip": "Default sampler used for steps. If not specified the sampler will default to non-ancestral Euler.",
+                    },
+                ),
+                "reference_image_opt": (
+                    "IMAGE",
+                    {
+                        "tooltip": "Optional: Image used for the initial pass. If not connected, a low-res initial reference will be generated using the schedule from the normal sigmas.",
+                    },
+                ),
+                "guidance_sampler_opt": (
+                    "SAMPLER",
+                    {
+                        "tooltip": "Optional: Sampler used for guidance steps. If not specified, will fallback to the base sampler. Note: The sampler is called on individual steps, samplers that keep history will not work well here.",
+                    },
+                ),
+                "reference_sampler_opt": (
+                    "SAMPLER",
+                    {
+                        "tooltip": "Optional: Sampler used to generate the initial low-resolution reference. Only used if reference_image_opt is not connected.",
+                    },
+                ),
+                "vae_opt": (
+                    "VAE",
+                    {
+                        "tooltip": "Optional when vae_mode is set to `taesd`, otherwise this is the VAE that will be used for encoding/decoding images.",
+                    },
+                ),
+                "upscale_model_opt": (
+                    "UPSCALE_MODEL",
+                    {
+                        "tooltip": "Optional: Model used for upscaling. When not attached, simple image scaling will be used. Regardless, the image will be scaled to match the size expected based on scale_factor. For example, if you use scale_factor 2 and a 4x upscale model, the image will get scaled down after the upscale model runs.",
+                    },
+                ),
                 "yaml_parameters": (
                     "STRING",
                     {