ComfyUI/comfy_extras/nodes_sd3.py

import folder_paths
import comfy.sd
import comfy.model_management
import nodes
import torch
import re
class TripleCLIPLoader:
    @classmethod
    def INPUT_TYPES(s):
        return {"required": { "clip_name1": (folder_paths.get_filename_list("text_encoders"), ), "clip_name2": (folder_paths.get_filename_list("text_encoders"), ), "clip_name3": (folder_paths.get_filename_list("text_encoders"), )
                             }}
    RETURN_TYPES = ("CLIP",)
    FUNCTION = "load_clip"

    CATEGORY = "advanced/loaders"

    DESCRIPTION = "[Recipes]\n\nsd3: clip-l, clip-g, t5"

    def load_clip(self, clip_name1, clip_name2, clip_name3):
        clip_path1 = folder_paths.get_full_path_or_raise("text_encoders", clip_name1)
        clip_path2 = folder_paths.get_full_path_or_raise("text_encoders", clip_name2)
        clip_path3 = folder_paths.get_full_path_or_raise("text_encoders", clip_name3)
        clip = comfy.sd.load_clip(ckpt_paths=[clip_path1, clip_path2, clip_path3], embedding_directory=folder_paths.get_folder_paths("embeddings"))
        return (clip,)

class EmptySD3LatentImage:
    def __init__(self):
        self.device = comfy.model_management.intermediate_device()

    @classmethod
    def INPUT_TYPES(s):
        return {"required": { "width": ("INT", {"default": 1024, "min": 16, "max": nodes.MAX_RESOLUTION, "step": 16}),
                              "height": ("INT", {"default": 1024, "min": 16, "max": nodes.MAX_RESOLUTION, "step": 16}),
                              "batch_size": ("INT", {"default": 1, "min": 1, "max": 4096})}}
    RETURN_TYPES = ("LATENT",)
    FUNCTION = "generate"

    CATEGORY = "latent/sd3"

    def generate(self, width, height, batch_size=1):
        latent = torch.zeros([batch_size, 16, height // 8, width // 8], device=self.device)
        return ({"samples":latent}, )

class CLIPTextEncodeSD3:
    @classmethod
    def INPUT_TYPES(s):
        return {"required": {
            "clip": ("CLIP", ),
            "clip_l": ("STRING", {"multiline": True, "dynamicPrompts": True}),
            "clip_g": ("STRING", {"multiline": True, "dynamicPrompts": True}),
            "t5xxl": ("STRING", {"multiline": True, "dynamicPrompts": True}),
            "empty_padding": (["none", "empty_prompt"], )
            }}
    RETURN_TYPES = ("CONDITIONING",)
    FUNCTION = "encode"

    CATEGORY = "advanced/conditioning"

    def encode(self, clip, clip_l, clip_g, t5xxl, empty_padding):
        no_padding = empty_padding == "none"

        tokens = clip.tokenize(clip_g)
        if len(clip_g) == 0 and no_padding:
            tokens["g"] = []

        if len(clip_l) == 0 and no_padding:
            tokens["l"] = []
        else:
            tokens["l"] = clip.tokenize(clip_l)["l"]

        if len(t5xxl) == 0 and no_padding:
            tokens["t5xxl"] =  []
        else:
            tokens["t5xxl"] = clip.tokenize(t5xxl)["t5xxl"]
        if len(tokens["l"]) != len(tokens["g"]):
            empty = clip.tokenize("")
            while len(tokens["l"]) < len(tokens["g"]):
                tokens["l"] += empty["l"]
            while len(tokens["l"]) > len(tokens["g"]):
                tokens["g"] += empty["g"]
        cond, pooled = clip.encode_from_tokens(tokens, return_pooled=True)
        return ([[cond, {"pooled_output": pooled}]], )


class ControlNetApplySD3(nodes.ControlNetApplyAdvanced):
    @classmethod
    def INPUT_TYPES(s):
        return {"required": {"positive": ("CONDITIONING", ),
                             "negative": ("CONDITIONING", ),
                             "control_net": ("CONTROL_NET", ),
                             "vae": ("VAE", ),
                             "image": ("IMAGE", ),
                             "strength": ("FLOAT", {"default": 1.0, "min": 0.0, "max": 10.0, "step": 0.01}),
                             "start_percent": ("FLOAT", {"default": 0.0, "min": 0.0, "max": 1.0, "step": 0.001}),
                             "end_percent": ("FLOAT", {"default": 1.0, "min": 0.0, "max": 1.0, "step": 0.001})
                             }}
    CATEGORY = "conditioning/controlnet"
    DEPRECATED = True

class SkipLayerGuidanceSD3:
    '''
    Enhance guidance towards detailed dtructure by having another set of CFG negative with skipped layers.
    Inspired by Perturbed Attention Guidance (https://arxiv.org/abs/2403.17377)
    Experimental implementation by Dango233@StabilityAI.
    '''
    @classmethod
    def INPUT_TYPES(s):
        return {"required": {"model": ("MODEL", ),
                             "layers": ("STRING", {"default": "7, 8, 9", "multiline": False}),
                             "scale": ("FLOAT", {"default": 3.0, "min": 0.0, "max": 10.0, "step": 0.1}),
                             "start_percent": ("FLOAT", {"default": 0.01, "min": 0.0, "max": 1.0, "step": 0.001}),
                             "end_percent": ("FLOAT", {"default": 0.15, "min": 0.0, "max": 1.0, "step": 0.001})
                                }}
    RETURN_TYPES = ("MODEL",)
    FUNCTION = "skip_guidance"

    CATEGORY = "advanced/guidance"


    def skip_guidance(self, model, layers, scale, start_percent, end_percent):
        if layers == "" or layers == None:
            return (model, )
        # check if layer is comma separated integers
        def skip(args, extra_args):
            return args

        model_sampling = model.get_model_object("model_sampling")
        sigma_start = model_sampling.percent_to_sigma(start_percent)
        sigma_end = model_sampling.percent_to_sigma(end_percent)

        def post_cfg_function(args):
            model = args["model"]
            cond_pred = args["cond_denoised"]
            cond = args["cond"]
            cfg_result = args["denoised"]
            sigma = args["sigma"]
            x = args["input"]
            model_options = args["model_options"].copy()
        
            for layer in layers:
                model_options = comfy.model_patcher.set_model_options_patch_replace(model_options, skip, "dit", "double_block", layer)
            model_sampling.percent_to_sigma(start_percent)

            sigma_ = sigma[0].item()
            if scale > 0 and sigma_ >= sigma_end and sigma_ <= sigma_start:
                (slg,) = comfy.samplers.calc_cond_batch(model, [cond], x, sigma, model_options)
                cfg_result = cfg_result + (cond_pred - slg) * scale
            return cfg_result

        layers = re.findall(r'\d+', layers)
        layers = [int(i) for i in layers]
        m = model.clone()
        m.set_model_sampler_post_cfg_function(post_cfg_function)

        return (m, )


NODE_CLASS_MAPPINGS = {
    "TripleCLIPLoader": TripleCLIPLoader,
    "EmptySD3LatentImage": EmptySD3LatentImage,
    "CLIPTextEncodeSD3": CLIPTextEncodeSD3,
    "ControlNetApplySD3": ControlNetApplySD3,
    "SkipLayerGuidanceSD3": SkipLayerGuidanceSD3,
}

NODE_DISPLAY_NAME_MAPPINGS = {
    # Sampling
    "ControlNetApplySD3": "Apply Controlnet with VAE",
}
SD3 Support. 2024-06-10 17:26:25 +00:00			`import folder_paths`
			`import comfy.sd`
			`import comfy.model_management`
			`import nodes`
			`import torch`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00			`import re`
SD3 Support. 2024-06-10 17:26:25 +00:00			`class TripleCLIPLoader:`
			`@classmethod`
			`def INPUT_TYPES(s):`
Update folder paths: "clip" -> "text_encoders" You can still use models/clip but the folder might get removed eventually on new installs of ComfyUI. 2024-11-02 19:35:38 +00:00			`return {"required": { "clip_name1": (folder_paths.get_filename_list("text_encoders"), ), "clip_name2": (folder_paths.get_filename_list("text_encoders"), ), "clip_name3": (folder_paths.get_filename_list("text_encoders"), )`
SD3 Support. 2024-06-10 17:26:25 +00:00			`}}`
			`RETURN_TYPES = ("CLIP",)`
			`FUNCTION = "load_clip"`

			`CATEGORY = "advanced/loaders"`

improve: add descriptions for clip loaders (#5576) 2024-11-11 10:37:23 +00:00			`DESCRIPTION = "[Recipes]\n\nsd3: clip-l, clip-g, t5"`

SD3 Support. 2024-06-10 17:26:25 +00:00			`def load_clip(self, clip_name1, clip_name2, clip_name3):`
Update folder paths: "clip" -> "text_encoders" You can still use models/clip but the folder might get removed eventually on new installs of ComfyUI. 2024-11-02 19:35:38 +00:00			`clip_path1 = folder_paths.get_full_path_or_raise("text_encoders", clip_name1)`
			`clip_path2 = folder_paths.get_full_path_or_raise("text_encoders", clip_name2)`
			`clip_path3 = folder_paths.get_full_path_or_raise("text_encoders", clip_name3)`
SD3 Support. 2024-06-10 17:26:25 +00:00			`clip = comfy.sd.load_clip(ckpt_paths=[clip_path1, clip_path2, clip_path3], embedding_directory=folder_paths.get_folder_paths("embeddings"))`
			`return (clip,)`

			`class EmptySD3LatentImage:`
			`def __init__(self):`
			`self.device = comfy.model_management.intermediate_device()`

			`@classmethod`
			`def INPUT_TYPES(s):`
Set the step in EmptySD3LatentImage to 16. These models work better when the res is a multiple of 16. 2024-08-04 19:59:02 +00:00			`return {"required": { "width": ("INT", {"default": 1024, "min": 16, "max": nodes.MAX_RESOLUTION, "step": 16}),`
			`"height": ("INT", {"default": 1024, "min": 16, "max": nodes.MAX_RESOLUTION, "step": 16}),`
SD3 Support. 2024-06-10 17:26:25 +00:00			`"batch_size": ("INT", {"default": 1, "min": 1, "max": 4096})}}`
			`RETURN_TYPES = ("LATENT",)`
			`FUNCTION = "generate"`

			`CATEGORY = "latent/sd3"`

			`def generate(self, width, height, batch_size=1):`
Make SD3 empty latent image zeros. This shouldn't change anything. The reason it was not zeros is because it did matter in early versions of the code. 2024-09-21 13:12:31 +00:00			`latent = torch.zeros([batch_size, 16, height // 8, width // 8], device=self.device)`
SD3 Support. 2024-06-10 17:26:25 +00:00			`return ({"samples":latent}, )`

			`class CLIPTextEncodeSD3:`
			`@classmethod`
			`def INPUT_TYPES(s):`
			`return {"required": {`
			`"clip": ("CLIP", ),`
			`"clip_l": ("STRING", {"multiline": True, "dynamicPrompts": True}),`
			`"clip_g": ("STRING", {"multiline": True, "dynamicPrompts": True}),`
			`"t5xxl": ("STRING", {"multiline": True, "dynamicPrompts": True}),`
			`"empty_padding": (["none", "empty_prompt"], )`
			`}}`
			`RETURN_TYPES = ("CONDITIONING",)`
			`FUNCTION = "encode"`

			`CATEGORY = "advanced/conditioning"`

			`def encode(self, clip, clip_l, clip_g, t5xxl, empty_padding):`
			`no_padding = empty_padding == "none"`

			`tokens = clip.tokenize(clip_g)`
			`if len(clip_g) == 0 and no_padding:`
			`tokens["g"] = []`

			`if len(clip_l) == 0 and no_padding:`
			`tokens["l"] = []`
			`else:`
			`tokens["l"] = clip.tokenize(clip_l)["l"]`

			`if len(t5xxl) == 0 and no_padding:`
			`tokens["t5xxl"] = []`
			`else:`
			`tokens["t5xxl"] = clip.tokenize(t5xxl)["t5xxl"]`
			`if len(tokens["l"]) != len(tokens["g"]):`
			`empty = clip.tokenize("")`
			`while len(tokens["l"]) < len(tokens["g"]):`
			`tokens["l"] += empty["l"]`
			`while len(tokens["l"]) > len(tokens["g"]):`
			`tokens["g"] += empty["g"]`
			`cond, pooled = clip.encode_from_tokens(tokens, return_pooled=True)`
			`return ([[cond, {"pooled_output": pooled}]], )`


ControlNetApplySD3 node can now be used to use SD3 controlnets. 2024-06-26 20:14:47 +00:00			`class ControlNetApplySD3(nodes.ControlNetApplyAdvanced):`
			`@classmethod`
			`def INPUT_TYPES(s):`
			`return {"required": {"positive": ("CONDITIONING", ),`
			`"negative": ("CONDITIONING", ),`
			`"control_net": ("CONTROL_NET", ),`
			`"vae": ("VAE", ),`
			`"image": ("IMAGE", ),`
			`"strength": ("FLOAT", {"default": 1.0, "min": 0.0, "max": 10.0, "step": 0.01}),`
			`"start_percent": ("FLOAT", {"default": 0.0, "min": 0.0, "max": 1.0, "step": 0.001}),`
			`"end_percent": ("FLOAT", {"default": 1.0, "min": 0.0, "max": 1.0, "step": 0.001})`
			`}}`
Move controlnet nodes to conditioning/controlnet. 2024-07-16 21:08:25 +00:00			`CATEGORY = "conditioning/controlnet"`
Add an optional VAE input to the ControlNetApplyAdvanced node. Deprecate the other controlnet nodes. 2024-09-22 05:24:52 +00:00			`DEPRECATED = True`
ControlNetApplySD3 node can now be used to use SD3 controlnets. 2024-06-26 20:14:47 +00:00
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00			`class SkipLayerGuidanceSD3:`
			`'''`
			`Enhance guidance towards detailed dtructure by having another set of CFG negative with skipped layers.`
			`Inspired by Perturbed Attention Guidance (https://arxiv.org/abs/2403.17377)`
			`Experimental implementation by Dango233@StabilityAI.`
			`'''`
			`@classmethod`
			`def INPUT_TYPES(s):`
			`return {"required": {"model": ("MODEL", ),`
Cleanup SkipLayerGuidanceSD3 node. 2024-10-29 14:11:46 +00:00			`"layers": ("STRING", {"default": "7, 8, 9", "multiline": False}),`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00			`"scale": ("FLOAT", {"default": 3.0, "min": 0.0, "max": 10.0, "step": 0.1}),`
			`"start_percent": ("FLOAT", {"default": 0.01, "min": 0.0, "max": 1.0, "step": 0.001}),`
			`"end_percent": ("FLOAT", {"default": 0.15, "min": 0.0, "max": 1.0, "step": 0.001})`
			`}}`
			`RETURN_TYPES = ("MODEL",)`
			`FUNCTION = "skip_guidance"`

			`CATEGORY = "advanced/guidance"`


			`def skip_guidance(self, model, layers, scale, start_percent, end_percent):`
			`if layers == "" or layers == None:`
			`return (model, )`
			`# check if layer is comma separated integers`
			`def skip(args, extra_args):`
			`return args`

			`model_sampling = model.get_model_object("model_sampling")`
Cleanup SkipLayerGuidanceSD3 node. 2024-10-29 14:11:46 +00:00			`sigma_start = model_sampling.percent_to_sigma(start_percent)`
			`sigma_end = model_sampling.percent_to_sigma(end_percent)`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00
			`def post_cfg_function(args):`
			`model = args["model"]`
			`cond_pred = args["cond_denoised"]`
			`cond = args["cond"]`
			`cfg_result = args["denoised"]`
			`sigma = args["sigma"]`
			`x = args["input"]`
			`model_options = args["model_options"].copy()`

			`for layer in layers:`
			`model_options = comfy.model_patcher.set_model_options_patch_replace(model_options, skip, "dit", "double_block", layer)`
			`model_sampling.percent_to_sigma(start_percent)`
Cleanup SkipLayerGuidanceSD3 node. 2024-10-29 14:11:46 +00:00
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00			`sigma_ = sigma[0].item()`
Cleanup SkipLayerGuidanceSD3 node. 2024-10-29 14:11:46 +00:00			`if scale > 0 and sigma_ >= sigma_end and sigma_ <= sigma_start:`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00			`(slg,) = comfy.samplers.calc_cond_batch(model, [cond], x, sigma, model_options)`
			`cfg_result = cfg_result + (cond_pred - slg) * scale`
			`return cfg_result`

			`layers = re.findall(r'\d+', layers)`
			`layers = [int(i) for i in layers]`
			`m = model.clone()`
			`m.set_model_sampler_post_cfg_function(post_cfg_function)`

			`return (m, )`


SD3 Support. 2024-06-10 17:26:25 +00:00			`NODE_CLASS_MAPPINGS = {`
			`"TripleCLIPLoader": TripleCLIPLoader,`
			`"EmptySD3LatentImage": EmptySD3LatentImage,`
			`"CLIPTextEncodeSD3": CLIPTextEncodeSD3,`
ControlNetApplySD3 node can now be used to use SD3 controlnets. 2024-06-26 20:14:47 +00:00			`"ControlNetApplySD3": ControlNetApplySD3,`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00			`"SkipLayerGuidanceSD3": SkipLayerGuidanceSD3,`
SD3 Support. 2024-06-10 17:26:25 +00:00			`}`
Cleanup HunyuanDit controlnets. Use the: ControlNetApply SD3 and HunyuanDiT node. 2024-08-09 06:35:19 +00:00
			`NODE_DISPLAY_NAME_MAPPINGS = {`
			`# Sampling`
Add an optional VAE input to the ControlNetApplyAdvanced node. Deprecate the other controlnet nodes. 2024-09-22 05:24:52 +00:00			`"ControlNetApplySD3": "Apply Controlnet with VAE",`
Cleanup HunyuanDit controlnets. Use the: ControlNetApply SD3 and HunyuanDiT node. 2024-08-09 06:35:19 +00:00			`}`