ComfyUI/comfy_extras/nodes_sd3.py

import folder_paths
import comfy.sd
import comfy.model_management
import nodes
import torch
import comfy_extras.nodes_slg


class TripleCLIPLoader:
    @classmethod
    def INPUT_TYPES(s):
        return {"required": { "clip_name1": (folder_paths.get_filename_list("text_encoders"), ), "clip_name2": (folder_paths.get_filename_list("text_encoders"), ), "clip_name3": (folder_paths.get_filename_list("text_encoders"), )
                             }}
    RETURN_TYPES = ("CLIP",)
    FUNCTION = "load_clip"

    CATEGORY = "advanced/loaders"

    DESCRIPTION = "[Recipes]\n\nsd3: clip-l, clip-g, t5"

    def load_clip(self, clip_name1, clip_name2, clip_name3):
        clip_path1 = folder_paths.get_full_path_or_raise("text_encoders", clip_name1)
        clip_path2 = folder_paths.get_full_path_or_raise("text_encoders", clip_name2)
        clip_path3 = folder_paths.get_full_path_or_raise("text_encoders", clip_name3)
        clip = comfy.sd.load_clip(ckpt_paths=[clip_path1, clip_path2, clip_path3], embedding_directory=folder_paths.get_folder_paths("embeddings"))
        return (clip,)


class EmptySD3LatentImage:
    def __init__(self):
        self.device = comfy.model_management.intermediate_device()

    @classmethod
    def INPUT_TYPES(s):
        return {"required": { "width": ("INT", {"default": 1024, "min": 16, "max": nodes.MAX_RESOLUTION, "step": 16}),
                              "height": ("INT", {"default": 1024, "min": 16, "max": nodes.MAX_RESOLUTION, "step": 16}),
                              "batch_size": ("INT", {"default": 1, "min": 1, "max": 4096})}}
    RETURN_TYPES = ("LATENT",)
    FUNCTION = "generate"

    CATEGORY = "latent/sd3"

    def generate(self, width, height, batch_size=1):
        latent = torch.zeros([batch_size, 16, height // 8, width // 8], device=self.device)
        return ({"samples":latent}, )


class CLIPTextEncodeSD3:
    @classmethod
    def INPUT_TYPES(s):
        return {"required": {
            "clip": ("CLIP", ),
            "clip_l": ("STRING", {"multiline": True, "dynamicPrompts": True}),
            "clip_g": ("STRING", {"multiline": True, "dynamicPrompts": True}),
            "t5xxl": ("STRING", {"multiline": True, "dynamicPrompts": True}),
            "empty_padding": (["none", "empty_prompt"], )
            }}
    RETURN_TYPES = ("CONDITIONING",)
    FUNCTION = "encode"

    CATEGORY = "advanced/conditioning"

    def encode(self, clip, clip_l, clip_g, t5xxl, empty_padding):
        no_padding = empty_padding == "none"

        tokens = clip.tokenize(clip_g)
        if len(clip_g) == 0 and no_padding:
            tokens["g"] = []

        if len(clip_l) == 0 and no_padding:
            tokens["l"] = []
        else:
            tokens["l"] = clip.tokenize(clip_l)["l"]

        if len(t5xxl) == 0 and no_padding:
            tokens["t5xxl"] =  []
        else:
            tokens["t5xxl"] = clip.tokenize(t5xxl)["t5xxl"]
        if len(tokens["l"]) != len(tokens["g"]):
            empty = clip.tokenize("")
            while len(tokens["l"]) < len(tokens["g"]):
                tokens["l"] += empty["l"]
            while len(tokens["l"]) > len(tokens["g"]):
                tokens["g"] += empty["g"]
        cond, pooled = clip.encode_from_tokens(tokens, return_pooled=True)
        return ([[cond, {"pooled_output": pooled}]], )


class ControlNetApplySD3(nodes.ControlNetApplyAdvanced):
    @classmethod
    def INPUT_TYPES(s):
        return {"required": {"positive": ("CONDITIONING", ),
                             "negative": ("CONDITIONING", ),
                             "control_net": ("CONTROL_NET", ),
                             "vae": ("VAE", ),
                             "image": ("IMAGE", ),
                             "strength": ("FLOAT", {"default": 1.0, "min": 0.0, "max": 10.0, "step": 0.01}),
                             "start_percent": ("FLOAT", {"default": 0.0, "min": 0.0, "max": 1.0, "step": 0.001}),
                             "end_percent": ("FLOAT", {"default": 1.0, "min": 0.0, "max": 1.0, "step": 0.001})
                             }}
    CATEGORY = "conditioning/controlnet"
    DEPRECATED = True


class SkipLayerGuidanceSD3(comfy_extras.nodes_slg.SkipLayerGuidanceDiT):
    '''
    Enhance guidance towards detailed dtructure by having another set of CFG negative with skipped layers.
    Inspired by Perturbed Attention Guidance (https://arxiv.org/abs/2403.17377)
    Experimental implementation by Dango233@StabilityAI.
    '''
    @classmethod
    def INPUT_TYPES(s):
        return {"required": {"model": ("MODEL", ),
                             "layers": ("STRING", {"default": "7, 8, 9", "multiline": False}),
                             "scale": ("FLOAT", {"default": 3.0, "min": 0.0, "max": 10.0, "step": 0.1}),
                             "start_percent": ("FLOAT", {"default": 0.01, "min": 0.0, "max": 1.0, "step": 0.001}),
                             "end_percent": ("FLOAT", {"default": 0.15, "min": 0.0, "max": 1.0, "step": 0.001})
                                }}
    RETURN_TYPES = ("MODEL",)
    FUNCTION = "skip_guidance_sd3"

    CATEGORY = "advanced/guidance"

    def skip_guidance_sd3(self, model, layers, scale, start_percent, end_percent):
        return self.skip_guidance(model=model, scale=scale, start_percent=start_percent, end_percent=end_percent, double_layers=layers)


NODE_CLASS_MAPPINGS = {
    "TripleCLIPLoader": TripleCLIPLoader,
    "EmptySD3LatentImage": EmptySD3LatentImage,
    "CLIPTextEncodeSD3": CLIPTextEncodeSD3,
    "ControlNetApplySD3": ControlNetApplySD3,
    "SkipLayerGuidanceSD3": SkipLayerGuidanceSD3,
}

NODE_DISPLAY_NAME_MAPPINGS = {
    # Sampling
    "ControlNetApplySD3": "Apply Controlnet with VAE",
}
SD3 Support. 2024-06-10 17:26:25 +00:00			`import folder_paths`
			`import comfy.sd`
			`import comfy.model_management`
			`import nodes`
			`import torch`
Add a skip layer guidance node that can also skip single layers. This one should work for skipping the single layers of models like Flux and Auraflow. If you want to see how these models work and how many double/single layers they have see the "ModelMerge*" nodes for the specific model. 2024-11-18 07:20:43 +00:00			`import comfy_extras.nodes_slg`


SD3 Support. 2024-06-10 17:26:25 +00:00			`class TripleCLIPLoader:`
			`@classmethod`
			`def INPUT_TYPES(s):`
Update folder paths: "clip" -> "text_encoders" You can still use models/clip but the folder might get removed eventually on new installs of ComfyUI. 2024-11-02 19:35:38 +00:00			`return {"required": { "clip_name1": (folder_paths.get_filename_list("text_encoders"), ), "clip_name2": (folder_paths.get_filename_list("text_encoders"), ), "clip_name3": (folder_paths.get_filename_list("text_encoders"), )`
SD3 Support. 2024-06-10 17:26:25 +00:00			`}}`
			`RETURN_TYPES = ("CLIP",)`
			`FUNCTION = "load_clip"`

			`CATEGORY = "advanced/loaders"`

improve: add descriptions for clip loaders (#5576) 2024-11-11 10:37:23 +00:00			`DESCRIPTION = "[Recipes]\n\nsd3: clip-l, clip-g, t5"`

SD3 Support. 2024-06-10 17:26:25 +00:00			`def load_clip(self, clip_name1, clip_name2, clip_name3):`
Update folder paths: "clip" -> "text_encoders" You can still use models/clip but the folder might get removed eventually on new installs of ComfyUI. 2024-11-02 19:35:38 +00:00			`clip_path1 = folder_paths.get_full_path_or_raise("text_encoders", clip_name1)`
			`clip_path2 = folder_paths.get_full_path_or_raise("text_encoders", clip_name2)`
			`clip_path3 = folder_paths.get_full_path_or_raise("text_encoders", clip_name3)`
SD3 Support. 2024-06-10 17:26:25 +00:00			`clip = comfy.sd.load_clip(ckpt_paths=[clip_path1, clip_path2, clip_path3], embedding_directory=folder_paths.get_folder_paths("embeddings"))`
			`return (clip,)`

Add a skip layer guidance node that can also skip single layers. This one should work for skipping the single layers of models like Flux and Auraflow. If you want to see how these models work and how many double/single layers they have see the "ModelMerge*" nodes for the specific model. 2024-11-18 07:20:43 +00:00
SD3 Support. 2024-06-10 17:26:25 +00:00			`class EmptySD3LatentImage:`
			`def __init__(self):`
			`self.device = comfy.model_management.intermediate_device()`

			`@classmethod`
			`def INPUT_TYPES(s):`
Set the step in EmptySD3LatentImage to 16. These models work better when the res is a multiple of 16. 2024-08-04 19:59:02 +00:00			`return {"required": { "width": ("INT", {"default": 1024, "min": 16, "max": nodes.MAX_RESOLUTION, "step": 16}),`
			`"height": ("INT", {"default": 1024, "min": 16, "max": nodes.MAX_RESOLUTION, "step": 16}),`
SD3 Support. 2024-06-10 17:26:25 +00:00			`"batch_size": ("INT", {"default": 1, "min": 1, "max": 4096})}}`
			`RETURN_TYPES = ("LATENT",)`
			`FUNCTION = "generate"`

			`CATEGORY = "latent/sd3"`

			`def generate(self, width, height, batch_size=1):`
Make SD3 empty latent image zeros. This shouldn't change anything. The reason it was not zeros is because it did matter in early versions of the code. 2024-09-21 13:12:31 +00:00			`latent = torch.zeros([batch_size, 16, height // 8, width // 8], device=self.device)`
SD3 Support. 2024-06-10 17:26:25 +00:00			`return ({"samples":latent}, )`

Add a skip layer guidance node that can also skip single layers. This one should work for skipping the single layers of models like Flux and Auraflow. If you want to see how these models work and how many double/single layers they have see the "ModelMerge*" nodes for the specific model. 2024-11-18 07:20:43 +00:00
SD3 Support. 2024-06-10 17:26:25 +00:00			`class CLIPTextEncodeSD3:`
			`@classmethod`
			`def INPUT_TYPES(s):`
			`return {"required": {`
			`"clip": ("CLIP", ),`
			`"clip_l": ("STRING", {"multiline": True, "dynamicPrompts": True}),`
			`"clip_g": ("STRING", {"multiline": True, "dynamicPrompts": True}),`
			`"t5xxl": ("STRING", {"multiline": True, "dynamicPrompts": True}),`
			`"empty_padding": (["none", "empty_prompt"], )`
			`}}`
			`RETURN_TYPES = ("CONDITIONING",)`
			`FUNCTION = "encode"`

			`CATEGORY = "advanced/conditioning"`

			`def encode(self, clip, clip_l, clip_g, t5xxl, empty_padding):`
			`no_padding = empty_padding == "none"`

			`tokens = clip.tokenize(clip_g)`
			`if len(clip_g) == 0 and no_padding:`
			`tokens["g"] = []`

			`if len(clip_l) == 0 and no_padding:`
			`tokens["l"] = []`
			`else:`
			`tokens["l"] = clip.tokenize(clip_l)["l"]`

			`if len(t5xxl) == 0 and no_padding:`
			`tokens["t5xxl"] = []`
			`else:`
			`tokens["t5xxl"] = clip.tokenize(t5xxl)["t5xxl"]`
			`if len(tokens["l"]) != len(tokens["g"]):`
			`empty = clip.tokenize("")`
			`while len(tokens["l"]) < len(tokens["g"]):`
			`tokens["l"] += empty["l"]`
			`while len(tokens["l"]) > len(tokens["g"]):`
			`tokens["g"] += empty["g"]`
			`cond, pooled = clip.encode_from_tokens(tokens, return_pooled=True)`
			`return ([[cond, {"pooled_output": pooled}]], )`


ControlNetApplySD3 node can now be used to use SD3 controlnets. 2024-06-26 20:14:47 +00:00			`class ControlNetApplySD3(nodes.ControlNetApplyAdvanced):`
			`@classmethod`
			`def INPUT_TYPES(s):`
			`return {"required": {"positive": ("CONDITIONING", ),`
			`"negative": ("CONDITIONING", ),`
			`"control_net": ("CONTROL_NET", ),`
			`"vae": ("VAE", ),`
			`"image": ("IMAGE", ),`
			`"strength": ("FLOAT", {"default": 1.0, "min": 0.0, "max": 10.0, "step": 0.01}),`
			`"start_percent": ("FLOAT", {"default": 0.0, "min": 0.0, "max": 1.0, "step": 0.001}),`
			`"end_percent": ("FLOAT", {"default": 1.0, "min": 0.0, "max": 1.0, "step": 0.001})`
			`}}`
Move controlnet nodes to conditioning/controlnet. 2024-07-16 21:08:25 +00:00			`CATEGORY = "conditioning/controlnet"`
Add an optional VAE input to the ControlNetApplyAdvanced node. Deprecate the other controlnet nodes. 2024-09-22 05:24:52 +00:00			`DEPRECATED = True`
ControlNetApplySD3 node can now be used to use SD3 controlnets. 2024-06-26 20:14:47 +00:00
Add a skip layer guidance node that can also skip single layers. This one should work for skipping the single layers of models like Flux and Auraflow. If you want to see how these models work and how many double/single layers they have see the "ModelMerge*" nodes for the specific model. 2024-11-18 07:20:43 +00:00
			`class SkipLayerGuidanceSD3(comfy_extras.nodes_slg.SkipLayerGuidanceDiT):`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00			`'''`
			`Enhance guidance towards detailed dtructure by having another set of CFG negative with skipped layers.`
			`Inspired by Perturbed Attention Guidance (https://arxiv.org/abs/2403.17377)`
			`Experimental implementation by Dango233@StabilityAI.`
			`'''`
			`@classmethod`
			`def INPUT_TYPES(s):`
			`return {"required": {"model": ("MODEL", ),`
Cleanup SkipLayerGuidanceSD3 node. 2024-10-29 14:11:46 +00:00			`"layers": ("STRING", {"default": "7, 8, 9", "multiline": False}),`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00			`"scale": ("FLOAT", {"default": 3.0, "min": 0.0, "max": 10.0, "step": 0.1}),`
			`"start_percent": ("FLOAT", {"default": 0.01, "min": 0.0, "max": 1.0, "step": 0.001}),`
			`"end_percent": ("FLOAT", {"default": 0.15, "min": 0.0, "max": 1.0, "step": 0.001})`
			`}}`
			`RETURN_TYPES = ("MODEL",)`
Add a skip layer guidance node that can also skip single layers. This one should work for skipping the single layers of models like Flux and Auraflow. If you want to see how these models work and how many double/single layers they have see the "ModelMerge*" nodes for the specific model. 2024-11-18 07:20:43 +00:00			`FUNCTION = "skip_guidance_sd3"`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00
			`CATEGORY = "advanced/guidance"`

Add a skip layer guidance node that can also skip single layers. This one should work for skipping the single layers of models like Flux and Auraflow. If you want to see how these models work and how many double/single layers they have see the "ModelMerge*" nodes for the specific model. 2024-11-18 07:20:43 +00:00			`def skip_guidance_sd3(self, model, layers, scale, start_percent, end_percent):`
			`return self.skip_guidance(model=model, scale=scale, start_percent=start_percent, end_percent=end_percent, double_layers=layers)`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00

SD3 Support. 2024-06-10 17:26:25 +00:00			`NODE_CLASS_MAPPINGS = {`
			`"TripleCLIPLoader": TripleCLIPLoader,`
			`"EmptySD3LatentImage": EmptySD3LatentImage,`
			`"CLIPTextEncodeSD3": CLIPTextEncodeSD3,`
ControlNetApplySD3 node can now be used to use SD3 controlnets. 2024-06-26 20:14:47 +00:00			`"ControlNetApplySD3": ControlNetApplySD3,`
SLG first implementation for SD3.5 (#5404) * SLG first implementation for SD3.5 * * Simplify and align with comfy style 2024-10-29 13:59:21 +00:00			`"SkipLayerGuidanceSD3": SkipLayerGuidanceSD3,`
SD3 Support. 2024-06-10 17:26:25 +00:00			`}`
Cleanup HunyuanDit controlnets. Use the: ControlNetApply SD3 and HunyuanDiT node. 2024-08-09 06:35:19 +00:00
			`NODE_DISPLAY_NAME_MAPPINGS = {`
			`# Sampling`
Add an optional VAE input to the ControlNetApplyAdvanced node. Deprecate the other controlnet nodes. 2024-09-22 05:24:52 +00:00			`"ControlNetApplySD3": "Apply Controlnet with VAE",`
Cleanup HunyuanDit controlnets. Use the: ControlNetApply SD3 and HunyuanDiT node. 2024-08-09 06:35:19 +00:00			`}`