Update categories and add new blueprints

This commit is contained in:
ComfyUI Wiki 2026-05-25 18:01:48 +08:00
parent 1c8d4ca092
commit 577c56bb6b
24 changed files with 2370 additions and 32 deletions

View File

@ -1553,7 +1553,7 @@
"VHS_MetadataImage": true,
"VHS_KeepIntermediate": true
},
"category": "Image generation and editing/Canny to image",
"category": "Image generation and editing/Conditioned",
"description": "Generates an image from a Canny edge map using Z-Image-Turbo, with text conditioning."
}
]

View File

@ -3600,7 +3600,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Video generation and editing/Canny to video",
"category": "Video generation and editing/Conditioned",
"description": "Generates video from Canny edge maps using LTX-2, with optional synchronized audio."
}
]

View File

@ -1401,7 +1401,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Image generation and editing/ControlNet",
"category": "Image generation and editing/Conditioned",
"description": "Generates images from a text prompt and ControlNet conditioning (e.g. depth, canny) using Z-Image-Turbo."
}
]

View File

@ -1579,7 +1579,7 @@
"VHS_MetadataImage": true,
"VHS_KeepIntermediate": true
},
"category": "Image generation and editing/Depth to image",
"category": "Image generation and editing/Conditioned",
"description": "Generates an image from a depth map using Z-Image-Turbo with text conditioning."
},
{

View File

@ -4233,7 +4233,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Video generation and editing/Depth to video",
"category": "Video generation and editing/Conditioned",
"description": "Generates depth-controlled video with LTX-2: motion and structure follow a depth-reference video alongside text prompting, optional first-frame image conditioning, with optional synchronized audio."
},
{
@ -5194,8 +5194,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"description": "Estimates a monocular depth map from an input image using the Lotus depth estimation model.",
"category": "Video generation and editing/Depth to video"
"description": "Estimates a monocular depth map from an input image using the Lotus depth estimation model."
}
]
},

View File

@ -3350,7 +3350,7 @@
}
],
"extra": {},
"category": "Video generation and editing/First-Last-Frame to Video",
"category": "Video generation and editing/Conditioned",
"description": "Generates a video interpolating between first and last keyframes using LTX-2.3."
}
]

View File

@ -3350,7 +3350,7 @@
}
],
"extra": {},
"category": "Video generation and editing/First-Last-Frame to Video",
"category": "Video generation and editing/FLF2V",
"description": "Generates a video that interpolates between the first and last keyframes using LTX-2.3, including optional audio."
}
]

View File

@ -1256,6 +1256,8 @@
"type": "BOOLEAN"
}
],
"category": "3D/Geometry Estimation",
"description": "Estimates 3D scene geometry from an input image using MoGe, outputting a mesh plus OpenGL and DirectX normal maps.",
"extra": {}
}
]

View File

@ -310,9 +310,9 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Text generation/Image Captioning",
"category": "Image Tools",
"description": "Generates descriptive captions for images using Google's Gemini multimodal LLM."
}
]
}
}
}

View File

@ -15,7 +15,7 @@
330
],
"flags": {},
"order": 3,
"order": 0,
"mode": 0,
"inputs": [
{
@ -80,6 +80,7 @@
"links": []
}
],
"title": "Image Depth Estimation (MoGe)",
"properties": {
"proxyWidgets": [
[
@ -109,8 +110,7 @@
"secondTabOffset": 80,
"secondTabWidth": 65
},
"widgets_values": [],
"title": "Depth Estimation (MoGe)"
"widgets_values": []
}
],
"links": [],
@ -128,7 +128,8 @@
},
"revision": 0,
"config": {},
"name": "Depth Estimation (MoGe)",
"name": "Image Depth Estimation (MoGe)",
"description": "Estimates monocular depth from an input image using MoGe, outputting both raw and colorized depth maps plus a mask.",
"inputNode": {
"id": -10,
"bounding": [

View File

@ -15,7 +15,7 @@
400
],
"flags": {},
"order": 3,
"order": 0,
"mode": 0,
"inputs": [
{
@ -119,6 +119,7 @@
"links": []
}
],
"title": "Image Face Detection (Mediapipe)",
"properties": {
"proxyWidgets": [
[
@ -164,8 +165,7 @@
"secondTabOffset": 80,
"secondTabWidth": 65
},
"widgets_values": [],
"title": "Face Detection (Mediapipe)"
"widgets_values": []
}
],
"links": [],
@ -183,7 +183,8 @@
},
"revision": 0,
"config": {},
"name": "Face Detection (Mediapipe)",
"name": "Image Face Detection (Mediapipe)",
"description": "Detects facial landmarks from an image using MediaPipe, outputting landmark data, face bounding boxes, and an optional face-region mask.",
"inputNode": {
"id": -10,
"bounding": [
@ -769,7 +770,8 @@
"type": "COMBO"
}
],
"extra": {}
"extra": {},
"category": "Conditioning & Preprocessors/Face Detection"
}
]
},

View File

@ -703,7 +703,7 @@
}
],
"extra": {},
"category": "Image Tools/Image Segmentation",
"category": "Conditioning & Preprocessors/Segmentation & Mask",
"description": "Segments images into masks using Meta SAM3 from text prompts, points, or boxes."
}
]

View File

@ -948,7 +948,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Image Tools/Preprocessors",
"category": "Conditioning & Preprocessors/Depth",
"description": "Estimates a monocular depth map from an input image using the Lotus depth estimation model."
}
]

View File

@ -1197,7 +1197,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Image Tools/Preprocessors",
"category": "Conditioning & Preprocessors/Pose",
"description": "Detects multiple people in an image and outputs per-person pose keypoints, skeleton renders, and bounding boxes using SDPose."
}
]

View File

@ -877,7 +877,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Image Tools/Preprocessors",
"category": "Conditioning & Preprocessors/Pose",
"description": "Extracts human pose keypoints and stick-figure visuals from an image using SDPose-OOD, with optional bounding-box input per subject."
}
]

View File

@ -1298,7 +1298,7 @@
"VHS_MetadataImage": true,
"VHS_KeepIntermediate": true
},
"category": "Image generation and editing/Pose to image",
"category": "Image generation and editing/Conditioned",
"description": "Generates an image from pose keypoints using Z-Image-Turbo with text conditioning."
}
]

View File

@ -3870,7 +3870,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Video generation and editing/Pose to video",
"category": "Video generation and editing/Conditioned",
"description": "Generates video from pose reference frames using LTX-2, with optional synchronized audio."
}
]

View File

@ -270,7 +270,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Text generation/Prompt enhance",
"category": "Text Tools",
"description": "Expands short text prompts into detailed descriptions using a text generation model for better generation quality."
}
]

View File

@ -307,9 +307,9 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Text generation/Video Captioning",
"category": "Video Tools",
"description": "Generates descriptive captions for video input using Google's Gemini multimodal LLM."
}
]
}
}
}

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@ -3768,7 +3768,7 @@
}
],
"extra": {},
"category": "Video Tools",
"category": "Video generation and editing/Inpaint video",
"description": "Removes objects from video by inpainting masked regions using VOID (CogVideoX), with SAM3 text-guided segmentation and optional two-pass optical-flow refinement."
},
{

View File

@ -818,7 +818,7 @@
}
],
"extra": {},
"category": "Video Tools",
"category": "Conditioning & Preprocessors/Segmentation & Mask",
"description": "Segments video into temporally consistent masks using Meta SAM3 from text or interactive prompts."
}
]

View File

@ -1314,7 +1314,7 @@
"extra": {
"workflowRendererVersion": "LG"
},
"category": "Video Tools",
"category": "Conditioning & Preprocessors/Pose",
"description": "Extracts multi-person pose keypoints and skeleton frame sequences from video using SDPose with built-in person detection."
}
]