Update categories and add new blueprints

2026-06-16 21:09:48 +08:00 · 2026-05-25 18:01:48 +08:00 · 2026-05-25 18:01:48 +08:00 · 577c56bb6b
commit 577c56bb6b
parent 1c8d4ca092
24 changed files with 2370 additions and 32 deletions
--- a/(Z-Image-Turbo).json
+++ b/(Z-Image-Turbo).json
@ -1553,7 +1553,7 @@
          "VHS_MetadataImage": true,
          "VHS_KeepIntermediate": true
        },
-        "category": "Image generation and editing/Canny to image",
+        "category": "Image generation and editing/Conditioned",
        "description": "Generates an image from a Canny edge map using Z-Image-Turbo, with text conditioning."
      }
    ]
--- a/blueprints/Canny
+++ b/blueprints/Canny
@ -3600,7 +3600,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Video generation and editing/Canny to video",
+        "category": "Video generation and editing/Conditioned",
        "description": "Generates video from Canny edge maps using LTX-2, with optional synchronized audio."
      }
    ]
--- a/blueprints/ControlNet
+++ b/blueprints/ControlNet
@ -1401,7 +1401,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Image generation and editing/ControlNet",
+        "category": "Image generation and editing/Conditioned",
        "description": "Generates images from a text prompt and ControlNet conditioning (e.g. depth, canny) using Z-Image-Turbo."
      }
    ]
--- a/(Z-Image-Turbo).json
+++ b/(Z-Image-Turbo).json
@ -1579,7 +1579,7 @@
          "VHS_MetadataImage": true,
          "VHS_KeepIntermediate": true
        },
-        "category": "Image generation and editing/Depth to image",
+        "category": "Image generation and editing/Conditioned",
        "description": "Generates an image from a depth map using Z-Image-Turbo with text conditioning."
      },
      {
--- a/blueprints/Depth
+++ b/blueprints/Depth
@ -4233,7 +4233,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Video generation and editing/Depth to video",
+        "category": "Video generation and editing/Conditioned",
        "description": "Generates depth-controlled video with LTX-2: motion and structure follow a depth-reference video alongside text prompting, optional first-frame image conditioning, with optional synchronized audio."
      },
      {
@ -5194,8 +5194,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "description": "Estimates a monocular depth map from an input image using the Lotus depth estimation model.",
-        "category": "Video generation and editing/Depth to video"
+        "description": "Estimates a monocular depth map from an input image using the Lotus depth estimation model."
      }
    ]
  },
--- a/blueprints/First-Last-Frame
+++ b/blueprints/First-Last-Frame
@ -3350,7 +3350,7 @@
          }
        ],
        "extra": {},
-        "category": "Video generation and editing/First-Last-Frame to Video",
+        "category": "Video generation and editing/Conditioned",
        "description": "Generates a video interpolating between first and last keyframes using LTX-2.3."
      }
    ]
--- a/blueprints/First-Last-Frame
+++ b/blueprints/First-Last-Frame
@ -3350,7 +3350,7 @@
          }
        ],
        "extra": {},
-        "category": "Video generation and editing/First-Last-Frame to Video",
+        "category": "Video generation and editing/FLF2V",
        "description": "Generates a video that interpolates between the first and last keyframes using LTX-2.3, including optional audio."
      }
    ]
--- a/blueprints/Geometry
+++ b/blueprints/Geometry
@ -1256,6 +1256,8 @@
            "type": "BOOLEAN"
          }
        ],
+        "category": "3D/Geometry Estimation",
+        "description": "Estimates 3D scene geometry from an input image using MoGe, outputting a mesh plus OpenGL and DirectX normal maps.",
        "extra": {}
      }
    ]
--- a/blueprints/Image
+++ b/blueprints/Image
@ -310,9 +310,9 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Text generation/Image Captioning",
+        "category": "Image Tools",
        "description": "Generates descriptive captions for images using Google's Gemini multimodal LLM."
      }
    ]
  }
-}
+}
--- a/blueprints/Image
+++ b/blueprints/Image
@ -15,7 +15,7 @@
        330
      ],
      "flags": {},
-      "order": 3,
+      "order": 0,
      "mode": 0,
      "inputs": [
        {
@ -80,6 +80,7 @@
          "links": []
        }
      ],
+      "title": "Image Depth Estimation (MoGe)",
      "properties": {
        "proxyWidgets": [
          [
@ -109,8 +110,7 @@
        "secondTabOffset": 80,
        "secondTabWidth": 65
      },
-      "widgets_values": [],
-      "title": "Depth Estimation (MoGe)"
+      "widgets_values": []
    }
  ],
  "links": [],
@ -128,7 +128,8 @@
        },
        "revision": 0,
        "config": {},
-        "name": "Depth Estimation (MoGe)",
+        "name": "Image Depth Estimation (MoGe)",
+        "description": "Estimates monocular depth from an input image using MoGe, outputting both raw and colorized depth maps plus a mask.",
        "inputNode": {
          "id": -10,
          "bounding": [
--- a/(Mediapipe).json
+++ b/(Mediapipe).json
@ -15,7 +15,7 @@
        400
      ],
      "flags": {},
-      "order": 3,
+      "order": 0,
      "mode": 0,
      "inputs": [
        {
@ -119,6 +119,7 @@
          "links": []
        }
      ],
+      "title": "Image Face Detection (Mediapipe)",
      "properties": {
        "proxyWidgets": [
          [
@ -164,8 +165,7 @@
        "secondTabOffset": 80,
        "secondTabWidth": 65
      },
-      "widgets_values": [],
-      "title": "Face Detection (Mediapipe)"
+      "widgets_values": []
    }
  ],
  "links": [],
@ -183,7 +183,8 @@
        },
        "revision": 0,
        "config": {},
-        "name": "Face Detection (Mediapipe)",
+        "name": "Image Face Detection (Mediapipe)",
+        "description": "Detects facial landmarks from an image using MediaPipe, outputting landmark data, face bounding boxes, and an optional face-region mask.",
        "inputNode": {
          "id": -10,
          "bounding": [
@ -769,7 +770,8 @@
            "type": "COMBO"
          }
        ],
-        "extra": {}
+        "extra": {},
+        "category": "Conditioning & Preprocessors/Face Detection"
      }
    ]
  },
--- a/blueprints/Image
+++ b/blueprints/Image
@ -703,7 +703,7 @@
          }
        ],
        "extra": {},
-        "category": "Image Tools/Image Segmentation",
+        "category": "Conditioning & Preprocessors/Segmentation & Mask",
        "description": "Segments images into masks using Meta SAM3 from text prompts, points, or boxes."
      }
    ]
--- a/blueprints/Image
+++ b/blueprints/Image
@ -948,7 +948,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Image Tools/Preprocessors",
+        "category": "Conditioning & Preprocessors/Depth",
        "description": "Estimates a monocular depth map from an input image using the Lotus depth estimation model."
      }
    ]
--- a/Multi-Person).json
+++ b/Multi-Person).json
@ -1197,7 +1197,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Image Tools/Preprocessors",
+        "category": "Conditioning & Preprocessors/Pose",
        "description": "Detects multiple people in an image and outputs per-person pose keypoints, skeleton renders, and bounding boxes using SDPose."
      }
    ]
--- a/(SDPose-OOD).json
+++ b/(SDPose-OOD).json
@ -877,7 +877,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Image Tools/Preprocessors",
+        "category": "Conditioning & Preprocessors/Pose",
        "description": "Extracts human pose keypoints and stick-figure visuals from an image using SDPose-OOD, with optional bounding-box input per subject."
      }
    ]
--- a/(Z-Image-Turbo).json
+++ b/(Z-Image-Turbo).json
@ -1298,7 +1298,7 @@
          "VHS_MetadataImage": true,
          "VHS_KeepIntermediate": true
        },
-        "category": "Image generation and editing/Pose to image",
+        "category": "Image generation and editing/Conditioned",
        "description": "Generates an image from pose keypoints using Z-Image-Turbo with text conditioning."
      }
    ]
--- a/blueprints/Pose
+++ b/blueprints/Pose
@ -3870,7 +3870,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Video generation and editing/Pose to video",
+        "category": "Video generation and editing/Conditioned",
        "description": "Generates video from pose reference frames using LTX-2, with optional synchronized audio."
      }
    ]
--- a/blueprints/Prompt
+++ b/blueprints/Prompt
@ -270,7 +270,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Text generation/Prompt enhance",
+        "category": "Text Tools",
        "description": "Expands short text prompts into detailed descriptions using a text generation model for better generation quality."
      }
    ]
--- a/blueprints/Video
+++ b/blueprints/Video
@ -307,9 +307,9 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Text generation/Video Captioning",
+        "category": "Video Tools",
        "description": "Generates descriptive captions for video input using Google's Gemini multimodal LLM."
      }
    ]
  }
-}
+}
--- a/blueprints/Video
+++ b/blueprints/Video
--- a/(Mediapipe).json
+++ b/(Mediapipe).json
--- a/blueprints/Video
+++ b/blueprints/Video
@ -3768,7 +3768,7 @@
          }
        ],
        "extra": {},
-        "category": "Video Tools",
+        "category": "Video generation and editing/Inpaint video",
        "description": "Removes objects from video by inpainting masked regions using VOID (CogVideoX), with SAM3 text-guided segmentation and optional two-pass optical-flow refinement."
      },
      {
--- a/blueprints/Video
+++ b/blueprints/Video
@ -818,7 +818,7 @@
          }
        ],
        "extra": {},
-        "category": "Video Tools",
+        "category": "Conditioning & Preprocessors/Segmentation & Mask",
        "description": "Segments video into temporally consistent masks using Meta SAM3 from text or interactive prompts."
      }
    ]
--- a/Multi-Person).json
+++ b/Multi-Person).json
@ -1314,7 +1314,7 @@
        "extra": {
          "workflowRendererVersion": "LG"
        },
-        "category": "Video Tools",
+        "category": "Conditioning & Preprocessors/Pose",
        "description": "Extracts multi-person pose keypoints and skeleton frame sequences from video using SDPose with built-in person detection."
      }
    ]