fix scripts

2026-05-13 02:33:02 +08:00 · 2026-04-27 13:42:53 -07:00 · 2026-04-27 13:42:53 -07:00 · 978b962300
commit 978b962300
parent 8136fbbb4a
1 changed files with 130 additions and 218 deletions
--- a/benchmarks/benchmark_comfyui_serving.py
+++ b/benchmarks/benchmark_comfyui_serving.py
@ -2,7 +2,7 @@
 """
 Simple serving benchmark client for ComfyUI's HTTP API.
-This script is inspired by diffusion serving benchmarks and is designed to:
+This script is designed to:
  - submit prompts to ComfyUI (/prompt or /bench/prompt),
  - optionally shape request arrivals (fixed rate or Poisson),
  - poll completion via /history/{prompt_id},
@ -15,28 +15,26 @@ Step 1 — Generate prompt files (downloads images, writes JSONs, then exits):
  # Minimal: uses synthetic images, writes to prompts/wan22_i2v/
  python3 benchmarks/benchmark_comfyui_serving.py \\
-    --generate-wan22-prompts \\
+    --generate-prompts --model wan22 --task i2v \\
    --num-requests 50
  # With model download (needs ComfyUI root):
  python3 benchmarks/benchmark_comfyui_serving.py \\
-    --generate-wan22-prompts \\
+    --generate-prompts --model wan22 --task i2v \\
-    --download-models \\
+    --download-models --comfyui-base-dir /path/to/ComfyUI \\
    --comfyui-base-dir /path/to/ComfyUI \\
    --num-requests 50
-  # Custom image/output dirs (input dir must be ComfyUI's input/ folder):
+  # Custom image/output dirs (input-dir must be ComfyUI's input/ folder):
  python3 benchmarks/benchmark_comfyui_serving.py \\
-    --generate-wan22-prompts \\
+    --generate-prompts --model wan22 --task i2v \\
-    --wan22-input-dir /home/ubuntu/ComfyUI/input \\
+    --input-dir /home/ubuntu/ComfyUI/input \\
-    --wan22-output-dir /data/prompts/wan22 \\
+    --prompts-dir /home/ubuntu/ComfyUI/benchmarks/prompts/wan22_i2v \\
-    --wan22-num-images 30 \\
+    --num-images 30 --num-requests 50
    --num-requests 50
 Step 2 — Run the benchmark (point at any one of the generated prompt files):
  python3 benchmarks/benchmark_comfyui_serving.py \\
-    --prompt-file prompts/wan22_i2v/wan22_i2v_prompt_0000.json \\
+    --prompt-file benchmarks/prompts/wan22_i2v/wan22_i2v_prompt_0000.json \\
    --num-requests 50 \\
    --max-concurrency 4 \\
    --host http://127.0.0.1:8188
@ -64,10 +62,17 @@ import aiohttp
 # ──────────────────────────────────────────────────────────────────────────────
-# Wan 2.2 I2V benchmark setup helpers
+# Benchmark setup helpers
 # ──────────────────────────────────────────────────────────────────────────────
-_WAN22_MODELS: list[tuple[str, str]] = [
+# Workflow JSON files live in benchmarks/workflows/<model>_<task>.json.
 _WORKFLOWS_DIR = Path(__file__).parent / "workflows"
 # Placeholder in workflow JSON files that is replaced with the actual image filename.
 _IMAGE_PLACEHOLDER = "__INPUT_IMAGE__"
 # Model weight downloads for wan22/i2v.
 _WAN22_I2V_MODELS: list[tuple[str, str]] = [
    (
        "models/diffusion_models/wan2.2_i2v_low_noise_14B_fp8_scaled.safetensors",
        "https://huggingface.co/Comfy-Org/Wan_2.2_ComfyUI_Repackaged/resolve/main/split_files/diffusion_models/wan2.2_i2v_low_noise_14B_fp8_scaled.safetensors",
@ -94,175 +99,46 @@ _WAN22_MODELS: list[tuple[str, str]] = [
    ),
 ]
 # Placeholder sentinel replaced by generate_prompt_file.
 _IMAGE_PLACEHOLDER = "__INPUT_IMAGE__"
 _WAN22_I2V_GRAPH: dict[str, Any] = {
    "97": {
        "inputs": {"image": _IMAGE_PLACEHOLDER},
        "class_type": "LoadImage",
        "_meta": {"title": "Start Frame Image"},
    },
    "108": {
        "inputs": {
            "filename_prefix": "video/Wan2.2_image_to_video",
            "format": "auto",
            "codec": "auto",
            "video-preview": "",
            "video": ["130:117", 0],
        },
        "class_type": "SaveVideo",
        "_meta": {"title": "Save Video"},
    },
    "130:105": {
        "inputs": {
            "clip_name": "umt5_xxl_fp8_e4m3fn_scaled.safetensors",
            "type": "wan",
            "device": "default",
        },
        "class_type": "CLIPLoader",
        "_meta": {"title": "Load CLIP"},
    },
    "130:106": {
        "inputs": {"vae_name": "wan_2.1_vae.safetensors"},
        "class_type": "VAELoader",
        "_meta": {"title": "Load VAE"},
    },
    "130:107": {
        "inputs": {
            "text": "A felt-style little eagle cashier greeting, waving, and smiling at the camera.",
            "clip": ["130:105", 0],
        },
        "class_type": "CLIPTextEncode",
        "_meta": {"title": "CLIP Text Encode (Positive Prompt)"},
    },
    "130:109": {
        "inputs": {"shift": 5.000000000000001, "model": ["130:126", 0]},
        "class_type": "ModelSamplingSD3",
        "_meta": {"title": "ModelSamplingSD3"},
    },
    "130:110": {
        "inputs": {
            "add_noise": "enable",
            "noise_seed": 636787045983965,
            "steps": 4,
            "cfg": 1,
            "sampler_name": "euler",
            "scheduler": "simple",
            "start_at_step": 0,
            "end_at_step": 2,
            "return_with_leftover_noise": "enable",
            "model": ["130:109", 0],
            "positive": ["130:128", 0],
            "negative": ["130:128", 1],
            "latent_image": ["130:128", 2],
        },
        "class_type": "KSamplerAdvanced",
        "_meta": {"title": "KSampler (Advanced)"},
    },
    "130:111": {
        "inputs": {
            "add_noise": "disable",
            "noise_seed": 0,
            "steps": 4,
            "cfg": 1,
            "sampler_name": "euler",
            "scheduler": "simple",
            "start_at_step": 2,
            "end_at_step": 4,
            "return_with_leftover_noise": "disable",
            "model": ["130:124", 0],
            "positive": ["130:128", 0],
            "negative": ["130:128", 1],
            "latent_image": ["130:110", 0],
        },
        "class_type": "KSamplerAdvanced",
        "_meta": {"title": "KSampler (Advanced)"},
    },
    "130:117": {
        "inputs": {"fps": 16, "images": ["130:129", 0]},
        "class_type": "CreateVideo",
        "_meta": {"title": "Create Video"},
    },
    "130:122": {
        "inputs": {
            "unet_name": "wan2.2_i2v_high_noise_14B_fp8_scaled.safetensors",
            "weight_dtype": "default",
        },
        "class_type": "UNETLoader",
        "_meta": {"title": "Load Diffusion Model"},
    },
    "130:123": {
        "inputs": {
            "unet_name": "wan2.2_i2v_low_noise_14B_fp8_scaled.safetensors",
            "weight_dtype": "default",
        },
        "class_type": "UNETLoader",
        "_meta": {"title": "Load Diffusion Model"},
    },
    "130:124": {
        "inputs": {"shift": 5.000000000000001, "model": ["130:127", 0]},
        "class_type": "ModelSamplingSD3",
        "_meta": {"title": "ModelSamplingSD3"},
    },
    "130:125": {
        "inputs": {
            "text": (
                "色调艳丽，过曝，静态，细节模糊不清，字幕，风格，作品，画作，画面，静止，整体发灰，最差质量，低质量，"
                "JPEG压缩残留，丑陋的，残缺的，多余的手指，画得不好的手部，画得不好的脸部，畸形的，毁容的，"
                "形态畸形的肢体，手指融合，静止不动的画面，杂乱的背景，三条腿，背景人很多，倒着走"
            ),
            "clip": ["130:105", 0],
        },
        "class_type": "CLIPTextEncode",
        "_meta": {"title": "CLIP Text Encode (Negative Prompt)"},
    },
    "130:126": {
        "inputs": {
            "lora_name": "wan2.2_i2v_lightx2v_4steps_lora_v1_high_noise.safetensors",
            "strength_model": 1.0000000000000002,
            "model": ["130:122", 0],
        },
        "class_type": "LoraLoaderModelOnly",
        "_meta": {"title": "Load LoRA"},
    },
    "130:127": {
        "inputs": {
            "lora_name": "wan2.2_i2v_lightx2v_4steps_lora_v1_low_noise.safetensors",
            "strength_model": 1.0000000000000002,
            "model": ["130:123", 0],
        },
        "class_type": "LoraLoaderModelOnly",
        "_meta": {"title": "Load LoRA"},
    },
    "130:128": {
        "inputs": {
            "width": 720,
            "height": 720,
            "length": 81,
            "batch_size": 1,
            "positive": ["130:107", 0],
            "negative": ["130:125", 0],
            "vae": ["130:106", 0],
            "start_image": ["97", 0],
        },
        "class_type": "WanImageToVideo",
        "_meta": {"title": "WanImageToVideo"},
    },
    "130:129": {
        "inputs": {"samples": ["130:111", 0], "vae": ["130:106", 0]},
        "class_type": "VAEDecode",
        "_meta": {"title": "VAE Decode"},
    },
 }
 # Google Drive file IDs from VBench's vbench2_beta_i2v/download_data.sh
 _VBENCH_ORIGIN_ZIP_GDRIVE_ID = "1qhkLCSBkzll0dkKpwlDTwLL0nxdQ4nrY"
 # Registry mapping (model, task) → benchmark configuration.
 # To add a new model/task: drop a workflow JSON in benchmarks/workflows/ and
 # add an entry here.
 _MODEL_REGISTRY: dict[tuple[str, str], dict[str, Any]] = {
    ("wan22", "i2v"): {
        "workflow_file": "wan22_i2v.json",
        "model_files": _WAN22_I2V_MODELS,
        "image_source": "vbench_i2v",
    },
 }
-def download_wan22_models(base_dir: Path) -> None:
+_VALID_MODELS = sorted({m for m, _ in _MODEL_REGISTRY})
-    """Download Wan 2.2 I2V model files into *base_dir* using wget."""
+_VALID_TASKS = sorted({t for _, t in _MODEL_REGISTRY})
-    for rel_path, url in _WAN22_MODELS:
+
 def _replace_in_graph(obj: Any, placeholder: str, value: str) -> None:
    """Recursively replace every occurrence of *placeholder* with *value* in-place."""
    if isinstance(obj, dict):
        for k, v in obj.items():
            if v == placeholder:
                obj[k] = value
            else:
                _replace_in_graph(v, placeholder, value)
    elif isinstance(obj, list):
        for i, item in enumerate(obj):
            if item == placeholder:
                obj[i] = value
            else:
                _replace_in_graph(item, placeholder, value)
 def download_models(base_dir: Path, model: str, task: str) -> None:
    """Download model weights for *model*/*task* into *base_dir* using wget."""
    key = (model, task)
    if key not in _MODEL_REGISTRY:
        raise ValueError(f"No model files registered for {model}/{task}")
    for rel_path, url in _MODEL_REGISTRY[key]["model_files"]:
        dest = base_dir / rel_path
        if dest.exists():
            print(f"[setup] already exists, skipping: {dest}")
@ -328,13 +204,17 @@ def _generate_synthetic_images(input_dir: Path, num_images: int) -> list[str]:
    return filenames
-def prepare_input_images(input_dir: Path, num_images: int = 20) -> list[str]:
+def prepare_input_images(
    input_dir: Path,
    num_images: int = 20,
    image_source: str = "vbench_i2v",
 ) -> list[str]:
    """
    Prepare benchmark input images in *input_dir*.
    Priority:
      1. Reuse any images already present in the directory.
-      2. Download Vchitect/VBench_I2V dataset via huggingface_hub.
+      2. Fetch from the source specified by *image_source* (e.g. "vbench_i2v").
      3. Generate synthetic 720×720 white PNG placeholders with Pillow.
    Returns a list of image basenames (not full paths).
@ -349,9 +229,10 @@ def prepare_input_images(input_dir: Path, num_images: int = 20) -> list[str]:
        print(f"[setup] found {len(existing)} existing images in {input_dir}")
        return existing
-    filenames = _try_download_vbench_i2v(input_dir)
+    if image_source == "vbench_i2v":
-    if filenames:
+        filenames = _try_download_vbench_i2v(input_dir)
-        return filenames
+        if filenames:
            return filenames
    print(f"[setup] generating {num_images} synthetic 720×720 placeholder images ...")
    return _generate_synthetic_images(input_dir, num_images)
@ -359,57 +240,71 @@ def prepare_input_images(input_dir: Path, num_images: int = 20) -> list[str]:
 def generate_prompt_file(
    output_path: Path,
    workflow_path: Path,
    image_filename: str,
    positive_prompt: str | None = None,
 ) -> None:
    """
-    Write a single Wan 2.2 I2V ComfyUI prompt JSON to *output_path*.
+    Write a single ComfyUI prompt JSON to *output_path* from *workflow_path*.
-    *image_filename* is substituted into the LoadImage node (node "97").
+    Replaces every occurrence of the sentinel string "__INPUT_IMAGE__" in the
-    *positive_prompt* overrides the default positive text if provided.
+    workflow graph with *image_filename*.
    """
-    graph: dict[str, Any] = json.loads(json.dumps(_WAN22_I2V_GRAPH))
+    graph: dict[str, Any] = json.loads(workflow_path.read_text())
-    graph["97"]["inputs"]["image"] = image_filename
+    _replace_in_graph(graph, _IMAGE_PLACEHOLDER, image_filename)
    if positive_prompt is not None:
        graph["130:107"]["inputs"]["text"] = positive_prompt
    output_path.parent.mkdir(parents=True, exist_ok=True)
    output_path.write_text(json.dumps({"prompt": graph}, indent=2))
 def generate_prompt_files(
    model: str,
    task: str,
    output_dir: Path,
    input_dir: Path,
    num_prompts: int = 50,
    num_images: int = 20,
-    download_models: bool = False,
+    download_model_weights: bool = False,
    comfyui_base_dir: Path | None = None,
 ) -> list[Path]:
    """
-    Full Wan 2.2 I2V benchmark setup:
+    Full benchmark setup for a given *model*/*task*:
      1. Optionally download model weights into *comfyui_base_dir*.
-      2. Prepare input images in *input_dir* (VBench I2V or synthetic).
+      2. Prepare input images in *input_dir*.
      3. Generate *num_prompts* prompt JSON files in *output_dir*, cycling
         through the available images.
    Returns the list of generated prompt file paths.
    """
-    if download_models:
+    key = (model, task)
    if key not in _MODEL_REGISTRY:
        available = ", ".join(f"{m}/{t}" for m, t in _MODEL_REGISTRY)
        raise ValueError(f"Unknown --model {model!r} --task {task!r}. Available: {available}")
    cfg = _MODEL_REGISTRY[key]
    if download_model_weights:
        if comfyui_base_dir is None:
            raise ValueError("--comfyui-base-dir is required when --download-models is set")
-        download_wan22_models(comfyui_base_dir)
+        download_models(comfyui_base_dir, model, task)
-    image_filenames = prepare_input_images(input_dir, num_images=num_images)
+    image_filenames = prepare_input_images(
        input_dir,
        num_images=num_images,
        image_source=cfg.get("image_source", "synthetic"),
    )
    if not image_filenames:
        raise RuntimeError(f"No input images available in {input_dir}")
    workflow_path = _WORKFLOWS_DIR / cfg["workflow_file"]
    if not workflow_path.exists():
        raise FileNotFoundError(f"Workflow file not found: {workflow_path}")
    output_dir.mkdir(parents=True, exist_ok=True)
    generated: list[Path] = []
    for i in range(num_prompts):
        image_name = image_filenames[i % len(image_filenames)]
-        prompt_path = output_dir / f"wan22_i2v_prompt_{i:04d}.json"
+        prompt_path = output_dir / f"{model}_{task}_prompt_{i:04d}.json"
-        generate_prompt_file(prompt_path, image_name)
+        generate_prompt_file(prompt_path, workflow_path, image_name)
        generated.append(prompt_path)
    print(f"[setup] generated {len(generated)} prompt files in {output_dir}")
@ -705,35 +600,47 @@ def parse_args() -> argparse.Namespace:
        "--prompt-file",
        type=Path,
        default=None,
-        help="Path to prompt JSON. Required unless --generate-wan22-prompts is set.",
+        help="Path to prompt JSON. Required unless --generate-prompts is set.",
    )
    p.add_argument(
-        "--generate-wan22-prompts",
+        "--generate-prompts",
        action="store_true",
-        help="Generate Wan 2.2 I2V prompt files (steps: prepare images, write JSONs) then exit.",
+        help="Prepare input images and generate prompt JSON files, then exit.",
    )
    p.add_argument(
-        "--wan22-input-dir",
+        "--model",
        choices=_VALID_MODELS,
        default=None,
        help=f"Model to benchmark. Required with --generate-prompts. Choices: {_VALID_MODELS}.",
    )
    p.add_argument(
        "--task",
        choices=_VALID_TASKS,
        default=None,
        help=f"Task type. Required with --generate-prompts. Choices: {_VALID_TASKS}.",
    )
    p.add_argument(
        "--input-dir",
        type=Path,
        default=Path("input"),
-        help="Directory for benchmark input images. Must be ComfyUI's input/ folder so LoadImage can find them (default: input/).",
+        help="ComfyUI input image directory (default: input/). LoadImage resolves files from this folder.",
    )
    p.add_argument(
-        "--wan22-output-dir",
+        "--prompts-dir",
        type=Path,
-        default=Path("prompts/wan22_i2v"),
+        default=None,
-        help="Directory where generated prompt JSON files are written (default: prompts/wan22_i2v/).",
+        help="Directory where generated prompt JSON files are written (default: benchmarks/prompts/<model>_<task>/).",
    )
    p.add_argument(
-        "--wan22-num-images",
+        "--num-images",
        type=int,
        default=20,
-        help="Number of synthetic images to generate when VBench download is unavailable (default: 20).",
+        help="Number of synthetic images to generate when dataset download is unavailable (default: 20).",
    )
    p.add_argument(
        "--download-models",
        action="store_true",
-        help="Download Wan 2.2 model weights before generating prompts (requires --comfyui-base-dir).",
+        help="Download model weights before generating prompts (requires --comfyui-base-dir).",
    )
    p.add_argument(
        "--comfyui-base-dir",
@ -762,7 +669,7 @@ def parse_args() -> argparse.Namespace:
 async def async_main(args: argparse.Namespace) -> None:
    if args.prompt_file is None:
-        raise SystemExit("error: --prompt-file is required (or use --generate-wan22-prompts to create one)")
+        raise SystemExit("error: --prompt-file is required (or use --generate-prompts to create one)")
    prompt_template = load_prompt_template(args.prompt_file)
    schedule = build_arrival_schedule(
        num_requests=args.num_requests,
@ -807,13 +714,18 @@ async def async_main(args: argparse.Namespace) -> None:
 def main() -> None:
    args = parse_args()
-    if args.generate_wan22_prompts:
+    if args.generate_prompts:
        if not args.model or not args.task:
            raise SystemExit("error: --model and --task are required with --generate-prompts")
        prompts_dir = args.prompts_dir or Path("benchmarks/prompts") / f"{args.model}_{args.task}"
        generate_prompt_files(
-            output_dir=args.wan22_output_dir,
+            model=args.model,
-            input_dir=args.wan22_input_dir,
+            task=args.task,
            output_dir=prompts_dir,
            input_dir=args.input_dir,
            num_prompts=args.num_requests,
-            num_images=args.wan22_num_images,
+            num_images=args.num_images,
-            download_models=args.download_models,
+            download_model_weights=args.download_models,
            comfyui_base_dir=args.comfyui_base_dir,
        )
        return